drm/xe/xe_late_bind_fw: Load late binding firmware

Load late binding firmware

v2:
 - s/EAGAIN/EBUSY/
 - Flush worker in suspend and driver unload (Daniele)
v3:
 - Use retry interval of 6s, in steps of 200ms, to allow
   other OS components release MEI CL handle (Sasha)
v4:
 - return -ENODEV if component not added (Daniele)
 - parse and print status returned by csc
v5:
 - Use payload to check firmware valid (Daniele)
 - Obtain the RPM reference before scheduling the worker to
   ensure the device remains awake until the worker completes
   firmware loading (Rodrigo)
v6:
 - In case of error donot re-attempt fw download (Daniele)
v7 (Rodrigo):
 - Rename of mei structs and callback.

Signed-off-by: Badal Nilawar <badal.nilawar@intel.com>
Reviewed-by: Daniele Ceraolo Spurio <daniele.ceraolospurio@intel.com>
Signed-off-by: Rodrigo Vivi <rodrigo.vivi@intel.com>
Link: https://lore.kernel.org/r/20250905154953.3974335-6-badal.nilawar@intel.com
Signed-off-by: Lucas De Marchi <lucas.demarchi@intel.com>
This commit is contained in:
Badal Nilawar
2025-09-05 21:19:49 +05:30
committed by Lucas De Marchi
parent 45832bf9c1
commit 691a54ad94
3 changed files with 165 additions and 2 deletions

View File

@@ -16,6 +16,20 @@
#include "xe_late_bind_fw.h"
#include "xe_pcode.h"
#include "xe_pcode_api.h"
#include "xe_pm.h"
/*
* The component should load quite quickly in most cases, but it could take
* a bit. Using a very big timeout just to cover the worst case scenario
*/
#define LB_INIT_TIMEOUT_MS 20000
/*
* Retry interval set to 6 seconds, in steps of 200 ms, to allow time for
* other OS components to release the MEI CL handle
*/
#define LB_FW_LOAD_RETRY_MAXCOUNT 30
#define LB_FW_LOAD_RETRY_PAUSE_MS 200
static const u32 fw_id_to_type[] = {
[XE_LB_FW_FAN_CONTROL] = INTEL_LB_TYPE_FAN_CONTROL,
@@ -31,6 +45,30 @@ late_bind_to_xe(struct xe_late_bind *late_bind)
return container_of(late_bind, struct xe_device, late_bind);
}
static const char *xe_late_bind_parse_status(uint32_t status)
{
switch (status) {
case INTEL_LB_STATUS_SUCCESS:
return "success";
case INTEL_LB_STATUS_4ID_MISMATCH:
return "4Id Mismatch";
case INTEL_LB_STATUS_ARB_FAILURE:
return "ARB Failure";
case INTEL_LB_STATUS_GENERAL_ERROR:
return "General Error";
case INTEL_LB_STATUS_INVALID_PARAMS:
return "Invalid Params";
case INTEL_LB_STATUS_INVALID_SIGNATURE:
return "Invalid Signature";
case INTEL_LB_STATUS_INVALID_PAYLOAD:
return "Invalid Payload";
case INTEL_LB_STATUS_TIMEOUT:
return "Timeout";
default:
return "Unknown error";
}
}
static int xe_late_bind_fw_num_fans(struct xe_late_bind *late_bind)
{
struct xe_device *xe = late_bind_to_xe(late_bind);
@@ -44,6 +82,101 @@ static int xe_late_bind_fw_num_fans(struct xe_late_bind *late_bind)
return 0;
}
static void xe_late_bind_wait_for_worker_completion(struct xe_late_bind *late_bind)
{
struct xe_device *xe = late_bind_to_xe(late_bind);
struct xe_late_bind_fw *lbfw;
int fw_id;
for (fw_id = 0; fw_id < XE_LB_FW_MAX_ID; fw_id++) {
lbfw = &late_bind->late_bind_fw[fw_id];
if (lbfw->payload && late_bind->wq) {
drm_dbg(&xe->drm, "Flush work: load %s firmware\n",
fw_id_to_name[lbfw->id]);
flush_work(&lbfw->work);
}
}
}
static void xe_late_bind_work(struct work_struct *work)
{
struct xe_late_bind_fw *lbfw = container_of(work, struct xe_late_bind_fw, work);
struct xe_late_bind *late_bind = container_of(lbfw, struct xe_late_bind,
late_bind_fw[lbfw->id]);
struct xe_device *xe = late_bind_to_xe(late_bind);
int retry = LB_FW_LOAD_RETRY_MAXCOUNT;
int ret;
int slept;
xe_device_assert_mem_access(xe);
/* we can queue this before the component is bound */
for (slept = 0; slept < LB_INIT_TIMEOUT_MS; slept += 100) {
if (late_bind->component.ops)
break;
msleep(100);
}
if (!late_bind->component.ops) {
drm_err(&xe->drm, "Late bind component not bound\n");
/* Do not re-attempt fw load */
drmm_kfree(&xe->drm, (void *)lbfw->payload);
lbfw->payload = NULL;
goto out;
}
drm_dbg(&xe->drm, "Load %s firmware\n", fw_id_to_name[lbfw->id]);
do {
ret = late_bind->component.ops->push_payload(late_bind->component.mei_dev,
lbfw->type,
lbfw->flags,
lbfw->payload,
lbfw->payload_size);
if (!ret)
break;
msleep(LB_FW_LOAD_RETRY_PAUSE_MS);
} while (--retry && ret == -EBUSY);
if (!ret) {
drm_dbg(&xe->drm, "Load %s firmware successful\n",
fw_id_to_name[lbfw->id]);
goto out;
}
if (ret > 0)
drm_err(&xe->drm, "Load %s firmware failed with err %d, %s\n",
fw_id_to_name[lbfw->id], ret, xe_late_bind_parse_status(ret));
else
drm_err(&xe->drm, "Load %s firmware failed with err %d",
fw_id_to_name[lbfw->id], ret);
/* Do not re-attempt fw load */
drmm_kfree(&xe->drm, (void *)lbfw->payload);
lbfw->payload = NULL;
out:
xe_pm_runtime_put(xe);
}
int xe_late_bind_fw_load(struct xe_late_bind *late_bind)
{
struct xe_device *xe = late_bind_to_xe(late_bind);
struct xe_late_bind_fw *lbfw;
int fw_id;
if (!late_bind->component_added)
return -ENODEV;
for (fw_id = 0; fw_id < XE_LB_FW_MAX_ID; fw_id++) {
lbfw = &late_bind->late_bind_fw[fw_id];
if (lbfw->payload) {
xe_pm_runtime_get_noresume(xe);
queue_work(late_bind->wq, &lbfw->work);
}
}
return 0;
}
static int __xe_late_bind_fw_init(struct xe_late_bind *late_bind, u32 fw_id)
{
struct xe_device *xe = late_bind_to_xe(late_bind);
@@ -97,6 +230,7 @@ static int __xe_late_bind_fw_init(struct xe_late_bind *late_bind, u32 fw_id)
memcpy((void *)lb_fw->payload, fw->data, lb_fw->payload_size);
release_firmware(fw);
INIT_WORK(&lb_fw->work, xe_late_bind_work);
return 0;
}
@@ -106,11 +240,16 @@ static int xe_late_bind_fw_init(struct xe_late_bind *late_bind)
int ret;
int fw_id;
late_bind->wq = alloc_ordered_workqueue("late-bind-ordered-wq", 0);
if (!late_bind->wq)
return -ENOMEM;
for (fw_id = 0; fw_id < XE_LB_FW_MAX_ID; fw_id++) {
ret = __xe_late_bind_fw_init(late_bind, fw_id);
if (ret)
return ret;
}
return 0;
}
@@ -132,6 +271,8 @@ static void xe_late_bind_component_unbind(struct device *xe_kdev,
struct xe_device *xe = kdev_to_xe_device(xe_kdev);
struct xe_late_bind *late_bind = &xe->late_bind;
xe_late_bind_wait_for_worker_completion(late_bind);
late_bind->component.ops = NULL;
}
@@ -145,7 +286,15 @@ static void xe_late_bind_remove(void *arg)
struct xe_late_bind *late_bind = arg;
struct xe_device *xe = late_bind_to_xe(late_bind);
xe_late_bind_wait_for_worker_completion(late_bind);
late_bind->component_added = false;
component_del(xe->drm.dev, &xe_late_bind_component_ops);
if (late_bind->wq) {
destroy_workqueue(late_bind->wq);
late_bind->wq = NULL;
}
}
/**
@@ -174,9 +323,15 @@ int xe_late_bind_init(struct xe_late_bind *late_bind)
return err;
}
late_bind->component_added = true;
err = devm_add_action_or_reset(xe->drm.dev, xe_late_bind_remove, late_bind);
if (err)
return err;
return xe_late_bind_fw_init(late_bind);
err = xe_late_bind_fw_init(late_bind);
if (err)
return err;
return xe_late_bind_fw_load(late_bind);
}

View File

@@ -11,5 +11,6 @@
struct xe_late_bind;
int xe_late_bind_init(struct xe_late_bind *late_bind);
int xe_late_bind_fw_load(struct xe_late_bind *late_bind);
#endif

View File

@@ -9,6 +9,7 @@
#include <linux/iosys-map.h>
#include <linux/mutex.h>
#include <linux/types.h>
#include <linux/workqueue.h>
#define XE_LB_MAX_PAYLOAD_SIZE SZ_4K
@@ -36,6 +37,8 @@ struct xe_late_bind_fw {
const u8 *payload;
/** @payload_size: late binding blob payload_size */
size_t payload_size;
/** @work: worker to upload latebind blob */
struct work_struct work;
};
/**
@@ -47,7 +50,7 @@ struct xe_late_bind_fw {
*/
struct xe_late_bind_component {
struct device *mei_dev;
const struct late_bind_component_ops *ops;
const struct intel_lb_component_ops *ops;
};
/**
@@ -58,6 +61,10 @@ struct xe_late_bind {
struct xe_late_bind_component component;
/** @late_bind_fw: late binding firmware array */
struct xe_late_bind_fw late_bind_fw[XE_LB_FW_MAX_ID];
/** @wq: workqueue to submit request to download late bind blob */
struct workqueue_struct *wq;
/** @component_added: whether the component has been added */
bool component_added;
};
#endif