[PATCH 4/4] drm/xe/vf: Defer fixups if migrated twice fast
Tomasz Lis
tomasz.lis at intel.com
Fri Sep 20 22:29:26 UTC 2024
If another VF migration happened during post-migration recovery,
then the current worker should be finished to allow the next
one start swiftly and cleanly.
Check for defer in two places: before fixups, and before
sending RESFIX_DONE.
Signed-off-by: Tomasz Lis <tomasz.lis at intel.com>
---
drivers/gpu/drm/xe/xe_sriov_vf.c | 25 +++++++++++++++++++++++++
1 file changed, 25 insertions(+)
diff --git a/drivers/gpu/drm/xe/xe_sriov_vf.c b/drivers/gpu/drm/xe/xe_sriov_vf.c
index 3cea2d21525f..93817cf21701 100644
--- a/drivers/gpu/drm/xe/xe_sriov_vf.c
+++ b/drivers/gpu/drm/xe/xe_sriov_vf.c
@@ -52,6 +52,19 @@ static int vf_post_migration_reinit_guc(struct xe_device *xe)
return err;
}
+/*
+ * vf_post_migration_imminent - Check if post-restore recovery is coming.
+ * @xe: the &xe_device struct instance
+ *
+ * Returns if migration recovery worker will soon be running. Any worker currently executing
+ * does not affect the result.
+ */
+static bool vf_post_migration_imminent(struct xe_device *xe)
+{
+ return xe->sriov.vf.migration_gt_flags != 0 ||
+ work_pending(&xe->sriov.vf.migration_worker);
+}
+
/*
* vf_post_migration_notify_resfix_done - Notify all GuCs about resource fixups apply finished.
* @xe: the &xe_device struct instance
@@ -64,12 +77,19 @@ static void vf_post_migration_notify_resfix_done(struct xe_device *xe)
xe_pm_runtime_get(xe);
for_each_gt(gt, xe, id) {
+ if (vf_post_migration_imminent(xe))
+ goto skip;
err = xe_gt_sriov_vf_notify_resfix_done(gt);
if (!err)
num_sent++;
}
xe_pm_runtime_put(xe);
drm_dbg(&xe->drm, "sent %d VF resource fixups done notifications\n", num_sent);
+ return;
+
+skip:
+ xe_pm_runtime_put(xe);
+ drm_dbg(&xe->drm, "another recovery imminent, skipping notifications\n");
}
static void vf_post_migration_recovery(struct xe_device *xe)
@@ -78,6 +98,8 @@ static void vf_post_migration_recovery(struct xe_device *xe)
drm_dbg(&xe->drm, "migration recovery in progress\n");
err = vf_post_migration_reinit_guc(xe);
+ if (vf_post_migration_imminent(xe))
+ goto defer;
if (unlikely(err))
goto fail;
@@ -85,6 +107,9 @@ static void vf_post_migration_recovery(struct xe_device *xe)
vf_post_migration_notify_resfix_done(xe);
drm_notice(&xe->drm, "migration recovery completed\n");
return;
+defer:
+ drm_dbg(&xe->drm, "migration recovery deferred\n");
+ return;
fail:
drm_err(&xe->drm, "migration recovery failed (%pe)\n", ERR_PTR(err));
xe_device_declare_wedged(xe);
--
2.25.1
More information about the Intel-xe
mailing list