[PATCH 1/2] drm/amdkfd: Document and define SVM event tracing macro
Felix Kuehling
felix.kuehling at amd.com
Fri Feb 16 20:16:06 UTC 2024
On 2024-02-15 10:18, Philip Yang wrote:
> Document how to use SMI system management interface to receive SVM
> events.
>
> Define SVM events message string format macro that could use by user
> mode for sscanf to parse the event. Add it to uAPI header file to make
> it obvious that is changing uAPI in future.
>
> No functional changes.
>
> Signed-off-by: Philip Yang <Philip.Yang at amd.com>
> ---
> drivers/gpu/drm/amd/amdkfd/kfd_smi_events.c | 51 +++++++-------
> include/uapi/linux/kfd_ioctl.h | 77 ++++++++++++++++++++-
> 2 files changed, 102 insertions(+), 26 deletions(-)
>
> diff --git a/drivers/gpu/drm/amd/amdkfd/kfd_smi_events.c b/drivers/gpu/drm/amd/amdkfd/kfd_smi_events.c
> index d9953c2b2661..85465eb303a9 100644
> --- a/drivers/gpu/drm/amd/amdkfd/kfd_smi_events.c
> +++ b/drivers/gpu/drm/amd/amdkfd/kfd_smi_events.c
> @@ -225,15 +225,16 @@ void kfd_smi_event_update_gpu_reset(struct kfd_node *dev, bool post_reset)
> event = KFD_SMI_EVENT_GPU_PRE_RESET;
> ++(dev->reset_seq_num);
> }
> - kfd_smi_event_add(0, dev, event, "%x\n", dev->reset_seq_num);
> + kfd_smi_event_add(0, dev, event,
> + KFD_EVENT_FMT_UPDATE_GPU_RESET(dev->reset_seq_num));
> }
>
> void kfd_smi_event_update_thermal_throttling(struct kfd_node *dev,
> uint64_t throttle_bitmask)
> {
> - kfd_smi_event_add(0, dev, KFD_SMI_EVENT_THERMAL_THROTTLE, "%llx:%llx\n",
> - throttle_bitmask,
> - amdgpu_dpm_get_thermal_throttling_counter(dev->adev));
> + kfd_smi_event_add(0, dev, KFD_SMI_EVENT_THERMAL_THROTTLE,
> + KFD_EVENT_FMT_UPDATE_THERMAL_THROTTLING(throttle_bitmask,
> + amdgpu_dpm_get_thermal_throttling_counter(dev->adev)));
> }
>
> void kfd_smi_event_update_vmfault(struct kfd_node *dev, uint16_t pasid)
> @@ -246,8 +247,8 @@ void kfd_smi_event_update_vmfault(struct kfd_node *dev, uint16_t pasid)
> if (!task_info.pid)
> return;
>
> - kfd_smi_event_add(0, dev, KFD_SMI_EVENT_VMFAULT, "%x:%s\n",
> - task_info.pid, task_info.task_name);
> + kfd_smi_event_add(0, dev, KFD_SMI_EVENT_VMFAULT,
> + KFD_EVENT_FMT_VMFAULT(task_info.pid, task_info.task_name));
> }
>
> void kfd_smi_event_page_fault_start(struct kfd_node *node, pid_t pid,
> @@ -255,16 +256,16 @@ void kfd_smi_event_page_fault_start(struct kfd_node *node, pid_t pid,
> ktime_t ts)
> {
> kfd_smi_event_add(pid, node, KFD_SMI_EVENT_PAGE_FAULT_START,
> - "%lld -%d @%lx(%x) %c\n", ktime_to_ns(ts), pid,
> - address, node->id, write_fault ? 'W' : 'R');
> + KFD_EVENT_FMT_PAGEFAULT_START(ktime_to_ns(ts), pid,
> + address, node->id, write_fault ? 'W' : 'R'));
> }
>
> void kfd_smi_event_page_fault_end(struct kfd_node *node, pid_t pid,
> unsigned long address, bool migration)
> {
> kfd_smi_event_add(pid, node, KFD_SMI_EVENT_PAGE_FAULT_END,
> - "%lld -%d @%lx(%x) %c\n", ktime_get_boottime_ns(),
> - pid, address, node->id, migration ? 'M' : 'U');
> + KFD_EVENT_FMT_PAGEFAULT_END(ktime_get_boottime_ns(),
> + pid, address, node->id, migration ? 'M' : 'U'));
> }
>
> void kfd_smi_event_migration_start(struct kfd_node *node, pid_t pid,
> @@ -274,9 +275,9 @@ void kfd_smi_event_migration_start(struct kfd_node *node, pid_t pid,
> uint32_t trigger)
> {
> kfd_smi_event_add(pid, node, KFD_SMI_EVENT_MIGRATE_START,
> - "%lld -%d @%lx(%lx) %x->%x %x:%x %d\n",
> - ktime_get_boottime_ns(), pid, start, end - start,
> - from, to, prefetch_loc, preferred_loc, trigger);
> + KFD_EVENT_FMT_MIGRATE_START(ktime_get_boottime_ns(),
> + pid, start, end - start, from, to, prefetch_loc,
> + preferred_loc, trigger));
> }
>
> void kfd_smi_event_migration_end(struct kfd_node *node, pid_t pid,
> @@ -284,24 +285,23 @@ void kfd_smi_event_migration_end(struct kfd_node *node, pid_t pid,
> uint32_t from, uint32_t to, uint32_t trigger)
> {
> kfd_smi_event_add(pid, node, KFD_SMI_EVENT_MIGRATE_END,
> - "%lld -%d @%lx(%lx) %x->%x %d\n",
> - ktime_get_boottime_ns(), pid, start, end - start,
> - from, to, trigger);
> + KFD_EVENT_FMT_MIGRATE_END(ktime_get_boottime_ns(), pid,
> + start, end - start, from, to, trigger));
> }
>
> void kfd_smi_event_queue_eviction(struct kfd_node *node, pid_t pid,
> uint32_t trigger)
> {
> kfd_smi_event_add(pid, node, KFD_SMI_EVENT_QUEUE_EVICTION,
> - "%lld -%d %x %d\n", ktime_get_boottime_ns(), pid,
> - node->id, trigger);
> + KFD_EVENT_FMT_QUEUE_EVICTION(ktime_get_boottime_ns(),
> + pid, node->id, trigger));
> }
>
> void kfd_smi_event_queue_restore(struct kfd_node *node, pid_t pid)
> {
> kfd_smi_event_add(pid, node, KFD_SMI_EVENT_QUEUE_RESTORE,
> - "%lld -%d %x\n", ktime_get_boottime_ns(), pid,
> - node->id);
> + KFD_EVENT_FMT_QUEUE_RESTORE(ktime_get_boottime_ns(),
> + pid, node->id));
> }
>
> void kfd_smi_event_queue_restore_rescheduled(struct mm_struct *mm)
> @@ -317,9 +317,10 @@ void kfd_smi_event_queue_restore_rescheduled(struct mm_struct *mm)
> struct kfd_process_device *pdd = p->pdds[i];
>
> kfd_smi_event_add(p->lead_thread->pid, pdd->dev,
> - KFD_SMI_EVENT_QUEUE_RESTORE,
> - "%lld -%d %x %c\n", ktime_get_boottime_ns(),
> - p->lead_thread->pid, pdd->dev->id, 'R');
> + KFD_SMI_EVENT_QUEUE_RESTORE_RESCHEDULED,
> + KFD_EVENT_FMT_QUEUE_RESTORE_RESCHEDULED(
> + ktime_get_boottime_ns(), p->lead_thread->pid,
> + pdd->dev->id, 'R'));
> }
> kfd_unref_process(p);
> }
> @@ -329,8 +330,8 @@ void kfd_smi_event_unmap_from_gpu(struct kfd_node *node, pid_t pid,
> uint32_t trigger)
> {
> kfd_smi_event_add(pid, node, KFD_SMI_EVENT_UNMAP_FROM_GPU,
> - "%lld -%d @%lx(%lx) %x %d\n", ktime_get_boottime_ns(),
> - pid, address, last - address + 1, node->id, trigger);
> + KFD_EVENT_FMT_UNMAP_FROM_GPU(ktime_get_boottime_ns(),
> + pid, address, last - address + 1, node->id, trigger));
> }
>
> int kfd_smi_event_open(struct kfd_node *dev, uint32_t *fd)
> diff --git a/include/uapi/linux/kfd_ioctl.h b/include/uapi/linux/kfd_ioctl.h
> index 9ce46edc62a5..430c01f4148b 100644
> --- a/include/uapi/linux/kfd_ioctl.h
> +++ b/include/uapi/linux/kfd_ioctl.h
> @@ -523,7 +523,8 @@ enum kfd_smi_event {
> KFD_SMI_EVENT_PAGE_FAULT_END = 8,
> KFD_SMI_EVENT_QUEUE_EVICTION = 9,
> KFD_SMI_EVENT_QUEUE_RESTORE = 10,
> - KFD_SMI_EVENT_UNMAP_FROM_GPU = 11,
> + KFD_SMI_EVENT_QUEUE_RESTORE_RESCHEDULED = 11,
> + KFD_SMI_EVENT_UNMAP_FROM_GPU = 12,
>
> /*
> * max event number, as a flag bit to get events from all processes,
> @@ -564,6 +565,80 @@ struct kfd_ioctl_smi_events_args {
> __u32 anon_fd; /* from KFD */
> };
>
> +/*
> + * SVM event tracing via SMI system management interface
> + *
> + * Open event file descriptor
> + * use ioctl AMDKFD_IOC_SMI_EVENTS, pass in gpuid and return a anonymous file
> + * descriptor to receive SMI events.
> + * If calling with sudo permission, then file descriptor can be used to receive
> + * SVM events from all processes, otherwise, to only receive SVM events of same
> + * process.
> + *
> + * To enable the SVM event
> + * Write event file descriptor with KFD_SMI_EVENT_MASK_FROM_INDEX(event) bitmap
> + * mask to start record the event to the kfifo, use bitmap mask combination
> + * for multiple events. New event mask will overwrite the previous event mask.
> + * KFD_SMI_EVENT_MASK_FROM_INDEX(KFD_SMI_EVENT_ALL_PROCESS) bit requires sudo
> + * permisson to receive SVM events from all process.
> + *
> + * To receive the event
> + * Application can poll file descriptor to wait for the events, then read event
> + * from the file into a buffer. Each event is one line string message, starting
> + * with the event id, then the event specific information.
> + *
> + * To decode event information
> + * The following event format string macro can be used with sscanf to decode
> + * the specific event information.
> + * event triggers: the reason to generate the event, defined as enum for unmap,
> + * eviction and migrate events.
> + * node, from, to, prefetch_loc, preferred_loc: GPU ID, or 0 for system memory.
> + * addr: user mode address, in pages
> + * size: in pages
> + * pid: the process ID to generate the event
> + * ns: timestamp in nanosecond-resolution, starts at system boot time but
> + * stops during suspend
> + * migrate_update: the GPU page is recovered by 'M' for migrate, 'U' for update
> + * rescheduled: 'R' if the queue restore failed and rescheduled to try again
> + * rw: 'W' for write page fault, 'R' for read page fault
> + */
> +#define KFD_EVENT_FMT_UPDATE_GPU_RESET(reset_seq_num)\
> + "%x\n", (reset_seq_num)
If we want user mode to use this with fscanf or sscanf, and we want this
to be extensible in the future so we can add new fields without breaking
user mode using these macros (as you do in patch 2), then the \n should
not be part of the format string here. We can add the \n in
kfd_smi_event_add instead.
Regards,
Felix
> +
> +#define KFD_EVENT_FMT_UPDATE_THERMAL_THROTTLING(bitmask, counter)\
> + "%llx:%llx\n", (bitmask), (counter)
> +
> +#define KFD_EVENT_FMT_VMFAULT(pid, task_name)\
> + "%x:%s\n", (pid), (task_name)
> +
> +#define KFD_EVENT_FMT_PAGEFAULT_START(ns, pid, addr, node, rw)\
> + "%lld -%d @%lx(%x) %c\n", (ns), (pid), (addr), (node), (rw)
> +
> +#define KFD_EVENT_FMT_PAGEFAULT_END(ns, pid, addr, node, migrate_update)\
> + "%lld -%d @%lx(%x) %c\n", (ns), (pid), (addr), (node), (migrate_update)
> +
> +#define KFD_EVENT_FMT_MIGRATE_START(ns, pid, start, size, from, to, prefetch_loc,\
> + preferred_loc, migrate_trigger)\
> + "%lld -%d @%lx(%lx) %x->%x %x:%x %d\n", (ns), (pid), (start), (size),\
> + (from), (to), (prefetch_loc), (preferred_loc), (migrate_trigger)
> +
> +#define KFD_EVENT_FMT_MIGRATE_END(ns, pid, start, size, from, to, migrate_trigger)\
> + "%lld -%d @%lx(%lx) %x->%x %d\n", (ns), (pid), (start), (size),\
> + (from), (to), (migrate_trigger)
> +
> +#define KFD_EVENT_FMT_QUEUE_EVICTION(ns, pid, node, evict_trigger)\
> + "%lld -%d %x %d\n", (ns), (pid), (node), (evict_trigger)
> +
> +#define KFD_EVENT_FMT_QUEUE_RESTORE(ns, pid, node)\
> + "%lld -%d %x\n", (ns), (pid), (node)
> +
> +#define KFD_EVENT_FMT_QUEUE_RESTORE_RESCHEDULED(ns, pid, node, rescheduled)\
> + "%lld -%d %x %c\n", (ns), (pid), (node), (rescheduled)
> +
> +#define KFD_EVENT_FMT_UNMAP_FROM_GPU(ns, pid, addr, size, node, unmap_trigger)\
> + "%lld -%d @%lx(%lx) %x %d\n", (ns), (pid), (addr), (size),\
> + (node), (unmap_trigger)
> +
> /**************************************************************************************************
> * CRIU IOCTLs (Checkpoint Restore In Userspace)
> *
More information about the amd-gfx
mailing list