AMD General

Regards,
      Prike

> -----Original Message-----
> From: Pierre-Eric Pelloux-Prayer <[email protected]>
> Sent: Wednesday, May 13, 2026 5:18 PM
> To: Liang, Prike <[email protected]>; [email protected]
> Cc: Deucher, Alexander <[email protected]>; Koenig, Christian
> <[email protected]>
> Subject: Re: [PATCH 4/4] drm/amdgpu: add eviction fence tracepoints for userq
> profiling
>
>
>
> Le 11/05/2026 à 15:54, Prike Liang a écrit :
> > Add ftrace events for the userq eviction fence lifecycle.
> >
> > Signed-off-by: Prike Liang <[email protected]>
> > ---
> >   .../drm/amd/amdgpu/amdgpu_eviction_fence.c    |  8 +++-
> >   drivers/gpu/drm/amd/amdgpu/amdgpu_trace.h     | 42 +++++++++++++++++++
> >   2 files changed, 49 insertions(+), 1 deletion(-)
> >
> > diff --git a/drivers/gpu/drm/amd/amdgpu/amdgpu_eviction_fence.c
> > b/drivers/gpu/drm/amd/amdgpu/amdgpu_eviction_fence.c
> > index 5ae477c49a53..9358f9b35914 100644
> > --- a/drivers/gpu/drm/amd/amdgpu/amdgpu_eviction_fence.c
> > +++ b/drivers/gpu/drm/amd/amdgpu/amdgpu_eviction_fence.c
> > @@ -24,6 +24,7 @@
> >   #include <linux/sched.h>
> >   #include <drm/drm_exec.h>
> >   #include "amdgpu.h"
> > +#include "amdgpu_trace.h"
> >
> >   static const char *
> >   amdgpu_eviction_fence_get_driver_name(struct dma_fence *fence) @@
> > -44,6 +45,8 @@ static bool amdgpu_eviction_fence_enable_signaling(struct
> dma_fence *f)
> >   {
> >     struct amdgpu_eviction_fence *ev_fence = to_ev_fence(f);
> >
> > +   trace_amdgpu_userq_eviction_fence_enable_signaling(f->context,
> > +                                                      f->seqno);
> >     schedule_work(&ev_fence->evf_mgr->suspend_work);
> >     return true;
> >   }
> > @@ -84,6 +87,8 @@ amdgpu_eviction_fence_suspend_worker(struct work_struct
> *work)
> >      * next fence.
> >      */
> >     dma_fence_signal(ev_fence);
> > +   trace_amdgpu_userq_eviction_fence_signal(ev_fence->context,
> > +                                            ev_fence->seqno);
> >     dma_fence_end_signalling(cookie);
> >     dma_fence_put(ev_fence);
> >
> > @@ -138,7 +143,8 @@ int amdgpu_evf_mgr_rearm(struct
> amdgpu_eviction_fence_mgr *evf_mgr,
> >     /* Remember it for newly added BOs */
> >     dma_fence_put(evf_mgr->ev_fence);
> >     evf_mgr->ev_fence = &ev_fence->base;
> > -
> > +   trace_amdgpu_userq_eviction_fence_emit(ev_fence->base.context,
> > +                                          ev_fence->base.seqno);
> >     /* And add it to all existing BOs */
> >     drm_exec_for_each_locked_object(exec, index, obj) {
> >             struct amdgpu_bo *bo = gem_to_amdgpu_bo(obj); diff --git
> > a/drivers/gpu/drm/amd/amdgpu/amdgpu_trace.h
> > b/drivers/gpu/drm/amd/amdgpu/amdgpu_trace.h
> > index d421a44ef933..5191f4e957d5 100644
> > --- a/drivers/gpu/drm/amd/amdgpu/amdgpu_trace.h
> > +++ b/drivers/gpu/drm/amd/amdgpu/amdgpu_trace.h
> > @@ -709,6 +709,48 @@ TRACE_EVENT(amdgpu_userq_fence_signal,
> >         TP_printk("context=%llu, seqno=%llu, rptr=%llu",
> >                   __entry->context, __entry->seqno, __entry->rptr)
> >   );
> > +TRACE_EVENT(amdgpu_userq_eviction_fence_emit,
> > +       TP_PROTO(u64 context, u64 seqno),
> > +       TP_ARGS(context, seqno),
> > +       TP_STRUCT__entry(
> > +                        __field(u64, context)
> > +                        __field(u64, seqno)
> > +                        ),
> > +       TP_fast_assign(
> > +                      __entry->context = context;
> > +                      __entry->seqno = seqno;
> > +                      ),
> > +       TP_printk("context=%llu, seqno=%llu",
> > +                 __entry->context, __entry->seqno)
>
> I'll leave it to others to decide if these events are useful, but if you keep 
> them please
> use "fence=%llu:%llu" for consistency.

I think this will help understanding and profiling the userq objects 
bookkeeping usage and userq eviction latency.

> Pierre-Eric
>
> > +);
> > +TRACE_EVENT(amdgpu_userq_eviction_fence_enable_signaling,
> > +       TP_PROTO(u64 context, u64 seqno),
> > +       TP_ARGS(context, seqno),
> > +       TP_STRUCT__entry(
> > +                        __field(u64, context)
> > +                        __field(u64, seqno)
> > +                        ),
> > +       TP_fast_assign(
> > +                      __entry->context = context;
> > +                      __entry->seqno = seqno;
> > +                      ),
> > +       TP_printk("context=%llu, seqno=%llu",
> > +                 __entry->context, __entry->seqno) );
> > +TRACE_EVENT(amdgpu_userq_eviction_fence_signal,
> > +       TP_PROTO(u64 context, u64 seqno),
> > +       TP_ARGS(context, seqno),
> > +       TP_STRUCT__entry(
> > +                        __field(u64, context)
> > +                        __field(u64, seqno)
> > +                        ),
> > +       TP_fast_assign(
> > +                      __entry->context = context;
> > +                      __entry->seqno = seqno;
> > +                      ),
> > +       TP_printk("context=%llu, seqno=%llu",
> > +                 __entry->context, __entry->seqno) );
> >   #undef AMDGPU_JOB_GET_TIMELINE_NAME
> >   #endif
> >

Reply via email to