On 2026-05-20 03:13, Yifan Zhang wrote:
This patch is to check per pdd sigbus delay time. Fixes: f207b038bc38 (drm/amdgpu: add ioctl to handle RAS poison error) Signed-off-by: Yifan Zhang <[email protected]>
Reviewed-by: Felix Kuehling <[email protected]>
--- drivers/gpu/drm/amd/amdkfd/kfd_events.c | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) diff --git a/drivers/gpu/drm/amd/amdkfd/kfd_events.c b/drivers/gpu/drm/amd/amdkfd/kfd_events.c index 8b4e0a208e86..69fed7e5b122 100644 --- a/drivers/gpu/drm/amd/amdkfd/kfd_events.c +++ b/drivers/gpu/drm/amd/amdkfd/kfd_events.c @@ -1388,7 +1388,7 @@ static void kfd_signal_sigbus_delayed_fn(struct work_struct *work) * Rationale: if the app has explicitly opted in on any GPU it uses, it * wants the chance to handle the error in userspace. */ -static u32 kfd_get_sigbus_delay_ms(struct kfd_process *p) +static u32 kfd_get_sigbus_delay_ms(struct kfd_process *p, struct kfd_node *dev) { u32 result = 0; int i; @@ -1399,7 +1399,7 @@ static u32 kfd_get_sigbus_delay_ms(struct kfd_process *p) struct amdgpu_fpriv *drv_priv; u32 v;- if (!pdd || !pdd->drm_file)+ if (!pdd || !pdd->drm_file || pdd->dev != dev) continue; if (amdgpu_file_to_fpriv(pdd->drm_file, &drv_priv)) continue; @@ -1420,7 +1420,7 @@ static u32 kfd_get_sigbus_delay_ms(struct kfd_process *p) static void kfd_signal_sigbus_with_delay(struct kfd_node *dev, struct kfd_process *p) { - u32 delay_ms = kfd_get_sigbus_delay_ms(p); + u32 delay_ms = kfd_get_sigbus_delay_ms(p, dev); struct kfd_sigbus_delayed_work *dw;if (delay_ms == AMDGPU_USER_OPTIONS_KFD_SIGBUS_DELAY_DISABLED) {
