This patch fixes a multiple CPU hangs caused by the improper use of
spin_lock that are not IRQ safe. This allow the software driver to
get into some sort of deadlock/race condition. It happen of kernels
that have CONFIG_PROVE_LOCKING=y and or CONFIG_PREEMPT (full
preemption).
Fixes: 4c131aa02bc4 ("drm/amdgpu: Add profiling counters in fdinfo")
Signed-off-by: Andrew Martin <[email protected]>
---
drivers/gpu/drm/amd/amdgpu/amdgpu_vm.c | 158 ++++++++++++++++---------
1 file changed, 105 insertions(+), 53 deletions(-)
diff --git a/drivers/gpu/drm/amd/amdgpu/amdgpu_vm.c
b/drivers/gpu/drm/amd/amdgpu/amdgpu_vm.c
index 8de9b7b3cc88..dc0fbf134fc0 100644
--- a/drivers/gpu/drm/amd/amdgpu/amdgpu_vm.c
+++ b/drivers/gpu/drm/amd/amdgpu/amdgpu_vm.c
@@ -165,14 +165,16 @@ static void amdgpu_vm_bo_evicted(struct amdgpu_vm_bo_base
*vm_bo)
struct amdgpu_vm *vm = vm_bo->vm;
struct amdgpu_bo *bo = vm_bo->bo;
+ unsigned long flags;
+
vm_bo->moved = true;
amdgpu_vm_assert_locked(vm);
- spin_lock(&vm_bo->vm->status_lock);
+ spin_lock_irqsave(&vm_bo->vm->status_lock, flags);
if (bo->tbo.type == ttm_bo_type_kernel)
list_move(&vm_bo->vm_status, &vm->evicted);
else
list_move_tail(&vm_bo->vm_status, &vm->evicted);
- spin_unlock(&vm_bo->vm->status_lock);
+ spin_unlock_irqrestore(&vm_bo->vm->status_lock, flags);
}
/**
* amdgpu_vm_bo_moved - vm_bo is moved
@@ -184,10 +186,12 @@ static void amdgpu_vm_bo_evicted(struct amdgpu_vm_bo_base
*vm_bo)
*/
static void amdgpu_vm_bo_moved(struct amdgpu_vm_bo_base *vm_bo)
{
+ unsigned long flags;
+
amdgpu_vm_assert_locked(vm_bo->vm);
- spin_lock(&vm_bo->vm->status_lock);
+ spin_lock_irqsave(&vm_bo->vm->status_lock, flags);
list_move(&vm_bo->vm_status, &vm_bo->vm->moved);
- spin_unlock(&vm_bo->vm->status_lock);
+ spin_unlock_irqrestore(&vm_bo->vm->status_lock, flags);
}
/**
@@ -200,10 +204,12 @@ static void amdgpu_vm_bo_moved(struct amdgpu_vm_bo_base
*vm_bo)
*/
static void amdgpu_vm_bo_idle(struct amdgpu_vm_bo_base *vm_bo)
{
+ unsigned long flags;
+
amdgpu_vm_assert_locked(vm_bo->vm);
- spin_lock(&vm_bo->vm->status_lock);
+ spin_lock_irqsave(&vm_bo->vm->status_lock, flags);
list_move(&vm_bo->vm_status, &vm_bo->vm->idle);
- spin_unlock(&vm_bo->vm->status_lock);
+ spin_unlock_irqrestore(&vm_bo->vm->status_lock, flags);
vm_bo->moved = false;
}
@@ -217,9 +223,11 @@ static void amdgpu_vm_bo_idle(struct amdgpu_vm_bo_base
*vm_bo)
*/
static void amdgpu_vm_bo_invalidated(struct amdgpu_vm_bo_base *vm_bo)
{
- spin_lock(&vm_bo->vm->status_lock);
+ unsigned long flags;
+
+ spin_lock_irqsave(&vm_bo->vm->status_lock, flags);
list_move(&vm_bo->vm_status, &vm_bo->vm->invalidated);
- spin_unlock(&vm_bo->vm->status_lock);
+ spin_unlock_irqrestore(&vm_bo->vm->status_lock, flags);
}
/**
@@ -232,10 +240,12 @@ static void amdgpu_vm_bo_invalidated(struct
amdgpu_vm_bo_base *vm_bo)
*/
static void amdgpu_vm_bo_evicted_user(struct amdgpu_vm_bo_base *vm_bo)
{
+ unsigned long flags;
+
vm_bo->moved = true;
- spin_lock(&vm_bo->vm->status_lock);
+ spin_lock_irqsave(&vm_bo->vm->status_lock, flags);
list_move(&vm_bo->vm_status, &vm_bo->vm->evicted_user);
- spin_unlock(&vm_bo->vm->status_lock);
+ spin_unlock_irqrestore(&vm_bo->vm->status_lock, flags);
}
/**
@@ -248,11 +258,13 @@ static void amdgpu_vm_bo_evicted_user(struct
amdgpu_vm_bo_base *vm_bo)
*/
static void amdgpu_vm_bo_relocated(struct amdgpu_vm_bo_base *vm_bo)
{
+ unsigned long flags;
+
amdgpu_vm_assert_locked(vm_bo->vm);
if (vm_bo->bo->parent) {
- spin_lock(&vm_bo->vm->status_lock);
+ spin_lock_irqsave(&vm_bo->vm->status_lock, flags);
list_move(&vm_bo->vm_status, &vm_bo->vm->relocated);
- spin_unlock(&vm_bo->vm->status_lock);
+ spin_unlock_irqrestore(&vm_bo->vm->status_lock, flags);
} else {
amdgpu_vm_bo_idle(vm_bo);
}
@@ -268,10 +280,12 @@ static void amdgpu_vm_bo_relocated(struct
amdgpu_vm_bo_base *vm_bo)
*/
static void amdgpu_vm_bo_done(struct amdgpu_vm_bo_base *vm_bo)
{
+ unsigned long flags;
+
amdgpu_vm_assert_locked(vm_bo->vm);
- spin_lock(&vm_bo->vm->status_lock);
+ spin_lock_irqsave(&vm_bo->vm->status_lock, flags);
list_move(&vm_bo->vm_status, &vm_bo->vm->done);
- spin_unlock(&vm_bo->vm->status_lock);
+ spin_unlock_irqrestore(&vm_bo->vm->status_lock, flags);
}
/**
@@ -284,10 +298,11 @@ static void amdgpu_vm_bo_done(struct amdgpu_vm_bo_base
*vm_bo)
static void amdgpu_vm_bo_reset_state_machine(struct amdgpu_vm *vm)
{
struct amdgpu_vm_bo_base *vm_bo, *tmp;
+ unsigned long flags;
amdgpu_vm_assert_locked(vm);
- spin_lock(&vm->status_lock);
+ spin_lock_irqsave(&vm->status_lock, flags);
list_splice_init(&vm->done, &vm->invalidated);
list_for_each_entry(vm_bo, &vm->invalidated, vm_status)
vm_bo->moved = true;
@@ -301,7 +316,7 @@ static void amdgpu_vm_bo_reset_state_machine(struct
amdgpu_vm *vm)
else if (bo->parent)
list_move(&vm_bo->vm_status, &vm_bo->vm->relocated);
}
- spin_unlock(&vm->status_lock);
+ spin_unlock_irqrestore(&vm->status_lock, flags);
}
/**
@@ -320,8 +335,10 @@ static void amdgpu_vm_update_shared(struct
amdgpu_vm_bo_base *base)
uint32_t bo_memtype = amdgpu_bo_mem_stats_placement(bo);
bool shared;
+ unsigned long flags;
+
dma_resv_assert_held(bo->tbo.base.resv);
- spin_lock(&vm->status_lock);
+ spin_lock_irqsave(&vm->status_lock, flags);
shared = drm_gem_object_is_shared_for_memory_stats(&bo->tbo.base);
if (base->shared != shared) {
base->shared = shared;
@@ -333,7 +350,7 @@ static void amdgpu_vm_update_shared(struct
amdgpu_vm_bo_base *base)
vm->stats[bo_memtype].drm.private += size;
}
}
- spin_unlock(&vm->status_lock);
+ spin_unlock_irqrestore(&vm->status_lock, flags);
}
/**
@@ -404,10 +421,11 @@ void amdgpu_vm_update_stats(struct amdgpu_vm_bo_base
*base,
struct ttm_resource *res, int sign)
{
struct amdgpu_vm *vm = base->vm;
+ unsigned long flags;
- spin_lock(&vm->status_lock);
+ spin_lock_irqsave(&vm->status_lock, flags);
amdgpu_vm_update_stats_locked(base, res, sign);
- spin_unlock(&vm->status_lock);
+ spin_unlock_irqrestore(&vm->status_lock, flags);
}
/**
@@ -428,15 +446,17 @@ void amdgpu_vm_bo_base_init(struct amdgpu_vm_bo_base
*base,
base->next = NULL;
INIT_LIST_HEAD(&base->vm_status);
+ unsigned long flags;
+
if (!bo)
return;
base->next = bo->vm_bo;
bo->vm_bo = base;
- spin_lock(&vm->status_lock);
+ spin_lock_irqsave(&vm->status_lock, flags);
base->shared = drm_gem_object_is_shared_for_memory_stats(&bo->tbo.base);
amdgpu_vm_update_stats_locked(base, bo->tbo.resource, +1);
- spin_unlock(&vm->status_lock);
+ spin_unlock_irqrestore(&vm->status_lock, flags);
if (!amdgpu_vm_is_bo_always_valid(vm, bo))
return;
@@ -492,28 +512,29 @@ int amdgpu_vm_lock_done_list(struct amdgpu_vm *vm, struct
drm_exec *exec,
struct list_head *prev = &vm->done;
struct amdgpu_bo_va *bo_va;
struct amdgpu_bo *bo;
+ unsigned long flags;
int ret;
/* We can only trust prev->next while holding the lock */
- spin_lock(&vm->status_lock);
+ spin_lock_irqsave(&vm->status_lock, flags);
while (!list_is_head(prev->next, &vm->done)) {
bo_va = list_entry(prev->next, typeof(*bo_va), base.vm_status);
bo = bo_va->base.bo;
if (bo) {
amdgpu_bo_ref(bo);
- spin_unlock(&vm->status_lock);
+ spin_unlock_irqrestore(&vm->status_lock, flags);
ret = drm_exec_prepare_obj(exec, &bo->tbo.base, 1);
amdgpu_bo_unref(&bo);
if (unlikely(ret))
return ret;
- spin_lock(&vm->status_lock);
+ spin_lock_irqsave(&vm->status_lock, flags);
}
prev = prev->next;
}
- spin_unlock(&vm->status_lock);
+ spin_unlock_irqrestore(&vm->status_lock, flags);
return 0;
}
@@ -611,6 +632,7 @@ int amdgpu_vm_validate(struct amdgpu_device *adev, struct
amdgpu_vm *vm,
uint64_t new_vm_generation = amdgpu_vm_generation(adev, vm);
struct amdgpu_vm_bo_base *bo_base;
struct amdgpu_bo *bo;
+ unsigned long flags;
int r;
if (vm->generation != new_vm_generation) {
@@ -622,12 +644,12 @@ int amdgpu_vm_validate(struct amdgpu_device *adev, struct
amdgpu_vm *vm,
return r;
}
- spin_lock(&vm->status_lock);
+ spin_lock_irqsave(&vm->status_lock, flags);
while (!list_empty(&vm->evicted)) {
bo_base = list_first_entry(&vm->evicted,
struct amdgpu_vm_bo_base,
vm_status);
- spin_unlock(&vm->status_lock);
+ spin_unlock_irqrestore(&vm->status_lock, flags);
bo = bo_base->bo;
@@ -641,13 +663,13 @@ int amdgpu_vm_validate(struct amdgpu_device *adev, struct
amdgpu_vm *vm,
vm->update_funcs->map_table(to_amdgpu_bo_vm(bo));
amdgpu_vm_bo_relocated(bo_base);
}
- spin_lock(&vm->status_lock);
+ spin_lock_irqsave(&vm->status_lock, flags);
}
while (ticket && !list_empty(&vm->evicted_user)) {
bo_base = list_first_entry(&vm->evicted_user,
struct amdgpu_vm_bo_base,
vm_status);
- spin_unlock(&vm->status_lock);
+ spin_unlock_irqrestore(&vm->status_lock, flags);
bo = bo_base->bo;
dma_resv_assert_held(bo->tbo.base.resv);
@@ -658,9 +680,9 @@ int amdgpu_vm_validate(struct amdgpu_device *adev, struct
amdgpu_vm *vm,
amdgpu_vm_bo_invalidated(bo_base);
- spin_lock(&vm->status_lock);
+ spin_lock_irqsave(&vm->status_lock, flags);
}
- spin_unlock(&vm->status_lock);
+ spin_unlock_irqrestore(&vm->status_lock, flags);
amdgpu_vm_eviction_lock(vm);
vm->evicting = false;
@@ -681,6 +703,7 @@ int amdgpu_vm_validate(struct amdgpu_device *adev, struct
amdgpu_vm *vm,
*/
bool amdgpu_vm_ready(struct amdgpu_vm *vm)
{
+ unsigned long flags;
bool ret;
amdgpu_vm_assert_locked(vm);
@@ -689,9 +712,9 @@ bool amdgpu_vm_ready(struct amdgpu_vm *vm)
ret = !vm->evicting;
amdgpu_vm_eviction_unlock(vm);
- spin_lock(&vm->status_lock);
+ spin_lock_irqsave(&vm->status_lock, flags);
ret &= list_empty(&vm->evicted);
- spin_unlock(&vm->status_lock);
+ spin_unlock_irqrestore(&vm->status_lock, flags);
spin_lock(&vm->immediate.lock);
ret &= !vm->immediate.stopped;
@@ -990,11 +1013,13 @@ int amdgpu_vm_update_pdes(struct amdgpu_device *adev,
LIST_HEAD(relocated);
int r, idx;
+ unsigned long flags;
+
amdgpu_vm_assert_locked(vm);
- spin_lock(&vm->status_lock);
+ spin_lock_irqsave(&vm->status_lock, flags);
list_splice_init(&vm->relocated, &relocated);
- spin_unlock(&vm->status_lock);
+ spin_unlock_irqrestore(&vm->status_lock, flags);
if (list_empty(&relocated))
return 0;
@@ -1261,10 +1286,12 @@ void amdgpu_vm_get_memory(struct amdgpu_vm *vm,
struct amdgpu_mem_stats stats[__AMDGPU_PL_NUM],
struct amdgpu_process_stats *process_stats)
{
- spin_lock(&vm->status_lock);
+ unsigned long flags;
+
+ spin_lock_irqsave(&vm->status_lock, flags);
memcpy(stats, vm->stats, sizeof(*stats) * __AMDGPU_PL_NUM);
memcpy(process_stats, &vm->process_stats, sizeof(*process_stats));
- spin_unlock(&vm->status_lock);
+ spin_unlock_irqrestore(&vm->status_lock, flags);
}
/**
@@ -1634,26 +1661,27 @@ int amdgpu_vm_handle_moved(struct amdgpu_device *adev,
struct amdgpu_bo_va *bo_va;
struct dma_resv *resv;
bool clear, unlock;
+ unsigned long flags;
int r;
- spin_lock(&vm->status_lock);
+ spin_lock_irqsave(&vm->status_lock, flags);
while (!list_empty(&vm->moved)) {
bo_va = list_first_entry(&vm->moved, struct amdgpu_bo_va,
base.vm_status);
- spin_unlock(&vm->status_lock);
+ spin_unlock_irqrestore(&vm->status_lock, flags);
/* Per VM BOs never need to bo cleared in the page tables */
r = amdgpu_vm_bo_update(adev, bo_va, false);
if (r)
return r;
- spin_lock(&vm->status_lock);
+ spin_lock_irqsave(&vm->status_lock, flags);
}
while (!list_empty(&vm->invalidated)) {
bo_va = list_first_entry(&vm->invalidated, struct amdgpu_bo_va,
base.vm_status);
resv = bo_va->base.bo->tbo.base.resv;
- spin_unlock(&vm->status_lock);
+ spin_unlock_irqrestore(&vm->status_lock, flags);
/* Try to reserve the BO to avoid clearing its ptes */
if (!adev->debug_vm && dma_resv_trylock(resv)) {
@@ -1685,9 +1713,9 @@ int amdgpu_vm_handle_moved(struct amdgpu_device *adev,
bo_va->base.bo->tbo.resource->mem_type == TTM_PL_SYSTEM))
amdgpu_vm_bo_evicted_user(&bo_va->base);
- spin_lock(&vm->status_lock);
+ spin_lock_irqsave(&vm->status_lock, flags);
}
- spin_unlock(&vm->status_lock);
+ spin_unlock_irqrestore(&vm->status_lock, flags);
return 0;
}
@@ -2225,9 +2253,13 @@ void amdgpu_vm_bo_del(struct amdgpu_device *adev,
}
}
- spin_lock(&vm->status_lock);
- list_del(&bo_va->base.vm_status);
- spin_unlock(&vm->status_lock);
+ {
+ unsigned long flags;
+
+ spin_lock_irqsave(&vm->status_lock, flags);
+ list_del(&bo_va->base.vm_status);
+ spin_unlock_irqrestore(&vm->status_lock, flags);
+ }
list_for_each_entry_safe(mapping, next, &bo_va->valids, list) {
list_del(&mapping->list);
@@ -2334,11 +2366,12 @@ void amdgpu_vm_bo_move(struct amdgpu_bo *bo, struct
ttm_resource *new_mem,
for (bo_base = bo->vm_bo; bo_base; bo_base = bo_base->next) {
struct amdgpu_vm *vm = bo_base->vm;
+ unsigned long flags;
- spin_lock(&vm->status_lock);
+ spin_lock_irqsave(&vm->status_lock, flags);
amdgpu_vm_update_stats_locked(bo_base, bo->tbo.resource, -1);
amdgpu_vm_update_stats_locked(bo_base, new_mem, +1);
- spin_unlock(&vm->status_lock);
+ spin_unlock_irqrestore(&vm->status_lock, flags);
}
amdgpu_vm_bo_invalidate(bo, evicted);
@@ -3104,10 +3137,11 @@ void amdgpu_debugfs_vm_bo_info(struct amdgpu_vm *vm,
struct seq_file *m)
unsigned int total_invalidated_objs = 0;
unsigned int total_done_objs = 0;
unsigned int id = 0;
+ unsigned long flags;
amdgpu_vm_assert_locked(vm);
- spin_lock(&vm->status_lock);
+ spin_lock_irqsave(&vm->status_lock, flags);
seq_puts(m, "\tIdle BOs:\n");
list_for_each_entry_safe(bo_va, tmp, &vm->idle, base.vm_status) {
if (!bo_va->base.bo)
@@ -3159,7 +3193,7 @@ void amdgpu_debugfs_vm_bo_info(struct amdgpu_vm *vm,
struct seq_file *m)
continue;
total_done += amdgpu_bo_print_info(id++, bo_va->base.bo, m);
}
- spin_unlock(&vm->status_lock);
+ spin_unlock_irqrestore(&vm->status_lock, flags);
total_done_objs = id;
seq_printf(m, "\tTotal idle size: %12lld\tobjs:\t%d\n",
total_idle,
@@ -3260,9 +3294,27 @@ void amdgpu_sdma_set_vm_pte_scheds(struct amdgpu_device
*adev,
adev->vm_manager.vm_pte_funcs = vm_pte_funcs;
}
+/**
+ * amdgpu_vm_increment_process_counter - increment a process profiling counter
+ *
+ * @vm: the VM to update
+ * @stat_type: which counter to increment
+ *
+ * NOTE: This function is called from IRQ context in amdgpu_irq_dispatch(),
+ * so we MUST use spin_lock_irqsave/spin_unlock_irqrestore to prevent
+ * deadlock when an interrupt arrives while another context holds status_lock.
+ *
+ * The deadlock scenario without IRQ-safe locking:
+ * 1. Process context: amdgpu_vm_bo_del() acquires spin_lock(&vm->status_lock)
+ * 2. IRQ arrives on same CPU
+ * 3. IRQ handler: amdgpu_vm_increment_process_counter() tries to acquire
+ * spin_lock(&vm->status_lock) -> DEADLOCK
+ */
void amdgpu_vm_increment_process_counter(struct amdgpu_vm *vm, enum
amdgpu_process_stat_type stat_type)
{
- spin_lock(&vm->status_lock);
+ unsigned long flags;
+
+ spin_lock_irqsave(&vm->status_lock, flags);
switch (stat_type) {
case AMDGPU_VM_VMFAULT_COUNTER:
vm->process_stats.vmfault_counter++;
@@ -3282,5 +3334,5 @@ void amdgpu_vm_increment_process_counter(struct amdgpu_vm
*vm, enum amdgpu_proce
default:
pr_debug("unknown process stat type 0x%x\n", stat_type);
}
- spin_unlock(&vm->status_lock);
+ spin_unlock_irqrestore(&vm->status_lock, flags);
}
--
2.43.0