When the cgroup's memory usage is below the low/min limit and allocation
fails, try evicting some unprotected buffers to make space. Otherwise,
application buffers may be forced to go into GTT even though usage is
below the corresponding low/min limit, if other applications filled VRAM
with their allocations first.

Signed-off-by: Natalie Vock <[email protected]>
---
 drivers/gpu/drm/ttm/ttm_bo.c | 52 +++++++++++++++++++++++++++++++++++++++-----
 1 file changed, 47 insertions(+), 5 deletions(-)

diff --git a/drivers/gpu/drm/ttm/ttm_bo.c b/drivers/gpu/drm/ttm/ttm_bo.c
index a8914d20b0c32..401a6846b470f 100644
--- a/drivers/gpu/drm/ttm/ttm_bo.c
+++ b/drivers/gpu/drm/ttm/ttm_bo.c
@@ -494,6 +494,10 @@ struct ttm_bo_alloc_state {
        struct dmem_cgroup_pool_state *charge_pool;
        /** @limit_pool: Which pool limit we should test against */
        struct dmem_cgroup_pool_state *limit_pool;
+       /** @only_evict_unprotected: If only unprotected BOs, i.e. BOs whose 
cgroup
+        *  is exceeding its dmem low/min protection, should be considered for 
eviction
+        */
+       bool only_evict_unprotected;
 };
 
 /**
@@ -590,8 +594,12 @@ static int ttm_bo_evict_alloc(struct ttm_device *bdev,
        evict_walk.walk.arg.trylock_only = true;
        lret = ttm_lru_walk_for_evict(&evict_walk.walk, bdev, man, 1);
 
-       /* One more attempt if we hit low limit? */
-       if (!lret && evict_walk.hit_low) {
+       /* If we failed to find enough BOs to evict, but we skipped over
+        * some BOs because they were covered by dmem low protection, retry
+        * evicting these protected BOs too, except if we're told not to
+        * consider protected BOs at all.
+        */
+       if (!lret && evict_walk.hit_low && !state->only_evict_unprotected) {
                evict_walk.try_low = true;
                lret = ttm_lru_walk_for_evict(&evict_walk.walk, bdev, man, 1);
        }
@@ -612,7 +620,8 @@ static int ttm_bo_evict_alloc(struct ttm_device *bdev,
        } while (!lret && evict_walk.evicted);
 
        /* We hit the low limit? Try once more */
-       if (!lret && evict_walk.hit_low && !evict_walk.try_low) {
+       if (!lret && evict_walk.hit_low && !evict_walk.try_low &&
+                       !state->only_evict_unprotected) {
                evict_walk.try_low = true;
                goto retry;
        }
@@ -722,7 +731,7 @@ static int ttm_bo_alloc_at_place(struct ttm_buffer_object 
*bo,
                                 struct ttm_resource **res,
                                 struct ttm_bo_alloc_state *alloc_state)
 {
-       bool may_evict;
+       bool may_evict, below_low = false;
        int ret;
 
        may_evict = (force_space && place->mem_type != TTM_PL_SYSTEM);
@@ -741,10 +750,43 @@ static int ttm_bo_alloc_at_place(struct ttm_buffer_object 
*bo,
                return ret;
        }
 
+       /*
+        * cgroup protection plays a special role in eviction.
+        * Conceptually, protection of memory via the dmem cgroup controller
+        * entitles the protected cgroup to use a certain amount of memory.
+        * There are two types of protection - the 'low' limit is a
+        * "best-effort" protection, whereas the 'min' limit provides a hard
+        * guarantee that memory within the cgroup's allowance will not be
+        * evicted under any circumstance.
+        *
+        * To faithfully model this concept in TTM, we also need to take cgroup
+        * protection into account when allocating. When allocation in one
+        * place fails, TTM will default to trying other places first before
+        * evicting.
+        * If the allocation is covered by dmem cgroup protection, however,
+        * this prevents the allocation from using the memory it is "entitled"
+        * to. To make sure unprotected allocations cannot push new protected
+        * allocations out of places they are "entitled" to use, we should
+        * evict buffers not covered by any cgroup protection, if this
+        * allocation is covered by cgroup protection.
+        *
+        * Buffers covered by 'min' protection are a special case - the 'min'
+        * limit is a stronger guarantee than 'low', and thus buffers protected
+        * by 'low' but not 'min' should also be considered for eviction.
+        * Buffers protected by 'min' will never be considered for eviction
+        * anyway, so the regular eviction path should be triggered here.
+        * Buffers protected by 'low' but not 'min' will take a special
+        * eviction path that only evicts buffers covered by neither 'low' or
+        * 'min' protections.
+        */
+       may_evict |= dmem_cgroup_below_min(NULL, alloc_state->charge_pool);
+       below_low = dmem_cgroup_below_low(NULL, alloc_state->charge_pool);
+       alloc_state->only_evict_unprotected = !may_evict && below_low;
+
        ret = ttm_resource_alloc(bo, place, res, alloc_state->charge_pool);
 
        if (ret) {
-               if (ret == -ENOSPC && may_evict)
+               if (ret == -ENOSPC && (may_evict || below_low))
                        ret = -EBUSY;
                return ret;
        }

-- 
2.53.0

Reply via email to