On Wed, Jun 03, 2026 at 02:56:17PM +0800, Honglei Huang wrote:
> From: Honglei Huang <[email protected]>
> 
> drm_gpusvm_pages is the layer that actually represents physical
> pages/mappings it owns the dma_addr array, the dma_iova_state...
> With the previous patch, so drm_gpusvm_pages is now strictly about
> physical pages and their DMA view.
> 
> Since now the drm_gpusvm_pages instance is inherently bound to one
> specific drm_device, make that ownership explicit by giving
> drm_gpusvm_pages its own drm_device handle, and drive all DMA through
> it instead of through the gpusvm:
> 
>   - Add drm to struct drm_gpusvm_pages and a matching drm parameter
>     to drm_gpusvm_get_pages(); the dma device is bound on first use
>     and immutable for the lifetime of the pages instance.
>   - Route all DMA in drm_gpusvm_get_pages() / __drm_gpusvm_unmap_pages()
>     through svm_pages->drm instead of gpusvm->drm.
>   - Update existing callers (drm_gpusvm_range_get_pages, xe userptr)
> 
> Suggested-by: Matthew Brost <[email protected]>
> Signed-off-by: Honglei Huang <[email protected]>
> ---
>  drivers/gpu/drm/drm_gpusvm.c    | 37 ++++++++++++++++++++++++---------
>  drivers/gpu/drm/xe/xe_userptr.c |  1 +
>  include/drm/drm_gpusvm.h        |  3 +++
>  3 files changed, 31 insertions(+), 10 deletions(-)
> 
> diff --git a/drivers/gpu/drm/drm_gpusvm.c b/drivers/gpu/drm/drm_gpusvm.c
> index 6000d587cf2..3f076178b2a 100644
> --- a/drivers/gpu/drm/drm_gpusvm.c
> +++ b/drivers/gpu/drm/drm_gpusvm.c
> @@ -1135,11 +1135,16 @@ static void __drm_gpusvm_unmap_pages(struct 
> drm_gpusvm *gpusvm,
>                                    unsigned long npages)
>  {
>       struct drm_pagemap *dpagemap = svm_pages->dpagemap;
> -     struct device *dev = gpusvm->drm->dev;
> +     struct device *dev;
>       unsigned long i, j;
>  
>       lockdep_assert_held(&gpusvm->notifier_lock);
>  
> +     if (WARN_ON_ONCE(!svm_pages->drm))

I think it is valid to reach this point without calling get_pages() and
assigning ->drm, so I don’t believe a WARN_ON is required. One example
would be creating a range, attempting to migrate it, and then failing
because the user performs a munmap() on part of the range, resulting in
the range being freed. It’s a weird race, but it’s possible, and I’m
fairly certain Xe SVM tests exercise scenarios like this.

So I would drop the WARN_ON, add a comment like “get_pages() never
called,” and bail out silently. Alternatively, if drm is NULL and
has_dma_mapping is set, then a WARN_ON might make sense, as that should
not be possible.

> +             return;
> +
> +     dev = svm_pages->drm->dev;
> +
>       if (svm_pages->flags.has_dma_mapping) {
>               struct drm_gpusvm_pages_flags flags = {
>                       .__flags = svm_pages->flags.__flags,
> @@ -1379,6 +1384,7 @@ static bool drm_gpusvm_pages_valid_unlocked(struct 
> drm_gpusvm *gpusvm,
>   * drm_gpusvm_get_pages() - Get pages and populate GPU SVM pages struct
>   * @gpusvm: Pointer to the GPU SVM structure
>   * @svm_pages: The SVM pages to populate. This will contain the dma-addresses
> + * @drm: The DRM device that will own the DMA mappings. Stored into 
> @svm_pages
>   * @mm: The mm corresponding to the CPU range
>   * @notifier: The corresponding notifier for the given CPU range
>   * @pages_start: Start CPU address for the pages
> @@ -1392,6 +1398,7 @@ static bool drm_gpusvm_pages_valid_unlocked(struct 
> drm_gpusvm *gpusvm,
>   */
>  int drm_gpusvm_get_pages(struct drm_gpusvm *gpusvm,
>                        struct drm_gpusvm_pages *svm_pages,
> +                      struct drm_device *drm,

You could also move drm into a function like drm_gpusvm_init_pages() (as
mentioned in the cover letter). I don’t have a strong preference, but if
we want a helper that calls hmm_range_fault() once and accepts an array
of drm_gpusvm_pages to DMA-map, that might make sense.

>                        struct mm_struct *mm,
>                        struct mmu_interval_notifier *notifier,
>                        unsigned long pages_start, unsigned long pages_end,
> @@ -1421,6 +1428,15 @@ int drm_gpusvm_get_pages(struct drm_gpusvm *gpusvm,
>                                                          DMA_BIDIRECTIONAL;
>       struct dma_iova_state *state = &svm_pages->state;
>  
> +     if (!drm)
> +             return -EINVAL;
> +     if (svm_pages->drm) {
> +             if (svm_pages->drm != drm)
> +                     return -EINVAL;
> +     } else {
> +             svm_pages->drm = drm;
> +     }

Style nit: If we keep this I'd write this like:

if (!drm || (svm_pages->drm && svm_pages->drm != drm))
        return -EINVAL;

svm_pages->drm = drm;

Matt

> +
>  retry:
>       if (time_after(jiffies, timeout))
>               return -EBUSY;
> @@ -1515,7 +1531,7 @@ int drm_gpusvm_get_pages(struct drm_gpusvm *gpusvm,
>  
>                               pagemap = page_pgmap(page);
>                               dpagemap = drm_pagemap_page_to_dpagemap(page);
> -                             if (drm_WARN_ON(gpusvm->drm, !dpagemap)) {
> +                             if (drm_WARN_ON(drm, !dpagemap)) {
>                                       /*
>                                        * Raced. This is not supposed to happen
>                                        * since hmm_range_fault() should've 
> migrated
> @@ -1527,10 +1543,10 @@ int drm_gpusvm_get_pages(struct drm_gpusvm *gpusvm,
>                       }
>                       svm_pages->dma_addr[j] =
>                               dpagemap->ops->device_map(dpagemap,
> -                                                       gpusvm->drm->dev,
> +                                                       drm->dev,
>                                                         page, order,
>                                                         dma_dir);
> -                     if (dma_mapping_error(gpusvm->drm->dev,
> +                     if (dma_mapping_error(drm->dev,
>                                             svm_pages->dma_addr[j].addr)) {
>                               err = -EFAULT;
>                               goto err_unmap;
> @@ -1550,11 +1566,11 @@ int drm_gpusvm_get_pages(struct drm_gpusvm *gpusvm,
>                       }
>  
>                       if (!i)
> -                             dma_iova_try_alloc(gpusvm->drm->dev, state,
> +                             dma_iova_try_alloc(drm->dev, state,
>                                                  0, npages * PAGE_SIZE);
>  
>                       if (dma_use_iova(state)) {
> -                             err = dma_iova_link(gpusvm->drm->dev, state,
> +                             err = dma_iova_link(drm->dev, state,
>                                                   hmm_pfn_to_phys(pfns[i]),
>                                                   svm_pages->state_offset,
>                                                   PAGE_SIZE << order,
> @@ -1565,11 +1581,11 @@ int drm_gpusvm_get_pages(struct drm_gpusvm *gpusvm,
>                               addr = state->addr + svm_pages->state_offset;
>                               svm_pages->state_offset += PAGE_SIZE << order;
>                       } else {
> -                             addr = dma_map_page(gpusvm->drm->dev,
> +                             addr = dma_map_page(drm->dev,
>                                                   page, 0,
>                                                   PAGE_SIZE << order,
>                                                   dma_dir);
> -                             if (dma_mapping_error(gpusvm->drm->dev, addr)) {
> +                             if (dma_mapping_error(drm->dev, addr)) {
>                                       err = -EFAULT;
>                                       goto err_unmap;
>                               }
> @@ -1585,7 +1601,7 @@ int drm_gpusvm_get_pages(struct drm_gpusvm *gpusvm,
>       }
>  
>       if (dma_use_iova(state)) {
> -             err = dma_iova_sync(gpusvm->drm->dev, state, 0,
> +             err = dma_iova_sync(drm->dev, state, 0,
>                                   svm_pages->state_offset);
>               if (err)
>                       goto err_unmap;
> @@ -1635,7 +1651,8 @@ int drm_gpusvm_range_get_pages(struct drm_gpusvm 
> *gpusvm,
>                              struct drm_gpusvm_range *range,
>                              const struct drm_gpusvm_ctx *ctx)
>  {
> -     return drm_gpusvm_get_pages(gpusvm, &range->pages, gpusvm->mm,
> +     return drm_gpusvm_get_pages(gpusvm, &range->pages, gpusvm->drm,
> +                                 gpusvm->mm,
>                                   &range->notifier->notifier,
>                                   drm_gpusvm_range_start(range),
>                                   drm_gpusvm_range_end(range), ctx);
> diff --git a/drivers/gpu/drm/xe/xe_userptr.c b/drivers/gpu/drm/xe/xe_userptr.c
> index 6761005c0b9..7e28f6868ff 100644
> --- a/drivers/gpu/drm/xe/xe_userptr.c
> +++ b/drivers/gpu/drm/xe/xe_userptr.c
> @@ -75,6 +75,7 @@ int xe_vma_userptr_pin_pages(struct xe_userptr_vma *uvma)
>               return 0;
>  
>       return drm_gpusvm_get_pages(&vm->svm.gpusvm, &uvma->userptr.pages,
> +                                 &xe->drm,
>                                   uvma->userptr.notifier.mm,
>                                   &uvma->userptr.notifier,
>                                   xe_vma_userptr(vma),
> diff --git a/include/drm/drm_gpusvm.h b/include/drm/drm_gpusvm.h
> index 3dba4b9516f..ed228d9ff6b 100644
> --- a/include/drm/drm_gpusvm.h
> +++ b/include/drm/drm_gpusvm.h
> @@ -127,6 +127,7 @@ struct drm_gpusvm_pages_flags {
>  /**
>   * struct drm_gpusvm_pages - Structure representing a GPU SVM mapped pages
>   *
> + * @drm: The DRM device that owns the dma mappings
>   * @dma_addr: Device address array
>   * @dpagemap: The struct drm_pagemap of the device pages we're dma-mapping.
>   *            Note this is assuming only one drm_pagemap per range is 
> allowed.
> @@ -136,6 +137,7 @@ struct drm_gpusvm_pages_flags {
>   * @flags: Flags for the range; see &struct drm_gpusvm_pages_flags
>   */
>  struct drm_gpusvm_pages {
> +     struct drm_device *drm;
>       struct drm_pagemap_addr *dma_addr;
>       struct drm_pagemap *dpagemap;
>       struct dma_iova_state state;
> @@ -328,6 +330,7 @@ void drm_gpusvm_range_set_unmapped(struct 
> drm_gpusvm_range *range,
>  
>  int drm_gpusvm_get_pages(struct drm_gpusvm *gpusvm,
>                        struct drm_gpusvm_pages *svm_pages,
> +                      struct drm_device *drm,
>                        struct mm_struct *mm,
>                        struct mmu_interval_notifier *notifier,
>                        unsigned long pages_start, unsigned long pages_end,
> -- 
> 2.34.1
> 

Reply via email to