Jerome Glisse wrote:
> On fault the driver is given the opportunity to perform any operation
> it sees fit in order to place the buffer into a CPU visible area of
> memory. This patch doesn't break TTM users, nouveau, vmwgfx and radeon
> should keep working properly. Future patch will take advantage of this
> infrastructure and remove the old path from TTM once driver are
> converted.
>
> V2 return VM_FAULT_NOPAGE if callback return -EBUSY or -ERESTARTSYS
>
> Signed-off-by: Jerome Glisse <jgli...@redhat.com>
>   


Jerome, See inline comments below and


1) Please make sure the patch passes checkpatch.pl without warnings or 
errors before submitting. This patch has 14 warnings.
2) There are a number of line spacing changes (empty newline changes) 
and line break changes. Please remove them from the patch.



> ---
>  drivers/gpu/drm/ttm/ttm_bo.c      |    3 +-
>  drivers/gpu/drm/ttm/ttm_bo_util.c |   92 
> +++++++++++++++++--------------------
>  drivers/gpu/drm/ttm/ttm_bo_vm.c   |   56 ++++++++++++----------
>  include/drm/ttm/ttm_bo_api.h      |    1 +
>  include/drm/ttm/ttm_bo_driver.h   |   30 ++++++++++++
>  5 files changed, 105 insertions(+), 77 deletions(-)
>
> diff --git a/drivers/gpu/drm/ttm/ttm_bo.c b/drivers/gpu/drm/ttm/ttm_bo.c
> index c7320ce..28f3fcf 100644
> --- a/drivers/gpu/drm/ttm/ttm_bo.c
> +++ b/drivers/gpu/drm/ttm/ttm_bo.c
> @@ -1581,7 +1581,8 @@ void ttm_bo_unmap_virtual(struct ttm_buffer_object *bo)
>  
>       if (!bdev->dev_mapping)
>               return;
> -
> +     if (bdev->driver->io_mem_free)
> +             bdev->driver->io_mem_free(bdev, &bo->mem);
>       unmap_mapping_range(bdev->dev_mapping, offset, holelen, 1);
>  }
>   

The user-space mappings must be taken down *before* the IO space is 
released, but please also see at the bottom for a design change for this.


>  EXPORT_SYMBOL(ttm_bo_unmap_virtual);
> diff --git a/drivers/gpu/drm/ttm/ttm_bo_util.c 
> b/drivers/gpu/drm/ttm/ttm_bo_util.c
> index 3f72fe1..10c5fc6 100644
> --- a/drivers/gpu/drm/ttm/ttm_bo_util.c
> +++ b/drivers/gpu/drm/ttm/ttm_bo_util.c
> @@ -84,26 +84,36 @@ int ttm_mem_reg_ioremap(struct ttm_bo_device *bdev, 
> struct ttm_mem_reg *mem,
>                       void **virtual)
>  {
>       struct ttm_mem_type_manager *man = &bdev->man[mem->mem_type];
> -     unsigned long bus_offset;
> -     unsigned long bus_size;
> -     unsigned long bus_base;
> +     struct ttm_bus_placement pl;
>       int ret;
>       void *addr;
>  
>       *virtual = NULL;
> -     ret = ttm_bo_pci_offset(bdev, mem, &bus_base, &bus_offset, &bus_size);
> -     if (ret || bus_size == 0)
> -             return ret;
> +     if (bdev->driver->io_mem_reserve) {
> +             ret = bdev->driver->io_mem_reserve(bdev, mem, &pl);
> +             if (unlikely(ret != 0)) {
> +                     return ret;
> +             }
> +     } else {
> +             ret = ttm_bo_pci_offset(bdev, mem, &pl.base, &pl.offset, 
> &pl.size);
> +             if (unlikely(ret != 0) || pl.size == 0) {
> +                     return ret;
> +             }
>   
> +             pl.is_iomem = (pl.size != 0);
>   

I fail to see how pl.size can be == 0 here?

> +     }
>  
>       if (!(man->flags & TTM_MEMTYPE_FLAG_NEEDS_IOREMAP))
> -             addr = (void *)(((u8 *) man->io_addr) + bus_offset);
> +             addr = (void *)(pl.base + pl.offset);
>   

This is incorrect. man->io_addr is the virtual kernel address of an 
existing iomap covering the whole aperture, if the driver has choosen to 
set up one. This is not practical on 32-bit systems, due to the limited 
vmalloc / ioremap space but may well be on 64-bit system.

>       else {
>               if (mem->placement & TTM_PL_FLAG_WC)
> -                     addr = ioremap_wc(bus_base + bus_offset, bus_size);
> +                     addr = ioremap_wc(pl.base + pl.offset, pl.size);
>               else
> -                     addr = ioremap_nocache(bus_base + bus_offset, bus_size);
> -             if (!addr)
> +                     addr = ioremap_nocache(pl.base + pl.offset, pl.size);
> +             if (!addr) {
> +                     if (bdev->driver->io_mem_free)
> +                             bdev->driver->io_mem_free(bdev, mem);
>                       return -ENOMEM;
> +             }
>       }
>       *virtual = addr;
>       return 0;
> @@ -118,6 +128,8 @@ void ttm_mem_reg_iounmap(struct ttm_bo_device *bdev, 
> struct ttm_mem_reg *mem,
>  
>       if (virtual && (man->flags & TTM_MEMTYPE_FLAG_NEEDS_IOREMAP))
>               iounmap(virtual);
> +     if (bdev->driver->io_mem_free)
> +             bdev->driver->io_mem_free(bdev, mem);
>  }
>  
>  static int ttm_copy_io_page(void *dst, void *src, unsigned long page)
> @@ -440,13 +452,12 @@ int ttm_bo_kmap(struct ttm_buffer_object *bo,
>               unsigned long start_page, unsigned long num_pages,
>               struct ttm_bo_kmap_obj *map)
>  {
> +     struct ttm_bus_placement pl;
>       int ret;
> -     unsigned long bus_base;
> -     unsigned long bus_offset;
> -     unsigned long bus_size;
>  
>       BUG_ON(!list_empty(&bo->swap));
>       map->virtual = NULL;
> +     map->bo = bo;
>       if (num_pages > bo->num_pages)
>               return -EINVAL;
>       if (start_page > bo->num_pages)
> @@ -455,16 +466,24 @@ int ttm_bo_kmap(struct ttm_buffer_object *bo,
>       if (num_pages > 1 && !DRM_SUSER(DRM_CURPROC))
>               return -EPERM;
>  #endif
> -     ret = ttm_bo_pci_offset(bo->bdev, &bo->mem, &bus_base,
> -                             &bus_offset, &bus_size);
> -     if (ret)
> -             return ret;
> -     if (bus_size == 0) {
> +     if (bo->bdev->driver->io_mem_reserve) {
> +             ret = bo->bdev->driver->io_mem_reserve(bo->bdev, &bo->mem, &pl);
> +             if (unlikely(ret != 0)) {
> +                     return ret;
> +             }
> +     } else {
> +             ret = ttm_bo_pci_offset(bo->bdev, &bo->mem, &pl.base, 
> &pl.offset, &pl.size);
> +             if (unlikely(ret != 0)) {
> +                     return ret;
> +             }
> +             pl.is_iomem = (pl.size != 0);
> +     }
> +     if (!pl.is_iomem) {
>               return ttm_bo_kmap_ttm(bo, start_page, num_pages, map);
>       } else {
> -             bus_offset += start_page << PAGE_SHIFT;
> -             bus_size = num_pages << PAGE_SHIFT;
> -             return ttm_bo_ioremap(bo, bus_base, bus_offset, bus_size, map);
> +             pl.offset += start_page << PAGE_SHIFT;
> +             pl.size = num_pages << PAGE_SHIFT;
> +             return ttm_bo_ioremap(bo, pl.base, pl.offset, pl.size, map);
>       }
>  }
>  EXPORT_SYMBOL(ttm_bo_kmap);
> @@ -476,6 +495,8 @@ void ttm_bo_kunmap(struct ttm_bo_kmap_obj *map)
>       switch (map->bo_kmap_type) {
>       case ttm_bo_map_iomap:
>               iounmap(map->virtual);
> +             if (map->bo->bdev->driver->io_mem_free)
> +                     map->bo->bdev->driver->io_mem_free(map->bo->bdev, 
> &map->bo->mem);
>   

Hmm.
What will happen if, say 10 multiple threads ttm_bo_kmap() and 
ttm_bo_kunmap() a single NO_EVICT bo racing with eachother? If I don't 
misunderstand things, that would cause a considerable mess?


>               break;
>       case ttm_bo_map_vmap:
>               vunmap(map->virtual);
> @@ -493,35 +514,6 @@ void ttm_bo_kunmap(struct ttm_bo_kmap_obj *map)
>  }
>  EXPORT_SYMBOL(ttm_bo_kunmap);
>   



>  
> -int ttm_bo_pfn_prot(struct ttm_buffer_object *bo,
> -                 unsigned long dst_offset,
> -                 unsigned long *pfn, pgprot_t *prot)
> -{
> -     struct ttm_mem_reg *mem = &bo->mem;
> -     struct ttm_bo_device *bdev = bo->bdev;
> -     unsigned long bus_offset;
> -     unsigned long bus_size;
> -     unsigned long bus_base;
> -     int ret;
> -     ret = ttm_bo_pci_offset(bdev, mem, &bus_base, &bus_offset,
> -                     &bus_size);
> -     if (ret)
> -             return -EINVAL;
> -     if (bus_size != 0)
> -             *pfn = (bus_base + bus_offset + dst_offset) >> PAGE_SHIFT;
> -     else
> -             if (!bo->ttm)
> -                     return -EINVAL;
> -             else
> -                     *pfn = page_to_pfn(ttm_tt_get_page(bo->ttm,
> -                                                        dst_offset >>
> -                                                        PAGE_SHIFT));
> -     *prot = (mem->placement & TTM_PL_FLAG_CACHED) ?
> -             PAGE_KERNEL : ttm_io_prot(mem->placement, PAGE_KERNEL);
> -
> -     return 0;
> -}
> -
>  int ttm_bo_move_accel_cleanup(struct ttm_buffer_object *bo,
>                             void *sync_obj,
>                             void *sync_obj_arg,
> diff --git a/drivers/gpu/drm/ttm/ttm_bo_vm.c b/drivers/gpu/drm/ttm/ttm_bo_vm.c
> index 668dbe8..fe4ac95 100644
> --- a/drivers/gpu/drm/ttm/ttm_bo_vm.c
> +++ b/drivers/gpu/drm/ttm/ttm_bo_vm.c
> @@ -74,9 +74,7 @@ static int ttm_bo_vm_fault(struct vm_area_struct *vma, 
> struct vm_fault *vmf)
>       struct ttm_buffer_object *bo = (struct ttm_buffer_object *)
>           vma->vm_private_data;
>       struct ttm_bo_device *bdev = bo->bdev;
> -     unsigned long bus_base;
> -     unsigned long bus_offset;
> -     unsigned long bus_size;
> +     struct ttm_bus_placement pl;
>       unsigned long page_offset;
>       unsigned long page_last;
>       unsigned long pfn;
> @@ -84,7 +82,6 @@ static int ttm_bo_vm_fault(struct vm_area_struct *vma, 
> struct vm_fault *vmf)
>       struct page *page;
>       int ret;
>       int i;
> -     bool is_iomem;
>       unsigned long address = (unsigned long)vmf->virtual_address;
>       int retval = VM_FAULT_NOPAGE;
>  
> @@ -104,11 +101,33 @@ static int ttm_bo_vm_fault(struct vm_area_struct *vma, 
> struct vm_fault *vmf)
>       if (bdev->driver->fault_reserve_notify)
>               bdev->driver->fault_reserve_notify(bo);
>  
> +     if (bdev->driver->fault_reserve) {
> +             ret = bdev->driver->fault_reserve(bo, &pl);
> +             switch (ret) {
> +             case 0:
> +                     break;
> +             case -EBUSY:
> +                     set_need_resched();
> +             case -ERESTARTSYS:
> +                     retval = VM_FAULT_NOPAGE;
> +                     goto out_unlock;
> +             default:
> +                     retval = VM_FAULT_SIGBUS;
> +                     goto out_unlock;
> +             }
> +     } else {
> +             ret = ttm_bo_pci_offset(bdev, &bo->mem, &pl.base, &pl.offset, 
> &pl.size);
> +             if (unlikely(ret != 0)) {
> +                     retval = VM_FAULT_SIGBUS;
> +                     goto out_unlock;
> +             }
> +             pl.is_iomem = (pl.size != 0);
> +     }
> +
>       /*
>        * Wait for buffer data in transit, due to a pipelined
>        * move.
>        */
> -
>   

>       spin_lock(&bo->lock);
>       if (test_bit(TTM_BO_PRIV_FLAG_MOVING, &bo->priv_flags)) {
>               ret = ttm_bo_wait(bo, false, true, false);
> @@ -122,20 +141,10 @@ static int ttm_bo_vm_fault(struct vm_area_struct *vma, 
> struct vm_fault *vmf)
>               spin_unlock(&bo->lock);
>  
>  
> -     ret = ttm_bo_pci_offset(bdev, &bo->mem, &bus_base, &bus_offset,
> -                             &bus_size);
> -     if (unlikely(ret != 0)) {
> -             retval = VM_FAULT_SIGBUS;
> -             goto out_unlock;
> -     }
> -
> -     is_iomem = (bus_size != 0);
> -
>       page_offset = ((address - vma->vm_start) >> PAGE_SHIFT) +
>           bo->vm_node->start - vma->vm_pgoff;
>       page_last = ((vma->vm_end - vma->vm_start) >> PAGE_SHIFT) +
>           bo->vm_node->start - vma->vm_pgoff;
> -
>   

>       if (unlikely(page_offset >= bo->num_pages)) {
>               retval = VM_FAULT_SIGBUS;
>               goto out_unlock;
> @@ -154,8 +163,7 @@ static int ttm_bo_vm_fault(struct vm_area_struct *vma, 
> struct vm_fault *vmf)
>        * vma->vm_page_prot when the object changes caching policy, with
>        * the correct locks held.
>        */
> -
> -     if (is_iomem) {
> +     if (pl.is_iomem) {
>               vma->vm_page_prot = ttm_io_prot(bo->mem.placement,
>                                               vma->vm_page_prot);
>   

>       } else {
> @@ -169,12 +177,9 @@ static int ttm_bo_vm_fault(struct vm_area_struct *vma, 
> struct vm_fault *vmf)
>        * Speculatively prefault a number of pages. Only error on
>        * first page.
>        */
> -
>       for (i = 0; i < TTM_BO_VM_NUM_PREFAULT; ++i) {
> -
>   

> -             if (is_iomem)
> -                     pfn = ((bus_base + bus_offset) >> PAGE_SHIFT) +
> -                         page_offset;
> +             if (pl.is_iomem)
> +                     pfn = ((pl.base + pl.offset) >> PAGE_SHIFT) + 
> page_offset;
>               else {
>                       page = ttm_tt_get_page(ttm, page_offset);
>                       if (unlikely(!page && i == 0)) {
> @@ -191,14 +196,12 @@ static int ttm_bo_vm_fault(struct vm_area_struct *vma, 
> struct vm_fault *vmf)
>                * Somebody beat us to this PTE or prefaulting to
>                * an already populated PTE, or prefaulting error.
>                */
> -
>   

>               if (unlikely((ret == -EBUSY) || (ret != 0 && i > 0)))
>                       break;
>               else if (unlikely(ret != 0)) {
>                       retval =
>                           (ret == -ENOMEM) ? VM_FAULT_OOM : VM_FAULT_SIGBUS;
>                       goto out_unlock;
> -
>   

>               }
>  
>               address += PAGE_SIZE;
> @@ -221,9 +224,10 @@ static void ttm_bo_vm_open(struct vm_area_struct *vma)
>  
>  static void ttm_bo_vm_close(struct vm_area_struct *vma)
>  {
> -     struct ttm_buffer_object *bo =
> -         (struct ttm_buffer_object *)vma->vm_private_data;
> +     struct ttm_buffer_object *bo = (struct ttm_buffer_object 
> *)vma->vm_private_data
>   

>  
> +     if (bo->bdev->driver->io_mem_free)
> +             bo->bdev->driver->io_mem_free(bo->bdev, &bo->mem);
>   

Ugh. This doesn't work. A single bo may have any number of VMAs open. 
Closing one of them should not remove the bo from mappable state. Only 
the last vm_close should. If needed, call ttm_bo_unmap_virtual just 
before the bo's vm_node is freed in ttm_bo_release(), or refcount VMAs 
on the bo. See additional comments below.

>       ttm_bo_unref(&bo);
>       vma->vm_private_data = NULL;
>  }
> diff --git a/include/drm/ttm/ttm_bo_api.h b/include/drm/ttm/ttm_bo_api.h
> index 81eb9f4..1b38c67 100644
> --- a/include/drm/ttm/ttm_bo_api.h
> +++ b/include/drm/ttm/ttm_bo_api.h
> @@ -274,6 +274,7 @@ struct ttm_bo_kmap_obj {
>               ttm_bo_map_kmap         = 3,
>               ttm_bo_map_premapped    = 4 | TTM_BO_MAP_IOMEM_MASK,
>       } bo_kmap_type;
> +     struct ttm_buffer_object *bo;
>  };
>  
>  /**
> diff --git a/include/drm/ttm/ttm_bo_driver.h b/include/drm/ttm/ttm_bo_driver.h
> index 4c4e0f8..923fecf 100644
> --- a/include/drm/ttm/ttm_bo_driver.h
> +++ b/include/drm/ttm/ttm_bo_driver.h
> @@ -240,6 +240,23 @@ struct ttm_mem_type_manager {
>  };
>  
>  /**
> + * struct ttm_bus_placement
> + *
> + * @base:            bus base address
> + * @is_iomem:                is this io memory ?
> + * @size:            size in byte
> + * @offset:          offset from the base address
> + *
> + * Structure indicating the bus placement of an object.
> + */
> +struct ttm_bus_placement {
> +     unsigned long   base;
> +     unsigned long   size;
> +     unsigned long   offset;
> +     bool            is_iomem;
> +};
> +
> +/**
>   * struct ttm_bo_driver
>   *
>   * @create_ttm_backend_entry: Callback to create a struct ttm_backend.
> @@ -358,6 +375,19 @@ struct ttm_bo_driver {
>        * notify the driver that we're about to swap out this bo
>        */
>       void (*swap_notify) (struct ttm_buffer_object *bo);
> +
> +     /**
> +      * Driver callback on bo fault, driver is responsible to fill the
> +      * bus placement and has the opportunity to move the buffer into
> +      * visible space.
> +      */
> +     int (*fault_reserve)(struct ttm_buffer_object *bo, struct 
> ttm_bus_placement *pl);
> +     /**
> +      * Driver callback on when mapping io memory (for bo_move_memcpy for 
> instance).
> +      * TTM will take care to call io_mem_free whenever the mapping is not 
> use anymore.
> +      */
> +     int (*io_mem_reserve)(struct ttm_bo_device *bdev, struct ttm_mem_reg 
> *mem, struct ttm_bus_placement *pl);
> +     void (*io_mem_free)(struct ttm_bo_device *bdev, struct ttm_mem_reg 
> *mem);
>  };
>  
>  /**
>   

Some additional comments:

I think io_mem_reserve() and io_mem_free() should carry out the 
equivalent of 'pin_mappable' and 'unpin_mappable' and additionally 
refcounted to avoid different processes racing. To make this consistent 
with the rest of TTM one would need to impose the restriction that these 
functions must be called only if the bo is in the reserved state or if 
it's pinned with NO_EVICT. That would mean that each struct ttm_mem_reg 
or whatever struct is passed to these functions would need to carry 
driver-specific info that can hold relevant refcounts and perhaps other 
information. Each io_mem_reserve() must be paired with exactly one 
io_mem_free().

Furthermore, For fault_reserve(), the only thing we need to guarantee is 
that the bo is mappable while there are user-space mappings to the bo. 
We can't pair fault_reserve() with io_mem_free() which is currently 
done. Instead we need a fault_unreserve() which should be called from 
ttm_bo_unmap_virtual().

That means also that any 'mappable space manager' that evicts a bo from 
mappable state needs to reserve the bo to be evicted with the no_wait 
flag set, and then call ttm_bo_unmap_virtual() on it. If the 'mappable 
space manager' is just a separate part of a TTM memory region, that's 
already taken care of.

Thanks,
Thomas


------------------------------------------------------------------------------
Download Intel&#174; Parallel Studio Eval
Try the new software tools for yourself. Speed compiling, find bugs
proactively, and fine-tune applications for parallel performance.
See why Intel Parallel Studio got high marks during beta.
http://p.sf.net/sfu/intel-sw-dev
--
_______________________________________________
Dri-devel mailing list
Dri-devel@lists.sourceforge.net
https://lists.sourceforge.net/lists/listinfo/dri-devel

Reply via email to