On Fri, Aug 09, 2019 at 05:18:31PM -0700, John Hubbard wrote:
> On 8/9/19 3:58 PM, ira.we...@intel.com wrote:
> > From: Ira Weiny <ira.we...@intel.com>
> > 
> > In preparation for passing more information (vaddr_pin) into
> > follow_page_pte(), follow_devmap_pud(), and follow_devmap_pmd().
> > 
> > Signed-off-by: Ira Weiny <ira.we...@intel.com>

[snip]

> > @@ -786,7 +782,8 @@ static int check_vma_flags(struct vm_area_struct *vma, 
> > unsigned long gup_flags)
> >  static long __get_user_pages(struct task_struct *tsk, struct mm_struct *mm,
> >             unsigned long start, unsigned long nr_pages,
> >             unsigned int gup_flags, struct page **pages,
> > -           struct vm_area_struct **vmas, int *nonblocking)
> > +           struct vm_area_struct **vmas, int *nonblocking,
> > +           struct vaddr_pin *vaddr_pin)
> 
> I didn't expect to see more vaddr_pin arg passing, based on the commit
> description. Did you want this as part of patch 9 or 10 instead? If not,
> then let's mention it in the commit description.

Yea that does seem out of place now that I look at it.  I'll add to the commit
message because this is really getting vaddr_pin into the context _and_ passing
it down the stack.  With all the rebasing I may have squashed something I did
not mean to.  But I think this patch is ok because it is not to complicated to
see what is going on.

Thanks,
Ira

> 
> >  {
> >     long ret = 0, i = 0;
> >     struct vm_area_struct *vma = NULL;
> > @@ -797,6 +794,8 @@ static long __get_user_pages(struct task_struct *tsk, 
> > struct mm_struct *mm,
> >  
> >     VM_BUG_ON(!!pages != !!(gup_flags & FOLL_GET));
> >  
> > +   ctx.vaddr_pin = vaddr_pin;
> > +
> >     /*
> >      * If FOLL_FORCE is set then do not force a full fault as the hinting
> >      * fault information is unrelated to the reference behaviour of a task
> > @@ -1025,7 +1024,7 @@ static __always_inline long 
> > __get_user_pages_locked(struct task_struct *tsk,
> >     lock_dropped = false;
> >     for (;;) {
> >             ret = __get_user_pages(tsk, mm, start, nr_pages, flags, pages,
> > -                                  vmas, locked);
> > +                                  vmas, locked, vaddr_pin);
> >             if (!locked)
> >                     /* VM_FAULT_RETRY couldn't trigger, bypass */
> >                     return ret;
> > @@ -1068,7 +1067,7 @@ static __always_inline long 
> > __get_user_pages_locked(struct task_struct *tsk,
> >             lock_dropped = true;
> >             down_read(&mm->mmap_sem);
> >             ret = __get_user_pages(tsk, mm, start, 1, flags | FOLL_TRIED,
> > -                                  pages, NULL, NULL);
> > +                                  pages, NULL, NULL, vaddr_pin);
> >             if (ret != 1) {
> >                     BUG_ON(ret > 1);
> >                     if (!pages_done)
> > @@ -1226,7 +1225,7 @@ long populate_vma_page_range(struct vm_area_struct 
> > *vma,
> >      * not result in a stack expansion that recurses back here.
> >      */
> >     return __get_user_pages(current, mm, start, nr_pages, gup_flags,
> > -                           NULL, NULL, nonblocking);
> > +                           NULL, NULL, nonblocking, NULL);
> >  }
> >  
> >  /*
> > @@ -1311,7 +1310,7 @@ struct page *get_dump_page(unsigned long addr)
> >  
> >     if (__get_user_pages(current, current->mm, addr, 1,
> >                          FOLL_FORCE | FOLL_DUMP | FOLL_GET, &page, &vma,
> > -                        NULL) < 1)
> > +                        NULL, NULL) < 1)
> >             return NULL;
> >     flush_cache_page(vma, addr, page_to_pfn(page));
> >     return page;
> > diff --git a/mm/huge_memory.c b/mm/huge_memory.c
> > index bc1a07a55be1..7e09f2f17ed8 100644
> > --- a/mm/huge_memory.c
> > +++ b/mm/huge_memory.c
> > @@ -916,8 +916,9 @@ static void touch_pmd(struct vm_area_struct *vma, 
> > unsigned long addr,
> >  }
> >  
> >  struct page *follow_devmap_pmd(struct vm_area_struct *vma, unsigned long 
> > addr,
> > -           pmd_t *pmd, int flags, struct dev_pagemap **pgmap)
> > +           pmd_t *pmd, int flags, struct follow_page_context *ctx)
> >  {
> > +   struct dev_pagemap **pgmap = &ctx->pgmap;
> >     unsigned long pfn = pmd_pfn(*pmd);
> >     struct mm_struct *mm = vma->vm_mm;
> >     struct page *page;
> > @@ -1068,8 +1069,9 @@ static void touch_pud(struct vm_area_struct *vma, 
> > unsigned long addr,
> >  }
> >  
> >  struct page *follow_devmap_pud(struct vm_area_struct *vma, unsigned long 
> > addr,
> > -           pud_t *pud, int flags, struct dev_pagemap **pgmap)
> > +           pud_t *pud, int flags, struct follow_page_context *ctx)
> >  {
> > +   struct dev_pagemap **pgmap = &ctx->pgmap;
> >     unsigned long pfn = pud_pfn(*pud);
> >     struct mm_struct *mm = vma->vm_mm;
> >     struct page *page;
> > diff --git a/mm/internal.h b/mm/internal.h
> > index 0d5f720c75ab..46ada5279856 100644
> > --- a/mm/internal.h
> > +++ b/mm/internal.h
> > @@ -12,6 +12,34 @@
> >  #include <linux/pagemap.h>
> >  #include <linux/tracepoint-defs.h>
> >  
> > +struct follow_page_context {
> > +   struct dev_pagemap *pgmap;
> > +   unsigned int page_mask;
> > +   struct vaddr_pin *vaddr_pin;
> > +};
> > +
> > +#ifdef CONFIG_TRANSPARENT_HUGEPAGE
> > +struct page *follow_devmap_pmd(struct vm_area_struct *vma, unsigned long 
> > addr,
> > +           pmd_t *pmd, int flags, struct follow_page_context *ctx);
> > +struct page *follow_devmap_pud(struct vm_area_struct *vma, unsigned long 
> > addr,
> > +           pud_t *pud, int flags, struct follow_page_context *ctx);
> > +#else
> > +static inline struct page *follow_devmap_pmd(struct vm_area_struct *vma,
> > +   unsigned long addr, pmd_t *pmd, int flags,
> > +   struct follow_page_context *ctx)
> > +{
> > +   return NULL;
> > +}
> > +
> > +static inline struct page *follow_devmap_pud(struct vm_area_struct *vma,
> > +   unsigned long addr, pud_t *pud, int flags,
> > +   struct follow_page_context *ctx)
> > +{
> > +   return NULL;
> > +}
> > +#endif /* CONFIG_TRANSPARENT_HUGEPAGE */
> > +
> > +
> >  /*
> >   * The set of flags that only affect watermark checking and reclaim
> >   * behaviour. This is used by the MM to obey the caller constraints
> > 
> 
> 
> 
> 
> thanks,
> -- 
> John Hubbard
> NVIDIA

Reply via email to