mm: use a folio in copy_pte_range()

Allocate an order-0 folio instead of a page and pass it all the way down
the call chain.  Removes dozens of calls to compound_head().

Link: https://lkml.kernel.org/r/20230116191813.2145215-5-willy@infradead.org
Signed-off-by: Matthew Wilcox (Oracle) <willy@infradead.org>
Reviewed-by: Zi Yan <ziy@nvidia.com>
Signed-off-by: Andrew Morton <akpm@linux-foundation.org>
This commit is contained in:
Matthew Wilcox (Oracle) 2023-01-16 19:18:12 +00:00 committed by Andrew Morton
parent 28d41a4863
commit edf5047058

View File

@ -863,13 +863,13 @@ copy_nonpresent_pte(struct mm_struct *dst_mm, struct mm_struct *src_mm,
static inline int static inline int
copy_present_page(struct vm_area_struct *dst_vma, struct vm_area_struct *src_vma, copy_present_page(struct vm_area_struct *dst_vma, struct vm_area_struct *src_vma,
pte_t *dst_pte, pte_t *src_pte, unsigned long addr, int *rss, pte_t *dst_pte, pte_t *src_pte, unsigned long addr, int *rss,
struct page **prealloc, struct page *page) struct folio **prealloc, struct page *page)
{ {
struct page *new_page; struct folio *new_folio;
pte_t pte; pte_t pte;
new_page = *prealloc; new_folio = *prealloc;
if (!new_page) if (!new_folio)
return -EAGAIN; return -EAGAIN;
/* /*
@ -877,14 +877,14 @@ copy_present_page(struct vm_area_struct *dst_vma, struct vm_area_struct *src_vma
* over and copy the page & arm it. * over and copy the page & arm it.
*/ */
*prealloc = NULL; *prealloc = NULL;
copy_user_highpage(new_page, page, addr, src_vma); copy_user_highpage(&new_folio->page, page, addr, src_vma);
__SetPageUptodate(new_page); __folio_mark_uptodate(new_folio);
page_add_new_anon_rmap(new_page, dst_vma, addr); folio_add_new_anon_rmap(new_folio, dst_vma, addr);
lru_cache_add_inactive_or_unevictable(new_page, dst_vma); folio_add_lru_vma(new_folio, dst_vma);
rss[mm_counter(new_page)]++; rss[MM_ANONPAGES]++;
/* All done, just insert the new page copy in the child */ /* All done, just insert the new page copy in the child */
pte = mk_pte(new_page, dst_vma->vm_page_prot); pte = mk_pte(&new_folio->page, dst_vma->vm_page_prot);
pte = maybe_mkwrite(pte_mkdirty(pte), dst_vma); pte = maybe_mkwrite(pte_mkdirty(pte), dst_vma);
if (userfaultfd_pte_wp(dst_vma, *src_pte)) if (userfaultfd_pte_wp(dst_vma, *src_pte))
/* Uffd-wp needs to be delivered to dest pte as well */ /* Uffd-wp needs to be delivered to dest pte as well */
@ -900,7 +900,7 @@ copy_present_page(struct vm_area_struct *dst_vma, struct vm_area_struct *src_vma
static inline int static inline int
copy_present_pte(struct vm_area_struct *dst_vma, struct vm_area_struct *src_vma, copy_present_pte(struct vm_area_struct *dst_vma, struct vm_area_struct *src_vma,
pte_t *dst_pte, pte_t *src_pte, unsigned long addr, int *rss, pte_t *dst_pte, pte_t *src_pte, unsigned long addr, int *rss,
struct page **prealloc) struct folio **prealloc)
{ {
struct mm_struct *src_mm = src_vma->vm_mm; struct mm_struct *src_mm = src_vma->vm_mm;
unsigned long vm_flags = src_vma->vm_flags; unsigned long vm_flags = src_vma->vm_flags;
@ -922,11 +922,11 @@ copy_present_pte(struct vm_area_struct *dst_vma, struct vm_area_struct *src_vma,
return copy_present_page(dst_vma, src_vma, dst_pte, src_pte, return copy_present_page(dst_vma, src_vma, dst_pte, src_pte,
addr, rss, prealloc, page); addr, rss, prealloc, page);
} }
rss[mm_counter(page)]++; rss[MM_ANONPAGES]++;
} else if (page) { } else if (page) {
get_page(page); get_page(page);
page_dup_file_rmap(page, false); page_dup_file_rmap(page, false);
rss[mm_counter(page)]++; rss[mm_counter_file(page)]++;
} }
/* /*
@ -954,23 +954,22 @@ copy_present_pte(struct vm_area_struct *dst_vma, struct vm_area_struct *src_vma,
return 0; return 0;
} }
static inline struct page * static inline struct folio *page_copy_prealloc(struct mm_struct *src_mm,
page_copy_prealloc(struct mm_struct *src_mm, struct vm_area_struct *vma, struct vm_area_struct *vma, unsigned long addr)
unsigned long addr)
{ {
struct page *new_page; struct folio *new_folio;
new_page = alloc_page_vma(GFP_HIGHUSER_MOVABLE, vma, addr); new_folio = vma_alloc_folio(GFP_HIGHUSER_MOVABLE, 0, vma, addr, false);
if (!new_page) if (!new_folio)
return NULL; return NULL;
if (mem_cgroup_charge(page_folio(new_page), src_mm, GFP_KERNEL)) { if (mem_cgroup_charge(new_folio, src_mm, GFP_KERNEL)) {
put_page(new_page); folio_put(new_folio);
return NULL; return NULL;
} }
cgroup_throttle_swaprate(new_page, GFP_KERNEL); cgroup_throttle_swaprate(&new_folio->page, GFP_KERNEL);
return new_page; return new_folio;
} }
static int static int
@ -986,7 +985,7 @@ copy_pte_range(struct vm_area_struct *dst_vma, struct vm_area_struct *src_vma,
int progress, ret = 0; int progress, ret = 0;
int rss[NR_MM_COUNTERS]; int rss[NR_MM_COUNTERS];
swp_entry_t entry = (swp_entry_t){0}; swp_entry_t entry = (swp_entry_t){0};
struct page *prealloc = NULL; struct folio *prealloc = NULL;
again: again:
progress = 0; progress = 0;
@ -1056,7 +1055,7 @@ copy_pte_range(struct vm_area_struct *dst_vma, struct vm_area_struct *src_vma,
* will allocate page according to address). This * will allocate page according to address). This
* could only happen if one pinned pte changed. * could only happen if one pinned pte changed.
*/ */
put_page(prealloc); folio_put(prealloc);
prealloc = NULL; prealloc = NULL;
} }
progress += 8; progress += 8;
@ -1093,7 +1092,7 @@ copy_pte_range(struct vm_area_struct *dst_vma, struct vm_area_struct *src_vma,
goto again; goto again;
out: out:
if (unlikely(prealloc)) if (unlikely(prealloc))
put_page(prealloc); folio_put(prealloc);
return ret; return ret;
} }