[<prev] [next>] [<thread-prev] [thread-next>] [day] [month] [year] [list]
Message-ID: <Yrkk0azmR2tqEPVt@FVFYT0MHHV2J.usts.net>
Date: Mon, 27 Jun 2022 11:32:33 +0800
From: Muchun Song <songmuchun@...edance.com>
To: Qi Zheng <zhengqi.arch@...edance.com>
Cc: mike.kravetz@...cle.com, akpm@...ux-foundation.org,
catalin.marinas@....com, will@...nel.org,
linux-arm-kernel@...ts.infradead.org, linux-kernel@...r.kernel.org,
linux-mm@...ck.org
Subject: Re: [PATCH] mm: hugetlb: kill set_huge_swap_pte_at()
On Sun, Jun 26, 2022 at 10:57:17PM +0800, Qi Zheng wrote:
> The commit e5251fd43007 ("mm/hugetlb: introduce set_huge_swap_pte_at()
> helper") add set_huge_swap_pte_at() to handle swap entries on
> architectures that support hugepages consisting of contiguous ptes.
> And currently the set_huge_swap_pte_at() is only overridden by arm64.
>
> The set_huge_swap_pte_at() provide a sz parameter to help determine
> the number of entries to be updated. But in fact, all hugetlb swap
> entries contain pfn information, so we can find the corresponding
> folio through the pfn recorded in the swap entry, then the folio_size()
> is the number of entries that need to be updated.
>
> And considering that users will easily cause bugs by ignoring the
> difference between set_huge_swap_pte_at() and set_huge_pte_at().
> Let's handle swap entries in set_huge_pte_at() and remove the
> set_huge_swap_pte_at(), then we can call set_huge_pte_at()
> anywhere, which simplifies our coding.
>
> Signed-off-by: Qi Zheng <zhengqi.arch@...edance.com>
I think it is a nice cleanup since it simplify the code enough.
We do not need to struggle between set_huge_swap_pte_at() and
set_huge_pte_at(), it is very easy to make mistakes (see commit
5d4af6195c87 and e5251fd43007).
And arm64 is the only user which needs a special
set_huge_swap_pte_at(), it would be nicer if arm64 could handle
it transparently. So
Acked-by: Muchun Song <songmuchun@...edance.com>
> ---
> arch/arm64/include/asm/hugetlb.h | 3 ---
> arch/arm64/mm/hugetlbpage.c | 34 ++++++++++++++++----------------
> include/linux/hugetlb.h | 13 ------------
> mm/hugetlb.c | 8 +++-----
> mm/rmap.c | 11 +++--------
> 5 files changed, 23 insertions(+), 46 deletions(-)
>
> diff --git a/arch/arm64/include/asm/hugetlb.h b/arch/arm64/include/asm/hugetlb.h
> index 1fd2846dbefe..d20f5da2d76f 100644
> --- a/arch/arm64/include/asm/hugetlb.h
> +++ b/arch/arm64/include/asm/hugetlb.h
> @@ -46,9 +46,6 @@ extern void huge_pte_clear(struct mm_struct *mm, unsigned long addr,
> pte_t *ptep, unsigned long sz);
> #define __HAVE_ARCH_HUGE_PTEP_GET
> extern pte_t huge_ptep_get(pte_t *ptep);
> -extern void set_huge_swap_pte_at(struct mm_struct *mm, unsigned long addr,
> - pte_t *ptep, pte_t pte, unsigned long sz);
> -#define set_huge_swap_pte_at set_huge_swap_pte_at
>
> void __init arm64_hugetlb_cma_reserve(void);
>
> diff --git a/arch/arm64/mm/hugetlbpage.c b/arch/arm64/mm/hugetlbpage.c
> index c9e076683e5d..58b89b9d13e0 100644
> --- a/arch/arm64/mm/hugetlbpage.c
> +++ b/arch/arm64/mm/hugetlbpage.c
> @@ -238,6 +238,13 @@ static void clear_flush(struct mm_struct *mm,
> flush_tlb_range(&vma, saddr, addr);
> }
>
> +static inline struct folio *hugetlb_swap_entry_to_folio(swp_entry_t entry)
> +{
> + VM_BUG_ON(!is_migration_entry(entry) && !is_hwpoison_entry(entry));
> +
> + return page_folio(pfn_to_page(swp_offset(entry)));
> +}
> +
> void set_huge_pte_at(struct mm_struct *mm, unsigned long addr,
> pte_t *ptep, pte_t pte)
> {
> @@ -247,11 +254,16 @@ void set_huge_pte_at(struct mm_struct *mm, unsigned long addr,
> unsigned long pfn, dpfn;
> pgprot_t hugeprot;
>
> - /*
> - * Code needs to be expanded to handle huge swap and migration
> - * entries. Needed for HUGETLB and MEMORY_FAILURE.
> - */
When I noticed the comments here, seems this cleanup was on the plan
a few years ago?
> - WARN_ON(!pte_present(pte));
> + if (!pte_present(pte)) {
> + struct folio *folio;
> +
> + folio = hugetlb_swap_entry_to_folio(pte_to_swp_entry(pte));
> + ncontig = num_contig_ptes(folio_size(folio), &pgsize);
> +
> + for (i = 0; i < ncontig; i++, ptep++)
> + set_pte_at(mm, addr, ptep, pte);
> + return;
> + }
>
> if (!pte_cont(pte)) {
> set_pte_at(mm, addr, ptep, pte);
> @@ -269,18 +281,6 @@ void set_huge_pte_at(struct mm_struct *mm, unsigned long addr,
> set_pte_at(mm, addr, ptep, pfn_pte(pfn, hugeprot));
> }
>
> -void set_huge_swap_pte_at(struct mm_struct *mm, unsigned long addr,
> - pte_t *ptep, pte_t pte, unsigned long sz)
> -{
> - int i, ncontig;
> - size_t pgsize;
> -
> - ncontig = num_contig_ptes(sz, &pgsize);
> -
> - for (i = 0; i < ncontig; i++, ptep++)
> - set_pte(ptep, pte);
> -}
> -
> pte_t *huge_pte_alloc(struct mm_struct *mm, struct vm_area_struct *vma,
> unsigned long addr, unsigned long sz)
> {
> diff --git a/include/linux/hugetlb.h b/include/linux/hugetlb.h
> index ee9a28ef26ee..3bb98434550a 100644
> --- a/include/linux/hugetlb.h
> +++ b/include/linux/hugetlb.h
> @@ -928,14 +928,6 @@ static inline void hugetlb_count_sub(long l, struct mm_struct *mm)
> atomic_long_sub(l, &mm->hugetlb_usage);
> }
>
> -#ifndef set_huge_swap_pte_at
> -static inline void set_huge_swap_pte_at(struct mm_struct *mm, unsigned long addr,
> - pte_t *ptep, pte_t pte, unsigned long sz)
> -{
> - set_huge_pte_at(mm, addr, ptep, pte);
> -}
> -#endif
> -
> #ifndef huge_ptep_modify_prot_start
> #define huge_ptep_modify_prot_start huge_ptep_modify_prot_start
> static inline pte_t huge_ptep_modify_prot_start(struct vm_area_struct *vma,
> @@ -1119,11 +1111,6 @@ static inline void hugetlb_count_sub(long l, struct mm_struct *mm)
> {
> }
>
> -static inline void set_huge_swap_pte_at(struct mm_struct *mm, unsigned long addr,
> - pte_t *ptep, pte_t pte, unsigned long sz)
> -{
> -}
> -
> static inline pte_t huge_ptep_clear_flush(struct vm_area_struct *vma,
> unsigned long addr, pte_t *ptep)
> {
> diff --git a/mm/hugetlb.c b/mm/hugetlb.c
> index f338640fbe4a..559084d96082 100644
> --- a/mm/hugetlb.c
> +++ b/mm/hugetlb.c
> @@ -4813,12 +4813,11 @@ int copy_hugetlb_page_range(struct mm_struct *dst, struct mm_struct *src,
> entry = swp_entry_to_pte(swp_entry);
> if (userfaultfd_wp(src_vma) && uffd_wp)
> entry = huge_pte_mkuffd_wp(entry);
> - set_huge_swap_pte_at(src, addr, src_pte,
> - entry, sz);
> + set_huge_pte_at(src, addr, src_pte, entry);
> }
> if (!userfaultfd_wp(dst_vma) && uffd_wp)
> entry = huge_pte_clear_uffd_wp(entry);
> - set_huge_swap_pte_at(dst, addr, dst_pte, entry, sz);
> + set_huge_pte_at(dst, addr, dst_pte, entry);
> } else if (unlikely(is_pte_marker(entry))) {
> /*
> * We copy the pte marker only if the dst vma has
> @@ -6375,8 +6374,7 @@ unsigned long hugetlb_change_protection(struct vm_area_struct *vma,
> newpte = pte_swp_mkuffd_wp(newpte);
> else if (uffd_wp_resolve)
> newpte = pte_swp_clear_uffd_wp(newpte);
> - set_huge_swap_pte_at(mm, address, ptep,
> - newpte, psize);
> + set_huge_pte_at(mm, address, ptep, newpte);
> pages++;
> }
> spin_unlock(ptl);
> diff --git a/mm/rmap.c b/mm/rmap.c
> index 062e8655f337..338fbb24c602 100644
> --- a/mm/rmap.c
> +++ b/mm/rmap.c
> @@ -1618,9 +1618,7 @@ static bool try_to_unmap_one(struct folio *folio, struct vm_area_struct *vma,
> pteval = swp_entry_to_pte(make_hwpoison_entry(subpage));
> if (folio_test_hugetlb(folio)) {
> hugetlb_count_sub(folio_nr_pages(folio), mm);
> - set_huge_swap_pte_at(mm, address,
> - pvmw.pte, pteval,
> - vma_mmu_pagesize(vma));
> + set_huge_pte_at(mm, address, pvmw.pte, pteval);
> } else {
> dec_mm_counter(mm, mm_counter(&folio->page));
> set_pte_at(mm, address, pvmw.pte, pteval);
> @@ -2004,9 +2002,7 @@ static bool try_to_migrate_one(struct folio *folio, struct vm_area_struct *vma,
> pteval = swp_entry_to_pte(make_hwpoison_entry(subpage));
> if (folio_test_hugetlb(folio)) {
> hugetlb_count_sub(folio_nr_pages(folio), mm);
> - set_huge_swap_pte_at(mm, address,
> - pvmw.pte, pteval,
> - vma_mmu_pagesize(vma));
> + set_huge_pte_at(mm, address, pvmw.pte, pteval);
> } else {
> dec_mm_counter(mm, mm_counter(&folio->page));
> set_pte_at(mm, address, pvmw.pte, pteval);
> @@ -2074,8 +2070,7 @@ static bool try_to_migrate_one(struct folio *folio, struct vm_area_struct *vma,
> if (pte_uffd_wp(pteval))
> swp_pte = pte_swp_mkuffd_wp(swp_pte);
> if (folio_test_hugetlb(folio))
> - set_huge_swap_pte_at(mm, address, pvmw.pte,
> - swp_pte, vma_mmu_pagesize(vma));
> + set_huge_pte_at(mm, address, pvmw.pte, swp_pte);
> else
> set_pte_at(mm, address, pvmw.pte, swp_pte);
> trace_set_migration_pte(address, pte_val(swp_pte),
> --
> 2.20.1
>
>
Powered by blists - more mailing lists