All of lore.kernel.org
 help / color / mirror / Atom feed
From: Mike Rapoport <rppt@linux.ibm.com>
To: Baolin Wang <baolin.wang@linux.alibaba.com>
Cc: akpm@linux-foundation.org, willy@infradead.org,
	linux-mm@kvack.org, linux-kernel@vger.kernel.org
Subject: Re: [RFC PATCH v2 3/3] mm: Add kernel PTE level pagetable pages account
Date: Wed, 22 Jun 2022 09:44:29 -0500	[thread overview]
Message-ID: <YrMqzWvc9x5HWm5v@linux.ibm.com> (raw)
In-Reply-To: <7882bbf467440f9a3ebe41d96ba5b6f384081bb7.1655887440.git.baolin.wang@linux.alibaba.com>

On Wed, Jun 22, 2022 at 04:58:54PM +0800, Baolin Wang wrote:
> Now the kernel PTE level ptes are always protected by mm->page_table_lock
> instead of split pagetable lock, so the kernel PTE level pagetable pages
> are not accounted. Especially the vmalloc()/vmap() can consume lots of
> kernel pagetable, so to get an accurate pagetable accounting, calling new
> helpers pgtable_set_and_inc()/pgtable_clear_and_dec() when allocating or
> freeing a kernel PTE level pagetable page.

This patch only adds accounting to the page tables allocated after boot,
please mention this in the changelog.
 
> Meanwhile converting architectures to use corresponding generic PTE pagetable
> allocation and freeing functions.
> 
> Signed-off-by: Baolin Wang <baolin.wang@linux.alibaba.com>
> Reported-by: kernel test robot <oliver.sang@intel.com>
> ---
>  arch/csky/include/asm/pgalloc.h |  2 +-
>  arch/microblaze/mm/pgtable.c    |  2 +-
>  arch/openrisc/mm/ioremap.c      |  2 +-
>  arch/x86/mm/pgtable.c           |  5 ++++-
>  include/asm-generic/pgalloc.h   | 14 ++++++++++++--
>  5 files changed, 19 insertions(+), 6 deletions(-)
> 
> diff --git a/arch/csky/include/asm/pgalloc.h b/arch/csky/include/asm/pgalloc.h
> index bbbd069..2443226 100644
> --- a/arch/csky/include/asm/pgalloc.h
> +++ b/arch/csky/include/asm/pgalloc.h
> @@ -29,7 +29,7 @@ static inline pte_t *pte_alloc_one_kernel(struct mm_struct *mm)
>  	pte_t *pte;
>  	unsigned long i;
>  
> -	pte = (pte_t *) __get_free_page(GFP_KERNEL);
> +	pte = __pte_alloc_one_kernel(mm);
>  	if (!pte)
>  		return NULL;
>  
> diff --git a/arch/microblaze/mm/pgtable.c b/arch/microblaze/mm/pgtable.c
> index 9f73265..e96dd1b 100644
> --- a/arch/microblaze/mm/pgtable.c
> +++ b/arch/microblaze/mm/pgtable.c
> @@ -245,7 +245,7 @@ unsigned long iopa(unsigned long addr)
>  __ref pte_t *pte_alloc_one_kernel(struct mm_struct *mm)
>  {
>  	if (mem_init_done)
> -		return (pte_t *)__get_free_page(GFP_KERNEL | __GFP_ZERO);
> +		return __pte_alloc_one_kernel(mm);
>  	else
>  		return memblock_alloc_try_nid(PAGE_SIZE, PAGE_SIZE,
>  					      MEMBLOCK_LOW_LIMIT,
> diff --git a/arch/openrisc/mm/ioremap.c b/arch/openrisc/mm/ioremap.c
> index daae13a..3453acc 100644
> --- a/arch/openrisc/mm/ioremap.c
> +++ b/arch/openrisc/mm/ioremap.c
> @@ -118,7 +118,7 @@ pte_t __ref *pte_alloc_one_kernel(struct mm_struct *mm)
>  	pte_t *pte;
>  
>  	if (likely(mem_init_done)) {
> -		pte = (pte_t *)get_zeroed_page(GFP_KERNEL);
> +		pte = __pte_alloc_one_kernel(mm);
>  	} else {
>  		pte = memblock_alloc(PAGE_SIZE, PAGE_SIZE);
>  		if (!pte)
> diff --git a/arch/x86/mm/pgtable.c b/arch/x86/mm/pgtable.c
> index a8ab3f9..fc2b9ef 100644
> --- a/arch/x86/mm/pgtable.c
> +++ b/arch/x86/mm/pgtable.c
> @@ -851,6 +851,7 @@ int pud_free_pmd_page(pud_t *pud, unsigned long addr)
>  int pmd_free_pte_page(pmd_t *pmd, unsigned long addr)
>  {
>  	pte_t *pte;
> +	struct page *page;
>  
>  	pte = (pte_t *)pmd_page_vaddr(*pmd);
>  	pmd_clear(pmd);
> @@ -858,7 +859,9 @@ int pmd_free_pte_page(pmd_t *pmd, unsigned long addr)
>  	/* INVLPG to clear all paging-structure caches */
>  	flush_tlb_kernel_range(addr, addr + PAGE_SIZE-1);
>  
> -	free_page((unsigned long)pte);
> +	page = virt_to_page(pte);
> +	pgtable_clear_and_dec(page);
> +	__free_page(page);
>  
>  	return 1;
>  }
> diff --git a/include/asm-generic/pgalloc.h b/include/asm-generic/pgalloc.h
> index 328a714..2e20e9e 100644
> --- a/include/asm-generic/pgalloc.h
> +++ b/include/asm-generic/pgalloc.h
> @@ -18,7 +18,14 @@
>   */
>  static inline pte_t *__pte_alloc_one_kernel(struct mm_struct *mm)
>  {
> -	return (pte_t *)__get_free_page(GFP_PGTABLE_KERNEL);
> +	struct page *page;
> +	gfp_t gfp = GFP_PGTABLE_KERNEL;
> +
> +	page = alloc_pages(gfp & ~__GFP_HIGHMEM, 0);
> +	if (!page)
> +		return NULL;
> +	pgtable_set_and_inc(page);
> +	return (pte_t *)page_address(page);

{
	pte_t *pte = (pte_t *)__get_free_page(GFP_PGTABLE_KERNEL);

	if (pte)
		pgtable_set_and_inc(virt_to_page(pte));

	return pte;
}

looks simpler, doesn't it?

>  }
>  
>  #ifndef __HAVE_ARCH_PTE_ALLOC_ONE_KERNEL
> @@ -41,7 +48,10 @@ static inline pte_t *pte_alloc_one_kernel(struct mm_struct *mm)
>   */
>  static inline void pte_free_kernel(struct mm_struct *mm, pte_t *pte)
>  {
> -	free_page((unsigned long)pte);
> +	struct page *page = virt_to_page(pte);
> +
> +	pgtable_clear_and_dec(page);
> +	__free_page(page);
>  }
>  
>  /**
> -- 
> 1.8.3.1
> 

-- 
Sincerely yours,
Mike.


  reply	other threads:[~2022-06-22 14:45 UTC|newest]

Thread overview: 18+ messages / expand[flat|nested]  mbox.gz  Atom feed  top
2022-06-22  8:58 [RFC PATCH v2 0/3] Add PUD and kernel PTE level pagetable account Baolin Wang
2022-06-22  8:58 ` [RFC PATCH v2 1/3] mm: Factor out the pagetable pages account into new helper function Baolin Wang
2022-06-23 16:07   ` Matthew Wilcox
2022-06-24  8:41     ` Baolin Wang
2022-06-22  8:58 ` [RFC PATCH v2 2/3] mm: Add PUD level pagetable account Baolin Wang
2022-06-22 14:38   ` Mike Rapoport
2022-06-23  3:32     ` Baolin Wang
2022-06-23 13:28     ` Matthew Wilcox
2022-06-24  8:52       ` Baolin Wang
2022-06-22  8:58 ` [RFC PATCH v2 3/3] mm: Add kernel PTE level pagetable pages account Baolin Wang
2022-06-22 14:44   ` Mike Rapoport [this message]
2022-06-23  3:34     ` Baolin Wang
2022-07-12  6:08   ` [mm] 0bf5cdf08f: BUG:Bad_page_state_in_process kernel test robot
2022-07-12  6:08     ` kernel test robot
2022-07-12  6:08     ` kernel test robot
2022-07-13  9:17     ` Baolin Wang
2022-07-13  9:17       ` Baolin Wang
2022-07-13  9:17       ` Baolin Wang

Reply instructions:

You may reply publicly to this message via plain-text email
using any one of the following methods:

* Save the following mbox file, import it into your mail client,
  and reply-to-all from there: mbox

  Avoid top-posting and favor interleaved quoting:
  https://en.wikipedia.org/wiki/Posting_style#Interleaved_style

* Reply using the --to, --cc, and --in-reply-to
  switches of git-send-email(1):

  git send-email \
    --in-reply-to=YrMqzWvc9x5HWm5v@linux.ibm.com \
    --to=rppt@linux.ibm.com \
    --cc=akpm@linux-foundation.org \
    --cc=baolin.wang@linux.alibaba.com \
    --cc=linux-kernel@vger.kernel.org \
    --cc=linux-mm@kvack.org \
    --cc=willy@infradead.org \
    /path/to/YOUR_REPLY

  https://kernel.org/pub/software/scm/git/docs/git-send-email.html

* If your mail client supports setting the In-Reply-To header
  via mailto: links, try the mailto: link
Be sure your reply has a Subject: header at the top and a blank line before the message body.
This is an external index of several public inboxes,
see mirroring instructions on how to clone and mirror
all data and code used by this external index.