public inbox for linux-kernel@vger.kernel.org
 help / color / mirror / Atom feed
From: "Kirill A. Shutemov" <kirill@shutemov.name>
To: Alexander Duyck <alexander.h.duyck@intel.com>
Cc: tglx@linutronix.de, mingo@redhat.com, hpa@zytor.com,
	andi@firstfloor.org, linux-kernel@vger.kernel.org,
	x86@kernel.org
Subject: Re: [PATCH v3 1/8] x86: Improve __phys_addr performance by making use of carry flags and inlining
Date: Mon, 5 Nov 2012 22:24:25 +0200	[thread overview]
Message-ID: <20121105202425.GA25671@shutemov.name> (raw)
In-Reply-To: <20121105190332.10205.22300.stgit@gitlad.jf.intel.com>

On Mon, Nov 05, 2012 at 11:04:06AM -0800, Alexander Duyck wrote:
> This patch is meant to improve overall system performance when making use of
> the __phys_addr call.  To do this I have implemented several changes.
> 
> First if CONFIG_DEBUG_VIRTUAL is not defined __phys_addr is made an inline,
> similar to how this is currently handled in 32 bit.  However in order to do
> this it is required to export phys_base so that it is available if __phys_addr
> is used in kernel modules.
> 
> The second change was to streamline the code by making use of the carry flag
> on an add operation instead of performing a compare on a 64 bit value.  The
> advantage to this is that it allows us to significantly reduce the overall
> size of the call.  On my Xeon E5 system the entire __phys_addr inline call
> consumes a little less than 32 bytes and 5 instructions.  I also applied
> similar logic to the debug version of the function.  My testing shows that the
> debug version of the function with this patch applied is slightly faster than
> the non-debug version without the patch.
> 
> When building the kernel with the first two changes applied I saw build
> warnings about __START_KERNEL_map and PAGE_OFFSET constants not fitting in
> their type.  In order to resolve the build warning I changed their type from
> UL to ULL.

What kind of warning messages did you see?
It's strange: sizeof(unsinged long) == sizeof(unsinged long long) on
x86_64

> 
> Finally I also applied the same logic changes to __virt_addr_valid since it
> used the same general code flow as __phys_addr and could achieve similar gains
> though these changes.
> 
> Signed-off-by: Alexander Duyck <alexander.h.duyck@intel.com>
> ---
> 
> v3:  Added changes to __virt_addr_valid to keep it in sync with __phys_addr
> 
>  arch/x86/include/asm/page_64_types.h |   17 +++++++++++++-
>  arch/x86/kernel/x8664_ksyms_64.c     |    3 +++
>  arch/x86/mm/physaddr.c               |   40 +++++++++++++++++++++-------------
>  3 files changed, 43 insertions(+), 17 deletions(-)
> 
> diff --git a/arch/x86/include/asm/page_64_types.h b/arch/x86/include/asm/page_64_types.h
> index 320f7bb..1ca93d3 100644
> --- a/arch/x86/include/asm/page_64_types.h
> +++ b/arch/x86/include/asm/page_64_types.h
> @@ -30,14 +30,14 @@
>   * hypervisor to fit.  Choosing 16 slots here is arbitrary, but it's
>   * what Xen requires.
>   */
> -#define __PAGE_OFFSET           _AC(0xffff880000000000, UL)
> +#define __PAGE_OFFSET           _AC(0xffff880000000000, ULL)
>  
>  #define __PHYSICAL_START	((CONFIG_PHYSICAL_START +	 	\
>  				  (CONFIG_PHYSICAL_ALIGN - 1)) &	\
>  				 ~(CONFIG_PHYSICAL_ALIGN - 1))
>  
>  #define __START_KERNEL		(__START_KERNEL_map + __PHYSICAL_START)
> -#define __START_KERNEL_map	_AC(0xffffffff80000000, UL)
> +#define __START_KERNEL_map	_AC(0xffffffff80000000, ULL)
>  
>  /* See Documentation/x86/x86_64/mm.txt for a description of the memory map. */
>  #define __PHYSICAL_MASK_SHIFT	46
> @@ -58,7 +58,20 @@ void copy_page(void *to, void *from);
>  extern unsigned long max_pfn;
>  extern unsigned long phys_base;
>  
> +static inline unsigned long __phys_addr_nodebug(unsigned long x)
> +{
> +	unsigned long y = x - __START_KERNEL_map;

With change above you assign ULL const to unsigned long variable. hm?

> +
> +	/* use the carry flag to determine if x was < __START_KERNEL_map */
> +	x = y + ((x > y) ? phys_base : (__START_KERNEL_map - PAGE_OFFSET));
> +
> +	return x;
> +}
> +#ifdef CONFIG_DEBUG_VIRTUAL
>  extern unsigned long __phys_addr(unsigned long);
> +#else
> +#define __phys_addr(x)		__phys_addr_nodebug(x)
> +#endif
>  #define __phys_reloc_hide(x)	(x)
>  
>  #define vmemmap ((struct page *)VMEMMAP_START)
> diff --git a/arch/x86/kernel/x8664_ksyms_64.c b/arch/x86/kernel/x8664_ksyms_64.c
> index 1330dd1..b014d94 100644
> --- a/arch/x86/kernel/x8664_ksyms_64.c
> +++ b/arch/x86/kernel/x8664_ksyms_64.c
> @@ -59,6 +59,9 @@ EXPORT_SYMBOL(memcpy);
>  EXPORT_SYMBOL(__memcpy);
>  EXPORT_SYMBOL(memmove);
>  
> +#ifndef CONFIG_DEBUG_VIRTUAL
> +EXPORT_SYMBOL(phys_base);
> +#endif
>  EXPORT_SYMBOL(empty_zero_page);
>  #ifndef CONFIG_PARAVIRT
>  EXPORT_SYMBOL(native_load_gs_index);
> diff --git a/arch/x86/mm/physaddr.c b/arch/x86/mm/physaddr.c
> index d2e2735..fd40d75 100644
> --- a/arch/x86/mm/physaddr.c
> +++ b/arch/x86/mm/physaddr.c
> @@ -8,33 +8,43 @@
>  
>  #ifdef CONFIG_X86_64
>  
> +#ifdef CONFIG_DEBUG_VIRTUAL
>  unsigned long __phys_addr(unsigned long x)
>  {
> -	if (x >= __START_KERNEL_map) {
> -		x -= __START_KERNEL_map;
> -		VIRTUAL_BUG_ON(x >= KERNEL_IMAGE_SIZE);
> -		x += phys_base;
> +	unsigned long y = x - __START_KERNEL_map;
> +
> +	/* use the carry flag to determine if x was < __START_KERNEL_map */
> +	if (unlikely(x > y)) {
> +		x = y + phys_base;
> +
> +		VIRTUAL_BUG_ON(y >= KERNEL_IMAGE_SIZE);
>  	} else {
> -		VIRTUAL_BUG_ON(x < PAGE_OFFSET);
> -		x -= PAGE_OFFSET;
> -		VIRTUAL_BUG_ON(!phys_addr_valid(x));
> +		x = y + (__START_KERNEL_map - PAGE_OFFSET);
> +
> +		/* carry flag will be set if starting x was >= PAGE_OFFSET */
> +		VIRTUAL_BUG_ON((x > y) || !phys_addr_valid(x));
>  	}
> +
>  	return x;
>  }
>  EXPORT_SYMBOL(__phys_addr);
> +#endif
>  
>  bool __virt_addr_valid(unsigned long x)
>  {
> -	if (x >= __START_KERNEL_map) {
> -		x -= __START_KERNEL_map;
> -		if (x >= KERNEL_IMAGE_SIZE)
> +	unsigned long y = x - __START_KERNEL_map;
> +
> +	/* use the carry flag to determine if x was < __START_KERNEL_map */
> +	if (unlikely(x > y)) {
> +		x = y + phys_base;
> +
> +		if (y >= KERNEL_IMAGE_SIZE)
>  			return false;
> -		x += phys_base;
>  	} else {
> -		if (x < PAGE_OFFSET)
> -			return false;
> -		x -= PAGE_OFFSET;
> -		if (!phys_addr_valid(x))
> +		x = y + (__START_KERNEL_map - PAGE_OFFSET);
> +
> +		/* carry flag will be set if starting x was >= PAGE_OFFSET */
> +		if ((x > y) || !phys_addr_valid(x))
>  			return false;
>  	}
>  
> 
> --
> To unsubscribe from this list: send the line "unsubscribe linux-kernel" in
> the body of a message to majordomo@vger.kernel.org
> More majordomo info at  http://vger.kernel.org/majordomo-info.html
> Please read the FAQ at  http://www.tux.org/lkml/

-- 
 Kirill A. Shutemov

  reply	other threads:[~2012-11-05 20:29 UTC|newest]

Thread overview: 15+ messages / expand[flat|nested]  mbox.gz  Atom feed  top
2012-11-05 19:03 [PATCH v3 0/8] Improve performance of VM translation on x86_64 Alexander Duyck
2012-11-05 19:04 ` [PATCH v3 1/8] x86: Improve __phys_addr performance by making use of carry flags and inlining Alexander Duyck
2012-11-05 20:24   ` Kirill A. Shutemov [this message]
2012-11-05 21:56     ` Alexander Duyck
2012-11-05 22:08       ` Kirill A. Shutemov
2012-11-16 19:35         ` Alexander Duyck
2012-11-05 19:04 ` [PATCH v3 2/8] x86: Make it so that __pa_symbol can only process kernel symbols on x86_64 Alexander Duyck
2012-11-05 19:04 ` [PATCH v3 3/8] x86: Drop 4 unnecessary calls to __pa_symbol Alexander Duyck
2012-11-05 19:05 ` [PATCH v3 4/8] x86: Use __pa_symbol instead of __pa on C visible symbols Alexander Duyck
2012-11-05 19:05 ` [PATCH v3 5/8] x86/ftrace: " Alexander Duyck
2012-11-05 19:06 ` [PATCH v3 6/8] x86/xen: " Alexander Duyck
2012-11-06 15:45   ` Konrad Rzeszutek Wilk
2012-11-05 19:06 ` [PATCH v3 7/8] x86/acpi: " Alexander Duyck
2012-11-05 19:06 ` [PATCH v3 8/8] x86/lguest: " Alexander Duyck
2012-11-06  1:11   ` Rusty Russell

Reply instructions:

You may reply publicly to this message via plain-text email
using any one of the following methods:

* Save the following mbox file, import it into your mail client,
  and reply-to-all from there: mbox

  Avoid top-posting and favor interleaved quoting:
  https://en.wikipedia.org/wiki/Posting_style#Interleaved_style

* Reply using the --to, --cc, and --in-reply-to
  switches of git-send-email(1):

  git send-email \
    --in-reply-to=20121105202425.GA25671@shutemov.name \
    --to=kirill@shutemov.name \
    --cc=alexander.h.duyck@intel.com \
    --cc=andi@firstfloor.org \
    --cc=hpa@zytor.com \
    --cc=linux-kernel@vger.kernel.org \
    --cc=mingo@redhat.com \
    --cc=tglx@linutronix.de \
    --cc=x86@kernel.org \
    /path/to/YOUR_REPLY

  https://kernel.org/pub/software/scm/git/docs/git-send-email.html

* If your mail client supports setting the In-Reply-To header
  via mailto: links, try the mailto: link
Be sure your reply has a Subject: header at the top and a blank line before the message body.
This is a public inbox, see mirroring instructions
for how to clone and mirror all data and code used for this inbox