public inbox for linux-kernel@vger.kernel.org
 help / color / mirror / Atom feed
From: Jinjie Ruan <ruanjinjie@huawei.com>
To: Kevin Brodsky <kevin.brodsky@arm.com>, <catalin.marinas@arm.com>,
	<will@kernel.org>, <oleg@redhat.com>, <tglx@linutronix.de>,
	<peterz@infradead.org>, <luto@kernel.org>, <shuah@kernel.org>,
	<kees@kernel.org>, <wad@chromium.org>, <deller@gmx.de>,
	<macro@orcam.me.uk>, <charlie@rivosinc.com>, <ldv@strace.io>,
	<mark.rutland@arm.com>, <song@kernel.org>, <ryan.roberts@arm.com>,
	<ada.coupriediaz@arm.com>, <anshuman.khandual@arm.com>,
	<broonie@kernel.org>, <pengcan@kylinos.cn>, <dvyukov@google.com>,
	<linux-arm-kernel@lists.infradead.org>,
	<linux-kernel@vger.kernel.org>, <linux-kselftest@vger.kernel.org>
Subject: Re: [PATCH v9 14/16] arm64: Inline el0_svc_common()
Date: Wed, 10 Dec 2025 10:56:56 +0800	[thread overview]
Message-ID: <132ceb8f-e82d-bed7-7b93-41f5dd505a03@huawei.com> (raw)
In-Reply-To: <746211f0-74b7-4935-a036-48a00bb5701b@arm.com>



On 2025/12/9 21:48, Kevin Brodsky wrote:
> On 04/12/2025 09:21, Jinjie Ruan wrote:
>> After switch arm64 to Generic Entry, the compiler no longer inlines
> 
> Did it inline it before this series?

Yes, as below

<do_el0_svc>:
       d503201f        nop
       d503201f        nop
       d503233f        paciasp
       a9be7bfd        stp     x29, x30, [sp, #-32]!
       910003fd        mov     x29, sp
       a90153f3        stp     x19, x20, [sp, #16]
       aa0003f3        mov     x19, x0
       d5384114        mrs     x20, sp_el0
       f9400001        ldr     x1, [x0]
       f9400282        ldr     x2, [x20]
       f9008801        str     x1, [x0, #272]
       f9402001        ldr     x1, [x0, #64]
       b9011801        str     w1, [x0, #280]
       373001e2        tbnz    w2, #6, ffff80008002c0f0 <do_el0_svc+0x70>
       f278105f        tst     x2, #0x1f00
       54000261        b.ne    ffff80008002c108 <do_el0_svc+0x88>  // b.any
       52803ac2        mov     w2, #0x1d6                      // #470
       97ffffb1        bl      ffff80008002bf88 <invoke_syscall.constprop.0>
       f9400280        ldr     x0, [x20]
       92783400        and     x0, x0, #0x3fff00
       926bdc00        and     x0, x0, #0xffffffffffe01fff
       b4000060        cbz     x0, ffff80008002c0e0 <do_el0_svc+0x60>
       aa1303e0        mov     x0, x19
       97ffc835        bl      ffff80008001e1b0 <syscall_trace_exit>
       a94153f3        ldp     x19, x20, [sp, #16]
       a8c27bfd        ldp     x29, x30, [sp], #32
       d50323bf        autiasp
       d65f03c0        ret
       92804000        mov     x0, #0xfffffffffffffdff         // #-513
       f9000260        str     x0, [x19]
       a94153f3        ldp     x19, x20, [sp, #16]
       a8c27bfd        ldp     x29, x30, [sp], #32
       d50323bf        autiasp
       d65f03c0        ret
       3100043f        cmn     w1, #0x1
       54000140        b.eq    ffff80008002c134 <do_el0_svc+0xb4>  // b.none
       aa1303e0        mov     x0, x19
       97ffc7c1        bl      ffff80008001e018 <syscall_trace_enter>
       2a0003e1        mov     w1, w0
       3100041f        cmn     w0, #0x1
       54fffdc0        b.eq    ffff80008002c0d8 <do_el0_svc+0x58>  // b.none
       aa1303e0        mov     x0, x19
       52803ac2        mov     w2, #0x1d6                      // #470
       97ffff97        bl      ffff80008002bf88 <invoke_syscall.constprop.0>
       17ffffea        b       ffff80008002c0d8 <do_el0_svc+0x58>
       928004a0        mov     x0, #0xffffffffffffffda         // #-38
       f9000260        str     x0, [x19]
       17fffff5        b       ffff80008002c110 <do_el0_svc+0x90>
       d53cd044        mrs     x4, tpidr_el2
       d53cd040        mrs     x0, tpidr_el2
       d53cd041        mrs     x1, tpidr_el2
       00000000        udf     #0
       d503201f        nop
       d503201f        nop

> 
>> el0_svc_common() into do_el0_svc(). So inline el0_svc_common() and it
>> has 1% performance uplift on perf bench basic syscall on kunpeng920
>> as below.
>>
>> | Metric     | W/O this patch | With this patch | Change    |
>> | ---------- | -------------- | --------------- | --------- |
>> | Total time | 2.195 [sec]    | 2.171 [sec]     |  ↓1.1%   |
>> | usecs/op   | 0.219575       | 0.217192        |  ↓1.1%   |
>> | ops/sec    | 4,554,260      | 4,604,225       |  ↑1.1%    |
>>
>> Signed-off-by: Jinjie Ruan <ruanjinjie@huawei.com>
> 
> I think this is sensible - do_el0_svc() is clearly hot and the small
> increase in code size is completely justified. It also removes a
> performance regression when enabling CONFIG_COMPAT (without it
> el0_svc_common() has only one caller so it should be inlined regardless).
> 
> Reviewed-by: Kevin Brodsky <kevin.brodsky@arm.com>
> 
>> ---
>>  arch/arm64/kernel/syscall.c | 4 ++--
>>  1 file changed, 2 insertions(+), 2 deletions(-)
>>
>> diff --git a/arch/arm64/kernel/syscall.c b/arch/arm64/kernel/syscall.c
>> index 47e193a1cfff..5aa51da9ec25 100644
>> --- a/arch/arm64/kernel/syscall.c
>> +++ b/arch/arm64/kernel/syscall.c
>> @@ -66,8 +66,8 @@ static void invoke_syscall(struct pt_regs *regs, unsigned int scno,
>>  	choose_random_kstack_offset(get_random_u16());
>>  }
>>  
>> -static void el0_svc_common(struct pt_regs *regs, int scno, int sc_nr,
>> -			   const syscall_fn_t syscall_table[])
>> +static __always_inline void el0_svc_common(struct pt_regs *regs, int scno, int sc_nr,
>> +					   const syscall_fn_t syscall_table[])
>>  {
>>  	unsigned long work = READ_ONCE(current_thread_info()->syscall_work);
>>  	unsigned long flags = read_thread_flags();
> 

  reply	other threads:[~2025-12-10  2:57 UTC|newest]

Thread overview: 36+ messages / expand[flat|nested]  mbox.gz  Atom feed  top
2025-12-04  8:21 [PATCH v9 00/16] arm64: entry: Convert to Generic Entry Jinjie Ruan
2025-12-04  8:21 ` [PATCH v9 01/16] arm64: Remove unused _TIF_WORK_MASK Jinjie Ruan
2025-12-08  4:42   ` Anshuman Khandual
2025-12-04  8:21 ` [PATCH v9 02/16] arm64/ptrace: Split report_syscall() Jinjie Ruan
2025-12-08  5:02   ` Anshuman Khandual
2025-12-04  8:21 ` [PATCH v9 03/16] arm64/ptrace: Return early for ptrace_report_syscall_entry() error Jinjie Ruan
2025-12-08  5:24   ` Anshuman Khandual
2025-12-08  6:31     ` Jinjie Ruan
2025-12-09 13:46   ` Kevin Brodsky
2025-12-12  4:00     ` Jinjie Ruan
2025-12-15 15:24       ` Kevin Brodsky
2025-12-04  8:21 ` [PATCH v9 04/16] arm64/ptrace: Refactor syscall_trace_enter/exit() Jinjie Ruan
2025-12-08  5:48   ` Anshuman Khandual
2025-12-08  6:24     ` Jinjie Ruan
2025-12-04  8:21 ` [PATCH v9 05/16] arm64: ptrace: Move rseq_syscall() before audit_syscall_exit() Jinjie Ruan
2025-12-04  8:21 ` [PATCH v9 06/16] arm64: syscall: Rework el0_svc_common() Jinjie Ruan
2025-12-04  8:21 ` [PATCH v9 07/16] arm64/ptrace: Not check _TIF_SECCOMP/SYSCALL_EMU for syscall_exit_work() Jinjie Ruan
2025-12-04  8:21 ` [PATCH v9 08/16] arm64/ptrace: Do not report_syscall_exit() for PTRACE_SYSEMU_SINGLESTEP Jinjie Ruan
2025-12-04  8:21 ` [PATCH v9 09/16] arm64/ptrace: Expand secure_computing() in place Jinjie Ruan
2025-12-04  8:21 ` [PATCH v9 10/16] arm64/ptrace: Use syscall_get_arguments() helper Jinjie Ruan
2025-12-04  8:21 ` [PATCH v9 11/16] entry: Split syscall_exit_to_user_mode_work() for arch reuse Jinjie Ruan
2025-12-04  8:21 ` [PATCH v9 12/16] entry: Add arch_ptrace_report_syscall_entry/exit() Jinjie Ruan
2025-12-04  8:21 ` [PATCH v9 13/16] arm64: entry: Convert to generic entry Jinjie Ruan
2025-12-09 13:47   ` Kevin Brodsky
2025-12-04  8:21 ` [PATCH v9 14/16] arm64: Inline el0_svc_common() Jinjie Ruan
2025-12-09 13:48   ` Kevin Brodsky
2025-12-10  2:56     ` Jinjie Ruan [this message]
2025-12-04  8:21 ` [PATCH v9 15/16] entry: Inline syscall_exit_work() Jinjie Ruan
2025-12-09 13:48   ` Kevin Brodsky
2025-12-11  6:55     ` Thomas Gleixner
2025-12-11  9:52       ` Kevin Brodsky
2025-12-12  1:12         ` Thomas Gleixner
2025-12-12  1:26       ` Jinjie Ruan
2025-12-12  3:49     ` Jinjie Ruan
2025-12-04  8:21 ` [PATCH v9 16/16] selftests: sud_test: Support aarch64 Jinjie Ruan
2025-12-20 14:53   ` kemal

Reply instructions:

You may reply publicly to this message via plain-text email
using any one of the following methods:

* Save the following mbox file, import it into your mail client,
  and reply-to-all from there: mbox

  Avoid top-posting and favor interleaved quoting:
  https://en.wikipedia.org/wiki/Posting_style#Interleaved_style

* Reply using the --to, --cc, and --in-reply-to
  switches of git-send-email(1):

  git send-email \
    --in-reply-to=132ceb8f-e82d-bed7-7b93-41f5dd505a03@huawei.com \
    --to=ruanjinjie@huawei.com \
    --cc=ada.coupriediaz@arm.com \
    --cc=anshuman.khandual@arm.com \
    --cc=broonie@kernel.org \
    --cc=catalin.marinas@arm.com \
    --cc=charlie@rivosinc.com \
    --cc=deller@gmx.de \
    --cc=dvyukov@google.com \
    --cc=kees@kernel.org \
    --cc=kevin.brodsky@arm.com \
    --cc=ldv@strace.io \
    --cc=linux-arm-kernel@lists.infradead.org \
    --cc=linux-kernel@vger.kernel.org \
    --cc=linux-kselftest@vger.kernel.org \
    --cc=luto@kernel.org \
    --cc=macro@orcam.me.uk \
    --cc=mark.rutland@arm.com \
    --cc=oleg@redhat.com \
    --cc=pengcan@kylinos.cn \
    --cc=peterz@infradead.org \
    --cc=ryan.roberts@arm.com \
    --cc=shuah@kernel.org \
    --cc=song@kernel.org \
    --cc=tglx@linutronix.de \
    --cc=wad@chromium.org \
    --cc=will@kernel.org \
    /path/to/YOUR_REPLY

  https://kernel.org/pub/software/scm/git/docs/git-send-email.html

* If your mail client supports setting the In-Reply-To header
  via mailto: links, try the mailto: link
Be sure your reply has a Subject: header at the top and a blank line before the message body.
This is a public inbox, see mirroring instructions
for how to clone and mirror all data and code used for this inbox