LinuxPPC-Dev Archive on lore.kernel.org
 help / color / mirror / Atom feed
From: "Christophe Leroy (CS GROUP)" <chleroy@kernel.org>
To: Shrikanth Hegde <sshegde@linux.ibm.com>,
	maddy@linux.ibm.com, linuxppc-dev@lists.ozlabs.org,
	tglx@kernel.org
Cc: linux-kernel@vger.kernel.org
Subject: Re: [PATCH 2/3] powerpc/irq: Make irqstats array based
Date: Fri, 29 May 2026 09:46:35 +0200	[thread overview]
Message-ID: <1f0b54f5-1df0-4649-89bc-9ab3a6d9a100@kernel.org> (raw)
In-Reply-To: <20260523174016.999456-3-sshegde@linux.ibm.com>



Le 23/05/2026 à 19:40, Shrikanth Hegde a écrit :
> Current irq_cpustat_t has separate member for handling each arch
> specific interrupt type. The same can be achieved with array instead
> indexed by corresponding irq counter type.
> 
> This helps to,
> 
> - Make it easy to integrate into genirq improvements by calling
>    genirq provided irq_proc_emit_counts. That speeds up quite a bit
>    by printing all 0's once as much as possible.
> 
> - Adding a new vector or software counter only requires to update the table
>    and everything just works
> 
> - Remove ifdef usage a bit.
> 
> - Instead of going through each member, it simply becomes an array
>    traversal.
> 
> Time taken to read /proc/interrupts 1000 times.
> Base and v6 details can be found in cover-letter.
> Base		:  103us
> v6		:   63us
> v6+this_patch	:   57us
> 
> A Decent 10% reduction can be seen in a system 240 CPUs. As the system
> size increases the gain would be more as emitting 0 would reduce more
> and more.
> 
> Signed-off-by: Shrikanth Hegde <sshegde@linux.ibm.com>

Reviewed-by: Christophe Leroy (CS GROUP) <chleroy@kernel.org>

> ---
>   arch/powerpc/include/asm/hardirq.h |  27 +++++---
>   arch/powerpc/kernel/dbell.c        |   2 +-
>   arch/powerpc/kernel/irq.c          | 107 ++++++++++-------------------
>   arch/powerpc/kernel/time.c         |   6 +-
>   arch/powerpc/kernel/traps.c        |  11 ++-
>   arch/powerpc/kernel/watchdog.c     |   2 +-
>   6 files changed, 64 insertions(+), 91 deletions(-)
> 
> diff --git a/arch/powerpc/include/asm/hardirq.h b/arch/powerpc/include/asm/hardirq.h
> index bf3926a0c69c..38098e35b241 100644
> --- a/arch/powerpc/include/asm/hardirq.h
> +++ b/arch/powerpc/include/asm/hardirq.h
> @@ -5,26 +5,33 @@
>   #include <linux/threads.h>
>   #include <linux/irq.h>
>   
> -typedef struct {
> -	unsigned int timer_irqs_event;
> -	unsigned int broadcast_irqs_event;
> -	unsigned int timer_irqs_others;
> -	unsigned int pmu_irqs;
> -	unsigned int mce_exceptions;
> -	unsigned int spurious_irqs;
> -	unsigned int sreset_irqs;
> +enum irq_stat_counts {
> +	IRQ_COUNT_LOC_TIMER,
> +	IRQ_COUNT_BCT_TIMER,
> +	IRQ_COUNT_OTHER_TIMER,
> +	IRQ_COUNT_SPURIOUS,
> +	IRQ_COUNT_PMI,
> +	IRQ_COUNT_MCE,
> +	IRQ_COUNT_NMI_SRESET,
>   #ifdef CONFIG_PPC_WATCHDOG
> -	unsigned int soft_nmi_irqs;
> +	IRQ_COUNT_WATCHDOG,
>   #endif
>   #ifdef CONFIG_PPC_DOORBELL
> -	unsigned int doorbell_irqs;
> +	IRQ_COUNT_DOORBELL,
>   #endif
> +	IRQ_COUNT_MAX,
> +};
> +
> +typedef struct {
> +	unsigned int counts[IRQ_COUNT_MAX];
>   } ____cacheline_aligned irq_cpustat_t;
>   
>   DECLARE_PER_CPU_SHARED_ALIGNED(irq_cpustat_t, irq_stat);
>   DECLARE_PER_CPU(unsigned int, __softirq_pending);
>   #define local_softirq_pending_ref       __softirq_pending
>   
> +#define inc_irq_stat(index)	__this_cpu_inc(irq_stat.counts[IRQ_COUNT_##index])
> +
>   #define __ARCH_IRQ_STAT
>   #define __ARCH_IRQ_EXIT_IRQS_DISABLED
>   
> diff --git a/arch/powerpc/kernel/dbell.c b/arch/powerpc/kernel/dbell.c
> index 5712dd846263..f5e298a4c4c0 100644
> --- a/arch/powerpc/kernel/dbell.c
> +++ b/arch/powerpc/kernel/dbell.c
> @@ -31,7 +31,7 @@ DEFINE_INTERRUPT_HANDLER_ASYNC(doorbell_exception)
>   		do_hard_irq_enable();
>   
>   	kvmppc_clear_host_ipi(smp_processor_id());
> -	__this_cpu_inc(irq_stat.doorbell_irqs);
> +	inc_irq_stat(DOORBELL);
>   
>   	smp_ipi_demux_relaxed(); /* already performed the barrier */
>   
> diff --git a/arch/powerpc/kernel/irq.c b/arch/powerpc/kernel/irq.c
> index f33df5e5c23f..e67a18f62142 100644
> --- a/arch/powerpc/kernel/irq.c
> +++ b/arch/powerpc/kernel/irq.c
> @@ -84,79 +84,57 @@ u32 tau_interrupts(unsigned long cpu);
>   #endif
>   #endif /* CONFIG_PPC32 */
>   
> +struct irq_stat_info {
> +	const char	*symbol;
> +	const char	*text;
> +};
> +
> +#define ISE(idx, sym, txt)[IRQ_COUNT_##idx] = { .symbol = sym, .text = txt}
> +
> +static struct irq_stat_info irq_stat_info[IRQ_COUNT_MAX] __ro_after_init = {
> +	ISE(LOC_TIMER,		"LOC", "  Local timer interrupts for timer event device\n"),
> +	ISE(BCT_TIMER,		"BCT", "  Broadcast timer interrupts for timer event device\n"),
> +	ISE(OTHER_TIMER,	"LOC", "  Local timer interrupts for others\n"),
> +	ISE(SPURIOUS,		"SPU", "  Spurious interrupts\n"),
> +	ISE(PMI,		"PMI", "  Performance monitoring interrupts\n"),
> +	ISE(MCE,		"MCE", "  Machine check exceptions\n"),
> +	ISE(NMI_SRESET,		"NMI", "  System Reset interrupts\n"),
> +#ifdef CONFIG_PPC_WATCHDOG
> +	ISE(WATCHDOG,		"WDG", "  Watchdog soft-NMI interrupts\n"),
> +#endif
> +#ifdef CONFIG_PPC_DOORBELL
> +	ISE(DOORBELL,		"DBL", "  Doorbell interrupts\n"),
> +#endif
> +};
> +
>   int arch_show_interrupts(struct seq_file *p, int prec)
>   {
> -	int j;
> +	const struct irq_stat_info *info = irq_stat_info;
> +
> +	for (unsigned int i = 0; i < ARRAY_SIZE(irq_stat_info); i++, info++) {
> +		seq_printf(p, "%*s:", prec, info->symbol);
> +		irq_proc_emit_counts(p, &irq_stat.counts[i]);
> +		seq_puts(p, info->text);
> +	}
>   
>   #if defined(CONFIG_PPC32) && defined(CONFIG_TAU_INT)
>   	if (tau_initialized) {
> +		int j;
>   		seq_printf(p, "%*s:", prec, "TAU");
>   		for_each_online_cpu(j)
>   			seq_put_decimal_ull_width(p, " ", tau_interrupts(j), 10);
>   		seq_puts(p, "  PowerPC             Thermal Assist (cpu temp)\n");
>   	}
>   #endif /* CONFIG_PPC32 && CONFIG_TAU_INT */
> -
> -	seq_printf(p, "%*s:", prec, "LOC");
> -	for_each_online_cpu(j)
> -		seq_put_decimal_ull_width(p, " ", per_cpu(irq_stat, j).timer_irqs_event, 10);
> -        seq_printf(p, "  Local timer interrupts for timer event device\n");
> -
> -	seq_printf(p, "%*s:", prec, "BCT");
> -	for_each_online_cpu(j)
> -		seq_put_decimal_ull_width(p, " ", per_cpu(irq_stat, j).broadcast_irqs_event, 10);
> -	seq_printf(p, "  Broadcast timer interrupts for timer event device\n");
> -
> -	seq_printf(p, "%*s:", prec, "LOC");
> -	for_each_online_cpu(j)
> -		seq_put_decimal_ull_width(p, " ", per_cpu(irq_stat, j).timer_irqs_others, 10);
> -        seq_printf(p, "  Local timer interrupts for others\n");
> -
> -	seq_printf(p, "%*s:", prec, "SPU");
> -	for_each_online_cpu(j)
> -		seq_put_decimal_ull_width(p, " ", per_cpu(irq_stat, j).spurious_irqs, 10);
> -	seq_printf(p, "  Spurious interrupts\n");
> -
> -	seq_printf(p, "%*s:", prec, "PMI");
> -	for_each_online_cpu(j)
> -		seq_put_decimal_ull_width(p, " ", per_cpu(irq_stat, j).pmu_irqs, 10);
> -	seq_printf(p, "  Performance monitoring interrupts\n");
> -
> -	seq_printf(p, "%*s:", prec, "MCE");
> -	for_each_online_cpu(j)
> -		seq_put_decimal_ull_width(p, " ", per_cpu(irq_stat, j).mce_exceptions, 10);
> -	seq_printf(p, "  Machine check exceptions\n");
> -
>   #ifdef CONFIG_PPC_BOOK3S_64
>   	if (cpu_has_feature(CPU_FTR_HVMODE)) {
> +		int j;
>   		seq_printf(p, "%*s:", prec, "HMI");
>   		for_each_online_cpu(j)
>   			seq_put_decimal_ull_width(p, " ", paca_ptrs[j]->hmi_irqs, 10);
>   		seq_printf(p, "  Hypervisor Maintenance Interrupts\n");
>   	}
>   #endif
> -
> -	seq_printf(p, "%*s:", prec, "NMI");
> -	for_each_online_cpu(j)
> -		seq_put_decimal_ull_width(p, " ", per_cpu(irq_stat, j).sreset_irqs, 10);
> -	seq_printf(p, "  System Reset interrupts\n");
> -
> -#ifdef CONFIG_PPC_WATCHDOG
> -	seq_printf(p, "%*s:", prec, "WDG");
> -	for_each_online_cpu(j)
> -		seq_put_decimal_ull_width(p, " ", per_cpu(irq_stat, j).soft_nmi_irqs, 10);
> -	seq_printf(p, "  Watchdog soft-NMI interrupts\n");
> -#endif
> -
> -#ifdef CONFIG_PPC_DOORBELL
> -	if (cpu_has_feature(CPU_FTR_DBELL)) {
> -		seq_printf(p, "%*s:", prec, "DBL");
> -		for_each_online_cpu(j)
> -			seq_put_decimal_ull_width(p, " ", per_cpu(irq_stat, j).doorbell_irqs, 10);
> -		seq_printf(p, "  Doorbell interrupts\n");
> -	}
> -#endif
> -
>   	return 0;
>   }
>   
> @@ -165,24 +143,15 @@ int arch_show_interrupts(struct seq_file *p, int prec)
>    */
>   u64 arch_irq_stat_cpu(unsigned int cpu)
>   {
> -	u64 sum = per_cpu(irq_stat, cpu).timer_irqs_event;
> +	irq_cpustat_t *p = per_cpu_ptr(&irq_stat, cpu);
> +	u64 sum = 0;
> +
> +	for (unsigned int i = 0; i < ARRAY_SIZE(irq_stat_info); i++)
> +		sum += p->counts[i];
>   
> -	sum += per_cpu(irq_stat, cpu).broadcast_irqs_event;
> -	sum += per_cpu(irq_stat, cpu).pmu_irqs;
> -	sum += per_cpu(irq_stat, cpu).mce_exceptions;
> -	sum += per_cpu(irq_stat, cpu).spurious_irqs;
> -	sum += per_cpu(irq_stat, cpu).timer_irqs_others;
>   #ifdef CONFIG_PPC_BOOK3S_64
>   	sum += paca_ptrs[cpu]->hmi_irqs;
>   #endif
> -	sum += per_cpu(irq_stat, cpu).sreset_irqs;
> -#ifdef CONFIG_PPC_WATCHDOG
> -	sum += per_cpu(irq_stat, cpu).soft_nmi_irqs;
> -#endif
> -#ifdef CONFIG_PPC_DOORBELL
> -	sum += per_cpu(irq_stat, cpu).doorbell_irqs;
> -#endif
> -
>   	return sum;
>   }
>   
> @@ -248,7 +217,7 @@ static void __do_irq(struct pt_regs *regs, unsigned long oldsp)
>   
>   	/* And finally process it */
>   	if (unlikely(!irq))
> -		__this_cpu_inc(irq_stat.spurious_irqs);
> +		inc_irq_stat(SPURIOUS);
>   	else
>   		generic_handle_irq(irq);
>   
> diff --git a/arch/powerpc/kernel/time.c b/arch/powerpc/kernel/time.c
> index 4bbeb8644d3d..44da7be36199 100644
> --- a/arch/powerpc/kernel/time.c
> +++ b/arch/powerpc/kernel/time.c
> @@ -572,13 +572,13 @@ DEFINE_INTERRUPT_HANDLER_ASYNC(timer_interrupt)
>   	now = get_tb();
>   	if (now >= *next_tb) {
>   		evt->event_handler(evt);
> -		__this_cpu_inc(irq_stat.timer_irqs_event);
> +		inc_irq_stat(LOC_TIMER);
>   	} else {
>   		now = *next_tb - now;
>   		if (now > decrementer_max)
>   			now = decrementer_max;
>   		set_dec_or_work(now);
> -		__this_cpu_inc(irq_stat.timer_irqs_others);
> +		inc_irq_stat(OTHER_TIMER);
>   	}
>   
>   	trace_timer_interrupt_exit(regs);
> @@ -591,7 +591,7 @@ EXPORT_SYMBOL(timer_interrupt);
>   void timer_broadcast_interrupt(void)
>   {
>   	tick_receive_broadcast();
> -	__this_cpu_inc(irq_stat.broadcast_irqs_event);
> +	inc_irq_stat(BCT_TIMER);
>   }
>   #endif
>   
> diff --git a/arch/powerpc/kernel/traps.c b/arch/powerpc/kernel/traps.c
> index cb8e9357383e..a8f15154bd9a 100644
> --- a/arch/powerpc/kernel/traps.c
> +++ b/arch/powerpc/kernel/traps.c
> @@ -459,8 +459,7 @@ DEFINE_INTERRUPT_HANDLER_NMI(system_reset_exception)
>   	}
>   
>   	hv_nmi_check_nonrecoverable(regs);
> -
> -	__this_cpu_inc(irq_stat.sreset_irqs);
> +	inc_irq_stat(NMI_SRESET);
>   
>   	/* See if any machine dependent calls */
>   	if (ppc_md.system_reset_exception) {
> @@ -817,7 +816,7 @@ static void __machine_check_exception(struct pt_regs *regs)
>   {
>   	int recover = 0;
>   
> -	__this_cpu_inc(irq_stat.mce_exceptions);
> +	inc_irq_stat(MCE);
>   
>   	add_taint(TAINT_MACHINE_CHECK, LOCKDEP_NOW_UNRELIABLE);
>   
> @@ -1932,8 +1931,7 @@ DEFINE_INTERRUPT_HANDLER(vsx_unavailable_tm)
>   DECLARE_INTERRUPT_HANDLER_NMI(performance_monitor_exception_nmi);
>   DEFINE_INTERRUPT_HANDLER_NMI(performance_monitor_exception_nmi)
>   {
> -	__this_cpu_inc(irq_stat.pmu_irqs);
> -
> +	inc_irq_stat(PMI);
>   	perf_irq(regs);
>   
>   	return 0;
> @@ -1943,8 +1941,7 @@ DEFINE_INTERRUPT_HANDLER_NMI(performance_monitor_exception_nmi)
>   DECLARE_INTERRUPT_HANDLER_ASYNC(performance_monitor_exception_async);
>   DEFINE_INTERRUPT_HANDLER_ASYNC(performance_monitor_exception_async)
>   {
> -	__this_cpu_inc(irq_stat.pmu_irqs);
> -
> +	inc_irq_stat(PMI);
>   	perf_irq(regs);
>   }
>   
> diff --git a/arch/powerpc/kernel/watchdog.c b/arch/powerpc/kernel/watchdog.c
> index 764001deb060..f516eeccc9f6 100644
> --- a/arch/powerpc/kernel/watchdog.c
> +++ b/arch/powerpc/kernel/watchdog.c
> @@ -381,7 +381,7 @@ DEFINE_INTERRUPT_HANDLER_NMI(soft_nmi_interrupt)
>   	if (!cpumask_test_cpu(cpu, &wd_cpus_enabled))
>   		return 0;
>   
> -	__this_cpu_inc(irq_stat.soft_nmi_irqs);
> +	inc_irq_stat(WATCHDOG);
>   
>   	tb = get_tb();
>   	if (tb - per_cpu(wd_timer_tb, cpu) >= wd_panic_timeout_tb) {



  reply	other threads:[~2026-05-29  7:46 UTC|newest]

Thread overview: 8+ messages / expand[flat|nested]  mbox.gz  Atom feed  top
2026-05-23 17:40 [PATCH 0/3] powerpc/irq: Use optimizations for /proc/interrupts Shrikanth Hegde
2026-05-23 17:40 ` [PATCH 1/3] powerpc/irq: Move __softirq_pending out of irq_stat Shrikanth Hegde
2026-05-29  7:43   ` Christophe Leroy (CS GROUP)
2026-05-23 17:40 ` [PATCH 2/3] powerpc/irq: Make irqstats array based Shrikanth Hegde
2026-05-29  7:46   ` Christophe Leroy (CS GROUP) [this message]
2026-05-23 17:40 ` [PATCH 3/3] powerpc/irq: Suppress unlikely interrupt stats by default Shrikanth Hegde
2026-05-29  7:51   ` Christophe Leroy (CS GROUP)
2026-05-29  8:09     ` Shrikanth Hegde

Reply instructions:

You may reply publicly to this message via plain-text email
using any one of the following methods:

* Save the following mbox file, import it into your mail client,
  and reply-to-all from there: mbox

  Avoid top-posting and favor interleaved quoting:
  https://en.wikipedia.org/wiki/Posting_style#Interleaved_style

* Reply using the --to, --cc, and --in-reply-to
  switches of git-send-email(1):

  git send-email \
    --in-reply-to=1f0b54f5-1df0-4649-89bc-9ab3a6d9a100@kernel.org \
    --to=chleroy@kernel.org \
    --cc=linux-kernel@vger.kernel.org \
    --cc=linuxppc-dev@lists.ozlabs.org \
    --cc=maddy@linux.ibm.com \
    --cc=sshegde@linux.ibm.com \
    --cc=tglx@kernel.org \
    /path/to/YOUR_REPLY

  https://kernel.org/pub/software/scm/git/docs/git-send-email.html

* If your mail client supports setting the In-Reply-To header
  via mailto: links, try the mailto: link
Be sure your reply has a Subject: header at the top and a blank line before the message body.
This is a public inbox, see mirroring instructions
for how to clone and mirror all data and code used for this inbox