From: Nicholas Piggin <npiggin@gmail.com>
To: linux-alpha@vger.kernel.org
Cc: Nicholas Piggin <npiggin@gmail.com>,
Richard Henderson <richard.henderson@linaro.org>,
Ivan Kokshaysky <ink@jurassic.park.msu.ru>,
Matt Turner <mattst88@gmail.com>,
Linus Torvalds <torvalds@linux-foundation.org>
Subject: [RFC PATCH 2/6] alpha: implement simple mm_cpumask TLB flush filter
Date: Thu, 25 May 2023 03:18:18 +1000 [thread overview]
Message-ID: <20230524171822.177133-3-npiggin@gmail.com> (raw)
In-Reply-To: <20230524171822.177133-1-npiggin@gmail.com>
Implement a sticky mm_cpumask and use it to filter TLB flush IPIs.
Sticky meaning that when an mm runs on a CPU, it gets set in the mask
and never goes away. This is the "base" mm_cpumask implementation that
comes with the least complexity.
This reduces IPIs booting into a small rootfs by about 10-15% on 4CPU
system.
Signed-off-by: Nicholas Piggin <npiggin@gmail.com>
---
arch/alpha/include/asm/mmu_context.h | 19 +++++++++++++++++++
arch/alpha/kernel/smp.c | 16 ++++++++++++++--
arch/alpha/mm/init.c | 2 ++
3 files changed, 35 insertions(+), 2 deletions(-)
diff --git a/arch/alpha/include/asm/mmu_context.h b/arch/alpha/include/asm/mmu_context.h
index 8ce89350e4b3..9c9e9a8c01a4 100644
--- a/arch/alpha/include/asm/mmu_context.h
+++ b/arch/alpha/include/asm/mmu_context.h
@@ -135,6 +135,21 @@ ev5_switch_mm(struct mm_struct *prev_mm, struct mm_struct *next_mm,
#ifdef CONFIG_SMP
cpu_data[cpu].asn_lock = 1;
barrier();
+
+ if (!cpumask_test_cpu(cpu, mm_cpumask(next_mm))) {
+ cpumask_set_cpu(cpu, mm_cpumask(next_mm));
+ /*
+ * Store to mm_cpumask must be visible to CPUs performing
+ * TLB flushes before memory accesses that could bring in
+ * new TLB entries. This orders the store above with the
+ * load of the new context and subsequent loads of PTEs
+ * that can then be cached in the TLB.
+ *
+ * The other side is in the mm_cpumask testing in TLB
+ * flush.
+ */
+ smp_mb();
+ }
#endif
asn = cpu_last_asn(cpu);
mmc = next_mm->context[cpu];
@@ -151,6 +166,8 @@ ev5_switch_mm(struct mm_struct *prev_mm, struct mm_struct *next_mm,
a new mm->context (via flush_tlb_mm) without the ASN serial
number wrapping. We have no way to detect when this is needed. */
task_thread_info(next)->pcb.asn = mmc & HARDWARE_ASN_MASK;
+
+ WARN_ON(!cpumask_test_cpu(cpu, mm_cpumask(prev_mm)));
}
static inline void
@@ -195,12 +212,14 @@ do { \
static inline void
ev5_activate_mm(struct mm_struct *prev_mm, struct mm_struct *next_mm)
{
+ cpumask_set_cpu(smp_processor_id(), mm_cpumask(next_mm));
__load_new_mm_context(next_mm);
}
static inline void
ev4_activate_mm(struct mm_struct *prev_mm, struct mm_struct *next_mm)
{
+ cpumask_set_cpu(smp_processor_id(), mm_cpumask(next_mm));
__load_new_mm_context(next_mm);
tbiap();
}
diff --git a/arch/alpha/kernel/smp.c b/arch/alpha/kernel/smp.c
index 7439b2377df5..b702372fbaba 100644
--- a/arch/alpha/kernel/smp.c
+++ b/arch/alpha/kernel/smp.c
@@ -145,6 +145,7 @@ smp_callin(void)
/* All kernel threads share the same mm context. */
mmgrab(&init_mm);
current->active_mm = &init_mm;
+ cpumask_set_cpu(smp_processor_id(), mm_cpumask(&init_mm));
/* inform the notifiers about the new cpu */
notify_cpu_starting(cpuid);
@@ -655,7 +656,17 @@ flush_tlb_mm(struct mm_struct *mm)
}
}
- smp_call_function(ipi_flush_tlb_mm, mm, 1);
+ /*
+ * TLB flush IPIs will be sent to all CPUs with mm_cpumask set. The
+ * problem of ordering the load of mm_cpumask vs a CPU switching to
+ * the mm and caching a translation from a PTE being invalidated and
+ * flushed here means we must have a memory barrier. This orders the
+ * prior stores to invalidate the PTEs from the load of mm_cpumask.
+ *
+ * The other side is switch_mm.
+ */
+ smp_mb();
+ smp_call_function_many(mm_cpumask(mm), ipi_flush_tlb_mm, mm, 1);
preempt_enable();
}
@@ -706,7 +717,8 @@ flush_tlb_page(struct vm_area_struct *vma, unsigned long addr)
data.mm = mm;
data.addr = addr;
- smp_call_function(ipi_flush_tlb_page, &data, 1);
+ smp_mb(); /* see flush_tlb_mm */
+ smp_call_function_many(mm_cpumask(mm), ipi_flush_tlb_page, &data, 1);
preempt_enable();
}
diff --git a/arch/alpha/mm/init.c b/arch/alpha/mm/init.c
index a155180d7a83..33f4c0abd2c8 100644
--- a/arch/alpha/mm/init.c
+++ b/arch/alpha/mm/init.c
@@ -254,6 +254,8 @@ void __init paging_init(void)
/* Initialize the kernel's ZERO_PGE. */
memset(absolute_pointer(ZERO_PGE), 0, PAGE_SIZE);
+
+ cpumask_set_cpu(raw_smp_processor_id(), mm_cpumask(&init_mm));
}
#if defined(CONFIG_ALPHA_GENERIC) || defined(CONFIG_ALPHA_SRM)
--
2.40.1
next prev parent reply other threads:[~2023-05-24 17:18 UTC|newest]
Thread overview: 12+ messages / expand[flat|nested] mbox.gz Atom feed top
2023-05-24 17:18 [RFC PATCH 0/6] Implement MMU_LAZY_TLB_SHOOTDOWN for alpha Nicholas Piggin
2023-05-24 17:18 ` [RFC PATCH 1/6] alpha: remove extern inline from mmu_context Nicholas Piggin
2023-05-24 17:18 ` Nicholas Piggin [this message]
2023-05-24 17:18 ` [RFC PATCH 3/6] alpha: remove TLB flushing mm_users special case Nicholas Piggin
2023-05-24 17:18 ` [RFC PATCH 4/6] alpha: clean mm_cpumask when flushing TLBs Nicholas Piggin
2023-06-02 22:33 ` Matt Turner
2023-09-06 1:39 ` Matt Turner
2023-05-24 17:18 ` [RFC PATCH 5/6] alpha: enable MMU_LAZY_TLB_SHOOTDOWN Nicholas Piggin
2023-05-24 17:18 ` [RFC PATCH 6/6] alpha: shoot the lazy tlb mm when flushing TLBs Nicholas Piggin
2023-05-24 17:27 ` [RFC PATCH 0/6] Implement MMU_LAZY_TLB_SHOOTDOWN for alpha Linus Torvalds
2023-05-24 17:52 ` Matt Turner
2023-05-29 1:45 ` Nicholas Piggin
Reply instructions:
You may reply publicly to this message via plain-text email
using any one of the following methods:
* Save the following mbox file, import it into your mail client,
and reply-to-all from there: mbox
Avoid top-posting and favor interleaved quoting:
https://en.wikipedia.org/wiki/Posting_style#Interleaved_style
* Reply using the --to, --cc, and --in-reply-to
switches of git-send-email(1):
git send-email \
--in-reply-to=20230524171822.177133-3-npiggin@gmail.com \
--to=npiggin@gmail.com \
--cc=ink@jurassic.park.msu.ru \
--cc=linux-alpha@vger.kernel.org \
--cc=mattst88@gmail.com \
--cc=richard.henderson@linaro.org \
--cc=torvalds@linux-foundation.org \
/path/to/YOUR_REPLY
https://kernel.org/pub/software/scm/git/docs/git-send-email.html
* If your mail client supports setting the In-Reply-To header
via mailto: links, try the mailto: link
Be sure your reply has a Subject: header at the top and a blank line
before the message body.
This is an external index of several public inboxes,
see mirroring instructions on how to clone and mirror
all data and code used by this external index.