* [PATCH RFC 1/5] dump_stack: Make arch description buffer __ro_after_init
2024-01-18 15:25 [PATCH RFC 0/5] dump_stack: Allow runtime updates of the hardware description Nathan Lynch via B4 Relay
@ 2024-01-18 15:25 ` Nathan Lynch via B4 Relay
2024-01-18 15:25 ` [PATCH RFC 2/5] dump_stack: Allow update of arch description string at runtime Nathan Lynch via B4 Relay
` (3 subsequent siblings)
4 siblings, 0 replies; 6+ messages in thread
From: Nathan Lynch via B4 Relay @ 2024-01-18 15:25 UTC (permalink / raw)
To: Aneesh Kumar K.V, Naveen N. Rao, Brian King, Christophe Leroy,
John Ogness, Michael Ellerman, Nicholas Piggin, Petr Mladek,
Sergey Senozhatsky, Steven Rostedt
Cc: Nathan Lynch, linuxppc-dev, linux-kernel
From: Nathan Lynch <nathanl@linux.ibm.com>
The static hardware description buffer is populated by arch code
during boot and should not change afterwards, so mark it
__ro_after_init.
Signed-off-by: Nathan Lynch <nathanl@linux.ibm.com>
---
lib/dump_stack.c | 3 ++-
1 file changed, 2 insertions(+), 1 deletion(-)
diff --git a/lib/dump_stack.c b/lib/dump_stack.c
index 83471e81501a..1057f102f6f2 100644
--- a/lib/dump_stack.c
+++ b/lib/dump_stack.c
@@ -6,6 +6,7 @@
#include <linux/kernel.h>
#include <linux/buildid.h>
+#include <linux/cache.h>
#include <linux/export.h>
#include <linux/sched.h>
#include <linux/sched/debug.h>
@@ -15,7 +16,7 @@
#include <linux/utsname.h>
#include <linux/stop_machine.h>
-static char dump_stack_arch_desc_str[128];
+static char dump_stack_arch_desc_str[128] __ro_after_init;
/**
* dump_stack_set_arch_desc - set arch-specific str to show with task dumps
--
2.43.0
^ permalink raw reply related [flat|nested] 6+ messages in thread* [PATCH RFC 2/5] dump_stack: Allow update of arch description string at runtime
2024-01-18 15:25 [PATCH RFC 0/5] dump_stack: Allow runtime updates of the hardware description Nathan Lynch via B4 Relay
2024-01-18 15:25 ` [PATCH RFC 1/5] dump_stack: Make arch description buffer __ro_after_init Nathan Lynch via B4 Relay
@ 2024-01-18 15:25 ` Nathan Lynch via B4 Relay
2024-01-18 15:25 ` [PATCH RFC 3/5] powerpc/prom: Add CPU info to hardware description string later Nathan Lynch via B4 Relay
` (2 subsequent siblings)
4 siblings, 0 replies; 6+ messages in thread
From: Nathan Lynch via B4 Relay @ 2024-01-18 15:25 UTC (permalink / raw)
To: Aneesh Kumar K.V, Naveen N. Rao, Brian King, Christophe Leroy,
John Ogness, Michael Ellerman, Nicholas Piggin, Petr Mladek,
Sergey Senozhatsky, Steven Rostedt
Cc: Nathan Lynch, linuxppc-dev, linux-kernel
From: Nathan Lynch <nathanl@linux.ibm.com>
The IBM PowerVM platform (targeted by powerpc/pseries) exposes the
physical machine model and firmware version to partitions (guests),
and this information is used to populate the arch description string,
e.g.
IBM,8408-E8E POWER8E (raw) 0x4b0201 0xf000004 \
of:IBM,FW860.50 (SV860_146) hv:phyp pSeries
The platform supports live migration of partitions between different
machine models and firmware versions, so the arch description string
set at boot can become inaccurate, potentially misleading anyone who's
analyzing stack traces produced after a migration.
Introduce a RCU-guarded pointer to the current arch description
string, initializing it to the static buffer populated at boot. Add to
dump_stack_print_info() a RCU read-side critical section that accesses
the buffer through this pointer. The majority of architectures which
don't need to update the string after boot incur only an additional
indirection.
As for platforms which do need that ability, they can use
dump_stack_update_arch_desc(), which allocates and formats a new
buffer, updates the pointer, and if appropriate frees the previous
buffer.
Signed-off-by: Nathan Lynch <nathanl@linux.ibm.com>
---
include/linux/printk.h | 5 +++++
lib/dump_stack.c | 54 ++++++++++++++++++++++++++++++++++++++++++++++----
2 files changed, 55 insertions(+), 4 deletions(-)
diff --git a/include/linux/printk.h b/include/linux/printk.h
index 8ef499ab3c1e..6138ae019d2a 100644
--- a/include/linux/printk.h
+++ b/include/linux/printk.h
@@ -187,6 +187,7 @@ u32 log_buf_len_get(void);
void log_buf_vmcoreinfo_setup(void);
void __init setup_log_buf(int early);
__printf(1, 2) void dump_stack_set_arch_desc(const char *fmt, ...);
+__printf(1, 2) void dump_stack_update_arch_desc(const char *fmt, ...);
void dump_stack_print_info(const char *log_lvl);
void show_regs_print_info(const char *log_lvl);
extern asmlinkage void dump_stack_lvl(const char *log_lvl) __cold;
@@ -253,6 +254,10 @@ static inline __printf(1, 2) void dump_stack_set_arch_desc(const char *fmt, ...)
{
}
+static inline __printf(1, 2) void dump_stack_update_arch_desc(const char *fmt, ...)
+{
+}
+
static inline void dump_stack_print_info(const char *log_lvl)
{
}
diff --git a/lib/dump_stack.c b/lib/dump_stack.c
index 1057f102f6f2..bd497e7797ee 100644
--- a/lib/dump_stack.c
+++ b/lib/dump_stack.c
@@ -8,15 +8,18 @@
#include <linux/buildid.h>
#include <linux/cache.h>
#include <linux/export.h>
+#include <linux/rcupdate.h>
#include <linux/sched.h>
#include <linux/sched/debug.h>
#include <linux/smp.h>
+#include <linux/spinlock.h>
#include <linux/atomic.h>
#include <linux/kexec.h>
#include <linux/utsname.h>
#include <linux/stop_machine.h>
static char dump_stack_arch_desc_str[128] __ro_after_init;
+static const char *dump_stack_arch_desc_ptr = dump_stack_arch_desc_str;
/**
* dump_stack_set_arch_desc - set arch-specific str to show with task dumps
@@ -28,7 +31,7 @@ static char dump_stack_arch_desc_str[128] __ro_after_init;
* arch wants to make use of such an ID string, it should initialize this
* as soon as possible during boot.
*/
-void __init dump_stack_set_arch_desc(const char *fmt, ...)
+void dump_stack_set_arch_desc(const char *fmt, ...)
{
va_list args;
@@ -38,6 +41,45 @@ void __init dump_stack_set_arch_desc(const char *fmt, ...)
va_end(args);
}
+/**
+ * dump_stack_update_arch_desc() - Update the arch description string at runtime.
+ * @fmt: printf-style format string
+ * @...: arguments for the format string
+ *
+ * A runtime counterpart of dump_stack_set_arch_desc(). Arch code
+ * should use this when the arch description set at boot potentially
+ * has become inaccurate, such as after a guest migration.
+ *
+ * Context: May sleep.
+ */
+void dump_stack_update_arch_desc(const char *fmt, ...)
+{
+ static DEFINE_SPINLOCK(arch_desc_update_lock);
+ const char *old;
+ const char *new;
+ va_list args;
+
+ va_start(args, fmt);
+ new = kvasprintf(GFP_KERNEL, fmt, args);
+ va_end(args);
+
+ if (!new)
+ return;
+
+ spin_lock(&arch_desc_update_lock);
+ old = rcu_replace_pointer(dump_stack_arch_desc_ptr, new,
+ lockdep_is_held(&arch_desc_update_lock));
+ spin_unlock(&arch_desc_update_lock);
+
+ /*
+ * Avoid freeing the static buffer initialized during boot.
+ */
+ if (old == dump_stack_arch_desc_str)
+ return;
+
+ kfree_rcu_mightsleep(old);
+}
+
#if IS_ENABLED(CONFIG_STACKTRACE_BUILD_ID)
#define BUILD_ID_FMT " %20phN"
#define BUILD_ID_VAL vmlinux_build_id
@@ -55,6 +97,8 @@ void __init dump_stack_set_arch_desc(const char *fmt, ...)
*/
void dump_stack_print_info(const char *log_lvl)
{
+ const char *arch_str;
+
printk("%sCPU: %d PID: %d Comm: %.20s %s%s %s %.*s" BUILD_ID_FMT "\n",
log_lvl, raw_smp_processor_id(), current->pid, current->comm,
kexec_crash_loaded() ? "Kdump: loaded " : "",
@@ -63,9 +107,11 @@ void dump_stack_print_info(const char *log_lvl)
(int)strcspn(init_utsname()->version, " "),
init_utsname()->version, BUILD_ID_VAL);
- if (dump_stack_arch_desc_str[0] != '\0')
- printk("%sHardware name: %s\n",
- log_lvl, dump_stack_arch_desc_str);
+ rcu_read_lock();
+ arch_str = rcu_dereference(dump_stack_arch_desc_ptr);
+ if (arch_str[0] != '\0')
+ printk("%sHardware name: %s\n", log_lvl, arch_str);
+ rcu_read_unlock();
print_worker_info(log_lvl, current);
print_stop_info(log_lvl, current);
--
2.43.0
^ permalink raw reply related [flat|nested] 6+ messages in thread* [PATCH RFC 3/5] powerpc/prom: Add CPU info to hardware description string later
2024-01-18 15:25 [PATCH RFC 0/5] dump_stack: Allow runtime updates of the hardware description Nathan Lynch via B4 Relay
2024-01-18 15:25 ` [PATCH RFC 1/5] dump_stack: Make arch description buffer __ro_after_init Nathan Lynch via B4 Relay
2024-01-18 15:25 ` [PATCH RFC 2/5] dump_stack: Allow update of arch description string at runtime Nathan Lynch via B4 Relay
@ 2024-01-18 15:25 ` Nathan Lynch via B4 Relay
2024-01-18 15:25 ` [PATCH RFC 4/5] powerpc/pseries: Prepare pseries_add_hw_description() for runtime use Nathan Lynch via B4 Relay
2024-01-18 15:25 ` [PATCH RFC 5/5] powerpc/pseries: Update hardware description string after migration Nathan Lynch via B4 Relay
4 siblings, 0 replies; 6+ messages in thread
From: Nathan Lynch via B4 Relay @ 2024-01-18 15:25 UTC (permalink / raw)
To: Aneesh Kumar K.V, Naveen N. Rao, Brian King, Christophe Leroy,
John Ogness, Michael Ellerman, Nicholas Piggin, Petr Mladek,
Sergey Senozhatsky, Steven Rostedt
Cc: Nathan Lynch, linuxppc-dev, linux-kernel
From: Nathan Lynch <nathanl@linux.ibm.com>
cur_cpu_spec->cpu_name is appended to ppc_hw_desc before cur_cpu_spec
has taken on its final value. This is illustrated on pseries by
comparing the CPU name as reported at boot ("POWER8E (raw)") to the
contents of /proc/cpuinfo ("POWER8 (architected)"):
$ dmesg | grep Hardware
Hardware name: IBM,8408-E8E POWER8E (raw) 0x4b0201 0xf000004 \
of:IBM,FW860.50 (SV860_146) hv:phyp pSeries
$ grep -m 1 ^cpu /proc/cpuinfo
cpu : POWER8 (architected), altivec supported
Some 44x models would appear to be affected as well; see
identical_pvr_fixup().
This results in incorrect CPU information in stack dumps --
ppc_hw_desc is an input to dump_stack_set_arch_desc().
Delay gathering the CPU name until after all potential calls to
identify_cpu().
Signed-off-by: Nathan Lynch <nathanl@linux.ibm.com>
Fixes: bd649d40e0f2 ("powerpc: Add PVR & CPU name to hardware description")
---
arch/powerpc/kernel/prom.c | 12 ++++++++----
1 file changed, 8 insertions(+), 4 deletions(-)
diff --git a/arch/powerpc/kernel/prom.c b/arch/powerpc/kernel/prom.c
index 0b5878c3125b..c12b4434336f 100644
--- a/arch/powerpc/kernel/prom.c
+++ b/arch/powerpc/kernel/prom.c
@@ -327,6 +327,7 @@ static int __init early_init_dt_scan_cpus(unsigned long node,
void *data)
{
const char *type = of_get_flat_dt_prop(node, "device_type", NULL);
+ const __be32 *cpu_version = NULL;
const __be32 *prop;
const __be32 *intserv;
int i, nthreads;
@@ -398,7 +399,7 @@ static int __init early_init_dt_scan_cpus(unsigned long node,
prop = of_get_flat_dt_prop(node, "cpu-version", NULL);
if (prop && (be32_to_cpup(prop) & 0xff000000) == 0x0f000000) {
identify_cpu(0, be32_to_cpup(prop));
- seq_buf_printf(&ppc_hw_desc, "0x%04x ", be32_to_cpup(prop));
+ cpu_version = prop;
}
check_cpu_feature_properties(node);
@@ -409,6 +410,12 @@ static int __init early_init_dt_scan_cpus(unsigned long node,
}
identical_pvr_fixup(node);
+
+ // We can now add the CPU name & PVR to the hardware description
+ seq_buf_printf(&ppc_hw_desc, "%s 0x%04lx ", cur_cpu_spec->cpu_name, mfspr(SPRN_PVR));
+ if (cpu_version)
+ seq_buf_printf(&ppc_hw_desc, "0x%04x ", be32_to_cpup(cpu_version));
+
init_mmu_slb_size(node);
#ifdef CONFIG_PPC64
@@ -846,9 +853,6 @@ void __init early_init_devtree(void *params)
dt_cpu_ftrs_scan();
- // We can now add the CPU name & PVR to the hardware description
- seq_buf_printf(&ppc_hw_desc, "%s 0x%04lx ", cur_cpu_spec->cpu_name, mfspr(SPRN_PVR));
-
/* Retrieve CPU related informations from the flat tree
* (altivec support, boot CPU ID, ...)
*/
--
2.43.0
^ permalink raw reply related [flat|nested] 6+ messages in thread* [PATCH RFC 4/5] powerpc/pseries: Prepare pseries_add_hw_description() for runtime use
2024-01-18 15:25 [PATCH RFC 0/5] dump_stack: Allow runtime updates of the hardware description Nathan Lynch via B4 Relay
` (2 preceding siblings ...)
2024-01-18 15:25 ` [PATCH RFC 3/5] powerpc/prom: Add CPU info to hardware description string later Nathan Lynch via B4 Relay
@ 2024-01-18 15:25 ` Nathan Lynch via B4 Relay
2024-01-18 15:25 ` [PATCH RFC 5/5] powerpc/pseries: Update hardware description string after migration Nathan Lynch via B4 Relay
4 siblings, 0 replies; 6+ messages in thread
From: Nathan Lynch via B4 Relay @ 2024-01-18 15:25 UTC (permalink / raw)
To: Aneesh Kumar K.V, Naveen N. Rao, Brian King, Christophe Leroy,
John Ogness, Michael Ellerman, Nicholas Piggin, Petr Mladek,
Sergey Senozhatsky, Steven Rostedt
Cc: Nathan Lynch, linuxppc-dev, linux-kernel
From: Nathan Lynch <nathanl@linux.ibm.com>
pseries_add_hw_description() will be used after boot to update the
hardware description string emitted in stack dumps. Remove the __init
and make it take a seq_buf * parameter instead of referencing
ppc_hw_desc directly.
Signed-off-by: Nathan Lynch <nathanl@linux.ibm.com>
---
arch/powerpc/platforms/pseries/setup.c | 10 +++++-----
1 file changed, 5 insertions(+), 5 deletions(-)
diff --git a/arch/powerpc/platforms/pseries/setup.c b/arch/powerpc/platforms/pseries/setup.c
index ecea85c74c43..9ae1951f8312 100644
--- a/arch/powerpc/platforms/pseries/setup.c
+++ b/arch/powerpc/platforms/pseries/setup.c
@@ -1007,7 +1007,7 @@ static void __init pSeries_cmo_feature_init(void)
pr_debug(" <- fw_cmo_feature_init()\n");
}
-static void __init pseries_add_hw_description(void)
+static void pseries_add_hw_description(struct seq_buf *sb)
{
struct device_node *dn;
const char *s;
@@ -1015,7 +1015,7 @@ static void __init pseries_add_hw_description(void)
dn = of_find_node_by_path("/openprom");
if (dn) {
if (of_property_read_string(dn, "model", &s) == 0)
- seq_buf_printf(&ppc_hw_desc, "of:%s ", s);
+ seq_buf_printf(sb, "of:%s ", s);
of_node_put(dn);
}
@@ -1023,7 +1023,7 @@ static void __init pseries_add_hw_description(void)
dn = of_find_node_by_path("/hypervisor");
if (dn) {
if (of_property_read_string(dn, "compatible", &s) == 0)
- seq_buf_printf(&ppc_hw_desc, "hv:%s ", s);
+ seq_buf_printf(sb, "hv:%s ", s);
of_node_put(dn);
return;
@@ -1031,7 +1031,7 @@ static void __init pseries_add_hw_description(void)
if (of_property_read_bool(of_root, "ibm,powervm-partition") ||
of_property_read_bool(of_root, "ibm,fw-net-version"))
- seq_buf_printf(&ppc_hw_desc, "hv:phyp ");
+ seq_buf_printf(sb, "hv:phyp ");
}
/*
@@ -1041,7 +1041,7 @@ static void __init pseries_init(void)
{
pr_debug(" -> pseries_init()\n");
- pseries_add_hw_description();
+ pseries_add_hw_description(&ppc_hw_desc);
#ifdef CONFIG_HVC_CONSOLE
if (firmware_has_feature(FW_FEATURE_LPAR))
--
2.43.0
^ permalink raw reply related [flat|nested] 6+ messages in thread* [PATCH RFC 5/5] powerpc/pseries: Update hardware description string after migration
2024-01-18 15:25 [PATCH RFC 0/5] dump_stack: Allow runtime updates of the hardware description Nathan Lynch via B4 Relay
` (3 preceding siblings ...)
2024-01-18 15:25 ` [PATCH RFC 4/5] powerpc/pseries: Prepare pseries_add_hw_description() for runtime use Nathan Lynch via B4 Relay
@ 2024-01-18 15:25 ` Nathan Lynch via B4 Relay
4 siblings, 0 replies; 6+ messages in thread
From: Nathan Lynch via B4 Relay @ 2024-01-18 15:25 UTC (permalink / raw)
To: Aneesh Kumar K.V, Naveen N. Rao, Brian King, Christophe Leroy,
John Ogness, Michael Ellerman, Nicholas Piggin, Petr Mladek,
Sergey Senozhatsky, Steven Rostedt
Cc: Nathan Lynch, linuxppc-dev, linux-kernel
From: Nathan Lynch <nathanl@linux.ibm.com>
Introduce code that rebuilds the short hardware description printed by
stack traces. This sort of duplicates some code from boot (prom.c
mainly), but that code populates the string as early as possible using
APIs that aren't available later. So sharing all the code between the
boot and runtime versions isn't feasible.
To prevent "drift" between the boot and runtime versions, rebuild the
description using the new runtime APIs in a late initcall and warn if
it doesn't match the one built earlier. The initcall also invokes
dump_stack_update_arch_desc() twice to fully exercise it before any
partition migration occurs. These checks could be dropped or made
configurable later.
Call pseries_update_hw_description() immediately after updating the
device tree when resuming from a partition migration.
Signed-off-by: Nathan Lynch <nathanl@linux.ibm.com>
---
arch/powerpc/platforms/pseries/mobility.c | 5 +++
arch/powerpc/platforms/pseries/pseries.h | 1 +
arch/powerpc/platforms/pseries/setup.c | 70 +++++++++++++++++++++++++++++++
3 files changed, 76 insertions(+)
diff --git a/arch/powerpc/platforms/pseries/mobility.c b/arch/powerpc/platforms/pseries/mobility.c
index 1798f0f14d58..ff573cb5aee5 100644
--- a/arch/powerpc/platforms/pseries/mobility.c
+++ b/arch/powerpc/platforms/pseries/mobility.c
@@ -378,6 +378,11 @@ void post_mobility_fixup(void)
rc = pseries_devicetree_update(MIGRATION_SCOPE);
if (rc)
pr_err("device tree update failed: %d\n", rc);
+ /*
+ * Rebuild the hardware description printed in stack traces
+ * using the updated device tree.
+ */
+ pseries_update_hw_description();
cacheinfo_rebuild();
diff --git a/arch/powerpc/platforms/pseries/pseries.h b/arch/powerpc/platforms/pseries/pseries.h
index bba4ad192b0f..810a64fccc7e 100644
--- a/arch/powerpc/platforms/pseries/pseries.h
+++ b/arch/powerpc/platforms/pseries/pseries.h
@@ -56,6 +56,7 @@ extern int dlpar_acquire_drc(u32 drc_index);
extern int dlpar_release_drc(u32 drc_index);
extern int dlpar_unisolate_drc(u32 drc_index);
extern void post_mobility_fixup(void);
+void pseries_update_hw_description(void);
void queue_hotplug_event(struct pseries_hp_errorlog *hp_errlog);
int handle_dlpar_errorlog(struct pseries_hp_errorlog *hp_errlog);
diff --git a/arch/powerpc/platforms/pseries/setup.c b/arch/powerpc/platforms/pseries/setup.c
index 9ae1951f8312..72177411026e 100644
--- a/arch/powerpc/platforms/pseries/setup.c
+++ b/arch/powerpc/platforms/pseries/setup.c
@@ -1034,6 +1034,76 @@ static void pseries_add_hw_description(struct seq_buf *sb)
seq_buf_printf(sb, "hv:phyp ");
}
+static void pseries_rebuild_hw_desc(struct seq_buf *sb)
+{
+ struct device_node *cpudn, *root;
+ const char *model;
+ u32 cpu_version;
+
+ seq_buf_clear(sb);
+
+ root = of_find_node_by_path("/");
+ if (!of_property_read_string(root, "model", &model))
+ seq_buf_printf(sb, "%s ", model);
+ of_node_put(root);
+
+ seq_buf_printf(sb, "%s 0x%04lx ", cur_cpu_spec->cpu_name, mfspr(SPRN_PVR));
+
+ cpudn = of_get_next_cpu_node(NULL);
+ if (!of_property_read_u32(cpudn, "cpu-version", &cpu_version)) {
+ if ((cpu_version & 0xff000000) == 0x0f000000)
+ seq_buf_printf(sb, "0x%04x ", cpu_version);
+ }
+ of_node_put(cpudn);
+
+ pseries_add_hw_description(sb);
+
+ seq_buf_puts(sb, ppc_md.name);
+}
+
+void pseries_update_hw_description(void)
+{
+ struct seq_buf sb = { // todo: use DECLARE_SEQ_BUF() once it's fixed
+ .buffer = (char[128]) { 0 },
+ .size = sizeof(char[128]),
+ };
+
+ pseries_rebuild_hw_desc(&sb);
+ dump_stack_update_arch_desc("%s", seq_buf_str(&sb));
+}
+
+static int __init pseries_test_update_hw_desc(void)
+{
+ struct seq_buf sb = { // todo: use DECLARE_SEQ_BUF() once it's fixed
+ .buffer = (char[128]) { 0 },
+ .size = sizeof(char[128]),
+ };
+ bool mismatch;
+
+ /*
+ * Ensure the rebuilt description matches the one built during
+ * boot.
+ */
+ pseries_rebuild_hw_desc(&sb);
+
+ mismatch = strcmp(seq_buf_str(&ppc_hw_desc), seq_buf_str(&sb));
+ if (WARN(mismatch, "rebuilt hardware description string mismatch")) {
+ pr_err(" boot: '%s'\n", ppc_hw_desc.buffer);
+ pr_err(" runtime: '%s'\n", sb.buffer);
+ return -EINVAL;
+ }
+
+ /*
+ * Invoke dump_stack_update_arch_desc() *twice* to ensure it
+ * exercises the free path.
+ */
+ dump_stack_update_arch_desc("%s", sb.buffer);
+ dump_stack_update_arch_desc("%s", sb.buffer);
+
+ return 0;
+}
+late_initcall(pseries_test_update_hw_desc);
+
/*
* Early initialization. Relocation is on but do not reference unbolted pages
*/
--
2.43.0
^ permalink raw reply related [flat|nested] 6+ messages in thread