* [PATCH] apic: use GFP_ATOMIC in lapic_resume
@ 2010-12-28 6:48 Zhang Rui
2010-12-28 7:00 ` David Rientjes
0 siblings, 1 reply; 7+ messages in thread
From: Zhang Rui @ 2010-12-28 6:48 UTC (permalink / raw)
To: H. Peter Anvin; +Cc: LKML
sysdev .suspend/.resume is invoked with irq disabled,
GFP_ATOMIC should be used in lapic_resume.
Without this patch, I got the following warning messages after resume.
[ 109.780371] BUG: sleeping function called from invalid context at mm/slub.c:793
[ 109.780782] in_atomic(): 0, irqs_disabled(): 1, pid: 1391, name: bash
[ 109.781024] Pid: 1391, comm: bash Not tainted 2.6.37-rc5+ #182
[ 109.781264] Call Trace:
[ 109.781501] [<ffffffff8104156a>] __might_sleep+0xeb/0xf0
[ 109.781743] [<ffffffff8110d5e2>] slab_pre_alloc_hook.clone.33+0x28/0x31
[ 109.781987] [<ffffffff8110dcef>] __kmalloc+0x88/0x115
[ 109.782224] [<ffffffff81025e4a>] ? kzalloc.clone.19+0x13/0x15
[ 109.782465] [<ffffffff81025e4a>] kzalloc.clone.19+0x13/0x15
[ 109.782704] [<ffffffff81025ff0>] alloc_ioapic_entries+0x20/0x82
[ 109.782948] [<ffffffff81024201>] lapic_resume+0x3a/0x245
[ 109.783189] [<ffffffff813a8329>] ? cpufreq_resume+0x30/0xb0
[ 109.783431] [<ffffffff812ec4ee>] __sysdev_resume+0x25/0xc5
[ 109.783673] [<ffffffff812ec644>] sysdev_resume+0xb6/0xfb
[ 109.783914] [<ffffffff81083256>] suspend_devices_and_enter+0x13c/0x1c1
[ 109.784159] [<ffffffff810833b8>] enter_state+0xdd/0x12e
[ 109.784398] [<ffffffff81082a61>] state_store+0xae/0xcb
[ 109.784640] [<ffffffff81225737>] kobj_attr_store+0x17/0x19
[ 109.784882] [<ffffffff81173311>] sysfs_write_file+0x114/0x150
[ 109.785124] [<ffffffff8111aebb>] vfs_write+0xac/0xff
[ 109.785365] [<ffffffff8111b0c2>] sys_write+0x4a/0x6e
[ 109.785604] [<ffffffff8100ac82>] system_call_fastpath+0x16/0x1b
Signed-off-by: Zhang Rui <rui.zhang@intel.com>
---
arch/x86/include/asm/io_apic.h | 2 +-
arch/x86/kernel/apic/apic.c | 4 ++--
arch/x86/kernel/apic/io_apic.c | 7 +++----
3 files changed, 6 insertions(+), 7 deletions(-)
Index: linux-2.6/arch/x86/kernel/apic/io_apic.c
===================================================================
--- linux-2.6.orig/arch/x86/kernel/apic/io_apic.c
+++ linux-2.6/arch/x86/kernel/apic/io_apic.c
@@ -589,20 +589,19 @@ static int __init ioapic_pirq_setup(char
__setup("pirq=", ioapic_pirq_setup);
#endif /* CONFIG_X86_32 */
-struct IO_APIC_route_entry **alloc_ioapic_entries(void)
+struct IO_APIC_route_entry **alloc_ioapic_entries(gfp_t flags)
{
int apic;
struct IO_APIC_route_entry **ioapic_entries;
- ioapic_entries = kzalloc(sizeof(*ioapic_entries) * nr_ioapics,
- GFP_KERNEL);
+ ioapic_entries = kzalloc(sizeof(*ioapic_entries) * nr_ioapics, flags);
if (!ioapic_entries)
return 0;
for (apic = 0; apic < nr_ioapics; apic++) {
ioapic_entries[apic] =
kzalloc(sizeof(struct IO_APIC_route_entry) *
- nr_ioapic_registers[apic], GFP_KERNEL);
+ nr_ioapic_registers[apic], flags);
if (!ioapic_entries[apic])
goto nomem;
}
Index: linux-2.6/arch/x86/include/asm/io_apic.h
===================================================================
--- linux-2.6.orig/arch/x86/include/asm/io_apic.h
+++ linux-2.6/arch/x86/include/asm/io_apic.h
@@ -162,7 +162,7 @@ void setup_IO_APIC_irq_extra(u32 gsi);
extern void ioapic_init_mappings(void);
extern void ioapic_insert_resources(void);
-extern struct IO_APIC_route_entry **alloc_ioapic_entries(void);
+extern struct IO_APIC_route_entry **alloc_ioapic_entries(gfp_t flags);
extern void free_ioapic_entries(struct IO_APIC_route_entry **ioapic_entries);
extern int save_IO_APIC_setup(struct IO_APIC_route_entry **ioapic_entries);
extern void mask_IO_APIC_setup(struct IO_APIC_route_entry **ioapic_entries);
Index: linux-2.6/arch/x86/kernel/apic/apic.c
===================================================================
--- linux-2.6.orig/arch/x86/kernel/apic/apic.c
+++ linux-2.6/arch/x86/kernel/apic/apic.c
@@ -1459,7 +1459,7 @@ void __init enable_IR_x2apic(void)
if (dmar_table_init_ret && !x2apic_supported())
return;
- ioapic_entries = alloc_ioapic_entries();
+ ioapic_entries = alloc_ioapic_entries(GFP_KERNEL);
if (!ioapic_entries) {
pr_err("Allocate ioapic_entries failed\n");
goto out;
@@ -2084,7 +2084,7 @@ static int lapic_resume(struct sys_devic
local_irq_save(flags);
if (intr_remapping_enabled) {
- ioapic_entries = alloc_ioapic_entries();
+ ioapic_entries = alloc_ioapic_entries(GFP_ATOMIC);
if (!ioapic_entries) {
WARN(1, "Alloc ioapic_entries in lapic resume failed.");
ret = -ENOMEM;
^ permalink raw reply [flat|nested] 7+ messages in thread* Re: [PATCH] apic: use GFP_ATOMIC in lapic_resume 2010-12-28 6:48 [PATCH] apic: use GFP_ATOMIC in lapic_resume Zhang Rui @ 2010-12-28 7:00 ` David Rientjes 2010-12-28 7:22 ` Zhang Rui 0 siblings, 1 reply; 7+ messages in thread From: David Rientjes @ 2010-12-28 7:00 UTC (permalink / raw) To: Zhang Rui; +Cc: H. Peter Anvin, LKML On Tue, 28 Dec 2010, Zhang Rui wrote: > Index: linux-2.6/arch/x86/kernel/apic/apic.c > =================================================================== > --- linux-2.6.orig/arch/x86/kernel/apic/apic.c > +++ linux-2.6/arch/x86/kernel/apic/apic.c > @@ -1459,7 +1459,7 @@ void __init enable_IR_x2apic(void) > if (dmar_table_init_ret && !x2apic_supported()) > return; > > - ioapic_entries = alloc_ioapic_entries(); > + ioapic_entries = alloc_ioapic_entries(GFP_KERNEL); > if (!ioapic_entries) { > pr_err("Allocate ioapic_entries failed\n"); > goto out; > @@ -2084,7 +2084,7 @@ static int lapic_resume(struct sys_devic > > local_irq_save(flags); > if (intr_remapping_enabled) { > - ioapic_entries = alloc_ioapic_entries(); > + ioapic_entries = alloc_ioapic_entries(GFP_ATOMIC); > if (!ioapic_entries) { > WARN(1, "Alloc ioapic_entries in lapic resume failed."); > ret = -ENOMEM; You can't do the allocation before disabling irqs when intr_remapping_enabled is set? ^ permalink raw reply [flat|nested] 7+ messages in thread
* Re: [PATCH] apic: use GFP_ATOMIC in lapic_resume 2010-12-28 7:00 ` David Rientjes @ 2010-12-28 7:22 ` Zhang Rui 2010-12-28 7:39 ` David Rientjes 0 siblings, 1 reply; 7+ messages in thread From: Zhang Rui @ 2010-12-28 7:22 UTC (permalink / raw) To: David Rientjes; +Cc: H. Peter Anvin, LKML, Rafael J. Wysocki On Tue, 2010-12-28 at 15:00 +0800, David Rientjes wrote: > On Tue, 28 Dec 2010, Zhang Rui wrote: > > > Index: linux-2.6/arch/x86/kernel/apic/apic.c > > =================================================================== > > --- linux-2.6.orig/arch/x86/kernel/apic/apic.c > > +++ linux-2.6/arch/x86/kernel/apic/apic.c > > @@ -1459,7 +1459,7 @@ void __init enable_IR_x2apic(void) > > if (dmar_table_init_ret && !x2apic_supported()) > > return; > > > > - ioapic_entries = alloc_ioapic_entries(); > > + ioapic_entries = alloc_ioapic_entries(GFP_KERNEL); > > if (!ioapic_entries) { > > pr_err("Allocate ioapic_entries failed\n"); > > goto out; > > @@ -2084,7 +2084,7 @@ static int lapic_resume(struct sys_devic > > > > local_irq_save(flags); > > if (intr_remapping_enabled) { > > - ioapic_entries = alloc_ioapic_entries(); > > + ioapic_entries = alloc_ioapic_entries(GFP_ATOMIC); > > if (!ioapic_entries) { > > WARN(1, "Alloc ioapic_entries in lapic resume failed."); > > ret = -ENOMEM; > > You can't do the allocation before disabling irqs when > intr_remapping_enabled is set? yes, we can. The first idea came into my mind is to register a pm notifier callback to allocate/free the memory. But that one duplicates the code of alloc_ioapic_entries, which doesn't look nice, neither. Plus, is there any problem with this one? thanks, rui > -- > To unsubscribe from this list: send the line "unsubscribe linux-kernel" in > the body of a message to majordomo@vger.kernel.org > More majordomo info at http://vger.kernel.org/majordomo-info.html > Please read the FAQ at http://www.tux.org/lkml/ ^ permalink raw reply [flat|nested] 7+ messages in thread
* Re: [PATCH] apic: use GFP_ATOMIC in lapic_resume 2010-12-28 7:22 ` Zhang Rui @ 2010-12-28 7:39 ` David Rientjes 2010-12-28 7:56 ` Zhang Rui 0 siblings, 1 reply; 7+ messages in thread From: David Rientjes @ 2010-12-28 7:39 UTC (permalink / raw) To: Zhang Rui; +Cc: H. Peter Anvin, LKML, Rafael J. Wysocki On Tue, 28 Dec 2010, Zhang Rui wrote: > > > Index: linux-2.6/arch/x86/kernel/apic/apic.c > > > =================================================================== > > > --- linux-2.6.orig/arch/x86/kernel/apic/apic.c > > > +++ linux-2.6/arch/x86/kernel/apic/apic.c > > > @@ -1459,7 +1459,7 @@ void __init enable_IR_x2apic(void) > > > if (dmar_table_init_ret && !x2apic_supported()) > > > return; > > > > > > - ioapic_entries = alloc_ioapic_entries(); > > > + ioapic_entries = alloc_ioapic_entries(GFP_KERNEL); > > > if (!ioapic_entries) { > > > pr_err("Allocate ioapic_entries failed\n"); > > > goto out; > > > @@ -2084,7 +2084,7 @@ static int lapic_resume(struct sys_devic > > > > > > local_irq_save(flags); > > > if (intr_remapping_enabled) { > > > - ioapic_entries = alloc_ioapic_entries(); > > > + ioapic_entries = alloc_ioapic_entries(GFP_ATOMIC); > > > if (!ioapic_entries) { > > > WARN(1, "Alloc ioapic_entries in lapic resume failed."); > > > ret = -ENOMEM; > > > > You can't do the allocation before disabling irqs when > > intr_remapping_enabled is set? > > yes, we can. The first idea came into my mind is to register a pm > notifier callback to allocate/free the memory. But that one duplicates > the code of alloc_ioapic_entries, which doesn't look nice, neither. > Plus, is there any problem with this one? > We try to avoid GFP_ATOMIC whenever possible and this seems like a particularly trivial case. You can simply move the alloc_ioapic_entries() and NULL check before local_irq_save() and GFP_KERNEL will work fine. ^ permalink raw reply [flat|nested] 7+ messages in thread
* Re: [PATCH] apic: use GFP_ATOMIC in lapic_resume 2010-12-28 7:39 ` David Rientjes @ 2010-12-28 7:56 ` Zhang Rui 2010-12-28 8:48 ` Zhang Rui 0 siblings, 1 reply; 7+ messages in thread From: Zhang Rui @ 2010-12-28 7:56 UTC (permalink / raw) To: David Rientjes; +Cc: H. Peter Anvin, LKML, Rafael J. Wysocki On Tue, 2010-12-28 at 15:39 +0800, David Rientjes wrote: > On Tue, 28 Dec 2010, Zhang Rui wrote: > > > > > Index: linux-2.6/arch/x86/kernel/apic/apic.c > > > > =================================================================== > > > > --- linux-2.6.orig/arch/x86/kernel/apic/apic.c > > > > +++ linux-2.6/arch/x86/kernel/apic/apic.c > > > > @@ -1459,7 +1459,7 @@ void __init enable_IR_x2apic(void) > > > > if (dmar_table_init_ret && !x2apic_supported()) > > > > return; > > > > > > > > - ioapic_entries = alloc_ioapic_entries(); > > > > + ioapic_entries = alloc_ioapic_entries(GFP_KERNEL); > > > > if (!ioapic_entries) { > > > > pr_err("Allocate ioapic_entries failed\n"); > > > > goto out; > > > > @@ -2084,7 +2084,7 @@ static int lapic_resume(struct sys_devic > > > > > > > > local_irq_save(flags); > > > > if (intr_remapping_enabled) { > > > > - ioapic_entries = alloc_ioapic_entries(); > > > > + ioapic_entries = alloc_ioapic_entries(GFP_ATOMIC); > > > > if (!ioapic_entries) { > > > > WARN(1, "Alloc ioapic_entries in lapic resume failed."); > > > > ret = -ENOMEM; > > > > > > You can't do the allocation before disabling irqs when > > > intr_remapping_enabled is set? > > > > yes, we can. The first idea came into my mind is to register a pm > > notifier callback to allocate/free the memory. But that one duplicates > > the code of alloc_ioapic_entries, which doesn't look nice, neither. > > Plus, is there any problem with this one? > > > > We try to avoid GFP_ATOMIC whenever possible and this seems like a > particularly trivial case. You can simply move the alloc_ioapic_entries() > and NULL check before local_irq_save() and GFP_KERNEL will work fine. I'm afraid not. lapic_resume is invoked in sysdev_resume, which is done with irq disabled, please refer to the code in kernel/power/suspend.c. arch_suspend_disable_irqs(); BUG_ON(!irqs_disabled()); error = sysdev_suspend(PMSG_SUSPEND); if (!error) { if (!suspend_test(TEST_CORE) && pm_check_wakeup_events()) { error = suspend_ops->enter(state); events_check_enabled = false; } sysdev_resume(); } arch_suspend_enable_irqs(); BUG_ON(irqs_disabled()); To pre-allocate the memory, we need to build a notifier bloack and call register_pm_notifier. thanks, rui > -- > To unsubscribe from this list: send the line "unsubscribe linux-kernel" in > the body of a message to majordomo@vger.kernel.org > More majordomo info at http://vger.kernel.org/majordomo-info.html > Please read the FAQ at http://www.tux.org/lkml/ ^ permalink raw reply [flat|nested] 7+ messages in thread
* Re: [PATCH] apic: use GFP_ATOMIC in lapic_resume 2010-12-28 7:56 ` Zhang Rui @ 2010-12-28 8:48 ` Zhang Rui 2010-12-28 9:57 ` Rafael J. Wysocki 0 siblings, 1 reply; 7+ messages in thread From: Zhang Rui @ 2010-12-28 8:48 UTC (permalink / raw) To: David Rientjes; +Cc: H. Peter Anvin, LKML, Rafael J. Wysocki On Tue, 2010-12-28 at 15:56 +0800, Zhang Rui wrote: > On Tue, 2010-12-28 at 15:39 +0800, David Rientjes wrote: > > On Tue, 28 Dec 2010, Zhang Rui wrote: > > > > > > > Index: linux-2.6/arch/x86/kernel/apic/apic.c > > > > > =================================================================== > > > > > --- linux-2.6.orig/arch/x86/kernel/apic/apic.c > > > > > +++ linux-2.6/arch/x86/kernel/apic/apic.c > > > > > @@ -1459,7 +1459,7 @@ void __init enable_IR_x2apic(void) > > > > > if (dmar_table_init_ret && !x2apic_supported()) > > > > > return; > > > > > > > > > > - ioapic_entries = alloc_ioapic_entries(); > > > > > + ioapic_entries = alloc_ioapic_entries(GFP_KERNEL); > > > > > if (!ioapic_entries) { > > > > > pr_err("Allocate ioapic_entries failed\n"); > > > > > goto out; > > > > > @@ -2084,7 +2084,7 @@ static int lapic_resume(struct sys_devic > > > > > > > > > > local_irq_save(flags); > > > > > if (intr_remapping_enabled) { > > > > > - ioapic_entries = alloc_ioapic_entries(); > > > > > + ioapic_entries = alloc_ioapic_entries(GFP_ATOMIC); > > > > > if (!ioapic_entries) { > > > > > WARN(1, "Alloc ioapic_entries in lapic resume failed."); > > > > > ret = -ENOMEM; > > > > > > > > You can't do the allocation before disabling irqs when > > > > intr_remapping_enabled is set? > > > > > > yes, we can. The first idea came into my mind is to register a pm > > > notifier callback to allocate/free the memory. But that one duplicates > > > the code of alloc_ioapic_entries, which doesn't look nice, neither. > > > Plus, is there any problem with this one? > > > > > > > We try to avoid GFP_ATOMIC whenever possible and this seems like a > > particularly trivial case. You can simply move the alloc_ioapic_entries() > > and NULL check before local_irq_save() and GFP_KERNEL will work fine. > > I'm afraid not. > lapic_resume is invoked in sysdev_resume, which is done with irq > disabled, please refer to the code in kernel/power/suspend.c. > > arch_suspend_disable_irqs(); > BUG_ON(!irqs_disabled()); > > error = sysdev_suspend(PMSG_SUSPEND); > if (!error) { > if (!suspend_test(TEST_CORE) && > pm_check_wakeup_events()) { > error = suspend_ops->enter(state); > events_check_enabled = false; > } > sysdev_resume(); > } > > arch_suspend_enable_irqs(); > BUG_ON(irqs_disabled()); > > To pre-allocate the memory, we need to build a notifier bloack and call > register_pm_notifier. what about this one? Note that it just builds okay, I have not test the patch yet. pre-allocate the memory used in lapic_resume because lapic_resume, as a sysdev .resume callback, is always invoked with irq disabled. Without this patch, I got the following warning messages after resume. [ 109.780371] BUG: sleeping function called from invalid context at mm/slub.c:793 [ 109.780782] in_atomic(): 0, irqs_disabled(): 1, pid: 1391, name: bash [ 109.781024] Pid: 1391, comm: bash Not tainted 2.6.37-rc5+ #182 [ 109.781264] Call Trace: [ 109.781501] [<ffffffff8104156a>] __might_sleep+0xeb/0xf0 [ 109.781743] [<ffffffff8110d5e2>] slab_pre_alloc_hook.clone.33 +0x28/0x31 [ 109.781987] [<ffffffff8110dcef>] __kmalloc+0x88/0x115 [ 109.782224] [<ffffffff81025e4a>] ? kzalloc.clone.19+0x13/0x15 [ 109.782465] [<ffffffff81025e4a>] kzalloc.clone.19+0x13/0x15 [ 109.782704] [<ffffffff81025ff0>] alloc_ioapic_entries+0x20/0x82 [ 109.782948] [<ffffffff81024201>] lapic_resume+0x3a/0x245 [ 109.783189] [<ffffffff813a8329>] ? cpufreq_resume+0x30/0xb0 [ 109.783431] [<ffffffff812ec4ee>] __sysdev_resume+0x25/0xc5 [ 109.783673] [<ffffffff812ec644>] sysdev_resume+0xb6/0xfb [ 109.783914] [<ffffffff81083256>] suspend_devices_and_enter +0x13c/0x1c1 [ 109.784159] [<ffffffff810833b8>] enter_state+0xdd/0x12e [ 109.784398] [<ffffffff81082a61>] state_store+0xae/0xcb [ 109.784640] [<ffffffff81225737>] kobj_attr_store+0x17/0x19 [ 109.784882] [<ffffffff81173311>] sysfs_write_file+0x114/0x150 [ 109.785124] [<ffffffff8111aebb>] vfs_write+0xac/0xff [ 109.785365] [<ffffffff8111b0c2>] sys_write+0x4a/0x6e [ 109.785604] [<ffffffff8100ac82>] system_call_fastpath+0x16/0x1b Signed-off-by: Zhang Rui <rui.zhang@intel.com> --- arch/x86/kernel/apic/apic.c | 38 +++++++++++++++++++++++++++++++++----- 1 file changed, 33 insertions(+), 5 deletions(-) Index: linux-2.6/arch/x86/kernel/apic/apic.c =================================================================== --- linux-2.6.orig/arch/x86/kernel/apic/apic.c +++ linux-2.6/arch/x86/kernel/apic/apic.c @@ -34,6 +34,7 @@ #include <linux/nmi.h> #include <linux/smp.h> #include <linux/mm.h> +#include <linux/suspend.h> #include <asm/perf_event.h> #include <asm/x86_init.h> @@ -2033,6 +2034,34 @@ static struct { unsigned int apic_thmr; } apic_pm_state; +static struct IO_APIC_route_entry **ioapic_entries; + +static int lapic_notifier_cb(struct notifier_block *nb, + unsigned long val, void *unused) +{ + switch(val) { + case PM_HIBERNATION_PREPARE: + case PM_SUSPEND_PREPARE: + case PM_RESTORE_PREPARE: + ioapic_entries = alloc_ioapic_entries(); + if (!ioapic_entries) + return NOTIFY_BAD; + return NOTIFY_OK; + case PM_POST_HIBERNATION: + case PM_POST_SUSPEND: + case PM_POST_RESTORE: + free_ioapic_entries(ioapic_entries); + ioapic_entries = NULL; + return NOTIFY_OK; + } + return NOTIFY_BAD; +} + +static struct notifier_block lapic_pm_nb = { + .notifier_call = lapic_notifier_cb, + .priority = 0, +}; + static int lapic_suspend(struct sys_device *dev, pm_message_t state) { unsigned long flags; @@ -2077,14 +2106,12 @@ static int lapic_resume(struct sys_devic unsigned long flags; int maxlvt; int ret = 0; - struct IO_APIC_route_entry **ioapic_entries = NULL; if (!apic_pm_state.active) return 0; local_irq_save(flags); if (intr_remapping_enabled) { - ioapic_entries = alloc_ioapic_entries(); if (!ioapic_entries) { WARN(1, "Alloc ioapic_entries in lapic resume failed."); ret = -ENOMEM; @@ -2094,7 +2121,6 @@ static int lapic_resume(struct sys_devic ret = save_IO_APIC_setup(ioapic_entries); if (ret) { WARN(1, "Saving IO-APIC state failed: %d\n", ret); - free_ioapic_entries(ioapic_entries); goto restore; } @@ -2145,7 +2171,6 @@ static int lapic_resume(struct sys_devic reenable_intr_remapping(x2apic_mode); legacy_pic->restore_mask(); restore_IO_APIC_setup(ioapic_entries); - free_ioapic_entries(ioapic_entries); } restore: local_irq_restore(flags); @@ -2183,8 +2208,11 @@ static int __init init_lapic_sysfs(void) /* XXX: remove suspend/resume procs if !apic_pm_state.active? */ error = sysdev_class_register(&lapic_sysclass); - if (!error) + if (!error) { error = sysdev_register(&device_lapic); + if (!error) + error = register_pm_notifier(&lapic_pm_nb); + } return error; } ^ permalink raw reply [flat|nested] 7+ messages in thread
* Re: [PATCH] apic: use GFP_ATOMIC in lapic_resume 2010-12-28 8:48 ` Zhang Rui @ 2010-12-28 9:57 ` Rafael J. Wysocki 0 siblings, 0 replies; 7+ messages in thread From: Rafael J. Wysocki @ 2010-12-28 9:57 UTC (permalink / raw) To: Zhang Rui; +Cc: David Rientjes, H. Peter Anvin, LKML On Tuesday, December 28, 2010, Zhang Rui wrote: > On Tue, 2010-12-28 at 15:56 +0800, Zhang Rui wrote: > > On Tue, 2010-12-28 at 15:39 +0800, David Rientjes wrote: > > > On Tue, 28 Dec 2010, Zhang Rui wrote: > > > > > > > > > Index: linux-2.6/arch/x86/kernel/apic/apic.c > > > > > > =================================================================== > > > > > > --- linux-2.6.orig/arch/x86/kernel/apic/apic.c > > > > > > +++ linux-2.6/arch/x86/kernel/apic/apic.c > > > > > > @@ -1459,7 +1459,7 @@ void __init enable_IR_x2apic(void) > > > > > > if (dmar_table_init_ret && !x2apic_supported()) > > > > > > return; > > > > > > > > > > > > - ioapic_entries = alloc_ioapic_entries(); > > > > > > + ioapic_entries = alloc_ioapic_entries(GFP_KERNEL); > > > > > > if (!ioapic_entries) { > > > > > > pr_err("Allocate ioapic_entries failed\n"); > > > > > > goto out; > > > > > > @@ -2084,7 +2084,7 @@ static int lapic_resume(struct sys_devic > > > > > > > > > > > > local_irq_save(flags); > > > > > > if (intr_remapping_enabled) { > > > > > > - ioapic_entries = alloc_ioapic_entries(); > > > > > > + ioapic_entries = alloc_ioapic_entries(GFP_ATOMIC); > > > > > > if (!ioapic_entries) { > > > > > > WARN(1, "Alloc ioapic_entries in lapic resume failed."); > > > > > > ret = -ENOMEM; > > > > > > > > > > You can't do the allocation before disabling irqs when > > > > > intr_remapping_enabled is set? > > > > > > > > yes, we can. The first idea came into my mind is to register a pm > > > > notifier callback to allocate/free the memory. But that one duplicates > > > > the code of alloc_ioapic_entries, which doesn't look nice, neither. > > > > Plus, is there any problem with this one? > > > > > > > > > > We try to avoid GFP_ATOMIC whenever possible and this seems like a > > > particularly trivial case. You can simply move the alloc_ioapic_entries() > > > and NULL check before local_irq_save() and GFP_KERNEL will work fine. > > > > I'm afraid not. > > lapic_resume is invoked in sysdev_resume, which is done with irq > > disabled, please refer to the code in kernel/power/suspend.c. > > > > arch_suspend_disable_irqs(); > > BUG_ON(!irqs_disabled()); > > > > error = sysdev_suspend(PMSG_SUSPEND); > > if (!error) { > > if (!suspend_test(TEST_CORE) && > > pm_check_wakeup_events()) { > > error = suspend_ops->enter(state); > > events_check_enabled = false; > > } > > sysdev_resume(); > > } > > > > arch_suspend_enable_irqs(); > > BUG_ON(irqs_disabled()); > > > > To pre-allocate the memory, we need to build a notifier bloack and call > > register_pm_notifier. > > what about this one? Quite frankly, I very much prefer the simple patch doing an atomic allocation. Using GFP_KERNEL in a sysdev callback is a plain bug and should be fixed, preferably in the simplest possible way (ie. replace GFP_KERNEL with GFP_ATOMIC). The question whether or not we can avoid allocating memory in there is a different one and I'm not sure if the solution below is the most straightforward one. Thanks, Rafael > Note that it just builds okay, I have not test the patch yet. > > pre-allocate the memory used in lapic_resume because lapic_resume, as a > sysdev .resume callback, is always invoked with irq disabled. > > Without this patch, I got the following warning messages after resume. > [ 109.780371] BUG: sleeping function called from invalid context at > mm/slub.c:793 > [ 109.780782] in_atomic(): 0, irqs_disabled(): 1, pid: 1391, name: bash > [ 109.781024] Pid: 1391, comm: bash Not tainted 2.6.37-rc5+ #182 > [ 109.781264] Call Trace: > [ 109.781501] [<ffffffff8104156a>] __might_sleep+0xeb/0xf0 > [ 109.781743] [<ffffffff8110d5e2>] slab_pre_alloc_hook.clone.33 > +0x28/0x31 > [ 109.781987] [<ffffffff8110dcef>] __kmalloc+0x88/0x115 > [ 109.782224] [<ffffffff81025e4a>] ? kzalloc.clone.19+0x13/0x15 > [ 109.782465] [<ffffffff81025e4a>] kzalloc.clone.19+0x13/0x15 > [ 109.782704] [<ffffffff81025ff0>] alloc_ioapic_entries+0x20/0x82 > [ 109.782948] [<ffffffff81024201>] lapic_resume+0x3a/0x245 > [ 109.783189] [<ffffffff813a8329>] ? cpufreq_resume+0x30/0xb0 > [ 109.783431] [<ffffffff812ec4ee>] __sysdev_resume+0x25/0xc5 > [ 109.783673] [<ffffffff812ec644>] sysdev_resume+0xb6/0xfb > [ 109.783914] [<ffffffff81083256>] suspend_devices_and_enter > +0x13c/0x1c1 > [ 109.784159] [<ffffffff810833b8>] enter_state+0xdd/0x12e > [ 109.784398] [<ffffffff81082a61>] state_store+0xae/0xcb > [ 109.784640] [<ffffffff81225737>] kobj_attr_store+0x17/0x19 > [ 109.784882] [<ffffffff81173311>] sysfs_write_file+0x114/0x150 > [ 109.785124] [<ffffffff8111aebb>] vfs_write+0xac/0xff > [ 109.785365] [<ffffffff8111b0c2>] sys_write+0x4a/0x6e > [ 109.785604] [<ffffffff8100ac82>] system_call_fastpath+0x16/0x1b > > Signed-off-by: Zhang Rui <rui.zhang@intel.com> > --- > arch/x86/kernel/apic/apic.c | 38 +++++++++++++++++++++++++++++++++----- > 1 file changed, 33 insertions(+), 5 deletions(-) > > Index: linux-2.6/arch/x86/kernel/apic/apic.c > =================================================================== > --- linux-2.6.orig/arch/x86/kernel/apic/apic.c > +++ linux-2.6/arch/x86/kernel/apic/apic.c > @@ -34,6 +34,7 @@ > #include <linux/nmi.h> > #include <linux/smp.h> > #include <linux/mm.h> > +#include <linux/suspend.h> > > #include <asm/perf_event.h> > #include <asm/x86_init.h> > @@ -2033,6 +2034,34 @@ static struct { > unsigned int apic_thmr; > } apic_pm_state; > > +static struct IO_APIC_route_entry **ioapic_entries; > + > +static int lapic_notifier_cb(struct notifier_block *nb, > + unsigned long val, void *unused) > +{ > + switch(val) { > + case PM_HIBERNATION_PREPARE: > + case PM_SUSPEND_PREPARE: > + case PM_RESTORE_PREPARE: > + ioapic_entries = alloc_ioapic_entries(); > + if (!ioapic_entries) > + return NOTIFY_BAD; > + return NOTIFY_OK; > + case PM_POST_HIBERNATION: > + case PM_POST_SUSPEND: > + case PM_POST_RESTORE: > + free_ioapic_entries(ioapic_entries); > + ioapic_entries = NULL; > + return NOTIFY_OK; > + } > + return NOTIFY_BAD; > +} > + > +static struct notifier_block lapic_pm_nb = { > + .notifier_call = lapic_notifier_cb, > + .priority = 0, > +}; > + > static int lapic_suspend(struct sys_device *dev, pm_message_t state) > { > unsigned long flags; > @@ -2077,14 +2106,12 @@ static int lapic_resume(struct sys_devic > unsigned long flags; > int maxlvt; > int ret = 0; > - struct IO_APIC_route_entry **ioapic_entries = NULL; > > if (!apic_pm_state.active) > return 0; > > local_irq_save(flags); > if (intr_remapping_enabled) { > - ioapic_entries = alloc_ioapic_entries(); > if (!ioapic_entries) { > WARN(1, "Alloc ioapic_entries in lapic resume failed."); > ret = -ENOMEM; > @@ -2094,7 +2121,6 @@ static int lapic_resume(struct sys_devic > ret = save_IO_APIC_setup(ioapic_entries); > if (ret) { > WARN(1, "Saving IO-APIC state failed: %d\n", ret); > - free_ioapic_entries(ioapic_entries); > goto restore; > } > > @@ -2145,7 +2171,6 @@ static int lapic_resume(struct sys_devic > reenable_intr_remapping(x2apic_mode); > legacy_pic->restore_mask(); > restore_IO_APIC_setup(ioapic_entries); > - free_ioapic_entries(ioapic_entries); > } > restore: > local_irq_restore(flags); > @@ -2183,8 +2208,11 @@ static int __init init_lapic_sysfs(void) > /* XXX: remove suspend/resume procs if !apic_pm_state.active? */ > > error = sysdev_class_register(&lapic_sysclass); > - if (!error) > + if (!error) { > error = sysdev_register(&device_lapic); > + if (!error) > + error = register_pm_notifier(&lapic_pm_nb); > + } > return error; > } > > > > > ^ permalink raw reply [flat|nested] 7+ messages in thread
end of thread, other threads:[~2010-12-28 9:58 UTC | newest] Thread overview: 7+ messages (download: mbox.gz follow: Atom feed -- links below jump to the message on this page -- 2010-12-28 6:48 [PATCH] apic: use GFP_ATOMIC in lapic_resume Zhang Rui 2010-12-28 7:00 ` David Rientjes 2010-12-28 7:22 ` Zhang Rui 2010-12-28 7:39 ` David Rientjes 2010-12-28 7:56 ` Zhang Rui 2010-12-28 8:48 ` Zhang Rui 2010-12-28 9:57 ` Rafael J. Wysocki
This is an external index of several public inboxes, see mirroring instructions on how to clone and mirror all data and code used by this external index.