Provide local_irq_{save,restore}_nmi() which will allow us to help architectures that implement NMIs using IRQ priorities like SPARC64 does. Sparc uses IRQ prio 15 for NMIs and implements local_irq_disable() as disable <= 14. However if you do that while inside an NMI you re- enable the NMI priority again, causing all kinds of fun. A more solid implementation would first check the disable level and never lower it, however that is more costly and would slow down the rest of the kernel for no particular reason. Therefore introduce local_irq_save_nmi() which can implement this slower but more solid scheme and dis-allow local_irq_save() from NMI context. Suggested-by: David Miller Signed-off-by: Peter Zijlstra --- include/linux/irqflags.h | 51 ++++++++++++++++++++++++++++++++++++++++--- kernel/lockdep.c | 7 +++++ kernel/trace/trace_irqsoff.c | 8 ++++++ 3 files changed, 63 insertions(+), 3 deletions(-) Index: linux-2.6/include/linux/irqflags.h =================================================================== --- linux-2.6.orig/include/linux/irqflags.h +++ linux-2.6/include/linux/irqflags.h @@ -18,6 +18,7 @@ extern void trace_softirqs_off(unsigned long ip); extern void trace_hardirqs_on(void); extern void trace_hardirqs_off(void); + extern void trace_hardirqs_off_no_nmi(void); # define trace_hardirq_context(p) ((p)->hardirq_context) # define trace_softirq_context(p) ((p)->softirq_context) # define trace_hardirqs_enabled(p) ((p)->hardirqs_enabled) @@ -30,6 +31,7 @@ #else # define trace_hardirqs_on() do { } while (0) # define trace_hardirqs_off() do { } while (0) +# define trace_hardirqs_off_no_nmi() do { } while (0) # define trace_softirqs_on(ip) do { } while (0) # define trace_softirqs_off(ip) do { } while (0) # define trace_hardirq_context(p) 0 @@ -59,15 +61,15 @@ #define local_irq_enable() \ do { trace_hardirqs_on(); raw_local_irq_enable(); } while (0) #define local_irq_disable() \ - do { raw_local_irq_disable(); trace_hardirqs_off(); } while (0) + do { raw_local_irq_disable(); trace_hardirqs_off_no_nmi(); } while (0) + #define local_irq_save(flags) \ do { \ typecheck(unsigned long, flags); \ raw_local_irq_save(flags); \ - trace_hardirqs_off(); \ + trace_hardirqs_off_no_nmi(); \ } while (0) - #define local_irq_restore(flags) \ do { \ typecheck(unsigned long, flags); \ @@ -79,6 +81,30 @@ raw_local_irq_restore(flags); \ } \ } while (0) + +#ifndef local_irq_save_nmi +# define local_irq_save_nmi(flags) \ + do { \ + typecheck(unsigned long, flags); \ + raw_local_irq_save(flags); \ + trace_hardirqs_off(); \ + } while (0) +#endif + +#ifndef local_irq_restore_nmi +#define local_irq_restore_nmi(flags) \ + do { \ + typecheck(unsigned long, flags); \ + if (raw_irqs_disabled_flags(flags)) { \ + raw_local_irq_restore(flags); \ + trace_hardirqs_off(); \ + } else { \ + trace_hardirqs_on(); \ + raw_local_irq_restore(flags); \ + } \ + } while (0) +#endif + #else /* !CONFIG_TRACE_IRQFLAGS_SUPPORT */ /* * The local_irq_*() APIs are equal to the raw_local_irq*() @@ -86,16 +112,35 @@ */ # define raw_local_irq_disable() local_irq_disable() # define raw_local_irq_enable() local_irq_enable() + # define raw_local_irq_save(flags) \ do { \ typecheck(unsigned long, flags); \ local_irq_save(flags); \ } while (0) + # define raw_local_irq_restore(flags) \ do { \ typecheck(unsigned long, flags); \ local_irq_restore(flags); \ } while (0) + +#ifndef local_irq_save_nmi +# define local_irq_save_nmi(flags) \ + do { \ + typecheck(unsigned long, flags); \ + local_irq_save(flags); \ + } while (0) +#endif + +#ifndef local_irq_restore_nmi +# define local_irq_restore_nmi(flags) \ + do { \ + typecheck(unsigned long, flags); \ + local_irq_restore(flags); \ + } while (0) +#endif + #endif /* CONFIG_TRACE_IRQFLAGS_SUPPORT */ #ifdef CONFIG_TRACE_IRQFLAGS_SUPPORT Index: linux-2.6/kernel/lockdep.c =================================================================== --- linux-2.6.orig/kernel/lockdep.c +++ linux-2.6/kernel/lockdep.c @@ -2369,6 +2369,13 @@ void trace_hardirqs_off(void) } EXPORT_SYMBOL(trace_hardirqs_off); +void trace_hardirqs_off_no_nmi(void) +{ + WARN_ON_ONCE(in_nmi()); + trace_hardirqs_off_caller(CALLER_ADDR0); +} +EXPORT_SYMBOL(trace_hardirqs_off_no_nmi); + /* * Softirqs will be enabled: */ Index: linux-2.6/kernel/trace/trace_irqsoff.c =================================================================== --- linux-2.6.orig/kernel/trace/trace_irqsoff.c +++ linux-2.6/kernel/trace/trace_irqsoff.c @@ -316,6 +316,14 @@ void trace_hardirqs_off(void) } EXPORT_SYMBOL(trace_hardirqs_off); +void trace_hardirqs_off_no_nmi(void) +{ + WARN_ON_ONCE(in_nmi()); + if (!preempt_trace() && irq_trace()) + start_critical_timing(CALLER_ADDR0, CALLER_ADDR1); +} +EXPORT_SYMBOL(trace_hardirqs_off_no_nmi); + void trace_hardirqs_on_caller(unsigned long caller_addr) { if (!preempt_trace() && irq_trace()) -- To unsubscribe from this list: send the line "unsubscribe linux-kernel" in the body of a message to majordomo@vger.kernel.org More majordomo info at http://vger.kernel.org/majordomo-info.html Please read the FAQ at http://www.tux.org/lkml/