On Wed, 22 Apr 2015 16:42:12 -0700 Dave Hansen <d...@sr71.net> wrote:
> > There has been a glut of tough debug issues lately that all come > back to the xsave code. This trace point helped us find and fix > a long-lived bug today, just from the data it showed. > > But, the xsave operations are in a header and they're inlined all > over the place. Including a tracepoint header in to another header > is causing some interesting issues. > > For instance arch/x86/kvm/x86.c's CREATE_TRACE_POINTS comes before > the last #include, so it tried to create *MY* tracepoints too. It > also looks like we need to be extra careful to #undef our > TRACE_SYSTEM, TRACE_INCLUDE_FILE, TRACE_INCLUDE_PATH #defines for > each trace header, or risk seeing them double-defined. Yeah, tracepoints really should not be used in header files, or for static inlines for that matter. A "trace_foo()" expands into a bit of code, that should not be called all over the place. It just bloats the kernel. One solution is to hard code a jump label and do: extern struct tracepoint __tracepoint_foo; [...] if (static_key_false(&__tracepoint_foo.key)) { call_trace_foo(x); Where call_trace_foo(x) is a function that does the tracepoint for foo: void call_trace_foo(arg x) { trace_foo(x); } This way you still get the benefit of the "zero" overhead of a disabled tracepoint, but you also avoid include hell and keep all tracepoint code out of headers. -- Steve > > I'm also seeing some odd redefinition warnings. When I go look at > ftrace_event.h:609, I don't see anything remotely xsave or FPU > related: > > arch/x86/mm/built-in.o: In function `perf_trace_buf_submit': > include/linux/ftrace_event.h:609: multiple definition of > `__tracepoint_cpu_state_xsave' > arch/x86/kernel/built-in.o:(__tracepoints+0x5c0): first defined here > arch/x86/mm/built-in.o: In function `perf_fetch_caller_regs': > include/linux/perf_event.h:688: multiple definition of > `__tracepoint_cpu_state_xrstor' > arch/x86/kernel/built-in.o:linux.git/arch/x86/kernel/process_64.c:256: first > defined here > make[2]: *** [arch/x86/built-in.o] Error 1 > > Am I doing something wrong? Are there good alternatives for when > we want to trace something that's done in a header? > > Cc: Steven Rostedt <rost...@goodmis.org> > Cc: Ingo Molnar <mi...@redhat.com> > Cc: a...@linux.intel.com > > --- > > b/arch/x86/include/asm/fpu-internal.h | 8 +- > b/arch/x86/include/asm/trace/cpustate.h | 105 > ++++++++++++++++++++++++++++++++ > b/arch/x86/include/asm/trace/mpx.h | 1 > b/arch/x86/include/asm/xsave.h | 15 +++- > b/arch/x86/kernel/xsave.c | 24 +++++++ > b/arch/x86/kvm/x86.c | 6 - > b/include/trace/events/syscalls.h | 3 > 7 files changed, 155 insertions(+), 7 deletions(-) > > diff -puN arch/x86/include/asm/fpu-internal.h~xsave-trace-0 > arch/x86/include/asm/fpu-internal.h > --- a/arch/x86/include/asm/fpu-internal.h~xsave-trace-0 2015-04-22 > 16:30:57.151296546 -0700 > +++ b/arch/x86/include/asm/fpu-internal.h 2015-04-22 16:31:19.482303717 > -0700 > @@ -22,6 +22,7 @@ > #include <asm/uaccess.h> > #include <asm/xsave.h> > #include <asm/smap.h> > +#include <asm/trace/cpustate.h> > > #ifdef CONFIG_X86_64 > # include <asm/sigcontext32.h> > @@ -532,10 +533,13 @@ static inline void user_fpu_begin(void) > static inline void __save_fpu(struct task_struct *tsk) > { > if (use_xsave()) { > + u64 requested_features = -1; > + struct xsave_struct *xsave = &tsk->thread.fpu.state->xsave; > if (unlikely(system_state == SYSTEM_BOOTING)) > - xsave_state_booting(&tsk->thread.fpu.state->xsave, -1); > + xsave_state_booting(xsave, requested_features); > else > - xsave_state(&tsk->thread.fpu.state->xsave, -1); > + xsave_state(xsave, requested_features); > + trace_cpu_state_xsave(xsave, requested_features); > } else > fpu_fxsave(&tsk->thread.fpu); > } > diff -puN /dev/null arch/x86/include/asm/trace/cpustate.h > --- /dev/null 2014-10-10 16:10:57.316716958 -0700 > +++ b/arch/x86/include/asm/trace/cpustate.h 2015-04-22 16:30:57.181297899 > -0700 > @@ -0,0 +1,105 @@ > +#undef TRACE_SYSTEM > +#define TRACE_SYSTEM cpu_state > + > +#ifdef CREATE_TRACE_POINTS > +#warning defining trace points foo > +#endif > + > +#if !defined(_TRACE_CPU_STATE_H) || defined(TRACE_HEADER_MULTI_READ) > +#define _TRACE_CPU_STATE_H > + > +#include <linux/tracepoint.h> > + > +#ifndef _TRACE_CPU_STATE_H_HELPERS > +#define _TRACE_CPU_STATE_H_HELPERS > +enum xsave_mode { > + XSAVE_MODE_XSAVE, > + XSAVE_MODE_XSAVEOPT, > + XSAVE_MODE_XSAVES, > +}; > + > +static inline enum xsave_mode get_xsave_mode(void) > +{ > + if (system_state == SYSTEM_BOOTING) { > + if (boot_cpu_has(X86_FEATURE_XSAVES)) > + return XSAVE_MODE_XSAVES; > + return XSAVE_MODE_XSAVE; > + } > + if (boot_cpu_has(X86_FEATURE_XSAVES)) > + return XSAVE_MODE_XSAVES; > + if (boot_cpu_has(X86_FEATURE_XSAVEOPT)) > + return XSAVE_MODE_XSAVEOPT; > + return XSAVE_MODE_XSAVE; > +} > +#endif /* _TRACE_CPU_STATE_H_HELPERS */ > + > +extern int xstate_bytes_saved(u64 xstate_bv); > + > +TRACE_EVENT(cpu_state_xsave, > + > + TP_PROTO(struct xsave_struct *xsave, u64 req_features), > + TP_ARGS(xsave, req_features), > + > + TP_STRUCT__entry( > + __field(u64, xstate_bv) > + __field(u64, xcomp_bv) > + __field(u64, req_features) > + __field(enum xsave_mode, mode) > + ), > + > + TP_fast_assign( > + __entry->xstate_bv = xsave->xsave_hdr.xstate_bv; > + __entry->xcomp_bv = xsave->xsave_hdr.xcomp_bv; > + __entry->req_features = req_features; > + __entry->mode = get_xsave_mode(); > + ), > + > + TP_printk("mode: %d xstate_bv: 0x%llx xcomp_bv: 0x%llx size: %d > requested features: %llx", > + __entry->mode, > + __entry->xstate_bv, > + __entry->xcomp_bv, > + xstate_bytes_saved(__entry->xstate_bv), > + __entry->req_features > + ) > +); > + > +TRACE_EVENT(cpu_state_xrstor, > + > + TP_PROTO(struct xsave_struct *xsave, u64 mask, int ret), > + TP_ARGS(xsave, mask, ret), > + > + TP_STRUCT__entry( > + __field(u64, xstate_bv) > + __field(u64, xcomp_bv) > + __field(enum xsave_mode, mode) > + __field(int, ret) > + __field(u64, mask) > + ), > + > + TP_fast_assign( > + __entry->xstate_bv = xsave->xsave_hdr.xstate_bv; > + __entry->xcomp_bv = xsave->xsave_hdr.xcomp_bv; > + __entry->mode = get_xsave_mode(); > + __entry->ret = ret; > + __entry->mask = mask; > + ), > + > + TP_printk("mode: %d xstate_bv: 0x%llx xcomp_bv: 0x%llx size: %d ret: %d > mask: %llx", > + __entry->mode, > + __entry->xstate_bv, > + __entry->xcomp_bv, > + xstate_bytes_saved(__entry->xstate_bv), > + __entry->ret, > + __entry->mask > + ) > +); > + > + > +#undef TRACE_INCLUDE_PATH > +#undef TRACE_INCLUDE_FILE > +#define TRACE_INCLUDE_PATH asm/trace/ > +#define TRACE_INCLUDE_FILE cpustate > +#endif /* _TRACE_CPU_STATE_H */ > + > +/* This part must be outside protection */ > +#include <trace/define_trace.h> > diff -puN include/trace/events/syscalls.h~xsave-trace-0 > include/trace/events/syscalls.h > --- a/include/trace/events/syscalls.h~xsave-trace-0 2015-04-22 > 16:30:57.153296636 -0700 > +++ b/include/trace/events/syscalls.h 2015-04-22 16:30:57.181297899 -0700 > @@ -1,6 +1,9 @@ > #undef TRACE_SYSTEM > #define TRACE_SYSTEM raw_syscalls > +#undef TRACE_INCLUDE_FILE > #define TRACE_INCLUDE_FILE syscalls > +#undef TRACE_INCLUDE_PATH > +#define TRACE_INCLUDE_PATH trace/events > > #if !defined(_TRACE_EVENTS_SYSCALLS_H) || defined(TRACE_HEADER_MULTI_READ) > #define _TRACE_EVENTS_SYSCALLS_H > diff -puN arch/x86/kernel/xsave.c~xsave-trace-0 arch/x86/kernel/xsave.c > --- a/arch/x86/kernel/xsave.c~xsave-trace-0 2015-04-22 16:30:57.155296727 > -0700 > +++ b/arch/x86/kernel/xsave.c 2015-04-22 16:30:57.182297945 -0700 > @@ -15,6 +15,10 @@ > #include <asm/tlbflush.h> > #include <asm/xcr.h> > > +#define CREATE_DAVE_TRACE_POINTS > +#define CREATE_TRACE_POINTS > +#include <asm/trace/cpustate.h> > + > /* > * Supported feature mask by the CPU and the kernel. > */ > @@ -555,6 +559,8 @@ static void __init setup_xstate_features > > xstate_offsets[leaf] = ebx; > xstate_sizes[leaf] = eax; > + printk("xstate[%2d]: offset: %4d size: %3d align: %d\n", > + leaf, ebx, eax, ecx); > } > } > > @@ -638,6 +644,7 @@ static void __init setup_init_fpu_buf(vo > * of any feature which is not represented by all zero's. > */ > xsave_state_booting(init_xstate_buf, -1); > + //trace_cpu_state_xsave(init_xstate_buf, -1); > } > > static enum { AUTO, ENABLE, DISABLE } eagerfpu = AUTO; > @@ -838,3 +845,20 @@ void *get_xsave_field(int xsave_field) > > return get_xsave_addr(&xstate->xsave, xsave_field); > } > + > +int xstate_bytes_saved(u64 xstate_bv) > +{ > + int i; > + int ret; > + > + if (!cpu_has_xsaves) > + return user_xstate_size; > + > + ret = FXSAVE_SIZE + XSAVE_HDR_SIZE; > + > + for (i = 2; i < xstate_features; i++) { > + if (xstate_bv & (1 << i)) > + ret += xstate_sizes[i]; > + } > + return ret; > +} > diff -puN arch/x86/kvm/x86.c~xsave-trace-0 arch/x86/kvm/x86.c > --- a/arch/x86/kvm/x86.c~xsave-trace-0 2015-04-22 16:30:57.159296906 > -0700 > +++ b/arch/x86/kvm/x86.c 2015-04-22 16:30:57.184298034 -0700 > @@ -51,9 +51,6 @@ > #include <linux/pvclock_gtod.h> > #include <trace/events/kvm.h> > > -#define CREATE_TRACE_POINTS > -#include "trace.h" > - > #include <asm/debugreg.h> > #include <asm/msr.h> > #include <asm/desc.h> > @@ -65,6 +62,9 @@ > #include <asm/pvclock.h> > #include <asm/div64.h> > > +#define CREATE_TRACE_POINTS > +#include "trace.h" > + > #define MAX_IO_MSRS 256 > #define KVM_MAX_MCE_BANKS 32 > #define KVM_MCE_CAP_SUPPORTED (MCG_CTL_P | MCG_SER_P) > diff -puN arch/x86/include/asm/xsave.h~xsave-trace-0 > arch/x86/include/asm/xsave.h > --- a/arch/x86/include/asm/xsave.h~xsave-trace-0 2015-04-22 > 16:30:57.161296997 -0700 > +++ b/arch/x86/include/asm/xsave.h 2015-04-22 16:30:57.185298079 -0700 > @@ -3,6 +3,7 @@ > > #include <linux/types.h> > #include <asm/processor.h> > +#include <asm/trace/cpustate.h> > > #define XSTATE_CPUID 0x0000000d > > @@ -91,6 +92,7 @@ static inline int xsave_state_booting(st > xstate_fault > : "D" (fx), "m" (*fx), "a" (lmask), "d" (hmask) > : "memory"); > + > return err; > } > > @@ -182,6 +184,8 @@ static inline int xrstor_state(struct xs > : "0" (0) > : "memory"); > > + trace_cpu_state_xrstor(fx, mask, err); > + > return err; > } > > @@ -190,7 +194,10 @@ static inline int xrstor_state(struct xs > */ > static inline void fpu_xsave(struct fpu *fpu) > { > - xsave_state(&fpu->state->xsave, -1); > + /* Requested Feature BitMap */ > + u64 rfbm = -1; > + xsave_state(&fpu->state->xsave, rfbm); > + trace_cpu_state_xsave(&fpu->state->xsave, rfbm); > } > > /* > @@ -198,7 +205,11 @@ static inline void fpu_xsave(struct fpu > */ > static inline int fpu_xrstor_checking(struct xsave_struct *fx) > { > - return xrstor_state(fx, -1); > + /* Requested Feature BitMap */ > + u64 rfbm = -1; > + int ret = xrstor_state(fx, rfbm); > + trace_cpu_state_xrstor(fx, rfbm, ret); > + return ret; > } > > /* > diff -puN arch/x86/include/asm/trace/mpx.h~xsave-trace-0 > arch/x86/include/asm/trace/mpx.h > --- a/arch/x86/include/asm/trace/mpx.h~xsave-trace-0 2015-04-22 > 16:30:57.172297493 -0700 > +++ b/arch/x86/include/asm/trace/mpx.h 2015-04-22 16:30:57.185298079 > -0700 > @@ -114,6 +114,7 @@ static inline void trace_bounds_exceptio > > #undef TRACE_INCLUDE_PATH > #define TRACE_INCLUDE_PATH asm/trace/ > +#undef TRACE_INCLUDE_FILE > #define TRACE_INCLUDE_FILE mpx > #endif /* _TRACE_MPX_H */ > > _ -- To unsubscribe from this list: send the line "unsubscribe linux-kernel" in the body of a message to majord...@vger.kernel.org More majordomo info at http://vger.kernel.org/majordomo-info.html Please read the FAQ at http://www.tux.org/lkml/