Hi Masami,

On Fri, 2013-06-21 at 13:18 +0900, Masami Hiramatsu wrote:
> (2013/06/21 3:31), Tom Zanussi wrote:
> > diff --git a/include/trace/ftrace.h b/include/trace/ftrace.h
> > index 88ac7da..7c5627f 100644
> > --- a/include/trace/ftrace.h
> > +++ b/include/trace/ftrace.h
> > @@ -522,14 +522,6 @@ ftrace_raw_event_##call(void *__data, proto)           
> >                 \
> >     int __data_size;                                                \
> >     int pc;                                                         \
> >                                                                     \
> > -   if (test_bit(FTRACE_EVENT_FL_TRIGGER_MODE_BIT,                  \
> > -                &ftrace_file->flags))                              \
> > -           event_triggers_call(ftrace_file);                       \
> > -                                                                   \
> > -   if (test_bit(FTRACE_EVENT_FL_SOFT_DISABLED_BIT,                 \
> > -                &ftrace_file->flags))                              \
> > -           return;                                                 \
> > -                                                                   \
> >     local_save_flags(irq_flags);                                    \
> >     pc = preempt_count();                                           \
> >                                                                     \
> > @@ -547,8 +539,22 @@ ftrace_raw_event_##call(void *__data, proto)           
> >                 \
> >                                                                     \
> >     { assign; }                                                     \
> >                                                                     \
> > +   if (test_bit(FTRACE_EVENT_FL_SOFT_DISABLED_BIT,                 \
> > +                &ftrace_file->flags)) {                            \
> > +           ring_buffer_discard_commit(buffer, event);              \
> > +                                                                   \
> > +           if (test_bit(FTRACE_EVENT_FL_TRIGGER_MODE_BIT,          \
> > +                        &ftrace_file->flags))                      \
> > +                   event_triggers_call(ftrace_file, entry);        \
> > +           return;                                                 \
> > +   }                                                               \
> > +                                                                   \
> >     if (!filter_current_check_discard(buffer, event_call, entry, event)) \
> >             trace_buffer_unlock_commit(buffer, event, irq_flags, pc); \
> > +                                                                   \
> > +   if (test_bit(FTRACE_EVENT_FL_TRIGGER_MODE_BIT,                  \
> > +                &ftrace_file->flags))                              \
> > +           event_triggers_call(ftrace_file, entry);                \
> 
> Actually, since "entry" is a part of "event" which may be already discarded,
> I think we should not access it here. It may not cause real problem because
> even if it is discarded, that does NOT mean it is freed. However, it depends
> on the ring-buffer implementation.
> 
> I recommend you to call event triggers before commit the event. It will also
> make the code simpler :)
> 

That's what I originally did, and is what I was referring to when I
mentioned the bit of 'trickiness' here. ;-)

The problem is that the trace_recursive_lock() check in
ring_buffer_lock_reserve() prevents a trigger that itself logs to the
ring buffer from reserving a slot in the buffer, since it's being done
from the same context as the triggering event.  For example, the
stacktrace trigger, which calls trace_dump_stack().

So the code is a bit more convoluted than I'd like because of that -
since we can't really invoke the triggers before the current event is
committed, it waits until the current event is either discarded (because
we're soft disabled) or committed (logging a normally-enabled event).

But you do point out a real problem with this - it means having to look
at a discarded event in the soft-disabled case, and if for example some
interrupt actually reserves and logs an event between the time we do the
discard and invoke the filter, we could end up with a false filtering
outcome.  I'm not sure how to prevent that though at this point - will
have think about it some more...

Tom

> > diff --git a/kernel/trace/trace_syscalls.c b/kernel/trace/trace_syscalls.c
> > index e287011..47fa712 100644
> > --- a/kernel/trace/trace_syscalls.c
> > +++ b/kernel/trace/trace_syscalls.c
> > @@ -319,14 +319,6 @@ static void ftrace_syscall_enter(void *data, struct 
> > pt_regs *regs, long id)
> >     if (!sys_data)
> >             return;
> >  
> > -   if (test_bit(FTRACE_EVENT_FL_TRIGGER_MODE_BIT,
> > -                &sys_data->enter_file->flags))
> > -           event_triggers_call(sys_data->enter_file);
> > -
> > -   if (test_bit(FTRACE_EVENT_FL_SOFT_DISABLED_BIT,
> > -                &sys_data->enter_file->flags))
> > -           return;
> > -
> >     size = sizeof(*entry) + sizeof(unsigned long) * sys_data->nb_args;
> >  
> >     buffer = tr->trace_buffer.buffer;
> > @@ -339,9 +331,23 @@ static void ftrace_syscall_enter(void *data, struct 
> > pt_regs *regs, long id)
> >     entry->nr = syscall_nr;
> >     syscall_get_arguments(current, regs, 0, sys_data->nb_args, entry->args);
> >  
> > +   if (test_bit(FTRACE_EVENT_FL_SOFT_DISABLED_BIT,
> > +                &sys_data->enter_file->flags)) {
> > +           ring_buffer_discard_commit(buffer, event);
> > +
> > +           if (test_bit(FTRACE_EVENT_FL_TRIGGER_MODE_BIT,
> > +                        &sys_data->enter_file->flags))
> > +                   event_triggers_call(sys_data->enter_file, entry);
> > +           return;
> > +   }
> > +
> >     if (!filter_current_check_discard(buffer, sys_data->enter_event,
> >                                       entry, event))
> >             trace_current_buffer_unlock_commit(buffer, event, 0, 0);
> > +
> > +   if (test_bit(FTRACE_EVENT_FL_TRIGGER_MODE_BIT,
> > +                &sys_data->enter_file->flags))
> > +           event_triggers_call(sys_data->enter_file, entry);
> >  }
> >  
> >  static void ftrace_syscall_exit(void *data, struct pt_regs *regs, long ret)
> > @@ -363,14 +369,6 @@ static void ftrace_syscall_exit(void *data, struct 
> > pt_regs *regs, long ret)
> >     if (!sys_data)
> >             return;
> >  
> > -   if (test_bit(FTRACE_EVENT_FL_TRIGGER_MODE_BIT,
> > -                &sys_data->exit_file->flags))
> > -           event_triggers_call(sys_data->exit_file);
> > -
> > -   if (test_bit(FTRACE_EVENT_FL_SOFT_DISABLED_BIT,
> > -                &sys_data->exit_file->flags))
> > -           return;
> > -
> >     buffer = tr->trace_buffer.buffer;
> >     event = trace_buffer_lock_reserve(buffer,
> >                     sys_data->exit_event->event.type, sizeof(*entry), 0, 0);
> > @@ -381,9 +379,23 @@ static void ftrace_syscall_exit(void *data, struct 
> > pt_regs *regs, long ret)
> >     entry->nr = syscall_nr;
> >     entry->ret = syscall_get_return_value(current, regs);
> >  
> > +   if (test_bit(FTRACE_EVENT_FL_SOFT_DISABLED_BIT,
> > +                &sys_data->exit_file->flags)) {
> > +           ring_buffer_discard_commit(buffer, event);
> > +
> > +           if (test_bit(FTRACE_EVENT_FL_TRIGGER_MODE_BIT,
> > +                        &sys_data->exit_file->flags))
> > +                   event_triggers_call(sys_data->exit_file, entry);
> > +           return;
> > +   }
> > +
> >     if (!filter_current_check_discard(buffer, sys_data->exit_event,
> >                                       entry, event))
> >             trace_current_buffer_unlock_commit(buffer, event, 0, 0);
> > +
> > +   if (test_bit(FTRACE_EVENT_FL_TRIGGER_MODE_BIT,
> > +                &sys_data->exit_file->flags))
> > +           event_triggers_call(sys_data->exit_file, entry);
> >  }
> >  
> >  static int reg_event_syscall_enter(struct ftrace_event_file *file,
> > 
> 
> Same changes are needed here.
> 
> Thank you,
> 


--
To unsubscribe from this list: send the line "unsubscribe linux-kernel" in
the body of a message to majord...@vger.kernel.org
More majordomo info at  http://vger.kernel.org/majordomo-info.html
Please read the FAQ at  http://www.tux.org/lkml/

Reply via email to