On Tue, Nov 22, 2016 at 04:01:06PM -0300, Arnaldo Carvalho de Melo wrote: > Sorry for the overly long delay, trying it now after fixing up a > conflict with a recent patchkit (branch stuff) I tested it by running > 'perf top -g' and I'm getting some assertion bugs: > > > # perf top -g > 1.34% filemap_map_pages > - 0.59% alloc_pages_vma > 1.20% __alloc_pages_nodemask > - 5.87% 0.45% [kernel] [k] handle_mm_fault > - 1.94% handle_mm_fault > 1.34% filemap_map_pages > - 0.59% alloc_pages_vma > 1.22% __alloc_pages_nodemask > + 5.75% 0.03% perf [.] > hist_entry_iter__add > + 4.46% 0.00% [unknown] [.] 0000000000000000 > - 4.06% 2.74% libc-2.23.so [.] _int_malloc > - 1.95% 0 > 1.94% _int_malloc > - 3.20% 0.23% perf [.] > iter_add_next_cumulative_entry > - 1.49% iter_add_next_cumulative_entry > - 1.43% __hists__add_entry > 2.58% 0.01% [kernel] [k] > return_from_SYSCALL_64 > 2.57% 2.55% libperl.so.5.22.2 [.] Perl_fbm_instr > - 2.54% 2.51% liblzma.so.5.2.2 [.] lzma_decode > - 2.51% lzma_decode > 2.33% 0.00% ld-2.23.so [.] _dl_sysdep_start > + 2.24% 0.04% ld-2.23.so [.] dl_main > 2.13% 0.03% [kernel] [k] ext4_readdir > 2.09% 0.01% [kernel] [k] sys_newstat > 2.08% 0.04% [kernel] [k] vfs_fstatat > 2.07% 0.02% [kernel] [k] SYSC_newstat > 2.02% 0.01% [kernel] [k] iterate_dir > - 1.96% 0.17% [kernel] [k] > __alloc_pages_nodemask > - 1.37% __alloc_pages_nodemask > perf: util/map.c:246: map__exit: Assertion > `!(!((&map->rb_node)->__rb_parent_color == (unsigned long)(&map->rb_node)))' > failed. > > Aborted (core dumped) > [root@jouet ~]# > > > I'll try to investigate this further later/tomorrow, find the updated patch > below. > > - Arnaldo > > commit af04d2c4a5d1f6bd7f4971118e4e1153cc7c2506 > Author: Krister Johansen <k...@templeofstupid.com> > Date: Tue Oct 11 02:28:39 2016 -0700 > > perf callchain: Fix a use after free crash due to refcounting bug > > If dso__load_kcore frees all of the existing maps, but one has already > been attached to a callchain cursor node, then we can get a SIGSEGV in > any function that happens to try to use this invalid cursor. Use the > existing map refcount mechanism to forestall cleanup of a map until the > cursor iterates past the node. > > Signed-off-by: Krister Johansen <k...@templeofstupid.com> > Cc: Frederic Weisbecker <fweis...@gmail.com> > Cc: Masami Hiramatsu <mhira...@kernel.org> > Cc: Namhyung Kim <namhy...@kernel.org> > Link: http://lkml.kernel.org/r/20161011092839.gc7...@templeofstupid.com > Signed-off-by: Arnaldo Carvalho de Melo <a...@redhat.com> > > diff --git a/tools/perf/util/callchain.c b/tools/perf/util/callchain.c > index 823befd8209a..18bb7caee535 100644 > --- a/tools/perf/util/callchain.c > +++ b/tools/perf/util/callchain.c > @@ -437,7 +437,7 @@ fill_node(struct callchain_node *node, struct > callchain_cursor *cursor) > } > call->ip = cursor_node->ip; > call->ms.sym = cursor_node->sym; > - call->ms.map = cursor_node->map; > + call->ms.map = map__get(cursor_node->map); > > if (cursor_node->branch) { > call->branch_count = 1; > @@ -477,6 +477,7 @@ add_child(struct callchain_node *parent, > > list_for_each_entry_safe(call, tmp, &new->val, list) { > list_del(&call->list); > + map__zput(call->ms.map); > free(call); > } > free(new); > @@ -761,6 +762,7 @@ merge_chain_branch(struct callchain_cursor *cursor, > list->ms.map, list->ms.sym, > false, NULL, 0, 0); > list_del(&list->list); > + map__zput(list->ms.map); > free(list); > } > > @@ -811,7 +813,8 @@ int callchain_cursor_append(struct callchain_cursor > *cursor, > } > > node->ip = ip; > - node->map = map; > + map__zput(node->map); > + node->map = map__get(map); > node->sym = sym; > node->branch = branch; > node->nr_loop_iter = nr_loop_iter; > @@ -868,6 +871,8 @@ int fill_callchain_info(struct addr_location *al, struct > callchain_cursor_node * > goto out; > } > > + map__get(al->map); > + > if (al->map->groups == &al->machine->kmaps) { > if (machine__is_host(al->machine)) { > al->cpumode = PERF_RECORD_MISC_KERNEL; > @@ -1142,11 +1147,13 @@ static void free_callchain_node(struct callchain_node > *node) > > list_for_each_entry_safe(list, tmp, &node->parent_val, list) { > list_del(&list->list); > + map__zput(list->ms.map); > free(list); > } > > list_for_each_entry_safe(list, tmp, &node->val, list) { > list_del(&list->list); > + map__zput(list->ms.map); > free(list); > } > > @@ -1210,6 +1217,7 @@ int callchain_node__make_parent_list(struct > callchain_node *node) > goto out; > *new = *chain; > new->has_children = false; > + map__get(new->ms.map); > list_add_tail(&new->list, &head); > } > parent = parent->parent; > @@ -1230,6 +1238,7 @@ int callchain_node__make_parent_list(struct > callchain_node *node) > out: > list_for_each_entry_safe(chain, new, &head, list) { > list_del(&chain->list); > + map__zput(chain->ms.map); > free(chain); > } > return -ENOMEM; > diff --git a/tools/perf/util/callchain.h b/tools/perf/util/callchain.h > index d9c70dccf06a..f551fd2cfe5a 100644 > --- a/tools/perf/util/callchain.h > +++ b/tools/perf/util/callchain.h > @@ -5,6 +5,7 @@ > #include <linux/list.h> > #include <linux/rbtree.h> > #include "event.h" > +#include "map.h" > #include "symbol.h" > > #define HELP_PAD "\t\t\t\t" > @@ -184,8 +185,13 @@ int callchain_merge(struct callchain_cursor *cursor, > */ > static inline void callchain_cursor_reset(struct callchain_cursor *cursor) > { > + struct callchain_cursor_node *node; > + > cursor->nr = 0; > cursor->last = &cursor->first; > + > + for (node = cursor->first; node != NULL; node = node->next) > + map__zput(node->map); > } > > int callchain_cursor_append(struct callchain_cursor *cursor, u64 ip, > diff --git a/tools/perf/util/hist.c b/tools/perf/util/hist.c > index e1be4132054d..be4b07145705 100644 > --- a/tools/perf/util/hist.c > +++ b/tools/perf/util/hist.c > @@ -1,6 +1,7 @@ > #include "util.h" > #include "build-id.h" > #include "hist.h" > +#include "map.h" > #include "session.h" > #include "sort.h" > #include "evlist.h" > @@ -979,6 +980,7 @@ iter_finish_cumulative_entry(struct hist_entry_iter *iter, > { > zfree(&iter->priv); > iter->he = NULL; > + map__zput(al->map); > > return 0; > }
As part of trying to tie up the year-end loose-ends, I went back and re-tested a rebase'd version of this patch against perf/core. I ended up with a merge that's identical to yours, except that I'm not seeing any assertion failures with 'perf top -g', 'perf script', or 'perf report'. Was perf/core the branch that was giving you trouble? -K