Em Sat, Mar 18, 2017 at 10:49:28PM +0100, Milian Wolff escreveu:
> Often it is interesting to know how costly a given source line is in
> total. Previously, one had to build these sums manually based on all
> addresses that pointed to the same source line. This patch introduces
> srcline as a sort key, which will do the aggregation for us.
> 
> Paired with the recent addition of showing inline frames, this makes
> perf report much more useful for many C++ work loads.
> 
> The following shows the new feature in action. First, let's show the
> status quo output when we sort by address. The result contains many
> hist entries that generate the same output:

Looks ok, one pet peeve below
 
> ~~~~~~~~~~~~~~~~
> $ perf report --stdio --inline -g address
> # Children      Self  Command       Shared Object        Symbol
> # ........  ........  ............  ...................  
> .........................................
> #
>     99.89%    35.34%  cpp-inlining  cpp-inlining         [.] main
>             |
>             |--64.55%--main complex:655
>             |          
> /home/milian/projects/kdab/rnd/hotspot/tests/test-clients/cpp-inlining/main.cpp:39
>  (inline)
>             |          /usr/include/c++/6.3.1/complex:664 (inline)
>             |          |
>             |          |--60.31%--hypot +20
>             |          |          |
>             |          |          |--8.52%--__hypot_finite +273
>             |          |          |
>             |          |          |--7.32%--__hypot_finite +411
> ...
>              --35.34%--_start +4194346
>                        __libc_start_main +241
>                        |
>                        |--6.65%--main random.tcc:3326
>                        |          
> /home/milian/projects/kdab/rnd/hotspot/tests/test-clients/cpp-inlining/main.cpp:39
>  (inline)
>                        |          /usr/include/c++/6.3.1/bits/random.h:1809 
> (inline)
>                        |          /usr/include/c++/6.3.1/bits/random.h:1818 
> (inline)
>                        |          /usr/include/c++/6.3.1/bits/random.h:185 
> (inline)
>                        |
>                        |--2.70%--main random.tcc:3326
>                        |          
> /home/milian/projects/kdab/rnd/hotspot/tests/test-clients/cpp-inlining/main.cpp:39
>  (inline)
>                        |          /usr/include/c++/6.3.1/bits/random.h:1809 
> (inline)
>                        |          /usr/include/c++/6.3.1/bits/random.h:1818 
> (inline)
>                        |          /usr/include/c++/6.3.1/bits/random.h:185 
> (inline)
>                        |
>                        |--1.69%--main random.tcc:3326
>                        |          
> /home/milian/projects/kdab/rnd/hotspot/tests/test-clients/cpp-inlining/main.cpp:39
>  (inline)
>                        |          /usr/include/c++/6.3.1/bits/random.h:1809 
> (inline)
>                        |          /usr/include/c++/6.3.1/bits/random.h:1818 
> (inline)
>                        |          /usr/include/c++/6.3.1/bits/random.h:185 
> (inline)
> ...
> ~~~~~~~~~~~~~~~~
> 
> With this patch and `-g srcline` we instead get the following output:
> 
> ~~~~~~~~~~~~~~~~
> $ perf report --stdio --inline -g srcline
> # Children      Self  Command       Shared Object        Symbol
> # ........  ........  ............  ...................  
> .........................................
> #
>     99.89%    35.34%  cpp-inlining  cpp-inlining         [.] main
>             |
>             |--64.55%--main complex:655
>             |          
> /home/milian/projects/kdab/rnd/hotspot/tests/test-clients/cpp-inlining/main.cpp:39
>  (inline)
>             |          /usr/include/c++/6.3.1/complex:664 (inline)
>             |          |
>             |          |--64.02%--hypot
>             |          |          |
>             |          |           --59.81%--__hypot_finite
>             |          |
>             |           --0.53%--cabs
>             |
>              --35.34%--_start
>                        __libc_start_main
>                        |
>                        |--12.48%--main random.tcc:3326
>                        |          
> /home/milian/projects/kdab/rnd/hotspot/tests/test-clients/cpp-inlining/main.cpp:39
>  (inline)
>                        |          /usr/include/c++/6.3.1/bits/random.h:1809 
> (inline)
>                        |          /usr/include/c++/6.3.1/bits/random.h:1818 
> (inline)
>                        |          /usr/include/c++/6.3.1/bits/random.h:185 
> (inline)
> ...
> ~~~~~~~~~~~~~~~~
> 
> Signed-off-by: Milian Wolff <[email protected]>
> ---
>  tools/perf/Documentation/perf-report.txt |  1 +
>  tools/perf/ui/browsers/hists.c           |  3 +-
>  tools/perf/ui/stdio/hist.c               |  3 +-
>  tools/perf/util/annotate.c               |  3 +-
>  tools/perf/util/callchain.c              | 52 
> +++++++++++++++++++++++++++++---
>  tools/perf/util/callchain.h              |  3 +-
>  tools/perf/util/map.c                    |  3 +-
>  tools/perf/util/sort.c                   | 16 ++++++----
>  tools/perf/util/srcline.c                | 11 +++++--
>  tools/perf/util/util.h                   |  4 +--
>  10 files changed, 78 insertions(+), 21 deletions(-)
> 
> diff --git a/tools/perf/Documentation/perf-report.txt 
> b/tools/perf/Documentation/perf-report.txt
> index 248bba434b53..37a175914157 100644
> --- a/tools/perf/Documentation/perf-report.txt
> +++ b/tools/perf/Documentation/perf-report.txt
> @@ -235,6 +235,7 @@ OPTIONS
>       sort_key can be:
>       - function: compare on functions (default)
>       - address: compare on individual code addresses
> +     - srcline: compare on source filename and line number
>  
>       branch can be:
>       - branch: include last branch information in callgraph when available.
> diff --git a/tools/perf/ui/browsers/hists.c b/tools/perf/ui/browsers/hists.c
> index 757222bc9dad..bca08be9fd78 100644
> --- a/tools/perf/ui/browsers/hists.c
> +++ b/tools/perf/ui/browsers/hists.c
> @@ -851,7 +851,8 @@ static int hist_browser__show_inline(struct hist_browser 
> *browser,
>                       if (ui_browser__is_current_entry(&browser->b, row))
>                               color = HE_COLORSET_SELECTED;
>  
> -                     if (callchain_param.key == CCKEY_ADDRESS) {
> +                     if (callchain_param.key == CCKEY_ADDRESS ||
> +                         callchain_param.key == CCKEY_SRCLINE) {
>                               if (ilist->filename != NULL)
>                                       scnprintf(buf, sizeof(buf),
>                                                 "%s:%d (inline)",
> diff --git a/tools/perf/ui/stdio/hist.c b/tools/perf/ui/stdio/hist.c
> index 183470f25100..bf95b4a9a592 100644
> --- a/tools/perf/ui/stdio/hist.c
> +++ b/tools/perf/ui/stdio/hist.c
> @@ -53,7 +53,8 @@ static size_t inline__fprintf(struct map *map, u64 ip, int 
> left_margin,
>                               ret += fprintf(fp, "          ");
>                       }
>  
> -                     if (callchain_param.key == CCKEY_ADDRESS) {
> +                     if (callchain_param.key == CCKEY_ADDRESS ||
> +                         callchain_param.key == CCKEY_SRCLINE) {
>                               if (ilist->filename != NULL)
>                                       ret += fprintf(fp, "%s:%d (inline)",
>                                                      ilist->filename,
> diff --git a/tools/perf/util/annotate.c b/tools/perf/util/annotate.c
> index 273f21fa32b5..e7194ff88c4f 100644
> --- a/tools/perf/util/annotate.c
> +++ b/tools/perf/util/annotate.c
> @@ -1668,7 +1668,8 @@ static int symbol__get_source_line(struct symbol *sym, 
> struct map *map,
>                       goto next;
>  
>               offset = start + i;
> -             src_line->path = get_srcline(map->dso, offset, NULL, false);
> +             src_line->path = get_srcline(map->dso, offset, NULL,
> +                                          false, true);
>               insert_source_line(&tmp_root, src_line);
>  
>       next:
> diff --git a/tools/perf/util/callchain.c b/tools/perf/util/callchain.c
> index aba953421a03..d78776a20e80 100644
> --- a/tools/perf/util/callchain.c
> +++ b/tools/perf/util/callchain.c
> @@ -80,6 +80,10 @@ static int parse_callchain_sort_key(const char *value)
>               callchain_param.key = CCKEY_ADDRESS;
>               return 0;
>       }
> +     if (!strncmp(value, "srcline", strlen(value))) {
> +             callchain_param.key = CCKEY_SRCLINE;
> +             return 0;
> +     }
>       if (!strncmp(value, "branch", strlen(value))) {
>               callchain_param.branch_callstack = 1;
>               return 0;
> @@ -510,14 +514,51 @@ enum match_result {
>       MATCH_GT,
>  };
>  
> +static enum match_result match_chain_srcline(struct callchain_cursor_node 
> *node,
> +                                          struct callchain_list *cnode)
> +{
> +     char *left = get_srcline(cnode->ms.map->dso,
> +                              map__rip_2objdump(cnode->ms.map, cnode->ip),
> +                              cnode->ms.sym, true, false);
> +     char *right = get_srcline(node->map->dso,
> +                               map__rip_2objdump(node->map, node->ip),
> +                               node->sym, true, false);
> +     enum match_result ret = MATCH_EQ;
> +     int cmp;
> +
> +     if (left && right)
> +             cmp = strcmp(left, right);
> +     else if (!left && right)
> +             cmp = 1;
> +     else if (left && !right)
> +             cmp = -1;
> +     else if (cnode->ip == node->ip)
> +             cmp = 0;
> +     else
> +             cmp = (cnode->ip < node->ip) ? -1 : 1;
> +
> +     if (cmp != 0)
> +             ret = cmp < 0 ? MATCH_LT : MATCH_GT;
> +
> +     free_srcline(left);
> +     free_srcline(right);
> +     return ret;
> +}
> +
>  static enum match_result match_chain(struct callchain_cursor_node *node,
>                                    struct callchain_list *cnode)
>  {
>       struct symbol *sym = node->sym;
>       u64 left, right;
>  
> -     if (cnode->ms.sym && sym &&
> -         callchain_param.key == CCKEY_FUNCTION) {
> +     if (callchain_param.key == CCKEY_SRCLINE) {
> +             enum match_result match = match_chain_srcline(node, cnode);
> +
> +             if (match != MATCH_ERROR)
> +                     return match;
> +     }
> +
> +     if (cnode->ms.sym && sym && callchain_param.key == CCKEY_FUNCTION) {

The above line is the same as it was in those first two removed, its
just churn :-\ I.e. this part:

-       if (cnode->ms.sym && sym &&
-           callchain_param.key == CCKEY_FUNCTION) {
+       if (cnode->ms.sym && sym && callchain_param.key == CCKEY_FUNCTION) {

Please avoid doing that in the future.

>               left = cnode->ms.sym->start;
>               right = sym->start;
>       } else {
> @@ -911,15 +952,16 @@ int fill_callchain_info(struct addr_location *al, 
> struct callchain_cursor_node *
>  char *callchain_list__sym_name(struct callchain_list *cl,
>                              char *bf, size_t bfsize, bool show_dso)
>  {
> +     bool show_addr = callchain_param.key == CCKEY_ADDRESS;
> +     bool show_srcline = show_addr || callchain_param.key == CCKEY_SRCLINE;
>       int printed;
>  
>       if (cl->ms.sym) {
> -             if (callchain_param.key == CCKEY_ADDRESS &&
> -                 cl->ms.map && !cl->srcline)
> +             if (show_srcline && cl->ms.map && !cl->srcline)
>                       cl->srcline = get_srcline(cl->ms.map->dso,
>                                                 map__rip_2objdump(cl->ms.map,
>                                                                   cl->ip),
> -                                               cl->ms.sym, false);
> +                                               cl->ms.sym, false, show_addr);
>               if (cl->srcline)
>                       printed = scnprintf(bf, bfsize, "%s %s",
>                                       cl->ms.sym->name, cl->srcline);
> diff --git a/tools/perf/util/callchain.h b/tools/perf/util/callchain.h
> index 4f4b60f1558a..c56c23dbbf72 100644
> --- a/tools/perf/util/callchain.h
> +++ b/tools/perf/util/callchain.h
> @@ -77,7 +77,8 @@ typedef void (*sort_chain_func_t)(struct rb_root *, struct 
> callchain_root *,
>  
>  enum chain_key {
>       CCKEY_FUNCTION,
> -     CCKEY_ADDRESS
> +     CCKEY_ADDRESS,
> +     CCKEY_SRCLINE
>  };
>  
>  enum chain_value {
> diff --git a/tools/perf/util/map.c b/tools/perf/util/map.c
> index 1d9ebcf9e38e..c1870ac365a3 100644
> --- a/tools/perf/util/map.c
> +++ b/tools/perf/util/map.c
> @@ -405,7 +405,8 @@ int map__fprintf_srcline(struct map *map, u64 addr, const 
> char *prefix,
>  
>       if (map && map->dso) {
>               srcline = get_srcline(map->dso,
> -                                   map__rip_2objdump(map, addr), NULL, true);
> +                                   map__rip_2objdump(map, addr), NULL,
> +                                   true, true);
>               if (srcline != SRCLINE_UNKNOWN)
>                       ret = fprintf(fp, "%s%s", prefix, srcline);
>               free_srcline(srcline);
> diff --git a/tools/perf/util/sort.c b/tools/perf/util/sort.c
> index 8b0d4e39f640..73f3ec1cf2a0 100644
> --- a/tools/perf/util/sort.c
> +++ b/tools/perf/util/sort.c
> @@ -323,7 +323,7 @@ char *hist_entry__get_srcline(struct hist_entry *he)
>               return SRCLINE_UNKNOWN;
>  
>       return get_srcline(map->dso, map__rip_2objdump(map, he->ip),
> -                        he->ms.sym, true);
> +                        he->ms.sym, true, true);
>  }
>  
>  static int64_t
> @@ -366,7 +366,8 @@ sort__srcline_from_cmp(struct hist_entry *left, struct 
> hist_entry *right)
>                       left->branch_info->srcline_from = get_srcline(map->dso,
>                                          map__rip_2objdump(map,
>                                                            
> left->branch_info->from.al_addr),
> -                                                      
> left->branch_info->from.sym, true);
> +                                                      
> left->branch_info->from.sym,
> +                                                      true, true);
>       }
>       if (!right->branch_info->srcline_from) {
>               struct map *map = right->branch_info->from.map;
> @@ -376,7 +377,8 @@ sort__srcline_from_cmp(struct hist_entry *left, struct 
> hist_entry *right)
>                       right->branch_info->srcline_from = get_srcline(map->dso,
>                                            map__rip_2objdump(map,
>                                                              
> right->branch_info->from.al_addr),
> -                                                  
> right->branch_info->from.sym, true);
> +                                                  
> right->branch_info->from.sym,
> +                                                  true, true);
>       }
>       return strcmp(right->branch_info->srcline_from, 
> left->branch_info->srcline_from);
>  }
> @@ -407,7 +409,8 @@ sort__srcline_to_cmp(struct hist_entry *left, struct 
> hist_entry *right)
>                       left->branch_info->srcline_to = get_srcline(map->dso,
>                                          map__rip_2objdump(map,
>                                                            
> left->branch_info->to.al_addr),
> -                                                      
> left->branch_info->from.sym, true);
> +                                                      
> left->branch_info->from.sym,
> +                                                      true, true);
>       }
>       if (!right->branch_info->srcline_to) {
>               struct map *map = right->branch_info->to.map;
> @@ -417,7 +420,8 @@ sort__srcline_to_cmp(struct hist_entry *left, struct 
> hist_entry *right)
>                       right->branch_info->srcline_to = get_srcline(map->dso,
>                                            map__rip_2objdump(map,
>                                                              
> right->branch_info->to.al_addr),
> -                                                  
> right->branch_info->to.sym, true);
> +                                                  right->branch_info->to.sym,
> +                                                  true, true);
>       }
>       return strcmp(right->branch_info->srcline_to, 
> left->branch_info->srcline_to);
>  }
> @@ -448,7 +452,7 @@ static char *hist_entry__get_srcfile(struct hist_entry *e)
>               return no_srcfile;
>  
>       sf = __get_srcline(map->dso, map__rip_2objdump(map, e->ip),
> -                      e->ms.sym, false, true);
> +                      e->ms.sym, false, true, true);
>       if (!strcmp(sf, SRCLINE_UNKNOWN))
>               return no_srcfile;
>       p = strchr(sf, ':');
> diff --git a/tools/perf/util/srcline.c b/tools/perf/util/srcline.c
> index f9d4b47d1fb5..6f8651104990 100644
> --- a/tools/perf/util/srcline.c
> +++ b/tools/perf/util/srcline.c
> @@ -427,7 +427,7 @@ static struct inline_node *addr2inlines(const char 
> *dso_name, u64 addr,
>  #define A2L_FAIL_LIMIT 123
>  
>  char *__get_srcline(struct dso *dso, u64 addr, struct symbol *sym,
> -               bool show_sym, bool unwind_inlines)
> +               bool show_sym, bool show_addr, bool unwind_inlines)
>  {
>       char *file = NULL;
>       unsigned line = 0;
> @@ -461,6 +461,11 @@ char *__get_srcline(struct dso *dso, u64 addr, struct 
> symbol *sym,
>               dso->has_srcline = 0;
>               dso__free_a2l(dso);
>       }
> +
> +     if (!show_addr)
> +             return (show_sym && sym) ?
> +                         strndup(sym->name, sym->namelen) : NULL;
> +
>       if (sym) {
>               if (asprintf(&srcline, "%s+%" PRIu64, show_sym ? sym->name : "",
>                                       addr - sym->start) < 0)
> @@ -477,9 +482,9 @@ void free_srcline(char *srcline)
>  }
>  
>  char *get_srcline(struct dso *dso, u64 addr, struct symbol *sym,
> -               bool show_sym)
> +               bool show_sym, bool show_addr)
>  {
> -     return __get_srcline(dso, addr, sym, show_sym, false);
> +     return __get_srcline(dso, addr, sym, show_sym, show_addr, false);
>  }
>  
>  struct inline_node *dso__parse_addr_inlines(struct dso *dso, u64 addr)
> diff --git a/tools/perf/util/util.h b/tools/perf/util/util.h
> index cc0700d6fef0..7cf5752b38fd 100644
> --- a/tools/perf/util/util.h
> +++ b/tools/perf/util/util.h
> @@ -287,9 +287,9 @@ struct symbol;
>  
>  extern bool srcline_full_filename;
>  char *get_srcline(struct dso *dso, u64 addr, struct symbol *sym,
> -               bool show_sym);
> +               bool show_sym, bool show_addr);
>  char *__get_srcline(struct dso *dso, u64 addr, struct symbol *sym,
> -               bool show_sym, bool unwind_inlines);
> +               bool show_sym, bool show_addr, bool unwind_inlines);
>  void free_srcline(char *srcline);
>  
>  int perf_event_paranoid(void);
> -- 
> 2.12.0

Reply via email to