From: Andi Kleen <[email protected]>

For perf script brstackinsn also print a running cycles count.
This makes it easier to calculate cycle deltas for code sections
measured with LBRs.

% perf record -b -a sleep 1
% perf script -F +brstackinsn
...
        _dl_sysdep_start+330:
        00007eff9f20583a        insn: 75 c4                     # PRED 24 
cycles [24]
        00007eff9f205800        insn: 48 83 e8 03
        00007eff9f205804        insn: 48 83 f8 1e
        00007eff9f205808        insn: 77 26
        00007eff9f20580a        insn: 48 63 04 81
        00007eff9f20580e        insn: 48 01 c8
        00007eff9f205811        insn: ff e0                     # MISPRED 31 
cycles [7] 0.71 IPC
        00007eff9f2059c0        insn: 44 8b 62 08
        00007eff9f2059c4        insn: e9 67 fe ff ff            # PRED 55 
cycles [24] 0.04 IPC
        00007eff9f205830        insn: 48 83 c2 10
        00007eff9f205834        insn: 48 8b 02
        00007eff9f205837        insn: 48 85 c0
        00007eff9f20583a        insn: 75 c4                     # PRED 68 
cycles [13] 0.23 IPC

Signed-off-by: Andi Kleen <[email protected]>
---
 tools/perf/builtin-script.c | 12 ++++++++----
 1 file changed, 8 insertions(+), 4 deletions(-)

diff --git a/tools/perf/builtin-script.c b/tools/perf/builtin-script.c
index 3b73c3226141..84895c861b84 100644
--- a/tools/perf/builtin-script.c
+++ b/tools/perf/builtin-script.c
@@ -913,7 +913,7 @@ static int grab_bb(u8 *buffer, u64 start, u64 end,
 
 static int ip__fprintf_jump(uint64_t ip, struct branch_entry *en,
                            struct perf_insn *x, u8 *inbuf, int len,
-                           int insn, FILE *fp)
+                           int insn, FILE *fp, int *total_cycles)
 {
        int printed = fprintf(fp, "\t%016" PRIx64 "\t%-30s\t#%s%s%s%s", ip,
                              dump_insn(x, ip, inbuf, len, NULL),
@@ -922,7 +922,8 @@ static int ip__fprintf_jump(uint64_t ip, struct 
branch_entry *en,
                              en->flags.in_tx ? " INTX" : "",
                              en->flags.abort ? " ABORT" : "");
        if (en->flags.cycles) {
-               printed += fprintf(fp, " %d cycles", en->flags.cycles);
+               *total_cycles += en->flags.cycles;
+               printed += fprintf(fp, " %d cycles [%d]", *total_cycles, 
en->flags.cycles);
                if (insn)
                        printed += fprintf(fp, " %.2f IPC", (float)insn / 
en->flags.cycles);
        }
@@ -979,6 +980,7 @@ static int perf_sample__fprintf_brstackinsn(struct 
perf_sample *sample,
        u8 buffer[MAXBB];
        unsigned off;
        struct symbol *lastsym = NULL;
+       int total_cycles = 0;
 
        if (!(br && br->nr))
                return 0;
@@ -999,7 +1001,7 @@ static int perf_sample__fprintf_brstackinsn(struct 
perf_sample *sample,
                printed += ip__fprintf_sym(br->entries[nr - 1].from, thread,
                                           x.cpumode, x.cpu, &lastsym, attr, 
fp);
                printed += ip__fprintf_jump(br->entries[nr - 1].from, 
&br->entries[nr - 1],
-                                           &x, buffer, len, 0, fp);
+                                           &x, buffer, len, 0, fp, 
&total_cycles);
        }
 
        /* Print all blocks */
@@ -1027,7 +1029,9 @@ static int perf_sample__fprintf_brstackinsn(struct 
perf_sample *sample,
 
                        printed += ip__fprintf_sym(ip, thread, x.cpumode, 
x.cpu, &lastsym, attr, fp);
                        if (ip == end) {
-                               printed += ip__fprintf_jump(ip, 
&br->entries[i], &x, buffer + off, len - off, insn, fp);
+                               printed += ip__fprintf_jump(ip, &br->entries[i],
+                                               &x, buffer + off, len - off,
+                                               insn, fp, &total_cycles);
                                break;
                        } else {
                                printed += fprintf(fp, "\t%016" PRIx64 
"\t%s\n", ip,
-- 
2.17.1

Reply via email to