From: Madhavan Srinivasan <ma...@linux.vnet.ibm.com>

Introduce new perf record option "--hazard" to capture cpu pipeline
hazard data. Also enable perf script -D to dump raw values of it.
Sample o/p:

  $ ./perf record -e r4010e --hazard -- ls
  $ ./perf script -D
  ... PERF_RECORD_SAMPLE(IP, 0x2): ...
  hazard information:
  Inst Type 0x1
  Inst Cache 0x1
  Hazard Stage 0x4
  Hazard Reason 0x3
  Stall Stage 0x4
  Stall Reason 0x2

Signed-off-by: Madhavan Srinivasan <ma...@linux.vnet.ibm.com>
Signed-off-by: Ravi Bangoria <ravi.bango...@linux.ibm.com>
---
 tools/perf/Documentation/perf-record.txt  |  3 +++
 tools/perf/builtin-record.c               |  1 +
 tools/perf/util/event.h                   |  1 +
 tools/perf/util/evsel.c                   | 10 ++++++++++
 tools/perf/util/perf_event_attr_fprintf.c |  1 +
 tools/perf/util/record.h                  |  1 +
 tools/perf/util/session.c                 | 16 ++++++++++++++++
 7 files changed, 33 insertions(+)

diff --git a/tools/perf/Documentation/perf-record.txt 
b/tools/perf/Documentation/perf-record.txt
index b23a4012a606..e7bd1b6938ce 100644
--- a/tools/perf/Documentation/perf-record.txt
+++ b/tools/perf/Documentation/perf-record.txt
@@ -283,6 +283,9 @@ OPTIONS
 --phys-data::
        Record the sample physical addresses.
 
+--hazard::
+       Record processor pipeline hazard and stall information.
+
 -T::
 --timestamp::
        Record the sample timestamps. Use it with 'perf report -D' to see the
diff --git a/tools/perf/builtin-record.c b/tools/perf/builtin-record.c
index 4c301466101b..6bd32d7bc4e9 100644
--- a/tools/perf/builtin-record.c
+++ b/tools/perf/builtin-record.c
@@ -2301,6 +2301,7 @@ static struct option __record_options[] = {
        OPT_BOOLEAN('s', "stat", &record.opts.inherit_stat,
                    "per thread counts"),
        OPT_BOOLEAN('d', "data", &record.opts.sample_address, "Record the 
sample addresses"),
+       OPT_BOOLEAN(0, "hazard", &record.opts.hazard, "Record processor 
pipeline hazard and stall information"),
        OPT_BOOLEAN(0, "phys-data", &record.opts.sample_phys_addr,
                    "Record the sample physical addresses"),
        OPT_BOOLEAN(0, "sample-cpu", &record.opts.sample_cpu, "Record the 
sample cpu"),
diff --git a/tools/perf/util/event.h b/tools/perf/util/event.h
index 85223159737c..ff0f03253a95 100644
--- a/tools/perf/util/event.h
+++ b/tools/perf/util/event.h
@@ -148,6 +148,7 @@ struct perf_sample {
        struct stack_dump user_stack;
        struct sample_read read;
        struct aux_sample aux_sample;
+       struct perf_pipeline_haz_data *pipeline_haz;
 };
 
 #define PERF_MEM_DATA_SRC_NONE \
diff --git a/tools/perf/util/evsel.c b/tools/perf/util/evsel.c
index c8dc4450884c..e37ed7929c2c 100644
--- a/tools/perf/util/evsel.c
+++ b/tools/perf/util/evsel.c
@@ -1080,6 +1080,9 @@ void perf_evsel__config(struct evsel *evsel, struct 
record_opts *opts,
        if (opts->sample_phys_addr)
                perf_evsel__set_sample_bit(evsel, PHYS_ADDR);
 
+       if (opts->hazard)
+               perf_evsel__set_sample_bit(evsel, PIPELINE_HAZ);
+
        if (opts->no_buffering) {
                attr->watermark = 0;
                attr->wakeup_events = 1;
@@ -2265,6 +2268,13 @@ int perf_evsel__parse_sample(struct evsel *evsel, union 
perf_event *event,
                array = (void *)array + sz;
        }
 
+       if (type & PERF_SAMPLE_PIPELINE_HAZ) {
+               sz = sizeof(struct perf_pipeline_haz_data);
+               OVERFLOW_CHECK(array, sz, max_size);
+               data->pipeline_haz = (struct perf_pipeline_haz_data *)array;
+               array = (void *)array + sz;
+       }
+
        return 0;
 }
 
diff --git a/tools/perf/util/perf_event_attr_fprintf.c 
b/tools/perf/util/perf_event_attr_fprintf.c
index 651203126c71..d97e755c886b 100644
--- a/tools/perf/util/perf_event_attr_fprintf.c
+++ b/tools/perf/util/perf_event_attr_fprintf.c
@@ -35,6 +35,7 @@ static void __p_sample_type(char *buf, size_t size, u64 value)
                bit_name(BRANCH_STACK), bit_name(REGS_USER), 
bit_name(STACK_USER),
                bit_name(IDENTIFIER), bit_name(REGS_INTR), bit_name(DATA_SRC),
                bit_name(WEIGHT), bit_name(PHYS_ADDR), bit_name(AUX),
+               bit_name(PIPELINE_HAZ),
                { .name = NULL, }
        };
 #undef bit_name
diff --git a/tools/perf/util/record.h b/tools/perf/util/record.h
index 5421fd2ad383..f1678a0bc8ce 100644
--- a/tools/perf/util/record.h
+++ b/tools/perf/util/record.h
@@ -67,6 +67,7 @@ struct record_opts {
        int           affinity;
        int           mmap_flush;
        unsigned int  comp_level;
+       bool          hazard;
 };
 
 extern const char * const *record_usage;
diff --git a/tools/perf/util/session.c b/tools/perf/util/session.c
index d0d7d25b23e3..834ca7df2349 100644
--- a/tools/perf/util/session.c
+++ b/tools/perf/util/session.c
@@ -1153,6 +1153,19 @@ static void stack_user__printf(struct stack_dump *dump)
               dump->size, dump->offset);
 }
 
+static void pipeline_hazard__printf(struct perf_sample *sample)
+{
+       struct perf_pipeline_haz_data *haz = sample->pipeline_haz;
+
+       printf("... hazard information:\n");
+       printf(".... Inst Type 0x%" PRIx32 "\n", haz->itype);
+       printf(".... Inst Cache 0x%" PRIx32 "\n", haz->icache);
+       printf(".... Hazard Stage 0x%" PRIx32 "\n", haz->hazard_stage);
+       printf(".... Hazard Reason 0x%" PRIx32 "\n", haz->hazard_reason);
+       printf(".... Stall Stage 0x%" PRIx32 "\n", haz->stall_stage);
+       printf(".... Stall Reason 0x%" PRIx32 "\n", haz->stall_reason);
+}
+
 static void perf_evlist__print_tstamp(struct evlist *evlist,
                                       union perf_event *event,
                                       struct perf_sample *sample)
@@ -1251,6 +1264,9 @@ static void dump_sample(struct evsel *evsel, union 
perf_event *event,
        if (sample_type & PERF_SAMPLE_STACK_USER)
                stack_user__printf(&sample->user_stack);
 
+       if (sample_type & PERF_SAMPLE_PIPELINE_HAZ)
+               pipeline_hazard__printf(sample);
+
        if (sample_type & PERF_SAMPLE_WEIGHT)
                printf("... weight: %" PRIu64 "\n", sample->weight);
 
-- 
2.21.1

Reply via email to