Em Thu, May 28, 2020 at 03:08:58PM +0300, Adrian Hunter escreveu: > Context switch events are added automatically by Intel PT and Coresight. > Make it possible to suppress them. That is useful for tracing the > scheduler without the disturbance that the switch event processing > creates. > > Example: > > Prerequisites: > > $ which perf > ~/bin/perf > $ sudo setcap > "cap_sys_rawio,cap_sys_admin,cap_sys_ptrace,cap_syslog,cap_ipc_lock=ep" > ~/bin/perf > $ sudo chmod +r /proc/kcore > > Before: > > $ perf record --no-switch-events --kcore -a -e intel_pt//k -- sleep 0.001 > [ perf record: Woken up 1 times to write data ] > [ perf record: Captured and wrote 0.938 MB perf.data ] > $ perf script -D | grep PERF_RECORD_SWITCH | wc -l > 572 > > After: > > $ perf record --no-switch-events --kcore -a -e intel_pt//k -- sleep 0.001 > Warning: > Intel Processor Trace decoding will not be possible except for kernel > tracing! > [ perf record: Woken up 1 times to write data ] > [ perf record: Captured and wrote 0.838 MB perf.data ] > $ perf script -D | grep PERF_RECORD_SWITCH | wc -l > 0 > > $ sudo chmod go-r /proc/kcore > $ sudo setcap -r ~/bin/perf
Thanks, tested as root and applied. - Arnaldo > Signed-off-by: Adrian Hunter <[email protected]> > --- > tools/perf/Documentation/perf-record.txt | 4 +++- > tools/perf/arch/arm/util/cs-etm.c | 3 ++- > tools/perf/arch/x86/util/intel-pt.c | 3 ++- > tools/perf/builtin-record.c | 5 +++-- > tools/perf/util/record.h | 6 ++++++ > 5 files changed, 16 insertions(+), 5 deletions(-) > > diff --git a/tools/perf/Documentation/perf-record.txt > b/tools/perf/Documentation/perf-record.txt > index 561ef55743e2..97b1a866ab22 100644 > --- a/tools/perf/Documentation/perf-record.txt > +++ b/tools/perf/Documentation/perf-record.txt > @@ -458,7 +458,9 @@ This option sets the time out limit. The default value is > 500 ms. > > --switch-events:: > Record context switch events i.e. events of type PERF_RECORD_SWITCH or > -PERF_RECORD_SWITCH_CPU_WIDE. > +PERF_RECORD_SWITCH_CPU_WIDE. In some cases (e.g. Intel PT or CoreSight) > +switch events will be enabled automatically, which can be suppressed by > +by the option --no-switch-events. > > --clang-path=PATH:: > Path to clang binary to use for compiling BPF scriptlets. > diff --git a/tools/perf/arch/arm/util/cs-etm.c > b/tools/perf/arch/arm/util/cs-etm.c > index 607499b41bea..cea5e33d61d2 100644 > --- a/tools/perf/arch/arm/util/cs-etm.c > +++ b/tools/perf/arch/arm/util/cs-etm.c > @@ -265,7 +265,8 @@ static int cs_etm_recording_options(struct > auxtrace_record *itr, > ptr->evlist = evlist; > ptr->snapshot_mode = opts->auxtrace_snapshot_mode; > > - if (perf_can_record_switch_events()) > + if (!record_opts__no_switch_events(opts) && > + perf_can_record_switch_events()) > opts->record_switch_events = true; > > evlist__for_each_entry(evlist, evsel) { > diff --git a/tools/perf/arch/x86/util/intel-pt.c > b/tools/perf/arch/x86/util/intel-pt.c > index fdb917fcf511..3fc547769707 100644 > --- a/tools/perf/arch/x86/util/intel-pt.c > +++ b/tools/perf/arch/x86/util/intel-pt.c > @@ -779,7 +779,8 @@ static int intel_pt_recording_options(struct > auxtrace_record *itr, > * Per-cpu recording needs sched_switch events to distinguish different > * threads. > */ > - if (have_timing_info && !perf_cpu_map__empty(cpus)) { > + if (have_timing_info && !perf_cpu_map__empty(cpus) && > + !record_opts__no_switch_events(opts)) { > if (perf_can_record_switch_events()) { > bool cpu_wide = !target__none(&opts->target) && > !target__has_task(&opts->target); > diff --git a/tools/perf/builtin-record.c b/tools/perf/builtin-record.c > index 02d85f4e4517..dc6d5ba2fff8 100644 > --- a/tools/perf/builtin-record.c > +++ b/tools/perf/builtin-record.c > @@ -2490,8 +2490,9 @@ static struct option __record_options[] = { > "Record namespaces events"), > OPT_BOOLEAN(0, "all-cgroups", &record.opts.record_cgroup, > "Record cgroup events"), > - OPT_BOOLEAN(0, "switch-events", &record.opts.record_switch_events, > - "Record context switch events"), > + OPT_BOOLEAN_SET(0, "switch-events", &record.opts.record_switch_events, > + &record.opts.record_switch_events_set, > + "Record context switch events"), > OPT_BOOLEAN_FLAG(0, "all-kernel", &record.opts.all_kernel, > "Configure all used events to run in kernel space.", > PARSE_OPT_EXCLUSIVE), > diff --git a/tools/perf/util/record.h b/tools/perf/util/record.h > index dce6332f5071..84dbbc3f0204 100644 > --- a/tools/perf/util/record.h > +++ b/tools/perf/util/record.h > @@ -36,6 +36,7 @@ struct record_opts { > bool record_namespaces; > bool record_cgroup; > bool record_switch_events; > + bool record_switch_events_set; > bool all_kernel; > bool all_user; > bool kernel_callchains; > @@ -77,4 +78,9 @@ extern struct option *record_options; > > int record__parse_freq(const struct option *opt, const char *str, int unset); > > +static inline bool record_opts__no_switch_events(const struct record_opts > *opts) > +{ > + return opts->record_switch_events_set && !opts->record_switch_events; > +} > + > #endif // _PERF_RECORD_H > -- > 2.17.1 > -- - Arnaldo

