Commit 23acd3e1 authored by Ingo Molnar's avatar Ingo Molnar

Merge tag 'perf-core-for-mingo-4.13-20170630' of...

Merge tag 'perf-core-for-mingo-4.13-20170630' of git://git.kernel.org/pub/scm/linux/kernel/git/acme/linux into perf/core

Pull perf/core improvements and fixes from Arnaldo Carvalho de Melo:

Intel PT enhancements:

 - Support "ptwrite" instruction, a way to stuff 32 or 64 bit values into
   the Intel PT trace (Adrian Hunter)

 - Support power events in Intel PT to report changes to C-state (Adrian
   Hunter)

 - Synthesize Intel PT events as PERF_RECORD_SAMPLE records with a
   perf_event_attr.type (PERF_TYPE_SYNTH) just after the range used by the
   kernel, i.e. right after what is allocated for PMUs, at INT_MAX + 1U,
   attr.config will have the identification for the synthesized event and
   the PERF_SAMPLE_RAW payload will have its fields (Adrian Hunter)

Infrastructure changes:

 - Remove warning() and error(), using instead pr_warning() and
   pr_error(), consolidating error reporting (Arnaldo Carvalho de Melo)

 - Add platform dependency to 'perf test 15' (Thomas Richter)
Signed-off-by: default avatarArnaldo Carvalho de Melo <acme@redhat.com>
Signed-off-by: default avatarIngo Molnar <mingo@kernel.org>
parents e91c8d97 644e0840
...@@ -1009,7 +1009,7 @@ GrpTable: Grp15 ...@@ -1009,7 +1009,7 @@ GrpTable: Grp15
1: fxstor | RDGSBASE Ry (F3),(11B) 1: fxstor | RDGSBASE Ry (F3),(11B)
2: vldmxcsr Md (v1) | WRFSBASE Ry (F3),(11B) 2: vldmxcsr Md (v1) | WRFSBASE Ry (F3),(11B)
3: vstmxcsr Md (v1) | WRGSBASE Ry (F3),(11B) 3: vstmxcsr Md (v1) | WRGSBASE Ry (F3),(11B)
4: XSAVE 4: XSAVE | ptwrite Ey (F3),(11B)
5: XRSTOR | lfence (11B) 5: XRSTOR | lfence (11B)
6: XSAVEOPT | clwb (66) | mfence (11B) 6: XSAVEOPT | clwb (66) | mfence (11B)
7: clflush | clflushopt (66) | sfence (11B) 7: clflush | clflushopt (66) | sfence (11B)
......
...@@ -5,6 +5,8 @@ ...@@ -5,6 +5,8 @@
#include <stddef.h> #include <stddef.h>
#include <assert.h> #include <assert.h>
#include <linux/compiler.h> #include <linux/compiler.h>
#include <endian.h>
#include <byteswap.h>
#ifndef UINT_MAX #ifndef UINT_MAX
#define UINT_MAX (~0U) #define UINT_MAX (~0U)
...@@ -67,12 +69,33 @@ ...@@ -67,12 +69,33 @@
#endif #endif
#endif #endif
/* #if __BYTE_ORDER == __BIG_ENDIAN
* Both need more care to handle endianness #define cpu_to_le16 bswap_16
* (Don't use bitmap_copy_le() for now) #define cpu_to_le32 bswap_32
*/ #define cpu_to_le64 bswap_64
#define cpu_to_le64(x) (x) #define le16_to_cpu bswap_16
#define cpu_to_le32(x) (x) #define le32_to_cpu bswap_32
#define le64_to_cpu bswap_64
#define cpu_to_be16
#define cpu_to_be32
#define cpu_to_be64
#define be16_to_cpu
#define be32_to_cpu
#define be64_to_cpu
#else
#define cpu_to_le16
#define cpu_to_le32
#define cpu_to_le64
#define le16_to_cpu
#define le32_to_cpu
#define le64_to_cpu
#define cpu_to_be16 bswap_16
#define cpu_to_be32 bswap_32
#define cpu_to_be64 bswap_64
#define be16_to_cpu bswap_16
#define be32_to_cpu bswap_32
#define be64_to_cpu bswap_64
#endif
int vscnprintf(char *buf, size_t size, const char *fmt, va_list args); int vscnprintf(char *buf, size_t size, const char *fmt, va_list args);
int scnprintf(char * buf, size_t size, const char * fmt, ...); int scnprintf(char * buf, size_t size, const char * fmt, ...);
......
...@@ -1009,7 +1009,7 @@ GrpTable: Grp15 ...@@ -1009,7 +1009,7 @@ GrpTable: Grp15
1: fxstor | RDGSBASE Ry (F3),(11B) 1: fxstor | RDGSBASE Ry (F3),(11B)
2: vldmxcsr Md (v1) | WRFSBASE Ry (F3),(11B) 2: vldmxcsr Md (v1) | WRFSBASE Ry (F3),(11B)
3: vstmxcsr Md (v1) | WRGSBASE Ry (F3),(11B) 3: vstmxcsr Md (v1) | WRGSBASE Ry (F3),(11B)
4: XSAVE 4: XSAVE | ptwrite Ey (F3),(11B)
5: XRSTOR | lfence (11B) 5: XRSTOR | lfence (11B)
6: XSAVEOPT | clwb (66) | mfence (11B) 6: XSAVEOPT | clwb (66) | mfence (11B)
7: clflush | clflushopt (66) | sfence (11B) 7: clflush | clflushopt (66) | sfence (11B)
......
...@@ -108,6 +108,9 @@ approach is available to export the data to a postgresql database. Refer to ...@@ -108,6 +108,9 @@ approach is available to export the data to a postgresql database. Refer to
script export-to-postgresql.py for more details, and to script script export-to-postgresql.py for more details, and to script
call-graph-from-postgresql.py for an example of using the database. call-graph-from-postgresql.py for an example of using the database.
There is also script intel-pt-events.py which provides an example of how to
unpack the raw data for power events and PTWRITE.
As mentioned above, it is easy to capture too much data. One way to limit the As mentioned above, it is easy to capture too much data. One way to limit the
data captured is to use 'snapshot' mode which is explained further below. data captured is to use 'snapshot' mode which is explained further below.
Refer to 'new snapshot option' and 'Intel PT modes of operation' further below. Refer to 'new snapshot option' and 'Intel PT modes of operation' further below.
...@@ -710,13 +713,15 @@ Having no option is the same as ...@@ -710,13 +713,15 @@ Having no option is the same as
which, in turn, is the same as which, in turn, is the same as
--itrace=ibxe --itrace=ibxwpe
The letters are: The letters are:
i synthesize "instructions" events i synthesize "instructions" events
b synthesize "branches" events b synthesize "branches" events
x synthesize "transactions" events x synthesize "transactions" events
w synthesize "ptwrite" events
p synthesize "power" events
c synthesize branches events (calls only) c synthesize branches events (calls only)
r synthesize branches events (returns only) r synthesize branches events (returns only)
e synthesize tracing error events e synthesize tracing error events
...@@ -735,7 +740,40 @@ and "r" can be combined to get calls and returns. ...@@ -735,7 +740,40 @@ and "r" can be combined to get calls and returns.
'flags' field can be used in perf script to determine whether the event is a 'flags' field can be used in perf script to determine whether the event is a
tranasaction start, commit or abort. tranasaction start, commit or abort.
Error events are new. They show where the decoder lost the trace. Error events Note that "instructions", "branches" and "transactions" events depend on code
flow packets which can be disabled by using the config term "branch=0". Refer
to the config terms section above.
"ptwrite" events record the payload of the ptwrite instruction and whether
"fup_on_ptw" was used. "ptwrite" events depend on PTWRITE packets which are
recorded only if the "ptw" config term was used. Refer to the config terms
section above. perf script "synth" field displays "ptwrite" information like
this: "ip: 0 payload: 0x123456789abcdef0" where "ip" is 1 if "fup_on_ptw" was
used.
"Power" events correspond to power event packets and CBR (core-to-bus ratio)
packets. While CBR packets are always recorded when tracing is enabled, power
event packets are recorded only if the "pwr_evt" config term was used. Refer to
the config terms section above. The power events record information about
C-state changes, whereas CBR is indicative of CPU frequency. perf script
"event,synth" fields display information like this:
cbr: cbr: 22 freq: 2189 MHz (200%)
mwait: hints: 0x60 extensions: 0x1
pwre: hw: 0 cstate: 2 sub-cstate: 0
exstop: ip: 1
pwrx: deepest cstate: 2 last cstate: 2 wake reason: 0x4
Where:
"cbr" includes the frequency and the percentage of maximum non-turbo
"mwait" shows mwait hints and extensions
"pwre" shows C-state transitions (to a C-state deeper than C0) and
whether initiated by hardware
"exstop" indicates execution stopped and whether the IP was recorded
exactly,
"pwrx" indicates return to C0
For more details refer to the Intel 64 and IA-32 Architectures Software
Developer Manuals.
Error events show where the decoder lost the trace. Error events
are quite important. Users must know if what they are seeing is a complete are quite important. Users must know if what they are seeing is a complete
picture or not. picture or not.
......
...@@ -3,13 +3,15 @@ ...@@ -3,13 +3,15 @@
c synthesize branches events (calls only) c synthesize branches events (calls only)
r synthesize branches events (returns only) r synthesize branches events (returns only)
x synthesize transactions events x synthesize transactions events
w synthesize ptwrite events
p synthesize power events
e synthesize error events e synthesize error events
d create a debug log d create a debug log
g synthesize a call chain (use with i or x) g synthesize a call chain (use with i or x)
l synthesize last branch entries (use with i or x) l synthesize last branch entries (use with i or x)
s skip initial number of events s skip initial number of events
The default is all events i.e. the same as --itrace=ibxe The default is all events i.e. the same as --itrace=ibxwpe
In addition, the period (default 100000) for instructions events In addition, the period (default 100000) for instructions events
can be specified in units of: can be specified in units of:
...@@ -26,8 +28,8 @@ ...@@ -26,8 +28,8 @@
Also the number of last branch entries (default 64, max. 1024) for Also the number of last branch entries (default 64, max. 1024) for
instructions or transactions events can be specified. instructions or transactions events can be specified.
It is also possible to skip events generated (instructions, branches, transactions) It is also possible to skip events generated (instructions, branches, transactions,
at the beginning. This is useful to ignore initialization code. ptwrite, power) at the beginning. This is useful to ignore initialization code.
--itrace=i0nss1000000 --itrace=i0nss1000000
......
...@@ -117,7 +117,8 @@ OPTIONS ...@@ -117,7 +117,8 @@ OPTIONS
Comma separated list of fields to print. Options are: Comma separated list of fields to print. Options are:
comm, tid, pid, time, cpu, event, trace, ip, sym, dso, addr, symoff, comm, tid, pid, time, cpu, event, trace, ip, sym, dso, addr, symoff,
srcline, period, iregs, brstack, brstacksym, flags, bpf-output, brstackinsn, brstackoff, srcline, period, iregs, brstack, brstacksym, flags, bpf-output, brstackinsn, brstackoff,
callindent, insn, insnlen. Field list can be prepended with the type, trace, sw or hw, callindent, insn, insnlen, synth.
Field list can be prepended with the type, trace, sw or hw,
to indicate to which event type the field list applies. to indicate to which event type the field list applies.
e.g., -F sw:comm,tid,time,ip,sym and -F trace:time,cpu,trace e.g., -F sw:comm,tid,time,ip,sym and -F trace:time,cpu,trace
...@@ -193,6 +194,9 @@ OPTIONS ...@@ -193,6 +194,9 @@ OPTIONS
instruction bytes and the instruction length of the current instruction bytes and the instruction length of the current
instruction. instruction.
The synth field is used by synthesized events which may be created when
Instruction Trace decoding.
Finally, a user may not set fields to none for all event types. Finally, a user may not set fields to none for all event types.
i.e., -F "" is not allowed. i.e., -F "" is not allowed.
......
...@@ -1664,3 +1664,15 @@ ...@@ -1664,3 +1664,15 @@
"0f c7 1d 78 56 34 12 \txrstors 0x12345678",}, "0f c7 1d 78 56 34 12 \txrstors 0x12345678",},
{{0x0f, 0xc7, 0x9c, 0xc8, 0x78, 0x56, 0x34, 0x12, }, 8, 0, "", "", {{0x0f, 0xc7, 0x9c, 0xc8, 0x78, 0x56, 0x34, 0x12, }, 8, 0, "", "",
"0f c7 9c c8 78 56 34 12 \txrstors 0x12345678(%eax,%ecx,8)",}, "0f c7 9c c8 78 56 34 12 \txrstors 0x12345678(%eax,%ecx,8)",},
{{0xf3, 0x0f, 0xae, 0x20, }, 4, 0, "", "",
"f3 0f ae 20 \tptwritel (%eax)",},
{{0xf3, 0x0f, 0xae, 0x25, 0x78, 0x56, 0x34, 0x12, }, 8, 0, "", "",
"f3 0f ae 25 78 56 34 12 \tptwritel 0x12345678",},
{{0xf3, 0x0f, 0xae, 0xa4, 0xc8, 0x78, 0x56, 0x34, 0x12, }, 9, 0, "", "",
"f3 0f ae a4 c8 78 56 34 12 \tptwritel 0x12345678(%eax,%ecx,8)",},
{{0xf3, 0x0f, 0xae, 0x20, }, 4, 0, "", "",
"f3 0f ae 20 \tptwritel (%eax)",},
{{0xf3, 0x0f, 0xae, 0x25, 0x78, 0x56, 0x34, 0x12, }, 8, 0, "", "",
"f3 0f ae 25 78 56 34 12 \tptwritel 0x12345678",},
{{0xf3, 0x0f, 0xae, 0xa4, 0xc8, 0x78, 0x56, 0x34, 0x12, }, 9, 0, "", "",
"f3 0f ae a4 c8 78 56 34 12 \tptwritel 0x12345678(%eax,%ecx,8)",},
...@@ -1696,3 +1696,33 @@ ...@@ -1696,3 +1696,33 @@
"0f c7 9c c8 78 56 34 12 \txrstors 0x12345678(%rax,%rcx,8)",}, "0f c7 9c c8 78 56 34 12 \txrstors 0x12345678(%rax,%rcx,8)",},
{{0x41, 0x0f, 0xc7, 0x9c, 0xc8, 0x78, 0x56, 0x34, 0x12, }, 9, 0, "", "", {{0x41, 0x0f, 0xc7, 0x9c, 0xc8, 0x78, 0x56, 0x34, 0x12, }, 9, 0, "", "",
"41 0f c7 9c c8 78 56 34 12 \txrstors 0x12345678(%r8,%rcx,8)",}, "41 0f c7 9c c8 78 56 34 12 \txrstors 0x12345678(%r8,%rcx,8)",},
{{0xf3, 0x0f, 0xae, 0x20, }, 4, 0, "", "",
"f3 0f ae 20 \tptwritel (%rax)",},
{{0xf3, 0x41, 0x0f, 0xae, 0x20, }, 5, 0, "", "",
"f3 41 0f ae 20 \tptwritel (%r8)",},
{{0xf3, 0x0f, 0xae, 0x24, 0x25, 0x78, 0x56, 0x34, 0x12, }, 9, 0, "", "",
"f3 0f ae 24 25 78 56 34 12 \tptwritel 0x12345678",},
{{0xf3, 0x0f, 0xae, 0xa4, 0xc8, 0x78, 0x56, 0x34, 0x12, }, 9, 0, "", "",
"f3 0f ae a4 c8 78 56 34 12 \tptwritel 0x12345678(%rax,%rcx,8)",},
{{0xf3, 0x41, 0x0f, 0xae, 0xa4, 0xc8, 0x78, 0x56, 0x34, 0x12, }, 10, 0, "", "",
"f3 41 0f ae a4 c8 78 56 34 12 \tptwritel 0x12345678(%r8,%rcx,8)",},
{{0xf3, 0x0f, 0xae, 0x20, }, 4, 0, "", "",
"f3 0f ae 20 \tptwritel (%rax)",},
{{0xf3, 0x41, 0x0f, 0xae, 0x20, }, 5, 0, "", "",
"f3 41 0f ae 20 \tptwritel (%r8)",},
{{0xf3, 0x0f, 0xae, 0x24, 0x25, 0x78, 0x56, 0x34, 0x12, }, 9, 0, "", "",
"f3 0f ae 24 25 78 56 34 12 \tptwritel 0x12345678",},
{{0xf3, 0x0f, 0xae, 0xa4, 0xc8, 0x78, 0x56, 0x34, 0x12, }, 9, 0, "", "",
"f3 0f ae a4 c8 78 56 34 12 \tptwritel 0x12345678(%rax,%rcx,8)",},
{{0xf3, 0x41, 0x0f, 0xae, 0xa4, 0xc8, 0x78, 0x56, 0x34, 0x12, }, 10, 0, "", "",
"f3 41 0f ae a4 c8 78 56 34 12 \tptwritel 0x12345678(%r8,%rcx,8)",},
{{0xf3, 0x48, 0x0f, 0xae, 0x20, }, 5, 0, "", "",
"f3 48 0f ae 20 \tptwriteq (%rax)",},
{{0xf3, 0x49, 0x0f, 0xae, 0x20, }, 5, 0, "", "",
"f3 49 0f ae 20 \tptwriteq (%r8)",},
{{0xf3, 0x48, 0x0f, 0xae, 0x24, 0x25, 0x78, 0x56, 0x34, 0x12, }, 10, 0, "", "",
"f3 48 0f ae 24 25 78 56 34 12 \tptwriteq 0x12345678",},
{{0xf3, 0x48, 0x0f, 0xae, 0xa4, 0xc8, 0x78, 0x56, 0x34, 0x12, }, 10, 0, "", "",
"f3 48 0f ae a4 c8 78 56 34 12 \tptwriteq 0x12345678(%rax,%rcx,8)",},
{{0xf3, 0x49, 0x0f, 0xae, 0xa4, 0xc8, 0x78, 0x56, 0x34, 0x12, }, 10, 0, "", "",
"f3 49 0f ae a4 c8 78 56 34 12 \tptwriteq 0x12345678(%r8,%rcx,8)",},
...@@ -1343,6 +1343,26 @@ int main(void) ...@@ -1343,6 +1343,26 @@ int main(void)
asm volatile("xrstors 0x12345678(%rax,%rcx,8)"); asm volatile("xrstors 0x12345678(%rax,%rcx,8)");
asm volatile("xrstors 0x12345678(%r8,%rcx,8)"); asm volatile("xrstors 0x12345678(%r8,%rcx,8)");
/* ptwrite */
asm volatile("ptwrite (%rax)");
asm volatile("ptwrite (%r8)");
asm volatile("ptwrite (0x12345678)");
asm volatile("ptwrite 0x12345678(%rax,%rcx,8)");
asm volatile("ptwrite 0x12345678(%r8,%rcx,8)");
asm volatile("ptwritel (%rax)");
asm volatile("ptwritel (%r8)");
asm volatile("ptwritel (0x12345678)");
asm volatile("ptwritel 0x12345678(%rax,%rcx,8)");
asm volatile("ptwritel 0x12345678(%r8,%rcx,8)");
asm volatile("ptwriteq (%rax)");
asm volatile("ptwriteq (%r8)");
asm volatile("ptwriteq (0x12345678)");
asm volatile("ptwriteq 0x12345678(%rax,%rcx,8)");
asm volatile("ptwriteq 0x12345678(%r8,%rcx,8)");
#else /* #ifdef __x86_64__ */ #else /* #ifdef __x86_64__ */
/* bound r32, mem (same op code as EVEX prefix) */ /* bound r32, mem (same op code as EVEX prefix) */
...@@ -2653,6 +2673,16 @@ int main(void) ...@@ -2653,6 +2673,16 @@ int main(void)
asm volatile("xrstors (0x12345678)"); asm volatile("xrstors (0x12345678)");
asm volatile("xrstors 0x12345678(%eax,%ecx,8)"); asm volatile("xrstors 0x12345678(%eax,%ecx,8)");
/* ptwrite */
asm volatile("ptwrite (%eax)");
asm volatile("ptwrite (0x12345678)");
asm volatile("ptwrite 0x12345678(%eax,%ecx,8)");
asm volatile("ptwritel (%eax)");
asm volatile("ptwritel (0x12345678)");
asm volatile("ptwritel 0x12345678(%eax,%ecx,8)");
#endif /* #ifndef __x86_64__ */ #endif /* #ifndef __x86_64__ */
/* Following line is a marker for the awk script - do not change */ /* Following line is a marker for the awk script - do not change */
......
...@@ -1725,10 +1725,10 @@ static int c2c_hists__init_sort(struct perf_hpp_list *hpp_list, char *name) ...@@ -1725,10 +1725,10 @@ static int c2c_hists__init_sort(struct perf_hpp_list *hpp_list, char *name)
tok; tok = strtok_r(NULL, ", ", &tmp)) { \ tok; tok = strtok_r(NULL, ", ", &tmp)) { \
ret = _fn(hpp_list, tok); \ ret = _fn(hpp_list, tok); \
if (ret == -EINVAL) { \ if (ret == -EINVAL) { \
error("Invalid --fields key: `%s'", tok); \ pr_err("Invalid --fields key: `%s'", tok); \
break; \ break; \
} else if (ret == -ESRCH) { \ } else if (ret == -ESRCH) { \
error("Unknown --fields key: `%s'", tok); \ pr_err("Unknown --fields key: `%s'", tok); \
break; \ break; \
} \ } \
} \ } \
......
...@@ -1302,7 +1302,10 @@ static int diff__config(const char *var, const char *value, ...@@ -1302,7 +1302,10 @@ static int diff__config(const char *var, const char *value,
void *cb __maybe_unused) void *cb __maybe_unused)
{ {
if (!strcmp(var, "diff.order")) { if (!strcmp(var, "diff.order")) {
sort_compute = perf_config_int(var, value); int ret;
if (perf_config_int(&ret, var, value) < 0)
return -1;
sort_compute = ret;
return 0; return 0;
} }
if (!strcmp(var, "diff.compute")) { if (!strcmp(var, "diff.compute")) {
......
...@@ -108,10 +108,14 @@ static int check_emacsclient_version(void) ...@@ -108,10 +108,14 @@ static int check_emacsclient_version(void)
return ret; return ret;
} }
static void exec_woman_emacs(const char *path, const char *page) static void exec_failed(const char *cmd)
{ {
char sbuf[STRERR_BUFSIZE]; char sbuf[STRERR_BUFSIZE];
pr_warning("failed to exec '%s': %s", cmd, str_error_r(errno, sbuf, sizeof(sbuf)));
}
static void exec_woman_emacs(const char *path, const char *page)
{
if (!check_emacsclient_version()) { if (!check_emacsclient_version()) {
/* This works only with emacsclient version >= 22. */ /* This works only with emacsclient version >= 22. */
char *man_page; char *man_page;
...@@ -122,8 +126,7 @@ static void exec_woman_emacs(const char *path, const char *page) ...@@ -122,8 +126,7 @@ static void exec_woman_emacs(const char *path, const char *page)
execlp(path, "emacsclient", "-e", man_page, NULL); execlp(path, "emacsclient", "-e", man_page, NULL);
free(man_page); free(man_page);
} }
warning("failed to exec '%s': %s", path, exec_failed(path);
str_error_r(errno, sbuf, sizeof(sbuf)));
} }
} }
...@@ -134,7 +137,6 @@ static void exec_man_konqueror(const char *path, const char *page) ...@@ -134,7 +137,6 @@ static void exec_man_konqueror(const char *path, const char *page)
if (display && *display) { if (display && *display) {
char *man_page; char *man_page;
const char *filename = "kfmclient"; const char *filename = "kfmclient";
char sbuf[STRERR_BUFSIZE];
/* It's simpler to launch konqueror using kfmclient. */ /* It's simpler to launch konqueror using kfmclient. */
if (path) { if (path) {
...@@ -155,33 +157,27 @@ static void exec_man_konqueror(const char *path, const char *page) ...@@ -155,33 +157,27 @@ static void exec_man_konqueror(const char *path, const char *page)
execlp(path, filename, "newTab", man_page, NULL); execlp(path, filename, "newTab", man_page, NULL);
free(man_page); free(man_page);
} }
warning("failed to exec '%s': %s", path, exec_failed(path);
str_error_r(errno, sbuf, sizeof(sbuf)));
} }
} }
static void exec_man_man(const char *path, const char *page) static void exec_man_man(const char *path, const char *page)
{ {
char sbuf[STRERR_BUFSIZE];
if (!path) if (!path)
path = "man"; path = "man";
execlp(path, "man", page, NULL); execlp(path, "man", page, NULL);
warning("failed to exec '%s': %s", path, exec_failed(path);
str_error_r(errno, sbuf, sizeof(sbuf)));
} }
static void exec_man_cmd(const char *cmd, const char *page) static void exec_man_cmd(const char *cmd, const char *page)
{ {
char sbuf[STRERR_BUFSIZE];
char *shell_cmd; char *shell_cmd;
if (asprintf(&shell_cmd, "%s %s", cmd, page) > 0) { if (asprintf(&shell_cmd, "%s %s", cmd, page) > 0) {
execl("/bin/sh", "sh", "-c", shell_cmd, NULL); execl("/bin/sh", "sh", "-c", shell_cmd, NULL);
free(shell_cmd); free(shell_cmd);
} }
warning("failed to exec '%s': %s", cmd, exec_failed(cmd);
str_error_r(errno, sbuf, sizeof(sbuf)));
} }
static void add_man_viewer(const char *name) static void add_man_viewer(const char *name)
...@@ -214,6 +210,12 @@ static void do_add_man_viewer_info(const char *name, ...@@ -214,6 +210,12 @@ static void do_add_man_viewer_info(const char *name,
man_viewer_info_list = new; man_viewer_info_list = new;
} }
static void unsupported_man_viewer(const char *name, const char *var)
{
pr_warning("'%s': path for unsupported man viewer.\n"
"Please consider using 'man.<tool>.%s' instead.", name, var);
}
static int add_man_viewer_path(const char *name, static int add_man_viewer_path(const char *name,
size_t len, size_t len,
const char *value) const char *value)
...@@ -221,9 +223,7 @@ static int add_man_viewer_path(const char *name, ...@@ -221,9 +223,7 @@ static int add_man_viewer_path(const char *name,
if (supported_man_viewer(name, len)) if (supported_man_viewer(name, len))
do_add_man_viewer_info(name, len, value); do_add_man_viewer_info(name, len, value);
else else
warning("'%s': path for unsupported man viewer.\n" unsupported_man_viewer(name, "cmd");
"Please consider using 'man.<tool>.cmd' instead.",
name);
return 0; return 0;
} }
...@@ -233,9 +233,7 @@ static int add_man_viewer_cmd(const char *name, ...@@ -233,9 +233,7 @@ static int add_man_viewer_cmd(const char *name,
const char *value) const char *value)
{ {
if (supported_man_viewer(name, len)) if (supported_man_viewer(name, len))
warning("'%s': cmd for supported man viewer.\n" unsupported_man_viewer(name, "path");
"Please consider using 'man.<tool>.path' instead.",
name);
else else
do_add_man_viewer_info(name, len, value); do_add_man_viewer_info(name, len, value);
...@@ -247,8 +245,10 @@ static int add_man_viewer_info(const char *var, const char *value) ...@@ -247,8 +245,10 @@ static int add_man_viewer_info(const char *var, const char *value)
const char *name = var + 4; const char *name = var + 4;
const char *subkey = strrchr(name, '.'); const char *subkey = strrchr(name, '.');
if (!subkey) if (!subkey) {
return error("Config with no key for man viewer: %s", name); pr_err("Config with no key for man viewer: %s", name);
return -1;
}
if (!strcmp(subkey, ".path")) { if (!strcmp(subkey, ".path")) {
if (!value) if (!value)
...@@ -261,7 +261,7 @@ static int add_man_viewer_info(const char *var, const char *value) ...@@ -261,7 +261,7 @@ static int add_man_viewer_info(const char *var, const char *value)
return add_man_viewer_cmd(name, subkey - name, value); return add_man_viewer_cmd(name, subkey - name, value);
} }
warning("'%s': unsupported man viewer sub key.", subkey); pr_warning("'%s': unsupported man viewer sub key.", subkey);
return 0; return 0;
} }
...@@ -332,7 +332,7 @@ static void setup_man_path(void) ...@@ -332,7 +332,7 @@ static void setup_man_path(void)
setenv("MANPATH", new_path, 1); setenv("MANPATH", new_path, 1);
free(new_path); free(new_path);
} else { } else {
error("Unable to setup man path"); pr_err("Unable to setup man path");
} }
} }
...@@ -349,7 +349,7 @@ static void exec_viewer(const char *name, const char *page) ...@@ -349,7 +349,7 @@ static void exec_viewer(const char *name, const char *page)
else if (info) else if (info)
exec_man_cmd(info, page); exec_man_cmd(info, page);
else else
warning("'%s': unknown man viewer.", name); pr_warning("'%s': unknown man viewer.", name);
} }
static int show_man_page(const char *perf_cmd) static int show_man_page(const char *perf_cmd)
......
...@@ -1715,7 +1715,7 @@ static int setup_slab_sorting(struct list_head *sort_list, const char *arg) ...@@ -1715,7 +1715,7 @@ static int setup_slab_sorting(struct list_head *sort_list, const char *arg)
if (!tok) if (!tok)
break; break;
if (slab_sort_dimension__add(tok, sort_list) < 0) { if (slab_sort_dimension__add(tok, sort_list) < 0) {
error("Unknown slab --sort key: '%s'", tok); pr_err("Unknown slab --sort key: '%s'", tok);
free(str); free(str);
return -1; return -1;
} }
...@@ -1741,7 +1741,7 @@ static int setup_page_sorting(struct list_head *sort_list, const char *arg) ...@@ -1741,7 +1741,7 @@ static int setup_page_sorting(struct list_head *sort_list, const char *arg)
if (!tok) if (!tok)
break; break;
if (page_sort_dimension__add(tok, sort_list) < 0) { if (page_sort_dimension__add(tok, sort_list) < 0) {
error("Unknown page --sort key: '%s'", tok); pr_err("Unknown page --sort key: '%s'", tok);
free(str); free(str);
return -1; return -1;
} }
......
...@@ -453,7 +453,7 @@ static int record__open(struct record *rec) ...@@ -453,7 +453,7 @@ static int record__open(struct record *rec)
} }
if (perf_evlist__apply_filters(evlist, &pos)) { if (perf_evlist__apply_filters(evlist, &pos)) {
error("failed to set filter \"%s\" on event %s with %d (%s)\n", pr_err("failed to set filter \"%s\" on event %s with %d (%s)\n",
pos->filter, perf_evsel__name(pos), errno, pos->filter, perf_evsel__name(pos), errno,
str_error_r(errno, msg, sizeof(msg))); str_error_r(errno, msg, sizeof(msg)));
rc = -1; rc = -1;
...@@ -461,7 +461,7 @@ static int record__open(struct record *rec) ...@@ -461,7 +461,7 @@ static int record__open(struct record *rec)
} }
if (perf_evlist__apply_drv_configs(evlist, &pos, &err_term)) { if (perf_evlist__apply_drv_configs(evlist, &pos, &err_term)) {
error("failed to set config \"%s\" on event %s with %d (%s)\n", pr_err("failed to set config \"%s\" on event %s with %d (%s)\n",
err_term->val.drv_cfg, perf_evsel__name(pos), errno, err_term->val.drv_cfg, perf_evsel__name(pos), errno,
str_error_r(errno, msg, sizeof(msg))); str_error_r(errno, msg, sizeof(msg)));
rc = -1; rc = -1;
......
...@@ -94,10 +94,9 @@ static int report__config(const char *var, const char *value, void *cb) ...@@ -94,10 +94,9 @@ static int report__config(const char *var, const char *value, void *cb)
symbol_conf.cumulate_callchain = perf_config_bool(var, value); symbol_conf.cumulate_callchain = perf_config_bool(var, value);
return 0; return 0;
} }
if (!strcmp(var, "report.queue-size")) { if (!strcmp(var, "report.queue-size"))
rep->queue_size = perf_config_u64(var, value); return perf_config_u64(&rep->queue_size, var, value);
return 0;
}
if (!strcmp(var, "report.sort_order")) { if (!strcmp(var, "report.sort_order")) {
default_sort_order = strdup(value); default_sort_order = strdup(value);
return 0; return 0;
...@@ -558,6 +557,7 @@ static int __cmd_report(struct report *rep) ...@@ -558,6 +557,7 @@ static int __cmd_report(struct report *rep)
ui__error("failed to set cpu bitmap\n"); ui__error("failed to set cpu bitmap\n");
return ret; return ret;
} }
session->itrace_synth_opts->cpu_bitmap = rep->cpu_bitmap;
} }
if (rep->show_threads) { if (rep->show_threads) {
......
...@@ -2066,7 +2066,7 @@ static void save_task_callchain(struct perf_sched *sched, ...@@ -2066,7 +2066,7 @@ static void save_task_callchain(struct perf_sched *sched,
if (thread__resolve_callchain(thread, cursor, evsel, sample, if (thread__resolve_callchain(thread, cursor, evsel, sample,
NULL, NULL, sched->max_stack + 2) != 0) { NULL, NULL, sched->max_stack + 2) != 0) {
if (verbose > 0) if (verbose > 0)
error("Failed to resolve callchain. Skipping\n"); pr_err("Failed to resolve callchain. Skipping\n");
return; return;
} }
......
This diff is collapsed.
...@@ -636,14 +636,14 @@ static int __run_perf_stat(int argc, const char **argv) ...@@ -636,14 +636,14 @@ static int __run_perf_stat(int argc, const char **argv)
} }
if (perf_evlist__apply_filters(evsel_list, &counter)) { if (perf_evlist__apply_filters(evsel_list, &counter)) {
error("failed to set filter \"%s\" on event %s with %d (%s)\n", pr_err("failed to set filter \"%s\" on event %s with %d (%s)\n",
counter->filter, perf_evsel__name(counter), errno, counter->filter, perf_evsel__name(counter), errno,
str_error_r(errno, msg, sizeof(msg))); str_error_r(errno, msg, sizeof(msg)));
return -1; return -1;
} }
if (perf_evlist__apply_drv_configs(evsel_list, &counter, &err_term)) { if (perf_evlist__apply_drv_configs(evsel_list, &counter, &err_term)) {
error("failed to set config \"%s\" on event %s with %d (%s)\n", pr_err("failed to set config \"%s\" on event %s with %d (%s)\n",
err_term->val.drv_cfg, perf_evsel__name(counter), errno, err_term->val.drv_cfg, perf_evsel__name(counter), errno,
str_error_r(errno, msg, sizeof(msg))); str_error_r(errno, msg, sizeof(msg)));
return -1; return -1;
......
...@@ -958,7 +958,7 @@ static int __cmd_top(struct perf_top *top) ...@@ -958,7 +958,7 @@ static int __cmd_top(struct perf_top *top)
ret = perf_evlist__apply_drv_configs(evlist, &pos, &err_term); ret = perf_evlist__apply_drv_configs(evlist, &pos, &err_term);
if (ret) { if (ret) {
error("failed to set config \"%s\" on event %s with %d (%s)\n", pr_err("failed to set config \"%s\" on event %s with %d (%s)\n",
err_term->val.drv_cfg, perf_evsel__name(pos), errno, err_term->val.drv_cfg, perf_evsel__name(pos), errno,
str_error_r(errno, msg, sizeof(msg))); str_error_r(errno, msg, sizeof(msg)));
goto out_delete; goto out_delete;
......
...@@ -304,7 +304,7 @@ jvmti_close(void *agent) ...@@ -304,7 +304,7 @@ jvmti_close(void *agent)
FILE *fp = agent; FILE *fp = agent;
if (!fp) { if (!fp) {
warnx("jvmti: incalid fd in close_agent"); warnx("jvmti: invalid fd in close_agent");
return -1; return -1;
} }
......
#!/bin/bash
#
# print Intel PT Power Events and PTWRITE. The intel_pt PMU event needs
# to be specified with appropriate config terms.
#
if ! echo "$@" | grep -q intel_pt ; then
echo "Options must include the Intel PT event e.g. -e intel_pt/pwr_evt,ptw/"
echo "and for power events it probably needs to be system wide i.e. -a option"
echo "For example: -a -e intel_pt/pwr_evt,branch=0/ sleep 1"
exit 1
fi
perf record $@
#!/bin/bash
# description: print Intel PT Power Events and PTWRITE
perf script $@ -s "$PERF_EXEC_PATH"/scripts/python/intel-pt-events.py
\ No newline at end of file
# intel-pt-events.py: Print Intel PT Power Events and PTWRITE
# Copyright (c) 2017, Intel Corporation.
#
# This program is free software; you can redistribute it and/or modify it
# under the terms and conditions of the GNU General Public License,
# version 2, as published by the Free Software Foundation.
#
# This program is distributed in the hope it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
# more details.
import os
import sys
import struct
sys.path.append(os.environ['PERF_EXEC_PATH'] + \
'/scripts/python/Perf-Trace-Util/lib/Perf/Trace')
# These perf imports are not used at present
#from perf_trace_context import *
#from Core import *
def trace_begin():
print "Intel PT Power Events and PTWRITE"
def trace_end():
print "End"
def trace_unhandled(event_name, context, event_fields_dict):
print ' '.join(['%s=%s'%(k,str(v))for k,v in sorted(event_fields_dict.items())])
def print_ptwrite(raw_buf):
data = struct.unpack_from("<IQ", raw_buf)
flags = data[0]
payload = data[1]
exact_ip = flags & 1
print "IP: %u payload: %#x" % (exact_ip, payload),
def print_cbr(raw_buf):
data = struct.unpack_from("<BBBBII", raw_buf)
cbr = data[0]
f = (data[4] + 500) / 1000
p = ((cbr * 1000 / data[2]) + 5) / 10
print "%3u freq: %4u MHz (%3u%%)" % (cbr, f, p),
def print_mwait(raw_buf):
data = struct.unpack_from("<IQ", raw_buf)
payload = data[1]
hints = payload & 0xff
extensions = (payload >> 32) & 0x3
print "hints: %#x extensions: %#x" % (hints, extensions),
def print_pwre(raw_buf):
data = struct.unpack_from("<IQ", raw_buf)
payload = data[1]
hw = (payload >> 7) & 1
cstate = (payload >> 12) & 0xf
subcstate = (payload >> 8) & 0xf
print "hw: %u cstate: %u sub-cstate: %u" % (hw, cstate, subcstate),
def print_exstop(raw_buf):
data = struct.unpack_from("<I", raw_buf)
flags = data[0]
exact_ip = flags & 1
print "IP: %u" % (exact_ip),
def print_pwrx(raw_buf):
data = struct.unpack_from("<IQ", raw_buf)
payload = data[1]
deepest_cstate = payload & 0xf
last_cstate = (payload >> 4) & 0xf
wake_reason = (payload >> 8) & 0xf
print "deepest cstate: %u last cstate: %u wake reason: %#x" % (deepest_cstate, last_cstate, wake_reason),
def print_common_start(comm, sample, name):
ts = sample["time"]
cpu = sample["cpu"]
pid = sample["pid"]
tid = sample["tid"]
print "%16s %5u/%-5u [%03u] %9u.%09u %7s:" % (comm, pid, tid, cpu, ts / 1000000000, ts %1000000000, name),
def print_common_ip(sample, symbol, dso):
ip = sample["ip"]
print "%16x %s (%s)" % (ip, symbol, dso)
def process_event(param_dict):
event_attr = param_dict["attr"]
sample = param_dict["sample"]
raw_buf = param_dict["raw_buf"]
comm = param_dict["comm"]
name = param_dict["ev_name"]
# Symbol and dso info are not always resolved
if (param_dict.has_key("dso")):
dso = param_dict["dso"]
else:
dso = "[unknown]"
if (param_dict.has_key("symbol")):
symbol = param_dict["symbol"]
else:
symbol = "[unknown]"
if name == "ptwrite":
print_common_start(comm, sample, name)
print_ptwrite(raw_buf)
print_common_ip(sample, symbol, dso)
elif name == "cbr":
print_common_start(comm, sample, name)
print_cbr(raw_buf)
print_common_ip(sample, symbol, dso)
elif name == "mwait":
print_common_start(comm, sample, name)
print_mwait(raw_buf)
print_common_ip(sample, symbol, dso)
elif name == "pwre":
print_common_start(comm, sample, name)
print_pwre(raw_buf)
print_common_ip(sample, symbol, dso)
elif name == "exstop":
print_common_start(comm, sample, name)
print_exstop(raw_buf)
print_common_ip(sample, symbol, dso)
elif name == "pwrx":
print_common_start(comm, sample, name)
print_pwrx(raw_buf)
print_common_ip(sample, symbol, dso)
...@@ -18,6 +18,7 @@ ...@@ -18,6 +18,7 @@
* permissions. All the event text files are stored there. * permissions. All the event text files are stored there.
*/ */
#include <debug.h>
#include <errno.h> #include <errno.h>
#include <inttypes.h> #include <inttypes.h>
#include <stdlib.h> #include <stdlib.h>
...@@ -29,14 +30,11 @@ ...@@ -29,14 +30,11 @@
#include <sys/stat.h> #include <sys/stat.h>
#include <unistd.h> #include <unistd.h>
#include "../perf.h" #include "../perf.h"
#include "util.h"
#include <subcmd/exec-cmd.h> #include <subcmd/exec-cmd.h>
#include "tests.h" #include "tests.h"
#define ENV "PERF_TEST_ATTR" #define ENV "PERF_TEST_ATTR"
extern int verbose;
static char *dir; static char *dir;
void test_attr__init(void) void test_attr__init(void)
...@@ -138,8 +136,10 @@ void test_attr__open(struct perf_event_attr *attr, pid_t pid, int cpu, ...@@ -138,8 +136,10 @@ void test_attr__open(struct perf_event_attr *attr, pid_t pid, int cpu,
{ {
int errno_saved = errno; int errno_saved = errno;
if (store_event(attr, pid, cpu, fd, group_fd, flags)) if (store_event(attr, pid, cpu, fd, group_fd, flags)) {
die("test attr FAILED"); pr_err("test attr FAILED");
exit(128);
}
errno = errno_saved; errno = errno_saved;
} }
......
...@@ -16,6 +16,13 @@ class Fail(Exception): ...@@ -16,6 +16,13 @@ class Fail(Exception):
def getMsg(self): def getMsg(self):
return '\'%s\' - %s' % (self.test.path, self.msg) return '\'%s\' - %s' % (self.test.path, self.msg)
class Notest(Exception):
def __init__(self, test, arch):
self.arch = arch
self.test = test
def getMsg(self):
return '[%s] \'%s\'' % (self.arch, self.test.path)
class Unsup(Exception): class Unsup(Exception):
def __init__(self, test): def __init__(self, test):
self.test = test self.test = test
...@@ -112,6 +119,9 @@ class Event(dict): ...@@ -112,6 +119,9 @@ class Event(dict):
# 'command' - perf command name # 'command' - perf command name
# 'args' - special command arguments # 'args' - special command arguments
# 'ret' - expected command return value (0 by default) # 'ret' - expected command return value (0 by default)
# 'arch' - architecture specific test (optional)
# comma separated list, ! at the beginning
# negates it.
# #
# [eventX:base] # [eventX:base]
# - one or multiple instances in file # - one or multiple instances in file
...@@ -134,6 +144,12 @@ class Test(object): ...@@ -134,6 +144,12 @@ class Test(object):
except: except:
self.ret = 0 self.ret = 0
try:
self.arch = parser.get('config', 'arch')
log.warning("test limitation '%s'" % self.arch)
except:
self.arch = ''
self.expect = {} self.expect = {}
self.result = {} self.result = {}
log.debug(" loading expected events"); log.debug(" loading expected events");
...@@ -145,6 +161,31 @@ class Test(object): ...@@ -145,6 +161,31 @@ class Test(object):
else: else:
return True return True
def skip_test(self, myarch):
# If architecture not set always run test
if self.arch == '':
# log.warning("test for arch %s is ok" % myarch)
return False
# Allow multiple values in assignment separated by ','
arch_list = self.arch.split(',')
# Handle negated list such as !s390x,ppc
if arch_list[0][0] == '!':
arch_list[0] = arch_list[0][1:]
log.warning("excluded architecture list %s" % arch_list)
for arch_item in arch_list:
# log.warning("test for %s arch is %s" % (arch_item, myarch))
if arch_item == myarch:
return True
return False
for arch_item in arch_list:
# log.warning("test for architecture '%s' current '%s'" % (arch_item, myarch))
if arch_item == myarch:
return False
return True
def load_events(self, path, events): def load_events(self, path, events):
parser_event = ConfigParser.SafeConfigParser() parser_event = ConfigParser.SafeConfigParser()
parser_event.read(path) parser_event.read(path)
...@@ -168,6 +209,11 @@ class Test(object): ...@@ -168,6 +209,11 @@ class Test(object):
events[section] = e events[section] = e
def run_cmd(self, tempdir): def run_cmd(self, tempdir):
junk1, junk2, junk3, junk4, myarch = (os.uname())
if self.skip_test(myarch):
raise Notest(self, myarch)
cmd = "PERF_TEST_ATTR=%s %s %s -o %s/perf.data %s" % (tempdir, cmd = "PERF_TEST_ATTR=%s %s %s -o %s/perf.data %s" % (tempdir,
self.perf, self.command, tempdir, self.args) self.perf, self.command, tempdir, self.args)
ret = os.WEXITSTATUS(os.system(cmd)) ret = os.WEXITSTATUS(os.system(cmd))
...@@ -265,6 +311,8 @@ def run_tests(options): ...@@ -265,6 +311,8 @@ def run_tests(options):
Test(f, options).run() Test(f, options).run()
except Unsup, obj: except Unsup, obj:
log.warning("unsupp %s" % obj.getMsg()) log.warning("unsupp %s" % obj.getMsg())
except Notest, obj:
log.warning("skipped %s" % obj.getMsg())
def setup_log(verbose): def setup_log(verbose):
global log global log
......
...@@ -1810,17 +1810,6 @@ static int test_pmu_events(void) ...@@ -1810,17 +1810,6 @@ static int test_pmu_events(void)
return ret; return ret;
} }
static void debug_warn(const char *warn, va_list params)
{
char msg[1024];
if (verbose <= 0)
return;
vsnprintf(msg, sizeof(msg), warn, params);
fprintf(stderr, " Warning: %s\n", msg);
}
int test__parse_events(int subtest __maybe_unused) int test__parse_events(int subtest __maybe_unused)
{ {
int ret1, ret2 = 0; int ret1, ret2 = 0;
...@@ -1832,8 +1821,6 @@ do { \ ...@@ -1832,8 +1821,6 @@ do { \
ret2 = ret1; \ ret2 = ret1; \
} while (0) } while (0)
set_warning_routine(debug_warn);
TEST_EVENTS(test__events); TEST_EVENTS(test__events);
if (test_pmu()) if (test_pmu())
......
...@@ -322,6 +322,13 @@ static int auxtrace_queues__add_event_buffer(struct auxtrace_queues *queues, ...@@ -322,6 +322,13 @@ static int auxtrace_queues__add_event_buffer(struct auxtrace_queues *queues,
return auxtrace_queues__add_buffer(queues, idx, buffer); return auxtrace_queues__add_buffer(queues, idx, buffer);
} }
static bool filter_cpu(struct perf_session *session, int cpu)
{
unsigned long *cpu_bitmap = session->itrace_synth_opts->cpu_bitmap;
return cpu_bitmap && cpu != -1 && !test_bit(cpu, cpu_bitmap);
}
int auxtrace_queues__add_event(struct auxtrace_queues *queues, int auxtrace_queues__add_event(struct auxtrace_queues *queues,
struct perf_session *session, struct perf_session *session,
union perf_event *event, off_t data_offset, union perf_event *event, off_t data_offset,
...@@ -331,6 +338,9 @@ int auxtrace_queues__add_event(struct auxtrace_queues *queues, ...@@ -331,6 +338,9 @@ int auxtrace_queues__add_event(struct auxtrace_queues *queues,
unsigned int idx; unsigned int idx;
int err; int err;
if (filter_cpu(session, event->auxtrace.cpu))
return 0;
buffer = zalloc(sizeof(struct auxtrace_buffer)); buffer = zalloc(sizeof(struct auxtrace_buffer));
if (!buffer) if (!buffer)
return -ENOMEM; return -ENOMEM;
...@@ -947,6 +957,8 @@ void itrace_synth_opts__set_default(struct itrace_synth_opts *synth_opts) ...@@ -947,6 +957,8 @@ void itrace_synth_opts__set_default(struct itrace_synth_opts *synth_opts)
synth_opts->instructions = true; synth_opts->instructions = true;
synth_opts->branches = true; synth_opts->branches = true;
synth_opts->transactions = true; synth_opts->transactions = true;
synth_opts->ptwrites = true;
synth_opts->pwr_events = true;
synth_opts->errors = true; synth_opts->errors = true;
synth_opts->period_type = PERF_ITRACE_DEFAULT_PERIOD_TYPE; synth_opts->period_type = PERF_ITRACE_DEFAULT_PERIOD_TYPE;
synth_opts->period = PERF_ITRACE_DEFAULT_PERIOD; synth_opts->period = PERF_ITRACE_DEFAULT_PERIOD;
...@@ -1030,6 +1042,12 @@ int itrace_parse_synth_opts(const struct option *opt, const char *str, ...@@ -1030,6 +1042,12 @@ int itrace_parse_synth_opts(const struct option *opt, const char *str,
case 'x': case 'x':
synth_opts->transactions = true; synth_opts->transactions = true;
break; break;
case 'w':
synth_opts->ptwrites = true;
break;
case 'p':
synth_opts->pwr_events = true;
break;
case 'e': case 'e':
synth_opts->errors = true; synth_opts->errors = true;
break; break;
......
...@@ -59,6 +59,8 @@ enum itrace_period_type { ...@@ -59,6 +59,8 @@ enum itrace_period_type {
* @instructions: whether to synthesize 'instructions' events * @instructions: whether to synthesize 'instructions' events
* @branches: whether to synthesize 'branches' events * @branches: whether to synthesize 'branches' events
* @transactions: whether to synthesize events for transactions * @transactions: whether to synthesize events for transactions
* @ptwrites: whether to synthesize events for ptwrites
* @pwr_events: whether to synthesize power events
* @errors: whether to synthesize decoder error events * @errors: whether to synthesize decoder error events
* @dont_decode: whether to skip decoding entirely * @dont_decode: whether to skip decoding entirely
* @log: write a decoding log * @log: write a decoding log
...@@ -72,6 +74,7 @@ enum itrace_period_type { ...@@ -72,6 +74,7 @@ enum itrace_period_type {
* @period: 'instructions' events period * @period: 'instructions' events period
* @period_type: 'instructions' events period type * @period_type: 'instructions' events period type
* @initial_skip: skip N events at the beginning. * @initial_skip: skip N events at the beginning.
* @cpu_bitmap: CPUs for which to synthesize events, or NULL for all
*/ */
struct itrace_synth_opts { struct itrace_synth_opts {
bool set; bool set;
...@@ -79,6 +82,8 @@ struct itrace_synth_opts { ...@@ -79,6 +82,8 @@ struct itrace_synth_opts {
bool instructions; bool instructions;
bool branches; bool branches;
bool transactions; bool transactions;
bool ptwrites;
bool pwr_events;
bool errors; bool errors;
bool dont_decode; bool dont_decode;
bool log; bool log;
...@@ -92,6 +97,7 @@ struct itrace_synth_opts { ...@@ -92,6 +97,7 @@ struct itrace_synth_opts {
unsigned long long period; unsigned long long period;
enum itrace_period_type period_type; enum itrace_period_type period_type;
unsigned long initial_skip; unsigned long initial_skip;
unsigned long *cpu_bitmap;
}; };
/** /**
......
...@@ -335,32 +335,42 @@ static int perf_parse_long(const char *value, long *ret) ...@@ -335,32 +335,42 @@ static int perf_parse_long(const char *value, long *ret)
return 0; return 0;
} }
static void die_bad_config(const char *name) static void bad_config(const char *name)
{ {
if (config_file_name) if (config_file_name)
die("bad config value for '%s' in %s", name, config_file_name); pr_warning("bad config value for '%s' in %s, ignoring...\n", name, config_file_name);
die("bad config value for '%s'", name); else
pr_warning("bad config value for '%s', ignoring...\n", name);
} }
u64 perf_config_u64(const char *name, const char *value) int perf_config_u64(u64 *dest, const char *name, const char *value)
{ {
long long ret = 0; long long ret = 0;
if (!perf_parse_llong(value, &ret)) if (!perf_parse_llong(value, &ret)) {
die_bad_config(name); bad_config(name);
return (u64) ret; return -1;
}
*dest = ret;
return 0;
} }
int perf_config_int(const char *name, const char *value) int perf_config_int(int *dest, const char *name, const char *value)
{ {
long ret = 0; long ret = 0;
if (!perf_parse_long(value, &ret)) if (!perf_parse_long(value, &ret)) {
die_bad_config(name); bad_config(name);
return ret; return -1;
}
*dest = ret;
return 0;
} }
static int perf_config_bool_or_int(const char *name, const char *value, int *is_bool) static int perf_config_bool_or_int(const char *name, const char *value, int *is_bool)
{ {
int ret;
*is_bool = 1; *is_bool = 1;
if (!value) if (!value)
return 1; return 1;
...@@ -371,7 +381,7 @@ static int perf_config_bool_or_int(const char *name, const char *value, int *is_ ...@@ -371,7 +381,7 @@ static int perf_config_bool_or_int(const char *name, const char *value, int *is_
if (!strcasecmp(value, "false") || !strcasecmp(value, "no") || !strcasecmp(value, "off")) if (!strcasecmp(value, "false") || !strcasecmp(value, "no") || !strcasecmp(value, "off"))
return 0; return 0;
*is_bool = 0; *is_bool = 0;
return perf_config_int(name, value); return perf_config_int(&ret, name, value) < 0 ? -1 : ret;
} }
int perf_config_bool(const char *name, const char *value) int perf_config_bool(const char *name, const char *value)
...@@ -657,8 +667,7 @@ static int perf_config_set__init(struct perf_config_set *set) ...@@ -657,8 +667,7 @@ static int perf_config_set__init(struct perf_config_set *set)
user_config = strdup(mkpath("%s/.perfconfig", home)); user_config = strdup(mkpath("%s/.perfconfig", home));
if (user_config == NULL) { if (user_config == NULL) {
warning("Not enough memory to process %s/.perfconfig, " pr_warning("Not enough memory to process %s/.perfconfig, ignoring it.", home);
"ignoring it.", home);
goto out; goto out;
} }
...@@ -671,8 +680,7 @@ static int perf_config_set__init(struct perf_config_set *set) ...@@ -671,8 +680,7 @@ static int perf_config_set__init(struct perf_config_set *set)
ret = 0; ret = 0;
if (st.st_uid && (st.st_uid != geteuid())) { if (st.st_uid && (st.st_uid != geteuid())) {
warning("File %s not owned by current user or root, " pr_warning("File %s not owned by current user or root, ignoring it.", user_config);
"ignoring it.", user_config);
goto out_free; goto out_free;
} }
...@@ -795,7 +803,8 @@ void perf_config_set__delete(struct perf_config_set *set) ...@@ -795,7 +803,8 @@ void perf_config_set__delete(struct perf_config_set *set)
*/ */
int config_error_nonbool(const char *var) int config_error_nonbool(const char *var)
{ {
return error("Missing value for '%s'", var); pr_err("Missing value for '%s'", var);
return -1;
} }
void set_buildid_dir(const char *dir) void set_buildid_dir(const char *dir)
......
...@@ -27,8 +27,8 @@ extern const char *config_exclusive_filename; ...@@ -27,8 +27,8 @@ extern const char *config_exclusive_filename;
typedef int (*config_fn_t)(const char *, const char *, void *); typedef int (*config_fn_t)(const char *, const char *, void *);
int perf_default_config(const char *, const char *, void *); int perf_default_config(const char *, const char *, void *);
int perf_config(config_fn_t fn, void *); int perf_config(config_fn_t fn, void *);
int perf_config_int(const char *, const char *); int perf_config_int(int *dest, const char *, const char *);
u64 perf_config_u64(const char *, const char *); int perf_config_u64(u64 *dest, const char *, const char *);
int perf_config_bool(const char *, const char *); int perf_config_bool(const char *, const char *);
int config_error_nonbool(const char *); int config_error_nonbool(const char *);
const char *perf_etc_perfconfig(void); const char *perf_etc_perfconfig(void);
......
...@@ -1444,10 +1444,8 @@ static int convert__config(const char *var, const char *value, void *cb) ...@@ -1444,10 +1444,8 @@ static int convert__config(const char *var, const char *value, void *cb)
{ {
struct convert *c = cb; struct convert *c = cb;
if (!strcmp(var, "convert.queue-size")) { if (!strcmp(var, "convert.queue-size"))
c->queue_size = perf_config_u64(var, value); return perf_config_u64(&c->queue_size, var, value);
return 0;
}
return 0; return 0;
} }
......
...@@ -252,6 +252,127 @@ enum auxtrace_error_type { ...@@ -252,6 +252,127 @@ enum auxtrace_error_type {
PERF_AUXTRACE_ERROR_MAX PERF_AUXTRACE_ERROR_MAX
}; };
/* Attribute type for custom synthesized events */
#define PERF_TYPE_SYNTH (INT_MAX + 1U)
/* Attribute config for custom synthesized events */
enum perf_synth_id {
PERF_SYNTH_INTEL_PTWRITE,
PERF_SYNTH_INTEL_MWAIT,
PERF_SYNTH_INTEL_PWRE,
PERF_SYNTH_INTEL_EXSTOP,
PERF_SYNTH_INTEL_PWRX,
PERF_SYNTH_INTEL_CBR,
};
/*
* Raw data formats for synthesized events. Note that 4 bytes of padding are
* present to match the 'size' member of PERF_SAMPLE_RAW data which is always
* 8-byte aligned. That means we must dereference raw_data with an offset of 4.
* Refer perf_sample__synth_ptr() and perf_synth__raw_data(). It also means the
* structure sizes are 4 bytes bigger than the raw_size, refer
* perf_synth__raw_size().
*/
struct perf_synth_intel_ptwrite {
u32 padding;
union {
struct {
u32 ip : 1,
reserved : 31;
};
u32 flags;
};
u64 payload;
};
struct perf_synth_intel_mwait {
u32 padding;
u32 reserved;
union {
struct {
u64 hints : 8,
reserved1 : 24,
extensions : 2,
reserved2 : 30;
};
u64 payload;
};
};
struct perf_synth_intel_pwre {
u32 padding;
u32 reserved;
union {
struct {
u64 reserved1 : 7,
hw : 1,
subcstate : 4,
cstate : 4,
reserved2 : 48;
};
u64 payload;
};
};
struct perf_synth_intel_exstop {
u32 padding;
union {
struct {
u32 ip : 1,
reserved : 31;
};
u32 flags;
};
};
struct perf_synth_intel_pwrx {
u32 padding;
u32 reserved;
union {
struct {
u64 deepest_cstate : 4,
last_cstate : 4,
wake_reason : 4,
reserved1 : 52;
};
u64 payload;
};
};
struct perf_synth_intel_cbr {
u32 padding;
union {
struct {
u32 cbr : 8,
reserved1 : 8,
max_nonturbo : 8,
reserved2 : 8;
};
u32 flags;
};
u32 freq;
u32 reserved3;
};
/*
* raw_data is always 4 bytes from an 8-byte boundary, so subtract 4 to get
* 8-byte alignment.
*/
static inline void *perf_sample__synth_ptr(struct perf_sample *sample)
{
return sample->raw_data - 4;
}
static inline void *perf_synth__raw_data(void *p)
{
return p + 4;
}
#define perf_synth__raw_size(d) (sizeof(d) - 4)
#define perf_sample__bad_synth_size(s, d) ((s)->raw_size < sizeof(d) - 4)
/* /*
* The kernel collects the number of events it couldn't send in a stretch and * The kernel collects the number of events it couldn't send in a stretch and
* when possible sends this number in a PERF_RECORD_LOST event. The number of * when possible sends this number in a PERF_RECORD_LOST event. The number of
......
...@@ -12,7 +12,7 @@ static int perf_unknown_cmd_config(const char *var, const char *value, ...@@ -12,7 +12,7 @@ static int perf_unknown_cmd_config(const char *var, const char *value,
void *cb __maybe_unused) void *cb __maybe_unused)
{ {
if (!strcmp(var, "help.autocorrect")) if (!strcmp(var, "help.autocorrect"))
autocorrect = perf_config_int(var,value); return perf_config_int(&autocorrect, var,value);
return 0; return 0;
} }
......
...@@ -711,6 +711,12 @@ static int intel_pt_calc_cyc_cb(struct intel_pt_pkt_info *pkt_info) ...@@ -711,6 +711,12 @@ static int intel_pt_calc_cyc_cb(struct intel_pt_pkt_info *pkt_info)
break; break;
case INTEL_PT_TSC: case INTEL_PT_TSC:
/*
* For now, do not support using TSC packets - refer
* intel_pt_calc_cyc_to_tsc().
*/
if (data->from_mtc)
return 1;
timestamp = pkt_info->packet.payload | timestamp = pkt_info->packet.payload |
(data->timestamp & (0xffULL << 56)); (data->timestamp & (0xffULL << 56));
if (data->from_mtc && timestamp < data->timestamp && if (data->from_mtc && timestamp < data->timestamp &&
...@@ -828,6 +834,14 @@ static void intel_pt_calc_cyc_to_tsc(struct intel_pt_decoder *decoder, ...@@ -828,6 +834,14 @@ static void intel_pt_calc_cyc_to_tsc(struct intel_pt_decoder *decoder,
.cbr_cyc_to_tsc = 0, .cbr_cyc_to_tsc = 0,
}; };
/*
* For now, do not support using TSC packets for at least the reasons:
* 1) timing might have stopped
* 2) TSC packets within PSB+ can slip against CYC packets
*/
if (!from_mtc)
return;
intel_pt_pkt_lookahead(decoder, intel_pt_calc_cyc_cb, &data); intel_pt_pkt_lookahead(decoder, intel_pt_calc_cyc_cb, &data);
} }
......
...@@ -1009,7 +1009,7 @@ GrpTable: Grp15 ...@@ -1009,7 +1009,7 @@ GrpTable: Grp15
1: fxstor | RDGSBASE Ry (F3),(11B) 1: fxstor | RDGSBASE Ry (F3),(11B)
2: vldmxcsr Md (v1) | WRFSBASE Ry (F3),(11B) 2: vldmxcsr Md (v1) | WRFSBASE Ry (F3),(11B)
3: vstmxcsr Md (v1) | WRGSBASE Ry (F3),(11B) 3: vstmxcsr Md (v1) | WRGSBASE Ry (F3),(11B)
4: XSAVE 4: XSAVE | ptwrite Ey (F3),(11B)
5: XRSTOR | lfence (11B) 5: XRSTOR | lfence (11B)
6: XSAVEOPT | clwb (66) | mfence (11B) 6: XSAVEOPT | clwb (66) | mfence (11B)
7: clflush | clflushopt (66) | sfence (11B) 7: clflush | clflushopt (66) | sfence (11B)
......
This diff is collapsed.
...@@ -2532,12 +2532,12 @@ static int setup_sort_list(struct perf_hpp_list *list, char *str, ...@@ -2532,12 +2532,12 @@ static int setup_sort_list(struct perf_hpp_list *list, char *str,
ret = sort_dimension__add(list, tok, evlist, level); ret = sort_dimension__add(list, tok, evlist, level);
if (ret == -EINVAL) { if (ret == -EINVAL) {
if (!cacheline_size && !strncasecmp(tok, "dcacheline", strlen(tok))) if (!cacheline_size && !strncasecmp(tok, "dcacheline", strlen(tok)))
error("The \"dcacheline\" --sort key needs to know the cacheline size and it couldn't be determined on this system"); pr_err("The \"dcacheline\" --sort key needs to know the cacheline size and it couldn't be determined on this system");
else else
error("Invalid --sort key: `%s'", tok); pr_err("Invalid --sort key: `%s'", tok);
break; break;
} else if (ret == -ESRCH) { } else if (ret == -ESRCH) {
error("Unknown --sort key: `%s'", tok); pr_err("Unknown --sort key: `%s'", tok);
break; break;
} }
} }
...@@ -2594,7 +2594,7 @@ static int setup_sort_order(struct perf_evlist *evlist) ...@@ -2594,7 +2594,7 @@ static int setup_sort_order(struct perf_evlist *evlist)
return 0; return 0;
if (sort_order[1] == '\0') { if (sort_order[1] == '\0') {
error("Invalid --sort key: `+'"); pr_err("Invalid --sort key: `+'");
return -EINVAL; return -EINVAL;
} }
...@@ -2604,7 +2604,7 @@ static int setup_sort_order(struct perf_evlist *evlist) ...@@ -2604,7 +2604,7 @@ static int setup_sort_order(struct perf_evlist *evlist)
*/ */
if (asprintf(&new_sort_order, "%s,%s", if (asprintf(&new_sort_order, "%s,%s",
get_default_sort_order(evlist), sort_order + 1) < 0) { get_default_sort_order(evlist), sort_order + 1) < 0) {
error("Not enough memory to set up --sort"); pr_err("Not enough memory to set up --sort");
return -ENOMEM; return -ENOMEM;
} }
...@@ -2668,7 +2668,7 @@ static int __setup_sorting(struct perf_evlist *evlist) ...@@ -2668,7 +2668,7 @@ static int __setup_sorting(struct perf_evlist *evlist)
str = strdup(sort_keys); str = strdup(sort_keys);
if (str == NULL) { if (str == NULL) {
error("Not enough memory to setup sort keys"); pr_err("Not enough memory to setup sort keys");
return -ENOMEM; return -ENOMEM;
} }
...@@ -2678,7 +2678,7 @@ static int __setup_sorting(struct perf_evlist *evlist) ...@@ -2678,7 +2678,7 @@ static int __setup_sorting(struct perf_evlist *evlist)
if (!is_strict_order(field_order)) { if (!is_strict_order(field_order)) {
str = setup_overhead(str); str = setup_overhead(str);
if (str == NULL) { if (str == NULL) {
error("Not enough memory to setup overhead keys"); pr_err("Not enough memory to setup overhead keys");
return -ENOMEM; return -ENOMEM;
} }
} }
...@@ -2834,10 +2834,10 @@ static int setup_output_list(struct perf_hpp_list *list, char *str) ...@@ -2834,10 +2834,10 @@ static int setup_output_list(struct perf_hpp_list *list, char *str)
tok; tok = strtok_r(NULL, ", ", &tmp)) { tok; tok = strtok_r(NULL, ", ", &tmp)) {
ret = output_field_add(list, tok); ret = output_field_add(list, tok);
if (ret == -EINVAL) { if (ret == -EINVAL) {
error("Invalid --fields key: `%s'", tok); pr_err("Invalid --fields key: `%s'", tok);
break; break;
} else if (ret == -ESRCH) { } else if (ret == -ESRCH) {
error("Unknown --fields key: `%s'", tok); pr_err("Unknown --fields key: `%s'", tok);
break; break;
} }
} }
...@@ -2877,7 +2877,7 @@ static int __setup_output_field(void) ...@@ -2877,7 +2877,7 @@ static int __setup_output_field(void)
strp = str = strdup(field_order); strp = str = strdup(field_order);
if (str == NULL) { if (str == NULL) {
error("Not enough memory to setup output fields"); pr_err("Not enough memory to setup output fields");
return -ENOMEM; return -ENOMEM;
} }
...@@ -2885,7 +2885,7 @@ static int __setup_output_field(void) ...@@ -2885,7 +2885,7 @@ static int __setup_output_field(void)
strp++; strp++;
if (!strlen(strp)) { if (!strlen(strp)) {
error("Invalid --fields key: `+'"); pr_err("Invalid --fields key: `+'");
goto out; goto out;
} }
......
...@@ -24,7 +24,7 @@ ...@@ -24,7 +24,7 @@
#include <errno.h> #include <errno.h>
#include "../perf.h" #include "../perf.h"
#include "util.h" #include "debug.h"
#include "trace-event.h" #include "trace-event.h"
#include "sane_ctype.h" #include "sane_ctype.h"
...@@ -150,7 +150,7 @@ void parse_ftrace_printk(struct pevent *pevent, ...@@ -150,7 +150,7 @@ void parse_ftrace_printk(struct pevent *pevent,
while (line) { while (line) {
addr_str = strtok_r(line, ":", &fmt); addr_str = strtok_r(line, ":", &fmt);
if (!addr_str) { if (!addr_str) {
warning("printk format with empty entry"); pr_warning("printk format with empty entry");
break; break;
} }
addr = strtoull(addr_str, NULL, 16); addr = strtoull(addr_str, NULL, 16);
......
...@@ -9,75 +9,17 @@ ...@@ -9,75 +9,17 @@
#include "util.h" #include "util.h"
#include "debug.h" #include "debug.h"
static void report(const char *prefix, const char *err, va_list params)
{
char msg[1024];
vsnprintf(msg, sizeof(msg), err, params);
fprintf(stderr, " %s%s\n", prefix, msg);
}
static __noreturn void usage_builtin(const char *err) static __noreturn void usage_builtin(const char *err)
{ {
fprintf(stderr, "\n Usage: %s\n", err); fprintf(stderr, "\n Usage: %s\n", err);
exit(129); exit(129);
} }
static __noreturn void die_builtin(const char *err, va_list params)
{
report(" Fatal: ", err, params);
exit(128);
}
static void error_builtin(const char *err, va_list params)
{
report(" Error: ", err, params);
}
static void warn_builtin(const char *warn, va_list params)
{
report(" Warning: ", warn, params);
}
/* If we are in a dlopen()ed .so write to a global variable would segfault /* If we are in a dlopen()ed .so write to a global variable would segfault
* (ugh), so keep things static. */ * (ugh), so keep things static. */
static void (*usage_routine)(const char *err) __noreturn = usage_builtin; static void (*usage_routine)(const char *err) __noreturn = usage_builtin;
static void (*error_routine)(const char *err, va_list params) = error_builtin;
static void (*warn_routine)(const char *err, va_list params) = warn_builtin;
void set_warning_routine(void (*routine)(const char *err, va_list params))
{
warn_routine = routine;
}
void usage(const char *err) void usage(const char *err)
{ {
usage_routine(err); usage_routine(err);
} }
void die(const char *err, ...)
{
va_list params;
va_start(params, err);
die_builtin(err, params);
va_end(params);
}
int error(const char *err, ...)
{
va_list params;
va_start(params, err);
error_routine(err, params);
va_end(params);
return -1;
}
void warning(const char *warn, ...)
{
va_list params;
va_start(params, warn);
warn_routine(warn, params);
va_end(params);
}
...@@ -16,10 +16,6 @@ ...@@ -16,10 +16,6 @@
/* General helper functions */ /* General helper functions */
void usage(const char *err) __noreturn; void usage(const char *err) __noreturn;
void die(const char *err, ...) __noreturn __printf(1, 2); void die(const char *err, ...) __noreturn __printf(1, 2);
int error(const char *err, ...) __printf(1, 2);
void warning(const char *err, ...) __printf(1, 2);
void set_warning_routine(void (*routine)(const char *err, va_list params));
static inline void *zalloc(size_t size) static inline void *zalloc(size_t size)
{ {
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment