Commit 89c683cd authored by Linus Torvalds's avatar Linus Torvalds

Merge branch 'perf-urgent-for-linus' of git://git.kernel.org/pub/scm/linux/kernel/git/tip/tip

Pull perf tooling fixes from Ingo  Molnar:
 "These are all perf tooling changes: most of them are fixes.

  Note that the large CPU count related fixes go beyond regression
  fixes, but the IPI-flood symptoms are severe enough that I think
  justifies their inclusion"

* 'perf-urgent-for-linus' of git://git.kernel.org/pub/scm/linux/kernel/git/tip/tip: (38 commits)
  perf vendor events s390: Remove name from L1D_RO_EXCL_WRITES description
  perf vendor events s390: Fix counter long description for DTLB1_GPAGE_WRITES
  libtraceevent: Allow custom libdir path
  perf header: Fix false warning when there are no duplicate cache entries
  perf metricgroup: Fix printing event names of metric group with multiple events
  perf/x86/pmu-events: Fix Kernel_Utilization metric
  perf top: Do not bail out when perf_env__read_cpuid() returns ENOSYS
  perf arch: Make the default get_cpuid() return compatible error
  tools headers kvm: Sync linux/kvm.h with the kernel sources
  tools headers UAPI: Update tools's copy of drm.h headers
  tools headers UAPI: Sync drm/i915_drm.h with the kernel sources
  perf inject: Fix processing of ID index for injected instruction tracing
  perf report: Bail out --mem-mode if mem info is not available
  perf report: Make -F more strict like -s
  perf report/top TUI: Replace pr_err() with ui__error()
  libtraceevent: Copy pkg-config file to output folder when using O=
  libtraceevent: Fix lib installation with O=
  perf kvm: Clarify the 'perf kvm' -i and -o command line options
  tools arch x86: Sync asm/cpufeatures.h with the kernel sources
  perf beauty: Add CLEAR_SIGHAND support for clone's flags arg
  ...
parents 9e8a0d5f 57e04eed
...@@ -131,8 +131,9 @@ struct kvm_vcpu_events { ...@@ -131,8 +131,9 @@ struct kvm_vcpu_events {
struct { struct {
__u8 serror_pending; __u8 serror_pending;
__u8 serror_has_esr; __u8 serror_has_esr;
__u8 ext_dabt_pending;
/* Align it to 8 bytes */ /* Align it to 8 bytes */
__u8 pad[6]; __u8 pad[5];
__u64 serror_esr; __u64 serror_esr;
} exception; } exception;
__u32 reserved[12]; __u32 reserved[12];
......
...@@ -164,8 +164,9 @@ struct kvm_vcpu_events { ...@@ -164,8 +164,9 @@ struct kvm_vcpu_events {
struct { struct {
__u8 serror_pending; __u8 serror_pending;
__u8 serror_has_esr; __u8 serror_has_esr;
__u8 ext_dabt_pending;
/* Align it to 8 bytes */ /* Align it to 8 bytes */
__u8 pad[6]; __u8 pad[5];
__u64 serror_esr; __u64 serror_esr;
} exception; } exception;
__u32 reserved[12]; __u32 reserved[12];
...@@ -323,6 +324,8 @@ struct kvm_vcpu_events { ...@@ -323,6 +324,8 @@ struct kvm_vcpu_events {
#define KVM_ARM_VCPU_TIMER_CTRL 1 #define KVM_ARM_VCPU_TIMER_CTRL 1
#define KVM_ARM_VCPU_TIMER_IRQ_VTIMER 0 #define KVM_ARM_VCPU_TIMER_IRQ_VTIMER 0
#define KVM_ARM_VCPU_TIMER_IRQ_PTIMER 1 #define KVM_ARM_VCPU_TIMER_IRQ_PTIMER 1
#define KVM_ARM_VCPU_PVTIME_CTRL 2
#define KVM_ARM_VCPU_PVTIME_IPA 0
/* KVM_IRQ_LINE irq field index values */ /* KVM_IRQ_LINE irq field index values */
#define KVM_ARM_IRQ_VCPU2_SHIFT 28 #define KVM_ARM_IRQ_VCPU2_SHIFT 28
......
...@@ -667,6 +667,8 @@ struct kvm_ppc_cpu_char { ...@@ -667,6 +667,8 @@ struct kvm_ppc_cpu_char {
/* PPC64 eXternal Interrupt Controller Specification */ /* PPC64 eXternal Interrupt Controller Specification */
#define KVM_DEV_XICS_GRP_SOURCES 1 /* 64-bit source attributes */ #define KVM_DEV_XICS_GRP_SOURCES 1 /* 64-bit source attributes */
#define KVM_DEV_XICS_GRP_CTRL 2
#define KVM_DEV_XICS_NR_SERVERS 1
/* Layout of 64-bit source attribute values */ /* Layout of 64-bit source attribute values */
#define KVM_XICS_DESTINATION_SHIFT 0 #define KVM_XICS_DESTINATION_SHIFT 0
...@@ -683,6 +685,7 @@ struct kvm_ppc_cpu_char { ...@@ -683,6 +685,7 @@ struct kvm_ppc_cpu_char {
#define KVM_DEV_XIVE_GRP_CTRL 1 #define KVM_DEV_XIVE_GRP_CTRL 1
#define KVM_DEV_XIVE_RESET 1 #define KVM_DEV_XIVE_RESET 1
#define KVM_DEV_XIVE_EQ_SYNC 2 #define KVM_DEV_XIVE_EQ_SYNC 2
#define KVM_DEV_XIVE_NR_SERVERS 3
#define KVM_DEV_XIVE_GRP_SOURCE 2 /* 64-bit source identifier */ #define KVM_DEV_XIVE_GRP_SOURCE 2 /* 64-bit source identifier */
#define KVM_DEV_XIVE_GRP_SOURCE_CONFIG 3 /* 64-bit source identifier */ #define KVM_DEV_XIVE_GRP_SOURCE_CONFIG 3 /* 64-bit source identifier */
#define KVM_DEV_XIVE_GRP_EQ_CONFIG 4 /* 64-bit EQ identifier */ #define KVM_DEV_XIVE_GRP_EQ_CONFIG 4 /* 64-bit EQ identifier */
......
...@@ -292,6 +292,7 @@ ...@@ -292,6 +292,7 @@
#define X86_FEATURE_CLZERO (13*32+ 0) /* CLZERO instruction */ #define X86_FEATURE_CLZERO (13*32+ 0) /* CLZERO instruction */
#define X86_FEATURE_IRPERF (13*32+ 1) /* Instructions Retired Count */ #define X86_FEATURE_IRPERF (13*32+ 1) /* Instructions Retired Count */
#define X86_FEATURE_XSAVEERPTR (13*32+ 2) /* Always save/restore FP error pointers */ #define X86_FEATURE_XSAVEERPTR (13*32+ 2) /* Always save/restore FP error pointers */
#define X86_FEATURE_RDPRU (13*32+ 4) /* Read processor register at user level */
#define X86_FEATURE_WBNOINVD (13*32+ 9) /* WBNOINVD instruction */ #define X86_FEATURE_WBNOINVD (13*32+ 9) /* WBNOINVD instruction */
#define X86_FEATURE_AMD_IBPB (13*32+12) /* "" Indirect Branch Prediction Barrier */ #define X86_FEATURE_AMD_IBPB (13*32+12) /* "" Indirect Branch Prediction Barrier */
#define X86_FEATURE_AMD_IBRS (13*32+14) /* "" Indirect Branch Restricted Speculation */ #define X86_FEATURE_AMD_IBRS (13*32+14) /* "" Indirect Branch Restricted Speculation */
...@@ -399,5 +400,7 @@ ...@@ -399,5 +400,7 @@
#define X86_BUG_MDS X86_BUG(19) /* CPU is affected by Microarchitectural data sampling */ #define X86_BUG_MDS X86_BUG(19) /* CPU is affected by Microarchitectural data sampling */
#define X86_BUG_MSBDS_ONLY X86_BUG(20) /* CPU is only affected by the MSDBS variant of BUG_MDS */ #define X86_BUG_MSBDS_ONLY X86_BUG(20) /* CPU is only affected by the MSDBS variant of BUG_MDS */
#define X86_BUG_SWAPGS X86_BUG(21) /* CPU is affected by speculation through SWAPGS */ #define X86_BUG_SWAPGS X86_BUG(21) /* CPU is affected by speculation through SWAPGS */
#define X86_BUG_TAA X86_BUG(22) /* CPU is affected by TSX Async Abort(TAA) */
#define X86_BUG_ITLB_MULTIHIT X86_BUG(23) /* CPU may incur MCE during certain page attribute changes */
#endif /* _ASM_X86_CPUFEATURES_H */ #endif /* _ASM_X86_CPUFEATURES_H */
...@@ -93,6 +93,18 @@ ...@@ -93,6 +93,18 @@
* Microarchitectural Data * Microarchitectural Data
* Sampling (MDS) vulnerabilities. * Sampling (MDS) vulnerabilities.
*/ */
#define ARCH_CAP_PSCHANGE_MC_NO BIT(6) /*
* The processor is not susceptible to a
* machine check error due to modifying the
* code page size along with either the
* physical address or cache type
* without TLB invalidation.
*/
#define ARCH_CAP_TSX_CTRL_MSR BIT(7) /* MSR for TSX control is available. */
#define ARCH_CAP_TAA_NO BIT(8) /*
* Not susceptible to
* TSX Async Abort (TAA) vulnerabilities.
*/
#define MSR_IA32_FLUSH_CMD 0x0000010b #define MSR_IA32_FLUSH_CMD 0x0000010b
#define L1D_FLUSH BIT(0) /* #define L1D_FLUSH BIT(0) /*
...@@ -103,6 +115,10 @@ ...@@ -103,6 +115,10 @@
#define MSR_IA32_BBL_CR_CTL 0x00000119 #define MSR_IA32_BBL_CR_CTL 0x00000119
#define MSR_IA32_BBL_CR_CTL3 0x0000011e #define MSR_IA32_BBL_CR_CTL3 0x0000011e
#define MSR_IA32_TSX_CTRL 0x00000122
#define TSX_CTRL_RTM_DISABLE BIT(0) /* Disable RTM feature */
#define TSX_CTRL_CPUID_CLEAR BIT(1) /* Disable TSX enumeration */
#define MSR_IA32_SYSENTER_CS 0x00000174 #define MSR_IA32_SYSENTER_CS 0x00000174
#define MSR_IA32_SYSENTER_ESP 0x00000175 #define MSR_IA32_SYSENTER_ESP 0x00000175
#define MSR_IA32_SYSENTER_EIP 0x00000176 #define MSR_IA32_SYSENTER_EIP 0x00000176
...@@ -393,6 +409,8 @@ ...@@ -393,6 +409,8 @@
#define MSR_AMD_PSTATE_DEF_BASE 0xc0010064 #define MSR_AMD_PSTATE_DEF_BASE 0xc0010064
#define MSR_AMD64_OSVW_ID_LENGTH 0xc0010140 #define MSR_AMD64_OSVW_ID_LENGTH 0xc0010140
#define MSR_AMD64_OSVW_STATUS 0xc0010141 #define MSR_AMD64_OSVW_STATUS 0xc0010141
#define MSR_AMD_PPIN_CTL 0xc00102f0
#define MSR_AMD_PPIN 0xc00102f1
#define MSR_AMD64_LS_CFG 0xc0011020 #define MSR_AMD64_LS_CFG 0xc0011020
#define MSR_AMD64_DC_CFG 0xc0011022 #define MSR_AMD64_DC_CFG 0xc0011022
#define MSR_AMD64_BU_CFG2 0xc001102a #define MSR_AMD64_BU_CFG2 0xc001102a
......
...@@ -28,8 +28,8 @@ ...@@ -28,8 +28,8 @@
* Output: * Output:
* rax original destination * rax original destination
*/ */
ENTRY(__memcpy) SYM_FUNC_START_ALIAS(__memcpy)
ENTRY(memcpy) SYM_FUNC_START_LOCAL(memcpy)
ALTERNATIVE_2 "jmp memcpy_orig", "", X86_FEATURE_REP_GOOD, \ ALTERNATIVE_2 "jmp memcpy_orig", "", X86_FEATURE_REP_GOOD, \
"jmp memcpy_erms", X86_FEATURE_ERMS "jmp memcpy_erms", X86_FEATURE_ERMS
...@@ -41,8 +41,8 @@ ENTRY(memcpy) ...@@ -41,8 +41,8 @@ ENTRY(memcpy)
movl %edx, %ecx movl %edx, %ecx
rep movsb rep movsb
ret ret
ENDPROC(memcpy) SYM_FUNC_END(memcpy)
ENDPROC(__memcpy) SYM_FUNC_END_ALIAS(__memcpy)
EXPORT_SYMBOL(memcpy) EXPORT_SYMBOL(memcpy)
EXPORT_SYMBOL(__memcpy) EXPORT_SYMBOL(__memcpy)
...@@ -50,14 +50,14 @@ EXPORT_SYMBOL(__memcpy) ...@@ -50,14 +50,14 @@ EXPORT_SYMBOL(__memcpy)
* memcpy_erms() - enhanced fast string memcpy. This is faster and * memcpy_erms() - enhanced fast string memcpy. This is faster and
* simpler than memcpy. Use memcpy_erms when possible. * simpler than memcpy. Use memcpy_erms when possible.
*/ */
ENTRY(memcpy_erms) SYM_FUNC_START(memcpy_erms)
movq %rdi, %rax movq %rdi, %rax
movq %rdx, %rcx movq %rdx, %rcx
rep movsb rep movsb
ret ret
ENDPROC(memcpy_erms) SYM_FUNC_END(memcpy_erms)
ENTRY(memcpy_orig) SYM_FUNC_START(memcpy_orig)
movq %rdi, %rax movq %rdi, %rax
cmpq $0x20, %rdx cmpq $0x20, %rdx
...@@ -182,7 +182,7 @@ ENTRY(memcpy_orig) ...@@ -182,7 +182,7 @@ ENTRY(memcpy_orig)
.Lend: .Lend:
retq retq
ENDPROC(memcpy_orig) SYM_FUNC_END(memcpy_orig)
#ifndef CONFIG_UML #ifndef CONFIG_UML
...@@ -193,7 +193,7 @@ MCSAFE_TEST_CTL ...@@ -193,7 +193,7 @@ MCSAFE_TEST_CTL
* Note that we only catch machine checks when reading the source addresses. * Note that we only catch machine checks when reading the source addresses.
* Writes to target are posted and don't generate machine checks. * Writes to target are posted and don't generate machine checks.
*/ */
ENTRY(__memcpy_mcsafe) SYM_FUNC_START(__memcpy_mcsafe)
cmpl $8, %edx cmpl $8, %edx
/* Less than 8 bytes? Go to byte copy loop */ /* Less than 8 bytes? Go to byte copy loop */
jb .L_no_whole_words jb .L_no_whole_words
...@@ -260,7 +260,7 @@ ENTRY(__memcpy_mcsafe) ...@@ -260,7 +260,7 @@ ENTRY(__memcpy_mcsafe)
xorl %eax, %eax xorl %eax, %eax
.L_done: .L_done:
ret ret
ENDPROC(__memcpy_mcsafe) SYM_FUNC_END(__memcpy_mcsafe)
EXPORT_SYMBOL_GPL(__memcpy_mcsafe) EXPORT_SYMBOL_GPL(__memcpy_mcsafe)
.section .fixup, "ax" .section .fixup, "ax"
......
...@@ -18,8 +18,8 @@ ...@@ -18,8 +18,8 @@
* *
* rax original destination * rax original destination
*/ */
ENTRY(memset) SYM_FUNC_START_ALIAS(memset)
ENTRY(__memset) SYM_FUNC_START(__memset)
/* /*
* Some CPUs support enhanced REP MOVSB/STOSB feature. It is recommended * Some CPUs support enhanced REP MOVSB/STOSB feature. It is recommended
* to use it when possible. If not available, use fast string instructions. * to use it when possible. If not available, use fast string instructions.
...@@ -42,8 +42,8 @@ ENTRY(__memset) ...@@ -42,8 +42,8 @@ ENTRY(__memset)
rep stosb rep stosb
movq %r9,%rax movq %r9,%rax
ret ret
ENDPROC(memset) SYM_FUNC_END(__memset)
ENDPROC(__memset) SYM_FUNC_END_ALIAS(memset)
/* /*
* ISO C memset - set a memory block to a byte value. This function uses * ISO C memset - set a memory block to a byte value. This function uses
...@@ -56,16 +56,16 @@ ENDPROC(__memset) ...@@ -56,16 +56,16 @@ ENDPROC(__memset)
* *
* rax original destination * rax original destination
*/ */
ENTRY(memset_erms) SYM_FUNC_START(memset_erms)
movq %rdi,%r9 movq %rdi,%r9
movb %sil,%al movb %sil,%al
movq %rdx,%rcx movq %rdx,%rcx
rep stosb rep stosb
movq %r9,%rax movq %r9,%rax
ret ret
ENDPROC(memset_erms) SYM_FUNC_END(memset_erms)
ENTRY(memset_orig) SYM_FUNC_START(memset_orig)
movq %rdi,%r10 movq %rdi,%r10
/* expand byte value */ /* expand byte value */
...@@ -136,4 +136,4 @@ ENTRY(memset_orig) ...@@ -136,4 +136,4 @@ ENTRY(memset_orig)
subq %r8,%rdx subq %r8,%rdx
jmp .Lafter_bad_alignment jmp .Lafter_bad_alignment
.Lfinal: .Lfinal:
ENDPROC(memset_orig) SYM_FUNC_END(memset_orig)
...@@ -778,11 +778,12 @@ struct drm_syncobj_array { ...@@ -778,11 +778,12 @@ struct drm_syncobj_array {
__u32 pad; __u32 pad;
}; };
#define DRM_SYNCOBJ_QUERY_FLAGS_LAST_SUBMITTED (1 << 0) /* last available point on timeline syncobj */
struct drm_syncobj_timeline_array { struct drm_syncobj_timeline_array {
__u64 handles; __u64 handles;
__u64 points; __u64 points;
__u32 count_handles; __u32 count_handles;
__u32 pad; __u32 flags;
}; };
......
...@@ -611,6 +611,13 @@ typedef struct drm_i915_irq_wait { ...@@ -611,6 +611,13 @@ typedef struct drm_i915_irq_wait {
* See I915_EXEC_FENCE_OUT and I915_EXEC_FENCE_SUBMIT. * See I915_EXEC_FENCE_OUT and I915_EXEC_FENCE_SUBMIT.
*/ */
#define I915_PARAM_HAS_EXEC_SUBMIT_FENCE 53 #define I915_PARAM_HAS_EXEC_SUBMIT_FENCE 53
/*
* Revision of the i915-perf uAPI. The value returned helps determine what
* i915-perf features are available. See drm_i915_perf_property_id.
*/
#define I915_PARAM_PERF_REVISION 54
/* Must be kept compact -- no holes and well documented */ /* Must be kept compact -- no holes and well documented */
typedef struct drm_i915_getparam { typedef struct drm_i915_getparam {
...@@ -1565,6 +1572,21 @@ struct drm_i915_gem_context_param { ...@@ -1565,6 +1572,21 @@ struct drm_i915_gem_context_param {
* i915_context_engines_bond (I915_CONTEXT_ENGINES_EXT_BOND) * i915_context_engines_bond (I915_CONTEXT_ENGINES_EXT_BOND)
*/ */
#define I915_CONTEXT_PARAM_ENGINES 0xa #define I915_CONTEXT_PARAM_ENGINES 0xa
/*
* I915_CONTEXT_PARAM_PERSISTENCE:
*
* Allow the context and active rendering to survive the process until
* completion. Persistence allows fire-and-forget clients to queue up a
* bunch of work, hand the output over to a display server and then quit.
* If the context is marked as not persistent, upon closing (either via
* an explicit DRM_I915_GEM_CONTEXT_DESTROY or implicitly from file closure
* or process termination), the context and any outstanding requests will be
* cancelled (and exported fences for cancelled requests marked as -EIO).
*
* By default, new contexts allow persistence.
*/
#define I915_CONTEXT_PARAM_PERSISTENCE 0xb
/* Must be kept compact -- no holes and well documented */ /* Must be kept compact -- no holes and well documented */
__u64 value; __u64 value;
...@@ -1844,23 +1866,31 @@ enum drm_i915_perf_property_id { ...@@ -1844,23 +1866,31 @@ enum drm_i915_perf_property_id {
* Open the stream for a specific context handle (as used with * Open the stream for a specific context handle (as used with
* execbuffer2). A stream opened for a specific context this way * execbuffer2). A stream opened for a specific context this way
* won't typically require root privileges. * won't typically require root privileges.
*
* This property is available in perf revision 1.
*/ */
DRM_I915_PERF_PROP_CTX_HANDLE = 1, DRM_I915_PERF_PROP_CTX_HANDLE = 1,
/** /**
* A value of 1 requests the inclusion of raw OA unit reports as * A value of 1 requests the inclusion of raw OA unit reports as
* part of stream samples. * part of stream samples.
*
* This property is available in perf revision 1.
*/ */
DRM_I915_PERF_PROP_SAMPLE_OA, DRM_I915_PERF_PROP_SAMPLE_OA,
/** /**
* The value specifies which set of OA unit metrics should be * The value specifies which set of OA unit metrics should be
* be configured, defining the contents of any OA unit reports. * be configured, defining the contents of any OA unit reports.
*
* This property is available in perf revision 1.
*/ */
DRM_I915_PERF_PROP_OA_METRICS_SET, DRM_I915_PERF_PROP_OA_METRICS_SET,
/** /**
* The value specifies the size and layout of OA unit reports. * The value specifies the size and layout of OA unit reports.
*
* This property is available in perf revision 1.
*/ */
DRM_I915_PERF_PROP_OA_FORMAT, DRM_I915_PERF_PROP_OA_FORMAT,
...@@ -1870,9 +1900,22 @@ enum drm_i915_perf_property_id { ...@@ -1870,9 +1900,22 @@ enum drm_i915_perf_property_id {
* from this exponent as follows: * from this exponent as follows:
* *
* 80ns * 2^(period_exponent + 1) * 80ns * 2^(period_exponent + 1)
*
* This property is available in perf revision 1.
*/ */
DRM_I915_PERF_PROP_OA_EXPONENT, DRM_I915_PERF_PROP_OA_EXPONENT,
/**
* Specifying this property is only valid when specify a context to
* filter with DRM_I915_PERF_PROP_CTX_HANDLE. Specifying this property
* will hold preemption of the particular context we want to gather
* performance data about. The execbuf2 submissions must include a
* drm_i915_gem_execbuffer_ext_perf parameter for this to apply.
*
* This property is available in perf revision 3.
*/
DRM_I915_PERF_PROP_HOLD_PREEMPTION,
DRM_I915_PERF_PROP_MAX /* non-ABI */ DRM_I915_PERF_PROP_MAX /* non-ABI */
}; };
...@@ -1901,6 +1944,8 @@ struct drm_i915_perf_open_param { ...@@ -1901,6 +1944,8 @@ struct drm_i915_perf_open_param {
* to close and re-open a stream with the same configuration. * to close and re-open a stream with the same configuration.
* *
* It's undefined whether any pending data for the stream will be lost. * It's undefined whether any pending data for the stream will be lost.
*
* This ioctl is available in perf revision 1.
*/ */
#define I915_PERF_IOCTL_ENABLE _IO('i', 0x0) #define I915_PERF_IOCTL_ENABLE _IO('i', 0x0)
...@@ -1908,9 +1953,24 @@ struct drm_i915_perf_open_param { ...@@ -1908,9 +1953,24 @@ struct drm_i915_perf_open_param {
* Disable data capture for a stream. * Disable data capture for a stream.
* *
* It is an error to try and read a stream that is disabled. * It is an error to try and read a stream that is disabled.
*
* This ioctl is available in perf revision 1.
*/ */
#define I915_PERF_IOCTL_DISABLE _IO('i', 0x1) #define I915_PERF_IOCTL_DISABLE _IO('i', 0x1)
/**
* Change metrics_set captured by a stream.
*
* If the stream is bound to a specific context, the configuration change
* will performed inline with that context such that it takes effect before
* the next execbuf submission.
*
* Returns the previously bound metrics set id, or a negative error code.
*
* This ioctl is available in perf revision 2.
*/
#define I915_PERF_IOCTL_CONFIG _IO('i', 0x2)
/** /**
* Common to all i915 perf records * Common to all i915 perf records
*/ */
...@@ -1984,6 +2044,7 @@ struct drm_i915_query_item { ...@@ -1984,6 +2044,7 @@ struct drm_i915_query_item {
__u64 query_id; __u64 query_id;
#define DRM_I915_QUERY_TOPOLOGY_INFO 1 #define DRM_I915_QUERY_TOPOLOGY_INFO 1
#define DRM_I915_QUERY_ENGINE_INFO 2 #define DRM_I915_QUERY_ENGINE_INFO 2
#define DRM_I915_QUERY_PERF_CONFIG 3
/* Must be kept compact -- no holes and well documented */ /* Must be kept compact -- no holes and well documented */
/* /*
...@@ -1995,9 +2056,18 @@ struct drm_i915_query_item { ...@@ -1995,9 +2056,18 @@ struct drm_i915_query_item {
__s32 length; __s32 length;
/* /*
* Unused for now. Must be cleared to zero. * When query_id == DRM_I915_QUERY_TOPOLOGY_INFO, must be 0.
*
* When query_id == DRM_I915_QUERY_PERF_CONFIG, must be one of the
* following :
* - DRM_I915_QUERY_PERF_CONFIG_LIST
* - DRM_I915_QUERY_PERF_CONFIG_DATA_FOR_UUID
* - DRM_I915_QUERY_PERF_CONFIG_FOR_UUID
*/ */
__u32 flags; __u32 flags;
#define DRM_I915_QUERY_PERF_CONFIG_LIST 1
#define DRM_I915_QUERY_PERF_CONFIG_DATA_FOR_UUID 2
#define DRM_I915_QUERY_PERF_CONFIG_DATA_FOR_ID 3
/* /*
* Data will be written at the location pointed by data_ptr when the * Data will be written at the location pointed by data_ptr when the
...@@ -2033,8 +2103,10 @@ struct drm_i915_query { ...@@ -2033,8 +2103,10 @@ struct drm_i915_query {
* (data[X / 8] >> (X % 8)) & 1 * (data[X / 8] >> (X % 8)) & 1
* *
* - the subslice mask for each slice with one bit per subslice telling * - the subslice mask for each slice with one bit per subslice telling
* whether a subslice is available. The availability of subslice Y in slice * whether a subslice is available. Gen12 has dual-subslices, which are
* X can be queried with the following formula : * similar to two gen11 subslices. For gen12, this array represents dual-
* subslices. The availability of subslice Y in slice X can be queried
* with the following formula :
* *
* (data[subslice_offset + * (data[subslice_offset +
* X * subslice_stride + * X * subslice_stride +
...@@ -2123,6 +2195,56 @@ struct drm_i915_query_engine_info { ...@@ -2123,6 +2195,56 @@ struct drm_i915_query_engine_info {
struct drm_i915_engine_info engines[]; struct drm_i915_engine_info engines[];
}; };
/*
* Data written by the kernel with query DRM_I915_QUERY_PERF_CONFIG.
*/
struct drm_i915_query_perf_config {
union {
/*
* When query_item.flags == DRM_I915_QUERY_PERF_CONFIG_LIST, i915 sets
* this fields to the number of configurations available.
*/
__u64 n_configs;
/*
* When query_id == DRM_I915_QUERY_PERF_CONFIG_DATA_FOR_ID,
* i915 will use the value in this field as configuration
* identifier to decide what data to write into config_ptr.
*/
__u64 config;
/*
* When query_id == DRM_I915_QUERY_PERF_CONFIG_DATA_FOR_UUID,
* i915 will use the value in this field as configuration
* identifier to decide what data to write into config_ptr.
*
* String formatted like "%08x-%04x-%04x-%04x-%012x"
*/
char uuid[36];
};
/*
* Unused for now. Must be cleared to zero.
*/
__u32 flags;
/*
* When query_item.flags == DRM_I915_QUERY_PERF_CONFIG_LIST, i915 will
* write an array of __u64 of configuration identifiers.
*
* When query_item.flags == DRM_I915_QUERY_PERF_CONFIG_DATA, i915 will
* write a struct drm_i915_perf_oa_config. If the following fields of
* drm_i915_perf_oa_config are set not set to 0, i915 will write into
* the associated pointers the values of submitted when the
* configuration was created :
*
* - n_mux_regs
* - n_boolean_regs
* - n_flex_regs
*/
__u8 data[];
};
#if defined(__cplusplus) #if defined(__cplusplus)
} }
#endif #endif
......
...@@ -17,7 +17,8 @@ ...@@ -17,7 +17,8 @@
#define FSCRYPT_POLICY_FLAGS_PAD_32 0x03 #define FSCRYPT_POLICY_FLAGS_PAD_32 0x03
#define FSCRYPT_POLICY_FLAGS_PAD_MASK 0x03 #define FSCRYPT_POLICY_FLAGS_PAD_MASK 0x03
#define FSCRYPT_POLICY_FLAG_DIRECT_KEY 0x04 #define FSCRYPT_POLICY_FLAG_DIRECT_KEY 0x04
#define FSCRYPT_POLICY_FLAGS_VALID 0x07 #define FSCRYPT_POLICY_FLAG_IV_INO_LBLK_64 0x08
#define FSCRYPT_POLICY_FLAGS_VALID 0x0F
/* Encryption algorithms */ /* Encryption algorithms */
#define FSCRYPT_MODE_AES_256_XTS 1 #define FSCRYPT_MODE_AES_256_XTS 1
......
...@@ -235,6 +235,7 @@ struct kvm_hyperv_exit { ...@@ -235,6 +235,7 @@ struct kvm_hyperv_exit {
#define KVM_EXIT_S390_STSI 25 #define KVM_EXIT_S390_STSI 25
#define KVM_EXIT_IOAPIC_EOI 26 #define KVM_EXIT_IOAPIC_EOI 26
#define KVM_EXIT_HYPERV 27 #define KVM_EXIT_HYPERV 27
#define KVM_EXIT_ARM_NISV 28
/* For KVM_EXIT_INTERNAL_ERROR */ /* For KVM_EXIT_INTERNAL_ERROR */
/* Emulate instruction failed. */ /* Emulate instruction failed. */
...@@ -394,6 +395,11 @@ struct kvm_run { ...@@ -394,6 +395,11 @@ struct kvm_run {
} eoi; } eoi;
/* KVM_EXIT_HYPERV */ /* KVM_EXIT_HYPERV */
struct kvm_hyperv_exit hyperv; struct kvm_hyperv_exit hyperv;
/* KVM_EXIT_ARM_NISV */
struct {
__u64 esr_iss;
__u64 fault_ipa;
} arm_nisv;
/* Fix the size of the union. */ /* Fix the size of the union. */
char padding[256]; char padding[256];
}; };
...@@ -1000,6 +1006,9 @@ struct kvm_ppc_resize_hpt { ...@@ -1000,6 +1006,9 @@ struct kvm_ppc_resize_hpt {
#define KVM_CAP_PMU_EVENT_FILTER 173 #define KVM_CAP_PMU_EVENT_FILTER 173
#define KVM_CAP_ARM_IRQ_LINE_LAYOUT_2 174 #define KVM_CAP_ARM_IRQ_LINE_LAYOUT_2 174
#define KVM_CAP_HYPERV_DIRECT_TLBFLUSH 175 #define KVM_CAP_HYPERV_DIRECT_TLBFLUSH 175
#define KVM_CAP_PPC_GUEST_DEBUG_SSTEP 176
#define KVM_CAP_ARM_NISV_TO_USER 177
#define KVM_CAP_ARM_INJECT_EXT_DABT 178
#ifdef KVM_CAP_IRQ_ROUTING #ifdef KVM_CAP_IRQ_ROUTING
...@@ -1227,6 +1236,8 @@ enum kvm_device_type { ...@@ -1227,6 +1236,8 @@ enum kvm_device_type {
#define KVM_DEV_TYPE_ARM_VGIC_ITS KVM_DEV_TYPE_ARM_VGIC_ITS #define KVM_DEV_TYPE_ARM_VGIC_ITS KVM_DEV_TYPE_ARM_VGIC_ITS
KVM_DEV_TYPE_XIVE, KVM_DEV_TYPE_XIVE,
#define KVM_DEV_TYPE_XIVE KVM_DEV_TYPE_XIVE #define KVM_DEV_TYPE_XIVE KVM_DEV_TYPE_XIVE
KVM_DEV_TYPE_ARM_PV_TIME,
#define KVM_DEV_TYPE_ARM_PV_TIME KVM_DEV_TYPE_ARM_PV_TIME
KVM_DEV_TYPE_MAX, KVM_DEV_TYPE_MAX,
}; };
...@@ -1337,6 +1348,7 @@ struct kvm_s390_ucas_mapping { ...@@ -1337,6 +1348,7 @@ struct kvm_s390_ucas_mapping {
#define KVM_PPC_GET_CPU_CHAR _IOR(KVMIO, 0xb1, struct kvm_ppc_cpu_char) #define KVM_PPC_GET_CPU_CHAR _IOR(KVMIO, 0xb1, struct kvm_ppc_cpu_char)
/* Available with KVM_CAP_PMU_EVENT_FILTER */ /* Available with KVM_CAP_PMU_EVENT_FILTER */
#define KVM_SET_PMU_EVENT_FILTER _IOW(KVMIO, 0xb2, struct kvm_pmu_event_filter) #define KVM_SET_PMU_EVENT_FILTER _IOW(KVMIO, 0xb2, struct kvm_pmu_event_filter)
#define KVM_PPC_SVM_OFF _IO(KVMIO, 0xb3)
/* ioctl for vm fd */ /* ioctl for vm fd */
#define KVM_CREATE_DEVICE _IOWR(KVMIO, 0xe0, struct kvm_create_device) #define KVM_CREATE_DEVICE _IOWR(KVMIO, 0xe0, struct kvm_create_device)
......
...@@ -33,27 +33,48 @@ ...@@ -33,27 +33,48 @@
#define CLONE_NEWNET 0x40000000 /* New network namespace */ #define CLONE_NEWNET 0x40000000 /* New network namespace */
#define CLONE_IO 0x80000000 /* Clone io context */ #define CLONE_IO 0x80000000 /* Clone io context */
/* Flags for the clone3() syscall. */
#define CLONE_CLEAR_SIGHAND 0x100000000ULL /* Clear any signal handler and reset to SIG_DFL. */
#ifndef __ASSEMBLY__ #ifndef __ASSEMBLY__
/** /**
* struct clone_args - arguments for the clone3 syscall * struct clone_args - arguments for the clone3 syscall
* @flags: Flags for the new process as listed above. * @flags: Flags for the new process as listed above.
* All flags are valid except for CSIGNAL and * All flags are valid except for CSIGNAL and
* CLONE_DETACHED. * CLONE_DETACHED.
* @pidfd: If CLONE_PIDFD is set, a pidfd will be * @pidfd: If CLONE_PIDFD is set, a pidfd will be
* returned in this argument. * returned in this argument.
* @child_tid: If CLONE_CHILD_SETTID is set, the TID of the * @child_tid: If CLONE_CHILD_SETTID is set, the TID of the
* child process will be returned in the child's * child process will be returned in the child's
* memory. * memory.
* @parent_tid: If CLONE_PARENT_SETTID is set, the TID of * @parent_tid: If CLONE_PARENT_SETTID is set, the TID of
* the child process will be returned in the * the child process will be returned in the
* parent's memory. * parent's memory.
* @exit_signal: The exit_signal the parent process will be * @exit_signal: The exit_signal the parent process will be
* sent when the child exits. * sent when the child exits.
* @stack: Specify the location of the stack for the * @stack: Specify the location of the stack for the
* child process. * child process.
* @stack_size: The size of the stack for the child process. * Note, @stack is expected to point to the
* @tls: If CLONE_SETTLS is set, the tls descriptor * lowest address. The stack direction will be
* is set to tls. * determined by the kernel and set up
* appropriately based on @stack_size.
* @stack_size: The size of the stack for the child process.
* @tls: If CLONE_SETTLS is set, the tls descriptor
* is set to tls.
* @set_tid: Pointer to an array of type *pid_t. The size
* of the array is defined using @set_tid_size.
* This array is used to select PIDs/TIDs for
* newly created processes. The first element in
* this defines the PID in the most nested PID
* namespace. Each additional element in the array
* defines the PID in the parent PID namespace of
* the original PID namespace. If the array has
* less entries than the number of currently
* nested PID namespaces only the PIDs in the
* corresponding namespaces are set.
* @set_tid_size: This defines the size of the array referenced
* in @set_tid. This cannot be larger than the
* kernel's limit of nested PID namespaces.
* *
* The structure is versioned by size and thus extensible. * The structure is versioned by size and thus extensible.
* New struct members must go at the end of the struct and * New struct members must go at the end of the struct and
...@@ -68,10 +89,13 @@ struct clone_args { ...@@ -68,10 +89,13 @@ struct clone_args {
__aligned_u64 stack; __aligned_u64 stack;
__aligned_u64 stack_size; __aligned_u64 stack_size;
__aligned_u64 tls; __aligned_u64 tls;
__aligned_u64 set_tid;
__aligned_u64 set_tid_size;
}; };
#endif #endif
#define CLONE_ARGS_SIZE_VER0 64 /* sizeof first published struct */ #define CLONE_ARGS_SIZE_VER0 64 /* sizeof first published struct */
#define CLONE_ARGS_SIZE_VER1 80 /* sizeof second published struct */
/* /*
* Scheduling policies * Scheduling policies
......
...@@ -167,8 +167,8 @@ struct statx { ...@@ -167,8 +167,8 @@ struct statx {
#define STATX_ATTR_APPEND 0x00000020 /* [I] File is append-only */ #define STATX_ATTR_APPEND 0x00000020 /* [I] File is append-only */
#define STATX_ATTR_NODUMP 0x00000040 /* [I] File is not to be dumped */ #define STATX_ATTR_NODUMP 0x00000040 /* [I] File is not to be dumped */
#define STATX_ATTR_ENCRYPTED 0x00000800 /* [I] File requires key to decrypt in fs */ #define STATX_ATTR_ENCRYPTED 0x00000800 /* [I] File requires key to decrypt in fs */
#define STATX_ATTR_AUTOMOUNT 0x00001000 /* Dir: Automount trigger */ #define STATX_ATTR_AUTOMOUNT 0x00001000 /* Dir: Automount trigger */
#define STATX_ATTR_VERITY 0x00100000 /* [I] Verity protected file */
#endif /* _UAPI_LINUX_STAT_H */ #endif /* _UAPI_LINUX_STAT_H */
...@@ -39,11 +39,12 @@ DESTDIR_SQ = '$(subst ','\'',$(DESTDIR))' ...@@ -39,11 +39,12 @@ DESTDIR_SQ = '$(subst ','\'',$(DESTDIR))'
LP64 := $(shell echo __LP64__ | ${CC} ${CFLAGS} -E -x c - | tail -n 1) LP64 := $(shell echo __LP64__ | ${CC} ${CFLAGS} -E -x c - | tail -n 1)
ifeq ($(LP64), 1) ifeq ($(LP64), 1)
libdir_relative = lib64 libdir_relative_temp = lib64
else else
libdir_relative = lib libdir_relative_temp = lib
endif endif
libdir_relative ?= $(libdir_relative_temp)
prefix ?= /usr/local prefix ?= /usr/local
libdir = $(prefix)/$(libdir_relative) libdir = $(prefix)/$(libdir_relative)
man_dir = $(prefix)/share/man man_dir = $(prefix)/share/man
...@@ -97,6 +98,7 @@ EVENT_PARSE_VERSION = $(EP_VERSION).$(EP_PATCHLEVEL).$(EP_EXTRAVERSION) ...@@ -97,6 +98,7 @@ EVENT_PARSE_VERSION = $(EP_VERSION).$(EP_PATCHLEVEL).$(EP_EXTRAVERSION)
LIB_TARGET = libtraceevent.a libtraceevent.so.$(EVENT_PARSE_VERSION) LIB_TARGET = libtraceevent.a libtraceevent.so.$(EVENT_PARSE_VERSION)
LIB_INSTALL = libtraceevent.a libtraceevent.so* LIB_INSTALL = libtraceevent.a libtraceevent.so*
LIB_INSTALL := $(addprefix $(OUTPUT),$(LIB_INSTALL))
INCLUDES = -I. -I $(srctree)/tools/include $(CONFIG_INCLUDES) INCLUDES = -I. -I $(srctree)/tools/include $(CONFIG_INCLUDES)
...@@ -207,10 +209,11 @@ define do_install ...@@ -207,10 +209,11 @@ define do_install
$(INSTALL) $(if $3,-m $3,) $1 '$(DESTDIR_SQ)$2' $(INSTALL) $(if $3,-m $3,) $1 '$(DESTDIR_SQ)$2'
endef endef
PKG_CONFIG_FILE = libtraceevent.pc PKG_CONFIG_SOURCE_FILE = libtraceevent.pc
PKG_CONFIG_FILE := $(addprefix $(OUTPUT),$(PKG_CONFIG_SOURCE_FILE))
define do_install_pkgconfig_file define do_install_pkgconfig_file
if [ -n "${pkgconfig_dir}" ]; then \ if [ -n "${pkgconfig_dir}" ]; then \
cp -f ${PKG_CONFIG_FILE}.template ${PKG_CONFIG_FILE}; \ cp -f ${PKG_CONFIG_SOURCE_FILE}.template ${PKG_CONFIG_FILE}; \
sed -i "s|INSTALL_PREFIX|${1}|g" ${PKG_CONFIG_FILE}; \ sed -i "s|INSTALL_PREFIX|${1}|g" ${PKG_CONFIG_FILE}; \
sed -i "s|LIB_VERSION|${EVENT_PARSE_VERSION}|g" ${PKG_CONFIG_FILE}; \ sed -i "s|LIB_VERSION|${EVENT_PARSE_VERSION}|g" ${PKG_CONFIG_FILE}; \
sed -i "s|LIB_DIR|${libdir}|g" ${PKG_CONFIG_FILE}; \ sed -i "s|LIB_DIR|${libdir}|g" ${PKG_CONFIG_FILE}; \
......
...@@ -32,11 +32,12 @@ DESTDIR_SQ = '$(subst ','\'',$(DESTDIR))' ...@@ -32,11 +32,12 @@ DESTDIR_SQ = '$(subst ','\'',$(DESTDIR))'
LP64 := $(shell echo __LP64__ | ${CC} ${CFLAGS} -E -x c - | tail -n 1) LP64 := $(shell echo __LP64__ | ${CC} ${CFLAGS} -E -x c - | tail -n 1)
ifeq ($(LP64), 1) ifeq ($(LP64), 1)
libdir_relative = lib64 libdir_relative_tmp = lib64
else else
libdir_relative = lib libdir_relative_tmp = lib
endif endif
libdir_relative ?= $(libdir_relative_tmp)
prefix ?= /usr/local prefix ?= /usr/local
libdir = $(prefix)/$(libdir_relative) libdir = $(prefix)/$(libdir_relative)
......
...@@ -68,10 +68,11 @@ OPTIONS ...@@ -68,10 +68,11 @@ OPTIONS
------- -------
-i:: -i::
--input=<path>:: --input=<path>::
Input file name. Input file name, for the 'report', 'diff' and 'buildid-list' subcommands.
-o:: -o::
--output=<path>:: --output=<path>::
Output file name. Output file name, for the 'record' subcommand. Doesn't work with 'report',
just redirect the output to a file when using 'report'.
--host:: --host::
Collect host side performance profile. Collect host side performance profile.
--guest:: --guest::
......
...@@ -37,7 +37,7 @@ ...@@ -37,7 +37,7 @@
.text .text
.type perf_regs_load,%function .type perf_regs_load,%function
ENTRY(perf_regs_load) SYM_FUNC_START(perf_regs_load)
str r0, [r0, #R0] str r0, [r0, #R0]
str r1, [r0, #R1] str r1, [r0, #R1]
str r2, [r0, #R2] str r2, [r0, #R2]
...@@ -56,4 +56,4 @@ ENTRY(perf_regs_load) ...@@ -56,4 +56,4 @@ ENTRY(perf_regs_load)
str lr, [r0, #PC] // store pc as lr in order to skip the call str lr, [r0, #PC] // store pc as lr in order to skip the call
// to this function // to this function
mov pc, lr mov pc, lr
ENDPROC(perf_regs_load) SYM_FUNC_END(perf_regs_load)
...@@ -7,7 +7,7 @@ ...@@ -7,7 +7,7 @@
#define LDR_REG(r) ldr x##r, [x0, 8 * r] #define LDR_REG(r) ldr x##r, [x0, 8 * r]
#define SP (8 * 31) #define SP (8 * 31)
#define PC (8 * 32) #define PC (8 * 32)
ENTRY(perf_regs_load) SYM_FUNC_START(perf_regs_load)
STR_REG(0) STR_REG(0)
STR_REG(1) STR_REG(1)
STR_REG(2) STR_REG(2)
...@@ -44,4 +44,4 @@ ENTRY(perf_regs_load) ...@@ -44,4 +44,4 @@ ENTRY(perf_regs_load)
str x30, [x0, #PC] str x30, [x0, #PC]
LDR_REG(1) LDR_REG(1)
ret ret
ENDPROC(perf_regs_load) SYM_FUNC_END(perf_regs_load)
...@@ -28,7 +28,7 @@ ...@@ -28,7 +28,7 @@
.text .text
#ifdef HAVE_ARCH_X86_64_SUPPORT #ifdef HAVE_ARCH_X86_64_SUPPORT
ENTRY(perf_regs_load) SYM_FUNC_START(perf_regs_load)
movq %rax, AX(%rdi) movq %rax, AX(%rdi)
movq %rbx, BX(%rdi) movq %rbx, BX(%rdi)
movq %rcx, CX(%rdi) movq %rcx, CX(%rdi)
...@@ -60,9 +60,9 @@ ENTRY(perf_regs_load) ...@@ -60,9 +60,9 @@ ENTRY(perf_regs_load)
movq %r14, R14(%rdi) movq %r14, R14(%rdi)
movq %r15, R15(%rdi) movq %r15, R15(%rdi)
ret ret
ENDPROC(perf_regs_load) SYM_FUNC_END(perf_regs_load)
#else #else
ENTRY(perf_regs_load) SYM_FUNC_START(perf_regs_load)
push %edi push %edi
movl 8(%esp), %edi movl 8(%esp), %edi
movl %eax, AX(%edi) movl %eax, AX(%edi)
...@@ -88,7 +88,7 @@ ENTRY(perf_regs_load) ...@@ -88,7 +88,7 @@ ENTRY(perf_regs_load)
movl $0, FS(%edi) movl $0, FS(%edi)
movl $0, GS(%edi) movl $0, GS(%edi)
ret ret
ENDPROC(perf_regs_load) SYM_FUNC_END(perf_regs_load)
#endif #endif
/* /*
......
...@@ -403,17 +403,6 @@ static int perf_event__repipe_tracing_data(struct perf_session *session, ...@@ -403,17 +403,6 @@ static int perf_event__repipe_tracing_data(struct perf_session *session,
return err; return err;
} }
static int perf_event__repipe_id_index(struct perf_session *session,
union perf_event *event)
{
int err;
perf_event__repipe_synth(session->tool, event);
err = perf_event__process_id_index(session, event);
return err;
}
static int dso__read_build_id(struct dso *dso) static int dso__read_build_id(struct dso *dso)
{ {
if (dso->has_build_id) if (dso->has_build_id)
...@@ -651,7 +640,7 @@ static int __cmd_inject(struct perf_inject *inject) ...@@ -651,7 +640,7 @@ static int __cmd_inject(struct perf_inject *inject)
inject->tool.comm = perf_event__repipe_comm; inject->tool.comm = perf_event__repipe_comm;
inject->tool.namespaces = perf_event__repipe_namespaces; inject->tool.namespaces = perf_event__repipe_namespaces;
inject->tool.exit = perf_event__repipe_exit; inject->tool.exit = perf_event__repipe_exit;
inject->tool.id_index = perf_event__repipe_id_index; inject->tool.id_index = perf_event__process_id_index;
inject->tool.auxtrace_info = perf_event__process_auxtrace_info; inject->tool.auxtrace_info = perf_event__process_auxtrace_info;
inject->tool.auxtrace = perf_event__process_auxtrace; inject->tool.auxtrace = perf_event__process_auxtrace;
inject->tool.aux = perf_event__drop_aux; inject->tool.aux = perf_event__drop_aux;
......
...@@ -832,7 +832,7 @@ static int record__open(struct record *rec) ...@@ -832,7 +832,7 @@ static int record__open(struct record *rec)
if ((errno == EINVAL || errno == EBADF) && if ((errno == EINVAL || errno == EBADF) &&
pos->leader != pos && pos->leader != pos &&
pos->weak_group) { pos->weak_group) {
pos = perf_evlist__reset_weak_group(evlist, pos); pos = perf_evlist__reset_weak_group(evlist, pos, true);
goto try_again; goto try_again;
} }
rc = -errno; rc = -errno;
......
...@@ -388,6 +388,14 @@ static int report__setup_sample_type(struct report *rep) ...@@ -388,6 +388,14 @@ static int report__setup_sample_type(struct report *rep)
} }
} }
if (sort__mode == SORT_MODE__MEMORY) {
if (!is_pipe && !(sample_type & PERF_SAMPLE_DATA_SRC)) {
ui__error("Selected --mem-mode but no mem data. "
"Did you call perf record without -d?\n");
return -1;
}
}
if (symbol_conf.use_callchain || symbol_conf.cumulate_callchain) { if (symbol_conf.use_callchain || symbol_conf.cumulate_callchain) {
if ((sample_type & PERF_SAMPLE_REGS_USER) && if ((sample_type & PERF_SAMPLE_REGS_USER) &&
(sample_type & PERF_SAMPLE_STACK_USER)) { (sample_type & PERF_SAMPLE_STACK_USER)) {
......
This diff is collapsed.
...@@ -1568,9 +1568,13 @@ int cmd_top(int argc, const char **argv) ...@@ -1568,9 +1568,13 @@ int cmd_top(int argc, const char **argv)
*/ */
status = perf_env__read_cpuid(&perf_env); status = perf_env__read_cpuid(&perf_env);
if (status) { if (status) {
pr_err("Couldn't read the cpuid for this machine: %s\n", /*
str_error_r(errno, errbuf, sizeof(errbuf))); * Some arches do not provide a get_cpuid(), so just use pr_debug, otherwise
goto out_delete_evlist; * warn the user explicitely.
*/
eprintf(status == ENOSYS ? 1 : 0, verbose,
"Couldn't read the cpuid for this machine: %s\n",
str_error_r(errno, errbuf, sizeof(errbuf)));
} }
top.evlist->env = &perf_env; top.evlist->env = &perf_env;
......
...@@ -110,8 +110,8 @@ for i in $FILES; do ...@@ -110,8 +110,8 @@ for i in $FILES; do
done done
# diff with extra ignore lines # diff with extra ignore lines
check arch/x86/lib/memcpy_64.S '-I "^EXPORT_SYMBOL" -I "^#include <asm/export.h>"' check arch/x86/lib/memcpy_64.S '-I "^EXPORT_SYMBOL" -I "^#include <asm/export.h>" -I"^SYM_FUNC_START\(_LOCAL\)*(memcpy_\(erms\|orig\))"'
check arch/x86/lib/memset_64.S '-I "^EXPORT_SYMBOL" -I "^#include <asm/export.h>"' check arch/x86/lib/memset_64.S '-I "^EXPORT_SYMBOL" -I "^#include <asm/export.h>" -I"^SYM_FUNC_START\(_LOCAL\)*(memset_\(erms\|orig\))"'
check include/uapi/asm-generic/mman.h '-I "^#include <\(uapi/\)*asm-generic/mman-common\(-tools\)*.h>"' check include/uapi/asm-generic/mman.h '-I "^#include <\(uapi/\)*asm-generic/mman-common\(-tools\)*.h>"'
check include/uapi/linux/mman.h '-I "^#include <\(uapi/\)*asm/mman.h>"' check include/uapi/linux/mman.h '-I "^#include <\(uapi/\)*asm/mman.h>"'
check include/linux/ctype.h '-I "isdigit("' check include/linux/ctype.h '-I "isdigit("'
......
...@@ -68,14 +68,28 @@ static struct perf_cpu_map *cpu_map__default_new(void) ...@@ -68,14 +68,28 @@ static struct perf_cpu_map *cpu_map__default_new(void)
return cpus; return cpus;
} }
static int cmp_int(const void *a, const void *b)
{
return *(const int *)a - *(const int*)b;
}
static struct perf_cpu_map *cpu_map__trim_new(int nr_cpus, int *tmp_cpus) static struct perf_cpu_map *cpu_map__trim_new(int nr_cpus, int *tmp_cpus)
{ {
size_t payload_size = nr_cpus * sizeof(int); size_t payload_size = nr_cpus * sizeof(int);
struct perf_cpu_map *cpus = malloc(sizeof(*cpus) + payload_size); struct perf_cpu_map *cpus = malloc(sizeof(*cpus) + payload_size);
int i, j;
if (cpus != NULL) { if (cpus != NULL) {
cpus->nr = nr_cpus;
memcpy(cpus->map, tmp_cpus, payload_size); memcpy(cpus->map, tmp_cpus, payload_size);
qsort(cpus->map, nr_cpus, sizeof(int), cmp_int);
/* Remove dups */
j = 0;
for (i = 0; i < nr_cpus; i++) {
if (i == 0 || cpus->map[i] != cpus->map[i - 1])
cpus->map[j++] = cpus->map[i];
}
cpus->nr = j;
assert(j <= nr_cpus);
refcount_set(&cpus->refcnt, 1); refcount_set(&cpus->refcnt, 1);
} }
...@@ -272,3 +286,60 @@ int perf_cpu_map__max(struct perf_cpu_map *map) ...@@ -272,3 +286,60 @@ int perf_cpu_map__max(struct perf_cpu_map *map)
return max; return max;
} }
/*
* Merge two cpumaps
*
* orig either gets freed and replaced with a new map, or reused
* with no reference count change (similar to "realloc")
* other has its reference count increased.
*/
struct perf_cpu_map *perf_cpu_map__merge(struct perf_cpu_map *orig,
struct perf_cpu_map *other)
{
int *tmp_cpus;
int tmp_len;
int i, j, k;
struct perf_cpu_map *merged;
if (!orig && !other)
return NULL;
if (!orig) {
perf_cpu_map__get(other);
return other;
}
if (!other)
return orig;
if (orig->nr == other->nr &&
!memcmp(orig->map, other->map, orig->nr * sizeof(int)))
return orig;
tmp_len = orig->nr + other->nr;
tmp_cpus = malloc(tmp_len * sizeof(int));
if (!tmp_cpus)
return NULL;
/* Standard merge algorithm from wikipedia */
i = j = k = 0;
while (i < orig->nr && j < other->nr) {
if (orig->map[i] <= other->map[j]) {
if (orig->map[i] == other->map[j])
j++;
tmp_cpus[k++] = orig->map[i++];
} else
tmp_cpus[k++] = other->map[j++];
}
while (i < orig->nr)
tmp_cpus[k++] = orig->map[i++];
while (j < other->nr)
tmp_cpus[k++] = other->map[j++];
assert(k <= tmp_len);
merged = cpu_map__trim_new(k, tmp_cpus);
free(tmp_cpus);
perf_cpu_map__put(orig);
return merged;
}
...@@ -54,6 +54,7 @@ static void __perf_evlist__propagate_maps(struct perf_evlist *evlist, ...@@ -54,6 +54,7 @@ static void __perf_evlist__propagate_maps(struct perf_evlist *evlist,
perf_thread_map__put(evsel->threads); perf_thread_map__put(evsel->threads);
evsel->threads = perf_thread_map__get(evlist->threads); evsel->threads = perf_thread_map__get(evlist->threads);
evlist->all_cpus = perf_cpu_map__merge(evlist->all_cpus, evsel->cpus);
} }
static void perf_evlist__propagate_maps(struct perf_evlist *evlist) static void perf_evlist__propagate_maps(struct perf_evlist *evlist)
......
...@@ -114,16 +114,23 @@ int perf_evsel__open(struct perf_evsel *evsel, struct perf_cpu_map *cpus, ...@@ -114,16 +114,23 @@ int perf_evsel__open(struct perf_evsel *evsel, struct perf_cpu_map *cpus,
return err; return err;
} }
static void perf_evsel__close_fd_cpu(struct perf_evsel *evsel, int cpu)
{
int thread;
for (thread = 0; thread < xyarray__max_y(evsel->fd); ++thread) {
if (FD(evsel, cpu, thread) >= 0)
close(FD(evsel, cpu, thread));
FD(evsel, cpu, thread) = -1;
}
}
void perf_evsel__close_fd(struct perf_evsel *evsel) void perf_evsel__close_fd(struct perf_evsel *evsel)
{ {
int cpu, thread; int cpu;
for (cpu = 0; cpu < xyarray__max_x(evsel->fd); cpu++) for (cpu = 0; cpu < xyarray__max_x(evsel->fd); cpu++)
for (thread = 0; thread < xyarray__max_y(evsel->fd); ++thread) { perf_evsel__close_fd_cpu(evsel, cpu);
if (FD(evsel, cpu, thread) >= 0)
close(FD(evsel, cpu, thread));
FD(evsel, cpu, thread) = -1;
}
} }
void perf_evsel__free_fd(struct perf_evsel *evsel) void perf_evsel__free_fd(struct perf_evsel *evsel)
...@@ -141,6 +148,14 @@ void perf_evsel__close(struct perf_evsel *evsel) ...@@ -141,6 +148,14 @@ void perf_evsel__close(struct perf_evsel *evsel)
perf_evsel__free_fd(evsel); perf_evsel__free_fd(evsel);
} }
void perf_evsel__close_cpu(struct perf_evsel *evsel, int cpu)
{
if (evsel->fd == NULL)
return;
perf_evsel__close_fd_cpu(evsel, cpu);
}
int perf_evsel__read_size(struct perf_evsel *evsel) int perf_evsel__read_size(struct perf_evsel *evsel)
{ {
u64 read_format = evsel->attr.read_format; u64 read_format = evsel->attr.read_format;
...@@ -183,38 +198,61 @@ int perf_evsel__read(struct perf_evsel *evsel, int cpu, int thread, ...@@ -183,38 +198,61 @@ int perf_evsel__read(struct perf_evsel *evsel, int cpu, int thread,
} }
static int perf_evsel__run_ioctl(struct perf_evsel *evsel, static int perf_evsel__run_ioctl(struct perf_evsel *evsel,
int ioc, void *arg) int ioc, void *arg,
int cpu)
{ {
int cpu, thread; int thread;
for (cpu = 0; cpu < xyarray__max_x(evsel->fd); cpu++) { for (thread = 0; thread < xyarray__max_y(evsel->fd); thread++) {
for (thread = 0; thread < xyarray__max_y(evsel->fd); thread++) { int fd = FD(evsel, cpu, thread),
int fd = FD(evsel, cpu, thread), err = ioctl(fd, ioc, arg);
err = ioctl(fd, ioc, arg);
if (err) if (err)
return err; return err;
}
} }
return 0; return 0;
} }
int perf_evsel__enable_cpu(struct perf_evsel *evsel, int cpu)
{
return perf_evsel__run_ioctl(evsel, PERF_EVENT_IOC_ENABLE, NULL, cpu);
}
int perf_evsel__enable(struct perf_evsel *evsel) int perf_evsel__enable(struct perf_evsel *evsel)
{ {
return perf_evsel__run_ioctl(evsel, PERF_EVENT_IOC_ENABLE, 0); int i;
int err = 0;
for (i = 0; i < xyarray__max_x(evsel->fd) && !err; i++)
err = perf_evsel__run_ioctl(evsel, PERF_EVENT_IOC_ENABLE, NULL, i);
return err;
}
int perf_evsel__disable_cpu(struct perf_evsel *evsel, int cpu)
{
return perf_evsel__run_ioctl(evsel, PERF_EVENT_IOC_DISABLE, NULL, cpu);
} }
int perf_evsel__disable(struct perf_evsel *evsel) int perf_evsel__disable(struct perf_evsel *evsel)
{ {
return perf_evsel__run_ioctl(evsel, PERF_EVENT_IOC_DISABLE, 0); int i;
int err = 0;
for (i = 0; i < xyarray__max_x(evsel->fd) && !err; i++)
err = perf_evsel__run_ioctl(evsel, PERF_EVENT_IOC_DISABLE, NULL, i);
return err;
} }
int perf_evsel__apply_filter(struct perf_evsel *evsel, const char *filter) int perf_evsel__apply_filter(struct perf_evsel *evsel, const char *filter)
{ {
return perf_evsel__run_ioctl(evsel, int err = 0, i;
for (i = 0; i < evsel->cpus->nr && !err; i++)
err = perf_evsel__run_ioctl(evsel,
PERF_EVENT_IOC_SET_FILTER, PERF_EVENT_IOC_SET_FILTER,
(void *)filter); (void *)filter, i);
return err;
} }
struct perf_cpu_map *perf_evsel__cpus(struct perf_evsel *evsel) struct perf_cpu_map *perf_evsel__cpus(struct perf_evsel *evsel)
......
...@@ -18,6 +18,7 @@ struct perf_evlist { ...@@ -18,6 +18,7 @@ struct perf_evlist {
int nr_entries; int nr_entries;
bool has_user_cpus; bool has_user_cpus;
struct perf_cpu_map *cpus; struct perf_cpu_map *cpus;
struct perf_cpu_map *all_cpus;
struct perf_thread_map *threads; struct perf_thread_map *threads;
int nr_mmaps; int nr_mmaps;
size_t mmap_len; size_t mmap_len;
......
...@@ -12,6 +12,8 @@ LIBPERF_API struct perf_cpu_map *perf_cpu_map__dummy_new(void); ...@@ -12,6 +12,8 @@ LIBPERF_API struct perf_cpu_map *perf_cpu_map__dummy_new(void);
LIBPERF_API struct perf_cpu_map *perf_cpu_map__new(const char *cpu_list); LIBPERF_API struct perf_cpu_map *perf_cpu_map__new(const char *cpu_list);
LIBPERF_API struct perf_cpu_map *perf_cpu_map__read(FILE *file); LIBPERF_API struct perf_cpu_map *perf_cpu_map__read(FILE *file);
LIBPERF_API struct perf_cpu_map *perf_cpu_map__get(struct perf_cpu_map *map); LIBPERF_API struct perf_cpu_map *perf_cpu_map__get(struct perf_cpu_map *map);
LIBPERF_API struct perf_cpu_map *perf_cpu_map__merge(struct perf_cpu_map *orig,
struct perf_cpu_map *other);
LIBPERF_API void perf_cpu_map__put(struct perf_cpu_map *map); LIBPERF_API void perf_cpu_map__put(struct perf_cpu_map *map);
LIBPERF_API int perf_cpu_map__cpu(const struct perf_cpu_map *cpus, int idx); LIBPERF_API int perf_cpu_map__cpu(const struct perf_cpu_map *cpus, int idx);
LIBPERF_API int perf_cpu_map__nr(const struct perf_cpu_map *cpus); LIBPERF_API int perf_cpu_map__nr(const struct perf_cpu_map *cpus);
......
...@@ -26,10 +26,13 @@ LIBPERF_API void perf_evsel__delete(struct perf_evsel *evsel); ...@@ -26,10 +26,13 @@ LIBPERF_API void perf_evsel__delete(struct perf_evsel *evsel);
LIBPERF_API int perf_evsel__open(struct perf_evsel *evsel, struct perf_cpu_map *cpus, LIBPERF_API int perf_evsel__open(struct perf_evsel *evsel, struct perf_cpu_map *cpus,
struct perf_thread_map *threads); struct perf_thread_map *threads);
LIBPERF_API void perf_evsel__close(struct perf_evsel *evsel); LIBPERF_API void perf_evsel__close(struct perf_evsel *evsel);
LIBPERF_API void perf_evsel__close_cpu(struct perf_evsel *evsel, int cpu);
LIBPERF_API int perf_evsel__read(struct perf_evsel *evsel, int cpu, int thread, LIBPERF_API int perf_evsel__read(struct perf_evsel *evsel, int cpu, int thread,
struct perf_counts_values *count); struct perf_counts_values *count);
LIBPERF_API int perf_evsel__enable(struct perf_evsel *evsel); LIBPERF_API int perf_evsel__enable(struct perf_evsel *evsel);
LIBPERF_API int perf_evsel__enable_cpu(struct perf_evsel *evsel, int cpu);
LIBPERF_API int perf_evsel__disable(struct perf_evsel *evsel); LIBPERF_API int perf_evsel__disable(struct perf_evsel *evsel);
LIBPERF_API int perf_evsel__disable_cpu(struct perf_evsel *evsel, int cpu);
LIBPERF_API struct perf_cpu_map *perf_evsel__cpus(struct perf_evsel *evsel); LIBPERF_API struct perf_cpu_map *perf_evsel__cpus(struct perf_evsel *evsel);
LIBPERF_API struct perf_thread_map *perf_evsel__threads(struct perf_evsel *evsel); LIBPERF_API struct perf_thread_map *perf_evsel__threads(struct perf_evsel *evsel);
LIBPERF_API struct perf_event_attr *perf_evsel__attr(struct perf_evsel *evsel); LIBPERF_API struct perf_event_attr *perf_evsel__attr(struct perf_evsel *evsel);
......
...@@ -32,7 +32,7 @@ ...@@ -32,7 +32,7 @@
"EventCode": "132", "EventCode": "132",
"EventName": "DTLB1_GPAGE_WRITES", "EventName": "DTLB1_GPAGE_WRITES",
"BriefDescription": "DTLB1 Two-Gigabyte Page Writes", "BriefDescription": "DTLB1 Two-Gigabyte Page Writes",
"PublicDescription": "Counter:132 Name:DTLB1_GPAGE_WRITES A translation entry has been written to the Level-1 Data Translation Lookaside Buffer for a two-gigabyte page." "PublicDescription": "A translation entry has been written to the Level-1 Data Translation Lookaside Buffer for a two-gigabyte page."
}, },
{ {
"Unit": "CPU-M-CF", "Unit": "CPU-M-CF",
......
...@@ -4,7 +4,7 @@ ...@@ -4,7 +4,7 @@
"EventCode": "128", "EventCode": "128",
"EventName": "L1D_RO_EXCL_WRITES", "EventName": "L1D_RO_EXCL_WRITES",
"BriefDescription": "L1D Read-only Exclusive Writes", "BriefDescription": "L1D Read-only Exclusive Writes",
"PublicDescription": "L1D_RO_EXCL_WRITES A directory write to the Level-1 Data cache where the line was originally in a Read-Only state in the cache but has been updated to be in the Exclusive state that allows stores to the cache line" "PublicDescription": "A directory write to the Level-1 Data cache where the line was originally in a Read-Only state in the cache but has been updated to be in the Exclusive state that allows stores to the cache line"
}, },
{ {
"Unit": "CPU-M-CF", "Unit": "CPU-M-CF",
......
...@@ -297,7 +297,7 @@ ...@@ -297,7 +297,7 @@
}, },
{ {
"BriefDescription": "Fraction of cycles spent in Kernel mode", "BriefDescription": "Fraction of cycles spent in Kernel mode",
"MetricExpr": "CPU_CLK_UNHALTED.REF_TSC:u / CPU_CLK_UNHALTED.REF_TSC", "MetricExpr": "CPU_CLK_UNHALTED.REF_TSC:k / CPU_CLK_UNHALTED.REF_TSC",
"MetricGroup": "Summary", "MetricGroup": "Summary",
"MetricName": "Kernel_Utilization" "MetricName": "Kernel_Utilization"
}, },
......
...@@ -115,7 +115,7 @@ ...@@ -115,7 +115,7 @@
}, },
{ {
"BriefDescription": "Fraction of cycles spent in Kernel mode", "BriefDescription": "Fraction of cycles spent in Kernel mode",
"MetricExpr": "CPU_CLK_UNHALTED.REF_TSC:u / CPU_CLK_UNHALTED.REF_TSC", "MetricExpr": "CPU_CLK_UNHALTED.REF_TSC:k / CPU_CLK_UNHALTED.REF_TSC",
"MetricGroup": "Summary", "MetricGroup": "Summary",
"MetricName": "Kernel_Utilization" "MetricName": "Kernel_Utilization"
}, },
......
...@@ -297,7 +297,7 @@ ...@@ -297,7 +297,7 @@
}, },
{ {
"BriefDescription": "Fraction of cycles spent in Kernel mode", "BriefDescription": "Fraction of cycles spent in Kernel mode",
"MetricExpr": "CPU_CLK_UNHALTED.REF_TSC:u / CPU_CLK_UNHALTED.REF_TSC", "MetricExpr": "CPU_CLK_UNHALTED.REF_TSC:k / CPU_CLK_UNHALTED.REF_TSC",
"MetricGroup": "Summary", "MetricGroup": "Summary",
"MetricName": "Kernel_Utilization" "MetricName": "Kernel_Utilization"
}, },
......
...@@ -315,7 +315,7 @@ ...@@ -315,7 +315,7 @@
}, },
{ {
"BriefDescription": "Fraction of cycles spent in Kernel mode", "BriefDescription": "Fraction of cycles spent in Kernel mode",
"MetricExpr": "CPU_CLK_UNHALTED.REF_TSC:u / CPU_CLK_UNHALTED.REF_TSC", "MetricExpr": "CPU_CLK_UNHALTED.REF_TSC:k / CPU_CLK_UNHALTED.REF_TSC",
"MetricGroup": "Summary", "MetricGroup": "Summary",
"MetricName": "Kernel_Utilization" "MetricName": "Kernel_Utilization"
}, },
......
...@@ -267,7 +267,7 @@ ...@@ -267,7 +267,7 @@
}, },
{ {
"BriefDescription": "Fraction of cycles spent in Kernel mode", "BriefDescription": "Fraction of cycles spent in Kernel mode",
"MetricExpr": "CPU_CLK_UNHALTED.REF_TSC:u / CPU_CLK_UNHALTED.REF_TSC", "MetricExpr": "CPU_CLK_UNHALTED.REF_TSC:k / CPU_CLK_UNHALTED.REF_TSC",
"MetricGroup": "Summary", "MetricGroup": "Summary",
"MetricName": "Kernel_Utilization" "MetricName": "Kernel_Utilization"
}, },
......
...@@ -267,7 +267,7 @@ ...@@ -267,7 +267,7 @@
}, },
{ {
"BriefDescription": "Fraction of cycles spent in Kernel mode", "BriefDescription": "Fraction of cycles spent in Kernel mode",
"MetricExpr": "CPU_CLK_UNHALTED.REF_TSC:u / CPU_CLK_UNHALTED.REF_TSC", "MetricExpr": "CPU_CLK_UNHALTED.REF_TSC:k / CPU_CLK_UNHALTED.REF_TSC",
"MetricGroup": "Summary", "MetricGroup": "Summary",
"MetricName": "Kernel_Utilization" "MetricName": "Kernel_Utilization"
}, },
......
...@@ -285,7 +285,7 @@ ...@@ -285,7 +285,7 @@
}, },
{ {
"BriefDescription": "Fraction of cycles spent in Kernel mode", "BriefDescription": "Fraction of cycles spent in Kernel mode",
"MetricExpr": "CPU_CLK_UNHALTED.REF_TSC:u / CPU_CLK_UNHALTED.REF_TSC", "MetricExpr": "CPU_CLK_UNHALTED.REF_TSC:k / CPU_CLK_UNHALTED.REF_TSC",
"MetricGroup": "Summary", "MetricGroup": "Summary",
"MetricName": "Kernel_Utilization" "MetricName": "Kernel_Utilization"
}, },
......
...@@ -285,7 +285,7 @@ ...@@ -285,7 +285,7 @@
}, },
{ {
"BriefDescription": "Fraction of cycles spent in Kernel mode", "BriefDescription": "Fraction of cycles spent in Kernel mode",
"MetricExpr": "CPU_CLK_UNHALTED.REF_TSC:u / CPU_CLK_UNHALTED.REF_TSC", "MetricExpr": "CPU_CLK_UNHALTED.REF_TSC:k / CPU_CLK_UNHALTED.REF_TSC",
"MetricGroup": "Summary", "MetricGroup": "Summary",
"MetricName": "Kernel_Utilization" "MetricName": "Kernel_Utilization"
}, },
......
...@@ -171,7 +171,7 @@ ...@@ -171,7 +171,7 @@
}, },
{ {
"BriefDescription": "Fraction of cycles spent in Kernel mode", "BriefDescription": "Fraction of cycles spent in Kernel mode",
"MetricExpr": "CPU_CLK_UNHALTED.REF_TSC:u / CPU_CLK_UNHALTED.REF_TSC", "MetricExpr": "CPU_CLK_UNHALTED.REF_TSC:k / CPU_CLK_UNHALTED.REF_TSC",
"MetricGroup": "Summary", "MetricGroup": "Summary",
"MetricName": "Kernel_Utilization" "MetricName": "Kernel_Utilization"
}, },
......
...@@ -171,7 +171,7 @@ ...@@ -171,7 +171,7 @@
}, },
{ {
"BriefDescription": "Fraction of cycles spent in Kernel mode", "BriefDescription": "Fraction of cycles spent in Kernel mode",
"MetricExpr": "CPU_CLK_UNHALTED.REF_TSC:u / CPU_CLK_UNHALTED.REF_TSC", "MetricExpr": "CPU_CLK_UNHALTED.REF_TSC:k / CPU_CLK_UNHALTED.REF_TSC",
"MetricGroup": "Summary", "MetricGroup": "Summary",
"MetricName": "Kernel_Utilization" "MetricName": "Kernel_Utilization"
}, },
......
...@@ -303,7 +303,7 @@ ...@@ -303,7 +303,7 @@
}, },
{ {
"BriefDescription": "Fraction of cycles spent in Kernel mode", "BriefDescription": "Fraction of cycles spent in Kernel mode",
"MetricExpr": "CPU_CLK_UNHALTED.REF_TSC:u / CPU_CLK_UNHALTED.REF_TSC", "MetricExpr": "CPU_CLK_UNHALTED.REF_TSC:k / CPU_CLK_UNHALTED.REF_TSC",
"MetricGroup": "Summary", "MetricGroup": "Summary",
"MetricName": "Kernel_Utilization" "MetricName": "Kernel_Utilization"
}, },
......
...@@ -315,7 +315,7 @@ ...@@ -315,7 +315,7 @@
}, },
{ {
"BriefDescription": "Fraction of cycles spent in Kernel mode", "BriefDescription": "Fraction of cycles spent in Kernel mode",
"MetricExpr": "CPU_CLK_UNHALTED.REF_TSC:u / CPU_CLK_UNHALTED.REF_TSC", "MetricExpr": "CPU_CLK_UNHALTED.REF_TSC:k / CPU_CLK_UNHALTED.REF_TSC",
"MetricGroup": "Summary", "MetricGroup": "Summary",
"MetricName": "Kernel_Utilization" "MetricName": "Kernel_Utilization"
}, },
......
...@@ -54,6 +54,7 @@ perf-y += unit_number__scnprintf.o ...@@ -54,6 +54,7 @@ perf-y += unit_number__scnprintf.o
perf-y += mem2node.o perf-y += mem2node.o
perf-y += maps.o perf-y += maps.o
perf-y += time-utils-test.o perf-y += time-utils-test.o
perf-y += genelf.o
$(OUTPUT)tests/llvm-src-base.c: tests/bpf-script-example.c tests/Build $(OUTPUT)tests/llvm-src-base.c: tests/bpf-script-example.c tests/Build
$(call rule_mkdir) $(call rule_mkdir)
......
...@@ -259,6 +259,11 @@ static struct test generic_tests[] = { ...@@ -259,6 +259,11 @@ static struct test generic_tests[] = {
.desc = "Print cpu map", .desc = "Print cpu map",
.func = test__cpu_map_print, .func = test__cpu_map_print,
}, },
{
.desc = "Merge cpu map",
.func = test__cpu_map_merge,
},
{ {
.desc = "Probe SDT events", .desc = "Probe SDT events",
.func = test__sdt_event, .func = test__sdt_event,
...@@ -296,6 +301,10 @@ static struct test generic_tests[] = { ...@@ -296,6 +301,10 @@ static struct test generic_tests[] = {
.desc = "time utils", .desc = "time utils",
.func = test__time_utils, .func = test__time_utils,
}, },
{
.desc = "Test jit_write_elf",
.func = test__jit_write_elf,
},
{ {
.desc = "maps__merge_in", .desc = "maps__merge_in",
.func = test__maps__merge_in, .func = test__maps__merge_in,
......
...@@ -120,3 +120,19 @@ int test__cpu_map_print(struct test *test __maybe_unused, int subtest __maybe_un ...@@ -120,3 +120,19 @@ int test__cpu_map_print(struct test *test __maybe_unused, int subtest __maybe_un
TEST_ASSERT_VAL("failed to convert map", cpu_map_print("1-10,12-20,22-30,32-40")); TEST_ASSERT_VAL("failed to convert map", cpu_map_print("1-10,12-20,22-30,32-40"));
return 0; return 0;
} }
int test__cpu_map_merge(struct test *test __maybe_unused, int subtest __maybe_unused)
{
struct perf_cpu_map *a = perf_cpu_map__new("4,2,1");
struct perf_cpu_map *b = perf_cpu_map__new("4,5,7");
struct perf_cpu_map *c = perf_cpu_map__merge(a, b);
char buf[100];
TEST_ASSERT_VAL("failed to merge map: bad nr", c->nr == 5);
cpu_map__snprint(c, buf, sizeof(buf));
TEST_ASSERT_VAL("failed to merge map: bad result", !strcmp(buf, "1-2,4-5,7"));
perf_cpu_map__put(a);
perf_cpu_map__put(b);
perf_cpu_map__put(c);
return 0;
}
...@@ -125,7 +125,7 @@ static int attach__cpu_disabled(struct evlist *evlist) ...@@ -125,7 +125,7 @@ static int attach__cpu_disabled(struct evlist *evlist)
evsel->core.attr.disabled = 1; evsel->core.attr.disabled = 1;
err = perf_evsel__open_per_cpu(evsel, cpus); err = perf_evsel__open_per_cpu(evsel, cpus, -1);
if (err) { if (err) {
if (err == -EACCES) if (err == -EACCES)
return TEST_SKIP; return TEST_SKIP;
...@@ -152,7 +152,7 @@ static int attach__cpu_enabled(struct evlist *evlist) ...@@ -152,7 +152,7 @@ static int attach__cpu_enabled(struct evlist *evlist)
return -1; return -1;
} }
err = perf_evsel__open_per_cpu(evsel, cpus); err = perf_evsel__open_per_cpu(evsel, cpus, -1);
if (err == -EACCES) if (err == -EACCES)
return TEST_SKIP; return TEST_SKIP;
......
// SPDX-License-Identifier: GPL-2.0-only
#include <limits.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <unistd.h>
#include <linux/compiler.h>
#include "debug.h"
#include "tests.h"
#ifdef HAVE_JITDUMP
#include <libelf.h>
#include "../util/genelf.h"
#endif
#define TEMPL "/tmp/perf-test-XXXXXX"
int test__jit_write_elf(struct test *test __maybe_unused,
int subtest __maybe_unused)
{
#ifdef HAVE_JITDUMP
static unsigned char x86_code[] = {
0xBB, 0x2A, 0x00, 0x00, 0x00, /* movl $42, %ebx */
0xB8, 0x01, 0x00, 0x00, 0x00, /* movl $1, %eax */
0xCD, 0x80 /* int $0x80 */
};
char path[PATH_MAX];
int fd, ret;
strcpy(path, TEMPL);
fd = mkstemp(path);
if (fd < 0) {
perror("mkstemp failed");
return TEST_FAIL;
}
pr_info("Writing jit code to: %s\n", path);
ret = jit_write_elf(fd, 0, "main", x86_code, sizeof(x86_code),
NULL, 0, NULL, 0, 0);
close(fd);
unlink(path);
return ret ? TEST_FAIL : 0;
#else
return TEST_SKIP;
#endif
}
...@@ -98,6 +98,7 @@ int test__event_update(struct test *test, int subtest); ...@@ -98,6 +98,7 @@ int test__event_update(struct test *test, int subtest);
int test__event_times(struct test *test, int subtest); int test__event_times(struct test *test, int subtest);
int test__backward_ring_buffer(struct test *test, int subtest); int test__backward_ring_buffer(struct test *test, int subtest);
int test__cpu_map_print(struct test *test, int subtest); int test__cpu_map_print(struct test *test, int subtest);
int test__cpu_map_merge(struct test *test, int subtest);
int test__sdt_event(struct test *test, int subtest); int test__sdt_event(struct test *test, int subtest);
int test__is_printable_array(struct test *test, int subtest); int test__is_printable_array(struct test *test, int subtest);
int test__bitmap_print(struct test *test, int subtest); int test__bitmap_print(struct test *test, int subtest);
...@@ -109,6 +110,7 @@ int test__unit_number__scnprint(struct test *test, int subtest); ...@@ -109,6 +110,7 @@ int test__unit_number__scnprint(struct test *test, int subtest);
int test__mem2node(struct test *t, int subtest); int test__mem2node(struct test *t, int subtest);
int test__maps__merge_in(struct test *t, int subtest); int test__maps__merge_in(struct test *t, int subtest);
int test__time_utils(struct test *t, int subtest); int test__time_utils(struct test *t, int subtest);
int test__jit_write_elf(struct test *test, int subtest);
bool test__bp_signal_is_supported(void); bool test__bp_signal_is_supported(void);
bool test__bp_account_is_supported(void); bool test__bp_account_is_supported(void);
......
...@@ -45,6 +45,7 @@ static size_t clone__scnprintf_flags(unsigned long flags, char *bf, size_t size, ...@@ -45,6 +45,7 @@ static size_t clone__scnprintf_flags(unsigned long flags, char *bf, size_t size,
P_FLAG(NEWPID); P_FLAG(NEWPID);
P_FLAG(NEWNET); P_FLAG(NEWNET);
P_FLAG(IO); P_FLAG(IO);
P_FLAG(CLEAR_SIGHAND);
#undef P_FLAG #undef P_FLAG
if (flags) if (flags)
......
...@@ -63,4 +63,5 @@ int cpu_map__build_map(struct perf_cpu_map *cpus, struct perf_cpu_map **res, ...@@ -63,4 +63,5 @@ int cpu_map__build_map(struct perf_cpu_map *cpus, struct perf_cpu_map **res,
int cpu_map__cpu(struct perf_cpu_map *cpus, int idx); int cpu_map__cpu(struct perf_cpu_map *cpus, int idx);
bool cpu_map__has(struct perf_cpu_map *cpus, int cpu); bool cpu_map__has(struct perf_cpu_map *cpus, int cpu);
#endif /* __PERF_CPUMAP_H */ #endif /* __PERF_CPUMAP_H */
...@@ -18,6 +18,7 @@ ...@@ -18,6 +18,7 @@
#include "debug.h" #include "debug.h"
#include "units.h" #include "units.h"
#include <internal/lib.h> // page_size #include <internal/lib.h> // page_size
#include "affinity.h"
#include "../perf.h" #include "../perf.h"
#include "asm/bug.h" #include "asm/bug.h"
#include "bpf-event.h" #include "bpf-event.h"
...@@ -342,14 +343,63 @@ static int perf_evlist__nr_threads(struct evlist *evlist, ...@@ -342,14 +343,63 @@ static int perf_evlist__nr_threads(struct evlist *evlist,
return perf_thread_map__nr(evlist->core.threads); return perf_thread_map__nr(evlist->core.threads);
} }
void evlist__cpu_iter_start(struct evlist *evlist)
{
struct evsel *pos;
/*
* Reset the per evsel cpu_iter. This is needed because
* each evsel's cpumap may have a different index space,
* and some operations need the index to modify
* the FD xyarray (e.g. open, close)
*/
evlist__for_each_entry(evlist, pos)
pos->cpu_iter = 0;
}
bool evsel__cpu_iter_skip_no_inc(struct evsel *ev, int cpu)
{
if (ev->cpu_iter >= ev->core.cpus->nr)
return true;
if (cpu >= 0 && ev->core.cpus->map[ev->cpu_iter] != cpu)
return true;
return false;
}
bool evsel__cpu_iter_skip(struct evsel *ev, int cpu)
{
if (!evsel__cpu_iter_skip_no_inc(ev, cpu)) {
ev->cpu_iter++;
return false;
}
return true;
}
void evlist__disable(struct evlist *evlist) void evlist__disable(struct evlist *evlist)
{ {
struct evsel *pos; struct evsel *pos;
struct affinity affinity;
int cpu, i;
if (affinity__setup(&affinity) < 0)
return;
evlist__for_each_cpu(evlist, i, cpu) {
affinity__set(&affinity, cpu);
evlist__for_each_entry(evlist, pos) {
if (evsel__cpu_iter_skip(pos, cpu))
continue;
if (pos->disabled || !perf_evsel__is_group_leader(pos) || !pos->core.fd)
continue;
evsel__disable_cpu(pos, pos->cpu_iter - 1);
}
}
affinity__cleanup(&affinity);
evlist__for_each_entry(evlist, pos) { evlist__for_each_entry(evlist, pos) {
if (pos->disabled || !perf_evsel__is_group_leader(pos) || !pos->core.fd) if (!perf_evsel__is_group_leader(pos) || !pos->core.fd)
continue; continue;
evsel__disable(pos); pos->disabled = true;
} }
evlist->enabled = false; evlist->enabled = false;
...@@ -358,11 +408,28 @@ void evlist__disable(struct evlist *evlist) ...@@ -358,11 +408,28 @@ void evlist__disable(struct evlist *evlist)
void evlist__enable(struct evlist *evlist) void evlist__enable(struct evlist *evlist)
{ {
struct evsel *pos; struct evsel *pos;
struct affinity affinity;
int cpu, i;
if (affinity__setup(&affinity) < 0)
return;
evlist__for_each_cpu(evlist, i, cpu) {
affinity__set(&affinity, cpu);
evlist__for_each_entry(evlist, pos) {
if (evsel__cpu_iter_skip(pos, cpu))
continue;
if (!perf_evsel__is_group_leader(pos) || !pos->core.fd)
continue;
evsel__enable_cpu(pos, pos->cpu_iter - 1);
}
}
affinity__cleanup(&affinity);
evlist__for_each_entry(evlist, pos) { evlist__for_each_entry(evlist, pos) {
if (!perf_evsel__is_group_leader(pos) || !pos->core.fd) if (!perf_evsel__is_group_leader(pos) || !pos->core.fd)
continue; continue;
evsel__enable(pos); pos->disabled = false;
} }
evlist->enabled = true; evlist->enabled = true;
...@@ -1137,9 +1204,35 @@ void perf_evlist__set_selected(struct evlist *evlist, ...@@ -1137,9 +1204,35 @@ void perf_evlist__set_selected(struct evlist *evlist,
void evlist__close(struct evlist *evlist) void evlist__close(struct evlist *evlist)
{ {
struct evsel *evsel; struct evsel *evsel;
struct affinity affinity;
int cpu, i;
evlist__for_each_entry_reverse(evlist, evsel) /*
evsel__close(evsel); * With perf record core.cpus is usually NULL.
* Use the old method to handle this for now.
*/
if (!evlist->core.cpus) {
evlist__for_each_entry_reverse(evlist, evsel)
evsel__close(evsel);
return;
}
if (affinity__setup(&affinity) < 0)
return;
evlist__for_each_cpu(evlist, i, cpu) {
affinity__set(&affinity, cpu);
evlist__for_each_entry_reverse(evlist, evsel) {
if (evsel__cpu_iter_skip(evsel, cpu))
continue;
perf_evsel__close_cpu(&evsel->core, evsel->cpu_iter - 1);
}
}
affinity__cleanup(&affinity);
evlist__for_each_entry_reverse(evlist, evsel) {
perf_evsel__free_fd(&evsel->core);
perf_evsel__free_id(&evsel->core);
}
} }
static int perf_evlist__create_syswide_maps(struct evlist *evlist) static int perf_evlist__create_syswide_maps(struct evlist *evlist)
...@@ -1577,7 +1670,8 @@ void perf_evlist__force_leader(struct evlist *evlist) ...@@ -1577,7 +1670,8 @@ void perf_evlist__force_leader(struct evlist *evlist)
} }
struct evsel *perf_evlist__reset_weak_group(struct evlist *evsel_list, struct evsel *perf_evlist__reset_weak_group(struct evlist *evsel_list,
struct evsel *evsel) struct evsel *evsel,
bool close)
{ {
struct evsel *c2, *leader; struct evsel *c2, *leader;
bool is_open = true; bool is_open = true;
...@@ -1594,10 +1688,15 @@ struct evsel *perf_evlist__reset_weak_group(struct evlist *evsel_list, ...@@ -1594,10 +1688,15 @@ struct evsel *perf_evlist__reset_weak_group(struct evlist *evsel_list,
if (c2 == evsel) if (c2 == evsel)
is_open = false; is_open = false;
if (c2->leader == leader) { if (c2->leader == leader) {
if (is_open) if (is_open && close)
perf_evsel__close(&c2->core); perf_evsel__close(&c2->core);
c2->leader = c2; c2->leader = c2;
c2->core.nr_members = 0; c2->core.nr_members = 0;
/*
* Set this for all former members of the group
* to indicate they get reopened.
*/
c2->reset_group = true;
} }
} }
return leader; return leader;
......
...@@ -334,9 +334,17 @@ void perf_evlist__to_front(struct evlist *evlist, ...@@ -334,9 +334,17 @@ void perf_evlist__to_front(struct evlist *evlist,
#define evlist__for_each_entry_safe(evlist, tmp, evsel) \ #define evlist__for_each_entry_safe(evlist, tmp, evsel) \
__evlist__for_each_entry_safe(&(evlist)->core.entries, tmp, evsel) __evlist__for_each_entry_safe(&(evlist)->core.entries, tmp, evsel)
#define evlist__for_each_cpu(evlist, index, cpu) \
evlist__cpu_iter_start(evlist); \
perf_cpu_map__for_each_cpu (cpu, index, (evlist)->core.all_cpus)
void perf_evlist__set_tracking_event(struct evlist *evlist, void perf_evlist__set_tracking_event(struct evlist *evlist,
struct evsel *tracking_evsel); struct evsel *tracking_evsel);
void evlist__cpu_iter_start(struct evlist *evlist);
bool evsel__cpu_iter_skip(struct evsel *ev, int cpu);
bool evsel__cpu_iter_skip_no_inc(struct evsel *ev, int cpu);
struct evsel * struct evsel *
perf_evlist__find_evsel_by_str(struct evlist *evlist, const char *str); perf_evlist__find_evsel_by_str(struct evlist *evlist, const char *str);
...@@ -348,5 +356,6 @@ bool perf_evlist__exclude_kernel(struct evlist *evlist); ...@@ -348,5 +356,6 @@ bool perf_evlist__exclude_kernel(struct evlist *evlist);
void perf_evlist__force_leader(struct evlist *evlist); void perf_evlist__force_leader(struct evlist *evlist);
struct evsel *perf_evlist__reset_weak_group(struct evlist *evlist, struct evsel *perf_evlist__reset_weak_group(struct evlist *evlist,
struct evsel *evsel); struct evsel *evsel,
bool close);
#endif /* __PERF_EVLIST_H */ #endif /* __PERF_EVLIST_H */
...@@ -1223,16 +1223,27 @@ int perf_evsel__append_addr_filter(struct evsel *evsel, const char *filter) ...@@ -1223,16 +1223,27 @@ int perf_evsel__append_addr_filter(struct evsel *evsel, const char *filter)
return perf_evsel__append_filter(evsel, "%s,%s", filter); return perf_evsel__append_filter(evsel, "%s,%s", filter);
} }
/* Caller has to clear disabled after going through all CPUs. */
int evsel__enable_cpu(struct evsel *evsel, int cpu)
{
return perf_evsel__enable_cpu(&evsel->core, cpu);
}
int evsel__enable(struct evsel *evsel) int evsel__enable(struct evsel *evsel)
{ {
int err = perf_evsel__enable(&evsel->core); int err = perf_evsel__enable(&evsel->core);
if (!err) if (!err)
evsel->disabled = false; evsel->disabled = false;
return err; return err;
} }
/* Caller has to set disabled after going through all CPUs. */
int evsel__disable_cpu(struct evsel *evsel, int cpu)
{
return perf_evsel__disable_cpu(&evsel->core, cpu);
}
int evsel__disable(struct evsel *evsel) int evsel__disable(struct evsel *evsel)
{ {
int err = perf_evsel__disable(&evsel->core); int err = perf_evsel__disable(&evsel->core);
...@@ -1587,8 +1598,9 @@ static int perf_event_open(struct evsel *evsel, ...@@ -1587,8 +1598,9 @@ static int perf_event_open(struct evsel *evsel,
return fd; return fd;
} }
int evsel__open(struct evsel *evsel, struct perf_cpu_map *cpus, static int evsel__open_cpu(struct evsel *evsel, struct perf_cpu_map *cpus,
struct perf_thread_map *threads) struct perf_thread_map *threads,
int start_cpu, int end_cpu)
{ {
int cpu, thread, nthreads; int cpu, thread, nthreads;
unsigned long flags = PERF_FLAG_FD_CLOEXEC; unsigned long flags = PERF_FLAG_FD_CLOEXEC;
...@@ -1665,7 +1677,7 @@ int evsel__open(struct evsel *evsel, struct perf_cpu_map *cpus, ...@@ -1665,7 +1677,7 @@ int evsel__open(struct evsel *evsel, struct perf_cpu_map *cpus,
display_attr(&evsel->core.attr); display_attr(&evsel->core.attr);
for (cpu = 0; cpu < cpus->nr; cpu++) { for (cpu = start_cpu; cpu < end_cpu; cpu++) {
for (thread = 0; thread < nthreads; thread++) { for (thread = 0; thread < nthreads; thread++) {
int fd, group_fd; int fd, group_fd;
...@@ -1843,6 +1855,12 @@ int evsel__open(struct evsel *evsel, struct perf_cpu_map *cpus, ...@@ -1843,6 +1855,12 @@ int evsel__open(struct evsel *evsel, struct perf_cpu_map *cpus,
return err; return err;
} }
int evsel__open(struct evsel *evsel, struct perf_cpu_map *cpus,
struct perf_thread_map *threads)
{
return evsel__open_cpu(evsel, cpus, threads, 0, cpus ? cpus->nr : 1);
}
void evsel__close(struct evsel *evsel) void evsel__close(struct evsel *evsel)
{ {
perf_evsel__close(&evsel->core); perf_evsel__close(&evsel->core);
...@@ -1850,9 +1868,14 @@ void evsel__close(struct evsel *evsel) ...@@ -1850,9 +1868,14 @@ void evsel__close(struct evsel *evsel)
} }
int perf_evsel__open_per_cpu(struct evsel *evsel, int perf_evsel__open_per_cpu(struct evsel *evsel,
struct perf_cpu_map *cpus) struct perf_cpu_map *cpus,
int cpu)
{ {
return evsel__open(evsel, cpus, NULL); if (cpu == -1)
return evsel__open_cpu(evsel, cpus, NULL, 0,
cpus ? cpus->nr : 1);
return evsel__open_cpu(evsel, cpus, NULL, cpu, cpu + 1);
} }
int perf_evsel__open_per_thread(struct evsel *evsel, int perf_evsel__open_per_thread(struct evsel *evsel,
......
...@@ -86,6 +86,7 @@ struct evsel { ...@@ -86,6 +86,7 @@ struct evsel {
struct list_head config_terms; struct list_head config_terms;
struct bpf_object *bpf_obj; struct bpf_object *bpf_obj;
int bpf_fd; int bpf_fd;
int err;
bool auto_merge_stats; bool auto_merge_stats;
bool merged_stat; bool merged_stat;
const char * metric_expr; const char * metric_expr;
...@@ -94,7 +95,10 @@ struct evsel { ...@@ -94,7 +95,10 @@ struct evsel {
struct evsel *metric_leader; struct evsel *metric_leader;
bool collect_stat; bool collect_stat;
bool weak_group; bool weak_group;
bool reset_group;
bool errored;
bool percore; bool percore;
int cpu_iter;
const char *pmu_name; const char *pmu_name;
struct { struct {
perf_evsel__sb_cb_t *cb; perf_evsel__sb_cb_t *cb;
...@@ -218,11 +222,14 @@ int perf_evsel__set_filter(struct evsel *evsel, const char *filter); ...@@ -218,11 +222,14 @@ int perf_evsel__set_filter(struct evsel *evsel, const char *filter);
int perf_evsel__append_tp_filter(struct evsel *evsel, const char *filter); int perf_evsel__append_tp_filter(struct evsel *evsel, const char *filter);
int perf_evsel__append_addr_filter(struct evsel *evsel, int perf_evsel__append_addr_filter(struct evsel *evsel,
const char *filter); const char *filter);
int evsel__enable_cpu(struct evsel *evsel, int cpu);
int evsel__enable(struct evsel *evsel); int evsel__enable(struct evsel *evsel);
int evsel__disable(struct evsel *evsel); int evsel__disable(struct evsel *evsel);
int evsel__disable_cpu(struct evsel *evsel, int cpu);
int perf_evsel__open_per_cpu(struct evsel *evsel, int perf_evsel__open_per_cpu(struct evsel *evsel,
struct perf_cpu_map *cpus); struct perf_cpu_map *cpus,
int cpu);
int perf_evsel__open_per_thread(struct evsel *evsel, int perf_evsel__open_per_thread(struct evsel *evsel,
struct perf_thread_map *threads); struct perf_thread_map *threads);
int evsel__open(struct evsel *evsel, struct perf_cpu_map *cpus, int evsel__open(struct evsel *evsel, struct perf_cpu_map *cpus,
......
...@@ -8,15 +8,12 @@ ...@@ -8,15 +8,12 @@
*/ */
#include <sys/types.h> #include <sys/types.h>
#include <stdio.h>
#include <getopt.h>
#include <stddef.h> #include <stddef.h>
#include <libelf.h> #include <libelf.h>
#include <string.h> #include <string.h>
#include <stdlib.h> #include <stdlib.h>
#include <unistd.h> #include <unistd.h>
#include <inttypes.h> #include <inttypes.h>
#include <limits.h>
#include <fcntl.h> #include <fcntl.h>
#include <err.h> #include <err.h>
#ifdef HAVE_DWARF_SUPPORT #ifdef HAVE_DWARF_SUPPORT
...@@ -31,8 +28,6 @@ ...@@ -31,8 +28,6 @@
#define NT_GNU_BUILD_ID 3 #define NT_GNU_BUILD_ID 3
#endif #endif
#define JVMTI
#define BUILD_ID_URANDOM /* different uuid for each run */ #define BUILD_ID_URANDOM /* different uuid for each run */
#ifdef HAVE_LIBCRYPTO #ifdef HAVE_LIBCRYPTO
...@@ -511,44 +506,3 @@ jit_write_elf(int fd, uint64_t load_addr, const char *sym, ...@@ -511,44 +506,3 @@ jit_write_elf(int fd, uint64_t load_addr, const char *sym,
return retval; return retval;
} }
#ifndef JVMTI
static unsigned char x86_code[] = {
0xBB, 0x2A, 0x00, 0x00, 0x00, /* movl $42, %ebx */
0xB8, 0x01, 0x00, 0x00, 0x00, /* movl $1, %eax */
0xCD, 0x80 /* int $0x80 */
};
static struct options options;
int main(int argc, char **argv)
{
int c, fd, ret;
while ((c = getopt(argc, argv, "o:h")) != -1) {
switch (c) {
case 'o':
options.output = optarg;
break;
case 'h':
printf("Usage: genelf -o output_file [-h]\n");
return 0;
default:
errx(1, "unknown option");
}
}
fd = open(options.output, O_CREAT|O_TRUNC|O_RDWR, 0666);
if (fd == -1)
err(1, "cannot create file %s", options.output);
ret = jit_write_elf(fd, "main", x86_code, sizeof(x86_code));
close(fd);
if (ret != 0)
unlink(options.output);
return ret;
}
#endif
...@@ -850,7 +850,7 @@ int __weak strcmp_cpuid_str(const char *mapcpuid, const char *cpuid) ...@@ -850,7 +850,7 @@ int __weak strcmp_cpuid_str(const char *mapcpuid, const char *cpuid)
*/ */
int __weak get_cpuid(char *buffer __maybe_unused, size_t sz __maybe_unused) int __weak get_cpuid(char *buffer __maybe_unused, size_t sz __maybe_unused)
{ {
return -1; return ENOSYS; /* Not implemented */
} }
static int write_cpuid(struct feat_fd *ff, static int write_cpuid(struct feat_fd *ff,
...@@ -1089,21 +1089,18 @@ static void cpu_cache_level__fprintf(FILE *out, struct cpu_cache_level *c) ...@@ -1089,21 +1089,18 @@ static void cpu_cache_level__fprintf(FILE *out, struct cpu_cache_level *c)
fprintf(out, "L%d %-15s %8s [%s]\n", c->level, c->type, c->size, c->map); fprintf(out, "L%d %-15s %8s [%s]\n", c->level, c->type, c->size, c->map);
} }
static int build_caches(struct cpu_cache_level caches[], u32 size, u32 *cntp) #define MAX_CACHE_LVL 4
static int build_caches(struct cpu_cache_level caches[], u32 *cntp)
{ {
u32 i, cnt = 0; u32 i, cnt = 0;
long ncpus;
u32 nr, cpu; u32 nr, cpu;
u16 level; u16 level;
ncpus = sysconf(_SC_NPROCESSORS_CONF); nr = cpu__max_cpu();
if (ncpus < 0)
return -1;
nr = (u32)(ncpus & UINT_MAX);
for (cpu = 0; cpu < nr; cpu++) { for (cpu = 0; cpu < nr; cpu++) {
for (level = 0; level < 10; level++) { for (level = 0; level < MAX_CACHE_LVL; level++) {
struct cpu_cache_level c; struct cpu_cache_level c;
int err; int err;
...@@ -1123,18 +1120,12 @@ static int build_caches(struct cpu_cache_level caches[], u32 size, u32 *cntp) ...@@ -1123,18 +1120,12 @@ static int build_caches(struct cpu_cache_level caches[], u32 size, u32 *cntp)
caches[cnt++] = c; caches[cnt++] = c;
else else
cpu_cache_level__free(&c); cpu_cache_level__free(&c);
if (WARN_ONCE(cnt == size, "way too many cpu caches.."))
goto out;
} }
} }
out:
*cntp = cnt; *cntp = cnt;
return 0; return 0;
} }
#define MAX_CACHE_LVL 4
static int write_cache(struct feat_fd *ff, static int write_cache(struct feat_fd *ff,
struct evlist *evlist __maybe_unused) struct evlist *evlist __maybe_unused)
{ {
...@@ -1143,7 +1134,7 @@ static int write_cache(struct feat_fd *ff, ...@@ -1143,7 +1134,7 @@ static int write_cache(struct feat_fd *ff,
u32 cnt = 0, i, version = 1; u32 cnt = 0, i, version = 1;
int ret; int ret;
ret = build_caches(caches, max_caches, &cnt); ret = build_caches(caches, &cnt);
if (ret) if (ret)
goto out; goto out;
......
...@@ -5,10 +5,93 @@ ...@@ -5,10 +5,93 @@
/* linkage.h ... for including arch/x86/lib/memcpy_64.S */ /* linkage.h ... for including arch/x86/lib/memcpy_64.S */
#define ENTRY(name) \ /* Some toolchains use other characters (e.g. '`') to mark new line in macro */
.globl name; \ #ifndef ASM_NL
#define ASM_NL ;
#endif
#ifndef __ALIGN
#define __ALIGN .align 4,0x90
#define __ALIGN_STR ".align 4,0x90"
#endif
/* SYM_T_FUNC -- type used by assembler to mark functions */
#ifndef SYM_T_FUNC
#define SYM_T_FUNC STT_FUNC
#endif
/* SYM_A_* -- align the symbol? */
#define SYM_A_ALIGN ALIGN
/* SYM_L_* -- linkage of symbols */
#define SYM_L_GLOBAL(name) .globl name
#define SYM_L_LOCAL(name) /* nothing */
#define ALIGN __ALIGN
/* === generic annotations === */
/* SYM_ENTRY -- use only if you have to for non-paired symbols */
#ifndef SYM_ENTRY
#define SYM_ENTRY(name, linkage, align...) \
linkage(name) ASM_NL \
align ASM_NL \
name: name:
#endif
/* SYM_START -- use only if you have to */
#ifndef SYM_START
#define SYM_START(name, linkage, align...) \
SYM_ENTRY(name, linkage, align)
#endif
/* SYM_END -- use only if you have to */
#ifndef SYM_END
#define SYM_END(name, sym_type) \
.type name sym_type ASM_NL \
.size name, .-name
#endif
/*
* SYM_FUNC_START_ALIAS -- use where there are two global names for one
* function
*/
#ifndef SYM_FUNC_START_ALIAS
#define SYM_FUNC_START_ALIAS(name) \
SYM_START(name, SYM_L_GLOBAL, SYM_A_ALIGN)
#endif
/* SYM_FUNC_START -- use for global functions */
#ifndef SYM_FUNC_START
/*
* The same as SYM_FUNC_START_ALIAS, but we will need to distinguish these two
* later.
*/
#define SYM_FUNC_START(name) \
SYM_START(name, SYM_L_GLOBAL, SYM_A_ALIGN)
#endif
/* SYM_FUNC_START_LOCAL -- use for local functions */
#ifndef SYM_FUNC_START_LOCAL
/* the same as SYM_FUNC_START_LOCAL_ALIAS, see comment near SYM_FUNC_START */
#define SYM_FUNC_START_LOCAL(name) \
SYM_START(name, SYM_L_LOCAL, SYM_A_ALIGN)
#endif
/* SYM_FUNC_END_ALIAS -- the end of LOCAL_ALIASed or ALIASed function */
#ifndef SYM_FUNC_END_ALIAS
#define SYM_FUNC_END_ALIAS(name) \
SYM_END(name, SYM_T_FUNC)
#endif
#define ENDPROC(name) /*
* SYM_FUNC_END -- the end of SYM_FUNC_START_LOCAL, SYM_FUNC_START,
* SYM_FUNC_START_WEAK, ...
*/
#ifndef SYM_FUNC_END
/* the same as SYM_FUNC_END_ALIAS, see comment near SYM_FUNC_START */
#define SYM_FUNC_END(name) \
SYM_END(name, SYM_T_FUNC)
#endif
#endif /* PERF_LINUX_LINKAGE_H_ */ #endif /* PERF_LINUX_LINKAGE_H_ */
...@@ -2446,6 +2446,7 @@ static int append_inlines(struct callchain_cursor *cursor, struct map_symbol *ms ...@@ -2446,6 +2446,7 @@ static int append_inlines(struct callchain_cursor *cursor, struct map_symbol *ms
list_for_each_entry(ilist, &inline_node->val, list) { list_for_each_entry(ilist, &inline_node->val, list) {
struct map_symbol ilist_ms = { struct map_symbol ilist_ms = {
.maps = ms->maps,
.map = map, .map = map,
.sym = ilist->symbol, .sym = ilist->symbol,
}; };
......
...@@ -103,8 +103,11 @@ static struct evsel *find_evsel_group(struct evlist *perf_evlist, ...@@ -103,8 +103,11 @@ static struct evsel *find_evsel_group(struct evlist *perf_evlist,
if (!strcmp(ev->name, ids[i])) { if (!strcmp(ev->name, ids[i])) {
if (!metric_events[i]) if (!metric_events[i])
metric_events[i] = ev; metric_events[i] = ev;
i++;
if (i == idnum)
break;
} else { } else {
if (++i == idnum) { if (i + 1 == idnum) {
/* Discard the whole match and start again */ /* Discard the whole match and start again */
i = 0; i = 0;
memset(metric_events, 0, memset(metric_events, 0,
...@@ -124,7 +127,7 @@ static struct evsel *find_evsel_group(struct evlist *perf_evlist, ...@@ -124,7 +127,7 @@ static struct evsel *find_evsel_group(struct evlist *perf_evlist,
} }
} }
if (i != idnum - 1) { if (i != idnum) {
/* Not whole match */ /* Not whole match */
return NULL; return NULL;
} }
......
...@@ -2681,12 +2681,12 @@ static int setup_sort_list(struct perf_hpp_list *list, char *str, ...@@ -2681,12 +2681,12 @@ static int setup_sort_list(struct perf_hpp_list *list, char *str,
ret = sort_dimension__add(list, tok, evlist, level); ret = sort_dimension__add(list, tok, evlist, level);
if (ret == -EINVAL) { if (ret == -EINVAL) {
if (!cacheline_size() && !strncasecmp(tok, "dcacheline", strlen(tok))) if (!cacheline_size() && !strncasecmp(tok, "dcacheline", strlen(tok)))
pr_err("The \"dcacheline\" --sort key needs to know the cacheline size and it couldn't be determined on this system"); ui__error("The \"dcacheline\" --sort key needs to know the cacheline size and it couldn't be determined on this system");
else else
pr_err("Invalid --sort key: `%s'", tok); ui__error("Invalid --sort key: `%s'", tok);
break; break;
} else if (ret == -ESRCH) { } else if (ret == -ESRCH) {
pr_err("Unknown --sort key: `%s'", tok); ui__error("Unknown --sort key: `%s'", tok);
break; break;
} }
} }
...@@ -2743,7 +2743,7 @@ static int setup_sort_order(struct evlist *evlist) ...@@ -2743,7 +2743,7 @@ static int setup_sort_order(struct evlist *evlist)
return 0; return 0;
if (sort_order[1] == '\0') { if (sort_order[1] == '\0') {
pr_err("Invalid --sort key: `+'"); ui__error("Invalid --sort key: `+'");
return -EINVAL; return -EINVAL;
} }
...@@ -2959,6 +2959,9 @@ int output_field_add(struct perf_hpp_list *list, char *tok) ...@@ -2959,6 +2959,9 @@ int output_field_add(struct perf_hpp_list *list, char *tok)
if (strncasecmp(tok, sd->name, strlen(tok))) if (strncasecmp(tok, sd->name, strlen(tok)))
continue; continue;
if (sort__mode != SORT_MODE__MEMORY)
return -EINVAL;
return __sort_dimension__add_output(list, sd); return __sort_dimension__add_output(list, sd);
} }
...@@ -2968,6 +2971,9 @@ int output_field_add(struct perf_hpp_list *list, char *tok) ...@@ -2968,6 +2971,9 @@ int output_field_add(struct perf_hpp_list *list, char *tok)
if (strncasecmp(tok, sd->name, strlen(tok))) if (strncasecmp(tok, sd->name, strlen(tok)))
continue; continue;
if (sort__mode != SORT_MODE__BRANCH)
return -EINVAL;
return __sort_dimension__add_output(list, sd); return __sort_dimension__add_output(list, sd);
} }
...@@ -3034,7 +3040,7 @@ static int __setup_output_field(void) ...@@ -3034,7 +3040,7 @@ static int __setup_output_field(void)
strp++; strp++;
if (!strlen(strp)) { if (!strlen(strp)) {
pr_err("Invalid --fields key: `+'"); ui__error("Invalid --fields key: `+'");
goto out; goto out;
} }
......
...@@ -464,7 +464,8 @@ size_t perf_event__fprintf_stat_config(union perf_event *event, FILE *fp) ...@@ -464,7 +464,8 @@ size_t perf_event__fprintf_stat_config(union perf_event *event, FILE *fp)
int create_perf_stat_counter(struct evsel *evsel, int create_perf_stat_counter(struct evsel *evsel,
struct perf_stat_config *config, struct perf_stat_config *config,
struct target *target) struct target *target,
int cpu)
{ {
struct perf_event_attr *attr = &evsel->core.attr; struct perf_event_attr *attr = &evsel->core.attr;
struct evsel *leader = evsel->leader; struct evsel *leader = evsel->leader;
...@@ -518,7 +519,7 @@ int create_perf_stat_counter(struct evsel *evsel, ...@@ -518,7 +519,7 @@ int create_perf_stat_counter(struct evsel *evsel,
} }
if (target__has_cpu(target) && !target__has_per_thread(target)) if (target__has_cpu(target) && !target__has_per_thread(target))
return perf_evsel__open_per_cpu(evsel, evsel__cpus(evsel)); return perf_evsel__open_per_cpu(evsel, evsel__cpus(evsel), cpu);
return perf_evsel__open_per_thread(evsel, evsel->core.threads); return perf_evsel__open_per_thread(evsel, evsel->core.threads);
} }
...@@ -214,7 +214,8 @@ size_t perf_event__fprintf_stat_config(union perf_event *event, FILE *fp); ...@@ -214,7 +214,8 @@ size_t perf_event__fprintf_stat_config(union perf_event *event, FILE *fp);
int create_perf_stat_counter(struct evsel *evsel, int create_perf_stat_counter(struct evsel *evsel,
struct perf_stat_config *config, struct perf_stat_config *config,
struct target *target); struct target *target,
int cpu);
void void
perf_evlist__print_counters(struct evlist *evlist, perf_evlist__print_counters(struct evlist *evlist,
struct perf_stat_config *config, struct perf_stat_config *config,
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment