Commit 26c923ab authored by Linus Torvalds's avatar Linus Torvalds

Merge branch 'perf-urgent-for-linus' of git://git.kernel.org/pub/scm/linux/kernel/git/tip/tip

Pull perf fixes from Ingo Molnar:
 "Some tooling fixes plus three kernel fixes: a memory leak fix, a
  statistics fix and a crash fix"

* 'perf-urgent-for-linus' of git://git.kernel.org/pub/scm/linux/kernel/git/tip/tip:
  perf/x86/intel/uncore: Fix memory leaks on allocation failures
  perf/core: Fix cgroup time when scheduling descendants
  perf/core: Avoid freeing static PMU contexts when PMU is unregistered
  tools include uapi bpf.h: Sync kernel ABI header with tooling header
  perf pmu: Unbreak perf record for arm/arm64 with events with explicit PMU
  perf script: Add missing separator for "-F ip,brstack" (and brstackoff)
  perf callchain: Compare dsos (as well) for CCKEY_FUNCTION
parents 60a6ca6c 47a74bdc
...@@ -822,7 +822,7 @@ static int __init uncore_type_init(struct intel_uncore_type *type, bool setid) ...@@ -822,7 +822,7 @@ static int __init uncore_type_init(struct intel_uncore_type *type, bool setid)
pmus[i].type = type; pmus[i].type = type;
pmus[i].boxes = kzalloc(size, GFP_KERNEL); pmus[i].boxes = kzalloc(size, GFP_KERNEL);
if (!pmus[i].boxes) if (!pmus[i].boxes)
return -ENOMEM; goto err;
} }
type->pmus = pmus; type->pmus = pmus;
...@@ -836,7 +836,7 @@ static int __init uncore_type_init(struct intel_uncore_type *type, bool setid) ...@@ -836,7 +836,7 @@ static int __init uncore_type_init(struct intel_uncore_type *type, bool setid)
attr_group = kzalloc(sizeof(struct attribute *) * (i + 1) + attr_group = kzalloc(sizeof(struct attribute *) * (i + 1) +
sizeof(*attr_group), GFP_KERNEL); sizeof(*attr_group), GFP_KERNEL);
if (!attr_group) if (!attr_group)
return -ENOMEM; goto err;
attrs = (struct attribute **)(attr_group + 1); attrs = (struct attribute **)(attr_group + 1);
attr_group->name = "events"; attr_group->name = "events";
...@@ -849,7 +849,15 @@ static int __init uncore_type_init(struct intel_uncore_type *type, bool setid) ...@@ -849,7 +849,15 @@ static int __init uncore_type_init(struct intel_uncore_type *type, bool setid)
} }
type->pmu_group = &uncore_pmu_attr_group; type->pmu_group = &uncore_pmu_attr_group;
return 0; return 0;
err:
for (i = 0; i < type->num_boxes; i++)
kfree(pmus[i].boxes);
kfree(pmus);
return -ENOMEM;
} }
static int __init static int __init
......
...@@ -662,7 +662,7 @@ static inline void update_cgrp_time_from_event(struct perf_event *event) ...@@ -662,7 +662,7 @@ static inline void update_cgrp_time_from_event(struct perf_event *event)
/* /*
* Do not update time when cgroup is not active * Do not update time when cgroup is not active
*/ */
if (cgrp == event->cgrp) if (cgroup_is_descendant(cgrp->css.cgroup, event->cgrp->css.cgroup))
__update_cgrp_time(event->cgrp); __update_cgrp_time(event->cgrp);
} }
...@@ -8955,6 +8955,14 @@ static struct perf_cpu_context __percpu *find_pmu_context(int ctxn) ...@@ -8955,6 +8955,14 @@ static struct perf_cpu_context __percpu *find_pmu_context(int ctxn)
static void free_pmu_context(struct pmu *pmu) static void free_pmu_context(struct pmu *pmu)
{ {
/*
* Static contexts such as perf_sw_context have a global lifetime
* and may be shared between different PMUs. Avoid freeing them
* when a single PMU is going away.
*/
if (pmu->task_ctx_nr > perf_invalid_context)
return;
mutex_lock(&pmus_lock); mutex_lock(&pmus_lock);
free_percpu(pmu->pmu_cpu_context); free_percpu(pmu->pmu_cpu_context);
mutex_unlock(&pmus_lock); mutex_unlock(&pmus_lock);
......
...@@ -312,7 +312,7 @@ union bpf_attr { ...@@ -312,7 +312,7 @@ union bpf_attr {
* jump into another BPF program * jump into another BPF program
* @ctx: context pointer passed to next program * @ctx: context pointer passed to next program
* @prog_array_map: pointer to map which type is BPF_MAP_TYPE_PROG_ARRAY * @prog_array_map: pointer to map which type is BPF_MAP_TYPE_PROG_ARRAY
* @index: index inside array that selects specific program to run * @index: 32-bit index inside array that selects specific program to run
* Return: 0 on success or negative error * Return: 0 on success or negative error
* *
* int bpf_clone_redirect(skb, ifindex, flags) * int bpf_clone_redirect(skb, ifindex, flags)
......
...@@ -586,7 +586,7 @@ static void print_sample_brstack(struct perf_sample *sample, ...@@ -586,7 +586,7 @@ static void print_sample_brstack(struct perf_sample *sample,
thread__find_addr_map(thread, sample->cpumode, MAP__FUNCTION, to, &alt); thread__find_addr_map(thread, sample->cpumode, MAP__FUNCTION, to, &alt);
} }
printf("0x%"PRIx64, from); printf(" 0x%"PRIx64, from);
if (PRINT_FIELD(DSO)) { if (PRINT_FIELD(DSO)) {
printf("("); printf("(");
map__fprintf_dsoname(alf.map, stdout); map__fprintf_dsoname(alf.map, stdout);
...@@ -681,7 +681,7 @@ static void print_sample_brstackoff(struct perf_sample *sample, ...@@ -681,7 +681,7 @@ static void print_sample_brstackoff(struct perf_sample *sample,
if (alt.map && !alt.map->dso->adjust_symbols) if (alt.map && !alt.map->dso->adjust_symbols)
to = map__map_ip(alt.map, to); to = map__map_ip(alt.map, to);
printf("0x%"PRIx64, from); printf(" 0x%"PRIx64, from);
if (PRINT_FIELD(DSO)) { if (PRINT_FIELD(DSO)) {
printf("("); printf("(");
map__fprintf_dsoname(alf.map, stdout); map__fprintf_dsoname(alf.map, stdout);
......
...@@ -685,6 +685,8 @@ static enum match_result match_chain(struct callchain_cursor_node *node, ...@@ -685,6 +685,8 @@ static enum match_result match_chain(struct callchain_cursor_node *node,
{ {
struct symbol *sym = node->sym; struct symbol *sym = node->sym;
u64 left, right; u64 left, right;
struct dso *left_dso = NULL;
struct dso *right_dso = NULL;
if (callchain_param.key == CCKEY_SRCLINE) { if (callchain_param.key == CCKEY_SRCLINE) {
enum match_result match = match_chain_srcline(node, cnode); enum match_result match = match_chain_srcline(node, cnode);
...@@ -696,12 +698,14 @@ static enum match_result match_chain(struct callchain_cursor_node *node, ...@@ -696,12 +698,14 @@ static enum match_result match_chain(struct callchain_cursor_node *node,
if (cnode->ms.sym && sym && callchain_param.key == CCKEY_FUNCTION) { if (cnode->ms.sym && sym && callchain_param.key == CCKEY_FUNCTION) {
left = cnode->ms.sym->start; left = cnode->ms.sym->start;
right = sym->start; right = sym->start;
left_dso = cnode->ms.map->dso;
right_dso = node->map->dso;
} else { } else {
left = cnode->ip; left = cnode->ip;
right = node->ip; right = node->ip;
} }
if (left == right) { if (left == right && left_dso == right_dso) {
if (node->branch) { if (node->branch) {
cnode->branch_count++; cnode->branch_count++;
......
...@@ -309,10 +309,11 @@ static char *get_config_name(struct list_head *head_terms) ...@@ -309,10 +309,11 @@ static char *get_config_name(struct list_head *head_terms)
static struct perf_evsel * static struct perf_evsel *
__add_event(struct list_head *list, int *idx, __add_event(struct list_head *list, int *idx,
struct perf_event_attr *attr, struct perf_event_attr *attr,
char *name, struct cpu_map *cpus, char *name, struct perf_pmu *pmu,
struct list_head *config_terms, bool auto_merge_stats) struct list_head *config_terms, bool auto_merge_stats)
{ {
struct perf_evsel *evsel; struct perf_evsel *evsel;
struct cpu_map *cpus = pmu ? pmu->cpus : NULL;
event_attr_init(attr); event_attr_init(attr);
...@@ -323,7 +324,7 @@ __add_event(struct list_head *list, int *idx, ...@@ -323,7 +324,7 @@ __add_event(struct list_head *list, int *idx,
(*idx)++; (*idx)++;
evsel->cpus = cpu_map__get(cpus); evsel->cpus = cpu_map__get(cpus);
evsel->own_cpus = cpu_map__get(cpus); evsel->own_cpus = cpu_map__get(cpus);
evsel->system_wide = !!cpus; evsel->system_wide = pmu ? pmu->is_uncore : false;
evsel->auto_merge_stats = auto_merge_stats; evsel->auto_merge_stats = auto_merge_stats;
if (name) if (name)
...@@ -1233,7 +1234,7 @@ static int __parse_events_add_pmu(struct parse_events_state *parse_state, ...@@ -1233,7 +1234,7 @@ static int __parse_events_add_pmu(struct parse_events_state *parse_state,
if (!head_config) { if (!head_config) {
attr.type = pmu->type; attr.type = pmu->type;
evsel = __add_event(list, &parse_state->idx, &attr, NULL, pmu->cpus, NULL, auto_merge_stats); evsel = __add_event(list, &parse_state->idx, &attr, NULL, pmu, NULL, auto_merge_stats);
return evsel ? 0 : -ENOMEM; return evsel ? 0 : -ENOMEM;
} }
...@@ -1254,7 +1255,7 @@ static int __parse_events_add_pmu(struct parse_events_state *parse_state, ...@@ -1254,7 +1255,7 @@ static int __parse_events_add_pmu(struct parse_events_state *parse_state,
return -EINVAL; return -EINVAL;
evsel = __add_event(list, &parse_state->idx, &attr, evsel = __add_event(list, &parse_state->idx, &attr,
get_config_name(head_config), pmu->cpus, get_config_name(head_config), pmu,
&config_terms, auto_merge_stats); &config_terms, auto_merge_stats);
if (evsel) { if (evsel) {
evsel->unit = info.unit; evsel->unit = info.unit;
......
...@@ -470,17 +470,36 @@ static void pmu_read_sysfs(void) ...@@ -470,17 +470,36 @@ static void pmu_read_sysfs(void)
closedir(dir); closedir(dir);
} }
static struct cpu_map *__pmu_cpumask(const char *path)
{
FILE *file;
struct cpu_map *cpus;
file = fopen(path, "r");
if (!file)
return NULL;
cpus = cpu_map__read(file);
fclose(file);
return cpus;
}
/*
* Uncore PMUs have a "cpumask" file under sysfs. CPU PMUs (e.g. on arm/arm64)
* may have a "cpus" file.
*/
#define CPUS_TEMPLATE_UNCORE "%s/bus/event_source/devices/%s/cpumask"
#define CPUS_TEMPLATE_CPU "%s/bus/event_source/devices/%s/cpus"
static struct cpu_map *pmu_cpumask(const char *name) static struct cpu_map *pmu_cpumask(const char *name)
{ {
struct stat st;
char path[PATH_MAX]; char path[PATH_MAX];
FILE *file;
struct cpu_map *cpus; struct cpu_map *cpus;
const char *sysfs = sysfs__mountpoint(); const char *sysfs = sysfs__mountpoint();
const char *templates[] = { const char *templates[] = {
"%s/bus/event_source/devices/%s/cpumask", CPUS_TEMPLATE_UNCORE,
"%s/bus/event_source/devices/%s/cpus", CPUS_TEMPLATE_CPU,
NULL NULL
}; };
const char **template; const char **template;
...@@ -489,20 +508,25 @@ static struct cpu_map *pmu_cpumask(const char *name) ...@@ -489,20 +508,25 @@ static struct cpu_map *pmu_cpumask(const char *name)
for (template = templates; *template; template++) { for (template = templates; *template; template++) {
snprintf(path, PATH_MAX, *template, sysfs, name); snprintf(path, PATH_MAX, *template, sysfs, name);
if (stat(path, &st) == 0) cpus = __pmu_cpumask(path);
break; if (cpus)
return cpus;
} }
if (!*template) return NULL;
return NULL; }
file = fopen(path, "r"); static bool pmu_is_uncore(const char *name)
if (!file) {
return NULL; char path[PATH_MAX];
struct cpu_map *cpus;
const char *sysfs = sysfs__mountpoint();
cpus = cpu_map__read(file); snprintf(path, PATH_MAX, CPUS_TEMPLATE_UNCORE, sysfs, name);
fclose(file); cpus = __pmu_cpumask(path);
return cpus; cpu_map__put(cpus);
return !!cpus;
} }
/* /*
...@@ -617,6 +641,8 @@ static struct perf_pmu *pmu_lookup(const char *name) ...@@ -617,6 +641,8 @@ static struct perf_pmu *pmu_lookup(const char *name)
pmu->cpus = pmu_cpumask(name); pmu->cpus = pmu_cpumask(name);
pmu->is_uncore = pmu_is_uncore(name);
INIT_LIST_HEAD(&pmu->format); INIT_LIST_HEAD(&pmu->format);
INIT_LIST_HEAD(&pmu->aliases); INIT_LIST_HEAD(&pmu->aliases);
list_splice(&format, &pmu->format); list_splice(&format, &pmu->format);
......
...@@ -22,6 +22,7 @@ struct perf_pmu { ...@@ -22,6 +22,7 @@ struct perf_pmu {
char *name; char *name;
__u32 type; __u32 type;
bool selectable; bool selectable;
bool is_uncore;
struct perf_event_attr *default_config; struct perf_event_attr *default_config;
struct cpu_map *cpus; struct cpu_map *cpus;
struct list_head format; /* HEAD struct perf_pmu_format -> list */ struct list_head format; /* HEAD struct perf_pmu_format -> list */
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment