Commit ced47e30 authored by Song Liu's avatar Song Liu Committed by Alexei Starovoitov

bpf: runqslower: Use task local storage

Replace hashtab with task local storage in runqslower. This improves the
performance of these BPF programs. The following table summarizes average
runtime of these programs, in nanoseconds:

                          task-local   hash-prealloc   hash-no-prealloc
handle__sched_wakeup             125             340               3124
handle__sched_wakeup_new        2812            1510               2998
handle__sched_switch             151             208                991

Note that, task local storage gives better performance than hashtab for
handle__sched_wakeup and handle__sched_switch. On the other hand, for
handle__sched_wakeup_new, task local storage is slower than hashtab with
prealloc. This is because handle__sched_wakeup_new accesses the data for
the first time, so it has to allocate the data for task local storage.
Once the initial allocation is done, subsequent accesses, as those in
handle__sched_wakeup, are much faster with task local storage. If we
disable hashtab prealloc, task local storage is much faster for all 3
functions.
Signed-off-by: default avatarSong Liu <songliubraving@fb.com>
Signed-off-by: default avatarAlexei Starovoitov <ast@kernel.org>
Acked-by: default avatarAndrii Nakryiko <andrii@kernel.org>
Link: https://lore.kernel.org/bpf/20210225234319.336131-7-songliubraving@fb.com
parent 4b0d2d41
...@@ -11,9 +11,9 @@ const volatile __u64 min_us = 0; ...@@ -11,9 +11,9 @@ const volatile __u64 min_us = 0;
const volatile pid_t targ_pid = 0; const volatile pid_t targ_pid = 0;
struct { struct {
__uint(type, BPF_MAP_TYPE_HASH); __uint(type, BPF_MAP_TYPE_TASK_STORAGE);
__uint(max_entries, 10240); __uint(map_flags, BPF_F_NO_PREALLOC);
__type(key, u32); __type(key, int);
__type(value, u64); __type(value, u64);
} start SEC(".maps"); } start SEC(".maps");
...@@ -25,15 +25,20 @@ struct { ...@@ -25,15 +25,20 @@ struct {
/* record enqueue timestamp */ /* record enqueue timestamp */
__always_inline __always_inline
static int trace_enqueue(u32 tgid, u32 pid) static int trace_enqueue(struct task_struct *t)
{ {
u64 ts; u32 pid = t->pid;
u64 *ptr;
if (!pid || (targ_pid && targ_pid != pid)) if (!pid || (targ_pid && targ_pid != pid))
return 0; return 0;
ts = bpf_ktime_get_ns(); ptr = bpf_task_storage_get(&start, t, 0,
bpf_map_update_elem(&start, &pid, &ts, 0); BPF_LOCAL_STORAGE_GET_F_CREATE);
if (!ptr)
return 0;
*ptr = bpf_ktime_get_ns();
return 0; return 0;
} }
...@@ -43,7 +48,7 @@ int handle__sched_wakeup(u64 *ctx) ...@@ -43,7 +48,7 @@ int handle__sched_wakeup(u64 *ctx)
/* TP_PROTO(struct task_struct *p) */ /* TP_PROTO(struct task_struct *p) */
struct task_struct *p = (void *)ctx[0]; struct task_struct *p = (void *)ctx[0];
return trace_enqueue(p->tgid, p->pid); return trace_enqueue(p);
} }
SEC("tp_btf/sched_wakeup_new") SEC("tp_btf/sched_wakeup_new")
...@@ -52,7 +57,7 @@ int handle__sched_wakeup_new(u64 *ctx) ...@@ -52,7 +57,7 @@ int handle__sched_wakeup_new(u64 *ctx)
/* TP_PROTO(struct task_struct *p) */ /* TP_PROTO(struct task_struct *p) */
struct task_struct *p = (void *)ctx[0]; struct task_struct *p = (void *)ctx[0];
return trace_enqueue(p->tgid, p->pid); return trace_enqueue(p);
} }
SEC("tp_btf/sched_switch") SEC("tp_btf/sched_switch")
...@@ -70,12 +75,16 @@ int handle__sched_switch(u64 *ctx) ...@@ -70,12 +75,16 @@ int handle__sched_switch(u64 *ctx)
/* ivcsw: treat like an enqueue event and store timestamp */ /* ivcsw: treat like an enqueue event and store timestamp */
if (prev->state == TASK_RUNNING) if (prev->state == TASK_RUNNING)
trace_enqueue(prev->tgid, prev->pid); trace_enqueue(prev);
pid = next->pid; pid = next->pid;
/* For pid mismatch, save a bpf_task_storage_get */
if (!pid || (targ_pid && targ_pid != pid))
return 0;
/* fetch timestamp and calculate delta */ /* fetch timestamp and calculate delta */
tsp = bpf_map_lookup_elem(&start, &pid); tsp = bpf_task_storage_get(&start, next, 0, 0);
if (!tsp) if (!tsp)
return 0; /* missed enqueue */ return 0; /* missed enqueue */
...@@ -91,7 +100,7 @@ int handle__sched_switch(u64 *ctx) ...@@ -91,7 +100,7 @@ int handle__sched_switch(u64 *ctx)
bpf_perf_event_output(ctx, &events, BPF_F_CURRENT_CPU, bpf_perf_event_output(ctx, &events, BPF_F_CURRENT_CPU,
&event, sizeof(event)); &event, sizeof(event));
bpf_map_delete_elem(&start, &pid); bpf_task_storage_delete(&start, next);
return 0; return 0;
} }
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment