Commit a5499b37 authored by Adrian Hunter's avatar Adrian Hunter Committed by Arnaldo Carvalho de Melo

perf tools: Ensure thread-stack is flushed

The thread-stack represents a thread's current stack.  When a thread
exits there can still be many functions on the stack e.g. exit() can be
called many levels deep, so all the callers will never return.  To get
that information output, the thread-stack must be flushed.

Previously it was assumed the thread-stack would be flushed when the
struct thread was deleted.  With thread ref-counting it is no longer
clear when that will be, if ever. So instead explicitly flush all the
thread-stacks at the end of a session.
Signed-off-by: default avatarAdrian Hunter <adrian.hunter@intel.com>
Cc: Jiri Olsa <jolsa@redhat.com>
Link: http://lkml.kernel.org/r/1432906425-9911-3-git-send-email-adrian.hunter@intel.comSigned-off-by: default avatarArnaldo Carvalho de Melo <acme@redhat.com>
parent 79928928
...@@ -1890,6 +1890,27 @@ int machine__for_each_thread(struct machine *machine, ...@@ -1890,6 +1890,27 @@ int machine__for_each_thread(struct machine *machine,
return rc; return rc;
} }
int machines__for_each_thread(struct machines *machines,
int (*fn)(struct thread *thread, void *p),
void *priv)
{
struct rb_node *nd;
int rc = 0;
rc = machine__for_each_thread(&machines->host, fn, priv);
if (rc != 0)
return rc;
for (nd = rb_first(&machines->guests); nd; nd = rb_next(nd)) {
struct machine *machine = rb_entry(nd, struct machine, rb_node);
rc = machine__for_each_thread(machine, fn, priv);
if (rc != 0)
return rc;
}
return rc;
}
int __machine__synthesize_threads(struct machine *machine, struct perf_tool *tool, int __machine__synthesize_threads(struct machine *machine, struct perf_tool *tool,
struct target *target, struct thread_map *threads, struct target *target, struct thread_map *threads,
perf_event__handler_t process, bool data_mmap) perf_event__handler_t process, bool data_mmap)
......
...@@ -216,6 +216,9 @@ size_t machine__fprintf_vmlinux_path(struct machine *machine, FILE *fp); ...@@ -216,6 +216,9 @@ size_t machine__fprintf_vmlinux_path(struct machine *machine, FILE *fp);
int machine__for_each_thread(struct machine *machine, int machine__for_each_thread(struct machine *machine,
int (*fn)(struct thread *thread, void *p), int (*fn)(struct thread *thread, void *p),
void *priv); void *priv);
int machines__for_each_thread(struct machines *machines,
int (*fn)(struct thread *thread, void *p),
void *priv);
int __machine__synthesize_threads(struct machine *machine, struct perf_tool *tool, int __machine__synthesize_threads(struct machine *machine, struct perf_tool *tool,
struct target *target, struct thread_map *threads, struct target *target, struct thread_map *threads,
......
...@@ -16,6 +16,7 @@ ...@@ -16,6 +16,7 @@
#include "perf_regs.h" #include "perf_regs.h"
#include "asm/bug.h" #include "asm/bug.h"
#include "auxtrace.h" #include "auxtrace.h"
#include "thread-stack.h"
static int perf_session__deliver_event(struct perf_session *session, static int perf_session__deliver_event(struct perf_session *session,
union perf_event *event, union perf_event *event,
...@@ -1361,6 +1362,19 @@ static void perf_session__warn_about_errors(const struct perf_session *session) ...@@ -1361,6 +1362,19 @@ static void perf_session__warn_about_errors(const struct perf_session *session)
events_stats__auxtrace_error_warn(stats); events_stats__auxtrace_error_warn(stats);
} }
static int perf_session__flush_thread_stack(struct thread *thread,
void *p __maybe_unused)
{
return thread_stack__flush(thread);
}
static int perf_session__flush_thread_stacks(struct perf_session *session)
{
return machines__for_each_thread(&session->machines,
perf_session__flush_thread_stack,
NULL);
}
volatile int session_done; volatile int session_done;
static int __perf_session__process_pipe_events(struct perf_session *session) static int __perf_session__process_pipe_events(struct perf_session *session)
...@@ -1450,6 +1464,9 @@ static int __perf_session__process_pipe_events(struct perf_session *session) ...@@ -1450,6 +1464,9 @@ static int __perf_session__process_pipe_events(struct perf_session *session)
if (err) if (err)
goto out_err; goto out_err;
err = auxtrace__flush_events(session, tool); err = auxtrace__flush_events(session, tool);
if (err)
goto out_err;
err = perf_session__flush_thread_stacks(session);
out_err: out_err:
free(buf); free(buf);
perf_session__warn_about_errors(session); perf_session__warn_about_errors(session);
...@@ -1600,6 +1617,9 @@ static int __perf_session__process_events(struct perf_session *session, ...@@ -1600,6 +1617,9 @@ static int __perf_session__process_events(struct perf_session *session,
if (err) if (err)
goto out_err; goto out_err;
err = auxtrace__flush_events(session, tool); err = auxtrace__flush_events(session, tool);
if (err)
goto out_err;
err = perf_session__flush_thread_stacks(session);
out_err: out_err:
ui_progress__finish(); ui_progress__finish();
perf_session__warn_about_errors(session); perf_session__warn_about_errors(session);
......
...@@ -219,7 +219,7 @@ static int thread_stack__call_return(struct thread *thread, ...@@ -219,7 +219,7 @@ static int thread_stack__call_return(struct thread *thread,
return crp->process(&cr, crp->data); return crp->process(&cr, crp->data);
} }
static int thread_stack__flush(struct thread *thread, struct thread_stack *ts) static int __thread_stack__flush(struct thread *thread, struct thread_stack *ts)
{ {
struct call_return_processor *crp = ts->crp; struct call_return_processor *crp = ts->crp;
int err; int err;
...@@ -242,6 +242,14 @@ static int thread_stack__flush(struct thread *thread, struct thread_stack *ts) ...@@ -242,6 +242,14 @@ static int thread_stack__flush(struct thread *thread, struct thread_stack *ts)
return 0; return 0;
} }
int thread_stack__flush(struct thread *thread)
{
if (thread->ts)
return __thread_stack__flush(thread, thread->ts);
return 0;
}
int thread_stack__event(struct thread *thread, u32 flags, u64 from_ip, int thread_stack__event(struct thread *thread, u32 flags, u64 from_ip,
u64 to_ip, u16 insn_len, u64 trace_nr) u64 to_ip, u16 insn_len, u64 trace_nr)
{ {
...@@ -264,7 +272,7 @@ int thread_stack__event(struct thread *thread, u32 flags, u64 from_ip, ...@@ -264,7 +272,7 @@ int thread_stack__event(struct thread *thread, u32 flags, u64 from_ip,
*/ */
if (trace_nr != thread->ts->trace_nr) { if (trace_nr != thread->ts->trace_nr) {
if (thread->ts->trace_nr) if (thread->ts->trace_nr)
thread_stack__flush(thread, thread->ts); __thread_stack__flush(thread, thread->ts);
thread->ts->trace_nr = trace_nr; thread->ts->trace_nr = trace_nr;
} }
...@@ -297,7 +305,7 @@ void thread_stack__set_trace_nr(struct thread *thread, u64 trace_nr) ...@@ -297,7 +305,7 @@ void thread_stack__set_trace_nr(struct thread *thread, u64 trace_nr)
if (trace_nr != thread->ts->trace_nr) { if (trace_nr != thread->ts->trace_nr) {
if (thread->ts->trace_nr) if (thread->ts->trace_nr)
thread_stack__flush(thread, thread->ts); __thread_stack__flush(thread, thread->ts);
thread->ts->trace_nr = trace_nr; thread->ts->trace_nr = trace_nr;
} }
} }
...@@ -305,7 +313,7 @@ void thread_stack__set_trace_nr(struct thread *thread, u64 trace_nr) ...@@ -305,7 +313,7 @@ void thread_stack__set_trace_nr(struct thread *thread, u64 trace_nr)
void thread_stack__free(struct thread *thread) void thread_stack__free(struct thread *thread)
{ {
if (thread->ts) { if (thread->ts) {
thread_stack__flush(thread, thread->ts); __thread_stack__flush(thread, thread->ts);
zfree(&thread->ts->stack); zfree(&thread->ts->stack);
zfree(&thread->ts); zfree(&thread->ts);
} }
...@@ -689,7 +697,7 @@ int thread_stack__process(struct thread *thread, struct comm *comm, ...@@ -689,7 +697,7 @@ int thread_stack__process(struct thread *thread, struct comm *comm,
/* Flush stack on exec */ /* Flush stack on exec */
if (ts->comm != comm && thread->pid_ == thread->tid) { if (ts->comm != comm && thread->pid_ == thread->tid) {
err = thread_stack__flush(thread, ts); err = __thread_stack__flush(thread, ts);
if (err) if (err)
return err; return err;
ts->comm = comm; ts->comm = comm;
......
...@@ -96,6 +96,7 @@ int thread_stack__event(struct thread *thread, u32 flags, u64 from_ip, ...@@ -96,6 +96,7 @@ int thread_stack__event(struct thread *thread, u32 flags, u64 from_ip,
void thread_stack__set_trace_nr(struct thread *thread, u64 trace_nr); void thread_stack__set_trace_nr(struct thread *thread, u64 trace_nr);
void thread_stack__sample(struct thread *thread, struct ip_callchain *chain, void thread_stack__sample(struct thread *thread, struct ip_callchain *chain,
size_t sz, u64 ip); size_t sz, u64 ip);
int thread_stack__flush(struct thread *thread);
void thread_stack__free(struct thread *thread); void thread_stack__free(struct thread *thread);
struct call_return_processor * struct call_return_processor *
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment