-#define _GNU_SOURCE
-#include <sys/types.h>
-#include <sys/stat.h>
-#include <sys/time.h>
-#include <unistd.h>
-#include <stdint.h>
-#include <stdbool.h>
-#include <stdlib.h>
-#include <string.h>
-#include <limits.h>
-#include <fcntl.h>
-#include <stdio.h>
-#include <errno.h>
-#include <ctype.h>
-#include <time.h>
-#include <getopt.h>
-#include <assert.h>
-#include <search.h>
-
-#include <sys/ioctl.h>
-#include <sys/poll.h>
-#include <sys/prctl.h>
-#include <sys/wait.h>
-#include <sys/mman.h>
-#include <sys/types.h>
-#include <sys/stat.h>
-
-#include <linux/unistd.h>
-#include <linux/types.h>
-
-#include "../../include/linux/perf_counter.h"
-#include "list.h"
+/*
+ * builtin-report.c
+ *
+ * Builtin report command: Analyze the perf.data input file,
+ * look up and read DSOs and symbol information and display
+ * a histogram of results, along various sorting keys.
+ */
+#include "builtin.h"
+
+#include "util/util.h"
+
+#include "util/list.h"
+#include "util/cache.h"
+#include "util/rbtree.h"
+#include "util/symbol.h"
+#include "util/string.h"
+
+#include "perf.h"
+
+#include "util/parse-options.h"
+#include "util/parse-events.h"
#define SHOW_KERNEL 1
#define SHOW_USER 2
#define SHOW_HV 4
-static char const *input_name = "output.perf";
+static char const *input_name = "perf.data";
+static char *vmlinux = NULL;
+
+static char default_sort_order[] = "comm,dso";
+static char *sort_order = default_sort_order;
+
static int input;
static int show_mask = SHOW_KERNEL | SHOW_USER | SHOW_HV;
+static int dump_trace = 0;
+#define dprintf(x...) do { if (dump_trace) printf(x); } while (0)
+
+static int verbose;
+static int full_paths;
+
static unsigned long page_size;
static unsigned long mmap_window = 32;
-static const char *perf_event_names[] = {
+const char *perf_event_names[] = {
[PERF_EVENT_MMAP] = " PERF_EVENT_MMAP",
[PERF_EVENT_MUNMAP] = " PERF_EVENT_MUNMAP",
[PERF_EVENT_COMM] = " PERF_EVENT_COMM",
__u64 ip;
__u32 pid, tid;
};
+
struct mmap_event {
struct perf_event_header header;
__u32 pid, tid;
__u64 pgoff;
char filename[PATH_MAX];
};
+
struct comm_event {
struct perf_event_header header;
- __u32 pid,tid;
+ __u32 pid, tid;
char comm[16];
};
struct comm_event comm;
} event_t;
-struct section {
- struct list_head node;
- uint64_t start;
- uint64_t end;
- uint64_t offset;
- char name[0];
-};
+static LIST_HEAD(dsos);
+static struct dso *kernel_dso;
-static struct section *section__new(uint64_t start, uint64_t size,
- uint64_t offset, char *name)
+static void dsos__add(struct dso *dso)
{
- struct section *self = malloc(sizeof(*self) + strlen(name) + 1);
+ list_add_tail(&dso->node, &dsos);
+}
- if (self != NULL) {
- self->start = start;
- self->end = start + size;
- self->offset = offset;
- strcpy(self->name, name);
+static struct dso *dsos__find(const char *name)
+{
+ struct dso *pos;
+
+ list_for_each_entry(pos, &dsos, node)
+ if (strcmp(pos->name, name) == 0)
+ return pos;
+ return NULL;
+}
+
+static struct dso *dsos__findnew(const char *name)
+{
+ struct dso *dso = dsos__find(name);
+ int nr;
+
+ if (dso)
+ return dso;
+
+ dso = dso__new(name, 0);
+ if (!dso)
+ goto out_delete_dso;
+
+ nr = dso__load(dso, NULL, verbose);
+ if (nr < 0) {
+ if (verbose)
+ fprintf(stderr, "Failed to open: %s\n", name);
+ goto out_delete_dso;
+ }
+ if (!nr && verbose) {
+ fprintf(stderr,
+ "No symbols found in: %s, maybe install a debug package?\n",
+ name);
}
- return self;
+ dsos__add(dso);
+
+ return dso;
+
+out_delete_dso:
+ dso__delete(dso);
+ return NULL;
}
-static void section__delete(struct section *self)
+static void dsos__fprintf(FILE *fp)
{
- free(self);
+ struct dso *pos;
+
+ list_for_each_entry(pos, &dsos, node)
+ dso__fprintf(pos, fp);
+}
+
+static int load_kernel(void)
+{
+ int err;
+
+ kernel_dso = dso__new("[kernel]", 0);
+ if (!kernel_dso)
+ return -1;
+
+ err = dso__load_kernel(kernel_dso, vmlinux, NULL, verbose);
+ if (err) {
+ dso__delete(kernel_dso);
+ kernel_dso = NULL;
+ } else
+ dsos__add(kernel_dso);
+
+ return err;
+}
+
+static char __cwd[PATH_MAX];
+static char *cwd = __cwd;
+static int cwdlen;
+
+static int strcommon(const char *pathname)
+{
+ int n = 0;
+
+ while (pathname[n] == cwd[n] && n < cwdlen)
+ ++n;
+
+ return n;
}
-struct symbol {
+struct map {
struct list_head node;
uint64_t start;
uint64_t end;
- char name[0];
+ uint64_t pgoff;
+ struct dso *dso;
};
-static struct symbol *symbol__new(uint64_t start, uint64_t len, const char *name)
+static struct map *map__new(struct mmap_event *event)
{
- struct symbol *self = malloc(sizeof(*self) + strlen(name) + 1);
+ struct map *self = malloc(sizeof(*self));
if (self != NULL) {
- self->start = start;
- self->end = start + len;
- strcpy(self->name, name);
- }
+ const char *filename = event->filename;
+ char newfilename[PATH_MAX];
- return self;
-}
+ if (cwd) {
+ int n = strcommon(filename);
-static void symbol__delete(struct symbol *self)
-{
+ if (n == cwdlen) {
+ snprintf(newfilename, sizeof(newfilename),
+ ".%s", filename + n);
+ filename = newfilename;
+ }
+ }
+
+ self->start = event->start;
+ self->end = event->start + event->len;
+ self->pgoff = event->pgoff;
+
+ self->dso = dsos__findnew(filename);
+ if (self->dso == NULL)
+ goto out_delete;
+ }
+ return self;
+out_delete:
free(self);
+ return NULL;
}
-static size_t symbol__fprintf(struct symbol *self, FILE *fp)
-{
- return fprintf(fp, " %lx-%lx %s\n",
- self->start, self->end, self->name);
-}
+struct thread;
-struct dso {
- struct list_head node;
- struct list_head sections;
- struct list_head syms;
- char name[0];
+struct thread {
+ struct rb_node rb_node;
+ struct list_head maps;
+ pid_t pid;
+ char *comm;
};
-static struct dso *dso__new(const char *name)
+static struct thread *thread__new(pid_t pid)
{
- struct dso *self = malloc(sizeof(*self) + strlen(name) + 1);
+ struct thread *self = malloc(sizeof(*self));
if (self != NULL) {
- strcpy(self->name, name);
- INIT_LIST_HEAD(&self->sections);
- INIT_LIST_HEAD(&self->syms);
+ self->pid = pid;
+ self->comm = malloc(32);
+ if (self->comm)
+ snprintf(self->comm, 32, ":%d", self->pid);
+ INIT_LIST_HEAD(&self->maps);
}
return self;
}
-static void dso__delete_sections(struct dso *self)
+static int thread__set_comm(struct thread *self, const char *comm)
{
- struct section *pos, *n;
-
- list_for_each_entry_safe(pos, n, &self->sections, node)
- section__delete(pos);
+ if (self->comm)
+ free(self->comm);
+ self->comm = strdup(comm);
+ return self->comm ? 0 : -ENOMEM;
}
-static void dso__delete_symbols(struct dso *self)
+static struct rb_root threads;
+static struct thread *last_match;
+
+static struct thread *threads__findnew(pid_t pid)
{
- struct symbol *pos, *n;
+ struct rb_node **p = &threads.rb_node;
+ struct rb_node *parent = NULL;
+ struct thread *th;
+
+ /*
+ * Font-end cache - PID lookups come in blocks,
+ * so most of the time we dont have to look up
+ * the full rbtree:
+ */
+ if (last_match && last_match->pid == pid)
+ return last_match;
+
+ while (*p != NULL) {
+ parent = *p;
+ th = rb_entry(parent, struct thread, rb_node);
+
+ if (th->pid == pid) {
+ last_match = th;
+ return th;
+ }
- list_for_each_entry_safe(pos, n, &self->syms, node)
- symbol__delete(pos);
-}
+ if (pid < th->pid)
+ p = &(*p)->rb_left;
+ else
+ p = &(*p)->rb_right;
+ }
-static void dso__delete(struct dso *self)
-{
- dso__delete_sections(self);
- dso__delete_symbols(self);
- free(self);
+ th = thread__new(pid);
+ if (th != NULL) {
+ rb_link_node(&th->rb_node, parent, p);
+ rb_insert_color(&th->rb_node, &threads);
+ last_match = th;
+ }
+
+ return th;
}
-static void dso__insert_symbol(struct dso *self, struct symbol *sym)
+static void thread__insert_map(struct thread *self, struct map *map)
{
- list_add_tail(&sym->node, &self->syms);
+ list_add_tail(&map->node, &self->maps);
}
-static struct symbol *dso__find_symbol(struct dso *self, uint64_t ip)
+static struct map *thread__find_map(struct thread *self, uint64_t ip)
{
+ struct map *pos;
+
if (self == NULL)
return NULL;
- struct symbol *pos;
-
- list_for_each_entry(pos, &self->syms, node)
+ list_for_each_entry(pos, &self->maps, node)
if (ip >= pos->start && ip <= pos->end)
return pos;
return NULL;
}
-static int dso__load(struct dso *self)
+/*
+ * histogram, sorted on item, collects counts
+ */
+
+static struct rb_root hist;
+
+struct hist_entry {
+ struct rb_node rb_node;
+
+ struct thread *thread;
+ struct map *map;
+ struct dso *dso;
+ struct symbol *sym;
+ uint64_t ip;
+ char level;
+
+ uint32_t count;
+};
+
+/*
+ * configurable sorting bits
+ */
+
+struct sort_entry {
+ struct list_head list;
+
+ char *header;
+
+ int64_t (*cmp)(struct hist_entry *, struct hist_entry *);
+ int64_t (*collapse)(struct hist_entry *, struct hist_entry *);
+ size_t (*print)(FILE *fp, struct hist_entry *);
+};
+
+/* --sort pid */
+
+static int64_t
+sort__thread_cmp(struct hist_entry *left, struct hist_entry *right)
{
- /* FIXME */
- return 0;
+ return right->thread->pid - left->thread->pid;
}
-static size_t dso__fprintf(struct dso *self, FILE *fp)
+static size_t
+sort__thread_print(FILE *fp, struct hist_entry *self)
{
- struct symbol *pos;
- size_t ret = fprintf(fp, "dso: %s\n", self->name);
-
- list_for_each_entry(pos, &self->syms, node)
- ret += symbol__fprintf(pos, fp);
-
- return ret;
+ return fprintf(fp, "%16s:%5d", self->thread->comm ?: "", self->thread->pid);
}
-static LIST_HEAD(dsos);
-static struct dso *kernel_dso;
+static struct sort_entry sort_thread = {
+ .header = " Command: Pid",
+ .cmp = sort__thread_cmp,
+ .print = sort__thread_print,
+};
-static void dsos__add(struct dso *dso)
+/* --sort comm */
+
+static int64_t
+sort__comm_cmp(struct hist_entry *left, struct hist_entry *right)
{
- list_add_tail(&dso->node, &dsos);
+ return right->thread->pid - left->thread->pid;
}
-static struct dso *dsos__find(const char *name)
+static int64_t
+sort__comm_collapse(struct hist_entry *left, struct hist_entry *right)
{
- struct dso *pos;
+ char *comm_l = left->thread->comm;
+ char *comm_r = right->thread->comm;
+
+ if (!comm_l || !comm_r) {
+ if (!comm_l && !comm_r)
+ return 0;
+ else if (!comm_l)
+ return -1;
+ else
+ return 1;
+ }
- list_for_each_entry(pos, &dsos, node)
- if (strcmp(pos->name, name) == 0)
- return pos;
- return NULL;
+ return strcmp(comm_l, comm_r);
}
-static struct dso *dsos__findnew(const char *name)
+static size_t
+sort__comm_print(FILE *fp, struct hist_entry *self)
{
- struct dso *dso = dsos__find(name);
+ return fprintf(fp, "%16s", self->thread->comm);
+}
- if (dso == NULL) {
- dso = dso__new(name);
- if (dso != NULL && dso__load(dso) < 0)
- goto out_delete_dso;
+static struct sort_entry sort_comm = {
+ .header = " Command",
+ .cmp = sort__comm_cmp,
+ .collapse = sort__comm_collapse,
+ .print = sort__comm_print,
+};
- dsos__add(dso);
- }
+/* --sort dso */
- return dso;
+static int64_t
+sort__dso_cmp(struct hist_entry *left, struct hist_entry *right)
+{
+ struct dso *dso_l = left->dso;
+ struct dso *dso_r = right->dso;
+
+ if (!dso_l || !dso_r) {
+ if (!dso_l && !dso_r)
+ return 0;
+ else if (!dso_l)
+ return -1;
+ else
+ return 1;
+ }
-out_delete_dso:
- dso__delete(dso);
- return NULL;
+ return strcmp(dso_l->name, dso_r->name);
}
-static void dsos__fprintf(FILE *fp)
+static size_t
+sort__dso_print(FILE *fp, struct hist_entry *self)
{
- struct dso *pos;
+ if (self->dso)
+ return fprintf(fp, "%-25s", self->dso->name);
- list_for_each_entry(pos, &dsos, node)
- dso__fprintf(pos, fp);
+ return fprintf(fp, "%016llx ", (__u64)self->ip);
}
-static int load_kallsyms(void)
-{
- kernel_dso = dso__new("[kernel]");
- if (kernel_dso == NULL)
- return -1;
+static struct sort_entry sort_dso = {
+ .header = "Shared Object ",
+ .cmp = sort__dso_cmp,
+ .print = sort__dso_print,
+};
- FILE *file = fopen("/proc/kallsyms", "r");
+/* --sort symbol */
- if (file == NULL)
- goto out_delete_dso;
+static int64_t
+sort__sym_cmp(struct hist_entry *left, struct hist_entry *right)
+{
+ uint64_t ip_l, ip_r;
- char *line = NULL;
- size_t n;
+ if (left->sym == right->sym)
+ return 0;
- while (!feof(file)) {
- unsigned long long start;
- char c, symbf[4096];
+ ip_l = left->sym ? left->sym->start : left->ip;
+ ip_r = right->sym ? right->sym->start : right->ip;
- if (getline(&line, &n, file) < 0)
- break;
+ return (int64_t)(ip_r - ip_l);
+}
- if (!line)
- goto out_delete_dso;
+static size_t
+sort__sym_print(FILE *fp, struct hist_entry *self)
+{
+ size_t ret = 0;
- if (sscanf(line, "%llx %c %s", &start, &c, symbf) == 3) {
- struct symbol *sym = symbol__new(start, 0x1000000, symbf);
+ if (verbose)
+ ret += fprintf(fp, "%#018llx ", (__u64)self->ip);
- if (sym == NULL)
- goto out_delete_dso;
+ if (self->sym)
+ ret += fprintf(fp, "%s", self->sym->name);
+ else
+ ret += fprintf(fp, "%#016llx", (__u64)self->ip);
- dso__insert_symbol(kernel_dso, sym);
- }
- }
+ return ret;
+}
- dsos__add(kernel_dso);
- free(line);
- fclose(file);
- return 0;
+static struct sort_entry sort_sym = {
+ .header = "Symbol",
+ .cmp = sort__sym_cmp,
+ .print = sort__sym_print,
+};
-out_delete_dso:
- dso__delete(kernel_dso);
- return -1;
-}
+static int sort__need_collapse = 0;
-struct map {
- struct list_head node;
- uint64_t start;
- uint64_t end;
- uint64_t pgoff;
- struct dso *dso;
+struct sort_dimension {
+ char *name;
+ struct sort_entry *entry;
+ int taken;
};
-static struct map *map__new(struct mmap_event *event)
+static struct sort_dimension sort_dimensions[] = {
+ { .name = "pid", .entry = &sort_thread, },
+ { .name = "comm", .entry = &sort_comm, },
+ { .name = "dso", .entry = &sort_dso, },
+ { .name = "symbol", .entry = &sort_sym, },
+};
+
+static LIST_HEAD(hist_entry__sort_list);
+
+static int sort_dimension__add(char *tok)
{
- struct map *self = malloc(sizeof(*self));
+ int i;
- if (self != NULL) {
- self->start = event->start;
- self->end = event->start + event->len;
- self->pgoff = event->pgoff;
+ for (i = 0; i < ARRAY_SIZE(sort_dimensions); i++) {
+ struct sort_dimension *sd = &sort_dimensions[i];
- self->dso = dsos__findnew(event->filename);
- if (self->dso == NULL)
- goto out_delete;
- }
- return self;
-out_delete:
- free(self);
- return NULL;
-}
+ if (sd->taken)
+ continue;
-static size_t map__fprintf(struct map *self, FILE *fp)
-{
- return fprintf(fp, " %lx-%lx %lx %s\n",
- self->start, self->end, self->pgoff, self->dso->name);
-}
+ if (strncasecmp(tok, sd->name, strlen(tok)))
+ continue;
-struct symhist {
- struct list_head node;
- struct dso *dso;
- struct symbol *sym;
- uint32_t count;
- char level;
-};
+ if (sd->entry->collapse)
+ sort__need_collapse = 1;
-static struct symhist *symhist__new(struct symbol *sym, struct dso *dso,
- char level)
-{
- struct symhist *self = malloc(sizeof(*self));
+ list_add_tail(&sd->entry->list, &hist_entry__sort_list);
+ sd->taken = 1;
- if (self != NULL) {
- self->sym = sym;
- self->dso = dso;
- self->level = level;
- self->count = 0;
+ return 0;
}
- return self;
+ return -ESRCH;
}
-static void symhist__delete(struct symhist *self)
+static int64_t
+hist_entry__cmp(struct hist_entry *left, struct hist_entry *right)
{
- free(self);
-}
+ struct sort_entry *se;
+ int64_t cmp = 0;
-static bool symhist__equal(struct symhist *self, struct symbol *sym,
- struct dso *dso, char level)
-{
- return self->level == level && self->sym == sym && self->dso == dso;
-}
+ list_for_each_entry(se, &hist_entry__sort_list, list) {
+ cmp = se->cmp(left, right);
+ if (cmp)
+ break;
+ }
-static void symhist__inc(struct symhist *self)
-{
- ++self->count;
+ return cmp;
}
-static size_t symhist__fprintf(struct symhist *self, FILE *fp)
+static int64_t
+hist_entry__collapse(struct hist_entry *left, struct hist_entry *right)
{
- size_t ret = fprintf(fp, "[%c] ", self->level);
+ struct sort_entry *se;
+ int64_t cmp = 0;
- if (self->level != '.')
- ret += fprintf(fp, "%s", self->sym->name);
- else
- ret += fprintf(fp, "%s: %s",
- self->dso ? self->dso->name : "<unknown",
- self->sym ? self->sym->name : "<unknown>");
- return ret + fprintf(fp, ": %u\n", self->count);
-}
+ list_for_each_entry(se, &hist_entry__sort_list, list) {
+ int64_t (*f)(struct hist_entry *, struct hist_entry *);
-struct thread {
- struct list_head node;
- struct list_head maps;
- struct list_head symhists;
- pid_t pid;
- char *comm;
-};
-
-static struct thread *thread__new(pid_t pid)
-{
- struct thread *self = malloc(sizeof(*self));
+ f = se->collapse ?: se->cmp;
- if (self != NULL) {
- self->pid = pid;
- self->comm = NULL;
- INIT_LIST_HEAD(&self->maps);
- INIT_LIST_HEAD(&self->symhists);
+ cmp = f(left, right);
+ if (cmp)
+ break;
}
- return self;
+ return cmp;
}
-static void thread__insert_symhist(struct thread *self,
- struct symhist *symhist)
+static size_t
+hist_entry__fprintf(FILE *fp, struct hist_entry *self, uint64_t total_samples)
{
- list_add_tail(&symhist->node, &self->symhists);
-}
-
-static struct symhist *thread__symhists_find(struct thread *self,
- struct symbol *sym,
- struct dso *dso, char level)
-{
- struct symhist *pos;
+ struct sort_entry *se;
+ size_t ret;
+
+ if (total_samples) {
+ ret = fprintf(fp, " %6.2f%%",
+ (self->count * 100.0) / total_samples);
+ } else
+ ret = fprintf(fp, "%12d ", self->count);
+
+ list_for_each_entry(se, &hist_entry__sort_list, list) {
+ fprintf(fp, " ");
+ ret += se->print(fp, self);
+ }
- list_for_each_entry(pos, &self->symhists, node)
- if (symhist__equal(pos, sym, dso, level))
- return pos;
+ ret += fprintf(fp, "\n");
- return NULL;
+ return ret;
}
-static int thread__symbol_incnew(struct thread *self, struct symbol *sym,
- struct dso *dso, char level)
+/*
+ * collect histogram counts
+ */
+
+static int
+hist_entry__add(struct thread *thread, struct map *map, struct dso *dso,
+ struct symbol *sym, uint64_t ip, char level)
{
- struct symhist *symhist = thread__symhists_find(self, sym, dso, level);
+ struct rb_node **p = &hist.rb_node;
+ struct rb_node *parent = NULL;
+ struct hist_entry *he;
+ struct hist_entry entry = {
+ .thread = thread,
+ .map = map,
+ .dso = dso,
+ .sym = sym,
+ .ip = ip,
+ .level = level,
+ .count = 1,
+ };
+ int cmp;
+
+ while (*p != NULL) {
+ parent = *p;
+ he = rb_entry(parent, struct hist_entry, rb_node);
+
+ cmp = hist_entry__cmp(&entry, he);
+
+ if (!cmp) {
+ he->count++;
+ return 0;
+ }
- if (symhist == NULL) {
- symhist = symhist__new(sym, dso, level);
- if (symhist == NULL)
- goto out_error;
- thread__insert_symhist(self, symhist);
+ if (cmp < 0)
+ p = &(*p)->rb_left;
+ else
+ p = &(*p)->rb_right;
}
- symhist__inc(symhist);
+ he = malloc(sizeof(*he));
+ if (!he)
+ return -ENOMEM;
+ *he = entry;
+ rb_link_node(&he->rb_node, parent, p);
+ rb_insert_color(&he->rb_node, &hist);
+
return 0;
-out_error:
- return -ENOMEM;
}
-static int thread__set_comm(struct thread *self, const char *comm)
+static void hist_entry__free(struct hist_entry *he)
{
- self->comm = strdup(comm);
- return self->comm ? 0 : -ENOMEM;
+ free(he);
}
-static size_t thread__maps_fprintf(struct thread *self, FILE *fp)
+/*
+ * collapse the histogram
+ */
+
+static struct rb_root collapse_hists;
+
+static void collapse__insert_entry(struct hist_entry *he)
{
- struct map *pos;
- size_t ret = 0;
+ struct rb_node **p = &collapse_hists.rb_node;
+ struct rb_node *parent = NULL;
+ struct hist_entry *iter;
+ int64_t cmp;
- list_for_each_entry(pos, &self->maps, node)
- ret += map__fprintf(pos, fp);
+ while (*p != NULL) {
+ parent = *p;
+ iter = rb_entry(parent, struct hist_entry, rb_node);
- return ret;
+ cmp = hist_entry__collapse(iter, he);
+
+ if (!cmp) {
+ iter->count += he->count;
+ hist_entry__free(he);
+ return;
+ }
+
+ if (cmp < 0)
+ p = &(*p)->rb_left;
+ else
+ p = &(*p)->rb_right;
+ }
+
+ rb_link_node(&he->rb_node, parent, p);
+ rb_insert_color(&he->rb_node, &collapse_hists);
}
-static size_t thread__fprintf(struct thread *self, FILE *fp)
+static void collapse__resort(void)
{
- struct symhist *pos;
- int ret = fprintf(fp, "thread: %d %s\n", self->pid, self->comm);
+ struct rb_node *next;
+ struct hist_entry *n;
- list_for_each_entry(pos, &self->symhists, node)
- ret += symhist__fprintf(pos, fp);
+ if (!sort__need_collapse)
+ return;
- return ret;
+ next = rb_first(&hist);
+ while (next) {
+ n = rb_entry(next, struct hist_entry, rb_node);
+ next = rb_next(&n->rb_node);
+
+ rb_erase(&n->rb_node, &hist);
+ collapse__insert_entry(n);
+ }
}
-static LIST_HEAD(threads);
+/*
+ * reverse the map, sort on count.
+ */
-static void threads__add(struct thread *thread)
-{
- list_add_tail(&thread->node, &threads);
-}
+static struct rb_root output_hists;
-static struct thread *threads__find(pid_t pid)
+static void output__insert_entry(struct hist_entry *he)
{
- struct thread *pos;
+ struct rb_node **p = &output_hists.rb_node;
+ struct rb_node *parent = NULL;
+ struct hist_entry *iter;
+
+ while (*p != NULL) {
+ parent = *p;
+ iter = rb_entry(parent, struct hist_entry, rb_node);
+
+ if (he->count > iter->count)
+ p = &(*p)->rb_left;
+ else
+ p = &(*p)->rb_right;
+ }
- list_for_each_entry(pos, &threads, node)
- if (pos->pid == pid)
- return pos;
- return NULL;
+ rb_link_node(&he->rb_node, parent, p);
+ rb_insert_color(&he->rb_node, &output_hists);
}
-static struct thread *threads__findnew(pid_t pid)
+static void output__resort(void)
{
- struct thread *thread = threads__find(pid);
+ struct rb_node *next;
+ struct hist_entry *n;
+ struct rb_root *tree = &hist;
- if (thread == NULL) {
- thread = thread__new(pid);
- if (thread != NULL)
- threads__add(thread);
- }
+ if (sort__need_collapse)
+ tree = &collapse_hists;
- return thread;
-}
+ next = rb_first(tree);
-static void thread__insert_map(struct thread *self, struct map *map)
-{
- list_add_tail(&map->node, &self->maps);
+ while (next) {
+ n = rb_entry(next, struct hist_entry, rb_node);
+ next = rb_next(&n->rb_node);
+
+ rb_erase(&n->rb_node, tree);
+ output__insert_entry(n);
+ }
}
-static struct map *thread__find_map(struct thread *self, uint64_t ip)
+static size_t output__fprintf(FILE *fp, uint64_t total_samples)
{
- if (self == NULL)
- return NULL;
+ struct hist_entry *pos;
+ struct sort_entry *se;
+ struct rb_node *nd;
+ size_t ret = 0;
- struct map *pos;
+ fprintf(fp, "\n");
+ fprintf(fp, "#\n");
+ fprintf(fp, "# (%Ld profiler events)\n", (__u64)total_samples);
+ fprintf(fp, "#\n");
- list_for_each_entry(pos, &self->maps, node)
- if (ip >= pos->start && ip <= pos->end)
- return pos;
+ fprintf(fp, "# Overhead");
+ list_for_each_entry(se, &hist_entry__sort_list, list)
+ fprintf(fp, " %s", se->header);
+ fprintf(fp, "\n");
- return NULL;
+ fprintf(fp, "# ........");
+ list_for_each_entry(se, &hist_entry__sort_list, list) {
+ int i;
+
+ fprintf(fp, " ");
+ for (i = 0; i < strlen(se->header); i++)
+ fprintf(fp, ".");
+ }
+ fprintf(fp, "\n");
+
+ fprintf(fp, "#\n");
+
+ for (nd = rb_first(&output_hists); nd; nd = rb_next(nd)) {
+ pos = rb_entry(nd, struct hist_entry, rb_node);
+ ret += hist_entry__fprintf(fp, pos, total_samples);
+ }
+
+ if (!strcmp(sort_order, default_sort_order)) {
+ fprintf(fp, "#\n");
+ fprintf(fp, "# (For more details, try: perf report --sort comm,dso,symbol)\n");
+ fprintf(fp, "#\n");
+ }
+ fprintf(fp, "\n");
+
+ return ret;
}
-static void threads__fprintf(FILE *fp)
+static void register_idle_thread(void)
{
- struct thread *pos;
+ struct thread *thread = threads__findnew(0);
- list_for_each_entry(pos, &threads, node)
- thread__fprintf(pos, fp);
+ if (thread == NULL ||
+ thread__set_comm(thread, "[idle]")) {
+ fprintf(stderr, "problem inserting idle task.\n");
+ exit(-1);
+ }
}
-#if 0
-static std::string resolve_user_symbol(int pid, uint64_t ip)
+static unsigned long total = 0, total_mmap = 0, total_comm = 0, total_unknown = 0;
+
+static int
+process_overflow_event(event_t *event, unsigned long offset, unsigned long head)
{
- std::string sym = "<unknown>";
+ char level;
+ int show = 0;
+ struct dso *dso = NULL;
+ struct thread *thread = threads__findnew(event->ip.pid);
+ uint64_t ip = event->ip.ip;
+ struct map *map = NULL;
+
+ dprintf("%p [%p]: PERF_EVENT (IP, %d): %d: %p\n",
+ (void *)(offset + head),
+ (void *)(long)(event->header.size),
+ event->header.misc,
+ event->ip.pid,
+ (void *)(long)ip);
+
+ dprintf(" ... thread: %s:%d\n", thread->comm, thread->pid);
+
+ if (thread == NULL) {
+ fprintf(stderr, "problem processing %d event, skipping it.\n",
+ event->header.type);
+ return -1;
+ }
- maps_t &m = maps[pid];
- maps_t::const_iterator mi = m.upper_bound(map(ip));
- if (mi == m.end())
- return sym;
+ if (event->header.misc & PERF_EVENT_MISC_KERNEL) {
+ show = SHOW_KERNEL;
+ level = 'k';
- ip -= mi->start + mi->pgoff;
+ dso = kernel_dso;
- symbols_t &s = dsos[mi->dso].syms;
- symbols_t::const_iterator si = s.upper_bound(symbol(ip));
+ dprintf(" ...... dso: %s\n", dso->name);
- sym = mi->dso + ": <unknown>";
+ } else if (event->header.misc & PERF_EVENT_MISC_USER) {
- if (si == s.begin())
- return sym;
- si--;
+ show = SHOW_USER;
+ level = '.';
- if (si->start <= ip && ip < si->end)
- sym = mi->dso + ": " + si->name;
-#if 0
- else if (si->start <= ip)
- sym = mi->dso + ": ?" + si->name;
-#endif
+ map = thread__find_map(thread, ip);
+ if (map != NULL) {
+ dso = map->dso;
+ ip -= map->start + map->pgoff;
+ } else {
+ /*
+ * If this is outside of all known maps,
+ * and is a negative address, try to look it
+ * up in the kernel dso, as it might be a
+ * vsyscall (which executes in user-mode):
+ */
+ if ((long long)ip < 0)
+ dso = kernel_dso;
+ }
+ dprintf(" ...... dso: %s\n", dso ? dso->name : "<not found>");
+
+ } else {
+ show = SHOW_HV;
+ level = 'H';
+ dprintf(" ...... dso: [hypervisor]\n");
+ }
+
+ if (show & show_mask) {
+ struct symbol *sym = dso__find_symbol(dso, ip);
- return sym;
+ if (hist_entry__add(thread, map, dso, sym, ip, level)) {
+ fprintf(stderr,
+ "problem incrementing symbol count, skipping event\n");
+ return -1;
+ }
+ }
+ total++;
+
+ return 0;
}
-#endif
-static void display_help(void)
+static int
+process_mmap_event(event_t *event, unsigned long offset, unsigned long head)
{
- printf(
- "Usage: perf-report [<options>]\n"
- " -i file --input=<file> # input file\n"
- );
+ struct thread *thread = threads__findnew(event->mmap.pid);
+ struct map *map = map__new(&event->mmap);
+
+ dprintf("%p [%p]: PERF_EVENT_MMAP: [%p(%p) @ %p]: %s\n",
+ (void *)(offset + head),
+ (void *)(long)(event->header.size),
+ (void *)(long)event->mmap.start,
+ (void *)(long)event->mmap.len,
+ (void *)(long)event->mmap.pgoff,
+ event->mmap.filename);
+
+ if (thread == NULL || map == NULL) {
+ dprintf("problem processing PERF_EVENT_MMAP, skipping event.\n");
+ return 0;
+ }
+
+ thread__insert_map(thread, map);
+ total_mmap++;
- exit(0);
+ return 0;
}
-static void process_options(int argc, char *argv[])
+static int
+process_comm_event(event_t *event, unsigned long offset, unsigned long head)
{
- int error = 0;
+ struct thread *thread = threads__findnew(event->comm.pid);
- for (;;) {
- int option_index = 0;
- /** Options for getopt */
- static struct option long_options[] = {
- {"input", required_argument, NULL, 'i'},
- {"no-user", no_argument, NULL, 'u'},
- {"no-kernel", no_argument, NULL, 'k'},
- {"no-hv", no_argument, NULL, 'h'},
- {NULL, 0, NULL, 0 }
- };
- int c = getopt_long(argc, argv, "+:i:kuh",
- long_options, &option_index);
- if (c == -1)
- break;
+ dprintf("%p [%p]: PERF_EVENT_COMM: %s:%d\n",
+ (void *)(offset + head),
+ (void *)(long)(event->header.size),
+ event->comm.comm, event->comm.pid);
- switch (c) {
- case 'i': input_name = strdup(optarg); break;
- case 'k': show_mask &= ~SHOW_KERNEL; break;
- case 'u': show_mask &= ~SHOW_USER; break;
- case 'h': show_mask &= ~SHOW_HV; break;
- default: error = 1; break;
- }
+ if (thread == NULL ||
+ thread__set_comm(thread, event->comm.comm)) {
+ dprintf("problem processing PERF_EVENT_COMM, skipping event.\n");
+ return -1;
}
+ total_comm++;
- if (error)
- display_help();
+ return 0;
}
-int cmd_report(int argc, char **argv)
+static int
+process_event(event_t *event, unsigned long offset, unsigned long head)
{
+ if (event->header.misc & PERF_EVENT_MISC_OVERFLOW)
+ return process_overflow_event(event, offset, head);
+
+ switch (event->header.type) {
+ case PERF_EVENT_MMAP:
+ return process_mmap_event(event, offset, head);
+
+ case PERF_EVENT_COMM:
+ return process_comm_event(event, offset, head);
+
+ /*
+ * We dont process them right now but they are fine:
+ */
+ case PERF_EVENT_MUNMAP:
+ case PERF_EVENT_PERIOD:
+ case PERF_EVENT_THROTTLE:
+ case PERF_EVENT_UNTHROTTLE:
+ return 0;
+
+ default:
+ return -1;
+ }
+
+ return 0;
+}
+
+static int __cmd_report(void)
+{
+ int ret, rc = EXIT_FAILURE;
unsigned long offset = 0;
unsigned long head = 0;
struct stat stat;
- char *buf;
event_t *event;
- int ret, rc = EXIT_FAILURE;
- unsigned long total = 0;
-
- page_size = getpagesize();
+ uint32_t size;
+ char *buf;
- process_options(argc, argv);
+ register_idle_thread();
input = open(input_name, O_RDONLY);
if (input < 0) {
exit(0);
}
- if (load_kallsyms() < 0) {
- perror("failed to open kallsyms");
+ if (load_kernel() < 0) {
+ perror("failed to load kernel symbols");
return EXIT_FAILURE;
}
+ if (!full_paths) {
+ if (getcwd(__cwd, sizeof(__cwd)) == NULL) {
+ perror("failed to get the current directory");
+ return EXIT_FAILURE;
+ }
+ cwdlen = strlen(cwd);
+ } else {
+ cwd = NULL;
+ cwdlen = 0;
+ }
remap:
buf = (char *)mmap(NULL, page_size * mmap_window, PROT_READ,
MAP_SHARED, input, offset);
more:
event = (event_t *)(buf + head);
+ size = event->header.size;
+ if (!size)
+ size = 8;
+
if (head + event->header.size >= page_size * mmap_window) {
unsigned long shift = page_size * (head / page_size);
int ret;
goto remap;
}
+ size = event->header.size;
- if (!event->header.size) {
- fprintf(stderr, "zero-sized event at file offset %ld\n", offset + head);
- fprintf(stderr, "skipping %ld bytes of events.\n", stat.st_size - offset - head);
- goto done;
- }
+ if (!size || process_event(event, offset, head) < 0) {
- head += event->header.size;
+ dprintf("%p [%p]: skipping unknown header type: %d\n",
+ (void *)(offset + head),
+ (void *)(long)(event->header.size),
+ event->header.type);
- if (event->header.misc & PERF_EVENT_MISC_OVERFLOW) {
- char level;
- int show = 0;
- struct dso *dso = NULL;
- struct thread *thread = threads__findnew(event->ip.pid);
+ total_unknown++;
- if (thread == NULL)
- goto done;
+ /*
+ * assume we lost track of the stream, check alignment, and
+ * increment a single u64 in the hope to catch on again 'soon'.
+ */
- if (event->header.misc & PERF_EVENT_MISC_KERNEL) {
- show = SHOW_KERNEL;
- level = 'k';
- dso = kernel_dso;
- } else if (event->header.misc & PERF_EVENT_MISC_USER) {
- show = SHOW_USER;
- level = '.';
- struct map *map = thread__find_map(thread, event->ip.ip);
- if (map != NULL)
- dso = map->dso;
- } else {
- show = SHOW_HV;
- level = 'H';
- }
+ if (unlikely(head & 7))
+ head &= ~7ULL;
- if (show & show_mask) {
- struct symbol *sym = dso__find_symbol(dso, event->ip.ip);
-
- if (thread__symbol_incnew(thread, sym, dso, level))
- goto done;
- }
- total++;
- } else switch (event->header.type) {
- case PERF_EVENT_MMAP: {
- struct thread *thread = threads__findnew(event->mmap.pid);
- struct map *map = map__new(&event->mmap);
-
- if (thread == NULL || map == NULL )
- goto done;
- thread__insert_map(thread, map);
- break;
+ size = 8;
}
- case PERF_EVENT_COMM: {
- struct thread *thread = threads__findnew(event->comm.pid);
- if (thread == NULL ||
- thread__set_comm(thread, event->comm.comm))
- goto done;
- break;
- }
- }
+ head += size;
if (offset + head < stat.st_size)
goto more;
rc = EXIT_SUCCESS;
-done:
close(input);
- //dsos__fprintf(stdout);
- threads__fprintf(stdout);
-#if 0
- std::map<std::string, int>::iterator hi = hist.begin();
- while (hi != hist.end()) {
- rev_hist.insert(std::pair<int, std::string>(hi->second, hi->first));
- hist.erase(hi++);
- }
+ dprintf(" IP events: %10ld\n", total);
+ dprintf(" mmap events: %10ld\n", total_mmap);
+ dprintf(" comm events: %10ld\n", total_comm);
+ dprintf(" unknown events: %10ld\n", total_unknown);
- std::multimap<int, std::string>::const_iterator ri = rev_hist.begin();
+ if (dump_trace)
+ return 0;
+
+ if (verbose >= 2)
+ dsos__fprintf(stdout);
+
+ collapse__resort();
+ output__resort();
+ output__fprintf(stdout, total);
- while (ri != rev_hist.end()) {
- printf(" %5.2f %s\n", (100.0 * ri->first)/total, ri->second.c_str());
- ri++;
- }
-#endif
return rc;
}
+static const char * const report_usage[] = {
+ "perf report [<options>] <command>",
+ NULL
+};
+
+static const struct option options[] = {
+ OPT_STRING('i', "input", &input_name, "file",
+ "input file name"),
+ OPT_BOOLEAN('v', "verbose", &verbose,
+ "be more verbose (show symbol address, etc)"),
+ OPT_BOOLEAN('D', "dump-raw-trace", &dump_trace,
+ "dump raw trace in ASCII"),
+ OPT_STRING('k', "vmlinux", &vmlinux, "file", "vmlinux pathname"),
+ OPT_STRING('s', "sort", &sort_order, "key[,key2...]",
+ "sort by key(s): pid, comm, dso, symbol. Default: pid,symbol"),
+ OPT_BOOLEAN('P', "full-paths", &full_paths,
+ "Don't shorten the pathnames taking into account the cwd"),
+ OPT_END()
+};
+
+static void setup_sorting(void)
+{
+ char *tmp, *tok, *str = strdup(sort_order);
+
+ for (tok = strtok_r(str, ", ", &tmp);
+ tok; tok = strtok_r(NULL, ", ", &tmp)) {
+ if (sort_dimension__add(tok) < 0) {
+ error("Unknown --sort key: `%s'", tok);
+ usage_with_options(report_usage, options);
+ }
+ }
+
+ free(str);
+}
+
+int cmd_report(int argc, const char **argv, const char *prefix)
+{
+ symbol__init();
+
+ page_size = getpagesize();
+
+ parse_options(argc, argv, options, report_usage, 0);
+
+ setup_sorting();
+
+ setup_pager();
+
+ return __cmd_report();
+}