1b3a0e9592
The callchains are fed with an array of a fixed size. As a result we iterate over each callchains three times: - 1st to resolve symbols - 2nd to filter out context boundaries - 3rd for the insertion into the tree This also involves some pairs of memory allocation/deallocation everytime we insert a callchain, for the filtered out array of addresses and for the array of symbols that comes along. Instead, feed the callchains through a linked list with persistent allocations. It brings several pros like: - Merge the 1st and 2nd iterations in one. That was possible before but in a way that would involve allocating an array slightly taller than necessary because we don't know in advance the number of context boundaries to filter out. - Much lesser allocations/deallocations. The linked list keeps persistent empty entries for the next usages and is extendable at will. - Makes it easier for multiple sources of callchains to feed a stacktrace together. This is deemed to pave the way for cfi based callchains wherein traditional frame pointer based kernel stacktraces will precede cfi based user ones, producing an overall callchain which size is hardly predictable. This requirement makes the static array obsolete and makes a linked list based iterator a much more flexible fit. Basic testing on a big perf file containing callchains (~ 176 MB) has shown a throughput gain of about 11% with perf report. Cc: Ingo Molnar <mingo@elte.hu> Cc: Paul Mackerras <paulus@samba.org> Cc: Peter Zijlstra <a.p.zijlstra@chello.nl> LKML-Reference: <1294977121-5700-2-git-send-email-fweisbec@gmail.com> Signed-off-by: Frederic Weisbecker <fweisbec@gmail.com> Signed-off-by: Arnaldo Carvalho de Melo <acme@redhat.com>
152 lines
4.2 KiB
C
152 lines
4.2 KiB
C
#ifndef __PERF_HIST_H
|
|
#define __PERF_HIST_H
|
|
|
|
#include <linux/types.h>
|
|
#include "callchain.h"
|
|
|
|
extern struct callchain_param callchain_param;
|
|
|
|
struct hist_entry;
|
|
struct addr_location;
|
|
struct symbol;
|
|
struct rb_root;
|
|
|
|
struct objdump_line {
|
|
struct list_head node;
|
|
s64 offset;
|
|
char *line;
|
|
};
|
|
|
|
void objdump_line__free(struct objdump_line *self);
|
|
struct objdump_line *objdump__get_next_ip_line(struct list_head *head,
|
|
struct objdump_line *pos);
|
|
|
|
struct sym_hist {
|
|
u64 sum;
|
|
u64 ip[0];
|
|
};
|
|
|
|
struct sym_ext {
|
|
struct rb_node node;
|
|
double percent;
|
|
char *path;
|
|
};
|
|
|
|
struct sym_priv {
|
|
struct sym_hist *hist;
|
|
struct sym_ext *ext;
|
|
};
|
|
|
|
/*
|
|
* The kernel collects the number of events it couldn't send in a stretch and
|
|
* when possible sends this number in a PERF_RECORD_LOST event. The number of
|
|
* such "chunks" of lost events is stored in .nr_events[PERF_EVENT_LOST] while
|
|
* total_lost tells exactly how many events the kernel in fact lost, i.e. it is
|
|
* the sum of all struct lost_event.lost fields reported.
|
|
*
|
|
* The total_period is needed because by default auto-freq is used, so
|
|
* multipling nr_events[PERF_EVENT_SAMPLE] by a frequency isn't possible to get
|
|
* the total number of low level events, it is necessary to to sum all struct
|
|
* sample_event.period and stash the result in total_period.
|
|
*/
|
|
struct events_stats {
|
|
u64 total_period;
|
|
u64 total_lost;
|
|
u64 total_invalid_chains;
|
|
u32 nr_events[PERF_RECORD_HEADER_MAX];
|
|
u32 nr_unknown_events;
|
|
u32 nr_invalid_chains;
|
|
};
|
|
|
|
enum hist_column {
|
|
HISTC_SYMBOL,
|
|
HISTC_DSO,
|
|
HISTC_THREAD,
|
|
HISTC_COMM,
|
|
HISTC_PARENT,
|
|
HISTC_CPU,
|
|
HISTC_NR_COLS, /* Last entry */
|
|
};
|
|
|
|
struct hists {
|
|
struct rb_node rb_node;
|
|
struct rb_root entries;
|
|
u64 nr_entries;
|
|
struct events_stats stats;
|
|
u64 config;
|
|
u64 event_stream;
|
|
u32 type;
|
|
u16 col_len[HISTC_NR_COLS];
|
|
/* Best would be to reuse the session callchain cursor */
|
|
struct callchain_cursor callchain_cursor;
|
|
};
|
|
|
|
struct hist_entry *__hists__add_entry(struct hists *self,
|
|
struct addr_location *al,
|
|
struct symbol *parent, u64 period);
|
|
extern int64_t hist_entry__cmp(struct hist_entry *, struct hist_entry *);
|
|
extern int64_t hist_entry__collapse(struct hist_entry *, struct hist_entry *);
|
|
int hist_entry__fprintf(struct hist_entry *self, struct hists *hists,
|
|
struct hists *pair_hists, bool show_displacement,
|
|
long displacement, FILE *fp, u64 total);
|
|
int hist_entry__snprintf(struct hist_entry *self, char *bf, size_t size,
|
|
struct hists *hists, struct hists *pair_hists,
|
|
bool show_displacement, long displacement,
|
|
bool color, u64 total);
|
|
void hist_entry__free(struct hist_entry *);
|
|
|
|
void hists__output_resort(struct hists *self);
|
|
void hists__collapse_resort(struct hists *self);
|
|
|
|
void hists__inc_nr_events(struct hists *self, u32 type);
|
|
size_t hists__fprintf_nr_events(struct hists *self, FILE *fp);
|
|
|
|
size_t hists__fprintf(struct hists *self, struct hists *pair,
|
|
bool show_displacement, FILE *fp);
|
|
|
|
int hist_entry__inc_addr_samples(struct hist_entry *self, u64 ip);
|
|
int hist_entry__annotate(struct hist_entry *self, struct list_head *head,
|
|
size_t privsize);
|
|
|
|
void hists__filter_by_dso(struct hists *self, const struct dso *dso);
|
|
void hists__filter_by_thread(struct hists *self, const struct thread *thread);
|
|
|
|
u16 hists__col_len(struct hists *self, enum hist_column col);
|
|
void hists__set_col_len(struct hists *self, enum hist_column col, u16 len);
|
|
bool hists__new_col_len(struct hists *self, enum hist_column col, u16 len);
|
|
|
|
#ifdef NO_NEWT_SUPPORT
|
|
static inline int hists__browse(struct hists *self __used,
|
|
const char *helpline __used,
|
|
const char *ev_name __used)
|
|
{
|
|
return 0;
|
|
}
|
|
|
|
static inline int hists__tui_browse_tree(struct rb_root *self __used,
|
|
const char *help __used)
|
|
{
|
|
return 0;
|
|
}
|
|
|
|
static inline int hist_entry__tui_annotate(struct hist_entry *self __used)
|
|
{
|
|
return 0;
|
|
}
|
|
#define KEY_LEFT -1
|
|
#define KEY_RIGHT -2
|
|
#else
|
|
#include <newt.h>
|
|
int hists__browse(struct hists *self, const char *helpline,
|
|
const char *ev_name);
|
|
int hist_entry__tui_annotate(struct hist_entry *self);
|
|
|
|
#define KEY_LEFT NEWT_KEY_LEFT
|
|
#define KEY_RIGHT NEWT_KEY_RIGHT
|
|
|
|
int hists__tui_browse_tree(struct rb_root *self, const char *help);
|
|
#endif
|
|
|
|
unsigned int hists__sort_list_width(struct hists *self);
|
|
|
|
#endif /* __PERF_HIST_H */
|