4 #include "util/cache.h"
5 #include "util/symbol.h"
6 #include "util/thread.h"
7 #include "util/header.h"
9 #include "util/parse-options.h"
12 #include "util/debug.h"
14 #include "util/trace-event.h"
16 static char const *input_name = "perf.data";
18 static unsigned long page_size;
19 static unsigned long mmap_window = 32;
21 static unsigned long total = 0;
22 static unsigned long total_comm = 0;
24 static struct rb_root threads;
25 static struct thread *last_match;
27 static struct perf_header *header;
28 static u64 sample_type;
32 process_comm_event(event_t *event, unsigned long offset, unsigned long head)
34 struct thread *thread;
36 thread = threads__findnew(event->comm.pid, &threads, &last_match);
38 dump_printf("%p [%p]: PERF_RECORD_COMM: %s:%d\n",
39 (void *)(offset + head),
40 (void *)(long)(event->header.size),
41 event->comm.comm, event->comm.pid);
44 thread__set_comm(thread, event->comm.comm)) {
45 dump_printf("problem processing PERF_RECORD_COMM, skipping event.\n");
54 process_sample_event(event_t *event, unsigned long offset, unsigned long head)
56 struct thread *thread;
57 u64 ip = event->ip.ip;
61 void *more_data = event->ip.__more_data;
63 thread = threads__findnew(event->ip.pid, &threads, &last_match);
65 if (sample_type & PERF_SAMPLE_TIME) {
66 timestamp = *(u64 *)more_data;
67 more_data += sizeof(u64);
70 if (sample_type & PERF_SAMPLE_CPU) {
71 cpu = *(u32 *)more_data;
72 more_data += sizeof(u32);
73 more_data += sizeof(u32); /* reserved */
76 if (sample_type & PERF_SAMPLE_PERIOD) {
77 period = *(u64 *)more_data;
78 more_data += sizeof(u64);
81 dump_printf("%p [%p]: PERF_RECORD_SAMPLE (IP, %d): %d/%d: %p period: %Ld\n",
82 (void *)(offset + head),
83 (void *)(long)(event->header.size),
85 event->ip.pid, event->ip.tid,
89 dump_printf(" ... thread: %s:%d\n", thread->comm, thread->pid);
92 eprintf("problem processing %d event, skipping it.\n",
97 if (sample_type & PERF_SAMPLE_RAW) {
104 * FIXME: better resolve from pid from the struct trace_entry
105 * field, although it should be the same than this perf
108 print_event(cpu, raw->data, raw->size, timestamp, thread->comm);
116 process_event(event_t *event, unsigned long offset, unsigned long head)
120 switch (event->header.type) {
121 case PERF_RECORD_MMAP ... PERF_RECORD_LOST:
124 case PERF_RECORD_COMM:
125 return process_comm_event(event, offset, head);
127 case PERF_RECORD_EXIT ... PERF_RECORD_READ:
130 case PERF_RECORD_SAMPLE:
131 return process_sample_event(event, offset, head);
133 case PERF_RECORD_MAX:
141 static int __cmd_trace(void)
143 int ret, rc = EXIT_FAILURE;
144 unsigned long offset = 0;
145 unsigned long head = 0;
146 struct stat perf_stat;
152 register_idle_thread(&threads, &last_match);
154 input = open(input_name, O_RDONLY);
156 perror("failed to open file");
160 ret = fstat(input, &perf_stat);
162 perror("failed to stat file");
166 if (!perf_stat.st_size) {
167 fprintf(stderr, "zero-sized file, nothing to do!\n");
170 header = perf_header__read(input);
171 head = header->data_offset;
172 sample_type = perf_header__sample_type(header);
174 if (!(sample_type & PERF_SAMPLE_RAW))
175 die("No trace sample to read. Did you call perf record "
178 if (load_kernel() < 0) {
179 perror("failed to load kernel symbols");
184 buf = (char *)mmap(NULL, page_size * mmap_window, PROT_READ,
185 MAP_SHARED, input, offset);
186 if (buf == MAP_FAILED) {
187 perror("failed to mmap file");
192 event = (event_t *)(buf + head);
194 if (head + event->header.size >= page_size * mmap_window) {
195 unsigned long shift = page_size * (head / page_size);
198 res = munmap(buf, page_size * mmap_window);
206 size = event->header.size;
208 if (!size || process_event(event, offset, head) < 0) {
211 * assume we lost track of the stream, check alignment, and
212 * increment a single u64 in the hope to catch on again 'soon'.
215 if (unlikely(head & 7))
223 if (offset + head < (unsigned long)perf_stat.st_size)
232 static const char * const annotate_usage[] = {
233 "perf trace [<options>] <command>",
237 static const struct option options[] = {
238 OPT_BOOLEAN('D', "dump-raw-trace", &dump_trace,
239 "dump raw trace in ASCII"),
240 OPT_BOOLEAN('v', "verbose", &verbose,
241 "be more verbose (show symbol address, etc)"),
245 int cmd_trace(int argc, const char **argv, const char *prefix __used)
248 page_size = getpagesize();
250 argc = parse_options(argc, argv, options, annotate_usage, 0);
253 * Special case: if there's an argument left then assume tha
254 * it's a symbol filter:
257 usage_with_options(annotate_usage, options);
262 return __cmd_trace();