blob: 810fc275ca65c95d69d2894249ad68f516759734 [file] [log] [blame]
Peter Zijlstrade9ac072009-04-08 15:01:31 +02001
2
Peter Zijlstra1a482f32009-05-23 18:28:58 +02003#include "perf.h"
Ingo Molnar16f762a2009-05-27 09:10:38 +02004#include "builtin.h"
Thomas Gleixner6eda5832009-05-01 18:29:57 +02005#include "util/util.h"
Ingo Molnar0e9b20b2009-05-26 09:17:18 +02006#include "util/parse-options.h"
Ingo Molnar8ad8db32009-05-26 11:10:09 +02007#include "util/parse-events.h"
Arnaldo Carvalho de Meloa0055ae2009-06-01 17:50:19 -03008#include "util/string.h"
Thomas Gleixner6eda5832009-05-01 18:29:57 +02009
Peter Zijlstrade9ac072009-04-08 15:01:31 +020010#include <sched.h>
Peter Zijlstrade9ac072009-04-08 15:01:31 +020011
Ingo Molnar0e9b20b2009-05-26 09:17:18 +020012#define ALIGN(x, a) __ALIGN_MASK(x, (typeof(x))(a)-1)
13#define __ALIGN_MASK(x, mask) (((x)+(mask))&~(mask))
Arnaldo Carvalho de Melo1a853e32009-05-14 22:50:46 -030014
Peter Zijlstrade9ac072009-04-08 15:01:31 +020015static int default_interval = 100000;
16static int event_count[MAX_COUNTERS];
Ingo Molnar8ad8db32009-05-26 11:10:09 +020017
Peter Zijlstrade9ac072009-04-08 15:01:31 +020018static int fd[MAX_NR_CPUS][MAX_COUNTERS];
19static int nr_cpus = 0;
20static unsigned int page_size;
21static unsigned int mmap_pages = 16;
22static int output;
Ingo Molnar23ac9cb2009-05-27 09:33:18 +020023static const char *output_name = "perf.data";
Peter Zijlstrade9ac072009-04-08 15:01:31 +020024static int group = 0;
Peter Zijlstra16c8a102009-05-05 17:50:27 +020025static unsigned int realtime_prio = 0;
26static int system_wide = 0;
Arnaldo Carvalho de Melo1a853e32009-05-14 22:50:46 -030027static pid_t target_pid = -1;
Peter Zijlstra16c8a102009-05-05 17:50:27 +020028static int inherit = 1;
29static int nmi = 1;
Peter Zijlstrade9ac072009-04-08 15:01:31 +020030
31const unsigned int default_count[] = {
32 1000000,
33 1000000,
34 10000,
35 10000,
36 1000000,
37 10000,
38};
39
Peter Zijlstrade9ac072009-04-08 15:01:31 +020040struct mmap_data {
41 int counter;
42 void *base;
43 unsigned int mask;
44 unsigned int prev;
45};
46
47static unsigned int mmap_read_head(struct mmap_data *md)
48{
49 struct perf_counter_mmap_page *pc = md->base;
50 int head;
51
52 head = pc->data_head;
53 rmb();
54
55 return head;
56}
57
58static long events;
59static struct timeval last_read, this_read;
60
61static void mmap_read(struct mmap_data *md)
62{
63 unsigned int head = mmap_read_head(md);
64 unsigned int old = md->prev;
65 unsigned char *data = md->base + page_size;
66 unsigned long size;
67 void *buf;
68 int diff;
69
70 gettimeofday(&this_read, NULL);
71
72 /*
73 * If we're further behind than half the buffer, there's a chance
74 * the writer will bite our tail and screw up the events under us.
75 *
76 * If we somehow ended up ahead of the head, we got messed up.
77 *
78 * In either case, truncate and restart at head.
79 */
80 diff = head - old;
81 if (diff > md->mask / 2 || diff < 0) {
82 struct timeval iv;
83 unsigned long msecs;
84
85 timersub(&this_read, &last_read, &iv);
86 msecs = iv.tv_sec*1000 + iv.tv_usec/1000;
87
88 fprintf(stderr, "WARNING: failed to keep up with mmap data."
89 " Last read %lu msecs ago.\n", msecs);
90
91 /*
92 * head points to a known good entry, start there.
93 */
94 old = head;
95 }
96
97 last_read = this_read;
98
99 if (old != head)
100 events++;
101
102 size = head - old;
103
104 if ((old & md->mask) + size != (head & md->mask)) {
105 buf = &data[old & md->mask];
106 size = md->mask + 1 - (old & md->mask);
107 old += size;
108 while (size) {
109 int ret = write(output, buf, size);
110 if (ret < 0) {
111 perror("failed to write");
112 exit(-1);
113 }
114 size -= ret;
115 buf += ret;
116 }
117 }
118
119 buf = &data[old & md->mask];
120 size = head - old;
121 old += size;
122 while (size) {
123 int ret = write(output, buf, size);
124 if (ret < 0) {
125 perror("failed to write");
126 exit(-1);
127 }
128 size -= ret;
129 buf += ret;
130 }
131
132 md->prev = old;
133}
134
135static volatile int done = 0;
136
Peter Zijlstra16c8a102009-05-05 17:50:27 +0200137static void sig_handler(int sig)
Peter Zijlstrade9ac072009-04-08 15:01:31 +0200138{
Peter Zijlstra16c8a102009-05-05 17:50:27 +0200139 done = 1;
Peter Zijlstrade9ac072009-04-08 15:01:31 +0200140}
141
Peter Zijlstra16c8a102009-05-05 17:50:27 +0200142static struct pollfd event_array[MAX_NR_CPUS * MAX_COUNTERS];
143static struct mmap_data mmap_array[MAX_NR_CPUS][MAX_COUNTERS];
144
145static int nr_poll;
146static int nr_cpu;
147
Arnaldo Carvalho de Melo1a853e32009-05-14 22:50:46 -0300148struct mmap_event {
Ingo Molnar16f762a2009-05-27 09:10:38 +0200149 struct perf_event_header header;
150 __u32 pid;
151 __u32 tid;
152 __u64 start;
153 __u64 len;
154 __u64 pgoff;
155 char filename[PATH_MAX];
Arnaldo Carvalho de Melo1a853e32009-05-14 22:50:46 -0300156};
Ingo Molnar16f762a2009-05-27 09:10:38 +0200157
Arnaldo Carvalho de Melo1a853e32009-05-14 22:50:46 -0300158struct comm_event {
Ingo Molnar16f762a2009-05-27 09:10:38 +0200159 struct perf_event_header header;
160 __u32 pid;
161 __u32 tid;
162 char comm[16];
Arnaldo Carvalho de Melo1a853e32009-05-14 22:50:46 -0300163};
164
Peter Zijlstraf70e87d2009-06-02 14:13:24 +0200165static void pid_synthesize_comm_event(pid_t pid, int full)
Arnaldo Carvalho de Melo1a853e32009-05-14 22:50:46 -0300166{
Arnaldo Carvalho de Melo1a853e32009-05-14 22:50:46 -0300167 struct comm_event comm_ev;
Ingo Molnar16f762a2009-05-27 09:10:38 +0200168 char filename[PATH_MAX];
Ingo Molnar16f762a2009-05-27 09:10:38 +0200169 char bf[BUFSIZ];
Arnaldo Carvalho de Meloa0055ae2009-06-01 17:50:19 -0300170 int fd, ret;
Arnaldo Carvalho de Melo1a853e32009-05-14 22:50:46 -0300171 size_t size;
Arnaldo Carvalho de Meloa0055ae2009-06-01 17:50:19 -0300172 char *field, *sep;
Peter Zijlstraf70e87d2009-06-02 14:13:24 +0200173 DIR *tasks;
174 struct dirent dirent, *next;
Arnaldo Carvalho de Melo1a853e32009-05-14 22:50:46 -0300175
176 snprintf(filename, sizeof(filename), "/proc/%d/stat", pid);
177
178 fd = open(filename, O_RDONLY);
179 if (fd < 0) {
180 fprintf(stderr, "couldn't open %s\n", filename);
181 exit(EXIT_FAILURE);
182 }
183 if (read(fd, bf, sizeof(bf)) < 0) {
184 fprintf(stderr, "couldn't read %s\n", filename);
185 exit(EXIT_FAILURE);
186 }
187 close(fd);
188
Arnaldo Carvalho de Meloa0055ae2009-06-01 17:50:19 -0300189 /* 9027 (cat) R 6747 9027 6747 34816 9027 ... */
Arnaldo Carvalho de Melo1a853e32009-05-14 22:50:46 -0300190 memset(&comm_ev, 0, sizeof(comm_ev));
Arnaldo Carvalho de Meloa0055ae2009-06-01 17:50:19 -0300191 field = strchr(bf, '(');
192 if (field == NULL)
193 goto out_failure;
194 sep = strchr(++field, ')');
195 if (sep == NULL)
196 goto out_failure;
197 size = sep - field;
198 memcpy(comm_ev.comm, field, size++);
Peter Zijlstraf70e87d2009-06-02 14:13:24 +0200199
200 comm_ev.pid = pid;
Arnaldo Carvalho de Melo1a853e32009-05-14 22:50:46 -0300201 comm_ev.header.type = PERF_EVENT_COMM;
Arnaldo Carvalho de Melo1a853e32009-05-14 22:50:46 -0300202 size = ALIGN(size, sizeof(uint64_t));
203 comm_ev.header.size = sizeof(comm_ev) - (sizeof(comm_ev.comm) - size);
Ingo Molnar16f762a2009-05-27 09:10:38 +0200204
Peter Zijlstraf70e87d2009-06-02 14:13:24 +0200205 if (!full) {
206 comm_ev.tid = pid;
207
208 ret = write(output, &comm_ev, comm_ev.header.size);
209 if (ret < 0) {
210 perror("failed to write");
211 exit(-1);
212 }
213 return;
Arnaldo Carvalho de Melo1a853e32009-05-14 22:50:46 -0300214 }
Peter Zijlstraf70e87d2009-06-02 14:13:24 +0200215
216 snprintf(filename, sizeof(filename), "/proc/%d/task", pid);
217
218 tasks = opendir(filename);
219 while (!readdir_r(tasks, &dirent, &next) && next) {
220 char *end;
221 pid = strtol(dirent.d_name, &end, 10);
222 if (*end)
223 continue;
224
225 comm_ev.tid = pid;
226
227 ret = write(output, &comm_ev, comm_ev.header.size);
228 if (ret < 0) {
229 perror("failed to write");
230 exit(-1);
231 }
232 }
233 closedir(tasks);
234 return;
235
Arnaldo Carvalho de Meloa0055ae2009-06-01 17:50:19 -0300236out_failure:
237 fprintf(stderr, "couldn't get COMM and pgid, malformed %s\n",
238 filename);
239 exit(EXIT_FAILURE);
Arnaldo Carvalho de Melo1a853e32009-05-14 22:50:46 -0300240}
241
Peter Zijlstraf70e87d2009-06-02 14:13:24 +0200242static void pid_synthesize_mmap_events(pid_t pid)
Arnaldo Carvalho de Melo1a853e32009-05-14 22:50:46 -0300243{
244 char filename[PATH_MAX];
245 FILE *fp;
246
247 snprintf(filename, sizeof(filename), "/proc/%d/maps", pid);
248
249 fp = fopen(filename, "r");
250 if (fp == NULL) {
251 fprintf(stderr, "couldn't open %s\n", filename);
252 exit(EXIT_FAILURE);
253 }
254 while (1) {
Arnaldo Carvalho de Meloa0055ae2009-06-01 17:50:19 -0300255 char bf[BUFSIZ], *pbf = bf;
Arnaldo Carvalho de Melo1a853e32009-05-14 22:50:46 -0300256 struct mmap_event mmap_ev = {
257 .header.type = PERF_EVENT_MMAP,
258 };
Arnaldo Carvalho de Meloa0055ae2009-06-01 17:50:19 -0300259 int n;
Arnaldo Carvalho de Melo1a853e32009-05-14 22:50:46 -0300260 size_t size;
261 if (fgets(bf, sizeof(bf), fp) == NULL)
262 break;
263
264 /* 00400000-0040c000 r-xp 00000000 fd:01 41038 /bin/cat */
Arnaldo Carvalho de Meloa0055ae2009-06-01 17:50:19 -0300265 n = hex2u64(pbf, &mmap_ev.start);
266 if (n < 0)
267 continue;
268 pbf += n + 1;
269 n = hex2u64(pbf, &mmap_ev.len);
270 if (n < 0)
271 continue;
272 pbf += n + 3;
273 if (*pbf == 'x') { /* vm_exec */
Arnaldo Carvalho de Melo1a853e32009-05-14 22:50:46 -0300274 char *execname = strrchr(bf, ' ');
275
276 if (execname == NULL || execname[1] != '/')
277 continue;
278
279 execname += 1;
280 size = strlen(execname);
281 execname[size - 1] = '\0'; /* Remove \n */
282 memcpy(mmap_ev.filename, execname, size);
283 size = ALIGN(size, sizeof(uint64_t));
284 mmap_ev.len -= mmap_ev.start;
285 mmap_ev.header.size = (sizeof(mmap_ev) -
286 (sizeof(mmap_ev.filename) - size));
Peter Zijlstraf70e87d2009-06-02 14:13:24 +0200287 mmap_ev.pid = pid;
Arnaldo Carvalho de Melo1a853e32009-05-14 22:50:46 -0300288 mmap_ev.tid = pid;
289
290 if (write(output, &mmap_ev, mmap_ev.header.size) < 0) {
291 perror("failed to write");
292 exit(-1);
293 }
294 }
295 }
296
297 fclose(fp);
298}
299
Peter Zijlstraf70e87d2009-06-02 14:13:24 +0200300static void synthesize_events(void)
301{
302 DIR *proc;
303 struct dirent dirent, *next;
304
305 proc = opendir("/proc");
306
307 while (!readdir_r(proc, &dirent, &next) && next) {
308 char *end;
309 pid_t pid;
310
311 pid = strtol(dirent.d_name, &end, 10);
312 if (*end) /* only interested in proper numerical dirents */
313 continue;
314
315 pid_synthesize_comm_event(pid, 1);
316 pid_synthesize_mmap_events(pid);
317 }
318
319 closedir(proc);
320}
321
Arnaldo Carvalho de Melo1a853e32009-05-14 22:50:46 -0300322static void open_counters(int cpu, pid_t pid)
Peter Zijlstrade9ac072009-04-08 15:01:31 +0200323{
Peter Zijlstrade9ac072009-04-08 15:01:31 +0200324 struct perf_counter_hw_event hw_event;
Peter Zijlstra16c8a102009-05-05 17:50:27 +0200325 int counter, group_fd;
326 int track = 1;
Peter Zijlstra16c8a102009-05-05 17:50:27 +0200327
Arnaldo Carvalho de Melo1a853e32009-05-14 22:50:46 -0300328 if (pid > 0) {
Peter Zijlstraf70e87d2009-06-02 14:13:24 +0200329 pid_synthesize_comm_event(pid, 0);
330 pid_synthesize_mmap_events(pid);
Arnaldo Carvalho de Melo1a853e32009-05-14 22:50:46 -0300331 }
Peter Zijlstra16c8a102009-05-05 17:50:27 +0200332
333 group_fd = -1;
334 for (counter = 0; counter < nr_counters; counter++) {
335
336 memset(&hw_event, 0, sizeof(hw_event));
337 hw_event.config = event_id[counter];
338 hw_event.irq_period = event_count[counter];
339 hw_event.record_type = PERF_RECORD_IP | PERF_RECORD_TID;
340 hw_event.nmi = nmi;
341 hw_event.mmap = track;
342 hw_event.comm = track;
343 hw_event.inherit = (cpu < 0) && inherit;
344
345 track = 0; // only the first counter needs these
346
347 fd[nr_cpu][counter] =
348 sys_perf_counter_open(&hw_event, pid, cpu, group_fd, 0);
349
350 if (fd[nr_cpu][counter] < 0) {
351 int err = errno;
352 printf("kerneltop error: syscall returned with %d (%s)\n",
353 fd[nr_cpu][counter], strerror(err));
354 if (err == EPERM)
355 printf("Are you root?\n");
356 exit(-1);
357 }
358 assert(fd[nr_cpu][counter] >= 0);
359 fcntl(fd[nr_cpu][counter], F_SETFL, O_NONBLOCK);
360
361 /*
362 * First counter acts as the group leader:
363 */
364 if (group && group_fd == -1)
365 group_fd = fd[nr_cpu][counter];
366
367 event_array[nr_poll].fd = fd[nr_cpu][counter];
368 event_array[nr_poll].events = POLLIN;
369 nr_poll++;
370
371 mmap_array[nr_cpu][counter].counter = counter;
372 mmap_array[nr_cpu][counter].prev = 0;
373 mmap_array[nr_cpu][counter].mask = mmap_pages*page_size - 1;
374 mmap_array[nr_cpu][counter].base = mmap(NULL, (mmap_pages+1)*page_size,
375 PROT_READ, MAP_SHARED, fd[nr_cpu][counter], 0);
376 if (mmap_array[nr_cpu][counter].base == MAP_FAILED) {
377 printf("kerneltop error: failed to mmap with %d (%s)\n",
378 errno, strerror(errno));
379 exit(-1);
380 }
381 }
382 nr_cpu++;
383}
384
Ingo Molnar0e9b20b2009-05-26 09:17:18 +0200385static int __cmd_record(int argc, const char **argv)
Peter Zijlstra16c8a102009-05-05 17:50:27 +0200386{
387 int i, counter;
Peter Zijlstrade9ac072009-04-08 15:01:31 +0200388 pid_t pid;
389 int ret;
390
391 page_size = sysconf(_SC_PAGE_SIZE);
Peter Zijlstrade9ac072009-04-08 15:01:31 +0200392 nr_cpus = sysconf(_SC_NPROCESSORS_ONLN);
393 assert(nr_cpus <= MAX_NR_CPUS);
394 assert(nr_cpus >= 0);
395
Peter Zijlstraf70e87d2009-06-02 14:13:24 +0200396 output = open(output_name, O_CREAT|O_EXCL|O_TRUNC|O_RDWR, S_IRUSR|S_IWUSR);
Peter Zijlstrade9ac072009-04-08 15:01:31 +0200397 if (output < 0) {
398 perror("failed to create output file");
399 exit(-1);
400 }
401
Arnaldo Carvalho de Melo1a853e32009-05-14 22:50:46 -0300402 if (!system_wide) {
403 open_counters(-1, target_pid != -1 ? target_pid : 0);
404 } else for (i = 0; i < nr_cpus; i++)
405 open_counters(i, target_pid);
Peter Zijlstrade9ac072009-04-08 15:01:31 +0200406
Peter Zijlstra16c8a102009-05-05 17:50:27 +0200407 signal(SIGCHLD, sig_handler);
408 signal(SIGINT, sig_handler);
Peter Zijlstrade9ac072009-04-08 15:01:31 +0200409
Mike Galbraithef65b2a2009-05-27 10:10:51 +0200410 if (target_pid == -1 && argc) {
Arnaldo Carvalho de Melo1a853e32009-05-14 22:50:46 -0300411 pid = fork();
412 if (pid < 0)
413 perror("failed to fork");
Peter Zijlstrade9ac072009-04-08 15:01:31 +0200414
Arnaldo Carvalho de Melo1a853e32009-05-14 22:50:46 -0300415 if (!pid) {
Ingo Molnar0e9b20b2009-05-26 09:17:18 +0200416 if (execvp(argv[0], (char **)argv)) {
Arnaldo Carvalho de Melo1a853e32009-05-14 22:50:46 -0300417 perror(argv[0]);
418 exit(-1);
419 }
Peter Zijlstrade9ac072009-04-08 15:01:31 +0200420 }
421 }
422
423 if (realtime_prio) {
424 struct sched_param param;
425
426 param.sched_priority = realtime_prio;
427 if (sched_setscheduler(0, SCHED_FIFO, &param)) {
428 printf("Could not set realtime priority.\n");
429 exit(-1);
430 }
431 }
432
Peter Zijlstraf70e87d2009-06-02 14:13:24 +0200433 if (system_wide)
434 synthesize_events();
Peter Zijlstrade9ac072009-04-08 15:01:31 +0200435
436 while (!done) {
437 int hits = events;
438
Peter Zijlstra16c8a102009-05-05 17:50:27 +0200439 for (i = 0; i < nr_cpu; i++) {
Peter Zijlstrade9ac072009-04-08 15:01:31 +0200440 for (counter = 0; counter < nr_counters; counter++)
441 mmap_read(&mmap_array[i][counter]);
442 }
443
444 if (hits == events)
445 ret = poll(event_array, nr_poll, 100);
446 }
447
448 return 0;
449}
Ingo Molnar0e9b20b2009-05-26 09:17:18 +0200450
Ingo Molnar0e9b20b2009-05-26 09:17:18 +0200451static const char * const record_usage[] = {
Mike Galbraith9e0967532009-05-28 16:25:34 +0200452 "perf record [<options>] [<command>]",
453 "perf record [<options>] -- <command> [<options>]",
Ingo Molnar0e9b20b2009-05-26 09:17:18 +0200454 NULL
455};
456
Ingo Molnar8ad8db32009-05-26 11:10:09 +0200457static char events_help_msg[EVENTS_HELP_MAX];
458
Ingo Molnar52425192009-05-26 09:17:18 +0200459static const struct option options[] = {
Ingo Molnar0e9b20b2009-05-26 09:17:18 +0200460 OPT_CALLBACK('e', "event", NULL, "event",
Ingo Molnar8ad8db32009-05-26 11:10:09 +0200461 events_help_msg, parse_events),
Ingo Molnar0e9b20b2009-05-26 09:17:18 +0200462 OPT_INTEGER('c', "count", &default_interval,
463 "event period to sample"),
464 OPT_INTEGER('m', "mmap-pages", &mmap_pages,
465 "number of mmap data pages"),
466 OPT_STRING('o', "output", &output_name, "file",
467 "output file name"),
468 OPT_BOOLEAN('i', "inherit", &inherit,
469 "child tasks inherit counters"),
470 OPT_INTEGER('p', "pid", &target_pid,
471 "record events on existing pid"),
472 OPT_INTEGER('r', "realtime", &realtime_prio,
473 "collect data with this RT SCHED_FIFO priority"),
474 OPT_BOOLEAN('a', "all-cpus", &system_wide,
475 "system-wide collection from all CPUs"),
476 OPT_END()
477};
478
479int cmd_record(int argc, const char **argv, const char *prefix)
480{
481 int counter;
482
Ingo Molnar8ad8db32009-05-26 11:10:09 +0200483 create_events_help(events_help_msg);
Ingo Molnar0e9b20b2009-05-26 09:17:18 +0200484
485 argc = parse_options(argc, argv, options, record_usage, 0);
Mike Galbraithef65b2a2009-05-27 10:10:51 +0200486 if (!argc && target_pid == -1 && !system_wide)
Ingo Molnar0e9b20b2009-05-26 09:17:18 +0200487 usage_with_options(record_usage, options);
488
489 if (!nr_counters) {
490 nr_counters = 1;
491 event_id[0] = 0;
492 }
493
494 for (counter = 0; counter < nr_counters; counter++) {
495 if (event_count[counter])
496 continue;
497
498 event_count[counter] = default_interval;
499 }
500
501 return __cmd_record(argc, argv);
502}