blob: 9c151ded22fabc74a5209660786628288d8bc6cb [file] [log] [blame]
Peter Zijlstrade9ac072009-04-08 15:01:31 +02001
2
Peter Zijlstra1a482f32009-05-23 18:28:58 +02003#include "perf.h"
Ingo Molnar16f762a2009-05-27 09:10:38 +02004#include "builtin.h"
Thomas Gleixner6eda5832009-05-01 18:29:57 +02005#include "util/util.h"
Ingo Molnar0e9b20b2009-05-26 09:17:18 +02006#include "util/parse-options.h"
Ingo Molnar8ad8db32009-05-26 11:10:09 +02007#include "util/parse-events.h"
Arnaldo Carvalho de Meloa0055ae2009-06-01 17:50:19 -03008#include "util/string.h"
Thomas Gleixner6eda5832009-05-01 18:29:57 +02009
Peter Zijlstrade9ac072009-04-08 15:01:31 +020010#include <sched.h>
Peter Zijlstrade9ac072009-04-08 15:01:31 +020011
Ingo Molnar0e9b20b2009-05-26 09:17:18 +020012#define ALIGN(x, a) __ALIGN_MASK(x, (typeof(x))(a)-1)
13#define __ALIGN_MASK(x, mask) (((x)+(mask))&~(mask))
Arnaldo Carvalho de Melo1a853e32009-05-14 22:50:46 -030014
Peter Zijlstrade9ac072009-04-08 15:01:31 +020015static int default_interval = 100000;
16static int event_count[MAX_COUNTERS];
Ingo Molnar8ad8db32009-05-26 11:10:09 +020017
Peter Zijlstrade9ac072009-04-08 15:01:31 +020018static int fd[MAX_NR_CPUS][MAX_COUNTERS];
19static int nr_cpus = 0;
20static unsigned int page_size;
21static unsigned int mmap_pages = 16;
22static int output;
Ingo Molnar23ac9cb2009-05-27 09:33:18 +020023static const char *output_name = "perf.data";
Peter Zijlstrade9ac072009-04-08 15:01:31 +020024static int group = 0;
Peter Zijlstra16c8a102009-05-05 17:50:27 +020025static unsigned int realtime_prio = 0;
26static int system_wide = 0;
Arnaldo Carvalho de Melo1a853e32009-05-14 22:50:46 -030027static pid_t target_pid = -1;
Peter Zijlstra16c8a102009-05-05 17:50:27 +020028static int inherit = 1;
29static int nmi = 1;
Peter Zijlstrade9ac072009-04-08 15:01:31 +020030
31const unsigned int default_count[] = {
32 1000000,
33 1000000,
34 10000,
35 10000,
36 1000000,
37 10000,
38};
39
Peter Zijlstrade9ac072009-04-08 15:01:31 +020040struct mmap_data {
41 int counter;
42 void *base;
43 unsigned int mask;
44 unsigned int prev;
45};
46
47static unsigned int mmap_read_head(struct mmap_data *md)
48{
49 struct perf_counter_mmap_page *pc = md->base;
50 int head;
51
52 head = pc->data_head;
53 rmb();
54
55 return head;
56}
57
58static long events;
59static struct timeval last_read, this_read;
60
61static void mmap_read(struct mmap_data *md)
62{
63 unsigned int head = mmap_read_head(md);
64 unsigned int old = md->prev;
65 unsigned char *data = md->base + page_size;
66 unsigned long size;
67 void *buf;
68 int diff;
69
70 gettimeofday(&this_read, NULL);
71
72 /*
73 * If we're further behind than half the buffer, there's a chance
74 * the writer will bite our tail and screw up the events under us.
75 *
76 * If we somehow ended up ahead of the head, we got messed up.
77 *
78 * In either case, truncate and restart at head.
79 */
80 diff = head - old;
81 if (diff > md->mask / 2 || diff < 0) {
82 struct timeval iv;
83 unsigned long msecs;
84
85 timersub(&this_read, &last_read, &iv);
86 msecs = iv.tv_sec*1000 + iv.tv_usec/1000;
87
88 fprintf(stderr, "WARNING: failed to keep up with mmap data."
89 " Last read %lu msecs ago.\n", msecs);
90
91 /*
92 * head points to a known good entry, start there.
93 */
94 old = head;
95 }
96
97 last_read = this_read;
98
99 if (old != head)
100 events++;
101
102 size = head - old;
103
104 if ((old & md->mask) + size != (head & md->mask)) {
105 buf = &data[old & md->mask];
106 size = md->mask + 1 - (old & md->mask);
107 old += size;
108 while (size) {
109 int ret = write(output, buf, size);
110 if (ret < 0) {
111 perror("failed to write");
112 exit(-1);
113 }
114 size -= ret;
115 buf += ret;
116 }
117 }
118
119 buf = &data[old & md->mask];
120 size = head - old;
121 old += size;
122 while (size) {
123 int ret = write(output, buf, size);
124 if (ret < 0) {
125 perror("failed to write");
126 exit(-1);
127 }
128 size -= ret;
129 buf += ret;
130 }
131
132 md->prev = old;
133}
134
135static volatile int done = 0;
136
Peter Zijlstra16c8a102009-05-05 17:50:27 +0200137static void sig_handler(int sig)
Peter Zijlstrade9ac072009-04-08 15:01:31 +0200138{
Peter Zijlstra16c8a102009-05-05 17:50:27 +0200139 done = 1;
Peter Zijlstrade9ac072009-04-08 15:01:31 +0200140}
141
Peter Zijlstra16c8a102009-05-05 17:50:27 +0200142static struct pollfd event_array[MAX_NR_CPUS * MAX_COUNTERS];
143static struct mmap_data mmap_array[MAX_NR_CPUS][MAX_COUNTERS];
144
145static int nr_poll;
146static int nr_cpu;
147
Arnaldo Carvalho de Melo1a853e32009-05-14 22:50:46 -0300148struct mmap_event {
Ingo Molnar16f762a2009-05-27 09:10:38 +0200149 struct perf_event_header header;
150 __u32 pid;
151 __u32 tid;
152 __u64 start;
153 __u64 len;
154 __u64 pgoff;
155 char filename[PATH_MAX];
Arnaldo Carvalho de Melo1a853e32009-05-14 22:50:46 -0300156};
Ingo Molnar16f762a2009-05-27 09:10:38 +0200157
Arnaldo Carvalho de Melo1a853e32009-05-14 22:50:46 -0300158struct comm_event {
Ingo Molnar16f762a2009-05-27 09:10:38 +0200159 struct perf_event_header header;
160 __u32 pid;
161 __u32 tid;
162 char comm[16];
Arnaldo Carvalho de Melo1a853e32009-05-14 22:50:46 -0300163};
164
165static pid_t pid_synthesize_comm_event(pid_t pid)
166{
Arnaldo Carvalho de Melo1a853e32009-05-14 22:50:46 -0300167 struct comm_event comm_ev;
Ingo Molnar16f762a2009-05-27 09:10:38 +0200168 char filename[PATH_MAX];
Ingo Molnar16f762a2009-05-27 09:10:38 +0200169 char bf[BUFSIZ];
Arnaldo Carvalho de Meloa0055ae2009-06-01 17:50:19 -0300170 int fd, ret;
Arnaldo Carvalho de Melo1a853e32009-05-14 22:50:46 -0300171 size_t size;
Arnaldo Carvalho de Meloa0055ae2009-06-01 17:50:19 -0300172 char *field, *sep;
Arnaldo Carvalho de Melo1a853e32009-05-14 22:50:46 -0300173
174 snprintf(filename, sizeof(filename), "/proc/%d/stat", pid);
175
176 fd = open(filename, O_RDONLY);
177 if (fd < 0) {
178 fprintf(stderr, "couldn't open %s\n", filename);
179 exit(EXIT_FAILURE);
180 }
181 if (read(fd, bf, sizeof(bf)) < 0) {
182 fprintf(stderr, "couldn't read %s\n", filename);
183 exit(EXIT_FAILURE);
184 }
185 close(fd);
186
Arnaldo Carvalho de Meloa0055ae2009-06-01 17:50:19 -0300187 /* 9027 (cat) R 6747 9027 6747 34816 9027 ... */
Arnaldo Carvalho de Melo1a853e32009-05-14 22:50:46 -0300188 memset(&comm_ev, 0, sizeof(comm_ev));
Arnaldo Carvalho de Meloa0055ae2009-06-01 17:50:19 -0300189 field = strchr(bf, '(');
190 if (field == NULL)
191 goto out_failure;
192 sep = strchr(++field, ')');
193 if (sep == NULL)
194 goto out_failure;
195 size = sep - field;
196 memcpy(comm_ev.comm, field, size++);
197 field = strchr(sep + 4, ' ');
198 if (field == NULL)
199 goto out_failure;
200 comm_ev.pid = atoi(++field);
Arnaldo Carvalho de Melo1a853e32009-05-14 22:50:46 -0300201 comm_ev.header.type = PERF_EVENT_COMM;
202 comm_ev.tid = pid;
Arnaldo Carvalho de Melo1a853e32009-05-14 22:50:46 -0300203 size = ALIGN(size, sizeof(uint64_t));
204 comm_ev.header.size = sizeof(comm_ev) - (sizeof(comm_ev.comm) - size);
Ingo Molnar16f762a2009-05-27 09:10:38 +0200205
206 ret = write(output, &comm_ev, comm_ev.header.size);
Arnaldo Carvalho de Melo1a853e32009-05-14 22:50:46 -0300207 if (ret < 0) {
208 perror("failed to write");
209 exit(-1);
210 }
211 return comm_ev.pid;
Arnaldo Carvalho de Meloa0055ae2009-06-01 17:50:19 -0300212out_failure:
213 fprintf(stderr, "couldn't get COMM and pgid, malformed %s\n",
214 filename);
215 exit(EXIT_FAILURE);
216 return -1;
Arnaldo Carvalho de Melo1a853e32009-05-14 22:50:46 -0300217}
218
219static void pid_synthesize_mmap_events(pid_t pid, pid_t pgid)
220{
221 char filename[PATH_MAX];
222 FILE *fp;
223
224 snprintf(filename, sizeof(filename), "/proc/%d/maps", pid);
225
226 fp = fopen(filename, "r");
227 if (fp == NULL) {
228 fprintf(stderr, "couldn't open %s\n", filename);
229 exit(EXIT_FAILURE);
230 }
231 while (1) {
Arnaldo Carvalho de Meloa0055ae2009-06-01 17:50:19 -0300232 char bf[BUFSIZ], *pbf = bf;
Arnaldo Carvalho de Melo1a853e32009-05-14 22:50:46 -0300233 struct mmap_event mmap_ev = {
234 .header.type = PERF_EVENT_MMAP,
235 };
Arnaldo Carvalho de Meloa0055ae2009-06-01 17:50:19 -0300236 int n;
Arnaldo Carvalho de Melo1a853e32009-05-14 22:50:46 -0300237 size_t size;
238 if (fgets(bf, sizeof(bf), fp) == NULL)
239 break;
240
241 /* 00400000-0040c000 r-xp 00000000 fd:01 41038 /bin/cat */
Arnaldo Carvalho de Meloa0055ae2009-06-01 17:50:19 -0300242 n = hex2u64(pbf, &mmap_ev.start);
243 if (n < 0)
244 continue;
245 pbf += n + 1;
246 n = hex2u64(pbf, &mmap_ev.len);
247 if (n < 0)
248 continue;
249 pbf += n + 3;
250 if (*pbf == 'x') { /* vm_exec */
Arnaldo Carvalho de Melo1a853e32009-05-14 22:50:46 -0300251 char *execname = strrchr(bf, ' ');
252
253 if (execname == NULL || execname[1] != '/')
254 continue;
255
256 execname += 1;
257 size = strlen(execname);
258 execname[size - 1] = '\0'; /* Remove \n */
259 memcpy(mmap_ev.filename, execname, size);
260 size = ALIGN(size, sizeof(uint64_t));
261 mmap_ev.len -= mmap_ev.start;
262 mmap_ev.header.size = (sizeof(mmap_ev) -
263 (sizeof(mmap_ev.filename) - size));
264 mmap_ev.pid = pgid;
265 mmap_ev.tid = pid;
266
267 if (write(output, &mmap_ev, mmap_ev.header.size) < 0) {
268 perror("failed to write");
269 exit(-1);
270 }
271 }
272 }
273
274 fclose(fp);
275}
276
277static void open_counters(int cpu, pid_t pid)
Peter Zijlstrade9ac072009-04-08 15:01:31 +0200278{
Peter Zijlstrade9ac072009-04-08 15:01:31 +0200279 struct perf_counter_hw_event hw_event;
Peter Zijlstra16c8a102009-05-05 17:50:27 +0200280 int counter, group_fd;
281 int track = 1;
Peter Zijlstra16c8a102009-05-05 17:50:27 +0200282
Arnaldo Carvalho de Melo1a853e32009-05-14 22:50:46 -0300283 if (pid > 0) {
284 pid_t pgid = pid_synthesize_comm_event(pid);
285 pid_synthesize_mmap_events(pid, pgid);
286 }
Peter Zijlstra16c8a102009-05-05 17:50:27 +0200287
288 group_fd = -1;
289 for (counter = 0; counter < nr_counters; counter++) {
290
291 memset(&hw_event, 0, sizeof(hw_event));
292 hw_event.config = event_id[counter];
293 hw_event.irq_period = event_count[counter];
294 hw_event.record_type = PERF_RECORD_IP | PERF_RECORD_TID;
295 hw_event.nmi = nmi;
296 hw_event.mmap = track;
297 hw_event.comm = track;
298 hw_event.inherit = (cpu < 0) && inherit;
299
300 track = 0; // only the first counter needs these
301
302 fd[nr_cpu][counter] =
303 sys_perf_counter_open(&hw_event, pid, cpu, group_fd, 0);
304
305 if (fd[nr_cpu][counter] < 0) {
306 int err = errno;
307 printf("kerneltop error: syscall returned with %d (%s)\n",
308 fd[nr_cpu][counter], strerror(err));
309 if (err == EPERM)
310 printf("Are you root?\n");
311 exit(-1);
312 }
313 assert(fd[nr_cpu][counter] >= 0);
314 fcntl(fd[nr_cpu][counter], F_SETFL, O_NONBLOCK);
315
316 /*
317 * First counter acts as the group leader:
318 */
319 if (group && group_fd == -1)
320 group_fd = fd[nr_cpu][counter];
321
322 event_array[nr_poll].fd = fd[nr_cpu][counter];
323 event_array[nr_poll].events = POLLIN;
324 nr_poll++;
325
326 mmap_array[nr_cpu][counter].counter = counter;
327 mmap_array[nr_cpu][counter].prev = 0;
328 mmap_array[nr_cpu][counter].mask = mmap_pages*page_size - 1;
329 mmap_array[nr_cpu][counter].base = mmap(NULL, (mmap_pages+1)*page_size,
330 PROT_READ, MAP_SHARED, fd[nr_cpu][counter], 0);
331 if (mmap_array[nr_cpu][counter].base == MAP_FAILED) {
332 printf("kerneltop error: failed to mmap with %d (%s)\n",
333 errno, strerror(errno));
334 exit(-1);
335 }
336 }
337 nr_cpu++;
338}
339
Ingo Molnar0e9b20b2009-05-26 09:17:18 +0200340static int __cmd_record(int argc, const char **argv)
Peter Zijlstra16c8a102009-05-05 17:50:27 +0200341{
342 int i, counter;
Peter Zijlstrade9ac072009-04-08 15:01:31 +0200343 pid_t pid;
344 int ret;
345
346 page_size = sysconf(_SC_PAGE_SIZE);
Peter Zijlstrade9ac072009-04-08 15:01:31 +0200347 nr_cpus = sysconf(_SC_NPROCESSORS_ONLN);
348 assert(nr_cpus <= MAX_NR_CPUS);
349 assert(nr_cpus >= 0);
350
Mike Galbraith229c4ee2009-05-28 16:28:53 +0200351 output = open(output_name, O_CREAT|O_EXCL|O_RDWR, S_IRWXU);
Peter Zijlstrade9ac072009-04-08 15:01:31 +0200352 if (output < 0) {
353 perror("failed to create output file");
354 exit(-1);
355 }
356
Arnaldo Carvalho de Melo1a853e32009-05-14 22:50:46 -0300357 if (!system_wide) {
358 open_counters(-1, target_pid != -1 ? target_pid : 0);
359 } else for (i = 0; i < nr_cpus; i++)
360 open_counters(i, target_pid);
Peter Zijlstrade9ac072009-04-08 15:01:31 +0200361
Peter Zijlstra16c8a102009-05-05 17:50:27 +0200362 signal(SIGCHLD, sig_handler);
363 signal(SIGINT, sig_handler);
Peter Zijlstrade9ac072009-04-08 15:01:31 +0200364
Mike Galbraithef65b2a2009-05-27 10:10:51 +0200365 if (target_pid == -1 && argc) {
Arnaldo Carvalho de Melo1a853e32009-05-14 22:50:46 -0300366 pid = fork();
367 if (pid < 0)
368 perror("failed to fork");
Peter Zijlstrade9ac072009-04-08 15:01:31 +0200369
Arnaldo Carvalho de Melo1a853e32009-05-14 22:50:46 -0300370 if (!pid) {
Ingo Molnar0e9b20b2009-05-26 09:17:18 +0200371 if (execvp(argv[0], (char **)argv)) {
Arnaldo Carvalho de Melo1a853e32009-05-14 22:50:46 -0300372 perror(argv[0]);
373 exit(-1);
374 }
Peter Zijlstrade9ac072009-04-08 15:01:31 +0200375 }
376 }
377
378 if (realtime_prio) {
379 struct sched_param param;
380
381 param.sched_priority = realtime_prio;
382 if (sched_setscheduler(0, SCHED_FIFO, &param)) {
383 printf("Could not set realtime priority.\n");
384 exit(-1);
385 }
386 }
387
388 /*
389 * TODO: store the current /proc/$/maps information somewhere
390 */
391
392 while (!done) {
393 int hits = events;
394
Peter Zijlstra16c8a102009-05-05 17:50:27 +0200395 for (i = 0; i < nr_cpu; i++) {
Peter Zijlstrade9ac072009-04-08 15:01:31 +0200396 for (counter = 0; counter < nr_counters; counter++)
397 mmap_read(&mmap_array[i][counter]);
398 }
399
400 if (hits == events)
401 ret = poll(event_array, nr_poll, 100);
402 }
403
404 return 0;
405}
Ingo Molnar0e9b20b2009-05-26 09:17:18 +0200406
Ingo Molnar0e9b20b2009-05-26 09:17:18 +0200407static const char * const record_usage[] = {
Mike Galbraith9e0967532009-05-28 16:25:34 +0200408 "perf record [<options>] [<command>]",
409 "perf record [<options>] -- <command> [<options>]",
Ingo Molnar0e9b20b2009-05-26 09:17:18 +0200410 NULL
411};
412
Ingo Molnar8ad8db32009-05-26 11:10:09 +0200413static char events_help_msg[EVENTS_HELP_MAX];
414
Ingo Molnar52425192009-05-26 09:17:18 +0200415static const struct option options[] = {
Ingo Molnar0e9b20b2009-05-26 09:17:18 +0200416 OPT_CALLBACK('e', "event", NULL, "event",
Ingo Molnar8ad8db32009-05-26 11:10:09 +0200417 events_help_msg, parse_events),
Ingo Molnar0e9b20b2009-05-26 09:17:18 +0200418 OPT_INTEGER('c', "count", &default_interval,
419 "event period to sample"),
420 OPT_INTEGER('m', "mmap-pages", &mmap_pages,
421 "number of mmap data pages"),
422 OPT_STRING('o', "output", &output_name, "file",
423 "output file name"),
424 OPT_BOOLEAN('i', "inherit", &inherit,
425 "child tasks inherit counters"),
426 OPT_INTEGER('p', "pid", &target_pid,
427 "record events on existing pid"),
428 OPT_INTEGER('r', "realtime", &realtime_prio,
429 "collect data with this RT SCHED_FIFO priority"),
430 OPT_BOOLEAN('a', "all-cpus", &system_wide,
431 "system-wide collection from all CPUs"),
432 OPT_END()
433};
434
435int cmd_record(int argc, const char **argv, const char *prefix)
436{
437 int counter;
438
Ingo Molnar8ad8db32009-05-26 11:10:09 +0200439 create_events_help(events_help_msg);
Ingo Molnar0e9b20b2009-05-26 09:17:18 +0200440
441 argc = parse_options(argc, argv, options, record_usage, 0);
Mike Galbraithef65b2a2009-05-27 10:10:51 +0200442 if (!argc && target_pid == -1 && !system_wide)
Ingo Molnar0e9b20b2009-05-26 09:17:18 +0200443 usage_with_options(record_usage, options);
444
445 if (!nr_counters) {
446 nr_counters = 1;
447 event_id[0] = 0;
448 }
449
450 for (counter = 0; counter < nr_counters; counter++) {
451 if (event_count[counter])
452 continue;
453
454 event_count[counter] = default_interval;
455 }
456
457 return __cmd_record(argc, argv);
458}