perf session: Fallback to unordered processing if no sample_id_all
[deliverable/linux.git] / tools / perf / builtin-record.c
CommitLineData
abaff32a 1/*
bf9e1876
IM
2 * builtin-record.c
3 *
4 * Builtin record command: Record the profile of a workload
5 * (or a CPU, or a PID) into the perf.data output file - for
6 * later analysis via perf report.
abaff32a 7 */
b8f46c5a
XG
8#define _FILE_OFFSET_BITS 64
9
16f762a2 10#include "builtin.h"
bf9e1876
IM
11
12#include "perf.h"
13
6122e4e4 14#include "util/build-id.h"
6eda5838 15#include "util/util.h"
0e9b20b8 16#include "util/parse-options.h"
8ad8db37 17#include "util/parse-events.h"
6eda5838 18
7c6a1c65 19#include "util/header.h"
66e274f3 20#include "util/event.h"
8f28827a 21#include "util/debug.h"
94c744b6 22#include "util/session.h"
8d06367f 23#include "util/symbol.h"
a12b51c4 24#include "util/cpumap.h"
7c6a1c65 25
97124d5e 26#include <unistd.h>
de9ac07b 27#include <sched.h>
a41794cd 28#include <sys/mman.h>
de9ac07b 29
7865e817
FW
30enum write_mode_t {
31 WRITE_FORCE,
32 WRITE_APPEND
33};
34
d6d901c2 35static int *fd[MAX_NR_CPUS][MAX_COUNTERS];
a21ca2ca 36
3de29cab
SE
37static u64 user_interval = ULLONG_MAX;
38static u64 default_interval = 0;
640c03ce 39static u64 sample_type;
a21ca2ca 40
42e59d7d 41static int nr_cpus = 0;
de9ac07b 42static unsigned int page_size;
42e59d7d 43static unsigned int mmap_pages = 128;
f9212819 44static unsigned int user_freq = UINT_MAX;
42e59d7d 45static int freq = 1000;
de9ac07b 46static int output;
529870e3 47static int pipe_output = 0;
23ac9cbe 48static const char *output_name = "perf.data";
42e59d7d 49static int group = 0;
1967936d 50static int realtime_prio = 0;
c0555642 51static bool raw_samples = false;
9c90a61c 52static bool sample_id_all_avail = true;
c0555642 53static bool system_wide = false;
42e59d7d 54static pid_t target_pid = -1;
d6d901c2
ZY
55static pid_t target_tid = -1;
56static pid_t *all_tids = NULL;
57static int thread_num = 0;
42e59d7d 58static pid_t child_pid = -1;
2e6cdf99 59static bool no_inherit = false;
7865e817 60static enum write_mode_t write_mode = WRITE_FORCE;
c0555642
IM
61static bool call_graph = false;
62static bool inherit_stat = false;
63static bool no_samples = false;
64static bool sample_address = false;
9c90a61c 65static bool sample_time = false;
a1ac1d3c 66static bool no_buildid = false;
baa2f6ce 67static bool no_buildid_cache = false;
42e59d7d
IM
68
69static long samples = 0;
42e59d7d 70static u64 bytes_written = 0;
a21ca2ca 71
d6d901c2 72static struct pollfd *event_array;
a21ca2ca 73
42e59d7d
IM
74static int nr_poll = 0;
75static int nr_cpu = 0;
a21ca2ca 76
42e59d7d 77static int file_new = 1;
6122e4e4 78static off_t post_processing_offset;
7c6a1c65 79
94c744b6 80static struct perf_session *session;
c45c6ea2 81static const char *cpu_list;
f5970550 82
de9ac07b 83struct mmap_data {
a21ca2ca
IM
84 int counter;
85 void *base;
86 unsigned int mask;
87 unsigned int prev;
de9ac07b
PZ
88};
89
0e2e63dd 90static struct mmap_data mmap_array[MAX_NR_CPUS];
a21ca2ca 91
9d91a6f7 92static unsigned long mmap_read_head(struct mmap_data *md)
de9ac07b 93{
cdd6c482 94 struct perf_event_mmap_page *pc = md->base;
9d91a6f7 95 long head;
de9ac07b
PZ
96
97 head = pc->data_head;
98 rmb();
99
100 return head;
101}
102
9d91a6f7
PZ
103static void mmap_write_tail(struct mmap_data *md, unsigned long tail)
104{
cdd6c482 105 struct perf_event_mmap_page *pc = md->base;
9d91a6f7
PZ
106
107 /*
108 * ensure all reads are done before we write the tail out.
109 */
110 /* mb(); */
111 pc->data_tail = tail;
112}
113
9215545e
TZ
114static void advance_output(size_t size)
115{
116 bytes_written += size;
117}
118
f5970550
PZ
119static void write_output(void *buf, size_t size)
120{
121 while (size) {
122 int ret = write(output, buf, size);
123
124 if (ret < 0)
125 die("failed to write");
126
127 size -= ret;
128 buf += ret;
129
130 bytes_written += ret;
131 }
132}
133
d8f66248 134static int process_synthesized_event(event_t *event,
640c03ce 135 struct sample_data *sample __used,
d8f66248 136 struct perf_session *self __used)
234fbbf5 137{
6122e4e4 138 write_output(event, event->header.size);
234fbbf5
ACM
139 return 0;
140}
141
de9ac07b
PZ
142static void mmap_read(struct mmap_data *md)
143{
144 unsigned int head = mmap_read_head(md);
145 unsigned int old = md->prev;
146 unsigned char *data = md->base + page_size;
147 unsigned long size;
148 void *buf;
149 int diff;
150
de9ac07b
PZ
151 /*
152 * If we're further behind than half the buffer, there's a chance
2debbc83 153 * the writer will bite our tail and mess up the samples under us.
de9ac07b
PZ
154 *
155 * If we somehow ended up ahead of the head, we got messed up.
156 *
157 * In either case, truncate and restart at head.
158 */
159 diff = head - old;
9d91a6f7 160 if (diff < 0) {
ef365cef 161 fprintf(stderr, "WARNING: failed to keep up with mmap data\n");
de9ac07b
PZ
162 /*
163 * head points to a known good entry, start there.
164 */
165 old = head;
166 }
167
de9ac07b 168 if (old != head)
2debbc83 169 samples++;
de9ac07b
PZ
170
171 size = head - old;
172
173 if ((old & md->mask) + size != (head & md->mask)) {
174 buf = &data[old & md->mask];
175 size = md->mask + 1 - (old & md->mask);
176 old += size;
021e9f47 177
6122e4e4 178 write_output(buf, size);
de9ac07b
PZ
179 }
180
181 buf = &data[old & md->mask];
182 size = head - old;
183 old += size;
021e9f47 184
6122e4e4 185 write_output(buf, size);
de9ac07b
PZ
186
187 md->prev = old;
9d91a6f7 188 mmap_write_tail(md, old);
de9ac07b
PZ
189}
190
191static volatile int done = 0;
f7b7c26e 192static volatile int signr = -1;
de9ac07b 193
16c8a109 194static void sig_handler(int sig)
de9ac07b 195{
16c8a109 196 done = 1;
f7b7c26e
PZ
197 signr = sig;
198}
199
200static void sig_atexit(void)
201{
5ffc8881 202 if (child_pid > 0)
933da83a
CW
203 kill(child_pid, SIGTERM);
204
18483b81 205 if (signr == -1 || signr == SIGUSR1)
f7b7c26e
PZ
206 return;
207
208 signal(signr, SIG_DFL);
209 kill(getpid(), signr);
de9ac07b
PZ
210}
211
f250c030
IM
212static int group_fd;
213
cdd6c482 214static struct perf_header_attr *get_header_attr(struct perf_event_attr *a, int nr)
7c6a1c65
PZ
215{
216 struct perf_header_attr *h_attr;
217
94c744b6
ACM
218 if (nr < session->header.attrs) {
219 h_attr = session->header.attr[nr];
7c6a1c65
PZ
220 } else {
221 h_attr = perf_header_attr__new(a);
dc79c0fc 222 if (h_attr != NULL)
94c744b6 223 if (perf_header__add_attr(&session->header, h_attr) < 0) {
11deb1f9
ACM
224 perf_header_attr__delete(h_attr);
225 h_attr = NULL;
226 }
7c6a1c65
PZ
227 }
228
229 return h_attr;
230}
231
d6d901c2 232static void create_counter(int counter, int cpu)
de9ac07b 233{
c171b552 234 char *filter = filters[counter];
cdd6c482 235 struct perf_event_attr *attr = attrs + counter;
7c6a1c65
PZ
236 struct perf_header_attr *h_attr;
237 int track = !counter; /* only the first counter needs these */
d6d901c2 238 int thread_index;
c171b552 239 int ret;
7c6a1c65
PZ
240 struct {
241 u64 count;
242 u64 time_enabled;
243 u64 time_running;
244 u64 id;
245 } read_data;
246
247 attr->read_format = PERF_FORMAT_TOTAL_TIME_ENABLED |
248 PERF_FORMAT_TOTAL_TIME_RUNNING |
249 PERF_FORMAT_ID;
16c8a109 250
3a9f131f 251 attr->sample_type |= PERF_SAMPLE_IP | PERF_SAMPLE_TID;
3efa1cc9 252
8907fd60
EM
253 if (nr_counters > 1)
254 attr->sample_type |= PERF_SAMPLE_ID;
255
f9212819
FW
256 /*
257 * We default some events to a 1 default interval. But keep
258 * it a weak assumption overridable by the user.
259 */
260 if (!attr->sample_period || (user_freq != UINT_MAX &&
3de29cab 261 user_interval != ULLONG_MAX)) {
f9212819
FW
262 if (freq) {
263 attr->sample_type |= PERF_SAMPLE_PERIOD;
264 attr->freq = 1;
265 attr->sample_freq = freq;
266 } else {
267 attr->sample_period = default_interval;
268 }
1dba15e7 269 }
3efa1cc9 270
649c48a9
PZ
271 if (no_samples)
272 attr->sample_freq = 0;
273
274 if (inherit_stat)
275 attr->inherit_stat = 1;
276
3af9e859 277 if (sample_address) {
4bba828d 278 attr->sample_type |= PERF_SAMPLE_ADDR;
3af9e859
EM
279 attr->mmap_data = track;
280 }
4bba828d 281
3efa1cc9
IM
282 if (call_graph)
283 attr->sample_type |= PERF_SAMPLE_CALLCHAIN;
284
f60f3593
AS
285 if (system_wide)
286 attr->sample_type |= PERF_SAMPLE_CPU;
287
9c90a61c
ACM
288 if (sample_time)
289 attr->sample_type |= PERF_SAMPLE_TIME;
290
cd6feeea 291 if (raw_samples) {
6ddf259d 292 attr->sample_type |= PERF_SAMPLE_TIME;
daac07b2 293 attr->sample_type |= PERF_SAMPLE_RAW;
cd6feeea
IM
294 attr->sample_type |= PERF_SAMPLE_CPU;
295 }
f413cdb8 296
640c03ce
ACM
297 if (!sample_type)
298 sample_type = attr->sample_type;
299
a21ca2ca
IM
300 attr->mmap = track;
301 attr->comm = track;
2e6cdf99
SE
302 attr->inherit = !no_inherit;
303 if (target_pid == -1 && target_tid == -1 && !system_wide) {
46be604b 304 attr->disabled = 1;
bedbfdea 305 attr->enable_on_exec = 1;
46be604b 306 }
9c90a61c
ACM
307retry_sample_id:
308 attr->sample_id_all = sample_id_all_avail ? 1 : 0;
bedbfdea 309
d6d901c2 310 for (thread_index = 0; thread_index < thread_num; thread_index++) {
3da297a6 311try_again:
d6d901c2
ZY
312 fd[nr_cpu][counter][thread_index] = sys_perf_event_open(attr,
313 all_tids[thread_index], cpu, group_fd, 0);
314
315 if (fd[nr_cpu][counter][thread_index] < 0) {
316 int err = errno;
317
318 if (err == EPERM || err == EACCES)
319 die("Permission error - are you root?\n"
320 "\t Consider tweaking"
321 " /proc/sys/kernel/perf_event_paranoid.\n");
c45c6ea2 322 else if (err == ENODEV && cpu_list) {
d6d901c2
ZY
323 die("No such device - did you specify"
324 " an out-of-range profile CPU?\n");
9c90a61c
ACM
325 } else if (err == EINVAL && sample_id_all_avail) {
326 /*
327 * Old kernel, no attr->sample_id_type_all field
328 */
329 sample_id_all_avail = false;
330 goto retry_sample_id;
d6d901c2 331 }
3da297a6 332
d6d901c2
ZY
333 /*
334 * If it's cycles then fall back to hrtimer
335 * based cpu-clock-tick sw counter, which
336 * is always available even if no PMU support:
337 */
338 if (attr->type == PERF_TYPE_HARDWARE
339 && attr->config == PERF_COUNT_HW_CPU_CYCLES) {
340
341 if (verbose)
342 warning(" ... trying to fall back to cpu-clock-ticks\n");
343 attr->type = PERF_TYPE_SOFTWARE;
344 attr->config = PERF_COUNT_SW_CPU_CLOCK;
345 goto try_again;
346 }
347 printf("\n");
d9cf837e 348 error("sys_perf_event_open() syscall returned with %d (%s). /bin/dmesg may provide additional information.\n",
d6d901c2 349 fd[nr_cpu][counter][thread_index], strerror(err));
bfd45118
SK
350
351#if defined(__i386__) || defined(__x86_64__)
d6d901c2
ZY
352 if (attr->type == PERF_TYPE_HARDWARE && err == EOPNOTSUPP)
353 die("No hardware sampling interrupt available."
354 " No APIC? If so then you can boot the kernel"
355 " with the \"lapic\" boot parameter to"
356 " force-enable it.\n");
bfd45118
SK
357#endif
358
d6d901c2
ZY
359 die("No CONFIG_PERF_EVENTS=y kernel support configured?\n");
360 exit(-1);
361 }
3da297a6 362
d6d901c2
ZY
363 h_attr = get_header_attr(attr, counter);
364 if (h_attr == NULL)
365 die("nomem\n");
7c6a1c65 366
d6d901c2
ZY
367 if (!file_new) {
368 if (memcmp(&h_attr->attr, attr, sizeof(*attr))) {
369 fprintf(stderr, "incompatible append\n");
370 exit(-1);
371 }
7c6a1c65 372 }
7c6a1c65 373
d6d901c2 374 if (read(fd[nr_cpu][counter][thread_index], &read_data, sizeof(read_data)) == -1) {
0ab7368f 375 perror("Unable to read perf file descriptor");
d6d901c2
ZY
376 exit(-1);
377 }
7c6a1c65 378
d6d901c2
ZY
379 if (perf_header_attr__add_id(h_attr, read_data.id) < 0) {
380 pr_warning("Not enough memory to add id\n");
381 exit(-1);
382 }
7c6a1c65 383
d6d901c2
ZY
384 assert(fd[nr_cpu][counter][thread_index] >= 0);
385 fcntl(fd[nr_cpu][counter][thread_index], F_SETFL, O_NONBLOCK);
16c8a109 386
d6d901c2
ZY
387 /*
388 * First counter acts as the group leader:
389 */
390 if (group && group_fd == -1)
391 group_fd = fd[nr_cpu][counter][thread_index];
f250c030 392
0e2e63dd
PZ
393 if (counter || thread_index) {
394 ret = ioctl(fd[nr_cpu][counter][thread_index],
395 PERF_EVENT_IOC_SET_OUTPUT,
396 fd[nr_cpu][0][0]);
397 if (ret) {
398 error("failed to set output: %d (%s)\n", errno,
399 strerror(errno));
400 exit(-1);
401 }
402 } else {
403 mmap_array[nr_cpu].counter = counter;
404 mmap_array[nr_cpu].prev = 0;
405 mmap_array[nr_cpu].mask = mmap_pages*page_size - 1;
406 mmap_array[nr_cpu].base = mmap(NULL, (mmap_pages+1)*page_size,
407 PROT_READ|PROT_WRITE, MAP_SHARED, fd[nr_cpu][counter][thread_index], 0);
408 if (mmap_array[nr_cpu].base == MAP_FAILED) {
409 error("failed to mmap with %d (%s)\n", errno, strerror(errno));
410 exit(-1);
411 }
412
413 event_array[nr_poll].fd = fd[nr_cpu][counter][thread_index];
414 event_array[nr_poll].events = POLLIN;
415 nr_poll++;
ea57c4f5 416 }
d1302522 417
d6d901c2
ZY
418 if (filter != NULL) {
419 ret = ioctl(fd[nr_cpu][counter][thread_index],
420 PERF_EVENT_IOC_SET_FILTER, filter);
421 if (ret) {
422 error("failed to set filter with %d (%s)\n", errno,
423 strerror(errno));
424 exit(-1);
425 }
c171b552
LZ
426 }
427 }
f250c030 428}
f2521b6e 429
d6d901c2 430static void open_counters(int cpu)
f250c030
IM
431{
432 int counter;
16c8a109 433
f250c030
IM
434 group_fd = -1;
435 for (counter = 0; counter < nr_counters; counter++)
d6d901c2 436 create_counter(counter, cpu);
f250c030 437
16c8a109
PZ
438 nr_cpu++;
439}
440
6122e4e4
ACM
441static int process_buildids(void)
442{
443 u64 size = lseek(output, 0, SEEK_CUR);
444
9f591fd7
ACM
445 if (size == 0)
446 return 0;
447
6122e4e4
ACM
448 session->fd = output;
449 return __perf_session__process_events(session, post_processing_offset,
450 size - post_processing_offset,
451 size, &build_id__mark_dso_hit_ops);
452}
453
f5970550
PZ
454static void atexit_header(void)
455{
c7929e47
TZ
456 if (!pipe_output) {
457 session->header.data_size += bytes_written;
f5970550 458
baa2f6ce
ACM
459 if (!no_buildid)
460 process_buildids();
c7929e47 461 perf_header__write(&session->header, output, true);
39d17dac 462 perf_session__delete(session);
d65a458b 463 symbol__exit();
c7929e47 464 }
f5970550
PZ
465}
466
23346f21 467static void event__synthesize_guest_os(struct machine *machine, void *data)
a1645ce1
ZY
468{
469 int err;
23346f21 470 struct perf_session *psession = data;
a1645ce1 471
23346f21 472 if (machine__is_host(machine))
a1645ce1
ZY
473 return;
474
475 /*
476 *As for guest kernel when processing subcommand record&report,
477 *we arrange module mmap prior to guest kernel mmap and trigger
478 *a preload dso because default guest module symbols are loaded
479 *from guest kallsyms instead of /lib/modules/XXX/XXX. This
480 *method is used to avoid symbol missing when the first addr is
481 *in module instead of in guest kernel.
482 */
483 err = event__synthesize_modules(process_synthesized_event,
23346f21 484 psession, machine);
a1645ce1
ZY
485 if (err < 0)
486 pr_err("Couldn't record guest kernel [%d]'s reference"
23346f21 487 " relocation symbol.\n", machine->pid);
a1645ce1 488
a1645ce1
ZY
489 /*
490 * We use _stext for guest kernel because guest kernel's /proc/kallsyms
491 * have no _text sometimes.
492 */
493 err = event__synthesize_kernel_mmap(process_synthesized_event,
23346f21 494 psession, machine, "_text");
a1645ce1
ZY
495 if (err < 0)
496 err = event__synthesize_kernel_mmap(process_synthesized_event,
23346f21 497 psession, machine, "_stext");
a1645ce1
ZY
498 if (err < 0)
499 pr_err("Couldn't record guest kernel [%d]'s reference"
23346f21 500 " relocation symbol.\n", machine->pid);
a1645ce1
ZY
501}
502
98402807
FW
503static struct perf_event_header finished_round_event = {
504 .size = sizeof(struct perf_event_header),
505 .type = PERF_RECORD_FINISHED_ROUND,
506};
507
508static void mmap_read_all(void)
509{
0e2e63dd 510 int i;
98402807
FW
511
512 for (i = 0; i < nr_cpu; i++) {
0e2e63dd
PZ
513 if (mmap_array[i].base)
514 mmap_read(&mmap_array[i]);
98402807
FW
515 }
516
517 if (perf_header__has_feat(&session->header, HEADER_TRACE_INFO))
518 write_output(&finished_round_event, sizeof(finished_round_event));
519}
520
d4db3f16 521static int __cmd_record(int argc, const char **argv)
16c8a109
PZ
522{
523 int i, counter;
abaff32a 524 struct stat st;
abaff32a 525 int flags;
4dc0a04b 526 int err;
8b412664 527 unsigned long waking = 0;
856e9660 528 int child_ready_pipe[2], go_pipe[2];
46be604b 529 const bool forks = argc > 0;
856e9660 530 char buf;
23346f21 531 struct machine *machine;
de9ac07b
PZ
532
533 page_size = sysconf(_SC_PAGE_SIZE);
de9ac07b 534
f5970550
PZ
535 atexit(sig_atexit);
536 signal(SIGCHLD, sig_handler);
537 signal(SIGINT, sig_handler);
18483b81 538 signal(SIGUSR1, sig_handler);
f5970550 539
d4db3f16 540 if (forks && (pipe(child_ready_pipe) < 0 || pipe(go_pipe) < 0)) {
856e9660
PZ
541 perror("failed to create pipes");
542 exit(-1);
543 }
544
529870e3
TZ
545 if (!strcmp(output_name, "-"))
546 pipe_output = 1;
547 else if (!stat(output_name, &st) && st.st_size) {
7865e817 548 if (write_mode == WRITE_FORCE) {
b38d3464
ACM
549 char oldname[PATH_MAX];
550 snprintf(oldname, sizeof(oldname), "%s.old",
551 output_name);
552 unlink(oldname);
553 rename(output_name, oldname);
266e0e21 554 }
7865e817
FW
555 } else if (write_mode == WRITE_APPEND) {
556 write_mode = WRITE_FORCE;
97124d5e
PZ
557 }
558
f887f301 559 flags = O_CREAT|O_RDWR;
7865e817 560 if (write_mode == WRITE_APPEND)
f5970550 561 file_new = 0;
abaff32a
IM
562 else
563 flags |= O_TRUNC;
564
529870e3
TZ
565 if (pipe_output)
566 output = STDOUT_FILENO;
567 else
568 output = open(output_name, flags, S_IRUSR | S_IWUSR);
de9ac07b
PZ
569 if (output < 0) {
570 perror("failed to create output file");
571 exit(-1);
572 }
573
7865e817 574 session = perf_session__new(output_name, O_WRONLY,
21ef97f0 575 write_mode == WRITE_FORCE, false, NULL);
94c744b6 576 if (session == NULL) {
a9a70bbc
ACM
577 pr_err("Not enough memory for reading perf file header\n");
578 return -1;
579 }
580
baa2f6ce
ACM
581 if (!no_buildid)
582 perf_header__set_feat(&session->header, HEADER_BUILD_ID);
583
4dc0a04b 584 if (!file_new) {
8dc58101 585 err = perf_header__read(session, output);
4dc0a04b 586 if (err < 0)
39d17dac 587 goto out_delete_session;
4dc0a04b
ACM
588 }
589
db620b1c 590 if (have_tracepoints(attrs, nr_counters))
94c744b6 591 perf_header__set_feat(&session->header, HEADER_TRACE_INFO);
03456a15 592
39d17dac
ACM
593 /*
594 * perf_session__delete(session) will be called at atexit_header()
595 */
f5970550
PZ
596 atexit(atexit_header);
597
d4db3f16 598 if (forks) {
46be604b 599 child_pid = fork();
2fb750e8 600 if (child_pid < 0) {
856e9660
PZ
601 perror("failed to fork");
602 exit(-1);
603 }
7c6a1c65 604
46be604b 605 if (!child_pid) {
529870e3
TZ
606 if (pipe_output)
607 dup2(2, 1);
856e9660
PZ
608 close(child_ready_pipe[0]);
609 close(go_pipe[1]);
610 fcntl(go_pipe[0], F_SETFD, FD_CLOEXEC);
611
612 /*
613 * Do a dummy execvp to get the PLT entry resolved,
614 * so we avoid the resolver overhead on the real
615 * execvp call.
616 */
617 execvp("", (char **)argv);
618
619 /*
620 * Tell the parent we're ready to go
621 */
622 close(child_ready_pipe[1]);
623
624 /*
625 * Wait until the parent tells us to go.
626 */
627 if (read(go_pipe[0], &buf, 1) == -1)
628 perror("unable to read pipe");
629
630 execvp(argv[0], (char **)argv);
631
632 perror(argv[0]);
18483b81 633 kill(getppid(), SIGUSR1);
856e9660 634 exit(-1);
0a5ac846 635 }
856e9660 636
d6d901c2
ZY
637 if (!system_wide && target_tid == -1 && target_pid == -1)
638 all_tids[0] = child_pid;
639
856e9660
PZ
640 close(child_ready_pipe[1]);
641 close(go_pipe[0]);
642 /*
643 * wait for child to settle
644 */
645 if (read(child_ready_pipe[0], &buf, 1) == -1) {
646 perror("unable to read pipe");
647 exit(-1);
648 }
649 close(child_ready_pipe[0]);
650 }
651
c45c6ea2
SE
652 nr_cpus = read_cpu_map(cpu_list);
653 if (nr_cpus < 1) {
0ab7368f 654 perror("failed to collect number of CPUs");
c45c6ea2
SE
655 return -1;
656 }
657
658 if (!system_wide && no_inherit && !cpu_list) {
659 open_counters(-1);
856e9660
PZ
660 } else {
661 for (i = 0; i < nr_cpus; i++)
d6d901c2 662 open_counters(cpumap[i]);
0a5ac846 663 }
de9ac07b 664
640c03ce
ACM
665 perf_session__set_sample_type(session, sample_type);
666
529870e3
TZ
667 if (pipe_output) {
668 err = perf_header__write_pipe(output);
669 if (err < 0)
670 return err;
671 } else if (file_new) {
94c744b6 672 err = perf_header__write(&session->header, output, false);
d5eed904
ACM
673 if (err < 0)
674 return err;
56b03f3c
ACM
675 }
676
6122e4e4
ACM
677 post_processing_offset = lseek(output, 0, SEEK_CUR);
678
9c90a61c
ACM
679 perf_session__set_sample_id_all(session, sample_id_all_avail);
680
2c46dbb5
TZ
681 if (pipe_output) {
682 err = event__synthesize_attrs(&session->header,
683 process_synthesized_event,
684 session);
685 if (err < 0) {
686 pr_err("Couldn't synthesize attrs.\n");
687 return err;
688 }
cd19a035
TZ
689
690 err = event__synthesize_event_types(process_synthesized_event,
691 session);
692 if (err < 0) {
693 pr_err("Couldn't synthesize event_types.\n");
694 return err;
695 }
9215545e 696
63e0c771
TZ
697 if (have_tracepoints(attrs, nr_counters)) {
698 /*
699 * FIXME err <= 0 here actually means that
700 * there were no tracepoints so its not really
701 * an error, just that we don't need to
702 * synthesize anything. We really have to
703 * return this more properly and also
704 * propagate errors that now are calling die()
705 */
706 err = event__synthesize_tracing_data(output, attrs,
707 nr_counters,
708 process_synthesized_event,
709 session);
710 if (err <= 0) {
711 pr_err("Couldn't record tracing data.\n");
712 return err;
713 }
2c9faa06 714 advance_output(err);
63e0c771 715 }
2c46dbb5
TZ
716 }
717
23346f21
ACM
718 machine = perf_session__find_host_machine(session);
719 if (!machine) {
a1645ce1
ZY
720 pr_err("Couldn't find native kernel information.\n");
721 return -1;
722 }
723
56b03f3c 724 err = event__synthesize_kernel_mmap(process_synthesized_event,
23346f21 725 session, machine, "_text");
70162138
ACM
726 if (err < 0)
727 err = event__synthesize_kernel_mmap(process_synthesized_event,
23346f21 728 session, machine, "_stext");
c1a3a4b9
ACM
729 if (err < 0)
730 pr_err("Couldn't record kernel reference relocation symbol\n"
731 "Symbol resolution may be skewed if relocation was used (e.g. kexec).\n"
732 "Check /proc/kallsyms permission or run as root.\n");
b7cece76 733
a1645ce1 734 err = event__synthesize_modules(process_synthesized_event,
23346f21 735 session, machine);
c1a3a4b9
ACM
736 if (err < 0)
737 pr_err("Couldn't record kernel module information.\n"
738 "Symbol resolution may be skewed if relocation was used (e.g. kexec).\n"
739 "Check /proc/modules permission or run as root.\n");
740
a1645ce1 741 if (perf_guest)
23346f21 742 perf_session__process_machines(session, event__synthesize_guest_os);
7c6a1c65 743
cf103a14 744 if (!system_wide)
d6d901c2 745 event__synthesize_thread(target_tid, process_synthesized_event,
d8f66248 746 session);
234fbbf5 747 else
d8f66248 748 event__synthesize_threads(process_synthesized_event, session);
7c6a1c65 749
de9ac07b
PZ
750 if (realtime_prio) {
751 struct sched_param param;
752
753 param.sched_priority = realtime_prio;
754 if (sched_setscheduler(0, SCHED_FIFO, &param)) {
6beba7ad 755 pr_err("Could not set realtime priority.\n");
de9ac07b
PZ
756 exit(-1);
757 }
758 }
759
856e9660
PZ
760 /*
761 * Let the child rip
762 */
d4db3f16
ACM
763 if (forks)
764 close(go_pipe[1]);
856e9660 765
649c48a9 766 for (;;) {
2debbc83 767 int hits = samples;
d6d901c2 768 int thread;
de9ac07b 769
98402807 770 mmap_read_all();
de9ac07b 771
649c48a9
PZ
772 if (hits == samples) {
773 if (done)
774 break;
4dc0a04b 775 err = poll(event_array, nr_poll, -1);
8b412664
PZ
776 waking++;
777 }
778
779 if (done) {
780 for (i = 0; i < nr_cpu; i++) {
d6d901c2
ZY
781 for (counter = 0;
782 counter < nr_counters;
783 counter++) {
784 for (thread = 0;
785 thread < thread_num;
786 thread++)
787 ioctl(fd[i][counter][thread],
788 PERF_EVENT_IOC_DISABLE);
789 }
8b412664 790 }
649c48a9 791 }
de9ac07b
PZ
792 }
793
18483b81 794 if (quiet || signr == SIGUSR1)
b44308f5
ACM
795 return 0;
796
8b412664
PZ
797 fprintf(stderr, "[ perf record: Woken up %ld times to write data ]\n", waking);
798
021e9f47
IM
799 /*
800 * Approximate RIP event size: 24 bytes.
801 */
802 fprintf(stderr,
2debbc83 803 "[ perf record: Captured and wrote %.3f MB %s (~%lld samples) ]\n",
021e9f47
IM
804 (double)bytes_written / 1024.0 / 1024.0,
805 output_name,
806 bytes_written / 24);
addc2785 807
de9ac07b 808 return 0;
39d17dac
ACM
809
810out_delete_session:
811 perf_session__delete(session);
812 return err;
de9ac07b 813}
0e9b20b8 814
0e9b20b8 815static const char * const record_usage[] = {
9e096753
MG
816 "perf record [<options>] [<command>]",
817 "perf record [<options>] -- <command> [<options>]",
0e9b20b8
IM
818 NULL
819};
820
7865e817
FW
821static bool force, append_file;
822
bca647aa 823const struct option record_options[] = {
0e9b20b8 824 OPT_CALLBACK('e', "event", NULL, "event",
86847b62
TG
825 "event selector. use 'perf list' to list available events",
826 parse_events),
c171b552
LZ
827 OPT_CALLBACK(0, "filter", NULL, "filter",
828 "event filter", parse_filter),
0e9b20b8 829 OPT_INTEGER('p', "pid", &target_pid,
d6d901c2
ZY
830 "record events on existing process id"),
831 OPT_INTEGER('t', "tid", &target_tid,
832 "record events on existing thread id"),
0e9b20b8
IM
833 OPT_INTEGER('r', "realtime", &realtime_prio,
834 "collect data with this RT SCHED_FIFO priority"),
daac07b2
FW
835 OPT_BOOLEAN('R', "raw-samples", &raw_samples,
836 "collect raw sample records from all opened counters"),
0e9b20b8
IM
837 OPT_BOOLEAN('a', "all-cpus", &system_wide,
838 "system-wide collection from all CPUs"),
abaff32a
IM
839 OPT_BOOLEAN('A', "append", &append_file,
840 "append to the output file to do incremental profiling"),
c45c6ea2
SE
841 OPT_STRING('C', "cpu", &cpu_list, "cpu",
842 "list of cpus to monitor"),
97124d5e 843 OPT_BOOLEAN('f', "force", &force,
7865e817 844 "overwrite existing data file (deprecated)"),
3de29cab 845 OPT_U64('c', "count", &user_interval, "event period to sample"),
abaff32a
IM
846 OPT_STRING('o', "output", &output_name, "file",
847 "output file name"),
2e6cdf99
SE
848 OPT_BOOLEAN('i', "no-inherit", &no_inherit,
849 "child tasks do not inherit counters"),
1967936d
ACM
850 OPT_UINTEGER('F', "freq", &user_freq, "profile at this frequency"),
851 OPT_UINTEGER('m', "mmap-pages", &mmap_pages, "number of mmap data pages"),
3efa1cc9
IM
852 OPT_BOOLEAN('g', "call-graph", &call_graph,
853 "do call-graph (stack chain/backtrace) recording"),
c0555642 854 OPT_INCR('v', "verbose", &verbose,
3da297a6 855 "be more verbose (show counter open errors, etc)"),
b44308f5 856 OPT_BOOLEAN('q', "quiet", &quiet, "don't print any message"),
649c48a9
PZ
857 OPT_BOOLEAN('s', "stat", &inherit_stat,
858 "per thread counts"),
4bba828d
AB
859 OPT_BOOLEAN('d', "data", &sample_address,
860 "Sample addresses"),
9c90a61c 861 OPT_BOOLEAN('T', "timestamp", &sample_time, "Sample timestamps"),
649c48a9
PZ
862 OPT_BOOLEAN('n', "no-samples", &no_samples,
863 "don't sample"),
baa2f6ce 864 OPT_BOOLEAN('N', "no-buildid-cache", &no_buildid_cache,
a1ac1d3c 865 "do not update the buildid cache"),
baa2f6ce
ACM
866 OPT_BOOLEAN('B', "no-buildid", &no_buildid,
867 "do not collect buildids in perf.data"),
0e9b20b8
IM
868 OPT_END()
869};
870
f37a291c 871int cmd_record(int argc, const char **argv, const char *prefix __used)
0e9b20b8 872{
39d17dac 873 int i, j, err = -ENOMEM;
0e9b20b8 874
bca647aa 875 argc = parse_options(argc, argv, record_options, record_usage,
655000e7 876 PARSE_OPT_STOP_AT_NON_OPTION);
d6d901c2 877 if (!argc && target_pid == -1 && target_tid == -1 &&
c45c6ea2 878 !system_wide && !cpu_list)
bca647aa 879 usage_with_options(record_usage, record_options);
0e9b20b8 880
7865e817
FW
881 if (force && append_file) {
882 fprintf(stderr, "Can't overwrite and append at the same time."
883 " You need to choose between -f and -A");
bca647aa 884 usage_with_options(record_usage, record_options);
7865e817
FW
885 } else if (append_file) {
886 write_mode = WRITE_APPEND;
887 } else {
888 write_mode = WRITE_FORCE;
889 }
890
655000e7 891 symbol__init();
baa2f6ce
ACM
892
893 if (no_buildid_cache || no_buildid)
a1ac1d3c 894 disable_buildid_cache();
655000e7 895
bbd36e5e
PZ
896 if (!nr_counters) {
897 nr_counters = 1;
898 attrs[0].type = PERF_TYPE_HARDWARE;
899 attrs[0].config = PERF_COUNT_HW_CPU_CYCLES;
900 }
0e9b20b8 901
d6d901c2
ZY
902 if (target_pid != -1) {
903 target_tid = target_pid;
904 thread_num = find_all_tid(target_pid, &all_tids);
905 if (thread_num <= 0) {
906 fprintf(stderr, "Can't find all threads of pid %d\n",
907 target_pid);
bca647aa 908 usage_with_options(record_usage, record_options);
d6d901c2
ZY
909 }
910 } else {
911 all_tids=malloc(sizeof(pid_t));
912 if (!all_tids)
d65a458b 913 goto out_symbol_exit;
d6d901c2
ZY
914
915 all_tids[0] = target_tid;
916 thread_num = 1;
917 }
918
919 for (i = 0; i < MAX_NR_CPUS; i++) {
920 for (j = 0; j < MAX_COUNTERS; j++) {
921 fd[i][j] = malloc(sizeof(int)*thread_num);
0e2e63dd 922 if (!fd[i][j])
39d17dac 923 goto out_free_fd;
d6d901c2
ZY
924 }
925 }
926 event_array = malloc(
927 sizeof(struct pollfd)*MAX_NR_CPUS*MAX_COUNTERS*thread_num);
928 if (!event_array)
39d17dac 929 goto out_free_fd;
d6d901c2 930
3de29cab 931 if (user_interval != ULLONG_MAX)
f9212819
FW
932 default_interval = user_interval;
933 if (user_freq != UINT_MAX)
934 freq = user_freq;
935
7e4ff9e3
MG
936 /*
937 * User specified count overrides default frequency.
938 */
939 if (default_interval)
940 freq = 0;
941 else if (freq) {
942 default_interval = freq;
943 } else {
944 fprintf(stderr, "frequency and count are zero, aborting\n");
39d17dac
ACM
945 err = -EINVAL;
946 goto out_free_event_array;
7e4ff9e3
MG
947 }
948
39d17dac
ACM
949 err = __cmd_record(argc, argv);
950
951out_free_event_array:
952 free(event_array);
953out_free_fd:
954 for (i = 0; i < MAX_NR_CPUS; i++) {
955 for (j = 0; j < MAX_COUNTERS; j++)
956 free(fd[i][j]);
957 }
958 free(all_tids);
959 all_tids = NULL;
d65a458b
ACM
960out_symbol_exit:
961 symbol__exit();
39d17dac 962 return err;
0e9b20b8 963}
This page took 0.251257 seconds and 5 git commands to generate.