blob: bf1f18366726e4272bffb8980cd3ea8cf1e591ae [file] [log] [blame]
Greg Kroah-Hartmanb2441312017-11-01 15:07:57 +01001// SPDX-License-Identifier: GPL-2.0
Ingo Molnarabaff322009-06-02 22:59:57 +02002/*
Ingo Molnarbf9e1872009-06-02 23:37:05 +02003 * builtin-record.c
4 *
5 * Builtin record command: Record the profile of a workload
6 * (or a CPU, or a PID) into the perf.data output file - for
7 * later analysis via perf report.
Ingo Molnarabaff322009-06-02 22:59:57 +02008 */
Ingo Molnar16f762a2009-05-27 09:10:38 +02009#include "builtin.h"
Ingo Molnarbf9e1872009-06-02 23:37:05 +020010
Arnaldo Carvalho de Melo6122e4e2010-02-03 16:52:05 -020011#include "util/build-id.h"
Josh Poimboeuf4b6ab942015-12-15 09:39:39 -060012#include <subcmd/parse-options.h>
Ingo Molnar8ad8db32009-05-26 11:10:09 +020013#include "util/parse-events.h"
Taeung Song41840d22016-06-23 17:55:17 +090014#include "util/config.h"
Thomas Gleixner6eda5832009-05-01 18:29:57 +020015
Arnaldo Carvalho de Melo8f651ea2014-10-09 16:12:24 -030016#include "util/callchain.h"
Arnaldo Carvalho de Melof14d5702014-10-17 12:17:40 -030017#include "util/cgroup.h"
Peter Zijlstra7c6a1c62009-06-25 17:05:54 +020018#include "util/header.h"
Frederic Weisbecker66e274f2009-08-12 11:07:25 +020019#include "util/event.h"
Arnaldo Carvalho de Melo361c99a2011-01-11 20:56:53 -020020#include "util/evlist.h"
Arnaldo Carvalho de Melo69aad6f2011-01-03 16:39:04 -020021#include "util/evsel.h"
Frederic Weisbecker8f288272009-08-16 22:05:48 +020022#include "util/debug.h"
Arnaldo Carvalho de Meloe0fcfb02019-09-23 12:20:38 -030023#include "util/mmap.h"
Arnaldo Carvalho de Meloaeb00b12019-08-22 15:40:29 -030024#include "util/target.h"
Arnaldo Carvalho de Melo94c744b2009-12-11 21:24:02 -020025#include "util/session.h"
Arnaldo Carvalho de Melo45694aa2011-11-28 08:30:20 -020026#include "util/tool.h"
Arnaldo Carvalho de Melo8d063672009-11-04 18:50:43 -020027#include "util/symbol.h"
Arnaldo Carvalho de Meloaeb00b12019-08-22 15:40:29 -030028#include "util/record.h"
Paul Mackerrasa12b51c2010-03-10 20:36:09 +110029#include "util/cpumap.h"
Arnaldo Carvalho de Melofd782602011-01-18 15:15:24 -020030#include "util/thread_map.h"
Jiri Olsaf5fc14122013-10-15 16:27:32 +020031#include "util/data.h"
Stephane Eranianbcc84ec2015-08-31 18:41:12 +020032#include "util/perf_regs.h"
Adrian Hunteref149c22015-04-09 18:53:45 +030033#include "util/auxtrace.h"
Adrian Hunter46bc29b2016-03-08 10:38:44 +020034#include "util/tsc.h"
Andi Kleenf00898f2015-05-27 10:51:51 -070035#include "util/parse-branch-options.h"
Stephane Eranianbcc84ec2015-08-31 18:41:12 +020036#include "util/parse-regs-options.h"
Arnaldo Carvalho de Melo40c7d242020-05-05 11:49:08 -030037#include "util/perf_api_probe.h"
Wang Nan71dc23262015-10-14 12:41:19 +000038#include "util/llvm-utils.h"
Wang Nan8690a2a2016-02-22 09:10:32 +000039#include "util/bpf-loader.h"
Wang Nan5f9cf592016-04-20 18:59:49 +000040#include "util/trigger.h"
Wang Nana0748652016-11-26 07:03:28 +000041#include "util/perf-hooks.h"
Alexey Budankovf13de662019-01-22 20:50:57 +030042#include "util/cpu-set-sched.h"
Arnaldo Carvalho de Meloea49e012019-09-18 11:36:13 -030043#include "util/synthetic-events.h"
Arnaldo Carvalho de Meloc5e40272017-04-19 16:12:39 -030044#include "util/time-utils.h"
Arnaldo Carvalho de Melo58db1d62017-04-19 16:05:56 -030045#include "util/units.h"
Song Liu7b612e22019-01-17 08:15:19 -080046#include "util/bpf-event.h"
Stephane Eraniand99c22e2020-04-22 08:50:38 -070047#include "util/util.h"
Stephane Eranian70943492020-05-05 11:29:43 -070048#include "util/pfm.h"
Wang Nand8871ea2016-02-26 09:32:06 +000049#include "asm/bug.h"
Arnaldo Carvalho de Meloc1a604d2019-08-29 15:20:59 -030050#include "perf.h"
Peter Zijlstra7c6a1c62009-06-25 17:05:54 +020051
Arnaldo Carvalho de Meloa43783a2017-04-18 10:46:11 -030052#include <errno.h>
Arnaldo Carvalho de Melofd20e812017-04-17 15:23:08 -030053#include <inttypes.h>
Arnaldo Carvalho de Melo67230472018-03-01 13:46:23 -030054#include <locale.h>
Arnaldo Carvalho de Melo42087352017-04-19 19:06:30 -030055#include <poll.h>
Stephane Eraniand99c22e2020-04-22 08:50:38 -070056#include <pthread.h>
Peter Zijlstra97124d5e2009-06-02 15:52:24 +020057#include <unistd.h>
Peter Zijlstrade9ac072009-04-08 15:01:31 +020058#include <sched.h>
Arnaldo Carvalho de Melo9607ad32017-04-19 15:49:18 -030059#include <signal.h>
Anand K Mistryda231332020-05-13 12:20:23 +100060#ifdef HAVE_EVENTFD_SUPPORT
61#include <sys/eventfd.h>
62#endif
Arnaldo Carvalho de Meloa41794c2010-05-18 18:29:23 -030063#include <sys/mman.h>
Arnaldo Carvalho de Melo42087352017-04-19 19:06:30 -030064#include <sys/wait.h>
Adrian Huntereeb399b2019-10-04 11:31:21 +030065#include <sys/types.h>
66#include <sys/stat.h>
67#include <fcntl.h>
Mamatha Inamdar6ef81c52019-08-22 12:50:49 +053068#include <linux/err.h>
Arnaldo Carvalho de Melo8520a982019-08-29 16:18:59 -030069#include <linux/string.h>
Arnaldo Carvalho de Melo0693e682016-08-08 15:05:46 -030070#include <linux/time64.h>
Arnaldo Carvalho de Melod8f9da22019-07-04 12:06:20 -030071#include <linux/zalloc.h>
Alexey Budankov8384a262019-12-03 14:45:27 +030072#include <linux/bitmap.h>
Bernhard Rosenkraenzer78da39f2012-10-08 09:43:26 +030073
Jiri Olsa1b43b702017-01-09 10:51:56 +010074struct switch_output {
Jiri Olsadc0c6122017-01-09 10:51:58 +010075 bool enabled;
Jiri Olsa1b43b702017-01-09 10:51:56 +010076 bool signal;
Jiri Olsadc0c6122017-01-09 10:51:58 +010077 unsigned long size;
Jiri Olsabfacbe32017-01-09 10:52:00 +010078 unsigned long time;
Jiri Olsacb4e1eb2017-01-09 10:51:57 +010079 const char *str;
80 bool set;
Andi Kleen03724b22019-03-14 15:49:55 -070081 char **filenames;
82 int num_files;
83 int cur_file;
Jiri Olsa1b43b702017-01-09 10:51:56 +010084};
85
Arnaldo Carvalho de Melo8c6f45a2013-12-19 14:38:03 -030086struct record {
Arnaldo Carvalho de Melo45694aa2011-11-28 08:30:20 -020087 struct perf_tool tool;
Arnaldo Carvalho de Melob4006792013-12-19 14:43:45 -030088 struct record_opts opts;
Arnaldo Carvalho de Melod20deb62011-11-25 08:19:45 -020089 u64 bytes_written;
Jiri Olsa8ceb41d2017-01-23 22:07:59 +010090 struct perf_data data;
Adrian Hunteref149c22015-04-09 18:53:45 +030091 struct auxtrace_record *itr;
Jiri Olsa63503db2019-07-21 13:23:52 +020092 struct evlist *evlist;
Arnaldo Carvalho de Melod20deb62011-11-25 08:19:45 -020093 struct perf_session *session;
Arnaldo Carvalho de Melobc477d792020-04-24 10:24:04 -030094 struct evlist *sb_evlist;
Arnaldo Carvalho de Melo899e5ff2020-04-27 17:56:37 -030095 pthread_t thread_id;
Arnaldo Carvalho de Melod20deb62011-11-25 08:19:45 -020096 int realtime_prio;
Arnaldo Carvalho de Melo899e5ff2020-04-27 17:56:37 -030097 bool switch_output_event_set;
Arnaldo Carvalho de Melod20deb62011-11-25 08:19:45 -020098 bool no_buildid;
Wang Nand2db9a92016-01-25 09:56:19 +000099 bool no_buildid_set;
Arnaldo Carvalho de Melod20deb62011-11-25 08:19:45 -0200100 bool no_buildid_cache;
Wang Nand2db9a92016-01-25 09:56:19 +0000101 bool no_buildid_cache_set;
Namhyung Kim61566812016-01-11 22:37:09 +0900102 bool buildid_all;
Wang Nanecfd7a92016-04-13 08:21:07 +0000103 bool timestamp_filename;
Jin Yao68588ba2017-12-08 21:13:42 +0800104 bool timestamp_boundary;
Jiri Olsa1b43b702017-01-09 10:51:56 +0100105 struct switch_output switch_output;
Yang Shi9f065192015-09-29 14:49:43 -0700106 unsigned long long samples;
Alexey Budankov8384a262019-12-03 14:45:27 +0300107 struct mmap_cpu_mask affinity_mask;
Jiwei Sun6d575812019-10-22 16:09:01 +0800108 unsigned long output_max_size; /* = 0: unlimited */
Arnaldo Carvalho de Melo0f82ebc2011-11-08 14:41:57 -0200109};
Ingo Molnara21ca2c2009-06-06 09:58:57 +0200110
Jiwei Sun6d575812019-10-22 16:09:01 +0800111static volatile int done;
112
Jiri Olsadc0c6122017-01-09 10:51:58 +0100113static volatile int auxtrace_record__snapshot_started;
114static DEFINE_TRIGGER(auxtrace_snapshot_trigger);
115static DEFINE_TRIGGER(switch_output_trigger);
116
Alexey Budankov9d2ed642019-01-22 20:47:43 +0300117static const char *affinity_tags[PERF_AFFINITY_MAX] = {
118 "SYS", "NODE", "CPU"
119};
120
Jiri Olsadc0c6122017-01-09 10:51:58 +0100121static bool switch_output_signal(struct record *rec)
122{
123 return rec->switch_output.signal &&
124 trigger_is_ready(&switch_output_trigger);
125}
126
127static bool switch_output_size(struct record *rec)
128{
129 return rec->switch_output.size &&
130 trigger_is_ready(&switch_output_trigger) &&
131 (rec->bytes_written >= rec->switch_output.size);
132}
133
Jiri Olsabfacbe32017-01-09 10:52:00 +0100134static bool switch_output_time(struct record *rec)
135{
136 return rec->switch_output.time &&
137 trigger_is_ready(&switch_output_trigger);
138}
139
Jiwei Sun6d575812019-10-22 16:09:01 +0800140static bool record__output_max_size_exceeded(struct record *rec)
141{
142 return rec->output_max_size &&
143 (rec->bytes_written >= rec->output_max_size);
144}
145
Jiri Olsaa5830532019-07-27 20:30:53 +0200146static int record__write(struct record *rec, struct mmap *map __maybe_unused,
Jiri Olsaded2b8f2018-09-13 14:54:06 +0200147 void *bf, size_t size)
Peter Zijlstraf5970552009-06-18 23:22:55 +0200148{
Jiri Olsaded2b8f2018-09-13 14:54:06 +0200149 struct perf_data_file *file = &rec->session->data->file;
150
151 if (perf_data_file__write(file, bf, size) < 0) {
Jiri Olsa50a9b862013-11-22 13:11:24 +0100152 pr_err("failed to write perf data, error: %m\n");
153 return -1;
Peter Zijlstraf5970552009-06-18 23:22:55 +0200154 }
David Ahern8d3eca22012-08-26 12:24:47 -0600155
Arnaldo Carvalho de Melocf8b2e62013-12-19 14:26:26 -0300156 rec->bytes_written += size;
Jiri Olsadc0c6122017-01-09 10:51:58 +0100157
Jiwei Sun6d575812019-10-22 16:09:01 +0800158 if (record__output_max_size_exceeded(rec) && !done) {
159 fprintf(stderr, "[ perf record: perf size limit reached (%" PRIu64 " KB),"
160 " stopping session ]\n",
161 rec->bytes_written >> 10);
162 done = 1;
163 }
164
Jiri Olsadc0c6122017-01-09 10:51:58 +0100165 if (switch_output_size(rec))
166 trigger_hit(&switch_output_trigger);
167
David Ahern8d3eca22012-08-26 12:24:47 -0600168 return 0;
Peter Zijlstraf5970552009-06-18 23:22:55 +0200169}
170
Alexey Budankovef781122019-03-18 20:44:12 +0300171static int record__aio_enabled(struct record *rec);
172static int record__comp_enabled(struct record *rec);
Alexey Budankov5d7f4112019-03-18 20:43:35 +0300173static size_t zstd_compress(struct perf_session *session, void *dst, size_t dst_size,
174 void *src, size_t src_size);
175
Alexey Budankovd3d1af62018-11-06 12:04:58 +0300176#ifdef HAVE_AIO_SUPPORT
177static int record__aio_write(struct aiocb *cblock, int trace_fd,
178 void *buf, size_t size, off_t off)
179{
180 int rc;
181
182 cblock->aio_fildes = trace_fd;
183 cblock->aio_buf = buf;
184 cblock->aio_nbytes = size;
185 cblock->aio_offset = off;
186 cblock->aio_sigevent.sigev_notify = SIGEV_NONE;
187
188 do {
189 rc = aio_write(cblock);
190 if (rc == 0) {
191 break;
192 } else if (errno != EAGAIN) {
193 cblock->aio_fildes = -1;
194 pr_err("failed to queue perf data, error: %m\n");
195 break;
196 }
197 } while (1);
198
199 return rc;
200}
201
Jiri Olsaa5830532019-07-27 20:30:53 +0200202static int record__aio_complete(struct mmap *md, struct aiocb *cblock)
Alexey Budankovd3d1af62018-11-06 12:04:58 +0300203{
204 void *rem_buf;
205 off_t rem_off;
206 size_t rem_size;
207 int rc, aio_errno;
208 ssize_t aio_ret, written;
209
210 aio_errno = aio_error(cblock);
211 if (aio_errno == EINPROGRESS)
212 return 0;
213
214 written = aio_ret = aio_return(cblock);
215 if (aio_ret < 0) {
216 if (aio_errno != EINTR)
217 pr_err("failed to write perf data, error: %m\n");
218 written = 0;
219 }
220
221 rem_size = cblock->aio_nbytes - written;
222
223 if (rem_size == 0) {
224 cblock->aio_fildes = -1;
225 /*
Alexey Budankovef781122019-03-18 20:44:12 +0300226 * md->refcount is incremented in record__aio_pushfn() for
227 * every aio write request started in record__aio_push() so
228 * decrement it because the request is now complete.
Alexey Budankovd3d1af62018-11-06 12:04:58 +0300229 */
Jiri Olsa80e53d12019-10-07 14:53:15 +0200230 perf_mmap__put(&md->core);
Alexey Budankovd3d1af62018-11-06 12:04:58 +0300231 rc = 1;
232 } else {
233 /*
234 * aio write request may require restart with the
235 * reminder if the kernel didn't write whole
236 * chunk at once.
237 */
238 rem_off = cblock->aio_offset + written;
239 rem_buf = (void *)(cblock->aio_buf + written);
240 record__aio_write(cblock, cblock->aio_fildes,
241 rem_buf, rem_size, rem_off);
242 rc = 0;
243 }
244
245 return rc;
246}
247
Jiri Olsaa5830532019-07-27 20:30:53 +0200248static int record__aio_sync(struct mmap *md, bool sync_all)
Alexey Budankovd3d1af62018-11-06 12:04:58 +0300249{
Alexey Budankov93f20c02018-11-06 12:07:19 +0300250 struct aiocb **aiocb = md->aio.aiocb;
251 struct aiocb *cblocks = md->aio.cblocks;
Alexey Budankovd3d1af62018-11-06 12:04:58 +0300252 struct timespec timeout = { 0, 1000 * 1000 * 1 }; /* 1ms */
Alexey Budankov93f20c02018-11-06 12:07:19 +0300253 int i, do_suspend;
Alexey Budankovd3d1af62018-11-06 12:04:58 +0300254
255 do {
Alexey Budankov93f20c02018-11-06 12:07:19 +0300256 do_suspend = 0;
257 for (i = 0; i < md->aio.nr_cblocks; ++i) {
258 if (cblocks[i].aio_fildes == -1 || record__aio_complete(md, &cblocks[i])) {
259 if (sync_all)
260 aiocb[i] = NULL;
261 else
262 return i;
263 } else {
264 /*
265 * Started aio write is not complete yet
266 * so it has to be waited before the
267 * next allocation.
268 */
269 aiocb[i] = &cblocks[i];
270 do_suspend = 1;
271 }
272 }
273 if (!do_suspend)
274 return -1;
Alexey Budankovd3d1af62018-11-06 12:04:58 +0300275
Alexey Budankov93f20c02018-11-06 12:07:19 +0300276 while (aio_suspend((const struct aiocb **)aiocb, md->aio.nr_cblocks, &timeout)) {
Alexey Budankovd3d1af62018-11-06 12:04:58 +0300277 if (!(errno == EAGAIN || errno == EINTR))
278 pr_err("failed to sync perf data, error: %m\n");
279 }
280 } while (1);
281}
282
Alexey Budankovef781122019-03-18 20:44:12 +0300283struct record_aio {
284 struct record *rec;
285 void *data;
286 size_t size;
287};
288
Jiri Olsaa5830532019-07-27 20:30:53 +0200289static int record__aio_pushfn(struct mmap *map, void *to, void *buf, size_t size)
Alexey Budankovd3d1af62018-11-06 12:04:58 +0300290{
Alexey Budankovef781122019-03-18 20:44:12 +0300291 struct record_aio *aio = to;
292
293 /*
Jiri Olsa547740f2019-07-27 22:07:44 +0200294 * map->core.base data pointed by buf is copied into free map->aio.data[] buffer
Alexey Budankovef781122019-03-18 20:44:12 +0300295 * to release space in the kernel buffer as fast as possible, calling
296 * perf_mmap__consume() from perf_mmap__push() function.
297 *
298 * That lets the kernel to proceed with storing more profiling data into
299 * the kernel buffer earlier than other per-cpu kernel buffers are handled.
300 *
301 * Coping can be done in two steps in case the chunk of profiling data
302 * crosses the upper bound of the kernel buffer. In this case we first move
303 * part of data from map->start till the upper bound and then the reminder
304 * from the beginning of the kernel buffer till the end of the data chunk.
305 */
306
307 if (record__comp_enabled(aio->rec)) {
308 size = zstd_compress(aio->rec->session, aio->data + aio->size,
Jiri Olsabf59b302019-10-07 14:53:11 +0200309 mmap__mmap_len(map) - aio->size,
Alexey Budankovef781122019-03-18 20:44:12 +0300310 buf, size);
311 } else {
312 memcpy(aio->data + aio->size, buf, size);
313 }
314
315 if (!aio->size) {
316 /*
317 * Increment map->refcount to guard map->aio.data[] buffer
318 * from premature deallocation because map object can be
319 * released earlier than aio write request started on
320 * map->aio.data[] buffer is complete.
321 *
322 * perf_mmap__put() is done at record__aio_complete()
323 * after started aio request completion or at record__aio_push()
324 * if the request failed to start.
325 */
Jiri Olsae75710f2019-10-07 14:53:13 +0200326 perf_mmap__get(&map->core);
Alexey Budankovef781122019-03-18 20:44:12 +0300327 }
328
329 aio->size += size;
330
331 return size;
332}
333
Jiri Olsaa5830532019-07-27 20:30:53 +0200334static int record__aio_push(struct record *rec, struct mmap *map, off_t *off)
Alexey Budankovef781122019-03-18 20:44:12 +0300335{
336 int ret, idx;
337 int trace_fd = rec->session->data->file.fd;
338 struct record_aio aio = { .rec = rec, .size = 0 };
339
340 /*
341 * Call record__aio_sync() to wait till map->aio.data[] buffer
342 * becomes available after previous aio write operation.
343 */
344
345 idx = record__aio_sync(map, false);
346 aio.data = map->aio.data[idx];
347 ret = perf_mmap__push(map, &aio, record__aio_pushfn);
348 if (ret != 0) /* ret > 0 - no data, ret < 0 - error */
349 return ret;
Alexey Budankovd3d1af62018-11-06 12:04:58 +0300350
351 rec->samples++;
Alexey Budankovef781122019-03-18 20:44:12 +0300352 ret = record__aio_write(&(map->aio.cblocks[idx]), trace_fd, aio.data, aio.size, *off);
Alexey Budankovd3d1af62018-11-06 12:04:58 +0300353 if (!ret) {
Alexey Budankovef781122019-03-18 20:44:12 +0300354 *off += aio.size;
355 rec->bytes_written += aio.size;
Alexey Budankovd3d1af62018-11-06 12:04:58 +0300356 if (switch_output_size(rec))
357 trigger_hit(&switch_output_trigger);
Alexey Budankovef781122019-03-18 20:44:12 +0300358 } else {
359 /*
360 * Decrement map->refcount incremented in record__aio_pushfn()
361 * back if record__aio_write() operation failed to start, otherwise
362 * map->refcount is decremented in record__aio_complete() after
363 * aio write operation finishes successfully.
364 */
Jiri Olsa80e53d12019-10-07 14:53:15 +0200365 perf_mmap__put(&map->core);
Alexey Budankovd3d1af62018-11-06 12:04:58 +0300366 }
367
368 return ret;
369}
370
371static off_t record__aio_get_pos(int trace_fd)
372{
373 return lseek(trace_fd, 0, SEEK_CUR);
374}
375
376static void record__aio_set_pos(int trace_fd, off_t pos)
377{
378 lseek(trace_fd, pos, SEEK_SET);
379}
380
381static void record__aio_mmap_read_sync(struct record *rec)
382{
383 int i;
Jiri Olsa63503db2019-07-21 13:23:52 +0200384 struct evlist *evlist = rec->evlist;
Jiri Olsaa5830532019-07-27 20:30:53 +0200385 struct mmap *maps = evlist->mmap;
Alexey Budankovd3d1af62018-11-06 12:04:58 +0300386
Alexey Budankovef781122019-03-18 20:44:12 +0300387 if (!record__aio_enabled(rec))
Alexey Budankovd3d1af62018-11-06 12:04:58 +0300388 return;
389
Jiri Olsac976ee12019-07-30 13:04:59 +0200390 for (i = 0; i < evlist->core.nr_mmaps; i++) {
Jiri Olsaa5830532019-07-27 20:30:53 +0200391 struct mmap *map = &maps[i];
Alexey Budankovd3d1af62018-11-06 12:04:58 +0300392
Jiri Olsa547740f2019-07-27 22:07:44 +0200393 if (map->core.base)
Alexey Budankov93f20c02018-11-06 12:07:19 +0300394 record__aio_sync(map, true);
Alexey Budankovd3d1af62018-11-06 12:04:58 +0300395 }
396}
397
398static int nr_cblocks_default = 1;
Alexey Budankov93f20c02018-11-06 12:07:19 +0300399static int nr_cblocks_max = 4;
Alexey Budankovd3d1af62018-11-06 12:04:58 +0300400
401static int record__aio_parse(const struct option *opt,
Alexey Budankov93f20c02018-11-06 12:07:19 +0300402 const char *str,
Alexey Budankovd3d1af62018-11-06 12:04:58 +0300403 int unset)
404{
405 struct record_opts *opts = (struct record_opts *)opt->value;
406
Alexey Budankov93f20c02018-11-06 12:07:19 +0300407 if (unset) {
Alexey Budankovd3d1af62018-11-06 12:04:58 +0300408 opts->nr_cblocks = 0;
Alexey Budankov93f20c02018-11-06 12:07:19 +0300409 } else {
410 if (str)
411 opts->nr_cblocks = strtol(str, NULL, 0);
412 if (!opts->nr_cblocks)
413 opts->nr_cblocks = nr_cblocks_default;
414 }
Alexey Budankovd3d1af62018-11-06 12:04:58 +0300415
416 return 0;
417}
418#else /* HAVE_AIO_SUPPORT */
Alexey Budankov93f20c02018-11-06 12:07:19 +0300419static int nr_cblocks_max = 0;
420
Jiri Olsaa5830532019-07-27 20:30:53 +0200421static int record__aio_push(struct record *rec __maybe_unused, struct mmap *map __maybe_unused,
Alexey Budankovef781122019-03-18 20:44:12 +0300422 off_t *off __maybe_unused)
Alexey Budankovd3d1af62018-11-06 12:04:58 +0300423{
424 return -1;
425}
426
427static off_t record__aio_get_pos(int trace_fd __maybe_unused)
428{
429 return -1;
430}
431
432static void record__aio_set_pos(int trace_fd __maybe_unused, off_t pos __maybe_unused)
433{
434}
435
436static void record__aio_mmap_read_sync(struct record *rec __maybe_unused)
437{
438}
439#endif
440
441static int record__aio_enabled(struct record *rec)
442{
443 return rec->opts.nr_cblocks > 0;
444}
445
Alexey Budankov470530b2019-03-18 20:40:26 +0300446#define MMAP_FLUSH_DEFAULT 1
447static int record__mmap_flush_parse(const struct option *opt,
448 const char *str,
449 int unset)
450{
451 int flush_max;
452 struct record_opts *opts = (struct record_opts *)opt->value;
453 static struct parse_tag tags[] = {
454 { .tag = 'B', .mult = 1 },
455 { .tag = 'K', .mult = 1 << 10 },
456 { .tag = 'M', .mult = 1 << 20 },
457 { .tag = 'G', .mult = 1 << 30 },
458 { .tag = 0 },
459 };
460
461 if (unset)
462 return 0;
463
464 if (str) {
465 opts->mmap_flush = parse_tag_value(str, tags);
466 if (opts->mmap_flush == (int)-1)
467 opts->mmap_flush = strtol(str, NULL, 0);
468 }
469
470 if (!opts->mmap_flush)
471 opts->mmap_flush = MMAP_FLUSH_DEFAULT;
472
Jiri Olsa9521b5f2019-07-28 12:45:35 +0200473 flush_max = evlist__mmap_size(opts->mmap_pages);
Alexey Budankov470530b2019-03-18 20:40:26 +0300474 flush_max /= 4;
475 if (opts->mmap_flush > flush_max)
476 opts->mmap_flush = flush_max;
477
478 return 0;
479}
480
Alexey Budankov504c1ad2019-03-18 20:44:42 +0300481#ifdef HAVE_ZSTD_SUPPORT
482static unsigned int comp_level_default = 1;
483
484static int record__parse_comp_level(const struct option *opt, const char *str, int unset)
485{
486 struct record_opts *opts = opt->value;
487
488 if (unset) {
489 opts->comp_level = 0;
490 } else {
491 if (str)
492 opts->comp_level = strtol(str, NULL, 0);
493 if (!opts->comp_level)
494 opts->comp_level = comp_level_default;
495 }
496
497 return 0;
498}
499#endif
Alexey Budankov51255a82019-03-18 20:42:19 +0300500static unsigned int comp_level_max = 22;
501
Alexey Budankov42e1fd82019-03-18 20:41:33 +0300502static int record__comp_enabled(struct record *rec)
503{
504 return rec->opts.comp_level > 0;
505}
506
Arnaldo Carvalho de Melo45694aa2011-11-28 08:30:20 -0200507static int process_synthesized_event(struct perf_tool *tool,
Arnaldo Carvalho de Melod20deb62011-11-25 08:19:45 -0200508 union perf_event *event,
Irina Tirdea1d037ca2012-09-11 01:15:03 +0300509 struct perf_sample *sample __maybe_unused,
510 struct machine *machine __maybe_unused)
Arnaldo Carvalho de Melo234fbbf2009-10-26 19:23:18 -0200511{
Arnaldo Carvalho de Melo8c6f45a2013-12-19 14:38:03 -0300512 struct record *rec = container_of(tool, struct record, tool);
Jiri Olsaded2b8f2018-09-13 14:54:06 +0200513 return record__write(rec, NULL, event, event->header.size);
Arnaldo Carvalho de Melo234fbbf2009-10-26 19:23:18 -0200514}
515
Stephane Eraniand99c22e2020-04-22 08:50:38 -0700516static int process_locked_synthesized_event(struct perf_tool *tool,
517 union perf_event *event,
518 struct perf_sample *sample __maybe_unused,
519 struct machine *machine __maybe_unused)
520{
521 static pthread_mutex_t synth_lock = PTHREAD_MUTEX_INITIALIZER;
522 int ret;
523
524 pthread_mutex_lock(&synth_lock);
525 ret = process_synthesized_event(tool, event, sample, machine);
526 pthread_mutex_unlock(&synth_lock);
527 return ret;
528}
529
Jiri Olsaa5830532019-07-27 20:30:53 +0200530static int record__pushfn(struct mmap *map, void *to, void *bf, size_t size)
Arnaldo Carvalho de Melod37f1582017-10-05 16:39:55 -0300531{
532 struct record *rec = to;
533
Alexey Budankov5d7f4112019-03-18 20:43:35 +0300534 if (record__comp_enabled(rec)) {
Jiri Olsabf59b302019-10-07 14:53:11 +0200535 size = zstd_compress(rec->session, map->data, mmap__mmap_len(map), bf, size);
Alexey Budankov5d7f4112019-03-18 20:43:35 +0300536 bf = map->data;
537 }
538
Arnaldo Carvalho de Melod37f1582017-10-05 16:39:55 -0300539 rec->samples++;
Jiri Olsaded2b8f2018-09-13 14:54:06 +0200540 return record__write(rec, map, bf, size);
Arnaldo Carvalho de Melod37f1582017-10-05 16:39:55 -0300541}
542
Adrian Hunter2dd6d8a2015-04-30 17:37:32 +0300543static volatile int signr = -1;
544static volatile int child_finished;
Anand K Mistryda231332020-05-13 12:20:23 +1000545#ifdef HAVE_EVENTFD_SUPPORT
546static int done_fd = -1;
547#endif
Wang Nanc0bdc1c2016-04-13 08:21:06 +0000548
Adrian Hunter2dd6d8a2015-04-30 17:37:32 +0300549static void sig_handler(int sig)
550{
551 if (sig == SIGCHLD)
552 child_finished = 1;
553 else
554 signr = sig;
555
556 done = 1;
Anand K Mistryda231332020-05-13 12:20:23 +1000557#ifdef HAVE_EVENTFD_SUPPORT
558{
559 u64 tmp = 1;
560 /*
561 * It is possible for this signal handler to run after done is checked
562 * in the main loop, but before the perf counter fds are polled. If this
563 * happens, the poll() will continue to wait even though done is set,
564 * and will only break out if either another signal is received, or the
565 * counters are ready for read. To ensure the poll() doesn't sleep when
566 * done is set, use an eventfd (done_fd) to wake up the poll().
567 */
568 if (write(done_fd, &tmp, sizeof(tmp)) < 0)
569 pr_err("failed to signal wakeup fd, error: %m\n");
570}
571#endif // HAVE_EVENTFD_SUPPORT
Adrian Hunter2dd6d8a2015-04-30 17:37:32 +0300572}
573
Wang Nana0748652016-11-26 07:03:28 +0000574static void sigsegv_handler(int sig)
575{
576 perf_hooks__recover();
577 sighandler_dump_stack(sig);
578}
579
Adrian Hunter2dd6d8a2015-04-30 17:37:32 +0300580static void record__sig_exit(void)
581{
582 if (signr == -1)
583 return;
584
585 signal(signr, SIG_DFL);
586 raise(signr);
587}
588
Adrian Huntere31f0d02015-04-30 17:37:27 +0300589#ifdef HAVE_AUXTRACE_SUPPORT
590
Adrian Hunteref149c22015-04-09 18:53:45 +0300591static int record__process_auxtrace(struct perf_tool *tool,
Jiri Olsaa5830532019-07-27 20:30:53 +0200592 struct mmap *map,
Adrian Hunteref149c22015-04-09 18:53:45 +0300593 union perf_event *event, void *data1,
594 size_t len1, void *data2, size_t len2)
595{
596 struct record *rec = container_of(tool, struct record, tool);
Jiri Olsa8ceb41d2017-01-23 22:07:59 +0100597 struct perf_data *data = &rec->data;
Adrian Hunteref149c22015-04-09 18:53:45 +0300598 size_t padding;
599 u8 pad[8] = {0};
600
Adrian Hunter46e201e2019-10-04 11:31:20 +0300601 if (!perf_data__is_pipe(data) && perf_data__is_single_file(data)) {
Adrian Hunter99fa2982015-04-30 17:37:25 +0300602 off_t file_offset;
Jiri Olsa8ceb41d2017-01-23 22:07:59 +0100603 int fd = perf_data__fd(data);
Adrian Hunter99fa2982015-04-30 17:37:25 +0300604 int err;
605
606 file_offset = lseek(fd, 0, SEEK_CUR);
607 if (file_offset == -1)
608 return -1;
609 err = auxtrace_index__auxtrace_event(&rec->session->auxtrace_index,
610 event, file_offset);
611 if (err)
612 return err;
613 }
614
Adrian Hunteref149c22015-04-09 18:53:45 +0300615 /* event.auxtrace.size includes padding, see __auxtrace_mmap__read() */
616 padding = (len1 + len2) & 7;
617 if (padding)
618 padding = 8 - padding;
619
Jiri Olsaded2b8f2018-09-13 14:54:06 +0200620 record__write(rec, map, event, event->header.size);
621 record__write(rec, map, data1, len1);
Adrian Hunteref149c22015-04-09 18:53:45 +0300622 if (len2)
Jiri Olsaded2b8f2018-09-13 14:54:06 +0200623 record__write(rec, map, data2, len2);
624 record__write(rec, map, &pad, padding);
Adrian Hunteref149c22015-04-09 18:53:45 +0300625
626 return 0;
627}
628
629static int record__auxtrace_mmap_read(struct record *rec,
Jiri Olsaa5830532019-07-27 20:30:53 +0200630 struct mmap *map)
Adrian Hunteref149c22015-04-09 18:53:45 +0300631{
632 int ret;
633
Jiri Olsae035f4c2018-09-13 14:54:05 +0200634 ret = auxtrace_mmap__read(map, rec->itr, &rec->tool,
Adrian Hunteref149c22015-04-09 18:53:45 +0300635 record__process_auxtrace);
636 if (ret < 0)
637 return ret;
638
639 if (ret)
640 rec->samples++;
641
642 return 0;
643}
644
Adrian Hunter2dd6d8a2015-04-30 17:37:32 +0300645static int record__auxtrace_mmap_read_snapshot(struct record *rec,
Jiri Olsaa5830532019-07-27 20:30:53 +0200646 struct mmap *map)
Adrian Hunter2dd6d8a2015-04-30 17:37:32 +0300647{
648 int ret;
649
Jiri Olsae035f4c2018-09-13 14:54:05 +0200650 ret = auxtrace_mmap__read_snapshot(map, rec->itr, &rec->tool,
Adrian Hunter2dd6d8a2015-04-30 17:37:32 +0300651 record__process_auxtrace,
652 rec->opts.auxtrace_snapshot_size);
653 if (ret < 0)
654 return ret;
655
656 if (ret)
657 rec->samples++;
658
659 return 0;
660}
661
662static int record__auxtrace_read_snapshot_all(struct record *rec)
663{
664 int i;
665 int rc = 0;
666
Jiri Olsac976ee12019-07-30 13:04:59 +0200667 for (i = 0; i < rec->evlist->core.nr_mmaps; i++) {
Jiri Olsaa5830532019-07-27 20:30:53 +0200668 struct mmap *map = &rec->evlist->mmap[i];
Adrian Hunter2dd6d8a2015-04-30 17:37:32 +0300669
Jiri Olsae035f4c2018-09-13 14:54:05 +0200670 if (!map->auxtrace_mmap.base)
Adrian Hunter2dd6d8a2015-04-30 17:37:32 +0300671 continue;
672
Jiri Olsae035f4c2018-09-13 14:54:05 +0200673 if (record__auxtrace_mmap_read_snapshot(rec, map) != 0) {
Adrian Hunter2dd6d8a2015-04-30 17:37:32 +0300674 rc = -1;
675 goto out;
676 }
677 }
678out:
679 return rc;
680}
681
Alexander Shishkince7b0e42019-08-06 17:41:01 +0300682static void record__read_auxtrace_snapshot(struct record *rec, bool on_exit)
Adrian Hunter2dd6d8a2015-04-30 17:37:32 +0300683{
684 pr_debug("Recording AUX area tracing snapshot\n");
685 if (record__auxtrace_read_snapshot_all(rec) < 0) {
Wang Nan5f9cf592016-04-20 18:59:49 +0000686 trigger_error(&auxtrace_snapshot_trigger);
Adrian Hunter2dd6d8a2015-04-30 17:37:32 +0300687 } else {
Alexander Shishkince7b0e42019-08-06 17:41:01 +0300688 if (auxtrace_record__snapshot_finish(rec->itr, on_exit))
Wang Nan5f9cf592016-04-20 18:59:49 +0000689 trigger_error(&auxtrace_snapshot_trigger);
690 else
691 trigger_ready(&auxtrace_snapshot_trigger);
Adrian Hunter2dd6d8a2015-04-30 17:37:32 +0300692 }
693}
694
Alexander Shishkince7b0e42019-08-06 17:41:01 +0300695static int record__auxtrace_snapshot_exit(struct record *rec)
696{
697 if (trigger_is_error(&auxtrace_snapshot_trigger))
698 return 0;
699
700 if (!auxtrace_record__snapshot_started &&
701 auxtrace_record__snapshot_start(rec->itr))
702 return -1;
703
704 record__read_auxtrace_snapshot(rec, true);
705 if (trigger_is_error(&auxtrace_snapshot_trigger))
706 return -1;
707
708 return 0;
709}
710
Adrian Hunter4b5ea3b2018-03-06 11:13:12 +0200711static int record__auxtrace_init(struct record *rec)
712{
713 int err;
714
715 if (!rec->itr) {
716 rec->itr = auxtrace_record__init(rec->evlist, &err);
717 if (err)
718 return err;
719 }
720
721 err = auxtrace_parse_snapshot_options(rec->itr, &rec->opts,
722 rec->opts.auxtrace_snapshot_opts);
723 if (err)
724 return err;
725
Adrian Hunterc0a6de02019-11-15 14:42:16 +0200726 err = auxtrace_parse_sample_options(rec->itr, rec->evlist, &rec->opts,
727 rec->opts.auxtrace_sample_opts);
728 if (err)
729 return err;
730
Adrian Hunter4b5ea3b2018-03-06 11:13:12 +0200731 return auxtrace_parse_filters(rec->evlist);
732}
733
Adrian Huntere31f0d02015-04-30 17:37:27 +0300734#else
735
736static inline
737int record__auxtrace_mmap_read(struct record *rec __maybe_unused,
Jiri Olsaa5830532019-07-27 20:30:53 +0200738 struct mmap *map __maybe_unused)
Adrian Huntere31f0d02015-04-30 17:37:27 +0300739{
740 return 0;
741}
742
Adrian Hunter2dd6d8a2015-04-30 17:37:32 +0300743static inline
Alexander Shishkince7b0e42019-08-06 17:41:01 +0300744void record__read_auxtrace_snapshot(struct record *rec __maybe_unused,
745 bool on_exit __maybe_unused)
Adrian Hunter2dd6d8a2015-04-30 17:37:32 +0300746{
747}
748
749static inline
750int auxtrace_record__snapshot_start(struct auxtrace_record *itr __maybe_unused)
751{
752 return 0;
753}
754
Alexander Shishkince7b0e42019-08-06 17:41:01 +0300755static inline
756int record__auxtrace_snapshot_exit(struct record *rec __maybe_unused)
757{
758 return 0;
759}
760
Adrian Hunter4b5ea3b2018-03-06 11:13:12 +0200761static int record__auxtrace_init(struct record *rec __maybe_unused)
762{
763 return 0;
764}
765
Adrian Huntere31f0d02015-04-30 17:37:27 +0300766#endif
767
Adrian Huntereeb399b2019-10-04 11:31:21 +0300768static bool record__kcore_readable(struct machine *machine)
769{
770 char kcore[PATH_MAX];
771 int fd;
772
773 scnprintf(kcore, sizeof(kcore), "%s/proc/kcore", machine->root_dir);
774
775 fd = open(kcore, O_RDONLY);
776 if (fd < 0)
777 return false;
778
779 close(fd);
780
781 return true;
782}
783
784static int record__kcore_copy(struct machine *machine, struct perf_data *data)
785{
786 char from_dir[PATH_MAX];
787 char kcore_dir[PATH_MAX];
788 int ret;
789
790 snprintf(from_dir, sizeof(from_dir), "%s/proc", machine->root_dir);
791
792 ret = perf_data__make_kcore_dir(data, kcore_dir, sizeof(kcore_dir));
793 if (ret)
794 return ret;
795
796 return kcore_copy(from_dir, kcore_dir);
797}
798
Wang Nancda57a82016-06-27 10:24:03 +0000799static int record__mmap_evlist(struct record *rec,
Jiri Olsa63503db2019-07-21 13:23:52 +0200800 struct evlist *evlist)
Wang Nancda57a82016-06-27 10:24:03 +0000801{
802 struct record_opts *opts = &rec->opts;
Adrian Hunterc0a6de02019-11-15 14:42:16 +0200803 bool auxtrace_overwrite = opts->auxtrace_snapshot_mode ||
804 opts->auxtrace_sample_mode;
Wang Nancda57a82016-06-27 10:24:03 +0000805 char msg[512];
806
Alexey Budankovf13de662019-01-22 20:50:57 +0300807 if (opts->affinity != PERF_AFFINITY_SYS)
808 cpu__setup_cpunode_map();
809
Jiri Olsa9521b5f2019-07-28 12:45:35 +0200810 if (evlist__mmap_ex(evlist, opts->mmap_pages,
Wang Nancda57a82016-06-27 10:24:03 +0000811 opts->auxtrace_mmap_pages,
Adrian Hunterc0a6de02019-11-15 14:42:16 +0200812 auxtrace_overwrite,
Alexey Budankov470530b2019-03-18 20:40:26 +0300813 opts->nr_cblocks, opts->affinity,
Alexey Budankov51255a82019-03-18 20:42:19 +0300814 opts->mmap_flush, opts->comp_level) < 0) {
Wang Nancda57a82016-06-27 10:24:03 +0000815 if (errno == EPERM) {
816 pr_err("Permission error mapping pages.\n"
817 "Consider increasing "
818 "/proc/sys/kernel/perf_event_mlock_kb,\n"
819 "or try again with a smaller value of -m/--mmap_pages.\n"
820 "(current value: %u,%u)\n",
821 opts->mmap_pages, opts->auxtrace_mmap_pages);
822 return -errno;
823 } else {
824 pr_err("failed to mmap with %d (%s)\n", errno,
Arnaldo Carvalho de Meloc8b5f2c2016-07-06 11:56:20 -0300825 str_error_r(errno, msg, sizeof(msg)));
Wang Nancda57a82016-06-27 10:24:03 +0000826 if (errno)
827 return -errno;
828 else
829 return -EINVAL;
830 }
831 }
832 return 0;
833}
834
835static int record__mmap(struct record *rec)
836{
837 return record__mmap_evlist(rec, rec->evlist);
838}
839
Arnaldo Carvalho de Melo8c6f45a2013-12-19 14:38:03 -0300840static int record__open(struct record *rec)
Arnaldo Carvalho de Melodd7927f2011-01-12 14:28:51 -0200841{
Arnaldo Carvalho de Melod6195a62017-02-13 16:45:24 -0300842 char msg[BUFSIZ];
Jiri Olsa32dcd022019-07-21 13:23:51 +0200843 struct evsel *pos;
Jiri Olsa63503db2019-07-21 13:23:52 +0200844 struct evlist *evlist = rec->evlist;
Arnaldo Carvalho de Melod20deb62011-11-25 08:19:45 -0200845 struct perf_session *session = rec->session;
Arnaldo Carvalho de Melob4006792013-12-19 14:43:45 -0300846 struct record_opts *opts = &rec->opts;
David Ahern8d3eca22012-08-26 12:24:47 -0600847 int rc = 0;
Arnaldo Carvalho de Melodd7927f2011-01-12 14:28:51 -0200848
Arnaldo Carvalho de Melod3dbf432017-11-03 15:34:34 -0300849 /*
Ian Rogers0a892c12020-04-22 10:36:15 -0700850 * For initial_delay or system wide, we need to add a dummy event so
851 * that we can track PERF_RECORD_MMAP to cover the delay of waiting or
852 * event synthesis.
Arnaldo Carvalho de Melod3dbf432017-11-03 15:34:34 -0300853 */
Ian Rogers0a892c12020-04-22 10:36:15 -0700854 if (opts->initial_delay || target__has_cpu(&opts->target)) {
Adrian Hunter442ad2252020-06-29 12:19:51 +0300855 pos = perf_evlist__get_tracking_event(evlist);
856 if (!evsel__is_dummy_event(pos)) {
857 /* Set up dummy event. */
Arnaldo Carvalho de Melofacbf0b2020-07-08 13:49:15 -0300858 if (evlist__add_dummy(evlist))
Adrian Hunter442ad2252020-06-29 12:19:51 +0300859 return -ENOMEM;
860 pos = evlist__last(evlist);
861 perf_evlist__set_tracking_event(evlist, pos);
862 }
Arnaldo Carvalho de Melod3dbf432017-11-03 15:34:34 -0300863
Ian Rogers0a892c12020-04-22 10:36:15 -0700864 /*
865 * Enable the dummy event when the process is forked for
866 * initial_delay, immediately for system wide.
867 */
Adrian Hunter442ad2252020-06-29 12:19:51 +0300868 if (opts->initial_delay && !pos->immediate)
Ian Rogers0a892c12020-04-22 10:36:15 -0700869 pos->core.attr.enable_on_exec = 1;
870 else
871 pos->immediate = 1;
Arnaldo Carvalho de Melod3dbf432017-11-03 15:34:34 -0300872 }
873
Arnaldo Carvalho de Meloe68ae9c2016-04-11 18:15:29 -0300874 perf_evlist__config(evlist, opts, &callchain_param);
Jiri Olsacac21422012-11-12 18:34:00 +0100875
Arnaldo Carvalho de Meloe5cadb92016-06-23 11:26:15 -0300876 evlist__for_each_entry(evlist, pos) {
Ingo Molnar3da297a2009-06-07 17:39:02 +0200877try_again:
Jiri Olsaaf663bd2019-07-21 13:24:39 +0200878 if (evsel__open(pos, pos->core.cpus, pos->core.threads) < 0) {
Arnaldo Carvalho de Meloae430892020-04-30 11:46:15 -0300879 if (evsel__fallback(pos, errno, msg, sizeof(msg))) {
Namhyung Kimbb963e12017-02-17 17:17:38 +0900880 if (verbose > 0)
Arnaldo Carvalho de Meloc0a54342012-12-13 14:16:30 -0300881 ui__warning("%s\n", msg);
Zhang, Yanmind6d901c2010-03-18 11:36:05 -0300882 goto try_again;
883 }
Andi Kleencf99ad12018-10-01 12:59:27 -0700884 if ((errno == EINVAL || errno == EBADF) &&
885 pos->leader != pos &&
886 pos->weak_group) {
Andi Kleen4804e012019-11-20 16:15:19 -0800887 pos = perf_evlist__reset_weak_group(evlist, pos, true);
Andi Kleencf99ad12018-10-01 12:59:27 -0700888 goto try_again;
889 }
Arnaldo Carvalho de Melo56e52e82012-12-13 15:10:58 -0300890 rc = -errno;
Arnaldo Carvalho de Melo2bb72db2020-05-04 13:43:03 -0300891 evsel__open_strerror(pos, &opts->target, errno, msg, sizeof(msg));
Arnaldo Carvalho de Melo56e52e82012-12-13 15:10:58 -0300892 ui__error("%s\n", msg);
David Ahern8d3eca22012-08-26 12:24:47 -0600893 goto out;
Zhang, Yanmind6d901c2010-03-18 11:36:05 -0300894 }
Andi Kleenbfd8f722017-11-17 13:42:58 -0800895
896 pos->supported = true;
Li Zefanc171b552009-10-15 11:22:07 +0800897 }
Arnaldo Carvalho de Meloa43d3f02010-12-25 12:12:25 -0200898
Arnaldo Carvalho de Meloc8b567c2019-09-23 11:07:29 -0300899 if (symbol_conf.kptr_restrict && !perf_evlist__exclude_kernel(evlist)) {
900 pr_warning(
901"WARNING: Kernel address maps (/proc/{kallsyms,modules}) are restricted,\n"
902"check /proc/sys/kernel/kptr_restrict and /proc/sys/kernel/perf_event_paranoid.\n\n"
903"Samples in kernel functions may not be resolved if a suitable vmlinux\n"
904"file is not found in the buildid cache or in the vmlinux path.\n\n"
905"Samples in kernel modules won't be resolved at all.\n\n"
906"If some relocation was applied (e.g. kexec) symbols may be misresolved\n"
907"even with a suitable vmlinux or kallsyms file.\n\n");
908 }
909
Arnaldo Carvalho de Melo23d4aad2015-03-24 19:23:47 -0300910 if (perf_evlist__apply_filters(evlist, &pos)) {
Arnaldo Carvalho de Melo62d94b02017-06-27 11:22:31 -0300911 pr_err("failed to set filter \"%s\" on event %s with %d (%s)\n",
Arnaldo Carvalho de Melo8ab2e962020-04-29 16:07:09 -0300912 pos->filter, evsel__name(pos), errno,
Arnaldo Carvalho de Meloc8b5f2c2016-07-06 11:56:20 -0300913 str_error_r(errno, msg, sizeof(msg)));
David Ahern8d3eca22012-08-26 12:24:47 -0600914 rc = -1;
915 goto out;
Frederic Weisbecker0a102472011-02-26 04:51:54 +0100916 }
917
Wang Nancda57a82016-06-27 10:24:03 +0000918 rc = record__mmap(rec);
919 if (rc)
David Ahern8d3eca22012-08-26 12:24:47 -0600920 goto out;
Arnaldo Carvalho de Melo0a27d7f2011-01-14 15:50:51 -0200921
Jiri Olsa563aecb2013-06-05 13:35:06 +0200922 session->evlist = evlist;
Arnaldo Carvalho de Melo7b56cce2012-08-01 19:31:00 -0300923 perf_session__set_id_hdr_size(session);
David Ahern8d3eca22012-08-26 12:24:47 -0600924out:
925 return rc;
Peter Zijlstra16c8a102009-05-05 17:50:27 +0200926}
927
Namhyung Kime3d59112015-01-29 17:06:44 +0900928static int process_sample_event(struct perf_tool *tool,
929 union perf_event *event,
930 struct perf_sample *sample,
Jiri Olsa32dcd022019-07-21 13:23:51 +0200931 struct evsel *evsel,
Namhyung Kime3d59112015-01-29 17:06:44 +0900932 struct machine *machine)
933{
934 struct record *rec = container_of(tool, struct record, tool);
935
Jin Yao68588ba2017-12-08 21:13:42 +0800936 if (rec->evlist->first_sample_time == 0)
937 rec->evlist->first_sample_time = sample->time;
Namhyung Kime3d59112015-01-29 17:06:44 +0900938
Jin Yao68588ba2017-12-08 21:13:42 +0800939 rec->evlist->last_sample_time = sample->time;
940
941 if (rec->buildid_all)
942 return 0;
943
944 rec->samples++;
Namhyung Kime3d59112015-01-29 17:06:44 +0900945 return build_id__mark_dso_hit(tool, event, sample, evsel, machine);
946}
947
Arnaldo Carvalho de Melo8c6f45a2013-12-19 14:38:03 -0300948static int process_buildids(struct record *rec)
Arnaldo Carvalho de Melo6122e4e2010-02-03 16:52:05 -0200949{
Jiri Olsaf5fc14122013-10-15 16:27:32 +0200950 struct perf_session *session = rec->session;
Arnaldo Carvalho de Melo6122e4e2010-02-03 16:52:05 -0200951
Jiri Olsa45112e82019-02-21 10:41:29 +0100952 if (perf_data__size(&rec->data) == 0)
Arnaldo Carvalho de Melo9f591fd2010-03-11 15:53:11 -0300953 return 0;
954
Namhyung Kim00dc8652014-11-04 10:14:32 +0900955 /*
956 * During this process, it'll load kernel map and replace the
957 * dso->long_name to a real pathname it found. In this case
958 * we prefer the vmlinux path like
959 * /lib/modules/3.16.4/build/vmlinux
960 *
961 * rather than build-id path (in debug directory).
962 * $HOME/.debug/.build-id/f0/6e17aa50adf4d00b88925e03775de107611551
963 */
964 symbol_conf.ignore_vmlinux_buildid = true;
965
Namhyung Kim61566812016-01-11 22:37:09 +0900966 /*
967 * If --buildid-all is given, it marks all DSO regardless of hits,
Jin Yao68588ba2017-12-08 21:13:42 +0800968 * so no need to process samples. But if timestamp_boundary is enabled,
969 * it still needs to walk on all samples to get the timestamps of
970 * first/last samples.
Namhyung Kim61566812016-01-11 22:37:09 +0900971 */
Jin Yao68588ba2017-12-08 21:13:42 +0800972 if (rec->buildid_all && !rec->timestamp_boundary)
Namhyung Kim61566812016-01-11 22:37:09 +0900973 rec->tool.sample = NULL;
974
Arnaldo Carvalho de Melob7b61cb2015-03-03 11:58:45 -0300975 return perf_session__process_events(session);
Arnaldo Carvalho de Melo6122e4e2010-02-03 16:52:05 -0200976}
977
Arnaldo Carvalho de Melo8115d602011-01-29 14:01:45 -0200978static void perf_event__synthesize_guest_os(struct machine *machine, void *data)
Zhang, Yanmina1645ce2010-04-19 13:32:50 +0800979{
980 int err;
Arnaldo Carvalho de Melo45694aa2011-11-28 08:30:20 -0200981 struct perf_tool *tool = data;
Zhang, Yanmina1645ce2010-04-19 13:32:50 +0800982 /*
983 *As for guest kernel when processing subcommand record&report,
984 *we arrange module mmap prior to guest kernel mmap and trigger
985 *a preload dso because default guest module symbols are loaded
986 *from guest kallsyms instead of /lib/modules/XXX/XXX. This
987 *method is used to avoid symbol missing when the first addr is
988 *in module instead of in guest kernel.
989 */
Arnaldo Carvalho de Melo45694aa2011-11-28 08:30:20 -0200990 err = perf_event__synthesize_modules(tool, process_synthesized_event,
Arnaldo Carvalho de Melo743eb862011-11-28 07:56:39 -0200991 machine);
Zhang, Yanmina1645ce2010-04-19 13:32:50 +0800992 if (err < 0)
993 pr_err("Couldn't record guest kernel [%d]'s reference"
Arnaldo Carvalho de Melo23346f22010-04-27 21:17:50 -0300994 " relocation symbol.\n", machine->pid);
Zhang, Yanmina1645ce2010-04-19 13:32:50 +0800995
Zhang, Yanmina1645ce2010-04-19 13:32:50 +0800996 /*
997 * We use _stext for guest kernel because guest kernel's /proc/kallsyms
998 * have no _text sometimes.
999 */
Arnaldo Carvalho de Melo45694aa2011-11-28 08:30:20 -02001000 err = perf_event__synthesize_kernel_mmap(tool, process_synthesized_event,
Adrian Hunter0ae617b2014-01-29 16:14:40 +02001001 machine);
Zhang, Yanmina1645ce2010-04-19 13:32:50 +08001002 if (err < 0)
1003 pr_err("Couldn't record guest kernel [%d]'s reference"
Arnaldo Carvalho de Melo23346f22010-04-27 21:17:50 -03001004 " relocation symbol.\n", machine->pid);
Zhang, Yanmina1645ce2010-04-19 13:32:50 +08001005}
1006
Frederic Weisbecker98402802010-05-02 22:05:29 +02001007static struct perf_event_header finished_round_event = {
1008 .size = sizeof(struct perf_event_header),
1009 .type = PERF_RECORD_FINISHED_ROUND,
1010};
1011
Jiri Olsaa5830532019-07-27 20:30:53 +02001012static void record__adjust_affinity(struct record *rec, struct mmap *map)
Alexey Budankovf13de662019-01-22 20:50:57 +03001013{
1014 if (rec->opts.affinity != PERF_AFFINITY_SYS &&
Alexey Budankov8384a262019-12-03 14:45:27 +03001015 !bitmap_equal(rec->affinity_mask.bits, map->affinity_mask.bits,
1016 rec->affinity_mask.nbits)) {
1017 bitmap_zero(rec->affinity_mask.bits, rec->affinity_mask.nbits);
1018 bitmap_or(rec->affinity_mask.bits, rec->affinity_mask.bits,
1019 map->affinity_mask.bits, rec->affinity_mask.nbits);
1020 sched_setaffinity(0, MMAP_CPU_MASK_BYTES(&rec->affinity_mask),
1021 (cpu_set_t *)rec->affinity_mask.bits);
1022 if (verbose == 2)
1023 mmap_cpu_mask__scnprintf(&rec->affinity_mask, "thread");
Alexey Budankovf13de662019-01-22 20:50:57 +03001024 }
1025}
1026
Alexey Budankov5d7f4112019-03-18 20:43:35 +03001027static size_t process_comp_header(void *record, size_t increment)
1028{
Jiri Olsa72932372019-08-28 15:57:16 +02001029 struct perf_record_compressed *event = record;
Alexey Budankov5d7f4112019-03-18 20:43:35 +03001030 size_t size = sizeof(*event);
1031
1032 if (increment) {
1033 event->header.size += increment;
1034 return increment;
1035 }
1036
1037 event->header.type = PERF_RECORD_COMPRESSED;
1038 event->header.size = size;
1039
1040 return size;
1041}
1042
1043static size_t zstd_compress(struct perf_session *session, void *dst, size_t dst_size,
1044 void *src, size_t src_size)
1045{
1046 size_t compressed;
Jiri Olsa72932372019-08-28 15:57:16 +02001047 size_t max_record_size = PERF_SAMPLE_MAX_SIZE - sizeof(struct perf_record_compressed) - 1;
Alexey Budankov5d7f4112019-03-18 20:43:35 +03001048
1049 compressed = zstd_compress_stream_to_records(&session->zstd_data, dst, dst_size, src, src_size,
1050 max_record_size, process_comp_header);
1051
1052 session->bytes_transferred += src_size;
1053 session->bytes_compressed += compressed;
1054
1055 return compressed;
1056}
1057
Jiri Olsa63503db2019-07-21 13:23:52 +02001058static int record__mmap_read_evlist(struct record *rec, struct evlist *evlist,
Alexey Budankov470530b2019-03-18 20:40:26 +03001059 bool overwrite, bool synch)
Frederic Weisbecker98402802010-05-02 22:05:29 +02001060{
Jiri Olsadcabb502014-07-25 16:56:16 +02001061 u64 bytes_written = rec->bytes_written;
Peter Zijlstra0e2e63d2010-05-20 14:45:26 +02001062 int i;
David Ahern8d3eca22012-08-26 12:24:47 -06001063 int rc = 0;
Jiri Olsaa5830532019-07-27 20:30:53 +02001064 struct mmap *maps;
Alexey Budankovd3d1af62018-11-06 12:04:58 +03001065 int trace_fd = rec->data.file.fd;
Alexey Budankovef781122019-03-18 20:44:12 +03001066 off_t off = 0;
Frederic Weisbecker98402802010-05-02 22:05:29 +02001067
Wang Nancb216862016-06-27 10:24:04 +00001068 if (!evlist)
1069 return 0;
Adrian Hunteref149c22015-04-09 18:53:45 +03001070
Wang Nan0b72d692017-12-04 16:51:07 +00001071 maps = overwrite ? evlist->overwrite_mmap : evlist->mmap;
Wang Nana4ea0ec2016-07-14 08:34:36 +00001072 if (!maps)
1073 return 0;
Wang Nancb216862016-06-27 10:24:04 +00001074
Wang Nan0b72d692017-12-04 16:51:07 +00001075 if (overwrite && evlist->bkw_mmap_state != BKW_MMAP_DATA_PENDING)
Wang Nan54cc54d2016-07-14 08:34:42 +00001076 return 0;
1077
Alexey Budankovd3d1af62018-11-06 12:04:58 +03001078 if (record__aio_enabled(rec))
1079 off = record__aio_get_pos(trace_fd);
1080
Jiri Olsac976ee12019-07-30 13:04:59 +02001081 for (i = 0; i < evlist->core.nr_mmaps; i++) {
Alexey Budankov470530b2019-03-18 20:40:26 +03001082 u64 flush = 0;
Jiri Olsaa5830532019-07-27 20:30:53 +02001083 struct mmap *map = &maps[i];
Wang Nana4ea0ec2016-07-14 08:34:36 +00001084
Jiri Olsa547740f2019-07-27 22:07:44 +02001085 if (map->core.base) {
Alexey Budankovf13de662019-01-22 20:50:57 +03001086 record__adjust_affinity(rec, map);
Alexey Budankov470530b2019-03-18 20:40:26 +03001087 if (synch) {
Jiri Olsa65aa2e62019-08-27 16:05:18 +02001088 flush = map->core.flush;
1089 map->core.flush = 1;
Alexey Budankov470530b2019-03-18 20:40:26 +03001090 }
Alexey Budankovd3d1af62018-11-06 12:04:58 +03001091 if (!record__aio_enabled(rec)) {
Alexey Budankovef781122019-03-18 20:44:12 +03001092 if (perf_mmap__push(map, rec, record__pushfn) < 0) {
Alexey Budankov470530b2019-03-18 20:40:26 +03001093 if (synch)
Jiri Olsa65aa2e62019-08-27 16:05:18 +02001094 map->core.flush = flush;
Alexey Budankovd3d1af62018-11-06 12:04:58 +03001095 rc = -1;
1096 goto out;
1097 }
1098 } else {
Alexey Budankovef781122019-03-18 20:44:12 +03001099 if (record__aio_push(rec, map, &off) < 0) {
Alexey Budankovd3d1af62018-11-06 12:04:58 +03001100 record__aio_set_pos(trace_fd, off);
Alexey Budankov470530b2019-03-18 20:40:26 +03001101 if (synch)
Jiri Olsa65aa2e62019-08-27 16:05:18 +02001102 map->core.flush = flush;
Alexey Budankovd3d1af62018-11-06 12:04:58 +03001103 rc = -1;
1104 goto out;
1105 }
David Ahern8d3eca22012-08-26 12:24:47 -06001106 }
Alexey Budankov470530b2019-03-18 20:40:26 +03001107 if (synch)
Jiri Olsa65aa2e62019-08-27 16:05:18 +02001108 map->core.flush = flush;
David Ahern8d3eca22012-08-26 12:24:47 -06001109 }
Adrian Hunteref149c22015-04-09 18:53:45 +03001110
Jiri Olsae035f4c2018-09-13 14:54:05 +02001111 if (map->auxtrace_mmap.base && !rec->opts.auxtrace_snapshot_mode &&
Adrian Hunterc0a6de02019-11-15 14:42:16 +02001112 !rec->opts.auxtrace_sample_mode &&
Jiri Olsae035f4c2018-09-13 14:54:05 +02001113 record__auxtrace_mmap_read(rec, map) != 0) {
Adrian Hunteref149c22015-04-09 18:53:45 +03001114 rc = -1;
1115 goto out;
1116 }
Frederic Weisbecker98402802010-05-02 22:05:29 +02001117 }
1118
Alexey Budankovd3d1af62018-11-06 12:04:58 +03001119 if (record__aio_enabled(rec))
1120 record__aio_set_pos(trace_fd, off);
1121
Jiri Olsadcabb502014-07-25 16:56:16 +02001122 /*
1123 * Mark the round finished in case we wrote
1124 * at least one event.
1125 */
1126 if (bytes_written != rec->bytes_written)
Jiri Olsaded2b8f2018-09-13 14:54:06 +02001127 rc = record__write(rec, NULL, &finished_round_event, sizeof(finished_round_event));
David Ahern8d3eca22012-08-26 12:24:47 -06001128
Wang Nan0b72d692017-12-04 16:51:07 +00001129 if (overwrite)
Wang Nan54cc54d2016-07-14 08:34:42 +00001130 perf_evlist__toggle_bkw_mmap(evlist, BKW_MMAP_EMPTY);
David Ahern8d3eca22012-08-26 12:24:47 -06001131out:
1132 return rc;
Frederic Weisbecker98402802010-05-02 22:05:29 +02001133}
1134
Alexey Budankov470530b2019-03-18 20:40:26 +03001135static int record__mmap_read_all(struct record *rec, bool synch)
Wang Nancb216862016-06-27 10:24:04 +00001136{
1137 int err;
1138
Alexey Budankov470530b2019-03-18 20:40:26 +03001139 err = record__mmap_read_evlist(rec, rec->evlist, false, synch);
Wang Nancb216862016-06-27 10:24:04 +00001140 if (err)
1141 return err;
1142
Alexey Budankov470530b2019-03-18 20:40:26 +03001143 return record__mmap_read_evlist(rec, rec->evlist, true, synch);
Wang Nancb216862016-06-27 10:24:04 +00001144}
1145
Arnaldo Carvalho de Melo8c6f45a2013-12-19 14:38:03 -03001146static void record__init_features(struct record *rec)
David Ahern57706ab2013-11-06 11:41:34 -07001147{
David Ahern57706ab2013-11-06 11:41:34 -07001148 struct perf_session *session = rec->session;
1149 int feat;
1150
1151 for (feat = HEADER_FIRST_FEATURE; feat < HEADER_LAST_FEATURE; feat++)
1152 perf_header__set_feat(&session->header, feat);
1153
1154 if (rec->no_buildid)
1155 perf_header__clear_feat(&session->header, HEADER_BUILD_ID);
1156
Jiri Olsace9036a2019-07-21 13:24:23 +02001157 if (!have_tracepoints(&rec->evlist->core.entries))
David Ahern57706ab2013-11-06 11:41:34 -07001158 perf_header__clear_feat(&session->header, HEADER_TRACING_DATA);
1159
1160 if (!rec->opts.branch_stack)
1161 perf_header__clear_feat(&session->header, HEADER_BRANCH_STACK);
Adrian Hunteref149c22015-04-09 18:53:45 +03001162
1163 if (!rec->opts.full_auxtrace)
1164 perf_header__clear_feat(&session->header, HEADER_AUXTRACE);
Jiri Olsaffa517a2015-10-25 15:51:43 +01001165
Alexey Budankovcf790512018-10-09 17:36:24 +03001166 if (!(rec->opts.use_clockid && rec->opts.clockid_res_ns))
1167 perf_header__clear_feat(&session->header, HEADER_CLOCKID);
1168
Jiri Olsa258031c2019-03-08 14:47:39 +01001169 perf_header__clear_feat(&session->header, HEADER_DIR_FORMAT);
Alexey Budankov42e1fd82019-03-18 20:41:33 +03001170 if (!record__comp_enabled(rec))
1171 perf_header__clear_feat(&session->header, HEADER_COMPRESSED);
Jiri Olsa258031c2019-03-08 14:47:39 +01001172
Jiri Olsaffa517a2015-10-25 15:51:43 +01001173 perf_header__clear_feat(&session->header, HEADER_STAT);
David Ahern57706ab2013-11-06 11:41:34 -07001174}
1175
Wang Nane1ab48b2016-02-26 09:32:10 +00001176static void
1177record__finish_output(struct record *rec)
1178{
Jiri Olsa8ceb41d2017-01-23 22:07:59 +01001179 struct perf_data *data = &rec->data;
1180 int fd = perf_data__fd(data);
Wang Nane1ab48b2016-02-26 09:32:10 +00001181
Jiri Olsa8ceb41d2017-01-23 22:07:59 +01001182 if (data->is_pipe)
Wang Nane1ab48b2016-02-26 09:32:10 +00001183 return;
1184
1185 rec->session->header.data_size += rec->bytes_written;
Jiri Olsa45112e82019-02-21 10:41:29 +01001186 data->file.size = lseek(perf_data__fd(data), 0, SEEK_CUR);
Wang Nane1ab48b2016-02-26 09:32:10 +00001187
1188 if (!rec->no_buildid) {
1189 process_buildids(rec);
1190
1191 if (rec->buildid_all)
1192 dsos__hit_all(rec->session);
1193 }
1194 perf_session__write_header(rec->session, rec->evlist, fd, true);
1195
1196 return;
1197}
1198
Wang Nan4ea648a2016-07-14 08:34:47 +00001199static int record__synthesize_workload(struct record *rec, bool tail)
Wang Nanbe7b0c92016-04-20 18:59:54 +00001200{
Arnaldo Carvalho de Melo9d6aae72017-02-14 10:59:04 -03001201 int err;
Jiri Olsa9749b902019-07-21 13:23:50 +02001202 struct perf_thread_map *thread_map;
Wang Nanbe7b0c92016-04-20 18:59:54 +00001203
Wang Nan4ea648a2016-07-14 08:34:47 +00001204 if (rec->opts.tail_synthesize != tail)
1205 return 0;
1206
Arnaldo Carvalho de Melo9d6aae72017-02-14 10:59:04 -03001207 thread_map = thread_map__new_by_tid(rec->evlist->workload.pid);
1208 if (thread_map == NULL)
1209 return -1;
1210
1211 err = perf_event__synthesize_thread_map(&rec->tool, thread_map,
Wang Nanbe7b0c92016-04-20 18:59:54 +00001212 process_synthesized_event,
1213 &rec->session->machines.host,
Mark Drayton3fcb10e2018-12-04 12:34:20 -08001214 rec->opts.sample_address);
Jiri Olsa7836e522019-07-21 13:24:20 +02001215 perf_thread_map__put(thread_map);
Arnaldo Carvalho de Melo9d6aae72017-02-14 10:59:04 -03001216 return err;
Wang Nanbe7b0c92016-04-20 18:59:54 +00001217}
1218
Wang Nan4ea648a2016-07-14 08:34:47 +00001219static int record__synthesize(struct record *rec, bool tail);
Wang Nan3c1cb7e2016-04-20 18:59:50 +00001220
Wang Nanecfd7a92016-04-13 08:21:07 +00001221static int
1222record__switch_output(struct record *rec, bool at_exit)
1223{
Jiri Olsa8ceb41d2017-01-23 22:07:59 +01001224 struct perf_data *data = &rec->data;
Wang Nanecfd7a92016-04-13 08:21:07 +00001225 int fd, err;
Andi Kleen03724b22019-03-14 15:49:55 -07001226 char *new_filename;
Wang Nanecfd7a92016-04-13 08:21:07 +00001227
1228 /* Same Size: "2015122520103046"*/
1229 char timestamp[] = "InvalidTimestamp";
1230
Alexey Budankovd3d1af62018-11-06 12:04:58 +03001231 record__aio_mmap_read_sync(rec);
1232
Wang Nan4ea648a2016-07-14 08:34:47 +00001233 record__synthesize(rec, true);
1234 if (target__none(&rec->opts.target))
1235 record__synthesize_workload(rec, true);
1236
Wang Nanecfd7a92016-04-13 08:21:07 +00001237 rec->samples = 0;
1238 record__finish_output(rec);
1239 err = fetch_current_timestamp(timestamp, sizeof(timestamp));
1240 if (err) {
1241 pr_err("Failed to get current timestamp\n");
1242 return -EINVAL;
1243 }
1244
Jiri Olsa8ceb41d2017-01-23 22:07:59 +01001245 fd = perf_data__switch(data, timestamp,
Wang Nanecfd7a92016-04-13 08:21:07 +00001246 rec->session->header.data_offset,
Andi Kleen03724b22019-03-14 15:49:55 -07001247 at_exit, &new_filename);
Wang Nanecfd7a92016-04-13 08:21:07 +00001248 if (fd >= 0 && !at_exit) {
1249 rec->bytes_written = 0;
1250 rec->session->header.data_size = 0;
1251 }
1252
1253 if (!quiet)
1254 fprintf(stderr, "[ perf record: Dump %s.%s ]\n",
Jiri Olsa2d4f2792019-02-21 10:41:30 +01001255 data->path, timestamp);
Wang Nan3c1cb7e2016-04-20 18:59:50 +00001256
Andi Kleen03724b22019-03-14 15:49:55 -07001257 if (rec->switch_output.num_files) {
1258 int n = rec->switch_output.cur_file + 1;
1259
1260 if (n >= rec->switch_output.num_files)
1261 n = 0;
1262 rec->switch_output.cur_file = n;
1263 if (rec->switch_output.filenames[n]) {
1264 remove(rec->switch_output.filenames[n]);
Arnaldo Carvalho de Melod8f9da22019-07-04 12:06:20 -03001265 zfree(&rec->switch_output.filenames[n]);
Andi Kleen03724b22019-03-14 15:49:55 -07001266 }
1267 rec->switch_output.filenames[n] = new_filename;
1268 } else {
1269 free(new_filename);
1270 }
1271
Wang Nan3c1cb7e2016-04-20 18:59:50 +00001272 /* Output tracking events */
Wang Nanbe7b0c92016-04-20 18:59:54 +00001273 if (!at_exit) {
Wang Nan4ea648a2016-07-14 08:34:47 +00001274 record__synthesize(rec, false);
Wang Nan3c1cb7e2016-04-20 18:59:50 +00001275
Wang Nanbe7b0c92016-04-20 18:59:54 +00001276 /*
1277 * In 'perf record --switch-output' without -a,
1278 * record__synthesize() in record__switch_output() won't
1279 * generate tracking events because there's no thread_map
1280 * in evlist. Which causes newly created perf.data doesn't
1281 * contain map and comm information.
1282 * Create a fake thread_map and directly call
1283 * perf_event__synthesize_thread_map() for those events.
1284 */
1285 if (target__none(&rec->opts.target))
Wang Nan4ea648a2016-07-14 08:34:47 +00001286 record__synthesize_workload(rec, false);
Wang Nanbe7b0c92016-04-20 18:59:54 +00001287 }
Wang Nanecfd7a92016-04-13 08:21:07 +00001288 return fd;
1289}
1290
Arnaldo Carvalho de Melof33cbe72014-01-02 15:11:25 -03001291static volatile int workload_exec_errno;
1292
1293/*
1294 * perf_evlist__prepare_workload will send a SIGUSR1
1295 * if the fork fails, since we asked by setting its
1296 * want_signal to true.
1297 */
Namhyung Kim45604712014-05-12 09:47:24 +09001298static void workload_exec_failed_signal(int signo __maybe_unused,
1299 siginfo_t *info,
Arnaldo Carvalho de Melof33cbe72014-01-02 15:11:25 -03001300 void *ucontext __maybe_unused)
1301{
1302 workload_exec_errno = info->si_value.sival_int;
1303 done = 1;
Arnaldo Carvalho de Melof33cbe72014-01-02 15:11:25 -03001304 child_finished = 1;
1305}
1306
Adrian Hunter2dd6d8a2015-04-30 17:37:32 +03001307static void snapshot_sig_handler(int sig);
Jiri Olsabfacbe32017-01-09 10:52:00 +01001308static void alarm_sig_handler(int sig);
Adrian Hunter2dd6d8a2015-04-30 17:37:32 +03001309
Wang Nanee667f92016-06-27 10:24:05 +00001310static const struct perf_event_mmap_page *
Jiri Olsa63503db2019-07-21 13:23:52 +02001311perf_evlist__pick_pc(struct evlist *evlist)
Wang Nanee667f92016-06-27 10:24:05 +00001312{
Wang Nanb2cb6152016-07-14 08:34:39 +00001313 if (evlist) {
Jiri Olsa547740f2019-07-27 22:07:44 +02001314 if (evlist->mmap && evlist->mmap[0].core.base)
1315 return evlist->mmap[0].core.base;
1316 if (evlist->overwrite_mmap && evlist->overwrite_mmap[0].core.base)
1317 return evlist->overwrite_mmap[0].core.base;
Wang Nanb2cb6152016-07-14 08:34:39 +00001318 }
Wang Nanee667f92016-06-27 10:24:05 +00001319 return NULL;
1320}
1321
Wang Nanc45628b2016-05-24 02:28:59 +00001322static const struct perf_event_mmap_page *record__pick_pc(struct record *rec)
1323{
Wang Nanee667f92016-06-27 10:24:05 +00001324 const struct perf_event_mmap_page *pc;
1325
1326 pc = perf_evlist__pick_pc(rec->evlist);
1327 if (pc)
1328 return pc;
Wang Nanc45628b2016-05-24 02:28:59 +00001329 return NULL;
1330}
1331
Wang Nan4ea648a2016-07-14 08:34:47 +00001332static int record__synthesize(struct record *rec, bool tail)
Wang Nanc45c86e2016-02-26 09:32:07 +00001333{
1334 struct perf_session *session = rec->session;
1335 struct machine *machine = &session->machines.host;
Jiri Olsa8ceb41d2017-01-23 22:07:59 +01001336 struct perf_data *data = &rec->data;
Wang Nanc45c86e2016-02-26 09:32:07 +00001337 struct record_opts *opts = &rec->opts;
1338 struct perf_tool *tool = &rec->tool;
Jiri Olsa8ceb41d2017-01-23 22:07:59 +01001339 int fd = perf_data__fd(data);
Wang Nanc45c86e2016-02-26 09:32:07 +00001340 int err = 0;
Stephane Eraniand99c22e2020-04-22 08:50:38 -07001341 event_op f = process_synthesized_event;
Wang Nanc45c86e2016-02-26 09:32:07 +00001342
Wang Nan4ea648a2016-07-14 08:34:47 +00001343 if (rec->opts.tail_synthesize != tail)
1344 return 0;
1345
Jiri Olsa8ceb41d2017-01-23 22:07:59 +01001346 if (data->is_pipe) {
Jiri Olsaa2015512018-03-14 10:22:04 +01001347 /*
1348 * We need to synthesize events first, because some
1349 * features works on top of them (on report side).
1350 */
Jiri Olsa318ec182018-08-30 08:32:15 +02001351 err = perf_event__synthesize_attrs(tool, rec->evlist,
Wang Nanc45c86e2016-02-26 09:32:07 +00001352 process_synthesized_event);
1353 if (err < 0) {
1354 pr_err("Couldn't synthesize attrs.\n");
1355 goto out;
1356 }
1357
Jiri Olsaa2015512018-03-14 10:22:04 +01001358 err = perf_event__synthesize_features(tool, session, rec->evlist,
1359 process_synthesized_event);
1360 if (err < 0) {
1361 pr_err("Couldn't synthesize features.\n");
1362 return err;
1363 }
1364
Jiri Olsace9036a2019-07-21 13:24:23 +02001365 if (have_tracepoints(&rec->evlist->core.entries)) {
Wang Nanc45c86e2016-02-26 09:32:07 +00001366 /*
1367 * FIXME err <= 0 here actually means that
1368 * there were no tracepoints so its not really
1369 * an error, just that we don't need to
1370 * synthesize anything. We really have to
1371 * return this more properly and also
1372 * propagate errors that now are calling die()
1373 */
1374 err = perf_event__synthesize_tracing_data(tool, fd, rec->evlist,
1375 process_synthesized_event);
1376 if (err <= 0) {
1377 pr_err("Couldn't record tracing data.\n");
1378 goto out;
1379 }
1380 rec->bytes_written += err;
1381 }
1382 }
1383
Wang Nanc45628b2016-05-24 02:28:59 +00001384 err = perf_event__synth_time_conv(record__pick_pc(rec), tool,
Adrian Hunter46bc29b2016-03-08 10:38:44 +02001385 process_synthesized_event, machine);
1386 if (err)
1387 goto out;
1388
Adrian Hunterc0a6de02019-11-15 14:42:16 +02001389 /* Synthesize id_index before auxtrace_info */
1390 if (rec->opts.auxtrace_sample_mode) {
1391 err = perf_event__synthesize_id_index(tool,
1392 process_synthesized_event,
1393 session->evlist, machine);
1394 if (err)
1395 goto out;
1396 }
1397
Wang Nanc45c86e2016-02-26 09:32:07 +00001398 if (rec->opts.full_auxtrace) {
1399 err = perf_event__synthesize_auxtrace_info(rec->itr, tool,
1400 session, process_synthesized_event);
1401 if (err)
1402 goto out;
1403 }
1404
Arnaldo Carvalho de Melo6c443952017-11-14 11:03:19 -03001405 if (!perf_evlist__exclude_kernel(rec->evlist)) {
1406 err = perf_event__synthesize_kernel_mmap(tool, process_synthesized_event,
1407 machine);
1408 WARN_ONCE(err < 0, "Couldn't record kernel reference relocation symbol\n"
1409 "Symbol resolution may be skewed if relocation was used (e.g. kexec).\n"
1410 "Check /proc/kallsyms permission or run as root.\n");
Wang Nanc45c86e2016-02-26 09:32:07 +00001411
Arnaldo Carvalho de Melo6c443952017-11-14 11:03:19 -03001412 err = perf_event__synthesize_modules(tool, process_synthesized_event,
1413 machine);
1414 WARN_ONCE(err < 0, "Couldn't record kernel module information.\n"
1415 "Symbol resolution may be skewed if relocation was used (e.g. kexec).\n"
1416 "Check /proc/modules permission or run as root.\n");
1417 }
Wang Nanc45c86e2016-02-26 09:32:07 +00001418
1419 if (perf_guest) {
1420 machines__process_guests(&session->machines,
1421 perf_event__synthesize_guest_os, tool);
1422 }
1423
Andi Kleenbfd8f722017-11-17 13:42:58 -08001424 err = perf_event__synthesize_extra_attr(&rec->tool,
1425 rec->evlist,
1426 process_synthesized_event,
1427 data->is_pipe);
1428 if (err)
1429 goto out;
1430
Jiri Olsa03617c22019-07-21 13:24:42 +02001431 err = perf_event__synthesize_thread_map2(&rec->tool, rec->evlist->core.threads,
Andi Kleen373565d2017-11-17 13:42:59 -08001432 process_synthesized_event,
1433 NULL);
1434 if (err < 0) {
1435 pr_err("Couldn't synthesize thread map.\n");
1436 return err;
1437 }
1438
Jiri Olsaf72f9012019-07-21 13:24:41 +02001439 err = perf_event__synthesize_cpu_map(&rec->tool, rec->evlist->core.cpus,
Andi Kleen373565d2017-11-17 13:42:59 -08001440 process_synthesized_event, NULL);
1441 if (err < 0) {
1442 pr_err("Couldn't synthesize cpu map.\n");
1443 return err;
1444 }
1445
Song Liue5416952019-03-11 22:30:41 -07001446 err = perf_event__synthesize_bpf_events(session, process_synthesized_event,
Song Liu7b612e22019-01-17 08:15:19 -08001447 machine, opts);
1448 if (err < 0)
1449 pr_warning("Couldn't synthesize bpf events.\n");
1450
Namhyung Kimab640692020-03-25 21:45:33 +09001451 err = perf_event__synthesize_cgroups(tool, process_synthesized_event,
1452 machine);
1453 if (err < 0)
1454 pr_warning("Couldn't synthesize cgroup events.\n");
1455
Stephane Eraniand99c22e2020-04-22 08:50:38 -07001456 if (rec->opts.nr_threads_synthesize > 1) {
1457 perf_set_multithreaded();
1458 f = process_locked_synthesized_event;
1459 }
1460
Jiri Olsa03617c22019-07-21 13:24:42 +02001461 err = __machine__synthesize_threads(machine, tool, &opts->target, rec->evlist->core.threads,
Stephane Eraniand99c22e2020-04-22 08:50:38 -07001462 f, opts->sample_address,
1463 rec->opts.nr_threads_synthesize);
1464
1465 if (rec->opts.nr_threads_synthesize > 1)
1466 perf_set_singlethreaded();
1467
Wang Nanc45c86e2016-02-26 09:32:07 +00001468out:
1469 return err;
1470}
1471
Arnaldo Carvalho de Melo899e5ff2020-04-27 17:56:37 -03001472static int record__process_signal_event(union perf_event *event __maybe_unused, void *data)
1473{
1474 struct record *rec = data;
1475 pthread_kill(rec->thread_id, SIGUSR2);
1476 return 0;
1477}
1478
Arnaldo Carvalho de Melo23cbb412020-04-28 14:58:29 -03001479static int record__setup_sb_evlist(struct record *rec)
1480{
1481 struct record_opts *opts = &rec->opts;
1482
1483 if (rec->sb_evlist != NULL) {
1484 /*
1485 * We get here if --switch-output-event populated the
1486 * sb_evlist, so associate a callback that will send a SIGUSR2
1487 * to the main thread.
1488 */
1489 evlist__set_cb(rec->sb_evlist, record__process_signal_event, rec);
1490 rec->thread_id = pthread_self();
1491 }
1492
1493 if (!opts->no_bpf_event) {
1494 if (rec->sb_evlist == NULL) {
1495 rec->sb_evlist = evlist__new();
1496
1497 if (rec->sb_evlist == NULL) {
1498 pr_err("Couldn't create side band evlist.\n.");
1499 return -1;
1500 }
1501 }
1502
1503 if (evlist__add_bpf_sb_event(rec->sb_evlist, &rec->session->header.env)) {
1504 pr_err("Couldn't ask for PERF_RECORD_BPF_EVENT side band events.\n.");
1505 return -1;
1506 }
1507 }
1508
1509 if (perf_evlist__start_sb_thread(rec->sb_evlist, &rec->opts.target)) {
1510 pr_debug("Couldn't start the BPF side band thread:\nBPF programs starting from now on won't be annotatable\n");
1511 opts->no_bpf_event = true;
1512 }
1513
1514 return 0;
1515}
1516
Arnaldo Carvalho de Melo8c6f45a2013-12-19 14:38:03 -03001517static int __cmd_record(struct record *rec, int argc, const char **argv)
Peter Zijlstra16c8a102009-05-05 17:50:27 +02001518{
David Ahern57706ab2013-11-06 11:41:34 -07001519 int err;
Namhyung Kim45604712014-05-12 09:47:24 +09001520 int status = 0;
Peter Zijlstra8b412662009-09-17 19:59:05 +02001521 unsigned long waking = 0;
Zhang, Yanmin46be6042010-03-18 11:36:04 -03001522 const bool forks = argc > 0;
Arnaldo Carvalho de Melo45694aa2011-11-28 08:30:20 -02001523 struct perf_tool *tool = &rec->tool;
Arnaldo Carvalho de Melob4006792013-12-19 14:43:45 -03001524 struct record_opts *opts = &rec->opts;
Jiri Olsa8ceb41d2017-01-23 22:07:59 +01001525 struct perf_data *data = &rec->data;
Arnaldo Carvalho de Melod20deb62011-11-25 08:19:45 -02001526 struct perf_session *session;
Arnaldo Carvalho de Melo6dcf45ef2014-08-13 11:33:59 -03001527 bool disabled = false, draining = false;
Namhyung Kim42aa2762015-01-29 17:06:48 +09001528 int fd;
Alexey Budankovd3c8c082019-03-18 20:41:02 +03001529 float ratio = 0;
Peter Zijlstrade9ac072009-04-08 15:01:31 +02001530
Namhyung Kim45604712014-05-12 09:47:24 +09001531 atexit(record__sig_exit);
Peter Zijlstraf5970552009-06-18 23:22:55 +02001532 signal(SIGCHLD, sig_handler);
1533 signal(SIGINT, sig_handler);
David Ahern804f7ac2013-05-06 12:24:23 -06001534 signal(SIGTERM, sig_handler);
Wang Nana0748652016-11-26 07:03:28 +00001535 signal(SIGSEGV, sigsegv_handler);
Wang Nanc0bdc1c2016-04-13 08:21:06 +00001536
Hari Bathinif3b36142017-03-08 02:11:43 +05301537 if (rec->opts.record_namespaces)
1538 tool->namespace_events = true;
1539
Namhyung Kim8fb4b672020-03-25 21:45:34 +09001540 if (rec->opts.record_cgroup) {
1541#ifdef HAVE_FILE_HANDLE
1542 tool->cgroup_events = true;
1543#else
1544 pr_err("cgroup tracking is not supported\n");
1545 return -1;
1546#endif
1547 }
1548
Jiri Olsadc0c6122017-01-09 10:51:58 +01001549 if (rec->opts.auxtrace_snapshot_mode || rec->switch_output.enabled) {
Adrian Hunter2dd6d8a2015-04-30 17:37:32 +03001550 signal(SIGUSR2, snapshot_sig_handler);
Wang Nan3c1cb7e2016-04-20 18:59:50 +00001551 if (rec->opts.auxtrace_snapshot_mode)
1552 trigger_on(&auxtrace_snapshot_trigger);
Jiri Olsadc0c6122017-01-09 10:51:58 +01001553 if (rec->switch_output.enabled)
Wang Nan3c1cb7e2016-04-20 18:59:50 +00001554 trigger_on(&switch_output_trigger);
Wang Nanc0bdc1c2016-04-13 08:21:06 +00001555 } else {
Adrian Hunter2dd6d8a2015-04-30 17:37:32 +03001556 signal(SIGUSR2, SIG_IGN);
Wang Nanc0bdc1c2016-04-13 08:21:06 +00001557 }
Peter Zijlstraf5970552009-06-18 23:22:55 +02001558
Jiri Olsa8ceb41d2017-01-23 22:07:59 +01001559 session = perf_session__new(data, false, tool);
Mamatha Inamdar6ef81c52019-08-22 12:50:49 +05301560 if (IS_ERR(session)) {
Adrien BAKffa91882014-04-18 11:00:43 +09001561 pr_err("Perf session creation failed.\n");
Mamatha Inamdar6ef81c52019-08-22 12:50:49 +05301562 return PTR_ERR(session);
Arnaldo Carvalho de Meloa9a70bb2009-11-17 01:18:11 -02001563 }
1564
Jiri Olsa8ceb41d2017-01-23 22:07:59 +01001565 fd = perf_data__fd(data);
Arnaldo Carvalho de Melod20deb62011-11-25 08:19:45 -02001566 rec->session = session;
1567
Alexey Budankov5d7f4112019-03-18 20:43:35 +03001568 if (zstd_init(&session->zstd_data, rec->opts.comp_level) < 0) {
1569 pr_err("Compression initialization failed.\n");
1570 return -1;
1571 }
Anand K Mistryda231332020-05-13 12:20:23 +10001572#ifdef HAVE_EVENTFD_SUPPORT
1573 done_fd = eventfd(0, EFD_NONBLOCK);
1574 if (done_fd < 0) {
1575 pr_err("Failed to create wakeup eventfd, error: %m\n");
1576 status = -1;
1577 goto out_delete_session;
1578 }
1579 err = evlist__add_pollfd(rec->evlist, done_fd);
1580 if (err < 0) {
1581 pr_err("Failed to add wakeup eventfd to poll list\n");
1582 status = err;
1583 goto out_delete_session;
1584 }
1585#endif // HAVE_EVENTFD_SUPPORT
Alexey Budankov5d7f4112019-03-18 20:43:35 +03001586
1587 session->header.env.comp_type = PERF_COMP_ZSTD;
1588 session->header.env.comp_level = rec->opts.comp_level;
1589
Adrian Huntereeb399b2019-10-04 11:31:21 +03001590 if (rec->opts.kcore &&
1591 !record__kcore_readable(&session->machines.host)) {
1592 pr_err("ERROR: kcore is not readable.\n");
1593 return -1;
1594 }
1595
Arnaldo Carvalho de Melo8c6f45a2013-12-19 14:38:03 -03001596 record__init_features(rec);
Stephane Eranian330aa672012-03-08 23:47:46 +01001597
Alexey Budankovcf790512018-10-09 17:36:24 +03001598 if (rec->opts.use_clockid && rec->opts.clockid_res_ns)
1599 session->header.env.clockid_res_ns = rec->opts.clockid_res_ns;
1600
Arnaldo Carvalho de Melod4db3f12009-12-27 21:36:57 -02001601 if (forks) {
Arnaldo Carvalho de Melo3e2be2d2014-01-03 15:03:26 -03001602 err = perf_evlist__prepare_workload(rec->evlist, &opts->target,
Jiri Olsa8ceb41d2017-01-23 22:07:59 +01001603 argv, data->is_pipe,
Arnaldo Carvalho de Melo735f7e02014-01-03 14:56:49 -03001604 workload_exec_failed_signal);
Arnaldo Carvalho de Melo35b9d882011-11-09 08:47:15 -02001605 if (err < 0) {
1606 pr_err("Couldn't run the workload!\n");
Namhyung Kim45604712014-05-12 09:47:24 +09001607 status = err;
Arnaldo Carvalho de Melo35b9d882011-11-09 08:47:15 -02001608 goto out_delete_session;
Jens Axboe0a5ac842009-08-12 11:18:01 +02001609 }
Peter Zijlstra856e9662009-12-16 17:55:55 +01001610 }
1611
Jiri Olsaad46e48c2018-03-02 17:13:54 +01001612 /*
1613 * If we have just single event and are sending data
1614 * through pipe, we need to force the ids allocation,
1615 * because we synthesize event name through the pipe
1616 * and need the id for that.
1617 */
Jiri Olsa6484d2f2019-07-21 13:24:28 +02001618 if (data->is_pipe && rec->evlist->core.nr_entries == 1)
Jiri Olsaad46e48c2018-03-02 17:13:54 +01001619 rec->opts.sample_id = true;
1620
Arnaldo Carvalho de Melo8c6f45a2013-12-19 14:38:03 -03001621 if (record__open(rec) != 0) {
David Ahern8d3eca22012-08-26 12:24:47 -06001622 err = -1;
Namhyung Kim45604712014-05-12 09:47:24 +09001623 goto out_child;
David Ahern8d3eca22012-08-26 12:24:47 -06001624 }
Jiri Olsaf6fa4372019-08-06 15:14:05 +02001625 session->header.env.comp_mmap_len = session->evlist->core.mmap_len;
Peter Zijlstrade9ac072009-04-08 15:01:31 +02001626
Adrian Huntereeb399b2019-10-04 11:31:21 +03001627 if (rec->opts.kcore) {
1628 err = record__kcore_copy(&session->machines.host, data);
1629 if (err) {
1630 pr_err("ERROR: Failed to copy kcore\n");
1631 goto out_child;
1632 }
1633 }
1634
Wang Nan8690a2a2016-02-22 09:10:32 +00001635 err = bpf__apply_obj_config();
1636 if (err) {
1637 char errbuf[BUFSIZ];
1638
1639 bpf__strerror_apply_obj_config(err, errbuf, sizeof(errbuf));
1640 pr_err("ERROR: Apply config to BPF failed: %s\n",
1641 errbuf);
1642 goto out_child;
1643 }
1644
Adrian Huntercca84822015-08-19 17:29:21 +03001645 /*
1646 * Normally perf_session__new would do this, but it doesn't have the
1647 * evlist.
1648 */
Arnaldo Carvalho de Melo8cedf3a2020-06-17 09:29:48 -03001649 if (rec->tool.ordered_events && !evlist__sample_id_all(rec->evlist)) {
Adrian Huntercca84822015-08-19 17:29:21 +03001650 pr_warning("WARNING: No sample_id_all support, falling back to unordered processing\n");
1651 rec->tool.ordered_events = false;
1652 }
1653
Arnaldo Carvalho de Melo3e2be2d2014-01-03 15:03:26 -03001654 if (!rec->evlist->nr_groups)
Namhyung Kima8bb5592013-01-22 18:09:31 +09001655 perf_header__clear_feat(&session->header, HEADER_GROUP_DESC);
1656
Jiri Olsa8ceb41d2017-01-23 22:07:59 +01001657 if (data->is_pipe) {
Namhyung Kim42aa2762015-01-29 17:06:48 +09001658 err = perf_header__write_pipe(fd);
Tom Zanussi529870e2010-04-01 23:59:16 -05001659 if (err < 0)
Namhyung Kim45604712014-05-12 09:47:24 +09001660 goto out_child;
Jiri Olsa563aecb2013-06-05 13:35:06 +02001661 } else {
Namhyung Kim42aa2762015-01-29 17:06:48 +09001662 err = perf_session__write_header(session, rec->evlist, fd, false);
Arnaldo Carvalho de Melod5eed902009-11-19 14:55:56 -02001663 if (err < 0)
Namhyung Kim45604712014-05-12 09:47:24 +09001664 goto out_child;
Arnaldo Carvalho de Melod5eed902009-11-19 14:55:56 -02001665 }
Peter Zijlstra7c6a1c62009-06-25 17:05:54 +02001666
Arnaldo Carvalho de Melob38d85e2020-04-24 12:24:51 -03001667 err = -1;
David Ahernd3665492012-02-06 15:27:52 -07001668 if (!rec->no_buildid
Robert Richtere20960c2011-12-07 10:02:55 +01001669 && !perf_header__has_feat(&session->header, HEADER_BUILD_ID)) {
David Ahernd3665492012-02-06 15:27:52 -07001670 pr_err("Couldn't generate buildids. "
Robert Richtere20960c2011-12-07 10:02:55 +01001671 "Use --no-buildid to profile anyway.\n");
Namhyung Kim45604712014-05-12 09:47:24 +09001672 goto out_child;
Robert Richtere20960c2011-12-07 10:02:55 +01001673 }
1674
Arnaldo Carvalho de Melo23cbb412020-04-28 14:58:29 -03001675 err = record__setup_sb_evlist(rec);
1676 if (err)
1677 goto out_child;
Song Liu657ee552019-03-11 22:30:50 -07001678
Wang Nan4ea648a2016-07-14 08:34:47 +00001679 err = record__synthesize(rec, false);
Wang Nanc45c86e2016-02-26 09:32:07 +00001680 if (err < 0)
Namhyung Kim45604712014-05-12 09:47:24 +09001681 goto out_child;
David Ahern8d3eca22012-08-26 12:24:47 -06001682
Arnaldo Carvalho de Melod20deb62011-11-25 08:19:45 -02001683 if (rec->realtime_prio) {
Peter Zijlstrade9ac072009-04-08 15:01:31 +02001684 struct sched_param param;
1685
Arnaldo Carvalho de Melod20deb62011-11-25 08:19:45 -02001686 param.sched_priority = rec->realtime_prio;
Peter Zijlstrade9ac072009-04-08 15:01:31 +02001687 if (sched_setscheduler(0, SCHED_FIFO, &param)) {
Arnaldo Carvalho de Melo6beba7a2009-10-21 17:34:06 -02001688 pr_err("Could not set realtime priority.\n");
David Ahern8d3eca22012-08-26 12:24:47 -06001689 err = -1;
Namhyung Kim45604712014-05-12 09:47:24 +09001690 goto out_child;
Peter Zijlstrade9ac072009-04-08 15:01:31 +02001691 }
1692 }
1693
Jiri Olsa774cb492012-11-12 18:34:01 +01001694 /*
1695 * When perf is starting the traced process, all the events
1696 * (apart from group members) have enable_on_exec=1 set,
1697 * so don't spoil it by prematurely enabling them.
1698 */
Andi Kleen6619a532014-01-11 13:38:27 -08001699 if (!target__none(&opts->target) && !opts->initial_delay)
Jiri Olsa1c87f162019-07-21 13:24:08 +02001700 evlist__enable(rec->evlist);
David Ahern764e16a32011-08-25 10:17:55 -06001701
Peter Zijlstra856e9662009-12-16 17:55:55 +01001702 /*
1703 * Let the child rip
1704 */
Namhyung Kime803cf92015-09-22 09:24:55 +09001705 if (forks) {
Jiri Olsa20a8a3c2018-03-07 16:50:04 +01001706 struct machine *machine = &session->machines.host;
Namhyung Kime5bed562015-09-30 10:45:24 +09001707 union perf_event *event;
Hari Bathinie907caf2017-03-08 02:11:51 +05301708 pid_t tgid;
Namhyung Kime5bed562015-09-30 10:45:24 +09001709
1710 event = malloc(sizeof(event->comm) + machine->id_hdr_size);
1711 if (event == NULL) {
1712 err = -ENOMEM;
1713 goto out_child;
1714 }
1715
Namhyung Kime803cf92015-09-22 09:24:55 +09001716 /*
1717 * Some H/W events are generated before COMM event
1718 * which is emitted during exec(), so perf script
1719 * cannot see a correct process name for those events.
1720 * Synthesize COMM event to prevent it.
1721 */
Hari Bathinie907caf2017-03-08 02:11:51 +05301722 tgid = perf_event__synthesize_comm(tool, event,
1723 rec->evlist->workload.pid,
1724 process_synthesized_event,
1725 machine);
1726 free(event);
1727
1728 if (tgid == -1)
1729 goto out_child;
1730
1731 event = malloc(sizeof(event->namespaces) +
1732 (NR_NAMESPACES * sizeof(struct perf_ns_link_info)) +
1733 machine->id_hdr_size);
1734 if (event == NULL) {
1735 err = -ENOMEM;
1736 goto out_child;
1737 }
1738
1739 /*
1740 * Synthesize NAMESPACES event for the command specified.
1741 */
1742 perf_event__synthesize_namespaces(tool, event,
1743 rec->evlist->workload.pid,
1744 tgid, process_synthesized_event,
1745 machine);
Namhyung Kime5bed562015-09-30 10:45:24 +09001746 free(event);
Namhyung Kime803cf92015-09-22 09:24:55 +09001747
Arnaldo Carvalho de Melo3e2be2d2014-01-03 15:03:26 -03001748 perf_evlist__start_workload(rec->evlist);
Namhyung Kime803cf92015-09-22 09:24:55 +09001749 }
Peter Zijlstra856e9662009-12-16 17:55:55 +01001750
Andi Kleen6619a532014-01-11 13:38:27 -08001751 if (opts->initial_delay) {
Arnaldo Carvalho de Melo0693e682016-08-08 15:05:46 -03001752 usleep(opts->initial_delay * USEC_PER_MSEC);
Jiri Olsa1c87f162019-07-21 13:24:08 +02001753 evlist__enable(rec->evlist);
Andi Kleen6619a532014-01-11 13:38:27 -08001754 }
1755
Wang Nan5f9cf592016-04-20 18:59:49 +00001756 trigger_ready(&auxtrace_snapshot_trigger);
Wang Nan3c1cb7e2016-04-20 18:59:50 +00001757 trigger_ready(&switch_output_trigger);
Wang Nana0748652016-11-26 07:03:28 +00001758 perf_hooks__invoke_record_start();
Peter Zijlstra649c48a2009-06-24 21:12:48 +02001759 for (;;) {
Yang Shi9f065192015-09-29 14:49:43 -07001760 unsigned long long hits = rec->samples;
Peter Zijlstrade9ac072009-04-08 15:01:31 +02001761
Wang Nan057374642016-07-14 08:34:43 +00001762 /*
1763 * rec->evlist->bkw_mmap_state is possible to be
1764 * BKW_MMAP_EMPTY here: when done == true and
1765 * hits != rec->samples in previous round.
1766 *
1767 * perf_evlist__toggle_bkw_mmap ensure we never
1768 * convert BKW_MMAP_EMPTY to BKW_MMAP_DATA_PENDING.
1769 */
1770 if (trigger_is_hit(&switch_output_trigger) || done || draining)
1771 perf_evlist__toggle_bkw_mmap(rec->evlist, BKW_MMAP_DATA_PENDING);
1772
Alexey Budankov470530b2019-03-18 20:40:26 +03001773 if (record__mmap_read_all(rec, false) < 0) {
Wang Nan5f9cf592016-04-20 18:59:49 +00001774 trigger_error(&auxtrace_snapshot_trigger);
Wang Nan3c1cb7e2016-04-20 18:59:50 +00001775 trigger_error(&switch_output_trigger);
David Ahern8d3eca22012-08-26 12:24:47 -06001776 err = -1;
Namhyung Kim45604712014-05-12 09:47:24 +09001777 goto out_child;
David Ahern8d3eca22012-08-26 12:24:47 -06001778 }
Peter Zijlstrade9ac072009-04-08 15:01:31 +02001779
Adrian Hunter2dd6d8a2015-04-30 17:37:32 +03001780 if (auxtrace_record__snapshot_started) {
1781 auxtrace_record__snapshot_started = 0;
Wang Nan5f9cf592016-04-20 18:59:49 +00001782 if (!trigger_is_error(&auxtrace_snapshot_trigger))
Alexander Shishkince7b0e42019-08-06 17:41:01 +03001783 record__read_auxtrace_snapshot(rec, false);
Wang Nan5f9cf592016-04-20 18:59:49 +00001784 if (trigger_is_error(&auxtrace_snapshot_trigger)) {
Adrian Hunter2dd6d8a2015-04-30 17:37:32 +03001785 pr_err("AUX area tracing snapshot failed\n");
1786 err = -1;
1787 goto out_child;
1788 }
1789 }
1790
Wang Nan3c1cb7e2016-04-20 18:59:50 +00001791 if (trigger_is_hit(&switch_output_trigger)) {
Wang Nan057374642016-07-14 08:34:43 +00001792 /*
1793 * If switch_output_trigger is hit, the data in
1794 * overwritable ring buffer should have been collected,
1795 * so bkw_mmap_state should be set to BKW_MMAP_EMPTY.
1796 *
1797 * If SIGUSR2 raise after or during record__mmap_read_all(),
1798 * record__mmap_read_all() didn't collect data from
1799 * overwritable ring buffer. Read again.
1800 */
1801 if (rec->evlist->bkw_mmap_state == BKW_MMAP_RUNNING)
1802 continue;
Wang Nan3c1cb7e2016-04-20 18:59:50 +00001803 trigger_ready(&switch_output_trigger);
1804
Wang Nan057374642016-07-14 08:34:43 +00001805 /*
1806 * Reenable events in overwrite ring buffer after
1807 * record__mmap_read_all(): we should have collected
1808 * data from it.
1809 */
1810 perf_evlist__toggle_bkw_mmap(rec->evlist, BKW_MMAP_RUNNING);
1811
Wang Nan3c1cb7e2016-04-20 18:59:50 +00001812 if (!quiet)
1813 fprintf(stderr, "[ perf record: dump data: Woken up %ld times ]\n",
1814 waking);
1815 waking = 0;
1816 fd = record__switch_output(rec, false);
1817 if (fd < 0) {
1818 pr_err("Failed to switch to new file\n");
1819 trigger_error(&switch_output_trigger);
1820 err = fd;
1821 goto out_child;
1822 }
Jiri Olsabfacbe32017-01-09 10:52:00 +01001823
1824 /* re-arm the alarm */
1825 if (rec->switch_output.time)
1826 alarm(rec->switch_output.time);
Wang Nan3c1cb7e2016-04-20 18:59:50 +00001827 }
1828
Arnaldo Carvalho de Melod20deb62011-11-25 08:19:45 -02001829 if (hits == rec->samples) {
Arnaldo Carvalho de Melo6dcf45ef2014-08-13 11:33:59 -03001830 if (done || draining)
Peter Zijlstra649c48a2009-06-24 21:12:48 +02001831 break;
Jiri Olsa80ab2982019-08-31 22:48:33 +02001832 err = evlist__poll(rec->evlist, -1);
Jiri Olsaa5151142014-06-02 13:44:23 -04001833 /*
1834 * Propagate error, only if there's any. Ignore positive
1835 * number of returned events and interrupt error.
1836 */
1837 if (err > 0 || (err < 0 && errno == EINTR))
Namhyung Kim45604712014-05-12 09:47:24 +09001838 err = 0;
Peter Zijlstra8b412662009-09-17 19:59:05 +02001839 waking++;
Arnaldo Carvalho de Melo6dcf45ef2014-08-13 11:33:59 -03001840
Jiri Olsaf4009e72019-08-16 16:00:45 +02001841 if (evlist__filter_pollfd(rec->evlist, POLLERR | POLLHUP) == 0)
Arnaldo Carvalho de Melo6dcf45ef2014-08-13 11:33:59 -03001842 draining = true;
Peter Zijlstra8b412662009-09-17 19:59:05 +02001843 }
1844
Jiri Olsa774cb492012-11-12 18:34:01 +01001845 /*
1846 * When perf is starting the traced process, at the end events
1847 * die with the process and we wait for that. Thus no need to
1848 * disable events in this case.
1849 */
Arnaldo Carvalho de Melo602ad872013-11-12 16:46:16 -03001850 if (done && !disabled && !target__none(&opts->target)) {
Wang Nan5f9cf592016-04-20 18:59:49 +00001851 trigger_off(&auxtrace_snapshot_trigger);
Jiri Olsae74676d2019-07-21 13:24:09 +02001852 evlist__disable(rec->evlist);
Jiri Olsa27119262012-11-12 18:34:02 +01001853 disabled = true;
1854 }
Peter Zijlstrade9ac072009-04-08 15:01:31 +02001855 }
Alexander Shishkince7b0e42019-08-06 17:41:01 +03001856
Wang Nan5f9cf592016-04-20 18:59:49 +00001857 trigger_off(&auxtrace_snapshot_trigger);
Wang Nan3c1cb7e2016-04-20 18:59:50 +00001858 trigger_off(&switch_output_trigger);
Peter Zijlstrade9ac072009-04-08 15:01:31 +02001859
Alexander Shishkince7b0e42019-08-06 17:41:01 +03001860 if (opts->auxtrace_snapshot_on_exit)
1861 record__auxtrace_snapshot_exit(rec);
1862
Arnaldo Carvalho de Melof33cbe72014-01-02 15:11:25 -03001863 if (forks && workload_exec_errno) {
Masami Hiramatsu35550da2014-08-14 02:22:43 +00001864 char msg[STRERR_BUFSIZE];
Arnaldo Carvalho de Meloc8b5f2c2016-07-06 11:56:20 -03001865 const char *emsg = str_error_r(workload_exec_errno, msg, sizeof(msg));
Arnaldo Carvalho de Melof33cbe72014-01-02 15:11:25 -03001866 pr_err("Workload failed: %s\n", emsg);
1867 err = -1;
Namhyung Kim45604712014-05-12 09:47:24 +09001868 goto out_child;
Arnaldo Carvalho de Melof33cbe72014-01-02 15:11:25 -03001869 }
1870
Namhyung Kime3d59112015-01-29 17:06:44 +09001871 if (!quiet)
Namhyung Kim45604712014-05-12 09:47:24 +09001872 fprintf(stderr, "[ perf record: Woken up %ld times to write data ]\n", waking);
Arnaldo Carvalho de Melob44308f2010-10-26 15:20:09 -02001873
Wang Nan4ea648a2016-07-14 08:34:47 +00001874 if (target__none(&rec->opts.target))
1875 record__synthesize_workload(rec, true);
1876
Namhyung Kim45604712014-05-12 09:47:24 +09001877out_child:
Alexey Budankov470530b2019-03-18 20:40:26 +03001878 record__mmap_read_all(rec, true);
Alexey Budankovd3d1af62018-11-06 12:04:58 +03001879 record__aio_mmap_read_sync(rec);
1880
Alexey Budankovd3c8c082019-03-18 20:41:02 +03001881 if (rec->session->bytes_transferred && rec->session->bytes_compressed) {
1882 ratio = (float)rec->session->bytes_transferred/(float)rec->session->bytes_compressed;
1883 session->header.env.comp_ratio = ratio + 0.5;
1884 }
1885
Namhyung Kim45604712014-05-12 09:47:24 +09001886 if (forks) {
1887 int exit_status;
Ingo Molnaraddc2782009-06-02 23:43:11 +02001888
Namhyung Kim45604712014-05-12 09:47:24 +09001889 if (!child_finished)
1890 kill(rec->evlist->workload.pid, SIGTERM);
1891
1892 wait(&exit_status);
1893
1894 if (err < 0)
1895 status = err;
1896 else if (WIFEXITED(exit_status))
1897 status = WEXITSTATUS(exit_status);
1898 else if (WIFSIGNALED(exit_status))
1899 signr = WTERMSIG(exit_status);
1900 } else
1901 status = err;
1902
Wang Nan4ea648a2016-07-14 08:34:47 +00001903 record__synthesize(rec, true);
Namhyung Kime3d59112015-01-29 17:06:44 +09001904 /* this will be recalculated during process_buildids() */
1905 rec->samples = 0;
1906
Wang Nanecfd7a92016-04-13 08:21:07 +00001907 if (!err) {
1908 if (!rec->timestamp_filename) {
1909 record__finish_output(rec);
1910 } else {
1911 fd = record__switch_output(rec, true);
1912 if (fd < 0) {
1913 status = fd;
1914 goto out_delete_session;
1915 }
1916 }
1917 }
Arnaldo Carvalho de Melo39d17da2010-07-29 14:08:55 -03001918
Wang Nana0748652016-11-26 07:03:28 +00001919 perf_hooks__invoke_record_end();
1920
Namhyung Kime3d59112015-01-29 17:06:44 +09001921 if (!err && !quiet) {
1922 char samples[128];
Wang Nanecfd7a92016-04-13 08:21:07 +00001923 const char *postfix = rec->timestamp_filename ?
1924 ".<timestamp>" : "";
Namhyung Kime3d59112015-01-29 17:06:44 +09001925
Adrian Hunteref149c22015-04-09 18:53:45 +03001926 if (rec->samples && !rec->opts.full_auxtrace)
Namhyung Kime3d59112015-01-29 17:06:44 +09001927 scnprintf(samples, sizeof(samples),
1928 " (%" PRIu64 " samples)", rec->samples);
1929 else
1930 samples[0] = '\0';
1931
Alexey Budankovd3c8c082019-03-18 20:41:02 +03001932 fprintf(stderr, "[ perf record: Captured and wrote %.3f MB %s%s%s",
Jiri Olsa8ceb41d2017-01-23 22:07:59 +01001933 perf_data__size(data) / 1024.0 / 1024.0,
Jiri Olsa2d4f2792019-02-21 10:41:30 +01001934 data->path, postfix, samples);
Alexey Budankovd3c8c082019-03-18 20:41:02 +03001935 if (ratio) {
1936 fprintf(stderr, ", compressed (original %.3f MB, ratio is %.3f)",
1937 rec->session->bytes_transferred / 1024.0 / 1024.0,
1938 ratio);
1939 }
1940 fprintf(stderr, " ]\n");
Namhyung Kime3d59112015-01-29 17:06:44 +09001941 }
1942
Arnaldo Carvalho de Melo39d17da2010-07-29 14:08:55 -03001943out_delete_session:
Anand K Mistryda231332020-05-13 12:20:23 +10001944#ifdef HAVE_EVENTFD_SUPPORT
1945 if (done_fd >= 0)
1946 close(done_fd);
1947#endif
Alexey Budankov5d7f4112019-03-18 20:43:35 +03001948 zstd_fini(&session->zstd_data);
Arnaldo Carvalho de Melo39d17da2010-07-29 14:08:55 -03001949 perf_session__delete(session);
Song Liu657ee552019-03-11 22:30:50 -07001950
1951 if (!opts->no_bpf_event)
Arnaldo Carvalho de Melobc477d792020-04-24 10:24:04 -03001952 perf_evlist__stop_sb_thread(rec->sb_evlist);
Namhyung Kim45604712014-05-12 09:47:24 +09001953 return status;
Peter Zijlstrade9ac072009-04-08 15:01:31 +02001954}
Ingo Molnar0e9b20b2009-05-26 09:17:18 +02001955
Arnaldo Carvalho de Melo0883e822016-04-15 16:37:17 -03001956static void callchain_debug(struct callchain_param *callchain)
Jiri Olsa09b0fd42013-10-26 16:25:33 +02001957{
Kan Liangaad2b212015-01-05 13:23:04 -05001958 static const char *str[CALLCHAIN_MAX] = { "NONE", "FP", "DWARF", "LBR" };
Jiri Olsaa601fdf2014-02-03 12:44:43 +01001959
Arnaldo Carvalho de Melo0883e822016-04-15 16:37:17 -03001960 pr_debug("callchain: type %s\n", str[callchain->record_mode]);
Jiri Olsa09b0fd42013-10-26 16:25:33 +02001961
Arnaldo Carvalho de Melo0883e822016-04-15 16:37:17 -03001962 if (callchain->record_mode == CALLCHAIN_DWARF)
Jiri Olsa09b0fd42013-10-26 16:25:33 +02001963 pr_debug("callchain: stack dump size %d\n",
Arnaldo Carvalho de Melo0883e822016-04-15 16:37:17 -03001964 callchain->dump_size);
1965}
1966
1967int record_opts__parse_callchain(struct record_opts *record,
1968 struct callchain_param *callchain,
1969 const char *arg, bool unset)
1970{
1971 int ret;
Arnaldo Carvalho de Melo0883e822016-04-15 16:37:17 -03001972 callchain->enabled = !unset;
1973
1974 /* --no-call-graph */
1975 if (unset) {
1976 callchain->record_mode = CALLCHAIN_NONE;
1977 pr_debug("callchain: disabled\n");
1978 return 0;
1979 }
1980
1981 ret = parse_callchain_record_opt(arg, callchain);
1982 if (!ret) {
1983 /* Enable data address sampling for DWARF unwind. */
1984 if (callchain->record_mode == CALLCHAIN_DWARF)
1985 record->sample_address = true;
1986 callchain_debug(callchain);
1987 }
1988
1989 return ret;
Jiri Olsa09b0fd42013-10-26 16:25:33 +02001990}
1991
Kan Liangc421e802015-07-29 05:42:12 -04001992int record_parse_callchain_opt(const struct option *opt,
Jiri Olsa09b0fd42013-10-26 16:25:33 +02001993 const char *arg,
1994 int unset)
1995{
Arnaldo Carvalho de Melo0883e822016-04-15 16:37:17 -03001996 return record_opts__parse_callchain(opt->value, &callchain_param, arg, unset);
Jiri Olsa26d33022012-08-07 15:20:47 +02001997}
1998
Kan Liangc421e802015-07-29 05:42:12 -04001999int record_callchain_opt(const struct option *opt,
Jiri Olsa09b0fd42013-10-26 16:25:33 +02002000 const char *arg __maybe_unused,
2001 int unset __maybe_unused)
2002{
Arnaldo Carvalho de Melo2ddd5c02016-04-18 12:09:08 -03002003 struct callchain_param *callchain = opt->value;
Kan Liangc421e802015-07-29 05:42:12 -04002004
Arnaldo Carvalho de Melo2ddd5c02016-04-18 12:09:08 -03002005 callchain->enabled = true;
Jiri Olsa09b0fd42013-10-26 16:25:33 +02002006
Arnaldo Carvalho de Melo2ddd5c02016-04-18 12:09:08 -03002007 if (callchain->record_mode == CALLCHAIN_NONE)
2008 callchain->record_mode = CALLCHAIN_FP;
Jiri Olsaeb853e82014-02-03 12:44:42 +01002009
Arnaldo Carvalho de Melo2ddd5c02016-04-18 12:09:08 -03002010 callchain_debug(callchain);
Jiri Olsa09b0fd42013-10-26 16:25:33 +02002011 return 0;
2012}
2013
Jiri Olsaeb853e82014-02-03 12:44:42 +01002014static int perf_record_config(const char *var, const char *value, void *cb)
2015{
Namhyung Kim7a29c082015-12-15 10:49:56 +09002016 struct record *rec = cb;
2017
2018 if (!strcmp(var, "record.build-id")) {
2019 if (!strcmp(value, "cache"))
2020 rec->no_buildid_cache = false;
2021 else if (!strcmp(value, "no-cache"))
2022 rec->no_buildid_cache = true;
2023 else if (!strcmp(value, "skip"))
2024 rec->no_buildid = true;
2025 else
2026 return -1;
2027 return 0;
2028 }
Yisheng Xiecff17202018-03-12 19:25:57 +08002029 if (!strcmp(var, "record.call-graph")) {
2030 var = "call-graph.record-mode";
2031 return perf_default_config(var, value, cb);
2032 }
Alexey Budankov93f20c02018-11-06 12:07:19 +03002033#ifdef HAVE_AIO_SUPPORT
2034 if (!strcmp(var, "record.aio")) {
2035 rec->opts.nr_cblocks = strtol(value, NULL, 0);
2036 if (!rec->opts.nr_cblocks)
2037 rec->opts.nr_cblocks = nr_cblocks_default;
2038 }
2039#endif
Jiri Olsaeb853e82014-02-03 12:44:42 +01002040
Yisheng Xiecff17202018-03-12 19:25:57 +08002041 return 0;
Jiri Olsaeb853e82014-02-03 12:44:42 +01002042}
2043
Peter Zijlstra814c8c32015-03-31 00:19:31 +02002044struct clockid_map {
2045 const char *name;
2046 int clockid;
2047};
2048
2049#define CLOCKID_MAP(n, c) \
2050 { .name = n, .clockid = (c), }
2051
2052#define CLOCKID_END { .name = NULL, }
2053
2054
2055/*
2056 * Add the missing ones, we need to build on many distros...
2057 */
2058#ifndef CLOCK_MONOTONIC_RAW
2059#define CLOCK_MONOTONIC_RAW 4
2060#endif
2061#ifndef CLOCK_BOOTTIME
2062#define CLOCK_BOOTTIME 7
2063#endif
2064#ifndef CLOCK_TAI
2065#define CLOCK_TAI 11
2066#endif
2067
2068static const struct clockid_map clockids[] = {
2069 /* available for all events, NMI safe */
2070 CLOCKID_MAP("monotonic", CLOCK_MONOTONIC),
2071 CLOCKID_MAP("monotonic_raw", CLOCK_MONOTONIC_RAW),
2072
2073 /* available for some events */
2074 CLOCKID_MAP("realtime", CLOCK_REALTIME),
2075 CLOCKID_MAP("boottime", CLOCK_BOOTTIME),
2076 CLOCKID_MAP("tai", CLOCK_TAI),
2077
2078 /* available for the lazy */
2079 CLOCKID_MAP("mono", CLOCK_MONOTONIC),
2080 CLOCKID_MAP("raw", CLOCK_MONOTONIC_RAW),
2081 CLOCKID_MAP("real", CLOCK_REALTIME),
2082 CLOCKID_MAP("boot", CLOCK_BOOTTIME),
2083
2084 CLOCKID_END,
2085};
2086
Alexey Budankovcf790512018-10-09 17:36:24 +03002087static int get_clockid_res(clockid_t clk_id, u64 *res_ns)
2088{
2089 struct timespec res;
2090
2091 *res_ns = 0;
2092 if (!clock_getres(clk_id, &res))
2093 *res_ns = res.tv_nsec + res.tv_sec * NSEC_PER_SEC;
2094 else
2095 pr_warning("WARNING: Failed to determine specified clock resolution.\n");
2096
2097 return 0;
2098}
2099
Peter Zijlstra814c8c32015-03-31 00:19:31 +02002100static int parse_clockid(const struct option *opt, const char *str, int unset)
2101{
2102 struct record_opts *opts = (struct record_opts *)opt->value;
2103 const struct clockid_map *cm;
2104 const char *ostr = str;
2105
2106 if (unset) {
2107 opts->use_clockid = 0;
2108 return 0;
2109 }
2110
2111 /* no arg passed */
2112 if (!str)
2113 return 0;
2114
2115 /* no setting it twice */
2116 if (opts->use_clockid)
2117 return -1;
2118
2119 opts->use_clockid = true;
2120
2121 /* if its a number, we're done */
2122 if (sscanf(str, "%d", &opts->clockid) == 1)
Alexey Budankovcf790512018-10-09 17:36:24 +03002123 return get_clockid_res(opts->clockid, &opts->clockid_res_ns);
Peter Zijlstra814c8c32015-03-31 00:19:31 +02002124
2125 /* allow a "CLOCK_" prefix to the name */
2126 if (!strncasecmp(str, "CLOCK_", 6))
2127 str += 6;
2128
2129 for (cm = clockids; cm->name; cm++) {
2130 if (!strcasecmp(str, cm->name)) {
2131 opts->clockid = cm->clockid;
Alexey Budankovcf790512018-10-09 17:36:24 +03002132 return get_clockid_res(opts->clockid,
2133 &opts->clockid_res_ns);
Peter Zijlstra814c8c32015-03-31 00:19:31 +02002134 }
2135 }
2136
2137 opts->use_clockid = false;
2138 ui__warning("unknown clockid %s, check man page\n", ostr);
2139 return -1;
2140}
2141
Alexey Budankovf4fe11b2019-01-22 20:52:03 +03002142static int record__parse_affinity(const struct option *opt, const char *str, int unset)
2143{
2144 struct record_opts *opts = (struct record_opts *)opt->value;
2145
2146 if (unset || !str)
2147 return 0;
2148
2149 if (!strcasecmp(str, "node"))
2150 opts->affinity = PERF_AFFINITY_NODE;
2151 else if (!strcasecmp(str, "cpu"))
2152 opts->affinity = PERF_AFFINITY_CPU;
2153
2154 return 0;
2155}
2156
Jiwei Sun6d575812019-10-22 16:09:01 +08002157static int parse_output_max_size(const struct option *opt,
2158 const char *str, int unset)
2159{
2160 unsigned long *s = (unsigned long *)opt->value;
2161 static struct parse_tag tags_size[] = {
2162 { .tag = 'B', .mult = 1 },
2163 { .tag = 'K', .mult = 1 << 10 },
2164 { .tag = 'M', .mult = 1 << 20 },
2165 { .tag = 'G', .mult = 1 << 30 },
2166 { .tag = 0 },
2167 };
2168 unsigned long val;
2169
2170 if (unset) {
2171 *s = 0;
2172 return 0;
2173 }
2174
2175 val = parse_tag_value(str, tags_size);
2176 if (val != (unsigned long) -1) {
2177 *s = val;
2178 return 0;
2179 }
2180
2181 return -1;
2182}
2183
Adrian Huntere9db1312015-04-09 18:53:46 +03002184static int record__parse_mmap_pages(const struct option *opt,
2185 const char *str,
2186 int unset __maybe_unused)
2187{
2188 struct record_opts *opts = opt->value;
2189 char *s, *p;
2190 unsigned int mmap_pages;
2191 int ret;
2192
2193 if (!str)
2194 return -EINVAL;
2195
2196 s = strdup(str);
2197 if (!s)
2198 return -ENOMEM;
2199
2200 p = strchr(s, ',');
2201 if (p)
2202 *p = '\0';
2203
2204 if (*s) {
2205 ret = __perf_evlist__parse_mmap_pages(&mmap_pages, s);
2206 if (ret)
2207 goto out_free;
2208 opts->mmap_pages = mmap_pages;
2209 }
2210
2211 if (!p) {
2212 ret = 0;
2213 goto out_free;
2214 }
2215
2216 ret = __perf_evlist__parse_mmap_pages(&mmap_pages, p + 1);
2217 if (ret)
2218 goto out_free;
2219
2220 opts->auxtrace_mmap_pages = mmap_pages;
2221
2222out_free:
2223 free(s);
2224 return ret;
2225}
2226
Jiri Olsa0c582442017-01-09 10:51:59 +01002227static void switch_output_size_warn(struct record *rec)
2228{
Jiri Olsa9521b5f2019-07-28 12:45:35 +02002229 u64 wakeup_size = evlist__mmap_size(rec->opts.mmap_pages);
Jiri Olsa0c582442017-01-09 10:51:59 +01002230 struct switch_output *s = &rec->switch_output;
2231
2232 wakeup_size /= 2;
2233
2234 if (s->size < wakeup_size) {
2235 char buf[100];
2236
2237 unit_number__scnprintf(buf, sizeof(buf), wakeup_size);
2238 pr_warning("WARNING: switch-output data size lower than "
2239 "wakeup kernel buffer size (%s) "
2240 "expect bigger perf.data sizes\n", buf);
2241 }
2242}
2243
Jiri Olsacb4e1eb2017-01-09 10:51:57 +01002244static int switch_output_setup(struct record *rec)
2245{
2246 struct switch_output *s = &rec->switch_output;
Jiri Olsadc0c6122017-01-09 10:51:58 +01002247 static struct parse_tag tags_size[] = {
2248 { .tag = 'B', .mult = 1 },
2249 { .tag = 'K', .mult = 1 << 10 },
2250 { .tag = 'M', .mult = 1 << 20 },
2251 { .tag = 'G', .mult = 1 << 30 },
2252 { .tag = 0 },
2253 };
Jiri Olsabfacbe32017-01-09 10:52:00 +01002254 static struct parse_tag tags_time[] = {
2255 { .tag = 's', .mult = 1 },
2256 { .tag = 'm', .mult = 60 },
2257 { .tag = 'h', .mult = 60*60 },
2258 { .tag = 'd', .mult = 60*60*24 },
2259 { .tag = 0 },
2260 };
Jiri Olsadc0c6122017-01-09 10:51:58 +01002261 unsigned long val;
Jiri Olsacb4e1eb2017-01-09 10:51:57 +01002262
Arnaldo Carvalho de Melo899e5ff2020-04-27 17:56:37 -03002263 /*
2264 * If we're using --switch-output-events, then we imply its
2265 * --switch-output=signal, as we'll send a SIGUSR2 from the side band
2266 * thread to its parent.
2267 */
2268 if (rec->switch_output_event_set)
2269 goto do_signal;
2270
Jiri Olsacb4e1eb2017-01-09 10:51:57 +01002271 if (!s->set)
2272 return 0;
2273
2274 if (!strcmp(s->str, "signal")) {
Arnaldo Carvalho de Melo899e5ff2020-04-27 17:56:37 -03002275do_signal:
Jiri Olsacb4e1eb2017-01-09 10:51:57 +01002276 s->signal = true;
2277 pr_debug("switch-output with SIGUSR2 signal\n");
Jiri Olsadc0c6122017-01-09 10:51:58 +01002278 goto enabled;
2279 }
2280
2281 val = parse_tag_value(s->str, tags_size);
2282 if (val != (unsigned long) -1) {
2283 s->size = val;
2284 pr_debug("switch-output with %s size threshold\n", s->str);
2285 goto enabled;
Jiri Olsacb4e1eb2017-01-09 10:51:57 +01002286 }
2287
Jiri Olsabfacbe32017-01-09 10:52:00 +01002288 val = parse_tag_value(s->str, tags_time);
2289 if (val != (unsigned long) -1) {
2290 s->time = val;
2291 pr_debug("switch-output with %s time threshold (%lu seconds)\n",
2292 s->str, s->time);
2293 goto enabled;
2294 }
2295
Jiri Olsacb4e1eb2017-01-09 10:51:57 +01002296 return -1;
Jiri Olsadc0c6122017-01-09 10:51:58 +01002297
2298enabled:
2299 rec->timestamp_filename = true;
2300 s->enabled = true;
Jiri Olsa0c582442017-01-09 10:51:59 +01002301
2302 if (s->size && !rec->opts.no_buffering)
2303 switch_output_size_warn(rec);
2304
Jiri Olsadc0c6122017-01-09 10:51:58 +01002305 return 0;
Jiri Olsacb4e1eb2017-01-09 10:51:57 +01002306}
2307
Namhyung Kime5b2c202014-10-23 00:15:46 +09002308static const char * const __record_usage[] = {
Mike Galbraith9e0967532009-05-28 16:25:34 +02002309 "perf record [<options>] [<command>]",
2310 "perf record [<options>] -- <command> [<options>]",
Ingo Molnar0e9b20b2009-05-26 09:17:18 +02002311 NULL
2312};
Namhyung Kime5b2c202014-10-23 00:15:46 +09002313const char * const *record_usage = __record_usage;
Ingo Molnar0e9b20b2009-05-26 09:17:18 +02002314
Arnaldo Carvalho de Melo6e0a9b32019-11-14 12:15:34 -03002315static int build_id__process_mmap(struct perf_tool *tool, union perf_event *event,
2316 struct perf_sample *sample, struct machine *machine)
2317{
2318 /*
2319 * We already have the kernel maps, put in place via perf_session__create_kernel_maps()
2320 * no need to add them twice.
2321 */
2322 if (!(event->header.misc & PERF_RECORD_MISC_USER))
2323 return 0;
2324 return perf_event__process_mmap(tool, event, sample, machine);
2325}
2326
2327static int build_id__process_mmap2(struct perf_tool *tool, union perf_event *event,
2328 struct perf_sample *sample, struct machine *machine)
2329{
2330 /*
2331 * We already have the kernel maps, put in place via perf_session__create_kernel_maps()
2332 * no need to add them twice.
2333 */
2334 if (!(event->header.misc & PERF_RECORD_MISC_USER))
2335 return 0;
2336
2337 return perf_event__process_mmap2(tool, event, sample, machine);
2338}
2339
Arnaldo Carvalho de Melod20deb62011-11-25 08:19:45 -02002340/*
Arnaldo Carvalho de Melo8c6f45a2013-12-19 14:38:03 -03002341 * XXX Ideally would be local to cmd_record() and passed to a record__new
2342 * because we need to have access to it in record__exit, that is called
Arnaldo Carvalho de Melod20deb62011-11-25 08:19:45 -02002343 * after cmd_record() exits, but since record_options need to be accessible to
2344 * builtin-script, leave it here.
2345 *
2346 * At least we don't ouch it in all the other functions here directly.
2347 *
2348 * Just say no to tons of global variables, sigh.
2349 */
Arnaldo Carvalho de Melo8c6f45a2013-12-19 14:38:03 -03002350static struct record record = {
Arnaldo Carvalho de Melod20deb62011-11-25 08:19:45 -02002351 .opts = {
Andi Kleen8affc2b2014-07-31 14:45:04 +08002352 .sample_time = true,
Arnaldo Carvalho de Melod20deb62011-11-25 08:19:45 -02002353 .mmap_pages = UINT_MAX,
2354 .user_freq = UINT_MAX,
2355 .user_interval = ULLONG_MAX,
Arnaldo Carvalho de Melo447a6012012-05-22 13:14:18 -03002356 .freq = 4000,
Namhyung Kimd1cb9fc2012-05-16 18:45:49 +09002357 .target = {
2358 .uses_mmap = true,
Adrian Hunter3aa59392013-11-15 15:52:29 +02002359 .default_per_cpu = true,
Namhyung Kimd1cb9fc2012-05-16 18:45:49 +09002360 },
Alexey Budankov470530b2019-03-18 20:40:26 +03002361 .mmap_flush = MMAP_FLUSH_DEFAULT,
Stephane Eraniand99c22e2020-04-22 08:50:38 -07002362 .nr_threads_synthesize = 1,
Arnaldo Carvalho de Melod20deb62011-11-25 08:19:45 -02002363 },
Namhyung Kime3d59112015-01-29 17:06:44 +09002364 .tool = {
2365 .sample = process_sample_event,
2366 .fork = perf_event__process_fork,
Adrian Huntercca84822015-08-19 17:29:21 +03002367 .exit = perf_event__process_exit,
Namhyung Kime3d59112015-01-29 17:06:44 +09002368 .comm = perf_event__process_comm,
Hari Bathinif3b36142017-03-08 02:11:43 +05302369 .namespaces = perf_event__process_namespaces,
Arnaldo Carvalho de Melo6e0a9b32019-11-14 12:15:34 -03002370 .mmap = build_id__process_mmap,
2371 .mmap2 = build_id__process_mmap2,
Adrian Huntercca84822015-08-19 17:29:21 +03002372 .ordered_events = true,
Namhyung Kime3d59112015-01-29 17:06:44 +09002373 },
Arnaldo Carvalho de Melod20deb62011-11-25 08:19:45 -02002374};
Frederic Weisbecker7865e812010-04-14 19:42:07 +02002375
Namhyung Kim76a26542015-10-22 23:28:32 +09002376const char record_callchain_help[] = CALLCHAIN_RECORD_HELP
2377 "\n\t\t\t\tDefault: fp";
Arnaldo Carvalho de Melo61eaa3b2012-10-01 15:20:58 -03002378
Wang Nan0aab2132016-06-16 08:02:41 +00002379static bool dry_run;
2380
Arnaldo Carvalho de Melod20deb62011-11-25 08:19:45 -02002381/*
2382 * XXX Will stay a global variable till we fix builtin-script.c to stop messing
2383 * with it and switch to use the library functions in perf_evlist that came
Arnaldo Carvalho de Melob4006792013-12-19 14:43:45 -03002384 * from builtin-record.c, i.e. use record_opts,
Arnaldo Carvalho de Melod20deb62011-11-25 08:19:45 -02002385 * perf_evlist__prepare_workload, etc instead of fork+exec'in 'perf record',
2386 * using pipes, etc.
2387 */
Jiri Olsaefd21302017-01-03 09:19:55 +01002388static struct option __record_options[] = {
Arnaldo Carvalho de Melod20deb62011-11-25 08:19:45 -02002389 OPT_CALLBACK('e', "event", &record.evlist, "event",
Thomas Gleixner86847b62009-06-06 12:24:17 +02002390 "event selector. use 'perf list' to list available events",
Jiri Olsaf120f9d2011-07-14 11:25:32 +02002391 parse_events_option),
Arnaldo Carvalho de Melod20deb62011-11-25 08:19:45 -02002392 OPT_CALLBACK(0, "filter", &record.evlist, "filter",
Li Zefanc171b552009-10-15 11:22:07 +08002393 "event filter", parse_filter),
Wang Nan4ba1faa2015-07-10 07:36:10 +00002394 OPT_CALLBACK_NOOPT(0, "exclude-perf", &record.evlist,
2395 NULL, "don't record events from perf itself",
2396 exclude_perf),
Namhyung Kimbea03402012-04-26 14:15:15 +09002397 OPT_STRING('p', "pid", &record.opts.target.pid, "pid",
Zhang, Yanmind6d901c2010-03-18 11:36:05 -03002398 "record events on existing process id"),
Namhyung Kimbea03402012-04-26 14:15:15 +09002399 OPT_STRING('t', "tid", &record.opts.target.tid, "tid",
Zhang, Yanmind6d901c2010-03-18 11:36:05 -03002400 "record events on existing thread id"),
Arnaldo Carvalho de Melod20deb62011-11-25 08:19:45 -02002401 OPT_INTEGER('r', "realtime", &record.realtime_prio,
Ingo Molnar0e9b20b2009-05-26 09:17:18 +02002402 "collect data with this RT SCHED_FIFO priority"),
Arnaldo Carvalho de Melo509051e2014-01-14 17:52:14 -03002403 OPT_BOOLEAN(0, "no-buffering", &record.opts.no_buffering,
Kirill Smelkovacac03f2011-01-12 17:59:36 +03002404 "collect data without buffering"),
Arnaldo Carvalho de Melod20deb62011-11-25 08:19:45 -02002405 OPT_BOOLEAN('R', "raw-samples", &record.opts.raw_samples,
Frederic Weisbeckerdaac07b2009-08-13 10:27:19 +02002406 "collect raw sample records from all opened counters"),
Namhyung Kimbea03402012-04-26 14:15:15 +09002407 OPT_BOOLEAN('a', "all-cpus", &record.opts.target.system_wide,
Ingo Molnar0e9b20b2009-05-26 09:17:18 +02002408 "system-wide collection from all CPUs"),
Namhyung Kimbea03402012-04-26 14:15:15 +09002409 OPT_STRING('C', "cpu", &record.opts.target.cpu_list, "cpu",
Stephane Eranianc45c6ea2010-05-28 12:00:01 +02002410 "list of cpus to monitor"),
Arnaldo Carvalho de Melod20deb62011-11-25 08:19:45 -02002411 OPT_U64('c', "count", &record.opts.user_interval, "event period to sample"),
Jiri Olsa2d4f2792019-02-21 10:41:30 +01002412 OPT_STRING('o', "output", &record.data.path, "file",
Ingo Molnarabaff322009-06-02 22:59:57 +02002413 "output file name"),
Adrian Hunter69e7e5b2013-11-18 11:55:57 +02002414 OPT_BOOLEAN_SET('i', "no-inherit", &record.opts.no_inherit,
2415 &record.opts.no_inherit_set,
2416 "child tasks do not inherit counters"),
Wang Nan4ea648a2016-07-14 08:34:47 +00002417 OPT_BOOLEAN(0, "tail-synthesize", &record.opts.tail_synthesize,
2418 "synthesize non-sample events at the end of output"),
Wang Nan626a6b72016-07-14 08:34:45 +00002419 OPT_BOOLEAN(0, "overwrite", &record.opts.overwrite, "use overwrite mode"),
Song Liu71184c62019-03-11 22:30:37 -07002420 OPT_BOOLEAN(0, "no-bpf-event", &record.opts.no_bpf_event, "record bpf events"),
Arnaldo Carvalho de Melob09c2362018-03-01 14:52:50 -03002421 OPT_BOOLEAN(0, "strict-freq", &record.opts.strict_freq,
2422 "Fail if the specified frequency can't be used"),
Arnaldo Carvalho de Melo67230472018-03-01 13:46:23 -03002423 OPT_CALLBACK('F', "freq", &record.opts, "freq or 'max'",
2424 "profile at this frequency",
2425 record__parse_freq),
Adrian Huntere9db1312015-04-09 18:53:46 +03002426 OPT_CALLBACK('m', "mmap-pages", &record.opts, "pages[,pages]",
2427 "number of mmap data pages and AUX area tracing mmap pages",
2428 record__parse_mmap_pages),
Alexey Budankov470530b2019-03-18 20:40:26 +03002429 OPT_CALLBACK(0, "mmap-flush", &record.opts, "number",
2430 "Minimal number of bytes that is extracted from mmap data pages (default: 1)",
2431 record__mmap_flush_parse),
Arnaldo Carvalho de Melod20deb62011-11-25 08:19:45 -02002432 OPT_BOOLEAN(0, "group", &record.opts.group,
Lin Ming43bece72011-08-17 18:42:07 +08002433 "put the counters into a counter group"),
Arnaldo Carvalho de Melo2ddd5c02016-04-18 12:09:08 -03002434 OPT_CALLBACK_NOOPT('g', NULL, &callchain_param,
Jiri Olsa09b0fd42013-10-26 16:25:33 +02002435 NULL, "enables call-graph recording" ,
2436 &record_callchain_opt),
2437 OPT_CALLBACK(0, "call-graph", &record.opts,
Namhyung Kim76a26542015-10-22 23:28:32 +09002438 "record_mode[,record_size]", record_callchain_help,
Jiri Olsa09b0fd42013-10-26 16:25:33 +02002439 &record_parse_callchain_opt),
Ian Munsiec0555642010-04-13 18:37:33 +10002440 OPT_INCR('v', "verbose", &verbose,
Ingo Molnar3da297a2009-06-07 17:39:02 +02002441 "be more verbose (show counter open errors, etc)"),
Arnaldo Carvalho de Melob44308f2010-10-26 15:20:09 -02002442 OPT_BOOLEAN('q', "quiet", &quiet, "don't print any message"),
Arnaldo Carvalho de Melod20deb62011-11-25 08:19:45 -02002443 OPT_BOOLEAN('s', "stat", &record.opts.inherit_stat,
Peter Zijlstra649c48a2009-06-24 21:12:48 +02002444 "per thread counts"),
Peter Zijlstra56100322015-06-10 16:48:50 +02002445 OPT_BOOLEAN('d', "data", &record.opts.sample_address, "Record the sample addresses"),
Kan Liang3b0a5da2017-08-29 13:11:08 -04002446 OPT_BOOLEAN(0, "phys-data", &record.opts.sample_phys_addr,
2447 "Record the sample physical addresses"),
Jiri Olsab6f35ed2016-08-01 20:02:35 +02002448 OPT_BOOLEAN(0, "sample-cpu", &record.opts.sample_cpu, "Record the sample cpu"),
Adrian Hunter3abebc52015-07-06 14:51:01 +03002449 OPT_BOOLEAN_SET('T', "timestamp", &record.opts.sample_time,
2450 &record.opts.sample_time_set,
2451 "Record the sample timestamps"),
Jiri Olsaf290aa12018-02-01 09:38:11 +01002452 OPT_BOOLEAN_SET('P', "period", &record.opts.period, &record.opts.period_set,
2453 "Record the sample period"),
Arnaldo Carvalho de Melod20deb62011-11-25 08:19:45 -02002454 OPT_BOOLEAN('n', "no-samples", &record.opts.no_samples,
Peter Zijlstra649c48a2009-06-24 21:12:48 +02002455 "don't sample"),
Wang Nand2db9a92016-01-25 09:56:19 +00002456 OPT_BOOLEAN_SET('N', "no-buildid-cache", &record.no_buildid_cache,
2457 &record.no_buildid_cache_set,
2458 "do not update the buildid cache"),
2459 OPT_BOOLEAN_SET('B', "no-buildid", &record.no_buildid,
2460 &record.no_buildid_set,
2461 "do not collect buildids in perf.data"),
Arnaldo Carvalho de Melod20deb62011-11-25 08:19:45 -02002462 OPT_CALLBACK('G', "cgroup", &record.evlist, "name",
Stephane Eranian023695d2011-02-14 11:20:01 +02002463 "monitor event in cgroup name only",
2464 parse_cgroups),
Arnaldo Carvalho de Meloa6205a32014-01-14 17:58:12 -03002465 OPT_UINTEGER('D', "delay", &record.opts.initial_delay,
Andi Kleen6619a532014-01-11 13:38:27 -08002466 "ms to wait before starting measurement after program start"),
Adrian Huntereeb399b2019-10-04 11:31:21 +03002467 OPT_BOOLEAN(0, "kcore", &record.opts.kcore, "copy /proc/kcore"),
Namhyung Kimbea03402012-04-26 14:15:15 +09002468 OPT_STRING('u', "uid", &record.opts.target.uid_str, "user",
2469 "user to profile"),
Stephane Eraniana5aabda2012-03-08 23:47:45 +01002470
2471 OPT_CALLBACK_NOOPT('b', "branch-any", &record.opts.branch_stack,
2472 "branch any", "sample any taken branches",
2473 parse_branch_stack),
2474
2475 OPT_CALLBACK('j', "branch-filter", &record.opts.branch_stack,
2476 "branch filter mask", "branch stack filter modes",
Roberto Agostino Vitillobdfebd82012-02-09 23:21:02 +01002477 parse_branch_stack),
Andi Kleen05484292013-01-24 16:10:29 +01002478 OPT_BOOLEAN('W', "weight", &record.opts.sample_weight,
2479 "sample by weight (on special events only)"),
Andi Kleen475eeab2013-09-20 07:40:43 -07002480 OPT_BOOLEAN(0, "transaction", &record.opts.sample_transaction,
2481 "sample transaction flags (special events only)"),
Adrian Hunter3aa59392013-11-15 15:52:29 +02002482 OPT_BOOLEAN(0, "per-thread", &record.opts.target.per_thread,
2483 "use per-thread mmaps"),
Stephane Eranianbcc84ec2015-08-31 18:41:12 +02002484 OPT_CALLBACK_OPTARG('I', "intr-regs", &record.opts.sample_intr_regs, NULL, "any register",
2485 "sample selected machine registers on interrupt,"
Kan Liangaeea9062019-05-14 13:19:32 -07002486 " use '-I?' to list register names", parse_intr_regs),
Andi Kleen84c41742017-09-05 10:00:28 -07002487 OPT_CALLBACK_OPTARG(0, "user-regs", &record.opts.sample_user_regs, NULL, "any register",
2488 "sample selected machine registers on interrupt,"
Kan Liangaeea9062019-05-14 13:19:32 -07002489 " use '--user-regs=?' to list register names", parse_user_regs),
Andi Kleen85c273d2015-02-24 15:13:40 -08002490 OPT_BOOLEAN(0, "running-time", &record.opts.running_time,
2491 "Record running/enabled time of read (:S) events"),
Peter Zijlstra814c8c32015-03-31 00:19:31 +02002492 OPT_CALLBACK('k', "clockid", &record.opts,
2493 "clockid", "clockid to use for events, see clock_gettime()",
2494 parse_clockid),
Adrian Hunter2dd6d8a2015-04-30 17:37:32 +03002495 OPT_STRING_OPTARG('S', "snapshot", &record.opts.auxtrace_snapshot_opts,
2496 "opts", "AUX area tracing Snapshot Mode", ""),
Adrian Hunterc0a6de02019-11-15 14:42:16 +02002497 OPT_STRING_OPTARG(0, "aux-sample", &record.opts.auxtrace_sample_opts,
2498 "opts", "sample AUX area", ""),
Mark Drayton3fcb10e2018-12-04 12:34:20 -08002499 OPT_UINTEGER(0, "proc-map-timeout", &proc_map_timeout,
Kan Liang9d9cad72015-06-17 09:51:11 -04002500 "per thread proc mmap processing timeout in ms"),
Hari Bathinif3b36142017-03-08 02:11:43 +05302501 OPT_BOOLEAN(0, "namespaces", &record.opts.record_namespaces,
2502 "Record namespaces events"),
Namhyung Kim8fb4b672020-03-25 21:45:34 +09002503 OPT_BOOLEAN(0, "all-cgroups", &record.opts.record_cgroup,
2504 "Record cgroup events"),
Adrian Hunter16b4b4e2020-05-28 15:08:58 +03002505 OPT_BOOLEAN_SET(0, "switch-events", &record.opts.record_switch_events,
2506 &record.opts.record_switch_events_set,
2507 "Record context switch events"),
Jiri Olsa85723882016-02-15 09:34:31 +01002508 OPT_BOOLEAN_FLAG(0, "all-kernel", &record.opts.all_kernel,
2509 "Configure all used events to run in kernel space.",
2510 PARSE_OPT_EXCLUSIVE),
2511 OPT_BOOLEAN_FLAG(0, "all-user", &record.opts.all_user,
2512 "Configure all used events to run in user space.",
2513 PARSE_OPT_EXCLUSIVE),
yuzhoujian53651b22019-05-30 14:29:22 +01002514 OPT_BOOLEAN(0, "kernel-callchains", &record.opts.kernel_callchains,
2515 "collect kernel callchains"),
2516 OPT_BOOLEAN(0, "user-callchains", &record.opts.user_callchains,
2517 "collect user callchains"),
Wang Nan71dc23262015-10-14 12:41:19 +00002518 OPT_STRING(0, "clang-path", &llvm_param.clang_path, "clang path",
2519 "clang binary to use for compiling BPF scriptlets"),
2520 OPT_STRING(0, "clang-opt", &llvm_param.clang_opt, "clang options",
2521 "options passed to clang when compiling BPF scriptlets"),
He Kuang7efe0e02015-12-14 10:39:23 +00002522 OPT_STRING(0, "vmlinux", &symbol_conf.vmlinux_name,
2523 "file", "vmlinux pathname"),
Namhyung Kim61566812016-01-11 22:37:09 +09002524 OPT_BOOLEAN(0, "buildid-all", &record.buildid_all,
2525 "Record build-id of all DSOs regardless of hits"),
Wang Nanecfd7a92016-04-13 08:21:07 +00002526 OPT_BOOLEAN(0, "timestamp-filename", &record.timestamp_filename,
2527 "append timestamp to output filename"),
Jin Yao68588ba2017-12-08 21:13:42 +08002528 OPT_BOOLEAN(0, "timestamp-boundary", &record.timestamp_boundary,
2529 "Record timestamp boundary (time of first/last samples)"),
Jiri Olsacb4e1eb2017-01-09 10:51:57 +01002530 OPT_STRING_OPTARG_SET(0, "switch-output", &record.switch_output.str,
Andi Kleenc38dab72019-03-14 15:49:56 -07002531 &record.switch_output.set, "signal or size[BKMG] or time[smhd]",
2532 "Switch output when receiving SIGUSR2 (signal) or cross a size or time threshold",
Jiri Olsadc0c6122017-01-09 10:51:58 +01002533 "signal"),
Arnaldo Carvalho de Melo899e5ff2020-04-27 17:56:37 -03002534 OPT_CALLBACK_SET(0, "switch-output-event", &record.sb_evlist, &record.switch_output_event_set, "switch output event",
2535 "switch output event selector. use 'perf list' to list available events",
2536 parse_events_option_new_evlist),
Andi Kleen03724b22019-03-14 15:49:55 -07002537 OPT_INTEGER(0, "switch-max-files", &record.switch_output.num_files,
2538 "Limit number of switch output generated files"),
Wang Nan0aab2132016-06-16 08:02:41 +00002539 OPT_BOOLEAN(0, "dry-run", &dry_run,
2540 "Parse options then exit"),
Alexey Budankovd3d1af62018-11-06 12:04:58 +03002541#ifdef HAVE_AIO_SUPPORT
Alexey Budankov93f20c02018-11-06 12:07:19 +03002542 OPT_CALLBACK_OPTARG(0, "aio", &record.opts,
2543 &nr_cblocks_default, "n", "Use <n> control blocks in asynchronous trace writing mode (default: 1, max: 4)",
Alexey Budankovd3d1af62018-11-06 12:04:58 +03002544 record__aio_parse),
2545#endif
Alexey Budankovf4fe11b2019-01-22 20:52:03 +03002546 OPT_CALLBACK(0, "affinity", &record.opts, "node|cpu",
2547 "Set affinity mask of trace reading thread to NUMA node cpu mask or cpu of processed mmap buffer",
2548 record__parse_affinity),
Alexey Budankov504c1ad2019-03-18 20:44:42 +03002549#ifdef HAVE_ZSTD_SUPPORT
2550 OPT_CALLBACK_OPTARG('z', "compression-level", &record.opts, &comp_level_default,
2551 "n", "Compressed records using specified level (default: 1 - fastest compression, 22 - greatest compression)",
2552 record__parse_comp_level),
2553#endif
Jiwei Sun6d575812019-10-22 16:09:01 +08002554 OPT_CALLBACK(0, "max-size", &record.output_max_size,
2555 "size", "Limit the maximum size of the output file", parse_output_max_size),
Stephane Eraniand99c22e2020-04-22 08:50:38 -07002556 OPT_UINTEGER(0, "num-thread-synthesize",
2557 &record.opts.nr_threads_synthesize,
2558 "number of threads to run for event synthesis"),
Stephane Eranian70943492020-05-05 11:29:43 -07002559#ifdef HAVE_LIBPFM
2560 OPT_CALLBACK(0, "pfm-events", &record.evlist, "event",
2561 "libpfm4 event selector. use 'perf list' to list available events",
2562 parse_libpfm_events_option),
2563#endif
Ingo Molnar0e9b20b2009-05-26 09:17:18 +02002564 OPT_END()
2565};
2566
Namhyung Kime5b2c202014-10-23 00:15:46 +09002567struct option *record_options = __record_options;
2568
Arnaldo Carvalho de Melob0ad8ea2017-03-27 11:47:20 -03002569int cmd_record(int argc, const char **argv)
Ingo Molnar0e9b20b2009-05-26 09:17:18 +02002570{
Adrian Hunteref149c22015-04-09 18:53:45 +03002571 int err;
Arnaldo Carvalho de Melo8c6f45a2013-12-19 14:38:03 -03002572 struct record *rec = &record;
Namhyung Kim16ad2ff2012-05-07 14:09:02 +09002573 char errbuf[BUFSIZ];
Ingo Molnar0e9b20b2009-05-26 09:17:18 +02002574
Arnaldo Carvalho de Melo67230472018-03-01 13:46:23 -03002575 setlocale(LC_ALL, "");
2576
Wang Nan48e1cab2015-12-14 10:39:22 +00002577#ifndef HAVE_LIBBPF_SUPPORT
2578# define set_nobuild(s, l, c) set_option_nobuild(record_options, s, l, "NO_LIBBPF=1", c)
2579 set_nobuild('\0', "clang-path", true);
2580 set_nobuild('\0', "clang-opt", true);
2581# undef set_nobuild
2582#endif
2583
He Kuang7efe0e02015-12-14 10:39:23 +00002584#ifndef HAVE_BPF_PROLOGUE
2585# if !defined (HAVE_DWARF_SUPPORT)
2586# define REASON "NO_DWARF=1"
2587# elif !defined (HAVE_LIBBPF_SUPPORT)
2588# define REASON "NO_LIBBPF=1"
2589# else
2590# define REASON "this architecture doesn't support BPF prologue"
2591# endif
2592# define set_nobuild(s, l, c) set_option_nobuild(record_options, s, l, REASON, c)
2593 set_nobuild('\0', "vmlinux", true);
2594# undef set_nobuild
2595# undef REASON
2596#endif
2597
Alexey Budankov9d2ed642019-01-22 20:47:43 +03002598 rec->opts.affinity = PERF_AFFINITY_SYS;
2599
Jiri Olsa0f98b112019-07-21 13:23:55 +02002600 rec->evlist = evlist__new();
Arnaldo Carvalho de Melo3e2be2d2014-01-03 15:03:26 -03002601 if (rec->evlist == NULL)
Arnaldo Carvalho de Melo361c99a2011-01-11 20:56:53 -02002602 return -ENOMEM;
2603
Arnaldo Carvalho de Meloecc4c562017-01-24 13:44:10 -03002604 err = perf_config(perf_record_config, rec);
2605 if (err)
2606 return err;
Jiri Olsaeb853e82014-02-03 12:44:42 +01002607
Tom Zanussibca647a2010-11-10 08:11:30 -06002608 argc = parse_options(argc, argv, record_options, record_usage,
Arnaldo Carvalho de Melo655000e2009-12-15 20:04:40 -02002609 PARSE_OPT_STOP_AT_NON_OPTION);
Namhyung Kim68ba3232017-02-17 17:17:42 +09002610 if (quiet)
2611 perf_quiet_option();
Jiri Olsa483635a2017-02-17 18:00:18 +01002612
2613 /* Make system wide (-a) the default target. */
Arnaldo Carvalho de Melo602ad872013-11-12 16:46:16 -03002614 if (!argc && target__none(&rec->opts.target))
Jiri Olsa483635a2017-02-17 18:00:18 +01002615 rec->opts.target.system_wide = true;
Ingo Molnar0e9b20b2009-05-26 09:17:18 +02002616
Namhyung Kimbea03402012-04-26 14:15:15 +09002617 if (nr_cgroups && !rec->opts.target.system_wide) {
Namhyung Kimc7118362015-10-25 00:49:27 +09002618 usage_with_options_msg(record_usage, record_options,
2619 "cgroup monitoring only available in system-wide mode");
2620
Stephane Eranian023695d2011-02-14 11:20:01 +02002621 }
Alexey Budankov504c1ad2019-03-18 20:44:42 +03002622
Adrian Huntereeb399b2019-10-04 11:31:21 +03002623 if (rec->opts.kcore)
2624 rec->data.is_dir = true;
2625
Alexey Budankov504c1ad2019-03-18 20:44:42 +03002626 if (rec->opts.comp_level != 0) {
2627 pr_debug("Compression enabled, disabling build id collection at the end of the session.\n");
2628 rec->no_buildid = true;
2629 }
2630
Adrian Hunterb757bb02015-07-21 12:44:04 +03002631 if (rec->opts.record_switch_events &&
2632 !perf_can_record_switch_events()) {
Namhyung Kimc7118362015-10-25 00:49:27 +09002633 ui__error("kernel does not support recording context switch events\n");
2634 parse_options_usage(record_usage, record_options, "switch-events", 0);
2635 return -EINVAL;
Adrian Hunterb757bb02015-07-21 12:44:04 +03002636 }
Stephane Eranian023695d2011-02-14 11:20:01 +02002637
Jiri Olsacb4e1eb2017-01-09 10:51:57 +01002638 if (switch_output_setup(rec)) {
2639 parse_options_usage(record_usage, record_options, "switch-output", 0);
2640 return -EINVAL;
2641 }
2642
Jiri Olsabfacbe32017-01-09 10:52:00 +01002643 if (rec->switch_output.time) {
2644 signal(SIGALRM, alarm_sig_handler);
2645 alarm(rec->switch_output.time);
2646 }
2647
Andi Kleen03724b22019-03-14 15:49:55 -07002648 if (rec->switch_output.num_files) {
2649 rec->switch_output.filenames = calloc(sizeof(char *),
2650 rec->switch_output.num_files);
2651 if (!rec->switch_output.filenames)
2652 return -EINVAL;
2653 }
2654
Adrian Hunter1b36c032016-09-23 17:38:39 +03002655 /*
2656 * Allow aliases to facilitate the lookup of symbols for address
2657 * filters. Refer to auxtrace_parse_filters().
2658 */
2659 symbol_conf.allow_aliases = true;
2660
2661 symbol__init(NULL);
2662
Alexey Budankov8384a262019-12-03 14:45:27 +03002663 if (rec->opts.affinity != PERF_AFFINITY_SYS) {
2664 rec->affinity_mask.nbits = cpu__max_cpu();
2665 rec->affinity_mask.bits = bitmap_alloc(rec->affinity_mask.nbits);
2666 if (!rec->affinity_mask.bits) {
2667 pr_err("Failed to allocate thread mask for %zd cpus\n", rec->affinity_mask.nbits);
2668 return -ENOMEM;
2669 }
2670 pr_debug2("thread mask[%zd]: empty\n", rec->affinity_mask.nbits);
2671 }
2672
Adrian Hunter4b5ea3b2018-03-06 11:13:12 +02002673 err = record__auxtrace_init(rec);
Adrian Hunter1b36c032016-09-23 17:38:39 +03002674 if (err)
2675 goto out;
2676
Wang Nan0aab2132016-06-16 08:02:41 +00002677 if (dry_run)
Adrian Hunter5c01ad602016-09-23 17:38:37 +03002678 goto out;
Wang Nan0aab2132016-06-16 08:02:41 +00002679
Wang Nand7888572016-04-08 15:07:24 +00002680 err = bpf__setup_stdout(rec->evlist);
2681 if (err) {
2682 bpf__strerror_setup_stdout(rec->evlist, err, errbuf, sizeof(errbuf));
2683 pr_err("ERROR: Setup BPF stdout failed: %s\n",
2684 errbuf);
Adrian Hunter5c01ad602016-09-23 17:38:37 +03002685 goto out;
Wang Nand7888572016-04-08 15:07:24 +00002686 }
2687
Adrian Hunteref149c22015-04-09 18:53:45 +03002688 err = -ENOMEM;
2689
Wang Nan0c1d46a2016-04-20 18:59:52 +00002690 if (rec->no_buildid_cache || rec->no_buildid) {
Stephane Eraniana1ac1d32010-06-17 11:39:01 +02002691 disable_buildid_cache();
Jiri Olsadc0c6122017-01-09 10:51:58 +01002692 } else if (rec->switch_output.enabled) {
Wang Nan0c1d46a2016-04-20 18:59:52 +00002693 /*
2694 * In 'perf record --switch-output', disable buildid
2695 * generation by default to reduce data file switching
2696 * overhead. Still generate buildid if they are required
2697 * explicitly using
2698 *
Jiri Olsa60437ac2017-01-03 09:19:56 +01002699 * perf record --switch-output --no-no-buildid \
Wang Nan0c1d46a2016-04-20 18:59:52 +00002700 * --no-no-buildid-cache
2701 *
2702 * Following code equals to:
2703 *
2704 * if ((rec->no_buildid || !rec->no_buildid_set) &&
2705 * (rec->no_buildid_cache || !rec->no_buildid_cache_set))
2706 * disable_buildid_cache();
2707 */
2708 bool disable = true;
2709
2710 if (rec->no_buildid_set && !rec->no_buildid)
2711 disable = false;
2712 if (rec->no_buildid_cache_set && !rec->no_buildid_cache)
2713 disable = false;
2714 if (disable) {
2715 rec->no_buildid = true;
2716 rec->no_buildid_cache = true;
2717 disable_buildid_cache();
2718 }
2719 }
Arnaldo Carvalho de Melo655000e2009-12-15 20:04:40 -02002720
Wang Nan4ea648a2016-07-14 08:34:47 +00002721 if (record.opts.overwrite)
2722 record.opts.tail_synthesize = true;
2723
Jiri Olsa6484d2f2019-07-21 13:24:28 +02002724 if (rec->evlist->core.nr_entries == 0 &&
Arnaldo Carvalho de Meloe251abe2020-06-17 09:16:20 -03002725 __evlist__add_default(rec->evlist, !record.opts.no_samples) < 0) {
Arnaldo Carvalho de Melo69aad6f2011-01-03 16:39:04 -02002726 pr_err("Not enough memory for event selector list\n");
Adrian Hunter394c01e2016-09-23 17:38:36 +03002727 goto out;
Peter Zijlstrabbd36e52009-06-11 23:11:50 +02002728 }
Ingo Molnar0e9b20b2009-05-26 09:17:18 +02002729
Adrian Hunter69e7e5b2013-11-18 11:55:57 +02002730 if (rec->opts.target.tid && !rec->opts.no_inherit_set)
2731 rec->opts.no_inherit = true;
2732
Arnaldo Carvalho de Melo602ad872013-11-12 16:46:16 -03002733 err = target__validate(&rec->opts.target);
Namhyung Kim16ad2ff2012-05-07 14:09:02 +09002734 if (err) {
Arnaldo Carvalho de Melo602ad872013-11-12 16:46:16 -03002735 target__strerror(&rec->opts.target, err, errbuf, BUFSIZ);
Jiri Olsac3dec272018-02-06 19:17:58 +01002736 ui__warning("%s\n", errbuf);
Namhyung Kim16ad2ff2012-05-07 14:09:02 +09002737 }
Namhyung Kim4bd0f2d2012-04-26 14:15:18 +09002738
Arnaldo Carvalho de Melo602ad872013-11-12 16:46:16 -03002739 err = target__parse_uid(&rec->opts.target);
Namhyung Kim16ad2ff2012-05-07 14:09:02 +09002740 if (err) {
2741 int saved_errno = errno;
2742
Arnaldo Carvalho de Melo602ad872013-11-12 16:46:16 -03002743 target__strerror(&rec->opts.target, err, errbuf, BUFSIZ);
Namhyung Kim3780f482012-05-29 13:22:57 +09002744 ui__error("%s", errbuf);
Namhyung Kim16ad2ff2012-05-07 14:09:02 +09002745
2746 err = -saved_errno;
Adrian Hunter394c01e2016-09-23 17:38:36 +03002747 goto out;
Namhyung Kim16ad2ff2012-05-07 14:09:02 +09002748 }
Arnaldo Carvalho de Melo0d37aa32012-01-19 14:08:15 -02002749
Mengting Zhangca800062017-12-13 15:01:53 +08002750 /* Enable ignoring missing threads when -u/-p option is defined. */
2751 rec->opts.ignore_missing_thread = rec->opts.target.uid != UINT_MAX || rec->opts.target.pid;
Jiri Olsa23dc4f12016-12-12 11:35:43 +01002752
Namhyung Kim16ad2ff2012-05-07 14:09:02 +09002753 err = -ENOMEM;
Arnaldo Carvalho de Melo3e2be2d2014-01-03 15:03:26 -03002754 if (perf_evlist__create_maps(rec->evlist, &rec->opts.target) < 0)
Arnaldo Carvalho de Melodd7927f2011-01-12 14:28:51 -02002755 usage_with_options(record_usage, record_options);
Arnaldo Carvalho de Melo69aad6f2011-01-03 16:39:04 -02002756
Adrian Hunteref149c22015-04-09 18:53:45 +03002757 err = auxtrace_record__options(rec->itr, rec->evlist, &rec->opts);
2758 if (err)
Adrian Hunter394c01e2016-09-23 17:38:36 +03002759 goto out;
Adrian Hunteref149c22015-04-09 18:53:45 +03002760
Namhyung Kim61566812016-01-11 22:37:09 +09002761 /*
2762 * We take all buildids when the file contains
2763 * AUX area tracing data because we do not decode the
2764 * trace because it would take too long.
2765 */
2766 if (rec->opts.full_auxtrace)
2767 rec->buildid_all = true;
2768
Arnaldo Carvalho de Melob4006792013-12-19 14:43:45 -03002769 if (record_opts__config(&rec->opts)) {
Arnaldo Carvalho de Melo39d17da2010-07-29 14:08:55 -03002770 err = -EINVAL;
Adrian Hunter394c01e2016-09-23 17:38:36 +03002771 goto out;
Mike Galbraith7e4ff9e2009-10-12 07:56:03 +02002772 }
2773
Alexey Budankov93f20c02018-11-06 12:07:19 +03002774 if (rec->opts.nr_cblocks > nr_cblocks_max)
2775 rec->opts.nr_cblocks = nr_cblocks_max;
Alexey Budankov5d7f4112019-03-18 20:43:35 +03002776 pr_debug("nr_cblocks: %d\n", rec->opts.nr_cblocks);
Alexey Budankovd3d1af62018-11-06 12:04:58 +03002777
Alexey Budankov9d2ed642019-01-22 20:47:43 +03002778 pr_debug("affinity: %s\n", affinity_tags[rec->opts.affinity]);
Alexey Budankov470530b2019-03-18 20:40:26 +03002779 pr_debug("mmap flush: %d\n", rec->opts.mmap_flush);
Alexey Budankov9d2ed642019-01-22 20:47:43 +03002780
Alexey Budankov51255a82019-03-18 20:42:19 +03002781 if (rec->opts.comp_level > comp_level_max)
2782 rec->opts.comp_level = comp_level_max;
2783 pr_debug("comp level: %d\n", rec->opts.comp_level);
2784
Arnaldo Carvalho de Melod20deb62011-11-25 08:19:45 -02002785 err = __cmd_record(&record, argc, argv);
Adrian Hunter394c01e2016-09-23 17:38:36 +03002786out:
Alexey Budankov8384a262019-12-03 14:45:27 +03002787 bitmap_free(rec->affinity_mask.bits);
Jiri Olsac12995a2019-07-21 13:23:56 +02002788 evlist__delete(rec->evlist);
Arnaldo Carvalho de Melod65a4582010-07-30 18:31:28 -03002789 symbol__exit();
Adrian Hunteref149c22015-04-09 18:53:45 +03002790 auxtrace_record__free(rec->itr);
Arnaldo Carvalho de Melo39d17da2010-07-29 14:08:55 -03002791 return err;
Ingo Molnar0e9b20b2009-05-26 09:17:18 +02002792}
Adrian Hunter2dd6d8a2015-04-30 17:37:32 +03002793
2794static void snapshot_sig_handler(int sig __maybe_unused)
2795{
Jiri Olsadc0c6122017-01-09 10:51:58 +01002796 struct record *rec = &record;
2797
Wang Nan5f9cf592016-04-20 18:59:49 +00002798 if (trigger_is_ready(&auxtrace_snapshot_trigger)) {
2799 trigger_hit(&auxtrace_snapshot_trigger);
2800 auxtrace_record__snapshot_started = 1;
2801 if (auxtrace_record__snapshot_start(record.itr))
2802 trigger_error(&auxtrace_snapshot_trigger);
2803 }
Wang Nan3c1cb7e2016-04-20 18:59:50 +00002804
Jiri Olsadc0c6122017-01-09 10:51:58 +01002805 if (switch_output_signal(rec))
Wang Nan3c1cb7e2016-04-20 18:59:50 +00002806 trigger_hit(&switch_output_trigger);
Adrian Hunter2dd6d8a2015-04-30 17:37:32 +03002807}
Jiri Olsabfacbe32017-01-09 10:52:00 +01002808
2809static void alarm_sig_handler(int sig __maybe_unused)
2810{
2811 struct record *rec = &record;
2812
2813 if (switch_output_time(rec))
2814 trigger_hit(&switch_output_trigger);
2815}