Merge branch 'locking-urgent-for-linus' of git://git.kernel.org/pub/scm/linux/kernel...
[cris-mirror.git] / tools / perf / util / jitdump.c
bloba1863000e972dbca938ed0003fb3632bf25e35c0
1 // SPDX-License-Identifier: GPL-2.0
2 #include <sys/sysmacros.h>
3 #include <sys/types.h>
4 #include <errno.h>
5 #include <stdio.h>
6 #include <stdlib.h>
7 #include <string.h>
8 #include <fcntl.h>
9 #include <unistd.h>
10 #include <inttypes.h>
11 #include <byteswap.h>
12 #include <sys/stat.h>
13 #include <sys/mman.h>
14 #include <linux/stringify.h>
16 #include "util.h"
17 #include "event.h"
18 #include "debug.h"
19 #include "evlist.h"
20 #include "symbol.h"
21 #include <elf.h>
23 #include "tsc.h"
24 #include "session.h"
25 #include "jit.h"
26 #include "jitdump.h"
27 #include "genelf.h"
28 #include "../builtin.h"
30 #include "sane_ctype.h"
32 struct jit_buf_desc {
33 struct perf_data *output;
34 struct perf_session *session;
35 struct machine *machine;
36 union jr_entry *entry;
37 void *buf;
38 uint64_t sample_type;
39 size_t bufsize;
40 FILE *in;
41 bool needs_bswap; /* handles cross-endianess */
42 bool use_arch_timestamp;
43 void *debug_data;
44 void *unwinding_data;
45 uint64_t unwinding_size;
46 uint64_t unwinding_mapped_size;
47 uint64_t eh_frame_hdr_size;
48 size_t nr_debug_entries;
49 uint32_t code_load_count;
50 u64 bytes_written;
51 struct rb_root code_root;
52 char dir[PATH_MAX];
55 struct debug_line_info {
56 unsigned long vma;
57 unsigned int lineno;
58 /* The filename format is unspecified, absolute path, relative etc. */
59 char const filename[0];
62 struct jit_tool {
63 struct perf_tool tool;
64 struct perf_data output;
65 struct perf_data input;
66 u64 bytes_written;
69 #define hmax(a, b) ((a) > (b) ? (a) : (b))
70 #define get_jit_tool(t) (container_of(tool, struct jit_tool, tool))
72 static int
73 jit_emit_elf(char *filename,
74 const char *sym,
75 uint64_t code_addr,
76 const void *code,
77 int csize,
78 void *debug,
79 int nr_debug_entries,
80 void *unwinding,
81 uint32_t unwinding_header_size,
82 uint32_t unwinding_size)
84 int ret, fd;
86 if (verbose > 0)
87 fprintf(stderr, "write ELF image %s\n", filename);
89 fd = open(filename, O_CREAT|O_TRUNC|O_WRONLY, 0644);
90 if (fd == -1) {
91 pr_warning("cannot create jit ELF %s: %s\n", filename, strerror(errno));
92 return -1;
95 ret = jit_write_elf(fd, code_addr, sym, (const void *)code, csize, debug, nr_debug_entries,
96 unwinding, unwinding_header_size, unwinding_size);
98 close(fd);
100 if (ret)
101 unlink(filename);
103 return ret;
106 static void
107 jit_close(struct jit_buf_desc *jd)
109 if (!(jd && jd->in))
110 return;
111 funlockfile(jd->in);
112 fclose(jd->in);
113 jd->in = NULL;
116 static int
117 jit_validate_events(struct perf_session *session)
119 struct perf_evsel *evsel;
122 * check that all events use CLOCK_MONOTONIC
124 evlist__for_each_entry(session->evlist, evsel) {
125 if (evsel->attr.use_clockid == 0 || evsel->attr.clockid != CLOCK_MONOTONIC)
126 return -1;
128 return 0;
131 static int
132 jit_open(struct jit_buf_desc *jd, const char *name)
134 struct jitheader header;
135 struct jr_prefix *prefix;
136 ssize_t bs, bsz = 0;
137 void *n, *buf = NULL;
138 int ret, retval = -1;
140 jd->in = fopen(name, "r");
141 if (!jd->in)
142 return -1;
144 bsz = hmax(sizeof(header), sizeof(*prefix));
146 buf = malloc(bsz);
147 if (!buf)
148 goto error;
151 * protect from writer modifying the file while we are reading it
153 flockfile(jd->in);
155 ret = fread(buf, sizeof(header), 1, jd->in);
156 if (ret != 1)
157 goto error;
159 memcpy(&header, buf, sizeof(header));
161 if (header.magic != JITHEADER_MAGIC) {
162 if (header.magic != JITHEADER_MAGIC_SW)
163 goto error;
164 jd->needs_bswap = true;
167 if (jd->needs_bswap) {
168 header.version = bswap_32(header.version);
169 header.total_size = bswap_32(header.total_size);
170 header.pid = bswap_32(header.pid);
171 header.elf_mach = bswap_32(header.elf_mach);
172 header.timestamp = bswap_64(header.timestamp);
173 header.flags = bswap_64(header.flags);
176 jd->use_arch_timestamp = header.flags & JITDUMP_FLAGS_ARCH_TIMESTAMP;
178 if (verbose > 2)
179 pr_debug("version=%u\nhdr.size=%u\nts=0x%llx\npid=%d\nelf_mach=%d\nuse_arch_timestamp=%d\n",
180 header.version,
181 header.total_size,
182 (unsigned long long)header.timestamp,
183 header.pid,
184 header.elf_mach,
185 jd->use_arch_timestamp);
187 if (header.version > JITHEADER_VERSION) {
188 pr_err("wrong jitdump version %u, expected " __stringify(JITHEADER_VERSION),
189 header.version);
190 goto error;
193 if (header.flags & JITDUMP_FLAGS_RESERVED) {
194 pr_err("jitdump file contains invalid or unsupported flags 0x%llx\n",
195 (unsigned long long)header.flags & JITDUMP_FLAGS_RESERVED);
196 goto error;
199 if (jd->use_arch_timestamp && !jd->session->time_conv.time_mult) {
200 pr_err("jitdump file uses arch timestamps but there is no timestamp conversion\n");
201 goto error;
205 * validate event is using the correct clockid
207 if (!jd->use_arch_timestamp && jit_validate_events(jd->session)) {
208 pr_err("error, jitted code must be sampled with perf record -k 1\n");
209 goto error;
212 bs = header.total_size - sizeof(header);
214 if (bs > bsz) {
215 n = realloc(buf, bs);
216 if (!n)
217 goto error;
218 bsz = bs;
219 buf = n;
220 /* read extra we do not know about */
221 ret = fread(buf, bs - bsz, 1, jd->in);
222 if (ret != 1)
223 goto error;
226 * keep dirname for generating files and mmap records
228 strcpy(jd->dir, name);
229 dirname(jd->dir);
231 return 0;
232 error:
233 funlockfile(jd->in);
234 fclose(jd->in);
235 return retval;
238 static union jr_entry *
239 jit_get_next_entry(struct jit_buf_desc *jd)
241 struct jr_prefix *prefix;
242 union jr_entry *jr;
243 void *addr;
244 size_t bs, size;
245 int id, ret;
247 if (!(jd && jd->in))
248 return NULL;
250 if (jd->buf == NULL) {
251 size_t sz = getpagesize();
252 if (sz < sizeof(*prefix))
253 sz = sizeof(*prefix);
255 jd->buf = malloc(sz);
256 if (jd->buf == NULL)
257 return NULL;
259 jd->bufsize = sz;
262 prefix = jd->buf;
265 * file is still locked at this point
267 ret = fread(prefix, sizeof(*prefix), 1, jd->in);
268 if (ret != 1)
269 return NULL;
271 if (jd->needs_bswap) {
272 prefix->id = bswap_32(prefix->id);
273 prefix->total_size = bswap_32(prefix->total_size);
274 prefix->timestamp = bswap_64(prefix->timestamp);
276 id = prefix->id;
277 size = prefix->total_size;
279 bs = (size_t)size;
280 if (bs < sizeof(*prefix))
281 return NULL;
283 if (id >= JIT_CODE_MAX) {
284 pr_warning("next_entry: unknown record type %d, skipping\n", id);
286 if (bs > jd->bufsize) {
287 void *n;
288 n = realloc(jd->buf, bs);
289 if (!n)
290 return NULL;
291 jd->buf = n;
292 jd->bufsize = bs;
295 addr = ((void *)jd->buf) + sizeof(*prefix);
297 ret = fread(addr, bs - sizeof(*prefix), 1, jd->in);
298 if (ret != 1)
299 return NULL;
301 jr = (union jr_entry *)jd->buf;
303 switch(id) {
304 case JIT_CODE_DEBUG_INFO:
305 if (jd->needs_bswap) {
306 uint64_t n;
307 jr->info.code_addr = bswap_64(jr->info.code_addr);
308 jr->info.nr_entry = bswap_64(jr->info.nr_entry);
309 for (n = 0 ; n < jr->info.nr_entry; n++) {
310 jr->info.entries[n].addr = bswap_64(jr->info.entries[n].addr);
311 jr->info.entries[n].lineno = bswap_32(jr->info.entries[n].lineno);
312 jr->info.entries[n].discrim = bswap_32(jr->info.entries[n].discrim);
315 break;
316 case JIT_CODE_UNWINDING_INFO:
317 if (jd->needs_bswap) {
318 jr->unwinding.unwinding_size = bswap_64(jr->unwinding.unwinding_size);
319 jr->unwinding.eh_frame_hdr_size = bswap_64(jr->unwinding.eh_frame_hdr_size);
320 jr->unwinding.mapped_size = bswap_64(jr->unwinding.mapped_size);
322 break;
323 case JIT_CODE_CLOSE:
324 break;
325 case JIT_CODE_LOAD:
326 if (jd->needs_bswap) {
327 jr->load.pid = bswap_32(jr->load.pid);
328 jr->load.tid = bswap_32(jr->load.tid);
329 jr->load.vma = bswap_64(jr->load.vma);
330 jr->load.code_addr = bswap_64(jr->load.code_addr);
331 jr->load.code_size = bswap_64(jr->load.code_size);
332 jr->load.code_index= bswap_64(jr->load.code_index);
334 jd->code_load_count++;
335 break;
336 case JIT_CODE_MOVE:
337 if (jd->needs_bswap) {
338 jr->move.pid = bswap_32(jr->move.pid);
339 jr->move.tid = bswap_32(jr->move.tid);
340 jr->move.vma = bswap_64(jr->move.vma);
341 jr->move.old_code_addr = bswap_64(jr->move.old_code_addr);
342 jr->move.new_code_addr = bswap_64(jr->move.new_code_addr);
343 jr->move.code_size = bswap_64(jr->move.code_size);
344 jr->move.code_index = bswap_64(jr->move.code_index);
346 break;
347 case JIT_CODE_MAX:
348 default:
349 /* skip unknown record (we have read them) */
350 break;
352 return jr;
355 static int
356 jit_inject_event(struct jit_buf_desc *jd, union perf_event *event)
358 ssize_t size;
360 size = perf_data__write(jd->output, event, event->header.size);
361 if (size < 0)
362 return -1;
364 jd->bytes_written += size;
365 return 0;
368 static uint64_t convert_timestamp(struct jit_buf_desc *jd, uint64_t timestamp)
370 struct perf_tsc_conversion tc;
372 if (!jd->use_arch_timestamp)
373 return timestamp;
375 tc.time_shift = jd->session->time_conv.time_shift;
376 tc.time_mult = jd->session->time_conv.time_mult;
377 tc.time_zero = jd->session->time_conv.time_zero;
379 if (!tc.time_mult)
380 return 0;
382 return tsc_to_perf_time(timestamp, &tc);
385 static int jit_repipe_code_load(struct jit_buf_desc *jd, union jr_entry *jr)
387 struct perf_sample sample;
388 union perf_event *event;
389 struct perf_tool *tool = jd->session->tool;
390 uint64_t code, addr;
391 uintptr_t uaddr;
392 char *filename;
393 struct stat st;
394 size_t size;
395 u16 idr_size;
396 const char *sym;
397 uint32_t count;
398 int ret, csize, usize;
399 pid_t pid, tid;
400 struct {
401 u32 pid, tid;
402 u64 time;
403 } *id;
405 pid = jr->load.pid;
406 tid = jr->load.tid;
407 csize = jr->load.code_size;
408 usize = jd->unwinding_mapped_size;
409 addr = jr->load.code_addr;
410 sym = (void *)((unsigned long)jr + sizeof(jr->load));
411 code = (unsigned long)jr + jr->load.p.total_size - csize;
412 count = jr->load.code_index;
413 idr_size = jd->machine->id_hdr_size;
415 event = calloc(1, sizeof(*event) + idr_size);
416 if (!event)
417 return -1;
419 filename = event->mmap2.filename;
420 size = snprintf(filename, PATH_MAX, "%s/jitted-%d-%u.so",
421 jd->dir,
422 pid,
423 count);
425 size++; /* for \0 */
427 size = PERF_ALIGN(size, sizeof(u64));
428 uaddr = (uintptr_t)code;
429 ret = jit_emit_elf(filename, sym, addr, (const void *)uaddr, csize, jd->debug_data, jd->nr_debug_entries,
430 jd->unwinding_data, jd->eh_frame_hdr_size, jd->unwinding_size);
432 if (jd->debug_data && jd->nr_debug_entries) {
433 free(jd->debug_data);
434 jd->debug_data = NULL;
435 jd->nr_debug_entries = 0;
438 if (jd->unwinding_data && jd->eh_frame_hdr_size) {
439 free(jd->unwinding_data);
440 jd->unwinding_data = NULL;
441 jd->eh_frame_hdr_size = 0;
442 jd->unwinding_mapped_size = 0;
443 jd->unwinding_size = 0;
446 if (ret) {
447 free(event);
448 return -1;
450 if (stat(filename, &st))
451 memset(&st, 0, sizeof(st));
453 event->mmap2.header.type = PERF_RECORD_MMAP2;
454 event->mmap2.header.misc = PERF_RECORD_MISC_USER;
455 event->mmap2.header.size = (sizeof(event->mmap2) -
456 (sizeof(event->mmap2.filename) - size) + idr_size);
458 event->mmap2.pgoff = GEN_ELF_TEXT_OFFSET;
459 event->mmap2.start = addr;
460 event->mmap2.len = usize ? ALIGN_8(csize) + usize : csize;
461 event->mmap2.pid = pid;
462 event->mmap2.tid = tid;
463 event->mmap2.ino = st.st_ino;
464 event->mmap2.maj = major(st.st_dev);
465 event->mmap2.min = minor(st.st_dev);
466 event->mmap2.prot = st.st_mode;
467 event->mmap2.flags = MAP_SHARED;
468 event->mmap2.ino_generation = 1;
470 id = (void *)((unsigned long)event + event->mmap.header.size - idr_size);
471 if (jd->sample_type & PERF_SAMPLE_TID) {
472 id->pid = pid;
473 id->tid = tid;
475 if (jd->sample_type & PERF_SAMPLE_TIME)
476 id->time = convert_timestamp(jd, jr->load.p.timestamp);
479 * create pseudo sample to induce dso hit increment
480 * use first address as sample address
482 memset(&sample, 0, sizeof(sample));
483 sample.cpumode = PERF_RECORD_MISC_USER;
484 sample.pid = pid;
485 sample.tid = tid;
486 sample.time = id->time;
487 sample.ip = addr;
489 ret = perf_event__process_mmap2(tool, event, &sample, jd->machine);
490 if (ret)
491 return ret;
493 ret = jit_inject_event(jd, event);
495 * mark dso as use to generate buildid in the header
497 if (!ret)
498 build_id__mark_dso_hit(tool, event, &sample, NULL, jd->machine);
500 return ret;
503 static int jit_repipe_code_move(struct jit_buf_desc *jd, union jr_entry *jr)
505 struct perf_sample sample;
506 union perf_event *event;
507 struct perf_tool *tool = jd->session->tool;
508 char *filename;
509 size_t size;
510 struct stat st;
511 int usize;
512 u16 idr_size;
513 int ret;
514 pid_t pid, tid;
515 struct {
516 u32 pid, tid;
517 u64 time;
518 } *id;
520 pid = jr->move.pid;
521 tid = jr->move.tid;
522 usize = jd->unwinding_mapped_size;
523 idr_size = jd->machine->id_hdr_size;
526 * +16 to account for sample_id_all (hack)
528 event = calloc(1, sizeof(*event) + 16);
529 if (!event)
530 return -1;
532 filename = event->mmap2.filename;
533 size = snprintf(filename, PATH_MAX, "%s/jitted-%d-%"PRIu64,
534 jd->dir,
535 pid,
536 jr->move.code_index);
538 size++; /* for \0 */
540 if (stat(filename, &st))
541 memset(&st, 0, sizeof(st));
543 size = PERF_ALIGN(size, sizeof(u64));
545 event->mmap2.header.type = PERF_RECORD_MMAP2;
546 event->mmap2.header.misc = PERF_RECORD_MISC_USER;
547 event->mmap2.header.size = (sizeof(event->mmap2) -
548 (sizeof(event->mmap2.filename) - size) + idr_size);
549 event->mmap2.pgoff = GEN_ELF_TEXT_OFFSET;
550 event->mmap2.start = jr->move.new_code_addr;
551 event->mmap2.len = usize ? ALIGN_8(jr->move.code_size) + usize
552 : jr->move.code_size;
553 event->mmap2.pid = pid;
554 event->mmap2.tid = tid;
555 event->mmap2.ino = st.st_ino;
556 event->mmap2.maj = major(st.st_dev);
557 event->mmap2.min = minor(st.st_dev);
558 event->mmap2.prot = st.st_mode;
559 event->mmap2.flags = MAP_SHARED;
560 event->mmap2.ino_generation = 1;
562 id = (void *)((unsigned long)event + event->mmap.header.size - idr_size);
563 if (jd->sample_type & PERF_SAMPLE_TID) {
564 id->pid = pid;
565 id->tid = tid;
567 if (jd->sample_type & PERF_SAMPLE_TIME)
568 id->time = convert_timestamp(jd, jr->load.p.timestamp);
571 * create pseudo sample to induce dso hit increment
572 * use first address as sample address
574 memset(&sample, 0, sizeof(sample));
575 sample.cpumode = PERF_RECORD_MISC_USER;
576 sample.pid = pid;
577 sample.tid = tid;
578 sample.time = id->time;
579 sample.ip = jr->move.new_code_addr;
581 ret = perf_event__process_mmap2(tool, event, &sample, jd->machine);
582 if (ret)
583 return ret;
585 ret = jit_inject_event(jd, event);
586 if (!ret)
587 build_id__mark_dso_hit(tool, event, &sample, NULL, jd->machine);
589 return ret;
592 static int jit_repipe_debug_info(struct jit_buf_desc *jd, union jr_entry *jr)
594 void *data;
595 size_t sz;
597 if (!(jd && jr))
598 return -1;
600 sz = jr->prefix.total_size - sizeof(jr->info);
601 data = malloc(sz);
602 if (!data)
603 return -1;
605 memcpy(data, &jr->info.entries, sz);
607 jd->debug_data = data;
610 * we must use nr_entry instead of size here because
611 * we cannot distinguish actual entry from padding otherwise
613 jd->nr_debug_entries = jr->info.nr_entry;
615 return 0;
618 static int
619 jit_repipe_unwinding_info(struct jit_buf_desc *jd, union jr_entry *jr)
621 void *unwinding_data;
622 uint32_t unwinding_data_size;
624 if (!(jd && jr))
625 return -1;
627 unwinding_data_size = jr->prefix.total_size - sizeof(jr->unwinding);
628 unwinding_data = malloc(unwinding_data_size);
629 if (!unwinding_data)
630 return -1;
632 memcpy(unwinding_data, &jr->unwinding.unwinding_data,
633 unwinding_data_size);
635 jd->eh_frame_hdr_size = jr->unwinding.eh_frame_hdr_size;
636 jd->unwinding_size = jr->unwinding.unwinding_size;
637 jd->unwinding_mapped_size = jr->unwinding.mapped_size;
638 jd->unwinding_data = unwinding_data;
640 return 0;
643 static int
644 jit_process_dump(struct jit_buf_desc *jd)
646 union jr_entry *jr;
647 int ret = 0;
649 while ((jr = jit_get_next_entry(jd))) {
650 switch(jr->prefix.id) {
651 case JIT_CODE_LOAD:
652 ret = jit_repipe_code_load(jd, jr);
653 break;
654 case JIT_CODE_MOVE:
655 ret = jit_repipe_code_move(jd, jr);
656 break;
657 case JIT_CODE_DEBUG_INFO:
658 ret = jit_repipe_debug_info(jd, jr);
659 break;
660 case JIT_CODE_UNWINDING_INFO:
661 ret = jit_repipe_unwinding_info(jd, jr);
662 break;
663 default:
664 ret = 0;
665 continue;
668 return ret;
671 static int
672 jit_inject(struct jit_buf_desc *jd, char *path)
674 int ret;
676 if (verbose > 0)
677 fprintf(stderr, "injecting: %s\n", path);
679 ret = jit_open(jd, path);
680 if (ret)
681 return -1;
683 ret = jit_process_dump(jd);
685 jit_close(jd);
687 if (verbose > 0)
688 fprintf(stderr, "injected: %s (%d)\n", path, ret);
690 return 0;
694 * File must be with pattern .../jit-XXXX.dump
695 * where XXXX is the PID of the process which did the mmap()
696 * as captured in the RECORD_MMAP record
698 static int
699 jit_detect(char *mmap_name, pid_t pid)
701 char *p;
702 char *end = NULL;
703 pid_t pid2;
705 if (verbose > 2)
706 fprintf(stderr, "jit marker trying : %s\n", mmap_name);
708 * get file name
710 p = strrchr(mmap_name, '/');
711 if (!p)
712 return -1;
715 * match prefix
717 if (strncmp(p, "/jit-", 5))
718 return -1;
721 * skip prefix
723 p += 5;
726 * must be followed by a pid
728 if (!isdigit(*p))
729 return -1;
731 pid2 = (int)strtol(p, &end, 10);
732 if (!end)
733 return -1;
736 * pid does not match mmap pid
737 * pid==0 in system-wide mode (synthesized)
739 if (pid && pid2 != pid)
740 return -1;
742 * validate suffix
744 if (strcmp(end, ".dump"))
745 return -1;
747 if (verbose > 0)
748 fprintf(stderr, "jit marker found: %s\n", mmap_name);
750 return 0;
754 jit_process(struct perf_session *session,
755 struct perf_data *output,
756 struct machine *machine,
757 char *filename,
758 pid_t pid,
759 u64 *nbytes)
761 struct perf_evsel *first;
762 struct jit_buf_desc jd;
763 int ret;
766 * first, detect marker mmap (i.e., the jitdump mmap)
768 if (jit_detect(filename, pid))
769 return 0;
771 memset(&jd, 0, sizeof(jd));
773 jd.session = session;
774 jd.output = output;
775 jd.machine = machine;
778 * track sample_type to compute id_all layout
779 * perf sets the same sample type to all events as of now
781 first = perf_evlist__first(session->evlist);
782 jd.sample_type = first->attr.sample_type;
784 *nbytes = 0;
786 ret = jit_inject(&jd, filename);
787 if (!ret) {
788 *nbytes = jd.bytes_written;
789 ret = 1;
792 return ret;