of: MSI: Simplify irqdomain lookup
[linux/fpc-iii.git] / tools / perf / util / auxtrace.c
blob360fda01f3b0d17369254d03fe16daf24f30c698
1 /*
2 * auxtrace.c: AUX area trace support
3 * Copyright (c) 2013-2015, Intel Corporation.
5 * This program is free software; you can redistribute it and/or modify it
6 * under the terms and conditions of the GNU General Public License,
7 * version 2, as published by the Free Software Foundation.
9 * This program is distributed in the hope it will be useful, but WITHOUT
10 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
11 * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
12 * more details.
16 #include <sys/types.h>
17 #include <sys/mman.h>
18 #include <stdbool.h>
20 #include <linux/kernel.h>
21 #include <linux/perf_event.h>
22 #include <linux/types.h>
23 #include <linux/bitops.h>
24 #include <linux/log2.h>
25 #include <linux/string.h>
27 #include <sys/param.h>
28 #include <stdlib.h>
29 #include <stdio.h>
30 #include <string.h>
31 #include <limits.h>
32 #include <errno.h>
33 #include <linux/list.h>
35 #include "../perf.h"
36 #include "util.h"
37 #include "evlist.h"
38 #include "cpumap.h"
39 #include "thread_map.h"
40 #include "asm/bug.h"
41 #include "auxtrace.h"
43 #include <linux/hash.h>
45 #include "event.h"
46 #include "session.h"
47 #include "debug.h"
48 #include <subcmd/parse-options.h>
50 #include "intel-pt.h"
51 #include "intel-bts.h"
53 int auxtrace_mmap__mmap(struct auxtrace_mmap *mm,
54 struct auxtrace_mmap_params *mp,
55 void *userpg, int fd)
57 struct perf_event_mmap_page *pc = userpg;
59 WARN_ONCE(mm->base, "Uninitialized auxtrace_mmap\n");
61 mm->userpg = userpg;
62 mm->mask = mp->mask;
63 mm->len = mp->len;
64 mm->prev = 0;
65 mm->idx = mp->idx;
66 mm->tid = mp->tid;
67 mm->cpu = mp->cpu;
69 if (!mp->len) {
70 mm->base = NULL;
71 return 0;
74 #if BITS_PER_LONG != 64 && !defined(HAVE_SYNC_COMPARE_AND_SWAP_SUPPORT)
75 pr_err("Cannot use AUX area tracing mmaps\n");
76 return -1;
77 #endif
79 pc->aux_offset = mp->offset;
80 pc->aux_size = mp->len;
82 mm->base = mmap(NULL, mp->len, mp->prot, MAP_SHARED, fd, mp->offset);
83 if (mm->base == MAP_FAILED) {
84 pr_debug2("failed to mmap AUX area\n");
85 mm->base = NULL;
86 return -1;
89 return 0;
92 void auxtrace_mmap__munmap(struct auxtrace_mmap *mm)
94 if (mm->base) {
95 munmap(mm->base, mm->len);
96 mm->base = NULL;
100 void auxtrace_mmap_params__init(struct auxtrace_mmap_params *mp,
101 off_t auxtrace_offset,
102 unsigned int auxtrace_pages,
103 bool auxtrace_overwrite)
105 if (auxtrace_pages) {
106 mp->offset = auxtrace_offset;
107 mp->len = auxtrace_pages * (size_t)page_size;
108 mp->mask = is_power_of_2(mp->len) ? mp->len - 1 : 0;
109 mp->prot = PROT_READ | (auxtrace_overwrite ? 0 : PROT_WRITE);
110 pr_debug2("AUX area mmap length %zu\n", mp->len);
111 } else {
112 mp->len = 0;
116 void auxtrace_mmap_params__set_idx(struct auxtrace_mmap_params *mp,
117 struct perf_evlist *evlist, int idx,
118 bool per_cpu)
120 mp->idx = idx;
122 if (per_cpu) {
123 mp->cpu = evlist->cpus->map[idx];
124 if (evlist->threads)
125 mp->tid = thread_map__pid(evlist->threads, 0);
126 else
127 mp->tid = -1;
128 } else {
129 mp->cpu = -1;
130 mp->tid = thread_map__pid(evlist->threads, idx);
134 #define AUXTRACE_INIT_NR_QUEUES 32
136 static struct auxtrace_queue *auxtrace_alloc_queue_array(unsigned int nr_queues)
138 struct auxtrace_queue *queue_array;
139 unsigned int max_nr_queues, i;
141 max_nr_queues = UINT_MAX / sizeof(struct auxtrace_queue);
142 if (nr_queues > max_nr_queues)
143 return NULL;
145 queue_array = calloc(nr_queues, sizeof(struct auxtrace_queue));
146 if (!queue_array)
147 return NULL;
149 for (i = 0; i < nr_queues; i++) {
150 INIT_LIST_HEAD(&queue_array[i].head);
151 queue_array[i].priv = NULL;
154 return queue_array;
157 int auxtrace_queues__init(struct auxtrace_queues *queues)
159 queues->nr_queues = AUXTRACE_INIT_NR_QUEUES;
160 queues->queue_array = auxtrace_alloc_queue_array(queues->nr_queues);
161 if (!queues->queue_array)
162 return -ENOMEM;
163 return 0;
166 static int auxtrace_queues__grow(struct auxtrace_queues *queues,
167 unsigned int new_nr_queues)
169 unsigned int nr_queues = queues->nr_queues;
170 struct auxtrace_queue *queue_array;
171 unsigned int i;
173 if (!nr_queues)
174 nr_queues = AUXTRACE_INIT_NR_QUEUES;
176 while (nr_queues && nr_queues < new_nr_queues)
177 nr_queues <<= 1;
179 if (nr_queues < queues->nr_queues || nr_queues < new_nr_queues)
180 return -EINVAL;
182 queue_array = auxtrace_alloc_queue_array(nr_queues);
183 if (!queue_array)
184 return -ENOMEM;
186 for (i = 0; i < queues->nr_queues; i++) {
187 list_splice_tail(&queues->queue_array[i].head,
188 &queue_array[i].head);
189 queue_array[i].priv = queues->queue_array[i].priv;
192 queues->nr_queues = nr_queues;
193 queues->queue_array = queue_array;
195 return 0;
198 static void *auxtrace_copy_data(u64 size, struct perf_session *session)
200 int fd = perf_data_file__fd(session->file);
201 void *p;
202 ssize_t ret;
204 if (size > SSIZE_MAX)
205 return NULL;
207 p = malloc(size);
208 if (!p)
209 return NULL;
211 ret = readn(fd, p, size);
212 if (ret != (ssize_t)size) {
213 free(p);
214 return NULL;
217 return p;
220 static int auxtrace_queues__add_buffer(struct auxtrace_queues *queues,
221 unsigned int idx,
222 struct auxtrace_buffer *buffer)
224 struct auxtrace_queue *queue;
225 int err;
227 if (idx >= queues->nr_queues) {
228 err = auxtrace_queues__grow(queues, idx + 1);
229 if (err)
230 return err;
233 queue = &queues->queue_array[idx];
235 if (!queue->set) {
236 queue->set = true;
237 queue->tid = buffer->tid;
238 queue->cpu = buffer->cpu;
239 } else if (buffer->cpu != queue->cpu || buffer->tid != queue->tid) {
240 pr_err("auxtrace queue conflict: cpu %d, tid %d vs cpu %d, tid %d\n",
241 queue->cpu, queue->tid, buffer->cpu, buffer->tid);
242 return -EINVAL;
245 buffer->buffer_nr = queues->next_buffer_nr++;
247 list_add_tail(&buffer->list, &queue->head);
249 queues->new_data = true;
250 queues->populated = true;
252 return 0;
255 /* Limit buffers to 32MiB on 32-bit */
256 #define BUFFER_LIMIT_FOR_32_BIT (32 * 1024 * 1024)
258 static int auxtrace_queues__split_buffer(struct auxtrace_queues *queues,
259 unsigned int idx,
260 struct auxtrace_buffer *buffer)
262 u64 sz = buffer->size;
263 bool consecutive = false;
264 struct auxtrace_buffer *b;
265 int err;
267 while (sz > BUFFER_LIMIT_FOR_32_BIT) {
268 b = memdup(buffer, sizeof(struct auxtrace_buffer));
269 if (!b)
270 return -ENOMEM;
271 b->size = BUFFER_LIMIT_FOR_32_BIT;
272 b->consecutive = consecutive;
273 err = auxtrace_queues__add_buffer(queues, idx, b);
274 if (err) {
275 auxtrace_buffer__free(b);
276 return err;
278 buffer->data_offset += BUFFER_LIMIT_FOR_32_BIT;
279 sz -= BUFFER_LIMIT_FOR_32_BIT;
280 consecutive = true;
283 buffer->size = sz;
284 buffer->consecutive = consecutive;
286 return 0;
289 static int auxtrace_queues__add_event_buffer(struct auxtrace_queues *queues,
290 struct perf_session *session,
291 unsigned int idx,
292 struct auxtrace_buffer *buffer)
294 if (session->one_mmap) {
295 buffer->data = buffer->data_offset - session->one_mmap_offset +
296 session->one_mmap_addr;
297 } else if (perf_data_file__is_pipe(session->file)) {
298 buffer->data = auxtrace_copy_data(buffer->size, session);
299 if (!buffer->data)
300 return -ENOMEM;
301 buffer->data_needs_freeing = true;
302 } else if (BITS_PER_LONG == 32 &&
303 buffer->size > BUFFER_LIMIT_FOR_32_BIT) {
304 int err;
306 err = auxtrace_queues__split_buffer(queues, idx, buffer);
307 if (err)
308 return err;
311 return auxtrace_queues__add_buffer(queues, idx, buffer);
314 int auxtrace_queues__add_event(struct auxtrace_queues *queues,
315 struct perf_session *session,
316 union perf_event *event, off_t data_offset,
317 struct auxtrace_buffer **buffer_ptr)
319 struct auxtrace_buffer *buffer;
320 unsigned int idx;
321 int err;
323 buffer = zalloc(sizeof(struct auxtrace_buffer));
324 if (!buffer)
325 return -ENOMEM;
327 buffer->pid = -1;
328 buffer->tid = event->auxtrace.tid;
329 buffer->cpu = event->auxtrace.cpu;
330 buffer->data_offset = data_offset;
331 buffer->offset = event->auxtrace.offset;
332 buffer->reference = event->auxtrace.reference;
333 buffer->size = event->auxtrace.size;
334 idx = event->auxtrace.idx;
336 err = auxtrace_queues__add_event_buffer(queues, session, idx, buffer);
337 if (err)
338 goto out_err;
340 if (buffer_ptr)
341 *buffer_ptr = buffer;
343 return 0;
345 out_err:
346 auxtrace_buffer__free(buffer);
347 return err;
350 static int auxtrace_queues__add_indexed_event(struct auxtrace_queues *queues,
351 struct perf_session *session,
352 off_t file_offset, size_t sz)
354 union perf_event *event;
355 int err;
356 char buf[PERF_SAMPLE_MAX_SIZE];
358 err = perf_session__peek_event(session, file_offset, buf,
359 PERF_SAMPLE_MAX_SIZE, &event, NULL);
360 if (err)
361 return err;
363 if (event->header.type == PERF_RECORD_AUXTRACE) {
364 if (event->header.size < sizeof(struct auxtrace_event) ||
365 event->header.size != sz) {
366 err = -EINVAL;
367 goto out;
369 file_offset += event->header.size;
370 err = auxtrace_queues__add_event(queues, session, event,
371 file_offset, NULL);
373 out:
374 return err;
377 void auxtrace_queues__free(struct auxtrace_queues *queues)
379 unsigned int i;
381 for (i = 0; i < queues->nr_queues; i++) {
382 while (!list_empty(&queues->queue_array[i].head)) {
383 struct auxtrace_buffer *buffer;
385 buffer = list_entry(queues->queue_array[i].head.next,
386 struct auxtrace_buffer, list);
387 list_del(&buffer->list);
388 auxtrace_buffer__free(buffer);
392 zfree(&queues->queue_array);
393 queues->nr_queues = 0;
396 static void auxtrace_heapify(struct auxtrace_heap_item *heap_array,
397 unsigned int pos, unsigned int queue_nr,
398 u64 ordinal)
400 unsigned int parent;
402 while (pos) {
403 parent = (pos - 1) >> 1;
404 if (heap_array[parent].ordinal <= ordinal)
405 break;
406 heap_array[pos] = heap_array[parent];
407 pos = parent;
409 heap_array[pos].queue_nr = queue_nr;
410 heap_array[pos].ordinal = ordinal;
413 int auxtrace_heap__add(struct auxtrace_heap *heap, unsigned int queue_nr,
414 u64 ordinal)
416 struct auxtrace_heap_item *heap_array;
418 if (queue_nr >= heap->heap_sz) {
419 unsigned int heap_sz = AUXTRACE_INIT_NR_QUEUES;
421 while (heap_sz <= queue_nr)
422 heap_sz <<= 1;
423 heap_array = realloc(heap->heap_array,
424 heap_sz * sizeof(struct auxtrace_heap_item));
425 if (!heap_array)
426 return -ENOMEM;
427 heap->heap_array = heap_array;
428 heap->heap_sz = heap_sz;
431 auxtrace_heapify(heap->heap_array, heap->heap_cnt++, queue_nr, ordinal);
433 return 0;
436 void auxtrace_heap__free(struct auxtrace_heap *heap)
438 zfree(&heap->heap_array);
439 heap->heap_cnt = 0;
440 heap->heap_sz = 0;
443 void auxtrace_heap__pop(struct auxtrace_heap *heap)
445 unsigned int pos, last, heap_cnt = heap->heap_cnt;
446 struct auxtrace_heap_item *heap_array;
448 if (!heap_cnt)
449 return;
451 heap->heap_cnt -= 1;
453 heap_array = heap->heap_array;
455 pos = 0;
456 while (1) {
457 unsigned int left, right;
459 left = (pos << 1) + 1;
460 if (left >= heap_cnt)
461 break;
462 right = left + 1;
463 if (right >= heap_cnt) {
464 heap_array[pos] = heap_array[left];
465 return;
467 if (heap_array[left].ordinal < heap_array[right].ordinal) {
468 heap_array[pos] = heap_array[left];
469 pos = left;
470 } else {
471 heap_array[pos] = heap_array[right];
472 pos = right;
476 last = heap_cnt - 1;
477 auxtrace_heapify(heap_array, pos, heap_array[last].queue_nr,
478 heap_array[last].ordinal);
481 size_t auxtrace_record__info_priv_size(struct auxtrace_record *itr)
483 if (itr)
484 return itr->info_priv_size(itr);
485 return 0;
488 static int auxtrace_not_supported(void)
490 pr_err("AUX area tracing is not supported on this architecture\n");
491 return -EINVAL;
494 int auxtrace_record__info_fill(struct auxtrace_record *itr,
495 struct perf_session *session,
496 struct auxtrace_info_event *auxtrace_info,
497 size_t priv_size)
499 if (itr)
500 return itr->info_fill(itr, session, auxtrace_info, priv_size);
501 return auxtrace_not_supported();
504 void auxtrace_record__free(struct auxtrace_record *itr)
506 if (itr)
507 itr->free(itr);
510 int auxtrace_record__snapshot_start(struct auxtrace_record *itr)
512 if (itr && itr->snapshot_start)
513 return itr->snapshot_start(itr);
514 return 0;
517 int auxtrace_record__snapshot_finish(struct auxtrace_record *itr)
519 if (itr && itr->snapshot_finish)
520 return itr->snapshot_finish(itr);
521 return 0;
524 int auxtrace_record__find_snapshot(struct auxtrace_record *itr, int idx,
525 struct auxtrace_mmap *mm,
526 unsigned char *data, u64 *head, u64 *old)
528 if (itr && itr->find_snapshot)
529 return itr->find_snapshot(itr, idx, mm, data, head, old);
530 return 0;
533 int auxtrace_record__options(struct auxtrace_record *itr,
534 struct perf_evlist *evlist,
535 struct record_opts *opts)
537 if (itr)
538 return itr->recording_options(itr, evlist, opts);
539 return 0;
542 u64 auxtrace_record__reference(struct auxtrace_record *itr)
544 if (itr)
545 return itr->reference(itr);
546 return 0;
549 int auxtrace_parse_snapshot_options(struct auxtrace_record *itr,
550 struct record_opts *opts, const char *str)
552 if (!str)
553 return 0;
555 if (itr)
556 return itr->parse_snapshot_options(itr, opts, str);
558 pr_err("No AUX area tracing to snapshot\n");
559 return -EINVAL;
562 struct auxtrace_record *__weak
563 auxtrace_record__init(struct perf_evlist *evlist __maybe_unused, int *err)
565 *err = 0;
566 return NULL;
569 static int auxtrace_index__alloc(struct list_head *head)
571 struct auxtrace_index *auxtrace_index;
573 auxtrace_index = malloc(sizeof(struct auxtrace_index));
574 if (!auxtrace_index)
575 return -ENOMEM;
577 auxtrace_index->nr = 0;
578 INIT_LIST_HEAD(&auxtrace_index->list);
580 list_add_tail(&auxtrace_index->list, head);
582 return 0;
585 void auxtrace_index__free(struct list_head *head)
587 struct auxtrace_index *auxtrace_index, *n;
589 list_for_each_entry_safe(auxtrace_index, n, head, list) {
590 list_del(&auxtrace_index->list);
591 free(auxtrace_index);
595 static struct auxtrace_index *auxtrace_index__last(struct list_head *head)
597 struct auxtrace_index *auxtrace_index;
598 int err;
600 if (list_empty(head)) {
601 err = auxtrace_index__alloc(head);
602 if (err)
603 return NULL;
606 auxtrace_index = list_entry(head->prev, struct auxtrace_index, list);
608 if (auxtrace_index->nr >= PERF_AUXTRACE_INDEX_ENTRY_COUNT) {
609 err = auxtrace_index__alloc(head);
610 if (err)
611 return NULL;
612 auxtrace_index = list_entry(head->prev, struct auxtrace_index,
613 list);
616 return auxtrace_index;
619 int auxtrace_index__auxtrace_event(struct list_head *head,
620 union perf_event *event, off_t file_offset)
622 struct auxtrace_index *auxtrace_index;
623 size_t nr;
625 auxtrace_index = auxtrace_index__last(head);
626 if (!auxtrace_index)
627 return -ENOMEM;
629 nr = auxtrace_index->nr;
630 auxtrace_index->entries[nr].file_offset = file_offset;
631 auxtrace_index->entries[nr].sz = event->header.size;
632 auxtrace_index->nr += 1;
634 return 0;
637 static int auxtrace_index__do_write(int fd,
638 struct auxtrace_index *auxtrace_index)
640 struct auxtrace_index_entry ent;
641 size_t i;
643 for (i = 0; i < auxtrace_index->nr; i++) {
644 ent.file_offset = auxtrace_index->entries[i].file_offset;
645 ent.sz = auxtrace_index->entries[i].sz;
646 if (writen(fd, &ent, sizeof(ent)) != sizeof(ent))
647 return -errno;
649 return 0;
652 int auxtrace_index__write(int fd, struct list_head *head)
654 struct auxtrace_index *auxtrace_index;
655 u64 total = 0;
656 int err;
658 list_for_each_entry(auxtrace_index, head, list)
659 total += auxtrace_index->nr;
661 if (writen(fd, &total, sizeof(total)) != sizeof(total))
662 return -errno;
664 list_for_each_entry(auxtrace_index, head, list) {
665 err = auxtrace_index__do_write(fd, auxtrace_index);
666 if (err)
667 return err;
670 return 0;
673 static int auxtrace_index__process_entry(int fd, struct list_head *head,
674 bool needs_swap)
676 struct auxtrace_index *auxtrace_index;
677 struct auxtrace_index_entry ent;
678 size_t nr;
680 if (readn(fd, &ent, sizeof(ent)) != sizeof(ent))
681 return -1;
683 auxtrace_index = auxtrace_index__last(head);
684 if (!auxtrace_index)
685 return -1;
687 nr = auxtrace_index->nr;
688 if (needs_swap) {
689 auxtrace_index->entries[nr].file_offset =
690 bswap_64(ent.file_offset);
691 auxtrace_index->entries[nr].sz = bswap_64(ent.sz);
692 } else {
693 auxtrace_index->entries[nr].file_offset = ent.file_offset;
694 auxtrace_index->entries[nr].sz = ent.sz;
697 auxtrace_index->nr = nr + 1;
699 return 0;
702 int auxtrace_index__process(int fd, u64 size, struct perf_session *session,
703 bool needs_swap)
705 struct list_head *head = &session->auxtrace_index;
706 u64 nr;
708 if (readn(fd, &nr, sizeof(u64)) != sizeof(u64))
709 return -1;
711 if (needs_swap)
712 nr = bswap_64(nr);
714 if (sizeof(u64) + nr * sizeof(struct auxtrace_index_entry) > size)
715 return -1;
717 while (nr--) {
718 int err;
720 err = auxtrace_index__process_entry(fd, head, needs_swap);
721 if (err)
722 return -1;
725 return 0;
728 static int auxtrace_queues__process_index_entry(struct auxtrace_queues *queues,
729 struct perf_session *session,
730 struct auxtrace_index_entry *ent)
732 return auxtrace_queues__add_indexed_event(queues, session,
733 ent->file_offset, ent->sz);
736 int auxtrace_queues__process_index(struct auxtrace_queues *queues,
737 struct perf_session *session)
739 struct auxtrace_index *auxtrace_index;
740 struct auxtrace_index_entry *ent;
741 size_t i;
742 int err;
744 list_for_each_entry(auxtrace_index, &session->auxtrace_index, list) {
745 for (i = 0; i < auxtrace_index->nr; i++) {
746 ent = &auxtrace_index->entries[i];
747 err = auxtrace_queues__process_index_entry(queues,
748 session,
749 ent);
750 if (err)
751 return err;
754 return 0;
757 struct auxtrace_buffer *auxtrace_buffer__next(struct auxtrace_queue *queue,
758 struct auxtrace_buffer *buffer)
760 if (buffer) {
761 if (list_is_last(&buffer->list, &queue->head))
762 return NULL;
763 return list_entry(buffer->list.next, struct auxtrace_buffer,
764 list);
765 } else {
766 if (list_empty(&queue->head))
767 return NULL;
768 return list_entry(queue->head.next, struct auxtrace_buffer,
769 list);
773 void *auxtrace_buffer__get_data(struct auxtrace_buffer *buffer, int fd)
775 size_t adj = buffer->data_offset & (page_size - 1);
776 size_t size = buffer->size + adj;
777 off_t file_offset = buffer->data_offset - adj;
778 void *addr;
780 if (buffer->data)
781 return buffer->data;
783 addr = mmap(NULL, size, PROT_READ, MAP_SHARED, fd, file_offset);
784 if (addr == MAP_FAILED)
785 return NULL;
787 buffer->mmap_addr = addr;
788 buffer->mmap_size = size;
790 buffer->data = addr + adj;
792 return buffer->data;
795 void auxtrace_buffer__put_data(struct auxtrace_buffer *buffer)
797 if (!buffer->data || !buffer->mmap_addr)
798 return;
799 munmap(buffer->mmap_addr, buffer->mmap_size);
800 buffer->mmap_addr = NULL;
801 buffer->mmap_size = 0;
802 buffer->data = NULL;
803 buffer->use_data = NULL;
806 void auxtrace_buffer__drop_data(struct auxtrace_buffer *buffer)
808 auxtrace_buffer__put_data(buffer);
809 if (buffer->data_needs_freeing) {
810 buffer->data_needs_freeing = false;
811 zfree(&buffer->data);
812 buffer->use_data = NULL;
813 buffer->size = 0;
817 void auxtrace_buffer__free(struct auxtrace_buffer *buffer)
819 auxtrace_buffer__drop_data(buffer);
820 free(buffer);
823 void auxtrace_synth_error(struct auxtrace_error_event *auxtrace_error, int type,
824 int code, int cpu, pid_t pid, pid_t tid, u64 ip,
825 const char *msg)
827 size_t size;
829 memset(auxtrace_error, 0, sizeof(struct auxtrace_error_event));
831 auxtrace_error->header.type = PERF_RECORD_AUXTRACE_ERROR;
832 auxtrace_error->type = type;
833 auxtrace_error->code = code;
834 auxtrace_error->cpu = cpu;
835 auxtrace_error->pid = pid;
836 auxtrace_error->tid = tid;
837 auxtrace_error->ip = ip;
838 strlcpy(auxtrace_error->msg, msg, MAX_AUXTRACE_ERROR_MSG);
840 size = (void *)auxtrace_error->msg - (void *)auxtrace_error +
841 strlen(auxtrace_error->msg) + 1;
842 auxtrace_error->header.size = PERF_ALIGN(size, sizeof(u64));
845 int perf_event__synthesize_auxtrace_info(struct auxtrace_record *itr,
846 struct perf_tool *tool,
847 struct perf_session *session,
848 perf_event__handler_t process)
850 union perf_event *ev;
851 size_t priv_size;
852 int err;
854 pr_debug2("Synthesizing auxtrace information\n");
855 priv_size = auxtrace_record__info_priv_size(itr);
856 ev = zalloc(sizeof(struct auxtrace_info_event) + priv_size);
857 if (!ev)
858 return -ENOMEM;
860 ev->auxtrace_info.header.type = PERF_RECORD_AUXTRACE_INFO;
861 ev->auxtrace_info.header.size = sizeof(struct auxtrace_info_event) +
862 priv_size;
863 err = auxtrace_record__info_fill(itr, session, &ev->auxtrace_info,
864 priv_size);
865 if (err)
866 goto out_free;
868 err = process(tool, ev, NULL, NULL);
869 out_free:
870 free(ev);
871 return err;
874 static bool auxtrace__dont_decode(struct perf_session *session)
876 return !session->itrace_synth_opts ||
877 session->itrace_synth_opts->dont_decode;
880 int perf_event__process_auxtrace_info(struct perf_tool *tool __maybe_unused,
881 union perf_event *event,
882 struct perf_session *session)
884 enum auxtrace_type type = event->auxtrace_info.type;
886 if (dump_trace)
887 fprintf(stdout, " type: %u\n", type);
889 switch (type) {
890 case PERF_AUXTRACE_INTEL_PT:
891 return intel_pt_process_auxtrace_info(event, session);
892 case PERF_AUXTRACE_INTEL_BTS:
893 return intel_bts_process_auxtrace_info(event, session);
894 case PERF_AUXTRACE_UNKNOWN:
895 default:
896 return -EINVAL;
900 s64 perf_event__process_auxtrace(struct perf_tool *tool,
901 union perf_event *event,
902 struct perf_session *session)
904 s64 err;
906 if (dump_trace)
907 fprintf(stdout, " size: %#"PRIx64" offset: %#"PRIx64" ref: %#"PRIx64" idx: %u tid: %d cpu: %d\n",
908 event->auxtrace.size, event->auxtrace.offset,
909 event->auxtrace.reference, event->auxtrace.idx,
910 event->auxtrace.tid, event->auxtrace.cpu);
912 if (auxtrace__dont_decode(session))
913 return event->auxtrace.size;
915 if (!session->auxtrace || event->header.type != PERF_RECORD_AUXTRACE)
916 return -EINVAL;
918 err = session->auxtrace->process_auxtrace_event(session, event, tool);
919 if (err < 0)
920 return err;
922 return event->auxtrace.size;
925 #define PERF_ITRACE_DEFAULT_PERIOD_TYPE PERF_ITRACE_PERIOD_NANOSECS
926 #define PERF_ITRACE_DEFAULT_PERIOD 100000
927 #define PERF_ITRACE_DEFAULT_CALLCHAIN_SZ 16
928 #define PERF_ITRACE_MAX_CALLCHAIN_SZ 1024
929 #define PERF_ITRACE_DEFAULT_LAST_BRANCH_SZ 64
930 #define PERF_ITRACE_MAX_LAST_BRANCH_SZ 1024
932 void itrace_synth_opts__set_default(struct itrace_synth_opts *synth_opts)
934 synth_opts->instructions = true;
935 synth_opts->branches = true;
936 synth_opts->transactions = true;
937 synth_opts->errors = true;
938 synth_opts->period_type = PERF_ITRACE_DEFAULT_PERIOD_TYPE;
939 synth_opts->period = PERF_ITRACE_DEFAULT_PERIOD;
940 synth_opts->callchain_sz = PERF_ITRACE_DEFAULT_CALLCHAIN_SZ;
941 synth_opts->last_branch_sz = PERF_ITRACE_DEFAULT_LAST_BRANCH_SZ;
945 * Please check tools/perf/Documentation/perf-script.txt for information
946 * about the options parsed here, which is introduced after this cset,
947 * when support in 'perf script' for these options is introduced.
949 int itrace_parse_synth_opts(const struct option *opt, const char *str,
950 int unset)
952 struct itrace_synth_opts *synth_opts = opt->value;
953 const char *p;
954 char *endptr;
955 bool period_type_set = false;
956 bool period_set = false;
958 synth_opts->set = true;
960 if (unset) {
961 synth_opts->dont_decode = true;
962 return 0;
965 if (!str) {
966 itrace_synth_opts__set_default(synth_opts);
967 return 0;
970 for (p = str; *p;) {
971 switch (*p++) {
972 case 'i':
973 synth_opts->instructions = true;
974 while (*p == ' ' || *p == ',')
975 p += 1;
976 if (isdigit(*p)) {
977 synth_opts->period = strtoull(p, &endptr, 10);
978 period_set = true;
979 p = endptr;
980 while (*p == ' ' || *p == ',')
981 p += 1;
982 switch (*p++) {
983 case 'i':
984 synth_opts->period_type =
985 PERF_ITRACE_PERIOD_INSTRUCTIONS;
986 period_type_set = true;
987 break;
988 case 't':
989 synth_opts->period_type =
990 PERF_ITRACE_PERIOD_TICKS;
991 period_type_set = true;
992 break;
993 case 'm':
994 synth_opts->period *= 1000;
995 /* Fall through */
996 case 'u':
997 synth_opts->period *= 1000;
998 /* Fall through */
999 case 'n':
1000 if (*p++ != 's')
1001 goto out_err;
1002 synth_opts->period_type =
1003 PERF_ITRACE_PERIOD_NANOSECS;
1004 period_type_set = true;
1005 break;
1006 case '\0':
1007 goto out;
1008 default:
1009 goto out_err;
1012 break;
1013 case 'b':
1014 synth_opts->branches = true;
1015 break;
1016 case 'x':
1017 synth_opts->transactions = true;
1018 break;
1019 case 'e':
1020 synth_opts->errors = true;
1021 break;
1022 case 'd':
1023 synth_opts->log = true;
1024 break;
1025 case 'c':
1026 synth_opts->branches = true;
1027 synth_opts->calls = true;
1028 break;
1029 case 'r':
1030 synth_opts->branches = true;
1031 synth_opts->returns = true;
1032 break;
1033 case 'g':
1034 synth_opts->callchain = true;
1035 synth_opts->callchain_sz =
1036 PERF_ITRACE_DEFAULT_CALLCHAIN_SZ;
1037 while (*p == ' ' || *p == ',')
1038 p += 1;
1039 if (isdigit(*p)) {
1040 unsigned int val;
1042 val = strtoul(p, &endptr, 10);
1043 p = endptr;
1044 if (!val || val > PERF_ITRACE_MAX_CALLCHAIN_SZ)
1045 goto out_err;
1046 synth_opts->callchain_sz = val;
1048 break;
1049 case 'l':
1050 synth_opts->last_branch = true;
1051 synth_opts->last_branch_sz =
1052 PERF_ITRACE_DEFAULT_LAST_BRANCH_SZ;
1053 while (*p == ' ' || *p == ',')
1054 p += 1;
1055 if (isdigit(*p)) {
1056 unsigned int val;
1058 val = strtoul(p, &endptr, 10);
1059 p = endptr;
1060 if (!val ||
1061 val > PERF_ITRACE_MAX_LAST_BRANCH_SZ)
1062 goto out_err;
1063 synth_opts->last_branch_sz = val;
1065 break;
1066 case ' ':
1067 case ',':
1068 break;
1069 default:
1070 goto out_err;
1073 out:
1074 if (synth_opts->instructions) {
1075 if (!period_type_set)
1076 synth_opts->period_type =
1077 PERF_ITRACE_DEFAULT_PERIOD_TYPE;
1078 if (!period_set)
1079 synth_opts->period = PERF_ITRACE_DEFAULT_PERIOD;
1082 return 0;
1084 out_err:
1085 pr_err("Bad Instruction Tracing options '%s'\n", str);
1086 return -EINVAL;
1089 static const char * const auxtrace_error_type_name[] = {
1090 [PERF_AUXTRACE_ERROR_ITRACE] = "instruction trace",
1093 static const char *auxtrace_error_name(int type)
1095 const char *error_type_name = NULL;
1097 if (type < PERF_AUXTRACE_ERROR_MAX)
1098 error_type_name = auxtrace_error_type_name[type];
1099 if (!error_type_name)
1100 error_type_name = "unknown AUX";
1101 return error_type_name;
1104 size_t perf_event__fprintf_auxtrace_error(union perf_event *event, FILE *fp)
1106 struct auxtrace_error_event *e = &event->auxtrace_error;
1107 int ret;
1109 ret = fprintf(fp, " %s error type %u",
1110 auxtrace_error_name(e->type), e->type);
1111 ret += fprintf(fp, " cpu %d pid %d tid %d ip %#"PRIx64" code %u: %s\n",
1112 e->cpu, e->pid, e->tid, e->ip, e->code, e->msg);
1113 return ret;
1116 void perf_session__auxtrace_error_inc(struct perf_session *session,
1117 union perf_event *event)
1119 struct auxtrace_error_event *e = &event->auxtrace_error;
1121 if (e->type < PERF_AUXTRACE_ERROR_MAX)
1122 session->evlist->stats.nr_auxtrace_errors[e->type] += 1;
1125 void events_stats__auxtrace_error_warn(const struct events_stats *stats)
1127 int i;
1129 for (i = 0; i < PERF_AUXTRACE_ERROR_MAX; i++) {
1130 if (!stats->nr_auxtrace_errors[i])
1131 continue;
1132 ui__warning("%u %s errors\n",
1133 stats->nr_auxtrace_errors[i],
1134 auxtrace_error_name(i));
1138 int perf_event__process_auxtrace_error(struct perf_tool *tool __maybe_unused,
1139 union perf_event *event,
1140 struct perf_session *session)
1142 if (auxtrace__dont_decode(session))
1143 return 0;
1145 perf_event__fprintf_auxtrace_error(event, stdout);
1146 return 0;
1149 static int __auxtrace_mmap__read(struct auxtrace_mmap *mm,
1150 struct auxtrace_record *itr,
1151 struct perf_tool *tool, process_auxtrace_t fn,
1152 bool snapshot, size_t snapshot_size)
1154 u64 head, old = mm->prev, offset, ref;
1155 unsigned char *data = mm->base;
1156 size_t size, head_off, old_off, len1, len2, padding;
1157 union perf_event ev;
1158 void *data1, *data2;
1160 if (snapshot) {
1161 head = auxtrace_mmap__read_snapshot_head(mm);
1162 if (auxtrace_record__find_snapshot(itr, mm->idx, mm, data,
1163 &head, &old))
1164 return -1;
1165 } else {
1166 head = auxtrace_mmap__read_head(mm);
1169 if (old == head)
1170 return 0;
1172 pr_debug3("auxtrace idx %d old %#"PRIx64" head %#"PRIx64" diff %#"PRIx64"\n",
1173 mm->idx, old, head, head - old);
1175 if (mm->mask) {
1176 head_off = head & mm->mask;
1177 old_off = old & mm->mask;
1178 } else {
1179 head_off = head % mm->len;
1180 old_off = old % mm->len;
1183 if (head_off > old_off)
1184 size = head_off - old_off;
1185 else
1186 size = mm->len - (old_off - head_off);
1188 if (snapshot && size > snapshot_size)
1189 size = snapshot_size;
1191 ref = auxtrace_record__reference(itr);
1193 if (head > old || size <= head || mm->mask) {
1194 offset = head - size;
1195 } else {
1197 * When the buffer size is not a power of 2, 'head' wraps at the
1198 * highest multiple of the buffer size, so we have to subtract
1199 * the remainder here.
1201 u64 rem = (0ULL - mm->len) % mm->len;
1203 offset = head - size - rem;
1206 if (size > head_off) {
1207 len1 = size - head_off;
1208 data1 = &data[mm->len - len1];
1209 len2 = head_off;
1210 data2 = &data[0];
1211 } else {
1212 len1 = size;
1213 data1 = &data[head_off - len1];
1214 len2 = 0;
1215 data2 = NULL;
1218 if (itr->alignment) {
1219 unsigned int unwanted = len1 % itr->alignment;
1221 len1 -= unwanted;
1222 size -= unwanted;
1225 /* padding must be written by fn() e.g. record__process_auxtrace() */
1226 padding = size & 7;
1227 if (padding)
1228 padding = 8 - padding;
1230 memset(&ev, 0, sizeof(ev));
1231 ev.auxtrace.header.type = PERF_RECORD_AUXTRACE;
1232 ev.auxtrace.header.size = sizeof(ev.auxtrace);
1233 ev.auxtrace.size = size + padding;
1234 ev.auxtrace.offset = offset;
1235 ev.auxtrace.reference = ref;
1236 ev.auxtrace.idx = mm->idx;
1237 ev.auxtrace.tid = mm->tid;
1238 ev.auxtrace.cpu = mm->cpu;
1240 if (fn(tool, &ev, data1, len1, data2, len2))
1241 return -1;
1243 mm->prev = head;
1245 if (!snapshot) {
1246 auxtrace_mmap__write_tail(mm, head);
1247 if (itr->read_finish) {
1248 int err;
1250 err = itr->read_finish(itr, mm->idx);
1251 if (err < 0)
1252 return err;
1256 return 1;
1259 int auxtrace_mmap__read(struct auxtrace_mmap *mm, struct auxtrace_record *itr,
1260 struct perf_tool *tool, process_auxtrace_t fn)
1262 return __auxtrace_mmap__read(mm, itr, tool, fn, false, 0);
1265 int auxtrace_mmap__read_snapshot(struct auxtrace_mmap *mm,
1266 struct auxtrace_record *itr,
1267 struct perf_tool *tool, process_auxtrace_t fn,
1268 size_t snapshot_size)
1270 return __auxtrace_mmap__read(mm, itr, tool, fn, true, snapshot_size);
1274 * struct auxtrace_cache - hash table to implement a cache
1275 * @hashtable: the hashtable
1276 * @sz: hashtable size (number of hlists)
1277 * @entry_size: size of an entry
1278 * @limit: limit the number of entries to this maximum, when reached the cache
1279 * is dropped and caching begins again with an empty cache
1280 * @cnt: current number of entries
1281 * @bits: hashtable size (@sz = 2^@bits)
1283 struct auxtrace_cache {
1284 struct hlist_head *hashtable;
1285 size_t sz;
1286 size_t entry_size;
1287 size_t limit;
1288 size_t cnt;
1289 unsigned int bits;
1292 struct auxtrace_cache *auxtrace_cache__new(unsigned int bits, size_t entry_size,
1293 unsigned int limit_percent)
1295 struct auxtrace_cache *c;
1296 struct hlist_head *ht;
1297 size_t sz, i;
1299 c = zalloc(sizeof(struct auxtrace_cache));
1300 if (!c)
1301 return NULL;
1303 sz = 1UL << bits;
1305 ht = calloc(sz, sizeof(struct hlist_head));
1306 if (!ht)
1307 goto out_free;
1309 for (i = 0; i < sz; i++)
1310 INIT_HLIST_HEAD(&ht[i]);
1312 c->hashtable = ht;
1313 c->sz = sz;
1314 c->entry_size = entry_size;
1315 c->limit = (c->sz * limit_percent) / 100;
1316 c->bits = bits;
1318 return c;
1320 out_free:
1321 free(c);
1322 return NULL;
1325 static void auxtrace_cache__drop(struct auxtrace_cache *c)
1327 struct auxtrace_cache_entry *entry;
1328 struct hlist_node *tmp;
1329 size_t i;
1331 if (!c)
1332 return;
1334 for (i = 0; i < c->sz; i++) {
1335 hlist_for_each_entry_safe(entry, tmp, &c->hashtable[i], hash) {
1336 hlist_del(&entry->hash);
1337 auxtrace_cache__free_entry(c, entry);
1341 c->cnt = 0;
1344 void auxtrace_cache__free(struct auxtrace_cache *c)
1346 if (!c)
1347 return;
1349 auxtrace_cache__drop(c);
1350 free(c->hashtable);
1351 free(c);
1354 void *auxtrace_cache__alloc_entry(struct auxtrace_cache *c)
1356 return malloc(c->entry_size);
1359 void auxtrace_cache__free_entry(struct auxtrace_cache *c __maybe_unused,
1360 void *entry)
1362 free(entry);
1365 int auxtrace_cache__add(struct auxtrace_cache *c, u32 key,
1366 struct auxtrace_cache_entry *entry)
1368 if (c->limit && ++c->cnt > c->limit)
1369 auxtrace_cache__drop(c);
1371 entry->key = key;
1372 hlist_add_head(&entry->hash, &c->hashtable[hash_32(key, c->bits)]);
1374 return 0;
1377 void *auxtrace_cache__lookup(struct auxtrace_cache *c, u32 key)
1379 struct auxtrace_cache_entry *entry;
1380 struct hlist_head *hlist;
1382 if (!c)
1383 return NULL;
1385 hlist = &c->hashtable[hash_32(key, c->bits)];
1386 hlist_for_each_entry(entry, hlist, hash) {
1387 if (entry->key == key)
1388 return entry;
1391 return NULL;