1 #include "util.h"
2 #include <sys/types.h>
3 #include <byteswap.h>
4 #include <unistd.h>
5 #include <stdio.h>
6 #include <stdlib.h>
7 #include <linux/list.h>
8 #include <linux/kernel.h>
9 #include <linux/bitops.h>
10 #include <sys/utsname.h>
11
12 #include "evlist.h"
13 #include "evsel.h"
14 #include "header.h"
15 #include "../perf.h"
16 #include "trace-event.h"
17 #include "session.h"
18 #include "symbol.h"
19 #include "debug.h"
20 #include "cpumap.h"
21 #include "pmu.h"
22 #include "vdso.h"
23 #include "strbuf.h"
24 #include "build-id.h"
25 #include "data.h"
26
27 static u32 header_argc;
28 static const char **header_argv;
29
30 /*
31 * magic2 = "PERFILE2"
32 * must be a numerical value to let the endianness
33 * determine the memory layout. That way we are able
34 * to detect endianness when reading the perf.data file
35 * back.
36 *
37 * we check for legacy (PERFFILE) format.
38 */
39 static const char *__perf_magic1 = "PERFFILE";
40 static const u64 __perf_magic2 = 0x32454c4946524550ULL;
41 static const u64 __perf_magic2_sw = 0x50455246494c4532ULL;
42
43 #define PERF_MAGIC __perf_magic2
44
45 struct perf_file_attr {
46 struct perf_event_attr attr;
47 struct perf_file_section ids;
48 };
49
perf_header__set_feat(struct perf_header * header,int feat)50 void perf_header__set_feat(struct perf_header *header, int feat)
51 {
52 set_bit(feat, header->adds_features);
53 }
54
perf_header__clear_feat(struct perf_header * header,int feat)55 void perf_header__clear_feat(struct perf_header *header, int feat)
56 {
57 clear_bit(feat, header->adds_features);
58 }
59
perf_header__has_feat(const struct perf_header * header,int feat)60 bool perf_header__has_feat(const struct perf_header *header, int feat)
61 {
62 return test_bit(feat, header->adds_features);
63 }
64
do_write(int fd,const void * buf,size_t size)65 static int do_write(int fd, const void *buf, size_t size)
66 {
67 while (size) {
68 int ret = write(fd, buf, size);
69
70 if (ret < 0)
71 return -errno;
72
73 size -= ret;
74 buf += ret;
75 }
76
77 return 0;
78 }
79
write_padded(int fd,const void * bf,size_t count,size_t count_aligned)80 int write_padded(int fd, const void *bf, size_t count, size_t count_aligned)
81 {
82 static const char zero_buf[NAME_ALIGN];
83 int err = do_write(fd, bf, count);
84
85 if (!err)
86 err = do_write(fd, zero_buf, count_aligned - count);
87
88 return err;
89 }
90
do_write_string(int fd,const char * str)91 static int do_write_string(int fd, const char *str)
92 {
93 u32 len, olen;
94 int ret;
95
96 olen = strlen(str) + 1;
97 len = PERF_ALIGN(olen, NAME_ALIGN);
98
99 /* write len, incl. \0 */
100 ret = do_write(fd, &len, sizeof(len));
101 if (ret < 0)
102 return ret;
103
104 return write_padded(fd, str, olen, len);
105 }
106
do_read_string(int fd,struct perf_header * ph)107 static char *do_read_string(int fd, struct perf_header *ph)
108 {
109 ssize_t sz, ret;
110 u32 len;
111 char *buf;
112
113 sz = readn(fd, &len, sizeof(len));
114 if (sz < (ssize_t)sizeof(len))
115 return NULL;
116
117 if (ph->needs_swap)
118 len = bswap_32(len);
119
120 buf = malloc(len);
121 if (!buf)
122 return NULL;
123
124 ret = readn(fd, buf, len);
125 if (ret == (ssize_t)len) {
126 /*
127 * strings are padded by zeroes
128 * thus the actual strlen of buf
129 * may be less than len
130 */
131 return buf;
132 }
133
134 free(buf);
135 return NULL;
136 }
137
138 int
perf_header__set_cmdline(int argc,const char ** argv)139 perf_header__set_cmdline(int argc, const char **argv)
140 {
141 int i;
142
143 /*
144 * If header_argv has already been set, do not override it.
145 * This allows a command to set the cmdline, parse args and
146 * then call another builtin function that implements a
147 * command -- e.g, cmd_kvm calling cmd_record.
148 */
149 if (header_argv)
150 return 0;
151
152 header_argc = (u32)argc;
153
154 /* do not include NULL termination */
155 header_argv = calloc(argc, sizeof(char *));
156 if (!header_argv)
157 return -ENOMEM;
158
159 /*
160 * must copy argv contents because it gets moved
161 * around during option parsing
162 */
163 for (i = 0; i < argc ; i++)
164 header_argv[i] = argv[i];
165
166 return 0;
167 }
168
write_tracing_data(int fd,struct perf_header * h __maybe_unused,struct perf_evlist * evlist)169 static int write_tracing_data(int fd, struct perf_header *h __maybe_unused,
170 struct perf_evlist *evlist)
171 {
172 return read_tracing_data(fd, &evlist->entries);
173 }
174
175
write_build_id(int fd,struct perf_header * h,struct perf_evlist * evlist __maybe_unused)176 static int write_build_id(int fd, struct perf_header *h,
177 struct perf_evlist *evlist __maybe_unused)
178 {
179 struct perf_session *session;
180 int err;
181
182 session = container_of(h, struct perf_session, header);
183
184 if (!perf_session__read_build_ids(session, true))
185 return -1;
186
187 err = perf_session__write_buildid_table(session, fd);
188 if (err < 0) {
189 pr_debug("failed to write buildid table\n");
190 return err;
191 }
192 perf_session__cache_build_ids(session);
193
194 return 0;
195 }
196
write_hostname(int fd,struct perf_header * h __maybe_unused,struct perf_evlist * evlist __maybe_unused)197 static int write_hostname(int fd, struct perf_header *h __maybe_unused,
198 struct perf_evlist *evlist __maybe_unused)
199 {
200 struct utsname uts;
201 int ret;
202
203 ret = uname(&uts);
204 if (ret < 0)
205 return -1;
206
207 return do_write_string(fd, uts.nodename);
208 }
209
write_osrelease(int fd,struct perf_header * h __maybe_unused,struct perf_evlist * evlist __maybe_unused)210 static int write_osrelease(int fd, struct perf_header *h __maybe_unused,
211 struct perf_evlist *evlist __maybe_unused)
212 {
213 struct utsname uts;
214 int ret;
215
216 ret = uname(&uts);
217 if (ret < 0)
218 return -1;
219
220 return do_write_string(fd, uts.release);
221 }
222
write_arch(int fd,struct perf_header * h __maybe_unused,struct perf_evlist * evlist __maybe_unused)223 static int write_arch(int fd, struct perf_header *h __maybe_unused,
224 struct perf_evlist *evlist __maybe_unused)
225 {
226 struct utsname uts;
227 int ret;
228
229 ret = uname(&uts);
230 if (ret < 0)
231 return -1;
232
233 return do_write_string(fd, uts.machine);
234 }
235
write_version(int fd,struct perf_header * h __maybe_unused,struct perf_evlist * evlist __maybe_unused)236 static int write_version(int fd, struct perf_header *h __maybe_unused,
237 struct perf_evlist *evlist __maybe_unused)
238 {
239 return do_write_string(fd, perf_version_string);
240 }
241
__write_cpudesc(int fd,const char * cpuinfo_proc)242 static int __write_cpudesc(int fd, const char *cpuinfo_proc)
243 {
244 FILE *file;
245 char *buf = NULL;
246 char *s, *p;
247 const char *search = cpuinfo_proc;
248 size_t len = 0;
249 int ret = -1;
250
251 if (!search)
252 return -1;
253
254 file = fopen("/proc/cpuinfo", "r");
255 if (!file)
256 return -1;
257
258 while (getline(&buf, &len, file) > 0) {
259 ret = strncmp(buf, search, strlen(search));
260 if (!ret)
261 break;
262 }
263
264 if (ret) {
265 ret = -1;
266 goto done;
267 }
268
269 s = buf;
270
271 p = strchr(buf, ':');
272 if (p && *(p+1) == ' ' && *(p+2))
273 s = p + 2;
274 p = strchr(s, '\n');
275 if (p)
276 *p = '\0';
277
278 /* squash extra space characters (branding string) */
279 p = s;
280 while (*p) {
281 if (isspace(*p)) {
282 char *r = p + 1;
283 char *q = r;
284 *p = ' ';
285 while (*q && isspace(*q))
286 q++;
287 if (q != (p+1))
288 while ((*r++ = *q++));
289 }
290 p++;
291 }
292 ret = do_write_string(fd, s);
293 done:
294 free(buf);
295 fclose(file);
296 return ret;
297 }
298
write_cpudesc(int fd,struct perf_header * h __maybe_unused,struct perf_evlist * evlist __maybe_unused)299 static int write_cpudesc(int fd, struct perf_header *h __maybe_unused,
300 struct perf_evlist *evlist __maybe_unused)
301 {
302 #ifndef CPUINFO_PROC
303 #define CPUINFO_PROC {"model name", }
304 #endif
305 const char *cpuinfo_procs[] = CPUINFO_PROC;
306 unsigned int i;
307
308 for (i = 0; i < ARRAY_SIZE(cpuinfo_procs); i++) {
309 int ret;
310 ret = __write_cpudesc(fd, cpuinfo_procs[i]);
311 if (ret >= 0)
312 return ret;
313 }
314 return -1;
315 }
316
317
write_nrcpus(int fd,struct perf_header * h __maybe_unused,struct perf_evlist * evlist __maybe_unused)318 static int write_nrcpus(int fd, struct perf_header *h __maybe_unused,
319 struct perf_evlist *evlist __maybe_unused)
320 {
321 long nr;
322 u32 nrc, nra;
323 int ret;
324
325 nr = sysconf(_SC_NPROCESSORS_CONF);
326 if (nr < 0)
327 return -1;
328
329 nrc = (u32)(nr & UINT_MAX);
330
331 nr = sysconf(_SC_NPROCESSORS_ONLN);
332 if (nr < 0)
333 return -1;
334
335 nra = (u32)(nr & UINT_MAX);
336
337 ret = do_write(fd, &nrc, sizeof(nrc));
338 if (ret < 0)
339 return ret;
340
341 return do_write(fd, &nra, sizeof(nra));
342 }
343
write_event_desc(int fd,struct perf_header * h __maybe_unused,struct perf_evlist * evlist)344 static int write_event_desc(int fd, struct perf_header *h __maybe_unused,
345 struct perf_evlist *evlist)
346 {
347 struct perf_evsel *evsel;
348 u32 nre, nri, sz;
349 int ret;
350
351 nre = evlist->nr_entries;
352
353 /*
354 * write number of events
355 */
356 ret = do_write(fd, &nre, sizeof(nre));
357 if (ret < 0)
358 return ret;
359
360 /*
361 * size of perf_event_attr struct
362 */
363 sz = (u32)sizeof(evsel->attr);
364 ret = do_write(fd, &sz, sizeof(sz));
365 if (ret < 0)
366 return ret;
367
368 evlist__for_each(evlist, evsel) {
369 ret = do_write(fd, &evsel->attr, sz);
370 if (ret < 0)
371 return ret;
372 /*
373 * write number of unique id per event
374 * there is one id per instance of an event
375 *
376 * copy into an nri to be independent of the
377 * type of ids,
378 */
379 nri = evsel->ids;
380 ret = do_write(fd, &nri, sizeof(nri));
381 if (ret < 0)
382 return ret;
383
384 /*
385 * write event string as passed on cmdline
386 */
387 ret = do_write_string(fd, perf_evsel__name(evsel));
388 if (ret < 0)
389 return ret;
390 /*
391 * write unique ids for this event
392 */
393 ret = do_write(fd, evsel->id, evsel->ids * sizeof(u64));
394 if (ret < 0)
395 return ret;
396 }
397 return 0;
398 }
399
write_cmdline(int fd,struct perf_header * h __maybe_unused,struct perf_evlist * evlist __maybe_unused)400 static int write_cmdline(int fd, struct perf_header *h __maybe_unused,
401 struct perf_evlist *evlist __maybe_unused)
402 {
403 char buf[MAXPATHLEN];
404 char proc[32];
405 u32 i, n;
406 int ret;
407
408 /*
409 * actual atual path to perf binary
410 */
411 sprintf(proc, "/proc/%d/exe", getpid());
412 ret = readlink(proc, buf, sizeof(buf));
413 if (ret <= 0)
414 return -1;
415
416 /* readlink() does not add null termination */
417 buf[ret] = '\0';
418
419 /* account for binary path */
420 n = header_argc + 1;
421
422 ret = do_write(fd, &n, sizeof(n));
423 if (ret < 0)
424 return ret;
425
426 ret = do_write_string(fd, buf);
427 if (ret < 0)
428 return ret;
429
430 for (i = 0 ; i < header_argc; i++) {
431 ret = do_write_string(fd, header_argv[i]);
432 if (ret < 0)
433 return ret;
434 }
435 return 0;
436 }
437
438 #define CORE_SIB_FMT \
439 "/sys/devices/system/cpu/cpu%d/topology/core_siblings_list"
440 #define THRD_SIB_FMT \
441 "/sys/devices/system/cpu/cpu%d/topology/thread_siblings_list"
442
443 struct cpu_topo {
444 u32 core_sib;
445 u32 thread_sib;
446 char **core_siblings;
447 char **thread_siblings;
448 };
449
build_cpu_topo(struct cpu_topo * tp,int cpu)450 static int build_cpu_topo(struct cpu_topo *tp, int cpu)
451 {
452 FILE *fp;
453 char filename[MAXPATHLEN];
454 char *buf = NULL, *p;
455 size_t len = 0;
456 ssize_t sret;
457 u32 i = 0;
458 int ret = -1;
459
460 sprintf(filename, CORE_SIB_FMT, cpu);
461 fp = fopen(filename, "r");
462 if (!fp)
463 goto try_threads;
464
465 sret = getline(&buf, &len, fp);
466 fclose(fp);
467 if (sret <= 0)
468 goto try_threads;
469
470 p = strchr(buf, '\n');
471 if (p)
472 *p = '\0';
473
474 for (i = 0; i < tp->core_sib; i++) {
475 if (!strcmp(buf, tp->core_siblings[i]))
476 break;
477 }
478 if (i == tp->core_sib) {
479 tp->core_siblings[i] = buf;
480 tp->core_sib++;
481 buf = NULL;
482 len = 0;
483 }
484 ret = 0;
485
486 try_threads:
487 sprintf(filename, THRD_SIB_FMT, cpu);
488 fp = fopen(filename, "r");
489 if (!fp)
490 goto done;
491
492 if (getline(&buf, &len, fp) <= 0)
493 goto done;
494
495 p = strchr(buf, '\n');
496 if (p)
497 *p = '\0';
498
499 for (i = 0; i < tp->thread_sib; i++) {
500 if (!strcmp(buf, tp->thread_siblings[i]))
501 break;
502 }
503 if (i == tp->thread_sib) {
504 tp->thread_siblings[i] = buf;
505 tp->thread_sib++;
506 buf = NULL;
507 }
508 ret = 0;
509 done:
510 if(fp)
511 fclose(fp);
512 free(buf);
513 return ret;
514 }
515
free_cpu_topo(struct cpu_topo * tp)516 static void free_cpu_topo(struct cpu_topo *tp)
517 {
518 u32 i;
519
520 if (!tp)
521 return;
522
523 for (i = 0 ; i < tp->core_sib; i++)
524 zfree(&tp->core_siblings[i]);
525
526 for (i = 0 ; i < tp->thread_sib; i++)
527 zfree(&tp->thread_siblings[i]);
528
529 free(tp);
530 }
531
build_cpu_topology(void)532 static struct cpu_topo *build_cpu_topology(void)
533 {
534 struct cpu_topo *tp;
535 void *addr;
536 u32 nr, i;
537 size_t sz;
538 long ncpus;
539 int ret = -1;
540
541 ncpus = sysconf(_SC_NPROCESSORS_CONF);
542 if (ncpus < 0)
543 return NULL;
544
545 nr = (u32)(ncpus & UINT_MAX);
546
547 sz = nr * sizeof(char *);
548
549 addr = calloc(1, sizeof(*tp) + 2 * sz);
550 if (!addr)
551 return NULL;
552
553 tp = addr;
554
555 addr += sizeof(*tp);
556 tp->core_siblings = addr;
557 addr += sz;
558 tp->thread_siblings = addr;
559
560 for (i = 0; i < nr; i++) {
561 ret = build_cpu_topo(tp, i);
562 if (ret < 0)
563 break;
564 }
565 if (ret) {
566 free_cpu_topo(tp);
567 tp = NULL;
568 }
569 return tp;
570 }
571
write_cpu_topology(int fd,struct perf_header * h __maybe_unused,struct perf_evlist * evlist __maybe_unused)572 static int write_cpu_topology(int fd, struct perf_header *h __maybe_unused,
573 struct perf_evlist *evlist __maybe_unused)
574 {
575 struct cpu_topo *tp;
576 u32 i;
577 int ret;
578
579 tp = build_cpu_topology();
580 if (!tp)
581 return -1;
582
583 ret = do_write(fd, &tp->core_sib, sizeof(tp->core_sib));
584 if (ret < 0)
585 goto done;
586
587 for (i = 0; i < tp->core_sib; i++) {
588 ret = do_write_string(fd, tp->core_siblings[i]);
589 if (ret < 0)
590 goto done;
591 }
592 ret = do_write(fd, &tp->thread_sib, sizeof(tp->thread_sib));
593 if (ret < 0)
594 goto done;
595
596 for (i = 0; i < tp->thread_sib; i++) {
597 ret = do_write_string(fd, tp->thread_siblings[i]);
598 if (ret < 0)
599 break;
600 }
601 done:
602 free_cpu_topo(tp);
603 return ret;
604 }
605
606
607
write_total_mem(int fd,struct perf_header * h __maybe_unused,struct perf_evlist * evlist __maybe_unused)608 static int write_total_mem(int fd, struct perf_header *h __maybe_unused,
609 struct perf_evlist *evlist __maybe_unused)
610 {
611 char *buf = NULL;
612 FILE *fp;
613 size_t len = 0;
614 int ret = -1, n;
615 uint64_t mem;
616
617 fp = fopen("/proc/meminfo", "r");
618 if (!fp)
619 return -1;
620
621 while (getline(&buf, &len, fp) > 0) {
622 ret = strncmp(buf, "MemTotal:", 9);
623 if (!ret)
624 break;
625 }
626 if (!ret) {
627 n = sscanf(buf, "%*s %"PRIu64, &mem);
628 if (n == 1)
629 ret = do_write(fd, &mem, sizeof(mem));
630 } else
631 ret = -1;
632 free(buf);
633 fclose(fp);
634 return ret;
635 }
636
write_topo_node(int fd,int node)637 static int write_topo_node(int fd, int node)
638 {
639 char str[MAXPATHLEN];
640 char field[32];
641 char *buf = NULL, *p;
642 size_t len = 0;
643 FILE *fp;
644 u64 mem_total, mem_free, mem;
645 int ret = -1;
646
647 sprintf(str, "/sys/devices/system/node/node%d/meminfo", node);
648 fp = fopen(str, "r");
649 if (!fp)
650 return -1;
651
652 while (getline(&buf, &len, fp) > 0) {
653 /* skip over invalid lines */
654 if (!strchr(buf, ':'))
655 continue;
656 if (sscanf(buf, "%*s %*d %31s %"PRIu64, field, &mem) != 2)
657 goto done;
658 if (!strcmp(field, "MemTotal:"))
659 mem_total = mem;
660 if (!strcmp(field, "MemFree:"))
661 mem_free = mem;
662 }
663
664 fclose(fp);
665 fp = NULL;
666
667 ret = do_write(fd, &mem_total, sizeof(u64));
668 if (ret)
669 goto done;
670
671 ret = do_write(fd, &mem_free, sizeof(u64));
672 if (ret)
673 goto done;
674
675 ret = -1;
676 sprintf(str, "/sys/devices/system/node/node%d/cpulist", node);
677
678 fp = fopen(str, "r");
679 if (!fp)
680 goto done;
681
682 if (getline(&buf, &len, fp) <= 0)
683 goto done;
684
685 p = strchr(buf, '\n');
686 if (p)
687 *p = '\0';
688
689 ret = do_write_string(fd, buf);
690 done:
691 free(buf);
692 if (fp)
693 fclose(fp);
694 return ret;
695 }
696
write_numa_topology(int fd,struct perf_header * h __maybe_unused,struct perf_evlist * evlist __maybe_unused)697 static int write_numa_topology(int fd, struct perf_header *h __maybe_unused,
698 struct perf_evlist *evlist __maybe_unused)
699 {
700 char *buf = NULL;
701 size_t len = 0;
702 FILE *fp;
703 struct cpu_map *node_map = NULL;
704 char *c;
705 u32 nr, i, j;
706 int ret = -1;
707
708 fp = fopen("/sys/devices/system/node/online", "r");
709 if (!fp)
710 return -1;
711
712 if (getline(&buf, &len, fp) <= 0)
713 goto done;
714
715 c = strchr(buf, '\n');
716 if (c)
717 *c = '\0';
718
719 node_map = cpu_map__new(buf);
720 if (!node_map)
721 goto done;
722
723 nr = (u32)node_map->nr;
724
725 ret = do_write(fd, &nr, sizeof(nr));
726 if (ret < 0)
727 goto done;
728
729 for (i = 0; i < nr; i++) {
730 j = (u32)node_map->map[i];
731 ret = do_write(fd, &j, sizeof(j));
732 if (ret < 0)
733 break;
734
735 ret = write_topo_node(fd, i);
736 if (ret < 0)
737 break;
738 }
739 done:
740 free(buf);
741 fclose(fp);
742 free(node_map);
743 return ret;
744 }
745
746 /*
747 * File format:
748 *
749 * struct pmu_mappings {
750 * u32 pmu_num;
751 * struct pmu_map {
752 * u32 type;
753 * char name[];
754 * }[pmu_num];
755 * };
756 */
757
write_pmu_mappings(int fd,struct perf_header * h __maybe_unused,struct perf_evlist * evlist __maybe_unused)758 static int write_pmu_mappings(int fd, struct perf_header *h __maybe_unused,
759 struct perf_evlist *evlist __maybe_unused)
760 {
761 struct perf_pmu *pmu = NULL;
762 off_t offset = lseek(fd, 0, SEEK_CUR);
763 __u32 pmu_num = 0;
764 int ret;
765
766 /* write real pmu_num later */
767 ret = do_write(fd, &pmu_num, sizeof(pmu_num));
768 if (ret < 0)
769 return ret;
770
771 while ((pmu = perf_pmu__scan(pmu))) {
772 if (!pmu->name)
773 continue;
774 pmu_num++;
775
776 ret = do_write(fd, &pmu->type, sizeof(pmu->type));
777 if (ret < 0)
778 return ret;
779
780 ret = do_write_string(fd, pmu->name);
781 if (ret < 0)
782 return ret;
783 }
784
785 if (pwrite(fd, &pmu_num, sizeof(pmu_num), offset) != sizeof(pmu_num)) {
786 /* discard all */
787 lseek(fd, offset, SEEK_SET);
788 return -1;
789 }
790
791 return 0;
792 }
793
794 /*
795 * File format:
796 *
797 * struct group_descs {
798 * u32 nr_groups;
799 * struct group_desc {
800 * char name[];
801 * u32 leader_idx;
802 * u32 nr_members;
803 * }[nr_groups];
804 * };
805 */
write_group_desc(int fd,struct perf_header * h __maybe_unused,struct perf_evlist * evlist)806 static int write_group_desc(int fd, struct perf_header *h __maybe_unused,
807 struct perf_evlist *evlist)
808 {
809 u32 nr_groups = evlist->nr_groups;
810 struct perf_evsel *evsel;
811 int ret;
812
813 ret = do_write(fd, &nr_groups, sizeof(nr_groups));
814 if (ret < 0)
815 return ret;
816
817 evlist__for_each(evlist, evsel) {
818 if (perf_evsel__is_group_leader(evsel) &&
819 evsel->nr_members > 1) {
820 const char *name = evsel->group_name ?: "{anon_group}";
821 u32 leader_idx = evsel->idx;
822 u32 nr_members = evsel->nr_members;
823
824 ret = do_write_string(fd, name);
825 if (ret < 0)
826 return ret;
827
828 ret = do_write(fd, &leader_idx, sizeof(leader_idx));
829 if (ret < 0)
830 return ret;
831
832 ret = do_write(fd, &nr_members, sizeof(nr_members));
833 if (ret < 0)
834 return ret;
835 }
836 }
837 return 0;
838 }
839
840 /*
841 * default get_cpuid(): nothing gets recorded
842 * actual implementation must be in arch/$(ARCH)/util/header.c
843 */
get_cpuid(char * buffer __maybe_unused,size_t sz __maybe_unused)844 int __attribute__ ((weak)) get_cpuid(char *buffer __maybe_unused,
845 size_t sz __maybe_unused)
846 {
847 return -1;
848 }
849
write_cpuid(int fd,struct perf_header * h __maybe_unused,struct perf_evlist * evlist __maybe_unused)850 static int write_cpuid(int fd, struct perf_header *h __maybe_unused,
851 struct perf_evlist *evlist __maybe_unused)
852 {
853 char buffer[64];
854 int ret;
855
856 ret = get_cpuid(buffer, sizeof(buffer));
857 if (!ret)
858 goto write_it;
859
860 return -1;
861 write_it:
862 return do_write_string(fd, buffer);
863 }
864
write_branch_stack(int fd __maybe_unused,struct perf_header * h __maybe_unused,struct perf_evlist * evlist __maybe_unused)865 static int write_branch_stack(int fd __maybe_unused,
866 struct perf_header *h __maybe_unused,
867 struct perf_evlist *evlist __maybe_unused)
868 {
869 return 0;
870 }
871
print_hostname(struct perf_header * ph,int fd __maybe_unused,FILE * fp)872 static void print_hostname(struct perf_header *ph, int fd __maybe_unused,
873 FILE *fp)
874 {
875 fprintf(fp, "# hostname : %s\n", ph->env.hostname);
876 }
877
print_osrelease(struct perf_header * ph,int fd __maybe_unused,FILE * fp)878 static void print_osrelease(struct perf_header *ph, int fd __maybe_unused,
879 FILE *fp)
880 {
881 fprintf(fp, "# os release : %s\n", ph->env.os_release);
882 }
883
print_arch(struct perf_header * ph,int fd __maybe_unused,FILE * fp)884 static void print_arch(struct perf_header *ph, int fd __maybe_unused, FILE *fp)
885 {
886 fprintf(fp, "# arch : %s\n", ph->env.arch);
887 }
888
print_cpudesc(struct perf_header * ph,int fd __maybe_unused,FILE * fp)889 static void print_cpudesc(struct perf_header *ph, int fd __maybe_unused,
890 FILE *fp)
891 {
892 fprintf(fp, "# cpudesc : %s\n", ph->env.cpu_desc);
893 }
894
print_nrcpus(struct perf_header * ph,int fd __maybe_unused,FILE * fp)895 static void print_nrcpus(struct perf_header *ph, int fd __maybe_unused,
896 FILE *fp)
897 {
898 fprintf(fp, "# nrcpus online : %u\n", ph->env.nr_cpus_online);
899 fprintf(fp, "# nrcpus avail : %u\n", ph->env.nr_cpus_avail);
900 }
901
print_version(struct perf_header * ph,int fd __maybe_unused,FILE * fp)902 static void print_version(struct perf_header *ph, int fd __maybe_unused,
903 FILE *fp)
904 {
905 fprintf(fp, "# perf version : %s\n", ph->env.version);
906 }
907
print_cmdline(struct perf_header * ph,int fd __maybe_unused,FILE * fp)908 static void print_cmdline(struct perf_header *ph, int fd __maybe_unused,
909 FILE *fp)
910 {
911 int nr, i;
912 char *str;
913
914 nr = ph->env.nr_cmdline;
915 str = ph->env.cmdline;
916
917 fprintf(fp, "# cmdline : ");
918
919 for (i = 0; i < nr; i++) {
920 fprintf(fp, "%s ", str);
921 str += strlen(str) + 1;
922 }
923 fputc('\n', fp);
924 }
925
print_cpu_topology(struct perf_header * ph,int fd __maybe_unused,FILE * fp)926 static void print_cpu_topology(struct perf_header *ph, int fd __maybe_unused,
927 FILE *fp)
928 {
929 int nr, i;
930 char *str;
931
932 nr = ph->env.nr_sibling_cores;
933 str = ph->env.sibling_cores;
934
935 for (i = 0; i < nr; i++) {
936 fprintf(fp, "# sibling cores : %s\n", str);
937 str += strlen(str) + 1;
938 }
939
940 nr = ph->env.nr_sibling_threads;
941 str = ph->env.sibling_threads;
942
943 for (i = 0; i < nr; i++) {
944 fprintf(fp, "# sibling threads : %s\n", str);
945 str += strlen(str) + 1;
946 }
947 }
948
free_event_desc(struct perf_evsel * events)949 static void free_event_desc(struct perf_evsel *events)
950 {
951 struct perf_evsel *evsel;
952
953 if (!events)
954 return;
955
956 for (evsel = events; evsel->attr.size; evsel++) {
957 zfree(&evsel->name);
958 zfree(&evsel->id);
959 }
960
961 free(events);
962 }
963
964 static struct perf_evsel *
read_event_desc(struct perf_header * ph,int fd)965 read_event_desc(struct perf_header *ph, int fd)
966 {
967 struct perf_evsel *evsel, *events = NULL;
968 u64 *id;
969 void *buf = NULL;
970 u32 nre, sz, nr, i, j;
971 ssize_t ret;
972 size_t msz;
973
974 /* number of events */
975 ret = readn(fd, &nre, sizeof(nre));
976 if (ret != (ssize_t)sizeof(nre))
977 goto error;
978
979 if (ph->needs_swap)
980 nre = bswap_32(nre);
981
982 ret = readn(fd, &sz, sizeof(sz));
983 if (ret != (ssize_t)sizeof(sz))
984 goto error;
985
986 if (ph->needs_swap)
987 sz = bswap_32(sz);
988
989 /* buffer to hold on file attr struct */
990 buf = malloc(sz);
991 if (!buf)
992 goto error;
993
994 /* the last event terminates with evsel->attr.size == 0: */
995 events = calloc(nre + 1, sizeof(*events));
996 if (!events)
997 goto error;
998
999 msz = sizeof(evsel->attr);
1000 if (sz < msz)
1001 msz = sz;
1002
1003 for (i = 0, evsel = events; i < nre; evsel++, i++) {
1004 evsel->idx = i;
1005
1006 /*
1007 * must read entire on-file attr struct to
1008 * sync up with layout.
1009 */
1010 ret = readn(fd, buf, sz);
1011 if (ret != (ssize_t)sz)
1012 goto error;
1013
1014 if (ph->needs_swap)
1015 perf_event__attr_swap(buf);
1016
1017 memcpy(&evsel->attr, buf, msz);
1018
1019 ret = readn(fd, &nr, sizeof(nr));
1020 if (ret != (ssize_t)sizeof(nr))
1021 goto error;
1022
1023 if (ph->needs_swap) {
1024 nr = bswap_32(nr);
1025 evsel->needs_swap = true;
1026 }
1027
1028 evsel->name = do_read_string(fd, ph);
1029
1030 if (!nr)
1031 continue;
1032
1033 id = calloc(nr, sizeof(*id));
1034 if (!id)
1035 goto error;
1036 evsel->ids = nr;
1037 evsel->id = id;
1038
1039 for (j = 0 ; j < nr; j++) {
1040 ret = readn(fd, id, sizeof(*id));
1041 if (ret != (ssize_t)sizeof(*id))
1042 goto error;
1043 if (ph->needs_swap)
1044 *id = bswap_64(*id);
1045 id++;
1046 }
1047 }
1048 out:
1049 free(buf);
1050 return events;
1051 error:
1052 if (events)
1053 free_event_desc(events);
1054 events = NULL;
1055 goto out;
1056 }
1057
__desc_attr__fprintf(FILE * fp,const char * name,const char * val,void * priv)1058 static int __desc_attr__fprintf(FILE *fp, const char *name, const char *val,
1059 void *priv __attribute__((unused)))
1060 {
1061 return fprintf(fp, ", %s = %s", name, val);
1062 }
1063
print_event_desc(struct perf_header * ph,int fd,FILE * fp)1064 static void print_event_desc(struct perf_header *ph, int fd, FILE *fp)
1065 {
1066 struct perf_evsel *evsel, *events = read_event_desc(ph, fd);
1067 u32 j;
1068 u64 *id;
1069
1070 if (!events) {
1071 fprintf(fp, "# event desc: not available or unable to read\n");
1072 return;
1073 }
1074
1075 for (evsel = events; evsel->attr.size; evsel++) {
1076 fprintf(fp, "# event : name = %s, ", evsel->name);
1077
1078 if (evsel->ids) {
1079 fprintf(fp, ", id = {");
1080 for (j = 0, id = evsel->id; j < evsel->ids; j++, id++) {
1081 if (j)
1082 fputc(',', fp);
1083 fprintf(fp, " %"PRIu64, *id);
1084 }
1085 fprintf(fp, " }");
1086 }
1087
1088 perf_event_attr__fprintf(fp, &evsel->attr, __desc_attr__fprintf, NULL);
1089
1090 fputc('\n', fp);
1091 }
1092
1093 free_event_desc(events);
1094 }
1095
print_total_mem(struct perf_header * ph,int fd __maybe_unused,FILE * fp)1096 static void print_total_mem(struct perf_header *ph, int fd __maybe_unused,
1097 FILE *fp)
1098 {
1099 fprintf(fp, "# total memory : %Lu kB\n", ph->env.total_mem);
1100 }
1101
print_numa_topology(struct perf_header * ph,int fd __maybe_unused,FILE * fp)1102 static void print_numa_topology(struct perf_header *ph, int fd __maybe_unused,
1103 FILE *fp)
1104 {
1105 u32 nr, c, i;
1106 char *str, *tmp;
1107 uint64_t mem_total, mem_free;
1108
1109 /* nr nodes */
1110 nr = ph->env.nr_numa_nodes;
1111 str = ph->env.numa_nodes;
1112
1113 for (i = 0; i < nr; i++) {
1114 /* node number */
1115 c = strtoul(str, &tmp, 0);
1116 if (*tmp != ':')
1117 goto error;
1118
1119 str = tmp + 1;
1120 mem_total = strtoull(str, &tmp, 0);
1121 if (*tmp != ':')
1122 goto error;
1123
1124 str = tmp + 1;
1125 mem_free = strtoull(str, &tmp, 0);
1126 if (*tmp != ':')
1127 goto error;
1128
1129 fprintf(fp, "# node%u meminfo : total = %"PRIu64" kB,"
1130 " free = %"PRIu64" kB\n",
1131 c, mem_total, mem_free);
1132
1133 str = tmp + 1;
1134 fprintf(fp, "# node%u cpu list : %s\n", c, str);
1135
1136 str += strlen(str) + 1;
1137 }
1138 return;
1139 error:
1140 fprintf(fp, "# numa topology : not available\n");
1141 }
1142
print_cpuid(struct perf_header * ph,int fd __maybe_unused,FILE * fp)1143 static void print_cpuid(struct perf_header *ph, int fd __maybe_unused, FILE *fp)
1144 {
1145 fprintf(fp, "# cpuid : %s\n", ph->env.cpuid);
1146 }
1147
print_branch_stack(struct perf_header * ph __maybe_unused,int fd __maybe_unused,FILE * fp)1148 static void print_branch_stack(struct perf_header *ph __maybe_unused,
1149 int fd __maybe_unused, FILE *fp)
1150 {
1151 fprintf(fp, "# contains samples with branch stack\n");
1152 }
1153
print_pmu_mappings(struct perf_header * ph,int fd __maybe_unused,FILE * fp)1154 static void print_pmu_mappings(struct perf_header *ph, int fd __maybe_unused,
1155 FILE *fp)
1156 {
1157 const char *delimiter = "# pmu mappings: ";
1158 char *str, *tmp;
1159 u32 pmu_num;
1160 u32 type;
1161
1162 pmu_num = ph->env.nr_pmu_mappings;
1163 if (!pmu_num) {
1164 fprintf(fp, "# pmu mappings: not available\n");
1165 return;
1166 }
1167
1168 str = ph->env.pmu_mappings;
1169
1170 while (pmu_num) {
1171 type = strtoul(str, &tmp, 0);
1172 if (*tmp != ':')
1173 goto error;
1174
1175 str = tmp + 1;
1176 fprintf(fp, "%s%s = %" PRIu32, delimiter, str, type);
1177
1178 delimiter = ", ";
1179 str += strlen(str) + 1;
1180 pmu_num--;
1181 }
1182
1183 fprintf(fp, "\n");
1184
1185 if (!pmu_num)
1186 return;
1187 error:
1188 fprintf(fp, "# pmu mappings: unable to read\n");
1189 }
1190
print_group_desc(struct perf_header * ph,int fd __maybe_unused,FILE * fp)1191 static void print_group_desc(struct perf_header *ph, int fd __maybe_unused,
1192 FILE *fp)
1193 {
1194 struct perf_session *session;
1195 struct perf_evsel *evsel;
1196 u32 nr = 0;
1197
1198 session = container_of(ph, struct perf_session, header);
1199
1200 evlist__for_each(session->evlist, evsel) {
1201 if (perf_evsel__is_group_leader(evsel) &&
1202 evsel->nr_members > 1) {
1203 fprintf(fp, "# group: %s{%s", evsel->group_name ?: "",
1204 perf_evsel__name(evsel));
1205
1206 nr = evsel->nr_members - 1;
1207 } else if (nr) {
1208 fprintf(fp, ",%s", perf_evsel__name(evsel));
1209
1210 if (--nr == 0)
1211 fprintf(fp, "}\n");
1212 }
1213 }
1214 }
1215
__event_process_build_id(struct build_id_event * bev,char * filename,struct perf_session * session)1216 static int __event_process_build_id(struct build_id_event *bev,
1217 char *filename,
1218 struct perf_session *session)
1219 {
1220 int err = -1;
1221 struct dsos *dsos;
1222 struct machine *machine;
1223 u16 misc;
1224 struct dso *dso;
1225 enum dso_kernel_type dso_type;
1226
1227 machine = perf_session__findnew_machine(session, bev->pid);
1228 if (!machine)
1229 goto out;
1230
1231 misc = bev->header.misc & PERF_RECORD_MISC_CPUMODE_MASK;
1232
1233 switch (misc) {
1234 case PERF_RECORD_MISC_KERNEL:
1235 dso_type = DSO_TYPE_KERNEL;
1236 dsos = &machine->kernel_dsos;
1237 break;
1238 case PERF_RECORD_MISC_GUEST_KERNEL:
1239 dso_type = DSO_TYPE_GUEST_KERNEL;
1240 dsos = &machine->kernel_dsos;
1241 break;
1242 case PERF_RECORD_MISC_USER:
1243 case PERF_RECORD_MISC_GUEST_USER:
1244 dso_type = DSO_TYPE_USER;
1245 dsos = &machine->user_dsos;
1246 break;
1247 default:
1248 goto out;
1249 }
1250
1251 dso = __dsos__findnew(dsos, filename);
1252 if (dso != NULL) {
1253 char sbuild_id[BUILD_ID_SIZE * 2 + 1];
1254
1255 dso__set_build_id(dso, &bev->build_id);
1256
1257 if (!is_kernel_module(filename))
1258 dso->kernel = dso_type;
1259
1260 build_id__sprintf(dso->build_id, sizeof(dso->build_id),
1261 sbuild_id);
1262 pr_debug("build id event received for %s: %s\n",
1263 dso->long_name, sbuild_id);
1264 }
1265
1266 err = 0;
1267 out:
1268 return err;
1269 }
1270
perf_header__read_build_ids_abi_quirk(struct perf_header * header,int input,u64 offset,u64 size)1271 static int perf_header__read_build_ids_abi_quirk(struct perf_header *header,
1272 int input, u64 offset, u64 size)
1273 {
1274 struct perf_session *session = container_of(header, struct perf_session, header);
1275 struct {
1276 struct perf_event_header header;
1277 u8 build_id[PERF_ALIGN(BUILD_ID_SIZE, sizeof(u64))];
1278 char filename[0];
1279 } old_bev;
1280 struct build_id_event bev;
1281 char filename[PATH_MAX];
1282 u64 limit = offset + size;
1283
1284 while (offset < limit) {
1285 ssize_t len;
1286
1287 if (readn(input, &old_bev, sizeof(old_bev)) != sizeof(old_bev))
1288 return -1;
1289
1290 if (header->needs_swap)
1291 perf_event_header__bswap(&old_bev.header);
1292
1293 len = old_bev.header.size - sizeof(old_bev);
1294 if (readn(input, filename, len) != len)
1295 return -1;
1296
1297 bev.header = old_bev.header;
1298
1299 /*
1300 * As the pid is the missing value, we need to fill
1301 * it properly. The header.misc value give us nice hint.
1302 */
1303 bev.pid = HOST_KERNEL_ID;
1304 if (bev.header.misc == PERF_RECORD_MISC_GUEST_USER ||
1305 bev.header.misc == PERF_RECORD_MISC_GUEST_KERNEL)
1306 bev.pid = DEFAULT_GUEST_KERNEL_ID;
1307
1308 memcpy(bev.build_id, old_bev.build_id, sizeof(bev.build_id));
1309 __event_process_build_id(&bev, filename, session);
1310
1311 offset += bev.header.size;
1312 }
1313
1314 return 0;
1315 }
1316
perf_header__read_build_ids(struct perf_header * header,int input,u64 offset,u64 size)1317 static int perf_header__read_build_ids(struct perf_header *header,
1318 int input, u64 offset, u64 size)
1319 {
1320 struct perf_session *session = container_of(header, struct perf_session, header);
1321 struct build_id_event bev;
1322 char filename[PATH_MAX];
1323 u64 limit = offset + size, orig_offset = offset;
1324 int err = -1;
1325
1326 while (offset < limit) {
1327 ssize_t len;
1328
1329 if (readn(input, &bev, sizeof(bev)) != sizeof(bev))
1330 goto out;
1331
1332 if (header->needs_swap)
1333 perf_event_header__bswap(&bev.header);
1334
1335 len = bev.header.size - sizeof(bev);
1336 if (readn(input, filename, len) != len)
1337 goto out;
1338 /*
1339 * The a1645ce1 changeset:
1340 *
1341 * "perf: 'perf kvm' tool for monitoring guest performance from host"
1342 *
1343 * Added a field to struct build_id_event that broke the file
1344 * format.
1345 *
1346 * Since the kernel build-id is the first entry, process the
1347 * table using the old format if the well known
1348 * '[kernel.kallsyms]' string for the kernel build-id has the
1349 * first 4 characters chopped off (where the pid_t sits).
1350 */
1351 if (memcmp(filename, "nel.kallsyms]", 13) == 0) {
1352 if (lseek(input, orig_offset, SEEK_SET) == (off_t)-1)
1353 return -1;
1354 return perf_header__read_build_ids_abi_quirk(header, input, offset, size);
1355 }
1356
1357 __event_process_build_id(&bev, filename, session);
1358
1359 offset += bev.header.size;
1360 }
1361 err = 0;
1362 out:
1363 return err;
1364 }
1365
process_tracing_data(struct perf_file_section * section __maybe_unused,struct perf_header * ph __maybe_unused,int fd,void * data)1366 static int process_tracing_data(struct perf_file_section *section __maybe_unused,
1367 struct perf_header *ph __maybe_unused,
1368 int fd, void *data)
1369 {
1370 ssize_t ret = trace_report(fd, data, false);
1371 return ret < 0 ? -1 : 0;
1372 }
1373
process_build_id(struct perf_file_section * section,struct perf_header * ph,int fd,void * data __maybe_unused)1374 static int process_build_id(struct perf_file_section *section,
1375 struct perf_header *ph, int fd,
1376 void *data __maybe_unused)
1377 {
1378 if (perf_header__read_build_ids(ph, fd, section->offset, section->size))
1379 pr_debug("Failed to read buildids, continuing...\n");
1380 return 0;
1381 }
1382
process_hostname(struct perf_file_section * section __maybe_unused,struct perf_header * ph,int fd,void * data __maybe_unused)1383 static int process_hostname(struct perf_file_section *section __maybe_unused,
1384 struct perf_header *ph, int fd,
1385 void *data __maybe_unused)
1386 {
1387 ph->env.hostname = do_read_string(fd, ph);
1388 return ph->env.hostname ? 0 : -ENOMEM;
1389 }
1390
process_osrelease(struct perf_file_section * section __maybe_unused,struct perf_header * ph,int fd,void * data __maybe_unused)1391 static int process_osrelease(struct perf_file_section *section __maybe_unused,
1392 struct perf_header *ph, int fd,
1393 void *data __maybe_unused)
1394 {
1395 ph->env.os_release = do_read_string(fd, ph);
1396 return ph->env.os_release ? 0 : -ENOMEM;
1397 }
1398
process_version(struct perf_file_section * section __maybe_unused,struct perf_header * ph,int fd,void * data __maybe_unused)1399 static int process_version(struct perf_file_section *section __maybe_unused,
1400 struct perf_header *ph, int fd,
1401 void *data __maybe_unused)
1402 {
1403 ph->env.version = do_read_string(fd, ph);
1404 return ph->env.version ? 0 : -ENOMEM;
1405 }
1406
process_arch(struct perf_file_section * section __maybe_unused,struct perf_header * ph,int fd,void * data __maybe_unused)1407 static int process_arch(struct perf_file_section *section __maybe_unused,
1408 struct perf_header *ph, int fd,
1409 void *data __maybe_unused)
1410 {
1411 ph->env.arch = do_read_string(fd, ph);
1412 return ph->env.arch ? 0 : -ENOMEM;
1413 }
1414
process_nrcpus(struct perf_file_section * section __maybe_unused,struct perf_header * ph,int fd,void * data __maybe_unused)1415 static int process_nrcpus(struct perf_file_section *section __maybe_unused,
1416 struct perf_header *ph, int fd,
1417 void *data __maybe_unused)
1418 {
1419 ssize_t ret;
1420 u32 nr;
1421
1422 ret = readn(fd, &nr, sizeof(nr));
1423 if (ret != sizeof(nr))
1424 return -1;
1425
1426 if (ph->needs_swap)
1427 nr = bswap_32(nr);
1428
1429 ph->env.nr_cpus_avail = nr;
1430
1431 ret = readn(fd, &nr, sizeof(nr));
1432 if (ret != sizeof(nr))
1433 return -1;
1434
1435 if (ph->needs_swap)
1436 nr = bswap_32(nr);
1437
1438 ph->env.nr_cpus_online = nr;
1439 return 0;
1440 }
1441
process_cpudesc(struct perf_file_section * section __maybe_unused,struct perf_header * ph,int fd,void * data __maybe_unused)1442 static int process_cpudesc(struct perf_file_section *section __maybe_unused,
1443 struct perf_header *ph, int fd,
1444 void *data __maybe_unused)
1445 {
1446 ph->env.cpu_desc = do_read_string(fd, ph);
1447 return ph->env.cpu_desc ? 0 : -ENOMEM;
1448 }
1449
process_cpuid(struct perf_file_section * section __maybe_unused,struct perf_header * ph,int fd,void * data __maybe_unused)1450 static int process_cpuid(struct perf_file_section *section __maybe_unused,
1451 struct perf_header *ph, int fd,
1452 void *data __maybe_unused)
1453 {
1454 ph->env.cpuid = do_read_string(fd, ph);
1455 return ph->env.cpuid ? 0 : -ENOMEM;
1456 }
1457
process_total_mem(struct perf_file_section * section __maybe_unused,struct perf_header * ph,int fd,void * data __maybe_unused)1458 static int process_total_mem(struct perf_file_section *section __maybe_unused,
1459 struct perf_header *ph, int fd,
1460 void *data __maybe_unused)
1461 {
1462 uint64_t mem;
1463 ssize_t ret;
1464
1465 ret = readn(fd, &mem, sizeof(mem));
1466 if (ret != sizeof(mem))
1467 return -1;
1468
1469 if (ph->needs_swap)
1470 mem = bswap_64(mem);
1471
1472 ph->env.total_mem = mem;
1473 return 0;
1474 }
1475
1476 static struct perf_evsel *
perf_evlist__find_by_index(struct perf_evlist * evlist,int idx)1477 perf_evlist__find_by_index(struct perf_evlist *evlist, int idx)
1478 {
1479 struct perf_evsel *evsel;
1480
1481 evlist__for_each(evlist, evsel) {
1482 if (evsel->idx == idx)
1483 return evsel;
1484 }
1485
1486 return NULL;
1487 }
1488
1489 static void
perf_evlist__set_event_name(struct perf_evlist * evlist,struct perf_evsel * event)1490 perf_evlist__set_event_name(struct perf_evlist *evlist,
1491 struct perf_evsel *event)
1492 {
1493 struct perf_evsel *evsel;
1494
1495 if (!event->name)
1496 return;
1497
1498 evsel = perf_evlist__find_by_index(evlist, event->idx);
1499 if (!evsel)
1500 return;
1501
1502 if (evsel->name)
1503 return;
1504
1505 evsel->name = strdup(event->name);
1506 }
1507
1508 static int
process_event_desc(struct perf_file_section * section __maybe_unused,struct perf_header * header,int fd,void * data __maybe_unused)1509 process_event_desc(struct perf_file_section *section __maybe_unused,
1510 struct perf_header *header, int fd,
1511 void *data __maybe_unused)
1512 {
1513 struct perf_session *session;
1514 struct perf_evsel *evsel, *events = read_event_desc(header, fd);
1515
1516 if (!events)
1517 return 0;
1518
1519 session = container_of(header, struct perf_session, header);
1520 for (evsel = events; evsel->attr.size; evsel++)
1521 perf_evlist__set_event_name(session->evlist, evsel);
1522
1523 free_event_desc(events);
1524
1525 return 0;
1526 }
1527
process_cmdline(struct perf_file_section * section __maybe_unused,struct perf_header * ph,int fd,void * data __maybe_unused)1528 static int process_cmdline(struct perf_file_section *section __maybe_unused,
1529 struct perf_header *ph, int fd,
1530 void *data __maybe_unused)
1531 {
1532 ssize_t ret;
1533 char *str;
1534 u32 nr, i;
1535 struct strbuf sb;
1536
1537 ret = readn(fd, &nr, sizeof(nr));
1538 if (ret != sizeof(nr))
1539 return -1;
1540
1541 if (ph->needs_swap)
1542 nr = bswap_32(nr);
1543
1544 ph->env.nr_cmdline = nr;
1545 strbuf_init(&sb, 128);
1546
1547 for (i = 0; i < nr; i++) {
1548 str = do_read_string(fd, ph);
1549 if (!str)
1550 goto error;
1551
1552 /* include a NULL character at the end */
1553 strbuf_add(&sb, str, strlen(str) + 1);
1554 free(str);
1555 }
1556 ph->env.cmdline = strbuf_detach(&sb, NULL);
1557 return 0;
1558
1559 error:
1560 strbuf_release(&sb);
1561 return -1;
1562 }
1563
process_cpu_topology(struct perf_file_section * section __maybe_unused,struct perf_header * ph,int fd,void * data __maybe_unused)1564 static int process_cpu_topology(struct perf_file_section *section __maybe_unused,
1565 struct perf_header *ph, int fd,
1566 void *data __maybe_unused)
1567 {
1568 ssize_t ret;
1569 u32 nr, i;
1570 char *str;
1571 struct strbuf sb;
1572
1573 ret = readn(fd, &nr, sizeof(nr));
1574 if (ret != sizeof(nr))
1575 return -1;
1576
1577 if (ph->needs_swap)
1578 nr = bswap_32(nr);
1579
1580 ph->env.nr_sibling_cores = nr;
1581 strbuf_init(&sb, 128);
1582
1583 for (i = 0; i < nr; i++) {
1584 str = do_read_string(fd, ph);
1585 if (!str)
1586 goto error;
1587
1588 /* include a NULL character at the end */
1589 strbuf_add(&sb, str, strlen(str) + 1);
1590 free(str);
1591 }
1592 ph->env.sibling_cores = strbuf_detach(&sb, NULL);
1593
1594 ret = readn(fd, &nr, sizeof(nr));
1595 if (ret != sizeof(nr))
1596 return -1;
1597
1598 if (ph->needs_swap)
1599 nr = bswap_32(nr);
1600
1601 ph->env.nr_sibling_threads = nr;
1602
1603 for (i = 0; i < nr; i++) {
1604 str = do_read_string(fd, ph);
1605 if (!str)
1606 goto error;
1607
1608 /* include a NULL character at the end */
1609 strbuf_add(&sb, str, strlen(str) + 1);
1610 free(str);
1611 }
1612 ph->env.sibling_threads = strbuf_detach(&sb, NULL);
1613 return 0;
1614
1615 error:
1616 strbuf_release(&sb);
1617 return -1;
1618 }
1619
process_numa_topology(struct perf_file_section * section __maybe_unused,struct perf_header * ph,int fd,void * data __maybe_unused)1620 static int process_numa_topology(struct perf_file_section *section __maybe_unused,
1621 struct perf_header *ph, int fd,
1622 void *data __maybe_unused)
1623 {
1624 ssize_t ret;
1625 u32 nr, node, i;
1626 char *str;
1627 uint64_t mem_total, mem_free;
1628 struct strbuf sb;
1629
1630 /* nr nodes */
1631 ret = readn(fd, &nr, sizeof(nr));
1632 if (ret != sizeof(nr))
1633 goto error;
1634
1635 if (ph->needs_swap)
1636 nr = bswap_32(nr);
1637
1638 ph->env.nr_numa_nodes = nr;
1639 strbuf_init(&sb, 256);
1640
1641 for (i = 0; i < nr; i++) {
1642 /* node number */
1643 ret = readn(fd, &node, sizeof(node));
1644 if (ret != sizeof(node))
1645 goto error;
1646
1647 ret = readn(fd, &mem_total, sizeof(u64));
1648 if (ret != sizeof(u64))
1649 goto error;
1650
1651 ret = readn(fd, &mem_free, sizeof(u64));
1652 if (ret != sizeof(u64))
1653 goto error;
1654
1655 if (ph->needs_swap) {
1656 node = bswap_32(node);
1657 mem_total = bswap_64(mem_total);
1658 mem_free = bswap_64(mem_free);
1659 }
1660
1661 strbuf_addf(&sb, "%u:%"PRIu64":%"PRIu64":",
1662 node, mem_total, mem_free);
1663
1664 str = do_read_string(fd, ph);
1665 if (!str)
1666 goto error;
1667
1668 /* include a NULL character at the end */
1669 strbuf_add(&sb, str, strlen(str) + 1);
1670 free(str);
1671 }
1672 ph->env.numa_nodes = strbuf_detach(&sb, NULL);
1673 return 0;
1674
1675 error:
1676 strbuf_release(&sb);
1677 return -1;
1678 }
1679
process_pmu_mappings(struct perf_file_section * section __maybe_unused,struct perf_header * ph,int fd,void * data __maybe_unused)1680 static int process_pmu_mappings(struct perf_file_section *section __maybe_unused,
1681 struct perf_header *ph, int fd,
1682 void *data __maybe_unused)
1683 {
1684 ssize_t ret;
1685 char *name;
1686 u32 pmu_num;
1687 u32 type;
1688 struct strbuf sb;
1689
1690 ret = readn(fd, &pmu_num, sizeof(pmu_num));
1691 if (ret != sizeof(pmu_num))
1692 return -1;
1693
1694 if (ph->needs_swap)
1695 pmu_num = bswap_32(pmu_num);
1696
1697 if (!pmu_num) {
1698 pr_debug("pmu mappings not available\n");
1699 return 0;
1700 }
1701
1702 ph->env.nr_pmu_mappings = pmu_num;
1703 strbuf_init(&sb, 128);
1704
1705 while (pmu_num) {
1706 if (readn(fd, &type, sizeof(type)) != sizeof(type))
1707 goto error;
1708 if (ph->needs_swap)
1709 type = bswap_32(type);
1710
1711 name = do_read_string(fd, ph);
1712 if (!name)
1713 goto error;
1714
1715 strbuf_addf(&sb, "%u:%s", type, name);
1716 /* include a NULL character at the end */
1717 strbuf_add(&sb, "", 1);
1718
1719 free(name);
1720 pmu_num--;
1721 }
1722 ph->env.pmu_mappings = strbuf_detach(&sb, NULL);
1723 return 0;
1724
1725 error:
1726 strbuf_release(&sb);
1727 return -1;
1728 }
1729
process_group_desc(struct perf_file_section * section __maybe_unused,struct perf_header * ph,int fd,void * data __maybe_unused)1730 static int process_group_desc(struct perf_file_section *section __maybe_unused,
1731 struct perf_header *ph, int fd,
1732 void *data __maybe_unused)
1733 {
1734 size_t ret = -1;
1735 u32 i, nr, nr_groups;
1736 struct perf_session *session;
1737 struct perf_evsel *evsel, *leader = NULL;
1738 struct group_desc {
1739 char *name;
1740 u32 leader_idx;
1741 u32 nr_members;
1742 } *desc;
1743
1744 if (readn(fd, &nr_groups, sizeof(nr_groups)) != sizeof(nr_groups))
1745 return -1;
1746
1747 if (ph->needs_swap)
1748 nr_groups = bswap_32(nr_groups);
1749
1750 ph->env.nr_groups = nr_groups;
1751 if (!nr_groups) {
1752 pr_debug("group desc not available\n");
1753 return 0;
1754 }
1755
1756 desc = calloc(nr_groups, sizeof(*desc));
1757 if (!desc)
1758 return -1;
1759
1760 for (i = 0; i < nr_groups; i++) {
1761 desc[i].name = do_read_string(fd, ph);
1762 if (!desc[i].name)
1763 goto out_free;
1764
1765 if (readn(fd, &desc[i].leader_idx, sizeof(u32)) != sizeof(u32))
1766 goto out_free;
1767
1768 if (readn(fd, &desc[i].nr_members, sizeof(u32)) != sizeof(u32))
1769 goto out_free;
1770
1771 if (ph->needs_swap) {
1772 desc[i].leader_idx = bswap_32(desc[i].leader_idx);
1773 desc[i].nr_members = bswap_32(desc[i].nr_members);
1774 }
1775 }
1776
1777 /*
1778 * Rebuild group relationship based on the group_desc
1779 */
1780 session = container_of(ph, struct perf_session, header);
1781 session->evlist->nr_groups = nr_groups;
1782
1783 i = nr = 0;
1784 evlist__for_each(session->evlist, evsel) {
1785 if (evsel->idx == (int) desc[i].leader_idx) {
1786 evsel->leader = evsel;
1787 /* {anon_group} is a dummy name */
1788 if (strcmp(desc[i].name, "{anon_group}")) {
1789 evsel->group_name = desc[i].name;
1790 desc[i].name = NULL;
1791 }
1792 evsel->nr_members = desc[i].nr_members;
1793
1794 if (i >= nr_groups || nr > 0) {
1795 pr_debug("invalid group desc\n");
1796 goto out_free;
1797 }
1798
1799 leader = evsel;
1800 nr = evsel->nr_members - 1;
1801 i++;
1802 } else if (nr) {
1803 /* This is a group member */
1804 evsel->leader = leader;
1805
1806 nr--;
1807 }
1808 }
1809
1810 if (i != nr_groups || nr != 0) {
1811 pr_debug("invalid group desc\n");
1812 goto out_free;
1813 }
1814
1815 ret = 0;
1816 out_free:
1817 for (i = 0; i < nr_groups; i++)
1818 zfree(&desc[i].name);
1819 free(desc);
1820
1821 return ret;
1822 }
1823
1824 struct feature_ops {
1825 int (*write)(int fd, struct perf_header *h, struct perf_evlist *evlist);
1826 void (*print)(struct perf_header *h, int fd, FILE *fp);
1827 int (*process)(struct perf_file_section *section,
1828 struct perf_header *h, int fd, void *data);
1829 const char *name;
1830 bool full_only;
1831 };
1832
1833 #define FEAT_OPA(n, func) \
1834 [n] = { .name = #n, .write = write_##func, .print = print_##func }
1835 #define FEAT_OPP(n, func) \
1836 [n] = { .name = #n, .write = write_##func, .print = print_##func, \
1837 .process = process_##func }
1838 #define FEAT_OPF(n, func) \
1839 [n] = { .name = #n, .write = write_##func, .print = print_##func, \
1840 .process = process_##func, .full_only = true }
1841
1842 /* feature_ops not implemented: */
1843 #define print_tracing_data NULL
1844 #define print_build_id NULL
1845
1846 static const struct feature_ops feat_ops[HEADER_LAST_FEATURE] = {
1847 FEAT_OPP(HEADER_TRACING_DATA, tracing_data),
1848 FEAT_OPP(HEADER_BUILD_ID, build_id),
1849 FEAT_OPP(HEADER_HOSTNAME, hostname),
1850 FEAT_OPP(HEADER_OSRELEASE, osrelease),
1851 FEAT_OPP(HEADER_VERSION, version),
1852 FEAT_OPP(HEADER_ARCH, arch),
1853 FEAT_OPP(HEADER_NRCPUS, nrcpus),
1854 FEAT_OPP(HEADER_CPUDESC, cpudesc),
1855 FEAT_OPP(HEADER_CPUID, cpuid),
1856 FEAT_OPP(HEADER_TOTAL_MEM, total_mem),
1857 FEAT_OPP(HEADER_EVENT_DESC, event_desc),
1858 FEAT_OPP(HEADER_CMDLINE, cmdline),
1859 FEAT_OPF(HEADER_CPU_TOPOLOGY, cpu_topology),
1860 FEAT_OPF(HEADER_NUMA_TOPOLOGY, numa_topology),
1861 FEAT_OPA(HEADER_BRANCH_STACK, branch_stack),
1862 FEAT_OPP(HEADER_PMU_MAPPINGS, pmu_mappings),
1863 FEAT_OPP(HEADER_GROUP_DESC, group_desc),
1864 };
1865
1866 struct header_print_data {
1867 FILE *fp;
1868 bool full; /* extended list of headers */
1869 };
1870
perf_file_section__fprintf_info(struct perf_file_section * section,struct perf_header * ph,int feat,int fd,void * data)1871 static int perf_file_section__fprintf_info(struct perf_file_section *section,
1872 struct perf_header *ph,
1873 int feat, int fd, void *data)
1874 {
1875 struct header_print_data *hd = data;
1876
1877 if (lseek(fd, section->offset, SEEK_SET) == (off_t)-1) {
1878 pr_debug("Failed to lseek to %" PRIu64 " offset for feature "
1879 "%d, continuing...\n", section->offset, feat);
1880 return 0;
1881 }
1882 if (feat >= HEADER_LAST_FEATURE) {
1883 pr_warning("unknown feature %d\n", feat);
1884 return 0;
1885 }
1886 if (!feat_ops[feat].print)
1887 return 0;
1888
1889 if (!feat_ops[feat].full_only || hd->full)
1890 feat_ops[feat].print(ph, fd, hd->fp);
1891 else
1892 fprintf(hd->fp, "# %s info available, use -I to display\n",
1893 feat_ops[feat].name);
1894
1895 return 0;
1896 }
1897
perf_header__fprintf_info(struct perf_session * session,FILE * fp,bool full)1898 int perf_header__fprintf_info(struct perf_session *session, FILE *fp, bool full)
1899 {
1900 struct header_print_data hd;
1901 struct perf_header *header = &session->header;
1902 int fd = perf_data_file__fd(session->file);
1903 hd.fp = fp;
1904 hd.full = full;
1905
1906 perf_header__process_sections(header, fd, &hd,
1907 perf_file_section__fprintf_info);
1908 return 0;
1909 }
1910
do_write_feat(int fd,struct perf_header * h,int type,struct perf_file_section ** p,struct perf_evlist * evlist)1911 static int do_write_feat(int fd, struct perf_header *h, int type,
1912 struct perf_file_section **p,
1913 struct perf_evlist *evlist)
1914 {
1915 int err;
1916 int ret = 0;
1917
1918 if (perf_header__has_feat(h, type)) {
1919 if (!feat_ops[type].write)
1920 return -1;
1921
1922 (*p)->offset = lseek(fd, 0, SEEK_CUR);
1923
1924 err = feat_ops[type].write(fd, h, evlist);
1925 if (err < 0) {
1926 pr_debug("failed to write feature %d\n", type);
1927
1928 /* undo anything written */
1929 lseek(fd, (*p)->offset, SEEK_SET);
1930
1931 return -1;
1932 }
1933 (*p)->size = lseek(fd, 0, SEEK_CUR) - (*p)->offset;
1934 (*p)++;
1935 }
1936 return ret;
1937 }
1938
perf_header__adds_write(struct perf_header * header,struct perf_evlist * evlist,int fd)1939 static int perf_header__adds_write(struct perf_header *header,
1940 struct perf_evlist *evlist, int fd)
1941 {
1942 int nr_sections;
1943 struct perf_file_section *feat_sec, *p;
1944 int sec_size;
1945 u64 sec_start;
1946 int feat;
1947 int err;
1948
1949 nr_sections = bitmap_weight(header->adds_features, HEADER_FEAT_BITS);
1950 if (!nr_sections)
1951 return 0;
1952
1953 feat_sec = p = calloc(nr_sections, sizeof(*feat_sec));
1954 if (feat_sec == NULL)
1955 return -ENOMEM;
1956
1957 sec_size = sizeof(*feat_sec) * nr_sections;
1958
1959 sec_start = header->feat_offset;
1960 lseek(fd, sec_start + sec_size, SEEK_SET);
1961
1962 for_each_set_bit(feat, header->adds_features, HEADER_FEAT_BITS) {
1963 if (do_write_feat(fd, header, feat, &p, evlist))
1964 perf_header__clear_feat(header, feat);
1965 }
1966
1967 lseek(fd, sec_start, SEEK_SET);
1968 /*
1969 * may write more than needed due to dropped feature, but
1970 * this is okay, reader will skip the mising entries
1971 */
1972 err = do_write(fd, feat_sec, sec_size);
1973 if (err < 0)
1974 pr_debug("failed to write feature section\n");
1975 free(feat_sec);
1976 return err;
1977 }
1978
perf_header__write_pipe(int fd)1979 int perf_header__write_pipe(int fd)
1980 {
1981 struct perf_pipe_file_header f_header;
1982 int err;
1983
1984 f_header = (struct perf_pipe_file_header){
1985 .magic = PERF_MAGIC,
1986 .size = sizeof(f_header),
1987 };
1988
1989 err = do_write(fd, &f_header, sizeof(f_header));
1990 if (err < 0) {
1991 pr_debug("failed to write perf pipe header\n");
1992 return err;
1993 }
1994
1995 return 0;
1996 }
1997
perf_session__write_header(struct perf_session * session,struct perf_evlist * evlist,int fd,bool at_exit)1998 int perf_session__write_header(struct perf_session *session,
1999 struct perf_evlist *evlist,
2000 int fd, bool at_exit)
2001 {
2002 struct perf_file_header f_header;
2003 struct perf_file_attr f_attr;
2004 struct perf_header *header = &session->header;
2005 struct perf_evsel *evsel;
2006 u64 attr_offset;
2007 int err;
2008
2009 lseek(fd, sizeof(f_header), SEEK_SET);
2010
2011 evlist__for_each(session->evlist, evsel) {
2012 evsel->id_offset = lseek(fd, 0, SEEK_CUR);
2013 err = do_write(fd, evsel->id, evsel->ids * sizeof(u64));
2014 if (err < 0) {
2015 pr_debug("failed to write perf header\n");
2016 return err;
2017 }
2018 }
2019
2020 attr_offset = lseek(fd, 0, SEEK_CUR);
2021
2022 evlist__for_each(evlist, evsel) {
2023 f_attr = (struct perf_file_attr){
2024 .attr = evsel->attr,
2025 .ids = {
2026 .offset = evsel->id_offset,
2027 .size = evsel->ids * sizeof(u64),
2028 }
2029 };
2030 err = do_write(fd, &f_attr, sizeof(f_attr));
2031 if (err < 0) {
2032 pr_debug("failed to write perf header attribute\n");
2033 return err;
2034 }
2035 }
2036
2037 if (!header->data_offset)
2038 header->data_offset = lseek(fd, 0, SEEK_CUR);
2039 header->feat_offset = header->data_offset + header->data_size;
2040
2041 if (at_exit) {
2042 err = perf_header__adds_write(header, evlist, fd);
2043 if (err < 0)
2044 return err;
2045 }
2046
2047 f_header = (struct perf_file_header){
2048 .magic = PERF_MAGIC,
2049 .size = sizeof(f_header),
2050 .attr_size = sizeof(f_attr),
2051 .attrs = {
2052 .offset = attr_offset,
2053 .size = evlist->nr_entries * sizeof(f_attr),
2054 },
2055 .data = {
2056 .offset = header->data_offset,
2057 .size = header->data_size,
2058 },
2059 /* event_types is ignored, store zeros */
2060 };
2061
2062 memcpy(&f_header.adds_features, &header->adds_features, sizeof(header->adds_features));
2063
2064 lseek(fd, 0, SEEK_SET);
2065 err = do_write(fd, &f_header, sizeof(f_header));
2066 if (err < 0) {
2067 pr_debug("failed to write perf header\n");
2068 return err;
2069 }
2070 lseek(fd, header->data_offset + header->data_size, SEEK_SET);
2071
2072 return 0;
2073 }
2074
perf_header__getbuffer64(struct perf_header * header,int fd,void * buf,size_t size)2075 static int perf_header__getbuffer64(struct perf_header *header,
2076 int fd, void *buf, size_t size)
2077 {
2078 if (readn(fd, buf, size) <= 0)
2079 return -1;
2080
2081 if (header->needs_swap)
2082 mem_bswap_64(buf, size);
2083
2084 return 0;
2085 }
2086
perf_header__process_sections(struct perf_header * header,int fd,void * data,int (* process)(struct perf_file_section * section,struct perf_header * ph,int feat,int fd,void * data))2087 int perf_header__process_sections(struct perf_header *header, int fd,
2088 void *data,
2089 int (*process)(struct perf_file_section *section,
2090 struct perf_header *ph,
2091 int feat, int fd, void *data))
2092 {
2093 struct perf_file_section *feat_sec, *sec;
2094 int nr_sections;
2095 int sec_size;
2096 int feat;
2097 int err;
2098
2099 nr_sections = bitmap_weight(header->adds_features, HEADER_FEAT_BITS);
2100 if (!nr_sections)
2101 return 0;
2102
2103 feat_sec = sec = calloc(nr_sections, sizeof(*feat_sec));
2104 if (!feat_sec)
2105 return -1;
2106
2107 sec_size = sizeof(*feat_sec) * nr_sections;
2108
2109 lseek(fd, header->feat_offset, SEEK_SET);
2110
2111 err = perf_header__getbuffer64(header, fd, feat_sec, sec_size);
2112 if (err < 0)
2113 goto out_free;
2114
2115 for_each_set_bit(feat, header->adds_features, HEADER_LAST_FEATURE) {
2116 err = process(sec++, header, feat, fd, data);
2117 if (err < 0)
2118 goto out_free;
2119 }
2120 err = 0;
2121 out_free:
2122 free(feat_sec);
2123 return err;
2124 }
2125
2126 static const int attr_file_abi_sizes[] = {
2127 [0] = PERF_ATTR_SIZE_VER0,
2128 [1] = PERF_ATTR_SIZE_VER1,
2129 [2] = PERF_ATTR_SIZE_VER2,
2130 [3] = PERF_ATTR_SIZE_VER3,
2131 [4] = PERF_ATTR_SIZE_VER4,
2132 0,
2133 };
2134
2135 /*
2136 * In the legacy file format, the magic number is not used to encode endianness.
2137 * hdr_sz was used to encode endianness. But given that hdr_sz can vary based
2138 * on ABI revisions, we need to try all combinations for all endianness to
2139 * detect the endianness.
2140 */
try_all_file_abis(uint64_t hdr_sz,struct perf_header * ph)2141 static int try_all_file_abis(uint64_t hdr_sz, struct perf_header *ph)
2142 {
2143 uint64_t ref_size, attr_size;
2144 int i;
2145
2146 for (i = 0 ; attr_file_abi_sizes[i]; i++) {
2147 ref_size = attr_file_abi_sizes[i]
2148 + sizeof(struct perf_file_section);
2149 if (hdr_sz != ref_size) {
2150 attr_size = bswap_64(hdr_sz);
2151 if (attr_size != ref_size)
2152 continue;
2153
2154 ph->needs_swap = true;
2155 }
2156 pr_debug("ABI%d perf.data file detected, need_swap=%d\n",
2157 i,
2158 ph->needs_swap);
2159 return 0;
2160 }
2161 /* could not determine endianness */
2162 return -1;
2163 }
2164
2165 #define PERF_PIPE_HDR_VER0 16
2166
2167 static const size_t attr_pipe_abi_sizes[] = {
2168 [0] = PERF_PIPE_HDR_VER0,
2169 0,
2170 };
2171
2172 /*
2173 * In the legacy pipe format, there is an implicit assumption that endiannesss
2174 * between host recording the samples, and host parsing the samples is the
2175 * same. This is not always the case given that the pipe output may always be
2176 * redirected into a file and analyzed on a different machine with possibly a
2177 * different endianness and perf_event ABI revsions in the perf tool itself.
2178 */
try_all_pipe_abis(uint64_t hdr_sz,struct perf_header * ph)2179 static int try_all_pipe_abis(uint64_t hdr_sz, struct perf_header *ph)
2180 {
2181 u64 attr_size;
2182 int i;
2183
2184 for (i = 0 ; attr_pipe_abi_sizes[i]; i++) {
2185 if (hdr_sz != attr_pipe_abi_sizes[i]) {
2186 attr_size = bswap_64(hdr_sz);
2187 if (attr_size != hdr_sz)
2188 continue;
2189
2190 ph->needs_swap = true;
2191 }
2192 pr_debug("Pipe ABI%d perf.data file detected\n", i);
2193 return 0;
2194 }
2195 return -1;
2196 }
2197
is_perf_magic(u64 magic)2198 bool is_perf_magic(u64 magic)
2199 {
2200 if (!memcmp(&magic, __perf_magic1, sizeof(magic))
2201 || magic == __perf_magic2
2202 || magic == __perf_magic2_sw)
2203 return true;
2204
2205 return false;
2206 }
2207
check_magic_endian(u64 magic,uint64_t hdr_sz,bool is_pipe,struct perf_header * ph)2208 static int check_magic_endian(u64 magic, uint64_t hdr_sz,
2209 bool is_pipe, struct perf_header *ph)
2210 {
2211 int ret;
2212
2213 /* check for legacy format */
2214 ret = memcmp(&magic, __perf_magic1, sizeof(magic));
2215 if (ret == 0) {
2216 ph->version = PERF_HEADER_VERSION_1;
2217 pr_debug("legacy perf.data format\n");
2218 if (is_pipe)
2219 return try_all_pipe_abis(hdr_sz, ph);
2220
2221 return try_all_file_abis(hdr_sz, ph);
2222 }
2223 /*
2224 * the new magic number serves two purposes:
2225 * - unique number to identify actual perf.data files
2226 * - encode endianness of file
2227 */
2228 ph->version = PERF_HEADER_VERSION_2;
2229
2230 /* check magic number with one endianness */
2231 if (magic == __perf_magic2)
2232 return 0;
2233
2234 /* check magic number with opposite endianness */
2235 if (magic != __perf_magic2_sw)
2236 return -1;
2237
2238 ph->needs_swap = true;
2239
2240 return 0;
2241 }
2242
perf_file_header__read(struct perf_file_header * header,struct perf_header * ph,int fd)2243 int perf_file_header__read(struct perf_file_header *header,
2244 struct perf_header *ph, int fd)
2245 {
2246 ssize_t ret;
2247
2248 lseek(fd, 0, SEEK_SET);
2249
2250 ret = readn(fd, header, sizeof(*header));
2251 if (ret <= 0)
2252 return -1;
2253
2254 if (check_magic_endian(header->magic,
2255 header->attr_size, false, ph) < 0) {
2256 pr_debug("magic/endian check failed\n");
2257 return -1;
2258 }
2259
2260 if (ph->needs_swap) {
2261 mem_bswap_64(header, offsetof(struct perf_file_header,
2262 adds_features));
2263 }
2264
2265 if (header->size != sizeof(*header)) {
2266 /* Support the previous format */
2267 if (header->size == offsetof(typeof(*header), adds_features))
2268 bitmap_zero(header->adds_features, HEADER_FEAT_BITS);
2269 else
2270 return -1;
2271 } else if (ph->needs_swap) {
2272 /*
2273 * feature bitmap is declared as an array of unsigned longs --
2274 * not good since its size can differ between the host that
2275 * generated the data file and the host analyzing the file.
2276 *
2277 * We need to handle endianness, but we don't know the size of
2278 * the unsigned long where the file was generated. Take a best
2279 * guess at determining it: try 64-bit swap first (ie., file
2280 * created on a 64-bit host), and check if the hostname feature
2281 * bit is set (this feature bit is forced on as of fbe96f2).
2282 * If the bit is not, undo the 64-bit swap and try a 32-bit
2283 * swap. If the hostname bit is still not set (e.g., older data
2284 * file), punt and fallback to the original behavior --
2285 * clearing all feature bits and setting buildid.
2286 */
2287 mem_bswap_64(&header->adds_features,
2288 BITS_TO_U64(HEADER_FEAT_BITS));
2289
2290 if (!test_bit(HEADER_HOSTNAME, header->adds_features)) {
2291 /* unswap as u64 */
2292 mem_bswap_64(&header->adds_features,
2293 BITS_TO_U64(HEADER_FEAT_BITS));
2294
2295 /* unswap as u32 */
2296 mem_bswap_32(&header->adds_features,
2297 BITS_TO_U32(HEADER_FEAT_BITS));
2298 }
2299
2300 if (!test_bit(HEADER_HOSTNAME, header->adds_features)) {
2301 bitmap_zero(header->adds_features, HEADER_FEAT_BITS);
2302 set_bit(HEADER_BUILD_ID, header->adds_features);
2303 }
2304 }
2305
2306 memcpy(&ph->adds_features, &header->adds_features,
2307 sizeof(ph->adds_features));
2308
2309 ph->data_offset = header->data.offset;
2310 ph->data_size = header->data.size;
2311 ph->feat_offset = header->data.offset + header->data.size;
2312 return 0;
2313 }
2314
perf_file_section__process(struct perf_file_section * section,struct perf_header * ph,int feat,int fd,void * data)2315 static int perf_file_section__process(struct perf_file_section *section,
2316 struct perf_header *ph,
2317 int feat, int fd, void *data)
2318 {
2319 if (lseek(fd, section->offset, SEEK_SET) == (off_t)-1) {
2320 pr_debug("Failed to lseek to %" PRIu64 " offset for feature "
2321 "%d, continuing...\n", section->offset, feat);
2322 return 0;
2323 }
2324
2325 if (feat >= HEADER_LAST_FEATURE) {
2326 pr_debug("unknown feature %d, continuing...\n", feat);
2327 return 0;
2328 }
2329
2330 if (!feat_ops[feat].process)
2331 return 0;
2332
2333 return feat_ops[feat].process(section, ph, fd, data);
2334 }
2335
perf_file_header__read_pipe(struct perf_pipe_file_header * header,struct perf_header * ph,int fd,bool repipe)2336 static int perf_file_header__read_pipe(struct perf_pipe_file_header *header,
2337 struct perf_header *ph, int fd,
2338 bool repipe)
2339 {
2340 ssize_t ret;
2341
2342 ret = readn(fd, header, sizeof(*header));
2343 if (ret <= 0)
2344 return -1;
2345
2346 if (check_magic_endian(header->magic, header->size, true, ph) < 0) {
2347 pr_debug("endian/magic failed\n");
2348 return -1;
2349 }
2350
2351 if (ph->needs_swap)
2352 header->size = bswap_64(header->size);
2353
2354 if (repipe && do_write(STDOUT_FILENO, header, sizeof(*header)) < 0)
2355 return -1;
2356
2357 return 0;
2358 }
2359
perf_header__read_pipe(struct perf_session * session)2360 static int perf_header__read_pipe(struct perf_session *session)
2361 {
2362 struct perf_header *header = &session->header;
2363 struct perf_pipe_file_header f_header;
2364
2365 if (perf_file_header__read_pipe(&f_header, header,
2366 perf_data_file__fd(session->file),
2367 session->repipe) < 0) {
2368 pr_debug("incompatible file format\n");
2369 return -EINVAL;
2370 }
2371
2372 return 0;
2373 }
2374
read_attr(int fd,struct perf_header * ph,struct perf_file_attr * f_attr)2375 static int read_attr(int fd, struct perf_header *ph,
2376 struct perf_file_attr *f_attr)
2377 {
2378 struct perf_event_attr *attr = &f_attr->attr;
2379 size_t sz, left;
2380 size_t our_sz = sizeof(f_attr->attr);
2381 ssize_t ret;
2382
2383 memset(f_attr, 0, sizeof(*f_attr));
2384
2385 /* read minimal guaranteed structure */
2386 ret = readn(fd, attr, PERF_ATTR_SIZE_VER0);
2387 if (ret <= 0) {
2388 pr_debug("cannot read %d bytes of header attr\n",
2389 PERF_ATTR_SIZE_VER0);
2390 return -1;
2391 }
2392
2393 /* on file perf_event_attr size */
2394 sz = attr->size;
2395
2396 if (ph->needs_swap)
2397 sz = bswap_32(sz);
2398
2399 if (sz == 0) {
2400 /* assume ABI0 */
2401 sz = PERF_ATTR_SIZE_VER0;
2402 } else if (sz > our_sz) {
2403 pr_debug("file uses a more recent and unsupported ABI"
2404 " (%zu bytes extra)\n", sz - our_sz);
2405 return -1;
2406 }
2407 /* what we have not yet read and that we know about */
2408 left = sz - PERF_ATTR_SIZE_VER0;
2409 if (left) {
2410 void *ptr = attr;
2411 ptr += PERF_ATTR_SIZE_VER0;
2412
2413 ret = readn(fd, ptr, left);
2414 }
2415 /* read perf_file_section, ids are read in caller */
2416 ret = readn(fd, &f_attr->ids, sizeof(f_attr->ids));
2417
2418 return ret <= 0 ? -1 : 0;
2419 }
2420
perf_evsel__prepare_tracepoint_event(struct perf_evsel * evsel,struct pevent * pevent)2421 static int perf_evsel__prepare_tracepoint_event(struct perf_evsel *evsel,
2422 struct pevent *pevent)
2423 {
2424 struct event_format *event;
2425 char bf[128];
2426
2427 /* already prepared */
2428 if (evsel->tp_format)
2429 return 0;
2430
2431 if (pevent == NULL) {
2432 pr_debug("broken or missing trace data\n");
2433 return -1;
2434 }
2435
2436 event = pevent_find_event(pevent, evsel->attr.config);
2437 if (event == NULL)
2438 return -1;
2439
2440 if (!evsel->name) {
2441 snprintf(bf, sizeof(bf), "%s:%s", event->system, event->name);
2442 evsel->name = strdup(bf);
2443 if (evsel->name == NULL)
2444 return -1;
2445 }
2446
2447 evsel->tp_format = event;
2448 return 0;
2449 }
2450
perf_evlist__prepare_tracepoint_events(struct perf_evlist * evlist,struct pevent * pevent)2451 static int perf_evlist__prepare_tracepoint_events(struct perf_evlist *evlist,
2452 struct pevent *pevent)
2453 {
2454 struct perf_evsel *pos;
2455
2456 evlist__for_each(evlist, pos) {
2457 if (pos->attr.type == PERF_TYPE_TRACEPOINT &&
2458 perf_evsel__prepare_tracepoint_event(pos, pevent))
2459 return -1;
2460 }
2461
2462 return 0;
2463 }
2464
perf_session__read_header(struct perf_session * session)2465 int perf_session__read_header(struct perf_session *session)
2466 {
2467 struct perf_data_file *file = session->file;
2468 struct perf_header *header = &session->header;
2469 struct perf_file_header f_header;
2470 struct perf_file_attr f_attr;
2471 u64 f_id;
2472 int nr_attrs, nr_ids, i, j;
2473 int fd = perf_data_file__fd(file);
2474
2475 session->evlist = perf_evlist__new();
2476 if (session->evlist == NULL)
2477 return -ENOMEM;
2478
2479 if (perf_data_file__is_pipe(file))
2480 return perf_header__read_pipe(session);
2481
2482 if (perf_file_header__read(&f_header, header, fd) < 0)
2483 return -EINVAL;
2484
2485 /*
2486 * Sanity check that perf.data was written cleanly; data size is
2487 * initialized to 0 and updated only if the on_exit function is run.
2488 * If data size is still 0 then the file contains only partial
2489 * information. Just warn user and process it as much as it can.
2490 */
2491 if (f_header.data.size == 0) {
2492 pr_warning("WARNING: The %s file's data size field is 0 which is unexpected.\n"
2493 "Was the 'perf record' command properly terminated?\n",
2494 file->path);
2495 }
2496
2497 nr_attrs = f_header.attrs.size / f_header.attr_size;
2498 lseek(fd, f_header.attrs.offset, SEEK_SET);
2499
2500 for (i = 0; i < nr_attrs; i++) {
2501 struct perf_evsel *evsel;
2502 off_t tmp;
2503
2504 if (read_attr(fd, header, &f_attr) < 0)
2505 goto out_errno;
2506
2507 if (header->needs_swap) {
2508 f_attr.ids.size = bswap_64(f_attr.ids.size);
2509 f_attr.ids.offset = bswap_64(f_attr.ids.offset);
2510 perf_event__attr_swap(&f_attr.attr);
2511 }
2512
2513 tmp = lseek(fd, 0, SEEK_CUR);
2514 evsel = perf_evsel__new(&f_attr.attr);
2515
2516 if (evsel == NULL)
2517 goto out_delete_evlist;
2518
2519 evsel->needs_swap = header->needs_swap;
2520 /*
2521 * Do it before so that if perf_evsel__alloc_id fails, this
2522 * entry gets purged too at perf_evlist__delete().
2523 */
2524 perf_evlist__add(session->evlist, evsel);
2525
2526 nr_ids = f_attr.ids.size / sizeof(u64);
2527 /*
2528 * We don't have the cpu and thread maps on the header, so
2529 * for allocating the perf_sample_id table we fake 1 cpu and
2530 * hattr->ids threads.
2531 */
2532 if (perf_evsel__alloc_id(evsel, 1, nr_ids))
2533 goto out_delete_evlist;
2534
2535 lseek(fd, f_attr.ids.offset, SEEK_SET);
2536
2537 for (j = 0; j < nr_ids; j++) {
2538 if (perf_header__getbuffer64(header, fd, &f_id, sizeof(f_id)))
2539 goto out_errno;
2540
2541 perf_evlist__id_add(session->evlist, evsel, 0, j, f_id);
2542 }
2543
2544 lseek(fd, tmp, SEEK_SET);
2545 }
2546
2547 symbol_conf.nr_events = nr_attrs;
2548
2549 perf_header__process_sections(header, fd, &session->tevent,
2550 perf_file_section__process);
2551
2552 if (perf_evlist__prepare_tracepoint_events(session->evlist,
2553 session->tevent.pevent))
2554 goto out_delete_evlist;
2555
2556 return 0;
2557 out_errno:
2558 return -errno;
2559
2560 out_delete_evlist:
2561 perf_evlist__delete(session->evlist);
2562 session->evlist = NULL;
2563 return -ENOMEM;
2564 }
2565
perf_event__synthesize_attr(struct perf_tool * tool,struct perf_event_attr * attr,u32 ids,u64 * id,perf_event__handler_t process)2566 int perf_event__synthesize_attr(struct perf_tool *tool,
2567 struct perf_event_attr *attr, u32 ids, u64 *id,
2568 perf_event__handler_t process)
2569 {
2570 union perf_event *ev;
2571 size_t size;
2572 int err;
2573
2574 size = sizeof(struct perf_event_attr);
2575 size = PERF_ALIGN(size, sizeof(u64));
2576 size += sizeof(struct perf_event_header);
2577 size += ids * sizeof(u64);
2578
2579 ev = malloc(size);
2580
2581 if (ev == NULL)
2582 return -ENOMEM;
2583
2584 ev->attr.attr = *attr;
2585 memcpy(ev->attr.id, id, ids * sizeof(u64));
2586
2587 ev->attr.header.type = PERF_RECORD_HEADER_ATTR;
2588 ev->attr.header.size = (u16)size;
2589
2590 if (ev->attr.header.size == size)
2591 err = process(tool, ev, NULL, NULL);
2592 else
2593 err = -E2BIG;
2594
2595 free(ev);
2596
2597 return err;
2598 }
2599
perf_event__synthesize_attrs(struct perf_tool * tool,struct perf_session * session,perf_event__handler_t process)2600 int perf_event__synthesize_attrs(struct perf_tool *tool,
2601 struct perf_session *session,
2602 perf_event__handler_t process)
2603 {
2604 struct perf_evsel *evsel;
2605 int err = 0;
2606
2607 evlist__for_each(session->evlist, evsel) {
2608 err = perf_event__synthesize_attr(tool, &evsel->attr, evsel->ids,
2609 evsel->id, process);
2610 if (err) {
2611 pr_debug("failed to create perf header attribute\n");
2612 return err;
2613 }
2614 }
2615
2616 return err;
2617 }
2618
perf_event__process_attr(struct perf_tool * tool __maybe_unused,union perf_event * event,struct perf_evlist ** pevlist)2619 int perf_event__process_attr(struct perf_tool *tool __maybe_unused,
2620 union perf_event *event,
2621 struct perf_evlist **pevlist)
2622 {
2623 u32 i, ids, n_ids;
2624 struct perf_evsel *evsel;
2625 struct perf_evlist *evlist = *pevlist;
2626
2627 if (evlist == NULL) {
2628 *pevlist = evlist = perf_evlist__new();
2629 if (evlist == NULL)
2630 return -ENOMEM;
2631 }
2632
2633 evsel = perf_evsel__new(&event->attr.attr);
2634 if (evsel == NULL)
2635 return -ENOMEM;
2636
2637 perf_evlist__add(evlist, evsel);
2638
2639 ids = event->header.size;
2640 ids -= (void *)&event->attr.id - (void *)event;
2641 n_ids = ids / sizeof(u64);
2642 /*
2643 * We don't have the cpu and thread maps on the header, so
2644 * for allocating the perf_sample_id table we fake 1 cpu and
2645 * hattr->ids threads.
2646 */
2647 if (perf_evsel__alloc_id(evsel, 1, n_ids))
2648 return -ENOMEM;
2649
2650 for (i = 0; i < n_ids; i++) {
2651 perf_evlist__id_add(evlist, evsel, 0, i, event->attr.id[i]);
2652 }
2653
2654 symbol_conf.nr_events = evlist->nr_entries;
2655
2656 return 0;
2657 }
2658
perf_event__synthesize_tracing_data(struct perf_tool * tool,int fd,struct perf_evlist * evlist,perf_event__handler_t process)2659 int perf_event__synthesize_tracing_data(struct perf_tool *tool, int fd,
2660 struct perf_evlist *evlist,
2661 perf_event__handler_t process)
2662 {
2663 union perf_event ev;
2664 struct tracing_data *tdata;
2665 ssize_t size = 0, aligned_size = 0, padding;
2666 int err __maybe_unused = 0;
2667
2668 /*
2669 * We are going to store the size of the data followed
2670 * by the data contents. Since the fd descriptor is a pipe,
2671 * we cannot seek back to store the size of the data once
2672 * we know it. Instead we:
2673 *
2674 * - write the tracing data to the temp file
2675 * - get/write the data size to pipe
2676 * - write the tracing data from the temp file
2677 * to the pipe
2678 */
2679 tdata = tracing_data_get(&evlist->entries, fd, true);
2680 if (!tdata)
2681 return -1;
2682
2683 memset(&ev, 0, sizeof(ev));
2684
2685 ev.tracing_data.header.type = PERF_RECORD_HEADER_TRACING_DATA;
2686 size = tdata->size;
2687 aligned_size = PERF_ALIGN(size, sizeof(u64));
2688 padding = aligned_size - size;
2689 ev.tracing_data.header.size = sizeof(ev.tracing_data);
2690 ev.tracing_data.size = aligned_size;
2691
2692 process(tool, &ev, NULL, NULL);
2693
2694 /*
2695 * The put function will copy all the tracing data
2696 * stored in temp file to the pipe.
2697 */
2698 tracing_data_put(tdata);
2699
2700 write_padded(fd, NULL, 0, padding);
2701
2702 return aligned_size;
2703 }
2704
perf_event__process_tracing_data(struct perf_tool * tool __maybe_unused,union perf_event * event,struct perf_session * session)2705 int perf_event__process_tracing_data(struct perf_tool *tool __maybe_unused,
2706 union perf_event *event,
2707 struct perf_session *session)
2708 {
2709 ssize_t size_read, padding, size = event->tracing_data.size;
2710 int fd = perf_data_file__fd(session->file);
2711 off_t offset = lseek(fd, 0, SEEK_CUR);
2712 char buf[BUFSIZ];
2713
2714 /* setup for reading amidst mmap */
2715 lseek(fd, offset + sizeof(struct tracing_data_event),
2716 SEEK_SET);
2717
2718 size_read = trace_report(fd, &session->tevent,
2719 session->repipe);
2720 padding = PERF_ALIGN(size_read, sizeof(u64)) - size_read;
2721
2722 if (readn(fd, buf, padding) < 0) {
2723 pr_err("%s: reading input file", __func__);
2724 return -1;
2725 }
2726 if (session->repipe) {
2727 int retw = write(STDOUT_FILENO, buf, padding);
2728 if (retw <= 0 || retw != padding) {
2729 pr_err("%s: repiping tracing data padding", __func__);
2730 return -1;
2731 }
2732 }
2733
2734 if (size_read + padding != size) {
2735 pr_err("%s: tracing data size mismatch", __func__);
2736 return -1;
2737 }
2738
2739 perf_evlist__prepare_tracepoint_events(session->evlist,
2740 session->tevent.pevent);
2741
2742 return size_read + padding;
2743 }
2744
perf_event__synthesize_build_id(struct perf_tool * tool,struct dso * pos,u16 misc,perf_event__handler_t process,struct machine * machine)2745 int perf_event__synthesize_build_id(struct perf_tool *tool,
2746 struct dso *pos, u16 misc,
2747 perf_event__handler_t process,
2748 struct machine *machine)
2749 {
2750 union perf_event ev;
2751 size_t len;
2752 int err = 0;
2753
2754 if (!pos->hit)
2755 return err;
2756
2757 memset(&ev, 0, sizeof(ev));
2758
2759 len = pos->long_name_len + 1;
2760 len = PERF_ALIGN(len, NAME_ALIGN);
2761 memcpy(&ev.build_id.build_id, pos->build_id, sizeof(pos->build_id));
2762 ev.build_id.header.type = PERF_RECORD_HEADER_BUILD_ID;
2763 ev.build_id.header.misc = misc;
2764 ev.build_id.pid = machine->pid;
2765 ev.build_id.header.size = sizeof(ev.build_id) + len;
2766 memcpy(&ev.build_id.filename, pos->long_name, pos->long_name_len);
2767
2768 err = process(tool, &ev, NULL, machine);
2769
2770 return err;
2771 }
2772
perf_event__process_build_id(struct perf_tool * tool __maybe_unused,union perf_event * event,struct perf_session * session)2773 int perf_event__process_build_id(struct perf_tool *tool __maybe_unused,
2774 union perf_event *event,
2775 struct perf_session *session)
2776 {
2777 __event_process_build_id(&event->build_id,
2778 event->build_id.filename,
2779 session);
2780 return 0;
2781 }
2782