e2ba261d158358f41a9148eed39546a4f83c4145
[linux-2.6-microblaze.git] / tools / perf / util / header.c
1 // SPDX-License-Identifier: GPL-2.0
2 #include <errno.h>
3 #include <inttypes.h>
4 #include "string2.h"
5 #include <sys/param.h>
6 #include <sys/types.h>
7 #include <byteswap.h>
8 #include <unistd.h>
9 #include <stdio.h>
10 #include <stdlib.h>
11 #include <linux/compiler.h>
12 #include <linux/list.h>
13 #include <linux/kernel.h>
14 #include <linux/bitops.h>
15 #include <linux/string.h>
16 #include <linux/stringify.h>
17 #include <linux/zalloc.h>
18 #include <sys/stat.h>
19 #include <sys/utsname.h>
20 #include <linux/time64.h>
21 #include <dirent.h>
22 #ifdef HAVE_LIBBPF_SUPPORT
23 #include <bpf/libbpf.h>
24 #endif
25 #include <perf/cpumap.h>
26
27 #include "dso.h"
28 #include "evlist.h"
29 #include "evsel.h"
30 #include "util/evsel_fprintf.h"
31 #include "header.h"
32 #include "memswap.h"
33 #include "trace-event.h"
34 #include "session.h"
35 #include "symbol.h"
36 #include "debug.h"
37 #include "cpumap.h"
38 #include "pmu.h"
39 #include "vdso.h"
40 #include "strbuf.h"
41 #include "build-id.h"
42 #include "data.h"
43 #include <api/fs/fs.h>
44 #include "asm/bug.h"
45 #include "tool.h"
46 #include "time-utils.h"
47 #include "units.h"
48 #include "util/util.h" // perf_exe()
49 #include "cputopo.h"
50 #include "bpf-event.h"
51 #include "bpf-utils.h"
52 #include "clockid.h"
53 #include "pmu-hybrid.h"
54
55 #include <linux/ctype.h>
56 #include <internal/lib.h>
57
58 /*
59  * magic2 = "PERFILE2"
60  * must be a numerical value to let the endianness
61  * determine the memory layout. That way we are able
62  * to detect endianness when reading the perf.data file
63  * back.
64  *
65  * we check for legacy (PERFFILE) format.
66  */
67 static const char *__perf_magic1 = "PERFFILE";
68 static const u64 __perf_magic2    = 0x32454c4946524550ULL;
69 static const u64 __perf_magic2_sw = 0x50455246494c4532ULL;
70
71 #define PERF_MAGIC      __perf_magic2
72
73 const char perf_version_string[] = PERF_VERSION;
74
75 struct perf_file_attr {
76         struct perf_event_attr  attr;
77         struct perf_file_section        ids;
78 };
79
80 void perf_header__set_feat(struct perf_header *header, int feat)
81 {
82         set_bit(feat, header->adds_features);
83 }
84
85 void perf_header__clear_feat(struct perf_header *header, int feat)
86 {
87         clear_bit(feat, header->adds_features);
88 }
89
90 bool perf_header__has_feat(const struct perf_header *header, int feat)
91 {
92         return test_bit(feat, header->adds_features);
93 }
94
95 static int __do_write_fd(struct feat_fd *ff, const void *buf, size_t size)
96 {
97         ssize_t ret = writen(ff->fd, buf, size);
98
99         if (ret != (ssize_t)size)
100                 return ret < 0 ? (int)ret : -1;
101         return 0;
102 }
103
104 static int __do_write_buf(struct feat_fd *ff,  const void *buf, size_t size)
105 {
106         /* struct perf_event_header::size is u16 */
107         const size_t max_size = 0xffff - sizeof(struct perf_event_header);
108         size_t new_size = ff->size;
109         void *addr;
110
111         if (size + ff->offset > max_size)
112                 return -E2BIG;
113
114         while (size > (new_size - ff->offset))
115                 new_size <<= 1;
116         new_size = min(max_size, new_size);
117
118         if (ff->size < new_size) {
119                 addr = realloc(ff->buf, new_size);
120                 if (!addr)
121                         return -ENOMEM;
122                 ff->buf = addr;
123                 ff->size = new_size;
124         }
125
126         memcpy(ff->buf + ff->offset, buf, size);
127         ff->offset += size;
128
129         return 0;
130 }
131
132 /* Return: 0 if succeeded, -ERR if failed. */
133 int do_write(struct feat_fd *ff, const void *buf, size_t size)
134 {
135         if (!ff->buf)
136                 return __do_write_fd(ff, buf, size);
137         return __do_write_buf(ff, buf, size);
138 }
139
140 /* Return: 0 if succeeded, -ERR if failed. */
141 static int do_write_bitmap(struct feat_fd *ff, unsigned long *set, u64 size)
142 {
143         u64 *p = (u64 *) set;
144         int i, ret;
145
146         ret = do_write(ff, &size, sizeof(size));
147         if (ret < 0)
148                 return ret;
149
150         for (i = 0; (u64) i < BITS_TO_U64(size); i++) {
151                 ret = do_write(ff, p + i, sizeof(*p));
152                 if (ret < 0)
153                         return ret;
154         }
155
156         return 0;
157 }
158
159 /* Return: 0 if succeeded, -ERR if failed. */
160 int write_padded(struct feat_fd *ff, const void *bf,
161                  size_t count, size_t count_aligned)
162 {
163         static const char zero_buf[NAME_ALIGN];
164         int err = do_write(ff, bf, count);
165
166         if (!err)
167                 err = do_write(ff, zero_buf, count_aligned - count);
168
169         return err;
170 }
171
172 #define string_size(str)                                                \
173         (PERF_ALIGN((strlen(str) + 1), NAME_ALIGN) + sizeof(u32))
174
175 /* Return: 0 if succeeded, -ERR if failed. */
176 static int do_write_string(struct feat_fd *ff, const char *str)
177 {
178         u32 len, olen;
179         int ret;
180
181         olen = strlen(str) + 1;
182         len = PERF_ALIGN(olen, NAME_ALIGN);
183
184         /* write len, incl. \0 */
185         ret = do_write(ff, &len, sizeof(len));
186         if (ret < 0)
187                 return ret;
188
189         return write_padded(ff, str, olen, len);
190 }
191
192 static int __do_read_fd(struct feat_fd *ff, void *addr, ssize_t size)
193 {
194         ssize_t ret = readn(ff->fd, addr, size);
195
196         if (ret != size)
197                 return ret < 0 ? (int)ret : -1;
198         return 0;
199 }
200
201 static int __do_read_buf(struct feat_fd *ff, void *addr, ssize_t size)
202 {
203         if (size > (ssize_t)ff->size - ff->offset)
204                 return -1;
205
206         memcpy(addr, ff->buf + ff->offset, size);
207         ff->offset += size;
208
209         return 0;
210
211 }
212
213 static int __do_read(struct feat_fd *ff, void *addr, ssize_t size)
214 {
215         if (!ff->buf)
216                 return __do_read_fd(ff, addr, size);
217         return __do_read_buf(ff, addr, size);
218 }
219
220 static int do_read_u32(struct feat_fd *ff, u32 *addr)
221 {
222         int ret;
223
224         ret = __do_read(ff, addr, sizeof(*addr));
225         if (ret)
226                 return ret;
227
228         if (ff->ph->needs_swap)
229                 *addr = bswap_32(*addr);
230         return 0;
231 }
232
233 static int do_read_u64(struct feat_fd *ff, u64 *addr)
234 {
235         int ret;
236
237         ret = __do_read(ff, addr, sizeof(*addr));
238         if (ret)
239                 return ret;
240
241         if (ff->ph->needs_swap)
242                 *addr = bswap_64(*addr);
243         return 0;
244 }
245
246 static char *do_read_string(struct feat_fd *ff)
247 {
248         u32 len;
249         char *buf;
250
251         if (do_read_u32(ff, &len))
252                 return NULL;
253
254         buf = malloc(len);
255         if (!buf)
256                 return NULL;
257
258         if (!__do_read(ff, buf, len)) {
259                 /*
260                  * strings are padded by zeroes
261                  * thus the actual strlen of buf
262                  * may be less than len
263                  */
264                 return buf;
265         }
266
267         free(buf);
268         return NULL;
269 }
270
271 /* Return: 0 if succeeded, -ERR if failed. */
272 static int do_read_bitmap(struct feat_fd *ff, unsigned long **pset, u64 *psize)
273 {
274         unsigned long *set;
275         u64 size, *p;
276         int i, ret;
277
278         ret = do_read_u64(ff, &size);
279         if (ret)
280                 return ret;
281
282         set = bitmap_zalloc(size);
283         if (!set)
284                 return -ENOMEM;
285
286         p = (u64 *) set;
287
288         for (i = 0; (u64) i < BITS_TO_U64(size); i++) {
289                 ret = do_read_u64(ff, p + i);
290                 if (ret < 0) {
291                         free(set);
292                         return ret;
293                 }
294         }
295
296         *pset  = set;
297         *psize = size;
298         return 0;
299 }
300
301 static int write_tracing_data(struct feat_fd *ff,
302                               struct evlist *evlist)
303 {
304         if (WARN(ff->buf, "Error: calling %s in pipe-mode.\n", __func__))
305                 return -1;
306
307         return read_tracing_data(ff->fd, &evlist->core.entries);
308 }
309
310 static int write_build_id(struct feat_fd *ff,
311                           struct evlist *evlist __maybe_unused)
312 {
313         struct perf_session *session;
314         int err;
315
316         session = container_of(ff->ph, struct perf_session, header);
317
318         if (!perf_session__read_build_ids(session, true))
319                 return -1;
320
321         if (WARN(ff->buf, "Error: calling %s in pipe-mode.\n", __func__))
322                 return -1;
323
324         err = perf_session__write_buildid_table(session, ff);
325         if (err < 0) {
326                 pr_debug("failed to write buildid table\n");
327                 return err;
328         }
329         perf_session__cache_build_ids(session);
330
331         return 0;
332 }
333
334 static int write_hostname(struct feat_fd *ff,
335                           struct evlist *evlist __maybe_unused)
336 {
337         struct utsname uts;
338         int ret;
339
340         ret = uname(&uts);
341         if (ret < 0)
342                 return -1;
343
344         return do_write_string(ff, uts.nodename);
345 }
346
347 static int write_osrelease(struct feat_fd *ff,
348                            struct evlist *evlist __maybe_unused)
349 {
350         struct utsname uts;
351         int ret;
352
353         ret = uname(&uts);
354         if (ret < 0)
355                 return -1;
356
357         return do_write_string(ff, uts.release);
358 }
359
360 static int write_arch(struct feat_fd *ff,
361                       struct evlist *evlist __maybe_unused)
362 {
363         struct utsname uts;
364         int ret;
365
366         ret = uname(&uts);
367         if (ret < 0)
368                 return -1;
369
370         return do_write_string(ff, uts.machine);
371 }
372
373 static int write_version(struct feat_fd *ff,
374                          struct evlist *evlist __maybe_unused)
375 {
376         return do_write_string(ff, perf_version_string);
377 }
378
379 static int __write_cpudesc(struct feat_fd *ff, const char *cpuinfo_proc)
380 {
381         FILE *file;
382         char *buf = NULL;
383         char *s, *p;
384         const char *search = cpuinfo_proc;
385         size_t len = 0;
386         int ret = -1;
387
388         if (!search)
389                 return -1;
390
391         file = fopen("/proc/cpuinfo", "r");
392         if (!file)
393                 return -1;
394
395         while (getline(&buf, &len, file) > 0) {
396                 ret = strncmp(buf, search, strlen(search));
397                 if (!ret)
398                         break;
399         }
400
401         if (ret) {
402                 ret = -1;
403                 goto done;
404         }
405
406         s = buf;
407
408         p = strchr(buf, ':');
409         if (p && *(p+1) == ' ' && *(p+2))
410                 s = p + 2;
411         p = strchr(s, '\n');
412         if (p)
413                 *p = '\0';
414
415         /* squash extra space characters (branding string) */
416         p = s;
417         while (*p) {
418                 if (isspace(*p)) {
419                         char *r = p + 1;
420                         char *q = skip_spaces(r);
421                         *p = ' ';
422                         if (q != (p+1))
423                                 while ((*r++ = *q++));
424                 }
425                 p++;
426         }
427         ret = do_write_string(ff, s);
428 done:
429         free(buf);
430         fclose(file);
431         return ret;
432 }
433
434 static int write_cpudesc(struct feat_fd *ff,
435                        struct evlist *evlist __maybe_unused)
436 {
437 #if defined(__powerpc__) || defined(__hppa__) || defined(__sparc__)
438 #define CPUINFO_PROC    { "cpu", }
439 #elif defined(__s390__)
440 #define CPUINFO_PROC    { "vendor_id", }
441 #elif defined(__sh__)
442 #define CPUINFO_PROC    { "cpu type", }
443 #elif defined(__alpha__) || defined(__mips__)
444 #define CPUINFO_PROC    { "cpu model", }
445 #elif defined(__arm__)
446 #define CPUINFO_PROC    { "model name", "Processor", }
447 #elif defined(__arc__)
448 #define CPUINFO_PROC    { "Processor", }
449 #elif defined(__xtensa__)
450 #define CPUINFO_PROC    { "core ID", }
451 #else
452 #define CPUINFO_PROC    { "model name", }
453 #endif
454         const char *cpuinfo_procs[] = CPUINFO_PROC;
455 #undef CPUINFO_PROC
456         unsigned int i;
457
458         for (i = 0; i < ARRAY_SIZE(cpuinfo_procs); i++) {
459                 int ret;
460                 ret = __write_cpudesc(ff, cpuinfo_procs[i]);
461                 if (ret >= 0)
462                         return ret;
463         }
464         return -1;
465 }
466
467
468 static int write_nrcpus(struct feat_fd *ff,
469                         struct evlist *evlist __maybe_unused)
470 {
471         long nr;
472         u32 nrc, nra;
473         int ret;
474
475         nrc = cpu__max_present_cpu();
476
477         nr = sysconf(_SC_NPROCESSORS_ONLN);
478         if (nr < 0)
479                 return -1;
480
481         nra = (u32)(nr & UINT_MAX);
482
483         ret = do_write(ff, &nrc, sizeof(nrc));
484         if (ret < 0)
485                 return ret;
486
487         return do_write(ff, &nra, sizeof(nra));
488 }
489
490 static int write_event_desc(struct feat_fd *ff,
491                             struct evlist *evlist)
492 {
493         struct evsel *evsel;
494         u32 nre, nri, sz;
495         int ret;
496
497         nre = evlist->core.nr_entries;
498
499         /*
500          * write number of events
501          */
502         ret = do_write(ff, &nre, sizeof(nre));
503         if (ret < 0)
504                 return ret;
505
506         /*
507          * size of perf_event_attr struct
508          */
509         sz = (u32)sizeof(evsel->core.attr);
510         ret = do_write(ff, &sz, sizeof(sz));
511         if (ret < 0)
512                 return ret;
513
514         evlist__for_each_entry(evlist, evsel) {
515                 ret = do_write(ff, &evsel->core.attr, sz);
516                 if (ret < 0)
517                         return ret;
518                 /*
519                  * write number of unique id per event
520                  * there is one id per instance of an event
521                  *
522                  * copy into an nri to be independent of the
523                  * type of ids,
524                  */
525                 nri = evsel->core.ids;
526                 ret = do_write(ff, &nri, sizeof(nri));
527                 if (ret < 0)
528                         return ret;
529
530                 /*
531                  * write event string as passed on cmdline
532                  */
533                 ret = do_write_string(ff, evsel__name(evsel));
534                 if (ret < 0)
535                         return ret;
536                 /*
537                  * write unique ids for this event
538                  */
539                 ret = do_write(ff, evsel->core.id, evsel->core.ids * sizeof(u64));
540                 if (ret < 0)
541                         return ret;
542         }
543         return 0;
544 }
545
546 static int write_cmdline(struct feat_fd *ff,
547                          struct evlist *evlist __maybe_unused)
548 {
549         char pbuf[MAXPATHLEN], *buf;
550         int i, ret, n;
551
552         /* actual path to perf binary */
553         buf = perf_exe(pbuf, MAXPATHLEN);
554
555         /* account for binary path */
556         n = perf_env.nr_cmdline + 1;
557
558         ret = do_write(ff, &n, sizeof(n));
559         if (ret < 0)
560                 return ret;
561
562         ret = do_write_string(ff, buf);
563         if (ret < 0)
564                 return ret;
565
566         for (i = 0 ; i < perf_env.nr_cmdline; i++) {
567                 ret = do_write_string(ff, perf_env.cmdline_argv[i]);
568                 if (ret < 0)
569                         return ret;
570         }
571         return 0;
572 }
573
574
575 static int write_cpu_topology(struct feat_fd *ff,
576                               struct evlist *evlist __maybe_unused)
577 {
578         struct cpu_topology *tp;
579         u32 i;
580         int ret, j;
581
582         tp = cpu_topology__new();
583         if (!tp)
584                 return -1;
585
586         ret = do_write(ff, &tp->package_cpus_lists, sizeof(tp->package_cpus_lists));
587         if (ret < 0)
588                 goto done;
589
590         for (i = 0; i < tp->package_cpus_lists; i++) {
591                 ret = do_write_string(ff, tp->package_cpus_list[i]);
592                 if (ret < 0)
593                         goto done;
594         }
595         ret = do_write(ff, &tp->thread_sib, sizeof(tp->thread_sib));
596         if (ret < 0)
597                 goto done;
598
599         for (i = 0; i < tp->thread_sib; i++) {
600                 ret = do_write_string(ff, tp->thread_siblings[i]);
601                 if (ret < 0)
602                         break;
603         }
604
605         ret = perf_env__read_cpu_topology_map(&perf_env);
606         if (ret < 0)
607                 goto done;
608
609         for (j = 0; j < perf_env.nr_cpus_avail; j++) {
610                 ret = do_write(ff, &perf_env.cpu[j].core_id,
611                                sizeof(perf_env.cpu[j].core_id));
612                 if (ret < 0)
613                         return ret;
614                 ret = do_write(ff, &perf_env.cpu[j].socket_id,
615                                sizeof(perf_env.cpu[j].socket_id));
616                 if (ret < 0)
617                         return ret;
618         }
619
620         if (!tp->die_cpus_lists)
621                 goto done;
622
623         ret = do_write(ff, &tp->die_cpus_lists, sizeof(tp->die_cpus_lists));
624         if (ret < 0)
625                 goto done;
626
627         for (i = 0; i < tp->die_cpus_lists; i++) {
628                 ret = do_write_string(ff, tp->die_cpus_list[i]);
629                 if (ret < 0)
630                         goto done;
631         }
632
633         for (j = 0; j < perf_env.nr_cpus_avail; j++) {
634                 ret = do_write(ff, &perf_env.cpu[j].die_id,
635                                sizeof(perf_env.cpu[j].die_id));
636                 if (ret < 0)
637                         return ret;
638         }
639
640 done:
641         cpu_topology__delete(tp);
642         return ret;
643 }
644
645
646
647 static int write_total_mem(struct feat_fd *ff,
648                            struct evlist *evlist __maybe_unused)
649 {
650         char *buf = NULL;
651         FILE *fp;
652         size_t len = 0;
653         int ret = -1, n;
654         uint64_t mem;
655
656         fp = fopen("/proc/meminfo", "r");
657         if (!fp)
658                 return -1;
659
660         while (getline(&buf, &len, fp) > 0) {
661                 ret = strncmp(buf, "MemTotal:", 9);
662                 if (!ret)
663                         break;
664         }
665         if (!ret) {
666                 n = sscanf(buf, "%*s %"PRIu64, &mem);
667                 if (n == 1)
668                         ret = do_write(ff, &mem, sizeof(mem));
669         } else
670                 ret = -1;
671         free(buf);
672         fclose(fp);
673         return ret;
674 }
675
676 static int write_numa_topology(struct feat_fd *ff,
677                                struct evlist *evlist __maybe_unused)
678 {
679         struct numa_topology *tp;
680         int ret = -1;
681         u32 i;
682
683         tp = numa_topology__new();
684         if (!tp)
685                 return -ENOMEM;
686
687         ret = do_write(ff, &tp->nr, sizeof(u32));
688         if (ret < 0)
689                 goto err;
690
691         for (i = 0; i < tp->nr; i++) {
692                 struct numa_topology_node *n = &tp->nodes[i];
693
694                 ret = do_write(ff, &n->node, sizeof(u32));
695                 if (ret < 0)
696                         goto err;
697
698                 ret = do_write(ff, &n->mem_total, sizeof(u64));
699                 if (ret)
700                         goto err;
701
702                 ret = do_write(ff, &n->mem_free, sizeof(u64));
703                 if (ret)
704                         goto err;
705
706                 ret = do_write_string(ff, n->cpus);
707                 if (ret < 0)
708                         goto err;
709         }
710
711         ret = 0;
712
713 err:
714         numa_topology__delete(tp);
715         return ret;
716 }
717
718 /*
719  * File format:
720  *
721  * struct pmu_mappings {
722  *      u32     pmu_num;
723  *      struct pmu_map {
724  *              u32     type;
725  *              char    name[];
726  *      }[pmu_num];
727  * };
728  */
729
730 static int write_pmu_mappings(struct feat_fd *ff,
731                               struct evlist *evlist __maybe_unused)
732 {
733         struct perf_pmu *pmu = NULL;
734         u32 pmu_num = 0;
735         int ret;
736
737         /*
738          * Do a first pass to count number of pmu to avoid lseek so this
739          * works in pipe mode as well.
740          */
741         while ((pmu = perf_pmu__scan(pmu))) {
742                 if (!pmu->name)
743                         continue;
744                 pmu_num++;
745         }
746
747         ret = do_write(ff, &pmu_num, sizeof(pmu_num));
748         if (ret < 0)
749                 return ret;
750
751         while ((pmu = perf_pmu__scan(pmu))) {
752                 if (!pmu->name)
753                         continue;
754
755                 ret = do_write(ff, &pmu->type, sizeof(pmu->type));
756                 if (ret < 0)
757                         return ret;
758
759                 ret = do_write_string(ff, pmu->name);
760                 if (ret < 0)
761                         return ret;
762         }
763
764         return 0;
765 }
766
767 /*
768  * File format:
769  *
770  * struct group_descs {
771  *      u32     nr_groups;
772  *      struct group_desc {
773  *              char    name[];
774  *              u32     leader_idx;
775  *              u32     nr_members;
776  *      }[nr_groups];
777  * };
778  */
779 static int write_group_desc(struct feat_fd *ff,
780                             struct evlist *evlist)
781 {
782         u32 nr_groups = evlist->core.nr_groups;
783         struct evsel *evsel;
784         int ret;
785
786         ret = do_write(ff, &nr_groups, sizeof(nr_groups));
787         if (ret < 0)
788                 return ret;
789
790         evlist__for_each_entry(evlist, evsel) {
791                 if (evsel__is_group_leader(evsel) && evsel->core.nr_members > 1) {
792                         const char *name = evsel->group_name ?: "{anon_group}";
793                         u32 leader_idx = evsel->core.idx;
794                         u32 nr_members = evsel->core.nr_members;
795
796                         ret = do_write_string(ff, name);
797                         if (ret < 0)
798                                 return ret;
799
800                         ret = do_write(ff, &leader_idx, sizeof(leader_idx));
801                         if (ret < 0)
802                                 return ret;
803
804                         ret = do_write(ff, &nr_members, sizeof(nr_members));
805                         if (ret < 0)
806                                 return ret;
807                 }
808         }
809         return 0;
810 }
811
812 /*
813  * Return the CPU id as a raw string.
814  *
815  * Each architecture should provide a more precise id string that
816  * can be use to match the architecture's "mapfile".
817  */
818 char * __weak get_cpuid_str(struct perf_pmu *pmu __maybe_unused)
819 {
820         return NULL;
821 }
822
823 /* Return zero when the cpuid from the mapfile.csv matches the
824  * cpuid string generated on this platform.
825  * Otherwise return non-zero.
826  */
827 int __weak strcmp_cpuid_str(const char *mapcpuid, const char *cpuid)
828 {
829         regex_t re;
830         regmatch_t pmatch[1];
831         int match;
832
833         if (regcomp(&re, mapcpuid, REG_EXTENDED) != 0) {
834                 /* Warn unable to generate match particular string. */
835                 pr_info("Invalid regular expression %s\n", mapcpuid);
836                 return 1;
837         }
838
839         match = !regexec(&re, cpuid, 1, pmatch, 0);
840         regfree(&re);
841         if (match) {
842                 size_t match_len = (pmatch[0].rm_eo - pmatch[0].rm_so);
843
844                 /* Verify the entire string matched. */
845                 if (match_len == strlen(cpuid))
846                         return 0;
847         }
848         return 1;
849 }
850
851 /*
852  * default get_cpuid(): nothing gets recorded
853  * actual implementation must be in arch/$(SRCARCH)/util/header.c
854  */
855 int __weak get_cpuid(char *buffer __maybe_unused, size_t sz __maybe_unused)
856 {
857         return ENOSYS; /* Not implemented */
858 }
859
860 static int write_cpuid(struct feat_fd *ff,
861                        struct evlist *evlist __maybe_unused)
862 {
863         char buffer[64];
864         int ret;
865
866         ret = get_cpuid(buffer, sizeof(buffer));
867         if (ret)
868                 return -1;
869
870         return do_write_string(ff, buffer);
871 }
872
873 static int write_branch_stack(struct feat_fd *ff __maybe_unused,
874                               struct evlist *evlist __maybe_unused)
875 {
876         return 0;
877 }
878
879 static int write_auxtrace(struct feat_fd *ff,
880                           struct evlist *evlist __maybe_unused)
881 {
882         struct perf_session *session;
883         int err;
884
885         if (WARN(ff->buf, "Error: calling %s in pipe-mode.\n", __func__))
886                 return -1;
887
888         session = container_of(ff->ph, struct perf_session, header);
889
890         err = auxtrace_index__write(ff->fd, &session->auxtrace_index);
891         if (err < 0)
892                 pr_err("Failed to write auxtrace index\n");
893         return err;
894 }
895
896 static int write_clockid(struct feat_fd *ff,
897                          struct evlist *evlist __maybe_unused)
898 {
899         return do_write(ff, &ff->ph->env.clock.clockid_res_ns,
900                         sizeof(ff->ph->env.clock.clockid_res_ns));
901 }
902
903 static int write_clock_data(struct feat_fd *ff,
904                             struct evlist *evlist __maybe_unused)
905 {
906         u64 *data64;
907         u32 data32;
908         int ret;
909
910         /* version */
911         data32 = 1;
912
913         ret = do_write(ff, &data32, sizeof(data32));
914         if (ret < 0)
915                 return ret;
916
917         /* clockid */
918         data32 = ff->ph->env.clock.clockid;
919
920         ret = do_write(ff, &data32, sizeof(data32));
921         if (ret < 0)
922                 return ret;
923
924         /* TOD ref time */
925         data64 = &ff->ph->env.clock.tod_ns;
926
927         ret = do_write(ff, data64, sizeof(*data64));
928         if (ret < 0)
929                 return ret;
930
931         /* clockid ref time */
932         data64 = &ff->ph->env.clock.clockid_ns;
933
934         return do_write(ff, data64, sizeof(*data64));
935 }
936
937 static int write_hybrid_topology(struct feat_fd *ff,
938                                  struct evlist *evlist __maybe_unused)
939 {
940         struct hybrid_topology *tp;
941         int ret;
942         u32 i;
943
944         tp = hybrid_topology__new();
945         if (!tp)
946                 return -ENOENT;
947
948         ret = do_write(ff, &tp->nr, sizeof(u32));
949         if (ret < 0)
950                 goto err;
951
952         for (i = 0; i < tp->nr; i++) {
953                 struct hybrid_topology_node *n = &tp->nodes[i];
954
955                 ret = do_write_string(ff, n->pmu_name);
956                 if (ret < 0)
957                         goto err;
958
959                 ret = do_write_string(ff, n->cpus);
960                 if (ret < 0)
961                         goto err;
962         }
963
964         ret = 0;
965
966 err:
967         hybrid_topology__delete(tp);
968         return ret;
969 }
970
971 static int write_dir_format(struct feat_fd *ff,
972                             struct evlist *evlist __maybe_unused)
973 {
974         struct perf_session *session;
975         struct perf_data *data;
976
977         session = container_of(ff->ph, struct perf_session, header);
978         data = session->data;
979
980         if (WARN_ON(!perf_data__is_dir(data)))
981                 return -1;
982
983         return do_write(ff, &data->dir.version, sizeof(data->dir.version));
984 }
985
986 #ifdef HAVE_LIBBPF_SUPPORT
987 static int write_bpf_prog_info(struct feat_fd *ff,
988                                struct evlist *evlist __maybe_unused)
989 {
990         struct perf_env *env = &ff->ph->env;
991         struct rb_root *root;
992         struct rb_node *next;
993         int ret;
994
995         down_read(&env->bpf_progs.lock);
996
997         ret = do_write(ff, &env->bpf_progs.infos_cnt,
998                        sizeof(env->bpf_progs.infos_cnt));
999         if (ret < 0)
1000                 goto out;
1001
1002         root = &env->bpf_progs.infos;
1003         next = rb_first(root);
1004         while (next) {
1005                 struct bpf_prog_info_node *node;
1006                 size_t len;
1007
1008                 node = rb_entry(next, struct bpf_prog_info_node, rb_node);
1009                 next = rb_next(&node->rb_node);
1010                 len = sizeof(struct perf_bpil) +
1011                         node->info_linear->data_len;
1012
1013                 /* before writing to file, translate address to offset */
1014                 bpil_addr_to_offs(node->info_linear);
1015                 ret = do_write(ff, node->info_linear, len);
1016                 /*
1017                  * translate back to address even when do_write() fails,
1018                  * so that this function never changes the data.
1019                  */
1020                 bpil_offs_to_addr(node->info_linear);
1021                 if (ret < 0)
1022                         goto out;
1023         }
1024 out:
1025         up_read(&env->bpf_progs.lock);
1026         return ret;
1027 }
1028
1029 static int write_bpf_btf(struct feat_fd *ff,
1030                          struct evlist *evlist __maybe_unused)
1031 {
1032         struct perf_env *env = &ff->ph->env;
1033         struct rb_root *root;
1034         struct rb_node *next;
1035         int ret;
1036
1037         down_read(&env->bpf_progs.lock);
1038
1039         ret = do_write(ff, &env->bpf_progs.btfs_cnt,
1040                        sizeof(env->bpf_progs.btfs_cnt));
1041
1042         if (ret < 0)
1043                 goto out;
1044
1045         root = &env->bpf_progs.btfs;
1046         next = rb_first(root);
1047         while (next) {
1048                 struct btf_node *node;
1049
1050                 node = rb_entry(next, struct btf_node, rb_node);
1051                 next = rb_next(&node->rb_node);
1052                 ret = do_write(ff, &node->id,
1053                                sizeof(u32) * 2 + node->data_size);
1054                 if (ret < 0)
1055                         goto out;
1056         }
1057 out:
1058         up_read(&env->bpf_progs.lock);
1059         return ret;
1060 }
1061 #endif // HAVE_LIBBPF_SUPPORT
1062
1063 static int cpu_cache_level__sort(const void *a, const void *b)
1064 {
1065         struct cpu_cache_level *cache_a = (struct cpu_cache_level *)a;
1066         struct cpu_cache_level *cache_b = (struct cpu_cache_level *)b;
1067
1068         return cache_a->level - cache_b->level;
1069 }
1070
1071 static bool cpu_cache_level__cmp(struct cpu_cache_level *a, struct cpu_cache_level *b)
1072 {
1073         if (a->level != b->level)
1074                 return false;
1075
1076         if (a->line_size != b->line_size)
1077                 return false;
1078
1079         if (a->sets != b->sets)
1080                 return false;
1081
1082         if (a->ways != b->ways)
1083                 return false;
1084
1085         if (strcmp(a->type, b->type))
1086                 return false;
1087
1088         if (strcmp(a->size, b->size))
1089                 return false;
1090
1091         if (strcmp(a->map, b->map))
1092                 return false;
1093
1094         return true;
1095 }
1096
1097 static int cpu_cache_level__read(struct cpu_cache_level *cache, u32 cpu, u16 level)
1098 {
1099         char path[PATH_MAX], file[PATH_MAX];
1100         struct stat st;
1101         size_t len;
1102
1103         scnprintf(path, PATH_MAX, "devices/system/cpu/cpu%d/cache/index%d/", cpu, level);
1104         scnprintf(file, PATH_MAX, "%s/%s", sysfs__mountpoint(), path);
1105
1106         if (stat(file, &st))
1107                 return 1;
1108
1109         scnprintf(file, PATH_MAX, "%s/level", path);
1110         if (sysfs__read_int(file, (int *) &cache->level))
1111                 return -1;
1112
1113         scnprintf(file, PATH_MAX, "%s/coherency_line_size", path);
1114         if (sysfs__read_int(file, (int *) &cache->line_size))
1115                 return -1;
1116
1117         scnprintf(file, PATH_MAX, "%s/number_of_sets", path);
1118         if (sysfs__read_int(file, (int *) &cache->sets))
1119                 return -1;
1120
1121         scnprintf(file, PATH_MAX, "%s/ways_of_associativity", path);
1122         if (sysfs__read_int(file, (int *) &cache->ways))
1123                 return -1;
1124
1125         scnprintf(file, PATH_MAX, "%s/type", path);
1126         if (sysfs__read_str(file, &cache->type, &len))
1127                 return -1;
1128
1129         cache->type[len] = 0;
1130         cache->type = strim(cache->type);
1131
1132         scnprintf(file, PATH_MAX, "%s/size", path);
1133         if (sysfs__read_str(file, &cache->size, &len)) {
1134                 zfree(&cache->type);
1135                 return -1;
1136         }
1137
1138         cache->size[len] = 0;
1139         cache->size = strim(cache->size);
1140
1141         scnprintf(file, PATH_MAX, "%s/shared_cpu_list", path);
1142         if (sysfs__read_str(file, &cache->map, &len)) {
1143                 zfree(&cache->size);
1144                 zfree(&cache->type);
1145                 return -1;
1146         }
1147
1148         cache->map[len] = 0;
1149         cache->map = strim(cache->map);
1150         return 0;
1151 }
1152
1153 static void cpu_cache_level__fprintf(FILE *out, struct cpu_cache_level *c)
1154 {
1155         fprintf(out, "L%d %-15s %8s [%s]\n", c->level, c->type, c->size, c->map);
1156 }
1157
1158 #define MAX_CACHE_LVL 4
1159
1160 static int build_caches(struct cpu_cache_level caches[], u32 *cntp)
1161 {
1162         u32 i, cnt = 0;
1163         u32 nr, cpu;
1164         u16 level;
1165
1166         nr = cpu__max_cpu();
1167
1168         for (cpu = 0; cpu < nr; cpu++) {
1169                 for (level = 0; level < MAX_CACHE_LVL; level++) {
1170                         struct cpu_cache_level c;
1171                         int err;
1172
1173                         err = cpu_cache_level__read(&c, cpu, level);
1174                         if (err < 0)
1175                                 return err;
1176
1177                         if (err == 1)
1178                                 break;
1179
1180                         for (i = 0; i < cnt; i++) {
1181                                 if (cpu_cache_level__cmp(&c, &caches[i]))
1182                                         break;
1183                         }
1184
1185                         if (i == cnt)
1186                                 caches[cnt++] = c;
1187                         else
1188                                 cpu_cache_level__free(&c);
1189                 }
1190         }
1191         *cntp = cnt;
1192         return 0;
1193 }
1194
1195 static int write_cache(struct feat_fd *ff,
1196                        struct evlist *evlist __maybe_unused)
1197 {
1198         u32 max_caches = cpu__max_cpu() * MAX_CACHE_LVL;
1199         struct cpu_cache_level caches[max_caches];
1200         u32 cnt = 0, i, version = 1;
1201         int ret;
1202
1203         ret = build_caches(caches, &cnt);
1204         if (ret)
1205                 goto out;
1206
1207         qsort(&caches, cnt, sizeof(struct cpu_cache_level), cpu_cache_level__sort);
1208
1209         ret = do_write(ff, &version, sizeof(u32));
1210         if (ret < 0)
1211                 goto out;
1212
1213         ret = do_write(ff, &cnt, sizeof(u32));
1214         if (ret < 0)
1215                 goto out;
1216
1217         for (i = 0; i < cnt; i++) {
1218                 struct cpu_cache_level *c = &caches[i];
1219
1220                 #define _W(v)                                   \
1221                         ret = do_write(ff, &c->v, sizeof(u32)); \
1222                         if (ret < 0)                            \
1223                                 goto out;
1224
1225                 _W(level)
1226                 _W(line_size)
1227                 _W(sets)
1228                 _W(ways)
1229                 #undef _W
1230
1231                 #define _W(v)                                           \
1232                         ret = do_write_string(ff, (const char *) c->v); \
1233                         if (ret < 0)                                    \
1234                                 goto out;
1235
1236                 _W(type)
1237                 _W(size)
1238                 _W(map)
1239                 #undef _W
1240         }
1241
1242 out:
1243         for (i = 0; i < cnt; i++)
1244                 cpu_cache_level__free(&caches[i]);
1245         return ret;
1246 }
1247
1248 static int write_stat(struct feat_fd *ff __maybe_unused,
1249                       struct evlist *evlist __maybe_unused)
1250 {
1251         return 0;
1252 }
1253
1254 static int write_sample_time(struct feat_fd *ff,
1255                              struct evlist *evlist)
1256 {
1257         int ret;
1258
1259         ret = do_write(ff, &evlist->first_sample_time,
1260                        sizeof(evlist->first_sample_time));
1261         if (ret < 0)
1262                 return ret;
1263
1264         return do_write(ff, &evlist->last_sample_time,
1265                         sizeof(evlist->last_sample_time));
1266 }
1267
1268
1269 static int memory_node__read(struct memory_node *n, unsigned long idx)
1270 {
1271         unsigned int phys, size = 0;
1272         char path[PATH_MAX];
1273         struct dirent *ent;
1274         DIR *dir;
1275
1276 #define for_each_memory(mem, dir)                                       \
1277         while ((ent = readdir(dir)))                                    \
1278                 if (strcmp(ent->d_name, ".") &&                         \
1279                     strcmp(ent->d_name, "..") &&                        \
1280                     sscanf(ent->d_name, "memory%u", &mem) == 1)
1281
1282         scnprintf(path, PATH_MAX,
1283                   "%s/devices/system/node/node%lu",
1284                   sysfs__mountpoint(), idx);
1285
1286         dir = opendir(path);
1287         if (!dir) {
1288                 pr_warning("failed: can't open memory sysfs data\n");
1289                 return -1;
1290         }
1291
1292         for_each_memory(phys, dir) {
1293                 size = max(phys, size);
1294         }
1295
1296         size++;
1297
1298         n->set = bitmap_zalloc(size);
1299         if (!n->set) {
1300                 closedir(dir);
1301                 return -ENOMEM;
1302         }
1303
1304         n->node = idx;
1305         n->size = size;
1306
1307         rewinddir(dir);
1308
1309         for_each_memory(phys, dir) {
1310                 set_bit(phys, n->set);
1311         }
1312
1313         closedir(dir);
1314         return 0;
1315 }
1316
1317 static int memory_node__sort(const void *a, const void *b)
1318 {
1319         const struct memory_node *na = a;
1320         const struct memory_node *nb = b;
1321
1322         return na->node - nb->node;
1323 }
1324
1325 static int build_mem_topology(struct memory_node *nodes, u64 size, u64 *cntp)
1326 {
1327         char path[PATH_MAX];
1328         struct dirent *ent;
1329         DIR *dir;
1330         u64 cnt = 0;
1331         int ret = 0;
1332
1333         scnprintf(path, PATH_MAX, "%s/devices/system/node/",
1334                   sysfs__mountpoint());
1335
1336         dir = opendir(path);
1337         if (!dir) {
1338                 pr_debug2("%s: could't read %s, does this arch have topology information?\n",
1339                           __func__, path);
1340                 return -1;
1341         }
1342
1343         while (!ret && (ent = readdir(dir))) {
1344                 unsigned int idx;
1345                 int r;
1346
1347                 if (!strcmp(ent->d_name, ".") ||
1348                     !strcmp(ent->d_name, ".."))
1349                         continue;
1350
1351                 r = sscanf(ent->d_name, "node%u", &idx);
1352                 if (r != 1)
1353                         continue;
1354
1355                 if (WARN_ONCE(cnt >= size,
1356                         "failed to write MEM_TOPOLOGY, way too many nodes\n")) {
1357                         closedir(dir);
1358                         return -1;
1359                 }
1360
1361                 ret = memory_node__read(&nodes[cnt++], idx);
1362         }
1363
1364         *cntp = cnt;
1365         closedir(dir);
1366
1367         if (!ret)
1368                 qsort(nodes, cnt, sizeof(nodes[0]), memory_node__sort);
1369
1370         return ret;
1371 }
1372
1373 #define MAX_MEMORY_NODES 2000
1374
1375 /*
1376  * The MEM_TOPOLOGY holds physical memory map for every
1377  * node in system. The format of data is as follows:
1378  *
1379  *  0 - version          | for future changes
1380  *  8 - block_size_bytes | /sys/devices/system/memory/block_size_bytes
1381  * 16 - count            | number of nodes
1382  *
1383  * For each node we store map of physical indexes for
1384  * each node:
1385  *
1386  * 32 - node id          | node index
1387  * 40 - size             | size of bitmap
1388  * 48 - bitmap           | bitmap of memory indexes that belongs to node
1389  */
1390 static int write_mem_topology(struct feat_fd *ff __maybe_unused,
1391                               struct evlist *evlist __maybe_unused)
1392 {
1393         static struct memory_node nodes[MAX_MEMORY_NODES];
1394         u64 bsize, version = 1, i, nr;
1395         int ret;
1396
1397         ret = sysfs__read_xll("devices/system/memory/block_size_bytes",
1398                               (unsigned long long *) &bsize);
1399         if (ret)
1400                 return ret;
1401
1402         ret = build_mem_topology(&nodes[0], MAX_MEMORY_NODES, &nr);
1403         if (ret)
1404                 return ret;
1405
1406         ret = do_write(ff, &version, sizeof(version));
1407         if (ret < 0)
1408                 goto out;
1409
1410         ret = do_write(ff, &bsize, sizeof(bsize));
1411         if (ret < 0)
1412                 goto out;
1413
1414         ret = do_write(ff, &nr, sizeof(nr));
1415         if (ret < 0)
1416                 goto out;
1417
1418         for (i = 0; i < nr; i++) {
1419                 struct memory_node *n = &nodes[i];
1420
1421                 #define _W(v)                                           \
1422                         ret = do_write(ff, &n->v, sizeof(n->v));        \
1423                         if (ret < 0)                                    \
1424                                 goto out;
1425
1426                 _W(node)
1427                 _W(size)
1428
1429                 #undef _W
1430
1431                 ret = do_write_bitmap(ff, n->set, n->size);
1432                 if (ret < 0)
1433                         goto out;
1434         }
1435
1436 out:
1437         return ret;
1438 }
1439
1440 static int write_compressed(struct feat_fd *ff __maybe_unused,
1441                             struct evlist *evlist __maybe_unused)
1442 {
1443         int ret;
1444
1445         ret = do_write(ff, &(ff->ph->env.comp_ver), sizeof(ff->ph->env.comp_ver));
1446         if (ret)
1447                 return ret;
1448
1449         ret = do_write(ff, &(ff->ph->env.comp_type), sizeof(ff->ph->env.comp_type));
1450         if (ret)
1451                 return ret;
1452
1453         ret = do_write(ff, &(ff->ph->env.comp_level), sizeof(ff->ph->env.comp_level));
1454         if (ret)
1455                 return ret;
1456
1457         ret = do_write(ff, &(ff->ph->env.comp_ratio), sizeof(ff->ph->env.comp_ratio));
1458         if (ret)
1459                 return ret;
1460
1461         return do_write(ff, &(ff->ph->env.comp_mmap_len), sizeof(ff->ph->env.comp_mmap_len));
1462 }
1463
1464 static int write_per_cpu_pmu_caps(struct feat_fd *ff, struct perf_pmu *pmu,
1465                                   bool write_pmu)
1466 {
1467         struct perf_pmu_caps *caps = NULL;
1468         int nr_caps;
1469         int ret;
1470
1471         nr_caps = perf_pmu__caps_parse(pmu);
1472         if (nr_caps < 0)
1473                 return nr_caps;
1474
1475         ret = do_write(ff, &nr_caps, sizeof(nr_caps));
1476         if (ret < 0)
1477                 return ret;
1478
1479         list_for_each_entry(caps, &pmu->caps, list) {
1480                 ret = do_write_string(ff, caps->name);
1481                 if (ret < 0)
1482                         return ret;
1483
1484                 ret = do_write_string(ff, caps->value);
1485                 if (ret < 0)
1486                         return ret;
1487         }
1488
1489         if (write_pmu) {
1490                 ret = do_write_string(ff, pmu->name);
1491                 if (ret < 0)
1492                         return ret;
1493         }
1494
1495         return ret;
1496 }
1497
1498 static int write_cpu_pmu_caps(struct feat_fd *ff,
1499                               struct evlist *evlist __maybe_unused)
1500 {
1501         struct perf_pmu *cpu_pmu = perf_pmu__find("cpu");
1502
1503         if (!cpu_pmu)
1504                 return -ENOENT;
1505
1506         return write_per_cpu_pmu_caps(ff, cpu_pmu, false);
1507 }
1508
1509 static int write_hybrid_cpu_pmu_caps(struct feat_fd *ff,
1510                                      struct evlist *evlist __maybe_unused)
1511 {
1512         struct perf_pmu *pmu;
1513         u32 nr_pmu = perf_pmu__hybrid_pmu_num();
1514         int ret;
1515
1516         if (nr_pmu == 0)
1517                 return -ENOENT;
1518
1519         ret = do_write(ff, &nr_pmu, sizeof(nr_pmu));
1520         if (ret < 0)
1521                 return ret;
1522
1523         perf_pmu__for_each_hybrid_pmu(pmu) {
1524                 ret = write_per_cpu_pmu_caps(ff, pmu, true);
1525                 if (ret < 0)
1526                         return ret;
1527         }
1528
1529         return 0;
1530 }
1531
1532 static void print_hostname(struct feat_fd *ff, FILE *fp)
1533 {
1534         fprintf(fp, "# hostname : %s\n", ff->ph->env.hostname);
1535 }
1536
1537 static void print_osrelease(struct feat_fd *ff, FILE *fp)
1538 {
1539         fprintf(fp, "# os release : %s\n", ff->ph->env.os_release);
1540 }
1541
1542 static void print_arch(struct feat_fd *ff, FILE *fp)
1543 {
1544         fprintf(fp, "# arch : %s\n", ff->ph->env.arch);
1545 }
1546
1547 static void print_cpudesc(struct feat_fd *ff, FILE *fp)
1548 {
1549         fprintf(fp, "# cpudesc : %s\n", ff->ph->env.cpu_desc);
1550 }
1551
1552 static void print_nrcpus(struct feat_fd *ff, FILE *fp)
1553 {
1554         fprintf(fp, "# nrcpus online : %u\n", ff->ph->env.nr_cpus_online);
1555         fprintf(fp, "# nrcpus avail : %u\n", ff->ph->env.nr_cpus_avail);
1556 }
1557
1558 static void print_version(struct feat_fd *ff, FILE *fp)
1559 {
1560         fprintf(fp, "# perf version : %s\n", ff->ph->env.version);
1561 }
1562
1563 static void print_cmdline(struct feat_fd *ff, FILE *fp)
1564 {
1565         int nr, i;
1566
1567         nr = ff->ph->env.nr_cmdline;
1568
1569         fprintf(fp, "# cmdline : ");
1570
1571         for (i = 0; i < nr; i++) {
1572                 char *argv_i = strdup(ff->ph->env.cmdline_argv[i]);
1573                 if (!argv_i) {
1574                         fprintf(fp, "%s ", ff->ph->env.cmdline_argv[i]);
1575                 } else {
1576                         char *mem = argv_i;
1577                         do {
1578                                 char *quote = strchr(argv_i, '\'');
1579                                 if (!quote)
1580                                         break;
1581                                 *quote++ = '\0';
1582                                 fprintf(fp, "%s\\\'", argv_i);
1583                                 argv_i = quote;
1584                         } while (1);
1585                         fprintf(fp, "%s ", argv_i);
1586                         free(mem);
1587                 }
1588         }
1589         fputc('\n', fp);
1590 }
1591
1592 static void print_cpu_topology(struct feat_fd *ff, FILE *fp)
1593 {
1594         struct perf_header *ph = ff->ph;
1595         int cpu_nr = ph->env.nr_cpus_avail;
1596         int nr, i;
1597         char *str;
1598
1599         nr = ph->env.nr_sibling_cores;
1600         str = ph->env.sibling_cores;
1601
1602         for (i = 0; i < nr; i++) {
1603                 fprintf(fp, "# sibling sockets : %s\n", str);
1604                 str += strlen(str) + 1;
1605         }
1606
1607         if (ph->env.nr_sibling_dies) {
1608                 nr = ph->env.nr_sibling_dies;
1609                 str = ph->env.sibling_dies;
1610
1611                 for (i = 0; i < nr; i++) {
1612                         fprintf(fp, "# sibling dies    : %s\n", str);
1613                         str += strlen(str) + 1;
1614                 }
1615         }
1616
1617         nr = ph->env.nr_sibling_threads;
1618         str = ph->env.sibling_threads;
1619
1620         for (i = 0; i < nr; i++) {
1621                 fprintf(fp, "# sibling threads : %s\n", str);
1622                 str += strlen(str) + 1;
1623         }
1624
1625         if (ph->env.nr_sibling_dies) {
1626                 if (ph->env.cpu != NULL) {
1627                         for (i = 0; i < cpu_nr; i++)
1628                                 fprintf(fp, "# CPU %d: Core ID %d, "
1629                                             "Die ID %d, Socket ID %d\n",
1630                                             i, ph->env.cpu[i].core_id,
1631                                             ph->env.cpu[i].die_id,
1632                                             ph->env.cpu[i].socket_id);
1633                 } else
1634                         fprintf(fp, "# Core ID, Die ID and Socket ID "
1635                                     "information is not available\n");
1636         } else {
1637                 if (ph->env.cpu != NULL) {
1638                         for (i = 0; i < cpu_nr; i++)
1639                                 fprintf(fp, "# CPU %d: Core ID %d, "
1640                                             "Socket ID %d\n",
1641                                             i, ph->env.cpu[i].core_id,
1642                                             ph->env.cpu[i].socket_id);
1643                 } else
1644                         fprintf(fp, "# Core ID and Socket ID "
1645                                     "information is not available\n");
1646         }
1647 }
1648
1649 static void print_clockid(struct feat_fd *ff, FILE *fp)
1650 {
1651         fprintf(fp, "# clockid frequency: %"PRIu64" MHz\n",
1652                 ff->ph->env.clock.clockid_res_ns * 1000);
1653 }
1654
1655 static void print_clock_data(struct feat_fd *ff, FILE *fp)
1656 {
1657         struct timespec clockid_ns;
1658         char tstr[64], date[64];
1659         struct timeval tod_ns;
1660         clockid_t clockid;
1661         struct tm ltime;
1662         u64 ref;
1663
1664         if (!ff->ph->env.clock.enabled) {
1665                 fprintf(fp, "# reference time disabled\n");
1666                 return;
1667         }
1668
1669         /* Compute TOD time. */
1670         ref = ff->ph->env.clock.tod_ns;
1671         tod_ns.tv_sec = ref / NSEC_PER_SEC;
1672         ref -= tod_ns.tv_sec * NSEC_PER_SEC;
1673         tod_ns.tv_usec = ref / NSEC_PER_USEC;
1674
1675         /* Compute clockid time. */
1676         ref = ff->ph->env.clock.clockid_ns;
1677         clockid_ns.tv_sec = ref / NSEC_PER_SEC;
1678         ref -= clockid_ns.tv_sec * NSEC_PER_SEC;
1679         clockid_ns.tv_nsec = ref;
1680
1681         clockid = ff->ph->env.clock.clockid;
1682
1683         if (localtime_r(&tod_ns.tv_sec, &ltime) == NULL)
1684                 snprintf(tstr, sizeof(tstr), "<error>");
1685         else {
1686                 strftime(date, sizeof(date), "%F %T", &ltime);
1687                 scnprintf(tstr, sizeof(tstr), "%s.%06d",
1688                           date, (int) tod_ns.tv_usec);
1689         }
1690
1691         fprintf(fp, "# clockid: %s (%u)\n", clockid_name(clockid), clockid);
1692         fprintf(fp, "# reference time: %s = %ld.%06d (TOD) = %ld.%09ld (%s)\n",
1693                     tstr, (long) tod_ns.tv_sec, (int) tod_ns.tv_usec,
1694                     (long) clockid_ns.tv_sec, clockid_ns.tv_nsec,
1695                     clockid_name(clockid));
1696 }
1697
1698 static void print_hybrid_topology(struct feat_fd *ff, FILE *fp)
1699 {
1700         int i;
1701         struct hybrid_node *n;
1702
1703         fprintf(fp, "# hybrid cpu system:\n");
1704         for (i = 0; i < ff->ph->env.nr_hybrid_nodes; i++) {
1705                 n = &ff->ph->env.hybrid_nodes[i];
1706                 fprintf(fp, "# %s cpu list : %s\n", n->pmu_name, n->cpus);
1707         }
1708 }
1709
1710 static void print_dir_format(struct feat_fd *ff, FILE *fp)
1711 {
1712         struct perf_session *session;
1713         struct perf_data *data;
1714
1715         session = container_of(ff->ph, struct perf_session, header);
1716         data = session->data;
1717
1718         fprintf(fp, "# directory data version : %"PRIu64"\n", data->dir.version);
1719 }
1720
1721 #ifdef HAVE_LIBBPF_SUPPORT
1722 static void print_bpf_prog_info(struct feat_fd *ff, FILE *fp)
1723 {
1724         struct perf_env *env = &ff->ph->env;
1725         struct rb_root *root;
1726         struct rb_node *next;
1727
1728         down_read(&env->bpf_progs.lock);
1729
1730         root = &env->bpf_progs.infos;
1731         next = rb_first(root);
1732
1733         while (next) {
1734                 struct bpf_prog_info_node *node;
1735
1736                 node = rb_entry(next, struct bpf_prog_info_node, rb_node);
1737                 next = rb_next(&node->rb_node);
1738
1739                 bpf_event__print_bpf_prog_info(&node->info_linear->info,
1740                                                env, fp);
1741         }
1742
1743         up_read(&env->bpf_progs.lock);
1744 }
1745
1746 static void print_bpf_btf(struct feat_fd *ff, FILE *fp)
1747 {
1748         struct perf_env *env = &ff->ph->env;
1749         struct rb_root *root;
1750         struct rb_node *next;
1751
1752         down_read(&env->bpf_progs.lock);
1753
1754         root = &env->bpf_progs.btfs;
1755         next = rb_first(root);
1756
1757         while (next) {
1758                 struct btf_node *node;
1759
1760                 node = rb_entry(next, struct btf_node, rb_node);
1761                 next = rb_next(&node->rb_node);
1762                 fprintf(fp, "# btf info of id %u\n", node->id);
1763         }
1764
1765         up_read(&env->bpf_progs.lock);
1766 }
1767 #endif // HAVE_LIBBPF_SUPPORT
1768
1769 static void free_event_desc(struct evsel *events)
1770 {
1771         struct evsel *evsel;
1772
1773         if (!events)
1774                 return;
1775
1776         for (evsel = events; evsel->core.attr.size; evsel++) {
1777                 zfree(&evsel->name);
1778                 zfree(&evsel->core.id);
1779         }
1780
1781         free(events);
1782 }
1783
1784 static bool perf_attr_check(struct perf_event_attr *attr)
1785 {
1786         if (attr->__reserved_1 || attr->__reserved_2 || attr->__reserved_3) {
1787                 pr_warning("Reserved bits are set unexpectedly. "
1788                            "Please update perf tool.\n");
1789                 return false;
1790         }
1791
1792         if (attr->sample_type & ~(PERF_SAMPLE_MAX-1)) {
1793                 pr_warning("Unknown sample type (0x%llx) is detected. "
1794                            "Please update perf tool.\n",
1795                            attr->sample_type);
1796                 return false;
1797         }
1798
1799         if (attr->read_format & ~(PERF_FORMAT_MAX-1)) {
1800                 pr_warning("Unknown read format (0x%llx) is detected. "
1801                            "Please update perf tool.\n",
1802                            attr->read_format);
1803                 return false;
1804         }
1805
1806         if ((attr->sample_type & PERF_SAMPLE_BRANCH_STACK) &&
1807             (attr->branch_sample_type & ~(PERF_SAMPLE_BRANCH_MAX-1))) {
1808                 pr_warning("Unknown branch sample type (0x%llx) is detected. "
1809                            "Please update perf tool.\n",
1810                            attr->branch_sample_type);
1811
1812                 return false;
1813         }
1814
1815         return true;
1816 }
1817
1818 static struct evsel *read_event_desc(struct feat_fd *ff)
1819 {
1820         struct evsel *evsel, *events = NULL;
1821         u64 *id;
1822         void *buf = NULL;
1823         u32 nre, sz, nr, i, j;
1824         size_t msz;
1825
1826         /* number of events */
1827         if (do_read_u32(ff, &nre))
1828                 goto error;
1829
1830         if (do_read_u32(ff, &sz))
1831                 goto error;
1832
1833         /* buffer to hold on file attr struct */
1834         buf = malloc(sz);
1835         if (!buf)
1836                 goto error;
1837
1838         /* the last event terminates with evsel->core.attr.size == 0: */
1839         events = calloc(nre + 1, sizeof(*events));
1840         if (!events)
1841                 goto error;
1842
1843         msz = sizeof(evsel->core.attr);
1844         if (sz < msz)
1845                 msz = sz;
1846
1847         for (i = 0, evsel = events; i < nre; evsel++, i++) {
1848                 evsel->core.idx = i;
1849
1850                 /*
1851                  * must read entire on-file attr struct to
1852                  * sync up with layout.
1853                  */
1854                 if (__do_read(ff, buf, sz))
1855                         goto error;
1856
1857                 if (ff->ph->needs_swap)
1858                         perf_event__attr_swap(buf);
1859
1860                 memcpy(&evsel->core.attr, buf, msz);
1861
1862                 if (!perf_attr_check(&evsel->core.attr))
1863                         goto error;
1864
1865                 if (do_read_u32(ff, &nr))
1866                         goto error;
1867
1868                 if (ff->ph->needs_swap)
1869                         evsel->needs_swap = true;
1870
1871                 evsel->name = do_read_string(ff);
1872                 if (!evsel->name)
1873                         goto error;
1874
1875                 if (!nr)
1876                         continue;
1877
1878                 id = calloc(nr, sizeof(*id));
1879                 if (!id)
1880                         goto error;
1881                 evsel->core.ids = nr;
1882                 evsel->core.id = id;
1883
1884                 for (j = 0 ; j < nr; j++) {
1885                         if (do_read_u64(ff, id))
1886                                 goto error;
1887                         id++;
1888                 }
1889         }
1890 out:
1891         free(buf);
1892         return events;
1893 error:
1894         free_event_desc(events);
1895         events = NULL;
1896         goto out;
1897 }
1898
1899 static int __desc_attr__fprintf(FILE *fp, const char *name, const char *val,
1900                                 void *priv __maybe_unused)
1901 {
1902         return fprintf(fp, ", %s = %s", name, val);
1903 }
1904
1905 static void print_event_desc(struct feat_fd *ff, FILE *fp)
1906 {
1907         struct evsel *evsel, *events;
1908         u32 j;
1909         u64 *id;
1910
1911         if (ff->events)
1912                 events = ff->events;
1913         else
1914                 events = read_event_desc(ff);
1915
1916         if (!events) {
1917                 fprintf(fp, "# event desc: not available or unable to read\n");
1918                 return;
1919         }
1920
1921         for (evsel = events; evsel->core.attr.size; evsel++) {
1922                 fprintf(fp, "# event : name = %s, ", evsel->name);
1923
1924                 if (evsel->core.ids) {
1925                         fprintf(fp, ", id = {");
1926                         for (j = 0, id = evsel->core.id; j < evsel->core.ids; j++, id++) {
1927                                 if (j)
1928                                         fputc(',', fp);
1929                                 fprintf(fp, " %"PRIu64, *id);
1930                         }
1931                         fprintf(fp, " }");
1932                 }
1933
1934                 perf_event_attr__fprintf(fp, &evsel->core.attr, __desc_attr__fprintf, NULL);
1935
1936                 fputc('\n', fp);
1937         }
1938
1939         free_event_desc(events);
1940         ff->events = NULL;
1941 }
1942
1943 static void print_total_mem(struct feat_fd *ff, FILE *fp)
1944 {
1945         fprintf(fp, "# total memory : %llu kB\n", ff->ph->env.total_mem);
1946 }
1947
1948 static void print_numa_topology(struct feat_fd *ff, FILE *fp)
1949 {
1950         int i;
1951         struct numa_node *n;
1952
1953         for (i = 0; i < ff->ph->env.nr_numa_nodes; i++) {
1954                 n = &ff->ph->env.numa_nodes[i];
1955
1956                 fprintf(fp, "# node%u meminfo  : total = %"PRIu64" kB,"
1957                             " free = %"PRIu64" kB\n",
1958                         n->node, n->mem_total, n->mem_free);
1959
1960                 fprintf(fp, "# node%u cpu list : ", n->node);
1961                 cpu_map__fprintf(n->map, fp);
1962         }
1963 }
1964
1965 static void print_cpuid(struct feat_fd *ff, FILE *fp)
1966 {
1967         fprintf(fp, "# cpuid : %s\n", ff->ph->env.cpuid);
1968 }
1969
1970 static void print_branch_stack(struct feat_fd *ff __maybe_unused, FILE *fp)
1971 {
1972         fprintf(fp, "# contains samples with branch stack\n");
1973 }
1974
1975 static void print_auxtrace(struct feat_fd *ff __maybe_unused, FILE *fp)
1976 {
1977         fprintf(fp, "# contains AUX area data (e.g. instruction trace)\n");
1978 }
1979
1980 static void print_stat(struct feat_fd *ff __maybe_unused, FILE *fp)
1981 {
1982         fprintf(fp, "# contains stat data\n");
1983 }
1984
1985 static void print_cache(struct feat_fd *ff, FILE *fp __maybe_unused)
1986 {
1987         int i;
1988
1989         fprintf(fp, "# CPU cache info:\n");
1990         for (i = 0; i < ff->ph->env.caches_cnt; i++) {
1991                 fprintf(fp, "#  ");
1992                 cpu_cache_level__fprintf(fp, &ff->ph->env.caches[i]);
1993         }
1994 }
1995
1996 static void print_compressed(struct feat_fd *ff, FILE *fp)
1997 {
1998         fprintf(fp, "# compressed : %s, level = %d, ratio = %d\n",
1999                 ff->ph->env.comp_type == PERF_COMP_ZSTD ? "Zstd" : "Unknown",
2000                 ff->ph->env.comp_level, ff->ph->env.comp_ratio);
2001 }
2002
2003 static void print_per_cpu_pmu_caps(FILE *fp, int nr_caps, char *cpu_pmu_caps,
2004                                    char *pmu_name)
2005 {
2006         const char *delimiter;
2007         char *str, buf[128];
2008
2009         if (!nr_caps) {
2010                 if (!pmu_name)
2011                         fprintf(fp, "# cpu pmu capabilities: not available\n");
2012                 else
2013                         fprintf(fp, "# %s pmu capabilities: not available\n", pmu_name);
2014                 return;
2015         }
2016
2017         if (!pmu_name)
2018                 scnprintf(buf, sizeof(buf), "# cpu pmu capabilities: ");
2019         else
2020                 scnprintf(buf, sizeof(buf), "# %s pmu capabilities: ", pmu_name);
2021
2022         delimiter = buf;
2023
2024         str = cpu_pmu_caps;
2025         while (nr_caps--) {
2026                 fprintf(fp, "%s%s", delimiter, str);
2027                 delimiter = ", ";
2028                 str += strlen(str) + 1;
2029         }
2030
2031         fprintf(fp, "\n");
2032 }
2033
2034 static void print_cpu_pmu_caps(struct feat_fd *ff, FILE *fp)
2035 {
2036         print_per_cpu_pmu_caps(fp, ff->ph->env.nr_cpu_pmu_caps,
2037                                ff->ph->env.cpu_pmu_caps, NULL);
2038 }
2039
2040 static void print_hybrid_cpu_pmu_caps(struct feat_fd *ff, FILE *fp)
2041 {
2042         struct hybrid_cpc_node *n;
2043
2044         for (int i = 0; i < ff->ph->env.nr_hybrid_cpc_nodes; i++) {
2045                 n = &ff->ph->env.hybrid_cpc_nodes[i];
2046                 print_per_cpu_pmu_caps(fp, n->nr_cpu_pmu_caps,
2047                                        n->cpu_pmu_caps,
2048                                        n->pmu_name);
2049         }
2050 }
2051
2052 static void print_pmu_mappings(struct feat_fd *ff, FILE *fp)
2053 {
2054         const char *delimiter = "# pmu mappings: ";
2055         char *str, *tmp;
2056         u32 pmu_num;
2057         u32 type;
2058
2059         pmu_num = ff->ph->env.nr_pmu_mappings;
2060         if (!pmu_num) {
2061                 fprintf(fp, "# pmu mappings: not available\n");
2062                 return;
2063         }
2064
2065         str = ff->ph->env.pmu_mappings;
2066
2067         while (pmu_num) {
2068                 type = strtoul(str, &tmp, 0);
2069                 if (*tmp != ':')
2070                         goto error;
2071
2072                 str = tmp + 1;
2073                 fprintf(fp, "%s%s = %" PRIu32, delimiter, str, type);
2074
2075                 delimiter = ", ";
2076                 str += strlen(str) + 1;
2077                 pmu_num--;
2078         }
2079
2080         fprintf(fp, "\n");
2081
2082         if (!pmu_num)
2083                 return;
2084 error:
2085         fprintf(fp, "# pmu mappings: unable to read\n");
2086 }
2087
2088 static void print_group_desc(struct feat_fd *ff, FILE *fp)
2089 {
2090         struct perf_session *session;
2091         struct evsel *evsel;
2092         u32 nr = 0;
2093
2094         session = container_of(ff->ph, struct perf_session, header);
2095
2096         evlist__for_each_entry(session->evlist, evsel) {
2097                 if (evsel__is_group_leader(evsel) && evsel->core.nr_members > 1) {
2098                         fprintf(fp, "# group: %s{%s", evsel->group_name ?: "", evsel__name(evsel));
2099
2100                         nr = evsel->core.nr_members - 1;
2101                 } else if (nr) {
2102                         fprintf(fp, ",%s", evsel__name(evsel));
2103
2104                         if (--nr == 0)
2105                                 fprintf(fp, "}\n");
2106                 }
2107         }
2108 }
2109
2110 static void print_sample_time(struct feat_fd *ff, FILE *fp)
2111 {
2112         struct perf_session *session;
2113         char time_buf[32];
2114         double d;
2115
2116         session = container_of(ff->ph, struct perf_session, header);
2117
2118         timestamp__scnprintf_usec(session->evlist->first_sample_time,
2119                                   time_buf, sizeof(time_buf));
2120         fprintf(fp, "# time of first sample : %s\n", time_buf);
2121
2122         timestamp__scnprintf_usec(session->evlist->last_sample_time,
2123                                   time_buf, sizeof(time_buf));
2124         fprintf(fp, "# time of last sample : %s\n", time_buf);
2125
2126         d = (double)(session->evlist->last_sample_time -
2127                 session->evlist->first_sample_time) / NSEC_PER_MSEC;
2128
2129         fprintf(fp, "# sample duration : %10.3f ms\n", d);
2130 }
2131
2132 static void memory_node__fprintf(struct memory_node *n,
2133                                  unsigned long long bsize, FILE *fp)
2134 {
2135         char buf_map[100], buf_size[50];
2136         unsigned long long size;
2137
2138         size = bsize * bitmap_weight(n->set, n->size);
2139         unit_number__scnprintf(buf_size, 50, size);
2140
2141         bitmap_scnprintf(n->set, n->size, buf_map, 100);
2142         fprintf(fp, "#  %3" PRIu64 " [%s]: %s\n", n->node, buf_size, buf_map);
2143 }
2144
2145 static void print_mem_topology(struct feat_fd *ff, FILE *fp)
2146 {
2147         struct memory_node *nodes;
2148         int i, nr;
2149
2150         nodes = ff->ph->env.memory_nodes;
2151         nr    = ff->ph->env.nr_memory_nodes;
2152
2153         fprintf(fp, "# memory nodes (nr %d, block size 0x%llx):\n",
2154                 nr, ff->ph->env.memory_bsize);
2155
2156         for (i = 0; i < nr; i++) {
2157                 memory_node__fprintf(&nodes[i], ff->ph->env.memory_bsize, fp);
2158         }
2159 }
2160
2161 static int __event_process_build_id(struct perf_record_header_build_id *bev,
2162                                     char *filename,
2163                                     struct perf_session *session)
2164 {
2165         int err = -1;
2166         struct machine *machine;
2167         u16 cpumode;
2168         struct dso *dso;
2169         enum dso_space_type dso_space;
2170
2171         machine = perf_session__findnew_machine(session, bev->pid);
2172         if (!machine)
2173                 goto out;
2174
2175         cpumode = bev->header.misc & PERF_RECORD_MISC_CPUMODE_MASK;
2176
2177         switch (cpumode) {
2178         case PERF_RECORD_MISC_KERNEL:
2179                 dso_space = DSO_SPACE__KERNEL;
2180                 break;
2181         case PERF_RECORD_MISC_GUEST_KERNEL:
2182                 dso_space = DSO_SPACE__KERNEL_GUEST;
2183                 break;
2184         case PERF_RECORD_MISC_USER:
2185         case PERF_RECORD_MISC_GUEST_USER:
2186                 dso_space = DSO_SPACE__USER;
2187                 break;
2188         default:
2189                 goto out;
2190         }
2191
2192         dso = machine__findnew_dso(machine, filename);
2193         if (dso != NULL) {
2194                 char sbuild_id[SBUILD_ID_SIZE];
2195                 struct build_id bid;
2196                 size_t size = BUILD_ID_SIZE;
2197
2198                 if (bev->header.misc & PERF_RECORD_MISC_BUILD_ID_SIZE)
2199                         size = bev->size;
2200
2201                 build_id__init(&bid, bev->data, size);
2202                 dso__set_build_id(dso, &bid);
2203
2204                 if (dso_space != DSO_SPACE__USER) {
2205                         struct kmod_path m = { .name = NULL, };
2206
2207                         if (!kmod_path__parse_name(&m, filename) && m.kmod)
2208                                 dso__set_module_info(dso, &m, machine);
2209
2210                         dso->kernel = dso_space;
2211                         free(m.name);
2212                 }
2213
2214                 build_id__sprintf(&dso->bid, sbuild_id);
2215                 pr_debug("build id event received for %s: %s [%zu]\n",
2216                          dso->long_name, sbuild_id, size);
2217                 dso__put(dso);
2218         }
2219
2220         err = 0;
2221 out:
2222         return err;
2223 }
2224
2225 static int perf_header__read_build_ids_abi_quirk(struct perf_header *header,
2226                                                  int input, u64 offset, u64 size)
2227 {
2228         struct perf_session *session = container_of(header, struct perf_session, header);
2229         struct {
2230                 struct perf_event_header   header;
2231                 u8                         build_id[PERF_ALIGN(BUILD_ID_SIZE, sizeof(u64))];
2232                 char                       filename[0];
2233         } old_bev;
2234         struct perf_record_header_build_id bev;
2235         char filename[PATH_MAX];
2236         u64 limit = offset + size;
2237
2238         while (offset < limit) {
2239                 ssize_t len;
2240
2241                 if (readn(input, &old_bev, sizeof(old_bev)) != sizeof(old_bev))
2242                         return -1;
2243
2244                 if (header->needs_swap)
2245                         perf_event_header__bswap(&old_bev.header);
2246
2247                 len = old_bev.header.size - sizeof(old_bev);
2248                 if (readn(input, filename, len) != len)
2249                         return -1;
2250
2251                 bev.header = old_bev.header;
2252
2253                 /*
2254                  * As the pid is the missing value, we need to fill
2255                  * it properly. The header.misc value give us nice hint.
2256                  */
2257                 bev.pid = HOST_KERNEL_ID;
2258                 if (bev.header.misc == PERF_RECORD_MISC_GUEST_USER ||
2259                     bev.header.misc == PERF_RECORD_MISC_GUEST_KERNEL)
2260                         bev.pid = DEFAULT_GUEST_KERNEL_ID;
2261
2262                 memcpy(bev.build_id, old_bev.build_id, sizeof(bev.build_id));
2263                 __event_process_build_id(&bev, filename, session);
2264
2265                 offset += bev.header.size;
2266         }
2267
2268         return 0;
2269 }
2270
2271 static int perf_header__read_build_ids(struct perf_header *header,
2272                                        int input, u64 offset, u64 size)
2273 {
2274         struct perf_session *session = container_of(header, struct perf_session, header);
2275         struct perf_record_header_build_id bev;
2276         char filename[PATH_MAX];
2277         u64 limit = offset + size, orig_offset = offset;
2278         int err = -1;
2279
2280         while (offset < limit) {
2281                 ssize_t len;
2282
2283                 if (readn(input, &bev, sizeof(bev)) != sizeof(bev))
2284                         goto out;
2285
2286                 if (header->needs_swap)
2287                         perf_event_header__bswap(&bev.header);
2288
2289                 len = bev.header.size - sizeof(bev);
2290                 if (readn(input, filename, len) != len)
2291                         goto out;
2292                 /*
2293                  * The a1645ce1 changeset:
2294                  *
2295                  * "perf: 'perf kvm' tool for monitoring guest performance from host"
2296                  *
2297                  * Added a field to struct perf_record_header_build_id that broke the file
2298                  * format.
2299                  *
2300                  * Since the kernel build-id is the first entry, process the
2301                  * table using the old format if the well known
2302                  * '[kernel.kallsyms]' string for the kernel build-id has the
2303                  * first 4 characters chopped off (where the pid_t sits).
2304                  */
2305                 if (memcmp(filename, "nel.kallsyms]", 13) == 0) {
2306                         if (lseek(input, orig_offset, SEEK_SET) == (off_t)-1)
2307                                 return -1;
2308                         return perf_header__read_build_ids_abi_quirk(header, input, offset, size);
2309                 }
2310
2311                 __event_process_build_id(&bev, filename, session);
2312
2313                 offset += bev.header.size;
2314         }
2315         err = 0;
2316 out:
2317         return err;
2318 }
2319
2320 /* Macro for features that simply need to read and store a string. */
2321 #define FEAT_PROCESS_STR_FUN(__feat, __feat_env) \
2322 static int process_##__feat(struct feat_fd *ff, void *data __maybe_unused) \
2323 {\
2324         ff->ph->env.__feat_env = do_read_string(ff); \
2325         return ff->ph->env.__feat_env ? 0 : -ENOMEM; \
2326 }
2327
2328 FEAT_PROCESS_STR_FUN(hostname, hostname);
2329 FEAT_PROCESS_STR_FUN(osrelease, os_release);
2330 FEAT_PROCESS_STR_FUN(version, version);
2331 FEAT_PROCESS_STR_FUN(arch, arch);
2332 FEAT_PROCESS_STR_FUN(cpudesc, cpu_desc);
2333 FEAT_PROCESS_STR_FUN(cpuid, cpuid);
2334
2335 static int process_tracing_data(struct feat_fd *ff, void *data)
2336 {
2337         ssize_t ret = trace_report(ff->fd, data, false);
2338
2339         return ret < 0 ? -1 : 0;
2340 }
2341
2342 static int process_build_id(struct feat_fd *ff, void *data __maybe_unused)
2343 {
2344         if (perf_header__read_build_ids(ff->ph, ff->fd, ff->offset, ff->size))
2345                 pr_debug("Failed to read buildids, continuing...\n");
2346         return 0;
2347 }
2348
2349 static int process_nrcpus(struct feat_fd *ff, void *data __maybe_unused)
2350 {
2351         int ret;
2352         u32 nr_cpus_avail, nr_cpus_online;
2353
2354         ret = do_read_u32(ff, &nr_cpus_avail);
2355         if (ret)
2356                 return ret;
2357
2358         ret = do_read_u32(ff, &nr_cpus_online);
2359         if (ret)
2360                 return ret;
2361         ff->ph->env.nr_cpus_avail = (int)nr_cpus_avail;
2362         ff->ph->env.nr_cpus_online = (int)nr_cpus_online;
2363         return 0;
2364 }
2365
2366 static int process_total_mem(struct feat_fd *ff, void *data __maybe_unused)
2367 {
2368         u64 total_mem;
2369         int ret;
2370
2371         ret = do_read_u64(ff, &total_mem);
2372         if (ret)
2373                 return -1;
2374         ff->ph->env.total_mem = (unsigned long long)total_mem;
2375         return 0;
2376 }
2377
2378 static struct evsel *evlist__find_by_index(struct evlist *evlist, int idx)
2379 {
2380         struct evsel *evsel;
2381
2382         evlist__for_each_entry(evlist, evsel) {
2383                 if (evsel->core.idx == idx)
2384                         return evsel;
2385         }
2386
2387         return NULL;
2388 }
2389
2390 static void evlist__set_event_name(struct evlist *evlist, struct evsel *event)
2391 {
2392         struct evsel *evsel;
2393
2394         if (!event->name)
2395                 return;
2396
2397         evsel = evlist__find_by_index(evlist, event->core.idx);
2398         if (!evsel)
2399                 return;
2400
2401         if (evsel->name)
2402                 return;
2403
2404         evsel->name = strdup(event->name);
2405 }
2406
2407 static int
2408 process_event_desc(struct feat_fd *ff, void *data __maybe_unused)
2409 {
2410         struct perf_session *session;
2411         struct evsel *evsel, *events = read_event_desc(ff);
2412
2413         if (!events)
2414                 return 0;
2415
2416         session = container_of(ff->ph, struct perf_session, header);
2417
2418         if (session->data->is_pipe) {
2419                 /* Save events for reading later by print_event_desc,
2420                  * since they can't be read again in pipe mode. */
2421                 ff->events = events;
2422         }
2423
2424         for (evsel = events; evsel->core.attr.size; evsel++)
2425                 evlist__set_event_name(session->evlist, evsel);
2426
2427         if (!session->data->is_pipe)
2428                 free_event_desc(events);
2429
2430         return 0;
2431 }
2432
2433 static int process_cmdline(struct feat_fd *ff, void *data __maybe_unused)
2434 {
2435         char *str, *cmdline = NULL, **argv = NULL;
2436         u32 nr, i, len = 0;
2437
2438         if (do_read_u32(ff, &nr))
2439                 return -1;
2440
2441         ff->ph->env.nr_cmdline = nr;
2442
2443         cmdline = zalloc(ff->size + nr + 1);
2444         if (!cmdline)
2445                 return -1;
2446
2447         argv = zalloc(sizeof(char *) * (nr + 1));
2448         if (!argv)
2449                 goto error;
2450
2451         for (i = 0; i < nr; i++) {
2452                 str = do_read_string(ff);
2453                 if (!str)
2454                         goto error;
2455
2456                 argv[i] = cmdline + len;
2457                 memcpy(argv[i], str, strlen(str) + 1);
2458                 len += strlen(str) + 1;
2459                 free(str);
2460         }
2461         ff->ph->env.cmdline = cmdline;
2462         ff->ph->env.cmdline_argv = (const char **) argv;
2463         return 0;
2464
2465 error:
2466         free(argv);
2467         free(cmdline);
2468         return -1;
2469 }
2470
2471 static int process_cpu_topology(struct feat_fd *ff, void *data __maybe_unused)
2472 {
2473         u32 nr, i;
2474         char *str;
2475         struct strbuf sb;
2476         int cpu_nr = ff->ph->env.nr_cpus_avail;
2477         u64 size = 0;
2478         struct perf_header *ph = ff->ph;
2479         bool do_core_id_test = true;
2480
2481         ph->env.cpu = calloc(cpu_nr, sizeof(*ph->env.cpu));
2482         if (!ph->env.cpu)
2483                 return -1;
2484
2485         if (do_read_u32(ff, &nr))
2486                 goto free_cpu;
2487
2488         ph->env.nr_sibling_cores = nr;
2489         size += sizeof(u32);
2490         if (strbuf_init(&sb, 128) < 0)
2491                 goto free_cpu;
2492
2493         for (i = 0; i < nr; i++) {
2494                 str = do_read_string(ff);
2495                 if (!str)
2496                         goto error;
2497
2498                 /* include a NULL character at the end */
2499                 if (strbuf_add(&sb, str, strlen(str) + 1) < 0)
2500                         goto error;
2501                 size += string_size(str);
2502                 free(str);
2503         }
2504         ph->env.sibling_cores = strbuf_detach(&sb, NULL);
2505
2506         if (do_read_u32(ff, &nr))
2507                 return -1;
2508
2509         ph->env.nr_sibling_threads = nr;
2510         size += sizeof(u32);
2511
2512         for (i = 0; i < nr; i++) {
2513                 str = do_read_string(ff);
2514                 if (!str)
2515                         goto error;
2516
2517                 /* include a NULL character at the end */
2518                 if (strbuf_add(&sb, str, strlen(str) + 1) < 0)
2519                         goto error;
2520                 size += string_size(str);
2521                 free(str);
2522         }
2523         ph->env.sibling_threads = strbuf_detach(&sb, NULL);
2524
2525         /*
2526          * The header may be from old perf,
2527          * which doesn't include core id and socket id information.
2528          */
2529         if (ff->size <= size) {
2530                 zfree(&ph->env.cpu);
2531                 return 0;
2532         }
2533
2534         /* On s390 the socket_id number is not related to the numbers of cpus.
2535          * The socket_id number might be higher than the numbers of cpus.
2536          * This depends on the configuration.
2537          * AArch64 is the same.
2538          */
2539         if (ph->env.arch && (!strncmp(ph->env.arch, "s390", 4)
2540                           || !strncmp(ph->env.arch, "aarch64", 7)))
2541                 do_core_id_test = false;
2542
2543         for (i = 0; i < (u32)cpu_nr; i++) {
2544                 if (do_read_u32(ff, &nr))
2545                         goto free_cpu;
2546
2547                 ph->env.cpu[i].core_id = nr;
2548                 size += sizeof(u32);
2549
2550                 if (do_read_u32(ff, &nr))
2551                         goto free_cpu;
2552
2553                 if (do_core_id_test && nr != (u32)-1 && nr > (u32)cpu_nr) {
2554                         pr_debug("socket_id number is too big."
2555                                  "You may need to upgrade the perf tool.\n");
2556                         goto free_cpu;
2557                 }
2558
2559                 ph->env.cpu[i].socket_id = nr;
2560                 size += sizeof(u32);
2561         }
2562
2563         /*
2564          * The header may be from old perf,
2565          * which doesn't include die information.
2566          */
2567         if (ff->size <= size)
2568                 return 0;
2569
2570         if (do_read_u32(ff, &nr))
2571                 return -1;
2572
2573         ph->env.nr_sibling_dies = nr;
2574         size += sizeof(u32);
2575
2576         for (i = 0; i < nr; i++) {
2577                 str = do_read_string(ff);
2578                 if (!str)
2579                         goto error;
2580
2581                 /* include a NULL character at the end */
2582                 if (strbuf_add(&sb, str, strlen(str) + 1) < 0)
2583                         goto error;
2584                 size += string_size(str);
2585                 free(str);
2586         }
2587         ph->env.sibling_dies = strbuf_detach(&sb, NULL);
2588
2589         for (i = 0; i < (u32)cpu_nr; i++) {
2590                 if (do_read_u32(ff, &nr))
2591                         goto free_cpu;
2592
2593                 ph->env.cpu[i].die_id = nr;
2594         }
2595
2596         return 0;
2597
2598 error:
2599         strbuf_release(&sb);
2600 free_cpu:
2601         zfree(&ph->env.cpu);
2602         return -1;
2603 }
2604
2605 static int process_numa_topology(struct feat_fd *ff, void *data __maybe_unused)
2606 {
2607         struct numa_node *nodes, *n;
2608         u32 nr, i;
2609         char *str;
2610
2611         /* nr nodes */
2612         if (do_read_u32(ff, &nr))
2613                 return -1;
2614
2615         nodes = zalloc(sizeof(*nodes) * nr);
2616         if (!nodes)
2617                 return -ENOMEM;
2618
2619         for (i = 0; i < nr; i++) {
2620                 n = &nodes[i];
2621
2622                 /* node number */
2623                 if (do_read_u32(ff, &n->node))
2624                         goto error;
2625
2626                 if (do_read_u64(ff, &n->mem_total))
2627                         goto error;
2628
2629                 if (do_read_u64(ff, &n->mem_free))
2630                         goto error;
2631
2632                 str = do_read_string(ff);
2633                 if (!str)
2634                         goto error;
2635
2636                 n->map = perf_cpu_map__new(str);
2637                 if (!n->map)
2638                         goto error;
2639
2640                 free(str);
2641         }
2642         ff->ph->env.nr_numa_nodes = nr;
2643         ff->ph->env.numa_nodes = nodes;
2644         return 0;
2645
2646 error:
2647         free(nodes);
2648         return -1;
2649 }
2650
2651 static int process_pmu_mappings(struct feat_fd *ff, void *data __maybe_unused)
2652 {
2653         char *name;
2654         u32 pmu_num;
2655         u32 type;
2656         struct strbuf sb;
2657
2658         if (do_read_u32(ff, &pmu_num))
2659                 return -1;
2660
2661         if (!pmu_num) {
2662                 pr_debug("pmu mappings not available\n");
2663                 return 0;
2664         }
2665
2666         ff->ph->env.nr_pmu_mappings = pmu_num;
2667         if (strbuf_init(&sb, 128) < 0)
2668                 return -1;
2669
2670         while (pmu_num) {
2671                 if (do_read_u32(ff, &type))
2672                         goto error;
2673
2674                 name = do_read_string(ff);
2675                 if (!name)
2676                         goto error;
2677
2678                 if (strbuf_addf(&sb, "%u:%s", type, name) < 0)
2679                         goto error;
2680                 /* include a NULL character at the end */
2681                 if (strbuf_add(&sb, "", 1) < 0)
2682                         goto error;
2683
2684                 if (!strcmp(name, "msr"))
2685                         ff->ph->env.msr_pmu_type = type;
2686
2687                 free(name);
2688                 pmu_num--;
2689         }
2690         ff->ph->env.pmu_mappings = strbuf_detach(&sb, NULL);
2691         return 0;
2692
2693 error:
2694         strbuf_release(&sb);
2695         return -1;
2696 }
2697
2698 static int process_group_desc(struct feat_fd *ff, void *data __maybe_unused)
2699 {
2700         size_t ret = -1;
2701         u32 i, nr, nr_groups;
2702         struct perf_session *session;
2703         struct evsel *evsel, *leader = NULL;
2704         struct group_desc {
2705                 char *name;
2706                 u32 leader_idx;
2707                 u32 nr_members;
2708         } *desc;
2709
2710         if (do_read_u32(ff, &nr_groups))
2711                 return -1;
2712
2713         ff->ph->env.nr_groups = nr_groups;
2714         if (!nr_groups) {
2715                 pr_debug("group desc not available\n");
2716                 return 0;
2717         }
2718
2719         desc = calloc(nr_groups, sizeof(*desc));
2720         if (!desc)
2721                 return -1;
2722
2723         for (i = 0; i < nr_groups; i++) {
2724                 desc[i].name = do_read_string(ff);
2725                 if (!desc[i].name)
2726                         goto out_free;
2727
2728                 if (do_read_u32(ff, &desc[i].leader_idx))
2729                         goto out_free;
2730
2731                 if (do_read_u32(ff, &desc[i].nr_members))
2732                         goto out_free;
2733         }
2734
2735         /*
2736          * Rebuild group relationship based on the group_desc
2737          */
2738         session = container_of(ff->ph, struct perf_session, header);
2739         session->evlist->core.nr_groups = nr_groups;
2740
2741         i = nr = 0;
2742         evlist__for_each_entry(session->evlist, evsel) {
2743                 if (evsel->core.idx == (int) desc[i].leader_idx) {
2744                         evsel__set_leader(evsel, evsel);
2745                         /* {anon_group} is a dummy name */
2746                         if (strcmp(desc[i].name, "{anon_group}")) {
2747                                 evsel->group_name = desc[i].name;
2748                                 desc[i].name = NULL;
2749                         }
2750                         evsel->core.nr_members = desc[i].nr_members;
2751
2752                         if (i >= nr_groups || nr > 0) {
2753                                 pr_debug("invalid group desc\n");
2754                                 goto out_free;
2755                         }
2756
2757                         leader = evsel;
2758                         nr = evsel->core.nr_members - 1;
2759                         i++;
2760                 } else if (nr) {
2761                         /* This is a group member */
2762                         evsel__set_leader(evsel, leader);
2763
2764                         nr--;
2765                 }
2766         }
2767
2768         if (i != nr_groups || nr != 0) {
2769                 pr_debug("invalid group desc\n");
2770                 goto out_free;
2771         }
2772
2773         ret = 0;
2774 out_free:
2775         for (i = 0; i < nr_groups; i++)
2776                 zfree(&desc[i].name);
2777         free(desc);
2778
2779         return ret;
2780 }
2781
2782 static int process_auxtrace(struct feat_fd *ff, void *data __maybe_unused)
2783 {
2784         struct perf_session *session;
2785         int err;
2786
2787         session = container_of(ff->ph, struct perf_session, header);
2788
2789         err = auxtrace_index__process(ff->fd, ff->size, session,
2790                                       ff->ph->needs_swap);
2791         if (err < 0)
2792                 pr_err("Failed to process auxtrace index\n");
2793         return err;
2794 }
2795
2796 static int process_cache(struct feat_fd *ff, void *data __maybe_unused)
2797 {
2798         struct cpu_cache_level *caches;
2799         u32 cnt, i, version;
2800
2801         if (do_read_u32(ff, &version))
2802                 return -1;
2803
2804         if (version != 1)
2805                 return -1;
2806
2807         if (do_read_u32(ff, &cnt))
2808                 return -1;
2809
2810         caches = zalloc(sizeof(*caches) * cnt);
2811         if (!caches)
2812                 return -1;
2813
2814         for (i = 0; i < cnt; i++) {
2815                 struct cpu_cache_level c;
2816
2817                 #define _R(v)                                           \
2818                         if (do_read_u32(ff, &c.v))\
2819                                 goto out_free_caches;                   \
2820
2821                 _R(level)
2822                 _R(line_size)
2823                 _R(sets)
2824                 _R(ways)
2825                 #undef _R
2826
2827                 #define _R(v)                                   \
2828                         c.v = do_read_string(ff);               \
2829                         if (!c.v)                               \
2830                                 goto out_free_caches;
2831
2832                 _R(type)
2833                 _R(size)
2834                 _R(map)
2835                 #undef _R
2836
2837                 caches[i] = c;
2838         }
2839
2840         ff->ph->env.caches = caches;
2841         ff->ph->env.caches_cnt = cnt;
2842         return 0;
2843 out_free_caches:
2844         free(caches);
2845         return -1;
2846 }
2847
2848 static int process_sample_time(struct feat_fd *ff, void *data __maybe_unused)
2849 {
2850         struct perf_session *session;
2851         u64 first_sample_time, last_sample_time;
2852         int ret;
2853
2854         session = container_of(ff->ph, struct perf_session, header);
2855
2856         ret = do_read_u64(ff, &first_sample_time);
2857         if (ret)
2858                 return -1;
2859
2860         ret = do_read_u64(ff, &last_sample_time);
2861         if (ret)
2862                 return -1;
2863
2864         session->evlist->first_sample_time = first_sample_time;
2865         session->evlist->last_sample_time = last_sample_time;
2866         return 0;
2867 }
2868
2869 static int process_mem_topology(struct feat_fd *ff,
2870                                 void *data __maybe_unused)
2871 {
2872         struct memory_node *nodes;
2873         u64 version, i, nr, bsize;
2874         int ret = -1;
2875
2876         if (do_read_u64(ff, &version))
2877                 return -1;
2878
2879         if (version != 1)
2880                 return -1;
2881
2882         if (do_read_u64(ff, &bsize))
2883                 return -1;
2884
2885         if (do_read_u64(ff, &nr))
2886                 return -1;
2887
2888         nodes = zalloc(sizeof(*nodes) * nr);
2889         if (!nodes)
2890                 return -1;
2891
2892         for (i = 0; i < nr; i++) {
2893                 struct memory_node n;
2894
2895                 #define _R(v)                           \
2896                         if (do_read_u64(ff, &n.v))      \
2897                                 goto out;               \
2898
2899                 _R(node)
2900                 _R(size)
2901
2902                 #undef _R
2903
2904                 if (do_read_bitmap(ff, &n.set, &n.size))
2905                         goto out;
2906
2907                 nodes[i] = n;
2908         }
2909
2910         ff->ph->env.memory_bsize    = bsize;
2911         ff->ph->env.memory_nodes    = nodes;
2912         ff->ph->env.nr_memory_nodes = nr;
2913         ret = 0;
2914
2915 out:
2916         if (ret)
2917                 free(nodes);
2918         return ret;
2919 }
2920
2921 static int process_clockid(struct feat_fd *ff,
2922                            void *data __maybe_unused)
2923 {
2924         if (do_read_u64(ff, &ff->ph->env.clock.clockid_res_ns))
2925                 return -1;
2926
2927         return 0;
2928 }
2929
2930 static int process_clock_data(struct feat_fd *ff,
2931                               void *_data __maybe_unused)
2932 {
2933         u32 data32;
2934         u64 data64;
2935
2936         /* version */
2937         if (do_read_u32(ff, &data32))
2938                 return -1;
2939
2940         if (data32 != 1)
2941                 return -1;
2942
2943         /* clockid */
2944         if (do_read_u32(ff, &data32))
2945                 return -1;
2946
2947         ff->ph->env.clock.clockid = data32;
2948
2949         /* TOD ref time */
2950         if (do_read_u64(ff, &data64))
2951                 return -1;
2952
2953         ff->ph->env.clock.tod_ns = data64;
2954
2955         /* clockid ref time */
2956         if (do_read_u64(ff, &data64))
2957                 return -1;
2958
2959         ff->ph->env.clock.clockid_ns = data64;
2960         ff->ph->env.clock.enabled = true;
2961         return 0;
2962 }
2963
2964 static int process_hybrid_topology(struct feat_fd *ff,
2965                                    void *data __maybe_unused)
2966 {
2967         struct hybrid_node *nodes, *n;
2968         u32 nr, i;
2969
2970         /* nr nodes */
2971         if (do_read_u32(ff, &nr))
2972                 return -1;
2973
2974         nodes = zalloc(sizeof(*nodes) * nr);
2975         if (!nodes)
2976                 return -ENOMEM;
2977
2978         for (i = 0; i < nr; i++) {
2979                 n = &nodes[i];
2980
2981                 n->pmu_name = do_read_string(ff);
2982                 if (!n->pmu_name)
2983                         goto error;
2984
2985                 n->cpus = do_read_string(ff);
2986                 if (!n->cpus)
2987                         goto error;
2988         }
2989
2990         ff->ph->env.nr_hybrid_nodes = nr;
2991         ff->ph->env.hybrid_nodes = nodes;
2992         return 0;
2993
2994 error:
2995         for (i = 0; i < nr; i++) {
2996                 free(nodes[i].pmu_name);
2997                 free(nodes[i].cpus);
2998         }
2999
3000         free(nodes);
3001         return -1;
3002 }
3003
3004 static int process_dir_format(struct feat_fd *ff,
3005                               void *_data __maybe_unused)
3006 {
3007         struct perf_session *session;
3008         struct perf_data *data;
3009
3010         session = container_of(ff->ph, struct perf_session, header);
3011         data = session->data;
3012
3013         if (WARN_ON(!perf_data__is_dir(data)))
3014                 return -1;
3015
3016         return do_read_u64(ff, &data->dir.version);
3017 }
3018
3019 #ifdef HAVE_LIBBPF_SUPPORT
3020 static int process_bpf_prog_info(struct feat_fd *ff, void *data __maybe_unused)
3021 {
3022         struct bpf_prog_info_node *info_node;
3023         struct perf_env *env = &ff->ph->env;
3024         struct perf_bpil *info_linear;
3025         u32 count, i;
3026         int err = -1;
3027
3028         if (ff->ph->needs_swap) {
3029                 pr_warning("interpreting bpf_prog_info from systems with endianness is not yet supported\n");
3030                 return 0;
3031         }
3032
3033         if (do_read_u32(ff, &count))
3034                 return -1;
3035
3036         down_write(&env->bpf_progs.lock);
3037
3038         for (i = 0; i < count; ++i) {
3039                 u32 info_len, data_len;
3040
3041                 info_linear = NULL;
3042                 info_node = NULL;
3043                 if (do_read_u32(ff, &info_len))
3044                         goto out;
3045                 if (do_read_u32(ff, &data_len))
3046                         goto out;
3047
3048                 if (info_len > sizeof(struct bpf_prog_info)) {
3049                         pr_warning("detected invalid bpf_prog_info\n");
3050                         goto out;
3051                 }
3052
3053                 info_linear = malloc(sizeof(struct perf_bpil) +
3054                                      data_len);
3055                 if (!info_linear)
3056                         goto out;
3057                 info_linear->info_len = sizeof(struct bpf_prog_info);
3058                 info_linear->data_len = data_len;
3059                 if (do_read_u64(ff, (u64 *)(&info_linear->arrays)))
3060                         goto out;
3061                 if (__do_read(ff, &info_linear->info, info_len))
3062                         goto out;
3063                 if (info_len < sizeof(struct bpf_prog_info))
3064                         memset(((void *)(&info_linear->info)) + info_len, 0,
3065                                sizeof(struct bpf_prog_info) - info_len);
3066
3067                 if (__do_read(ff, info_linear->data, data_len))
3068                         goto out;
3069
3070                 info_node = malloc(sizeof(struct bpf_prog_info_node));
3071                 if (!info_node)
3072                         goto out;
3073
3074                 /* after reading from file, translate offset to address */
3075                 bpil_offs_to_addr(info_linear);
3076                 info_node->info_linear = info_linear;
3077                 perf_env__insert_bpf_prog_info(env, info_node);
3078         }
3079
3080         up_write(&env->bpf_progs.lock);
3081         return 0;
3082 out:
3083         free(info_linear);
3084         free(info_node);
3085         up_write(&env->bpf_progs.lock);
3086         return err;
3087 }
3088
3089 static int process_bpf_btf(struct feat_fd *ff, void *data __maybe_unused)
3090 {
3091         struct perf_env *env = &ff->ph->env;
3092         struct btf_node *node = NULL;
3093         u32 count, i;
3094         int err = -1;
3095
3096         if (ff->ph->needs_swap) {
3097                 pr_warning("interpreting btf from systems with endianness is not yet supported\n");
3098                 return 0;
3099         }
3100
3101         if (do_read_u32(ff, &count))
3102                 return -1;
3103
3104         down_write(&env->bpf_progs.lock);
3105
3106         for (i = 0; i < count; ++i) {
3107                 u32 id, data_size;
3108
3109                 if (do_read_u32(ff, &id))
3110                         goto out;
3111                 if (do_read_u32(ff, &data_size))
3112                         goto out;
3113
3114                 node = malloc(sizeof(struct btf_node) + data_size);
3115                 if (!node)
3116                         goto out;
3117
3118                 node->id = id;
3119                 node->data_size = data_size;
3120
3121                 if (__do_read(ff, node->data, data_size))
3122                         goto out;
3123
3124                 perf_env__insert_btf(env, node);
3125                 node = NULL;
3126         }
3127
3128         err = 0;
3129 out:
3130         up_write(&env->bpf_progs.lock);
3131         free(node);
3132         return err;
3133 }
3134 #endif // HAVE_LIBBPF_SUPPORT
3135
3136 static int process_compressed(struct feat_fd *ff,
3137                               void *data __maybe_unused)
3138 {
3139         if (do_read_u32(ff, &(ff->ph->env.comp_ver)))
3140                 return -1;
3141
3142         if (do_read_u32(ff, &(ff->ph->env.comp_type)))
3143                 return -1;
3144
3145         if (do_read_u32(ff, &(ff->ph->env.comp_level)))
3146                 return -1;
3147
3148         if (do_read_u32(ff, &(ff->ph->env.comp_ratio)))
3149                 return -1;
3150
3151         if (do_read_u32(ff, &(ff->ph->env.comp_mmap_len)))
3152                 return -1;
3153
3154         return 0;
3155 }
3156
3157 static int process_per_cpu_pmu_caps(struct feat_fd *ff, int *nr_cpu_pmu_caps,
3158                                     char **cpu_pmu_caps,
3159                                     unsigned int *max_branches)
3160 {
3161         char *name, *value;
3162         struct strbuf sb;
3163         u32 nr_caps;
3164
3165         if (do_read_u32(ff, &nr_caps))
3166                 return -1;
3167
3168         if (!nr_caps) {
3169                 pr_debug("cpu pmu capabilities not available\n");
3170                 return 0;
3171         }
3172
3173         *nr_cpu_pmu_caps = nr_caps;
3174
3175         if (strbuf_init(&sb, 128) < 0)
3176                 return -1;
3177
3178         while (nr_caps--) {
3179                 name = do_read_string(ff);
3180                 if (!name)
3181                         goto error;
3182
3183                 value = do_read_string(ff);
3184                 if (!value)
3185                         goto free_name;
3186
3187                 if (strbuf_addf(&sb, "%s=%s", name, value) < 0)
3188                         goto free_value;
3189
3190                 /* include a NULL character at the end */
3191                 if (strbuf_add(&sb, "", 1) < 0)
3192                         goto free_value;
3193
3194                 if (!strcmp(name, "branches"))
3195                         *max_branches = atoi(value);
3196
3197                 free(value);
3198                 free(name);
3199         }
3200         *cpu_pmu_caps = strbuf_detach(&sb, NULL);
3201         return 0;
3202
3203 free_value:
3204         free(value);
3205 free_name:
3206         free(name);
3207 error:
3208         strbuf_release(&sb);
3209         return -1;
3210 }
3211
3212 static int process_cpu_pmu_caps(struct feat_fd *ff,
3213                                 void *data __maybe_unused)
3214 {
3215         return process_per_cpu_pmu_caps(ff, &ff->ph->env.nr_cpu_pmu_caps,
3216                                         &ff->ph->env.cpu_pmu_caps,
3217                                         &ff->ph->env.max_branches);
3218 }
3219
3220 static int process_hybrid_cpu_pmu_caps(struct feat_fd *ff,
3221                                        void *data __maybe_unused)
3222 {
3223         struct hybrid_cpc_node *nodes;
3224         u32 nr_pmu, i;
3225         int ret;
3226
3227         if (do_read_u32(ff, &nr_pmu))
3228                 return -1;
3229
3230         if (!nr_pmu) {
3231                 pr_debug("hybrid cpu pmu capabilities not available\n");
3232                 return 0;
3233         }
3234
3235         nodes = zalloc(sizeof(*nodes) * nr_pmu);
3236         if (!nodes)
3237                 return -ENOMEM;
3238
3239         for (i = 0; i < nr_pmu; i++) {
3240                 struct hybrid_cpc_node *n = &nodes[i];
3241
3242                 ret = process_per_cpu_pmu_caps(ff, &n->nr_cpu_pmu_caps,
3243                                                &n->cpu_pmu_caps,
3244                                                &n->max_branches);
3245                 if (ret)
3246                         goto err;
3247
3248                 n->pmu_name = do_read_string(ff);
3249                 if (!n->pmu_name) {
3250                         ret = -1;
3251                         goto err;
3252                 }
3253         }
3254
3255         ff->ph->env.nr_hybrid_cpc_nodes = nr_pmu;
3256         ff->ph->env.hybrid_cpc_nodes = nodes;
3257         return 0;
3258
3259 err:
3260         for (i = 0; i < nr_pmu; i++) {
3261                 free(nodes[i].cpu_pmu_caps);
3262                 free(nodes[i].pmu_name);
3263         }
3264
3265         free(nodes);
3266         return ret;
3267 }
3268
3269 #define FEAT_OPR(n, func, __full_only) \
3270         [HEADER_##n] = {                                        \
3271                 .name       = __stringify(n),                   \
3272                 .write      = write_##func,                     \
3273                 .print      = print_##func,                     \
3274                 .full_only  = __full_only,                      \
3275                 .process    = process_##func,                   \
3276                 .synthesize = true                              \
3277         }
3278
3279 #define FEAT_OPN(n, func, __full_only) \
3280         [HEADER_##n] = {                                        \
3281                 .name       = __stringify(n),                   \
3282                 .write      = write_##func,                     \
3283                 .print      = print_##func,                     \
3284                 .full_only  = __full_only,                      \
3285                 .process    = process_##func                    \
3286         }
3287
3288 /* feature_ops not implemented: */
3289 #define print_tracing_data      NULL
3290 #define print_build_id          NULL
3291
3292 #define process_branch_stack    NULL
3293 #define process_stat            NULL
3294
3295 // Only used in util/synthetic-events.c
3296 const struct perf_header_feature_ops feat_ops[HEADER_LAST_FEATURE];
3297
3298 const struct perf_header_feature_ops feat_ops[HEADER_LAST_FEATURE] = {
3299         FEAT_OPN(TRACING_DATA,  tracing_data,   false),
3300         FEAT_OPN(BUILD_ID,      build_id,       false),
3301         FEAT_OPR(HOSTNAME,      hostname,       false),
3302         FEAT_OPR(OSRELEASE,     osrelease,      false),
3303         FEAT_OPR(VERSION,       version,        false),
3304         FEAT_OPR(ARCH,          arch,           false),
3305         FEAT_OPR(NRCPUS,        nrcpus,         false),
3306         FEAT_OPR(CPUDESC,       cpudesc,        false),
3307         FEAT_OPR(CPUID,         cpuid,          false),
3308         FEAT_OPR(TOTAL_MEM,     total_mem,      false),
3309         FEAT_OPR(EVENT_DESC,    event_desc,     false),
3310         FEAT_OPR(CMDLINE,       cmdline,        false),
3311         FEAT_OPR(CPU_TOPOLOGY,  cpu_topology,   true),
3312         FEAT_OPR(NUMA_TOPOLOGY, numa_topology,  true),
3313         FEAT_OPN(BRANCH_STACK,  branch_stack,   false),
3314         FEAT_OPR(PMU_MAPPINGS,  pmu_mappings,   false),
3315         FEAT_OPR(GROUP_DESC,    group_desc,     false),
3316         FEAT_OPN(AUXTRACE,      auxtrace,       false),
3317         FEAT_OPN(STAT,          stat,           false),
3318         FEAT_OPN(CACHE,         cache,          true),
3319         FEAT_OPR(SAMPLE_TIME,   sample_time,    false),
3320         FEAT_OPR(MEM_TOPOLOGY,  mem_topology,   true),
3321         FEAT_OPR(CLOCKID,       clockid,        false),
3322         FEAT_OPN(DIR_FORMAT,    dir_format,     false),
3323 #ifdef HAVE_LIBBPF_SUPPORT
3324         FEAT_OPR(BPF_PROG_INFO, bpf_prog_info,  false),
3325         FEAT_OPR(BPF_BTF,       bpf_btf,        false),
3326 #endif
3327         FEAT_OPR(COMPRESSED,    compressed,     false),
3328         FEAT_OPR(CPU_PMU_CAPS,  cpu_pmu_caps,   false),
3329         FEAT_OPR(CLOCK_DATA,    clock_data,     false),
3330         FEAT_OPN(HYBRID_TOPOLOGY,       hybrid_topology,        true),
3331         FEAT_OPR(HYBRID_CPU_PMU_CAPS,   hybrid_cpu_pmu_caps,    false),
3332 };
3333
3334 struct header_print_data {
3335         FILE *fp;
3336         bool full; /* extended list of headers */
3337 };
3338
3339 static int perf_file_section__fprintf_info(struct perf_file_section *section,
3340                                            struct perf_header *ph,
3341                                            int feat, int fd, void *data)
3342 {
3343         struct header_print_data *hd = data;
3344         struct feat_fd ff;
3345
3346         if (lseek(fd, section->offset, SEEK_SET) == (off_t)-1) {
3347                 pr_debug("Failed to lseek to %" PRIu64 " offset for feature "
3348                                 "%d, continuing...\n", section->offset, feat);
3349                 return 0;
3350         }
3351         if (feat >= HEADER_LAST_FEATURE) {
3352                 pr_warning("unknown feature %d\n", feat);
3353                 return 0;
3354         }
3355         if (!feat_ops[feat].print)
3356                 return 0;
3357
3358         ff = (struct  feat_fd) {
3359                 .fd = fd,
3360                 .ph = ph,
3361         };
3362
3363         if (!feat_ops[feat].full_only || hd->full)
3364                 feat_ops[feat].print(&ff, hd->fp);
3365         else
3366                 fprintf(hd->fp, "# %s info available, use -I to display\n",
3367                         feat_ops[feat].name);
3368
3369         return 0;
3370 }
3371
3372 int perf_header__fprintf_info(struct perf_session *session, FILE *fp, bool full)
3373 {
3374         struct header_print_data hd;
3375         struct perf_header *header = &session->header;
3376         int fd = perf_data__fd(session->data);
3377         struct stat st;
3378         time_t stctime;
3379         int ret, bit;
3380
3381         hd.fp = fp;
3382         hd.full = full;
3383
3384         ret = fstat(fd, &st);
3385         if (ret == -1)
3386                 return -1;
3387
3388         stctime = st.st_mtime;
3389         fprintf(fp, "# captured on    : %s", ctime(&stctime));
3390
3391         fprintf(fp, "# header version : %u\n", header->version);
3392         fprintf(fp, "# data offset    : %" PRIu64 "\n", header->data_offset);
3393         fprintf(fp, "# data size      : %" PRIu64 "\n", header->data_size);
3394         fprintf(fp, "# feat offset    : %" PRIu64 "\n", header->feat_offset);
3395
3396         perf_header__process_sections(header, fd, &hd,
3397                                       perf_file_section__fprintf_info);
3398
3399         if (session->data->is_pipe)
3400                 return 0;
3401
3402         fprintf(fp, "# missing features: ");
3403         for_each_clear_bit(bit, header->adds_features, HEADER_LAST_FEATURE) {
3404                 if (bit)
3405                         fprintf(fp, "%s ", feat_ops[bit].name);
3406         }
3407
3408         fprintf(fp, "\n");
3409         return 0;
3410 }
3411
3412 static int do_write_feat(struct feat_fd *ff, int type,
3413                          struct perf_file_section **p,
3414                          struct evlist *evlist)
3415 {
3416         int err;
3417         int ret = 0;
3418
3419         if (perf_header__has_feat(ff->ph, type)) {
3420                 if (!feat_ops[type].write)
3421                         return -1;
3422
3423                 if (WARN(ff->buf, "Error: calling %s in pipe-mode.\n", __func__))
3424                         return -1;
3425
3426                 (*p)->offset = lseek(ff->fd, 0, SEEK_CUR);
3427
3428                 err = feat_ops[type].write(ff, evlist);
3429                 if (err < 0) {
3430                         pr_debug("failed to write feature %s\n", feat_ops[type].name);
3431
3432                         /* undo anything written */
3433                         lseek(ff->fd, (*p)->offset, SEEK_SET);
3434
3435                         return -1;
3436                 }
3437                 (*p)->size = lseek(ff->fd, 0, SEEK_CUR) - (*p)->offset;
3438                 (*p)++;
3439         }
3440         return ret;
3441 }
3442
3443 static int perf_header__adds_write(struct perf_header *header,
3444                                    struct evlist *evlist, int fd)
3445 {
3446         int nr_sections;
3447         struct feat_fd ff;
3448         struct perf_file_section *feat_sec, *p;
3449         int sec_size;
3450         u64 sec_start;
3451         int feat;
3452         int err;
3453
3454         ff = (struct feat_fd){
3455                 .fd  = fd,
3456                 .ph = header,
3457         };
3458
3459         nr_sections = bitmap_weight(header->adds_features, HEADER_FEAT_BITS);
3460         if (!nr_sections)
3461                 return 0;
3462
3463         feat_sec = p = calloc(nr_sections, sizeof(*feat_sec));
3464         if (feat_sec == NULL)
3465                 return -ENOMEM;
3466
3467         sec_size = sizeof(*feat_sec) * nr_sections;
3468
3469         sec_start = header->feat_offset;
3470         lseek(fd, sec_start + sec_size, SEEK_SET);
3471
3472         for_each_set_bit(feat, header->adds_features, HEADER_FEAT_BITS) {
3473                 if (do_write_feat(&ff, feat, &p, evlist))
3474                         perf_header__clear_feat(header, feat);
3475         }
3476
3477         lseek(fd, sec_start, SEEK_SET);
3478         /*
3479          * may write more than needed due to dropped feature, but
3480          * this is okay, reader will skip the missing entries
3481          */
3482         err = do_write(&ff, feat_sec, sec_size);
3483         if (err < 0)
3484                 pr_debug("failed to write feature section\n");
3485         free(feat_sec);
3486         return err;
3487 }
3488
3489 int perf_header__write_pipe(int fd)
3490 {
3491         struct perf_pipe_file_header f_header;
3492         struct feat_fd ff;
3493         int err;
3494
3495         ff = (struct feat_fd){ .fd = fd };
3496
3497         f_header = (struct perf_pipe_file_header){
3498                 .magic     = PERF_MAGIC,
3499                 .size      = sizeof(f_header),
3500         };
3501
3502         err = do_write(&ff, &f_header, sizeof(f_header));
3503         if (err < 0) {
3504                 pr_debug("failed to write perf pipe header\n");
3505                 return err;
3506         }
3507
3508         return 0;
3509 }
3510
3511 int perf_session__write_header(struct perf_session *session,
3512                                struct evlist *evlist,
3513                                int fd, bool at_exit)
3514 {
3515         struct perf_file_header f_header;
3516         struct perf_file_attr   f_attr;
3517         struct perf_header *header = &session->header;
3518         struct evsel *evsel;
3519         struct feat_fd ff;
3520         u64 attr_offset;
3521         int err;
3522
3523         ff = (struct feat_fd){ .fd = fd};
3524         lseek(fd, sizeof(f_header), SEEK_SET);
3525
3526         evlist__for_each_entry(session->evlist, evsel) {
3527                 evsel->id_offset = lseek(fd, 0, SEEK_CUR);
3528                 err = do_write(&ff, evsel->core.id, evsel->core.ids * sizeof(u64));
3529                 if (err < 0) {
3530                         pr_debug("failed to write perf header\n");
3531                         return err;
3532                 }
3533         }
3534
3535         attr_offset = lseek(ff.fd, 0, SEEK_CUR);
3536
3537         evlist__for_each_entry(evlist, evsel) {
3538                 if (evsel->core.attr.size < sizeof(evsel->core.attr)) {
3539                         /*
3540                          * We are likely in "perf inject" and have read
3541                          * from an older file. Update attr size so that
3542                          * reader gets the right offset to the ids.
3543                          */
3544                         evsel->core.attr.size = sizeof(evsel->core.attr);
3545                 }
3546                 f_attr = (struct perf_file_attr){
3547                         .attr = evsel->core.attr,
3548                         .ids  = {
3549                                 .offset = evsel->id_offset,
3550                                 .size   = evsel->core.ids * sizeof(u64),
3551                         }
3552                 };
3553                 err = do_write(&ff, &f_attr, sizeof(f_attr));
3554                 if (err < 0) {
3555                         pr_debug("failed to write perf header attribute\n");
3556                         return err;
3557                 }
3558         }
3559
3560         if (!header->data_offset)
3561                 header->data_offset = lseek(fd, 0, SEEK_CUR);
3562         header->feat_offset = header->data_offset + header->data_size;
3563
3564         if (at_exit) {
3565                 err = perf_header__adds_write(header, evlist, fd);
3566                 if (err < 0)
3567                         return err;
3568         }
3569
3570         f_header = (struct perf_file_header){
3571                 .magic     = PERF_MAGIC,
3572                 .size      = sizeof(f_header),
3573                 .attr_size = sizeof(f_attr),
3574                 .attrs = {
3575                         .offset = attr_offset,
3576                         .size   = evlist->core.nr_entries * sizeof(f_attr),
3577                 },
3578                 .data = {
3579                         .offset = header->data_offset,
3580                         .size   = header->data_size,
3581                 },
3582                 /* event_types is ignored, store zeros */
3583         };
3584
3585         memcpy(&f_header.adds_features, &header->adds_features, sizeof(header->adds_features));
3586
3587         lseek(fd, 0, SEEK_SET);
3588         err = do_write(&ff, &f_header, sizeof(f_header));
3589         if (err < 0) {
3590                 pr_debug("failed to write perf header\n");
3591                 return err;
3592         }
3593         lseek(fd, header->data_offset + header->data_size, SEEK_SET);
3594
3595         return 0;
3596 }
3597
3598 static int perf_header__getbuffer64(struct perf_header *header,
3599                                     int fd, void *buf, size_t size)
3600 {
3601         if (readn(fd, buf, size) <= 0)
3602                 return -1;
3603
3604         if (header->needs_swap)
3605                 mem_bswap_64(buf, size);
3606
3607         return 0;
3608 }
3609
3610 int perf_header__process_sections(struct perf_header *header, int fd,
3611                                   void *data,
3612                                   int (*process)(struct perf_file_section *section,
3613                                                  struct perf_header *ph,
3614                                                  int feat, int fd, void *data))
3615 {
3616         struct perf_file_section *feat_sec, *sec;
3617         int nr_sections;
3618         int sec_size;
3619         int feat;
3620         int err;
3621
3622         nr_sections = bitmap_weight(header->adds_features, HEADER_FEAT_BITS);
3623         if (!nr_sections)
3624                 return 0;
3625
3626         feat_sec = sec = calloc(nr_sections, sizeof(*feat_sec));
3627         if (!feat_sec)
3628                 return -1;
3629
3630         sec_size = sizeof(*feat_sec) * nr_sections;
3631
3632         lseek(fd, header->feat_offset, SEEK_SET);
3633
3634         err = perf_header__getbuffer64(header, fd, feat_sec, sec_size);
3635         if (err < 0)
3636                 goto out_free;
3637
3638         for_each_set_bit(feat, header->adds_features, HEADER_LAST_FEATURE) {
3639                 err = process(sec++, header, feat, fd, data);
3640                 if (err < 0)
3641                         goto out_free;
3642         }
3643         err = 0;
3644 out_free:
3645         free(feat_sec);
3646         return err;
3647 }
3648
3649 static const int attr_file_abi_sizes[] = {
3650         [0] = PERF_ATTR_SIZE_VER0,
3651         [1] = PERF_ATTR_SIZE_VER1,
3652         [2] = PERF_ATTR_SIZE_VER2,
3653         [3] = PERF_ATTR_SIZE_VER3,
3654         [4] = PERF_ATTR_SIZE_VER4,
3655         0,
3656 };
3657
3658 /*
3659  * In the legacy file format, the magic number is not used to encode endianness.
3660  * hdr_sz was used to encode endianness. But given that hdr_sz can vary based
3661  * on ABI revisions, we need to try all combinations for all endianness to
3662  * detect the endianness.
3663  */
3664 static int try_all_file_abis(uint64_t hdr_sz, struct perf_header *ph)
3665 {
3666         uint64_t ref_size, attr_size;
3667         int i;
3668
3669         for (i = 0 ; attr_file_abi_sizes[i]; i++) {
3670                 ref_size = attr_file_abi_sizes[i]
3671                          + sizeof(struct perf_file_section);
3672                 if (hdr_sz != ref_size) {
3673                         attr_size = bswap_64(hdr_sz);
3674                         if (attr_size != ref_size)
3675                                 continue;
3676
3677                         ph->needs_swap = true;
3678                 }
3679                 pr_debug("ABI%d perf.data file detected, need_swap=%d\n",
3680                          i,
3681                          ph->needs_swap);
3682                 return 0;
3683         }
3684         /* could not determine endianness */
3685         return -1;
3686 }
3687
3688 #define PERF_PIPE_HDR_VER0      16
3689
3690 static const size_t attr_pipe_abi_sizes[] = {
3691         [0] = PERF_PIPE_HDR_VER0,
3692         0,
3693 };
3694
3695 /*
3696  * In the legacy pipe format, there is an implicit assumption that endianness
3697  * between host recording the samples, and host parsing the samples is the
3698  * same. This is not always the case given that the pipe output may always be
3699  * redirected into a file and analyzed on a different machine with possibly a
3700  * different endianness and perf_event ABI revisions in the perf tool itself.
3701  */
3702 static int try_all_pipe_abis(uint64_t hdr_sz, struct perf_header *ph)
3703 {
3704         u64 attr_size;
3705         int i;
3706
3707         for (i = 0 ; attr_pipe_abi_sizes[i]; i++) {
3708                 if (hdr_sz != attr_pipe_abi_sizes[i]) {
3709                         attr_size = bswap_64(hdr_sz);
3710                         if (attr_size != hdr_sz)
3711                                 continue;
3712
3713                         ph->needs_swap = true;
3714                 }
3715                 pr_debug("Pipe ABI%d perf.data file detected\n", i);
3716                 return 0;
3717         }
3718         return -1;
3719 }
3720
3721 bool is_perf_magic(u64 magic)
3722 {
3723         if (!memcmp(&magic, __perf_magic1, sizeof(magic))
3724                 || magic == __perf_magic2
3725                 || magic == __perf_magic2_sw)
3726                 return true;
3727
3728         return false;
3729 }
3730
3731 static int check_magic_endian(u64 magic, uint64_t hdr_sz,
3732                               bool is_pipe, struct perf_header *ph)
3733 {
3734         int ret;
3735
3736         /* check for legacy format */
3737         ret = memcmp(&magic, __perf_magic1, sizeof(magic));
3738         if (ret == 0) {
3739                 ph->version = PERF_HEADER_VERSION_1;
3740                 pr_debug("legacy perf.data format\n");
3741                 if (is_pipe)
3742                         return try_all_pipe_abis(hdr_sz, ph);
3743
3744                 return try_all_file_abis(hdr_sz, ph);
3745         }
3746         /*
3747          * the new magic number serves two purposes:
3748          * - unique number to identify actual perf.data files
3749          * - encode endianness of file
3750          */
3751         ph->version = PERF_HEADER_VERSION_2;
3752
3753         /* check magic number with one endianness */
3754         if (magic == __perf_magic2)
3755                 return 0;
3756
3757         /* check magic number with opposite endianness */
3758         if (magic != __perf_magic2_sw)
3759                 return -1;
3760
3761         ph->needs_swap = true;
3762
3763         return 0;
3764 }
3765
3766 int perf_file_header__read(struct perf_file_header *header,
3767                            struct perf_header *ph, int fd)
3768 {
3769         ssize_t ret;
3770
3771         lseek(fd, 0, SEEK_SET);
3772
3773         ret = readn(fd, header, sizeof(*header));
3774         if (ret <= 0)
3775                 return -1;
3776
3777         if (check_magic_endian(header->magic,
3778                                header->attr_size, false, ph) < 0) {
3779                 pr_debug("magic/endian check failed\n");
3780                 return -1;
3781         }
3782
3783         if (ph->needs_swap) {
3784                 mem_bswap_64(header, offsetof(struct perf_file_header,
3785                              adds_features));
3786         }
3787
3788         if (header->size != sizeof(*header)) {
3789                 /* Support the previous format */
3790                 if (header->size == offsetof(typeof(*header), adds_features))
3791                         bitmap_zero(header->adds_features, HEADER_FEAT_BITS);
3792                 else
3793                         return -1;
3794         } else if (ph->needs_swap) {
3795                 /*
3796                  * feature bitmap is declared as an array of unsigned longs --
3797                  * not good since its size can differ between the host that
3798                  * generated the data file and the host analyzing the file.
3799                  *
3800                  * We need to handle endianness, but we don't know the size of
3801                  * the unsigned long where the file was generated. Take a best
3802                  * guess at determining it: try 64-bit swap first (ie., file
3803                  * created on a 64-bit host), and check if the hostname feature
3804                  * bit is set (this feature bit is forced on as of fbe96f2).
3805                  * If the bit is not, undo the 64-bit swap and try a 32-bit
3806                  * swap. If the hostname bit is still not set (e.g., older data
3807                  * file), punt and fallback to the original behavior --
3808                  * clearing all feature bits and setting buildid.
3809                  */
3810                 mem_bswap_64(&header->adds_features,
3811                             BITS_TO_U64(HEADER_FEAT_BITS));
3812
3813                 if (!test_bit(HEADER_HOSTNAME, header->adds_features)) {
3814                         /* unswap as u64 */
3815                         mem_bswap_64(&header->adds_features,
3816                                     BITS_TO_U64(HEADER_FEAT_BITS));
3817
3818                         /* unswap as u32 */
3819                         mem_bswap_32(&header->adds_features,
3820                                     BITS_TO_U32(HEADER_FEAT_BITS));
3821                 }
3822
3823                 if (!test_bit(HEADER_HOSTNAME, header->adds_features)) {
3824                         bitmap_zero(header->adds_features, HEADER_FEAT_BITS);
3825                         set_bit(HEADER_BUILD_ID, header->adds_features);
3826                 }
3827         }
3828
3829         memcpy(&ph->adds_features, &header->adds_features,
3830                sizeof(ph->adds_features));
3831
3832         ph->data_offset  = header->data.offset;
3833         ph->data_size    = header->data.size;
3834         ph->feat_offset  = header->data.offset + header->data.size;
3835         return 0;
3836 }
3837
3838 static int perf_file_section__process(struct perf_file_section *section,
3839                                       struct perf_header *ph,
3840                                       int feat, int fd, void *data)
3841 {
3842         struct feat_fd fdd = {
3843                 .fd     = fd,
3844                 .ph     = ph,
3845                 .size   = section->size,
3846                 .offset = section->offset,
3847         };
3848
3849         if (lseek(fd, section->offset, SEEK_SET) == (off_t)-1) {
3850                 pr_debug("Failed to lseek to %" PRIu64 " offset for feature "
3851                           "%d, continuing...\n", section->offset, feat);
3852                 return 0;
3853         }
3854
3855         if (feat >= HEADER_LAST_FEATURE) {
3856                 pr_debug("unknown feature %d, continuing...\n", feat);
3857                 return 0;
3858         }
3859
3860         if (!feat_ops[feat].process)
3861                 return 0;
3862
3863         return feat_ops[feat].process(&fdd, data);
3864 }
3865
3866 static int perf_file_header__read_pipe(struct perf_pipe_file_header *header,
3867                                        struct perf_header *ph,
3868                                        struct perf_data* data,
3869                                        bool repipe, int repipe_fd)
3870 {
3871         struct feat_fd ff = {
3872                 .fd = repipe_fd,
3873                 .ph = ph,
3874         };
3875         ssize_t ret;
3876
3877         ret = perf_data__read(data, header, sizeof(*header));
3878         if (ret <= 0)
3879                 return -1;
3880
3881         if (check_magic_endian(header->magic, header->size, true, ph) < 0) {
3882                 pr_debug("endian/magic failed\n");
3883                 return -1;
3884         }
3885
3886         if (ph->needs_swap)
3887                 header->size = bswap_64(header->size);
3888
3889         if (repipe && do_write(&ff, header, sizeof(*header)) < 0)
3890                 return -1;
3891
3892         return 0;
3893 }
3894
3895 static int perf_header__read_pipe(struct perf_session *session, int repipe_fd)
3896 {
3897         struct perf_header *header = &session->header;
3898         struct perf_pipe_file_header f_header;
3899
3900         if (perf_file_header__read_pipe(&f_header, header, session->data,
3901                                         session->repipe, repipe_fd) < 0) {
3902                 pr_debug("incompatible file format\n");
3903                 return -EINVAL;
3904         }
3905
3906         return f_header.size == sizeof(f_header) ? 0 : -1;
3907 }
3908
3909 static int read_attr(int fd, struct perf_header *ph,
3910                      struct perf_file_attr *f_attr)
3911 {
3912         struct perf_event_attr *attr = &f_attr->attr;
3913         size_t sz, left;
3914         size_t our_sz = sizeof(f_attr->attr);
3915         ssize_t ret;
3916
3917         memset(f_attr, 0, sizeof(*f_attr));
3918
3919         /* read minimal guaranteed structure */
3920         ret = readn(fd, attr, PERF_ATTR_SIZE_VER0);
3921         if (ret <= 0) {
3922                 pr_debug("cannot read %d bytes of header attr\n",
3923                          PERF_ATTR_SIZE_VER0);
3924                 return -1;
3925         }
3926
3927         /* on file perf_event_attr size */
3928         sz = attr->size;
3929
3930         if (ph->needs_swap)
3931                 sz = bswap_32(sz);
3932
3933         if (sz == 0) {
3934                 /* assume ABI0 */
3935                 sz =  PERF_ATTR_SIZE_VER0;
3936         } else if (sz > our_sz) {
3937                 pr_debug("file uses a more recent and unsupported ABI"
3938                          " (%zu bytes extra)\n", sz - our_sz);
3939                 return -1;
3940         }
3941         /* what we have not yet read and that we know about */
3942         left = sz - PERF_ATTR_SIZE_VER0;
3943         if (left) {
3944                 void *ptr = attr;
3945                 ptr += PERF_ATTR_SIZE_VER0;
3946
3947                 ret = readn(fd, ptr, left);
3948         }
3949         /* read perf_file_section, ids are read in caller */
3950         ret = readn(fd, &f_attr->ids, sizeof(f_attr->ids));
3951
3952         return ret <= 0 ? -1 : 0;
3953 }
3954
3955 static int evsel__prepare_tracepoint_event(struct evsel *evsel, struct tep_handle *pevent)
3956 {
3957         struct tep_event *event;
3958         char bf[128];
3959
3960         /* already prepared */
3961         if (evsel->tp_format)
3962                 return 0;
3963
3964         if (pevent == NULL) {
3965                 pr_debug("broken or missing trace data\n");
3966                 return -1;
3967         }
3968
3969         event = tep_find_event(pevent, evsel->core.attr.config);
3970         if (event == NULL) {
3971                 pr_debug("cannot find event format for %d\n", (int)evsel->core.attr.config);
3972                 return -1;
3973         }
3974
3975         if (!evsel->name) {
3976                 snprintf(bf, sizeof(bf), "%s:%s", event->system, event->name);
3977                 evsel->name = strdup(bf);
3978                 if (evsel->name == NULL)
3979                         return -1;
3980         }
3981
3982         evsel->tp_format = event;
3983         return 0;
3984 }
3985
3986 static int evlist__prepare_tracepoint_events(struct evlist *evlist, struct tep_handle *pevent)
3987 {
3988         struct evsel *pos;
3989
3990         evlist__for_each_entry(evlist, pos) {
3991                 if (pos->core.attr.type == PERF_TYPE_TRACEPOINT &&
3992                     evsel__prepare_tracepoint_event(pos, pevent))
3993                         return -1;
3994         }
3995
3996         return 0;
3997 }
3998
3999 int perf_session__read_header(struct perf_session *session, int repipe_fd)
4000 {
4001         struct perf_data *data = session->data;
4002         struct perf_header *header = &session->header;
4003         struct perf_file_header f_header;
4004         struct perf_file_attr   f_attr;
4005         u64                     f_id;
4006         int nr_attrs, nr_ids, i, j, err;
4007         int fd = perf_data__fd(data);
4008
4009         session->evlist = evlist__new();
4010         if (session->evlist == NULL)
4011                 return -ENOMEM;
4012
4013         session->evlist->env = &header->env;
4014         session->machines.host.env = &header->env;
4015
4016         /*
4017          * We can read 'pipe' data event from regular file,
4018          * check for the pipe header regardless of source.
4019          */
4020         err = perf_header__read_pipe(session, repipe_fd);
4021         if (!err || perf_data__is_pipe(data)) {
4022                 data->is_pipe = true;
4023                 return err;
4024         }
4025
4026         if (perf_file_header__read(&f_header, header, fd) < 0)
4027                 return -EINVAL;
4028
4029         if (header->needs_swap && data->in_place_update) {
4030                 pr_err("In-place update not supported when byte-swapping is required\n");
4031                 return -EINVAL;
4032         }
4033
4034         /*
4035          * Sanity check that perf.data was written cleanly; data size is
4036          * initialized to 0 and updated only if the on_exit function is run.
4037          * If data size is still 0 then the file contains only partial
4038          * information.  Just warn user and process it as much as it can.
4039          */
4040         if (f_header.data.size == 0) {
4041                 pr_warning("WARNING: The %s file's data size field is 0 which is unexpected.\n"
4042                            "Was the 'perf record' command properly terminated?\n",
4043                            data->file.path);
4044         }
4045
4046         if (f_header.attr_size == 0) {
4047                 pr_err("ERROR: The %s file's attr size field is 0 which is unexpected.\n"
4048                        "Was the 'perf record' command properly terminated?\n",
4049                        data->file.path);
4050                 return -EINVAL;
4051         }
4052
4053         nr_attrs = f_header.attrs.size / f_header.attr_size;
4054         lseek(fd, f_header.attrs.offset, SEEK_SET);
4055
4056         for (i = 0; i < nr_attrs; i++) {
4057                 struct evsel *evsel;
4058                 off_t tmp;
4059
4060                 if (read_attr(fd, header, &f_attr) < 0)
4061                         goto out_errno;
4062
4063                 if (header->needs_swap) {
4064                         f_attr.ids.size   = bswap_64(f_attr.ids.size);
4065                         f_attr.ids.offset = bswap_64(f_attr.ids.offset);
4066                         perf_event__attr_swap(&f_attr.attr);
4067                 }
4068
4069                 tmp = lseek(fd, 0, SEEK_CUR);
4070                 evsel = evsel__new(&f_attr.attr);
4071
4072                 if (evsel == NULL)
4073                         goto out_delete_evlist;
4074
4075                 evsel->needs_swap = header->needs_swap;
4076                 /*
4077                  * Do it before so that if perf_evsel__alloc_id fails, this
4078                  * entry gets purged too at evlist__delete().
4079                  */
4080                 evlist__add(session->evlist, evsel);
4081
4082                 nr_ids = f_attr.ids.size / sizeof(u64);
4083                 /*
4084                  * We don't have the cpu and thread maps on the header, so
4085                  * for allocating the perf_sample_id table we fake 1 cpu and
4086                  * hattr->ids threads.
4087                  */
4088                 if (perf_evsel__alloc_id(&evsel->core, 1, nr_ids))
4089                         goto out_delete_evlist;
4090
4091                 lseek(fd, f_attr.ids.offset, SEEK_SET);
4092
4093                 for (j = 0; j < nr_ids; j++) {
4094                         if (perf_header__getbuffer64(header, fd, &f_id, sizeof(f_id)))
4095                                 goto out_errno;
4096
4097                         perf_evlist__id_add(&session->evlist->core, &evsel->core, 0, j, f_id);
4098                 }
4099
4100                 lseek(fd, tmp, SEEK_SET);
4101         }
4102
4103         perf_header__process_sections(header, fd, &session->tevent,
4104                                       perf_file_section__process);
4105
4106         if (evlist__prepare_tracepoint_events(session->evlist, session->tevent.pevent))
4107                 goto out_delete_evlist;
4108
4109         return 0;
4110 out_errno:
4111         return -errno;
4112
4113 out_delete_evlist:
4114         evlist__delete(session->evlist);
4115         session->evlist = NULL;
4116         return -ENOMEM;
4117 }
4118
4119 int perf_event__process_feature(struct perf_session *session,
4120                                 union perf_event *event)
4121 {
4122         struct perf_tool *tool = session->tool;
4123         struct feat_fd ff = { .fd = 0 };
4124         struct perf_record_header_feature *fe = (struct perf_record_header_feature *)event;
4125         int type = fe->header.type;
4126         u64 feat = fe->feat_id;
4127
4128         if (type < 0 || type >= PERF_RECORD_HEADER_MAX) {
4129                 pr_warning("invalid record type %d in pipe-mode\n", type);
4130                 return 0;
4131         }
4132         if (feat == HEADER_RESERVED || feat >= HEADER_LAST_FEATURE) {
4133                 pr_warning("invalid record type %d in pipe-mode\n", type);
4134                 return -1;
4135         }
4136
4137         if (!feat_ops[feat].process)
4138                 return 0;
4139
4140         ff.buf  = (void *)fe->data;
4141         ff.size = event->header.size - sizeof(*fe);
4142         ff.ph = &session->header;
4143
4144         if (feat_ops[feat].process(&ff, NULL))
4145                 return -1;
4146
4147         if (!feat_ops[feat].print || !tool->show_feat_hdr)
4148                 return 0;
4149
4150         if (!feat_ops[feat].full_only ||
4151             tool->show_feat_hdr >= SHOW_FEAT_HEADER_FULL_INFO) {
4152                 feat_ops[feat].print(&ff, stdout);
4153         } else {
4154                 fprintf(stdout, "# %s info available, use -I to display\n",
4155                         feat_ops[feat].name);
4156         }
4157
4158         return 0;
4159 }
4160
4161 size_t perf_event__fprintf_event_update(union perf_event *event, FILE *fp)
4162 {
4163         struct perf_record_event_update *ev = &event->event_update;
4164         struct perf_record_event_update_scale *ev_scale;
4165         struct perf_record_event_update_cpus *ev_cpus;
4166         struct perf_cpu_map *map;
4167         size_t ret;
4168
4169         ret = fprintf(fp, "\n... id:    %" PRI_lu64 "\n", ev->id);
4170
4171         switch (ev->type) {
4172         case PERF_EVENT_UPDATE__SCALE:
4173                 ev_scale = (struct perf_record_event_update_scale *)ev->data;
4174                 ret += fprintf(fp, "... scale: %f\n", ev_scale->scale);
4175                 break;
4176         case PERF_EVENT_UPDATE__UNIT:
4177                 ret += fprintf(fp, "... unit:  %s\n", ev->data);
4178                 break;
4179         case PERF_EVENT_UPDATE__NAME:
4180                 ret += fprintf(fp, "... name:  %s\n", ev->data);
4181                 break;
4182         case PERF_EVENT_UPDATE__CPUS:
4183                 ev_cpus = (struct perf_record_event_update_cpus *)ev->data;
4184                 ret += fprintf(fp, "... ");
4185
4186                 map = cpu_map__new_data(&ev_cpus->cpus);
4187                 if (map)
4188                         ret += cpu_map__fprintf(map, fp);
4189                 else
4190                         ret += fprintf(fp, "failed to get cpus\n");
4191                 break;
4192         default:
4193                 ret += fprintf(fp, "... unknown type\n");
4194                 break;
4195         }
4196
4197         return ret;
4198 }
4199
4200 int perf_event__process_attr(struct perf_tool *tool __maybe_unused,
4201                              union perf_event *event,
4202                              struct evlist **pevlist)
4203 {
4204         u32 i, ids, n_ids;
4205         struct evsel *evsel;
4206         struct evlist *evlist = *pevlist;
4207
4208         if (evlist == NULL) {
4209                 *pevlist = evlist = evlist__new();
4210                 if (evlist == NULL)
4211                         return -ENOMEM;
4212         }
4213
4214         evsel = evsel__new(&event->attr.attr);
4215         if (evsel == NULL)
4216                 return -ENOMEM;
4217
4218         evlist__add(evlist, evsel);
4219
4220         ids = event->header.size;
4221         ids -= (void *)&event->attr.id - (void *)event;
4222         n_ids = ids / sizeof(u64);
4223         /*
4224          * We don't have the cpu and thread maps on the header, so
4225          * for allocating the perf_sample_id table we fake 1 cpu and
4226          * hattr->ids threads.
4227          */
4228         if (perf_evsel__alloc_id(&evsel->core, 1, n_ids))
4229                 return -ENOMEM;
4230
4231         for (i = 0; i < n_ids; i++) {
4232                 perf_evlist__id_add(&evlist->core, &evsel->core, 0, i, event->attr.id[i]);
4233         }
4234
4235         return 0;
4236 }
4237
4238 int perf_event__process_event_update(struct perf_tool *tool __maybe_unused,
4239                                      union perf_event *event,
4240                                      struct evlist **pevlist)
4241 {
4242         struct perf_record_event_update *ev = &event->event_update;
4243         struct perf_record_event_update_scale *ev_scale;
4244         struct perf_record_event_update_cpus *ev_cpus;
4245         struct evlist *evlist;
4246         struct evsel *evsel;
4247         struct perf_cpu_map *map;
4248
4249         if (!pevlist || *pevlist == NULL)
4250                 return -EINVAL;
4251
4252         evlist = *pevlist;
4253
4254         evsel = evlist__id2evsel(evlist, ev->id);
4255         if (evsel == NULL)
4256                 return -EINVAL;
4257
4258         switch (ev->type) {
4259         case PERF_EVENT_UPDATE__UNIT:
4260                 evsel->unit = strdup(ev->data);
4261                 break;
4262         case PERF_EVENT_UPDATE__NAME:
4263                 evsel->name = strdup(ev->data);
4264                 break;
4265         case PERF_EVENT_UPDATE__SCALE:
4266                 ev_scale = (struct perf_record_event_update_scale *)ev->data;
4267                 evsel->scale = ev_scale->scale;
4268                 break;
4269         case PERF_EVENT_UPDATE__CPUS:
4270                 ev_cpus = (struct perf_record_event_update_cpus *)ev->data;
4271
4272                 map = cpu_map__new_data(&ev_cpus->cpus);
4273                 if (map)
4274                         evsel->core.own_cpus = map;
4275                 else
4276                         pr_err("failed to get event_update cpus\n");
4277         default:
4278                 break;
4279         }
4280
4281         return 0;
4282 }
4283
4284 int perf_event__process_tracing_data(struct perf_session *session,
4285                                      union perf_event *event)
4286 {
4287         ssize_t size_read, padding, size = event->tracing_data.size;
4288         int fd = perf_data__fd(session->data);
4289         char buf[BUFSIZ];
4290
4291         /*
4292          * The pipe fd is already in proper place and in any case
4293          * we can't move it, and we'd screw the case where we read
4294          * 'pipe' data from regular file. The trace_report reads
4295          * data from 'fd' so we need to set it directly behind the
4296          * event, where the tracing data starts.
4297          */
4298         if (!perf_data__is_pipe(session->data)) {
4299                 off_t offset = lseek(fd, 0, SEEK_CUR);
4300
4301                 /* setup for reading amidst mmap */
4302                 lseek(fd, offset + sizeof(struct perf_record_header_tracing_data),
4303                       SEEK_SET);
4304         }
4305
4306         size_read = trace_report(fd, &session->tevent,
4307                                  session->repipe);
4308         padding = PERF_ALIGN(size_read, sizeof(u64)) - size_read;
4309
4310         if (readn(fd, buf, padding) < 0) {
4311                 pr_err("%s: reading input file", __func__);
4312                 return -1;
4313         }
4314         if (session->repipe) {
4315                 int retw = write(STDOUT_FILENO, buf, padding);
4316                 if (retw <= 0 || retw != padding) {
4317                         pr_err("%s: repiping tracing data padding", __func__);
4318                         return -1;
4319                 }
4320         }
4321
4322         if (size_read + padding != size) {
4323                 pr_err("%s: tracing data size mismatch", __func__);
4324                 return -1;
4325         }
4326
4327         evlist__prepare_tracepoint_events(session->evlist, session->tevent.pevent);
4328
4329         return size_read + padding;
4330 }
4331
4332 int perf_event__process_build_id(struct perf_session *session,
4333                                  union perf_event *event)
4334 {
4335         __event_process_build_id(&event->build_id,
4336                                  event->build_id.filename,
4337                                  session);
4338         return 0;
4339 }