perf tools: handle spaces in file names obtained from /proc/pid/maps
[linux-2.6-block.git] / tools / perf / util / symbol-elf.c
CommitLineData
e5a1845f
NK
1#include <fcntl.h>
2#include <stdio.h>
3#include <errno.h>
4#include <string.h>
5#include <unistd.h>
6#include <inttypes.h>
7
8#include "symbol.h"
8fa7d87f 9#include "machine.h"
922d0e4d 10#include "vdso.h"
c506c96b 11#include <symbol/kallsyms.h>
e5a1845f
NK
12#include "debug.h"
13
e370a3d5
DA
14#ifndef EM_AARCH64
15#define EM_AARCH64 183 /* ARM 64 bit */
16#endif
17
18
aaba4e12
ACM
19#ifdef HAVE_CPLUS_DEMANGLE_SUPPORT
20extern char *cplus_demangle(const char *, int);
21
22static inline char *bfd_demangle(void __maybe_unused *v, const char *c, int i)
23{
24 return cplus_demangle(c, i);
25}
26#else
27#ifdef NO_DEMANGLE
28static inline char *bfd_demangle(void __maybe_unused *v,
29 const char __maybe_unused *c,
30 int __maybe_unused i)
31{
32 return NULL;
33}
34#else
35#define PACKAGE 'perf'
36#include <bfd.h>
37#endif
38#endif
39
89fe808a 40#ifndef HAVE_ELF_GETPHDRNUM_SUPPORT
179f36dd 41static int elf_getphdrnum(Elf *elf, size_t *dst)
e955d5c4
AH
42{
43 GElf_Ehdr gehdr;
44 GElf_Ehdr *ehdr;
45
46 ehdr = gelf_getehdr(elf, &gehdr);
47 if (!ehdr)
48 return -1;
49
50 *dst = ehdr->e_phnum;
51
52 return 0;
53}
54#endif
55
e5a1845f
NK
56#ifndef NT_GNU_BUILD_ID
57#define NT_GNU_BUILD_ID 3
58#endif
59
60/**
61 * elf_symtab__for_each_symbol - iterate thru all the symbols
62 *
63 * @syms: struct elf_symtab instance to iterate
64 * @idx: uint32_t idx
65 * @sym: GElf_Sym iterator
66 */
67#define elf_symtab__for_each_symbol(syms, nr_syms, idx, sym) \
68 for (idx = 0, gelf_getsym(syms, idx, &sym);\
69 idx < nr_syms; \
70 idx++, gelf_getsym(syms, idx, &sym))
71
72static inline uint8_t elf_sym__type(const GElf_Sym *sym)
73{
74 return GELF_ST_TYPE(sym->st_info);
75}
76
4e31050f
VL
77#ifndef STT_GNU_IFUNC
78#define STT_GNU_IFUNC 10
79#endif
80
e5a1845f
NK
81static inline int elf_sym__is_function(const GElf_Sym *sym)
82{
a2f3b6bf
AH
83 return (elf_sym__type(sym) == STT_FUNC ||
84 elf_sym__type(sym) == STT_GNU_IFUNC) &&
e5a1845f
NK
85 sym->st_name != 0 &&
86 sym->st_shndx != SHN_UNDEF;
87}
88
89static inline bool elf_sym__is_object(const GElf_Sym *sym)
90{
91 return elf_sym__type(sym) == STT_OBJECT &&
92 sym->st_name != 0 &&
93 sym->st_shndx != SHN_UNDEF;
94}
95
96static inline int elf_sym__is_label(const GElf_Sym *sym)
97{
98 return elf_sym__type(sym) == STT_NOTYPE &&
99 sym->st_name != 0 &&
100 sym->st_shndx != SHN_UNDEF &&
101 sym->st_shndx != SHN_ABS;
102}
103
104static bool elf_sym__is_a(GElf_Sym *sym, enum map_type type)
105{
106 switch (type) {
107 case MAP__FUNCTION:
108 return elf_sym__is_function(sym);
109 case MAP__VARIABLE:
110 return elf_sym__is_object(sym);
111 default:
112 return false;
113 }
114}
115
116static inline const char *elf_sym__name(const GElf_Sym *sym,
117 const Elf_Data *symstrs)
118{
119 return symstrs->d_buf + sym->st_name;
120}
121
122static inline const char *elf_sec__name(const GElf_Shdr *shdr,
123 const Elf_Data *secstrs)
124{
125 return secstrs->d_buf + shdr->sh_name;
126}
127
128static inline int elf_sec__is_text(const GElf_Shdr *shdr,
129 const Elf_Data *secstrs)
130{
131 return strstr(elf_sec__name(shdr, secstrs), "text") != NULL;
132}
133
134static inline bool elf_sec__is_data(const GElf_Shdr *shdr,
135 const Elf_Data *secstrs)
136{
137 return strstr(elf_sec__name(shdr, secstrs), "data") != NULL;
138}
139
140static bool elf_sec__is_a(GElf_Shdr *shdr, Elf_Data *secstrs,
141 enum map_type type)
142{
143 switch (type) {
144 case MAP__FUNCTION:
145 return elf_sec__is_text(shdr, secstrs);
146 case MAP__VARIABLE:
147 return elf_sec__is_data(shdr, secstrs);
148 default:
149 return false;
150 }
151}
152
153static size_t elf_addr_to_index(Elf *elf, GElf_Addr addr)
154{
155 Elf_Scn *sec = NULL;
156 GElf_Shdr shdr;
157 size_t cnt = 1;
158
159 while ((sec = elf_nextscn(elf, sec)) != NULL) {
160 gelf_getshdr(sec, &shdr);
161
162 if ((addr >= shdr.sh_addr) &&
163 (addr < (shdr.sh_addr + shdr.sh_size)))
164 return cnt;
165
166 ++cnt;
167 }
168
169 return -1;
170}
171
99ca4233
MH
172Elf_Scn *elf_section_by_name(Elf *elf, GElf_Ehdr *ep,
173 GElf_Shdr *shp, const char *name, size_t *idx)
e5a1845f
NK
174{
175 Elf_Scn *sec = NULL;
176 size_t cnt = 1;
177
49274654
CS
178 /* Elf is corrupted/truncated, avoid calling elf_strptr. */
179 if (!elf_rawdata(elf_getscn(elf, ep->e_shstrndx), NULL))
180 return NULL;
181
e5a1845f
NK
182 while ((sec = elf_nextscn(elf, sec)) != NULL) {
183 char *str;
184
185 gelf_getshdr(sec, shp);
186 str = elf_strptr(elf, ep->e_shstrndx, shp->sh_name);
155b3a13 187 if (str && !strcmp(name, str)) {
e5a1845f
NK
188 if (idx)
189 *idx = cnt;
155b3a13 190 return sec;
e5a1845f
NK
191 }
192 ++cnt;
193 }
194
155b3a13 195 return NULL;
e5a1845f
NK
196}
197
198#define elf_section__for_each_rel(reldata, pos, pos_mem, idx, nr_entries) \
199 for (idx = 0, pos = gelf_getrel(reldata, 0, &pos_mem); \
200 idx < nr_entries; \
201 ++idx, pos = gelf_getrel(reldata, idx, &pos_mem))
202
203#define elf_section__for_each_rela(reldata, pos, pos_mem, idx, nr_entries) \
204 for (idx = 0, pos = gelf_getrela(reldata, 0, &pos_mem); \
205 idx < nr_entries; \
206 ++idx, pos = gelf_getrela(reldata, idx, &pos_mem))
207
208/*
209 * We need to check if we have a .dynsym, so that we can handle the
210 * .plt, synthesizing its symbols, that aren't on the symtabs (be it
211 * .dynsym or .symtab).
212 * And always look at the original dso, not at debuginfo packages, that
213 * have the PLT data stripped out (shdr_rel_plt.sh_type == SHT_NOBITS).
214 */
a44f605b 215int dso__synthesize_plt_symbols(struct dso *dso, struct symsrc *ss, struct map *map,
e5a1845f
NK
216 symbol_filter_t filter)
217{
218 uint32_t nr_rel_entries, idx;
219 GElf_Sym sym;
220 u64 plt_offset;
221 GElf_Shdr shdr_plt;
222 struct symbol *f;
223 GElf_Shdr shdr_rel_plt, shdr_dynsym;
224 Elf_Data *reldata, *syms, *symstrs;
225 Elf_Scn *scn_plt_rel, *scn_symstrs, *scn_dynsym;
226 size_t dynsym_idx;
227 GElf_Ehdr ehdr;
228 char sympltname[1024];
229 Elf *elf;
a44f605b 230 int nr = 0, symidx, err = 0;
e5a1845f 231
f47b58b7
DA
232 if (!ss->dynsym)
233 return 0;
234
a44f605b
CS
235 elf = ss->elf;
236 ehdr = ss->ehdr;
e5a1845f 237
a44f605b
CS
238 scn_dynsym = ss->dynsym;
239 shdr_dynsym = ss->dynshdr;
240 dynsym_idx = ss->dynsym_idx;
e5a1845f 241
e5a1845f
NK
242 if (scn_dynsym == NULL)
243 goto out_elf_end;
244
245 scn_plt_rel = elf_section_by_name(elf, &ehdr, &shdr_rel_plt,
246 ".rela.plt", NULL);
247 if (scn_plt_rel == NULL) {
248 scn_plt_rel = elf_section_by_name(elf, &ehdr, &shdr_rel_plt,
249 ".rel.plt", NULL);
250 if (scn_plt_rel == NULL)
251 goto out_elf_end;
252 }
253
254 err = -1;
255
256 if (shdr_rel_plt.sh_link != dynsym_idx)
257 goto out_elf_end;
258
259 if (elf_section_by_name(elf, &ehdr, &shdr_plt, ".plt", NULL) == NULL)
260 goto out_elf_end;
261
262 /*
263 * Fetch the relocation section to find the idxes to the GOT
264 * and the symbols in the .dynsym they refer to.
265 */
266 reldata = elf_getdata(scn_plt_rel, NULL);
267 if (reldata == NULL)
268 goto out_elf_end;
269
270 syms = elf_getdata(scn_dynsym, NULL);
271 if (syms == NULL)
272 goto out_elf_end;
273
274 scn_symstrs = elf_getscn(elf, shdr_dynsym.sh_link);
275 if (scn_symstrs == NULL)
276 goto out_elf_end;
277
278 symstrs = elf_getdata(scn_symstrs, NULL);
279 if (symstrs == NULL)
280 goto out_elf_end;
281
52f9ddba
CS
282 if (symstrs->d_size == 0)
283 goto out_elf_end;
284
e5a1845f
NK
285 nr_rel_entries = shdr_rel_plt.sh_size / shdr_rel_plt.sh_entsize;
286 plt_offset = shdr_plt.sh_offset;
287
288 if (shdr_rel_plt.sh_type == SHT_RELA) {
289 GElf_Rela pos_mem, *pos;
290
291 elf_section__for_each_rela(reldata, pos, pos_mem, idx,
292 nr_rel_entries) {
293 symidx = GELF_R_SYM(pos->r_info);
294 plt_offset += shdr_plt.sh_entsize;
295 gelf_getsym(syms, symidx, &sym);
296 snprintf(sympltname, sizeof(sympltname),
297 "%s@plt", elf_sym__name(&sym, symstrs));
298
299 f = symbol__new(plt_offset, shdr_plt.sh_entsize,
300 STB_GLOBAL, sympltname);
301 if (!f)
302 goto out_elf_end;
303
304 if (filter && filter(map, f))
305 symbol__delete(f);
306 else {
307 symbols__insert(&dso->symbols[map->type], f);
308 ++nr;
309 }
310 }
311 } else if (shdr_rel_plt.sh_type == SHT_REL) {
312 GElf_Rel pos_mem, *pos;
313 elf_section__for_each_rel(reldata, pos, pos_mem, idx,
314 nr_rel_entries) {
315 symidx = GELF_R_SYM(pos->r_info);
316 plt_offset += shdr_plt.sh_entsize;
317 gelf_getsym(syms, symidx, &sym);
318 snprintf(sympltname, sizeof(sympltname),
319 "%s@plt", elf_sym__name(&sym, symstrs));
320
321 f = symbol__new(plt_offset, shdr_plt.sh_entsize,
322 STB_GLOBAL, sympltname);
323 if (!f)
324 goto out_elf_end;
325
326 if (filter && filter(map, f))
327 symbol__delete(f);
328 else {
329 symbols__insert(&dso->symbols[map->type], f);
330 ++nr;
331 }
332 }
333 }
334
335 err = 0;
336out_elf_end:
e5a1845f
NK
337 if (err == 0)
338 return nr;
e5a1845f
NK
339 pr_debug("%s: problems reading %s PLT info.\n",
340 __func__, dso->long_name);
341 return 0;
342}
343
344/*
345 * Align offset to 4 bytes as needed for note name and descriptor data.
346 */
347#define NOTE_ALIGN(n) (((n) + 3) & -4U)
348
349static int elf_read_build_id(Elf *elf, void *bf, size_t size)
350{
351 int err = -1;
352 GElf_Ehdr ehdr;
353 GElf_Shdr shdr;
354 Elf_Data *data;
355 Elf_Scn *sec;
356 Elf_Kind ek;
357 void *ptr;
358
359 if (size < BUILD_ID_SIZE)
360 goto out;
361
362 ek = elf_kind(elf);
363 if (ek != ELF_K_ELF)
364 goto out;
365
366 if (gelf_getehdr(elf, &ehdr) == NULL) {
367 pr_err("%s: cannot get elf header.\n", __func__);
368 goto out;
369 }
370
371 /*
372 * Check following sections for notes:
373 * '.note.gnu.build-id'
374 * '.notes'
375 * '.note' (VDSO specific)
376 */
377 do {
378 sec = elf_section_by_name(elf, &ehdr, &shdr,
379 ".note.gnu.build-id", NULL);
380 if (sec)
381 break;
382
383 sec = elf_section_by_name(elf, &ehdr, &shdr,
384 ".notes", NULL);
385 if (sec)
386 break;
387
388 sec = elf_section_by_name(elf, &ehdr, &shdr,
389 ".note", NULL);
390 if (sec)
391 break;
392
393 return err;
394
395 } while (0);
396
397 data = elf_getdata(sec, NULL);
398 if (data == NULL)
399 goto out;
400
401 ptr = data->d_buf;
402 while (ptr < (data->d_buf + data->d_size)) {
403 GElf_Nhdr *nhdr = ptr;
404 size_t namesz = NOTE_ALIGN(nhdr->n_namesz),
405 descsz = NOTE_ALIGN(nhdr->n_descsz);
406 const char *name;
407
408 ptr += sizeof(*nhdr);
409 name = ptr;
410 ptr += namesz;
411 if (nhdr->n_type == NT_GNU_BUILD_ID &&
412 nhdr->n_namesz == sizeof("GNU")) {
413 if (memcmp(name, "GNU", sizeof("GNU")) == 0) {
414 size_t sz = min(size, descsz);
415 memcpy(bf, ptr, sz);
416 memset(bf + sz, 0, size - sz);
417 err = descsz;
418 break;
419 }
420 }
421 ptr += descsz;
422 }
423
424out:
425 return err;
426}
427
428int filename__read_build_id(const char *filename, void *bf, size_t size)
429{
430 int fd, err = -1;
431 Elf *elf;
432
433 if (size < BUILD_ID_SIZE)
434 goto out;
435
436 fd = open(filename, O_RDONLY);
437 if (fd < 0)
438 goto out;
439
440 elf = elf_begin(fd, PERF_ELF_C_READ_MMAP, NULL);
441 if (elf == NULL) {
442 pr_debug2("%s: cannot read %s ELF file.\n", __func__, filename);
443 goto out_close;
444 }
445
446 err = elf_read_build_id(elf, bf, size);
447
448 elf_end(elf);
449out_close:
450 close(fd);
451out:
452 return err;
453}
454
455int sysfs__read_build_id(const char *filename, void *build_id, size_t size)
456{
457 int fd, err = -1;
458
459 if (size < BUILD_ID_SIZE)
460 goto out;
461
462 fd = open(filename, O_RDONLY);
463 if (fd < 0)
464 goto out;
465
466 while (1) {
467 char bf[BUFSIZ];
468 GElf_Nhdr nhdr;
469 size_t namesz, descsz;
470
471 if (read(fd, &nhdr, sizeof(nhdr)) != sizeof(nhdr))
472 break;
473
474 namesz = NOTE_ALIGN(nhdr.n_namesz);
475 descsz = NOTE_ALIGN(nhdr.n_descsz);
476 if (nhdr.n_type == NT_GNU_BUILD_ID &&
477 nhdr.n_namesz == sizeof("GNU")) {
478 if (read(fd, bf, namesz) != (ssize_t)namesz)
479 break;
480 if (memcmp(bf, "GNU", sizeof("GNU")) == 0) {
481 size_t sz = min(descsz, size);
482 if (read(fd, build_id, sz) == (ssize_t)sz) {
483 memset(build_id + sz, 0, size - sz);
484 err = 0;
485 break;
486 }
487 } else if (read(fd, bf, descsz) != (ssize_t)descsz)
488 break;
489 } else {
490 int n = namesz + descsz;
491 if (read(fd, bf, n) != n)
492 break;
493 }
494 }
495 close(fd);
496out:
497 return err;
498}
499
500int filename__read_debuglink(const char *filename, char *debuglink,
501 size_t size)
502{
503 int fd, err = -1;
504 Elf *elf;
505 GElf_Ehdr ehdr;
506 GElf_Shdr shdr;
507 Elf_Data *data;
508 Elf_Scn *sec;
509 Elf_Kind ek;
510
511 fd = open(filename, O_RDONLY);
512 if (fd < 0)
513 goto out;
514
515 elf = elf_begin(fd, PERF_ELF_C_READ_MMAP, NULL);
516 if (elf == NULL) {
517 pr_debug2("%s: cannot read %s ELF file.\n", __func__, filename);
518 goto out_close;
519 }
520
521 ek = elf_kind(elf);
522 if (ek != ELF_K_ELF)
784f3390 523 goto out_elf_end;
e5a1845f
NK
524
525 if (gelf_getehdr(elf, &ehdr) == NULL) {
526 pr_err("%s: cannot get elf header.\n", __func__);
784f3390 527 goto out_elf_end;
e5a1845f
NK
528 }
529
530 sec = elf_section_by_name(elf, &ehdr, &shdr,
531 ".gnu_debuglink", NULL);
532 if (sec == NULL)
784f3390 533 goto out_elf_end;
e5a1845f
NK
534
535 data = elf_getdata(sec, NULL);
536 if (data == NULL)
784f3390 537 goto out_elf_end;
e5a1845f
NK
538
539 /* the start of this section is a zero-terminated string */
540 strncpy(debuglink, data->d_buf, size);
541
0d3dc5e8
SE
542 err = 0;
543
784f3390 544out_elf_end:
e5a1845f 545 elf_end(elf);
e5a1845f
NK
546out_close:
547 close(fd);
548out:
549 return err;
550}
551
552static int dso__swap_init(struct dso *dso, unsigned char eidata)
553{
554 static unsigned int const endian = 1;
555
556 dso->needs_swap = DSO_SWAP__NO;
557
558 switch (eidata) {
559 case ELFDATA2LSB:
560 /* We are big endian, DSO is little endian. */
561 if (*(unsigned char const *)&endian != 1)
562 dso->needs_swap = DSO_SWAP__YES;
563 break;
564
565 case ELFDATA2MSB:
566 /* We are little endian, DSO is big endian. */
567 if (*(unsigned char const *)&endian != 0)
568 dso->needs_swap = DSO_SWAP__YES;
569 break;
570
571 default:
572 pr_err("unrecognized DSO data encoding %d\n", eidata);
573 return -EINVAL;
574 }
575
576 return 0;
577}
578
c00c48fc
NK
579static int decompress_kmodule(struct dso *dso, const char *name,
580 enum dso_binary_type type)
581{
914f85c4 582 int fd = -1;
c00c48fc 583 char tmpbuf[] = "/tmp/perf-kmod-XXXXXX";
914f85c4 584 struct kmod_path m;
c00c48fc 585
0b064f43
NK
586 if (type != DSO_BINARY_TYPE__SYSTEM_PATH_KMODULE_COMP &&
587 type != DSO_BINARY_TYPE__GUEST_KMODULE_COMP &&
588 type != DSO_BINARY_TYPE__BUILD_ID_CACHE)
c00c48fc
NK
589 return -1;
590
914f85c4
JO
591 if (type == DSO_BINARY_TYPE__BUILD_ID_CACHE)
592 name = dso->long_name;
593
594 if (kmod_path__parse_ext(&m, name) || !m.comp)
595 return -1;
c00c48fc
NK
596
597 fd = mkstemp(tmpbuf);
18425f13
ACM
598 if (fd < 0) {
599 dso->load_errno = errno;
914f85c4 600 goto out;
18425f13 601 }
c00c48fc 602
914f85c4 603 if (!decompress_to_file(m.ext, name, fd)) {
18425f13 604 dso->load_errno = DSO_LOAD_ERRNO__DECOMPRESSION_FAILURE;
c00c48fc
NK
605 close(fd);
606 fd = -1;
607 }
608
609 unlink(tmpbuf);
610
914f85c4
JO
611out:
612 free(m.ext);
c00c48fc
NK
613 return fd;
614}
615
3aafe5ae
CS
616bool symsrc__possibly_runtime(struct symsrc *ss)
617{
618 return ss->dynsym || ss->opdsec;
619}
620
d26cd12b
CS
621bool symsrc__has_symtab(struct symsrc *ss)
622{
623 return ss->symtab != NULL;
624}
b68e2f91
CS
625
626void symsrc__destroy(struct symsrc *ss)
627{
74cf249d 628 zfree(&ss->name);
b68e2f91
CS
629 elf_end(ss->elf);
630 close(ss->fd);
631}
632
d2332098
NR
633bool __weak elf__needs_adjust_symbols(GElf_Ehdr ehdr)
634{
635 return ehdr.e_type == ET_EXEC || ehdr.e_type == ET_REL;
636}
637
b68e2f91
CS
638int symsrc__init(struct symsrc *ss, struct dso *dso, const char *name,
639 enum dso_binary_type type)
e5a1845f 640{
e5a1845f 641 int err = -1;
e5a1845f 642 GElf_Ehdr ehdr;
e5a1845f 643 Elf *elf;
b68e2f91
CS
644 int fd;
645
18425f13 646 if (dso__needs_decompress(dso)) {
c00c48fc 647 fd = decompress_kmodule(dso, name, type);
18425f13
ACM
648 if (fd < 0)
649 return -1;
650 } else {
c00c48fc 651 fd = open(name, O_RDONLY);
18425f13
ACM
652 if (fd < 0) {
653 dso->load_errno = errno;
654 return -1;
655 }
656 }
e5a1845f
NK
657
658 elf = elf_begin(fd, PERF_ELF_C_READ_MMAP, NULL);
659 if (elf == NULL) {
660 pr_debug("%s: cannot read %s ELF file.\n", __func__, name);
18425f13 661 dso->load_errno = DSO_LOAD_ERRNO__INVALID_ELF;
e5a1845f
NK
662 goto out_close;
663 }
664
665 if (gelf_getehdr(elf, &ehdr) == NULL) {
18425f13 666 dso->load_errno = DSO_LOAD_ERRNO__INVALID_ELF;
e5a1845f
NK
667 pr_debug("%s: cannot get elf header.\n", __func__);
668 goto out_elf_end;
669 }
670
18425f13
ACM
671 if (dso__swap_init(dso, ehdr.e_ident[EI_DATA])) {
672 dso->load_errno = DSO_LOAD_ERRNO__INTERNAL_ERROR;
e5a1845f 673 goto out_elf_end;
18425f13 674 }
e5a1845f
NK
675
676 /* Always reject images with a mismatched build-id: */
677 if (dso->has_build_id) {
678 u8 build_id[BUILD_ID_SIZE];
679
18425f13
ACM
680 if (elf_read_build_id(elf, build_id, BUILD_ID_SIZE) < 0) {
681 dso->load_errno = DSO_LOAD_ERRNO__CANNOT_READ_BUILDID;
e5a1845f 682 goto out_elf_end;
18425f13 683 }
e5a1845f 684
18425f13 685 if (!dso__build_id_equal(dso, build_id)) {
468f3d29 686 pr_debug("%s: build id mismatch for %s.\n", __func__, name);
18425f13 687 dso->load_errno = DSO_LOAD_ERRNO__MISMATCHING_BUILDID;
e5a1845f 688 goto out_elf_end;
18425f13 689 }
e5a1845f
NK
690 }
691
c6d8f2a4
AH
692 ss->is_64_bit = (gelf_getclass(elf) == ELFCLASS64);
693
b68e2f91
CS
694 ss->symtab = elf_section_by_name(elf, &ehdr, &ss->symshdr, ".symtab",
695 NULL);
696 if (ss->symshdr.sh_type != SHT_SYMTAB)
697 ss->symtab = NULL;
698
699 ss->dynsym_idx = 0;
700 ss->dynsym = elf_section_by_name(elf, &ehdr, &ss->dynshdr, ".dynsym",
701 &ss->dynsym_idx);
702 if (ss->dynshdr.sh_type != SHT_DYNSYM)
703 ss->dynsym = NULL;
704
705 ss->opdidx = 0;
706 ss->opdsec = elf_section_by_name(elf, &ehdr, &ss->opdshdr, ".opd",
707 &ss->opdidx);
708 if (ss->opdshdr.sh_type != SHT_PROGBITS)
709 ss->opdsec = NULL;
710
711 if (dso->kernel == DSO_TYPE_USER) {
712 GElf_Shdr shdr;
713 ss->adjust_symbols = (ehdr.e_type == ET_EXEC ||
0131c4ec 714 ehdr.e_type == ET_REL ||
51682dc7 715 dso__is_vdso(dso) ||
b68e2f91
CS
716 elf_section_by_name(elf, &ehdr, &shdr,
717 ".gnu.prelink_undo",
718 NULL) != NULL);
719 } else {
d2332098 720 ss->adjust_symbols = elf__needs_adjust_symbols(ehdr);
b68e2f91
CS
721 }
722
723 ss->name = strdup(name);
18425f13
ACM
724 if (!ss->name) {
725 dso->load_errno = errno;
b68e2f91 726 goto out_elf_end;
18425f13 727 }
b68e2f91
CS
728
729 ss->elf = elf;
730 ss->fd = fd;
731 ss->ehdr = ehdr;
732 ss->type = type;
733
734 return 0;
735
736out_elf_end:
737 elf_end(elf);
738out_close:
739 close(fd);
740 return err;
741}
742
39b12f78
AH
743/**
744 * ref_reloc_sym_not_found - has kernel relocation symbol been found.
745 * @kmap: kernel maps and relocation reference symbol
746 *
747 * This function returns %true if we are dealing with the kernel maps and the
748 * relocation reference symbol has not yet been found. Otherwise %false is
749 * returned.
750 */
751static bool ref_reloc_sym_not_found(struct kmap *kmap)
752{
753 return kmap && kmap->ref_reloc_sym && kmap->ref_reloc_sym->name &&
754 !kmap->ref_reloc_sym->unrelocated_addr;
755}
756
757/**
758 * ref_reloc - kernel relocation offset.
759 * @kmap: kernel maps and relocation reference symbol
760 *
761 * This function returns the offset of kernel addresses as determined by using
762 * the relocation reference symbol i.e. if the kernel has not been relocated
763 * then the return value is zero.
764 */
765static u64 ref_reloc(struct kmap *kmap)
766{
767 if (kmap && kmap->ref_reloc_sym &&
768 kmap->ref_reloc_sym->unrelocated_addr)
769 return kmap->ref_reloc_sym->addr -
770 kmap->ref_reloc_sym->unrelocated_addr;
771 return 0;
772}
773
763122ad
AK
774static bool want_demangle(bool is_kernel_sym)
775{
776 return is_kernel_sym ? symbol_conf.demangle_kernel : symbol_conf.demangle;
777}
778
c50fc0a4
AM
779void __weak arch__elf_sym_adjust(GElf_Sym *sym __maybe_unused) { }
780
261360b6
CS
781int dso__load_sym(struct dso *dso, struct map *map,
782 struct symsrc *syms_ss, struct symsrc *runtime_ss,
d26cd12b 783 symbol_filter_t filter, int kmodule)
b68e2f91
CS
784{
785 struct kmap *kmap = dso->kernel ? map__kmap(map) : NULL;
ba92732e 786 struct map_groups *kmaps = kmap ? map__kmaps(map) : NULL;
b68e2f91
CS
787 struct map *curr_map = map;
788 struct dso *curr_dso = dso;
789 Elf_Data *symstrs, *secstrs;
790 uint32_t nr_syms;
791 int err = -1;
792 uint32_t idx;
793 GElf_Ehdr ehdr;
261360b6 794 GElf_Shdr shdr;
b68e2f91
CS
795 Elf_Data *syms, *opddata = NULL;
796 GElf_Sym sym;
261360b6 797 Elf_Scn *sec, *sec_strndx;
b68e2f91
CS
798 Elf *elf;
799 int nr = 0;
39b12f78 800 bool remap_kernel = false, adjust_kernel_syms = false;
b68e2f91 801
ba92732e
WN
802 if (kmap && !kmaps)
803 return -1;
804
261360b6 805 dso->symtab_type = syms_ss->type;
c6d8f2a4 806 dso->is_64_bit = syms_ss->is_64_bit;
0131c4ec
AH
807 dso->rel = syms_ss->ehdr.e_type == ET_REL;
808
809 /*
810 * Modules may already have symbols from kallsyms, but those symbols
811 * have the wrong values for the dso maps, so remove them.
812 */
813 if (kmodule && syms_ss->symtab)
814 symbols__delete(&dso->symbols[map->type]);
005f9294 815
261360b6 816 if (!syms_ss->symtab) {
d0b0d040
AB
817 /*
818 * If the vmlinux is stripped, fail so we will fall back
819 * to using kallsyms. The vmlinux runtime symbols aren't
820 * of much use.
821 */
822 if (dso->kernel)
823 goto out_elf_end;
824
261360b6
CS
825 syms_ss->symtab = syms_ss->dynsym;
826 syms_ss->symshdr = syms_ss->dynshdr;
d26cd12b
CS
827 }
828
261360b6
CS
829 elf = syms_ss->elf;
830 ehdr = syms_ss->ehdr;
831 sec = syms_ss->symtab;
832 shdr = syms_ss->symshdr;
b68e2f91 833
261360b6
CS
834 if (runtime_ss->opdsec)
835 opddata = elf_rawdata(runtime_ss->opdsec, NULL);
e5a1845f
NK
836
837 syms = elf_getdata(sec, NULL);
838 if (syms == NULL)
839 goto out_elf_end;
840
841 sec = elf_getscn(elf, shdr.sh_link);
842 if (sec == NULL)
843 goto out_elf_end;
844
845 symstrs = elf_getdata(sec, NULL);
846 if (symstrs == NULL)
847 goto out_elf_end;
848
f247fb81 849 sec_strndx = elf_getscn(runtime_ss->elf, runtime_ss->ehdr.e_shstrndx);
e5a1845f
NK
850 if (sec_strndx == NULL)
851 goto out_elf_end;
852
853 secstrs = elf_getdata(sec_strndx, NULL);
854 if (secstrs == NULL)
855 goto out_elf_end;
856
857 nr_syms = shdr.sh_size / shdr.sh_entsize;
858
859 memset(&sym, 0, sizeof(sym));
39b12f78
AH
860
861 /*
862 * The kernel relocation symbol is needed in advance in order to adjust
863 * kernel maps correctly.
864 */
865 if (ref_reloc_sym_not_found(kmap)) {
866 elf_symtab__for_each_symbol(syms, nr_syms, idx, sym) {
867 const char *elf_name = elf_sym__name(&sym, symstrs);
868
869 if (strcmp(elf_name, kmap->ref_reloc_sym->name))
870 continue;
871 kmap->ref_reloc_sym->unrelocated_addr = sym.st_value;
9176753d
AH
872 map->reloc = kmap->ref_reloc_sym->addr -
873 kmap->ref_reloc_sym->unrelocated_addr;
39b12f78
AH
874 break;
875 }
876 }
877
f0ee3b46
AH
878 /*
879 * Handle any relocation of vdso necessary because older kernels
880 * attempted to prelink vdso to its virtual address.
881 */
882 if (dso__is_vdso(dso)) {
883 GElf_Shdr tshdr;
884
885 if (elf_section_by_name(elf, &ehdr, &tshdr, ".text", NULL))
886 map->reloc = map->start - tshdr.sh_addr + tshdr.sh_offset;
887 }
888
39b12f78
AH
889 dso->adjust_symbols = runtime_ss->adjust_symbols || ref_reloc(kmap);
890 /*
891 * Initial kernel and module mappings do not map to the dso. For
892 * function mappings, flag the fixups.
893 */
894 if (map->type == MAP__FUNCTION && (dso->kernel || kmodule)) {
895 remap_kernel = true;
896 adjust_kernel_syms = dso->adjust_symbols;
897 }
e5a1845f
NK
898 elf_symtab__for_each_symbol(syms, nr_syms, idx, sym) {
899 struct symbol *f;
900 const char *elf_name = elf_sym__name(&sym, symstrs);
901 char *demangled = NULL;
902 int is_label = elf_sym__is_label(&sym);
903 const char *section_name;
261360b6 904 bool used_opd = false;
e5a1845f 905
e5a1845f
NK
906 if (!is_label && !elf_sym__is_a(&sym, map->type))
907 continue;
908
909 /* Reject ARM ELF "mapping symbols": these aren't unique and
910 * don't identify functions, so will confuse the profile
911 * output: */
4886f2ca
VK
912 if (ehdr.e_machine == EM_ARM || ehdr.e_machine == EM_AARCH64) {
913 if (elf_name[0] == '$' && strchr("adtx", elf_name[1])
914 && (elf_name[2] == '\0' || elf_name[2] == '.'))
e5a1845f
NK
915 continue;
916 }
917
261360b6
CS
918 if (runtime_ss->opdsec && sym.st_shndx == runtime_ss->opdidx) {
919 u32 offset = sym.st_value - syms_ss->opdshdr.sh_addr;
e5a1845f
NK
920 u64 *opd = opddata->d_buf + offset;
921 sym.st_value = DSO__SWAP(dso, u64, *opd);
261360b6
CS
922 sym.st_shndx = elf_addr_to_index(runtime_ss->elf,
923 sym.st_value);
924 used_opd = true;
e5a1845f 925 }
3843b05d
NK
926 /*
927 * When loading symbols in a data mapping, ABS symbols (which
928 * has a value of SHN_ABS in its st_shndx) failed at
929 * elf_getscn(). And it marks the loading as a failure so
930 * already loaded symbols cannot be fixed up.
931 *
932 * I'm not sure what should be done. Just ignore them for now.
933 * - Namhyung Kim
934 */
935 if (sym.st_shndx == SHN_ABS)
936 continue;
e5a1845f 937
261360b6 938 sec = elf_getscn(runtime_ss->elf, sym.st_shndx);
e5a1845f
NK
939 if (!sec)
940 goto out_elf_end;
941
942 gelf_getshdr(sec, &shdr);
943
944 if (is_label && !elf_sec__is_a(&shdr, secstrs, map->type))
945 continue;
946
947 section_name = elf_sec__name(&shdr, secstrs);
948
949 /* On ARM, symbols for thumb functions have 1 added to
950 * the symbol address as a flag - remove it */
951 if ((ehdr.e_machine == EM_ARM) &&
952 (map->type == MAP__FUNCTION) &&
953 (sym.st_value & 1))
954 --sym.st_value;
955
c50fc0a4
AM
956 arch__elf_sym_adjust(&sym);
957
39b12f78 958 if (dso->kernel || kmodule) {
e5a1845f
NK
959 char dso_name[PATH_MAX];
960
39b12f78
AH
961 /* Adjust symbol to map to file offset */
962 if (adjust_kernel_syms)
963 sym.st_value -= shdr.sh_addr - shdr.sh_offset;
964
e5a1845f
NK
965 if (strcmp(section_name,
966 (curr_dso->short_name +
967 dso->short_name_len)) == 0)
968 goto new_symbol;
969
970 if (strcmp(section_name, ".text") == 0) {
39b12f78
AH
971 /*
972 * The initial kernel mapping is based on
973 * kallsyms and identity maps. Overwrite it to
974 * map to the kernel dso.
975 */
976 if (remap_kernel && dso->kernel) {
977 remap_kernel = false;
978 map->start = shdr.sh_addr +
979 ref_reloc(kmap);
980 map->end = map->start + shdr.sh_size;
981 map->pgoff = shdr.sh_offset;
982 map->map_ip = map__map_ip;
983 map->unmap_ip = map__unmap_ip;
984 /* Ensure maps are correctly ordered */
ba92732e 985 if (kmaps) {
84c2cafa 986 map__get(map);
ba92732e
WN
987 map_groups__remove(kmaps, map);
988 map_groups__insert(kmaps, map);
84c2cafa 989 map__put(map);
ba92732e 990 }
39b12f78
AH
991 }
992
0131c4ec
AH
993 /*
994 * The initial module mapping is based on
995 * /proc/modules mapped to offset zero.
996 * Overwrite it to map to the module dso.
997 */
998 if (remap_kernel && kmodule) {
999 remap_kernel = false;
1000 map->pgoff = shdr.sh_offset;
1001 }
1002
e5a1845f
NK
1003 curr_map = map;
1004 curr_dso = dso;
1005 goto new_symbol;
1006 }
1007
0131c4ec
AH
1008 if (!kmap)
1009 goto new_symbol;
1010
e5a1845f
NK
1011 snprintf(dso_name, sizeof(dso_name),
1012 "%s%s", dso->short_name, section_name);
1013
ba92732e 1014 curr_map = map_groups__find_by_name(kmaps, map->type, dso_name);
e5a1845f
NK
1015 if (curr_map == NULL) {
1016 u64 start = sym.st_value;
1017
1018 if (kmodule)
1019 start += map->start + shdr.sh_offset;
1020
1021 curr_dso = dso__new(dso_name);
1022 if (curr_dso == NULL)
1023 goto out_elf_end;
1024 curr_dso->kernel = dso->kernel;
1025 curr_dso->long_name = dso->long_name;
1026 curr_dso->long_name_len = dso->long_name_len;
1027 curr_map = map__new2(start, curr_dso,
1028 map->type);
e7a7865c 1029 dso__put(curr_dso);
e5a1845f 1030 if (curr_map == NULL) {
e5a1845f
NK
1031 goto out_elf_end;
1032 }
39b12f78
AH
1033 if (adjust_kernel_syms) {
1034 curr_map->start = shdr.sh_addr +
1035 ref_reloc(kmap);
1036 curr_map->end = curr_map->start +
1037 shdr.sh_size;
1038 curr_map->pgoff = shdr.sh_offset;
1039 } else {
1040 curr_map->map_ip = identity__map_ip;
1041 curr_map->unmap_ip = identity__map_ip;
1042 }
e5a1845f 1043 curr_dso->symtab_type = dso->symtab_type;
ba92732e 1044 map_groups__insert(kmaps, curr_map);
e7a7865c
MH
1045 /*
1046 * Add it before we drop the referece to curr_map,
1047 * i.e. while we still are sure to have a reference
1048 * to this DSO via curr_map->dso.
1049 */
1050 dsos__add(&map->groups->machine->dsos, curr_dso);
8d5c340d
MH
1051 /* kmaps already got it */
1052 map__put(curr_map);
e5a1845f
NK
1053 dso__set_loaded(curr_dso, map->type);
1054 } else
1055 curr_dso = curr_map->dso;
1056
1057 goto new_symbol;
1058 }
1059
261360b6
CS
1060 if ((used_opd && runtime_ss->adjust_symbols)
1061 || (!used_opd && syms_ss->adjust_symbols)) {
e5a1845f
NK
1062 pr_debug4("%s: adjusting symbol: st_value: %#" PRIx64 " "
1063 "sh_addr: %#" PRIx64 " sh_offset: %#" PRIx64 "\n", __func__,
1064 (u64)sym.st_value, (u64)shdr.sh_addr,
1065 (u64)shdr.sh_offset);
1066 sym.st_value -= shdr.sh_addr - shdr.sh_offset;
1067 }
950b8354 1068new_symbol:
e5a1845f
NK
1069 /*
1070 * We need to figure out if the object was created from C++ sources
1071 * DWARF DW_compile_unit has this, but we don't always have access
1072 * to it...
1073 */
763122ad 1074 if (want_demangle(dso->kernel || kmodule)) {
e71e7945
NK
1075 int demangle_flags = DMGL_NO_OPTS;
1076 if (verbose)
1077 demangle_flags = DMGL_PARAMS | DMGL_ANSI;
1078
1079 demangled = bfd_demangle(NULL, elf_name, demangle_flags);
328ccdac
NK
1080 if (demangled != NULL)
1081 elf_name = demangled;
1082 }
e5a1845f
NK
1083 f = symbol__new(sym.st_value, sym.st_size,
1084 GELF_ST_BIND(sym.st_info), elf_name);
1085 free(demangled);
1086 if (!f)
1087 goto out_elf_end;
1088
1089 if (filter && filter(curr_map, f))
1090 symbol__delete(f);
1091 else {
1092 symbols__insert(&curr_dso->symbols[curr_map->type], f);
1093 nr++;
1094 }
1095 }
1096
1097 /*
1098 * For misannotated, zeroed, ASM function sizes.
1099 */
1100 if (nr > 0) {
680d926a
NK
1101 if (!symbol_conf.allow_aliases)
1102 symbols__fixup_duplicate(&dso->symbols[map->type]);
e5a1845f
NK
1103 symbols__fixup_end(&dso->symbols[map->type]);
1104 if (kmap) {
1105 /*
1106 * We need to fixup this here too because we create new
1107 * maps here, for things like vsyscall sections.
1108 */
ba92732e 1109 __map_groups__fixup_end(kmaps, map->type);
e5a1845f
NK
1110 }
1111 }
1112 err = nr;
1113out_elf_end:
e5a1845f
NK
1114 return err;
1115}
1116
8e0cf965
AH
1117static int elf_read_maps(Elf *elf, bool exe, mapfn_t mapfn, void *data)
1118{
1119 GElf_Phdr phdr;
1120 size_t i, phdrnum;
1121 int err;
1122 u64 sz;
1123
1124 if (elf_getphdrnum(elf, &phdrnum))
1125 return -1;
1126
1127 for (i = 0; i < phdrnum; i++) {
1128 if (gelf_getphdr(elf, i, &phdr) == NULL)
1129 return -1;
1130 if (phdr.p_type != PT_LOAD)
1131 continue;
1132 if (exe) {
1133 if (!(phdr.p_flags & PF_X))
1134 continue;
1135 } else {
1136 if (!(phdr.p_flags & PF_R))
1137 continue;
1138 }
1139 sz = min(phdr.p_memsz, phdr.p_filesz);
1140 if (!sz)
1141 continue;
1142 err = mapfn(phdr.p_vaddr, sz, phdr.p_offset, data);
1143 if (err)
1144 return err;
1145 }
1146 return 0;
1147}
1148
1149int file__read_maps(int fd, bool exe, mapfn_t mapfn, void *data,
1150 bool *is_64_bit)
1151{
1152 int err;
1153 Elf *elf;
1154
1155 elf = elf_begin(fd, PERF_ELF_C_READ_MMAP, NULL);
1156 if (elf == NULL)
1157 return -1;
1158
1159 if (is_64_bit)
1160 *is_64_bit = (gelf_getclass(elf) == ELFCLASS64);
1161
1162 err = elf_read_maps(elf, exe, mapfn, data);
1163
1164 elf_end(elf);
1165 return err;
1166}
1167
2b5b8bb2
AH
1168enum dso_type dso__type_fd(int fd)
1169{
1170 enum dso_type dso_type = DSO__TYPE_UNKNOWN;
1171 GElf_Ehdr ehdr;
1172 Elf_Kind ek;
1173 Elf *elf;
1174
1175 elf = elf_begin(fd, PERF_ELF_C_READ_MMAP, NULL);
1176 if (elf == NULL)
1177 goto out;
1178
1179 ek = elf_kind(elf);
1180 if (ek != ELF_K_ELF)
1181 goto out_end;
1182
1183 if (gelf_getclass(elf) == ELFCLASS64) {
1184 dso_type = DSO__TYPE_64BIT;
1185 goto out_end;
1186 }
1187
1188 if (gelf_getehdr(elf, &ehdr) == NULL)
1189 goto out_end;
1190
1191 if (ehdr.e_machine == EM_X86_64)
1192 dso_type = DSO__TYPE_X32BIT;
1193 else
1194 dso_type = DSO__TYPE_32BIT;
1195out_end:
1196 elf_end(elf);
1197out:
1198 return dso_type;
1199}
1200
afba19d9
AH
1201static int copy_bytes(int from, off_t from_offs, int to, off_t to_offs, u64 len)
1202{
1203 ssize_t r;
1204 size_t n;
1205 int err = -1;
1206 char *buf = malloc(page_size);
1207
1208 if (buf == NULL)
1209 return -1;
1210
1211 if (lseek(to, to_offs, SEEK_SET) != to_offs)
1212 goto out;
1213
1214 if (lseek(from, from_offs, SEEK_SET) != from_offs)
1215 goto out;
1216
1217 while (len) {
1218 n = page_size;
1219 if (len < n)
1220 n = len;
1221 /* Use read because mmap won't work on proc files */
1222 r = read(from, buf, n);
1223 if (r < 0)
1224 goto out;
1225 if (!r)
1226 break;
1227 n = r;
1228 r = write(to, buf, n);
1229 if (r < 0)
1230 goto out;
1231 if ((size_t)r != n)
1232 goto out;
1233 len -= n;
1234 }
1235
1236 err = 0;
1237out:
1238 free(buf);
1239 return err;
1240}
1241
1242struct kcore {
1243 int fd;
1244 int elfclass;
1245 Elf *elf;
1246 GElf_Ehdr ehdr;
1247};
1248
1249static int kcore__open(struct kcore *kcore, const char *filename)
1250{
1251 GElf_Ehdr *ehdr;
1252
1253 kcore->fd = open(filename, O_RDONLY);
1254 if (kcore->fd == -1)
1255 return -1;
1256
1257 kcore->elf = elf_begin(kcore->fd, ELF_C_READ, NULL);
1258 if (!kcore->elf)
1259 goto out_close;
1260
1261 kcore->elfclass = gelf_getclass(kcore->elf);
1262 if (kcore->elfclass == ELFCLASSNONE)
1263 goto out_end;
1264
1265 ehdr = gelf_getehdr(kcore->elf, &kcore->ehdr);
1266 if (!ehdr)
1267 goto out_end;
1268
1269 return 0;
1270
1271out_end:
1272 elf_end(kcore->elf);
1273out_close:
1274 close(kcore->fd);
1275 return -1;
1276}
1277
1278static int kcore__init(struct kcore *kcore, char *filename, int elfclass,
1279 bool temp)
1280{
afba19d9
AH
1281 kcore->elfclass = elfclass;
1282
1283 if (temp)
1284 kcore->fd = mkstemp(filename);
1285 else
1286 kcore->fd = open(filename, O_WRONLY | O_CREAT | O_EXCL, 0400);
1287 if (kcore->fd == -1)
1288 return -1;
1289
1290 kcore->elf = elf_begin(kcore->fd, ELF_C_WRITE, NULL);
1291 if (!kcore->elf)
1292 goto out_close;
1293
1294 if (!gelf_newehdr(kcore->elf, elfclass))
1295 goto out_end;
1296
b5cabbcb 1297 memset(&kcore->ehdr, 0, sizeof(GElf_Ehdr));
afba19d9
AH
1298
1299 return 0;
1300
1301out_end:
1302 elf_end(kcore->elf);
1303out_close:
1304 close(kcore->fd);
1305 unlink(filename);
1306 return -1;
1307}
1308
1309static void kcore__close(struct kcore *kcore)
1310{
1311 elf_end(kcore->elf);
1312 close(kcore->fd);
1313}
1314
1315static int kcore__copy_hdr(struct kcore *from, struct kcore *to, size_t count)
1316{
1317 GElf_Ehdr *ehdr = &to->ehdr;
1318 GElf_Ehdr *kehdr = &from->ehdr;
1319
1320 memcpy(ehdr->e_ident, kehdr->e_ident, EI_NIDENT);
1321 ehdr->e_type = kehdr->e_type;
1322 ehdr->e_machine = kehdr->e_machine;
1323 ehdr->e_version = kehdr->e_version;
1324 ehdr->e_entry = 0;
1325 ehdr->e_shoff = 0;
1326 ehdr->e_flags = kehdr->e_flags;
1327 ehdr->e_phnum = count;
1328 ehdr->e_shentsize = 0;
1329 ehdr->e_shnum = 0;
1330 ehdr->e_shstrndx = 0;
1331
1332 if (from->elfclass == ELFCLASS32) {
1333 ehdr->e_phoff = sizeof(Elf32_Ehdr);
1334 ehdr->e_ehsize = sizeof(Elf32_Ehdr);
1335 ehdr->e_phentsize = sizeof(Elf32_Phdr);
1336 } else {
1337 ehdr->e_phoff = sizeof(Elf64_Ehdr);
1338 ehdr->e_ehsize = sizeof(Elf64_Ehdr);
1339 ehdr->e_phentsize = sizeof(Elf64_Phdr);
1340 }
1341
1342 if (!gelf_update_ehdr(to->elf, ehdr))
1343 return -1;
1344
1345 if (!gelf_newphdr(to->elf, count))
1346 return -1;
1347
1348 return 0;
1349}
1350
1351static int kcore__add_phdr(struct kcore *kcore, int idx, off_t offset,
1352 u64 addr, u64 len)
1353{
b5cabbcb
AH
1354 GElf_Phdr phdr = {
1355 .p_type = PT_LOAD,
1356 .p_flags = PF_R | PF_W | PF_X,
1357 .p_offset = offset,
1358 .p_vaddr = addr,
1359 .p_paddr = 0,
1360 .p_filesz = len,
1361 .p_memsz = len,
1362 .p_align = page_size,
1363 };
1364
1365 if (!gelf_update_phdr(kcore->elf, idx, &phdr))
afba19d9
AH
1366 return -1;
1367
1368 return 0;
1369}
1370
1371static off_t kcore__write(struct kcore *kcore)
1372{
1373 return elf_update(kcore->elf, ELF_C_WRITE);
1374}
1375
fc1b691d
AH
1376struct phdr_data {
1377 off_t offset;
1378 u64 addr;
1379 u64 len;
1380};
1381
1382struct kcore_copy_info {
1383 u64 stext;
1384 u64 etext;
1385 u64 first_symbol;
1386 u64 last_symbol;
1387 u64 first_module;
1388 u64 last_module_symbol;
1389 struct phdr_data kernel_map;
1390 struct phdr_data modules_map;
1391};
1392
1393static int kcore_copy__process_kallsyms(void *arg, const char *name, char type,
1394 u64 start)
1395{
1396 struct kcore_copy_info *kci = arg;
1397
1398 if (!symbol_type__is_a(type, MAP__FUNCTION))
1399 return 0;
1400
1401 if (strchr(name, '[')) {
1402 if (start > kci->last_module_symbol)
1403 kci->last_module_symbol = start;
1404 return 0;
1405 }
1406
1407 if (!kci->first_symbol || start < kci->first_symbol)
1408 kci->first_symbol = start;
1409
1410 if (!kci->last_symbol || start > kci->last_symbol)
1411 kci->last_symbol = start;
1412
1413 if (!strcmp(name, "_stext")) {
1414 kci->stext = start;
1415 return 0;
1416 }
1417
1418 if (!strcmp(name, "_etext")) {
1419 kci->etext = start;
1420 return 0;
1421 }
1422
1423 return 0;
1424}
1425
1426static int kcore_copy__parse_kallsyms(struct kcore_copy_info *kci,
1427 const char *dir)
1428{
1429 char kallsyms_filename[PATH_MAX];
1430
1431 scnprintf(kallsyms_filename, PATH_MAX, "%s/kallsyms", dir);
1432
1433 if (symbol__restricted_filename(kallsyms_filename, "/proc/kallsyms"))
1434 return -1;
1435
1436 if (kallsyms__parse(kallsyms_filename, kci,
1437 kcore_copy__process_kallsyms) < 0)
1438 return -1;
1439
1440 return 0;
1441}
1442
1443static int kcore_copy__process_modules(void *arg,
1444 const char *name __maybe_unused,
1445 u64 start)
1446{
1447 struct kcore_copy_info *kci = arg;
1448
1449 if (!kci->first_module || start < kci->first_module)
1450 kci->first_module = start;
1451
1452 return 0;
1453}
1454
1455static int kcore_copy__parse_modules(struct kcore_copy_info *kci,
1456 const char *dir)
1457{
1458 char modules_filename[PATH_MAX];
1459
1460 scnprintf(modules_filename, PATH_MAX, "%s/modules", dir);
1461
1462 if (symbol__restricted_filename(modules_filename, "/proc/modules"))
1463 return -1;
1464
1465 if (modules__parse(modules_filename, kci,
1466 kcore_copy__process_modules) < 0)
1467 return -1;
1468
1469 return 0;
1470}
1471
1472static void kcore_copy__map(struct phdr_data *p, u64 start, u64 end, u64 pgoff,
1473 u64 s, u64 e)
1474{
1475 if (p->addr || s < start || s >= end)
1476 return;
1477
1478 p->addr = s;
1479 p->offset = (s - start) + pgoff;
1480 p->len = e < end ? e - s : end - s;
1481}
1482
1483static int kcore_copy__read_map(u64 start, u64 len, u64 pgoff, void *data)
1484{
1485 struct kcore_copy_info *kci = data;
1486 u64 end = start + len;
1487
1488 kcore_copy__map(&kci->kernel_map, start, end, pgoff, kci->stext,
1489 kci->etext);
1490
1491 kcore_copy__map(&kci->modules_map, start, end, pgoff, kci->first_module,
1492 kci->last_module_symbol);
1493
1494 return 0;
1495}
1496
1497static int kcore_copy__read_maps(struct kcore_copy_info *kci, Elf *elf)
1498{
1499 if (elf_read_maps(elf, true, kcore_copy__read_map, kci) < 0)
1500 return -1;
1501
1502 return 0;
1503}
1504
1505static int kcore_copy__calc_maps(struct kcore_copy_info *kci, const char *dir,
1506 Elf *elf)
1507{
1508 if (kcore_copy__parse_kallsyms(kci, dir))
1509 return -1;
1510
1511 if (kcore_copy__parse_modules(kci, dir))
1512 return -1;
1513
1514 if (kci->stext)
1515 kci->stext = round_down(kci->stext, page_size);
1516 else
1517 kci->stext = round_down(kci->first_symbol, page_size);
1518
1519 if (kci->etext) {
1520 kci->etext = round_up(kci->etext, page_size);
1521 } else if (kci->last_symbol) {
1522 kci->etext = round_up(kci->last_symbol, page_size);
1523 kci->etext += page_size;
1524 }
1525
1526 kci->first_module = round_down(kci->first_module, page_size);
1527
1528 if (kci->last_module_symbol) {
1529 kci->last_module_symbol = round_up(kci->last_module_symbol,
1530 page_size);
1531 kci->last_module_symbol += page_size;
1532 }
1533
1534 if (!kci->stext || !kci->etext)
1535 return -1;
1536
1537 if (kci->first_module && !kci->last_module_symbol)
1538 return -1;
1539
1540 return kcore_copy__read_maps(kci, elf);
1541}
1542
1543static int kcore_copy__copy_file(const char *from_dir, const char *to_dir,
1544 const char *name)
1545{
1546 char from_filename[PATH_MAX];
1547 char to_filename[PATH_MAX];
1548
1549 scnprintf(from_filename, PATH_MAX, "%s/%s", from_dir, name);
1550 scnprintf(to_filename, PATH_MAX, "%s/%s", to_dir, name);
1551
1552 return copyfile_mode(from_filename, to_filename, 0400);
1553}
1554
1555static int kcore_copy__unlink(const char *dir, const char *name)
1556{
1557 char filename[PATH_MAX];
1558
1559 scnprintf(filename, PATH_MAX, "%s/%s", dir, name);
1560
1561 return unlink(filename);
1562}
1563
1564static int kcore_copy__compare_fds(int from, int to)
1565{
1566 char *buf_from;
1567 char *buf_to;
1568 ssize_t ret;
1569 size_t len;
1570 int err = -1;
1571
1572 buf_from = malloc(page_size);
1573 buf_to = malloc(page_size);
1574 if (!buf_from || !buf_to)
1575 goto out;
1576
1577 while (1) {
1578 /* Use read because mmap won't work on proc files */
1579 ret = read(from, buf_from, page_size);
1580 if (ret < 0)
1581 goto out;
1582
1583 if (!ret)
1584 break;
1585
1586 len = ret;
1587
1588 if (readn(to, buf_to, len) != (int)len)
1589 goto out;
1590
1591 if (memcmp(buf_from, buf_to, len))
1592 goto out;
1593 }
1594
1595 err = 0;
1596out:
1597 free(buf_to);
1598 free(buf_from);
1599 return err;
1600}
1601
1602static int kcore_copy__compare_files(const char *from_filename,
1603 const char *to_filename)
1604{
1605 int from, to, err = -1;
1606
1607 from = open(from_filename, O_RDONLY);
1608 if (from < 0)
1609 return -1;
1610
1611 to = open(to_filename, O_RDONLY);
1612 if (to < 0)
1613 goto out_close_from;
1614
1615 err = kcore_copy__compare_fds(from, to);
1616
1617 close(to);
1618out_close_from:
1619 close(from);
1620 return err;
1621}
1622
1623static int kcore_copy__compare_file(const char *from_dir, const char *to_dir,
1624 const char *name)
1625{
1626 char from_filename[PATH_MAX];
1627 char to_filename[PATH_MAX];
1628
1629 scnprintf(from_filename, PATH_MAX, "%s/%s", from_dir, name);
1630 scnprintf(to_filename, PATH_MAX, "%s/%s", to_dir, name);
1631
1632 return kcore_copy__compare_files(from_filename, to_filename);
1633}
1634
1635/**
1636 * kcore_copy - copy kallsyms, modules and kcore from one directory to another.
1637 * @from_dir: from directory
1638 * @to_dir: to directory
1639 *
1640 * This function copies kallsyms, modules and kcore files from one directory to
1641 * another. kallsyms and modules are copied entirely. Only code segments are
1642 * copied from kcore. It is assumed that two segments suffice: one for the
1643 * kernel proper and one for all the modules. The code segments are determined
1644 * from kallsyms and modules files. The kernel map starts at _stext or the
1645 * lowest function symbol, and ends at _etext or the highest function symbol.
1646 * The module map starts at the lowest module address and ends at the highest
1647 * module symbol. Start addresses are rounded down to the nearest page. End
1648 * addresses are rounded up to the nearest page. An extra page is added to the
1649 * highest kernel symbol and highest module symbol to, hopefully, encompass that
1650 * symbol too. Because it contains only code sections, the resulting kcore is
1651 * unusual. One significant peculiarity is that the mapping (start -> pgoff)
1652 * is not the same for the kernel map and the modules map. That happens because
1653 * the data is copied adjacently whereas the original kcore has gaps. Finally,
1654 * kallsyms and modules files are compared with their copies to check that
1655 * modules have not been loaded or unloaded while the copies were taking place.
1656 *
1657 * Return: %0 on success, %-1 on failure.
1658 */
1659int kcore_copy(const char *from_dir, const char *to_dir)
1660{
1661 struct kcore kcore;
1662 struct kcore extract;
1663 size_t count = 2;
1664 int idx = 0, err = -1;
1665 off_t offset = page_size, sz, modules_offset = 0;
1666 struct kcore_copy_info kci = { .stext = 0, };
1667 char kcore_filename[PATH_MAX];
1668 char extract_filename[PATH_MAX];
1669
1670 if (kcore_copy__copy_file(from_dir, to_dir, "kallsyms"))
1671 return -1;
1672
1673 if (kcore_copy__copy_file(from_dir, to_dir, "modules"))
1674 goto out_unlink_kallsyms;
1675
1676 scnprintf(kcore_filename, PATH_MAX, "%s/kcore", from_dir);
1677 scnprintf(extract_filename, PATH_MAX, "%s/kcore", to_dir);
1678
1679 if (kcore__open(&kcore, kcore_filename))
1680 goto out_unlink_modules;
1681
1682 if (kcore_copy__calc_maps(&kci, from_dir, kcore.elf))
1683 goto out_kcore_close;
1684
1685 if (kcore__init(&extract, extract_filename, kcore.elfclass, false))
1686 goto out_kcore_close;
1687
1688 if (!kci.modules_map.addr)
1689 count -= 1;
1690
1691 if (kcore__copy_hdr(&kcore, &extract, count))
1692 goto out_extract_close;
1693
1694 if (kcore__add_phdr(&extract, idx++, offset, kci.kernel_map.addr,
1695 kci.kernel_map.len))
1696 goto out_extract_close;
1697
1698 if (kci.modules_map.addr) {
1699 modules_offset = offset + kci.kernel_map.len;
1700 if (kcore__add_phdr(&extract, idx, modules_offset,
1701 kci.modules_map.addr, kci.modules_map.len))
1702 goto out_extract_close;
1703 }
1704
1705 sz = kcore__write(&extract);
1706 if (sz < 0 || sz > offset)
1707 goto out_extract_close;
1708
1709 if (copy_bytes(kcore.fd, kci.kernel_map.offset, extract.fd, offset,
1710 kci.kernel_map.len))
1711 goto out_extract_close;
1712
1713 if (modules_offset && copy_bytes(kcore.fd, kci.modules_map.offset,
1714 extract.fd, modules_offset,
1715 kci.modules_map.len))
1716 goto out_extract_close;
1717
1718 if (kcore_copy__compare_file(from_dir, to_dir, "modules"))
1719 goto out_extract_close;
1720
1721 if (kcore_copy__compare_file(from_dir, to_dir, "kallsyms"))
1722 goto out_extract_close;
1723
1724 err = 0;
1725
1726out_extract_close:
1727 kcore__close(&extract);
1728 if (err)
1729 unlink(extract_filename);
1730out_kcore_close:
1731 kcore__close(&kcore);
1732out_unlink_modules:
1733 if (err)
1734 kcore_copy__unlink(to_dir, "modules");
1735out_unlink_kallsyms:
1736 if (err)
1737 kcore_copy__unlink(to_dir, "kallsyms");
1738
1739 return err;
1740}
1741
afba19d9
AH
1742int kcore_extract__create(struct kcore_extract *kce)
1743{
1744 struct kcore kcore;
1745 struct kcore extract;
1746 size_t count = 1;
1747 int idx = 0, err = -1;
1748 off_t offset = page_size, sz;
1749
1750 if (kcore__open(&kcore, kce->kcore_filename))
1751 return -1;
1752
1753 strcpy(kce->extract_filename, PERF_KCORE_EXTRACT);
1754 if (kcore__init(&extract, kce->extract_filename, kcore.elfclass, true))
1755 goto out_kcore_close;
1756
1757 if (kcore__copy_hdr(&kcore, &extract, count))
1758 goto out_extract_close;
1759
1760 if (kcore__add_phdr(&extract, idx, offset, kce->addr, kce->len))
1761 goto out_extract_close;
1762
1763 sz = kcore__write(&extract);
1764 if (sz < 0 || sz > offset)
1765 goto out_extract_close;
1766
1767 if (copy_bytes(kcore.fd, kce->offs, extract.fd, offset, kce->len))
1768 goto out_extract_close;
1769
1770 err = 0;
1771
1772out_extract_close:
1773 kcore__close(&extract);
1774 if (err)
1775 unlink(kce->extract_filename);
1776out_kcore_close:
1777 kcore__close(&kcore);
1778
1779 return err;
1780}
1781
1782void kcore_extract__delete(struct kcore_extract *kce)
1783{
1784 unlink(kce->extract_filename);
1785}
1786
e5a1845f
NK
1787void symbol__elf_init(void)
1788{
1789 elf_version(EV_CURRENT);
1790}