11 #ifndef HAVE_ELF_GETPHDRNUM
12 static int elf_getphdrnum(Elf *elf, size_t *dst)
17 ehdr = gelf_getehdr(elf, &gehdr);
27 #ifndef NT_GNU_BUILD_ID
28 #define NT_GNU_BUILD_ID 3
32 * elf_symtab__for_each_symbol - iterate thru all the symbols
34 * @syms: struct elf_symtab instance to iterate
36 * @sym: GElf_Sym iterator
38 #define elf_symtab__for_each_symbol(syms, nr_syms, idx, sym) \
39 for (idx = 0, gelf_getsym(syms, idx, &sym);\
41 idx++, gelf_getsym(syms, idx, &sym))
43 static inline uint8_t elf_sym__type(const GElf_Sym *sym)
45 return GELF_ST_TYPE(sym->st_info);
48 static inline int elf_sym__is_function(const GElf_Sym *sym)
50 return elf_sym__type(sym) == STT_FUNC &&
52 sym->st_shndx != SHN_UNDEF;
55 static inline bool elf_sym__is_object(const GElf_Sym *sym)
57 return elf_sym__type(sym) == STT_OBJECT &&
59 sym->st_shndx != SHN_UNDEF;
62 static inline int elf_sym__is_label(const GElf_Sym *sym)
64 return elf_sym__type(sym) == STT_NOTYPE &&
66 sym->st_shndx != SHN_UNDEF &&
67 sym->st_shndx != SHN_ABS;
70 static bool elf_sym__is_a(GElf_Sym *sym, enum map_type type)
74 return elf_sym__is_function(sym);
76 return elf_sym__is_object(sym);
82 static inline const char *elf_sym__name(const GElf_Sym *sym,
83 const Elf_Data *symstrs)
85 return symstrs->d_buf + sym->st_name;
88 static inline const char *elf_sec__name(const GElf_Shdr *shdr,
89 const Elf_Data *secstrs)
91 return secstrs->d_buf + shdr->sh_name;
94 static inline int elf_sec__is_text(const GElf_Shdr *shdr,
95 const Elf_Data *secstrs)
97 return strstr(elf_sec__name(shdr, secstrs), "text") != NULL;
100 static inline bool elf_sec__is_data(const GElf_Shdr *shdr,
101 const Elf_Data *secstrs)
103 return strstr(elf_sec__name(shdr, secstrs), "data") != NULL;
106 static bool elf_sec__is_a(GElf_Shdr *shdr, Elf_Data *secstrs,
111 return elf_sec__is_text(shdr, secstrs);
113 return elf_sec__is_data(shdr, secstrs);
119 static size_t elf_addr_to_index(Elf *elf, GElf_Addr addr)
125 while ((sec = elf_nextscn(elf, sec)) != NULL) {
126 gelf_getshdr(sec, &shdr);
128 if ((addr >= shdr.sh_addr) &&
129 (addr < (shdr.sh_addr + shdr.sh_size)))
138 static Elf_Scn *elf_section_by_name(Elf *elf, GElf_Ehdr *ep,
139 GElf_Shdr *shp, const char *name,
145 /* Elf is corrupted/truncated, avoid calling elf_strptr. */
146 if (!elf_rawdata(elf_getscn(elf, ep->e_shstrndx), NULL))
149 while ((sec = elf_nextscn(elf, sec)) != NULL) {
152 gelf_getshdr(sec, shp);
153 str = elf_strptr(elf, ep->e_shstrndx, shp->sh_name);
154 if (!strcmp(name, str)) {
165 #define elf_section__for_each_rel(reldata, pos, pos_mem, idx, nr_entries) \
166 for (idx = 0, pos = gelf_getrel(reldata, 0, &pos_mem); \
168 ++idx, pos = gelf_getrel(reldata, idx, &pos_mem))
170 #define elf_section__for_each_rela(reldata, pos, pos_mem, idx, nr_entries) \
171 for (idx = 0, pos = gelf_getrela(reldata, 0, &pos_mem); \
173 ++idx, pos = gelf_getrela(reldata, idx, &pos_mem))
176 * We need to check if we have a .dynsym, so that we can handle the
177 * .plt, synthesizing its symbols, that aren't on the symtabs (be it
178 * .dynsym or .symtab).
179 * And always look at the original dso, not at debuginfo packages, that
180 * have the PLT data stripped out (shdr_rel_plt.sh_type == SHT_NOBITS).
182 int dso__synthesize_plt_symbols(struct dso *dso, struct symsrc *ss, struct map *map,
183 symbol_filter_t filter)
185 uint32_t nr_rel_entries, idx;
190 GElf_Shdr shdr_rel_plt, shdr_dynsym;
191 Elf_Data *reldata, *syms, *symstrs;
192 Elf_Scn *scn_plt_rel, *scn_symstrs, *scn_dynsym;
195 char sympltname[1024];
197 int nr = 0, symidx, err = 0;
205 scn_dynsym = ss->dynsym;
206 shdr_dynsym = ss->dynshdr;
207 dynsym_idx = ss->dynsym_idx;
209 if (scn_dynsym == NULL)
212 scn_plt_rel = elf_section_by_name(elf, &ehdr, &shdr_rel_plt,
214 if (scn_plt_rel == NULL) {
215 scn_plt_rel = elf_section_by_name(elf, &ehdr, &shdr_rel_plt,
217 if (scn_plt_rel == NULL)
223 if (shdr_rel_plt.sh_link != dynsym_idx)
226 if (elf_section_by_name(elf, &ehdr, &shdr_plt, ".plt", NULL) == NULL)
230 * Fetch the relocation section to find the idxes to the GOT
231 * and the symbols in the .dynsym they refer to.
233 reldata = elf_getdata(scn_plt_rel, NULL);
237 syms = elf_getdata(scn_dynsym, NULL);
241 scn_symstrs = elf_getscn(elf, shdr_dynsym.sh_link);
242 if (scn_symstrs == NULL)
245 symstrs = elf_getdata(scn_symstrs, NULL);
249 if (symstrs->d_size == 0)
252 nr_rel_entries = shdr_rel_plt.sh_size / shdr_rel_plt.sh_entsize;
253 plt_offset = shdr_plt.sh_offset;
255 if (shdr_rel_plt.sh_type == SHT_RELA) {
256 GElf_Rela pos_mem, *pos;
258 elf_section__for_each_rela(reldata, pos, pos_mem, idx,
260 symidx = GELF_R_SYM(pos->r_info);
261 plt_offset += shdr_plt.sh_entsize;
262 gelf_getsym(syms, symidx, &sym);
263 snprintf(sympltname, sizeof(sympltname),
264 "%s@plt", elf_sym__name(&sym, symstrs));
266 f = symbol__new(plt_offset, shdr_plt.sh_entsize,
267 STB_GLOBAL, sympltname);
271 if (filter && filter(map, f))
274 symbols__insert(&dso->symbols[map->type], f);
278 } else if (shdr_rel_plt.sh_type == SHT_REL) {
279 GElf_Rel pos_mem, *pos;
280 elf_section__for_each_rel(reldata, pos, pos_mem, idx,
282 symidx = GELF_R_SYM(pos->r_info);
283 plt_offset += shdr_plt.sh_entsize;
284 gelf_getsym(syms, symidx, &sym);
285 snprintf(sympltname, sizeof(sympltname),
286 "%s@plt", elf_sym__name(&sym, symstrs));
288 f = symbol__new(plt_offset, shdr_plt.sh_entsize,
289 STB_GLOBAL, sympltname);
293 if (filter && filter(map, f))
296 symbols__insert(&dso->symbols[map->type], f);
306 pr_debug("%s: problems reading %s PLT info.\n",
307 __func__, dso->long_name);
312 * Align offset to 4 bytes as needed for note name and descriptor data.
314 #define NOTE_ALIGN(n) (((n) + 3) & -4U)
316 static int elf_read_build_id(Elf *elf, void *bf, size_t size)
326 if (size < BUILD_ID_SIZE)
333 if (gelf_getehdr(elf, &ehdr) == NULL) {
334 pr_err("%s: cannot get elf header.\n", __func__);
339 * Check following sections for notes:
340 * '.note.gnu.build-id'
342 * '.note' (VDSO specific)
345 sec = elf_section_by_name(elf, &ehdr, &shdr,
346 ".note.gnu.build-id", NULL);
350 sec = elf_section_by_name(elf, &ehdr, &shdr,
355 sec = elf_section_by_name(elf, &ehdr, &shdr,
364 data = elf_getdata(sec, NULL);
369 while (ptr < (data->d_buf + data->d_size)) {
370 GElf_Nhdr *nhdr = ptr;
371 size_t namesz = NOTE_ALIGN(nhdr->n_namesz),
372 descsz = NOTE_ALIGN(nhdr->n_descsz);
375 ptr += sizeof(*nhdr);
378 if (nhdr->n_type == NT_GNU_BUILD_ID &&
379 nhdr->n_namesz == sizeof("GNU")) {
380 if (memcmp(name, "GNU", sizeof("GNU")) == 0) {
381 size_t sz = min(size, descsz);
383 memset(bf + sz, 0, size - sz);
395 int filename__read_build_id(const char *filename, void *bf, size_t size)
400 if (size < BUILD_ID_SIZE)
403 fd = open(filename, O_RDONLY);
407 elf = elf_begin(fd, PERF_ELF_C_READ_MMAP, NULL);
409 pr_debug2("%s: cannot read %s ELF file.\n", __func__, filename);
413 err = elf_read_build_id(elf, bf, size);
422 int sysfs__read_build_id(const char *filename, void *build_id, size_t size)
426 if (size < BUILD_ID_SIZE)
429 fd = open(filename, O_RDONLY);
436 size_t namesz, descsz;
438 if (read(fd, &nhdr, sizeof(nhdr)) != sizeof(nhdr))
441 namesz = NOTE_ALIGN(nhdr.n_namesz);
442 descsz = NOTE_ALIGN(nhdr.n_descsz);
443 if (nhdr.n_type == NT_GNU_BUILD_ID &&
444 nhdr.n_namesz == sizeof("GNU")) {
445 if (read(fd, bf, namesz) != (ssize_t)namesz)
447 if (memcmp(bf, "GNU", sizeof("GNU")) == 0) {
448 size_t sz = min(descsz, size);
449 if (read(fd, build_id, sz) == (ssize_t)sz) {
450 memset(build_id + sz, 0, size - sz);
454 } else if (read(fd, bf, descsz) != (ssize_t)descsz)
457 int n = namesz + descsz;
458 if (read(fd, bf, n) != n)
467 int filename__read_debuglink(const char *filename, char *debuglink,
478 fd = open(filename, O_RDONLY);
482 elf = elf_begin(fd, PERF_ELF_C_READ_MMAP, NULL);
484 pr_debug2("%s: cannot read %s ELF file.\n", __func__, filename);
492 if (gelf_getehdr(elf, &ehdr) == NULL) {
493 pr_err("%s: cannot get elf header.\n", __func__);
497 sec = elf_section_by_name(elf, &ehdr, &shdr,
498 ".gnu_debuglink", NULL);
502 data = elf_getdata(sec, NULL);
506 /* the start of this section is a zero-terminated string */
507 strncpy(debuglink, data->d_buf, size);
517 static int dso__swap_init(struct dso *dso, unsigned char eidata)
519 static unsigned int const endian = 1;
521 dso->needs_swap = DSO_SWAP__NO;
525 /* We are big endian, DSO is little endian. */
526 if (*(unsigned char const *)&endian != 1)
527 dso->needs_swap = DSO_SWAP__YES;
531 /* We are little endian, DSO is big endian. */
532 if (*(unsigned char const *)&endian != 0)
533 dso->needs_swap = DSO_SWAP__YES;
537 pr_err("unrecognized DSO data encoding %d\n", eidata);
544 bool symsrc__possibly_runtime(struct symsrc *ss)
546 return ss->dynsym || ss->opdsec;
549 bool symsrc__has_symtab(struct symsrc *ss)
551 return ss->symtab != NULL;
554 void symsrc__destroy(struct symsrc *ss)
561 int symsrc__init(struct symsrc *ss, struct dso *dso, const char *name,
562 enum dso_binary_type type)
569 fd = open(name, O_RDONLY);
573 elf = elf_begin(fd, PERF_ELF_C_READ_MMAP, NULL);
575 pr_debug("%s: cannot read %s ELF file.\n", __func__, name);
579 if (gelf_getehdr(elf, &ehdr) == NULL) {
580 pr_debug("%s: cannot get elf header.\n", __func__);
584 if (dso__swap_init(dso, ehdr.e_ident[EI_DATA]))
587 /* Always reject images with a mismatched build-id: */
588 if (dso->has_build_id) {
589 u8 build_id[BUILD_ID_SIZE];
591 if (elf_read_build_id(elf, build_id, BUILD_ID_SIZE) < 0)
594 if (!dso__build_id_equal(dso, build_id))
598 ss->symtab = elf_section_by_name(elf, &ehdr, &ss->symshdr, ".symtab",
600 if (ss->symshdr.sh_type != SHT_SYMTAB)
604 ss->dynsym = elf_section_by_name(elf, &ehdr, &ss->dynshdr, ".dynsym",
606 if (ss->dynshdr.sh_type != SHT_DYNSYM)
610 ss->opdsec = elf_section_by_name(elf, &ehdr, &ss->opdshdr, ".opd",
612 if (ss->opdshdr.sh_type != SHT_PROGBITS)
615 if (dso->kernel == DSO_TYPE_USER) {
617 ss->adjust_symbols = (ehdr.e_type == ET_EXEC ||
618 ehdr.e_type == ET_REL ||
619 elf_section_by_name(elf, &ehdr, &shdr,
623 ss->adjust_symbols = ehdr.e_type == ET_EXEC ||
624 ehdr.e_type == ET_REL;
627 ss->name = strdup(name);
646 * ref_reloc_sym_not_found - has kernel relocation symbol been found.
647 * @kmap: kernel maps and relocation reference symbol
649 * This function returns %true if we are dealing with the kernel maps and the
650 * relocation reference symbol has not yet been found. Otherwise %false is
653 static bool ref_reloc_sym_not_found(struct kmap *kmap)
655 return kmap && kmap->ref_reloc_sym && kmap->ref_reloc_sym->name &&
656 !kmap->ref_reloc_sym->unrelocated_addr;
660 * ref_reloc - kernel relocation offset.
661 * @kmap: kernel maps and relocation reference symbol
663 * This function returns the offset of kernel addresses as determined by using
664 * the relocation reference symbol i.e. if the kernel has not been relocated
665 * then the return value is zero.
667 static u64 ref_reloc(struct kmap *kmap)
669 if (kmap && kmap->ref_reloc_sym &&
670 kmap->ref_reloc_sym->unrelocated_addr)
671 return kmap->ref_reloc_sym->addr -
672 kmap->ref_reloc_sym->unrelocated_addr;
676 int dso__load_sym(struct dso *dso, struct map *map,
677 struct symsrc *syms_ss, struct symsrc *runtime_ss,
678 symbol_filter_t filter, int kmodule)
680 struct kmap *kmap = dso->kernel ? map__kmap(map) : NULL;
681 struct map *curr_map = map;
682 struct dso *curr_dso = dso;
683 Elf_Data *symstrs, *secstrs;
689 Elf_Data *syms, *opddata = NULL;
691 Elf_Scn *sec, *sec_strndx;
694 bool remap_kernel = false, adjust_kernel_syms = false;
696 dso->symtab_type = syms_ss->type;
697 dso->rel = syms_ss->ehdr.e_type == ET_REL;
700 * Modules may already have symbols from kallsyms, but those symbols
701 * have the wrong values for the dso maps, so remove them.
703 if (kmodule && syms_ss->symtab)
704 symbols__delete(&dso->symbols[map->type]);
706 if (!syms_ss->symtab) {
707 syms_ss->symtab = syms_ss->dynsym;
708 syms_ss->symshdr = syms_ss->dynshdr;
712 ehdr = syms_ss->ehdr;
713 sec = syms_ss->symtab;
714 shdr = syms_ss->symshdr;
716 if (runtime_ss->opdsec)
717 opddata = elf_rawdata(runtime_ss->opdsec, NULL);
719 syms = elf_getdata(sec, NULL);
723 sec = elf_getscn(elf, shdr.sh_link);
727 symstrs = elf_getdata(sec, NULL);
731 sec_strndx = elf_getscn(elf, ehdr.e_shstrndx);
732 if (sec_strndx == NULL)
735 secstrs = elf_getdata(sec_strndx, NULL);
739 nr_syms = shdr.sh_size / shdr.sh_entsize;
741 memset(&sym, 0, sizeof(sym));
744 * The kernel relocation symbol is needed in advance in order to adjust
745 * kernel maps correctly.
747 if (ref_reloc_sym_not_found(kmap)) {
748 elf_symtab__for_each_symbol(syms, nr_syms, idx, sym) {
749 const char *elf_name = elf_sym__name(&sym, symstrs);
751 if (strcmp(elf_name, kmap->ref_reloc_sym->name))
753 kmap->ref_reloc_sym->unrelocated_addr = sym.st_value;
758 dso->adjust_symbols = runtime_ss->adjust_symbols || ref_reloc(kmap);
760 * Initial kernel and module mappings do not map to the dso. For
761 * function mappings, flag the fixups.
763 if (map->type == MAP__FUNCTION && (dso->kernel || kmodule)) {
765 adjust_kernel_syms = dso->adjust_symbols;
767 elf_symtab__for_each_symbol(syms, nr_syms, idx, sym) {
769 const char *elf_name = elf_sym__name(&sym, symstrs);
770 char *demangled = NULL;
771 int is_label = elf_sym__is_label(&sym);
772 const char *section_name;
773 bool used_opd = false;
775 if (!is_label && !elf_sym__is_a(&sym, map->type))
778 /* Reject ARM ELF "mapping symbols": these aren't unique and
779 * don't identify functions, so will confuse the profile
781 if (ehdr.e_machine == EM_ARM) {
782 if (!strcmp(elf_name, "$a") ||
783 !strcmp(elf_name, "$d") ||
784 !strcmp(elf_name, "$t"))
788 if (runtime_ss->opdsec && sym.st_shndx == runtime_ss->opdidx) {
789 u32 offset = sym.st_value - syms_ss->opdshdr.sh_addr;
790 u64 *opd = opddata->d_buf + offset;
791 sym.st_value = DSO__SWAP(dso, u64, *opd);
792 sym.st_shndx = elf_addr_to_index(runtime_ss->elf,
797 * When loading symbols in a data mapping, ABS symbols (which
798 * has a value of SHN_ABS in its st_shndx) failed at
799 * elf_getscn(). And it marks the loading as a failure so
800 * already loaded symbols cannot be fixed up.
802 * I'm not sure what should be done. Just ignore them for now.
805 if (sym.st_shndx == SHN_ABS)
808 sec = elf_getscn(runtime_ss->elf, sym.st_shndx);
812 gelf_getshdr(sec, &shdr);
814 if (is_label && !elf_sec__is_a(&shdr, secstrs, map->type))
817 section_name = elf_sec__name(&shdr, secstrs);
819 /* On ARM, symbols for thumb functions have 1 added to
820 * the symbol address as a flag - remove it */
821 if ((ehdr.e_machine == EM_ARM) &&
822 (map->type == MAP__FUNCTION) &&
826 if (dso->kernel || kmodule) {
827 char dso_name[PATH_MAX];
829 /* Adjust symbol to map to file offset */
830 if (adjust_kernel_syms)
831 sym.st_value -= shdr.sh_addr - shdr.sh_offset;
833 if (strcmp(section_name,
834 (curr_dso->short_name +
835 dso->short_name_len)) == 0)
838 if (strcmp(section_name, ".text") == 0) {
840 * The initial kernel mapping is based on
841 * kallsyms and identity maps. Overwrite it to
842 * map to the kernel dso.
844 if (remap_kernel && dso->kernel) {
845 remap_kernel = false;
846 map->start = shdr.sh_addr +
848 map->end = map->start + shdr.sh_size;
849 map->pgoff = shdr.sh_offset;
850 map->map_ip = map__map_ip;
851 map->unmap_ip = map__unmap_ip;
852 /* Ensure maps are correctly ordered */
853 map_groups__remove(kmap->kmaps, map);
854 map_groups__insert(kmap->kmaps, map);
858 * The initial module mapping is based on
859 * /proc/modules mapped to offset zero.
860 * Overwrite it to map to the module dso.
862 if (remap_kernel && kmodule) {
863 remap_kernel = false;
864 map->pgoff = shdr.sh_offset;
875 snprintf(dso_name, sizeof(dso_name),
876 "%s%s", dso->short_name, section_name);
878 curr_map = map_groups__find_by_name(kmap->kmaps, map->type, dso_name);
879 if (curr_map == NULL) {
880 u64 start = sym.st_value;
883 start += map->start + shdr.sh_offset;
885 curr_dso = dso__new(dso_name);
886 if (curr_dso == NULL)
888 curr_dso->kernel = dso->kernel;
889 curr_dso->long_name = dso->long_name;
890 curr_dso->long_name_len = dso->long_name_len;
891 curr_map = map__new2(start, curr_dso,
893 if (curr_map == NULL) {
894 dso__delete(curr_dso);
897 if (adjust_kernel_syms) {
898 curr_map->start = shdr.sh_addr +
900 curr_map->end = curr_map->start +
902 curr_map->pgoff = shdr.sh_offset;
904 curr_map->map_ip = identity__map_ip;
905 curr_map->unmap_ip = identity__map_ip;
907 curr_dso->symtab_type = dso->symtab_type;
908 map_groups__insert(kmap->kmaps, curr_map);
909 dsos__add(&dso->node, curr_dso);
910 dso__set_loaded(curr_dso, map->type);
912 curr_dso = curr_map->dso;
917 if ((used_opd && runtime_ss->adjust_symbols)
918 || (!used_opd && syms_ss->adjust_symbols)) {
919 pr_debug4("%s: adjusting symbol: st_value: %#" PRIx64 " "
920 "sh_addr: %#" PRIx64 " sh_offset: %#" PRIx64 "\n", __func__,
921 (u64)sym.st_value, (u64)shdr.sh_addr,
922 (u64)shdr.sh_offset);
923 sym.st_value -= shdr.sh_addr - shdr.sh_offset;
926 * We need to figure out if the object was created from C++ sources
927 * DWARF DW_compile_unit has this, but we don't always have access
930 if (symbol_conf.demangle) {
931 demangled = bfd_demangle(NULL, elf_name,
932 DMGL_PARAMS | DMGL_ANSI);
933 if (demangled != NULL)
934 elf_name = demangled;
937 f = symbol__new(sym.st_value, sym.st_size,
938 GELF_ST_BIND(sym.st_info), elf_name);
943 if (filter && filter(curr_map, f))
946 symbols__insert(&curr_dso->symbols[curr_map->type], f);
952 * For misannotated, zeroed, ASM function sizes.
955 symbols__fixup_duplicate(&dso->symbols[map->type]);
956 symbols__fixup_end(&dso->symbols[map->type]);
959 * We need to fixup this here too because we create new
960 * maps here, for things like vsyscall sections.
962 __map_groups__fixup_end(kmap->kmaps, map->type);
970 static int elf_read_maps(Elf *elf, bool exe, mapfn_t mapfn, void *data)
977 if (elf_getphdrnum(elf, &phdrnum))
980 for (i = 0; i < phdrnum; i++) {
981 if (gelf_getphdr(elf, i, &phdr) == NULL)
983 if (phdr.p_type != PT_LOAD)
986 if (!(phdr.p_flags & PF_X))
989 if (!(phdr.p_flags & PF_R))
992 sz = min(phdr.p_memsz, phdr.p_filesz);
995 err = mapfn(phdr.p_vaddr, sz, phdr.p_offset, data);
1002 int file__read_maps(int fd, bool exe, mapfn_t mapfn, void *data,
1008 elf = elf_begin(fd, PERF_ELF_C_READ_MMAP, NULL);
1013 *is_64_bit = (gelf_getclass(elf) == ELFCLASS64);
1015 err = elf_read_maps(elf, exe, mapfn, data);
1021 void symbol__elf_init(void)
1023 elf_version(EV_CURRENT);