Commit | Line | Data |
---|---|---|
a2928c42 ACM |
1 | #include "util.h" |
2 | #include "../perf.h" | |
a0055ae2 | 3 | #include "string.h" |
a2928c42 ACM |
4 | #include "symbol.h" |
5 | ||
8f28827a FW |
6 | #include "debug.h" |
7 | ||
a2928c42 ACM |
8 | #include <libelf.h> |
9 | #include <gelf.h> | |
10 | #include <elf.h> | |
2cdbc46d | 11 | |
0b73da3f IM |
12 | const char *sym_hist_filter; |
13 | ||
94cb9e38 ACM |
14 | enum dso_origin { |
15 | DSO__ORIG_KERNEL = 0, | |
16 | DSO__ORIG_JAVA_JIT, | |
17 | DSO__ORIG_FEDORA, | |
18 | DSO__ORIG_UBUNTU, | |
19 | DSO__ORIG_BUILDID, | |
20 | DSO__ORIG_DSO, | |
21 | DSO__ORIG_NOT_FOUND, | |
22 | }; | |
23 | ||
9cffa8d5 | 24 | static struct symbol *symbol__new(u64 start, u64 len, |
0b73da3f | 25 | const char *name, unsigned int priv_size, |
83a0944f | 26 | u64 obj_start, int v) |
a2928c42 | 27 | { |
0085c954 | 28 | size_t namelen = strlen(name) + 1; |
0b73da3f | 29 | struct symbol *self = calloc(1, priv_size + sizeof(*self) + namelen); |
a2928c42 | 30 | |
0b73da3f IM |
31 | if (!self) |
32 | return NULL; | |
33 | ||
83a0944f | 34 | if (v >= 2) |
0b73da3f | 35 | printf("new symbol: %016Lx [%08lx]: %s, hist: %p, obj_start: %p\n", |
9cffa8d5 | 36 | (u64)start, (unsigned long)len, name, self->hist, (void *)(unsigned long)obj_start); |
0b73da3f IM |
37 | |
38 | self->obj_start= obj_start; | |
39 | self->hist = NULL; | |
40 | self->hist_sum = 0; | |
41 | ||
42 | if (sym_hist_filter && !strcmp(name, sym_hist_filter)) | |
9cffa8d5 | 43 | self->hist = calloc(sizeof(u64), len); |
0b73da3f IM |
44 | |
45 | if (priv_size) { | |
46 | memset(self, 0, priv_size); | |
47 | self = ((void *)self) + priv_size; | |
a2928c42 | 48 | } |
0b73da3f | 49 | self->start = start; |
6cfcc53e | 50 | self->end = len ? start + len - 1 : start; |
0b73da3f | 51 | memcpy(self->name, name, namelen); |
a2928c42 ACM |
52 | |
53 | return self; | |
54 | } | |
55 | ||
0085c954 | 56 | static void symbol__delete(struct symbol *self, unsigned int priv_size) |
a2928c42 | 57 | { |
0085c954 | 58 | free(((void *)self) - priv_size); |
a2928c42 ACM |
59 | } |
60 | ||
61 | static size_t symbol__fprintf(struct symbol *self, FILE *fp) | |
62 | { | |
6cfcc53e MG |
63 | if (!self->module) |
64 | return fprintf(fp, " %llx-%llx %s\n", | |
a2928c42 | 65 | self->start, self->end, self->name); |
6cfcc53e MG |
66 | else |
67 | return fprintf(fp, " %llx-%llx %s \t[%s]\n", | |
68 | self->start, self->end, self->name, self->module->name); | |
a2928c42 ACM |
69 | } |
70 | ||
0085c954 | 71 | struct dso *dso__new(const char *name, unsigned int sym_priv_size) |
a2928c42 ACM |
72 | { |
73 | struct dso *self = malloc(sizeof(*self) + strlen(name) + 1); | |
74 | ||
75 | if (self != NULL) { | |
76 | strcpy(self->name, name); | |
77 | self->syms = RB_ROOT; | |
0085c954 | 78 | self->sym_priv_size = sym_priv_size; |
fc54db51 | 79 | self->find_symbol = dso__find_symbol; |
52d422de | 80 | self->slen_calculated = 0; |
94cb9e38 | 81 | self->origin = DSO__ORIG_NOT_FOUND; |
a2928c42 ACM |
82 | } |
83 | ||
84 | return self; | |
85 | } | |
86 | ||
87 | static void dso__delete_symbols(struct dso *self) | |
88 | { | |
89 | struct symbol *pos; | |
90 | struct rb_node *next = rb_first(&self->syms); | |
91 | ||
92 | while (next) { | |
93 | pos = rb_entry(next, struct symbol, rb_node); | |
94 | next = rb_next(&pos->rb_node); | |
c8c96525 | 95 | rb_erase(&pos->rb_node, &self->syms); |
0085c954 | 96 | symbol__delete(pos, self->sym_priv_size); |
a2928c42 ACM |
97 | } |
98 | } | |
99 | ||
100 | void dso__delete(struct dso *self) | |
101 | { | |
102 | dso__delete_symbols(self); | |
103 | free(self); | |
104 | } | |
105 | ||
106 | static void dso__insert_symbol(struct dso *self, struct symbol *sym) | |
107 | { | |
108 | struct rb_node **p = &self->syms.rb_node; | |
109 | struct rb_node *parent = NULL; | |
9cffa8d5 | 110 | const u64 ip = sym->start; |
a2928c42 ACM |
111 | struct symbol *s; |
112 | ||
113 | while (*p != NULL) { | |
114 | parent = *p; | |
115 | s = rb_entry(parent, struct symbol, rb_node); | |
116 | if (ip < s->start) | |
117 | p = &(*p)->rb_left; | |
118 | else | |
119 | p = &(*p)->rb_right; | |
120 | } | |
121 | rb_link_node(&sym->rb_node, parent, p); | |
122 | rb_insert_color(&sym->rb_node, &self->syms); | |
123 | } | |
124 | ||
9cffa8d5 | 125 | struct symbol *dso__find_symbol(struct dso *self, u64 ip) |
a2928c42 ACM |
126 | { |
127 | struct rb_node *n; | |
128 | ||
129 | if (self == NULL) | |
130 | return NULL; | |
131 | ||
132 | n = self->syms.rb_node; | |
133 | ||
134 | while (n) { | |
135 | struct symbol *s = rb_entry(n, struct symbol, rb_node); | |
136 | ||
137 | if (ip < s->start) | |
138 | n = n->rb_left; | |
139 | else if (ip > s->end) | |
140 | n = n->rb_right; | |
141 | else | |
142 | return s; | |
143 | } | |
144 | ||
145 | return NULL; | |
146 | } | |
147 | ||
148 | size_t dso__fprintf(struct dso *self, FILE *fp) | |
149 | { | |
150 | size_t ret = fprintf(fp, "dso: %s\n", self->name); | |
151 | ||
152 | struct rb_node *nd; | |
153 | for (nd = rb_first(&self->syms); nd; nd = rb_next(nd)) { | |
154 | struct symbol *pos = rb_entry(nd, struct symbol, rb_node); | |
155 | ret += symbol__fprintf(pos, fp); | |
156 | } | |
157 | ||
158 | return ret; | |
159 | } | |
160 | ||
83a0944f | 161 | static int dso__load_kallsyms(struct dso *self, symbol_filter_t filter, int v) |
a2928c42 ACM |
162 | { |
163 | struct rb_node *nd, *prevnd; | |
164 | char *line = NULL; | |
165 | size_t n; | |
166 | FILE *file = fopen("/proc/kallsyms", "r"); | |
9974f496 | 167 | int count = 0; |
a2928c42 ACM |
168 | |
169 | if (file == NULL) | |
170 | goto out_failure; | |
171 | ||
172 | while (!feof(file)) { | |
9cffa8d5 | 173 | u64 start; |
a2928c42 ACM |
174 | struct symbol *sym; |
175 | int line_len, len; | |
176 | char symbol_type; | |
177 | ||
178 | line_len = getline(&line, &n, file); | |
179 | if (line_len < 0) | |
180 | break; | |
181 | ||
182 | if (!line) | |
183 | goto out_failure; | |
184 | ||
185 | line[--line_len] = '\0'; /* \n */ | |
186 | ||
a0055ae2 | 187 | len = hex2u64(line, &start); |
a2928c42 ACM |
188 | |
189 | len++; | |
190 | if (len + 2 >= line_len) | |
191 | continue; | |
192 | ||
193 | symbol_type = toupper(line[len]); | |
194 | /* | |
195 | * We're interested only in code ('T'ext) | |
196 | */ | |
197 | if (symbol_type != 'T' && symbol_type != 'W') | |
198 | continue; | |
199 | /* | |
200 | * Well fix up the end later, when we have all sorted. | |
201 | */ | |
0085c954 | 202 | sym = symbol__new(start, 0xdead, line + len + 2, |
83a0944f | 203 | self->sym_priv_size, 0, v); |
a2928c42 ACM |
204 | |
205 | if (sym == NULL) | |
206 | goto out_delete_line; | |
207 | ||
69ee69f6 ACM |
208 | if (filter && filter(self, sym)) |
209 | symbol__delete(sym, self->sym_priv_size); | |
9974f496 | 210 | else { |
69ee69f6 | 211 | dso__insert_symbol(self, sym); |
9974f496 MG |
212 | count++; |
213 | } | |
a2928c42 ACM |
214 | } |
215 | ||
216 | /* | |
217 | * Now that we have all sorted out, just set the ->end of all | |
218 | * symbols | |
219 | */ | |
220 | prevnd = rb_first(&self->syms); | |
221 | ||
222 | if (prevnd == NULL) | |
223 | goto out_delete_line; | |
224 | ||
225 | for (nd = rb_next(prevnd); nd; nd = rb_next(nd)) { | |
226 | struct symbol *prev = rb_entry(prevnd, struct symbol, rb_node), | |
227 | *curr = rb_entry(nd, struct symbol, rb_node); | |
228 | ||
229 | prev->end = curr->start - 1; | |
230 | prevnd = nd; | |
231 | } | |
232 | ||
233 | free(line); | |
234 | fclose(file); | |
235 | ||
9974f496 | 236 | return count; |
a2928c42 ACM |
237 | |
238 | out_delete_line: | |
239 | free(line); | |
240 | out_failure: | |
241 | return -1; | |
242 | } | |
243 | ||
83a0944f | 244 | static int dso__load_perf_map(struct dso *self, symbol_filter_t filter, int v) |
80d496be PE |
245 | { |
246 | char *line = NULL; | |
247 | size_t n; | |
248 | FILE *file; | |
249 | int nr_syms = 0; | |
250 | ||
251 | file = fopen(self->name, "r"); | |
252 | if (file == NULL) | |
253 | goto out_failure; | |
254 | ||
255 | while (!feof(file)) { | |
9cffa8d5 | 256 | u64 start, size; |
80d496be PE |
257 | struct symbol *sym; |
258 | int line_len, len; | |
259 | ||
260 | line_len = getline(&line, &n, file); | |
261 | if (line_len < 0) | |
262 | break; | |
263 | ||
264 | if (!line) | |
265 | goto out_failure; | |
266 | ||
267 | line[--line_len] = '\0'; /* \n */ | |
268 | ||
269 | len = hex2u64(line, &start); | |
270 | ||
271 | len++; | |
272 | if (len + 2 >= line_len) | |
273 | continue; | |
274 | ||
275 | len += hex2u64(line + len, &size); | |
276 | ||
277 | len++; | |
278 | if (len + 2 >= line_len) | |
279 | continue; | |
280 | ||
281 | sym = symbol__new(start, size, line + len, | |
83a0944f | 282 | self->sym_priv_size, start, v); |
80d496be PE |
283 | |
284 | if (sym == NULL) | |
285 | goto out_delete_line; | |
286 | ||
287 | if (filter && filter(self, sym)) | |
288 | symbol__delete(sym, self->sym_priv_size); | |
289 | else { | |
290 | dso__insert_symbol(self, sym); | |
291 | nr_syms++; | |
292 | } | |
293 | } | |
294 | ||
295 | free(line); | |
296 | fclose(file); | |
297 | ||
298 | return nr_syms; | |
299 | ||
300 | out_delete_line: | |
301 | free(line); | |
302 | out_failure: | |
303 | return -1; | |
304 | } | |
305 | ||
a2928c42 ACM |
306 | /** |
307 | * elf_symtab__for_each_symbol - iterate thru all the symbols | |
308 | * | |
309 | * @self: struct elf_symtab instance to iterate | |
83a0944f | 310 | * @idx: uint32_t idx |
a2928c42 ACM |
311 | * @sym: GElf_Sym iterator |
312 | */ | |
83a0944f IM |
313 | #define elf_symtab__for_each_symbol(syms, nr_syms, idx, sym) \ |
314 | for (idx = 0, gelf_getsym(syms, idx, &sym);\ | |
315 | idx < nr_syms; \ | |
316 | idx++, gelf_getsym(syms, idx, &sym)) | |
a2928c42 ACM |
317 | |
318 | static inline uint8_t elf_sym__type(const GElf_Sym *sym) | |
319 | { | |
320 | return GELF_ST_TYPE(sym->st_info); | |
321 | } | |
322 | ||
323 | static inline int elf_sym__is_function(const GElf_Sym *sym) | |
324 | { | |
325 | return elf_sym__type(sym) == STT_FUNC && | |
326 | sym->st_name != 0 && | |
327 | sym->st_shndx != SHN_UNDEF && | |
328 | sym->st_size != 0; | |
329 | } | |
330 | ||
6cfcc53e MG |
331 | static inline int elf_sym__is_label(const GElf_Sym *sym) |
332 | { | |
333 | return elf_sym__type(sym) == STT_NOTYPE && | |
334 | sym->st_name != 0 && | |
335 | sym->st_shndx != SHN_UNDEF && | |
336 | sym->st_shndx != SHN_ABS; | |
337 | } | |
338 | ||
339 | static inline const char *elf_sec__name(const GElf_Shdr *shdr, | |
340 | const Elf_Data *secstrs) | |
341 | { | |
342 | return secstrs->d_buf + shdr->sh_name; | |
343 | } | |
344 | ||
345 | static inline int elf_sec__is_text(const GElf_Shdr *shdr, | |
346 | const Elf_Data *secstrs) | |
347 | { | |
348 | return strstr(elf_sec__name(shdr, secstrs), "text") != NULL; | |
349 | } | |
350 | ||
a2928c42 ACM |
351 | static inline const char *elf_sym__name(const GElf_Sym *sym, |
352 | const Elf_Data *symstrs) | |
353 | { | |
354 | return symstrs->d_buf + sym->st_name; | |
355 | } | |
356 | ||
357 | static Elf_Scn *elf_section_by_name(Elf *elf, GElf_Ehdr *ep, | |
358 | GElf_Shdr *shp, const char *name, | |
83a0944f | 359 | size_t *idx) |
a2928c42 ACM |
360 | { |
361 | Elf_Scn *sec = NULL; | |
362 | size_t cnt = 1; | |
363 | ||
364 | while ((sec = elf_nextscn(elf, sec)) != NULL) { | |
365 | char *str; | |
366 | ||
367 | gelf_getshdr(sec, shp); | |
368 | str = elf_strptr(elf, ep->e_shstrndx, shp->sh_name); | |
369 | if (!strcmp(name, str)) { | |
83a0944f IM |
370 | if (idx) |
371 | *idx = cnt; | |
a2928c42 ACM |
372 | break; |
373 | } | |
374 | ++cnt; | |
375 | } | |
376 | ||
377 | return sec; | |
378 | } | |
379 | ||
8ce998d6 ACM |
380 | #define elf_section__for_each_rel(reldata, pos, pos_mem, idx, nr_entries) \ |
381 | for (idx = 0, pos = gelf_getrel(reldata, 0, &pos_mem); \ | |
382 | idx < nr_entries; \ | |
383 | ++idx, pos = gelf_getrel(reldata, idx, &pos_mem)) | |
384 | ||
385 | #define elf_section__for_each_rela(reldata, pos, pos_mem, idx, nr_entries) \ | |
386 | for (idx = 0, pos = gelf_getrela(reldata, 0, &pos_mem); \ | |
387 | idx < nr_entries; \ | |
388 | ++idx, pos = gelf_getrela(reldata, idx, &pos_mem)) | |
389 | ||
a25e46c4 ACM |
390 | /* |
391 | * We need to check if we have a .dynsym, so that we can handle the | |
392 | * .plt, synthesizing its symbols, that aren't on the symtabs (be it | |
393 | * .dynsym or .symtab). | |
394 | * And always look at the original dso, not at debuginfo packages, that | |
395 | * have the PLT data stripped out (shdr_rel_plt.sh_type == SHT_NOBITS). | |
396 | */ | |
83a0944f | 397 | static int dso__synthesize_plt_symbols(struct dso *self, int v) |
8ce998d6 ACM |
398 | { |
399 | uint32_t nr_rel_entries, idx; | |
400 | GElf_Sym sym; | |
9cffa8d5 | 401 | u64 plt_offset; |
8ce998d6 ACM |
402 | GElf_Shdr shdr_plt; |
403 | struct symbol *f; | |
a25e46c4 | 404 | GElf_Shdr shdr_rel_plt, shdr_dynsym; |
8ce998d6 | 405 | Elf_Data *reldata, *syms, *symstrs; |
a25e46c4 ACM |
406 | Elf_Scn *scn_plt_rel, *scn_symstrs, *scn_dynsym; |
407 | size_t dynsym_idx; | |
408 | GElf_Ehdr ehdr; | |
8ce998d6 | 409 | char sympltname[1024]; |
a25e46c4 ACM |
410 | Elf *elf; |
411 | int nr = 0, symidx, fd, err = 0; | |
412 | ||
413 | fd = open(self->name, O_RDONLY); | |
414 | if (fd < 0) | |
415 | goto out; | |
416 | ||
417 | elf = elf_begin(fd, ELF_C_READ_MMAP, NULL); | |
418 | if (elf == NULL) | |
419 | goto out_close; | |
420 | ||
421 | if (gelf_getehdr(elf, &ehdr) == NULL) | |
422 | goto out_elf_end; | |
423 | ||
424 | scn_dynsym = elf_section_by_name(elf, &ehdr, &shdr_dynsym, | |
425 | ".dynsym", &dynsym_idx); | |
426 | if (scn_dynsym == NULL) | |
427 | goto out_elf_end; | |
8ce998d6 | 428 | |
a25e46c4 | 429 | scn_plt_rel = elf_section_by_name(elf, &ehdr, &shdr_rel_plt, |
8ce998d6 ACM |
430 | ".rela.plt", NULL); |
431 | if (scn_plt_rel == NULL) { | |
a25e46c4 | 432 | scn_plt_rel = elf_section_by_name(elf, &ehdr, &shdr_rel_plt, |
8ce998d6 ACM |
433 | ".rel.plt", NULL); |
434 | if (scn_plt_rel == NULL) | |
a25e46c4 | 435 | goto out_elf_end; |
8ce998d6 ACM |
436 | } |
437 | ||
a25e46c4 ACM |
438 | err = -1; |
439 | ||
8ce998d6 | 440 | if (shdr_rel_plt.sh_link != dynsym_idx) |
a25e46c4 | 441 | goto out_elf_end; |
8ce998d6 | 442 | |
a25e46c4 ACM |
443 | if (elf_section_by_name(elf, &ehdr, &shdr_plt, ".plt", NULL) == NULL) |
444 | goto out_elf_end; | |
8ce998d6 ACM |
445 | |
446 | /* | |
83a0944f | 447 | * Fetch the relocation section to find the idxes to the GOT |
8ce998d6 ACM |
448 | * and the symbols in the .dynsym they refer to. |
449 | */ | |
450 | reldata = elf_getdata(scn_plt_rel, NULL); | |
451 | if (reldata == NULL) | |
a25e46c4 | 452 | goto out_elf_end; |
8ce998d6 ACM |
453 | |
454 | syms = elf_getdata(scn_dynsym, NULL); | |
455 | if (syms == NULL) | |
a25e46c4 | 456 | goto out_elf_end; |
8ce998d6 | 457 | |
a25e46c4 | 458 | scn_symstrs = elf_getscn(elf, shdr_dynsym.sh_link); |
8ce998d6 | 459 | if (scn_symstrs == NULL) |
a25e46c4 | 460 | goto out_elf_end; |
8ce998d6 ACM |
461 | |
462 | symstrs = elf_getdata(scn_symstrs, NULL); | |
463 | if (symstrs == NULL) | |
a25e46c4 | 464 | goto out_elf_end; |
8ce998d6 ACM |
465 | |
466 | nr_rel_entries = shdr_rel_plt.sh_size / shdr_rel_plt.sh_entsize; | |
467 | plt_offset = shdr_plt.sh_offset; | |
468 | ||
469 | if (shdr_rel_plt.sh_type == SHT_RELA) { | |
470 | GElf_Rela pos_mem, *pos; | |
471 | ||
472 | elf_section__for_each_rela(reldata, pos, pos_mem, idx, | |
473 | nr_rel_entries) { | |
474 | symidx = GELF_R_SYM(pos->r_info); | |
475 | plt_offset += shdr_plt.sh_entsize; | |
476 | gelf_getsym(syms, symidx, &sym); | |
477 | snprintf(sympltname, sizeof(sympltname), | |
478 | "%s@plt", elf_sym__name(&sym, symstrs)); | |
479 | ||
480 | f = symbol__new(plt_offset, shdr_plt.sh_entsize, | |
83a0944f | 481 | sympltname, self->sym_priv_size, 0, v); |
8ce998d6 | 482 | if (!f) |
a25e46c4 | 483 | goto out_elf_end; |
8ce998d6 ACM |
484 | |
485 | dso__insert_symbol(self, f); | |
486 | ++nr; | |
487 | } | |
488 | } else if (shdr_rel_plt.sh_type == SHT_REL) { | |
489 | GElf_Rel pos_mem, *pos; | |
490 | elf_section__for_each_rel(reldata, pos, pos_mem, idx, | |
491 | nr_rel_entries) { | |
492 | symidx = GELF_R_SYM(pos->r_info); | |
493 | plt_offset += shdr_plt.sh_entsize; | |
494 | gelf_getsym(syms, symidx, &sym); | |
495 | snprintf(sympltname, sizeof(sympltname), | |
496 | "%s@plt", elf_sym__name(&sym, symstrs)); | |
497 | ||
498 | f = symbol__new(plt_offset, shdr_plt.sh_entsize, | |
83a0944f | 499 | sympltname, self->sym_priv_size, 0, v); |
8ce998d6 | 500 | if (!f) |
a25e46c4 | 501 | goto out_elf_end; |
8ce998d6 ACM |
502 | |
503 | dso__insert_symbol(self, f); | |
504 | ++nr; | |
505 | } | |
8ce998d6 ACM |
506 | } |
507 | ||
a25e46c4 ACM |
508 | err = 0; |
509 | out_elf_end: | |
510 | elf_end(elf); | |
511 | out_close: | |
512 | close(fd); | |
513 | ||
514 | if (err == 0) | |
515 | return nr; | |
516 | out: | |
517 | fprintf(stderr, "%s: problems reading %s PLT info.\n", | |
518 | __func__, self->name); | |
519 | return 0; | |
8ce998d6 ACM |
520 | } |
521 | ||
69ee69f6 | 522 | static int dso__load_sym(struct dso *self, int fd, const char *name, |
83a0944f | 523 | symbol_filter_t filter, int v, struct module *mod) |
a2928c42 | 524 | { |
6cfcc53e | 525 | Elf_Data *symstrs, *secstrs; |
a2928c42 ACM |
526 | uint32_t nr_syms; |
527 | int err = -1; | |
83a0944f | 528 | uint32_t idx; |
a2928c42 ACM |
529 | GElf_Ehdr ehdr; |
530 | GElf_Shdr shdr; | |
531 | Elf_Data *syms; | |
532 | GElf_Sym sym; | |
a25e46c4 | 533 | Elf_Scn *sec, *sec_strndx; |
a2928c42 | 534 | Elf *elf; |
d20ff6bd | 535 | int nr = 0, kernel = !strcmp("[kernel]", self->name); |
a2928c42 ACM |
536 | |
537 | elf = elf_begin(fd, ELF_C_READ_MMAP, NULL); | |
538 | if (elf == NULL) { | |
83a0944f | 539 | if (v) |
bd74137e IM |
540 | fprintf(stderr, "%s: cannot read %s ELF file.\n", |
541 | __func__, name); | |
a2928c42 ACM |
542 | goto out_close; |
543 | } | |
544 | ||
545 | if (gelf_getehdr(elf, &ehdr) == NULL) { | |
83a0944f | 546 | if (v) |
bd74137e | 547 | fprintf(stderr, "%s: cannot get elf header.\n", __func__); |
a2928c42 ACM |
548 | goto out_elf_end; |
549 | } | |
550 | ||
551 | sec = elf_section_by_name(elf, &ehdr, &shdr, ".symtab", NULL); | |
8ce998d6 | 552 | if (sec == NULL) { |
a25e46c4 ACM |
553 | sec = elf_section_by_name(elf, &ehdr, &shdr, ".dynsym", NULL); |
554 | if (sec == NULL) | |
8ce998d6 | 555 | goto out_elf_end; |
8ce998d6 | 556 | } |
a2928c42 ACM |
557 | |
558 | syms = elf_getdata(sec, NULL); | |
559 | if (syms == NULL) | |
560 | goto out_elf_end; | |
561 | ||
562 | sec = elf_getscn(elf, shdr.sh_link); | |
563 | if (sec == NULL) | |
564 | goto out_elf_end; | |
565 | ||
566 | symstrs = elf_getdata(sec, NULL); | |
567 | if (symstrs == NULL) | |
568 | goto out_elf_end; | |
569 | ||
6cfcc53e MG |
570 | sec_strndx = elf_getscn(elf, ehdr.e_shstrndx); |
571 | if (sec_strndx == NULL) | |
572 | goto out_elf_end; | |
573 | ||
574 | secstrs = elf_getdata(sec_strndx, NULL); | |
9b30a26b | 575 | if (secstrs == NULL) |
6cfcc53e MG |
576 | goto out_elf_end; |
577 | ||
a2928c42 ACM |
578 | nr_syms = shdr.sh_size / shdr.sh_entsize; |
579 | ||
e9fbc9dc | 580 | memset(&sym, 0, sizeof(sym)); |
d20ff6bd MG |
581 | if (!kernel) { |
582 | self->adjust_symbols = (ehdr.e_type == ET_EXEC || | |
30d7a77d ACM |
583 | elf_section_by_name(elf, &ehdr, &shdr, |
584 | ".gnu.prelink_undo", | |
585 | NULL) != NULL); | |
d20ff6bd MG |
586 | } else self->adjust_symbols = 0; |
587 | ||
83a0944f | 588 | elf_symtab__for_each_symbol(syms, nr_syms, idx, sym) { |
a2928c42 | 589 | struct symbol *f; |
83a0944f | 590 | const char *elf_name; |
28ac909b | 591 | char *demangled; |
9cffa8d5 | 592 | u64 obj_start; |
6cfcc53e MG |
593 | struct section *section = NULL; |
594 | int is_label = elf_sym__is_label(&sym); | |
595 | const char *section_name; | |
a2928c42 | 596 | |
6cfcc53e | 597 | if (!is_label && !elf_sym__is_function(&sym)) |
a2928c42 ACM |
598 | continue; |
599 | ||
600 | sec = elf_getscn(elf, sym.st_shndx); | |
601 | if (!sec) | |
602 | goto out_elf_end; | |
603 | ||
604 | gelf_getshdr(sec, &shdr); | |
6cfcc53e MG |
605 | |
606 | if (is_label && !elf_sec__is_text(&shdr, secstrs)) | |
607 | continue; | |
608 | ||
609 | section_name = elf_sec__name(&shdr, secstrs); | |
0b73da3f IM |
610 | obj_start = sym.st_value; |
611 | ||
30d7a77d | 612 | if (self->adjust_symbols) { |
83a0944f | 613 | if (v >= 2) |
f5812a7a ACM |
614 | printf("adjusting symbol: st_value: %Lx sh_addr: %Lx sh_offset: %Lx\n", |
615 | (u64)sym.st_value, (u64)shdr.sh_addr, (u64)shdr.sh_offset); | |
520f2c34 | 616 | |
f5812a7a ACM |
617 | sym.st_value -= shdr.sh_addr - shdr.sh_offset; |
618 | } | |
a2928c42 | 619 | |
6cfcc53e MG |
620 | if (mod) { |
621 | section = mod->sections->find_section(mod->sections, section_name); | |
622 | if (section) | |
623 | sym.st_value += section->vma; | |
624 | else { | |
625 | fprintf(stderr, "dso__load_sym() module %s lookup of %s failed\n", | |
626 | mod->name, section_name); | |
627 | goto out_elf_end; | |
628 | } | |
629 | } | |
28ac909b ACM |
630 | /* |
631 | * We need to figure out if the object was created from C++ sources | |
632 | * DWARF DW_compile_unit has this, but we don't always have access | |
633 | * to it... | |
634 | */ | |
83a0944f IM |
635 | elf_name = elf_sym__name(&sym, symstrs); |
636 | demangled = bfd_demangle(NULL, elf_name, DMGL_PARAMS | DMGL_ANSI); | |
28ac909b | 637 | if (demangled != NULL) |
83a0944f | 638 | elf_name = demangled; |
6cfcc53e | 639 | |
83a0944f IM |
640 | f = symbol__new(sym.st_value, sym.st_size, elf_name, |
641 | self->sym_priv_size, obj_start, v); | |
28ac909b | 642 | free(demangled); |
a2928c42 ACM |
643 | if (!f) |
644 | goto out_elf_end; | |
645 | ||
69ee69f6 ACM |
646 | if (filter && filter(self, f)) |
647 | symbol__delete(f, self->sym_priv_size); | |
648 | else { | |
6cfcc53e | 649 | f->module = mod; |
69ee69f6 ACM |
650 | dso__insert_symbol(self, f); |
651 | nr++; | |
652 | } | |
a2928c42 ACM |
653 | } |
654 | ||
655 | err = nr; | |
656 | out_elf_end: | |
657 | elf_end(elf); | |
658 | out_close: | |
659 | return err; | |
660 | } | |
661 | ||
4d1e00a8 ACM |
662 | #define BUILD_ID_SIZE 128 |
663 | ||
83a0944f | 664 | static char *dso__read_build_id(struct dso *self, int v) |
4d1e00a8 ACM |
665 | { |
666 | int i; | |
667 | GElf_Ehdr ehdr; | |
668 | GElf_Shdr shdr; | |
669 | Elf_Data *build_id_data; | |
670 | Elf_Scn *sec; | |
671 | char *build_id = NULL, *bid; | |
672 | unsigned char *raw; | |
673 | Elf *elf; | |
674 | int fd = open(self->name, O_RDONLY); | |
675 | ||
676 | if (fd < 0) | |
677 | goto out; | |
678 | ||
679 | elf = elf_begin(fd, ELF_C_READ_MMAP, NULL); | |
680 | if (elf == NULL) { | |
83a0944f | 681 | if (v) |
4d1e00a8 ACM |
682 | fprintf(stderr, "%s: cannot read %s ELF file.\n", |
683 | __func__, self->name); | |
684 | goto out_close; | |
685 | } | |
686 | ||
687 | if (gelf_getehdr(elf, &ehdr) == NULL) { | |
83a0944f | 688 | if (v) |
4d1e00a8 ACM |
689 | fprintf(stderr, "%s: cannot get elf header.\n", __func__); |
690 | goto out_elf_end; | |
691 | } | |
692 | ||
693 | sec = elf_section_by_name(elf, &ehdr, &shdr, ".note.gnu.build-id", NULL); | |
694 | if (sec == NULL) | |
695 | goto out_elf_end; | |
696 | ||
697 | build_id_data = elf_getdata(sec, NULL); | |
698 | if (build_id_data == NULL) | |
699 | goto out_elf_end; | |
700 | build_id = malloc(BUILD_ID_SIZE); | |
701 | if (build_id == NULL) | |
702 | goto out_elf_end; | |
703 | raw = build_id_data->d_buf + 16; | |
704 | bid = build_id; | |
705 | ||
706 | for (i = 0; i < 20; ++i) { | |
707 | sprintf(bid, "%02x", *raw); | |
708 | ++raw; | |
709 | bid += 2; | |
710 | } | |
83a0944f | 711 | if (v >= 2) |
4d1e00a8 ACM |
712 | printf("%s(%s): %s\n", __func__, self->name, build_id); |
713 | out_elf_end: | |
714 | elf_end(elf); | |
715 | out_close: | |
716 | close(fd); | |
717 | out: | |
718 | return build_id; | |
719 | } | |
720 | ||
94cb9e38 ACM |
721 | char dso__symtab_origin(const struct dso *self) |
722 | { | |
723 | static const char origin[] = { | |
724 | [DSO__ORIG_KERNEL] = 'k', | |
725 | [DSO__ORIG_JAVA_JIT] = 'j', | |
726 | [DSO__ORIG_FEDORA] = 'f', | |
727 | [DSO__ORIG_UBUNTU] = 'u', | |
728 | [DSO__ORIG_BUILDID] = 'b', | |
729 | [DSO__ORIG_DSO] = 'd', | |
730 | }; | |
731 | ||
732 | if (self == NULL || self->origin == DSO__ORIG_NOT_FOUND) | |
733 | return '!'; | |
734 | return origin[self->origin]; | |
735 | } | |
736 | ||
83a0944f | 737 | int dso__load(struct dso *self, symbol_filter_t filter, int v) |
a2928c42 | 738 | { |
4d1e00a8 ACM |
739 | int size = PATH_MAX; |
740 | char *name = malloc(size), *build_id = NULL; | |
a2928c42 ACM |
741 | int ret = -1; |
742 | int fd; | |
743 | ||
744 | if (!name) | |
745 | return -1; | |
746 | ||
30d7a77d | 747 | self->adjust_symbols = 0; |
f5812a7a | 748 | |
94cb9e38 | 749 | if (strncmp(self->name, "/tmp/perf-", 10) == 0) { |
83a0944f | 750 | ret = dso__load_perf_map(self, filter, v); |
94cb9e38 ACM |
751 | self->origin = ret > 0 ? DSO__ORIG_JAVA_JIT : |
752 | DSO__ORIG_NOT_FOUND; | |
753 | return ret; | |
754 | } | |
755 | ||
756 | self->origin = DSO__ORIG_FEDORA - 1; | |
80d496be | 757 | |
a2928c42 ACM |
758 | more: |
759 | do { | |
94cb9e38 ACM |
760 | self->origin++; |
761 | switch (self->origin) { | |
762 | case DSO__ORIG_FEDORA: | |
a2928c42 ACM |
763 | snprintf(name, size, "/usr/lib/debug%s.debug", self->name); |
764 | break; | |
94cb9e38 | 765 | case DSO__ORIG_UBUNTU: |
a2928c42 ACM |
766 | snprintf(name, size, "/usr/lib/debug%s", self->name); |
767 | break; | |
94cb9e38 | 768 | case DSO__ORIG_BUILDID: |
83a0944f | 769 | build_id = dso__read_build_id(self, v); |
4d1e00a8 ACM |
770 | if (build_id != NULL) { |
771 | snprintf(name, size, | |
772 | "/usr/lib/debug/.build-id/%.2s/%s.debug", | |
773 | build_id, build_id + 2); | |
774 | free(build_id); | |
775 | break; | |
776 | } | |
94cb9e38 | 777 | self->origin++; |
4d1e00a8 | 778 | /* Fall thru */ |
94cb9e38 | 779 | case DSO__ORIG_DSO: |
a2928c42 ACM |
780 | snprintf(name, size, "%s", self->name); |
781 | break; | |
782 | ||
783 | default: | |
784 | goto out; | |
785 | } | |
a2928c42 ACM |
786 | |
787 | fd = open(name, O_RDONLY); | |
788 | } while (fd < 0); | |
789 | ||
83a0944f | 790 | ret = dso__load_sym(self, fd, name, filter, v, NULL); |
a2928c42 ACM |
791 | close(fd); |
792 | ||
793 | /* | |
794 | * Some people seem to have debuginfo files _WITHOUT_ debug info!?!? | |
795 | */ | |
796 | if (!ret) | |
797 | goto more; | |
798 | ||
a25e46c4 | 799 | if (ret > 0) { |
83a0944f | 800 | int nr_plt = dso__synthesize_plt_symbols(self, v); |
a25e46c4 ACM |
801 | if (nr_plt > 0) |
802 | ret += nr_plt; | |
803 | } | |
a2928c42 ACM |
804 | out: |
805 | free(name); | |
1340e6bb ACM |
806 | if (ret < 0 && strstr(self->name, " (deleted)") != NULL) |
807 | return 0; | |
a2928c42 ACM |
808 | return ret; |
809 | } | |
810 | ||
6cfcc53e | 811 | static int dso__load_module(struct dso *self, struct mod_dso *mods, const char *name, |
83a0944f | 812 | symbol_filter_t filter, int v) |
6cfcc53e MG |
813 | { |
814 | struct module *mod = mod_dso__find_module(mods, name); | |
815 | int err = 0, fd; | |
816 | ||
817 | if (mod == NULL || !mod->active) | |
818 | return err; | |
819 | ||
820 | fd = open(mod->path, O_RDONLY); | |
821 | ||
822 | if (fd < 0) | |
823 | return err; | |
824 | ||
83a0944f | 825 | err = dso__load_sym(self, fd, name, filter, v, mod); |
6cfcc53e MG |
826 | close(fd); |
827 | ||
828 | return err; | |
829 | } | |
830 | ||
83a0944f | 831 | int dso__load_modules(struct dso *self, symbol_filter_t filter, int v) |
6cfcc53e MG |
832 | { |
833 | struct mod_dso *mods = mod_dso__new_dso("modules"); | |
834 | struct module *pos; | |
835 | struct rb_node *next; | |
836 | int err; | |
837 | ||
838 | err = mod_dso__load_modules(mods); | |
839 | ||
840 | if (err <= 0) | |
841 | return err; | |
842 | ||
843 | /* | |
844 | * Iterate over modules, and load active symbols. | |
845 | */ | |
846 | next = rb_first(&mods->mods); | |
847 | while (next) { | |
848 | pos = rb_entry(next, struct module, rb_node); | |
83a0944f | 849 | err = dso__load_module(self, mods, pos->name, filter, v); |
6cfcc53e MG |
850 | |
851 | if (err < 0) | |
852 | break; | |
853 | ||
854 | next = rb_next(&pos->rb_node); | |
855 | } | |
856 | ||
857 | if (err < 0) { | |
858 | mod_dso__delete_modules(mods); | |
859 | mod_dso__delete_self(mods); | |
860 | } | |
861 | ||
862 | return err; | |
863 | } | |
864 | ||
865 | static inline void dso__fill_symbol_holes(struct dso *self) | |
866 | { | |
867 | struct symbol *prev = NULL; | |
868 | struct rb_node *nd; | |
869 | ||
870 | for (nd = rb_last(&self->syms); nd; nd = rb_prev(nd)) { | |
871 | struct symbol *pos = rb_entry(nd, struct symbol, rb_node); | |
872 | ||
873 | if (prev) { | |
874 | u64 hole = 0; | |
875 | int alias = pos->start == prev->start; | |
876 | ||
877 | if (!alias) | |
878 | hole = prev->start - pos->end - 1; | |
879 | ||
880 | if (hole || alias) { | |
881 | if (alias) | |
882 | pos->end = prev->end; | |
883 | else if (hole) | |
884 | pos->end = prev->start - 1; | |
885 | } | |
886 | } | |
887 | prev = pos; | |
888 | } | |
889 | } | |
890 | ||
69ee69f6 | 891 | static int dso__load_vmlinux(struct dso *self, const char *vmlinux, |
83a0944f | 892 | symbol_filter_t filter, int v) |
a2928c42 ACM |
893 | { |
894 | int err, fd = open(vmlinux, O_RDONLY); | |
895 | ||
896 | if (fd < 0) | |
897 | return -1; | |
898 | ||
83a0944f | 899 | err = dso__load_sym(self, fd, vmlinux, filter, v, NULL); |
6cfcc53e MG |
900 | |
901 | if (err > 0) | |
902 | dso__fill_symbol_holes(self); | |
903 | ||
a2928c42 ACM |
904 | close(fd); |
905 | ||
906 | return err; | |
907 | } | |
908 | ||
bd74137e | 909 | int dso__load_kernel(struct dso *self, const char *vmlinux, |
83a0944f | 910 | symbol_filter_t filter, int v, int use_modules) |
a827c875 ACM |
911 | { |
912 | int err = -1; | |
913 | ||
6cfcc53e | 914 | if (vmlinux) { |
83a0944f IM |
915 | err = dso__load_vmlinux(self, vmlinux, filter, v); |
916 | if (err > 0 && use_modules) | |
917 | err = dso__load_modules(self, filter, v); | |
6cfcc53e | 918 | } |
a827c875 | 919 | |
9974f496 | 920 | if (err <= 0) |
83a0944f | 921 | err = dso__load_kallsyms(self, filter, v); |
a827c875 | 922 | |
94cb9e38 ACM |
923 | if (err > 0) |
924 | self->origin = DSO__ORIG_KERNEL; | |
925 | ||
a827c875 ACM |
926 | return err; |
927 | } | |
928 | ||
cd84c2ac FW |
929 | LIST_HEAD(dsos); |
930 | struct dso *kernel_dso; | |
931 | struct dso *vdso; | |
932 | struct dso *hypervisor_dso; | |
933 | ||
83a0944f | 934 | const char *vmlinux_name = "vmlinux"; |
cd84c2ac FW |
935 | int modules; |
936 | ||
937 | static void dsos__add(struct dso *dso) | |
938 | { | |
939 | list_add_tail(&dso->node, &dsos); | |
940 | } | |
941 | ||
942 | static struct dso *dsos__find(const char *name) | |
943 | { | |
944 | struct dso *pos; | |
945 | ||
946 | list_for_each_entry(pos, &dsos, node) | |
947 | if (strcmp(pos->name, name) == 0) | |
948 | return pos; | |
949 | return NULL; | |
950 | } | |
951 | ||
952 | struct dso *dsos__findnew(const char *name) | |
953 | { | |
954 | struct dso *dso = dsos__find(name); | |
955 | int nr; | |
956 | ||
957 | if (dso) | |
958 | return dso; | |
959 | ||
960 | dso = dso__new(name, 0); | |
961 | if (!dso) | |
962 | goto out_delete_dso; | |
963 | ||
964 | nr = dso__load(dso, NULL, verbose); | |
965 | if (nr < 0) { | |
966 | eprintf("Failed to open: %s\n", name); | |
967 | goto out_delete_dso; | |
968 | } | |
969 | if (!nr) | |
970 | eprintf("No symbols found in: %s, maybe install a debug package?\n", name); | |
971 | ||
972 | dsos__add(dso); | |
973 | ||
974 | return dso; | |
975 | ||
976 | out_delete_dso: | |
977 | dso__delete(dso); | |
978 | return NULL; | |
979 | } | |
980 | ||
981 | void dsos__fprintf(FILE *fp) | |
982 | { | |
983 | struct dso *pos; | |
984 | ||
985 | list_for_each_entry(pos, &dsos, node) | |
986 | dso__fprintf(pos, fp); | |
987 | } | |
988 | ||
989 | static struct symbol *vdso__find_symbol(struct dso *dso, u64 ip) | |
990 | { | |
991 | return dso__find_symbol(dso, ip); | |
992 | } | |
993 | ||
994 | int load_kernel(void) | |
995 | { | |
996 | int err; | |
997 | ||
998 | kernel_dso = dso__new("[kernel]", 0); | |
999 | if (!kernel_dso) | |
1000 | return -1; | |
1001 | ||
83a0944f | 1002 | err = dso__load_kernel(kernel_dso, vmlinux_name, NULL, verbose, modules); |
cd84c2ac FW |
1003 | if (err <= 0) { |
1004 | dso__delete(kernel_dso); | |
1005 | kernel_dso = NULL; | |
1006 | } else | |
1007 | dsos__add(kernel_dso); | |
1008 | ||
1009 | vdso = dso__new("[vdso]", 0); | |
1010 | if (!vdso) | |
1011 | return -1; | |
1012 | ||
1013 | vdso->find_symbol = vdso__find_symbol; | |
1014 | ||
1015 | dsos__add(vdso); | |
1016 | ||
1017 | hypervisor_dso = dso__new("[hypervisor]", 0); | |
1018 | if (!hypervisor_dso) | |
1019 | return -1; | |
1020 | dsos__add(hypervisor_dso); | |
1021 | ||
1022 | return err; | |
1023 | } | |
1024 | ||
1025 | ||
a2928c42 ACM |
1026 | void symbol__init(void) |
1027 | { | |
1028 | elf_version(EV_CURRENT); | |
1029 | } |