symbol.c 8.6 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450
  1. #include "util.h"
  2. #include "../perf.h"
  3. #include "symbol.h"
  4. #include <libelf.h>
  5. #include <gelf.h>
  6. #include <elf.h>
  7. static struct symbol *symbol__new(uint64_t start, uint64_t len,
  8. const char *name, unsigned int priv_size)
  9. {
  10. size_t namelen = strlen(name) + 1;
  11. struct symbol *self = malloc(priv_size + sizeof(*self) + namelen);
  12. if (self != NULL) {
  13. if (priv_size) {
  14. memset(self, 0, priv_size);
  15. self = ((void *)self) + priv_size;
  16. }
  17. self->start = start;
  18. self->end = start + len;
  19. memcpy(self->name, name, namelen);
  20. }
  21. return self;
  22. }
  23. static void symbol__delete(struct symbol *self, unsigned int priv_size)
  24. {
  25. free(((void *)self) - priv_size);
  26. }
  27. static size_t symbol__fprintf(struct symbol *self, FILE *fp)
  28. {
  29. return fprintf(fp, " %llx-%llx %s\n",
  30. self->start, self->end, self->name);
  31. }
  32. struct dso *dso__new(const char *name, unsigned int sym_priv_size)
  33. {
  34. struct dso *self = malloc(sizeof(*self) + strlen(name) + 1);
  35. if (self != NULL) {
  36. strcpy(self->name, name);
  37. self->syms = RB_ROOT;
  38. self->sym_priv_size = sym_priv_size;
  39. }
  40. return self;
  41. }
  42. static void dso__delete_symbols(struct dso *self)
  43. {
  44. struct symbol *pos;
  45. struct rb_node *next = rb_first(&self->syms);
  46. while (next) {
  47. pos = rb_entry(next, struct symbol, rb_node);
  48. next = rb_next(&pos->rb_node);
  49. symbol__delete(pos, self->sym_priv_size);
  50. }
  51. }
  52. void dso__delete(struct dso *self)
  53. {
  54. dso__delete_symbols(self);
  55. free(self);
  56. }
  57. static void dso__insert_symbol(struct dso *self, struct symbol *sym)
  58. {
  59. struct rb_node **p = &self->syms.rb_node;
  60. struct rb_node *parent = NULL;
  61. const uint64_t ip = sym->start;
  62. struct symbol *s;
  63. while (*p != NULL) {
  64. parent = *p;
  65. s = rb_entry(parent, struct symbol, rb_node);
  66. if (ip < s->start)
  67. p = &(*p)->rb_left;
  68. else
  69. p = &(*p)->rb_right;
  70. }
  71. rb_link_node(&sym->rb_node, parent, p);
  72. rb_insert_color(&sym->rb_node, &self->syms);
  73. }
  74. struct symbol *dso__find_symbol(struct dso *self, uint64_t ip)
  75. {
  76. struct rb_node *n;
  77. if (self == NULL)
  78. return NULL;
  79. n = self->syms.rb_node;
  80. while (n) {
  81. struct symbol *s = rb_entry(n, struct symbol, rb_node);
  82. if (ip < s->start)
  83. n = n->rb_left;
  84. else if (ip > s->end)
  85. n = n->rb_right;
  86. else
  87. return s;
  88. }
  89. return NULL;
  90. }
  91. size_t dso__fprintf(struct dso *self, FILE *fp)
  92. {
  93. size_t ret = fprintf(fp, "dso: %s\n", self->name);
  94. struct rb_node *nd;
  95. for (nd = rb_first(&self->syms); nd; nd = rb_next(nd)) {
  96. struct symbol *pos = rb_entry(nd, struct symbol, rb_node);
  97. ret += symbol__fprintf(pos, fp);
  98. }
  99. return ret;
  100. }
  101. static int hex(char ch)
  102. {
  103. if ((ch >= '0') && (ch <= '9'))
  104. return ch - '0';
  105. if ((ch >= 'a') && (ch <= 'f'))
  106. return ch - 'a' + 10;
  107. if ((ch >= 'A') && (ch <= 'F'))
  108. return ch - 'A' + 10;
  109. return -1;
  110. }
  111. /*
  112. * While we find nice hex chars, build a long_val.
  113. * Return number of chars processed.
  114. */
  115. static int hex2long(char *ptr, unsigned long *long_val)
  116. {
  117. const char *p = ptr;
  118. *long_val = 0;
  119. while (*p) {
  120. const int hex_val = hex(*p);
  121. if (hex_val < 0)
  122. break;
  123. *long_val = (*long_val << 4) | hex_val;
  124. p++;
  125. }
  126. return p - ptr;
  127. }
  128. static int dso__load_kallsyms(struct dso *self, symbol_filter_t filter)
  129. {
  130. struct rb_node *nd, *prevnd;
  131. char *line = NULL;
  132. size_t n;
  133. FILE *file = fopen("/proc/kallsyms", "r");
  134. if (file == NULL)
  135. goto out_failure;
  136. while (!feof(file)) {
  137. unsigned long start;
  138. struct symbol *sym;
  139. int line_len, len;
  140. char symbol_type;
  141. line_len = getline(&line, &n, file);
  142. if (line_len < 0)
  143. break;
  144. if (!line)
  145. goto out_failure;
  146. line[--line_len] = '\0'; /* \n */
  147. len = hex2long(line, &start);
  148. len++;
  149. if (len + 2 >= line_len)
  150. continue;
  151. symbol_type = toupper(line[len]);
  152. /*
  153. * We're interested only in code ('T'ext)
  154. */
  155. if (symbol_type != 'T' && symbol_type != 'W')
  156. continue;
  157. /*
  158. * Well fix up the end later, when we have all sorted.
  159. */
  160. sym = symbol__new(start, 0xdead, line + len + 2,
  161. self->sym_priv_size);
  162. if (sym == NULL)
  163. goto out_delete_line;
  164. if (filter && filter(self, sym))
  165. symbol__delete(sym, self->sym_priv_size);
  166. else
  167. dso__insert_symbol(self, sym);
  168. }
  169. /*
  170. * Now that we have all sorted out, just set the ->end of all
  171. * symbols
  172. */
  173. prevnd = rb_first(&self->syms);
  174. if (prevnd == NULL)
  175. goto out_delete_line;
  176. for (nd = rb_next(prevnd); nd; nd = rb_next(nd)) {
  177. struct symbol *prev = rb_entry(prevnd, struct symbol, rb_node),
  178. *curr = rb_entry(nd, struct symbol, rb_node);
  179. prev->end = curr->start - 1;
  180. prevnd = nd;
  181. }
  182. free(line);
  183. fclose(file);
  184. return 0;
  185. out_delete_line:
  186. free(line);
  187. out_failure:
  188. return -1;
  189. }
  190. /**
  191. * elf_symtab__for_each_symbol - iterate thru all the symbols
  192. *
  193. * @self: struct elf_symtab instance to iterate
  194. * @index: uint32_t index
  195. * @sym: GElf_Sym iterator
  196. */
  197. #define elf_symtab__for_each_symbol(syms, nr_syms, index, sym) \
  198. for (index = 0, gelf_getsym(syms, index, &sym);\
  199. index < nr_syms; \
  200. index++, gelf_getsym(syms, index, &sym))
  201. static inline uint8_t elf_sym__type(const GElf_Sym *sym)
  202. {
  203. return GELF_ST_TYPE(sym->st_info);
  204. }
  205. static inline int elf_sym__is_function(const GElf_Sym *sym)
  206. {
  207. return elf_sym__type(sym) == STT_FUNC &&
  208. sym->st_name != 0 &&
  209. sym->st_shndx != SHN_UNDEF &&
  210. sym->st_size != 0;
  211. }
  212. static inline const char *elf_sym__name(const GElf_Sym *sym,
  213. const Elf_Data *symstrs)
  214. {
  215. return symstrs->d_buf + sym->st_name;
  216. }
  217. static Elf_Scn *elf_section_by_name(Elf *elf, GElf_Ehdr *ep,
  218. GElf_Shdr *shp, const char *name,
  219. size_t *index)
  220. {
  221. Elf_Scn *sec = NULL;
  222. size_t cnt = 1;
  223. while ((sec = elf_nextscn(elf, sec)) != NULL) {
  224. char *str;
  225. gelf_getshdr(sec, shp);
  226. str = elf_strptr(elf, ep->e_shstrndx, shp->sh_name);
  227. if (!strcmp(name, str)) {
  228. if (index)
  229. *index = cnt;
  230. break;
  231. }
  232. ++cnt;
  233. }
  234. return sec;
  235. }
  236. static int dso__load_sym(struct dso *self, int fd, const char *name,
  237. symbol_filter_t filter)
  238. {
  239. Elf_Data *symstrs;
  240. uint32_t nr_syms;
  241. int err = -1;
  242. uint32_t index;
  243. GElf_Ehdr ehdr;
  244. GElf_Shdr shdr;
  245. Elf_Data *syms;
  246. GElf_Sym sym;
  247. Elf_Scn *sec;
  248. Elf *elf;
  249. int nr = 0;
  250. elf = elf_begin(fd, ELF_C_READ_MMAP, NULL);
  251. if (elf == NULL) {
  252. fprintf(stderr, "%s: cannot read %s ELF file.\n",
  253. __func__, name);
  254. goto out_close;
  255. }
  256. if (gelf_getehdr(elf, &ehdr) == NULL) {
  257. fprintf(stderr, "%s: cannot get elf header.\n", __func__);
  258. goto out_elf_end;
  259. }
  260. sec = elf_section_by_name(elf, &ehdr, &shdr, ".symtab", NULL);
  261. if (sec == NULL)
  262. sec = elf_section_by_name(elf, &ehdr, &shdr, ".dynsym", NULL);
  263. if (sec == NULL)
  264. goto out_elf_end;
  265. syms = elf_getdata(sec, NULL);
  266. if (syms == NULL)
  267. goto out_elf_end;
  268. sec = elf_getscn(elf, shdr.sh_link);
  269. if (sec == NULL)
  270. goto out_elf_end;
  271. symstrs = elf_getdata(sec, NULL);
  272. if (symstrs == NULL)
  273. goto out_elf_end;
  274. nr_syms = shdr.sh_size / shdr.sh_entsize;
  275. elf_symtab__for_each_symbol(syms, nr_syms, index, sym) {
  276. struct symbol *f;
  277. if (!elf_sym__is_function(&sym))
  278. continue;
  279. sec = elf_getscn(elf, sym.st_shndx);
  280. if (!sec)
  281. goto out_elf_end;
  282. gelf_getshdr(sec, &shdr);
  283. sym.st_value -= shdr.sh_addr - shdr.sh_offset;
  284. f = symbol__new(sym.st_value, sym.st_size,
  285. elf_sym__name(&sym, symstrs),
  286. self->sym_priv_size);
  287. if (!f)
  288. goto out_elf_end;
  289. if (filter && filter(self, f))
  290. symbol__delete(f, self->sym_priv_size);
  291. else {
  292. dso__insert_symbol(self, f);
  293. nr++;
  294. }
  295. }
  296. err = nr;
  297. out_elf_end:
  298. elf_end(elf);
  299. out_close:
  300. return err;
  301. }
  302. int dso__load(struct dso *self, symbol_filter_t filter)
  303. {
  304. int size = strlen(self->name) + sizeof("/usr/lib/debug%s.debug");
  305. char *name = malloc(size);
  306. int variant = 0;
  307. int ret = -1;
  308. int fd;
  309. if (!name)
  310. return -1;
  311. more:
  312. do {
  313. switch (variant) {
  314. case 0: /* Fedora */
  315. snprintf(name, size, "/usr/lib/debug%s.debug", self->name);
  316. break;
  317. case 1: /* Ubuntu */
  318. snprintf(name, size, "/usr/lib/debug%s", self->name);
  319. break;
  320. case 2: /* Sane people */
  321. snprintf(name, size, "%s", self->name);
  322. break;
  323. default:
  324. goto out;
  325. }
  326. variant++;
  327. fd = open(name, O_RDONLY);
  328. } while (fd < 0);
  329. ret = dso__load_sym(self, fd, name, filter);
  330. close(fd);
  331. /*
  332. * Some people seem to have debuginfo files _WITHOUT_ debug info!?!?
  333. */
  334. if (!ret)
  335. goto more;
  336. out:
  337. free(name);
  338. return ret;
  339. }
  340. static int dso__load_vmlinux(struct dso *self, const char *vmlinux,
  341. symbol_filter_t filter)
  342. {
  343. int err, fd = open(vmlinux, O_RDONLY);
  344. if (fd < 0)
  345. return -1;
  346. err = dso__load_sym(self, fd, vmlinux, filter);
  347. close(fd);
  348. return err;
  349. }
  350. int dso__load_kernel(struct dso *self, const char *vmlinux, symbol_filter_t filter)
  351. {
  352. int err = -1;
  353. if (vmlinux)
  354. err = dso__load_vmlinux(self, vmlinux, filter);
  355. if (err)
  356. err = dso__load_kallsyms(self, filter);
  357. return err;
  358. }
  359. void symbol__init(void)
  360. {
  361. elf_version(EV_CURRENT);
  362. }