builtin-annotate.c 7.4 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309
  1. /*
  2. * builtin-annotate.c
  3. *
  4. * Builtin annotate command: Analyze the perf.data input file,
  5. * look up and read DSOs and symbol information and display
  6. * a histogram of results, along various sorting keys.
  7. */
  8. #include "builtin.h"
  9. #include "util/util.h"
  10. #include "util/color.h"
  11. #include <linux/list.h>
  12. #include "util/cache.h"
  13. #include <linux/rbtree.h>
  14. #include "util/symbol.h"
  15. #include "perf.h"
  16. #include "util/debug.h"
  17. #include "util/evlist.h"
  18. #include "util/evsel.h"
  19. #include "util/annotate.h"
  20. #include "util/event.h"
  21. #include "util/parse-options.h"
  22. #include "util/parse-events.h"
  23. #include "util/thread.h"
  24. #include "util/sort.h"
  25. #include "util/hist.h"
  26. #include "util/session.h"
  27. #include <linux/bitmap.h>
  28. static char const *input_name = "perf.data";
  29. static bool force, use_tui, use_stdio;
  30. static bool full_paths;
  31. static bool print_line;
  32. static const char *sym_hist_filter;
  33. static const char *cpu_list;
  34. static DECLARE_BITMAP(cpu_bitmap, MAX_NR_CPUS);
  35. static int perf_evlist__add_sample(struct perf_evlist *evlist,
  36. struct perf_sample *sample,
  37. struct perf_evsel *evsel,
  38. struct addr_location *al)
  39. {
  40. struct hist_entry *he;
  41. int ret;
  42. if (sym_hist_filter != NULL &&
  43. (al->sym == NULL || strcmp(sym_hist_filter, al->sym->name) != 0)) {
  44. /* We're only interested in a symbol named sym_hist_filter */
  45. if (al->sym != NULL) {
  46. rb_erase(&al->sym->rb_node,
  47. &al->map->dso->symbols[al->map->type]);
  48. symbol__delete(al->sym);
  49. }
  50. return 0;
  51. }
  52. he = __hists__add_entry(&evsel->hists, al, NULL, 1);
  53. if (he == NULL)
  54. return -ENOMEM;
  55. ret = 0;
  56. if (he->ms.sym != NULL) {
  57. struct annotation *notes = symbol__annotation(he->ms.sym);
  58. if (notes->src == NULL &&
  59. symbol__alloc_hist(he->ms.sym, evlist->nr_entries) < 0)
  60. return -ENOMEM;
  61. ret = hist_entry__inc_addr_samples(he, evsel->idx, al->addr);
  62. }
  63. evsel->hists.stats.total_period += sample->period;
  64. hists__inc_nr_events(&evsel->hists, PERF_RECORD_SAMPLE);
  65. return ret;
  66. }
  67. static int process_sample_event(union perf_event *event,
  68. struct perf_sample *sample,
  69. struct perf_evsel *evsel,
  70. struct perf_session *session)
  71. {
  72. struct addr_location al;
  73. if (perf_event__preprocess_sample(event, session, &al, sample,
  74. symbol__annotate_init) < 0) {
  75. pr_warning("problem processing %d event, skipping it.\n",
  76. event->header.type);
  77. return -1;
  78. }
  79. if (cpu_list && !test_bit(sample->cpu, cpu_bitmap))
  80. return 0;
  81. if (!al.filtered &&
  82. perf_evlist__add_sample(session->evlist, sample, evsel, &al)) {
  83. pr_warning("problem incrementing symbol count, "
  84. "skipping event\n");
  85. return -1;
  86. }
  87. return 0;
  88. }
  89. static int hist_entry__tty_annotate(struct hist_entry *he, int evidx)
  90. {
  91. return symbol__tty_annotate(he->ms.sym, he->ms.map, evidx,
  92. print_line, full_paths, 0, 0);
  93. }
  94. static void hists__find_annotations(struct hists *self, int evidx)
  95. {
  96. struct rb_node *nd = rb_first(&self->entries), *next;
  97. int key = KEY_RIGHT;
  98. while (nd) {
  99. struct hist_entry *he = rb_entry(nd, struct hist_entry, rb_node);
  100. struct annotation *notes;
  101. if (he->ms.sym == NULL || he->ms.map->dso->annotate_warned)
  102. goto find_next;
  103. notes = symbol__annotation(he->ms.sym);
  104. if (notes->src == NULL) {
  105. find_next:
  106. if (key == KEY_LEFT)
  107. nd = rb_prev(nd);
  108. else
  109. nd = rb_next(nd);
  110. continue;
  111. }
  112. if (use_browser > 0) {
  113. key = hist_entry__tui_annotate(he, evidx);
  114. switch (key) {
  115. case KEY_RIGHT:
  116. next = rb_next(nd);
  117. break;
  118. case KEY_LEFT:
  119. next = rb_prev(nd);
  120. break;
  121. default:
  122. return;
  123. }
  124. if (next != NULL)
  125. nd = next;
  126. } else {
  127. hist_entry__tty_annotate(he, evidx);
  128. nd = rb_next(nd);
  129. /*
  130. * Since we have a hist_entry per IP for the same
  131. * symbol, free he->ms.sym->src to signal we already
  132. * processed this symbol.
  133. */
  134. free(notes->src);
  135. notes->src = NULL;
  136. }
  137. }
  138. }
  139. static struct perf_event_ops event_ops = {
  140. .sample = process_sample_event,
  141. .mmap = perf_event__process_mmap,
  142. .comm = perf_event__process_comm,
  143. .fork = perf_event__process_task,
  144. .ordered_samples = true,
  145. .ordering_requires_timestamps = true,
  146. };
  147. static int __cmd_annotate(void)
  148. {
  149. int ret;
  150. struct perf_session *session;
  151. struct perf_evsel *pos;
  152. u64 total_nr_samples;
  153. session = perf_session__new(input_name, O_RDONLY, force, false, &event_ops);
  154. if (session == NULL)
  155. return -ENOMEM;
  156. if (cpu_list) {
  157. ret = perf_session__cpu_bitmap(session, cpu_list, cpu_bitmap);
  158. if (ret)
  159. goto out_delete;
  160. }
  161. ret = perf_session__process_events(session, &event_ops);
  162. if (ret)
  163. goto out_delete;
  164. if (dump_trace) {
  165. perf_session__fprintf_nr_events(session, stdout);
  166. goto out_delete;
  167. }
  168. if (verbose > 3)
  169. perf_session__fprintf(session, stdout);
  170. if (verbose > 2)
  171. perf_session__fprintf_dsos(session, stdout);
  172. total_nr_samples = 0;
  173. list_for_each_entry(pos, &session->evlist->entries, node) {
  174. struct hists *hists = &pos->hists;
  175. u32 nr_samples = hists->stats.nr_events[PERF_RECORD_SAMPLE];
  176. if (nr_samples > 0) {
  177. total_nr_samples += nr_samples;
  178. hists__collapse_resort(hists);
  179. hists__output_resort(hists);
  180. hists__find_annotations(hists, pos->idx);
  181. }
  182. }
  183. if (total_nr_samples == 0) {
  184. ui__warning("The %s file has no samples!\n", input_name);
  185. goto out_delete;
  186. }
  187. out_delete:
  188. /*
  189. * Speed up the exit process, for large files this can
  190. * take quite a while.
  191. *
  192. * XXX Enable this when using valgrind or if we ever
  193. * librarize this command.
  194. *
  195. * Also experiment with obstacks to see how much speed
  196. * up we'll get here.
  197. *
  198. * perf_session__delete(session);
  199. */
  200. return ret;
  201. }
  202. static const char * const annotate_usage[] = {
  203. "perf annotate [<options>] <command>",
  204. NULL
  205. };
  206. static const struct option options[] = {
  207. OPT_STRING('i', "input", &input_name, "file",
  208. "input file name"),
  209. OPT_STRING('d', "dsos", &symbol_conf.dso_list_str, "dso[,dso...]",
  210. "only consider symbols in these dsos"),
  211. OPT_STRING('s', "symbol", &sym_hist_filter, "symbol",
  212. "symbol to annotate"),
  213. OPT_BOOLEAN('f', "force", &force, "don't complain, do it"),
  214. OPT_INCR('v', "verbose", &verbose,
  215. "be more verbose (show symbol address, etc)"),
  216. OPT_BOOLEAN('D', "dump-raw-trace", &dump_trace,
  217. "dump raw trace in ASCII"),
  218. OPT_BOOLEAN(0, "tui", &use_tui, "Use the TUI interface"),
  219. OPT_BOOLEAN(0, "stdio", &use_stdio, "Use the stdio interface"),
  220. OPT_STRING('k', "vmlinux", &symbol_conf.vmlinux_name,
  221. "file", "vmlinux pathname"),
  222. OPT_BOOLEAN('m', "modules", &symbol_conf.use_modules,
  223. "load module symbols - WARNING: use only with -k and LIVE kernel"),
  224. OPT_BOOLEAN('l', "print-line", &print_line,
  225. "print matching source lines (may be slow)"),
  226. OPT_BOOLEAN('P', "full-paths", &full_paths,
  227. "Don't shorten the displayed pathnames"),
  228. OPT_STRING('c', "cpu", &cpu_list, "cpu", "list of cpus to profile"),
  229. OPT_END()
  230. };
  231. int cmd_annotate(int argc, const char **argv, const char *prefix __used)
  232. {
  233. argc = parse_options(argc, argv, options, annotate_usage, 0);
  234. if (use_stdio)
  235. use_browser = 0;
  236. else if (use_tui)
  237. use_browser = 1;
  238. setup_browser(true);
  239. symbol_conf.priv_size = sizeof(struct annotation);
  240. symbol_conf.try_vmlinux_path = true;
  241. if (symbol__init() < 0)
  242. return -1;
  243. setup_sorting(annotate_usage, options);
  244. if (argc) {
  245. /*
  246. * Special case: if there's an argument left then assume tha
  247. * it's a symbol filter:
  248. */
  249. if (argc > 1)
  250. usage_with_options(annotate_usage, options);
  251. sym_hist_filter = argv[0];
  252. }
  253. if (field_sep && *field_sep == '.') {
  254. pr_err("'.' is the only non valid --field-separator argument\n");
  255. return -1;
  256. }
  257. return __cmd_annotate();
  258. }