session.c 17 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710
  1. #define _FILE_OFFSET_BITS 64
  2. #include <linux/kernel.h>
  3. #include <byteswap.h>
  4. #include <unistd.h>
  5. #include <sys/types.h>
  6. #include "session.h"
  7. #include "sort.h"
  8. #include "util.h"
  9. static int perf_session__open(struct perf_session *self, bool force)
  10. {
  11. struct stat input_stat;
  12. if (!strcmp(self->filename, "-")) {
  13. self->fd_pipe = true;
  14. self->fd = STDIN_FILENO;
  15. if (perf_header__read(self, self->fd) < 0)
  16. pr_err("incompatible file format");
  17. return 0;
  18. }
  19. self->fd = open(self->filename, O_RDONLY);
  20. if (self->fd < 0) {
  21. pr_err("failed to open file: %s", self->filename);
  22. if (!strcmp(self->filename, "perf.data"))
  23. pr_err(" (try 'perf record' first)");
  24. pr_err("\n");
  25. return -errno;
  26. }
  27. if (fstat(self->fd, &input_stat) < 0)
  28. goto out_close;
  29. if (!force && input_stat.st_uid && (input_stat.st_uid != geteuid())) {
  30. pr_err("file %s not owned by current user or root\n",
  31. self->filename);
  32. goto out_close;
  33. }
  34. if (!input_stat.st_size) {
  35. pr_info("zero-sized file (%s), nothing to do!\n",
  36. self->filename);
  37. goto out_close;
  38. }
  39. if (perf_header__read(self, self->fd) < 0) {
  40. pr_err("incompatible file format");
  41. goto out_close;
  42. }
  43. self->size = input_stat.st_size;
  44. return 0;
  45. out_close:
  46. close(self->fd);
  47. self->fd = -1;
  48. return -1;
  49. }
  50. void perf_session__update_sample_type(struct perf_session *self)
  51. {
  52. self->sample_type = perf_header__sample_type(&self->header);
  53. }
  54. struct perf_session *perf_session__new(const char *filename, int mode, bool force)
  55. {
  56. size_t len = filename ? strlen(filename) + 1 : 0;
  57. struct perf_session *self = zalloc(sizeof(*self) + len);
  58. if (self == NULL)
  59. goto out;
  60. if (perf_header__init(&self->header) < 0)
  61. goto out_free;
  62. memcpy(self->filename, filename, len);
  63. self->threads = RB_ROOT;
  64. self->stats_by_id = RB_ROOT;
  65. self->last_match = NULL;
  66. self->mmap_window = 32;
  67. self->cwd = NULL;
  68. self->cwdlen = 0;
  69. self->unknown_events = 0;
  70. map_groups__init(&self->kmaps);
  71. if (mode == O_RDONLY) {
  72. if (perf_session__open(self, force) < 0)
  73. goto out_delete;
  74. } else if (mode == O_WRONLY) {
  75. /*
  76. * In O_RDONLY mode this will be performed when reading the
  77. * kernel MMAP event, in event__process_mmap().
  78. */
  79. if (perf_session__create_kernel_maps(self) < 0)
  80. goto out_delete;
  81. }
  82. perf_session__update_sample_type(self);
  83. out:
  84. return self;
  85. out_free:
  86. free(self);
  87. return NULL;
  88. out_delete:
  89. perf_session__delete(self);
  90. return NULL;
  91. }
  92. void perf_session__delete(struct perf_session *self)
  93. {
  94. perf_header__exit(&self->header);
  95. close(self->fd);
  96. free(self->cwd);
  97. free(self);
  98. }
  99. static bool symbol__match_parent_regex(struct symbol *sym)
  100. {
  101. if (sym->name && !regexec(&parent_regex, sym->name, 0, NULL, 0))
  102. return 1;
  103. return 0;
  104. }
  105. struct map_symbol *perf_session__resolve_callchain(struct perf_session *self,
  106. struct thread *thread,
  107. struct ip_callchain *chain,
  108. struct symbol **parent)
  109. {
  110. u8 cpumode = PERF_RECORD_MISC_USER;
  111. unsigned int i;
  112. struct map_symbol *syms = calloc(chain->nr, sizeof(*syms));
  113. if (!syms)
  114. return NULL;
  115. for (i = 0; i < chain->nr; i++) {
  116. u64 ip = chain->ips[i];
  117. struct addr_location al;
  118. if (ip >= PERF_CONTEXT_MAX) {
  119. switch (ip) {
  120. case PERF_CONTEXT_HV:
  121. cpumode = PERF_RECORD_MISC_HYPERVISOR; break;
  122. case PERF_CONTEXT_KERNEL:
  123. cpumode = PERF_RECORD_MISC_KERNEL; break;
  124. case PERF_CONTEXT_USER:
  125. cpumode = PERF_RECORD_MISC_USER; break;
  126. default:
  127. break;
  128. }
  129. continue;
  130. }
  131. thread__find_addr_location(thread, self, cpumode,
  132. MAP__FUNCTION, ip, &al, NULL);
  133. if (al.sym != NULL) {
  134. if (sort__has_parent && !*parent &&
  135. symbol__match_parent_regex(al.sym))
  136. *parent = al.sym;
  137. if (!symbol_conf.use_callchain)
  138. break;
  139. syms[i].map = al.map;
  140. syms[i].sym = al.sym;
  141. }
  142. }
  143. return syms;
  144. }
  145. static int process_event_stub(event_t *event __used,
  146. struct perf_session *session __used)
  147. {
  148. dump_printf(": unhandled!\n");
  149. return 0;
  150. }
  151. static void perf_event_ops__fill_defaults(struct perf_event_ops *handler)
  152. {
  153. if (handler->sample == NULL)
  154. handler->sample = process_event_stub;
  155. if (handler->mmap == NULL)
  156. handler->mmap = process_event_stub;
  157. if (handler->comm == NULL)
  158. handler->comm = process_event_stub;
  159. if (handler->fork == NULL)
  160. handler->fork = process_event_stub;
  161. if (handler->exit == NULL)
  162. handler->exit = process_event_stub;
  163. if (handler->lost == NULL)
  164. handler->lost = process_event_stub;
  165. if (handler->read == NULL)
  166. handler->read = process_event_stub;
  167. if (handler->throttle == NULL)
  168. handler->throttle = process_event_stub;
  169. if (handler->unthrottle == NULL)
  170. handler->unthrottle = process_event_stub;
  171. if (handler->attr == NULL)
  172. handler->attr = process_event_stub;
  173. if (handler->event_type == NULL)
  174. handler->event_type = process_event_stub;
  175. if (handler->tracing_data == NULL)
  176. handler->tracing_data = process_event_stub;
  177. }
  178. static const char *event__name[] = {
  179. [0] = "TOTAL",
  180. [PERF_RECORD_MMAP] = "MMAP",
  181. [PERF_RECORD_LOST] = "LOST",
  182. [PERF_RECORD_COMM] = "COMM",
  183. [PERF_RECORD_EXIT] = "EXIT",
  184. [PERF_RECORD_THROTTLE] = "THROTTLE",
  185. [PERF_RECORD_UNTHROTTLE] = "UNTHROTTLE",
  186. [PERF_RECORD_FORK] = "FORK",
  187. [PERF_RECORD_READ] = "READ",
  188. [PERF_RECORD_SAMPLE] = "SAMPLE",
  189. [PERF_RECORD_HEADER_ATTR] = "ATTR",
  190. [PERF_RECORD_HEADER_EVENT_TYPE] = "EVENT_TYPE",
  191. [PERF_RECORD_HEADER_TRACING_DATA] = "TRACING_DATA",
  192. };
  193. unsigned long event__total[PERF_RECORD_HEADER_MAX];
  194. void event__print_totals(void)
  195. {
  196. int i;
  197. for (i = 0; i < PERF_RECORD_HEADER_MAX; ++i) {
  198. if (!event__name[i])
  199. continue;
  200. pr_info("%10s events: %10ld\n",
  201. event__name[i], event__total[i]);
  202. }
  203. }
  204. void mem_bswap_64(void *src, int byte_size)
  205. {
  206. u64 *m = src;
  207. while (byte_size > 0) {
  208. *m = bswap_64(*m);
  209. byte_size -= sizeof(u64);
  210. ++m;
  211. }
  212. }
  213. static void event__all64_swap(event_t *self)
  214. {
  215. struct perf_event_header *hdr = &self->header;
  216. mem_bswap_64(hdr + 1, self->header.size - sizeof(*hdr));
  217. }
  218. static void event__comm_swap(event_t *self)
  219. {
  220. self->comm.pid = bswap_32(self->comm.pid);
  221. self->comm.tid = bswap_32(self->comm.tid);
  222. }
  223. static void event__mmap_swap(event_t *self)
  224. {
  225. self->mmap.pid = bswap_32(self->mmap.pid);
  226. self->mmap.tid = bswap_32(self->mmap.tid);
  227. self->mmap.start = bswap_64(self->mmap.start);
  228. self->mmap.len = bswap_64(self->mmap.len);
  229. self->mmap.pgoff = bswap_64(self->mmap.pgoff);
  230. }
  231. static void event__task_swap(event_t *self)
  232. {
  233. self->fork.pid = bswap_32(self->fork.pid);
  234. self->fork.tid = bswap_32(self->fork.tid);
  235. self->fork.ppid = bswap_32(self->fork.ppid);
  236. self->fork.ptid = bswap_32(self->fork.ptid);
  237. self->fork.time = bswap_64(self->fork.time);
  238. }
  239. static void event__read_swap(event_t *self)
  240. {
  241. self->read.pid = bswap_32(self->read.pid);
  242. self->read.tid = bswap_32(self->read.tid);
  243. self->read.value = bswap_64(self->read.value);
  244. self->read.time_enabled = bswap_64(self->read.time_enabled);
  245. self->read.time_running = bswap_64(self->read.time_running);
  246. self->read.id = bswap_64(self->read.id);
  247. }
  248. static void event__attr_swap(event_t *self)
  249. {
  250. size_t size;
  251. self->attr.attr.type = bswap_32(self->attr.attr.type);
  252. self->attr.attr.size = bswap_32(self->attr.attr.size);
  253. self->attr.attr.config = bswap_64(self->attr.attr.config);
  254. self->attr.attr.sample_period = bswap_64(self->attr.attr.sample_period);
  255. self->attr.attr.sample_type = bswap_64(self->attr.attr.sample_type);
  256. self->attr.attr.read_format = bswap_64(self->attr.attr.read_format);
  257. self->attr.attr.wakeup_events = bswap_32(self->attr.attr.wakeup_events);
  258. self->attr.attr.bp_type = bswap_32(self->attr.attr.bp_type);
  259. self->attr.attr.bp_addr = bswap_64(self->attr.attr.bp_addr);
  260. self->attr.attr.bp_len = bswap_64(self->attr.attr.bp_len);
  261. size = self->header.size;
  262. size -= (void *)&self->attr.id - (void *)self;
  263. mem_bswap_64(self->attr.id, size);
  264. }
  265. static void event__event_type_swap(event_t *self)
  266. {
  267. self->event_type.event_type.event_id =
  268. bswap_64(self->event_type.event_type.event_id);
  269. }
  270. static void event__tracing_data_swap(event_t *self)
  271. {
  272. self->tracing_data.size = bswap_32(self->tracing_data.size);
  273. }
  274. typedef void (*event__swap_op)(event_t *self);
  275. static event__swap_op event__swap_ops[] = {
  276. [PERF_RECORD_MMAP] = event__mmap_swap,
  277. [PERF_RECORD_COMM] = event__comm_swap,
  278. [PERF_RECORD_FORK] = event__task_swap,
  279. [PERF_RECORD_EXIT] = event__task_swap,
  280. [PERF_RECORD_LOST] = event__all64_swap,
  281. [PERF_RECORD_READ] = event__read_swap,
  282. [PERF_RECORD_SAMPLE] = event__all64_swap,
  283. [PERF_RECORD_HEADER_ATTR] = event__attr_swap,
  284. [PERF_RECORD_HEADER_EVENT_TYPE] = event__event_type_swap,
  285. [PERF_RECORD_HEADER_TRACING_DATA] = event__tracing_data_swap,
  286. [PERF_RECORD_HEADER_MAX] = NULL,
  287. };
  288. static int perf_session__process_event(struct perf_session *self,
  289. event_t *event,
  290. struct perf_event_ops *ops,
  291. u64 offset, u64 head)
  292. {
  293. trace_event(event);
  294. if (event->header.type < PERF_RECORD_HEADER_MAX) {
  295. dump_printf("%#Lx [%#x]: PERF_RECORD_%s",
  296. offset + head, event->header.size,
  297. event__name[event->header.type]);
  298. ++event__total[0];
  299. ++event__total[event->header.type];
  300. }
  301. if (self->header.needs_swap && event__swap_ops[event->header.type])
  302. event__swap_ops[event->header.type](event);
  303. switch (event->header.type) {
  304. case PERF_RECORD_SAMPLE:
  305. return ops->sample(event, self);
  306. case PERF_RECORD_MMAP:
  307. return ops->mmap(event, self);
  308. case PERF_RECORD_COMM:
  309. return ops->comm(event, self);
  310. case PERF_RECORD_FORK:
  311. return ops->fork(event, self);
  312. case PERF_RECORD_EXIT:
  313. return ops->exit(event, self);
  314. case PERF_RECORD_LOST:
  315. return ops->lost(event, self);
  316. case PERF_RECORD_READ:
  317. return ops->read(event, self);
  318. case PERF_RECORD_THROTTLE:
  319. return ops->throttle(event, self);
  320. case PERF_RECORD_UNTHROTTLE:
  321. return ops->unthrottle(event, self);
  322. case PERF_RECORD_HEADER_ATTR:
  323. return ops->attr(event, self);
  324. case PERF_RECORD_HEADER_EVENT_TYPE:
  325. return ops->event_type(event, self);
  326. case PERF_RECORD_HEADER_TRACING_DATA:
  327. /* setup for reading amidst mmap */
  328. lseek(self->fd, offset + head, SEEK_SET);
  329. return ops->tracing_data(event, self);
  330. default:
  331. self->unknown_events++;
  332. return -1;
  333. }
  334. }
  335. void perf_event_header__bswap(struct perf_event_header *self)
  336. {
  337. self->type = bswap_32(self->type);
  338. self->misc = bswap_16(self->misc);
  339. self->size = bswap_16(self->size);
  340. }
  341. int perf_header__read_build_ids(struct perf_header *self,
  342. int input, u64 offset, u64 size)
  343. {
  344. struct build_id_event bev;
  345. char filename[PATH_MAX];
  346. u64 limit = offset + size;
  347. int err = -1;
  348. while (offset < limit) {
  349. struct dso *dso;
  350. ssize_t len;
  351. struct list_head *head = &dsos__user;
  352. if (read(input, &bev, sizeof(bev)) != sizeof(bev))
  353. goto out;
  354. if (self->needs_swap)
  355. perf_event_header__bswap(&bev.header);
  356. len = bev.header.size - sizeof(bev);
  357. if (read(input, filename, len) != len)
  358. goto out;
  359. if (bev.header.misc & PERF_RECORD_MISC_KERNEL)
  360. head = &dsos__kernel;
  361. dso = __dsos__findnew(head, filename);
  362. if (dso != NULL) {
  363. dso__set_build_id(dso, &bev.build_id);
  364. if (head == &dsos__kernel && filename[0] == '[')
  365. dso->kernel = 1;
  366. }
  367. offset += bev.header.size;
  368. }
  369. err = 0;
  370. out:
  371. return err;
  372. }
  373. static struct thread *perf_session__register_idle_thread(struct perf_session *self)
  374. {
  375. struct thread *thread = perf_session__findnew(self, 0);
  376. if (thread == NULL || thread__set_comm(thread, "swapper")) {
  377. pr_err("problem inserting idle task.\n");
  378. thread = NULL;
  379. }
  380. return thread;
  381. }
  382. int do_read(int fd, void *buf, size_t size)
  383. {
  384. void *buf_start = buf;
  385. while (size) {
  386. int ret = read(fd, buf, size);
  387. if (ret <= 0)
  388. return ret;
  389. size -= ret;
  390. buf += ret;
  391. }
  392. return buf - buf_start;
  393. }
  394. #define session_done() (*(volatile int *)(&session_done))
  395. volatile int session_done;
  396. static int __perf_session__process_pipe_events(struct perf_session *self,
  397. struct perf_event_ops *ops)
  398. {
  399. event_t event;
  400. uint32_t size;
  401. int skip = 0;
  402. u64 head;
  403. int err;
  404. void *p;
  405. perf_event_ops__fill_defaults(ops);
  406. head = 0;
  407. more:
  408. err = do_read(self->fd, &event, sizeof(struct perf_event_header));
  409. if (err <= 0) {
  410. if (err == 0)
  411. goto done;
  412. pr_err("failed to read event header\n");
  413. goto out_err;
  414. }
  415. if (self->header.needs_swap)
  416. perf_event_header__bswap(&event.header);
  417. size = event.header.size;
  418. if (size == 0)
  419. size = 8;
  420. p = &event;
  421. p += sizeof(struct perf_event_header);
  422. err = do_read(self->fd, p, size - sizeof(struct perf_event_header));
  423. if (err <= 0) {
  424. if (err == 0) {
  425. pr_err("unexpected end of event stream\n");
  426. goto done;
  427. }
  428. pr_err("failed to read event data\n");
  429. goto out_err;
  430. }
  431. if (size == 0 ||
  432. (skip = perf_session__process_event(self, &event, ops,
  433. 0, head)) < 0) {
  434. dump_printf("%#Lx [%#x]: skipping unknown header type: %d\n",
  435. head, event.header.size, event.header.type);
  436. /*
  437. * assume we lost track of the stream, check alignment, and
  438. * increment a single u64 in the hope to catch on again 'soon'.
  439. */
  440. if (unlikely(head & 7))
  441. head &= ~7ULL;
  442. size = 8;
  443. }
  444. head += size;
  445. dump_printf("\n%#Lx [%#x]: event: %d\n",
  446. head, event.header.size, event.header.type);
  447. if (skip > 0)
  448. head += skip;
  449. if (!session_done())
  450. goto more;
  451. done:
  452. err = 0;
  453. out_err:
  454. return err;
  455. }
  456. int __perf_session__process_events(struct perf_session *self,
  457. u64 data_offset, u64 data_size,
  458. u64 file_size, struct perf_event_ops *ops)
  459. {
  460. int err, mmap_prot, mmap_flags;
  461. u64 head, shift;
  462. u64 offset = 0;
  463. size_t page_size;
  464. event_t *event;
  465. uint32_t size;
  466. char *buf;
  467. struct ui_progress *progress = ui_progress__new("Processing events...",
  468. self->size);
  469. if (progress == NULL)
  470. return -1;
  471. perf_event_ops__fill_defaults(ops);
  472. page_size = sysconf(_SC_PAGESIZE);
  473. head = data_offset;
  474. shift = page_size * (head / page_size);
  475. offset += shift;
  476. head -= shift;
  477. mmap_prot = PROT_READ;
  478. mmap_flags = MAP_SHARED;
  479. if (self->header.needs_swap) {
  480. mmap_prot |= PROT_WRITE;
  481. mmap_flags = MAP_PRIVATE;
  482. }
  483. remap:
  484. buf = mmap(NULL, page_size * self->mmap_window, mmap_prot,
  485. mmap_flags, self->fd, offset);
  486. if (buf == MAP_FAILED) {
  487. pr_err("failed to mmap file\n");
  488. err = -errno;
  489. goto out_err;
  490. }
  491. more:
  492. event = (event_t *)(buf + head);
  493. ui_progress__update(progress, offset);
  494. if (self->header.needs_swap)
  495. perf_event_header__bswap(&event->header);
  496. size = event->header.size;
  497. if (size == 0)
  498. size = 8;
  499. if (head + event->header.size >= page_size * self->mmap_window) {
  500. int munmap_ret;
  501. shift = page_size * (head / page_size);
  502. munmap_ret = munmap(buf, page_size * self->mmap_window);
  503. assert(munmap_ret == 0);
  504. offset += shift;
  505. head -= shift;
  506. goto remap;
  507. }
  508. size = event->header.size;
  509. dump_printf("\n%#Lx [%#x]: event: %d\n",
  510. offset + head, event->header.size, event->header.type);
  511. if (size == 0 ||
  512. perf_session__process_event(self, event, ops, offset, head) < 0) {
  513. dump_printf("%#Lx [%#x]: skipping unknown header type: %d\n",
  514. offset + head, event->header.size,
  515. event->header.type);
  516. /*
  517. * assume we lost track of the stream, check alignment, and
  518. * increment a single u64 in the hope to catch on again 'soon'.
  519. */
  520. if (unlikely(head & 7))
  521. head &= ~7ULL;
  522. size = 8;
  523. }
  524. head += size;
  525. if (offset + head >= data_offset + data_size)
  526. goto done;
  527. if (offset + head < file_size)
  528. goto more;
  529. done:
  530. err = 0;
  531. out_err:
  532. ui_progress__delete(progress);
  533. return err;
  534. }
  535. int perf_session__process_events(struct perf_session *self,
  536. struct perf_event_ops *ops)
  537. {
  538. int err;
  539. if (perf_session__register_idle_thread(self) == NULL)
  540. return -ENOMEM;
  541. if (!symbol_conf.full_paths) {
  542. char bf[PATH_MAX];
  543. if (getcwd(bf, sizeof(bf)) == NULL) {
  544. err = -errno;
  545. out_getcwd_err:
  546. pr_err("failed to get the current directory\n");
  547. goto out_err;
  548. }
  549. self->cwd = strdup(bf);
  550. if (self->cwd == NULL) {
  551. err = -ENOMEM;
  552. goto out_getcwd_err;
  553. }
  554. self->cwdlen = strlen(self->cwd);
  555. }
  556. if (!self->fd_pipe)
  557. err = __perf_session__process_events(self,
  558. self->header.data_offset,
  559. self->header.data_size,
  560. self->size, ops);
  561. else
  562. err = __perf_session__process_pipe_events(self, ops);
  563. out_err:
  564. return err;
  565. }
  566. bool perf_session__has_traces(struct perf_session *self, const char *msg)
  567. {
  568. if (!(self->sample_type & PERF_SAMPLE_RAW)) {
  569. pr_err("No trace sample to read. Did you call 'perf %s'?\n", msg);
  570. return false;
  571. }
  572. return true;
  573. }
  574. int perf_session__set_kallsyms_ref_reloc_sym(struct perf_session *self,
  575. const char *symbol_name,
  576. u64 addr)
  577. {
  578. char *bracket;
  579. enum map_type i;
  580. self->ref_reloc_sym.name = strdup(symbol_name);
  581. if (self->ref_reloc_sym.name == NULL)
  582. return -ENOMEM;
  583. bracket = strchr(self->ref_reloc_sym.name, ']');
  584. if (bracket)
  585. *bracket = '\0';
  586. self->ref_reloc_sym.addr = addr;
  587. for (i = 0; i < MAP__NR_TYPES; ++i) {
  588. struct kmap *kmap = map__kmap(self->vmlinux_maps[i]);
  589. kmap->ref_reloc_sym = &self->ref_reloc_sym;
  590. }
  591. return 0;
  592. }