session.c 16 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685
  1. #define _FILE_OFFSET_BITS 64
  2. #include <linux/kernel.h>
  3. #include <byteswap.h>
  4. #include <unistd.h>
  5. #include <sys/types.h>
  6. #include "session.h"
  7. #include "sort.h"
  8. #include "util.h"
  9. static int perf_session__open(struct perf_session *self, bool force)
  10. {
  11. struct stat input_stat;
  12. if (!strcmp(self->filename, "-")) {
  13. self->fd_pipe = true;
  14. self->fd = STDIN_FILENO;
  15. if (perf_header__read(self, self->fd) < 0)
  16. pr_err("incompatible file format");
  17. return 0;
  18. }
  19. self->fd = open(self->filename, O_RDONLY);
  20. if (self->fd < 0) {
  21. pr_err("failed to open file: %s", self->filename);
  22. if (!strcmp(self->filename, "perf.data"))
  23. pr_err(" (try 'perf record' first)");
  24. pr_err("\n");
  25. return -errno;
  26. }
  27. if (fstat(self->fd, &input_stat) < 0)
  28. goto out_close;
  29. if (!force && input_stat.st_uid && (input_stat.st_uid != geteuid())) {
  30. pr_err("file %s not owned by current user or root\n",
  31. self->filename);
  32. goto out_close;
  33. }
  34. if (!input_stat.st_size) {
  35. pr_info("zero-sized file (%s), nothing to do!\n",
  36. self->filename);
  37. goto out_close;
  38. }
  39. if (perf_header__read(self, self->fd) < 0) {
  40. pr_err("incompatible file format");
  41. goto out_close;
  42. }
  43. self->size = input_stat.st_size;
  44. return 0;
  45. out_close:
  46. close(self->fd);
  47. self->fd = -1;
  48. return -1;
  49. }
  50. void perf_session__update_sample_type(struct perf_session *self)
  51. {
  52. self->sample_type = perf_header__sample_type(&self->header);
  53. }
  54. struct perf_session *perf_session__new(const char *filename, int mode, bool force)
  55. {
  56. size_t len = filename ? strlen(filename) + 1 : 0;
  57. struct perf_session *self = zalloc(sizeof(*self) + len);
  58. if (self == NULL)
  59. goto out;
  60. if (perf_header__init(&self->header) < 0)
  61. goto out_free;
  62. memcpy(self->filename, filename, len);
  63. self->threads = RB_ROOT;
  64. self->stats_by_id = RB_ROOT;
  65. self->last_match = NULL;
  66. self->mmap_window = 32;
  67. self->cwd = NULL;
  68. self->cwdlen = 0;
  69. self->unknown_events = 0;
  70. map_groups__init(&self->kmaps);
  71. if (mode == O_RDONLY) {
  72. if (perf_session__open(self, force) < 0)
  73. goto out_delete;
  74. } else if (mode == O_WRONLY) {
  75. /*
  76. * In O_RDONLY mode this will be performed when reading the
  77. * kernel MMAP event, in event__process_mmap().
  78. */
  79. if (perf_session__create_kernel_maps(self) < 0)
  80. goto out_delete;
  81. }
  82. perf_session__update_sample_type(self);
  83. out:
  84. return self;
  85. out_free:
  86. free(self);
  87. return NULL;
  88. out_delete:
  89. perf_session__delete(self);
  90. return NULL;
  91. }
  92. void perf_session__delete(struct perf_session *self)
  93. {
  94. perf_header__exit(&self->header);
  95. close(self->fd);
  96. free(self->cwd);
  97. free(self);
  98. }
  99. static bool symbol__match_parent_regex(struct symbol *sym)
  100. {
  101. if (sym->name && !regexec(&parent_regex, sym->name, 0, NULL, 0))
  102. return 1;
  103. return 0;
  104. }
  105. struct map_symbol *perf_session__resolve_callchain(struct perf_session *self,
  106. struct thread *thread,
  107. struct ip_callchain *chain,
  108. struct symbol **parent)
  109. {
  110. u8 cpumode = PERF_RECORD_MISC_USER;
  111. unsigned int i;
  112. struct map_symbol *syms = calloc(chain->nr, sizeof(*syms));
  113. if (!syms)
  114. return NULL;
  115. for (i = 0; i < chain->nr; i++) {
  116. u64 ip = chain->ips[i];
  117. struct addr_location al;
  118. if (ip >= PERF_CONTEXT_MAX) {
  119. switch (ip) {
  120. case PERF_CONTEXT_HV:
  121. cpumode = PERF_RECORD_MISC_HYPERVISOR; break;
  122. case PERF_CONTEXT_KERNEL:
  123. cpumode = PERF_RECORD_MISC_KERNEL; break;
  124. case PERF_CONTEXT_USER:
  125. cpumode = PERF_RECORD_MISC_USER; break;
  126. default:
  127. break;
  128. }
  129. continue;
  130. }
  131. thread__find_addr_location(thread, self, cpumode,
  132. MAP__FUNCTION, ip, &al, NULL);
  133. if (al.sym != NULL) {
  134. if (sort__has_parent && !*parent &&
  135. symbol__match_parent_regex(al.sym))
  136. *parent = al.sym;
  137. if (!symbol_conf.use_callchain)
  138. break;
  139. syms[i].map = al.map;
  140. syms[i].sym = al.sym;
  141. }
  142. }
  143. return syms;
  144. }
  145. static int process_event_stub(event_t *event __used,
  146. struct perf_session *session __used)
  147. {
  148. dump_printf(": unhandled!\n");
  149. return 0;
  150. }
  151. static void perf_event_ops__fill_defaults(struct perf_event_ops *handler)
  152. {
  153. if (handler->sample == NULL)
  154. handler->sample = process_event_stub;
  155. if (handler->mmap == NULL)
  156. handler->mmap = process_event_stub;
  157. if (handler->comm == NULL)
  158. handler->comm = process_event_stub;
  159. if (handler->fork == NULL)
  160. handler->fork = process_event_stub;
  161. if (handler->exit == NULL)
  162. handler->exit = process_event_stub;
  163. if (handler->lost == NULL)
  164. handler->lost = process_event_stub;
  165. if (handler->read == NULL)
  166. handler->read = process_event_stub;
  167. if (handler->throttle == NULL)
  168. handler->throttle = process_event_stub;
  169. if (handler->unthrottle == NULL)
  170. handler->unthrottle = process_event_stub;
  171. if (handler->attr == NULL)
  172. handler->attr = process_event_stub;
  173. }
  174. static const char *event__name[] = {
  175. [0] = "TOTAL",
  176. [PERF_RECORD_MMAP] = "MMAP",
  177. [PERF_RECORD_LOST] = "LOST",
  178. [PERF_RECORD_COMM] = "COMM",
  179. [PERF_RECORD_EXIT] = "EXIT",
  180. [PERF_RECORD_THROTTLE] = "THROTTLE",
  181. [PERF_RECORD_UNTHROTTLE] = "UNTHROTTLE",
  182. [PERF_RECORD_FORK] = "FORK",
  183. [PERF_RECORD_READ] = "READ",
  184. [PERF_RECORD_SAMPLE] = "SAMPLE",
  185. [PERF_RECORD_HEADER_ATTR] = "ATTR",
  186. };
  187. unsigned long event__total[PERF_RECORD_HEADER_MAX];
  188. void event__print_totals(void)
  189. {
  190. int i;
  191. for (i = 0; i < PERF_RECORD_HEADER_MAX; ++i) {
  192. if (!event__name[i])
  193. continue;
  194. pr_info("%10s events: %10ld\n",
  195. event__name[i], event__total[i]);
  196. }
  197. }
  198. void mem_bswap_64(void *src, int byte_size)
  199. {
  200. u64 *m = src;
  201. while (byte_size > 0) {
  202. *m = bswap_64(*m);
  203. byte_size -= sizeof(u64);
  204. ++m;
  205. }
  206. }
  207. static void event__all64_swap(event_t *self)
  208. {
  209. struct perf_event_header *hdr = &self->header;
  210. mem_bswap_64(hdr + 1, self->header.size - sizeof(*hdr));
  211. }
  212. static void event__comm_swap(event_t *self)
  213. {
  214. self->comm.pid = bswap_32(self->comm.pid);
  215. self->comm.tid = bswap_32(self->comm.tid);
  216. }
  217. static void event__mmap_swap(event_t *self)
  218. {
  219. self->mmap.pid = bswap_32(self->mmap.pid);
  220. self->mmap.tid = bswap_32(self->mmap.tid);
  221. self->mmap.start = bswap_64(self->mmap.start);
  222. self->mmap.len = bswap_64(self->mmap.len);
  223. self->mmap.pgoff = bswap_64(self->mmap.pgoff);
  224. }
  225. static void event__task_swap(event_t *self)
  226. {
  227. self->fork.pid = bswap_32(self->fork.pid);
  228. self->fork.tid = bswap_32(self->fork.tid);
  229. self->fork.ppid = bswap_32(self->fork.ppid);
  230. self->fork.ptid = bswap_32(self->fork.ptid);
  231. self->fork.time = bswap_64(self->fork.time);
  232. }
  233. static void event__read_swap(event_t *self)
  234. {
  235. self->read.pid = bswap_32(self->read.pid);
  236. self->read.tid = bswap_32(self->read.tid);
  237. self->read.value = bswap_64(self->read.value);
  238. self->read.time_enabled = bswap_64(self->read.time_enabled);
  239. self->read.time_running = bswap_64(self->read.time_running);
  240. self->read.id = bswap_64(self->read.id);
  241. }
  242. static void event__attr_swap(event_t *self)
  243. {
  244. size_t size;
  245. self->attr.attr.type = bswap_32(self->attr.attr.type);
  246. self->attr.attr.size = bswap_32(self->attr.attr.size);
  247. self->attr.attr.config = bswap_64(self->attr.attr.config);
  248. self->attr.attr.sample_period = bswap_64(self->attr.attr.sample_period);
  249. self->attr.attr.sample_type = bswap_64(self->attr.attr.sample_type);
  250. self->attr.attr.read_format = bswap_64(self->attr.attr.read_format);
  251. self->attr.attr.wakeup_events = bswap_32(self->attr.attr.wakeup_events);
  252. self->attr.attr.bp_type = bswap_32(self->attr.attr.bp_type);
  253. self->attr.attr.bp_addr = bswap_64(self->attr.attr.bp_addr);
  254. self->attr.attr.bp_len = bswap_64(self->attr.attr.bp_len);
  255. size = self->header.size;
  256. size -= (void *)&self->attr.id - (void *)self;
  257. mem_bswap_64(self->attr.id, size);
  258. }
  259. typedef void (*event__swap_op)(event_t *self);
  260. static event__swap_op event__swap_ops[] = {
  261. [PERF_RECORD_MMAP] = event__mmap_swap,
  262. [PERF_RECORD_COMM] = event__comm_swap,
  263. [PERF_RECORD_FORK] = event__task_swap,
  264. [PERF_RECORD_EXIT] = event__task_swap,
  265. [PERF_RECORD_LOST] = event__all64_swap,
  266. [PERF_RECORD_READ] = event__read_swap,
  267. [PERF_RECORD_SAMPLE] = event__all64_swap,
  268. [PERF_RECORD_HEADER_ATTR] = event__attr_swap,
  269. [PERF_RECORD_HEADER_MAX] = NULL,
  270. };
  271. static int perf_session__process_event(struct perf_session *self,
  272. event_t *event,
  273. struct perf_event_ops *ops,
  274. u64 offset, u64 head)
  275. {
  276. trace_event(event);
  277. if (event->header.type < PERF_RECORD_HEADER_MAX) {
  278. dump_printf("%#Lx [%#x]: PERF_RECORD_%s",
  279. offset + head, event->header.size,
  280. event__name[event->header.type]);
  281. ++event__total[0];
  282. ++event__total[event->header.type];
  283. }
  284. if (self->header.needs_swap && event__swap_ops[event->header.type])
  285. event__swap_ops[event->header.type](event);
  286. switch (event->header.type) {
  287. case PERF_RECORD_SAMPLE:
  288. return ops->sample(event, self);
  289. case PERF_RECORD_MMAP:
  290. return ops->mmap(event, self);
  291. case PERF_RECORD_COMM:
  292. return ops->comm(event, self);
  293. case PERF_RECORD_FORK:
  294. return ops->fork(event, self);
  295. case PERF_RECORD_EXIT:
  296. return ops->exit(event, self);
  297. case PERF_RECORD_LOST:
  298. return ops->lost(event, self);
  299. case PERF_RECORD_READ:
  300. return ops->read(event, self);
  301. case PERF_RECORD_THROTTLE:
  302. return ops->throttle(event, self);
  303. case PERF_RECORD_UNTHROTTLE:
  304. return ops->unthrottle(event, self);
  305. case PERF_RECORD_HEADER_ATTR:
  306. return ops->attr(event, self);
  307. default:
  308. self->unknown_events++;
  309. return -1;
  310. }
  311. }
  312. void perf_event_header__bswap(struct perf_event_header *self)
  313. {
  314. self->type = bswap_32(self->type);
  315. self->misc = bswap_16(self->misc);
  316. self->size = bswap_16(self->size);
  317. }
  318. int perf_header__read_build_ids(struct perf_header *self,
  319. int input, u64 offset, u64 size)
  320. {
  321. struct build_id_event bev;
  322. char filename[PATH_MAX];
  323. u64 limit = offset + size;
  324. int err = -1;
  325. while (offset < limit) {
  326. struct dso *dso;
  327. ssize_t len;
  328. struct list_head *head = &dsos__user;
  329. if (read(input, &bev, sizeof(bev)) != sizeof(bev))
  330. goto out;
  331. if (self->needs_swap)
  332. perf_event_header__bswap(&bev.header);
  333. len = bev.header.size - sizeof(bev);
  334. if (read(input, filename, len) != len)
  335. goto out;
  336. if (bev.header.misc & PERF_RECORD_MISC_KERNEL)
  337. head = &dsos__kernel;
  338. dso = __dsos__findnew(head, filename);
  339. if (dso != NULL) {
  340. dso__set_build_id(dso, &bev.build_id);
  341. if (head == &dsos__kernel && filename[0] == '[')
  342. dso->kernel = 1;
  343. }
  344. offset += bev.header.size;
  345. }
  346. err = 0;
  347. out:
  348. return err;
  349. }
  350. static struct thread *perf_session__register_idle_thread(struct perf_session *self)
  351. {
  352. struct thread *thread = perf_session__findnew(self, 0);
  353. if (thread == NULL || thread__set_comm(thread, "swapper")) {
  354. pr_err("problem inserting idle task.\n");
  355. thread = NULL;
  356. }
  357. return thread;
  358. }
  359. int do_read(int fd, void *buf, size_t size)
  360. {
  361. void *buf_start = buf;
  362. while (size) {
  363. int ret = read(fd, buf, size);
  364. if (ret <= 0)
  365. return ret;
  366. size -= ret;
  367. buf += ret;
  368. }
  369. return buf - buf_start;
  370. }
  371. #define session_done() (*(volatile int *)(&session_done))
  372. volatile int session_done;
  373. static int __perf_session__process_pipe_events(struct perf_session *self,
  374. struct perf_event_ops *ops)
  375. {
  376. event_t event;
  377. uint32_t size;
  378. int skip = 0;
  379. u64 head;
  380. int err;
  381. void *p;
  382. perf_event_ops__fill_defaults(ops);
  383. head = 0;
  384. more:
  385. err = do_read(self->fd, &event, sizeof(struct perf_event_header));
  386. if (err <= 0) {
  387. if (err == 0)
  388. goto done;
  389. pr_err("failed to read event header\n");
  390. goto out_err;
  391. }
  392. if (self->header.needs_swap)
  393. perf_event_header__bswap(&event.header);
  394. size = event.header.size;
  395. if (size == 0)
  396. size = 8;
  397. p = &event;
  398. p += sizeof(struct perf_event_header);
  399. err = do_read(self->fd, p, size - sizeof(struct perf_event_header));
  400. if (err <= 0) {
  401. if (err == 0) {
  402. pr_err("unexpected end of event stream\n");
  403. goto done;
  404. }
  405. pr_err("failed to read event data\n");
  406. goto out_err;
  407. }
  408. if (size == 0 ||
  409. (skip = perf_session__process_event(self, &event, ops,
  410. 0, head)) < 0) {
  411. dump_printf("%#Lx [%#x]: skipping unknown header type: %d\n",
  412. head, event.header.size, event.header.type);
  413. /*
  414. * assume we lost track of the stream, check alignment, and
  415. * increment a single u64 in the hope to catch on again 'soon'.
  416. */
  417. if (unlikely(head & 7))
  418. head &= ~7ULL;
  419. size = 8;
  420. }
  421. head += size;
  422. dump_printf("\n%#Lx [%#x]: event: %d\n",
  423. head, event.header.size, event.header.type);
  424. if (skip > 0)
  425. head += skip;
  426. if (!session_done())
  427. goto more;
  428. done:
  429. err = 0;
  430. out_err:
  431. return err;
  432. }
  433. int __perf_session__process_events(struct perf_session *self,
  434. u64 data_offset, u64 data_size,
  435. u64 file_size, struct perf_event_ops *ops)
  436. {
  437. int err, mmap_prot, mmap_flags;
  438. u64 head, shift;
  439. u64 offset = 0;
  440. size_t page_size;
  441. event_t *event;
  442. uint32_t size;
  443. char *buf;
  444. struct ui_progress *progress = ui_progress__new("Processing events...",
  445. self->size);
  446. if (progress == NULL)
  447. return -1;
  448. perf_event_ops__fill_defaults(ops);
  449. page_size = sysconf(_SC_PAGESIZE);
  450. head = data_offset;
  451. shift = page_size * (head / page_size);
  452. offset += shift;
  453. head -= shift;
  454. mmap_prot = PROT_READ;
  455. mmap_flags = MAP_SHARED;
  456. if (self->header.needs_swap) {
  457. mmap_prot |= PROT_WRITE;
  458. mmap_flags = MAP_PRIVATE;
  459. }
  460. remap:
  461. buf = mmap(NULL, page_size * self->mmap_window, mmap_prot,
  462. mmap_flags, self->fd, offset);
  463. if (buf == MAP_FAILED) {
  464. pr_err("failed to mmap file\n");
  465. err = -errno;
  466. goto out_err;
  467. }
  468. more:
  469. event = (event_t *)(buf + head);
  470. ui_progress__update(progress, offset);
  471. if (self->header.needs_swap)
  472. perf_event_header__bswap(&event->header);
  473. size = event->header.size;
  474. if (size == 0)
  475. size = 8;
  476. if (head + event->header.size >= page_size * self->mmap_window) {
  477. int munmap_ret;
  478. shift = page_size * (head / page_size);
  479. munmap_ret = munmap(buf, page_size * self->mmap_window);
  480. assert(munmap_ret == 0);
  481. offset += shift;
  482. head -= shift;
  483. goto remap;
  484. }
  485. size = event->header.size;
  486. dump_printf("\n%#Lx [%#x]: event: %d\n",
  487. offset + head, event->header.size, event->header.type);
  488. if (size == 0 ||
  489. perf_session__process_event(self, event, ops, offset, head) < 0) {
  490. dump_printf("%#Lx [%#x]: skipping unknown header type: %d\n",
  491. offset + head, event->header.size,
  492. event->header.type);
  493. /*
  494. * assume we lost track of the stream, check alignment, and
  495. * increment a single u64 in the hope to catch on again 'soon'.
  496. */
  497. if (unlikely(head & 7))
  498. head &= ~7ULL;
  499. size = 8;
  500. }
  501. head += size;
  502. if (offset + head >= data_offset + data_size)
  503. goto done;
  504. if (offset + head < file_size)
  505. goto more;
  506. done:
  507. err = 0;
  508. out_err:
  509. ui_progress__delete(progress);
  510. return err;
  511. }
  512. int perf_session__process_events(struct perf_session *self,
  513. struct perf_event_ops *ops)
  514. {
  515. int err;
  516. if (perf_session__register_idle_thread(self) == NULL)
  517. return -ENOMEM;
  518. if (!symbol_conf.full_paths) {
  519. char bf[PATH_MAX];
  520. if (getcwd(bf, sizeof(bf)) == NULL) {
  521. err = -errno;
  522. out_getcwd_err:
  523. pr_err("failed to get the current directory\n");
  524. goto out_err;
  525. }
  526. self->cwd = strdup(bf);
  527. if (self->cwd == NULL) {
  528. err = -ENOMEM;
  529. goto out_getcwd_err;
  530. }
  531. self->cwdlen = strlen(self->cwd);
  532. }
  533. if (!self->fd_pipe)
  534. err = __perf_session__process_events(self,
  535. self->header.data_offset,
  536. self->header.data_size,
  537. self->size, ops);
  538. else
  539. err = __perf_session__process_pipe_events(self, ops);
  540. out_err:
  541. return err;
  542. }
  543. bool perf_session__has_traces(struct perf_session *self, const char *msg)
  544. {
  545. if (!(self->sample_type & PERF_SAMPLE_RAW)) {
  546. pr_err("No trace sample to read. Did you call 'perf %s'?\n", msg);
  547. return false;
  548. }
  549. return true;
  550. }
  551. int perf_session__set_kallsyms_ref_reloc_sym(struct perf_session *self,
  552. const char *symbol_name,
  553. u64 addr)
  554. {
  555. char *bracket;
  556. enum map_type i;
  557. self->ref_reloc_sym.name = strdup(symbol_name);
  558. if (self->ref_reloc_sym.name == NULL)
  559. return -ENOMEM;
  560. bracket = strchr(self->ref_reloc_sym.name, ']');
  561. if (bracket)
  562. *bracket = '\0';
  563. self->ref_reloc_sym.addr = addr;
  564. for (i = 0; i < MAP__NR_TYPES; ++i) {
  565. struct kmap *kmap = map__kmap(self->vmlinux_maps[i]);
  566. kmap->ref_reloc_sym = &self->ref_reloc_sym;
  567. }
  568. return 0;
  569. }