session.c 44 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285128612871288128912901291129212931294129512961297129812991300130113021303130413051306130713081309131013111312131313141315131613171318131913201321132213231324132513261327132813291330133113321333133413351336133713381339134013411342134313441345134613471348134913501351135213531354135513561357135813591360136113621363136413651366136713681369137013711372137313741375137613771378137913801381138213831384138513861387138813891390139113921393139413951396139713981399140014011402140314041405140614071408140914101411141214131414141514161417141814191420142114221423142414251426142714281429143014311432143314341435143614371438143914401441144214431444144514461447144814491450145114521453145414551456145714581459146014611462146314641465146614671468146914701471147214731474147514761477147814791480148114821483148414851486148714881489149014911492149314941495149614971498149915001501150215031504150515061507150815091510151115121513151415151516151715181519152015211522152315241525152615271528152915301531153215331534153515361537153815391540154115421543154415451546154715481549155015511552155315541555155615571558155915601561156215631564156515661567156815691570157115721573157415751576157715781579158015811582158315841585158615871588158915901591159215931594159515961597159815991600160116021603160416051606160716081609161016111612161316141615161616171618161916201621162216231624162516261627162816291630163116321633163416351636163716381639164016411642164316441645164616471648164916501651165216531654165516561657165816591660166116621663166416651666166716681669167016711672167316741675167616771678167916801681168216831684168516861687168816891690169116921693169416951696
  1. #include <linux/kernel.h>
  2. #include <traceevent/event-parse.h>
  3. #include <byteswap.h>
  4. #include <unistd.h>
  5. #include <sys/types.h>
  6. #include <sys/mman.h>
  7. #include "evlist.h"
  8. #include "evsel.h"
  9. #include "session.h"
  10. #include "tool.h"
  11. #include "sort.h"
  12. #include "util.h"
  13. #include "cpumap.h"
  14. #include "perf_regs.h"
  15. #include "vdso.h"
  16. static int perf_session__open(struct perf_session *self, bool force)
  17. {
  18. struct stat input_stat;
  19. if (!strcmp(self->filename, "-")) {
  20. self->fd_pipe = true;
  21. self->fd = STDIN_FILENO;
  22. if (perf_session__read_header(self) < 0)
  23. pr_err("incompatible file format (rerun with -v to learn more)");
  24. return 0;
  25. }
  26. self->fd = open(self->filename, O_RDONLY);
  27. if (self->fd < 0) {
  28. int err = errno;
  29. pr_err("failed to open %s: %s", self->filename, strerror(err));
  30. if (err == ENOENT && !strcmp(self->filename, "perf.data"))
  31. pr_err(" (try 'perf record' first)");
  32. pr_err("\n");
  33. return -errno;
  34. }
  35. if (fstat(self->fd, &input_stat) < 0)
  36. goto out_close;
  37. if (!force && input_stat.st_uid && (input_stat.st_uid != geteuid())) {
  38. pr_err("file %s not owned by current user or root\n",
  39. self->filename);
  40. goto out_close;
  41. }
  42. if (!input_stat.st_size) {
  43. pr_info("zero-sized file (%s), nothing to do!\n",
  44. self->filename);
  45. goto out_close;
  46. }
  47. if (perf_session__read_header(self) < 0) {
  48. pr_err("incompatible file format (rerun with -v to learn more)");
  49. goto out_close;
  50. }
  51. if (!perf_evlist__valid_sample_type(self->evlist)) {
  52. pr_err("non matching sample_type");
  53. goto out_close;
  54. }
  55. if (!perf_evlist__valid_sample_id_all(self->evlist)) {
  56. pr_err("non matching sample_id_all");
  57. goto out_close;
  58. }
  59. if (!perf_evlist__valid_read_format(self->evlist)) {
  60. pr_err("non matching read_format");
  61. goto out_close;
  62. }
  63. self->size = input_stat.st_size;
  64. return 0;
  65. out_close:
  66. close(self->fd);
  67. self->fd = -1;
  68. return -1;
  69. }
  70. void perf_session__set_id_hdr_size(struct perf_session *session)
  71. {
  72. u16 id_hdr_size = perf_evlist__id_hdr_size(session->evlist);
  73. machines__set_id_hdr_size(&session->machines, id_hdr_size);
  74. }
  75. int perf_session__create_kernel_maps(struct perf_session *self)
  76. {
  77. int ret = machine__create_kernel_maps(&self->machines.host);
  78. if (ret >= 0)
  79. ret = machines__create_guest_kernel_maps(&self->machines);
  80. return ret;
  81. }
  82. static void perf_session__destroy_kernel_maps(struct perf_session *self)
  83. {
  84. machines__destroy_kernel_maps(&self->machines);
  85. }
  86. struct perf_session *perf_session__new(const char *filename, int mode,
  87. bool force, bool repipe,
  88. struct perf_tool *tool)
  89. {
  90. struct perf_session *self;
  91. struct stat st;
  92. size_t len;
  93. if (!filename || !strlen(filename)) {
  94. if (!fstat(STDIN_FILENO, &st) && S_ISFIFO(st.st_mode))
  95. filename = "-";
  96. else
  97. filename = "perf.data";
  98. }
  99. len = strlen(filename);
  100. self = zalloc(sizeof(*self) + len);
  101. if (self == NULL)
  102. goto out;
  103. memcpy(self->filename, filename, len);
  104. self->repipe = repipe;
  105. INIT_LIST_HEAD(&self->ordered_samples.samples);
  106. INIT_LIST_HEAD(&self->ordered_samples.sample_cache);
  107. INIT_LIST_HEAD(&self->ordered_samples.to_free);
  108. machines__init(&self->machines);
  109. if (mode == O_RDONLY) {
  110. if (perf_session__open(self, force) < 0)
  111. goto out_delete;
  112. perf_session__set_id_hdr_size(self);
  113. } else if (mode == O_WRONLY) {
  114. /*
  115. * In O_RDONLY mode this will be performed when reading the
  116. * kernel MMAP event, in perf_event__process_mmap().
  117. */
  118. if (perf_session__create_kernel_maps(self) < 0)
  119. goto out_delete;
  120. }
  121. if (tool && tool->ordering_requires_timestamps &&
  122. tool->ordered_samples && !perf_evlist__sample_id_all(self->evlist)) {
  123. dump_printf("WARNING: No sample_id_all support, falling back to unordered processing\n");
  124. tool->ordered_samples = false;
  125. }
  126. out:
  127. return self;
  128. out_delete:
  129. perf_session__delete(self);
  130. return NULL;
  131. }
  132. static void perf_session__delete_dead_threads(struct perf_session *session)
  133. {
  134. machine__delete_dead_threads(&session->machines.host);
  135. }
  136. static void perf_session__delete_threads(struct perf_session *session)
  137. {
  138. machine__delete_threads(&session->machines.host);
  139. }
  140. static void perf_session_env__delete(struct perf_session_env *env)
  141. {
  142. free(env->hostname);
  143. free(env->os_release);
  144. free(env->version);
  145. free(env->arch);
  146. free(env->cpu_desc);
  147. free(env->cpuid);
  148. free(env->cmdline);
  149. free(env->sibling_cores);
  150. free(env->sibling_threads);
  151. free(env->numa_nodes);
  152. free(env->pmu_mappings);
  153. }
  154. void perf_session__delete(struct perf_session *self)
  155. {
  156. perf_session__destroy_kernel_maps(self);
  157. perf_session__delete_dead_threads(self);
  158. perf_session__delete_threads(self);
  159. perf_session_env__delete(&self->header.env);
  160. machines__exit(&self->machines);
  161. close(self->fd);
  162. free(self);
  163. vdso__exit();
  164. }
  165. static int process_event_synth_tracing_data_stub(struct perf_tool *tool
  166. __maybe_unused,
  167. union perf_event *event
  168. __maybe_unused,
  169. struct perf_session *session
  170. __maybe_unused)
  171. {
  172. dump_printf(": unhandled!\n");
  173. return 0;
  174. }
  175. static int process_event_synth_attr_stub(struct perf_tool *tool __maybe_unused,
  176. union perf_event *event __maybe_unused,
  177. struct perf_evlist **pevlist
  178. __maybe_unused)
  179. {
  180. dump_printf(": unhandled!\n");
  181. return 0;
  182. }
  183. static int process_event_sample_stub(struct perf_tool *tool __maybe_unused,
  184. union perf_event *event __maybe_unused,
  185. struct perf_sample *sample __maybe_unused,
  186. struct perf_evsel *evsel __maybe_unused,
  187. struct machine *machine __maybe_unused)
  188. {
  189. dump_printf(": unhandled!\n");
  190. return 0;
  191. }
  192. static int process_event_stub(struct perf_tool *tool __maybe_unused,
  193. union perf_event *event __maybe_unused,
  194. struct perf_sample *sample __maybe_unused,
  195. struct machine *machine __maybe_unused)
  196. {
  197. dump_printf(": unhandled!\n");
  198. return 0;
  199. }
  200. static int process_finished_round_stub(struct perf_tool *tool __maybe_unused,
  201. union perf_event *event __maybe_unused,
  202. struct perf_session *perf_session
  203. __maybe_unused)
  204. {
  205. dump_printf(": unhandled!\n");
  206. return 0;
  207. }
  208. static int process_finished_round(struct perf_tool *tool,
  209. union perf_event *event,
  210. struct perf_session *session);
  211. void perf_tool__fill_defaults(struct perf_tool *tool)
  212. {
  213. if (tool->sample == NULL)
  214. tool->sample = process_event_sample_stub;
  215. if (tool->mmap == NULL)
  216. tool->mmap = process_event_stub;
  217. if (tool->mmap2 == NULL)
  218. tool->mmap2 = process_event_stub;
  219. if (tool->comm == NULL)
  220. tool->comm = process_event_stub;
  221. if (tool->fork == NULL)
  222. tool->fork = process_event_stub;
  223. if (tool->exit == NULL)
  224. tool->exit = process_event_stub;
  225. if (tool->lost == NULL)
  226. tool->lost = perf_event__process_lost;
  227. if (tool->read == NULL)
  228. tool->read = process_event_sample_stub;
  229. if (tool->throttle == NULL)
  230. tool->throttle = process_event_stub;
  231. if (tool->unthrottle == NULL)
  232. tool->unthrottle = process_event_stub;
  233. if (tool->attr == NULL)
  234. tool->attr = process_event_synth_attr_stub;
  235. if (tool->tracing_data == NULL)
  236. tool->tracing_data = process_event_synth_tracing_data_stub;
  237. if (tool->build_id == NULL)
  238. tool->build_id = process_finished_round_stub;
  239. if (tool->finished_round == NULL) {
  240. if (tool->ordered_samples)
  241. tool->finished_round = process_finished_round;
  242. else
  243. tool->finished_round = process_finished_round_stub;
  244. }
  245. }
  246. void mem_bswap_32(void *src, int byte_size)
  247. {
  248. u32 *m = src;
  249. while (byte_size > 0) {
  250. *m = bswap_32(*m);
  251. byte_size -= sizeof(u32);
  252. ++m;
  253. }
  254. }
  255. void mem_bswap_64(void *src, int byte_size)
  256. {
  257. u64 *m = src;
  258. while (byte_size > 0) {
  259. *m = bswap_64(*m);
  260. byte_size -= sizeof(u64);
  261. ++m;
  262. }
  263. }
  264. static void swap_sample_id_all(union perf_event *event, void *data)
  265. {
  266. void *end = (void *) event + event->header.size;
  267. int size = end - data;
  268. BUG_ON(size % sizeof(u64));
  269. mem_bswap_64(data, size);
  270. }
  271. static void perf_event__all64_swap(union perf_event *event,
  272. bool sample_id_all __maybe_unused)
  273. {
  274. struct perf_event_header *hdr = &event->header;
  275. mem_bswap_64(hdr + 1, event->header.size - sizeof(*hdr));
  276. }
  277. static void perf_event__comm_swap(union perf_event *event, bool sample_id_all)
  278. {
  279. event->comm.pid = bswap_32(event->comm.pid);
  280. event->comm.tid = bswap_32(event->comm.tid);
  281. if (sample_id_all) {
  282. void *data = &event->comm.comm;
  283. data += PERF_ALIGN(strlen(data) + 1, sizeof(u64));
  284. swap_sample_id_all(event, data);
  285. }
  286. }
  287. static void perf_event__mmap_swap(union perf_event *event,
  288. bool sample_id_all)
  289. {
  290. event->mmap.pid = bswap_32(event->mmap.pid);
  291. event->mmap.tid = bswap_32(event->mmap.tid);
  292. event->mmap.start = bswap_64(event->mmap.start);
  293. event->mmap.len = bswap_64(event->mmap.len);
  294. event->mmap.pgoff = bswap_64(event->mmap.pgoff);
  295. if (sample_id_all) {
  296. void *data = &event->mmap.filename;
  297. data += PERF_ALIGN(strlen(data) + 1, sizeof(u64));
  298. swap_sample_id_all(event, data);
  299. }
  300. }
  301. static void perf_event__mmap2_swap(union perf_event *event,
  302. bool sample_id_all)
  303. {
  304. event->mmap2.pid = bswap_32(event->mmap2.pid);
  305. event->mmap2.tid = bswap_32(event->mmap2.tid);
  306. event->mmap2.start = bswap_64(event->mmap2.start);
  307. event->mmap2.len = bswap_64(event->mmap2.len);
  308. event->mmap2.pgoff = bswap_64(event->mmap2.pgoff);
  309. event->mmap2.maj = bswap_32(event->mmap2.maj);
  310. event->mmap2.min = bswap_32(event->mmap2.min);
  311. event->mmap2.ino = bswap_64(event->mmap2.ino);
  312. if (sample_id_all) {
  313. void *data = &event->mmap2.filename;
  314. data += PERF_ALIGN(strlen(data) + 1, sizeof(u64));
  315. swap_sample_id_all(event, data);
  316. }
  317. }
  318. static void perf_event__task_swap(union perf_event *event, bool sample_id_all)
  319. {
  320. event->fork.pid = bswap_32(event->fork.pid);
  321. event->fork.tid = bswap_32(event->fork.tid);
  322. event->fork.ppid = bswap_32(event->fork.ppid);
  323. event->fork.ptid = bswap_32(event->fork.ptid);
  324. event->fork.time = bswap_64(event->fork.time);
  325. if (sample_id_all)
  326. swap_sample_id_all(event, &event->fork + 1);
  327. }
  328. static void perf_event__read_swap(union perf_event *event, bool sample_id_all)
  329. {
  330. event->read.pid = bswap_32(event->read.pid);
  331. event->read.tid = bswap_32(event->read.tid);
  332. event->read.value = bswap_64(event->read.value);
  333. event->read.time_enabled = bswap_64(event->read.time_enabled);
  334. event->read.time_running = bswap_64(event->read.time_running);
  335. event->read.id = bswap_64(event->read.id);
  336. if (sample_id_all)
  337. swap_sample_id_all(event, &event->read + 1);
  338. }
  339. static void perf_event__throttle_swap(union perf_event *event,
  340. bool sample_id_all)
  341. {
  342. event->throttle.time = bswap_64(event->throttle.time);
  343. event->throttle.id = bswap_64(event->throttle.id);
  344. event->throttle.stream_id = bswap_64(event->throttle.stream_id);
  345. if (sample_id_all)
  346. swap_sample_id_all(event, &event->throttle + 1);
  347. }
  348. static u8 revbyte(u8 b)
  349. {
  350. int rev = (b >> 4) | ((b & 0xf) << 4);
  351. rev = ((rev & 0xcc) >> 2) | ((rev & 0x33) << 2);
  352. rev = ((rev & 0xaa) >> 1) | ((rev & 0x55) << 1);
  353. return (u8) rev;
  354. }
  355. /*
  356. * XXX this is hack in attempt to carry flags bitfield
  357. * throught endian village. ABI says:
  358. *
  359. * Bit-fields are allocated from right to left (least to most significant)
  360. * on little-endian implementations and from left to right (most to least
  361. * significant) on big-endian implementations.
  362. *
  363. * The above seems to be byte specific, so we need to reverse each
  364. * byte of the bitfield. 'Internet' also says this might be implementation
  365. * specific and we probably need proper fix and carry perf_event_attr
  366. * bitfield flags in separate data file FEAT_ section. Thought this seems
  367. * to work for now.
  368. */
  369. static void swap_bitfield(u8 *p, unsigned len)
  370. {
  371. unsigned i;
  372. for (i = 0; i < len; i++) {
  373. *p = revbyte(*p);
  374. p++;
  375. }
  376. }
  377. /* exported for swapping attributes in file header */
  378. void perf_event__attr_swap(struct perf_event_attr *attr)
  379. {
  380. attr->type = bswap_32(attr->type);
  381. attr->size = bswap_32(attr->size);
  382. attr->config = bswap_64(attr->config);
  383. attr->sample_period = bswap_64(attr->sample_period);
  384. attr->sample_type = bswap_64(attr->sample_type);
  385. attr->read_format = bswap_64(attr->read_format);
  386. attr->wakeup_events = bswap_32(attr->wakeup_events);
  387. attr->bp_type = bswap_32(attr->bp_type);
  388. attr->bp_addr = bswap_64(attr->bp_addr);
  389. attr->bp_len = bswap_64(attr->bp_len);
  390. attr->branch_sample_type = bswap_64(attr->branch_sample_type);
  391. attr->sample_regs_user = bswap_64(attr->sample_regs_user);
  392. attr->sample_stack_user = bswap_32(attr->sample_stack_user);
  393. swap_bitfield((u8 *) (&attr->read_format + 1), sizeof(u64));
  394. }
  395. static void perf_event__hdr_attr_swap(union perf_event *event,
  396. bool sample_id_all __maybe_unused)
  397. {
  398. size_t size;
  399. perf_event__attr_swap(&event->attr.attr);
  400. size = event->header.size;
  401. size -= (void *)&event->attr.id - (void *)event;
  402. mem_bswap_64(event->attr.id, size);
  403. }
  404. static void perf_event__event_type_swap(union perf_event *event,
  405. bool sample_id_all __maybe_unused)
  406. {
  407. event->event_type.event_type.event_id =
  408. bswap_64(event->event_type.event_type.event_id);
  409. }
  410. static void perf_event__tracing_data_swap(union perf_event *event,
  411. bool sample_id_all __maybe_unused)
  412. {
  413. event->tracing_data.size = bswap_32(event->tracing_data.size);
  414. }
  415. typedef void (*perf_event__swap_op)(union perf_event *event,
  416. bool sample_id_all);
  417. static perf_event__swap_op perf_event__swap_ops[] = {
  418. [PERF_RECORD_MMAP] = perf_event__mmap_swap,
  419. [PERF_RECORD_MMAP2] = perf_event__mmap2_swap,
  420. [PERF_RECORD_COMM] = perf_event__comm_swap,
  421. [PERF_RECORD_FORK] = perf_event__task_swap,
  422. [PERF_RECORD_EXIT] = perf_event__task_swap,
  423. [PERF_RECORD_LOST] = perf_event__all64_swap,
  424. [PERF_RECORD_READ] = perf_event__read_swap,
  425. [PERF_RECORD_THROTTLE] = perf_event__throttle_swap,
  426. [PERF_RECORD_UNTHROTTLE] = perf_event__throttle_swap,
  427. [PERF_RECORD_SAMPLE] = perf_event__all64_swap,
  428. [PERF_RECORD_HEADER_ATTR] = perf_event__hdr_attr_swap,
  429. [PERF_RECORD_HEADER_EVENT_TYPE] = perf_event__event_type_swap,
  430. [PERF_RECORD_HEADER_TRACING_DATA] = perf_event__tracing_data_swap,
  431. [PERF_RECORD_HEADER_BUILD_ID] = NULL,
  432. [PERF_RECORD_HEADER_MAX] = NULL,
  433. };
  434. struct sample_queue {
  435. u64 timestamp;
  436. u64 file_offset;
  437. union perf_event *event;
  438. struct list_head list;
  439. };
  440. static void perf_session_free_sample_buffers(struct perf_session *session)
  441. {
  442. struct ordered_samples *os = &session->ordered_samples;
  443. while (!list_empty(&os->to_free)) {
  444. struct sample_queue *sq;
  445. sq = list_entry(os->to_free.next, struct sample_queue, list);
  446. list_del(&sq->list);
  447. free(sq);
  448. }
  449. }
  450. static int perf_session_deliver_event(struct perf_session *session,
  451. union perf_event *event,
  452. struct perf_sample *sample,
  453. struct perf_tool *tool,
  454. u64 file_offset);
  455. static int flush_sample_queue(struct perf_session *s,
  456. struct perf_tool *tool)
  457. {
  458. struct ordered_samples *os = &s->ordered_samples;
  459. struct list_head *head = &os->samples;
  460. struct sample_queue *tmp, *iter;
  461. struct perf_sample sample;
  462. u64 limit = os->next_flush;
  463. u64 last_ts = os->last_sample ? os->last_sample->timestamp : 0ULL;
  464. unsigned idx = 0, progress_next = os->nr_samples / 16;
  465. bool show_progress = limit == ULLONG_MAX;
  466. int ret;
  467. if (!tool->ordered_samples || !limit)
  468. return 0;
  469. list_for_each_entry_safe(iter, tmp, head, list) {
  470. if (session_done())
  471. return 0;
  472. if (iter->timestamp > limit)
  473. break;
  474. ret = perf_evlist__parse_sample(s->evlist, iter->event, &sample);
  475. if (ret)
  476. pr_err("Can't parse sample, err = %d\n", ret);
  477. else {
  478. ret = perf_session_deliver_event(s, iter->event, &sample, tool,
  479. iter->file_offset);
  480. if (ret)
  481. return ret;
  482. }
  483. os->last_flush = iter->timestamp;
  484. list_del(&iter->list);
  485. list_add(&iter->list, &os->sample_cache);
  486. if (show_progress && (++idx >= progress_next)) {
  487. progress_next += os->nr_samples / 16;
  488. ui_progress__update(idx, os->nr_samples,
  489. "Processing time ordered events...");
  490. }
  491. }
  492. if (list_empty(head)) {
  493. os->last_sample = NULL;
  494. } else if (last_ts <= limit) {
  495. os->last_sample =
  496. list_entry(head->prev, struct sample_queue, list);
  497. }
  498. os->nr_samples = 0;
  499. return 0;
  500. }
  501. /*
  502. * When perf record finishes a pass on every buffers, it records this pseudo
  503. * event.
  504. * We record the max timestamp t found in the pass n.
  505. * Assuming these timestamps are monotonic across cpus, we know that if
  506. * a buffer still has events with timestamps below t, they will be all
  507. * available and then read in the pass n + 1.
  508. * Hence when we start to read the pass n + 2, we can safely flush every
  509. * events with timestamps below t.
  510. *
  511. * ============ PASS n =================
  512. * CPU 0 | CPU 1
  513. * |
  514. * cnt1 timestamps | cnt2 timestamps
  515. * 1 | 2
  516. * 2 | 3
  517. * - | 4 <--- max recorded
  518. *
  519. * ============ PASS n + 1 ==============
  520. * CPU 0 | CPU 1
  521. * |
  522. * cnt1 timestamps | cnt2 timestamps
  523. * 3 | 5
  524. * 4 | 6
  525. * 5 | 7 <---- max recorded
  526. *
  527. * Flush every events below timestamp 4
  528. *
  529. * ============ PASS n + 2 ==============
  530. * CPU 0 | CPU 1
  531. * |
  532. * cnt1 timestamps | cnt2 timestamps
  533. * 6 | 8
  534. * 7 | 9
  535. * - | 10
  536. *
  537. * Flush every events below timestamp 7
  538. * etc...
  539. */
  540. static int process_finished_round(struct perf_tool *tool,
  541. union perf_event *event __maybe_unused,
  542. struct perf_session *session)
  543. {
  544. int ret = flush_sample_queue(session, tool);
  545. if (!ret)
  546. session->ordered_samples.next_flush = session->ordered_samples.max_timestamp;
  547. return ret;
  548. }
  549. /* The queue is ordered by time */
  550. static void __queue_event(struct sample_queue *new, struct perf_session *s)
  551. {
  552. struct ordered_samples *os = &s->ordered_samples;
  553. struct sample_queue *sample = os->last_sample;
  554. u64 timestamp = new->timestamp;
  555. struct list_head *p;
  556. ++os->nr_samples;
  557. os->last_sample = new;
  558. if (!sample) {
  559. list_add(&new->list, &os->samples);
  560. os->max_timestamp = timestamp;
  561. return;
  562. }
  563. /*
  564. * last_sample might point to some random place in the list as it's
  565. * the last queued event. We expect that the new event is close to
  566. * this.
  567. */
  568. if (sample->timestamp <= timestamp) {
  569. while (sample->timestamp <= timestamp) {
  570. p = sample->list.next;
  571. if (p == &os->samples) {
  572. list_add_tail(&new->list, &os->samples);
  573. os->max_timestamp = timestamp;
  574. return;
  575. }
  576. sample = list_entry(p, struct sample_queue, list);
  577. }
  578. list_add_tail(&new->list, &sample->list);
  579. } else {
  580. while (sample->timestamp > timestamp) {
  581. p = sample->list.prev;
  582. if (p == &os->samples) {
  583. list_add(&new->list, &os->samples);
  584. return;
  585. }
  586. sample = list_entry(p, struct sample_queue, list);
  587. }
  588. list_add(&new->list, &sample->list);
  589. }
  590. }
  591. #define MAX_SAMPLE_BUFFER (64 * 1024 / sizeof(struct sample_queue))
  592. int perf_session_queue_event(struct perf_session *s, union perf_event *event,
  593. struct perf_sample *sample, u64 file_offset)
  594. {
  595. struct ordered_samples *os = &s->ordered_samples;
  596. struct list_head *sc = &os->sample_cache;
  597. u64 timestamp = sample->time;
  598. struct sample_queue *new;
  599. if (!timestamp || timestamp == ~0ULL)
  600. return -ETIME;
  601. if (timestamp < s->ordered_samples.last_flush) {
  602. printf("Warning: Timestamp below last timeslice flush\n");
  603. return -EINVAL;
  604. }
  605. if (!list_empty(sc)) {
  606. new = list_entry(sc->next, struct sample_queue, list);
  607. list_del(&new->list);
  608. } else if (os->sample_buffer) {
  609. new = os->sample_buffer + os->sample_buffer_idx;
  610. if (++os->sample_buffer_idx == MAX_SAMPLE_BUFFER)
  611. os->sample_buffer = NULL;
  612. } else {
  613. os->sample_buffer = malloc(MAX_SAMPLE_BUFFER * sizeof(*new));
  614. if (!os->sample_buffer)
  615. return -ENOMEM;
  616. list_add(&os->sample_buffer->list, &os->to_free);
  617. os->sample_buffer_idx = 2;
  618. new = os->sample_buffer + 1;
  619. }
  620. new->timestamp = timestamp;
  621. new->file_offset = file_offset;
  622. new->event = event;
  623. __queue_event(new, s);
  624. return 0;
  625. }
  626. static void callchain__printf(struct perf_sample *sample)
  627. {
  628. unsigned int i;
  629. printf("... chain: nr:%" PRIu64 "\n", sample->callchain->nr);
  630. for (i = 0; i < sample->callchain->nr; i++)
  631. printf("..... %2d: %016" PRIx64 "\n",
  632. i, sample->callchain->ips[i]);
  633. }
  634. static void branch_stack__printf(struct perf_sample *sample)
  635. {
  636. uint64_t i;
  637. printf("... branch stack: nr:%" PRIu64 "\n", sample->branch_stack->nr);
  638. for (i = 0; i < sample->branch_stack->nr; i++)
  639. printf("..... %2"PRIu64": %016" PRIx64 " -> %016" PRIx64 "\n",
  640. i, sample->branch_stack->entries[i].from,
  641. sample->branch_stack->entries[i].to);
  642. }
  643. static void regs_dump__printf(u64 mask, u64 *regs)
  644. {
  645. unsigned rid, i = 0;
  646. for_each_set_bit(rid, (unsigned long *) &mask, sizeof(mask) * 8) {
  647. u64 val = regs[i++];
  648. printf(".... %-5s 0x%" PRIx64 "\n",
  649. perf_reg_name(rid), val);
  650. }
  651. }
  652. static void regs_user__printf(struct perf_sample *sample, u64 mask)
  653. {
  654. struct regs_dump *user_regs = &sample->user_regs;
  655. if (user_regs->regs) {
  656. printf("... user regs: mask 0x%" PRIx64 "\n", mask);
  657. regs_dump__printf(mask, user_regs->regs);
  658. }
  659. }
  660. static void stack_user__printf(struct stack_dump *dump)
  661. {
  662. printf("... ustack: size %" PRIu64 ", offset 0x%x\n",
  663. dump->size, dump->offset);
  664. }
  665. static void perf_session__print_tstamp(struct perf_session *session,
  666. union perf_event *event,
  667. struct perf_sample *sample)
  668. {
  669. u64 sample_type = __perf_evlist__combined_sample_type(session->evlist);
  670. if (event->header.type != PERF_RECORD_SAMPLE &&
  671. !perf_evlist__sample_id_all(session->evlist)) {
  672. fputs("-1 -1 ", stdout);
  673. return;
  674. }
  675. if ((sample_type & PERF_SAMPLE_CPU))
  676. printf("%u ", sample->cpu);
  677. if (sample_type & PERF_SAMPLE_TIME)
  678. printf("%" PRIu64 " ", sample->time);
  679. }
  680. static void sample_read__printf(struct perf_sample *sample, u64 read_format)
  681. {
  682. printf("... sample_read:\n");
  683. if (read_format & PERF_FORMAT_TOTAL_TIME_ENABLED)
  684. printf("...... time enabled %016" PRIx64 "\n",
  685. sample->read.time_enabled);
  686. if (read_format & PERF_FORMAT_TOTAL_TIME_RUNNING)
  687. printf("...... time running %016" PRIx64 "\n",
  688. sample->read.time_running);
  689. if (read_format & PERF_FORMAT_GROUP) {
  690. u64 i;
  691. printf(".... group nr %" PRIu64 "\n", sample->read.group.nr);
  692. for (i = 0; i < sample->read.group.nr; i++) {
  693. struct sample_read_value *value;
  694. value = &sample->read.group.values[i];
  695. printf("..... id %016" PRIx64
  696. ", value %016" PRIx64 "\n",
  697. value->id, value->value);
  698. }
  699. } else
  700. printf("..... id %016" PRIx64 ", value %016" PRIx64 "\n",
  701. sample->read.one.id, sample->read.one.value);
  702. }
  703. static void dump_event(struct perf_session *session, union perf_event *event,
  704. u64 file_offset, struct perf_sample *sample)
  705. {
  706. if (!dump_trace)
  707. return;
  708. printf("\n%#" PRIx64 " [%#x]: event: %d\n",
  709. file_offset, event->header.size, event->header.type);
  710. trace_event(event);
  711. if (sample)
  712. perf_session__print_tstamp(session, event, sample);
  713. printf("%#" PRIx64 " [%#x]: PERF_RECORD_%s", file_offset,
  714. event->header.size, perf_event__name(event->header.type));
  715. }
  716. static void dump_sample(struct perf_evsel *evsel, union perf_event *event,
  717. struct perf_sample *sample)
  718. {
  719. u64 sample_type;
  720. if (!dump_trace)
  721. return;
  722. printf("(IP, %d): %d/%d: %#" PRIx64 " period: %" PRIu64 " addr: %#" PRIx64 "\n",
  723. event->header.misc, sample->pid, sample->tid, sample->ip,
  724. sample->period, sample->addr);
  725. sample_type = evsel->attr.sample_type;
  726. if (sample_type & PERF_SAMPLE_CALLCHAIN)
  727. callchain__printf(sample);
  728. if (sample_type & PERF_SAMPLE_BRANCH_STACK)
  729. branch_stack__printf(sample);
  730. if (sample_type & PERF_SAMPLE_REGS_USER)
  731. regs_user__printf(sample, evsel->attr.sample_regs_user);
  732. if (sample_type & PERF_SAMPLE_STACK_USER)
  733. stack_user__printf(&sample->user_stack);
  734. if (sample_type & PERF_SAMPLE_WEIGHT)
  735. printf("... weight: %" PRIu64 "\n", sample->weight);
  736. if (sample_type & PERF_SAMPLE_DATA_SRC)
  737. printf(" . data_src: 0x%"PRIx64"\n", sample->data_src);
  738. if (sample_type & PERF_SAMPLE_TRANSACTION)
  739. printf("... transaction: %" PRIx64 "\n", sample->transaction);
  740. if (sample_type & PERF_SAMPLE_READ)
  741. sample_read__printf(sample, evsel->attr.read_format);
  742. }
  743. static struct machine *
  744. perf_session__find_machine_for_cpumode(struct perf_session *session,
  745. union perf_event *event,
  746. struct perf_sample *sample)
  747. {
  748. const u8 cpumode = event->header.misc & PERF_RECORD_MISC_CPUMODE_MASK;
  749. if (perf_guest &&
  750. ((cpumode == PERF_RECORD_MISC_GUEST_KERNEL) ||
  751. (cpumode == PERF_RECORD_MISC_GUEST_USER))) {
  752. u32 pid;
  753. if (event->header.type == PERF_RECORD_MMAP
  754. || event->header.type == PERF_RECORD_MMAP2)
  755. pid = event->mmap.pid;
  756. else
  757. pid = sample->pid;
  758. return perf_session__findnew_machine(session, pid);
  759. }
  760. return &session->machines.host;
  761. }
  762. static int deliver_sample_value(struct perf_session *session,
  763. struct perf_tool *tool,
  764. union perf_event *event,
  765. struct perf_sample *sample,
  766. struct sample_read_value *v,
  767. struct machine *machine)
  768. {
  769. struct perf_sample_id *sid;
  770. sid = perf_evlist__id2sid(session->evlist, v->id);
  771. if (sid) {
  772. sample->id = v->id;
  773. sample->period = v->value - sid->period;
  774. sid->period = v->value;
  775. }
  776. if (!sid || sid->evsel == NULL) {
  777. ++session->stats.nr_unknown_id;
  778. return 0;
  779. }
  780. return tool->sample(tool, event, sample, sid->evsel, machine);
  781. }
  782. static int deliver_sample_group(struct perf_session *session,
  783. struct perf_tool *tool,
  784. union perf_event *event,
  785. struct perf_sample *sample,
  786. struct machine *machine)
  787. {
  788. int ret = -EINVAL;
  789. u64 i;
  790. for (i = 0; i < sample->read.group.nr; i++) {
  791. ret = deliver_sample_value(session, tool, event, sample,
  792. &sample->read.group.values[i],
  793. machine);
  794. if (ret)
  795. break;
  796. }
  797. return ret;
  798. }
  799. static int
  800. perf_session__deliver_sample(struct perf_session *session,
  801. struct perf_tool *tool,
  802. union perf_event *event,
  803. struct perf_sample *sample,
  804. struct perf_evsel *evsel,
  805. struct machine *machine)
  806. {
  807. /* We know evsel != NULL. */
  808. u64 sample_type = evsel->attr.sample_type;
  809. u64 read_format = evsel->attr.read_format;
  810. /* Standard sample delievery. */
  811. if (!(sample_type & PERF_SAMPLE_READ))
  812. return tool->sample(tool, event, sample, evsel, machine);
  813. /* For PERF_SAMPLE_READ we have either single or group mode. */
  814. if (read_format & PERF_FORMAT_GROUP)
  815. return deliver_sample_group(session, tool, event, sample,
  816. machine);
  817. else
  818. return deliver_sample_value(session, tool, event, sample,
  819. &sample->read.one, machine);
  820. }
  821. static int perf_session_deliver_event(struct perf_session *session,
  822. union perf_event *event,
  823. struct perf_sample *sample,
  824. struct perf_tool *tool,
  825. u64 file_offset)
  826. {
  827. struct perf_evsel *evsel;
  828. struct machine *machine;
  829. dump_event(session, event, file_offset, sample);
  830. evsel = perf_evlist__id2evsel(session->evlist, sample->id);
  831. if (evsel != NULL && event->header.type != PERF_RECORD_SAMPLE) {
  832. /*
  833. * XXX We're leaving PERF_RECORD_SAMPLE unnacounted here
  834. * because the tools right now may apply filters, discarding
  835. * some of the samples. For consistency, in the future we
  836. * should have something like nr_filtered_samples and remove
  837. * the sample->period from total_sample_period, etc, KISS for
  838. * now tho.
  839. *
  840. * Also testing against NULL allows us to handle files without
  841. * attr.sample_id_all and/or without PERF_SAMPLE_ID. In the
  842. * future probably it'll be a good idea to restrict event
  843. * processing via perf_session to files with both set.
  844. */
  845. hists__inc_nr_events(&evsel->hists, event->header.type);
  846. }
  847. machine = perf_session__find_machine_for_cpumode(session, event,
  848. sample);
  849. switch (event->header.type) {
  850. case PERF_RECORD_SAMPLE:
  851. dump_sample(evsel, event, sample);
  852. if (evsel == NULL) {
  853. ++session->stats.nr_unknown_id;
  854. return 0;
  855. }
  856. if (machine == NULL) {
  857. ++session->stats.nr_unprocessable_samples;
  858. return 0;
  859. }
  860. return perf_session__deliver_sample(session, tool, event,
  861. sample, evsel, machine);
  862. case PERF_RECORD_MMAP:
  863. return tool->mmap(tool, event, sample, machine);
  864. case PERF_RECORD_MMAP2:
  865. return tool->mmap2(tool, event, sample, machine);
  866. case PERF_RECORD_COMM:
  867. return tool->comm(tool, event, sample, machine);
  868. case PERF_RECORD_FORK:
  869. return tool->fork(tool, event, sample, machine);
  870. case PERF_RECORD_EXIT:
  871. return tool->exit(tool, event, sample, machine);
  872. case PERF_RECORD_LOST:
  873. if (tool->lost == perf_event__process_lost)
  874. session->stats.total_lost += event->lost.lost;
  875. return tool->lost(tool, event, sample, machine);
  876. case PERF_RECORD_READ:
  877. return tool->read(tool, event, sample, evsel, machine);
  878. case PERF_RECORD_THROTTLE:
  879. return tool->throttle(tool, event, sample, machine);
  880. case PERF_RECORD_UNTHROTTLE:
  881. return tool->unthrottle(tool, event, sample, machine);
  882. default:
  883. ++session->stats.nr_unknown_events;
  884. return -1;
  885. }
  886. }
  887. static int perf_session__process_user_event(struct perf_session *session, union perf_event *event,
  888. struct perf_tool *tool, u64 file_offset)
  889. {
  890. int err;
  891. dump_event(session, event, file_offset, NULL);
  892. /* These events are processed right away */
  893. switch (event->header.type) {
  894. case PERF_RECORD_HEADER_ATTR:
  895. err = tool->attr(tool, event, &session->evlist);
  896. if (err == 0)
  897. perf_session__set_id_hdr_size(session);
  898. return err;
  899. case PERF_RECORD_HEADER_TRACING_DATA:
  900. /* setup for reading amidst mmap */
  901. lseek(session->fd, file_offset, SEEK_SET);
  902. return tool->tracing_data(tool, event, session);
  903. case PERF_RECORD_HEADER_BUILD_ID:
  904. return tool->build_id(tool, event, session);
  905. case PERF_RECORD_FINISHED_ROUND:
  906. return tool->finished_round(tool, event, session);
  907. default:
  908. return -EINVAL;
  909. }
  910. }
  911. static void event_swap(union perf_event *event, bool sample_id_all)
  912. {
  913. perf_event__swap_op swap;
  914. swap = perf_event__swap_ops[event->header.type];
  915. if (swap)
  916. swap(event, sample_id_all);
  917. }
  918. static int perf_session__process_event(struct perf_session *session,
  919. union perf_event *event,
  920. struct perf_tool *tool,
  921. u64 file_offset)
  922. {
  923. struct perf_sample sample;
  924. int ret;
  925. if (session->header.needs_swap)
  926. event_swap(event, perf_evlist__sample_id_all(session->evlist));
  927. if (event->header.type >= PERF_RECORD_HEADER_MAX)
  928. return -EINVAL;
  929. events_stats__inc(&session->stats, event->header.type);
  930. if (event->header.type >= PERF_RECORD_USER_TYPE_START)
  931. return perf_session__process_user_event(session, event, tool, file_offset);
  932. /*
  933. * For all kernel events we get the sample data
  934. */
  935. ret = perf_evlist__parse_sample(session->evlist, event, &sample);
  936. if (ret)
  937. return ret;
  938. if (tool->ordered_samples) {
  939. ret = perf_session_queue_event(session, event, &sample,
  940. file_offset);
  941. if (ret != -ETIME)
  942. return ret;
  943. }
  944. return perf_session_deliver_event(session, event, &sample, tool,
  945. file_offset);
  946. }
  947. void perf_event_header__bswap(struct perf_event_header *self)
  948. {
  949. self->type = bswap_32(self->type);
  950. self->misc = bswap_16(self->misc);
  951. self->size = bswap_16(self->size);
  952. }
  953. struct thread *perf_session__findnew(struct perf_session *session, pid_t pid)
  954. {
  955. return machine__findnew_thread(&session->machines.host, 0, pid);
  956. }
  957. static struct thread *perf_session__register_idle_thread(struct perf_session *self)
  958. {
  959. struct thread *thread = perf_session__findnew(self, 0);
  960. if (thread == NULL || thread__set_comm(thread, "swapper")) {
  961. pr_err("problem inserting idle task.\n");
  962. thread = NULL;
  963. }
  964. return thread;
  965. }
  966. static void perf_session__warn_about_errors(const struct perf_session *session,
  967. const struct perf_tool *tool)
  968. {
  969. if (tool->lost == perf_event__process_lost &&
  970. session->stats.nr_events[PERF_RECORD_LOST] != 0) {
  971. ui__warning("Processed %d events and lost %d chunks!\n\n"
  972. "Check IO/CPU overload!\n\n",
  973. session->stats.nr_events[0],
  974. session->stats.nr_events[PERF_RECORD_LOST]);
  975. }
  976. if (session->stats.nr_unknown_events != 0) {
  977. ui__warning("Found %u unknown events!\n\n"
  978. "Is this an older tool processing a perf.data "
  979. "file generated by a more recent tool?\n\n"
  980. "If that is not the case, consider "
  981. "reporting to linux-kernel@vger.kernel.org.\n\n",
  982. session->stats.nr_unknown_events);
  983. }
  984. if (session->stats.nr_unknown_id != 0) {
  985. ui__warning("%u samples with id not present in the header\n",
  986. session->stats.nr_unknown_id);
  987. }
  988. if (session->stats.nr_invalid_chains != 0) {
  989. ui__warning("Found invalid callchains!\n\n"
  990. "%u out of %u events were discarded for this reason.\n\n"
  991. "Consider reporting to linux-kernel@vger.kernel.org.\n\n",
  992. session->stats.nr_invalid_chains,
  993. session->stats.nr_events[PERF_RECORD_SAMPLE]);
  994. }
  995. if (session->stats.nr_unprocessable_samples != 0) {
  996. ui__warning("%u unprocessable samples recorded.\n"
  997. "Do you have a KVM guest running and not using 'perf kvm'?\n",
  998. session->stats.nr_unprocessable_samples);
  999. }
  1000. }
  1001. volatile int session_done;
  1002. static int __perf_session__process_pipe_events(struct perf_session *self,
  1003. struct perf_tool *tool)
  1004. {
  1005. union perf_event *event;
  1006. uint32_t size, cur_size = 0;
  1007. void *buf = NULL;
  1008. int skip = 0;
  1009. u64 head;
  1010. int err;
  1011. void *p;
  1012. perf_tool__fill_defaults(tool);
  1013. head = 0;
  1014. cur_size = sizeof(union perf_event);
  1015. buf = malloc(cur_size);
  1016. if (!buf)
  1017. return -errno;
  1018. more:
  1019. event = buf;
  1020. err = readn(self->fd, event, sizeof(struct perf_event_header));
  1021. if (err <= 0) {
  1022. if (err == 0)
  1023. goto done;
  1024. pr_err("failed to read event header\n");
  1025. goto out_err;
  1026. }
  1027. if (self->header.needs_swap)
  1028. perf_event_header__bswap(&event->header);
  1029. size = event->header.size;
  1030. if (size < sizeof(struct perf_event_header)) {
  1031. pr_err("bad event header size\n");
  1032. goto out_err;
  1033. }
  1034. if (size > cur_size) {
  1035. void *new = realloc(buf, size);
  1036. if (!new) {
  1037. pr_err("failed to allocate memory to read event\n");
  1038. goto out_err;
  1039. }
  1040. buf = new;
  1041. cur_size = size;
  1042. event = buf;
  1043. }
  1044. p = event;
  1045. p += sizeof(struct perf_event_header);
  1046. if (size - sizeof(struct perf_event_header)) {
  1047. err = readn(self->fd, p, size - sizeof(struct perf_event_header));
  1048. if (err <= 0) {
  1049. if (err == 0) {
  1050. pr_err("unexpected end of event stream\n");
  1051. goto done;
  1052. }
  1053. pr_err("failed to read event data\n");
  1054. goto out_err;
  1055. }
  1056. }
  1057. if ((skip = perf_session__process_event(self, event, tool, head)) < 0) {
  1058. pr_err("%#" PRIx64 " [%#x]: failed to process type: %d\n",
  1059. head, event->header.size, event->header.type);
  1060. err = -EINVAL;
  1061. goto out_err;
  1062. }
  1063. head += size;
  1064. if (skip > 0)
  1065. head += skip;
  1066. if (!session_done())
  1067. goto more;
  1068. done:
  1069. /* do the final flush for ordered samples */
  1070. self->ordered_samples.next_flush = ULLONG_MAX;
  1071. err = flush_sample_queue(self, tool);
  1072. out_err:
  1073. free(buf);
  1074. perf_session__warn_about_errors(self, tool);
  1075. perf_session_free_sample_buffers(self);
  1076. return err;
  1077. }
  1078. static union perf_event *
  1079. fetch_mmaped_event(struct perf_session *session,
  1080. u64 head, size_t mmap_size, char *buf)
  1081. {
  1082. union perf_event *event;
  1083. /*
  1084. * Ensure we have enough space remaining to read
  1085. * the size of the event in the headers.
  1086. */
  1087. if (head + sizeof(event->header) > mmap_size)
  1088. return NULL;
  1089. event = (union perf_event *)(buf + head);
  1090. if (session->header.needs_swap)
  1091. perf_event_header__bswap(&event->header);
  1092. if (head + event->header.size > mmap_size) {
  1093. /* We're not fetching the event so swap back again */
  1094. if (session->header.needs_swap)
  1095. perf_event_header__bswap(&event->header);
  1096. return NULL;
  1097. }
  1098. return event;
  1099. }
  1100. /*
  1101. * On 64bit we can mmap the data file in one go. No need for tiny mmap
  1102. * slices. On 32bit we use 32MB.
  1103. */
  1104. #if BITS_PER_LONG == 64
  1105. #define MMAP_SIZE ULLONG_MAX
  1106. #define NUM_MMAPS 1
  1107. #else
  1108. #define MMAP_SIZE (32 * 1024 * 1024ULL)
  1109. #define NUM_MMAPS 128
  1110. #endif
  1111. int __perf_session__process_events(struct perf_session *session,
  1112. u64 data_offset, u64 data_size,
  1113. u64 file_size, struct perf_tool *tool)
  1114. {
  1115. u64 head, page_offset, file_offset, file_pos, progress_next;
  1116. int err, mmap_prot, mmap_flags, map_idx = 0;
  1117. size_t mmap_size;
  1118. char *buf, *mmaps[NUM_MMAPS];
  1119. union perf_event *event;
  1120. uint32_t size;
  1121. perf_tool__fill_defaults(tool);
  1122. page_offset = page_size * (data_offset / page_size);
  1123. file_offset = page_offset;
  1124. head = data_offset - page_offset;
  1125. if (data_size && (data_offset + data_size < file_size))
  1126. file_size = data_offset + data_size;
  1127. progress_next = file_size / 16;
  1128. mmap_size = MMAP_SIZE;
  1129. if (mmap_size > file_size)
  1130. mmap_size = file_size;
  1131. memset(mmaps, 0, sizeof(mmaps));
  1132. mmap_prot = PROT_READ;
  1133. mmap_flags = MAP_SHARED;
  1134. if (session->header.needs_swap) {
  1135. mmap_prot |= PROT_WRITE;
  1136. mmap_flags = MAP_PRIVATE;
  1137. }
  1138. remap:
  1139. buf = mmap(NULL, mmap_size, mmap_prot, mmap_flags, session->fd,
  1140. file_offset);
  1141. if (buf == MAP_FAILED) {
  1142. pr_err("failed to mmap file\n");
  1143. err = -errno;
  1144. goto out_err;
  1145. }
  1146. mmaps[map_idx] = buf;
  1147. map_idx = (map_idx + 1) & (ARRAY_SIZE(mmaps) - 1);
  1148. file_pos = file_offset + head;
  1149. more:
  1150. event = fetch_mmaped_event(session, head, mmap_size, buf);
  1151. if (!event) {
  1152. if (mmaps[map_idx]) {
  1153. munmap(mmaps[map_idx], mmap_size);
  1154. mmaps[map_idx] = NULL;
  1155. }
  1156. page_offset = page_size * (head / page_size);
  1157. file_offset += page_offset;
  1158. head -= page_offset;
  1159. goto remap;
  1160. }
  1161. size = event->header.size;
  1162. if (size < sizeof(struct perf_event_header) ||
  1163. perf_session__process_event(session, event, tool, file_pos) < 0) {
  1164. pr_err("%#" PRIx64 " [%#x]: failed to process type: %d\n",
  1165. file_offset + head, event->header.size,
  1166. event->header.type);
  1167. err = -EINVAL;
  1168. goto out_err;
  1169. }
  1170. head += size;
  1171. file_pos += size;
  1172. if (file_pos >= progress_next) {
  1173. progress_next += file_size / 16;
  1174. ui_progress__update(file_pos, file_size,
  1175. "Processing events...");
  1176. }
  1177. if (session_done())
  1178. goto out;
  1179. if (file_pos < file_size)
  1180. goto more;
  1181. out:
  1182. /* do the final flush for ordered samples */
  1183. session->ordered_samples.next_flush = ULLONG_MAX;
  1184. err = flush_sample_queue(session, tool);
  1185. out_err:
  1186. ui_progress__finish();
  1187. perf_session__warn_about_errors(session, tool);
  1188. perf_session_free_sample_buffers(session);
  1189. return err;
  1190. }
  1191. int perf_session__process_events(struct perf_session *self,
  1192. struct perf_tool *tool)
  1193. {
  1194. int err;
  1195. if (perf_session__register_idle_thread(self) == NULL)
  1196. return -ENOMEM;
  1197. if (!self->fd_pipe)
  1198. err = __perf_session__process_events(self,
  1199. self->header.data_offset,
  1200. self->header.data_size,
  1201. self->size, tool);
  1202. else
  1203. err = __perf_session__process_pipe_events(self, tool);
  1204. return err;
  1205. }
  1206. bool perf_session__has_traces(struct perf_session *session, const char *msg)
  1207. {
  1208. struct perf_evsel *evsel;
  1209. list_for_each_entry(evsel, &session->evlist->entries, node) {
  1210. if (evsel->attr.type == PERF_TYPE_TRACEPOINT)
  1211. return true;
  1212. }
  1213. pr_err("No trace sample to read. Did you call 'perf %s'?\n", msg);
  1214. return false;
  1215. }
  1216. int maps__set_kallsyms_ref_reloc_sym(struct map **maps,
  1217. const char *symbol_name, u64 addr)
  1218. {
  1219. char *bracket;
  1220. enum map_type i;
  1221. struct ref_reloc_sym *ref;
  1222. ref = zalloc(sizeof(struct ref_reloc_sym));
  1223. if (ref == NULL)
  1224. return -ENOMEM;
  1225. ref->name = strdup(symbol_name);
  1226. if (ref->name == NULL) {
  1227. free(ref);
  1228. return -ENOMEM;
  1229. }
  1230. bracket = strchr(ref->name, ']');
  1231. if (bracket)
  1232. *bracket = '\0';
  1233. ref->addr = addr;
  1234. for (i = 0; i < MAP__NR_TYPES; ++i) {
  1235. struct kmap *kmap = map__kmap(maps[i]);
  1236. kmap->ref_reloc_sym = ref;
  1237. }
  1238. return 0;
  1239. }
  1240. size_t perf_session__fprintf_dsos(struct perf_session *self, FILE *fp)
  1241. {
  1242. return machines__fprintf_dsos(&self->machines, fp);
  1243. }
  1244. size_t perf_session__fprintf_dsos_buildid(struct perf_session *self, FILE *fp,
  1245. bool (skip)(struct dso *dso, int parm), int parm)
  1246. {
  1247. return machines__fprintf_dsos_buildid(&self->machines, fp, skip, parm);
  1248. }
  1249. size_t perf_session__fprintf_nr_events(struct perf_session *session, FILE *fp)
  1250. {
  1251. struct perf_evsel *pos;
  1252. size_t ret = fprintf(fp, "Aggregated stats:\n");
  1253. ret += events_stats__fprintf(&session->stats, fp);
  1254. list_for_each_entry(pos, &session->evlist->entries, node) {
  1255. ret += fprintf(fp, "%s stats:\n", perf_evsel__name(pos));
  1256. ret += events_stats__fprintf(&pos->hists.stats, fp);
  1257. }
  1258. return ret;
  1259. }
  1260. size_t perf_session__fprintf(struct perf_session *session, FILE *fp)
  1261. {
  1262. /*
  1263. * FIXME: Here we have to actually print all the machines in this
  1264. * session, not just the host...
  1265. */
  1266. return machine__fprintf(&session->machines.host, fp);
  1267. }
  1268. struct perf_evsel *perf_session__find_first_evtype(struct perf_session *session,
  1269. unsigned int type)
  1270. {
  1271. struct perf_evsel *pos;
  1272. list_for_each_entry(pos, &session->evlist->entries, node) {
  1273. if (pos->attr.type == type)
  1274. return pos;
  1275. }
  1276. return NULL;
  1277. }
  1278. void perf_evsel__print_ip(struct perf_evsel *evsel, union perf_event *event,
  1279. struct perf_sample *sample, struct machine *machine,
  1280. unsigned int print_opts, unsigned int stack_depth)
  1281. {
  1282. struct addr_location al;
  1283. struct callchain_cursor_node *node;
  1284. int print_ip = print_opts & PRINT_IP_OPT_IP;
  1285. int print_sym = print_opts & PRINT_IP_OPT_SYM;
  1286. int print_dso = print_opts & PRINT_IP_OPT_DSO;
  1287. int print_symoffset = print_opts & PRINT_IP_OPT_SYMOFFSET;
  1288. int print_oneline = print_opts & PRINT_IP_OPT_ONELINE;
  1289. char s = print_oneline ? ' ' : '\t';
  1290. if (perf_event__preprocess_sample(event, machine, &al, sample) < 0) {
  1291. error("problem processing %d event, skipping it.\n",
  1292. event->header.type);
  1293. return;
  1294. }
  1295. if (symbol_conf.use_callchain && sample->callchain) {
  1296. if (machine__resolve_callchain(machine, evsel, al.thread,
  1297. sample, NULL, NULL) != 0) {
  1298. if (verbose)
  1299. error("Failed to resolve callchain. Skipping\n");
  1300. return;
  1301. }
  1302. callchain_cursor_commit(&callchain_cursor);
  1303. while (stack_depth) {
  1304. node = callchain_cursor_current(&callchain_cursor);
  1305. if (!node)
  1306. break;
  1307. if (print_ip)
  1308. printf("%c%16" PRIx64, s, node->ip);
  1309. if (print_sym) {
  1310. printf(" ");
  1311. if (print_symoffset) {
  1312. al.addr = node->ip;
  1313. al.map = node->map;
  1314. symbol__fprintf_symname_offs(node->sym, &al, stdout);
  1315. } else
  1316. symbol__fprintf_symname(node->sym, stdout);
  1317. }
  1318. if (print_dso) {
  1319. printf(" (");
  1320. map__fprintf_dsoname(node->map, stdout);
  1321. printf(")");
  1322. }
  1323. if (!print_oneline)
  1324. printf("\n");
  1325. callchain_cursor_advance(&callchain_cursor);
  1326. stack_depth--;
  1327. }
  1328. } else {
  1329. if (print_ip)
  1330. printf("%16" PRIx64, sample->ip);
  1331. if (print_sym) {
  1332. printf(" ");
  1333. if (print_symoffset)
  1334. symbol__fprintf_symname_offs(al.sym, &al,
  1335. stdout);
  1336. else
  1337. symbol__fprintf_symname(al.sym, stdout);
  1338. }
  1339. if (print_dso) {
  1340. printf(" (");
  1341. map__fprintf_dsoname(al.map, stdout);
  1342. printf(")");
  1343. }
  1344. }
  1345. }
  1346. int perf_session__cpu_bitmap(struct perf_session *session,
  1347. const char *cpu_list, unsigned long *cpu_bitmap)
  1348. {
  1349. int i;
  1350. struct cpu_map *map;
  1351. for (i = 0; i < PERF_TYPE_MAX; ++i) {
  1352. struct perf_evsel *evsel;
  1353. evsel = perf_session__find_first_evtype(session, i);
  1354. if (!evsel)
  1355. continue;
  1356. if (!(evsel->attr.sample_type & PERF_SAMPLE_CPU)) {
  1357. pr_err("File does not contain CPU events. "
  1358. "Remove -c option to proceed.\n");
  1359. return -1;
  1360. }
  1361. }
  1362. map = cpu_map__new(cpu_list);
  1363. if (map == NULL) {
  1364. pr_err("Invalid cpu_list\n");
  1365. return -1;
  1366. }
  1367. for (i = 0; i < map->nr; i++) {
  1368. int cpu = map->map[i];
  1369. if (cpu >= MAX_NR_CPUS) {
  1370. pr_err("Requested CPU %d too large. "
  1371. "Consider raising MAX_NR_CPUS\n", cpu);
  1372. return -1;
  1373. }
  1374. set_bit(cpu, cpu_bitmap);
  1375. }
  1376. return 0;
  1377. }
  1378. void perf_session__fprintf_info(struct perf_session *session, FILE *fp,
  1379. bool full)
  1380. {
  1381. struct stat st;
  1382. int ret;
  1383. if (session == NULL || fp == NULL)
  1384. return;
  1385. ret = fstat(session->fd, &st);
  1386. if (ret == -1)
  1387. return;
  1388. fprintf(fp, "# ========\n");
  1389. fprintf(fp, "# captured on: %s", ctime(&st.st_ctime));
  1390. perf_header__fprintf_info(session, fp, full);
  1391. fprintf(fp, "# ========\n#\n");
  1392. }
  1393. int __perf_session__set_tracepoints_handlers(struct perf_session *session,
  1394. const struct perf_evsel_str_handler *assocs,
  1395. size_t nr_assocs)
  1396. {
  1397. struct perf_evsel *evsel;
  1398. size_t i;
  1399. int err;
  1400. for (i = 0; i < nr_assocs; i++) {
  1401. /*
  1402. * Adding a handler for an event not in the session,
  1403. * just ignore it.
  1404. */
  1405. evsel = perf_evlist__find_tracepoint_by_name(session->evlist, assocs[i].name);
  1406. if (evsel == NULL)
  1407. continue;
  1408. err = -EEXIST;
  1409. if (evsel->handler.func != NULL)
  1410. goto out;
  1411. evsel->handler.func = assocs[i].handler;
  1412. }
  1413. err = 0;
  1414. out:
  1415. return err;
  1416. }