trace_irqsoff.c 11 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495
  1. /*
  2. * trace irqs off criticall timings
  3. *
  4. * Copyright (C) 2007-2008 Steven Rostedt <srostedt@redhat.com>
  5. * Copyright (C) 2008 Ingo Molnar <mingo@redhat.com>
  6. *
  7. * From code in the latency_tracer, that is:
  8. *
  9. * Copyright (C) 2004-2006 Ingo Molnar
  10. * Copyright (C) 2004 William Lee Irwin III
  11. */
  12. #include <linux/kallsyms.h>
  13. #include <linux/debugfs.h>
  14. #include <linux/uaccess.h>
  15. #include <linux/module.h>
  16. #include <linux/ftrace.h>
  17. #include <linux/fs.h>
  18. #include "trace.h"
  19. static struct trace_array *irqsoff_trace __read_mostly;
  20. static int tracer_enabled __read_mostly;
  21. static DEFINE_PER_CPU(int, tracing_cpu);
  22. enum {
  23. TRACER_IRQS_OFF = (1 << 1),
  24. TRACER_PREEMPT_OFF = (1 << 2),
  25. };
  26. static int trace_type __read_mostly;
  27. #ifdef CONFIG_PREEMPT_TRACER
  28. static inline int notrace
  29. preempt_trace(void)
  30. {
  31. return ((trace_type & TRACER_PREEMPT_OFF) && preempt_count());
  32. }
  33. #else
  34. # define preempt_trace() (0)
  35. #endif
  36. #ifdef CONFIG_IRQSOFF_TRACER
  37. static inline int notrace
  38. irq_trace(void)
  39. {
  40. return ((trace_type & TRACER_IRQS_OFF) &&
  41. irqs_disabled());
  42. }
  43. #else
  44. # define irq_trace() (0)
  45. #endif
  46. /*
  47. * Sequence count - we record it when starting a measurement and
  48. * skip the latency if the sequence has changed - some other section
  49. * did a maximum and could disturb our measurement with serial console
  50. * printouts, etc. Truly coinciding maximum latencies should be rare
  51. * and what happens together happens separately as well, so this doesnt
  52. * decrease the validity of the maximum found:
  53. */
  54. static __cacheline_aligned_in_smp unsigned long max_sequence;
  55. #ifdef CONFIG_FTRACE
  56. /*
  57. * irqsoff uses its own tracer function to keep the overhead down:
  58. */
  59. static void notrace
  60. irqsoff_tracer_call(unsigned long ip, unsigned long parent_ip)
  61. {
  62. struct trace_array *tr = irqsoff_trace;
  63. struct trace_array_cpu *data;
  64. unsigned long flags;
  65. long disabled;
  66. int cpu;
  67. /*
  68. * Does not matter if we preempt. We test the flags
  69. * afterward, to see if irqs are disabled or not.
  70. * If we preempt and get a false positive, the flags
  71. * test will fail.
  72. */
  73. cpu = raw_smp_processor_id();
  74. if (likely(!per_cpu(tracing_cpu, cpu)))
  75. return;
  76. local_save_flags(flags);
  77. /* slight chance to get a false positive on tracing_cpu */
  78. if (!irqs_disabled_flags(flags))
  79. return;
  80. data = tr->data[cpu];
  81. disabled = atomic_inc_return(&data->disabled);
  82. if (likely(disabled == 1))
  83. ftrace(tr, data, ip, parent_ip, flags);
  84. atomic_dec(&data->disabled);
  85. }
  86. static struct ftrace_ops trace_ops __read_mostly =
  87. {
  88. .func = irqsoff_tracer_call,
  89. };
  90. #endif /* CONFIG_FTRACE */
  91. /*
  92. * Should this new latency be reported/recorded?
  93. */
  94. static int notrace report_latency(cycle_t delta)
  95. {
  96. if (tracing_thresh) {
  97. if (delta < tracing_thresh)
  98. return 0;
  99. } else {
  100. if (delta <= tracing_max_latency)
  101. return 0;
  102. }
  103. return 1;
  104. }
  105. static void notrace
  106. check_critical_timing(struct trace_array *tr,
  107. struct trace_array_cpu *data,
  108. unsigned long parent_ip,
  109. int cpu)
  110. {
  111. unsigned long latency, t0, t1;
  112. cycle_t T0, T1, T2, delta;
  113. unsigned long flags;
  114. /*
  115. * usecs conversion is slow so we try to delay the conversion
  116. * as long as possible:
  117. */
  118. T0 = data->preempt_timestamp;
  119. T1 = now(cpu);
  120. delta = T1-T0;
  121. local_save_flags(flags);
  122. if (!report_latency(delta))
  123. goto out;
  124. ftrace(tr, data, CALLER_ADDR0, parent_ip, flags);
  125. /*
  126. * Update the timestamp, because the trace entry above
  127. * might change it (it can only get larger so the latency
  128. * is fair to be reported):
  129. */
  130. T2 = now(cpu);
  131. delta = T2-T0;
  132. latency = nsecs_to_usecs(delta);
  133. if (data->critical_sequence != max_sequence)
  134. goto out;
  135. tracing_max_latency = delta;
  136. t0 = nsecs_to_usecs(T0);
  137. t1 = nsecs_to_usecs(T1);
  138. data->critical_end = parent_ip;
  139. update_max_tr_single(tr, current, cpu);
  140. if (tracing_thresh)
  141. printk(KERN_INFO "(%16s-%-5d|#%d): %lu us critical section "
  142. "violates %lu us threshold.\n"
  143. " => started at timestamp %lu: ",
  144. current->comm, current->pid,
  145. raw_smp_processor_id(),
  146. latency, nsecs_to_usecs(tracing_thresh), t0);
  147. else
  148. printk(KERN_INFO "(%16s-%-5d|#%d):"
  149. " new %lu us maximum-latency "
  150. "critical section.\n => started at timestamp %lu: ",
  151. current->comm, current->pid,
  152. raw_smp_processor_id(),
  153. latency, t0);
  154. print_symbol(KERN_CONT "<%s>\n", data->critical_start);
  155. printk(KERN_CONT " => ended at timestamp %lu: ", t1);
  156. print_symbol(KERN_CONT "<%s>\n", data->critical_end);
  157. dump_stack();
  158. t1 = nsecs_to_usecs(now(cpu));
  159. printk(KERN_CONT " => dump-end timestamp %lu\n\n", t1);
  160. max_sequence++;
  161. out:
  162. data->critical_sequence = max_sequence;
  163. data->preempt_timestamp = now(cpu);
  164. tracing_reset(data);
  165. ftrace(tr, data, CALLER_ADDR0, parent_ip, flags);
  166. }
  167. static inline void notrace
  168. start_critical_timing(unsigned long ip, unsigned long parent_ip)
  169. {
  170. int cpu;
  171. struct trace_array *tr = irqsoff_trace;
  172. struct trace_array_cpu *data;
  173. unsigned long flags;
  174. if (likely(!tracer_enabled))
  175. return;
  176. if (__get_cpu_var(tracing_cpu))
  177. return;
  178. cpu = raw_smp_processor_id();
  179. data = tr->data[cpu];
  180. if (unlikely(!data) || unlikely(!data->trace) ||
  181. atomic_read(&data->disabled))
  182. return;
  183. atomic_inc(&data->disabled);
  184. data->critical_sequence = max_sequence;
  185. data->preempt_timestamp = now(cpu);
  186. data->critical_start = parent_ip ? : ip;
  187. tracing_reset(data);
  188. local_save_flags(flags);
  189. ftrace(tr, data, ip, parent_ip, flags);
  190. __get_cpu_var(tracing_cpu) = 1;
  191. atomic_dec(&data->disabled);
  192. }
  193. static inline void notrace
  194. stop_critical_timing(unsigned long ip, unsigned long parent_ip)
  195. {
  196. int cpu;
  197. struct trace_array *tr = irqsoff_trace;
  198. struct trace_array_cpu *data;
  199. unsigned long flags;
  200. /* Always clear the tracing cpu on stopping the trace */
  201. if (unlikely(__get_cpu_var(tracing_cpu)))
  202. __get_cpu_var(tracing_cpu) = 0;
  203. else
  204. return;
  205. if (!tracer_enabled)
  206. return;
  207. cpu = raw_smp_processor_id();
  208. data = tr->data[cpu];
  209. if (unlikely(!data) || unlikely(!data->trace) ||
  210. !data->critical_start || atomic_read(&data->disabled))
  211. return;
  212. atomic_inc(&data->disabled);
  213. local_save_flags(flags);
  214. ftrace(tr, data, ip, parent_ip, flags);
  215. check_critical_timing(tr, data, parent_ip ? : ip, cpu);
  216. data->critical_start = 0;
  217. atomic_dec(&data->disabled);
  218. }
  219. /* start and stop critical timings used to for stoppage (in idle) */
  220. void notrace start_critical_timings(void)
  221. {
  222. if (preempt_trace() || irq_trace())
  223. start_critical_timing(CALLER_ADDR0, CALLER_ADDR1);
  224. }
  225. void notrace stop_critical_timings(void)
  226. {
  227. if (preempt_trace() || irq_trace())
  228. stop_critical_timing(CALLER_ADDR0, CALLER_ADDR1);
  229. }
  230. #ifdef CONFIG_IRQSOFF_TRACER
  231. #ifdef CONFIG_PROVE_LOCKING
  232. void notrace time_hardirqs_on(unsigned long a0, unsigned long a1)
  233. {
  234. if (!preempt_trace() && irq_trace())
  235. stop_critical_timing(a0, a1);
  236. }
  237. void notrace time_hardirqs_off(unsigned long a0, unsigned long a1)
  238. {
  239. if (!preempt_trace() && irq_trace())
  240. start_critical_timing(a0, a1);
  241. }
  242. #else /* !CONFIG_PROVE_LOCKING */
  243. /*
  244. * Stubs:
  245. */
  246. void early_boot_irqs_off(void)
  247. {
  248. }
  249. void early_boot_irqs_on(void)
  250. {
  251. }
  252. void trace_softirqs_on(unsigned long ip)
  253. {
  254. }
  255. void trace_softirqs_off(unsigned long ip)
  256. {
  257. }
  258. inline void print_irqtrace_events(struct task_struct *curr)
  259. {
  260. }
  261. /*
  262. * We are only interested in hardirq on/off events:
  263. */
  264. void notrace trace_hardirqs_on(void)
  265. {
  266. if (!preempt_trace() && irq_trace())
  267. stop_critical_timing(CALLER_ADDR0, CALLER_ADDR1);
  268. }
  269. EXPORT_SYMBOL(trace_hardirqs_on);
  270. void notrace trace_hardirqs_off(void)
  271. {
  272. if (!preempt_trace() && irq_trace())
  273. start_critical_timing(CALLER_ADDR0, CALLER_ADDR1);
  274. }
  275. EXPORT_SYMBOL(trace_hardirqs_off);
  276. void notrace trace_hardirqs_on_caller(unsigned long caller_addr)
  277. {
  278. if (!preempt_trace() && irq_trace())
  279. stop_critical_timing(CALLER_ADDR0, caller_addr);
  280. }
  281. EXPORT_SYMBOL(trace_hardirqs_on_caller);
  282. void notrace trace_hardirqs_off_caller(unsigned long caller_addr)
  283. {
  284. if (!preempt_trace() && irq_trace())
  285. start_critical_timing(CALLER_ADDR0, caller_addr);
  286. }
  287. EXPORT_SYMBOL(trace_hardirqs_off_caller);
  288. #endif /* CONFIG_PROVE_LOCKING */
  289. #endif /* CONFIG_IRQSOFF_TRACER */
  290. #ifdef CONFIG_PREEMPT_TRACER
  291. void notrace trace_preempt_on(unsigned long a0, unsigned long a1)
  292. {
  293. stop_critical_timing(a0, a1);
  294. }
  295. void notrace trace_preempt_off(unsigned long a0, unsigned long a1)
  296. {
  297. start_critical_timing(a0, a1);
  298. }
  299. #endif /* CONFIG_PREEMPT_TRACER */
  300. static void start_irqsoff_tracer(struct trace_array *tr)
  301. {
  302. tracer_enabled = 1;
  303. register_ftrace_function(&trace_ops);
  304. }
  305. static void stop_irqsoff_tracer(struct trace_array *tr)
  306. {
  307. unregister_ftrace_function(&trace_ops);
  308. tracer_enabled = 0;
  309. }
  310. static void __irqsoff_tracer_init(struct trace_array *tr)
  311. {
  312. irqsoff_trace = tr;
  313. /* make sure that the tracer is visibel */
  314. smp_wmb();
  315. if (tr->ctrl)
  316. start_irqsoff_tracer(tr);
  317. }
  318. static void irqsoff_tracer_reset(struct trace_array *tr)
  319. {
  320. if (tr->ctrl)
  321. stop_irqsoff_tracer(tr);
  322. }
  323. static void irqsoff_tracer_ctrl_update(struct trace_array *tr)
  324. {
  325. if (tr->ctrl)
  326. start_irqsoff_tracer(tr);
  327. else
  328. stop_irqsoff_tracer(tr);
  329. }
  330. static void notrace irqsoff_tracer_open(struct trace_iterator *iter)
  331. {
  332. /* stop the trace while dumping */
  333. if (iter->tr->ctrl)
  334. stop_irqsoff_tracer(iter->tr);
  335. }
  336. static void notrace irqsoff_tracer_close(struct trace_iterator *iter)
  337. {
  338. if (iter->tr->ctrl)
  339. start_irqsoff_tracer(iter->tr);
  340. }
  341. #ifdef CONFIG_IRQSOFF_TRACER
  342. static void irqsoff_tracer_init(struct trace_array *tr)
  343. {
  344. trace_type = TRACER_IRQS_OFF;
  345. __irqsoff_tracer_init(tr);
  346. }
  347. static struct tracer irqsoff_tracer __read_mostly =
  348. {
  349. .name = "irqsoff",
  350. .init = irqsoff_tracer_init,
  351. .reset = irqsoff_tracer_reset,
  352. .open = irqsoff_tracer_open,
  353. .close = irqsoff_tracer_close,
  354. .ctrl_update = irqsoff_tracer_ctrl_update,
  355. .print_max = 1,
  356. };
  357. # define register_irqsoff(trace) register_tracer(&trace)
  358. #else
  359. # define register_irqsoff(trace) do { } while (0)
  360. #endif
  361. #ifdef CONFIG_PREEMPT_TRACER
  362. static void preemptoff_tracer_init(struct trace_array *tr)
  363. {
  364. trace_type = TRACER_PREEMPT_OFF;
  365. __irqsoff_tracer_init(tr);
  366. }
  367. static struct tracer preemptoff_tracer __read_mostly =
  368. {
  369. .name = "preemptoff",
  370. .init = preemptoff_tracer_init,
  371. .reset = irqsoff_tracer_reset,
  372. .open = irqsoff_tracer_open,
  373. .close = irqsoff_tracer_close,
  374. .ctrl_update = irqsoff_tracer_ctrl_update,
  375. .print_max = 1,
  376. };
  377. # define register_preemptoff(trace) register_tracer(&trace)
  378. #else
  379. # define register_preemptoff(trace) do { } while (0)
  380. #endif
  381. #if defined(CONFIG_IRQSOFF_TRACER) && \
  382. defined(CONFIG_PREEMPT_TRACER)
  383. static void preemptirqsoff_tracer_init(struct trace_array *tr)
  384. {
  385. trace_type = TRACER_IRQS_OFF | TRACER_PREEMPT_OFF;
  386. __irqsoff_tracer_init(tr);
  387. }
  388. static struct tracer preemptirqsoff_tracer __read_mostly =
  389. {
  390. .name = "preemptirqsoff",
  391. .init = preemptirqsoff_tracer_init,
  392. .reset = irqsoff_tracer_reset,
  393. .open = irqsoff_tracer_open,
  394. .close = irqsoff_tracer_close,
  395. .ctrl_update = irqsoff_tracer_ctrl_update,
  396. .print_max = 1,
  397. };
  398. # define register_preemptirqsoff(trace) register_tracer(&trace)
  399. #else
  400. # define register_preemptirqsoff(trace) do { } while (0)
  401. #endif
  402. __init static int init_irqsoff_tracer(void)
  403. {
  404. register_irqsoff(irqsoff_tracer);
  405. register_preemptoff(preemptoff_tracer);
  406. register_preemptirqsoff(preemptirqsoff_tracer);
  407. return 0;
  408. }
  409. device_initcall(init_irqsoff_tracer);