perf_event_v7.c 32 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187
  1. /*
  2. * ARMv7 Cortex-A8 and Cortex-A9 Performance Events handling code.
  3. *
  4. * ARMv7 support: Jean Pihet <jpihet@mvista.com>
  5. * 2010 (c) MontaVista Software, LLC.
  6. *
  7. * Copied from ARMv6 code, with the low level code inspired
  8. * by the ARMv7 Oprofile code.
  9. *
  10. * Cortex-A8 has up to 4 configurable performance counters and
  11. * a single cycle counter.
  12. * Cortex-A9 has up to 31 configurable performance counters and
  13. * a single cycle counter.
  14. *
  15. * All counters can be enabled/disabled and IRQ masked separately. The cycle
  16. * counter and all 4 performance counters together can be reset separately.
  17. */
  18. #ifdef CONFIG_CPU_V7
  19. static struct arm_pmu armv7pmu;
  20. /*
  21. * Common ARMv7 event types
  22. *
  23. * Note: An implementation may not be able to count all of these events
  24. * but the encodings are considered to be `reserved' in the case that
  25. * they are not available.
  26. */
  27. enum armv7_perf_types {
  28. ARMV7_PERFCTR_PMNC_SW_INCR = 0x00,
  29. ARMV7_PERFCTR_L1_ICACHE_REFILL = 0x01,
  30. ARMV7_PERFCTR_ITLB_REFILL = 0x02,
  31. ARMV7_PERFCTR_L1_DCACHE_REFILL = 0x03,
  32. ARMV7_PERFCTR_L1_DCACHE_ACCESS = 0x04,
  33. ARMV7_PERFCTR_DTLB_REFILL = 0x05,
  34. ARMV7_PERFCTR_MEM_READ = 0x06,
  35. ARMV7_PERFCTR_MEM_WRITE = 0x07,
  36. ARMV7_PERFCTR_INSTR_EXECUTED = 0x08,
  37. ARMV7_PERFCTR_EXC_TAKEN = 0x09,
  38. ARMV7_PERFCTR_EXC_EXECUTED = 0x0A,
  39. ARMV7_PERFCTR_CID_WRITE = 0x0B,
  40. /*
  41. * ARMV7_PERFCTR_PC_WRITE is equivalent to HW_BRANCH_INSTRUCTIONS.
  42. * It counts:
  43. * - all (taken) branch instructions,
  44. * - instructions that explicitly write the PC,
  45. * - exception generating instructions.
  46. */
  47. ARMV7_PERFCTR_PC_WRITE = 0x0C,
  48. ARMV7_PERFCTR_PC_IMM_BRANCH = 0x0D,
  49. ARMV7_PERFCTR_PC_PROC_RETURN = 0x0E,
  50. ARMV7_PERFCTR_MEM_UNALIGNED_ACCESS = 0x0F,
  51. ARMV7_PERFCTR_PC_BRANCH_MIS_PRED = 0x10,
  52. ARMV7_PERFCTR_CLOCK_CYCLES = 0x11,
  53. ARMV7_PERFCTR_PC_BRANCH_PRED = 0x12,
  54. /* These events are defined by the PMUv2 supplement (ARM DDI 0457A). */
  55. ARMV7_PERFCTR_MEM_ACCESS = 0x13,
  56. ARMV7_PERFCTR_L1_ICACHE_ACCESS = 0x14,
  57. ARMV7_PERFCTR_L1_DCACHE_WB = 0x15,
  58. ARMV7_PERFCTR_L2_CACHE_ACCESS = 0x16,
  59. ARMV7_PERFCTR_L2_CACHE_REFILL = 0x17,
  60. ARMV7_PERFCTR_L2_CACHE_WB = 0x18,
  61. ARMV7_PERFCTR_BUS_ACCESS = 0x19,
  62. ARMV7_PERFCTR_MEM_ERROR = 0x1A,
  63. ARMV7_PERFCTR_INSTR_SPEC = 0x1B,
  64. ARMV7_PERFCTR_TTBR_WRITE = 0x1C,
  65. ARMV7_PERFCTR_BUS_CYCLES = 0x1D,
  66. ARMV7_PERFCTR_CPU_CYCLES = 0xFF
  67. };
  68. /* ARMv7 Cortex-A8 specific event types */
  69. enum armv7_a8_perf_types {
  70. ARMV7_A8_PERFCTR_L2_CACHE_ACCESS = 0x43,
  71. ARMV7_A8_PERFCTR_L2_CACHE_REFILL = 0x44,
  72. ARMV7_A8_PERFCTR_L1_ICACHE_ACCESS = 0x50,
  73. ARMV7_A8_PERFCTR_STALL_ISIDE = 0x56,
  74. };
  75. /* ARMv7 Cortex-A9 specific event types */
  76. enum armv7_a9_perf_types {
  77. ARMV7_A9_PERFCTR_INSTR_CORE_RENAME = 0x68,
  78. ARMV7_A9_PERFCTR_STALL_ICACHE = 0x60,
  79. ARMV7_A9_PERFCTR_STALL_DISPATCH = 0x66,
  80. };
  81. /* ARMv7 Cortex-A5 specific event types */
  82. enum armv7_a5_perf_types {
  83. ARMV7_A5_PERFCTR_PREFETCH_LINEFILL = 0xc2,
  84. ARMV7_A5_PERFCTR_PREFETCH_LINEFILL_DROP = 0xc3,
  85. };
  86. /* ARMv7 Cortex-A15 specific event types */
  87. enum armv7_a15_perf_types {
  88. ARMV7_A15_PERFCTR_L1_DCACHE_ACCESS_READ = 0x40,
  89. ARMV7_A15_PERFCTR_L1_DCACHE_ACCESS_WRITE = 0x41,
  90. ARMV7_A15_PERFCTR_L1_DCACHE_REFILL_READ = 0x42,
  91. ARMV7_A15_PERFCTR_L1_DCACHE_REFILL_WRITE = 0x43,
  92. ARMV7_A15_PERFCTR_DTLB_REFILL_L1_READ = 0x4C,
  93. ARMV7_A15_PERFCTR_DTLB_REFILL_L1_WRITE = 0x4D,
  94. ARMV7_A15_PERFCTR_L2_CACHE_ACCESS_READ = 0x50,
  95. ARMV7_A15_PERFCTR_L2_CACHE_ACCESS_WRITE = 0x51,
  96. ARMV7_A15_PERFCTR_L2_CACHE_REFILL_READ = 0x52,
  97. ARMV7_A15_PERFCTR_L2_CACHE_REFILL_WRITE = 0x53,
  98. ARMV7_A15_PERFCTR_PC_WRITE_SPEC = 0x76,
  99. };
  100. /*
  101. * Cortex-A8 HW events mapping
  102. *
  103. * The hardware events that we support. We do support cache operations but
  104. * we have harvard caches and no way to combine instruction and data
  105. * accesses/misses in hardware.
  106. */
  107. static const unsigned armv7_a8_perf_map[PERF_COUNT_HW_MAX] = {
  108. [PERF_COUNT_HW_CPU_CYCLES] = ARMV7_PERFCTR_CPU_CYCLES,
  109. [PERF_COUNT_HW_INSTRUCTIONS] = ARMV7_PERFCTR_INSTR_EXECUTED,
  110. [PERF_COUNT_HW_CACHE_REFERENCES] = ARMV7_PERFCTR_L1_DCACHE_ACCESS,
  111. [PERF_COUNT_HW_CACHE_MISSES] = ARMV7_PERFCTR_L1_DCACHE_REFILL,
  112. [PERF_COUNT_HW_BRANCH_INSTRUCTIONS] = ARMV7_PERFCTR_PC_WRITE,
  113. [PERF_COUNT_HW_BRANCH_MISSES] = ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
  114. [PERF_COUNT_HW_BUS_CYCLES] = HW_OP_UNSUPPORTED,
  115. [PERF_COUNT_HW_STALLED_CYCLES_FRONTEND] = ARMV7_A8_PERFCTR_STALL_ISIDE,
  116. [PERF_COUNT_HW_STALLED_CYCLES_BACKEND] = HW_OP_UNSUPPORTED,
  117. };
  118. static const unsigned armv7_a8_perf_cache_map[PERF_COUNT_HW_CACHE_MAX]
  119. [PERF_COUNT_HW_CACHE_OP_MAX]
  120. [PERF_COUNT_HW_CACHE_RESULT_MAX] = {
  121. [C(L1D)] = {
  122. /*
  123. * The performance counters don't differentiate between read
  124. * and write accesses/misses so this isn't strictly correct,
  125. * but it's the best we can do. Writes and reads get
  126. * combined.
  127. */
  128. [C(OP_READ)] = {
  129. [C(RESULT_ACCESS)] = ARMV7_PERFCTR_L1_DCACHE_ACCESS,
  130. [C(RESULT_MISS)] = ARMV7_PERFCTR_L1_DCACHE_REFILL,
  131. },
  132. [C(OP_WRITE)] = {
  133. [C(RESULT_ACCESS)] = ARMV7_PERFCTR_L1_DCACHE_ACCESS,
  134. [C(RESULT_MISS)] = ARMV7_PERFCTR_L1_DCACHE_REFILL,
  135. },
  136. [C(OP_PREFETCH)] = {
  137. [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
  138. [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
  139. },
  140. },
  141. [C(L1I)] = {
  142. [C(OP_READ)] = {
  143. [C(RESULT_ACCESS)] = ARMV7_A8_PERFCTR_L1_ICACHE_ACCESS,
  144. [C(RESULT_MISS)] = ARMV7_PERFCTR_L1_ICACHE_REFILL,
  145. },
  146. [C(OP_WRITE)] = {
  147. [C(RESULT_ACCESS)] = ARMV7_A8_PERFCTR_L1_ICACHE_ACCESS,
  148. [C(RESULT_MISS)] = ARMV7_PERFCTR_L1_ICACHE_REFILL,
  149. },
  150. [C(OP_PREFETCH)] = {
  151. [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
  152. [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
  153. },
  154. },
  155. [C(LL)] = {
  156. [C(OP_READ)] = {
  157. [C(RESULT_ACCESS)] = ARMV7_A8_PERFCTR_L2_CACHE_ACCESS,
  158. [C(RESULT_MISS)] = ARMV7_A8_PERFCTR_L2_CACHE_REFILL,
  159. },
  160. [C(OP_WRITE)] = {
  161. [C(RESULT_ACCESS)] = ARMV7_A8_PERFCTR_L2_CACHE_ACCESS,
  162. [C(RESULT_MISS)] = ARMV7_A8_PERFCTR_L2_CACHE_REFILL,
  163. },
  164. [C(OP_PREFETCH)] = {
  165. [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
  166. [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
  167. },
  168. },
  169. [C(DTLB)] = {
  170. [C(OP_READ)] = {
  171. [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
  172. [C(RESULT_MISS)] = ARMV7_PERFCTR_DTLB_REFILL,
  173. },
  174. [C(OP_WRITE)] = {
  175. [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
  176. [C(RESULT_MISS)] = ARMV7_PERFCTR_DTLB_REFILL,
  177. },
  178. [C(OP_PREFETCH)] = {
  179. [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
  180. [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
  181. },
  182. },
  183. [C(ITLB)] = {
  184. [C(OP_READ)] = {
  185. [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
  186. [C(RESULT_MISS)] = ARMV7_PERFCTR_ITLB_REFILL,
  187. },
  188. [C(OP_WRITE)] = {
  189. [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
  190. [C(RESULT_MISS)] = ARMV7_PERFCTR_ITLB_REFILL,
  191. },
  192. [C(OP_PREFETCH)] = {
  193. [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
  194. [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
  195. },
  196. },
  197. [C(BPU)] = {
  198. [C(OP_READ)] = {
  199. [C(RESULT_ACCESS)] = ARMV7_PERFCTR_PC_BRANCH_PRED,
  200. [C(RESULT_MISS)] = ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
  201. },
  202. [C(OP_WRITE)] = {
  203. [C(RESULT_ACCESS)] = ARMV7_PERFCTR_PC_BRANCH_PRED,
  204. [C(RESULT_MISS)] = ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
  205. },
  206. [C(OP_PREFETCH)] = {
  207. [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
  208. [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
  209. },
  210. },
  211. [C(NODE)] = {
  212. [C(OP_READ)] = {
  213. [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
  214. [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
  215. },
  216. [C(OP_WRITE)] = {
  217. [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
  218. [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
  219. },
  220. [C(OP_PREFETCH)] = {
  221. [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
  222. [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
  223. },
  224. },
  225. };
  226. /*
  227. * Cortex-A9 HW events mapping
  228. */
  229. static const unsigned armv7_a9_perf_map[PERF_COUNT_HW_MAX] = {
  230. [PERF_COUNT_HW_CPU_CYCLES] = ARMV7_PERFCTR_CPU_CYCLES,
  231. [PERF_COUNT_HW_INSTRUCTIONS] = ARMV7_A9_PERFCTR_INSTR_CORE_RENAME,
  232. [PERF_COUNT_HW_CACHE_REFERENCES] = ARMV7_PERFCTR_L1_DCACHE_ACCESS,
  233. [PERF_COUNT_HW_CACHE_MISSES] = ARMV7_PERFCTR_L1_DCACHE_REFILL,
  234. [PERF_COUNT_HW_BRANCH_INSTRUCTIONS] = ARMV7_PERFCTR_PC_WRITE,
  235. [PERF_COUNT_HW_BRANCH_MISSES] = ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
  236. [PERF_COUNT_HW_BUS_CYCLES] = HW_OP_UNSUPPORTED,
  237. [PERF_COUNT_HW_STALLED_CYCLES_FRONTEND] = ARMV7_A9_PERFCTR_STALL_ICACHE,
  238. [PERF_COUNT_HW_STALLED_CYCLES_BACKEND] = ARMV7_A9_PERFCTR_STALL_DISPATCH,
  239. };
  240. static const unsigned armv7_a9_perf_cache_map[PERF_COUNT_HW_CACHE_MAX]
  241. [PERF_COUNT_HW_CACHE_OP_MAX]
  242. [PERF_COUNT_HW_CACHE_RESULT_MAX] = {
  243. [C(L1D)] = {
  244. /*
  245. * The performance counters don't differentiate between read
  246. * and write accesses/misses so this isn't strictly correct,
  247. * but it's the best we can do. Writes and reads get
  248. * combined.
  249. */
  250. [C(OP_READ)] = {
  251. [C(RESULT_ACCESS)] = ARMV7_PERFCTR_L1_DCACHE_ACCESS,
  252. [C(RESULT_MISS)] = ARMV7_PERFCTR_L1_DCACHE_REFILL,
  253. },
  254. [C(OP_WRITE)] = {
  255. [C(RESULT_ACCESS)] = ARMV7_PERFCTR_L1_DCACHE_ACCESS,
  256. [C(RESULT_MISS)] = ARMV7_PERFCTR_L1_DCACHE_REFILL,
  257. },
  258. [C(OP_PREFETCH)] = {
  259. [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
  260. [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
  261. },
  262. },
  263. [C(L1I)] = {
  264. [C(OP_READ)] = {
  265. [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
  266. [C(RESULT_MISS)] = ARMV7_PERFCTR_L1_ICACHE_REFILL,
  267. },
  268. [C(OP_WRITE)] = {
  269. [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
  270. [C(RESULT_MISS)] = ARMV7_PERFCTR_L1_ICACHE_REFILL,
  271. },
  272. [C(OP_PREFETCH)] = {
  273. [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
  274. [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
  275. },
  276. },
  277. [C(LL)] = {
  278. [C(OP_READ)] = {
  279. [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
  280. [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
  281. },
  282. [C(OP_WRITE)] = {
  283. [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
  284. [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
  285. },
  286. [C(OP_PREFETCH)] = {
  287. [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
  288. [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
  289. },
  290. },
  291. [C(DTLB)] = {
  292. [C(OP_READ)] = {
  293. [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
  294. [C(RESULT_MISS)] = ARMV7_PERFCTR_DTLB_REFILL,
  295. },
  296. [C(OP_WRITE)] = {
  297. [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
  298. [C(RESULT_MISS)] = ARMV7_PERFCTR_DTLB_REFILL,
  299. },
  300. [C(OP_PREFETCH)] = {
  301. [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
  302. [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
  303. },
  304. },
  305. [C(ITLB)] = {
  306. [C(OP_READ)] = {
  307. [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
  308. [C(RESULT_MISS)] = ARMV7_PERFCTR_ITLB_REFILL,
  309. },
  310. [C(OP_WRITE)] = {
  311. [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
  312. [C(RESULT_MISS)] = ARMV7_PERFCTR_ITLB_REFILL,
  313. },
  314. [C(OP_PREFETCH)] = {
  315. [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
  316. [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
  317. },
  318. },
  319. [C(BPU)] = {
  320. [C(OP_READ)] = {
  321. [C(RESULT_ACCESS)] = ARMV7_PERFCTR_PC_BRANCH_PRED,
  322. [C(RESULT_MISS)] = ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
  323. },
  324. [C(OP_WRITE)] = {
  325. [C(RESULT_ACCESS)] = ARMV7_PERFCTR_PC_BRANCH_PRED,
  326. [C(RESULT_MISS)] = ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
  327. },
  328. [C(OP_PREFETCH)] = {
  329. [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
  330. [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
  331. },
  332. },
  333. [C(NODE)] = {
  334. [C(OP_READ)] = {
  335. [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
  336. [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
  337. },
  338. [C(OP_WRITE)] = {
  339. [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
  340. [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
  341. },
  342. [C(OP_PREFETCH)] = {
  343. [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
  344. [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
  345. },
  346. },
  347. };
  348. /*
  349. * Cortex-A5 HW events mapping
  350. */
  351. static const unsigned armv7_a5_perf_map[PERF_COUNT_HW_MAX] = {
  352. [PERF_COUNT_HW_CPU_CYCLES] = ARMV7_PERFCTR_CPU_CYCLES,
  353. [PERF_COUNT_HW_INSTRUCTIONS] = ARMV7_PERFCTR_INSTR_EXECUTED,
  354. [PERF_COUNT_HW_CACHE_REFERENCES] = ARMV7_PERFCTR_L1_DCACHE_ACCESS,
  355. [PERF_COUNT_HW_CACHE_MISSES] = ARMV7_PERFCTR_L1_DCACHE_REFILL,
  356. [PERF_COUNT_HW_BRANCH_INSTRUCTIONS] = ARMV7_PERFCTR_PC_WRITE,
  357. [PERF_COUNT_HW_BRANCH_MISSES] = ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
  358. [PERF_COUNT_HW_BUS_CYCLES] = HW_OP_UNSUPPORTED,
  359. [PERF_COUNT_HW_STALLED_CYCLES_FRONTEND] = HW_OP_UNSUPPORTED,
  360. [PERF_COUNT_HW_STALLED_CYCLES_BACKEND] = HW_OP_UNSUPPORTED,
  361. };
  362. static const unsigned armv7_a5_perf_cache_map[PERF_COUNT_HW_CACHE_MAX]
  363. [PERF_COUNT_HW_CACHE_OP_MAX]
  364. [PERF_COUNT_HW_CACHE_RESULT_MAX] = {
  365. [C(L1D)] = {
  366. [C(OP_READ)] = {
  367. [C(RESULT_ACCESS)] = ARMV7_PERFCTR_L1_DCACHE_ACCESS,
  368. [C(RESULT_MISS)] = ARMV7_PERFCTR_L1_DCACHE_REFILL,
  369. },
  370. [C(OP_WRITE)] = {
  371. [C(RESULT_ACCESS)] = ARMV7_PERFCTR_L1_DCACHE_ACCESS,
  372. [C(RESULT_MISS)] = ARMV7_PERFCTR_L1_DCACHE_REFILL,
  373. },
  374. [C(OP_PREFETCH)] = {
  375. [C(RESULT_ACCESS)] = ARMV7_A5_PERFCTR_PREFETCH_LINEFILL,
  376. [C(RESULT_MISS)] = ARMV7_A5_PERFCTR_PREFETCH_LINEFILL_DROP,
  377. },
  378. },
  379. [C(L1I)] = {
  380. [C(OP_READ)] = {
  381. [C(RESULT_ACCESS)] = ARMV7_PERFCTR_L1_ICACHE_ACCESS,
  382. [C(RESULT_MISS)] = ARMV7_PERFCTR_L1_ICACHE_REFILL,
  383. },
  384. [C(OP_WRITE)] = {
  385. [C(RESULT_ACCESS)] = ARMV7_PERFCTR_L1_ICACHE_ACCESS,
  386. [C(RESULT_MISS)] = ARMV7_PERFCTR_L1_ICACHE_REFILL,
  387. },
  388. /*
  389. * The prefetch counters don't differentiate between the I
  390. * side and the D side.
  391. */
  392. [C(OP_PREFETCH)] = {
  393. [C(RESULT_ACCESS)] = ARMV7_A5_PERFCTR_PREFETCH_LINEFILL,
  394. [C(RESULT_MISS)] = ARMV7_A5_PERFCTR_PREFETCH_LINEFILL_DROP,
  395. },
  396. },
  397. [C(LL)] = {
  398. [C(OP_READ)] = {
  399. [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
  400. [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
  401. },
  402. [C(OP_WRITE)] = {
  403. [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
  404. [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
  405. },
  406. [C(OP_PREFETCH)] = {
  407. [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
  408. [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
  409. },
  410. },
  411. [C(DTLB)] = {
  412. [C(OP_READ)] = {
  413. [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
  414. [C(RESULT_MISS)] = ARMV7_PERFCTR_DTLB_REFILL,
  415. },
  416. [C(OP_WRITE)] = {
  417. [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
  418. [C(RESULT_MISS)] = ARMV7_PERFCTR_DTLB_REFILL,
  419. },
  420. [C(OP_PREFETCH)] = {
  421. [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
  422. [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
  423. },
  424. },
  425. [C(ITLB)] = {
  426. [C(OP_READ)] = {
  427. [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
  428. [C(RESULT_MISS)] = ARMV7_PERFCTR_ITLB_REFILL,
  429. },
  430. [C(OP_WRITE)] = {
  431. [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
  432. [C(RESULT_MISS)] = ARMV7_PERFCTR_ITLB_REFILL,
  433. },
  434. [C(OP_PREFETCH)] = {
  435. [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
  436. [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
  437. },
  438. },
  439. [C(BPU)] = {
  440. [C(OP_READ)] = {
  441. [C(RESULT_ACCESS)] = ARMV7_PERFCTR_PC_BRANCH_PRED,
  442. [C(RESULT_MISS)] = ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
  443. },
  444. [C(OP_WRITE)] = {
  445. [C(RESULT_ACCESS)] = ARMV7_PERFCTR_PC_BRANCH_PRED,
  446. [C(RESULT_MISS)] = ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
  447. },
  448. [C(OP_PREFETCH)] = {
  449. [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
  450. [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
  451. },
  452. },
  453. [C(NODE)] = {
  454. [C(OP_READ)] = {
  455. [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
  456. [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
  457. },
  458. [C(OP_WRITE)] = {
  459. [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
  460. [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
  461. },
  462. [C(OP_PREFETCH)] = {
  463. [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
  464. [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
  465. },
  466. },
  467. };
  468. /*
  469. * Cortex-A15 HW events mapping
  470. */
  471. static const unsigned armv7_a15_perf_map[PERF_COUNT_HW_MAX] = {
  472. [PERF_COUNT_HW_CPU_CYCLES] = ARMV7_PERFCTR_CPU_CYCLES,
  473. [PERF_COUNT_HW_INSTRUCTIONS] = ARMV7_PERFCTR_INSTR_EXECUTED,
  474. [PERF_COUNT_HW_CACHE_REFERENCES] = ARMV7_PERFCTR_L1_DCACHE_ACCESS,
  475. [PERF_COUNT_HW_CACHE_MISSES] = ARMV7_PERFCTR_L1_DCACHE_REFILL,
  476. [PERF_COUNT_HW_BRANCH_INSTRUCTIONS] = ARMV7_A15_PERFCTR_PC_WRITE_SPEC,
  477. [PERF_COUNT_HW_BRANCH_MISSES] = ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
  478. [PERF_COUNT_HW_BUS_CYCLES] = ARMV7_PERFCTR_BUS_CYCLES,
  479. [PERF_COUNT_HW_STALLED_CYCLES_FRONTEND] = HW_OP_UNSUPPORTED,
  480. [PERF_COUNT_HW_STALLED_CYCLES_BACKEND] = HW_OP_UNSUPPORTED,
  481. };
  482. static const unsigned armv7_a15_perf_cache_map[PERF_COUNT_HW_CACHE_MAX]
  483. [PERF_COUNT_HW_CACHE_OP_MAX]
  484. [PERF_COUNT_HW_CACHE_RESULT_MAX] = {
  485. [C(L1D)] = {
  486. [C(OP_READ)] = {
  487. [C(RESULT_ACCESS)] = ARMV7_A15_PERFCTR_L1_DCACHE_ACCESS_READ,
  488. [C(RESULT_MISS)] = ARMV7_A15_PERFCTR_L1_DCACHE_REFILL_READ,
  489. },
  490. [C(OP_WRITE)] = {
  491. [C(RESULT_ACCESS)] = ARMV7_A15_PERFCTR_L1_DCACHE_ACCESS_WRITE,
  492. [C(RESULT_MISS)] = ARMV7_A15_PERFCTR_L1_DCACHE_REFILL_WRITE,
  493. },
  494. [C(OP_PREFETCH)] = {
  495. [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
  496. [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
  497. },
  498. },
  499. [C(L1I)] = {
  500. /*
  501. * Not all performance counters differentiate between read
  502. * and write accesses/misses so we're not always strictly
  503. * correct, but it's the best we can do. Writes and reads get
  504. * combined in these cases.
  505. */
  506. [C(OP_READ)] = {
  507. [C(RESULT_ACCESS)] = ARMV7_PERFCTR_L1_ICACHE_ACCESS,
  508. [C(RESULT_MISS)] = ARMV7_PERFCTR_L1_ICACHE_REFILL,
  509. },
  510. [C(OP_WRITE)] = {
  511. [C(RESULT_ACCESS)] = ARMV7_PERFCTR_L1_ICACHE_ACCESS,
  512. [C(RESULT_MISS)] = ARMV7_PERFCTR_L1_ICACHE_REFILL,
  513. },
  514. [C(OP_PREFETCH)] = {
  515. [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
  516. [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
  517. },
  518. },
  519. [C(LL)] = {
  520. [C(OP_READ)] = {
  521. [C(RESULT_ACCESS)] = ARMV7_A15_PERFCTR_L2_CACHE_ACCESS_READ,
  522. [C(RESULT_MISS)] = ARMV7_A15_PERFCTR_L2_CACHE_REFILL_READ,
  523. },
  524. [C(OP_WRITE)] = {
  525. [C(RESULT_ACCESS)] = ARMV7_A15_PERFCTR_L2_CACHE_ACCESS_WRITE,
  526. [C(RESULT_MISS)] = ARMV7_A15_PERFCTR_L2_CACHE_REFILL_WRITE,
  527. },
  528. [C(OP_PREFETCH)] = {
  529. [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
  530. [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
  531. },
  532. },
  533. [C(DTLB)] = {
  534. [C(OP_READ)] = {
  535. [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
  536. [C(RESULT_MISS)] = ARMV7_A15_PERFCTR_DTLB_REFILL_L1_READ,
  537. },
  538. [C(OP_WRITE)] = {
  539. [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
  540. [C(RESULT_MISS)] = ARMV7_A15_PERFCTR_DTLB_REFILL_L1_WRITE,
  541. },
  542. [C(OP_PREFETCH)] = {
  543. [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
  544. [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
  545. },
  546. },
  547. [C(ITLB)] = {
  548. [C(OP_READ)] = {
  549. [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
  550. [C(RESULT_MISS)] = ARMV7_PERFCTR_ITLB_REFILL,
  551. },
  552. [C(OP_WRITE)] = {
  553. [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
  554. [C(RESULT_MISS)] = ARMV7_PERFCTR_ITLB_REFILL,
  555. },
  556. [C(OP_PREFETCH)] = {
  557. [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
  558. [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
  559. },
  560. },
  561. [C(BPU)] = {
  562. [C(OP_READ)] = {
  563. [C(RESULT_ACCESS)] = ARMV7_PERFCTR_PC_BRANCH_PRED,
  564. [C(RESULT_MISS)] = ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
  565. },
  566. [C(OP_WRITE)] = {
  567. [C(RESULT_ACCESS)] = ARMV7_PERFCTR_PC_BRANCH_PRED,
  568. [C(RESULT_MISS)] = ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
  569. },
  570. [C(OP_PREFETCH)] = {
  571. [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
  572. [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
  573. },
  574. },
  575. [C(NODE)] = {
  576. [C(OP_READ)] = {
  577. [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
  578. [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
  579. },
  580. [C(OP_WRITE)] = {
  581. [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
  582. [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
  583. },
  584. [C(OP_PREFETCH)] = {
  585. [C(RESULT_ACCESS)] = CACHE_OP_UNSUPPORTED,
  586. [C(RESULT_MISS)] = CACHE_OP_UNSUPPORTED,
  587. },
  588. },
  589. };
  590. /*
  591. * Perf Events' indices
  592. */
  593. #define ARMV7_IDX_CYCLE_COUNTER 0
  594. #define ARMV7_IDX_COUNTER0 1
  595. #define ARMV7_IDX_COUNTER_LAST (ARMV7_IDX_CYCLE_COUNTER + cpu_pmu->num_events - 1)
  596. #define ARMV7_MAX_COUNTERS 32
  597. #define ARMV7_COUNTER_MASK (ARMV7_MAX_COUNTERS - 1)
  598. /*
  599. * ARMv7 low level PMNC access
  600. */
  601. /*
  602. * Perf Event to low level counters mapping
  603. */
  604. #define ARMV7_IDX_TO_COUNTER(x) \
  605. (((x) - ARMV7_IDX_COUNTER0) & ARMV7_COUNTER_MASK)
  606. /*
  607. * Per-CPU PMNC: config reg
  608. */
  609. #define ARMV7_PMNC_E (1 << 0) /* Enable all counters */
  610. #define ARMV7_PMNC_P (1 << 1) /* Reset all counters */
  611. #define ARMV7_PMNC_C (1 << 2) /* Cycle counter reset */
  612. #define ARMV7_PMNC_D (1 << 3) /* CCNT counts every 64th cpu cycle */
  613. #define ARMV7_PMNC_X (1 << 4) /* Export to ETM */
  614. #define ARMV7_PMNC_DP (1 << 5) /* Disable CCNT if non-invasive debug*/
  615. #define ARMV7_PMNC_N_SHIFT 11 /* Number of counters supported */
  616. #define ARMV7_PMNC_N_MASK 0x1f
  617. #define ARMV7_PMNC_MASK 0x3f /* Mask for writable bits */
  618. /*
  619. * FLAG: counters overflow flag status reg
  620. */
  621. #define ARMV7_FLAG_MASK 0xffffffff /* Mask for writable bits */
  622. #define ARMV7_OVERFLOWED_MASK ARMV7_FLAG_MASK
  623. /*
  624. * PMXEVTYPER: Event selection reg
  625. */
  626. #define ARMV7_EVTYPE_MASK 0xc00000ff /* Mask for writable bits */
  627. #define ARMV7_EVTYPE_EVENT 0xff /* Mask for EVENT bits */
  628. /*
  629. * Event filters for PMUv2
  630. */
  631. #define ARMV7_EXCLUDE_PL1 (1 << 31)
  632. #define ARMV7_EXCLUDE_USER (1 << 30)
  633. #define ARMV7_INCLUDE_HYP (1 << 27)
  634. static inline u32 armv7_pmnc_read(void)
  635. {
  636. u32 val;
  637. asm volatile("mrc p15, 0, %0, c9, c12, 0" : "=r"(val));
  638. return val;
  639. }
  640. static inline void armv7_pmnc_write(u32 val)
  641. {
  642. val &= ARMV7_PMNC_MASK;
  643. isb();
  644. asm volatile("mcr p15, 0, %0, c9, c12, 0" : : "r"(val));
  645. }
  646. static inline int armv7_pmnc_has_overflowed(u32 pmnc)
  647. {
  648. return pmnc & ARMV7_OVERFLOWED_MASK;
  649. }
  650. static inline int armv7_pmnc_counter_valid(int idx)
  651. {
  652. return idx >= ARMV7_IDX_CYCLE_COUNTER && idx <= ARMV7_IDX_COUNTER_LAST;
  653. }
  654. static inline int armv7_pmnc_counter_has_overflowed(u32 pmnc, int idx)
  655. {
  656. int ret = 0;
  657. u32 counter;
  658. if (!armv7_pmnc_counter_valid(idx)) {
  659. pr_err("CPU%u checking wrong counter %d overflow status\n",
  660. smp_processor_id(), idx);
  661. } else {
  662. counter = ARMV7_IDX_TO_COUNTER(idx);
  663. ret = pmnc & BIT(counter);
  664. }
  665. return ret;
  666. }
  667. static inline int armv7_pmnc_select_counter(int idx)
  668. {
  669. u32 counter;
  670. if (!armv7_pmnc_counter_valid(idx)) {
  671. pr_err("CPU%u selecting wrong PMNC counter %d\n",
  672. smp_processor_id(), idx);
  673. return -EINVAL;
  674. }
  675. counter = ARMV7_IDX_TO_COUNTER(idx);
  676. asm volatile("mcr p15, 0, %0, c9, c12, 5" : : "r" (counter));
  677. isb();
  678. return idx;
  679. }
  680. static inline u32 armv7pmu_read_counter(int idx)
  681. {
  682. u32 value = 0;
  683. if (!armv7_pmnc_counter_valid(idx))
  684. pr_err("CPU%u reading wrong counter %d\n",
  685. smp_processor_id(), idx);
  686. else if (idx == ARMV7_IDX_CYCLE_COUNTER)
  687. asm volatile("mrc p15, 0, %0, c9, c13, 0" : "=r" (value));
  688. else if (armv7_pmnc_select_counter(idx) == idx)
  689. asm volatile("mrc p15, 0, %0, c9, c13, 2" : "=r" (value));
  690. return value;
  691. }
  692. static inline void armv7pmu_write_counter(int idx, u32 value)
  693. {
  694. if (!armv7_pmnc_counter_valid(idx))
  695. pr_err("CPU%u writing wrong counter %d\n",
  696. smp_processor_id(), idx);
  697. else if (idx == ARMV7_IDX_CYCLE_COUNTER)
  698. asm volatile("mcr p15, 0, %0, c9, c13, 0" : : "r" (value));
  699. else if (armv7_pmnc_select_counter(idx) == idx)
  700. asm volatile("mcr p15, 0, %0, c9, c13, 2" : : "r" (value));
  701. }
  702. static inline void armv7_pmnc_write_evtsel(int idx, u32 val)
  703. {
  704. if (armv7_pmnc_select_counter(idx) == idx) {
  705. val &= ARMV7_EVTYPE_MASK;
  706. asm volatile("mcr p15, 0, %0, c9, c13, 1" : : "r" (val));
  707. }
  708. }
  709. static inline int armv7_pmnc_enable_counter(int idx)
  710. {
  711. u32 counter;
  712. if (!armv7_pmnc_counter_valid(idx)) {
  713. pr_err("CPU%u enabling wrong PMNC counter %d\n",
  714. smp_processor_id(), idx);
  715. return -EINVAL;
  716. }
  717. counter = ARMV7_IDX_TO_COUNTER(idx);
  718. asm volatile("mcr p15, 0, %0, c9, c12, 1" : : "r" (BIT(counter)));
  719. return idx;
  720. }
  721. static inline int armv7_pmnc_disable_counter(int idx)
  722. {
  723. u32 counter;
  724. if (!armv7_pmnc_counter_valid(idx)) {
  725. pr_err("CPU%u disabling wrong PMNC counter %d\n",
  726. smp_processor_id(), idx);
  727. return -EINVAL;
  728. }
  729. counter = ARMV7_IDX_TO_COUNTER(idx);
  730. asm volatile("mcr p15, 0, %0, c9, c12, 2" : : "r" (BIT(counter)));
  731. return idx;
  732. }
  733. static inline int armv7_pmnc_enable_intens(int idx)
  734. {
  735. u32 counter;
  736. if (!armv7_pmnc_counter_valid(idx)) {
  737. pr_err("CPU%u enabling wrong PMNC counter IRQ enable %d\n",
  738. smp_processor_id(), idx);
  739. return -EINVAL;
  740. }
  741. counter = ARMV7_IDX_TO_COUNTER(idx);
  742. asm volatile("mcr p15, 0, %0, c9, c14, 1" : : "r" (BIT(counter)));
  743. return idx;
  744. }
  745. static inline int armv7_pmnc_disable_intens(int idx)
  746. {
  747. u32 counter;
  748. if (!armv7_pmnc_counter_valid(idx)) {
  749. pr_err("CPU%u disabling wrong PMNC counter IRQ enable %d\n",
  750. smp_processor_id(), idx);
  751. return -EINVAL;
  752. }
  753. counter = ARMV7_IDX_TO_COUNTER(idx);
  754. asm volatile("mcr p15, 0, %0, c9, c14, 2" : : "r" (BIT(counter)));
  755. isb();
  756. /* Clear the overflow flag in case an interrupt is pending. */
  757. asm volatile("mcr p15, 0, %0, c9, c12, 3" : : "r" (BIT(counter)));
  758. isb();
  759. return idx;
  760. }
  761. static inline u32 armv7_pmnc_getreset_flags(void)
  762. {
  763. u32 val;
  764. /* Read */
  765. asm volatile("mrc p15, 0, %0, c9, c12, 3" : "=r" (val));
  766. /* Write to clear flags */
  767. val &= ARMV7_FLAG_MASK;
  768. asm volatile("mcr p15, 0, %0, c9, c12, 3" : : "r" (val));
  769. return val;
  770. }
  771. #ifdef DEBUG
  772. static void armv7_pmnc_dump_regs(void)
  773. {
  774. u32 val;
  775. unsigned int cnt;
  776. printk(KERN_INFO "PMNC registers dump:\n");
  777. asm volatile("mrc p15, 0, %0, c9, c12, 0" : "=r" (val));
  778. printk(KERN_INFO "PMNC =0x%08x\n", val);
  779. asm volatile("mrc p15, 0, %0, c9, c12, 1" : "=r" (val));
  780. printk(KERN_INFO "CNTENS=0x%08x\n", val);
  781. asm volatile("mrc p15, 0, %0, c9, c14, 1" : "=r" (val));
  782. printk(KERN_INFO "INTENS=0x%08x\n", val);
  783. asm volatile("mrc p15, 0, %0, c9, c12, 3" : "=r" (val));
  784. printk(KERN_INFO "FLAGS =0x%08x\n", val);
  785. asm volatile("mrc p15, 0, %0, c9, c12, 5" : "=r" (val));
  786. printk(KERN_INFO "SELECT=0x%08x\n", val);
  787. asm volatile("mrc p15, 0, %0, c9, c13, 0" : "=r" (val));
  788. printk(KERN_INFO "CCNT =0x%08x\n", val);
  789. for (cnt = ARMV7_IDX_COUNTER0; cnt <= ARMV7_IDX_COUNTER_LAST; cnt++) {
  790. armv7_pmnc_select_counter(cnt);
  791. asm volatile("mrc p15, 0, %0, c9, c13, 2" : "=r" (val));
  792. printk(KERN_INFO "CNT[%d] count =0x%08x\n",
  793. ARMV7_IDX_TO_COUNTER(cnt), val);
  794. asm volatile("mrc p15, 0, %0, c9, c13, 1" : "=r" (val));
  795. printk(KERN_INFO "CNT[%d] evtsel=0x%08x\n",
  796. ARMV7_IDX_TO_COUNTER(cnt), val);
  797. }
  798. }
  799. #endif
  800. static void armv7pmu_enable_event(struct hw_perf_event *hwc, int idx)
  801. {
  802. unsigned long flags;
  803. struct pmu_hw_events *events = cpu_pmu->get_hw_events();
  804. /*
  805. * Enable counter and interrupt, and set the counter to count
  806. * the event that we're interested in.
  807. */
  808. raw_spin_lock_irqsave(&events->pmu_lock, flags);
  809. /*
  810. * Disable counter
  811. */
  812. armv7_pmnc_disable_counter(idx);
  813. /*
  814. * Set event (if destined for PMNx counters)
  815. * We only need to set the event for the cycle counter if we
  816. * have the ability to perform event filtering.
  817. */
  818. if (armv7pmu.set_event_filter || idx != ARMV7_IDX_CYCLE_COUNTER)
  819. armv7_pmnc_write_evtsel(idx, hwc->config_base);
  820. /*
  821. * Enable interrupt for this counter
  822. */
  823. armv7_pmnc_enable_intens(idx);
  824. /*
  825. * Enable counter
  826. */
  827. armv7_pmnc_enable_counter(idx);
  828. raw_spin_unlock_irqrestore(&events->pmu_lock, flags);
  829. }
  830. static void armv7pmu_disable_event(struct hw_perf_event *hwc, int idx)
  831. {
  832. unsigned long flags;
  833. struct pmu_hw_events *events = cpu_pmu->get_hw_events();
  834. /*
  835. * Disable counter and interrupt
  836. */
  837. raw_spin_lock_irqsave(&events->pmu_lock, flags);
  838. /*
  839. * Disable counter
  840. */
  841. armv7_pmnc_disable_counter(idx);
  842. /*
  843. * Disable interrupt for this counter
  844. */
  845. armv7_pmnc_disable_intens(idx);
  846. raw_spin_unlock_irqrestore(&events->pmu_lock, flags);
  847. }
  848. static irqreturn_t armv7pmu_handle_irq(int irq_num, void *dev)
  849. {
  850. u32 pmnc;
  851. struct perf_sample_data data;
  852. struct pmu_hw_events *cpuc;
  853. struct pt_regs *regs;
  854. int idx;
  855. /*
  856. * Get and reset the IRQ flags
  857. */
  858. pmnc = armv7_pmnc_getreset_flags();
  859. /*
  860. * Did an overflow occur?
  861. */
  862. if (!armv7_pmnc_has_overflowed(pmnc))
  863. return IRQ_NONE;
  864. /*
  865. * Handle the counter(s) overflow(s)
  866. */
  867. regs = get_irq_regs();
  868. perf_sample_data_init(&data, 0);
  869. cpuc = &__get_cpu_var(cpu_hw_events);
  870. for (idx = 0; idx < cpu_pmu->num_events; ++idx) {
  871. struct perf_event *event = cpuc->events[idx];
  872. struct hw_perf_event *hwc;
  873. /* Ignore if we don't have an event. */
  874. if (!event)
  875. continue;
  876. /*
  877. * We have a single interrupt for all counters. Check that
  878. * each counter has overflowed before we process it.
  879. */
  880. if (!armv7_pmnc_counter_has_overflowed(pmnc, idx))
  881. continue;
  882. hwc = &event->hw;
  883. armpmu_event_update(event, hwc, idx);
  884. data.period = event->hw.last_period;
  885. if (!armpmu_event_set_period(event, hwc, idx))
  886. continue;
  887. if (perf_event_overflow(event, &data, regs))
  888. cpu_pmu->disable(hwc, idx);
  889. }
  890. /*
  891. * Handle the pending perf events.
  892. *
  893. * Note: this call *must* be run with interrupts disabled. For
  894. * platforms that can have the PMU interrupts raised as an NMI, this
  895. * will not work.
  896. */
  897. irq_work_run();
  898. return IRQ_HANDLED;
  899. }
  900. static void armv7pmu_start(void)
  901. {
  902. unsigned long flags;
  903. struct pmu_hw_events *events = cpu_pmu->get_hw_events();
  904. raw_spin_lock_irqsave(&events->pmu_lock, flags);
  905. /* Enable all counters */
  906. armv7_pmnc_write(armv7_pmnc_read() | ARMV7_PMNC_E);
  907. raw_spin_unlock_irqrestore(&events->pmu_lock, flags);
  908. }
  909. static void armv7pmu_stop(void)
  910. {
  911. unsigned long flags;
  912. struct pmu_hw_events *events = cpu_pmu->get_hw_events();
  913. raw_spin_lock_irqsave(&events->pmu_lock, flags);
  914. /* Disable all counters */
  915. armv7_pmnc_write(armv7_pmnc_read() & ~ARMV7_PMNC_E);
  916. raw_spin_unlock_irqrestore(&events->pmu_lock, flags);
  917. }
  918. static int armv7pmu_get_event_idx(struct pmu_hw_events *cpuc,
  919. struct hw_perf_event *event)
  920. {
  921. int idx;
  922. unsigned long evtype = event->config_base & ARMV7_EVTYPE_EVENT;
  923. /* Always place a cycle counter into the cycle counter. */
  924. if (evtype == ARMV7_PERFCTR_CPU_CYCLES) {
  925. if (test_and_set_bit(ARMV7_IDX_CYCLE_COUNTER, cpuc->used_mask))
  926. return -EAGAIN;
  927. return ARMV7_IDX_CYCLE_COUNTER;
  928. }
  929. /*
  930. * For anything other than a cycle counter, try and use
  931. * the events counters
  932. */
  933. for (idx = ARMV7_IDX_COUNTER0; idx < cpu_pmu->num_events; ++idx) {
  934. if (!test_and_set_bit(idx, cpuc->used_mask))
  935. return idx;
  936. }
  937. /* The counters are all in use. */
  938. return -EAGAIN;
  939. }
  940. /*
  941. * Add an event filter to a given event. This will only work for PMUv2 PMUs.
  942. */
  943. static int armv7pmu_set_event_filter(struct hw_perf_event *event,
  944. struct perf_event_attr *attr)
  945. {
  946. unsigned long config_base = 0;
  947. if (attr->exclude_idle)
  948. return -EPERM;
  949. if (attr->exclude_user)
  950. config_base |= ARMV7_EXCLUDE_USER;
  951. if (attr->exclude_kernel)
  952. config_base |= ARMV7_EXCLUDE_PL1;
  953. if (!attr->exclude_hv)
  954. config_base |= ARMV7_INCLUDE_HYP;
  955. /*
  956. * Install the filter into config_base as this is used to
  957. * construct the event type.
  958. */
  959. event->config_base = config_base;
  960. return 0;
  961. }
  962. static void armv7pmu_reset(void *info)
  963. {
  964. u32 idx, nb_cnt = cpu_pmu->num_events;
  965. /* The counter and interrupt enable registers are unknown at reset. */
  966. for (idx = ARMV7_IDX_CYCLE_COUNTER; idx < nb_cnt; ++idx)
  967. armv7pmu_disable_event(NULL, idx);
  968. /* Initialize & Reset PMNC: C and P bits */
  969. armv7_pmnc_write(ARMV7_PMNC_P | ARMV7_PMNC_C);
  970. }
  971. static int armv7_a8_map_event(struct perf_event *event)
  972. {
  973. return map_cpu_event(event, &armv7_a8_perf_map,
  974. &armv7_a8_perf_cache_map, 0xFF);
  975. }
  976. static int armv7_a9_map_event(struct perf_event *event)
  977. {
  978. return map_cpu_event(event, &armv7_a9_perf_map,
  979. &armv7_a9_perf_cache_map, 0xFF);
  980. }
  981. static int armv7_a5_map_event(struct perf_event *event)
  982. {
  983. return map_cpu_event(event, &armv7_a5_perf_map,
  984. &armv7_a5_perf_cache_map, 0xFF);
  985. }
  986. static int armv7_a15_map_event(struct perf_event *event)
  987. {
  988. return map_cpu_event(event, &armv7_a15_perf_map,
  989. &armv7_a15_perf_cache_map, 0xFF);
  990. }
  991. static struct arm_pmu armv7pmu = {
  992. .handle_irq = armv7pmu_handle_irq,
  993. .enable = armv7pmu_enable_event,
  994. .disable = armv7pmu_disable_event,
  995. .read_counter = armv7pmu_read_counter,
  996. .write_counter = armv7pmu_write_counter,
  997. .get_event_idx = armv7pmu_get_event_idx,
  998. .start = armv7pmu_start,
  999. .stop = armv7pmu_stop,
  1000. .reset = armv7pmu_reset,
  1001. .max_period = (1LLU << 32) - 1,
  1002. };
  1003. static u32 __init armv7_read_num_pmnc_events(void)
  1004. {
  1005. u32 nb_cnt;
  1006. /* Read the nb of CNTx counters supported from PMNC */
  1007. nb_cnt = (armv7_pmnc_read() >> ARMV7_PMNC_N_SHIFT) & ARMV7_PMNC_N_MASK;
  1008. /* Add the CPU cycles counter and return */
  1009. return nb_cnt + 1;
  1010. }
  1011. static struct arm_pmu *__init armv7_a8_pmu_init(void)
  1012. {
  1013. armv7pmu.id = ARM_PERF_PMU_ID_CA8;
  1014. armv7pmu.name = "ARMv7 Cortex-A8";
  1015. armv7pmu.map_event = armv7_a8_map_event;
  1016. armv7pmu.num_events = armv7_read_num_pmnc_events();
  1017. return &armv7pmu;
  1018. }
  1019. static struct arm_pmu *__init armv7_a9_pmu_init(void)
  1020. {
  1021. armv7pmu.id = ARM_PERF_PMU_ID_CA9;
  1022. armv7pmu.name = "ARMv7 Cortex-A9";
  1023. armv7pmu.map_event = armv7_a9_map_event;
  1024. armv7pmu.num_events = armv7_read_num_pmnc_events();
  1025. return &armv7pmu;
  1026. }
  1027. static struct arm_pmu *__init armv7_a5_pmu_init(void)
  1028. {
  1029. armv7pmu.id = ARM_PERF_PMU_ID_CA5;
  1030. armv7pmu.name = "ARMv7 Cortex-A5";
  1031. armv7pmu.map_event = armv7_a5_map_event;
  1032. armv7pmu.num_events = armv7_read_num_pmnc_events();
  1033. return &armv7pmu;
  1034. }
  1035. static struct arm_pmu *__init armv7_a15_pmu_init(void)
  1036. {
  1037. armv7pmu.id = ARM_PERF_PMU_ID_CA15;
  1038. armv7pmu.name = "ARMv7 Cortex-A15";
  1039. armv7pmu.map_event = armv7_a15_map_event;
  1040. armv7pmu.num_events = armv7_read_num_pmnc_events();
  1041. armv7pmu.set_event_filter = armv7pmu_set_event_filter;
  1042. return &armv7pmu;
  1043. }
  1044. #else
  1045. static struct arm_pmu *__init armv7_a8_pmu_init(void)
  1046. {
  1047. return NULL;
  1048. }
  1049. static struct arm_pmu *__init armv7_a9_pmu_init(void)
  1050. {
  1051. return NULL;
  1052. }
  1053. static struct arm_pmu *__init armv7_a5_pmu_init(void)
  1054. {
  1055. return NULL;
  1056. }
  1057. static struct arm_pmu *__init armv7_a15_pmu_init(void)
  1058. {
  1059. return NULL;
  1060. }
  1061. #endif /* CONFIG_CPU_V7 */