c-r4k.c 32 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214
  1. /*
  2. * This file is subject to the terms and conditions of the GNU General Public
  3. * License. See the file "COPYING" in the main directory of this archive
  4. * for more details.
  5. *
  6. * Copyright (C) 1996 David S. Miller (dm@engr.sgi.com)
  7. * Copyright (C) 1997, 1998, 1999, 2000, 2001, 2002 Ralf Baechle (ralf@gnu.org)
  8. * Copyright (C) 1999, 2000 Silicon Graphics, Inc.
  9. */
  10. #include <linux/config.h>
  11. #include <linux/init.h>
  12. #include <linux/kernel.h>
  13. #include <linux/sched.h>
  14. #include <linux/mm.h>
  15. #include <linux/bitops.h>
  16. #include <asm/bcache.h>
  17. #include <asm/bootinfo.h>
  18. #include <asm/cache.h>
  19. #include <asm/cacheops.h>
  20. #include <asm/cpu.h>
  21. #include <asm/cpu-features.h>
  22. #include <asm/io.h>
  23. #include <asm/page.h>
  24. #include <asm/pgtable.h>
  25. #include <asm/r4kcache.h>
  26. #include <asm/system.h>
  27. #include <asm/mmu_context.h>
  28. #include <asm/war.h>
  29. #include <asm/cacheflush.h> /* for run_uncached() */
  30. /*
  31. * Must die.
  32. */
  33. static unsigned long icache_size __read_mostly;
  34. static unsigned long dcache_size __read_mostly;
  35. static unsigned long scache_size __read_mostly;
  36. /*
  37. * Dummy cache handling routines for machines without boardcaches
  38. */
  39. static void no_sc_noop(void) {}
  40. static struct bcache_ops no_sc_ops = {
  41. .bc_enable = (void *)no_sc_noop,
  42. .bc_disable = (void *)no_sc_noop,
  43. .bc_wback_inv = (void *)no_sc_noop,
  44. .bc_inv = (void *)no_sc_noop
  45. };
  46. struct bcache_ops *bcops = &no_sc_ops;
  47. #define cpu_is_r4600_v1_x() ((read_c0_prid() & 0xfffffff0) == 0x00002010)
  48. #define cpu_is_r4600_v2_x() ((read_c0_prid() & 0xfffffff0) == 0x00002020)
  49. #define R4600_HIT_CACHEOP_WAR_IMPL \
  50. do { \
  51. if (R4600_V2_HIT_CACHEOP_WAR && cpu_is_r4600_v2_x()) \
  52. *(volatile unsigned long *)CKSEG1; \
  53. if (R4600_V1_HIT_CACHEOP_WAR) \
  54. __asm__ __volatile__("nop;nop;nop;nop"); \
  55. } while (0)
  56. static void (*r4k_blast_dcache_page)(unsigned long addr);
  57. static inline void r4k_blast_dcache_page_dc32(unsigned long addr)
  58. {
  59. R4600_HIT_CACHEOP_WAR_IMPL;
  60. blast_dcache32_page(addr);
  61. }
  62. static inline void r4k_blast_dcache_page_setup(void)
  63. {
  64. unsigned long dc_lsize = cpu_dcache_line_size();
  65. if (dc_lsize == 16)
  66. r4k_blast_dcache_page = blast_dcache16_page;
  67. else if (dc_lsize == 32)
  68. r4k_blast_dcache_page = r4k_blast_dcache_page_dc32;
  69. }
  70. static void (* r4k_blast_dcache_page_indexed)(unsigned long addr);
  71. static inline void r4k_blast_dcache_page_indexed_setup(void)
  72. {
  73. unsigned long dc_lsize = cpu_dcache_line_size();
  74. if (dc_lsize == 16)
  75. r4k_blast_dcache_page_indexed = blast_dcache16_page_indexed;
  76. else if (dc_lsize == 32)
  77. r4k_blast_dcache_page_indexed = blast_dcache32_page_indexed;
  78. }
  79. static void (* r4k_blast_dcache)(void);
  80. static inline void r4k_blast_dcache_setup(void)
  81. {
  82. unsigned long dc_lsize = cpu_dcache_line_size();
  83. if (dc_lsize == 16)
  84. r4k_blast_dcache = blast_dcache16;
  85. else if (dc_lsize == 32)
  86. r4k_blast_dcache = blast_dcache32;
  87. }
  88. /* force code alignment (used for TX49XX_ICACHE_INDEX_INV_WAR) */
  89. #define JUMP_TO_ALIGN(order) \
  90. __asm__ __volatile__( \
  91. "b\t1f\n\t" \
  92. ".align\t" #order "\n\t" \
  93. "1:\n\t" \
  94. )
  95. #define CACHE32_UNROLL32_ALIGN JUMP_TO_ALIGN(10) /* 32 * 32 = 1024 */
  96. #define CACHE32_UNROLL32_ALIGN2 JUMP_TO_ALIGN(11)
  97. static inline void blast_r4600_v1_icache32(void)
  98. {
  99. unsigned long flags;
  100. local_irq_save(flags);
  101. blast_icache32();
  102. local_irq_restore(flags);
  103. }
  104. static inline void tx49_blast_icache32(void)
  105. {
  106. unsigned long start = INDEX_BASE;
  107. unsigned long end = start + current_cpu_data.icache.waysize;
  108. unsigned long ws_inc = 1UL << current_cpu_data.icache.waybit;
  109. unsigned long ws_end = current_cpu_data.icache.ways <<
  110. current_cpu_data.icache.waybit;
  111. unsigned long ws, addr;
  112. CACHE32_UNROLL32_ALIGN2;
  113. /* I'm in even chunk. blast odd chunks */
  114. for (ws = 0; ws < ws_end; ws += ws_inc)
  115. for (addr = start + 0x400; addr < end; addr += 0x400 * 2)
  116. cache32_unroll32(addr|ws,Index_Invalidate_I);
  117. CACHE32_UNROLL32_ALIGN;
  118. /* I'm in odd chunk. blast even chunks */
  119. for (ws = 0; ws < ws_end; ws += ws_inc)
  120. for (addr = start; addr < end; addr += 0x400 * 2)
  121. cache32_unroll32(addr|ws,Index_Invalidate_I);
  122. }
  123. static inline void blast_icache32_r4600_v1_page_indexed(unsigned long page)
  124. {
  125. unsigned long flags;
  126. local_irq_save(flags);
  127. blast_icache32_page_indexed(page);
  128. local_irq_restore(flags);
  129. }
  130. static inline void tx49_blast_icache32_page_indexed(unsigned long page)
  131. {
  132. unsigned long start = page;
  133. unsigned long end = start + PAGE_SIZE;
  134. unsigned long ws_inc = 1UL << current_cpu_data.icache.waybit;
  135. unsigned long ws_end = current_cpu_data.icache.ways <<
  136. current_cpu_data.icache.waybit;
  137. unsigned long ws, addr;
  138. CACHE32_UNROLL32_ALIGN2;
  139. /* I'm in even chunk. blast odd chunks */
  140. for (ws = 0; ws < ws_end; ws += ws_inc)
  141. for (addr = start + 0x400; addr < end; addr += 0x400 * 2)
  142. cache32_unroll32(addr|ws,Index_Invalidate_I);
  143. CACHE32_UNROLL32_ALIGN;
  144. /* I'm in odd chunk. blast even chunks */
  145. for (ws = 0; ws < ws_end; ws += ws_inc)
  146. for (addr = start; addr < end; addr += 0x400 * 2)
  147. cache32_unroll32(addr|ws,Index_Invalidate_I);
  148. }
  149. static void (* r4k_blast_icache_page)(unsigned long addr);
  150. static inline void r4k_blast_icache_page_setup(void)
  151. {
  152. unsigned long ic_lsize = cpu_icache_line_size();
  153. if (ic_lsize == 16)
  154. r4k_blast_icache_page = blast_icache16_page;
  155. else if (ic_lsize == 32)
  156. r4k_blast_icache_page = blast_icache32_page;
  157. else if (ic_lsize == 64)
  158. r4k_blast_icache_page = blast_icache64_page;
  159. }
  160. static void (* r4k_blast_icache_page_indexed)(unsigned long addr);
  161. static inline void r4k_blast_icache_page_indexed_setup(void)
  162. {
  163. unsigned long ic_lsize = cpu_icache_line_size();
  164. if (ic_lsize == 16)
  165. r4k_blast_icache_page_indexed = blast_icache16_page_indexed;
  166. else if (ic_lsize == 32) {
  167. if (R4600_V1_INDEX_ICACHEOP_WAR && cpu_is_r4600_v1_x())
  168. r4k_blast_icache_page_indexed =
  169. blast_icache32_r4600_v1_page_indexed;
  170. else if (TX49XX_ICACHE_INDEX_INV_WAR)
  171. r4k_blast_icache_page_indexed =
  172. tx49_blast_icache32_page_indexed;
  173. else
  174. r4k_blast_icache_page_indexed =
  175. blast_icache32_page_indexed;
  176. } else if (ic_lsize == 64)
  177. r4k_blast_icache_page_indexed = blast_icache64_page_indexed;
  178. }
  179. static void (* r4k_blast_icache)(void);
  180. static inline void r4k_blast_icache_setup(void)
  181. {
  182. unsigned long ic_lsize = cpu_icache_line_size();
  183. if (ic_lsize == 16)
  184. r4k_blast_icache = blast_icache16;
  185. else if (ic_lsize == 32) {
  186. if (R4600_V1_INDEX_ICACHEOP_WAR && cpu_is_r4600_v1_x())
  187. r4k_blast_icache = blast_r4600_v1_icache32;
  188. else if (TX49XX_ICACHE_INDEX_INV_WAR)
  189. r4k_blast_icache = tx49_blast_icache32;
  190. else
  191. r4k_blast_icache = blast_icache32;
  192. } else if (ic_lsize == 64)
  193. r4k_blast_icache = blast_icache64;
  194. }
  195. static void (* r4k_blast_scache_page)(unsigned long addr);
  196. static inline void r4k_blast_scache_page_setup(void)
  197. {
  198. unsigned long sc_lsize = cpu_scache_line_size();
  199. if (scache_size == 0)
  200. r4k_blast_scache_page = (void *)no_sc_noop;
  201. else if (sc_lsize == 16)
  202. r4k_blast_scache_page = blast_scache16_page;
  203. else if (sc_lsize == 32)
  204. r4k_blast_scache_page = blast_scache32_page;
  205. else if (sc_lsize == 64)
  206. r4k_blast_scache_page = blast_scache64_page;
  207. else if (sc_lsize == 128)
  208. r4k_blast_scache_page = blast_scache128_page;
  209. }
  210. static void (* r4k_blast_scache_page_indexed)(unsigned long addr);
  211. static inline void r4k_blast_scache_page_indexed_setup(void)
  212. {
  213. unsigned long sc_lsize = cpu_scache_line_size();
  214. if (scache_size == 0)
  215. r4k_blast_scache_page_indexed = (void *)no_sc_noop;
  216. else if (sc_lsize == 16)
  217. r4k_blast_scache_page_indexed = blast_scache16_page_indexed;
  218. else if (sc_lsize == 32)
  219. r4k_blast_scache_page_indexed = blast_scache32_page_indexed;
  220. else if (sc_lsize == 64)
  221. r4k_blast_scache_page_indexed = blast_scache64_page_indexed;
  222. else if (sc_lsize == 128)
  223. r4k_blast_scache_page_indexed = blast_scache128_page_indexed;
  224. }
  225. static void (* r4k_blast_scache)(void);
  226. static inline void r4k_blast_scache_setup(void)
  227. {
  228. unsigned long sc_lsize = cpu_scache_line_size();
  229. if (scache_size == 0)
  230. r4k_blast_scache = (void *)no_sc_noop;
  231. else if (sc_lsize == 16)
  232. r4k_blast_scache = blast_scache16;
  233. else if (sc_lsize == 32)
  234. r4k_blast_scache = blast_scache32;
  235. else if (sc_lsize == 64)
  236. r4k_blast_scache = blast_scache64;
  237. else if (sc_lsize == 128)
  238. r4k_blast_scache = blast_scache128;
  239. }
  240. /*
  241. * This is former mm's flush_cache_all() which really should be
  242. * flush_cache_vunmap these days ...
  243. */
  244. static inline void local_r4k_flush_cache_all(void * args)
  245. {
  246. r4k_blast_dcache();
  247. r4k_blast_icache();
  248. }
  249. static void r4k_flush_cache_all(void)
  250. {
  251. if (!cpu_has_dc_aliases)
  252. return;
  253. on_each_cpu(local_r4k_flush_cache_all, NULL, 1, 1);
  254. }
  255. static inline void local_r4k___flush_cache_all(void * args)
  256. {
  257. r4k_blast_dcache();
  258. r4k_blast_icache();
  259. switch (current_cpu_data.cputype) {
  260. case CPU_R4000SC:
  261. case CPU_R4000MC:
  262. case CPU_R4400SC:
  263. case CPU_R4400MC:
  264. case CPU_R10000:
  265. case CPU_R12000:
  266. r4k_blast_scache();
  267. }
  268. }
  269. static void r4k___flush_cache_all(void)
  270. {
  271. on_each_cpu(local_r4k___flush_cache_all, NULL, 1, 1);
  272. }
  273. static inline void local_r4k_flush_cache_range(void * args)
  274. {
  275. struct vm_area_struct *vma = args;
  276. int exec;
  277. if (!(cpu_context(smp_processor_id(), vma->vm_mm)))
  278. return;
  279. exec = vma->vm_flags & VM_EXEC;
  280. if (cpu_has_dc_aliases || exec)
  281. r4k_blast_dcache();
  282. if (exec)
  283. r4k_blast_icache();
  284. }
  285. static void r4k_flush_cache_range(struct vm_area_struct *vma,
  286. unsigned long start, unsigned long end)
  287. {
  288. on_each_cpu(local_r4k_flush_cache_range, vma, 1, 1);
  289. }
  290. static inline void local_r4k_flush_cache_mm(void * args)
  291. {
  292. struct mm_struct *mm = args;
  293. if (!cpu_context(smp_processor_id(), mm))
  294. return;
  295. r4k_blast_dcache();
  296. r4k_blast_icache();
  297. /*
  298. * Kludge alert. For obscure reasons R4000SC and R4400SC go nuts if we
  299. * only flush the primary caches but R10000 and R12000 behave sane ...
  300. */
  301. if (current_cpu_data.cputype == CPU_R4000SC ||
  302. current_cpu_data.cputype == CPU_R4000MC ||
  303. current_cpu_data.cputype == CPU_R4400SC ||
  304. current_cpu_data.cputype == CPU_R4400MC)
  305. r4k_blast_scache();
  306. }
  307. static void r4k_flush_cache_mm(struct mm_struct *mm)
  308. {
  309. if (!cpu_has_dc_aliases)
  310. return;
  311. on_each_cpu(local_r4k_flush_cache_mm, mm, 1, 1);
  312. }
  313. struct flush_cache_page_args {
  314. struct vm_area_struct *vma;
  315. unsigned long addr;
  316. unsigned long pfn;
  317. };
  318. static inline void local_r4k_flush_cache_page(void *args)
  319. {
  320. struct flush_cache_page_args *fcp_args = args;
  321. struct vm_area_struct *vma = fcp_args->vma;
  322. unsigned long addr = fcp_args->addr;
  323. unsigned long paddr = fcp_args->pfn << PAGE_SHIFT;
  324. int exec = vma->vm_flags & VM_EXEC;
  325. struct mm_struct *mm = vma->vm_mm;
  326. pgd_t *pgdp;
  327. pud_t *pudp;
  328. pmd_t *pmdp;
  329. pte_t *ptep;
  330. /*
  331. * If ownes no valid ASID yet, cannot possibly have gotten
  332. * this page into the cache.
  333. */
  334. if (cpu_context(smp_processor_id(), mm) == 0)
  335. return;
  336. addr &= PAGE_MASK;
  337. pgdp = pgd_offset(mm, addr);
  338. pudp = pud_offset(pgdp, addr);
  339. pmdp = pmd_offset(pudp, addr);
  340. ptep = pte_offset(pmdp, addr);
  341. /*
  342. * If the page isn't marked valid, the page cannot possibly be
  343. * in the cache.
  344. */
  345. if (!(pte_val(*ptep) & _PAGE_PRESENT))
  346. return;
  347. /*
  348. * Doing flushes for another ASID than the current one is
  349. * too difficult since stupid R4k caches do a TLB translation
  350. * for every cache flush operation. So we do indexed flushes
  351. * in that case, which doesn't overly flush the cache too much.
  352. */
  353. if ((mm == current->active_mm) && (pte_val(*ptep) & _PAGE_VALID)) {
  354. if (cpu_has_dc_aliases || (exec && !cpu_has_ic_fills_f_dc)) {
  355. r4k_blast_dcache_page(addr);
  356. if (exec && !cpu_icache_snoops_remote_store)
  357. r4k_blast_scache_page(addr);
  358. }
  359. if (exec)
  360. r4k_blast_icache_page(addr);
  361. return;
  362. }
  363. /*
  364. * Do indexed flush, too much work to get the (possible) TLB refills
  365. * to work correctly.
  366. */
  367. if (cpu_has_dc_aliases || (exec && !cpu_has_ic_fills_f_dc)) {
  368. r4k_blast_dcache_page_indexed(cpu_has_pindexed_dcache ?
  369. paddr : addr);
  370. if (exec && !cpu_icache_snoops_remote_store) {
  371. r4k_blast_scache_page_indexed(paddr);
  372. }
  373. }
  374. if (exec) {
  375. if (cpu_has_vtag_icache) {
  376. int cpu = smp_processor_id();
  377. if (cpu_context(cpu, mm) != 0)
  378. drop_mmu_context(mm, cpu);
  379. } else
  380. r4k_blast_icache_page_indexed(addr);
  381. }
  382. }
  383. static void r4k_flush_cache_page(struct vm_area_struct *vma,
  384. unsigned long addr, unsigned long pfn)
  385. {
  386. struct flush_cache_page_args args;
  387. args.vma = vma;
  388. args.addr = addr;
  389. args.pfn = pfn;
  390. on_each_cpu(local_r4k_flush_cache_page, &args, 1, 1);
  391. }
  392. static inline void local_r4k_flush_data_cache_page(void * addr)
  393. {
  394. r4k_blast_dcache_page((unsigned long) addr);
  395. }
  396. static void r4k_flush_data_cache_page(unsigned long addr)
  397. {
  398. on_each_cpu(local_r4k_flush_data_cache_page, (void *) addr, 1, 1);
  399. }
  400. struct flush_icache_range_args {
  401. unsigned long start;
  402. unsigned long end;
  403. };
  404. static inline void local_r4k_flush_icache_range(void *args)
  405. {
  406. struct flush_icache_range_args *fir_args = args;
  407. unsigned long start = fir_args->start;
  408. unsigned long end = fir_args->end;
  409. if (!cpu_has_ic_fills_f_dc) {
  410. if (end - start > dcache_size) {
  411. r4k_blast_dcache();
  412. } else {
  413. R4600_HIT_CACHEOP_WAR_IMPL;
  414. protected_blast_dcache_range(start, end);
  415. }
  416. if (!cpu_icache_snoops_remote_store && scache_size) {
  417. if (end - start > scache_size)
  418. r4k_blast_scache();
  419. else
  420. protected_blast_scache_range(start, end);
  421. }
  422. }
  423. if (end - start > icache_size)
  424. r4k_blast_icache();
  425. else
  426. protected_blast_icache_range(start, end);
  427. }
  428. static void r4k_flush_icache_range(unsigned long start, unsigned long end)
  429. {
  430. struct flush_icache_range_args args;
  431. args.start = start;
  432. args.end = end;
  433. on_each_cpu(local_r4k_flush_icache_range, &args, 1, 1);
  434. instruction_hazard();
  435. }
  436. /*
  437. * Ok, this seriously sucks. We use them to flush a user page but don't
  438. * know the virtual address, so we have to blast away the whole icache
  439. * which is significantly more expensive than the real thing. Otoh we at
  440. * least know the kernel address of the page so we can flush it
  441. * selectivly.
  442. */
  443. struct flush_icache_page_args {
  444. struct vm_area_struct *vma;
  445. struct page *page;
  446. };
  447. static inline void local_r4k_flush_icache_page(void *args)
  448. {
  449. struct flush_icache_page_args *fip_args = args;
  450. struct vm_area_struct *vma = fip_args->vma;
  451. struct page *page = fip_args->page;
  452. /*
  453. * Tricky ... Because we don't know the virtual address we've got the
  454. * choice of either invalidating the entire primary and secondary
  455. * caches or invalidating the secondary caches also. With the subset
  456. * enforcment on R4000SC, R4400SC, R10000 and R12000 invalidating the
  457. * secondary cache will result in any entries in the primary caches
  458. * also getting invalidated which hopefully is a bit more economical.
  459. */
  460. if (cpu_has_subset_pcaches) {
  461. unsigned long addr = (unsigned long) page_address(page);
  462. r4k_blast_scache_page(addr);
  463. ClearPageDcacheDirty(page);
  464. return;
  465. }
  466. if (!cpu_has_ic_fills_f_dc) {
  467. unsigned long addr = (unsigned long) page_address(page);
  468. r4k_blast_dcache_page(addr);
  469. if (!cpu_icache_snoops_remote_store)
  470. r4k_blast_scache_page(addr);
  471. ClearPageDcacheDirty(page);
  472. }
  473. /*
  474. * We're not sure of the virtual address(es) involved here, so
  475. * we have to flush the entire I-cache.
  476. */
  477. if (cpu_has_vtag_icache) {
  478. int cpu = smp_processor_id();
  479. if (cpu_context(cpu, vma->vm_mm) != 0)
  480. drop_mmu_context(vma->vm_mm, cpu);
  481. } else
  482. r4k_blast_icache();
  483. }
  484. static void r4k_flush_icache_page(struct vm_area_struct *vma,
  485. struct page *page)
  486. {
  487. struct flush_icache_page_args args;
  488. /*
  489. * If there's no context yet, or the page isn't executable, no I-cache
  490. * flush is needed.
  491. */
  492. if (!(vma->vm_flags & VM_EXEC))
  493. return;
  494. args.vma = vma;
  495. args.page = page;
  496. on_each_cpu(local_r4k_flush_icache_page, &args, 1, 1);
  497. }
  498. #ifdef CONFIG_DMA_NONCOHERENT
  499. static void r4k_dma_cache_wback_inv(unsigned long addr, unsigned long size)
  500. {
  501. /* Catch bad driver code */
  502. BUG_ON(size == 0);
  503. if (cpu_has_subset_pcaches) {
  504. if (size >= scache_size)
  505. r4k_blast_scache();
  506. else
  507. blast_scache_range(addr, addr + size);
  508. return;
  509. }
  510. /*
  511. * Either no secondary cache or the available caches don't have the
  512. * subset property so we have to flush the primary caches
  513. * explicitly
  514. */
  515. if (size >= dcache_size) {
  516. r4k_blast_dcache();
  517. } else {
  518. R4600_HIT_CACHEOP_WAR_IMPL;
  519. blast_dcache_range(addr, addr + size);
  520. }
  521. bc_wback_inv(addr, size);
  522. }
  523. static void r4k_dma_cache_inv(unsigned long addr, unsigned long size)
  524. {
  525. /* Catch bad driver code */
  526. BUG_ON(size == 0);
  527. if (cpu_has_subset_pcaches) {
  528. if (size >= scache_size)
  529. r4k_blast_scache();
  530. else
  531. blast_scache_range(addr, addr + size);
  532. return;
  533. }
  534. if (size >= dcache_size) {
  535. r4k_blast_dcache();
  536. } else {
  537. R4600_HIT_CACHEOP_WAR_IMPL;
  538. blast_dcache_range(addr, addr + size);
  539. }
  540. bc_inv(addr, size);
  541. }
  542. #endif /* CONFIG_DMA_NONCOHERENT */
  543. /*
  544. * While we're protected against bad userland addresses we don't care
  545. * very much about what happens in that case. Usually a segmentation
  546. * fault will dump the process later on anyway ...
  547. */
  548. static void local_r4k_flush_cache_sigtramp(void * arg)
  549. {
  550. unsigned long ic_lsize = cpu_icache_line_size();
  551. unsigned long dc_lsize = cpu_dcache_line_size();
  552. unsigned long sc_lsize = cpu_scache_line_size();
  553. unsigned long addr = (unsigned long) arg;
  554. R4600_HIT_CACHEOP_WAR_IMPL;
  555. protected_writeback_dcache_line(addr & ~(dc_lsize - 1));
  556. if (!cpu_icache_snoops_remote_store && scache_size)
  557. protected_writeback_scache_line(addr & ~(sc_lsize - 1));
  558. protected_flush_icache_line(addr & ~(ic_lsize - 1));
  559. if (MIPS4K_ICACHE_REFILL_WAR) {
  560. __asm__ __volatile__ (
  561. ".set push\n\t"
  562. ".set noat\n\t"
  563. ".set mips3\n\t"
  564. #ifdef CONFIG_32BIT
  565. "la $at,1f\n\t"
  566. #endif
  567. #ifdef CONFIG_64BIT
  568. "dla $at,1f\n\t"
  569. #endif
  570. "cache %0,($at)\n\t"
  571. "nop; nop; nop\n"
  572. "1:\n\t"
  573. ".set pop"
  574. :
  575. : "i" (Hit_Invalidate_I));
  576. }
  577. if (MIPS_CACHE_SYNC_WAR)
  578. __asm__ __volatile__ ("sync");
  579. }
  580. static void r4k_flush_cache_sigtramp(unsigned long addr)
  581. {
  582. on_each_cpu(local_r4k_flush_cache_sigtramp, (void *) addr, 1, 1);
  583. }
  584. static void r4k_flush_icache_all(void)
  585. {
  586. if (cpu_has_vtag_icache)
  587. r4k_blast_icache();
  588. }
  589. static inline void rm7k_erratum31(void)
  590. {
  591. const unsigned long ic_lsize = 32;
  592. unsigned long addr;
  593. /* RM7000 erratum #31. The icache is screwed at startup. */
  594. write_c0_taglo(0);
  595. write_c0_taghi(0);
  596. for (addr = INDEX_BASE; addr <= INDEX_BASE + 4096; addr += ic_lsize) {
  597. __asm__ __volatile__ (
  598. ".set push\n\t"
  599. ".set noreorder\n\t"
  600. ".set mips3\n\t"
  601. "cache\t%1, 0(%0)\n\t"
  602. "cache\t%1, 0x1000(%0)\n\t"
  603. "cache\t%1, 0x2000(%0)\n\t"
  604. "cache\t%1, 0x3000(%0)\n\t"
  605. "cache\t%2, 0(%0)\n\t"
  606. "cache\t%2, 0x1000(%0)\n\t"
  607. "cache\t%2, 0x2000(%0)\n\t"
  608. "cache\t%2, 0x3000(%0)\n\t"
  609. "cache\t%1, 0(%0)\n\t"
  610. "cache\t%1, 0x1000(%0)\n\t"
  611. "cache\t%1, 0x2000(%0)\n\t"
  612. "cache\t%1, 0x3000(%0)\n\t"
  613. ".set pop\n"
  614. :
  615. : "r" (addr), "i" (Index_Store_Tag_I), "i" (Fill));
  616. }
  617. }
  618. static char *way_string[] __initdata = { NULL, "direct mapped", "2-way",
  619. "3-way", "4-way", "5-way", "6-way", "7-way", "8-way"
  620. };
  621. static void __init probe_pcache(void)
  622. {
  623. struct cpuinfo_mips *c = &current_cpu_data;
  624. unsigned int config = read_c0_config();
  625. unsigned int prid = read_c0_prid();
  626. unsigned long config1;
  627. unsigned int lsize;
  628. switch (c->cputype) {
  629. case CPU_R4600: /* QED style two way caches? */
  630. case CPU_R4700:
  631. case CPU_R5000:
  632. case CPU_NEVADA:
  633. icache_size = 1 << (12 + ((config & CONF_IC) >> 9));
  634. c->icache.linesz = 16 << ((config & CONF_IB) >> 5);
  635. c->icache.ways = 2;
  636. c->icache.waybit = ffs(icache_size/2) - 1;
  637. dcache_size = 1 << (12 + ((config & CONF_DC) >> 6));
  638. c->dcache.linesz = 16 << ((config & CONF_DB) >> 4);
  639. c->dcache.ways = 2;
  640. c->dcache.waybit= ffs(dcache_size/2) - 1;
  641. c->options |= MIPS_CPU_CACHE_CDEX_P;
  642. break;
  643. case CPU_R5432:
  644. case CPU_R5500:
  645. icache_size = 1 << (12 + ((config & CONF_IC) >> 9));
  646. c->icache.linesz = 16 << ((config & CONF_IB) >> 5);
  647. c->icache.ways = 2;
  648. c->icache.waybit= 0;
  649. dcache_size = 1 << (12 + ((config & CONF_DC) >> 6));
  650. c->dcache.linesz = 16 << ((config & CONF_DB) >> 4);
  651. c->dcache.ways = 2;
  652. c->dcache.waybit = 0;
  653. c->options |= MIPS_CPU_CACHE_CDEX_P;
  654. break;
  655. case CPU_TX49XX:
  656. icache_size = 1 << (12 + ((config & CONF_IC) >> 9));
  657. c->icache.linesz = 16 << ((config & CONF_IB) >> 5);
  658. c->icache.ways = 4;
  659. c->icache.waybit= 0;
  660. dcache_size = 1 << (12 + ((config & CONF_DC) >> 6));
  661. c->dcache.linesz = 16 << ((config & CONF_DB) >> 4);
  662. c->dcache.ways = 4;
  663. c->dcache.waybit = 0;
  664. c->options |= MIPS_CPU_CACHE_CDEX_P;
  665. c->options |= MIPS_CPU_PREFETCH;
  666. break;
  667. case CPU_R4000PC:
  668. case CPU_R4000SC:
  669. case CPU_R4000MC:
  670. case CPU_R4400PC:
  671. case CPU_R4400SC:
  672. case CPU_R4400MC:
  673. case CPU_R4300:
  674. icache_size = 1 << (12 + ((config & CONF_IC) >> 9));
  675. c->icache.linesz = 16 << ((config & CONF_IB) >> 5);
  676. c->icache.ways = 1;
  677. c->icache.waybit = 0; /* doesn't matter */
  678. dcache_size = 1 << (12 + ((config & CONF_DC) >> 6));
  679. c->dcache.linesz = 16 << ((config & CONF_DB) >> 4);
  680. c->dcache.ways = 1;
  681. c->dcache.waybit = 0; /* does not matter */
  682. c->options |= MIPS_CPU_CACHE_CDEX_P;
  683. break;
  684. case CPU_R10000:
  685. case CPU_R12000:
  686. icache_size = 1 << (12 + ((config & R10K_CONF_IC) >> 29));
  687. c->icache.linesz = 64;
  688. c->icache.ways = 2;
  689. c->icache.waybit = 0;
  690. dcache_size = 1 << (12 + ((config & R10K_CONF_DC) >> 26));
  691. c->dcache.linesz = 32;
  692. c->dcache.ways = 2;
  693. c->dcache.waybit = 0;
  694. c->options |= MIPS_CPU_PREFETCH;
  695. break;
  696. case CPU_VR4133:
  697. write_c0_config(config & ~CONF_EB);
  698. case CPU_VR4131:
  699. /* Workaround for cache instruction bug of VR4131 */
  700. if (c->processor_id == 0x0c80U || c->processor_id == 0x0c81U ||
  701. c->processor_id == 0x0c82U) {
  702. config &= ~0x00000030U;
  703. config |= 0x00410000U;
  704. write_c0_config(config);
  705. }
  706. icache_size = 1 << (10 + ((config & CONF_IC) >> 9));
  707. c->icache.linesz = 16 << ((config & CONF_IB) >> 5);
  708. c->icache.ways = 2;
  709. c->icache.waybit = ffs(icache_size/2) - 1;
  710. dcache_size = 1 << (10 + ((config & CONF_DC) >> 6));
  711. c->dcache.linesz = 16 << ((config & CONF_DB) >> 4);
  712. c->dcache.ways = 2;
  713. c->dcache.waybit = ffs(dcache_size/2) - 1;
  714. c->options |= MIPS_CPU_CACHE_CDEX_P;
  715. break;
  716. case CPU_VR41XX:
  717. case CPU_VR4111:
  718. case CPU_VR4121:
  719. case CPU_VR4122:
  720. case CPU_VR4181:
  721. case CPU_VR4181A:
  722. icache_size = 1 << (10 + ((config & CONF_IC) >> 9));
  723. c->icache.linesz = 16 << ((config & CONF_IB) >> 5);
  724. c->icache.ways = 1;
  725. c->icache.waybit = 0; /* doesn't matter */
  726. dcache_size = 1 << (10 + ((config & CONF_DC) >> 6));
  727. c->dcache.linesz = 16 << ((config & CONF_DB) >> 4);
  728. c->dcache.ways = 1;
  729. c->dcache.waybit = 0; /* does not matter */
  730. c->options |= MIPS_CPU_CACHE_CDEX_P;
  731. break;
  732. case CPU_RM7000:
  733. rm7k_erratum31();
  734. case CPU_RM9000:
  735. icache_size = 1 << (12 + ((config & CONF_IC) >> 9));
  736. c->icache.linesz = 16 << ((config & CONF_IB) >> 5);
  737. c->icache.ways = 4;
  738. c->icache.waybit = ffs(icache_size / c->icache.ways) - 1;
  739. dcache_size = 1 << (12 + ((config & CONF_DC) >> 6));
  740. c->dcache.linesz = 16 << ((config & CONF_DB) >> 4);
  741. c->dcache.ways = 4;
  742. c->dcache.waybit = ffs(dcache_size / c->dcache.ways) - 1;
  743. #if !defined(CONFIG_SMP) || !defined(RM9000_CDEX_SMP_WAR)
  744. c->options |= MIPS_CPU_CACHE_CDEX_P;
  745. #endif
  746. c->options |= MIPS_CPU_PREFETCH;
  747. break;
  748. default:
  749. if (!(config & MIPS_CONF_M))
  750. panic("Don't know how to probe P-caches on this cpu.");
  751. /*
  752. * So we seem to be a MIPS32 or MIPS64 CPU
  753. * So let's probe the I-cache ...
  754. */
  755. config1 = read_c0_config1();
  756. if ((lsize = ((config1 >> 19) & 7)))
  757. c->icache.linesz = 2 << lsize;
  758. else
  759. c->icache.linesz = lsize;
  760. c->icache.sets = 64 << ((config1 >> 22) & 7);
  761. c->icache.ways = 1 + ((config1 >> 16) & 7);
  762. icache_size = c->icache.sets *
  763. c->icache.ways *
  764. c->icache.linesz;
  765. c->icache.waybit = ffs(icache_size/c->icache.ways) - 1;
  766. if (config & 0x8) /* VI bit */
  767. c->icache.flags |= MIPS_CACHE_VTAG;
  768. /*
  769. * Now probe the MIPS32 / MIPS64 data cache.
  770. */
  771. c->dcache.flags = 0;
  772. if ((lsize = ((config1 >> 10) & 7)))
  773. c->dcache.linesz = 2 << lsize;
  774. else
  775. c->dcache.linesz= lsize;
  776. c->dcache.sets = 64 << ((config1 >> 13) & 7);
  777. c->dcache.ways = 1 + ((config1 >> 7) & 7);
  778. dcache_size = c->dcache.sets *
  779. c->dcache.ways *
  780. c->dcache.linesz;
  781. c->dcache.waybit = ffs(dcache_size/c->dcache.ways) - 1;
  782. c->options |= MIPS_CPU_PREFETCH;
  783. break;
  784. }
  785. /*
  786. * Processor configuration sanity check for the R4000SC erratum
  787. * #5. With page sizes larger than 32kB there is no possibility
  788. * to get a VCE exception anymore so we don't care about this
  789. * misconfiguration. The case is rather theoretical anyway;
  790. * presumably no vendor is shipping his hardware in the "bad"
  791. * configuration.
  792. */
  793. if ((prid & 0xff00) == PRID_IMP_R4000 && (prid & 0xff) < 0x40 &&
  794. !(config & CONF_SC) && c->icache.linesz != 16 &&
  795. PAGE_SIZE <= 0x8000)
  796. panic("Improper R4000SC processor configuration detected");
  797. /* compute a couple of other cache variables */
  798. c->icache.waysize = icache_size / c->icache.ways;
  799. c->dcache.waysize = dcache_size / c->dcache.ways;
  800. c->icache.sets = icache_size / (c->icache.linesz * c->icache.ways);
  801. c->dcache.sets = dcache_size / (c->dcache.linesz * c->dcache.ways);
  802. /*
  803. * R10000 and R12000 P-caches are odd in a positive way. They're 32kB
  804. * 2-way virtually indexed so normally would suffer from aliases. So
  805. * normally they'd suffer from aliases but magic in the hardware deals
  806. * with that for us so we don't need to take care ourselves.
  807. */
  808. switch (c->cputype) {
  809. case CPU_20KC:
  810. case CPU_25KF:
  811. c->dcache.flags |= MIPS_CACHE_PINDEX;
  812. case CPU_R10000:
  813. case CPU_R12000:
  814. case CPU_SB1:
  815. break;
  816. case CPU_24K:
  817. if (!(read_c0_config7() & (1 << 16)))
  818. default:
  819. if (c->dcache.waysize > PAGE_SIZE)
  820. c->dcache.flags |= MIPS_CACHE_ALIASES;
  821. }
  822. switch (c->cputype) {
  823. case CPU_20KC:
  824. /*
  825. * Some older 20Kc chips doesn't have the 'VI' bit in
  826. * the config register.
  827. */
  828. c->icache.flags |= MIPS_CACHE_VTAG;
  829. break;
  830. case CPU_AU1000:
  831. case CPU_AU1500:
  832. case CPU_AU1100:
  833. case CPU_AU1550:
  834. case CPU_AU1200:
  835. c->icache.flags |= MIPS_CACHE_IC_F_DC;
  836. break;
  837. }
  838. printk("Primary instruction cache %ldkB, %s, %s, linesize %d bytes.\n",
  839. icache_size >> 10,
  840. cpu_has_vtag_icache ? "virtually tagged" : "physically tagged",
  841. way_string[c->icache.ways], c->icache.linesz);
  842. printk("Primary data cache %ldkB, %s, linesize %d bytes.\n",
  843. dcache_size >> 10, way_string[c->dcache.ways], c->dcache.linesz);
  844. }
  845. /*
  846. * If you even _breathe_ on this function, look at the gcc output and make sure
  847. * it does not pop things on and off the stack for the cache sizing loop that
  848. * executes in KSEG1 space or else you will crash and burn badly. You have
  849. * been warned.
  850. */
  851. static int __init probe_scache(void)
  852. {
  853. extern unsigned long stext;
  854. unsigned long flags, addr, begin, end, pow2;
  855. unsigned int config = read_c0_config();
  856. struct cpuinfo_mips *c = &current_cpu_data;
  857. int tmp;
  858. if (config & CONF_SC)
  859. return 0;
  860. begin = (unsigned long) &stext;
  861. begin &= ~((4 * 1024 * 1024) - 1);
  862. end = begin + (4 * 1024 * 1024);
  863. /*
  864. * This is such a bitch, you'd think they would make it easy to do
  865. * this. Away you daemons of stupidity!
  866. */
  867. local_irq_save(flags);
  868. /* Fill each size-multiple cache line with a valid tag. */
  869. pow2 = (64 * 1024);
  870. for (addr = begin; addr < end; addr = (begin + pow2)) {
  871. unsigned long *p = (unsigned long *) addr;
  872. __asm__ __volatile__("nop" : : "r" (*p)); /* whee... */
  873. pow2 <<= 1;
  874. }
  875. /* Load first line with zero (therefore invalid) tag. */
  876. write_c0_taglo(0);
  877. write_c0_taghi(0);
  878. __asm__ __volatile__("nop; nop; nop; nop;"); /* avoid the hazard */
  879. cache_op(Index_Store_Tag_I, begin);
  880. cache_op(Index_Store_Tag_D, begin);
  881. cache_op(Index_Store_Tag_SD, begin);
  882. /* Now search for the wrap around point. */
  883. pow2 = (128 * 1024);
  884. tmp = 0;
  885. for (addr = begin + (128 * 1024); addr < end; addr = begin + pow2) {
  886. cache_op(Index_Load_Tag_SD, addr);
  887. __asm__ __volatile__("nop; nop; nop; nop;"); /* hazard... */
  888. if (!read_c0_taglo())
  889. break;
  890. pow2 <<= 1;
  891. }
  892. local_irq_restore(flags);
  893. addr -= begin;
  894. scache_size = addr;
  895. c->scache.linesz = 16 << ((config & R4K_CONF_SB) >> 22);
  896. c->scache.ways = 1;
  897. c->dcache.waybit = 0; /* does not matter */
  898. return 1;
  899. }
  900. extern int r5k_sc_init(void);
  901. extern int rm7k_sc_init(void);
  902. static void __init setup_scache(void)
  903. {
  904. struct cpuinfo_mips *c = &current_cpu_data;
  905. unsigned int config = read_c0_config();
  906. int sc_present = 0;
  907. /*
  908. * Do the probing thing on R4000SC and R4400SC processors. Other
  909. * processors don't have a S-cache that would be relevant to the
  910. * Linux memory managment.
  911. */
  912. switch (c->cputype) {
  913. case CPU_R4000SC:
  914. case CPU_R4000MC:
  915. case CPU_R4400SC:
  916. case CPU_R4400MC:
  917. sc_present = run_uncached(probe_scache);
  918. if (sc_present)
  919. c->options |= MIPS_CPU_CACHE_CDEX_S;
  920. break;
  921. case CPU_R10000:
  922. case CPU_R12000:
  923. scache_size = 0x80000 << ((config & R10K_CONF_SS) >> 16);
  924. c->scache.linesz = 64 << ((config >> 13) & 1);
  925. c->scache.ways = 2;
  926. c->scache.waybit= 0;
  927. sc_present = 1;
  928. break;
  929. case CPU_R5000:
  930. case CPU_NEVADA:
  931. #ifdef CONFIG_R5000_CPU_SCACHE
  932. r5k_sc_init();
  933. #endif
  934. return;
  935. case CPU_RM7000:
  936. case CPU_RM9000:
  937. #ifdef CONFIG_RM7000_CPU_SCACHE
  938. rm7k_sc_init();
  939. #endif
  940. return;
  941. default:
  942. sc_present = 0;
  943. }
  944. if (!sc_present)
  945. return;
  946. if ((c->isa_level == MIPS_CPU_ISA_M32R1 ||
  947. c->isa_level == MIPS_CPU_ISA_M64R1) &&
  948. !(c->scache.flags & MIPS_CACHE_NOT_PRESENT))
  949. panic("Dunno how to handle MIPS32 / MIPS64 second level cache");
  950. /* compute a couple of other cache variables */
  951. c->scache.waysize = scache_size / c->scache.ways;
  952. c->scache.sets = scache_size / (c->scache.linesz * c->scache.ways);
  953. printk("Unified secondary cache %ldkB %s, linesize %d bytes.\n",
  954. scache_size >> 10, way_string[c->scache.ways], c->scache.linesz);
  955. c->options |= MIPS_CPU_SUBSET_CACHES;
  956. }
  957. static inline void coherency_setup(void)
  958. {
  959. change_c0_config(CONF_CM_CMASK, CONF_CM_DEFAULT);
  960. /*
  961. * c0_status.cu=0 specifies that updates by the sc instruction use
  962. * the coherency mode specified by the TLB; 1 means cachable
  963. * coherent update on write will be used. Not all processors have
  964. * this bit and; some wire it to zero, others like Toshiba had the
  965. * silly idea of putting something else there ...
  966. */
  967. switch (current_cpu_data.cputype) {
  968. case CPU_R4000PC:
  969. case CPU_R4000SC:
  970. case CPU_R4000MC:
  971. case CPU_R4400PC:
  972. case CPU_R4400SC:
  973. case CPU_R4400MC:
  974. clear_c0_config(CONF_CU);
  975. break;
  976. }
  977. }
  978. void __init r4k_cache_init(void)
  979. {
  980. extern void build_clear_page(void);
  981. extern void build_copy_page(void);
  982. extern char except_vec2_generic;
  983. struct cpuinfo_mips *c = &current_cpu_data;
  984. /* Default cache error handler for R4000 and R5000 family */
  985. set_uncached_handler (0x100, &except_vec2_generic, 0x80);
  986. probe_pcache();
  987. setup_scache();
  988. r4k_blast_dcache_page_setup();
  989. r4k_blast_dcache_page_indexed_setup();
  990. r4k_blast_dcache_setup();
  991. r4k_blast_icache_page_setup();
  992. r4k_blast_icache_page_indexed_setup();
  993. r4k_blast_icache_setup();
  994. r4k_blast_scache_page_setup();
  995. r4k_blast_scache_page_indexed_setup();
  996. r4k_blast_scache_setup();
  997. /*
  998. * Some MIPS32 and MIPS64 processors have physically indexed caches.
  999. * This code supports virtually indexed processors and will be
  1000. * unnecessarily inefficient on physically indexed processors.
  1001. */
  1002. shm_align_mask = max_t( unsigned long,
  1003. c->dcache.sets * c->dcache.linesz - 1,
  1004. PAGE_SIZE - 1);
  1005. flush_cache_all = r4k_flush_cache_all;
  1006. __flush_cache_all = r4k___flush_cache_all;
  1007. flush_cache_mm = r4k_flush_cache_mm;
  1008. flush_cache_page = r4k_flush_cache_page;
  1009. flush_icache_page = r4k_flush_icache_page;
  1010. flush_cache_range = r4k_flush_cache_range;
  1011. flush_cache_sigtramp = r4k_flush_cache_sigtramp;
  1012. flush_icache_all = r4k_flush_icache_all;
  1013. flush_data_cache_page = r4k_flush_data_cache_page;
  1014. flush_icache_range = r4k_flush_icache_range;
  1015. #ifdef CONFIG_DMA_NONCOHERENT
  1016. _dma_cache_wback_inv = r4k_dma_cache_wback_inv;
  1017. _dma_cache_wback = r4k_dma_cache_wback_inv;
  1018. _dma_cache_inv = r4k_dma_cache_inv;
  1019. #endif
  1020. build_clear_page();
  1021. build_copy_page();
  1022. local_r4k___flush_cache_all(NULL);
  1023. coherency_setup();
  1024. }