unaligned.c 20 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729
  1. /* $Id: unaligned.c,v 1.24 2002/02/09 19:49:31 davem Exp $
  2. * unaligned.c: Unaligned load/store trap handling with special
  3. * cases for the kernel to do them more quickly.
  4. *
  5. * Copyright (C) 1996 David S. Miller (davem@caip.rutgers.edu)
  6. * Copyright (C) 1996,1997 Jakub Jelinek (jj@sunsite.mff.cuni.cz)
  7. */
  8. #include <linux/kernel.h>
  9. #include <linux/sched.h>
  10. #include <linux/mm.h>
  11. #include <linux/module.h>
  12. #include <asm/asi.h>
  13. #include <asm/ptrace.h>
  14. #include <asm/pstate.h>
  15. #include <asm/processor.h>
  16. #include <asm/system.h>
  17. #include <asm/uaccess.h>
  18. #include <linux/smp.h>
  19. #include <linux/smp_lock.h>
  20. #include <linux/bitops.h>
  21. #include <asm/fpumacro.h>
  22. /* #define DEBUG_MNA */
  23. enum direction {
  24. load, /* ld, ldd, ldh, ldsh */
  25. store, /* st, std, sth, stsh */
  26. both, /* Swap, ldstub, cas, ... */
  27. fpld,
  28. fpst,
  29. invalid,
  30. };
  31. #ifdef DEBUG_MNA
  32. static char *dirstrings[] = {
  33. "load", "store", "both", "fpload", "fpstore", "invalid"
  34. };
  35. #endif
  36. static inline enum direction decode_direction(unsigned int insn)
  37. {
  38. unsigned long tmp = (insn >> 21) & 1;
  39. if (!tmp)
  40. return load;
  41. else {
  42. switch ((insn>>19)&0xf) {
  43. case 15: /* swap* */
  44. return both;
  45. default:
  46. return store;
  47. }
  48. }
  49. }
  50. /* 16 = double-word, 8 = extra-word, 4 = word, 2 = half-word */
  51. static inline int decode_access_size(unsigned int insn)
  52. {
  53. unsigned int tmp;
  54. tmp = ((insn >> 19) & 0xf);
  55. if (tmp == 11 || tmp == 14) /* ldx/stx */
  56. return 8;
  57. tmp &= 3;
  58. if (!tmp)
  59. return 4;
  60. else if (tmp == 3)
  61. return 16; /* ldd/std - Although it is actually 8 */
  62. else if (tmp == 2)
  63. return 2;
  64. else {
  65. printk("Impossible unaligned trap. insn=%08x\n", insn);
  66. die_if_kernel("Byte sized unaligned access?!?!", current_thread_info()->kregs);
  67. /* GCC should never warn that control reaches the end
  68. * of this function without returning a value because
  69. * die_if_kernel() is marked with attribute 'noreturn'.
  70. * Alas, some versions do...
  71. */
  72. return 0;
  73. }
  74. }
  75. static inline int decode_asi(unsigned int insn, struct pt_regs *regs)
  76. {
  77. if (insn & 0x800000) {
  78. if (insn & 0x2000)
  79. return (unsigned char)(regs->tstate >> 24); /* %asi */
  80. else
  81. return (unsigned char)(insn >> 5); /* imm_asi */
  82. } else
  83. return ASI_P;
  84. }
  85. /* 0x400000 = signed, 0 = unsigned */
  86. static inline int decode_signedness(unsigned int insn)
  87. {
  88. return (insn & 0x400000);
  89. }
  90. static inline void maybe_flush_windows(unsigned int rs1, unsigned int rs2,
  91. unsigned int rd, int from_kernel)
  92. {
  93. if (rs2 >= 16 || rs1 >= 16 || rd >= 16) {
  94. if (from_kernel != 0)
  95. __asm__ __volatile__("flushw");
  96. else
  97. flushw_user();
  98. }
  99. }
  100. static inline long sign_extend_imm13(long imm)
  101. {
  102. return imm << 51 >> 51;
  103. }
  104. static unsigned long fetch_reg(unsigned int reg, struct pt_regs *regs)
  105. {
  106. unsigned long value;
  107. if (reg < 16)
  108. return (!reg ? 0 : regs->u_regs[reg]);
  109. if (regs->tstate & TSTATE_PRIV) {
  110. struct reg_window *win;
  111. win = (struct reg_window *)(regs->u_regs[UREG_FP] + STACK_BIAS);
  112. value = win->locals[reg - 16];
  113. } else if (test_thread_flag(TIF_32BIT)) {
  114. struct reg_window32 __user *win32;
  115. win32 = (struct reg_window32 __user *)((unsigned long)((u32)regs->u_regs[UREG_FP]));
  116. get_user(value, &win32->locals[reg - 16]);
  117. } else {
  118. struct reg_window __user *win;
  119. win = (struct reg_window __user *)(regs->u_regs[UREG_FP] + STACK_BIAS);
  120. get_user(value, &win->locals[reg - 16]);
  121. }
  122. return value;
  123. }
  124. static unsigned long *fetch_reg_addr(unsigned int reg, struct pt_regs *regs)
  125. {
  126. if (reg < 16)
  127. return &regs->u_regs[reg];
  128. if (regs->tstate & TSTATE_PRIV) {
  129. struct reg_window *win;
  130. win = (struct reg_window *)(regs->u_regs[UREG_FP] + STACK_BIAS);
  131. return &win->locals[reg - 16];
  132. } else if (test_thread_flag(TIF_32BIT)) {
  133. struct reg_window32 *win32;
  134. win32 = (struct reg_window32 *)((unsigned long)((u32)regs->u_regs[UREG_FP]));
  135. return (unsigned long *)&win32->locals[reg - 16];
  136. } else {
  137. struct reg_window *win;
  138. win = (struct reg_window *)(regs->u_regs[UREG_FP] + STACK_BIAS);
  139. return &win->locals[reg - 16];
  140. }
  141. }
  142. unsigned long compute_effective_address(struct pt_regs *regs,
  143. unsigned int insn, unsigned int rd)
  144. {
  145. unsigned int rs1 = (insn >> 14) & 0x1f;
  146. unsigned int rs2 = insn & 0x1f;
  147. int from_kernel = (regs->tstate & TSTATE_PRIV) != 0;
  148. if (insn & 0x2000) {
  149. maybe_flush_windows(rs1, 0, rd, from_kernel);
  150. return (fetch_reg(rs1, regs) + sign_extend_imm13(insn));
  151. } else {
  152. maybe_flush_windows(rs1, rs2, rd, from_kernel);
  153. return (fetch_reg(rs1, regs) + fetch_reg(rs2, regs));
  154. }
  155. }
  156. /* This is just to make gcc think die_if_kernel does return... */
  157. static void __attribute_used__ unaligned_panic(char *str, struct pt_regs *regs)
  158. {
  159. die_if_kernel(str, regs);
  160. }
  161. #define do_integer_load(dest_reg, size, saddr, is_signed, asi, errh) ({ \
  162. __asm__ __volatile__ ( \
  163. "wr %4, 0, %%asi\n\t" \
  164. "cmp %1, 8\n\t" \
  165. "bge,pn %%icc, 9f\n\t" \
  166. " cmp %1, 4\n\t" \
  167. "be,pt %%icc, 6f\n" \
  168. "4:\t" " lduba [%2] %%asi, %%l1\n" \
  169. "5:\t" "lduba [%2 + 1] %%asi, %%l2\n\t" \
  170. "sll %%l1, 8, %%l1\n\t" \
  171. "brz,pt %3, 3f\n\t" \
  172. " add %%l1, %%l2, %%l1\n\t" \
  173. "sllx %%l1, 48, %%l1\n\t" \
  174. "srax %%l1, 48, %%l1\n" \
  175. "3:\t" "ba,pt %%xcc, 0f\n\t" \
  176. " stx %%l1, [%0]\n" \
  177. "6:\t" "lduba [%2 + 1] %%asi, %%l2\n\t" \
  178. "sll %%l1, 24, %%l1\n" \
  179. "7:\t" "lduba [%2 + 2] %%asi, %%g7\n\t" \
  180. "sll %%l2, 16, %%l2\n" \
  181. "8:\t" "lduba [%2 + 3] %%asi, %%g1\n\t" \
  182. "sll %%g7, 8, %%g7\n\t" \
  183. "or %%l1, %%l2, %%l1\n\t" \
  184. "or %%g7, %%g1, %%g7\n\t" \
  185. "or %%l1, %%g7, %%l1\n\t" \
  186. "brnz,a,pt %3, 3f\n\t" \
  187. " sra %%l1, 0, %%l1\n" \
  188. "3:\t" "ba,pt %%xcc, 0f\n\t" \
  189. " stx %%l1, [%0]\n" \
  190. "9:\t" "lduba [%2] %%asi, %%l1\n" \
  191. "10:\t" "lduba [%2 + 1] %%asi, %%l2\n\t" \
  192. "sllx %%l1, 56, %%l1\n" \
  193. "11:\t" "lduba [%2 + 2] %%asi, %%g7\n\t" \
  194. "sllx %%l2, 48, %%l2\n" \
  195. "12:\t" "lduba [%2 + 3] %%asi, %%g1\n\t" \
  196. "sllx %%g7, 40, %%g7\n\t" \
  197. "sllx %%g1, 32, %%g1\n\t" \
  198. "or %%l1, %%l2, %%l1\n\t" \
  199. "or %%g7, %%g1, %%g7\n" \
  200. "13:\t" "lduba [%2 + 4] %%asi, %%l2\n\t" \
  201. "or %%l1, %%g7, %%g7\n" \
  202. "14:\t" "lduba [%2 + 5] %%asi, %%g1\n\t" \
  203. "sllx %%l2, 24, %%l2\n" \
  204. "15:\t" "lduba [%2 + 6] %%asi, %%l1\n\t" \
  205. "sllx %%g1, 16, %%g1\n\t" \
  206. "or %%g7, %%l2, %%g7\n" \
  207. "16:\t" "lduba [%2 + 7] %%asi, %%l2\n\t" \
  208. "sllx %%l1, 8, %%l1\n\t" \
  209. "or %%g7, %%g1, %%g7\n\t" \
  210. "or %%l1, %%l2, %%l1\n\t" \
  211. "or %%g7, %%l1, %%g7\n\t" \
  212. "cmp %1, 8\n\t" \
  213. "be,a,pt %%icc, 0f\n\t" \
  214. " stx %%g7, [%0]\n\t" \
  215. "srlx %%g7, 32, %%l1\n\t" \
  216. "sra %%g7, 0, %%g7\n\t" \
  217. "stx %%l1, [%0]\n\t" \
  218. "stx %%g7, [%0 + 8]\n" \
  219. "0:\n\t" \
  220. "wr %%g0, %5, %%asi\n\n\t" \
  221. ".section __ex_table\n\t" \
  222. ".word 4b, " #errh "\n\t" \
  223. ".word 5b, " #errh "\n\t" \
  224. ".word 6b, " #errh "\n\t" \
  225. ".word 7b, " #errh "\n\t" \
  226. ".word 8b, " #errh "\n\t" \
  227. ".word 9b, " #errh "\n\t" \
  228. ".word 10b, " #errh "\n\t" \
  229. ".word 11b, " #errh "\n\t" \
  230. ".word 12b, " #errh "\n\t" \
  231. ".word 13b, " #errh "\n\t" \
  232. ".word 14b, " #errh "\n\t" \
  233. ".word 15b, " #errh "\n\t" \
  234. ".word 16b, " #errh "\n\n\t" \
  235. ".previous\n\t" \
  236. : : "r" (dest_reg), "r" (size), "r" (saddr), "r" (is_signed), \
  237. "r" (asi), "i" (ASI_AIUS) \
  238. : "l1", "l2", "g7", "g1", "cc"); \
  239. })
  240. #define store_common(dst_addr, size, src_val, asi, errh) ({ \
  241. __asm__ __volatile__ ( \
  242. "wr %3, 0, %%asi\n\t" \
  243. "ldx [%2], %%l1\n" \
  244. "cmp %1, 2\n\t" \
  245. "be,pn %%icc, 2f\n\t" \
  246. " cmp %1, 4\n\t" \
  247. "be,pt %%icc, 1f\n\t" \
  248. " srlx %%l1, 24, %%l2\n\t" \
  249. "srlx %%l1, 56, %%g1\n\t" \
  250. "srlx %%l1, 48, %%g7\n" \
  251. "4:\t" "stba %%g1, [%0] %%asi\n\t" \
  252. "srlx %%l1, 40, %%g1\n" \
  253. "5:\t" "stba %%g7, [%0 + 1] %%asi\n\t" \
  254. "srlx %%l1, 32, %%g7\n" \
  255. "6:\t" "stba %%g1, [%0 + 2] %%asi\n" \
  256. "7:\t" "stba %%g7, [%0 + 3] %%asi\n\t" \
  257. "srlx %%l1, 16, %%g1\n" \
  258. "8:\t" "stba %%l2, [%0 + 4] %%asi\n\t" \
  259. "srlx %%l1, 8, %%g7\n" \
  260. "9:\t" "stba %%g1, [%0 + 5] %%asi\n" \
  261. "10:\t" "stba %%g7, [%0 + 6] %%asi\n\t" \
  262. "ba,pt %%xcc, 0f\n" \
  263. "11:\t" " stba %%l1, [%0 + 7] %%asi\n" \
  264. "1:\t" "srl %%l1, 16, %%g7\n" \
  265. "12:\t" "stba %%l2, [%0] %%asi\n\t" \
  266. "srl %%l1, 8, %%l2\n" \
  267. "13:\t" "stba %%g7, [%0 + 1] %%asi\n" \
  268. "14:\t" "stba %%l2, [%0 + 2] %%asi\n\t" \
  269. "ba,pt %%xcc, 0f\n" \
  270. "15:\t" " stba %%l1, [%0 + 3] %%asi\n" \
  271. "2:\t" "srl %%l1, 8, %%l2\n" \
  272. "16:\t" "stba %%l2, [%0] %%asi\n" \
  273. "17:\t" "stba %%l1, [%0 + 1] %%asi\n" \
  274. "0:\n\t" \
  275. "wr %%g0, %4, %%asi\n\n\t" \
  276. ".section __ex_table\n\t" \
  277. ".word 4b, " #errh "\n\t" \
  278. ".word 5b, " #errh "\n\t" \
  279. ".word 6b, " #errh "\n\t" \
  280. ".word 7b, " #errh "\n\t" \
  281. ".word 8b, " #errh "\n\t" \
  282. ".word 9b, " #errh "\n\t" \
  283. ".word 10b, " #errh "\n\t" \
  284. ".word 11b, " #errh "\n\t" \
  285. ".word 12b, " #errh "\n\t" \
  286. ".word 13b, " #errh "\n\t" \
  287. ".word 14b, " #errh "\n\t" \
  288. ".word 15b, " #errh "\n\t" \
  289. ".word 16b, " #errh "\n\t" \
  290. ".word 17b, " #errh "\n\n\t" \
  291. ".previous\n\t" \
  292. : : "r" (dst_addr), "r" (size), "r" (src_val), "r" (asi), "i" (ASI_AIUS)\
  293. : "l1", "l2", "g7", "g1", "cc"); \
  294. })
  295. #define do_integer_store(reg_num, size, dst_addr, regs, asi, errh) ({ \
  296. unsigned long zero = 0; \
  297. unsigned long *src_val = &zero; \
  298. \
  299. if (size == 16) { \
  300. size = 8; \
  301. zero = (((long)(reg_num ? \
  302. (unsigned)fetch_reg(reg_num, regs) : 0)) << 32) | \
  303. (unsigned)fetch_reg(reg_num + 1, regs); \
  304. } else if (reg_num) src_val = fetch_reg_addr(reg_num, regs); \
  305. store_common(dst_addr, size, src_val, asi, errh); \
  306. })
  307. extern void smp_capture(void);
  308. extern void smp_release(void);
  309. #define do_atomic(srcdest_reg, mem, errh) ({ \
  310. unsigned long flags, tmp; \
  311. \
  312. smp_capture(); \
  313. local_irq_save(flags); \
  314. tmp = *srcdest_reg; \
  315. do_integer_load(srcdest_reg, 4, mem, 0, errh); \
  316. store_common(mem, 4, &tmp, errh); \
  317. local_irq_restore(flags); \
  318. smp_release(); \
  319. })
  320. static inline void advance(struct pt_regs *regs)
  321. {
  322. regs->tpc = regs->tnpc;
  323. regs->tnpc += 4;
  324. if (test_thread_flag(TIF_32BIT)) {
  325. regs->tpc &= 0xffffffff;
  326. regs->tnpc &= 0xffffffff;
  327. }
  328. }
  329. static inline int floating_point_load_or_store_p(unsigned int insn)
  330. {
  331. return (insn >> 24) & 1;
  332. }
  333. static inline int ok_for_kernel(unsigned int insn)
  334. {
  335. return !floating_point_load_or_store_p(insn);
  336. }
  337. void kernel_mna_trap_fault(struct pt_regs *regs, unsigned int insn) __asm__ ("kernel_mna_trap_fault");
  338. void kernel_mna_trap_fault(struct pt_regs *regs, unsigned int insn)
  339. {
  340. unsigned long g2 = regs->u_regs [UREG_G2];
  341. unsigned long fixup = search_extables_range(regs->tpc, &g2);
  342. if (!fixup) {
  343. unsigned long address = compute_effective_address(regs, insn, ((insn >> 25) & 0x1f));
  344. if (address < PAGE_SIZE) {
  345. printk(KERN_ALERT "Unable to handle kernel NULL pointer dereference in mna handler");
  346. } else
  347. printk(KERN_ALERT "Unable to handle kernel paging request in mna handler");
  348. printk(KERN_ALERT " at virtual address %016lx\n",address);
  349. printk(KERN_ALERT "current->{mm,active_mm}->context = %016lx\n",
  350. (current->mm ? CTX_HWBITS(current->mm->context) :
  351. CTX_HWBITS(current->active_mm->context)));
  352. printk(KERN_ALERT "current->{mm,active_mm}->pgd = %016lx\n",
  353. (current->mm ? (unsigned long) current->mm->pgd :
  354. (unsigned long) current->active_mm->pgd));
  355. die_if_kernel("Oops", regs);
  356. /* Not reached */
  357. }
  358. regs->tpc = fixup;
  359. regs->tnpc = regs->tpc + 4;
  360. regs->u_regs [UREG_G2] = g2;
  361. regs->tstate &= ~TSTATE_ASI;
  362. regs->tstate |= (ASI_AIUS << 24UL);
  363. }
  364. asmlinkage void kernel_unaligned_trap(struct pt_regs *regs, unsigned int insn, unsigned long sfar, unsigned long sfsr)
  365. {
  366. enum direction dir = decode_direction(insn);
  367. int size = decode_access_size(insn);
  368. if (!ok_for_kernel(insn) || dir == both) {
  369. printk("Unsupported unaligned load/store trap for kernel at <%016lx>.\n",
  370. regs->tpc);
  371. unaligned_panic("Kernel does fpu/atomic unaligned load/store.", regs);
  372. __asm__ __volatile__ ("\n"
  373. "kernel_unaligned_trap_fault:\n\t"
  374. "mov %0, %%o0\n\t"
  375. "call kernel_mna_trap_fault\n\t"
  376. " mov %1, %%o1\n\t"
  377. :
  378. : "r" (regs), "r" (insn)
  379. : "o0", "o1", "o2", "o3", "o4", "o5", "o7",
  380. "g1", "g2", "g3", "g4", "g7", "cc");
  381. } else {
  382. unsigned long addr = compute_effective_address(regs, insn, ((insn >> 25) & 0x1f));
  383. #ifdef DEBUG_MNA
  384. printk("KMNA: pc=%016lx [dir=%s addr=%016lx size=%d] retpc[%016lx]\n",
  385. regs->tpc, dirstrings[dir], addr, size, regs->u_regs[UREG_RETPC]);
  386. #endif
  387. switch (dir) {
  388. case load:
  389. do_integer_load(fetch_reg_addr(((insn>>25)&0x1f), regs),
  390. size, (unsigned long *) addr,
  391. decode_signedness(insn), decode_asi(insn, regs),
  392. kernel_unaligned_trap_fault);
  393. break;
  394. case store:
  395. do_integer_store(((insn>>25)&0x1f), size,
  396. (unsigned long *) addr, regs,
  397. decode_asi(insn, regs),
  398. kernel_unaligned_trap_fault);
  399. break;
  400. #if 0 /* unsupported */
  401. case both:
  402. do_atomic(fetch_reg_addr(((insn>>25)&0x1f), regs),
  403. (unsigned long *) addr,
  404. kernel_unaligned_trap_fault);
  405. break;
  406. #endif
  407. default:
  408. panic("Impossible kernel unaligned trap.");
  409. /* Not reached... */
  410. }
  411. advance(regs);
  412. }
  413. }
  414. static char popc_helper[] = {
  415. 0, 1, 1, 2, 1, 2, 2, 3,
  416. 1, 2, 2, 3, 2, 3, 3, 4,
  417. };
  418. int handle_popc(u32 insn, struct pt_regs *regs)
  419. {
  420. u64 value;
  421. int ret, i, rd = ((insn >> 25) & 0x1f);
  422. int from_kernel = (regs->tstate & TSTATE_PRIV) != 0;
  423. if (insn & 0x2000) {
  424. maybe_flush_windows(0, 0, rd, from_kernel);
  425. value = sign_extend_imm13(insn);
  426. } else {
  427. maybe_flush_windows(0, insn & 0x1f, rd, from_kernel);
  428. value = fetch_reg(insn & 0x1f, regs);
  429. }
  430. for (ret = 0, i = 0; i < 16; i++) {
  431. ret += popc_helper[value & 0xf];
  432. value >>= 4;
  433. }
  434. if (rd < 16) {
  435. if (rd)
  436. regs->u_regs[rd] = ret;
  437. } else {
  438. if (test_thread_flag(TIF_32BIT)) {
  439. struct reg_window32 __user *win32;
  440. win32 = (struct reg_window32 __user *)((unsigned long)((u32)regs->u_regs[UREG_FP]));
  441. put_user(ret, &win32->locals[rd - 16]);
  442. } else {
  443. struct reg_window __user *win;
  444. win = (struct reg_window __user *)(regs->u_regs[UREG_FP] + STACK_BIAS);
  445. put_user(ret, &win->locals[rd - 16]);
  446. }
  447. }
  448. advance(regs);
  449. return 1;
  450. }
  451. extern void do_fpother(struct pt_regs *regs);
  452. extern void do_privact(struct pt_regs *regs);
  453. extern void data_access_exception(struct pt_regs *regs,
  454. unsigned long sfsr,
  455. unsigned long sfar);
  456. int handle_ldf_stq(u32 insn, struct pt_regs *regs)
  457. {
  458. unsigned long addr = compute_effective_address(regs, insn, 0);
  459. int freg = ((insn >> 25) & 0x1e) | ((insn >> 20) & 0x20);
  460. struct fpustate *f = FPUSTATE;
  461. int asi = decode_asi(insn, regs);
  462. int flag = (freg < 32) ? FPRS_DL : FPRS_DU;
  463. save_and_clear_fpu();
  464. current_thread_info()->xfsr[0] &= ~0x1c000;
  465. if (freg & 3) {
  466. current_thread_info()->xfsr[0] |= (6 << 14) /* invalid_fp_register */;
  467. do_fpother(regs);
  468. return 0;
  469. }
  470. if (insn & 0x200000) {
  471. /* STQ */
  472. u64 first = 0, second = 0;
  473. if (current_thread_info()->fpsaved[0] & flag) {
  474. first = *(u64 *)&f->regs[freg];
  475. second = *(u64 *)&f->regs[freg+2];
  476. }
  477. if (asi < 0x80) {
  478. do_privact(regs);
  479. return 1;
  480. }
  481. switch (asi) {
  482. case ASI_P:
  483. case ASI_S: break;
  484. case ASI_PL:
  485. case ASI_SL:
  486. {
  487. /* Need to convert endians */
  488. u64 tmp = __swab64p(&first);
  489. first = __swab64p(&second);
  490. second = tmp;
  491. break;
  492. }
  493. default:
  494. data_access_exception(regs, 0, addr);
  495. return 1;
  496. }
  497. if (put_user (first >> 32, (u32 __user *)addr) ||
  498. __put_user ((u32)first, (u32 __user *)(addr + 4)) ||
  499. __put_user (second >> 32, (u32 __user *)(addr + 8)) ||
  500. __put_user ((u32)second, (u32 __user *)(addr + 12))) {
  501. data_access_exception(regs, 0, addr);
  502. return 1;
  503. }
  504. } else {
  505. /* LDF, LDDF, LDQF */
  506. u32 data[4] __attribute__ ((aligned(8)));
  507. int size, i;
  508. int err;
  509. if (asi < 0x80) {
  510. do_privact(regs);
  511. return 1;
  512. } else if (asi > ASI_SNFL) {
  513. data_access_exception(regs, 0, addr);
  514. return 1;
  515. }
  516. switch (insn & 0x180000) {
  517. case 0x000000: size = 1; break;
  518. case 0x100000: size = 4; break;
  519. default: size = 2; break;
  520. }
  521. for (i = 0; i < size; i++)
  522. data[i] = 0;
  523. err = get_user (data[0], (u32 __user *) addr);
  524. if (!err) {
  525. for (i = 1; i < size; i++)
  526. err |= __get_user (data[i], (u32 __user *)(addr + 4*i));
  527. }
  528. if (err && !(asi & 0x2 /* NF */)) {
  529. data_access_exception(regs, 0, addr);
  530. return 1;
  531. }
  532. if (asi & 0x8) /* Little */ {
  533. u64 tmp;
  534. switch (size) {
  535. case 1: data[0] = le32_to_cpup(data + 0); break;
  536. default:*(u64 *)(data + 0) = le64_to_cpup((u64 *)(data + 0));
  537. break;
  538. case 4: tmp = le64_to_cpup((u64 *)(data + 0));
  539. *(u64 *)(data + 0) = le64_to_cpup((u64 *)(data + 2));
  540. *(u64 *)(data + 2) = tmp;
  541. break;
  542. }
  543. }
  544. if (!(current_thread_info()->fpsaved[0] & FPRS_FEF)) {
  545. current_thread_info()->fpsaved[0] = FPRS_FEF;
  546. current_thread_info()->gsr[0] = 0;
  547. }
  548. if (!(current_thread_info()->fpsaved[0] & flag)) {
  549. if (freg < 32)
  550. memset(f->regs, 0, 32*sizeof(u32));
  551. else
  552. memset(f->regs+32, 0, 32*sizeof(u32));
  553. }
  554. memcpy(f->regs + freg, data, size * 4);
  555. current_thread_info()->fpsaved[0] |= flag;
  556. }
  557. advance(regs);
  558. return 1;
  559. }
  560. void handle_ld_nf(u32 insn, struct pt_regs *regs)
  561. {
  562. int rd = ((insn >> 25) & 0x1f);
  563. int from_kernel = (regs->tstate & TSTATE_PRIV) != 0;
  564. unsigned long *reg;
  565. maybe_flush_windows(0, 0, rd, from_kernel);
  566. reg = fetch_reg_addr(rd, regs);
  567. if (from_kernel || rd < 16) {
  568. reg[0] = 0;
  569. if ((insn & 0x780000) == 0x180000)
  570. reg[1] = 0;
  571. } else if (test_thread_flag(TIF_32BIT)) {
  572. put_user(0, (int __user *) reg);
  573. if ((insn & 0x780000) == 0x180000)
  574. put_user(0, ((int __user *) reg) + 1);
  575. } else {
  576. put_user(0, (unsigned long __user *) reg);
  577. if ((insn & 0x780000) == 0x180000)
  578. put_user(0, (unsigned long __user *) reg + 1);
  579. }
  580. advance(regs);
  581. }
  582. void handle_lddfmna(struct pt_regs *regs, unsigned long sfar, unsigned long sfsr)
  583. {
  584. unsigned long pc = regs->tpc;
  585. unsigned long tstate = regs->tstate;
  586. u32 insn;
  587. u32 first, second;
  588. u64 value;
  589. u8 asi, freg;
  590. int flag;
  591. struct fpustate *f = FPUSTATE;
  592. if (tstate & TSTATE_PRIV)
  593. die_if_kernel("lddfmna from kernel", regs);
  594. if (test_thread_flag(TIF_32BIT))
  595. pc = (u32)pc;
  596. if (get_user(insn, (u32 __user *) pc) != -EFAULT) {
  597. asi = sfsr >> 16;
  598. if ((asi > ASI_SNFL) ||
  599. (asi < ASI_P))
  600. goto daex;
  601. if (get_user(first, (u32 __user *)sfar) ||
  602. get_user(second, (u32 __user *)(sfar + 4))) {
  603. if (asi & 0x2) /* NF */ {
  604. first = 0; second = 0;
  605. } else
  606. goto daex;
  607. }
  608. save_and_clear_fpu();
  609. freg = ((insn >> 25) & 0x1e) | ((insn >> 20) & 0x20);
  610. value = (((u64)first) << 32) | second;
  611. if (asi & 0x8) /* Little */
  612. value = __swab64p(&value);
  613. flag = (freg < 32) ? FPRS_DL : FPRS_DU;
  614. if (!(current_thread_info()->fpsaved[0] & FPRS_FEF)) {
  615. current_thread_info()->fpsaved[0] = FPRS_FEF;
  616. current_thread_info()->gsr[0] = 0;
  617. }
  618. if (!(current_thread_info()->fpsaved[0] & flag)) {
  619. if (freg < 32)
  620. memset(f->regs, 0, 32*sizeof(u32));
  621. else
  622. memset(f->regs+32, 0, 32*sizeof(u32));
  623. }
  624. *(u64 *)(f->regs + freg) = value;
  625. current_thread_info()->fpsaved[0] |= flag;
  626. } else {
  627. daex: data_access_exception(regs, sfsr, sfar);
  628. return;
  629. }
  630. advance(regs);
  631. return;
  632. }
  633. void handle_stdfmna(struct pt_regs *regs, unsigned long sfar, unsigned long sfsr)
  634. {
  635. unsigned long pc = regs->tpc;
  636. unsigned long tstate = regs->tstate;
  637. u32 insn;
  638. u64 value;
  639. u8 asi, freg;
  640. int flag;
  641. struct fpustate *f = FPUSTATE;
  642. if (tstate & TSTATE_PRIV)
  643. die_if_kernel("stdfmna from kernel", regs);
  644. if (test_thread_flag(TIF_32BIT))
  645. pc = (u32)pc;
  646. if (get_user(insn, (u32 __user *) pc) != -EFAULT) {
  647. freg = ((insn >> 25) & 0x1e) | ((insn >> 20) & 0x20);
  648. asi = sfsr >> 16;
  649. value = 0;
  650. flag = (freg < 32) ? FPRS_DL : FPRS_DU;
  651. if ((asi > ASI_SNFL) ||
  652. (asi < ASI_P))
  653. goto daex;
  654. save_and_clear_fpu();
  655. if (current_thread_info()->fpsaved[0] & flag)
  656. value = *(u64 *)&f->regs[freg];
  657. switch (asi) {
  658. case ASI_P:
  659. case ASI_S: break;
  660. case ASI_PL:
  661. case ASI_SL:
  662. value = __swab64p(&value); break;
  663. default: goto daex;
  664. }
  665. if (put_user (value >> 32, (u32 __user *) sfar) ||
  666. __put_user ((u32)value, (u32 __user *)(sfar + 4)))
  667. goto daex;
  668. } else {
  669. daex: data_access_exception(regs, sfsr, sfar);
  670. return;
  671. }
  672. advance(regs);
  673. return;
  674. }