aes_asm.S 18 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836
  1. #include <linux/linkage.h>
  2. #include <asm/visasm.h>
  3. #define F3F(x,y,z) (((x)<<30)|((y)<<19)|((z)<<5))
  4. #define FPD_ENCODE(x) (((x) >> 5) | ((x) & ~(0x20)))
  5. #define RS1(x) (FPD_ENCODE(x) << 14)
  6. #define RS2(x) (FPD_ENCODE(x) << 0)
  7. #define RS3(x) (FPD_ENCODE(x) << 9)
  8. #define RD(x) (FPD_ENCODE(x) << 25)
  9. #define IMM5(x) ((x) << 9)
  10. #define AES_EROUND01(a,b,c,d) \
  11. .word (F3F(2, 0x19, 0)|RS1(a)|RS2(b)|RS3(c)|RD(d));
  12. #define AES_EROUND23(a,b,c,d) \
  13. .word (F3F(2, 0x19, 1)|RS1(a)|RS2(b)|RS3(c)|RD(d));
  14. #define AES_DROUND01(a,b,c,d) \
  15. .word (F3F(2, 0x19, 2)|RS1(a)|RS2(b)|RS3(c)|RD(d));
  16. #define AES_DROUND23(a,b,c,d) \
  17. .word (F3F(2, 0x19, 3)|RS1(a)|RS2(b)|RS3(c)|RD(d));
  18. #define AES_EROUND01_L(a,b,c,d) \
  19. .word (F3F(2, 0x19, 4)|RS1(a)|RS2(b)|RS3(c)|RD(d));
  20. #define AES_EROUND23_L(a,b,c,d) \
  21. .word (F3F(2, 0x19, 5)|RS1(a)|RS2(b)|RS3(c)|RD(d));
  22. #define AES_DROUND01_L(a,b,c,d) \
  23. .word (F3F(2, 0x19, 6)|RS1(a)|RS2(b)|RS3(c)|RD(d));
  24. #define AES_DROUND23_L(a,b,c,d) \
  25. .word (F3F(2, 0x19, 7)|RS1(a)|RS2(b)|RS3(c)|RD(d));
  26. #define AES_KEXPAND1(a,b,c,d) \
  27. .word (F3F(2, 0x19, 8)|RS1(a)|RS2(b)|IMM5(c)|RD(d));
  28. #define AES_KEXPAND0(a,b,c) \
  29. .word (F3F(2, 0x36, 0x130)|RS1(a)|RS2(b)|RD(c));
  30. #define AES_KEXPAND2(a,b,c) \
  31. .word (F3F(2, 0x36, 0x131)|RS1(a)|RS2(b)|RD(c));
  32. #define MOVXTOD_G3_F4 \
  33. .word 0x89b02303;
  34. #define MOVXTOD_G7_F6 \
  35. .word 0x8db02307;
  36. #define MOVXTOD_G3_F0 \
  37. .word 0x81b02303;
  38. #define MOVXTOD_G7_F2 \
  39. .word 0x85b02307;
  40. #define MOVXTOD_O0_F0 \
  41. .word 0x81b02308;
  42. #define MOVXTOD_O1_F2 \
  43. .word 0x85b02309;
  44. #define ENCRYPT_TWO_ROUNDS(KEY_BASE, I0, I1, T0, T1) \
  45. AES_EROUND01(KEY_BASE + 0, I0, I1, T0) \
  46. AES_EROUND23(KEY_BASE + 2, I0, I1, T1) \
  47. AES_EROUND01(KEY_BASE + 4, T0, T1, I0) \
  48. AES_EROUND23(KEY_BASE + 6, T0, T1, I1)
  49. #define ENCRYPT_TWO_ROUNDS_LAST(KEY_BASE, I0, I1, T0, T1) \
  50. AES_EROUND01(KEY_BASE + 0, I0, I1, T0) \
  51. AES_EROUND23(KEY_BASE + 2, I0, I1, T1) \
  52. AES_EROUND01_L(KEY_BASE + 4, T0, T1, I0) \
  53. AES_EROUND23_L(KEY_BASE + 6, T0, T1, I1)
  54. /* 10 rounds */
  55. #define ENCRYPT_128(KEY_BASE, I0, I1, T0, T1) \
  56. ENCRYPT_TWO_ROUNDS(KEY_BASE + 0, I0, I1, T0, T1) \
  57. ENCRYPT_TWO_ROUNDS(KEY_BASE + 8, I0, I1, T0, T1) \
  58. ENCRYPT_TWO_ROUNDS(KEY_BASE + 16, I0, I1, T0, T1) \
  59. ENCRYPT_TWO_ROUNDS(KEY_BASE + 24, I0, I1, T0, T1) \
  60. ENCRYPT_TWO_ROUNDS_LAST(KEY_BASE + 32, I0, I1, T0, T1)
  61. /* 12 rounds */
  62. #define ENCRYPT_192(KEY_BASE, I0, I1, T0, T1) \
  63. ENCRYPT_TWO_ROUNDS(KEY_BASE + 0, I0, I1, T0, T1) \
  64. ENCRYPT_TWO_ROUNDS(KEY_BASE + 8, I0, I1, T0, T1) \
  65. ENCRYPT_TWO_ROUNDS(KEY_BASE + 16, I0, I1, T0, T1) \
  66. ENCRYPT_TWO_ROUNDS(KEY_BASE + 24, I0, I1, T0, T1) \
  67. ENCRYPT_TWO_ROUNDS(KEY_BASE + 32, I0, I1, T0, T1) \
  68. ENCRYPT_TWO_ROUNDS_LAST(KEY_BASE + 40, I0, I1, T0, T1)
  69. /* 14 rounds */
  70. #define ENCRYPT_256(KEY_BASE, I0, I1, T0, T1) \
  71. ENCRYPT_TWO_ROUNDS(KEY_BASE + 0, I0, I1, T0, T1) \
  72. ENCRYPT_TWO_ROUNDS(KEY_BASE + 8, I0, I1, T0, T1) \
  73. ENCRYPT_TWO_ROUNDS(KEY_BASE + 16, I0, I1, T0, T1) \
  74. ENCRYPT_TWO_ROUNDS(KEY_BASE + 24, I0, I1, T0, T1) \
  75. ENCRYPT_TWO_ROUNDS(KEY_BASE + 32, I0, I1, T0, T1) \
  76. ENCRYPT_TWO_ROUNDS(KEY_BASE + 40, I0, I1, T0, T1) \
  77. ENCRYPT_TWO_ROUNDS_LAST(KEY_BASE + 48, I0, I1, T0, T1)
  78. #define DECRYPT_TWO_ROUNDS(KEY_TOP, I0, I1, T0, T1) \
  79. AES_DROUND23(KEY_TOP - 2, I0, I1, T1) \
  80. AES_DROUND01(KEY_TOP - 4, I0, I1, T0) \
  81. AES_DROUND23(KEY_TOP - 6, T0, T1, I1) \
  82. AES_DROUND01(KEY_TOP - 8, T0, T1, I0)
  83. #define DECRYPT_TWO_ROUNDS_LAST(KEY_TOP, I0, I1, T0, T1) \
  84. AES_DROUND23(KEY_TOP - 2, I0, I1, T1) \
  85. AES_DROUND01(KEY_TOP - 4, I0, I1, T0) \
  86. AES_DROUND23_L(KEY_TOP - 6, T0, T1, I1) \
  87. AES_DROUND01_L(KEY_TOP - 8, T0, T1, I0)
  88. /* 10 rounds */
  89. #define DECRYPT_128(KEY_TOP, I0, I1, T0, T1) \
  90. DECRYPT_TWO_ROUNDS(KEY_TOP - 0, I0, I1, T0, T1) \
  91. DECRYPT_TWO_ROUNDS(KEY_TOP - 8, I0, I1, T0, T1) \
  92. DECRYPT_TWO_ROUNDS(KEY_TOP - 16, I0, I1, T0, T1) \
  93. DECRYPT_TWO_ROUNDS(KEY_TOP - 24, I0, I1, T0, T1) \
  94. DECRYPT_TWO_ROUNDS_LAST(KEY_TOP - 32, I0, I1, T0, T1)
  95. /* 12 rounds */
  96. #define DECRYPT_192(KEY_TOP, I0, I1, T0, T1) \
  97. DECRYPT_TWO_ROUNDS(KEY_TOP - 0, I0, I1, T0, T1) \
  98. DECRYPT_TWO_ROUNDS(KEY_TOP - 8, I0, I1, T0, T1) \
  99. DECRYPT_TWO_ROUNDS(KEY_TOP - 16, I0, I1, T0, T1) \
  100. DECRYPT_TWO_ROUNDS(KEY_TOP - 24, I0, I1, T0, T1) \
  101. DECRYPT_TWO_ROUNDS(KEY_TOP - 32, I0, I1, T0, T1) \
  102. DECRYPT_TWO_ROUNDS_LAST(KEY_TOP - 40, I0, I1, T0, T1)
  103. /* 14 rounds */
  104. #define DECRYPT_256(KEY_TOP, I0, I1, T0, T1) \
  105. DECRYPT_TWO_ROUNDS(KEY_TOP - 0, I0, I1, T0, T1) \
  106. DECRYPT_TWO_ROUNDS(KEY_TOP - 8, I0, I1, T0, T1) \
  107. DECRYPT_TWO_ROUNDS(KEY_TOP - 16, I0, I1, T0, T1) \
  108. DECRYPT_TWO_ROUNDS(KEY_TOP - 24, I0, I1, T0, T1) \
  109. DECRYPT_TWO_ROUNDS(KEY_TOP - 32, I0, I1, T0, T1) \
  110. DECRYPT_TWO_ROUNDS(KEY_TOP - 40, I0, I1, T0, T1) \
  111. DECRYPT_TWO_ROUNDS_LAST(KEY_TOP - 48, I0, I1, T0, T1)
  112. ENTRY(aes_sparc64_key_expand)
  113. /* %o0=input_key, %o1=output_key, %o2=key_len */
  114. VISEntry
  115. ld [%o0 + 0x00], %f0
  116. ld [%o0 + 0x04], %f1
  117. ld [%o0 + 0x08], %f2
  118. ld [%o0 + 0x0c], %f3
  119. std %f0, [%o1 + 0x00]
  120. std %f2, [%o1 + 0x08]
  121. add %o1, 0x10, %o1
  122. cmp %o2, 24
  123. bl 2f
  124. nop
  125. be 1f
  126. nop
  127. /* 256-bit key expansion */
  128. ld [%o0 + 0x10], %f4
  129. ld [%o0 + 0x14], %f5
  130. ld [%o0 + 0x18], %f6
  131. ld [%o0 + 0x1c], %f7
  132. std %f4, [%o1 + 0x00]
  133. std %f6, [%o1 + 0x08]
  134. add %o1, 0x10, %o1
  135. AES_KEXPAND1(0, 6, 0x0, 8)
  136. AES_KEXPAND2(2, 8, 10)
  137. AES_KEXPAND0(4, 10, 12)
  138. AES_KEXPAND2(6, 12, 14)
  139. AES_KEXPAND1(8, 14, 0x1, 16)
  140. AES_KEXPAND2(10, 16, 18)
  141. AES_KEXPAND0(12, 18, 20)
  142. AES_KEXPAND2(14, 20, 22)
  143. AES_KEXPAND1(16, 22, 0x2, 24)
  144. AES_KEXPAND2(18, 24, 26)
  145. AES_KEXPAND0(20, 26, 28)
  146. AES_KEXPAND2(22, 28, 30)
  147. AES_KEXPAND1(24, 30, 0x3, 32)
  148. AES_KEXPAND2(26, 32, 34)
  149. AES_KEXPAND0(28, 34, 36)
  150. AES_KEXPAND2(30, 36, 38)
  151. AES_KEXPAND1(32, 38, 0x4, 40)
  152. AES_KEXPAND2(34, 40, 42)
  153. AES_KEXPAND0(36, 42, 44)
  154. AES_KEXPAND2(38, 44, 46)
  155. AES_KEXPAND1(40, 46, 0x5, 48)
  156. AES_KEXPAND2(42, 48, 50)
  157. AES_KEXPAND0(44, 50, 52)
  158. AES_KEXPAND2(46, 52, 54)
  159. AES_KEXPAND1(48, 54, 0x6, 56)
  160. AES_KEXPAND2(50, 56, 58)
  161. std %f8, [%o1 + 0x00]
  162. std %f10, [%o1 + 0x08]
  163. std %f12, [%o1 + 0x10]
  164. std %f14, [%o1 + 0x18]
  165. std %f16, [%o1 + 0x20]
  166. std %f18, [%o1 + 0x28]
  167. std %f20, [%o1 + 0x30]
  168. std %f22, [%o1 + 0x38]
  169. std %f24, [%o1 + 0x40]
  170. std %f26, [%o1 + 0x48]
  171. std %f28, [%o1 + 0x50]
  172. std %f30, [%o1 + 0x58]
  173. std %f32, [%o1 + 0x60]
  174. std %f34, [%o1 + 0x68]
  175. std %f36, [%o1 + 0x70]
  176. std %f38, [%o1 + 0x78]
  177. std %f40, [%o1 + 0x80]
  178. std %f42, [%o1 + 0x88]
  179. std %f44, [%o1 + 0x90]
  180. std %f46, [%o1 + 0x98]
  181. std %f48, [%o1 + 0xa0]
  182. std %f50, [%o1 + 0xa8]
  183. std %f52, [%o1 + 0xb0]
  184. std %f54, [%o1 + 0xb8]
  185. std %f56, [%o1 + 0xc0]
  186. ba,pt %xcc, 80f
  187. std %f58, [%o1 + 0xc8]
  188. 1:
  189. /* 192-bit key expansion */
  190. ld [%o0 + 0x10], %f4
  191. ld [%o0 + 0x14], %f5
  192. std %f4, [%o1 + 0x00]
  193. add %o1, 0x08, %o1
  194. AES_KEXPAND1(0, 4, 0x0, 6)
  195. AES_KEXPAND2(2, 6, 8)
  196. AES_KEXPAND2(4, 8, 10)
  197. AES_KEXPAND1(6, 10, 0x1, 12)
  198. AES_KEXPAND2(8, 12, 14)
  199. AES_KEXPAND2(10, 14, 16)
  200. AES_KEXPAND1(12, 16, 0x2, 18)
  201. AES_KEXPAND2(14, 18, 20)
  202. AES_KEXPAND2(16, 20, 22)
  203. AES_KEXPAND1(18, 22, 0x3, 24)
  204. AES_KEXPAND2(20, 24, 26)
  205. AES_KEXPAND2(22, 26, 28)
  206. AES_KEXPAND1(24, 28, 0x4, 30)
  207. AES_KEXPAND2(26, 30, 32)
  208. AES_KEXPAND2(28, 32, 34)
  209. AES_KEXPAND1(30, 34, 0x5, 36)
  210. AES_KEXPAND2(32, 36, 38)
  211. AES_KEXPAND2(34, 38, 40)
  212. AES_KEXPAND1(36, 40, 0x6, 42)
  213. AES_KEXPAND2(38, 42, 44)
  214. AES_KEXPAND2(40, 44, 46)
  215. AES_KEXPAND1(42, 46, 0x7, 48)
  216. AES_KEXPAND2(44, 48, 50)
  217. std %f6, [%o1 + 0x00]
  218. std %f8, [%o1 + 0x08]
  219. std %f10, [%o1 + 0x10]
  220. std %f12, [%o1 + 0x18]
  221. std %f14, [%o1 + 0x20]
  222. std %f16, [%o1 + 0x28]
  223. std %f18, [%o1 + 0x30]
  224. std %f20, [%o1 + 0x38]
  225. std %f22, [%o1 + 0x40]
  226. std %f24, [%o1 + 0x48]
  227. std %f26, [%o1 + 0x50]
  228. std %f28, [%o1 + 0x58]
  229. std %f30, [%o1 + 0x60]
  230. std %f32, [%o1 + 0x68]
  231. std %f34, [%o1 + 0x70]
  232. std %f36, [%o1 + 0x78]
  233. std %f38, [%o1 + 0x80]
  234. std %f40, [%o1 + 0x88]
  235. std %f42, [%o1 + 0x90]
  236. std %f44, [%o1 + 0x98]
  237. std %f46, [%o1 + 0xa0]
  238. std %f48, [%o1 + 0xa8]
  239. ba,pt %xcc, 80f
  240. std %f50, [%o1 + 0xb0]
  241. 2:
  242. /* 128-bit key expansion */
  243. AES_KEXPAND1(0, 2, 0x0, 4)
  244. AES_KEXPAND2(2, 4, 6)
  245. AES_KEXPAND1(4, 6, 0x1, 8)
  246. AES_KEXPAND2(6, 8, 10)
  247. AES_KEXPAND1(8, 10, 0x2, 12)
  248. AES_KEXPAND2(10, 12, 14)
  249. AES_KEXPAND1(12, 14, 0x3, 16)
  250. AES_KEXPAND2(14, 16, 18)
  251. AES_KEXPAND1(16, 18, 0x4, 20)
  252. AES_KEXPAND2(18, 20, 22)
  253. AES_KEXPAND1(20, 22, 0x5, 24)
  254. AES_KEXPAND2(22, 24, 26)
  255. AES_KEXPAND1(24, 26, 0x6, 28)
  256. AES_KEXPAND2(26, 28, 30)
  257. AES_KEXPAND1(28, 30, 0x7, 32)
  258. AES_KEXPAND2(30, 32, 34)
  259. AES_KEXPAND1(32, 34, 0x8, 36)
  260. AES_KEXPAND2(34, 36, 38)
  261. AES_KEXPAND1(36, 38, 0x9, 40)
  262. AES_KEXPAND2(38, 40, 42)
  263. std %f4, [%o1 + 0x00]
  264. std %f6, [%o1 + 0x08]
  265. std %f8, [%o1 + 0x10]
  266. std %f10, [%o1 + 0x18]
  267. std %f12, [%o1 + 0x20]
  268. std %f14, [%o1 + 0x28]
  269. std %f16, [%o1 + 0x30]
  270. std %f18, [%o1 + 0x38]
  271. std %f20, [%o1 + 0x40]
  272. std %f22, [%o1 + 0x48]
  273. std %f24, [%o1 + 0x50]
  274. std %f26, [%o1 + 0x58]
  275. std %f28, [%o1 + 0x60]
  276. std %f30, [%o1 + 0x68]
  277. std %f32, [%o1 + 0x70]
  278. std %f34, [%o1 + 0x78]
  279. std %f36, [%o1 + 0x80]
  280. std %f38, [%o1 + 0x88]
  281. std %f40, [%o1 + 0x90]
  282. std %f42, [%o1 + 0x98]
  283. 80:
  284. retl
  285. VISExit
  286. ENDPROC(aes_sparc64_key_expand)
  287. ENTRY(aes_sparc64_encrypt)
  288. /* %o0=key, %o1=input, %o2=output, %o3=key_len */
  289. VISEntry
  290. ld [%o1 + 0x00], %f4
  291. ld [%o1 + 0x04], %f5
  292. ld [%o1 + 0x08], %f6
  293. ld [%o1 + 0x0c], %f7
  294. ldd [%o0 + 0x00], %f8
  295. ldd [%o0 + 0x08], %f10
  296. cmp %o3, 24
  297. fxor %f8, %f4, %f4
  298. bl 2f
  299. fxor %f10, %f6, %f6
  300. be 1f
  301. ldd [%o0 + 0x10], %f8
  302. ldd [%o0 + 0x18], %f10
  303. ldd [%o0 + 0x20], %f12
  304. ldd [%o0 + 0x28], %f14
  305. add %o0, 0x20, %o0
  306. ENCRYPT_TWO_ROUNDS(8, 4, 6, 0, 2)
  307. ldd [%o0 + 0x10], %f8
  308. 1:
  309. ldd [%o0 + 0x18], %f10
  310. ldd [%o0 + 0x20], %f12
  311. ldd [%o0 + 0x28], %f14
  312. add %o0, 0x20, %o0
  313. ENCRYPT_TWO_ROUNDS(8, 4, 6, 0, 2)
  314. 2:
  315. ldd [%o0 + 0x10], %f12
  316. ldd [%o0 + 0x18], %f14
  317. ldd [%o0 + 0x20], %f16
  318. ldd [%o0 + 0x28], %f18
  319. ldd [%o0 + 0x30], %f20
  320. ldd [%o0 + 0x38], %f22
  321. ldd [%o0 + 0x40], %f24
  322. ldd [%o0 + 0x48], %f26
  323. ldd [%o0 + 0x50], %f28
  324. ldd [%o0 + 0x58], %f30
  325. ldd [%o0 + 0x60], %f32
  326. ldd [%o0 + 0x68], %f34
  327. ldd [%o0 + 0x70], %f36
  328. ldd [%o0 + 0x78], %f38
  329. ldd [%o0 + 0x80], %f40
  330. ldd [%o0 + 0x88], %f42
  331. ldd [%o0 + 0x90], %f44
  332. ldd [%o0 + 0x98], %f46
  333. ldd [%o0 + 0xa0], %f48
  334. ldd [%o0 + 0xa8], %f50
  335. ENCRYPT_128(12, 4, 6, 0, 2)
  336. st %f4, [%o2 + 0x00]
  337. st %f5, [%o2 + 0x04]
  338. st %f6, [%o2 + 0x08]
  339. st %f7, [%o2 + 0x0c]
  340. retl
  341. VISExit
  342. ENDPROC(aes_sparc64_encrypt)
  343. ENTRY(aes_sparc64_decrypt)
  344. /* %o0=key, %o1=input, %o2=output, %o3=key_len, %o4=exp_key_len */
  345. VISEntry
  346. ld [%o1 + 0x00], %f4
  347. add %o0, %o4, %o0
  348. ld [%o1 + 0x04], %f5
  349. ld [%o1 + 0x08], %f6
  350. ld [%o1 + 0x0c], %f7
  351. ldd [%o0 - 0x08], %f8
  352. ldd [%o0 - 0x10], %f10
  353. cmp %o3, 24
  354. fxor %f10, %f4, %f4
  355. bl 2f
  356. fxor %f8, %f6, %f6
  357. be 1f
  358. ldd [%o0 - 0x30], %f8
  359. ldd [%o0 - 0x28], %f10
  360. ldd [%o0 - 0x20], %f12
  361. ldd [%o0 - 0x18], %f14
  362. sub %o0, 0x20, %o0
  363. DECRYPT_TWO_ROUNDS(16, 4, 6, 0, 2)
  364. ldd [%o0 - 0x30], %f8
  365. 1:
  366. ldd [%o0 - 0x28], %f10
  367. ldd [%o0 - 0x20], %f12
  368. ldd [%o0 - 0x18], %f14
  369. sub %o0, 0x20, %o0
  370. DECRYPT_TWO_ROUNDS(16, 4, 6, 0, 2)
  371. 2:
  372. ldd [%o0 - 0xb0], %f12
  373. ldd [%o0 - 0xa8], %f14
  374. ldd [%o0 - 0xa0], %f16
  375. ldd [%o0 - 0x98], %f18
  376. ldd [%o0 - 0x90], %f20
  377. ldd [%o0 - 0x88], %f22
  378. ldd [%o0 - 0x80], %f24
  379. ldd [%o0 - 0x78], %f26
  380. ldd [%o0 - 0x70], %f28
  381. ldd [%o0 - 0x68], %f30
  382. ldd [%o0 - 0x60], %f32
  383. ldd [%o0 - 0x58], %f34
  384. ldd [%o0 - 0x50], %f36
  385. ldd [%o0 - 0x48], %f38
  386. ldd [%o0 - 0x40], %f40
  387. ldd [%o0 - 0x38], %f42
  388. ldd [%o0 - 0x30], %f44
  389. ldd [%o0 - 0x28], %f46
  390. ldd [%o0 - 0x20], %f48
  391. ldd [%o0 - 0x18], %f50
  392. DECRYPT_128(52, 4, 6, 0, 2)
  393. st %f4, [%o2 + 0x00]
  394. st %f5, [%o2 + 0x04]
  395. st %f6, [%o2 + 0x08]
  396. st %f7, [%o2 + 0x0c]
  397. retl
  398. VISExit
  399. ENDPROC(aes_sparc64_decrypt)
  400. ENTRY(aes_sparc64_load_decrypt_keys)
  401. /* %o0=key */
  402. ba,pt %xcc, aes_sparc64_load_encrypt_keys
  403. sub %o0, 0x10, %o0
  404. ENDPROC(aes_sparc64_load_decrypt_keys)
  405. ENTRY(aes_sparc64_load_encrypt_keys)
  406. /* %o0=key */
  407. VISEntry
  408. ldd [%o0 + 0x10], %f8
  409. ldd [%o0 + 0x18], %f10
  410. ldd [%o0 + 0x20], %f12
  411. ldd [%o0 + 0x28], %f14
  412. ldd [%o0 + 0x30], %f16
  413. ldd [%o0 + 0x38], %f18
  414. ldd [%o0 + 0x40], %f20
  415. ldd [%o0 + 0x48], %f22
  416. ldd [%o0 + 0x50], %f24
  417. ldd [%o0 + 0x58], %f26
  418. ldd [%o0 + 0x60], %f28
  419. ldd [%o0 + 0x68], %f30
  420. ldd [%o0 + 0x70], %f32
  421. ldd [%o0 + 0x78], %f34
  422. ldd [%o0 + 0x80], %f36
  423. ldd [%o0 + 0x88], %f38
  424. ldd [%o0 + 0x90], %f40
  425. ldd [%o0 + 0x98], %f42
  426. ldd [%o0 + 0xa0], %f44
  427. ldd [%o0 + 0xa8], %f46
  428. ldd [%o0 + 0xb0], %f48
  429. ldd [%o0 + 0xb8], %f50
  430. ldd [%o0 + 0xc0], %f52
  431. ldd [%o0 + 0xc8], %f54
  432. ldd [%o0 + 0xd0], %f56
  433. ldd [%o0 + 0xd8], %f58
  434. ldd [%o0 + 0xe0], %f60
  435. retl
  436. ldd [%o0 + 0xe8], %f62
  437. ENDPROC(aes_sparc64_load_encrypt_keys)
  438. ENTRY(aes_sparc64_ecb_encrypt)
  439. /* %o0=key, %o1=input, %o2=output, %o3=key_len, %o4=len */
  440. ldx [%o0 + 0x00], %g1
  441. ldx [%o0 + 0x08], %g2
  442. cmp %o3, 24
  443. bl 2f
  444. nop
  445. be 1f
  446. nop
  447. 0:
  448. /* 256-bit key */
  449. ldx [%o1 + 0x00], %g3
  450. ldx [%o1 + 0x08], %g7
  451. add %o1, 0x10, %o1
  452. xor %g1, %g3, %g3
  453. xor %g2, %g7, %g7
  454. MOVXTOD_G3_F4
  455. MOVXTOD_G7_F6
  456. ENCRYPT_256(8, 4, 6, 0, 2)
  457. std %f4, [%o2 + 0x00]
  458. std %f6, [%o2 + 0x08]
  459. subcc %o4, 0x10, %o4
  460. bne,pt %xcc, 0b
  461. add %o2, 0x10, %o2
  462. retl
  463. nop
  464. 1:
  465. /* 192-bit key */
  466. ldx [%o1 + 0x00], %g3
  467. ldx [%o1 + 0x08], %g7
  468. add %o1, 0x10, %o1
  469. xor %g1, %g3, %g3
  470. xor %g2, %g7, %g7
  471. MOVXTOD_G3_F4
  472. MOVXTOD_G7_F6
  473. ENCRYPT_192(8, 4, 6, 0, 2)
  474. std %f4, [%o2 + 0x00]
  475. std %f6, [%o2 + 0x08]
  476. subcc %o4, 0x10, %o4
  477. bne,pt %xcc, 1b
  478. add %o2, 0x10, %o2
  479. retl
  480. nop
  481. 2:
  482. /* 128-bit key */
  483. ldx [%o1 + 0x00], %g3
  484. ldx [%o1 + 0x08], %g7
  485. add %o1, 0x10, %o1
  486. xor %g1, %g3, %g3
  487. xor %g2, %g7, %g7
  488. MOVXTOD_G3_F4
  489. MOVXTOD_G7_F6
  490. ENCRYPT_128(8, 4, 6, 0, 2)
  491. std %f4, [%o2 + 0x00]
  492. std %f6, [%o2 + 0x08]
  493. subcc %o4, 0x10, %o4
  494. bne,pt %xcc, 2b
  495. add %o2, 0x10, %o2
  496. retl
  497. nop
  498. ENDPROC(aes_sparc64_ecb_encrypt)
  499. ENTRY(aes_sparc64_ecb_decrypt)
  500. /* %o0=&key[key_len], %o1=input, %o2=output, %o3=key_len, %o4=len, %o5=iv */
  501. ldx [%o0 - 0x10], %g1
  502. ldx [%o0 - 0x08], %g2
  503. cmp %o3, 24
  504. bl 2f
  505. nop
  506. be 1f
  507. nop
  508. 0:
  509. /* 256-bit key */
  510. ldx [%o1 + 0x00], %g3
  511. ldx [%o1 + 0x08], %g7
  512. add %o1, 0x10, %o1
  513. xor %g1, %g3, %g3
  514. xor %g2, %g7, %g7
  515. MOVXTOD_G3_F4
  516. MOVXTOD_G7_F6
  517. DECRYPT_256(64, 4, 6, 0, 2)
  518. std %f4, [%o2 + 0x00]
  519. std %f6, [%o2 + 0x08]
  520. subcc %o4, 0x10, %o4
  521. bne,pt %xcc, 0b
  522. add %o2, 0x10, %o2
  523. retl
  524. nop
  525. 1:
  526. /* 192-bit key */
  527. ldx [%o1 + 0x00], %g3
  528. ldx [%o1 + 0x08], %g7
  529. add %o1, 0x10, %o1
  530. xor %g1, %g3, %g3
  531. xor %g2, %g7, %g7
  532. MOVXTOD_G3_F4
  533. MOVXTOD_G7_F6
  534. DECRYPT_192(56, 4, 6, 0, 2)
  535. std %f4, [%o2 + 0x00]
  536. std %f6, [%o2 + 0x08]
  537. subcc %o4, 0x10, %o4
  538. bne,pt %xcc, 1b
  539. add %o2, 0x10, %o2
  540. retl
  541. nop
  542. 2:
  543. /* 128-bit key */
  544. ldx [%o1 + 0x00], %g3
  545. ldx [%o1 + 0x08], %g7
  546. add %o1, 0x10, %o1
  547. xor %g1, %g3, %g3
  548. xor %g2, %g7, %g7
  549. MOVXTOD_G3_F4
  550. MOVXTOD_G7_F6
  551. DECRYPT_128(48, 4, 6, 0, 2)
  552. std %f4, [%o2 + 0x00]
  553. std %f6, [%o2 + 0x08]
  554. subcc %o4, 0x10, %o4
  555. bne,pt %xcc, 2b
  556. add %o2, 0x10, %o2
  557. retl
  558. nop
  559. ENDPROC(aes_sparc64_ecb_decrypt)
  560. ENTRY(aes_sparc64_cbc_encrypt)
  561. /* %o0=key, %o1=input, %o2=output, %o3=key_len, %o4=len */
  562. ldd [%o5 + 0x00], %f4
  563. ldd [%o5 + 0x08], %f6
  564. ldx [%o0 + 0x00], %g1
  565. ldx [%o0 + 0x08], %g2
  566. cmp %o3, 24
  567. bl 2f
  568. nop
  569. be 1f
  570. nop
  571. 0:
  572. /* 256-bit key */
  573. ldx [%o1 + 0x00], %g3
  574. ldx [%o1 + 0x08], %g7
  575. add %o1, 0x10, %o1
  576. xor %g1, %g3, %g3
  577. xor %g2, %g7, %g7
  578. MOVXTOD_G3_F0
  579. MOVXTOD_G7_F2
  580. fxor %f4, %f0, %f4
  581. fxor %f6, %f2, %f6
  582. ENCRYPT_256(8, 4, 6, 0, 2)
  583. std %f4, [%o2 + 0x00]
  584. std %f6, [%o2 + 0x08]
  585. subcc %o4, 0x10, %o4
  586. bne,pt %xcc, 0b
  587. add %o2, 0x10, %o2
  588. std %f4, [%o5 + 0x00]
  589. std %f6, [%o5 + 0x08]
  590. retl
  591. nop
  592. 1:
  593. /* 192-bit key */
  594. ldx [%o1 + 0x00], %g3
  595. ldx [%o1 + 0x08], %g7
  596. add %o1, 0x10, %o1
  597. xor %g1, %g3, %g3
  598. xor %g2, %g7, %g7
  599. MOVXTOD_G3_F0
  600. MOVXTOD_G7_F2
  601. fxor %f4, %f0, %f4
  602. fxor %f6, %f2, %f6
  603. ENCRYPT_192(8, 4, 6, 0, 2)
  604. std %f4, [%o2 + 0x00]
  605. std %f6, [%o2 + 0x08]
  606. subcc %o4, 0x10, %o4
  607. bne,pt %xcc, 1b
  608. add %o2, 0x10, %o2
  609. std %f4, [%o5 + 0x00]
  610. std %f6, [%o5 + 0x08]
  611. retl
  612. nop
  613. 2:
  614. /* 128-bit key */
  615. ldx [%o1 + 0x00], %g3
  616. ldx [%o1 + 0x08], %g7
  617. add %o1, 0x10, %o1
  618. xor %g1, %g3, %g3
  619. xor %g2, %g7, %g7
  620. MOVXTOD_G3_F0
  621. MOVXTOD_G7_F2
  622. fxor %f4, %f0, %f4
  623. fxor %f6, %f2, %f6
  624. ENCRYPT_128(8, 4, 6, 0, 2)
  625. std %f4, [%o2 + 0x00]
  626. std %f6, [%o2 + 0x08]
  627. subcc %o4, 0x10, %o4
  628. bne,pt %xcc, 2b
  629. add %o2, 0x10, %o2
  630. std %f4, [%o5 + 0x00]
  631. std %f6, [%o5 + 0x08]
  632. retl
  633. nop
  634. ENDPROC(aes_sparc64_cbc_encrypt)
  635. ENTRY(aes_sparc64_cbc_decrypt)
  636. /* %o0=&key[key_len], %o1=key_len, %o2=input, %o3=output, %o4=len, %o5=iv */
  637. ldx [%o0 - 0x10], %g1
  638. ldx [%o0 - 0x08], %g2
  639. cmp %o1, 24
  640. ldx [%o5 + 0x00], %o0
  641. bl 2f
  642. ldx [%o5 + 0x08], %o1
  643. be 1f
  644. nop
  645. 0:
  646. /* 256-bit key */
  647. ldx [%o2 + 0x00], %g3
  648. ldx [%o2 + 0x08], %g7
  649. add %o2, 0x10, %o2
  650. xor %g1, %g3, %g3
  651. xor %g2, %g7, %g7
  652. MOVXTOD_G3_F4
  653. MOVXTOD_G7_F6
  654. DECRYPT_256(64, 4, 6, 0, 2)
  655. MOVXTOD_O0_F0
  656. MOVXTOD_O1_F2
  657. xor %g1, %g3, %o0
  658. xor %g2, %g7, %o1
  659. fxor %f4, %f0, %f4
  660. fxor %f6, %f2, %f6
  661. std %f4, [%o3 + 0x00]
  662. std %f6, [%o3 + 0x08]
  663. subcc %o4, 0x10, %o4
  664. bne,pt %xcc, 0b
  665. add %o3, 0x10, %o3
  666. stx %o0, [%o5 + 0x00]
  667. stx %o1, [%o5 + 0x08]
  668. retl
  669. nop
  670. 1:
  671. /* 192-bit key */
  672. ldx [%o2 + 0x00], %g3
  673. ldx [%o2 + 0x08], %g7
  674. add %o2, 0x10, %o2
  675. xor %g1, %g3, %g3
  676. xor %g2, %g7, %g7
  677. MOVXTOD_G3_F4
  678. MOVXTOD_G7_F6
  679. DECRYPT_192(56, 4, 6, 0, 2)
  680. MOVXTOD_O0_F0
  681. MOVXTOD_O1_F2
  682. xor %g1, %g3, %o0
  683. xor %g2, %g7, %o1
  684. fxor %f4, %f0, %f4
  685. fxor %f6, %f2, %f6
  686. std %f4, [%o3 + 0x00]
  687. std %f6, [%o3 + 0x08]
  688. subcc %o4, 0x10, %o4
  689. bne,pt %xcc, 1b
  690. add %o3, 0x10, %o3
  691. stx %o0, [%o5 + 0x00]
  692. stx %o1, [%o5 + 0x08]
  693. retl
  694. nop
  695. 2:
  696. /* 128-bit key */
  697. ldx [%o2 + 0x00], %g3
  698. ldx [%o2 + 0x08], %g7
  699. add %o2, 0x10, %o2
  700. xor %g1, %g3, %g3
  701. xor %g2, %g7, %g7
  702. MOVXTOD_G3_F4
  703. MOVXTOD_G7_F6
  704. DECRYPT_128(48, 4, 6, 0, 2)
  705. MOVXTOD_O0_F0
  706. MOVXTOD_O1_F2
  707. xor %g1, %g3, %o0
  708. xor %g2, %g7, %o1
  709. fxor %f4, %f0, %f4
  710. fxor %f6, %f2, %f6
  711. std %f4, [%o3 + 0x00]
  712. std %f6, [%o3 + 0x08]
  713. subcc %o4, 0x10, %o4
  714. bne,pt %xcc, 2b
  715. add %o3, 0x10, %o3
  716. stx %o0, [%o5 + 0x00]
  717. stx %o1, [%o5 + 0x08]
  718. retl
  719. nop
  720. ENDPROC(aes_sparc64_cbc_decrypt)