aes_asm.S 38 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229123012311232123312341235123612371238123912401241124212431244124512461247124812491250125112521253125412551256125712581259126012611262126312641265126612671268126912701271127212731274127512761277127812791280128112821283128412851286128712881289129012911292129312941295129612971298129913001301130213031304130513061307130813091310131113121313131413151316131713181319132013211322132313241325132613271328132913301331133213331334133513361337133813391340134113421343134413451346134713481349135013511352135313541355135613571358135913601361136213631364136513661367136813691370137113721373137413751376137713781379138013811382138313841385138613871388138913901391139213931394139513961397139813991400140114021403140414051406140714081409141014111412141314141415141614171418141914201421142214231424142514261427142814291430143114321433143414351436143714381439144014411442144314441445144614471448144914501451145214531454145514561457145814591460146114621463146414651466146714681469147014711472147314741475147614771478147914801481148214831484148514861487148814891490149114921493149414951496149714981499150015011502150315041505150615071508150915101511151215131514151515161517151815191520152115221523152415251526152715281529
  1. #include <linux/linkage.h>
  2. #include <asm/visasm.h>
  3. #include "opcodes.h"
  4. #define ENCRYPT_TWO_ROUNDS(KEY_BASE, I0, I1, T0, T1) \
  5. AES_EROUND01(KEY_BASE + 0, I0, I1, T0) \
  6. AES_EROUND23(KEY_BASE + 2, I0, I1, T1) \
  7. AES_EROUND01(KEY_BASE + 4, T0, T1, I0) \
  8. AES_EROUND23(KEY_BASE + 6, T0, T1, I1)
  9. #define ENCRYPT_TWO_ROUNDS_2(KEY_BASE, I0, I1, I2, I3, T0, T1, T2, T3) \
  10. AES_EROUND01(KEY_BASE + 0, I0, I1, T0) \
  11. AES_EROUND23(KEY_BASE + 2, I0, I1, T1) \
  12. AES_EROUND01(KEY_BASE + 0, I2, I3, T2) \
  13. AES_EROUND23(KEY_BASE + 2, I2, I3, T3) \
  14. AES_EROUND01(KEY_BASE + 4, T0, T1, I0) \
  15. AES_EROUND23(KEY_BASE + 6, T0, T1, I1) \
  16. AES_EROUND01(KEY_BASE + 4, T2, T3, I2) \
  17. AES_EROUND23(KEY_BASE + 6, T2, T3, I3)
  18. #define ENCRYPT_TWO_ROUNDS_LAST(KEY_BASE, I0, I1, T0, T1) \
  19. AES_EROUND01(KEY_BASE + 0, I0, I1, T0) \
  20. AES_EROUND23(KEY_BASE + 2, I0, I1, T1) \
  21. AES_EROUND01_L(KEY_BASE + 4, T0, T1, I0) \
  22. AES_EROUND23_L(KEY_BASE + 6, T0, T1, I1)
  23. #define ENCRYPT_TWO_ROUNDS_LAST_2(KEY_BASE, I0, I1, I2, I3, T0, T1, T2, T3) \
  24. AES_EROUND01(KEY_BASE + 0, I0, I1, T0) \
  25. AES_EROUND23(KEY_BASE + 2, I0, I1, T1) \
  26. AES_EROUND01(KEY_BASE + 0, I2, I3, T2) \
  27. AES_EROUND23(KEY_BASE + 2, I2, I3, T3) \
  28. AES_EROUND01_L(KEY_BASE + 4, T0, T1, I0) \
  29. AES_EROUND23_L(KEY_BASE + 6, T0, T1, I1) \
  30. AES_EROUND01_L(KEY_BASE + 4, T2, T3, I2) \
  31. AES_EROUND23_L(KEY_BASE + 6, T2, T3, I3)
  32. /* 10 rounds */
  33. #define ENCRYPT_128(KEY_BASE, I0, I1, T0, T1) \
  34. ENCRYPT_TWO_ROUNDS(KEY_BASE + 0, I0, I1, T0, T1) \
  35. ENCRYPT_TWO_ROUNDS(KEY_BASE + 8, I0, I1, T0, T1) \
  36. ENCRYPT_TWO_ROUNDS(KEY_BASE + 16, I0, I1, T0, T1) \
  37. ENCRYPT_TWO_ROUNDS(KEY_BASE + 24, I0, I1, T0, T1) \
  38. ENCRYPT_TWO_ROUNDS_LAST(KEY_BASE + 32, I0, I1, T0, T1)
  39. #define ENCRYPT_128_2(KEY_BASE, I0, I1, I2, I3, T0, T1, T2, T3) \
  40. ENCRYPT_TWO_ROUNDS_2(KEY_BASE + 0, I0, I1, I2, I3, T0, T1, T2, T3) \
  41. ENCRYPT_TWO_ROUNDS_2(KEY_BASE + 8, I0, I1, I2, I3, T0, T1, T2, T3) \
  42. ENCRYPT_TWO_ROUNDS_2(KEY_BASE + 16, I0, I1, I2, I3, T0, T1, T2, T3) \
  43. ENCRYPT_TWO_ROUNDS_2(KEY_BASE + 24, I0, I1, I2, I3, T0, T1, T2, T3) \
  44. ENCRYPT_TWO_ROUNDS_LAST_2(KEY_BASE + 32, I0, I1, I2, I3, T0, T1, T2, T3)
  45. /* 12 rounds */
  46. #define ENCRYPT_192(KEY_BASE, I0, I1, T0, T1) \
  47. ENCRYPT_TWO_ROUNDS(KEY_BASE + 0, I0, I1, T0, T1) \
  48. ENCRYPT_TWO_ROUNDS(KEY_BASE + 8, I0, I1, T0, T1) \
  49. ENCRYPT_TWO_ROUNDS(KEY_BASE + 16, I0, I1, T0, T1) \
  50. ENCRYPT_TWO_ROUNDS(KEY_BASE + 24, I0, I1, T0, T1) \
  51. ENCRYPT_TWO_ROUNDS(KEY_BASE + 32, I0, I1, T0, T1) \
  52. ENCRYPT_TWO_ROUNDS_LAST(KEY_BASE + 40, I0, I1, T0, T1)
  53. #define ENCRYPT_192_2(KEY_BASE, I0, I1, I2, I3, T0, T1, T2, T3) \
  54. ENCRYPT_TWO_ROUNDS_2(KEY_BASE + 0, I0, I1, I2, I3, T0, T1, T2, T3) \
  55. ENCRYPT_TWO_ROUNDS_2(KEY_BASE + 8, I0, I1, I2, I3, T0, T1, T2, T3) \
  56. ENCRYPT_TWO_ROUNDS_2(KEY_BASE + 16, I0, I1, I2, I3, T0, T1, T2, T3) \
  57. ENCRYPT_TWO_ROUNDS_2(KEY_BASE + 24, I0, I1, I2, I3, T0, T1, T2, T3) \
  58. ENCRYPT_TWO_ROUNDS_2(KEY_BASE + 32, I0, I1, I2, I3, T0, T1, T2, T3) \
  59. ENCRYPT_TWO_ROUNDS_LAST_2(KEY_BASE + 40, I0, I1, I2, I3, T0, T1, T2, T3)
  60. /* 14 rounds */
  61. #define ENCRYPT_256(KEY_BASE, I0, I1, T0, T1) \
  62. ENCRYPT_TWO_ROUNDS(KEY_BASE + 0, I0, I1, T0, T1) \
  63. ENCRYPT_TWO_ROUNDS(KEY_BASE + 8, I0, I1, T0, T1) \
  64. ENCRYPT_TWO_ROUNDS(KEY_BASE + 16, I0, I1, T0, T1) \
  65. ENCRYPT_TWO_ROUNDS(KEY_BASE + 24, I0, I1, T0, T1) \
  66. ENCRYPT_TWO_ROUNDS(KEY_BASE + 32, I0, I1, T0, T1) \
  67. ENCRYPT_TWO_ROUNDS(KEY_BASE + 40, I0, I1, T0, T1) \
  68. ENCRYPT_TWO_ROUNDS_LAST(KEY_BASE + 48, I0, I1, T0, T1)
  69. #define ENCRYPT_256_TWO_ROUNDS_2(KEY_BASE, I0, I1, I2, I3, TMP_BASE) \
  70. ENCRYPT_TWO_ROUNDS_2(KEY_BASE, I0, I1, I2, I3, \
  71. TMP_BASE + 0, TMP_BASE + 2, TMP_BASE + 4, TMP_BASE + 6)
  72. #define ENCRYPT_256_2(KEY_BASE, I0, I1, I2, I3) \
  73. ENCRYPT_256_TWO_ROUNDS_2(KEY_BASE + 0, I0, I1, I2, I3, KEY_BASE + 48) \
  74. ldd [%o0 + 0xd0], %f56; \
  75. ldd [%o0 + 0xd8], %f58; \
  76. ENCRYPT_256_TWO_ROUNDS_2(KEY_BASE + 8, I0, I1, I2, I3, KEY_BASE + 0) \
  77. ldd [%o0 + 0xe0], %f60; \
  78. ldd [%o0 + 0xe8], %f62; \
  79. ENCRYPT_256_TWO_ROUNDS_2(KEY_BASE + 16, I0, I1, I2, I3, KEY_BASE + 0) \
  80. ENCRYPT_256_TWO_ROUNDS_2(KEY_BASE + 24, I0, I1, I2, I3, KEY_BASE + 0) \
  81. ENCRYPT_256_TWO_ROUNDS_2(KEY_BASE + 32, I0, I1, I2, I3, KEY_BASE + 0) \
  82. ENCRYPT_256_TWO_ROUNDS_2(KEY_BASE + 40, I0, I1, I2, I3, KEY_BASE + 0) \
  83. AES_EROUND01(KEY_BASE + 48, I0, I1, KEY_BASE + 0) \
  84. AES_EROUND23(KEY_BASE + 50, I0, I1, KEY_BASE + 2) \
  85. AES_EROUND01(KEY_BASE + 48, I2, I3, KEY_BASE + 4) \
  86. AES_EROUND23(KEY_BASE + 50, I2, I3, KEY_BASE + 6) \
  87. AES_EROUND01_L(KEY_BASE + 52, KEY_BASE + 0, KEY_BASE + 2, I0) \
  88. AES_EROUND23_L(KEY_BASE + 54, KEY_BASE + 0, KEY_BASE + 2, I1) \
  89. ldd [%o0 + 0x10], %f8; \
  90. ldd [%o0 + 0x18], %f10; \
  91. AES_EROUND01_L(KEY_BASE + 52, KEY_BASE + 4, KEY_BASE + 6, I2) \
  92. AES_EROUND23_L(KEY_BASE + 54, KEY_BASE + 4, KEY_BASE + 6, I3) \
  93. ldd [%o0 + 0x20], %f12; \
  94. ldd [%o0 + 0x28], %f14;
  95. #define DECRYPT_TWO_ROUNDS(KEY_BASE, I0, I1, T0, T1) \
  96. AES_DROUND23(KEY_BASE + 0, I0, I1, T1) \
  97. AES_DROUND01(KEY_BASE + 2, I0, I1, T0) \
  98. AES_DROUND23(KEY_BASE + 4, T0, T1, I1) \
  99. AES_DROUND01(KEY_BASE + 6, T0, T1, I0)
  100. #define DECRYPT_TWO_ROUNDS_2(KEY_BASE, I0, I1, I2, I3, T0, T1, T2, T3) \
  101. AES_DROUND23(KEY_BASE + 0, I0, I1, T1) \
  102. AES_DROUND01(KEY_BASE + 2, I0, I1, T0) \
  103. AES_DROUND23(KEY_BASE + 0, I2, I3, T3) \
  104. AES_DROUND01(KEY_BASE + 2, I2, I3, T2) \
  105. AES_DROUND23(KEY_BASE + 4, T0, T1, I1) \
  106. AES_DROUND01(KEY_BASE + 6, T0, T1, I0) \
  107. AES_DROUND23(KEY_BASE + 4, T2, T3, I3) \
  108. AES_DROUND01(KEY_BASE + 6, T2, T3, I2)
  109. #define DECRYPT_TWO_ROUNDS_LAST(KEY_BASE, I0, I1, T0, T1) \
  110. AES_DROUND23(KEY_BASE + 0, I0, I1, T1) \
  111. AES_DROUND01(KEY_BASE + 2, I0, I1, T0) \
  112. AES_DROUND23_L(KEY_BASE + 4, T0, T1, I1) \
  113. AES_DROUND01_L(KEY_BASE + 6, T0, T1, I0)
  114. #define DECRYPT_TWO_ROUNDS_LAST_2(KEY_BASE, I0, I1, I2, I3, T0, T1, T2, T3) \
  115. AES_DROUND23(KEY_BASE + 0, I0, I1, T1) \
  116. AES_DROUND01(KEY_BASE + 2, I0, I1, T0) \
  117. AES_DROUND23(KEY_BASE + 0, I2, I3, T3) \
  118. AES_DROUND01(KEY_BASE + 2, I2, I3, T2) \
  119. AES_DROUND23_L(KEY_BASE + 4, T0, T1, I1) \
  120. AES_DROUND01_L(KEY_BASE + 6, T0, T1, I0) \
  121. AES_DROUND23_L(KEY_BASE + 4, T2, T3, I3) \
  122. AES_DROUND01_L(KEY_BASE + 6, T2, T3, I2)
  123. /* 10 rounds */
  124. #define DECRYPT_128(KEY_BASE, I0, I1, T0, T1) \
  125. DECRYPT_TWO_ROUNDS(KEY_BASE + 0, I0, I1, T0, T1) \
  126. DECRYPT_TWO_ROUNDS(KEY_BASE + 8, I0, I1, T0, T1) \
  127. DECRYPT_TWO_ROUNDS(KEY_BASE + 16, I0, I1, T0, T1) \
  128. DECRYPT_TWO_ROUNDS(KEY_BASE + 24, I0, I1, T0, T1) \
  129. DECRYPT_TWO_ROUNDS_LAST(KEY_BASE + 32, I0, I1, T0, T1)
  130. #define DECRYPT_128_2(KEY_BASE, I0, I1, I2, I3, T0, T1, T2, T3) \
  131. DECRYPT_TWO_ROUNDS_2(KEY_BASE + 0, I0, I1, I2, I3, T0, T1, T2, T3) \
  132. DECRYPT_TWO_ROUNDS_2(KEY_BASE + 8, I0, I1, I2, I3, T0, T1, T2, T3) \
  133. DECRYPT_TWO_ROUNDS_2(KEY_BASE + 16, I0, I1, I2, I3, T0, T1, T2, T3) \
  134. DECRYPT_TWO_ROUNDS_2(KEY_BASE + 24, I0, I1, I2, I3, T0, T1, T2, T3) \
  135. DECRYPT_TWO_ROUNDS_LAST_2(KEY_BASE + 32, I0, I1, I2, I3, T0, T1, T2, T3)
  136. /* 12 rounds */
  137. #define DECRYPT_192(KEY_BASE, I0, I1, T0, T1) \
  138. DECRYPT_TWO_ROUNDS(KEY_BASE + 0, I0, I1, T0, T1) \
  139. DECRYPT_TWO_ROUNDS(KEY_BASE + 8, I0, I1, T0, T1) \
  140. DECRYPT_TWO_ROUNDS(KEY_BASE + 16, I0, I1, T0, T1) \
  141. DECRYPT_TWO_ROUNDS(KEY_BASE + 24, I0, I1, T0, T1) \
  142. DECRYPT_TWO_ROUNDS(KEY_BASE + 32, I0, I1, T0, T1) \
  143. DECRYPT_TWO_ROUNDS_LAST(KEY_BASE + 40, I0, I1, T0, T1)
  144. #define DECRYPT_192_2(KEY_BASE, I0, I1, I2, I3, T0, T1, T2, T3) \
  145. DECRYPT_TWO_ROUNDS_2(KEY_BASE + 0, I0, I1, I2, I3, T0, T1, T2, T3) \
  146. DECRYPT_TWO_ROUNDS_2(KEY_BASE + 8, I0, I1, I2, I3, T0, T1, T2, T3) \
  147. DECRYPT_TWO_ROUNDS_2(KEY_BASE + 16, I0, I1, I2, I3, T0, T1, T2, T3) \
  148. DECRYPT_TWO_ROUNDS_2(KEY_BASE + 24, I0, I1, I2, I3, T0, T1, T2, T3) \
  149. DECRYPT_TWO_ROUNDS_2(KEY_BASE + 32, I0, I1, I2, I3, T0, T1, T2, T3) \
  150. DECRYPT_TWO_ROUNDS_LAST_2(KEY_BASE + 40, I0, I1, I2, I3, T0, T1, T2, T3)
  151. /* 14 rounds */
  152. #define DECRYPT_256(KEY_BASE, I0, I1, T0, T1) \
  153. DECRYPT_TWO_ROUNDS(KEY_BASE + 0, I0, I1, T0, T1) \
  154. DECRYPT_TWO_ROUNDS(KEY_BASE + 8, I0, I1, T0, T1) \
  155. DECRYPT_TWO_ROUNDS(KEY_BASE + 16, I0, I1, T0, T1) \
  156. DECRYPT_TWO_ROUNDS(KEY_BASE + 24, I0, I1, T0, T1) \
  157. DECRYPT_TWO_ROUNDS(KEY_BASE + 32, I0, I1, T0, T1) \
  158. DECRYPT_TWO_ROUNDS(KEY_BASE + 40, I0, I1, T0, T1) \
  159. DECRYPT_TWO_ROUNDS_LAST(KEY_BASE + 48, I0, I1, T0, T1)
  160. #define DECRYPT_256_TWO_ROUNDS_2(KEY_BASE, I0, I1, I2, I3, TMP_BASE) \
  161. DECRYPT_TWO_ROUNDS_2(KEY_BASE, I0, I1, I2, I3, \
  162. TMP_BASE + 0, TMP_BASE + 2, TMP_BASE + 4, TMP_BASE + 6)
  163. #define DECRYPT_256_2(KEY_BASE, I0, I1, I2, I3) \
  164. DECRYPT_256_TWO_ROUNDS_2(KEY_BASE + 0, I0, I1, I2, I3, KEY_BASE + 48) \
  165. ldd [%o0 + 0x18], %f56; \
  166. ldd [%o0 + 0x10], %f58; \
  167. DECRYPT_256_TWO_ROUNDS_2(KEY_BASE + 8, I0, I1, I2, I3, KEY_BASE + 0) \
  168. DECRYPT_256_TWO_ROUNDS_2(KEY_BASE + 16, I0, I1, I2, I3, KEY_BASE + 0) \
  169. DECRYPT_256_TWO_ROUNDS_2(KEY_BASE + 24, I0, I1, I2, I3, KEY_BASE + 0) \
  170. DECRYPT_256_TWO_ROUNDS_2(KEY_BASE + 32, I0, I1, I2, I3, KEY_BASE + 0) \
  171. DECRYPT_256_TWO_ROUNDS_2(KEY_BASE + 40, I0, I1, I2, I3, KEY_BASE + 0) \
  172. AES_DROUND23(KEY_BASE + 48, I0, I1, KEY_BASE + 2) \
  173. AES_DROUND01(KEY_BASE + 50, I0, I1, KEY_BASE + 0) \
  174. AES_DROUND23(KEY_BASE + 48, I2, I3, KEY_BASE + 6) \
  175. AES_DROUND01(KEY_BASE + 50, I2, I3, KEY_BASE + 4) \
  176. AES_DROUND23_L(KEY_BASE + 52, KEY_BASE + 0, KEY_BASE + 2, I1) \
  177. AES_DROUND01_L(KEY_BASE + 54, KEY_BASE + 0, KEY_BASE + 2, I0) \
  178. ldd [%o0 + 0xd8], %f8; \
  179. ldd [%o0 + 0xd0], %f10; \
  180. AES_DROUND23_L(KEY_BASE + 52, KEY_BASE + 4, KEY_BASE + 6, I3) \
  181. AES_DROUND01_L(KEY_BASE + 54, KEY_BASE + 4, KEY_BASE + 6, I2)
  182. ldd [%o0 + 0xc8], %f12; \
  183. ldd [%o0 + 0xc0], %f14;
  184. .align 32
  185. ENTRY(aes_sparc64_key_expand)
  186. /* %o0=input_key, %o1=output_key, %o2=key_len */
  187. VISEntry
  188. ld [%o0 + 0x00], %f0
  189. ld [%o0 + 0x04], %f1
  190. ld [%o0 + 0x08], %f2
  191. ld [%o0 + 0x0c], %f3
  192. std %f0, [%o1 + 0x00]
  193. std %f2, [%o1 + 0x08]
  194. add %o1, 0x10, %o1
  195. cmp %o2, 24
  196. bl 2f
  197. nop
  198. be 1f
  199. nop
  200. /* 256-bit key expansion */
  201. ld [%o0 + 0x10], %f4
  202. ld [%o0 + 0x14], %f5
  203. ld [%o0 + 0x18], %f6
  204. ld [%o0 + 0x1c], %f7
  205. std %f4, [%o1 + 0x00]
  206. std %f6, [%o1 + 0x08]
  207. add %o1, 0x10, %o1
  208. AES_KEXPAND1(0, 6, 0x0, 8)
  209. AES_KEXPAND2(2, 8, 10)
  210. AES_KEXPAND0(4, 10, 12)
  211. AES_KEXPAND2(6, 12, 14)
  212. AES_KEXPAND1(8, 14, 0x1, 16)
  213. AES_KEXPAND2(10, 16, 18)
  214. AES_KEXPAND0(12, 18, 20)
  215. AES_KEXPAND2(14, 20, 22)
  216. AES_KEXPAND1(16, 22, 0x2, 24)
  217. AES_KEXPAND2(18, 24, 26)
  218. AES_KEXPAND0(20, 26, 28)
  219. AES_KEXPAND2(22, 28, 30)
  220. AES_KEXPAND1(24, 30, 0x3, 32)
  221. AES_KEXPAND2(26, 32, 34)
  222. AES_KEXPAND0(28, 34, 36)
  223. AES_KEXPAND2(30, 36, 38)
  224. AES_KEXPAND1(32, 38, 0x4, 40)
  225. AES_KEXPAND2(34, 40, 42)
  226. AES_KEXPAND0(36, 42, 44)
  227. AES_KEXPAND2(38, 44, 46)
  228. AES_KEXPAND1(40, 46, 0x5, 48)
  229. AES_KEXPAND2(42, 48, 50)
  230. AES_KEXPAND0(44, 50, 52)
  231. AES_KEXPAND2(46, 52, 54)
  232. AES_KEXPAND1(48, 54, 0x6, 56)
  233. AES_KEXPAND2(50, 56, 58)
  234. std %f8, [%o1 + 0x00]
  235. std %f10, [%o1 + 0x08]
  236. std %f12, [%o1 + 0x10]
  237. std %f14, [%o1 + 0x18]
  238. std %f16, [%o1 + 0x20]
  239. std %f18, [%o1 + 0x28]
  240. std %f20, [%o1 + 0x30]
  241. std %f22, [%o1 + 0x38]
  242. std %f24, [%o1 + 0x40]
  243. std %f26, [%o1 + 0x48]
  244. std %f28, [%o1 + 0x50]
  245. std %f30, [%o1 + 0x58]
  246. std %f32, [%o1 + 0x60]
  247. std %f34, [%o1 + 0x68]
  248. std %f36, [%o1 + 0x70]
  249. std %f38, [%o1 + 0x78]
  250. std %f40, [%o1 + 0x80]
  251. std %f42, [%o1 + 0x88]
  252. std %f44, [%o1 + 0x90]
  253. std %f46, [%o1 + 0x98]
  254. std %f48, [%o1 + 0xa0]
  255. std %f50, [%o1 + 0xa8]
  256. std %f52, [%o1 + 0xb0]
  257. std %f54, [%o1 + 0xb8]
  258. std %f56, [%o1 + 0xc0]
  259. ba,pt %xcc, 80f
  260. std %f58, [%o1 + 0xc8]
  261. 1:
  262. /* 192-bit key expansion */
  263. ld [%o0 + 0x10], %f4
  264. ld [%o0 + 0x14], %f5
  265. std %f4, [%o1 + 0x00]
  266. add %o1, 0x08, %o1
  267. AES_KEXPAND1(0, 4, 0x0, 6)
  268. AES_KEXPAND2(2, 6, 8)
  269. AES_KEXPAND2(4, 8, 10)
  270. AES_KEXPAND1(6, 10, 0x1, 12)
  271. AES_KEXPAND2(8, 12, 14)
  272. AES_KEXPAND2(10, 14, 16)
  273. AES_KEXPAND1(12, 16, 0x2, 18)
  274. AES_KEXPAND2(14, 18, 20)
  275. AES_KEXPAND2(16, 20, 22)
  276. AES_KEXPAND1(18, 22, 0x3, 24)
  277. AES_KEXPAND2(20, 24, 26)
  278. AES_KEXPAND2(22, 26, 28)
  279. AES_KEXPAND1(24, 28, 0x4, 30)
  280. AES_KEXPAND2(26, 30, 32)
  281. AES_KEXPAND2(28, 32, 34)
  282. AES_KEXPAND1(30, 34, 0x5, 36)
  283. AES_KEXPAND2(32, 36, 38)
  284. AES_KEXPAND2(34, 38, 40)
  285. AES_KEXPAND1(36, 40, 0x6, 42)
  286. AES_KEXPAND2(38, 42, 44)
  287. AES_KEXPAND2(40, 44, 46)
  288. AES_KEXPAND1(42, 46, 0x7, 48)
  289. AES_KEXPAND2(44, 48, 50)
  290. std %f6, [%o1 + 0x00]
  291. std %f8, [%o1 + 0x08]
  292. std %f10, [%o1 + 0x10]
  293. std %f12, [%o1 + 0x18]
  294. std %f14, [%o1 + 0x20]
  295. std %f16, [%o1 + 0x28]
  296. std %f18, [%o1 + 0x30]
  297. std %f20, [%o1 + 0x38]
  298. std %f22, [%o1 + 0x40]
  299. std %f24, [%o1 + 0x48]
  300. std %f26, [%o1 + 0x50]
  301. std %f28, [%o1 + 0x58]
  302. std %f30, [%o1 + 0x60]
  303. std %f32, [%o1 + 0x68]
  304. std %f34, [%o1 + 0x70]
  305. std %f36, [%o1 + 0x78]
  306. std %f38, [%o1 + 0x80]
  307. std %f40, [%o1 + 0x88]
  308. std %f42, [%o1 + 0x90]
  309. std %f44, [%o1 + 0x98]
  310. std %f46, [%o1 + 0xa0]
  311. std %f48, [%o1 + 0xa8]
  312. ba,pt %xcc, 80f
  313. std %f50, [%o1 + 0xb0]
  314. 2:
  315. /* 128-bit key expansion */
  316. AES_KEXPAND1(0, 2, 0x0, 4)
  317. AES_KEXPAND2(2, 4, 6)
  318. AES_KEXPAND1(4, 6, 0x1, 8)
  319. AES_KEXPAND2(6, 8, 10)
  320. AES_KEXPAND1(8, 10, 0x2, 12)
  321. AES_KEXPAND2(10, 12, 14)
  322. AES_KEXPAND1(12, 14, 0x3, 16)
  323. AES_KEXPAND2(14, 16, 18)
  324. AES_KEXPAND1(16, 18, 0x4, 20)
  325. AES_KEXPAND2(18, 20, 22)
  326. AES_KEXPAND1(20, 22, 0x5, 24)
  327. AES_KEXPAND2(22, 24, 26)
  328. AES_KEXPAND1(24, 26, 0x6, 28)
  329. AES_KEXPAND2(26, 28, 30)
  330. AES_KEXPAND1(28, 30, 0x7, 32)
  331. AES_KEXPAND2(30, 32, 34)
  332. AES_KEXPAND1(32, 34, 0x8, 36)
  333. AES_KEXPAND2(34, 36, 38)
  334. AES_KEXPAND1(36, 38, 0x9, 40)
  335. AES_KEXPAND2(38, 40, 42)
  336. std %f4, [%o1 + 0x00]
  337. std %f6, [%o1 + 0x08]
  338. std %f8, [%o1 + 0x10]
  339. std %f10, [%o1 + 0x18]
  340. std %f12, [%o1 + 0x20]
  341. std %f14, [%o1 + 0x28]
  342. std %f16, [%o1 + 0x30]
  343. std %f18, [%o1 + 0x38]
  344. std %f20, [%o1 + 0x40]
  345. std %f22, [%o1 + 0x48]
  346. std %f24, [%o1 + 0x50]
  347. std %f26, [%o1 + 0x58]
  348. std %f28, [%o1 + 0x60]
  349. std %f30, [%o1 + 0x68]
  350. std %f32, [%o1 + 0x70]
  351. std %f34, [%o1 + 0x78]
  352. std %f36, [%o1 + 0x80]
  353. std %f38, [%o1 + 0x88]
  354. std %f40, [%o1 + 0x90]
  355. std %f42, [%o1 + 0x98]
  356. 80:
  357. retl
  358. VISExit
  359. ENDPROC(aes_sparc64_key_expand)
  360. .align 32
  361. ENTRY(aes_sparc64_encrypt_128)
  362. /* %o0=key, %o1=input, %o2=output */
  363. VISEntry
  364. ld [%o1 + 0x00], %f4
  365. ld [%o1 + 0x04], %f5
  366. ld [%o1 + 0x08], %f6
  367. ld [%o1 + 0x0c], %f7
  368. ldd [%o0 + 0x00], %f8
  369. ldd [%o0 + 0x08], %f10
  370. ldd [%o0 + 0x10], %f12
  371. ldd [%o0 + 0x18], %f14
  372. ldd [%o0 + 0x20], %f16
  373. ldd [%o0 + 0x28], %f18
  374. ldd [%o0 + 0x30], %f20
  375. ldd [%o0 + 0x38], %f22
  376. ldd [%o0 + 0x40], %f24
  377. ldd [%o0 + 0x48], %f26
  378. ldd [%o0 + 0x50], %f28
  379. ldd [%o0 + 0x58], %f30
  380. ldd [%o0 + 0x60], %f32
  381. ldd [%o0 + 0x68], %f34
  382. ldd [%o0 + 0x70], %f36
  383. ldd [%o0 + 0x78], %f38
  384. ldd [%o0 + 0x80], %f40
  385. ldd [%o0 + 0x88], %f42
  386. ldd [%o0 + 0x90], %f44
  387. ldd [%o0 + 0x98], %f46
  388. ldd [%o0 + 0xa0], %f48
  389. ldd [%o0 + 0xa8], %f50
  390. fxor %f8, %f4, %f4
  391. fxor %f10, %f6, %f6
  392. ENCRYPT_128(12, 4, 6, 0, 2)
  393. st %f4, [%o2 + 0x00]
  394. st %f5, [%o2 + 0x04]
  395. st %f6, [%o2 + 0x08]
  396. st %f7, [%o2 + 0x0c]
  397. retl
  398. VISExit
  399. ENDPROC(aes_sparc64_encrypt_128)
  400. .align 32
  401. ENTRY(aes_sparc64_encrypt_192)
  402. /* %o0=key, %o1=input, %o2=output */
  403. VISEntry
  404. ld [%o1 + 0x00], %f4
  405. ld [%o1 + 0x04], %f5
  406. ld [%o1 + 0x08], %f6
  407. ld [%o1 + 0x0c], %f7
  408. ldd [%o0 + 0x00], %f8
  409. ldd [%o0 + 0x08], %f10
  410. fxor %f8, %f4, %f4
  411. fxor %f10, %f6, %f6
  412. ldd [%o0 + 0x10], %f8
  413. ldd [%o0 + 0x18], %f10
  414. ldd [%o0 + 0x20], %f12
  415. ldd [%o0 + 0x28], %f14
  416. add %o0, 0x20, %o0
  417. ENCRYPT_TWO_ROUNDS(8, 4, 6, 0, 2)
  418. ldd [%o0 + 0x10], %f12
  419. ldd [%o0 + 0x18], %f14
  420. ldd [%o0 + 0x20], %f16
  421. ldd [%o0 + 0x28], %f18
  422. ldd [%o0 + 0x30], %f20
  423. ldd [%o0 + 0x38], %f22
  424. ldd [%o0 + 0x40], %f24
  425. ldd [%o0 + 0x48], %f26
  426. ldd [%o0 + 0x50], %f28
  427. ldd [%o0 + 0x58], %f30
  428. ldd [%o0 + 0x60], %f32
  429. ldd [%o0 + 0x68], %f34
  430. ldd [%o0 + 0x70], %f36
  431. ldd [%o0 + 0x78], %f38
  432. ldd [%o0 + 0x80], %f40
  433. ldd [%o0 + 0x88], %f42
  434. ldd [%o0 + 0x90], %f44
  435. ldd [%o0 + 0x98], %f46
  436. ldd [%o0 + 0xa0], %f48
  437. ldd [%o0 + 0xa8], %f50
  438. ENCRYPT_128(12, 4, 6, 0, 2)
  439. st %f4, [%o2 + 0x00]
  440. st %f5, [%o2 + 0x04]
  441. st %f6, [%o2 + 0x08]
  442. st %f7, [%o2 + 0x0c]
  443. retl
  444. VISExit
  445. ENDPROC(aes_sparc64_encrypt_192)
  446. .align 32
  447. ENTRY(aes_sparc64_encrypt_256)
  448. /* %o0=key, %o1=input, %o2=output */
  449. VISEntry
  450. ld [%o1 + 0x00], %f4
  451. ld [%o1 + 0x04], %f5
  452. ld [%o1 + 0x08], %f6
  453. ld [%o1 + 0x0c], %f7
  454. ldd [%o0 + 0x00], %f8
  455. ldd [%o0 + 0x08], %f10
  456. fxor %f8, %f4, %f4
  457. fxor %f10, %f6, %f6
  458. ldd [%o0 + 0x10], %f8
  459. ldd [%o0 + 0x18], %f10
  460. ldd [%o0 + 0x20], %f12
  461. ldd [%o0 + 0x28], %f14
  462. add %o0, 0x20, %o0
  463. ENCRYPT_TWO_ROUNDS(8, 4, 6, 0, 2)
  464. ldd [%o0 + 0x10], %f8
  465. ldd [%o0 + 0x18], %f10
  466. ldd [%o0 + 0x20], %f12
  467. ldd [%o0 + 0x28], %f14
  468. add %o0, 0x20, %o0
  469. ENCRYPT_TWO_ROUNDS(8, 4, 6, 0, 2)
  470. ldd [%o0 + 0x10], %f12
  471. ldd [%o0 + 0x18], %f14
  472. ldd [%o0 + 0x20], %f16
  473. ldd [%o0 + 0x28], %f18
  474. ldd [%o0 + 0x30], %f20
  475. ldd [%o0 + 0x38], %f22
  476. ldd [%o0 + 0x40], %f24
  477. ldd [%o0 + 0x48], %f26
  478. ldd [%o0 + 0x50], %f28
  479. ldd [%o0 + 0x58], %f30
  480. ldd [%o0 + 0x60], %f32
  481. ldd [%o0 + 0x68], %f34
  482. ldd [%o0 + 0x70], %f36
  483. ldd [%o0 + 0x78], %f38
  484. ldd [%o0 + 0x80], %f40
  485. ldd [%o0 + 0x88], %f42
  486. ldd [%o0 + 0x90], %f44
  487. ldd [%o0 + 0x98], %f46
  488. ldd [%o0 + 0xa0], %f48
  489. ldd [%o0 + 0xa8], %f50
  490. ENCRYPT_128(12, 4, 6, 0, 2)
  491. st %f4, [%o2 + 0x00]
  492. st %f5, [%o2 + 0x04]
  493. st %f6, [%o2 + 0x08]
  494. st %f7, [%o2 + 0x0c]
  495. retl
  496. VISExit
  497. ENDPROC(aes_sparc64_encrypt_256)
  498. .align 32
  499. ENTRY(aes_sparc64_decrypt_128)
  500. /* %o0=key, %o1=input, %o2=output */
  501. VISEntry
  502. ld [%o1 + 0x00], %f4
  503. ld [%o1 + 0x04], %f5
  504. ld [%o1 + 0x08], %f6
  505. ld [%o1 + 0x0c], %f7
  506. ldd [%o0 + 0xa0], %f8
  507. ldd [%o0 + 0xa8], %f10
  508. ldd [%o0 + 0x98], %f12
  509. ldd [%o0 + 0x90], %f14
  510. ldd [%o0 + 0x88], %f16
  511. ldd [%o0 + 0x80], %f18
  512. ldd [%o0 + 0x78], %f20
  513. ldd [%o0 + 0x70], %f22
  514. ldd [%o0 + 0x68], %f24
  515. ldd [%o0 + 0x60], %f26
  516. ldd [%o0 + 0x58], %f28
  517. ldd [%o0 + 0x50], %f30
  518. ldd [%o0 + 0x48], %f32
  519. ldd [%o0 + 0x40], %f34
  520. ldd [%o0 + 0x38], %f36
  521. ldd [%o0 + 0x30], %f38
  522. ldd [%o0 + 0x28], %f40
  523. ldd [%o0 + 0x20], %f42
  524. ldd [%o0 + 0x18], %f44
  525. ldd [%o0 + 0x10], %f46
  526. ldd [%o0 + 0x08], %f48
  527. ldd [%o0 + 0x00], %f50
  528. fxor %f8, %f4, %f4
  529. fxor %f10, %f6, %f6
  530. DECRYPT_128(12, 4, 6, 0, 2)
  531. st %f4, [%o2 + 0x00]
  532. st %f5, [%o2 + 0x04]
  533. st %f6, [%o2 + 0x08]
  534. st %f7, [%o2 + 0x0c]
  535. retl
  536. VISExit
  537. ENDPROC(aes_sparc64_decrypt_128)
  538. .align 32
  539. ENTRY(aes_sparc64_decrypt_192)
  540. /* %o0=key, %o1=input, %o2=output */
  541. VISEntry
  542. ld [%o1 + 0x00], %f4
  543. ld [%o1 + 0x04], %f5
  544. ld [%o1 + 0x08], %f6
  545. ld [%o1 + 0x0c], %f7
  546. ldd [%o0 + 0xc0], %f8
  547. ldd [%o0 + 0xc8], %f10
  548. ldd [%o0 + 0xb8], %f12
  549. ldd [%o0 + 0xb0], %f14
  550. ldd [%o0 + 0xa8], %f16
  551. ldd [%o0 + 0xa0], %f18
  552. fxor %f8, %f4, %f4
  553. fxor %f10, %f6, %f6
  554. ldd [%o0 + 0x98], %f20
  555. ldd [%o0 + 0x90], %f22
  556. ldd [%o0 + 0x88], %f24
  557. ldd [%o0 + 0x80], %f26
  558. DECRYPT_TWO_ROUNDS(12, 4, 6, 0, 2)
  559. ldd [%o0 + 0x78], %f28
  560. ldd [%o0 + 0x70], %f30
  561. ldd [%o0 + 0x68], %f32
  562. ldd [%o0 + 0x60], %f34
  563. ldd [%o0 + 0x58], %f36
  564. ldd [%o0 + 0x50], %f38
  565. ldd [%o0 + 0x48], %f40
  566. ldd [%o0 + 0x40], %f42
  567. ldd [%o0 + 0x38], %f44
  568. ldd [%o0 + 0x30], %f46
  569. ldd [%o0 + 0x28], %f48
  570. ldd [%o0 + 0x20], %f50
  571. ldd [%o0 + 0x18], %f52
  572. ldd [%o0 + 0x10], %f54
  573. ldd [%o0 + 0x08], %f56
  574. ldd [%o0 + 0x00], %f58
  575. DECRYPT_128(20, 4, 6, 0, 2)
  576. st %f4, [%o2 + 0x00]
  577. st %f5, [%o2 + 0x04]
  578. st %f6, [%o2 + 0x08]
  579. st %f7, [%o2 + 0x0c]
  580. retl
  581. VISExit
  582. ENDPROC(aes_sparc64_decrypt_192)
  583. .align 32
  584. ENTRY(aes_sparc64_decrypt_256)
  585. /* %o0=key, %o1=input, %o2=output */
  586. VISEntry
  587. ld [%o1 + 0x00], %f4
  588. ld [%o1 + 0x04], %f5
  589. ld [%o1 + 0x08], %f6
  590. ld [%o1 + 0x0c], %f7
  591. ldd [%o0 + 0xe0], %f8
  592. ldd [%o0 + 0xe8], %f10
  593. ldd [%o0 + 0xd8], %f12
  594. ldd [%o0 + 0xd0], %f14
  595. ldd [%o0 + 0xc8], %f16
  596. fxor %f8, %f4, %f4
  597. ldd [%o0 + 0xc0], %f18
  598. fxor %f10, %f6, %f6
  599. ldd [%o0 + 0xb8], %f20
  600. AES_DROUND23(12, 4, 6, 2)
  601. ldd [%o0 + 0xb0], %f22
  602. AES_DROUND01(14, 4, 6, 0)
  603. ldd [%o0 + 0xa8], %f24
  604. AES_DROUND23(16, 0, 2, 6)
  605. ldd [%o0 + 0xa0], %f26
  606. AES_DROUND01(18, 0, 2, 4)
  607. ldd [%o0 + 0x98], %f12
  608. AES_DROUND23(20, 4, 6, 2)
  609. ldd [%o0 + 0x90], %f14
  610. AES_DROUND01(22, 4, 6, 0)
  611. ldd [%o0 + 0x88], %f16
  612. AES_DROUND23(24, 0, 2, 6)
  613. ldd [%o0 + 0x80], %f18
  614. AES_DROUND01(26, 0, 2, 4)
  615. ldd [%o0 + 0x78], %f20
  616. AES_DROUND23(12, 4, 6, 2)
  617. ldd [%o0 + 0x70], %f22
  618. AES_DROUND01(14, 4, 6, 0)
  619. ldd [%o0 + 0x68], %f24
  620. AES_DROUND23(16, 0, 2, 6)
  621. ldd [%o0 + 0x60], %f26
  622. AES_DROUND01(18, 0, 2, 4)
  623. ldd [%o0 + 0x58], %f28
  624. AES_DROUND23(20, 4, 6, 2)
  625. ldd [%o0 + 0x50], %f30
  626. AES_DROUND01(22, 4, 6, 0)
  627. ldd [%o0 + 0x48], %f32
  628. AES_DROUND23(24, 0, 2, 6)
  629. ldd [%o0 + 0x40], %f34
  630. AES_DROUND01(26, 0, 2, 4)
  631. ldd [%o0 + 0x38], %f36
  632. AES_DROUND23(28, 4, 6, 2)
  633. ldd [%o0 + 0x30], %f38
  634. AES_DROUND01(30, 4, 6, 0)
  635. ldd [%o0 + 0x28], %f40
  636. AES_DROUND23(32, 0, 2, 6)
  637. ldd [%o0 + 0x20], %f42
  638. AES_DROUND01(34, 0, 2, 4)
  639. ldd [%o0 + 0x18], %f44
  640. AES_DROUND23(36, 4, 6, 2)
  641. ldd [%o0 + 0x10], %f46
  642. AES_DROUND01(38, 4, 6, 0)
  643. ldd [%o0 + 0x08], %f48
  644. AES_DROUND23(40, 0, 2, 6)
  645. ldd [%o0 + 0x00], %f50
  646. AES_DROUND01(42, 0, 2, 4)
  647. AES_DROUND23(44, 4, 6, 2)
  648. AES_DROUND01(46, 4, 6, 0)
  649. AES_DROUND23_L(48, 0, 2, 6)
  650. AES_DROUND01_L(50, 0, 2, 4)
  651. st %f4, [%o2 + 0x00]
  652. st %f5, [%o2 + 0x04]
  653. st %f6, [%o2 + 0x08]
  654. st %f7, [%o2 + 0x0c]
  655. retl
  656. VISExit
  657. ENDPROC(aes_sparc64_decrypt_256)
  658. .align 32
  659. ENTRY(aes_sparc64_load_encrypt_keys_128)
  660. /* %o0=key */
  661. VISEntry
  662. ldd [%o0 + 0x10], %f8
  663. ldd [%o0 + 0x18], %f10
  664. ldd [%o0 + 0x20], %f12
  665. ldd [%o0 + 0x28], %f14
  666. ldd [%o0 + 0x30], %f16
  667. ldd [%o0 + 0x38], %f18
  668. ldd [%o0 + 0x40], %f20
  669. ldd [%o0 + 0x48], %f22
  670. ldd [%o0 + 0x50], %f24
  671. ldd [%o0 + 0x58], %f26
  672. ldd [%o0 + 0x60], %f28
  673. ldd [%o0 + 0x68], %f30
  674. ldd [%o0 + 0x70], %f32
  675. ldd [%o0 + 0x78], %f34
  676. ldd [%o0 + 0x80], %f36
  677. ldd [%o0 + 0x88], %f38
  678. ldd [%o0 + 0x90], %f40
  679. ldd [%o0 + 0x98], %f42
  680. ldd [%o0 + 0xa0], %f44
  681. retl
  682. ldd [%o0 + 0xa8], %f46
  683. ENDPROC(aes_sparc64_load_encrypt_keys_128)
  684. .align 32
  685. ENTRY(aes_sparc64_load_encrypt_keys_192)
  686. /* %o0=key */
  687. VISEntry
  688. ldd [%o0 + 0x10], %f8
  689. ldd [%o0 + 0x18], %f10
  690. ldd [%o0 + 0x20], %f12
  691. ldd [%o0 + 0x28], %f14
  692. ldd [%o0 + 0x30], %f16
  693. ldd [%o0 + 0x38], %f18
  694. ldd [%o0 + 0x40], %f20
  695. ldd [%o0 + 0x48], %f22
  696. ldd [%o0 + 0x50], %f24
  697. ldd [%o0 + 0x58], %f26
  698. ldd [%o0 + 0x60], %f28
  699. ldd [%o0 + 0x68], %f30
  700. ldd [%o0 + 0x70], %f32
  701. ldd [%o0 + 0x78], %f34
  702. ldd [%o0 + 0x80], %f36
  703. ldd [%o0 + 0x88], %f38
  704. ldd [%o0 + 0x90], %f40
  705. ldd [%o0 + 0x98], %f42
  706. ldd [%o0 + 0xa0], %f44
  707. ldd [%o0 + 0xa8], %f46
  708. ldd [%o0 + 0xb0], %f48
  709. ldd [%o0 + 0xb8], %f50
  710. ldd [%o0 + 0xc0], %f52
  711. retl
  712. ldd [%o0 + 0xc8], %f54
  713. ENDPROC(aes_sparc64_load_encrypt_keys_192)
  714. .align 32
  715. ENTRY(aes_sparc64_load_encrypt_keys_256)
  716. /* %o0=key */
  717. VISEntry
  718. ldd [%o0 + 0x10], %f8
  719. ldd [%o0 + 0x18], %f10
  720. ldd [%o0 + 0x20], %f12
  721. ldd [%o0 + 0x28], %f14
  722. ldd [%o0 + 0x30], %f16
  723. ldd [%o0 + 0x38], %f18
  724. ldd [%o0 + 0x40], %f20
  725. ldd [%o0 + 0x48], %f22
  726. ldd [%o0 + 0x50], %f24
  727. ldd [%o0 + 0x58], %f26
  728. ldd [%o0 + 0x60], %f28
  729. ldd [%o0 + 0x68], %f30
  730. ldd [%o0 + 0x70], %f32
  731. ldd [%o0 + 0x78], %f34
  732. ldd [%o0 + 0x80], %f36
  733. ldd [%o0 + 0x88], %f38
  734. ldd [%o0 + 0x90], %f40
  735. ldd [%o0 + 0x98], %f42
  736. ldd [%o0 + 0xa0], %f44
  737. ldd [%o0 + 0xa8], %f46
  738. ldd [%o0 + 0xb0], %f48
  739. ldd [%o0 + 0xb8], %f50
  740. ldd [%o0 + 0xc0], %f52
  741. ldd [%o0 + 0xc8], %f54
  742. ldd [%o0 + 0xd0], %f56
  743. ldd [%o0 + 0xd8], %f58
  744. ldd [%o0 + 0xe0], %f60
  745. retl
  746. ldd [%o0 + 0xe8], %f62
  747. ENDPROC(aes_sparc64_load_encrypt_keys_256)
  748. .align 32
  749. ENTRY(aes_sparc64_load_decrypt_keys_128)
  750. /* %o0=key */
  751. VISEntry
  752. ldd [%o0 + 0x98], %f8
  753. ldd [%o0 + 0x90], %f10
  754. ldd [%o0 + 0x88], %f12
  755. ldd [%o0 + 0x80], %f14
  756. ldd [%o0 + 0x78], %f16
  757. ldd [%o0 + 0x70], %f18
  758. ldd [%o0 + 0x68], %f20
  759. ldd [%o0 + 0x60], %f22
  760. ldd [%o0 + 0x58], %f24
  761. ldd [%o0 + 0x50], %f26
  762. ldd [%o0 + 0x48], %f28
  763. ldd [%o0 + 0x40], %f30
  764. ldd [%o0 + 0x38], %f32
  765. ldd [%o0 + 0x30], %f34
  766. ldd [%o0 + 0x28], %f36
  767. ldd [%o0 + 0x20], %f38
  768. ldd [%o0 + 0x18], %f40
  769. ldd [%o0 + 0x10], %f42
  770. ldd [%o0 + 0x08], %f44
  771. retl
  772. ldd [%o0 + 0x00], %f46
  773. ENDPROC(aes_sparc64_load_decrypt_keys_128)
  774. .align 32
  775. ENTRY(aes_sparc64_load_decrypt_keys_192)
  776. /* %o0=key */
  777. VISEntry
  778. ldd [%o0 + 0xb8], %f8
  779. ldd [%o0 + 0xb0], %f10
  780. ldd [%o0 + 0xa8], %f12
  781. ldd [%o0 + 0xa0], %f14
  782. ldd [%o0 + 0x98], %f16
  783. ldd [%o0 + 0x90], %f18
  784. ldd [%o0 + 0x88], %f20
  785. ldd [%o0 + 0x80], %f22
  786. ldd [%o0 + 0x78], %f24
  787. ldd [%o0 + 0x70], %f26
  788. ldd [%o0 + 0x68], %f28
  789. ldd [%o0 + 0x60], %f30
  790. ldd [%o0 + 0x58], %f32
  791. ldd [%o0 + 0x50], %f34
  792. ldd [%o0 + 0x48], %f36
  793. ldd [%o0 + 0x40], %f38
  794. ldd [%o0 + 0x38], %f40
  795. ldd [%o0 + 0x30], %f42
  796. ldd [%o0 + 0x28], %f44
  797. ldd [%o0 + 0x20], %f46
  798. ldd [%o0 + 0x18], %f48
  799. ldd [%o0 + 0x10], %f50
  800. ldd [%o0 + 0x08], %f52
  801. retl
  802. ldd [%o0 + 0x00], %f54
  803. ENDPROC(aes_sparc64_load_decrypt_keys_192)
  804. .align 32
  805. ENTRY(aes_sparc64_load_decrypt_keys_256)
  806. /* %o0=key */
  807. VISEntry
  808. ldd [%o0 + 0xd8], %f8
  809. ldd [%o0 + 0xd0], %f10
  810. ldd [%o0 + 0xc8], %f12
  811. ldd [%o0 + 0xc0], %f14
  812. ldd [%o0 + 0xb8], %f16
  813. ldd [%o0 + 0xb0], %f18
  814. ldd [%o0 + 0xa8], %f20
  815. ldd [%o0 + 0xa0], %f22
  816. ldd [%o0 + 0x98], %f24
  817. ldd [%o0 + 0x90], %f26
  818. ldd [%o0 + 0x88], %f28
  819. ldd [%o0 + 0x80], %f30
  820. ldd [%o0 + 0x78], %f32
  821. ldd [%o0 + 0x70], %f34
  822. ldd [%o0 + 0x68], %f36
  823. ldd [%o0 + 0x60], %f38
  824. ldd [%o0 + 0x58], %f40
  825. ldd [%o0 + 0x50], %f42
  826. ldd [%o0 + 0x48], %f44
  827. ldd [%o0 + 0x40], %f46
  828. ldd [%o0 + 0x38], %f48
  829. ldd [%o0 + 0x30], %f50
  830. ldd [%o0 + 0x28], %f52
  831. ldd [%o0 + 0x20], %f54
  832. ldd [%o0 + 0x18], %f56
  833. ldd [%o0 + 0x10], %f58
  834. ldd [%o0 + 0x08], %f60
  835. retl
  836. ldd [%o0 + 0x00], %f62
  837. ENDPROC(aes_sparc64_load_decrypt_keys_256)
  838. .align 32
  839. ENTRY(aes_sparc64_ecb_encrypt_128)
  840. /* %o0=key, %o1=input, %o2=output, %o3=len */
  841. ldx [%o0 + 0x00], %g1
  842. subcc %o3, 0x10, %o3
  843. be 10f
  844. ldx [%o0 + 0x08], %g2
  845. 1: ldx [%o1 + 0x00], %g3
  846. ldx [%o1 + 0x08], %g7
  847. ldx [%o1 + 0x10], %o4
  848. ldx [%o1 + 0x18], %o5
  849. xor %g1, %g3, %g3
  850. xor %g2, %g7, %g7
  851. MOVXTOD_G3_F4
  852. MOVXTOD_G7_F6
  853. xor %g1, %o4, %g3
  854. xor %g2, %o5, %g7
  855. MOVXTOD_G3_F60
  856. MOVXTOD_G7_F62
  857. ENCRYPT_128_2(8, 4, 6, 60, 62, 0, 2, 56, 58)
  858. std %f4, [%o2 + 0x00]
  859. std %f6, [%o2 + 0x08]
  860. std %f60, [%o2 + 0x10]
  861. std %f62, [%o2 + 0x18]
  862. sub %o3, 0x20, %o3
  863. add %o1, 0x20, %o1
  864. brgz %o3, 1b
  865. add %o2, 0x20, %o2
  866. brlz,pt %o3, 11f
  867. nop
  868. 10: ldx [%o1 + 0x00], %g3
  869. ldx [%o1 + 0x08], %g7
  870. xor %g1, %g3, %g3
  871. xor %g2, %g7, %g7
  872. MOVXTOD_G3_F4
  873. MOVXTOD_G7_F6
  874. ENCRYPT_128(8, 4, 6, 0, 2)
  875. std %f4, [%o2 + 0x00]
  876. std %f6, [%o2 + 0x08]
  877. 11: retl
  878. nop
  879. ENDPROC(aes_sparc64_ecb_encrypt_128)
  880. .align 32
  881. ENTRY(aes_sparc64_ecb_encrypt_192)
  882. /* %o0=key, %o1=input, %o2=output, %o3=len */
  883. ldx [%o0 + 0x00], %g1
  884. subcc %o3, 0x10, %o3
  885. be 10f
  886. ldx [%o0 + 0x08], %g2
  887. 1: ldx [%o1 + 0x00], %g3
  888. ldx [%o1 + 0x08], %g7
  889. ldx [%o1 + 0x10], %o4
  890. ldx [%o1 + 0x18], %o5
  891. xor %g1, %g3, %g3
  892. xor %g2, %g7, %g7
  893. MOVXTOD_G3_F4
  894. MOVXTOD_G7_F6
  895. xor %g1, %o4, %g3
  896. xor %g2, %o5, %g7
  897. MOVXTOD_G3_F60
  898. MOVXTOD_G7_F62
  899. ENCRYPT_192_2(8, 4, 6, 60, 62, 0, 2, 56, 58)
  900. std %f4, [%o2 + 0x00]
  901. std %f6, [%o2 + 0x08]
  902. std %f60, [%o2 + 0x10]
  903. std %f62, [%o2 + 0x18]
  904. sub %o3, 0x20, %o3
  905. add %o1, 0x20, %o1
  906. brgz %o3, 1b
  907. add %o2, 0x20, %o2
  908. brlz,pt %o3, 11f
  909. nop
  910. 10: ldx [%o1 + 0x00], %g3
  911. ldx [%o1 + 0x08], %g7
  912. xor %g1, %g3, %g3
  913. xor %g2, %g7, %g7
  914. MOVXTOD_G3_F4
  915. MOVXTOD_G7_F6
  916. ENCRYPT_192(8, 4, 6, 0, 2)
  917. std %f4, [%o2 + 0x00]
  918. std %f6, [%o2 + 0x08]
  919. 11: retl
  920. nop
  921. ENDPROC(aes_sparc64_ecb_encrypt_192)
  922. .align 32
  923. ENTRY(aes_sparc64_ecb_encrypt_256)
  924. /* %o0=key, %o1=input, %o2=output, %o3=len */
  925. ldx [%o0 + 0x00], %g1
  926. subcc %o3, 0x10, %o3
  927. be 10f
  928. ldx [%o0 + 0x08], %g2
  929. 1: ldx [%o1 + 0x00], %g3
  930. ldx [%o1 + 0x08], %g7
  931. ldx [%o1 + 0x10], %o4
  932. ldx [%o1 + 0x18], %o5
  933. xor %g1, %g3, %g3
  934. xor %g2, %g7, %g7
  935. MOVXTOD_G3_F4
  936. MOVXTOD_G7_F6
  937. xor %g1, %o4, %g3
  938. xor %g2, %o5, %g7
  939. MOVXTOD_G3_F0
  940. MOVXTOD_G7_F2
  941. ENCRYPT_256_2(8, 4, 6, 0, 2)
  942. std %f4, [%o2 + 0x00]
  943. std %f6, [%o2 + 0x08]
  944. std %f0, [%o2 + 0x10]
  945. std %f2, [%o2 + 0x18]
  946. sub %o3, 0x20, %o3
  947. add %o1, 0x20, %o1
  948. brgz %o3, 1b
  949. add %o2, 0x20, %o2
  950. brlz,pt %o3, 11f
  951. nop
  952. 10: ldx [%o1 + 0x00], %g3
  953. ldx [%o1 + 0x08], %g7
  954. xor %g1, %g3, %g3
  955. xor %g2, %g7, %g7
  956. MOVXTOD_G3_F4
  957. MOVXTOD_G7_F6
  958. ENCRYPT_256(8, 4, 6, 0, 2)
  959. std %f4, [%o2 + 0x00]
  960. std %f6, [%o2 + 0x08]
  961. 11: retl
  962. nop
  963. ENDPROC(aes_sparc64_ecb_encrypt_256)
  964. .align 32
  965. ENTRY(aes_sparc64_ecb_decrypt_128)
  966. /* %o0=&key[key_len], %o1=input, %o2=output, %o3=len */
  967. ldx [%o0 - 0x10], %g1
  968. subcc %o3, 0x10, %o3
  969. be 10f
  970. ldx [%o0 - 0x08], %g2
  971. 1: ldx [%o1 + 0x00], %g3
  972. ldx [%o1 + 0x08], %g7
  973. ldx [%o1 + 0x10], %o4
  974. ldx [%o1 + 0x18], %o5
  975. xor %g1, %g3, %g3
  976. xor %g2, %g7, %g7
  977. MOVXTOD_G3_F4
  978. MOVXTOD_G7_F6
  979. xor %g1, %o4, %g3
  980. xor %g2, %o5, %g7
  981. MOVXTOD_G3_F60
  982. MOVXTOD_G7_F62
  983. DECRYPT_128_2(8, 4, 6, 60, 62, 0, 2, 56, 58)
  984. std %f4, [%o2 + 0x00]
  985. std %f6, [%o2 + 0x08]
  986. std %f60, [%o2 + 0x10]
  987. std %f62, [%o2 + 0x18]
  988. sub %o3, 0x20, %o3
  989. add %o1, 0x20, %o1
  990. brgz,pt %o3, 1b
  991. add %o2, 0x20, %o2
  992. brlz,pt %o3, 11f
  993. nop
  994. 10: ldx [%o1 + 0x00], %g3
  995. ldx [%o1 + 0x08], %g7
  996. xor %g1, %g3, %g3
  997. xor %g2, %g7, %g7
  998. MOVXTOD_G3_F4
  999. MOVXTOD_G7_F6
  1000. DECRYPT_128(8, 4, 6, 0, 2)
  1001. std %f4, [%o2 + 0x00]
  1002. std %f6, [%o2 + 0x08]
  1003. 11: retl
  1004. nop
  1005. ENDPROC(aes_sparc64_ecb_decrypt_128)
  1006. .align 32
  1007. ENTRY(aes_sparc64_ecb_decrypt_192)
  1008. /* %o0=&key[key_len], %o1=input, %o2=output, %o3=len */
  1009. ldx [%o0 - 0x10], %g1
  1010. subcc %o3, 0x10, %o3
  1011. be 10f
  1012. ldx [%o0 - 0x08], %g2
  1013. 1: ldx [%o1 + 0x00], %g3
  1014. ldx [%o1 + 0x08], %g7
  1015. ldx [%o1 + 0x10], %o4
  1016. ldx [%o1 + 0x18], %o5
  1017. xor %g1, %g3, %g3
  1018. xor %g2, %g7, %g7
  1019. MOVXTOD_G3_F4
  1020. MOVXTOD_G7_F6
  1021. xor %g1, %o4, %g3
  1022. xor %g2, %o5, %g7
  1023. MOVXTOD_G3_F60
  1024. MOVXTOD_G7_F62
  1025. DECRYPT_192_2(8, 4, 6, 60, 62, 0, 2, 56, 58)
  1026. std %f4, [%o2 + 0x00]
  1027. std %f6, [%o2 + 0x08]
  1028. std %f60, [%o2 + 0x10]
  1029. std %f62, [%o2 + 0x18]
  1030. sub %o3, 0x20, %o3
  1031. add %o1, 0x20, %o1
  1032. brgz,pt %o3, 1b
  1033. add %o2, 0x20, %o2
  1034. brlz,pt %o3, 11f
  1035. nop
  1036. 10: ldx [%o1 + 0x00], %g3
  1037. ldx [%o1 + 0x08], %g7
  1038. xor %g1, %g3, %g3
  1039. xor %g2, %g7, %g7
  1040. MOVXTOD_G3_F4
  1041. MOVXTOD_G7_F6
  1042. DECRYPT_192(8, 4, 6, 0, 2)
  1043. std %f4, [%o2 + 0x00]
  1044. std %f6, [%o2 + 0x08]
  1045. 11: retl
  1046. nop
  1047. ENDPROC(aes_sparc64_ecb_decrypt_192)
  1048. .align 32
  1049. ENTRY(aes_sparc64_ecb_decrypt_256)
  1050. /* %o0=&key[key_len], %o1=input, %o2=output, %o3=len */
  1051. ldx [%o0 - 0x10], %g1
  1052. subcc %o3, 0x10, %o3
  1053. be 10f
  1054. ldx [%o0 - 0x08], %g2
  1055. sub %o0, 0xf0, %o0
  1056. 1: ldx [%o1 + 0x00], %g3
  1057. ldx [%o1 + 0x08], %g7
  1058. ldx [%o1 + 0x10], %o4
  1059. ldx [%o1 + 0x18], %o5
  1060. xor %g1, %g3, %g3
  1061. xor %g2, %g7, %g7
  1062. MOVXTOD_G3_F4
  1063. MOVXTOD_G7_F6
  1064. xor %g1, %o4, %g3
  1065. xor %g2, %o5, %g7
  1066. MOVXTOD_G3_F0
  1067. MOVXTOD_G7_F2
  1068. DECRYPT_256_2(8, 4, 6, 0, 2)
  1069. std %f4, [%o2 + 0x00]
  1070. std %f6, [%o2 + 0x08]
  1071. std %f60, [%o2 + 0x10]
  1072. std %f62, [%o2 + 0x18]
  1073. sub %o3, 0x20, %o3
  1074. add %o1, 0x20, %o1
  1075. brgz,pt %o3, 1b
  1076. add %o2, 0x20, %o2
  1077. brlz,pt %o3, 11f
  1078. nop
  1079. 10: ldx [%o1 + 0x00], %g3
  1080. ldx [%o1 + 0x08], %g7
  1081. xor %g1, %g3, %g3
  1082. xor %g2, %g7, %g7
  1083. MOVXTOD_G3_F4
  1084. MOVXTOD_G7_F6
  1085. DECRYPT_256(8, 4, 6, 0, 2)
  1086. std %f4, [%o2 + 0x00]
  1087. std %f6, [%o2 + 0x08]
  1088. 11: retl
  1089. nop
  1090. ENDPROC(aes_sparc64_ecb_decrypt_256)
  1091. .align 32
  1092. ENTRY(aes_sparc64_cbc_encrypt_128)
  1093. /* %o0=key, %o1=input, %o2=output, %o3=len, %o4=IV */
  1094. ldd [%o4 + 0x00], %f4
  1095. ldd [%o4 + 0x08], %f6
  1096. ldx [%o0 + 0x00], %g1
  1097. ldx [%o0 + 0x08], %g2
  1098. 1: ldx [%o1 + 0x00], %g3
  1099. ldx [%o1 + 0x08], %g7
  1100. add %o1, 0x10, %o1
  1101. xor %g1, %g3, %g3
  1102. xor %g2, %g7, %g7
  1103. MOVXTOD_G3_F0
  1104. MOVXTOD_G7_F2
  1105. fxor %f4, %f0, %f4
  1106. fxor %f6, %f2, %f6
  1107. ENCRYPT_128(8, 4, 6, 0, 2)
  1108. std %f4, [%o2 + 0x00]
  1109. std %f6, [%o2 + 0x08]
  1110. subcc %o3, 0x10, %o3
  1111. bne,pt %xcc, 1b
  1112. add %o2, 0x10, %o2
  1113. std %f4, [%o4 + 0x00]
  1114. std %f6, [%o4 + 0x08]
  1115. retl
  1116. nop
  1117. ENDPROC(aes_sparc64_cbc_encrypt_128)
  1118. .align 32
  1119. ENTRY(aes_sparc64_cbc_encrypt_192)
  1120. /* %o0=key, %o1=input, %o2=output, %o3=len, %o4=IV */
  1121. ldd [%o4 + 0x00], %f4
  1122. ldd [%o4 + 0x08], %f6
  1123. ldx [%o0 + 0x00], %g1
  1124. ldx [%o0 + 0x08], %g2
  1125. 1: ldx [%o1 + 0x00], %g3
  1126. ldx [%o1 + 0x08], %g7
  1127. add %o1, 0x10, %o1
  1128. xor %g1, %g3, %g3
  1129. xor %g2, %g7, %g7
  1130. MOVXTOD_G3_F0
  1131. MOVXTOD_G7_F2
  1132. fxor %f4, %f0, %f4
  1133. fxor %f6, %f2, %f6
  1134. ENCRYPT_192(8, 4, 6, 0, 2)
  1135. std %f4, [%o2 + 0x00]
  1136. std %f6, [%o2 + 0x08]
  1137. subcc %o3, 0x10, %o3
  1138. bne,pt %xcc, 1b
  1139. add %o2, 0x10, %o2
  1140. std %f4, [%o4 + 0x00]
  1141. std %f6, [%o4 + 0x08]
  1142. retl
  1143. nop
  1144. ENDPROC(aes_sparc64_cbc_encrypt_192)
  1145. .align 32
  1146. ENTRY(aes_sparc64_cbc_encrypt_256)
  1147. /* %o0=key, %o1=input, %o2=output, %o3=len, %o4=IV */
  1148. ldd [%o4 + 0x00], %f4
  1149. ldd [%o4 + 0x08], %f6
  1150. ldx [%o0 + 0x00], %g1
  1151. ldx [%o0 + 0x08], %g2
  1152. 1: ldx [%o1 + 0x00], %g3
  1153. ldx [%o1 + 0x08], %g7
  1154. add %o1, 0x10, %o1
  1155. xor %g1, %g3, %g3
  1156. xor %g2, %g7, %g7
  1157. MOVXTOD_G3_F0
  1158. MOVXTOD_G7_F2
  1159. fxor %f4, %f0, %f4
  1160. fxor %f6, %f2, %f6
  1161. ENCRYPT_256(8, 4, 6, 0, 2)
  1162. std %f4, [%o2 + 0x00]
  1163. std %f6, [%o2 + 0x08]
  1164. subcc %o3, 0x10, %o3
  1165. bne,pt %xcc, 1b
  1166. add %o2, 0x10, %o2
  1167. std %f4, [%o4 + 0x00]
  1168. std %f6, [%o4 + 0x08]
  1169. retl
  1170. nop
  1171. ENDPROC(aes_sparc64_cbc_encrypt_256)
  1172. .align 32
  1173. ENTRY(aes_sparc64_cbc_decrypt_128)
  1174. /* %o0=&key[key_len], %o1=input, %o2=output, %o3=len, %o4=iv */
  1175. ldx [%o0 - 0x10], %g1
  1176. ldx [%o0 - 0x08], %g2
  1177. ldx [%o4 + 0x00], %o0
  1178. ldx [%o4 + 0x08], %o5
  1179. 1: ldx [%o1 + 0x00], %g3
  1180. ldx [%o1 + 0x08], %g7
  1181. add %o1, 0x10, %o1
  1182. xor %g1, %g3, %g3
  1183. xor %g2, %g7, %g7
  1184. MOVXTOD_G3_F4
  1185. MOVXTOD_G7_F6
  1186. DECRYPT_128(8, 4, 6, 0, 2)
  1187. MOVXTOD_O0_F0
  1188. MOVXTOD_O5_F2
  1189. xor %g1, %g3, %o0
  1190. xor %g2, %g7, %o5
  1191. fxor %f4, %f0, %f4
  1192. fxor %f6, %f2, %f6
  1193. std %f4, [%o2 + 0x00]
  1194. std %f6, [%o2 + 0x08]
  1195. subcc %o3, 0x10, %o3
  1196. bne,pt %xcc, 1b
  1197. add %o2, 0x10, %o2
  1198. stx %o0, [%o4 + 0x00]
  1199. stx %o5, [%o4 + 0x08]
  1200. retl
  1201. nop
  1202. ENDPROC(aes_sparc64_cbc_decrypt_128)
  1203. .align 32
  1204. ENTRY(aes_sparc64_cbc_decrypt_192)
  1205. /* %o0=&key[key_len], %o1=input, %o2=output, %o3=len, %o4=iv */
  1206. ldx [%o0 - 0x10], %g1
  1207. ldx [%o0 - 0x08], %g2
  1208. ldx [%o4 + 0x00], %o0
  1209. ldx [%o4 + 0x08], %o5
  1210. 1: ldx [%o1 + 0x00], %g3
  1211. ldx [%o1 + 0x08], %g7
  1212. add %o1, 0x10, %o1
  1213. xor %g1, %g3, %g3
  1214. xor %g2, %g7, %g7
  1215. MOVXTOD_G3_F4
  1216. MOVXTOD_G7_F6
  1217. DECRYPT_192(8, 4, 6, 0, 2)
  1218. MOVXTOD_O0_F0
  1219. MOVXTOD_O5_F2
  1220. xor %g1, %g3, %o0
  1221. xor %g2, %g7, %o5
  1222. fxor %f4, %f0, %f4
  1223. fxor %f6, %f2, %f6
  1224. std %f4, [%o2 + 0x00]
  1225. std %f6, [%o2 + 0x08]
  1226. subcc %o3, 0x10, %o3
  1227. bne,pt %xcc, 1b
  1228. add %o2, 0x10, %o2
  1229. stx %o0, [%o4 + 0x00]
  1230. stx %o5, [%o4 + 0x08]
  1231. retl
  1232. nop
  1233. ENDPROC(aes_sparc64_cbc_decrypt_192)
  1234. .align 32
  1235. ENTRY(aes_sparc64_cbc_decrypt_256)
  1236. /* %o0=&key[key_len], %o1=input, %o2=output, %o3=len, %o4=iv */
  1237. ldx [%o0 - 0x10], %g1
  1238. ldx [%o0 - 0x08], %g2
  1239. ldx [%o4 + 0x00], %o0
  1240. ldx [%o4 + 0x08], %o5
  1241. 1: ldx [%o1 + 0x00], %g3
  1242. ldx [%o1 + 0x08], %g7
  1243. add %o1, 0x10, %o1
  1244. xor %g1, %g3, %g3
  1245. xor %g2, %g7, %g7
  1246. MOVXTOD_G3_F4
  1247. MOVXTOD_G7_F6
  1248. DECRYPT_256(8, 4, 6, 0, 2)
  1249. MOVXTOD_O0_F0
  1250. MOVXTOD_O5_F2
  1251. xor %g1, %g3, %o0
  1252. xor %g2, %g7, %o5
  1253. fxor %f4, %f0, %f4
  1254. fxor %f6, %f2, %f6
  1255. std %f4, [%o2 + 0x00]
  1256. std %f6, [%o2 + 0x08]
  1257. subcc %o3, 0x10, %o3
  1258. bne,pt %xcc, 1b
  1259. add %o2, 0x10, %o2
  1260. stx %o0, [%o4 + 0x00]
  1261. stx %o5, [%o4 + 0x08]
  1262. retl
  1263. nop
  1264. ENDPROC(aes_sparc64_cbc_decrypt_256)
  1265. .align 32
  1266. ENTRY(aes_sparc64_ctr_crypt_128)
  1267. /* %o0=key, %o1=input, %o2=output, %o3=len, %o4=IV */
  1268. ldx [%o4 + 0x00], %g3
  1269. ldx [%o4 + 0x08], %g7
  1270. subcc %o3, 0x10, %o3
  1271. ldx [%o0 + 0x00], %g1
  1272. be 10f
  1273. ldx [%o0 + 0x08], %g2
  1274. 1: xor %g1, %g3, %o5
  1275. MOVXTOD_O5_F0
  1276. xor %g2, %g7, %o5
  1277. MOVXTOD_O5_F2
  1278. add %g7, 1, %g7
  1279. add %g3, 1, %o5
  1280. movrz %g7, %o5, %g3
  1281. xor %g1, %g3, %o5
  1282. MOVXTOD_O5_F4
  1283. xor %g2, %g7, %o5
  1284. MOVXTOD_O5_F6
  1285. add %g7, 1, %g7
  1286. add %g3, 1, %o5
  1287. movrz %g7, %o5, %g3
  1288. ENCRYPT_128_2(8, 0, 2, 4, 6, 56, 58, 60, 62)
  1289. ldd [%o1 + 0x00], %f56
  1290. ldd [%o1 + 0x08], %f58
  1291. ldd [%o1 + 0x10], %f60
  1292. ldd [%o1 + 0x18], %f62
  1293. fxor %f56, %f0, %f56
  1294. fxor %f58, %f2, %f58
  1295. fxor %f60, %f4, %f60
  1296. fxor %f62, %f6, %f62
  1297. std %f56, [%o2 + 0x00]
  1298. std %f58, [%o2 + 0x08]
  1299. std %f60, [%o2 + 0x10]
  1300. std %f62, [%o2 + 0x18]
  1301. subcc %o3, 0x20, %o3
  1302. add %o1, 0x20, %o1
  1303. brgz %o3, 1b
  1304. add %o2, 0x20, %o2
  1305. brlz,pt %o3, 11f
  1306. nop
  1307. 10: xor %g1, %g3, %o5
  1308. MOVXTOD_O5_F0
  1309. xor %g2, %g7, %o5
  1310. MOVXTOD_O5_F2
  1311. add %g7, 1, %g7
  1312. add %g3, 1, %o5
  1313. movrz %g7, %o5, %g3
  1314. ENCRYPT_128(8, 0, 2, 4, 6)
  1315. ldd [%o1 + 0x00], %f4
  1316. ldd [%o1 + 0x08], %f6
  1317. fxor %f4, %f0, %f4
  1318. fxor %f6, %f2, %f6
  1319. std %f4, [%o2 + 0x00]
  1320. std %f6, [%o2 + 0x08]
  1321. 11: stx %g3, [%o4 + 0x00]
  1322. retl
  1323. stx %g7, [%o4 + 0x08]
  1324. ENDPROC(aes_sparc64_ctr_crypt_128)
  1325. .align 32
  1326. ENTRY(aes_sparc64_ctr_crypt_192)
  1327. /* %o0=key, %o1=input, %o2=output, %o3=len, %o4=IV */
  1328. ldx [%o4 + 0x00], %g3
  1329. ldx [%o4 + 0x08], %g7
  1330. subcc %o3, 0x10, %o3
  1331. ldx [%o0 + 0x00], %g1
  1332. be 10f
  1333. ldx [%o0 + 0x08], %g2
  1334. 1: xor %g1, %g3, %o5
  1335. MOVXTOD_O5_F0
  1336. xor %g2, %g7, %o5
  1337. MOVXTOD_O5_F2
  1338. add %g7, 1, %g7
  1339. add %g3, 1, %o5
  1340. movrz %g7, %o5, %g3
  1341. xor %g1, %g3, %o5
  1342. MOVXTOD_O5_F4
  1343. xor %g2, %g7, %o5
  1344. MOVXTOD_O5_F6
  1345. add %g7, 1, %g7
  1346. add %g3, 1, %o5
  1347. movrz %g7, %o5, %g3
  1348. ENCRYPT_192_2(8, 0, 2, 4, 6, 56, 58, 60, 62)
  1349. ldd [%o1 + 0x00], %f56
  1350. ldd [%o1 + 0x08], %f58
  1351. ldd [%o1 + 0x10], %f60
  1352. ldd [%o1 + 0x18], %f62
  1353. fxor %f56, %f0, %f56
  1354. fxor %f58, %f2, %f58
  1355. fxor %f60, %f4, %f60
  1356. fxor %f62, %f6, %f62
  1357. std %f56, [%o2 + 0x00]
  1358. std %f58, [%o2 + 0x08]
  1359. std %f60, [%o2 + 0x10]
  1360. std %f62, [%o2 + 0x18]
  1361. subcc %o3, 0x20, %o3
  1362. add %o1, 0x20, %o1
  1363. brgz %o3, 1b
  1364. add %o2, 0x20, %o2
  1365. brlz,pt %o3, 11f
  1366. nop
  1367. 10: xor %g1, %g3, %o5
  1368. MOVXTOD_O5_F0
  1369. xor %g2, %g7, %o5
  1370. MOVXTOD_O5_F2
  1371. add %g7, 1, %g7
  1372. add %g3, 1, %o5
  1373. movrz %g7, %o5, %g3
  1374. ENCRYPT_192(8, 0, 2, 4, 6)
  1375. ldd [%o1 + 0x00], %f4
  1376. ldd [%o1 + 0x08], %f6
  1377. fxor %f4, %f0, %f4
  1378. fxor %f6, %f2, %f6
  1379. std %f4, [%o2 + 0x00]
  1380. std %f6, [%o2 + 0x08]
  1381. 11: stx %g3, [%o4 + 0x00]
  1382. retl
  1383. stx %g7, [%o4 + 0x08]
  1384. ENDPROC(aes_sparc64_ctr_crypt_192)
  1385. .align 32
  1386. ENTRY(aes_sparc64_ctr_crypt_256)
  1387. /* %o0=key, %o1=input, %o2=output, %o3=len, %o4=IV */
  1388. ldx [%o4 + 0x00], %g3
  1389. ldx [%o4 + 0x08], %g7
  1390. subcc %o3, 0x10, %o3
  1391. ldx [%o0 + 0x00], %g1
  1392. be 10f
  1393. ldx [%o0 + 0x08], %g2
  1394. 1: xor %g1, %g3, %o5
  1395. MOVXTOD_O5_F0
  1396. xor %g2, %g7, %o5
  1397. MOVXTOD_O5_F2
  1398. add %g7, 1, %g7
  1399. add %g3, 1, %o5
  1400. movrz %g7, %o5, %g3
  1401. xor %g1, %g3, %o5
  1402. MOVXTOD_O5_F4
  1403. xor %g2, %g7, %o5
  1404. MOVXTOD_O5_F6
  1405. add %g7, 1, %g7
  1406. add %g3, 1, %o5
  1407. movrz %g7, %o5, %g3
  1408. ENCRYPT_256_2(8, 0, 2, 4, 6)
  1409. ldd [%o1 + 0x00], %f56
  1410. ldd [%o1 + 0x08], %f58
  1411. ldd [%o1 + 0x10], %f60
  1412. ldd [%o1 + 0x18], %f62
  1413. fxor %f56, %f0, %f56
  1414. fxor %f58, %f2, %f58
  1415. fxor %f60, %f4, %f60
  1416. fxor %f62, %f6, %f62
  1417. std %f56, [%o2 + 0x00]
  1418. std %f58, [%o2 + 0x08]
  1419. std %f60, [%o2 + 0x10]
  1420. std %f62, [%o2 + 0x18]
  1421. subcc %o3, 0x20, %o3
  1422. add %o1, 0x20, %o1
  1423. brgz %o3, 1b
  1424. add %o2, 0x20, %o2
  1425. brlz,pt %o3, 11f
  1426. nop
  1427. 10: xor %g1, %g3, %o5
  1428. MOVXTOD_O5_F0
  1429. xor %g2, %g7, %o5
  1430. MOVXTOD_O5_F2
  1431. add %g7, 1, %g7
  1432. add %g3, 1, %o5
  1433. movrz %g7, %o5, %g3
  1434. ENCRYPT_256(8, 0, 2, 4, 6)
  1435. ldd [%o1 + 0x00], %f4
  1436. ldd [%o1 + 0x08], %f6
  1437. fxor %f4, %f0, %f4
  1438. fxor %f6, %f2, %f6
  1439. std %f4, [%o2 + 0x00]
  1440. std %f6, [%o2 + 0x08]
  1441. 11: stx %g3, [%o4 + 0x00]
  1442. retl
  1443. stx %g7, [%o4 + 0x08]
  1444. ENDPROC(aes_sparc64_ctr_crypt_256)