serpent_avx2_glue.c 16 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562
  1. /*
  2. * Glue Code for x86_64/AVX2 assembler optimized version of Serpent
  3. *
  4. * Copyright © 2012-2013 Jussi Kivilinna <jussi.kivilinna@mbnet.fi>
  5. *
  6. * This program is free software; you can redistribute it and/or modify
  7. * it under the terms of the GNU General Public License as published by
  8. * the Free Software Foundation; either version 2 of the License, or
  9. * (at your option) any later version.
  10. *
  11. */
  12. #include <linux/module.h>
  13. #include <linux/types.h>
  14. #include <linux/crypto.h>
  15. #include <linux/err.h>
  16. #include <crypto/algapi.h>
  17. #include <crypto/ctr.h>
  18. #include <crypto/lrw.h>
  19. #include <crypto/xts.h>
  20. #include <crypto/serpent.h>
  21. #include <asm/xcr.h>
  22. #include <asm/xsave.h>
  23. #include <asm/crypto/serpent-avx.h>
  24. #include <asm/crypto/ablk_helper.h>
  25. #include <asm/crypto/glue_helper.h>
  26. #define SERPENT_AVX2_PARALLEL_BLOCKS 16
  27. /* 16-way AVX2 parallel cipher functions */
  28. asmlinkage void serpent_ecb_enc_16way(struct serpent_ctx *ctx, u8 *dst,
  29. const u8 *src);
  30. asmlinkage void serpent_ecb_dec_16way(struct serpent_ctx *ctx, u8 *dst,
  31. const u8 *src);
  32. asmlinkage void serpent_cbc_dec_16way(void *ctx, u128 *dst, const u128 *src);
  33. asmlinkage void serpent_ctr_16way(void *ctx, u128 *dst, const u128 *src,
  34. le128 *iv);
  35. asmlinkage void serpent_xts_enc_16way(struct serpent_ctx *ctx, u8 *dst,
  36. const u8 *src, le128 *iv);
  37. asmlinkage void serpent_xts_dec_16way(struct serpent_ctx *ctx, u8 *dst,
  38. const u8 *src, le128 *iv);
  39. static const struct common_glue_ctx serpent_enc = {
  40. .num_funcs = 3,
  41. .fpu_blocks_limit = 8,
  42. .funcs = { {
  43. .num_blocks = 16,
  44. .fn_u = { .ecb = GLUE_FUNC_CAST(serpent_ecb_enc_16way) }
  45. }, {
  46. .num_blocks = 8,
  47. .fn_u = { .ecb = GLUE_FUNC_CAST(serpent_ecb_enc_8way_avx) }
  48. }, {
  49. .num_blocks = 1,
  50. .fn_u = { .ecb = GLUE_FUNC_CAST(__serpent_encrypt) }
  51. } }
  52. };
  53. static const struct common_glue_ctx serpent_ctr = {
  54. .num_funcs = 3,
  55. .fpu_blocks_limit = 8,
  56. .funcs = { {
  57. .num_blocks = 16,
  58. .fn_u = { .ctr = GLUE_CTR_FUNC_CAST(serpent_ctr_16way) }
  59. }, {
  60. .num_blocks = 8,
  61. .fn_u = { .ctr = GLUE_CTR_FUNC_CAST(serpent_ctr_8way_avx) }
  62. }, {
  63. .num_blocks = 1,
  64. .fn_u = { .ctr = GLUE_CTR_FUNC_CAST(__serpent_crypt_ctr) }
  65. } }
  66. };
  67. static const struct common_glue_ctx serpent_enc_xts = {
  68. .num_funcs = 3,
  69. .fpu_blocks_limit = 8,
  70. .funcs = { {
  71. .num_blocks = 16,
  72. .fn_u = { .xts = GLUE_XTS_FUNC_CAST(serpent_xts_enc_16way) }
  73. }, {
  74. .num_blocks = 8,
  75. .fn_u = { .xts = GLUE_XTS_FUNC_CAST(serpent_xts_enc_8way_avx) }
  76. }, {
  77. .num_blocks = 1,
  78. .fn_u = { .xts = GLUE_XTS_FUNC_CAST(serpent_xts_enc) }
  79. } }
  80. };
  81. static const struct common_glue_ctx serpent_dec = {
  82. .num_funcs = 3,
  83. .fpu_blocks_limit = 8,
  84. .funcs = { {
  85. .num_blocks = 16,
  86. .fn_u = { .ecb = GLUE_FUNC_CAST(serpent_ecb_dec_16way) }
  87. }, {
  88. .num_blocks = 8,
  89. .fn_u = { .ecb = GLUE_FUNC_CAST(serpent_ecb_dec_8way_avx) }
  90. }, {
  91. .num_blocks = 1,
  92. .fn_u = { .ecb = GLUE_FUNC_CAST(__serpent_decrypt) }
  93. } }
  94. };
  95. static const struct common_glue_ctx serpent_dec_cbc = {
  96. .num_funcs = 3,
  97. .fpu_blocks_limit = 8,
  98. .funcs = { {
  99. .num_blocks = 16,
  100. .fn_u = { .cbc = GLUE_CBC_FUNC_CAST(serpent_cbc_dec_16way) }
  101. }, {
  102. .num_blocks = 8,
  103. .fn_u = { .cbc = GLUE_CBC_FUNC_CAST(serpent_cbc_dec_8way_avx) }
  104. }, {
  105. .num_blocks = 1,
  106. .fn_u = { .cbc = GLUE_CBC_FUNC_CAST(__serpent_decrypt) }
  107. } }
  108. };
  109. static const struct common_glue_ctx serpent_dec_xts = {
  110. .num_funcs = 3,
  111. .fpu_blocks_limit = 8,
  112. .funcs = { {
  113. .num_blocks = 16,
  114. .fn_u = { .xts = GLUE_XTS_FUNC_CAST(serpent_xts_dec_16way) }
  115. }, {
  116. .num_blocks = 8,
  117. .fn_u = { .xts = GLUE_XTS_FUNC_CAST(serpent_xts_dec_8way_avx) }
  118. }, {
  119. .num_blocks = 1,
  120. .fn_u = { .xts = GLUE_XTS_FUNC_CAST(serpent_xts_dec) }
  121. } }
  122. };
  123. static int ecb_encrypt(struct blkcipher_desc *desc, struct scatterlist *dst,
  124. struct scatterlist *src, unsigned int nbytes)
  125. {
  126. return glue_ecb_crypt_128bit(&serpent_enc, desc, dst, src, nbytes);
  127. }
  128. static int ecb_decrypt(struct blkcipher_desc *desc, struct scatterlist *dst,
  129. struct scatterlist *src, unsigned int nbytes)
  130. {
  131. return glue_ecb_crypt_128bit(&serpent_dec, desc, dst, src, nbytes);
  132. }
  133. static int cbc_encrypt(struct blkcipher_desc *desc, struct scatterlist *dst,
  134. struct scatterlist *src, unsigned int nbytes)
  135. {
  136. return glue_cbc_encrypt_128bit(GLUE_FUNC_CAST(__serpent_encrypt), desc,
  137. dst, src, nbytes);
  138. }
  139. static int cbc_decrypt(struct blkcipher_desc *desc, struct scatterlist *dst,
  140. struct scatterlist *src, unsigned int nbytes)
  141. {
  142. return glue_cbc_decrypt_128bit(&serpent_dec_cbc, desc, dst, src,
  143. nbytes);
  144. }
  145. static int ctr_crypt(struct blkcipher_desc *desc, struct scatterlist *dst,
  146. struct scatterlist *src, unsigned int nbytes)
  147. {
  148. return glue_ctr_crypt_128bit(&serpent_ctr, desc, dst, src, nbytes);
  149. }
  150. static inline bool serpent_fpu_begin(bool fpu_enabled, unsigned int nbytes)
  151. {
  152. /* since reusing AVX functions, starts using FPU at 8 parallel blocks */
  153. return glue_fpu_begin(SERPENT_BLOCK_SIZE, 8, NULL, fpu_enabled, nbytes);
  154. }
  155. static inline void serpent_fpu_end(bool fpu_enabled)
  156. {
  157. glue_fpu_end(fpu_enabled);
  158. }
  159. struct crypt_priv {
  160. struct serpent_ctx *ctx;
  161. bool fpu_enabled;
  162. };
  163. static void encrypt_callback(void *priv, u8 *srcdst, unsigned int nbytes)
  164. {
  165. const unsigned int bsize = SERPENT_BLOCK_SIZE;
  166. struct crypt_priv *ctx = priv;
  167. int i;
  168. ctx->fpu_enabled = serpent_fpu_begin(ctx->fpu_enabled, nbytes);
  169. if (nbytes >= SERPENT_AVX2_PARALLEL_BLOCKS * bsize) {
  170. serpent_ecb_enc_16way(ctx->ctx, srcdst, srcdst);
  171. srcdst += bsize * SERPENT_AVX2_PARALLEL_BLOCKS;
  172. nbytes -= bsize * SERPENT_AVX2_PARALLEL_BLOCKS;
  173. }
  174. while (nbytes >= SERPENT_PARALLEL_BLOCKS * bsize) {
  175. serpent_ecb_enc_8way_avx(ctx->ctx, srcdst, srcdst);
  176. srcdst += bsize * SERPENT_PARALLEL_BLOCKS;
  177. nbytes -= bsize * SERPENT_PARALLEL_BLOCKS;
  178. }
  179. for (i = 0; i < nbytes / bsize; i++, srcdst += bsize)
  180. __serpent_encrypt(ctx->ctx, srcdst, srcdst);
  181. }
  182. static void decrypt_callback(void *priv, u8 *srcdst, unsigned int nbytes)
  183. {
  184. const unsigned int bsize = SERPENT_BLOCK_SIZE;
  185. struct crypt_priv *ctx = priv;
  186. int i;
  187. ctx->fpu_enabled = serpent_fpu_begin(ctx->fpu_enabled, nbytes);
  188. if (nbytes >= SERPENT_AVX2_PARALLEL_BLOCKS * bsize) {
  189. serpent_ecb_dec_16way(ctx->ctx, srcdst, srcdst);
  190. srcdst += bsize * SERPENT_AVX2_PARALLEL_BLOCKS;
  191. nbytes -= bsize * SERPENT_AVX2_PARALLEL_BLOCKS;
  192. }
  193. while (nbytes >= SERPENT_PARALLEL_BLOCKS * bsize) {
  194. serpent_ecb_dec_8way_avx(ctx->ctx, srcdst, srcdst);
  195. srcdst += bsize * SERPENT_PARALLEL_BLOCKS;
  196. nbytes -= bsize * SERPENT_PARALLEL_BLOCKS;
  197. }
  198. for (i = 0; i < nbytes / bsize; i++, srcdst += bsize)
  199. __serpent_decrypt(ctx->ctx, srcdst, srcdst);
  200. }
  201. static int lrw_encrypt(struct blkcipher_desc *desc, struct scatterlist *dst,
  202. struct scatterlist *src, unsigned int nbytes)
  203. {
  204. struct serpent_lrw_ctx *ctx = crypto_blkcipher_ctx(desc->tfm);
  205. be128 buf[SERPENT_AVX2_PARALLEL_BLOCKS];
  206. struct crypt_priv crypt_ctx = {
  207. .ctx = &ctx->serpent_ctx,
  208. .fpu_enabled = false,
  209. };
  210. struct lrw_crypt_req req = {
  211. .tbuf = buf,
  212. .tbuflen = sizeof(buf),
  213. .table_ctx = &ctx->lrw_table,
  214. .crypt_ctx = &crypt_ctx,
  215. .crypt_fn = encrypt_callback,
  216. };
  217. int ret;
  218. desc->flags &= ~CRYPTO_TFM_REQ_MAY_SLEEP;
  219. ret = lrw_crypt(desc, dst, src, nbytes, &req);
  220. serpent_fpu_end(crypt_ctx.fpu_enabled);
  221. return ret;
  222. }
  223. static int lrw_decrypt(struct blkcipher_desc *desc, struct scatterlist *dst,
  224. struct scatterlist *src, unsigned int nbytes)
  225. {
  226. struct serpent_lrw_ctx *ctx = crypto_blkcipher_ctx(desc->tfm);
  227. be128 buf[SERPENT_AVX2_PARALLEL_BLOCKS];
  228. struct crypt_priv crypt_ctx = {
  229. .ctx = &ctx->serpent_ctx,
  230. .fpu_enabled = false,
  231. };
  232. struct lrw_crypt_req req = {
  233. .tbuf = buf,
  234. .tbuflen = sizeof(buf),
  235. .table_ctx = &ctx->lrw_table,
  236. .crypt_ctx = &crypt_ctx,
  237. .crypt_fn = decrypt_callback,
  238. };
  239. int ret;
  240. desc->flags &= ~CRYPTO_TFM_REQ_MAY_SLEEP;
  241. ret = lrw_crypt(desc, dst, src, nbytes, &req);
  242. serpent_fpu_end(crypt_ctx.fpu_enabled);
  243. return ret;
  244. }
  245. static int xts_encrypt(struct blkcipher_desc *desc, struct scatterlist *dst,
  246. struct scatterlist *src, unsigned int nbytes)
  247. {
  248. struct serpent_xts_ctx *ctx = crypto_blkcipher_ctx(desc->tfm);
  249. return glue_xts_crypt_128bit(&serpent_enc_xts, desc, dst, src, nbytes,
  250. XTS_TWEAK_CAST(__serpent_encrypt),
  251. &ctx->tweak_ctx, &ctx->crypt_ctx);
  252. }
  253. static int xts_decrypt(struct blkcipher_desc *desc, struct scatterlist *dst,
  254. struct scatterlist *src, unsigned int nbytes)
  255. {
  256. struct serpent_xts_ctx *ctx = crypto_blkcipher_ctx(desc->tfm);
  257. return glue_xts_crypt_128bit(&serpent_dec_xts, desc, dst, src, nbytes,
  258. XTS_TWEAK_CAST(__serpent_encrypt),
  259. &ctx->tweak_ctx, &ctx->crypt_ctx);
  260. }
  261. static struct crypto_alg srp_algs[10] = { {
  262. .cra_name = "__ecb-serpent-avx2",
  263. .cra_driver_name = "__driver-ecb-serpent-avx2",
  264. .cra_priority = 0,
  265. .cra_flags = CRYPTO_ALG_TYPE_BLKCIPHER,
  266. .cra_blocksize = SERPENT_BLOCK_SIZE,
  267. .cra_ctxsize = sizeof(struct serpent_ctx),
  268. .cra_alignmask = 0,
  269. .cra_type = &crypto_blkcipher_type,
  270. .cra_module = THIS_MODULE,
  271. .cra_list = LIST_HEAD_INIT(srp_algs[0].cra_list),
  272. .cra_u = {
  273. .blkcipher = {
  274. .min_keysize = SERPENT_MIN_KEY_SIZE,
  275. .max_keysize = SERPENT_MAX_KEY_SIZE,
  276. .setkey = serpent_setkey,
  277. .encrypt = ecb_encrypt,
  278. .decrypt = ecb_decrypt,
  279. },
  280. },
  281. }, {
  282. .cra_name = "__cbc-serpent-avx2",
  283. .cra_driver_name = "__driver-cbc-serpent-avx2",
  284. .cra_priority = 0,
  285. .cra_flags = CRYPTO_ALG_TYPE_BLKCIPHER,
  286. .cra_blocksize = SERPENT_BLOCK_SIZE,
  287. .cra_ctxsize = sizeof(struct serpent_ctx),
  288. .cra_alignmask = 0,
  289. .cra_type = &crypto_blkcipher_type,
  290. .cra_module = THIS_MODULE,
  291. .cra_list = LIST_HEAD_INIT(srp_algs[1].cra_list),
  292. .cra_u = {
  293. .blkcipher = {
  294. .min_keysize = SERPENT_MIN_KEY_SIZE,
  295. .max_keysize = SERPENT_MAX_KEY_SIZE,
  296. .setkey = serpent_setkey,
  297. .encrypt = cbc_encrypt,
  298. .decrypt = cbc_decrypt,
  299. },
  300. },
  301. }, {
  302. .cra_name = "__ctr-serpent-avx2",
  303. .cra_driver_name = "__driver-ctr-serpent-avx2",
  304. .cra_priority = 0,
  305. .cra_flags = CRYPTO_ALG_TYPE_BLKCIPHER,
  306. .cra_blocksize = 1,
  307. .cra_ctxsize = sizeof(struct serpent_ctx),
  308. .cra_alignmask = 0,
  309. .cra_type = &crypto_blkcipher_type,
  310. .cra_module = THIS_MODULE,
  311. .cra_list = LIST_HEAD_INIT(srp_algs[2].cra_list),
  312. .cra_u = {
  313. .blkcipher = {
  314. .min_keysize = SERPENT_MIN_KEY_SIZE,
  315. .max_keysize = SERPENT_MAX_KEY_SIZE,
  316. .ivsize = SERPENT_BLOCK_SIZE,
  317. .setkey = serpent_setkey,
  318. .encrypt = ctr_crypt,
  319. .decrypt = ctr_crypt,
  320. },
  321. },
  322. }, {
  323. .cra_name = "__lrw-serpent-avx2",
  324. .cra_driver_name = "__driver-lrw-serpent-avx2",
  325. .cra_priority = 0,
  326. .cra_flags = CRYPTO_ALG_TYPE_BLKCIPHER,
  327. .cra_blocksize = SERPENT_BLOCK_SIZE,
  328. .cra_ctxsize = sizeof(struct serpent_lrw_ctx),
  329. .cra_alignmask = 0,
  330. .cra_type = &crypto_blkcipher_type,
  331. .cra_module = THIS_MODULE,
  332. .cra_list = LIST_HEAD_INIT(srp_algs[3].cra_list),
  333. .cra_exit = lrw_serpent_exit_tfm,
  334. .cra_u = {
  335. .blkcipher = {
  336. .min_keysize = SERPENT_MIN_KEY_SIZE +
  337. SERPENT_BLOCK_SIZE,
  338. .max_keysize = SERPENT_MAX_KEY_SIZE +
  339. SERPENT_BLOCK_SIZE,
  340. .ivsize = SERPENT_BLOCK_SIZE,
  341. .setkey = lrw_serpent_setkey,
  342. .encrypt = lrw_encrypt,
  343. .decrypt = lrw_decrypt,
  344. },
  345. },
  346. }, {
  347. .cra_name = "__xts-serpent-avx2",
  348. .cra_driver_name = "__driver-xts-serpent-avx2",
  349. .cra_priority = 0,
  350. .cra_flags = CRYPTO_ALG_TYPE_BLKCIPHER,
  351. .cra_blocksize = SERPENT_BLOCK_SIZE,
  352. .cra_ctxsize = sizeof(struct serpent_xts_ctx),
  353. .cra_alignmask = 0,
  354. .cra_type = &crypto_blkcipher_type,
  355. .cra_module = THIS_MODULE,
  356. .cra_list = LIST_HEAD_INIT(srp_algs[4].cra_list),
  357. .cra_u = {
  358. .blkcipher = {
  359. .min_keysize = SERPENT_MIN_KEY_SIZE * 2,
  360. .max_keysize = SERPENT_MAX_KEY_SIZE * 2,
  361. .ivsize = SERPENT_BLOCK_SIZE,
  362. .setkey = xts_serpent_setkey,
  363. .encrypt = xts_encrypt,
  364. .decrypt = xts_decrypt,
  365. },
  366. },
  367. }, {
  368. .cra_name = "ecb(serpent)",
  369. .cra_driver_name = "ecb-serpent-avx2",
  370. .cra_priority = 600,
  371. .cra_flags = CRYPTO_ALG_TYPE_ABLKCIPHER | CRYPTO_ALG_ASYNC,
  372. .cra_blocksize = SERPENT_BLOCK_SIZE,
  373. .cra_ctxsize = sizeof(struct async_helper_ctx),
  374. .cra_alignmask = 0,
  375. .cra_type = &crypto_ablkcipher_type,
  376. .cra_module = THIS_MODULE,
  377. .cra_list = LIST_HEAD_INIT(srp_algs[5].cra_list),
  378. .cra_init = ablk_init,
  379. .cra_exit = ablk_exit,
  380. .cra_u = {
  381. .ablkcipher = {
  382. .min_keysize = SERPENT_MIN_KEY_SIZE,
  383. .max_keysize = SERPENT_MAX_KEY_SIZE,
  384. .setkey = ablk_set_key,
  385. .encrypt = ablk_encrypt,
  386. .decrypt = ablk_decrypt,
  387. },
  388. },
  389. }, {
  390. .cra_name = "cbc(serpent)",
  391. .cra_driver_name = "cbc-serpent-avx2",
  392. .cra_priority = 600,
  393. .cra_flags = CRYPTO_ALG_TYPE_ABLKCIPHER | CRYPTO_ALG_ASYNC,
  394. .cra_blocksize = SERPENT_BLOCK_SIZE,
  395. .cra_ctxsize = sizeof(struct async_helper_ctx),
  396. .cra_alignmask = 0,
  397. .cra_type = &crypto_ablkcipher_type,
  398. .cra_module = THIS_MODULE,
  399. .cra_list = LIST_HEAD_INIT(srp_algs[6].cra_list),
  400. .cra_init = ablk_init,
  401. .cra_exit = ablk_exit,
  402. .cra_u = {
  403. .ablkcipher = {
  404. .min_keysize = SERPENT_MIN_KEY_SIZE,
  405. .max_keysize = SERPENT_MAX_KEY_SIZE,
  406. .ivsize = SERPENT_BLOCK_SIZE,
  407. .setkey = ablk_set_key,
  408. .encrypt = __ablk_encrypt,
  409. .decrypt = ablk_decrypt,
  410. },
  411. },
  412. }, {
  413. .cra_name = "ctr(serpent)",
  414. .cra_driver_name = "ctr-serpent-avx2",
  415. .cra_priority = 600,
  416. .cra_flags = CRYPTO_ALG_TYPE_ABLKCIPHER | CRYPTO_ALG_ASYNC,
  417. .cra_blocksize = 1,
  418. .cra_ctxsize = sizeof(struct async_helper_ctx),
  419. .cra_alignmask = 0,
  420. .cra_type = &crypto_ablkcipher_type,
  421. .cra_module = THIS_MODULE,
  422. .cra_list = LIST_HEAD_INIT(srp_algs[7].cra_list),
  423. .cra_init = ablk_init,
  424. .cra_exit = ablk_exit,
  425. .cra_u = {
  426. .ablkcipher = {
  427. .min_keysize = SERPENT_MIN_KEY_SIZE,
  428. .max_keysize = SERPENT_MAX_KEY_SIZE,
  429. .ivsize = SERPENT_BLOCK_SIZE,
  430. .setkey = ablk_set_key,
  431. .encrypt = ablk_encrypt,
  432. .decrypt = ablk_encrypt,
  433. .geniv = "chainiv",
  434. },
  435. },
  436. }, {
  437. .cra_name = "lrw(serpent)",
  438. .cra_driver_name = "lrw-serpent-avx2",
  439. .cra_priority = 600,
  440. .cra_flags = CRYPTO_ALG_TYPE_ABLKCIPHER | CRYPTO_ALG_ASYNC,
  441. .cra_blocksize = SERPENT_BLOCK_SIZE,
  442. .cra_ctxsize = sizeof(struct async_helper_ctx),
  443. .cra_alignmask = 0,
  444. .cra_type = &crypto_ablkcipher_type,
  445. .cra_module = THIS_MODULE,
  446. .cra_list = LIST_HEAD_INIT(srp_algs[8].cra_list),
  447. .cra_init = ablk_init,
  448. .cra_exit = ablk_exit,
  449. .cra_u = {
  450. .ablkcipher = {
  451. .min_keysize = SERPENT_MIN_KEY_SIZE +
  452. SERPENT_BLOCK_SIZE,
  453. .max_keysize = SERPENT_MAX_KEY_SIZE +
  454. SERPENT_BLOCK_SIZE,
  455. .ivsize = SERPENT_BLOCK_SIZE,
  456. .setkey = ablk_set_key,
  457. .encrypt = ablk_encrypt,
  458. .decrypt = ablk_decrypt,
  459. },
  460. },
  461. }, {
  462. .cra_name = "xts(serpent)",
  463. .cra_driver_name = "xts-serpent-avx2",
  464. .cra_priority = 600,
  465. .cra_flags = CRYPTO_ALG_TYPE_ABLKCIPHER | CRYPTO_ALG_ASYNC,
  466. .cra_blocksize = SERPENT_BLOCK_SIZE,
  467. .cra_ctxsize = sizeof(struct async_helper_ctx),
  468. .cra_alignmask = 0,
  469. .cra_type = &crypto_ablkcipher_type,
  470. .cra_module = THIS_MODULE,
  471. .cra_list = LIST_HEAD_INIT(srp_algs[9].cra_list),
  472. .cra_init = ablk_init,
  473. .cra_exit = ablk_exit,
  474. .cra_u = {
  475. .ablkcipher = {
  476. .min_keysize = SERPENT_MIN_KEY_SIZE * 2,
  477. .max_keysize = SERPENT_MAX_KEY_SIZE * 2,
  478. .ivsize = SERPENT_BLOCK_SIZE,
  479. .setkey = ablk_set_key,
  480. .encrypt = ablk_encrypt,
  481. .decrypt = ablk_decrypt,
  482. },
  483. },
  484. } };
  485. static int __init init(void)
  486. {
  487. u64 xcr0;
  488. if (!cpu_has_avx2 || !cpu_has_osxsave) {
  489. pr_info("AVX2 instructions are not detected.\n");
  490. return -ENODEV;
  491. }
  492. xcr0 = xgetbv(XCR_XFEATURE_ENABLED_MASK);
  493. if ((xcr0 & (XSTATE_SSE | XSTATE_YMM)) != (XSTATE_SSE | XSTATE_YMM)) {
  494. pr_info("AVX detected but unusable.\n");
  495. return -ENODEV;
  496. }
  497. return crypto_register_algs(srp_algs, ARRAY_SIZE(srp_algs));
  498. }
  499. static void __exit fini(void)
  500. {
  501. crypto_unregister_algs(srp_algs, ARRAY_SIZE(srp_algs));
  502. }
  503. module_init(init);
  504. module_exit(fini);
  505. MODULE_LICENSE("GPL");
  506. MODULE_DESCRIPTION("Serpent Cipher Algorithm, AVX2 optimized");
  507. MODULE_ALIAS("serpent");
  508. MODULE_ALIAS("serpent-asm");