sha512_ssse3_glue.c 8.9 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347
  1. /*
  2. * Cryptographic API.
  3. *
  4. * Glue code for the SHA512 Secure Hash Algorithm assembler
  5. * implementation using supplemental SSE3 / AVX / AVX2 instructions.
  6. *
  7. * This file is based on sha512_generic.c
  8. *
  9. * Copyright (C) 2013 Intel Corporation
  10. * Author: Tim Chen <[email protected]>
  11. *
  12. * This program is free software; you can redistribute it and/or modify it
  13. * under the terms of the GNU General Public License as published by the Free
  14. * Software Foundation; either version 2 of the License, or (at your option)
  15. * any later version.
  16. *
  17. * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
  18. * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
  19. * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
  20. * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
  21. * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
  22. * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
  23. * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
  24. * SOFTWARE.
  25. *
  26. */
  27. #define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
  28. #include <crypto/internal/hash.h>
  29. #include <crypto/internal/simd.h>
  30. #include <linux/init.h>
  31. #include <linux/module.h>
  32. #include <linux/mm.h>
  33. #include <linux/string.h>
  34. #include <linux/types.h>
  35. #include <crypto/sha2.h>
  36. #include <crypto/sha512_base.h>
  37. #include <asm/cpu_device_id.h>
  38. #include <asm/simd.h>
  39. asmlinkage void sha512_transform_ssse3(struct sha512_state *state,
  40. const u8 *data, int blocks);
  41. static int sha512_update(struct shash_desc *desc, const u8 *data,
  42. unsigned int len, sha512_block_fn *sha512_xform)
  43. {
  44. struct sha512_state *sctx = shash_desc_ctx(desc);
  45. if (!crypto_simd_usable() ||
  46. (sctx->count[0] % SHA512_BLOCK_SIZE) + len < SHA512_BLOCK_SIZE)
  47. return crypto_sha512_update(desc, data, len);
  48. /*
  49. * Make sure struct sha512_state begins directly with the SHA512
  50. * 512-bit internal state, as this is what the asm functions expect.
  51. */
  52. BUILD_BUG_ON(offsetof(struct sha512_state, state) != 0);
  53. kernel_fpu_begin();
  54. sha512_base_do_update(desc, data, len, sha512_xform);
  55. kernel_fpu_end();
  56. return 0;
  57. }
  58. static int sha512_finup(struct shash_desc *desc, const u8 *data,
  59. unsigned int len, u8 *out, sha512_block_fn *sha512_xform)
  60. {
  61. if (!crypto_simd_usable())
  62. return crypto_sha512_finup(desc, data, len, out);
  63. kernel_fpu_begin();
  64. if (len)
  65. sha512_base_do_update(desc, data, len, sha512_xform);
  66. sha512_base_do_finalize(desc, sha512_xform);
  67. kernel_fpu_end();
  68. return sha512_base_finish(desc, out);
  69. }
  70. static int sha512_ssse3_update(struct shash_desc *desc, const u8 *data,
  71. unsigned int len)
  72. {
  73. return sha512_update(desc, data, len, sha512_transform_ssse3);
  74. }
  75. static int sha512_ssse3_finup(struct shash_desc *desc, const u8 *data,
  76. unsigned int len, u8 *out)
  77. {
  78. return sha512_finup(desc, data, len, out, sha512_transform_ssse3);
  79. }
  80. /* Add padding and return the message digest. */
  81. static int sha512_ssse3_final(struct shash_desc *desc, u8 *out)
  82. {
  83. return sha512_ssse3_finup(desc, NULL, 0, out);
  84. }
  85. static struct shash_alg sha512_ssse3_algs[] = { {
  86. .digestsize = SHA512_DIGEST_SIZE,
  87. .init = sha512_base_init,
  88. .update = sha512_ssse3_update,
  89. .final = sha512_ssse3_final,
  90. .finup = sha512_ssse3_finup,
  91. .descsize = sizeof(struct sha512_state),
  92. .base = {
  93. .cra_name = "sha512",
  94. .cra_driver_name = "sha512-ssse3",
  95. .cra_priority = 150,
  96. .cra_blocksize = SHA512_BLOCK_SIZE,
  97. .cra_module = THIS_MODULE,
  98. }
  99. }, {
  100. .digestsize = SHA384_DIGEST_SIZE,
  101. .init = sha384_base_init,
  102. .update = sha512_ssse3_update,
  103. .final = sha512_ssse3_final,
  104. .finup = sha512_ssse3_finup,
  105. .descsize = sizeof(struct sha512_state),
  106. .base = {
  107. .cra_name = "sha384",
  108. .cra_driver_name = "sha384-ssse3",
  109. .cra_priority = 150,
  110. .cra_blocksize = SHA384_BLOCK_SIZE,
  111. .cra_module = THIS_MODULE,
  112. }
  113. } };
  114. static int register_sha512_ssse3(void)
  115. {
  116. if (boot_cpu_has(X86_FEATURE_SSSE3))
  117. return crypto_register_shashes(sha512_ssse3_algs,
  118. ARRAY_SIZE(sha512_ssse3_algs));
  119. return 0;
  120. }
  121. static void unregister_sha512_ssse3(void)
  122. {
  123. if (boot_cpu_has(X86_FEATURE_SSSE3))
  124. crypto_unregister_shashes(sha512_ssse3_algs,
  125. ARRAY_SIZE(sha512_ssse3_algs));
  126. }
  127. asmlinkage void sha512_transform_avx(struct sha512_state *state,
  128. const u8 *data, int blocks);
  129. static bool avx_usable(void)
  130. {
  131. if (!cpu_has_xfeatures(XFEATURE_MASK_SSE | XFEATURE_MASK_YMM, NULL)) {
  132. if (boot_cpu_has(X86_FEATURE_AVX))
  133. pr_info("AVX detected but unusable.\n");
  134. return false;
  135. }
  136. return true;
  137. }
  138. static int sha512_avx_update(struct shash_desc *desc, const u8 *data,
  139. unsigned int len)
  140. {
  141. return sha512_update(desc, data, len, sha512_transform_avx);
  142. }
  143. static int sha512_avx_finup(struct shash_desc *desc, const u8 *data,
  144. unsigned int len, u8 *out)
  145. {
  146. return sha512_finup(desc, data, len, out, sha512_transform_avx);
  147. }
  148. /* Add padding and return the message digest. */
  149. static int sha512_avx_final(struct shash_desc *desc, u8 *out)
  150. {
  151. return sha512_avx_finup(desc, NULL, 0, out);
  152. }
  153. static struct shash_alg sha512_avx_algs[] = { {
  154. .digestsize = SHA512_DIGEST_SIZE,
  155. .init = sha512_base_init,
  156. .update = sha512_avx_update,
  157. .final = sha512_avx_final,
  158. .finup = sha512_avx_finup,
  159. .descsize = sizeof(struct sha512_state),
  160. .base = {
  161. .cra_name = "sha512",
  162. .cra_driver_name = "sha512-avx",
  163. .cra_priority = 160,
  164. .cra_blocksize = SHA512_BLOCK_SIZE,
  165. .cra_module = THIS_MODULE,
  166. }
  167. }, {
  168. .digestsize = SHA384_DIGEST_SIZE,
  169. .init = sha384_base_init,
  170. .update = sha512_avx_update,
  171. .final = sha512_avx_final,
  172. .finup = sha512_avx_finup,
  173. .descsize = sizeof(struct sha512_state),
  174. .base = {
  175. .cra_name = "sha384",
  176. .cra_driver_name = "sha384-avx",
  177. .cra_priority = 160,
  178. .cra_blocksize = SHA384_BLOCK_SIZE,
  179. .cra_module = THIS_MODULE,
  180. }
  181. } };
  182. static int register_sha512_avx(void)
  183. {
  184. if (avx_usable())
  185. return crypto_register_shashes(sha512_avx_algs,
  186. ARRAY_SIZE(sha512_avx_algs));
  187. return 0;
  188. }
  189. static void unregister_sha512_avx(void)
  190. {
  191. if (avx_usable())
  192. crypto_unregister_shashes(sha512_avx_algs,
  193. ARRAY_SIZE(sha512_avx_algs));
  194. }
  195. asmlinkage void sha512_transform_rorx(struct sha512_state *state,
  196. const u8 *data, int blocks);
  197. static int sha512_avx2_update(struct shash_desc *desc, const u8 *data,
  198. unsigned int len)
  199. {
  200. return sha512_update(desc, data, len, sha512_transform_rorx);
  201. }
  202. static int sha512_avx2_finup(struct shash_desc *desc, const u8 *data,
  203. unsigned int len, u8 *out)
  204. {
  205. return sha512_finup(desc, data, len, out, sha512_transform_rorx);
  206. }
  207. /* Add padding and return the message digest. */
  208. static int sha512_avx2_final(struct shash_desc *desc, u8 *out)
  209. {
  210. return sha512_avx2_finup(desc, NULL, 0, out);
  211. }
  212. static struct shash_alg sha512_avx2_algs[] = { {
  213. .digestsize = SHA512_DIGEST_SIZE,
  214. .init = sha512_base_init,
  215. .update = sha512_avx2_update,
  216. .final = sha512_avx2_final,
  217. .finup = sha512_avx2_finup,
  218. .descsize = sizeof(struct sha512_state),
  219. .base = {
  220. .cra_name = "sha512",
  221. .cra_driver_name = "sha512-avx2",
  222. .cra_priority = 170,
  223. .cra_blocksize = SHA512_BLOCK_SIZE,
  224. .cra_module = THIS_MODULE,
  225. }
  226. }, {
  227. .digestsize = SHA384_DIGEST_SIZE,
  228. .init = sha384_base_init,
  229. .update = sha512_avx2_update,
  230. .final = sha512_avx2_final,
  231. .finup = sha512_avx2_finup,
  232. .descsize = sizeof(struct sha512_state),
  233. .base = {
  234. .cra_name = "sha384",
  235. .cra_driver_name = "sha384-avx2",
  236. .cra_priority = 170,
  237. .cra_blocksize = SHA384_BLOCK_SIZE,
  238. .cra_module = THIS_MODULE,
  239. }
  240. } };
  241. static bool avx2_usable(void)
  242. {
  243. if (avx_usable() && boot_cpu_has(X86_FEATURE_AVX2) &&
  244. boot_cpu_has(X86_FEATURE_BMI2))
  245. return true;
  246. return false;
  247. }
  248. static int register_sha512_avx2(void)
  249. {
  250. if (avx2_usable())
  251. return crypto_register_shashes(sha512_avx2_algs,
  252. ARRAY_SIZE(sha512_avx2_algs));
  253. return 0;
  254. }
  255. static const struct x86_cpu_id module_cpu_ids[] = {
  256. X86_MATCH_FEATURE(X86_FEATURE_AVX2, NULL),
  257. X86_MATCH_FEATURE(X86_FEATURE_AVX, NULL),
  258. X86_MATCH_FEATURE(X86_FEATURE_SSSE3, NULL),
  259. {}
  260. };
  261. MODULE_DEVICE_TABLE(x86cpu, module_cpu_ids);
  262. static void unregister_sha512_avx2(void)
  263. {
  264. if (avx2_usable())
  265. crypto_unregister_shashes(sha512_avx2_algs,
  266. ARRAY_SIZE(sha512_avx2_algs));
  267. }
  268. static int __init sha512_ssse3_mod_init(void)
  269. {
  270. if (!x86_match_cpu(module_cpu_ids))
  271. return -ENODEV;
  272. if (register_sha512_ssse3())
  273. goto fail;
  274. if (register_sha512_avx()) {
  275. unregister_sha512_ssse3();
  276. goto fail;
  277. }
  278. if (register_sha512_avx2()) {
  279. unregister_sha512_avx();
  280. unregister_sha512_ssse3();
  281. goto fail;
  282. }
  283. return 0;
  284. fail:
  285. return -ENODEV;
  286. }
  287. static void __exit sha512_ssse3_mod_fini(void)
  288. {
  289. unregister_sha512_avx2();
  290. unregister_sha512_avx();
  291. unregister_sha512_ssse3();
  292. }
  293. module_init(sha512_ssse3_mod_init);
  294. module_exit(sha512_ssse3_mod_fini);
  295. MODULE_LICENSE("GPL");
  296. MODULE_DESCRIPTION("SHA512 Secure Hash Algorithm, Supplemental SSE3 accelerated");
  297. MODULE_ALIAS_CRYPTO("sha512");
  298. MODULE_ALIAS_CRYPTO("sha512-ssse3");
  299. MODULE_ALIAS_CRYPTO("sha512-avx");
  300. MODULE_ALIAS_CRYPTO("sha512-avx2");
  301. MODULE_ALIAS_CRYPTO("sha384");
  302. MODULE_ALIAS_CRYPTO("sha384-ssse3");
  303. MODULE_ALIAS_CRYPTO("sha384-avx");
  304. MODULE_ALIAS_CRYPTO("sha384-avx2");