162306a36Sopenharmony_ci/* 262306a36Sopenharmony_ci * Cryptographic API. 362306a36Sopenharmony_ci * 462306a36Sopenharmony_ci * Glue code for the SHA512 Secure Hash Algorithm assembler 562306a36Sopenharmony_ci * implementation using supplemental SSE3 / AVX / AVX2 instructions. 662306a36Sopenharmony_ci * 762306a36Sopenharmony_ci * This file is based on sha512_generic.c 862306a36Sopenharmony_ci * 962306a36Sopenharmony_ci * Copyright (C) 2013 Intel Corporation 1062306a36Sopenharmony_ci * Author: Tim Chen <tim.c.chen@linux.intel.com> 1162306a36Sopenharmony_ci * 1262306a36Sopenharmony_ci * This program is free software; you can redistribute it and/or modify it 1362306a36Sopenharmony_ci * under the terms of the GNU General Public License as published by the Free 1462306a36Sopenharmony_ci * Software Foundation; either version 2 of the License, or (at your option) 1562306a36Sopenharmony_ci * any later version. 1662306a36Sopenharmony_ci * 1762306a36Sopenharmony_ci * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, 1862306a36Sopenharmony_ci * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF 1962306a36Sopenharmony_ci * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND 2062306a36Sopenharmony_ci * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS 2162306a36Sopenharmony_ci * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN 2262306a36Sopenharmony_ci * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN 2362306a36Sopenharmony_ci * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE 2462306a36Sopenharmony_ci * SOFTWARE. 2562306a36Sopenharmony_ci * 2662306a36Sopenharmony_ci */ 2762306a36Sopenharmony_ci 2862306a36Sopenharmony_ci#define pr_fmt(fmt) KBUILD_MODNAME ": " fmt 2962306a36Sopenharmony_ci 3062306a36Sopenharmony_ci#include <crypto/internal/hash.h> 3162306a36Sopenharmony_ci#include <crypto/internal/simd.h> 3262306a36Sopenharmony_ci#include <linux/init.h> 3362306a36Sopenharmony_ci#include <linux/module.h> 3462306a36Sopenharmony_ci#include <linux/mm.h> 3562306a36Sopenharmony_ci#include <linux/string.h> 3662306a36Sopenharmony_ci#include <linux/types.h> 3762306a36Sopenharmony_ci#include <crypto/sha2.h> 3862306a36Sopenharmony_ci#include <crypto/sha512_base.h> 3962306a36Sopenharmony_ci#include <asm/cpu_device_id.h> 4062306a36Sopenharmony_ci#include <asm/simd.h> 4162306a36Sopenharmony_ci 4262306a36Sopenharmony_ciasmlinkage void sha512_transform_ssse3(struct sha512_state *state, 4362306a36Sopenharmony_ci const u8 *data, int blocks); 4462306a36Sopenharmony_ci 4562306a36Sopenharmony_cistatic int sha512_update(struct shash_desc *desc, const u8 *data, 4662306a36Sopenharmony_ci unsigned int len, sha512_block_fn *sha512_xform) 4762306a36Sopenharmony_ci{ 4862306a36Sopenharmony_ci struct sha512_state *sctx = shash_desc_ctx(desc); 4962306a36Sopenharmony_ci 5062306a36Sopenharmony_ci if (!crypto_simd_usable() || 5162306a36Sopenharmony_ci (sctx->count[0] % SHA512_BLOCK_SIZE) + len < SHA512_BLOCK_SIZE) 5262306a36Sopenharmony_ci return crypto_sha512_update(desc, data, len); 5362306a36Sopenharmony_ci 5462306a36Sopenharmony_ci /* 5562306a36Sopenharmony_ci * Make sure struct sha512_state begins directly with the SHA512 5662306a36Sopenharmony_ci * 512-bit internal state, as this is what the asm functions expect. 5762306a36Sopenharmony_ci */ 5862306a36Sopenharmony_ci BUILD_BUG_ON(offsetof(struct sha512_state, state) != 0); 5962306a36Sopenharmony_ci 6062306a36Sopenharmony_ci kernel_fpu_begin(); 6162306a36Sopenharmony_ci sha512_base_do_update(desc, data, len, sha512_xform); 6262306a36Sopenharmony_ci kernel_fpu_end(); 6362306a36Sopenharmony_ci 6462306a36Sopenharmony_ci return 0; 6562306a36Sopenharmony_ci} 6662306a36Sopenharmony_ci 6762306a36Sopenharmony_cistatic int sha512_finup(struct shash_desc *desc, const u8 *data, 6862306a36Sopenharmony_ci unsigned int len, u8 *out, sha512_block_fn *sha512_xform) 6962306a36Sopenharmony_ci{ 7062306a36Sopenharmony_ci if (!crypto_simd_usable()) 7162306a36Sopenharmony_ci return crypto_sha512_finup(desc, data, len, out); 7262306a36Sopenharmony_ci 7362306a36Sopenharmony_ci kernel_fpu_begin(); 7462306a36Sopenharmony_ci if (len) 7562306a36Sopenharmony_ci sha512_base_do_update(desc, data, len, sha512_xform); 7662306a36Sopenharmony_ci sha512_base_do_finalize(desc, sha512_xform); 7762306a36Sopenharmony_ci kernel_fpu_end(); 7862306a36Sopenharmony_ci 7962306a36Sopenharmony_ci return sha512_base_finish(desc, out); 8062306a36Sopenharmony_ci} 8162306a36Sopenharmony_ci 8262306a36Sopenharmony_cistatic int sha512_ssse3_update(struct shash_desc *desc, const u8 *data, 8362306a36Sopenharmony_ci unsigned int len) 8462306a36Sopenharmony_ci{ 8562306a36Sopenharmony_ci return sha512_update(desc, data, len, sha512_transform_ssse3); 8662306a36Sopenharmony_ci} 8762306a36Sopenharmony_ci 8862306a36Sopenharmony_cistatic int sha512_ssse3_finup(struct shash_desc *desc, const u8 *data, 8962306a36Sopenharmony_ci unsigned int len, u8 *out) 9062306a36Sopenharmony_ci{ 9162306a36Sopenharmony_ci return sha512_finup(desc, data, len, out, sha512_transform_ssse3); 9262306a36Sopenharmony_ci} 9362306a36Sopenharmony_ci 9462306a36Sopenharmony_ci/* Add padding and return the message digest. */ 9562306a36Sopenharmony_cistatic int sha512_ssse3_final(struct shash_desc *desc, u8 *out) 9662306a36Sopenharmony_ci{ 9762306a36Sopenharmony_ci return sha512_ssse3_finup(desc, NULL, 0, out); 9862306a36Sopenharmony_ci} 9962306a36Sopenharmony_ci 10062306a36Sopenharmony_cistatic struct shash_alg sha512_ssse3_algs[] = { { 10162306a36Sopenharmony_ci .digestsize = SHA512_DIGEST_SIZE, 10262306a36Sopenharmony_ci .init = sha512_base_init, 10362306a36Sopenharmony_ci .update = sha512_ssse3_update, 10462306a36Sopenharmony_ci .final = sha512_ssse3_final, 10562306a36Sopenharmony_ci .finup = sha512_ssse3_finup, 10662306a36Sopenharmony_ci .descsize = sizeof(struct sha512_state), 10762306a36Sopenharmony_ci .base = { 10862306a36Sopenharmony_ci .cra_name = "sha512", 10962306a36Sopenharmony_ci .cra_driver_name = "sha512-ssse3", 11062306a36Sopenharmony_ci .cra_priority = 150, 11162306a36Sopenharmony_ci .cra_blocksize = SHA512_BLOCK_SIZE, 11262306a36Sopenharmony_ci .cra_module = THIS_MODULE, 11362306a36Sopenharmony_ci } 11462306a36Sopenharmony_ci}, { 11562306a36Sopenharmony_ci .digestsize = SHA384_DIGEST_SIZE, 11662306a36Sopenharmony_ci .init = sha384_base_init, 11762306a36Sopenharmony_ci .update = sha512_ssse3_update, 11862306a36Sopenharmony_ci .final = sha512_ssse3_final, 11962306a36Sopenharmony_ci .finup = sha512_ssse3_finup, 12062306a36Sopenharmony_ci .descsize = sizeof(struct sha512_state), 12162306a36Sopenharmony_ci .base = { 12262306a36Sopenharmony_ci .cra_name = "sha384", 12362306a36Sopenharmony_ci .cra_driver_name = "sha384-ssse3", 12462306a36Sopenharmony_ci .cra_priority = 150, 12562306a36Sopenharmony_ci .cra_blocksize = SHA384_BLOCK_SIZE, 12662306a36Sopenharmony_ci .cra_module = THIS_MODULE, 12762306a36Sopenharmony_ci } 12862306a36Sopenharmony_ci} }; 12962306a36Sopenharmony_ci 13062306a36Sopenharmony_cistatic int register_sha512_ssse3(void) 13162306a36Sopenharmony_ci{ 13262306a36Sopenharmony_ci if (boot_cpu_has(X86_FEATURE_SSSE3)) 13362306a36Sopenharmony_ci return crypto_register_shashes(sha512_ssse3_algs, 13462306a36Sopenharmony_ci ARRAY_SIZE(sha512_ssse3_algs)); 13562306a36Sopenharmony_ci return 0; 13662306a36Sopenharmony_ci} 13762306a36Sopenharmony_ci 13862306a36Sopenharmony_cistatic void unregister_sha512_ssse3(void) 13962306a36Sopenharmony_ci{ 14062306a36Sopenharmony_ci if (boot_cpu_has(X86_FEATURE_SSSE3)) 14162306a36Sopenharmony_ci crypto_unregister_shashes(sha512_ssse3_algs, 14262306a36Sopenharmony_ci ARRAY_SIZE(sha512_ssse3_algs)); 14362306a36Sopenharmony_ci} 14462306a36Sopenharmony_ci 14562306a36Sopenharmony_ciasmlinkage void sha512_transform_avx(struct sha512_state *state, 14662306a36Sopenharmony_ci const u8 *data, int blocks); 14762306a36Sopenharmony_cistatic bool avx_usable(void) 14862306a36Sopenharmony_ci{ 14962306a36Sopenharmony_ci if (!cpu_has_xfeatures(XFEATURE_MASK_SSE | XFEATURE_MASK_YMM, NULL)) { 15062306a36Sopenharmony_ci if (boot_cpu_has(X86_FEATURE_AVX)) 15162306a36Sopenharmony_ci pr_info("AVX detected but unusable.\n"); 15262306a36Sopenharmony_ci return false; 15362306a36Sopenharmony_ci } 15462306a36Sopenharmony_ci 15562306a36Sopenharmony_ci return true; 15662306a36Sopenharmony_ci} 15762306a36Sopenharmony_ci 15862306a36Sopenharmony_cistatic int sha512_avx_update(struct shash_desc *desc, const u8 *data, 15962306a36Sopenharmony_ci unsigned int len) 16062306a36Sopenharmony_ci{ 16162306a36Sopenharmony_ci return sha512_update(desc, data, len, sha512_transform_avx); 16262306a36Sopenharmony_ci} 16362306a36Sopenharmony_ci 16462306a36Sopenharmony_cistatic int sha512_avx_finup(struct shash_desc *desc, const u8 *data, 16562306a36Sopenharmony_ci unsigned int len, u8 *out) 16662306a36Sopenharmony_ci{ 16762306a36Sopenharmony_ci return sha512_finup(desc, data, len, out, sha512_transform_avx); 16862306a36Sopenharmony_ci} 16962306a36Sopenharmony_ci 17062306a36Sopenharmony_ci/* Add padding and return the message digest. */ 17162306a36Sopenharmony_cistatic int sha512_avx_final(struct shash_desc *desc, u8 *out) 17262306a36Sopenharmony_ci{ 17362306a36Sopenharmony_ci return sha512_avx_finup(desc, NULL, 0, out); 17462306a36Sopenharmony_ci} 17562306a36Sopenharmony_ci 17662306a36Sopenharmony_cistatic struct shash_alg sha512_avx_algs[] = { { 17762306a36Sopenharmony_ci .digestsize = SHA512_DIGEST_SIZE, 17862306a36Sopenharmony_ci .init = sha512_base_init, 17962306a36Sopenharmony_ci .update = sha512_avx_update, 18062306a36Sopenharmony_ci .final = sha512_avx_final, 18162306a36Sopenharmony_ci .finup = sha512_avx_finup, 18262306a36Sopenharmony_ci .descsize = sizeof(struct sha512_state), 18362306a36Sopenharmony_ci .base = { 18462306a36Sopenharmony_ci .cra_name = "sha512", 18562306a36Sopenharmony_ci .cra_driver_name = "sha512-avx", 18662306a36Sopenharmony_ci .cra_priority = 160, 18762306a36Sopenharmony_ci .cra_blocksize = SHA512_BLOCK_SIZE, 18862306a36Sopenharmony_ci .cra_module = THIS_MODULE, 18962306a36Sopenharmony_ci } 19062306a36Sopenharmony_ci}, { 19162306a36Sopenharmony_ci .digestsize = SHA384_DIGEST_SIZE, 19262306a36Sopenharmony_ci .init = sha384_base_init, 19362306a36Sopenharmony_ci .update = sha512_avx_update, 19462306a36Sopenharmony_ci .final = sha512_avx_final, 19562306a36Sopenharmony_ci .finup = sha512_avx_finup, 19662306a36Sopenharmony_ci .descsize = sizeof(struct sha512_state), 19762306a36Sopenharmony_ci .base = { 19862306a36Sopenharmony_ci .cra_name = "sha384", 19962306a36Sopenharmony_ci .cra_driver_name = "sha384-avx", 20062306a36Sopenharmony_ci .cra_priority = 160, 20162306a36Sopenharmony_ci .cra_blocksize = SHA384_BLOCK_SIZE, 20262306a36Sopenharmony_ci .cra_module = THIS_MODULE, 20362306a36Sopenharmony_ci } 20462306a36Sopenharmony_ci} }; 20562306a36Sopenharmony_ci 20662306a36Sopenharmony_cistatic int register_sha512_avx(void) 20762306a36Sopenharmony_ci{ 20862306a36Sopenharmony_ci if (avx_usable()) 20962306a36Sopenharmony_ci return crypto_register_shashes(sha512_avx_algs, 21062306a36Sopenharmony_ci ARRAY_SIZE(sha512_avx_algs)); 21162306a36Sopenharmony_ci return 0; 21262306a36Sopenharmony_ci} 21362306a36Sopenharmony_ci 21462306a36Sopenharmony_cistatic void unregister_sha512_avx(void) 21562306a36Sopenharmony_ci{ 21662306a36Sopenharmony_ci if (avx_usable()) 21762306a36Sopenharmony_ci crypto_unregister_shashes(sha512_avx_algs, 21862306a36Sopenharmony_ci ARRAY_SIZE(sha512_avx_algs)); 21962306a36Sopenharmony_ci} 22062306a36Sopenharmony_ci 22162306a36Sopenharmony_ciasmlinkage void sha512_transform_rorx(struct sha512_state *state, 22262306a36Sopenharmony_ci const u8 *data, int blocks); 22362306a36Sopenharmony_ci 22462306a36Sopenharmony_cistatic int sha512_avx2_update(struct shash_desc *desc, const u8 *data, 22562306a36Sopenharmony_ci unsigned int len) 22662306a36Sopenharmony_ci{ 22762306a36Sopenharmony_ci return sha512_update(desc, data, len, sha512_transform_rorx); 22862306a36Sopenharmony_ci} 22962306a36Sopenharmony_ci 23062306a36Sopenharmony_cistatic int sha512_avx2_finup(struct shash_desc *desc, const u8 *data, 23162306a36Sopenharmony_ci unsigned int len, u8 *out) 23262306a36Sopenharmony_ci{ 23362306a36Sopenharmony_ci return sha512_finup(desc, data, len, out, sha512_transform_rorx); 23462306a36Sopenharmony_ci} 23562306a36Sopenharmony_ci 23662306a36Sopenharmony_ci/* Add padding and return the message digest. */ 23762306a36Sopenharmony_cistatic int sha512_avx2_final(struct shash_desc *desc, u8 *out) 23862306a36Sopenharmony_ci{ 23962306a36Sopenharmony_ci return sha512_avx2_finup(desc, NULL, 0, out); 24062306a36Sopenharmony_ci} 24162306a36Sopenharmony_ci 24262306a36Sopenharmony_cistatic struct shash_alg sha512_avx2_algs[] = { { 24362306a36Sopenharmony_ci .digestsize = SHA512_DIGEST_SIZE, 24462306a36Sopenharmony_ci .init = sha512_base_init, 24562306a36Sopenharmony_ci .update = sha512_avx2_update, 24662306a36Sopenharmony_ci .final = sha512_avx2_final, 24762306a36Sopenharmony_ci .finup = sha512_avx2_finup, 24862306a36Sopenharmony_ci .descsize = sizeof(struct sha512_state), 24962306a36Sopenharmony_ci .base = { 25062306a36Sopenharmony_ci .cra_name = "sha512", 25162306a36Sopenharmony_ci .cra_driver_name = "sha512-avx2", 25262306a36Sopenharmony_ci .cra_priority = 170, 25362306a36Sopenharmony_ci .cra_blocksize = SHA512_BLOCK_SIZE, 25462306a36Sopenharmony_ci .cra_module = THIS_MODULE, 25562306a36Sopenharmony_ci } 25662306a36Sopenharmony_ci}, { 25762306a36Sopenharmony_ci .digestsize = SHA384_DIGEST_SIZE, 25862306a36Sopenharmony_ci .init = sha384_base_init, 25962306a36Sopenharmony_ci .update = sha512_avx2_update, 26062306a36Sopenharmony_ci .final = sha512_avx2_final, 26162306a36Sopenharmony_ci .finup = sha512_avx2_finup, 26262306a36Sopenharmony_ci .descsize = sizeof(struct sha512_state), 26362306a36Sopenharmony_ci .base = { 26462306a36Sopenharmony_ci .cra_name = "sha384", 26562306a36Sopenharmony_ci .cra_driver_name = "sha384-avx2", 26662306a36Sopenharmony_ci .cra_priority = 170, 26762306a36Sopenharmony_ci .cra_blocksize = SHA384_BLOCK_SIZE, 26862306a36Sopenharmony_ci .cra_module = THIS_MODULE, 26962306a36Sopenharmony_ci } 27062306a36Sopenharmony_ci} }; 27162306a36Sopenharmony_ci 27262306a36Sopenharmony_cistatic bool avx2_usable(void) 27362306a36Sopenharmony_ci{ 27462306a36Sopenharmony_ci if (avx_usable() && boot_cpu_has(X86_FEATURE_AVX2) && 27562306a36Sopenharmony_ci boot_cpu_has(X86_FEATURE_BMI2)) 27662306a36Sopenharmony_ci return true; 27762306a36Sopenharmony_ci 27862306a36Sopenharmony_ci return false; 27962306a36Sopenharmony_ci} 28062306a36Sopenharmony_ci 28162306a36Sopenharmony_cistatic int register_sha512_avx2(void) 28262306a36Sopenharmony_ci{ 28362306a36Sopenharmony_ci if (avx2_usable()) 28462306a36Sopenharmony_ci return crypto_register_shashes(sha512_avx2_algs, 28562306a36Sopenharmony_ci ARRAY_SIZE(sha512_avx2_algs)); 28662306a36Sopenharmony_ci return 0; 28762306a36Sopenharmony_ci} 28862306a36Sopenharmony_cistatic const struct x86_cpu_id module_cpu_ids[] = { 28962306a36Sopenharmony_ci X86_MATCH_FEATURE(X86_FEATURE_AVX2, NULL), 29062306a36Sopenharmony_ci X86_MATCH_FEATURE(X86_FEATURE_AVX, NULL), 29162306a36Sopenharmony_ci X86_MATCH_FEATURE(X86_FEATURE_SSSE3, NULL), 29262306a36Sopenharmony_ci {} 29362306a36Sopenharmony_ci}; 29462306a36Sopenharmony_ciMODULE_DEVICE_TABLE(x86cpu, module_cpu_ids); 29562306a36Sopenharmony_ci 29662306a36Sopenharmony_cistatic void unregister_sha512_avx2(void) 29762306a36Sopenharmony_ci{ 29862306a36Sopenharmony_ci if (avx2_usable()) 29962306a36Sopenharmony_ci crypto_unregister_shashes(sha512_avx2_algs, 30062306a36Sopenharmony_ci ARRAY_SIZE(sha512_avx2_algs)); 30162306a36Sopenharmony_ci} 30262306a36Sopenharmony_ci 30362306a36Sopenharmony_cistatic int __init sha512_ssse3_mod_init(void) 30462306a36Sopenharmony_ci{ 30562306a36Sopenharmony_ci if (!x86_match_cpu(module_cpu_ids)) 30662306a36Sopenharmony_ci return -ENODEV; 30762306a36Sopenharmony_ci 30862306a36Sopenharmony_ci if (register_sha512_ssse3()) 30962306a36Sopenharmony_ci goto fail; 31062306a36Sopenharmony_ci 31162306a36Sopenharmony_ci if (register_sha512_avx()) { 31262306a36Sopenharmony_ci unregister_sha512_ssse3(); 31362306a36Sopenharmony_ci goto fail; 31462306a36Sopenharmony_ci } 31562306a36Sopenharmony_ci 31662306a36Sopenharmony_ci if (register_sha512_avx2()) { 31762306a36Sopenharmony_ci unregister_sha512_avx(); 31862306a36Sopenharmony_ci unregister_sha512_ssse3(); 31962306a36Sopenharmony_ci goto fail; 32062306a36Sopenharmony_ci } 32162306a36Sopenharmony_ci 32262306a36Sopenharmony_ci return 0; 32362306a36Sopenharmony_cifail: 32462306a36Sopenharmony_ci return -ENODEV; 32562306a36Sopenharmony_ci} 32662306a36Sopenharmony_ci 32762306a36Sopenharmony_cistatic void __exit sha512_ssse3_mod_fini(void) 32862306a36Sopenharmony_ci{ 32962306a36Sopenharmony_ci unregister_sha512_avx2(); 33062306a36Sopenharmony_ci unregister_sha512_avx(); 33162306a36Sopenharmony_ci unregister_sha512_ssse3(); 33262306a36Sopenharmony_ci} 33362306a36Sopenharmony_ci 33462306a36Sopenharmony_cimodule_init(sha512_ssse3_mod_init); 33562306a36Sopenharmony_cimodule_exit(sha512_ssse3_mod_fini); 33662306a36Sopenharmony_ci 33762306a36Sopenharmony_ciMODULE_LICENSE("GPL"); 33862306a36Sopenharmony_ciMODULE_DESCRIPTION("SHA512 Secure Hash Algorithm, Supplemental SSE3 accelerated"); 33962306a36Sopenharmony_ci 34062306a36Sopenharmony_ciMODULE_ALIAS_CRYPTO("sha512"); 34162306a36Sopenharmony_ciMODULE_ALIAS_CRYPTO("sha512-ssse3"); 34262306a36Sopenharmony_ciMODULE_ALIAS_CRYPTO("sha512-avx"); 34362306a36Sopenharmony_ciMODULE_ALIAS_CRYPTO("sha512-avx2"); 34462306a36Sopenharmony_ciMODULE_ALIAS_CRYPTO("sha384"); 34562306a36Sopenharmony_ciMODULE_ALIAS_CRYPTO("sha384-ssse3"); 34662306a36Sopenharmony_ciMODULE_ALIAS_CRYPTO("sha384-avx"); 34762306a36Sopenharmony_ciMODULE_ALIAS_CRYPTO("sha384-avx2"); 348