162306a36Sopenharmony_ci// SPDX-License-Identifier: GPL-2.0-or-later 262306a36Sopenharmony_ci/* 362306a36Sopenharmony_ci * Glue code for SHA-256 implementation for SPE instructions (PPC) 462306a36Sopenharmony_ci * 562306a36Sopenharmony_ci * Based on generic implementation. The assembler module takes care 662306a36Sopenharmony_ci * about the SPE registers so it can run from interrupt context. 762306a36Sopenharmony_ci * 862306a36Sopenharmony_ci * Copyright (c) 2015 Markus Stockhausen <stockhausen@collogia.de> 962306a36Sopenharmony_ci */ 1062306a36Sopenharmony_ci 1162306a36Sopenharmony_ci#include <crypto/internal/hash.h> 1262306a36Sopenharmony_ci#include <linux/init.h> 1362306a36Sopenharmony_ci#include <linux/module.h> 1462306a36Sopenharmony_ci#include <linux/mm.h> 1562306a36Sopenharmony_ci#include <linux/types.h> 1662306a36Sopenharmony_ci#include <crypto/sha2.h> 1762306a36Sopenharmony_ci#include <crypto/sha256_base.h> 1862306a36Sopenharmony_ci#include <asm/byteorder.h> 1962306a36Sopenharmony_ci#include <asm/switch_to.h> 2062306a36Sopenharmony_ci#include <linux/hardirq.h> 2162306a36Sopenharmony_ci 2262306a36Sopenharmony_ci/* 2362306a36Sopenharmony_ci * MAX_BYTES defines the number of bytes that are allowed to be processed 2462306a36Sopenharmony_ci * between preempt_disable() and preempt_enable(). SHA256 takes ~2,000 2562306a36Sopenharmony_ci * operations per 64 bytes. e500 cores can issue two arithmetic instructions 2662306a36Sopenharmony_ci * per clock cycle using one 32/64 bit unit (SU1) and one 32 bit unit (SU2). 2762306a36Sopenharmony_ci * Thus 1KB of input data will need an estimated maximum of 18,000 cycles. 2862306a36Sopenharmony_ci * Headroom for cache misses included. Even with the low end model clocked 2962306a36Sopenharmony_ci * at 667 MHz this equals to a critical time window of less than 27us. 3062306a36Sopenharmony_ci * 3162306a36Sopenharmony_ci */ 3262306a36Sopenharmony_ci#define MAX_BYTES 1024 3362306a36Sopenharmony_ci 3462306a36Sopenharmony_ciextern void ppc_spe_sha256_transform(u32 *state, const u8 *src, u32 blocks); 3562306a36Sopenharmony_ci 3662306a36Sopenharmony_cistatic void spe_begin(void) 3762306a36Sopenharmony_ci{ 3862306a36Sopenharmony_ci /* We just start SPE operations and will save SPE registers later. */ 3962306a36Sopenharmony_ci preempt_disable(); 4062306a36Sopenharmony_ci enable_kernel_spe(); 4162306a36Sopenharmony_ci} 4262306a36Sopenharmony_ci 4362306a36Sopenharmony_cistatic void spe_end(void) 4462306a36Sopenharmony_ci{ 4562306a36Sopenharmony_ci disable_kernel_spe(); 4662306a36Sopenharmony_ci /* reenable preemption */ 4762306a36Sopenharmony_ci preempt_enable(); 4862306a36Sopenharmony_ci} 4962306a36Sopenharmony_ci 5062306a36Sopenharmony_cistatic inline void ppc_sha256_clear_context(struct sha256_state *sctx) 5162306a36Sopenharmony_ci{ 5262306a36Sopenharmony_ci int count = sizeof(struct sha256_state) >> 2; 5362306a36Sopenharmony_ci u32 *ptr = (u32 *)sctx; 5462306a36Sopenharmony_ci 5562306a36Sopenharmony_ci /* make sure we can clear the fast way */ 5662306a36Sopenharmony_ci BUILD_BUG_ON(sizeof(struct sha256_state) % 4); 5762306a36Sopenharmony_ci do { *ptr++ = 0; } while (--count); 5862306a36Sopenharmony_ci} 5962306a36Sopenharmony_ci 6062306a36Sopenharmony_cistatic int ppc_spe_sha256_update(struct shash_desc *desc, const u8 *data, 6162306a36Sopenharmony_ci unsigned int len) 6262306a36Sopenharmony_ci{ 6362306a36Sopenharmony_ci struct sha256_state *sctx = shash_desc_ctx(desc); 6462306a36Sopenharmony_ci const unsigned int offset = sctx->count & 0x3f; 6562306a36Sopenharmony_ci const unsigned int avail = 64 - offset; 6662306a36Sopenharmony_ci unsigned int bytes; 6762306a36Sopenharmony_ci const u8 *src = data; 6862306a36Sopenharmony_ci 6962306a36Sopenharmony_ci if (avail > len) { 7062306a36Sopenharmony_ci sctx->count += len; 7162306a36Sopenharmony_ci memcpy((char *)sctx->buf + offset, src, len); 7262306a36Sopenharmony_ci return 0; 7362306a36Sopenharmony_ci } 7462306a36Sopenharmony_ci 7562306a36Sopenharmony_ci sctx->count += len; 7662306a36Sopenharmony_ci 7762306a36Sopenharmony_ci if (offset) { 7862306a36Sopenharmony_ci memcpy((char *)sctx->buf + offset, src, avail); 7962306a36Sopenharmony_ci 8062306a36Sopenharmony_ci spe_begin(); 8162306a36Sopenharmony_ci ppc_spe_sha256_transform(sctx->state, (const u8 *)sctx->buf, 1); 8262306a36Sopenharmony_ci spe_end(); 8362306a36Sopenharmony_ci 8462306a36Sopenharmony_ci len -= avail; 8562306a36Sopenharmony_ci src += avail; 8662306a36Sopenharmony_ci } 8762306a36Sopenharmony_ci 8862306a36Sopenharmony_ci while (len > 63) { 8962306a36Sopenharmony_ci /* cut input data into smaller blocks */ 9062306a36Sopenharmony_ci bytes = (len > MAX_BYTES) ? MAX_BYTES : len; 9162306a36Sopenharmony_ci bytes = bytes & ~0x3f; 9262306a36Sopenharmony_ci 9362306a36Sopenharmony_ci spe_begin(); 9462306a36Sopenharmony_ci ppc_spe_sha256_transform(sctx->state, src, bytes >> 6); 9562306a36Sopenharmony_ci spe_end(); 9662306a36Sopenharmony_ci 9762306a36Sopenharmony_ci src += bytes; 9862306a36Sopenharmony_ci len -= bytes; 9962306a36Sopenharmony_ci } 10062306a36Sopenharmony_ci 10162306a36Sopenharmony_ci memcpy((char *)sctx->buf, src, len); 10262306a36Sopenharmony_ci return 0; 10362306a36Sopenharmony_ci} 10462306a36Sopenharmony_ci 10562306a36Sopenharmony_cistatic int ppc_spe_sha256_final(struct shash_desc *desc, u8 *out) 10662306a36Sopenharmony_ci{ 10762306a36Sopenharmony_ci struct sha256_state *sctx = shash_desc_ctx(desc); 10862306a36Sopenharmony_ci const unsigned int offset = sctx->count & 0x3f; 10962306a36Sopenharmony_ci char *p = (char *)sctx->buf + offset; 11062306a36Sopenharmony_ci int padlen; 11162306a36Sopenharmony_ci __be64 *pbits = (__be64 *)(((char *)&sctx->buf) + 56); 11262306a36Sopenharmony_ci __be32 *dst = (__be32 *)out; 11362306a36Sopenharmony_ci 11462306a36Sopenharmony_ci padlen = 55 - offset; 11562306a36Sopenharmony_ci *p++ = 0x80; 11662306a36Sopenharmony_ci 11762306a36Sopenharmony_ci spe_begin(); 11862306a36Sopenharmony_ci 11962306a36Sopenharmony_ci if (padlen < 0) { 12062306a36Sopenharmony_ci memset(p, 0x00, padlen + sizeof (u64)); 12162306a36Sopenharmony_ci ppc_spe_sha256_transform(sctx->state, sctx->buf, 1); 12262306a36Sopenharmony_ci p = (char *)sctx->buf; 12362306a36Sopenharmony_ci padlen = 56; 12462306a36Sopenharmony_ci } 12562306a36Sopenharmony_ci 12662306a36Sopenharmony_ci memset(p, 0, padlen); 12762306a36Sopenharmony_ci *pbits = cpu_to_be64(sctx->count << 3); 12862306a36Sopenharmony_ci ppc_spe_sha256_transform(sctx->state, sctx->buf, 1); 12962306a36Sopenharmony_ci 13062306a36Sopenharmony_ci spe_end(); 13162306a36Sopenharmony_ci 13262306a36Sopenharmony_ci dst[0] = cpu_to_be32(sctx->state[0]); 13362306a36Sopenharmony_ci dst[1] = cpu_to_be32(sctx->state[1]); 13462306a36Sopenharmony_ci dst[2] = cpu_to_be32(sctx->state[2]); 13562306a36Sopenharmony_ci dst[3] = cpu_to_be32(sctx->state[3]); 13662306a36Sopenharmony_ci dst[4] = cpu_to_be32(sctx->state[4]); 13762306a36Sopenharmony_ci dst[5] = cpu_to_be32(sctx->state[5]); 13862306a36Sopenharmony_ci dst[6] = cpu_to_be32(sctx->state[6]); 13962306a36Sopenharmony_ci dst[7] = cpu_to_be32(sctx->state[7]); 14062306a36Sopenharmony_ci 14162306a36Sopenharmony_ci ppc_sha256_clear_context(sctx); 14262306a36Sopenharmony_ci return 0; 14362306a36Sopenharmony_ci} 14462306a36Sopenharmony_ci 14562306a36Sopenharmony_cistatic int ppc_spe_sha224_final(struct shash_desc *desc, u8 *out) 14662306a36Sopenharmony_ci{ 14762306a36Sopenharmony_ci __be32 D[SHA256_DIGEST_SIZE >> 2]; 14862306a36Sopenharmony_ci __be32 *dst = (__be32 *)out; 14962306a36Sopenharmony_ci 15062306a36Sopenharmony_ci ppc_spe_sha256_final(desc, (u8 *)D); 15162306a36Sopenharmony_ci 15262306a36Sopenharmony_ci /* avoid bytewise memcpy */ 15362306a36Sopenharmony_ci dst[0] = D[0]; 15462306a36Sopenharmony_ci dst[1] = D[1]; 15562306a36Sopenharmony_ci dst[2] = D[2]; 15662306a36Sopenharmony_ci dst[3] = D[3]; 15762306a36Sopenharmony_ci dst[4] = D[4]; 15862306a36Sopenharmony_ci dst[5] = D[5]; 15962306a36Sopenharmony_ci dst[6] = D[6]; 16062306a36Sopenharmony_ci 16162306a36Sopenharmony_ci /* clear sensitive data */ 16262306a36Sopenharmony_ci memzero_explicit(D, SHA256_DIGEST_SIZE); 16362306a36Sopenharmony_ci return 0; 16462306a36Sopenharmony_ci} 16562306a36Sopenharmony_ci 16662306a36Sopenharmony_cistatic int ppc_spe_sha256_export(struct shash_desc *desc, void *out) 16762306a36Sopenharmony_ci{ 16862306a36Sopenharmony_ci struct sha256_state *sctx = shash_desc_ctx(desc); 16962306a36Sopenharmony_ci 17062306a36Sopenharmony_ci memcpy(out, sctx, sizeof(*sctx)); 17162306a36Sopenharmony_ci return 0; 17262306a36Sopenharmony_ci} 17362306a36Sopenharmony_ci 17462306a36Sopenharmony_cistatic int ppc_spe_sha256_import(struct shash_desc *desc, const void *in) 17562306a36Sopenharmony_ci{ 17662306a36Sopenharmony_ci struct sha256_state *sctx = shash_desc_ctx(desc); 17762306a36Sopenharmony_ci 17862306a36Sopenharmony_ci memcpy(sctx, in, sizeof(*sctx)); 17962306a36Sopenharmony_ci return 0; 18062306a36Sopenharmony_ci} 18162306a36Sopenharmony_ci 18262306a36Sopenharmony_cistatic struct shash_alg algs[2] = { { 18362306a36Sopenharmony_ci .digestsize = SHA256_DIGEST_SIZE, 18462306a36Sopenharmony_ci .init = sha256_base_init, 18562306a36Sopenharmony_ci .update = ppc_spe_sha256_update, 18662306a36Sopenharmony_ci .final = ppc_spe_sha256_final, 18762306a36Sopenharmony_ci .export = ppc_spe_sha256_export, 18862306a36Sopenharmony_ci .import = ppc_spe_sha256_import, 18962306a36Sopenharmony_ci .descsize = sizeof(struct sha256_state), 19062306a36Sopenharmony_ci .statesize = sizeof(struct sha256_state), 19162306a36Sopenharmony_ci .base = { 19262306a36Sopenharmony_ci .cra_name = "sha256", 19362306a36Sopenharmony_ci .cra_driver_name= "sha256-ppc-spe", 19462306a36Sopenharmony_ci .cra_priority = 300, 19562306a36Sopenharmony_ci .cra_blocksize = SHA256_BLOCK_SIZE, 19662306a36Sopenharmony_ci .cra_module = THIS_MODULE, 19762306a36Sopenharmony_ci } 19862306a36Sopenharmony_ci}, { 19962306a36Sopenharmony_ci .digestsize = SHA224_DIGEST_SIZE, 20062306a36Sopenharmony_ci .init = sha224_base_init, 20162306a36Sopenharmony_ci .update = ppc_spe_sha256_update, 20262306a36Sopenharmony_ci .final = ppc_spe_sha224_final, 20362306a36Sopenharmony_ci .export = ppc_spe_sha256_export, 20462306a36Sopenharmony_ci .import = ppc_spe_sha256_import, 20562306a36Sopenharmony_ci .descsize = sizeof(struct sha256_state), 20662306a36Sopenharmony_ci .statesize = sizeof(struct sha256_state), 20762306a36Sopenharmony_ci .base = { 20862306a36Sopenharmony_ci .cra_name = "sha224", 20962306a36Sopenharmony_ci .cra_driver_name= "sha224-ppc-spe", 21062306a36Sopenharmony_ci .cra_priority = 300, 21162306a36Sopenharmony_ci .cra_blocksize = SHA224_BLOCK_SIZE, 21262306a36Sopenharmony_ci .cra_module = THIS_MODULE, 21362306a36Sopenharmony_ci } 21462306a36Sopenharmony_ci} }; 21562306a36Sopenharmony_ci 21662306a36Sopenharmony_cistatic int __init ppc_spe_sha256_mod_init(void) 21762306a36Sopenharmony_ci{ 21862306a36Sopenharmony_ci return crypto_register_shashes(algs, ARRAY_SIZE(algs)); 21962306a36Sopenharmony_ci} 22062306a36Sopenharmony_ci 22162306a36Sopenharmony_cistatic void __exit ppc_spe_sha256_mod_fini(void) 22262306a36Sopenharmony_ci{ 22362306a36Sopenharmony_ci crypto_unregister_shashes(algs, ARRAY_SIZE(algs)); 22462306a36Sopenharmony_ci} 22562306a36Sopenharmony_ci 22662306a36Sopenharmony_cimodule_init(ppc_spe_sha256_mod_init); 22762306a36Sopenharmony_cimodule_exit(ppc_spe_sha256_mod_fini); 22862306a36Sopenharmony_ci 22962306a36Sopenharmony_ciMODULE_LICENSE("GPL"); 23062306a36Sopenharmony_ciMODULE_DESCRIPTION("SHA-224 and SHA-256 Secure Hash Algorithm, SPE optimized"); 23162306a36Sopenharmony_ci 23262306a36Sopenharmony_ciMODULE_ALIAS_CRYPTO("sha224"); 23362306a36Sopenharmony_ciMODULE_ALIAS_CRYPTO("sha224-ppc-spe"); 23462306a36Sopenharmony_ciMODULE_ALIAS_CRYPTO("sha256"); 23562306a36Sopenharmony_ciMODULE_ALIAS_CRYPTO("sha256-ppc-spe"); 236