162306a36Sopenharmony_ci// SPDX-License-Identifier: GPL-2.0-or-later 262306a36Sopenharmony_ci/* 362306a36Sopenharmony_ci * Glue code for SHA-1 implementation for SPE instructions (PPC) 462306a36Sopenharmony_ci * 562306a36Sopenharmony_ci * Based on generic implementation. 662306a36Sopenharmony_ci * 762306a36Sopenharmony_ci * Copyright (c) 2015 Markus Stockhausen <stockhausen@collogia.de> 862306a36Sopenharmony_ci */ 962306a36Sopenharmony_ci 1062306a36Sopenharmony_ci#include <crypto/internal/hash.h> 1162306a36Sopenharmony_ci#include <linux/init.h> 1262306a36Sopenharmony_ci#include <linux/module.h> 1362306a36Sopenharmony_ci#include <linux/mm.h> 1462306a36Sopenharmony_ci#include <linux/types.h> 1562306a36Sopenharmony_ci#include <crypto/sha1.h> 1662306a36Sopenharmony_ci#include <crypto/sha1_base.h> 1762306a36Sopenharmony_ci#include <asm/byteorder.h> 1862306a36Sopenharmony_ci#include <asm/switch_to.h> 1962306a36Sopenharmony_ci#include <linux/hardirq.h> 2062306a36Sopenharmony_ci 2162306a36Sopenharmony_ci/* 2262306a36Sopenharmony_ci * MAX_BYTES defines the number of bytes that are allowed to be processed 2362306a36Sopenharmony_ci * between preempt_disable() and preempt_enable(). SHA1 takes ~1000 2462306a36Sopenharmony_ci * operations per 64 bytes. e500 cores can issue two arithmetic instructions 2562306a36Sopenharmony_ci * per clock cycle using one 32/64 bit unit (SU1) and one 32 bit unit (SU2). 2662306a36Sopenharmony_ci * Thus 2KB of input data will need an estimated maximum of 18,000 cycles. 2762306a36Sopenharmony_ci * Headroom for cache misses included. Even with the low end model clocked 2862306a36Sopenharmony_ci * at 667 MHz this equals to a critical time window of less than 27us. 2962306a36Sopenharmony_ci * 3062306a36Sopenharmony_ci */ 3162306a36Sopenharmony_ci#define MAX_BYTES 2048 3262306a36Sopenharmony_ci 3362306a36Sopenharmony_ciextern void ppc_spe_sha1_transform(u32 *state, const u8 *src, u32 blocks); 3462306a36Sopenharmony_ci 3562306a36Sopenharmony_cistatic void spe_begin(void) 3662306a36Sopenharmony_ci{ 3762306a36Sopenharmony_ci /* We just start SPE operations and will save SPE registers later. */ 3862306a36Sopenharmony_ci preempt_disable(); 3962306a36Sopenharmony_ci enable_kernel_spe(); 4062306a36Sopenharmony_ci} 4162306a36Sopenharmony_ci 4262306a36Sopenharmony_cistatic void spe_end(void) 4362306a36Sopenharmony_ci{ 4462306a36Sopenharmony_ci disable_kernel_spe(); 4562306a36Sopenharmony_ci /* reenable preemption */ 4662306a36Sopenharmony_ci preempt_enable(); 4762306a36Sopenharmony_ci} 4862306a36Sopenharmony_ci 4962306a36Sopenharmony_cistatic inline void ppc_sha1_clear_context(struct sha1_state *sctx) 5062306a36Sopenharmony_ci{ 5162306a36Sopenharmony_ci int count = sizeof(struct sha1_state) >> 2; 5262306a36Sopenharmony_ci u32 *ptr = (u32 *)sctx; 5362306a36Sopenharmony_ci 5462306a36Sopenharmony_ci /* make sure we can clear the fast way */ 5562306a36Sopenharmony_ci BUILD_BUG_ON(sizeof(struct sha1_state) % 4); 5662306a36Sopenharmony_ci do { *ptr++ = 0; } while (--count); 5762306a36Sopenharmony_ci} 5862306a36Sopenharmony_ci 5962306a36Sopenharmony_cistatic int ppc_spe_sha1_update(struct shash_desc *desc, const u8 *data, 6062306a36Sopenharmony_ci unsigned int len) 6162306a36Sopenharmony_ci{ 6262306a36Sopenharmony_ci struct sha1_state *sctx = shash_desc_ctx(desc); 6362306a36Sopenharmony_ci const unsigned int offset = sctx->count & 0x3f; 6462306a36Sopenharmony_ci const unsigned int avail = 64 - offset; 6562306a36Sopenharmony_ci unsigned int bytes; 6662306a36Sopenharmony_ci const u8 *src = data; 6762306a36Sopenharmony_ci 6862306a36Sopenharmony_ci if (avail > len) { 6962306a36Sopenharmony_ci sctx->count += len; 7062306a36Sopenharmony_ci memcpy((char *)sctx->buffer + offset, src, len); 7162306a36Sopenharmony_ci return 0; 7262306a36Sopenharmony_ci } 7362306a36Sopenharmony_ci 7462306a36Sopenharmony_ci sctx->count += len; 7562306a36Sopenharmony_ci 7662306a36Sopenharmony_ci if (offset) { 7762306a36Sopenharmony_ci memcpy((char *)sctx->buffer + offset, src, avail); 7862306a36Sopenharmony_ci 7962306a36Sopenharmony_ci spe_begin(); 8062306a36Sopenharmony_ci ppc_spe_sha1_transform(sctx->state, (const u8 *)sctx->buffer, 1); 8162306a36Sopenharmony_ci spe_end(); 8262306a36Sopenharmony_ci 8362306a36Sopenharmony_ci len -= avail; 8462306a36Sopenharmony_ci src += avail; 8562306a36Sopenharmony_ci } 8662306a36Sopenharmony_ci 8762306a36Sopenharmony_ci while (len > 63) { 8862306a36Sopenharmony_ci bytes = (len > MAX_BYTES) ? MAX_BYTES : len; 8962306a36Sopenharmony_ci bytes = bytes & ~0x3f; 9062306a36Sopenharmony_ci 9162306a36Sopenharmony_ci spe_begin(); 9262306a36Sopenharmony_ci ppc_spe_sha1_transform(sctx->state, src, bytes >> 6); 9362306a36Sopenharmony_ci spe_end(); 9462306a36Sopenharmony_ci 9562306a36Sopenharmony_ci src += bytes; 9662306a36Sopenharmony_ci len -= bytes; 9762306a36Sopenharmony_ci } 9862306a36Sopenharmony_ci 9962306a36Sopenharmony_ci memcpy((char *)sctx->buffer, src, len); 10062306a36Sopenharmony_ci return 0; 10162306a36Sopenharmony_ci} 10262306a36Sopenharmony_ci 10362306a36Sopenharmony_cistatic int ppc_spe_sha1_final(struct shash_desc *desc, u8 *out) 10462306a36Sopenharmony_ci{ 10562306a36Sopenharmony_ci struct sha1_state *sctx = shash_desc_ctx(desc); 10662306a36Sopenharmony_ci const unsigned int offset = sctx->count & 0x3f; 10762306a36Sopenharmony_ci char *p = (char *)sctx->buffer + offset; 10862306a36Sopenharmony_ci int padlen; 10962306a36Sopenharmony_ci __be64 *pbits = (__be64 *)(((char *)&sctx->buffer) + 56); 11062306a36Sopenharmony_ci __be32 *dst = (__be32 *)out; 11162306a36Sopenharmony_ci 11262306a36Sopenharmony_ci padlen = 55 - offset; 11362306a36Sopenharmony_ci *p++ = 0x80; 11462306a36Sopenharmony_ci 11562306a36Sopenharmony_ci spe_begin(); 11662306a36Sopenharmony_ci 11762306a36Sopenharmony_ci if (padlen < 0) { 11862306a36Sopenharmony_ci memset(p, 0x00, padlen + sizeof (u64)); 11962306a36Sopenharmony_ci ppc_spe_sha1_transform(sctx->state, sctx->buffer, 1); 12062306a36Sopenharmony_ci p = (char *)sctx->buffer; 12162306a36Sopenharmony_ci padlen = 56; 12262306a36Sopenharmony_ci } 12362306a36Sopenharmony_ci 12462306a36Sopenharmony_ci memset(p, 0, padlen); 12562306a36Sopenharmony_ci *pbits = cpu_to_be64(sctx->count << 3); 12662306a36Sopenharmony_ci ppc_spe_sha1_transform(sctx->state, sctx->buffer, 1); 12762306a36Sopenharmony_ci 12862306a36Sopenharmony_ci spe_end(); 12962306a36Sopenharmony_ci 13062306a36Sopenharmony_ci dst[0] = cpu_to_be32(sctx->state[0]); 13162306a36Sopenharmony_ci dst[1] = cpu_to_be32(sctx->state[1]); 13262306a36Sopenharmony_ci dst[2] = cpu_to_be32(sctx->state[2]); 13362306a36Sopenharmony_ci dst[3] = cpu_to_be32(sctx->state[3]); 13462306a36Sopenharmony_ci dst[4] = cpu_to_be32(sctx->state[4]); 13562306a36Sopenharmony_ci 13662306a36Sopenharmony_ci ppc_sha1_clear_context(sctx); 13762306a36Sopenharmony_ci return 0; 13862306a36Sopenharmony_ci} 13962306a36Sopenharmony_ci 14062306a36Sopenharmony_cistatic int ppc_spe_sha1_export(struct shash_desc *desc, void *out) 14162306a36Sopenharmony_ci{ 14262306a36Sopenharmony_ci struct sha1_state *sctx = shash_desc_ctx(desc); 14362306a36Sopenharmony_ci 14462306a36Sopenharmony_ci memcpy(out, sctx, sizeof(*sctx)); 14562306a36Sopenharmony_ci return 0; 14662306a36Sopenharmony_ci} 14762306a36Sopenharmony_ci 14862306a36Sopenharmony_cistatic int ppc_spe_sha1_import(struct shash_desc *desc, const void *in) 14962306a36Sopenharmony_ci{ 15062306a36Sopenharmony_ci struct sha1_state *sctx = shash_desc_ctx(desc); 15162306a36Sopenharmony_ci 15262306a36Sopenharmony_ci memcpy(sctx, in, sizeof(*sctx)); 15362306a36Sopenharmony_ci return 0; 15462306a36Sopenharmony_ci} 15562306a36Sopenharmony_ci 15662306a36Sopenharmony_cistatic struct shash_alg alg = { 15762306a36Sopenharmony_ci .digestsize = SHA1_DIGEST_SIZE, 15862306a36Sopenharmony_ci .init = sha1_base_init, 15962306a36Sopenharmony_ci .update = ppc_spe_sha1_update, 16062306a36Sopenharmony_ci .final = ppc_spe_sha1_final, 16162306a36Sopenharmony_ci .export = ppc_spe_sha1_export, 16262306a36Sopenharmony_ci .import = ppc_spe_sha1_import, 16362306a36Sopenharmony_ci .descsize = sizeof(struct sha1_state), 16462306a36Sopenharmony_ci .statesize = sizeof(struct sha1_state), 16562306a36Sopenharmony_ci .base = { 16662306a36Sopenharmony_ci .cra_name = "sha1", 16762306a36Sopenharmony_ci .cra_driver_name= "sha1-ppc-spe", 16862306a36Sopenharmony_ci .cra_priority = 300, 16962306a36Sopenharmony_ci .cra_blocksize = SHA1_BLOCK_SIZE, 17062306a36Sopenharmony_ci .cra_module = THIS_MODULE, 17162306a36Sopenharmony_ci } 17262306a36Sopenharmony_ci}; 17362306a36Sopenharmony_ci 17462306a36Sopenharmony_cistatic int __init ppc_spe_sha1_mod_init(void) 17562306a36Sopenharmony_ci{ 17662306a36Sopenharmony_ci return crypto_register_shash(&alg); 17762306a36Sopenharmony_ci} 17862306a36Sopenharmony_ci 17962306a36Sopenharmony_cistatic void __exit ppc_spe_sha1_mod_fini(void) 18062306a36Sopenharmony_ci{ 18162306a36Sopenharmony_ci crypto_unregister_shash(&alg); 18262306a36Sopenharmony_ci} 18362306a36Sopenharmony_ci 18462306a36Sopenharmony_cimodule_init(ppc_spe_sha1_mod_init); 18562306a36Sopenharmony_cimodule_exit(ppc_spe_sha1_mod_fini); 18662306a36Sopenharmony_ci 18762306a36Sopenharmony_ciMODULE_LICENSE("GPL"); 18862306a36Sopenharmony_ciMODULE_DESCRIPTION("SHA1 Secure Hash Algorithm, SPE optimized"); 18962306a36Sopenharmony_ci 19062306a36Sopenharmony_ciMODULE_ALIAS_CRYPTO("sha1"); 19162306a36Sopenharmony_ciMODULE_ALIAS_CRYPTO("sha1-ppc-spe"); 192