162306a36Sopenharmony_ci// SPDX-License-Identifier: GPL-2.0-or-later
262306a36Sopenharmony_ci/*
362306a36Sopenharmony_ci * Glue code for SHA-256 implementation for SPE instructions (PPC)
462306a36Sopenharmony_ci *
562306a36Sopenharmony_ci * Based on generic implementation. The assembler module takes care
662306a36Sopenharmony_ci * about the SPE registers so it can run from interrupt context.
762306a36Sopenharmony_ci *
862306a36Sopenharmony_ci * Copyright (c) 2015 Markus Stockhausen <stockhausen@collogia.de>
962306a36Sopenharmony_ci */
1062306a36Sopenharmony_ci
1162306a36Sopenharmony_ci#include <crypto/internal/hash.h>
1262306a36Sopenharmony_ci#include <linux/init.h>
1362306a36Sopenharmony_ci#include <linux/module.h>
1462306a36Sopenharmony_ci#include <linux/mm.h>
1562306a36Sopenharmony_ci#include <linux/types.h>
1662306a36Sopenharmony_ci#include <crypto/sha2.h>
1762306a36Sopenharmony_ci#include <crypto/sha256_base.h>
1862306a36Sopenharmony_ci#include <asm/byteorder.h>
1962306a36Sopenharmony_ci#include <asm/switch_to.h>
2062306a36Sopenharmony_ci#include <linux/hardirq.h>
2162306a36Sopenharmony_ci
2262306a36Sopenharmony_ci/*
2362306a36Sopenharmony_ci * MAX_BYTES defines the number of bytes that are allowed to be processed
2462306a36Sopenharmony_ci * between preempt_disable() and preempt_enable(). SHA256 takes ~2,000
2562306a36Sopenharmony_ci * operations per 64 bytes. e500 cores can issue two arithmetic instructions
2662306a36Sopenharmony_ci * per clock cycle using one 32/64 bit unit (SU1) and one 32 bit unit (SU2).
2762306a36Sopenharmony_ci * Thus 1KB of input data will need an estimated maximum of 18,000 cycles.
2862306a36Sopenharmony_ci * Headroom for cache misses included. Even with the low end model clocked
2962306a36Sopenharmony_ci * at 667 MHz this equals to a critical time window of less than 27us.
3062306a36Sopenharmony_ci *
3162306a36Sopenharmony_ci */
3262306a36Sopenharmony_ci#define MAX_BYTES 1024
3362306a36Sopenharmony_ci
3462306a36Sopenharmony_ciextern void ppc_spe_sha256_transform(u32 *state, const u8 *src, u32 blocks);
3562306a36Sopenharmony_ci
3662306a36Sopenharmony_cistatic void spe_begin(void)
3762306a36Sopenharmony_ci{
3862306a36Sopenharmony_ci	/* We just start SPE operations and will save SPE registers later. */
3962306a36Sopenharmony_ci	preempt_disable();
4062306a36Sopenharmony_ci	enable_kernel_spe();
4162306a36Sopenharmony_ci}
4262306a36Sopenharmony_ci
4362306a36Sopenharmony_cistatic void spe_end(void)
4462306a36Sopenharmony_ci{
4562306a36Sopenharmony_ci	disable_kernel_spe();
4662306a36Sopenharmony_ci	/* reenable preemption */
4762306a36Sopenharmony_ci	preempt_enable();
4862306a36Sopenharmony_ci}
4962306a36Sopenharmony_ci
5062306a36Sopenharmony_cistatic inline void ppc_sha256_clear_context(struct sha256_state *sctx)
5162306a36Sopenharmony_ci{
5262306a36Sopenharmony_ci	int count = sizeof(struct sha256_state) >> 2;
5362306a36Sopenharmony_ci	u32 *ptr = (u32 *)sctx;
5462306a36Sopenharmony_ci
5562306a36Sopenharmony_ci	/* make sure we can clear the fast way */
5662306a36Sopenharmony_ci	BUILD_BUG_ON(sizeof(struct sha256_state) % 4);
5762306a36Sopenharmony_ci	do { *ptr++ = 0; } while (--count);
5862306a36Sopenharmony_ci}
5962306a36Sopenharmony_ci
6062306a36Sopenharmony_cistatic int ppc_spe_sha256_update(struct shash_desc *desc, const u8 *data,
6162306a36Sopenharmony_ci			unsigned int len)
6262306a36Sopenharmony_ci{
6362306a36Sopenharmony_ci	struct sha256_state *sctx = shash_desc_ctx(desc);
6462306a36Sopenharmony_ci	const unsigned int offset = sctx->count & 0x3f;
6562306a36Sopenharmony_ci	const unsigned int avail = 64 - offset;
6662306a36Sopenharmony_ci	unsigned int bytes;
6762306a36Sopenharmony_ci	const u8 *src = data;
6862306a36Sopenharmony_ci
6962306a36Sopenharmony_ci	if (avail > len) {
7062306a36Sopenharmony_ci		sctx->count += len;
7162306a36Sopenharmony_ci		memcpy((char *)sctx->buf + offset, src, len);
7262306a36Sopenharmony_ci		return 0;
7362306a36Sopenharmony_ci	}
7462306a36Sopenharmony_ci
7562306a36Sopenharmony_ci	sctx->count += len;
7662306a36Sopenharmony_ci
7762306a36Sopenharmony_ci	if (offset) {
7862306a36Sopenharmony_ci		memcpy((char *)sctx->buf + offset, src, avail);
7962306a36Sopenharmony_ci
8062306a36Sopenharmony_ci		spe_begin();
8162306a36Sopenharmony_ci		ppc_spe_sha256_transform(sctx->state, (const u8 *)sctx->buf, 1);
8262306a36Sopenharmony_ci		spe_end();
8362306a36Sopenharmony_ci
8462306a36Sopenharmony_ci		len -= avail;
8562306a36Sopenharmony_ci		src += avail;
8662306a36Sopenharmony_ci	}
8762306a36Sopenharmony_ci
8862306a36Sopenharmony_ci	while (len > 63) {
8962306a36Sopenharmony_ci		/* cut input data into smaller blocks */
9062306a36Sopenharmony_ci		bytes = (len > MAX_BYTES) ? MAX_BYTES : len;
9162306a36Sopenharmony_ci		bytes = bytes & ~0x3f;
9262306a36Sopenharmony_ci
9362306a36Sopenharmony_ci		spe_begin();
9462306a36Sopenharmony_ci		ppc_spe_sha256_transform(sctx->state, src, bytes >> 6);
9562306a36Sopenharmony_ci		spe_end();
9662306a36Sopenharmony_ci
9762306a36Sopenharmony_ci		src += bytes;
9862306a36Sopenharmony_ci		len -= bytes;
9962306a36Sopenharmony_ci	}
10062306a36Sopenharmony_ci
10162306a36Sopenharmony_ci	memcpy((char *)sctx->buf, src, len);
10262306a36Sopenharmony_ci	return 0;
10362306a36Sopenharmony_ci}
10462306a36Sopenharmony_ci
10562306a36Sopenharmony_cistatic int ppc_spe_sha256_final(struct shash_desc *desc, u8 *out)
10662306a36Sopenharmony_ci{
10762306a36Sopenharmony_ci	struct sha256_state *sctx = shash_desc_ctx(desc);
10862306a36Sopenharmony_ci	const unsigned int offset = sctx->count & 0x3f;
10962306a36Sopenharmony_ci	char *p = (char *)sctx->buf + offset;
11062306a36Sopenharmony_ci	int padlen;
11162306a36Sopenharmony_ci	__be64 *pbits = (__be64 *)(((char *)&sctx->buf) + 56);
11262306a36Sopenharmony_ci	__be32 *dst = (__be32 *)out;
11362306a36Sopenharmony_ci
11462306a36Sopenharmony_ci	padlen = 55 - offset;
11562306a36Sopenharmony_ci	*p++ = 0x80;
11662306a36Sopenharmony_ci
11762306a36Sopenharmony_ci	spe_begin();
11862306a36Sopenharmony_ci
11962306a36Sopenharmony_ci	if (padlen < 0) {
12062306a36Sopenharmony_ci		memset(p, 0x00, padlen + sizeof (u64));
12162306a36Sopenharmony_ci		ppc_spe_sha256_transform(sctx->state, sctx->buf, 1);
12262306a36Sopenharmony_ci		p = (char *)sctx->buf;
12362306a36Sopenharmony_ci		padlen = 56;
12462306a36Sopenharmony_ci	}
12562306a36Sopenharmony_ci
12662306a36Sopenharmony_ci	memset(p, 0, padlen);
12762306a36Sopenharmony_ci	*pbits = cpu_to_be64(sctx->count << 3);
12862306a36Sopenharmony_ci	ppc_spe_sha256_transform(sctx->state, sctx->buf, 1);
12962306a36Sopenharmony_ci
13062306a36Sopenharmony_ci	spe_end();
13162306a36Sopenharmony_ci
13262306a36Sopenharmony_ci	dst[0] = cpu_to_be32(sctx->state[0]);
13362306a36Sopenharmony_ci	dst[1] = cpu_to_be32(sctx->state[1]);
13462306a36Sopenharmony_ci	dst[2] = cpu_to_be32(sctx->state[2]);
13562306a36Sopenharmony_ci	dst[3] = cpu_to_be32(sctx->state[3]);
13662306a36Sopenharmony_ci	dst[4] = cpu_to_be32(sctx->state[4]);
13762306a36Sopenharmony_ci	dst[5] = cpu_to_be32(sctx->state[5]);
13862306a36Sopenharmony_ci	dst[6] = cpu_to_be32(sctx->state[6]);
13962306a36Sopenharmony_ci	dst[7] = cpu_to_be32(sctx->state[7]);
14062306a36Sopenharmony_ci
14162306a36Sopenharmony_ci	ppc_sha256_clear_context(sctx);
14262306a36Sopenharmony_ci	return 0;
14362306a36Sopenharmony_ci}
14462306a36Sopenharmony_ci
14562306a36Sopenharmony_cistatic int ppc_spe_sha224_final(struct shash_desc *desc, u8 *out)
14662306a36Sopenharmony_ci{
14762306a36Sopenharmony_ci	__be32 D[SHA256_DIGEST_SIZE >> 2];
14862306a36Sopenharmony_ci	__be32 *dst = (__be32 *)out;
14962306a36Sopenharmony_ci
15062306a36Sopenharmony_ci	ppc_spe_sha256_final(desc, (u8 *)D);
15162306a36Sopenharmony_ci
15262306a36Sopenharmony_ci	/* avoid bytewise memcpy */
15362306a36Sopenharmony_ci	dst[0] = D[0];
15462306a36Sopenharmony_ci	dst[1] = D[1];
15562306a36Sopenharmony_ci	dst[2] = D[2];
15662306a36Sopenharmony_ci	dst[3] = D[3];
15762306a36Sopenharmony_ci	dst[4] = D[4];
15862306a36Sopenharmony_ci	dst[5] = D[5];
15962306a36Sopenharmony_ci	dst[6] = D[6];
16062306a36Sopenharmony_ci
16162306a36Sopenharmony_ci	/* clear sensitive data */
16262306a36Sopenharmony_ci	memzero_explicit(D, SHA256_DIGEST_SIZE);
16362306a36Sopenharmony_ci	return 0;
16462306a36Sopenharmony_ci}
16562306a36Sopenharmony_ci
16662306a36Sopenharmony_cistatic int ppc_spe_sha256_export(struct shash_desc *desc, void *out)
16762306a36Sopenharmony_ci{
16862306a36Sopenharmony_ci	struct sha256_state *sctx = shash_desc_ctx(desc);
16962306a36Sopenharmony_ci
17062306a36Sopenharmony_ci	memcpy(out, sctx, sizeof(*sctx));
17162306a36Sopenharmony_ci	return 0;
17262306a36Sopenharmony_ci}
17362306a36Sopenharmony_ci
17462306a36Sopenharmony_cistatic int ppc_spe_sha256_import(struct shash_desc *desc, const void *in)
17562306a36Sopenharmony_ci{
17662306a36Sopenharmony_ci	struct sha256_state *sctx = shash_desc_ctx(desc);
17762306a36Sopenharmony_ci
17862306a36Sopenharmony_ci	memcpy(sctx, in, sizeof(*sctx));
17962306a36Sopenharmony_ci	return 0;
18062306a36Sopenharmony_ci}
18162306a36Sopenharmony_ci
18262306a36Sopenharmony_cistatic struct shash_alg algs[2] = { {
18362306a36Sopenharmony_ci	.digestsize	=	SHA256_DIGEST_SIZE,
18462306a36Sopenharmony_ci	.init		=	sha256_base_init,
18562306a36Sopenharmony_ci	.update		=	ppc_spe_sha256_update,
18662306a36Sopenharmony_ci	.final		=	ppc_spe_sha256_final,
18762306a36Sopenharmony_ci	.export		=	ppc_spe_sha256_export,
18862306a36Sopenharmony_ci	.import		=	ppc_spe_sha256_import,
18962306a36Sopenharmony_ci	.descsize	=	sizeof(struct sha256_state),
19062306a36Sopenharmony_ci	.statesize	=	sizeof(struct sha256_state),
19162306a36Sopenharmony_ci	.base		=	{
19262306a36Sopenharmony_ci		.cra_name	=	"sha256",
19362306a36Sopenharmony_ci		.cra_driver_name=	"sha256-ppc-spe",
19462306a36Sopenharmony_ci		.cra_priority	=	300,
19562306a36Sopenharmony_ci		.cra_blocksize	=	SHA256_BLOCK_SIZE,
19662306a36Sopenharmony_ci		.cra_module	=	THIS_MODULE,
19762306a36Sopenharmony_ci	}
19862306a36Sopenharmony_ci}, {
19962306a36Sopenharmony_ci	.digestsize	=	SHA224_DIGEST_SIZE,
20062306a36Sopenharmony_ci	.init		=	sha224_base_init,
20162306a36Sopenharmony_ci	.update		=	ppc_spe_sha256_update,
20262306a36Sopenharmony_ci	.final		=	ppc_spe_sha224_final,
20362306a36Sopenharmony_ci	.export		=	ppc_spe_sha256_export,
20462306a36Sopenharmony_ci	.import		=	ppc_spe_sha256_import,
20562306a36Sopenharmony_ci	.descsize	=	sizeof(struct sha256_state),
20662306a36Sopenharmony_ci	.statesize	=	sizeof(struct sha256_state),
20762306a36Sopenharmony_ci	.base		=	{
20862306a36Sopenharmony_ci		.cra_name	=	"sha224",
20962306a36Sopenharmony_ci		.cra_driver_name=	"sha224-ppc-spe",
21062306a36Sopenharmony_ci		.cra_priority	=	300,
21162306a36Sopenharmony_ci		.cra_blocksize	=	SHA224_BLOCK_SIZE,
21262306a36Sopenharmony_ci		.cra_module	=	THIS_MODULE,
21362306a36Sopenharmony_ci	}
21462306a36Sopenharmony_ci} };
21562306a36Sopenharmony_ci
21662306a36Sopenharmony_cistatic int __init ppc_spe_sha256_mod_init(void)
21762306a36Sopenharmony_ci{
21862306a36Sopenharmony_ci	return crypto_register_shashes(algs, ARRAY_SIZE(algs));
21962306a36Sopenharmony_ci}
22062306a36Sopenharmony_ci
22162306a36Sopenharmony_cistatic void __exit ppc_spe_sha256_mod_fini(void)
22262306a36Sopenharmony_ci{
22362306a36Sopenharmony_ci	crypto_unregister_shashes(algs, ARRAY_SIZE(algs));
22462306a36Sopenharmony_ci}
22562306a36Sopenharmony_ci
22662306a36Sopenharmony_cimodule_init(ppc_spe_sha256_mod_init);
22762306a36Sopenharmony_cimodule_exit(ppc_spe_sha256_mod_fini);
22862306a36Sopenharmony_ci
22962306a36Sopenharmony_ciMODULE_LICENSE("GPL");
23062306a36Sopenharmony_ciMODULE_DESCRIPTION("SHA-224 and SHA-256 Secure Hash Algorithm, SPE optimized");
23162306a36Sopenharmony_ci
23262306a36Sopenharmony_ciMODULE_ALIAS_CRYPTO("sha224");
23362306a36Sopenharmony_ciMODULE_ALIAS_CRYPTO("sha224-ppc-spe");
23462306a36Sopenharmony_ciMODULE_ALIAS_CRYPTO("sha256");
23562306a36Sopenharmony_ciMODULE_ALIAS_CRYPTO("sha256-ppc-spe");
236