162306a36Sopenharmony_ci/* SPDX-License-Identifier: GPL-2.0-only */
262306a36Sopenharmony_ci/*
362306a36Sopenharmony_ci * SM3 secure hash, as specified by OSCCA GM/T 0004-2012 SM3 and described
462306a36Sopenharmony_ci * at https://datatracker.ietf.org/doc/html/draft-sca-cfrg-sm3-02
562306a36Sopenharmony_ci *
662306a36Sopenharmony_ci * Copyright (C) 2017 ARM Limited or its affiliates.
762306a36Sopenharmony_ci * Copyright (C) 2017 Gilad Ben-Yossef <gilad@benyossef.com>
862306a36Sopenharmony_ci * Copyright (C) 2021 Tianjia Zhang <tianjia.zhang@linux.alibaba.com>
962306a36Sopenharmony_ci */
1062306a36Sopenharmony_ci
1162306a36Sopenharmony_ci#include <linux/module.h>
1262306a36Sopenharmony_ci#include <asm/unaligned.h>
1362306a36Sopenharmony_ci#include <crypto/sm3.h>
1462306a36Sopenharmony_ci
1562306a36Sopenharmony_cistatic const u32 ____cacheline_aligned K[64] = {
1662306a36Sopenharmony_ci	0x79cc4519, 0xf3988a32, 0xe7311465, 0xce6228cb,
1762306a36Sopenharmony_ci	0x9cc45197, 0x3988a32f, 0x7311465e, 0xe6228cbc,
1862306a36Sopenharmony_ci	0xcc451979, 0x988a32f3, 0x311465e7, 0x6228cbce,
1962306a36Sopenharmony_ci	0xc451979c, 0x88a32f39, 0x11465e73, 0x228cbce6,
2062306a36Sopenharmony_ci	0x9d8a7a87, 0x3b14f50f, 0x7629ea1e, 0xec53d43c,
2162306a36Sopenharmony_ci	0xd8a7a879, 0xb14f50f3, 0x629ea1e7, 0xc53d43ce,
2262306a36Sopenharmony_ci	0x8a7a879d, 0x14f50f3b, 0x29ea1e76, 0x53d43cec,
2362306a36Sopenharmony_ci	0xa7a879d8, 0x4f50f3b1, 0x9ea1e762, 0x3d43cec5,
2462306a36Sopenharmony_ci	0x7a879d8a, 0xf50f3b14, 0xea1e7629, 0xd43cec53,
2562306a36Sopenharmony_ci	0xa879d8a7, 0x50f3b14f, 0xa1e7629e, 0x43cec53d,
2662306a36Sopenharmony_ci	0x879d8a7a, 0x0f3b14f5, 0x1e7629ea, 0x3cec53d4,
2762306a36Sopenharmony_ci	0x79d8a7a8, 0xf3b14f50, 0xe7629ea1, 0xcec53d43,
2862306a36Sopenharmony_ci	0x9d8a7a87, 0x3b14f50f, 0x7629ea1e, 0xec53d43c,
2962306a36Sopenharmony_ci	0xd8a7a879, 0xb14f50f3, 0x629ea1e7, 0xc53d43ce,
3062306a36Sopenharmony_ci	0x8a7a879d, 0x14f50f3b, 0x29ea1e76, 0x53d43cec,
3162306a36Sopenharmony_ci	0xa7a879d8, 0x4f50f3b1, 0x9ea1e762, 0x3d43cec5
3262306a36Sopenharmony_ci};
3362306a36Sopenharmony_ci
3462306a36Sopenharmony_ci/*
3562306a36Sopenharmony_ci * Transform the message X which consists of 16 32-bit-words. See
3662306a36Sopenharmony_ci * GM/T 004-2012 for details.
3762306a36Sopenharmony_ci */
3862306a36Sopenharmony_ci#define R(i, a, b, c, d, e, f, g, h, t, w1, w2)			\
3962306a36Sopenharmony_ci	do {							\
4062306a36Sopenharmony_ci		ss1 = rol32((rol32((a), 12) + (e) + (t)), 7);	\
4162306a36Sopenharmony_ci		ss2 = ss1 ^ rol32((a), 12);			\
4262306a36Sopenharmony_ci		d += FF ## i(a, b, c) + ss2 + ((w1) ^ (w2));	\
4362306a36Sopenharmony_ci		h += GG ## i(e, f, g) + ss1 + (w1);		\
4462306a36Sopenharmony_ci		b = rol32((b), 9);				\
4562306a36Sopenharmony_ci		f = rol32((f), 19);				\
4662306a36Sopenharmony_ci		h = P0((h));					\
4762306a36Sopenharmony_ci	} while (0)
4862306a36Sopenharmony_ci
4962306a36Sopenharmony_ci#define R1(a, b, c, d, e, f, g, h, t, w1, w2) \
5062306a36Sopenharmony_ci	R(1, a, b, c, d, e, f, g, h, t, w1, w2)
5162306a36Sopenharmony_ci#define R2(a, b, c, d, e, f, g, h, t, w1, w2) \
5262306a36Sopenharmony_ci	R(2, a, b, c, d, e, f, g, h, t, w1, w2)
5362306a36Sopenharmony_ci
5462306a36Sopenharmony_ci#define FF1(x, y, z)  (x ^ y ^ z)
5562306a36Sopenharmony_ci#define FF2(x, y, z)  ((x & y) | (x & z) | (y & z))
5662306a36Sopenharmony_ci
5762306a36Sopenharmony_ci#define GG1(x, y, z)  FF1(x, y, z)
5862306a36Sopenharmony_ci#define GG2(x, y, z)  ((x & y) | (~x & z))
5962306a36Sopenharmony_ci
6062306a36Sopenharmony_ci/* Message expansion */
6162306a36Sopenharmony_ci#define P0(x) ((x) ^ rol32((x), 9) ^ rol32((x), 17))
6262306a36Sopenharmony_ci#define P1(x) ((x) ^ rol32((x), 15) ^ rol32((x), 23))
6362306a36Sopenharmony_ci#define I(i)  (W[i] = get_unaligned_be32(data + i * 4))
6462306a36Sopenharmony_ci#define W1(i) (W[i & 0x0f])
6562306a36Sopenharmony_ci#define W2(i) (W[i & 0x0f] =				\
6662306a36Sopenharmony_ci		P1(W[i & 0x0f]				\
6762306a36Sopenharmony_ci			^ W[(i-9) & 0x0f]		\
6862306a36Sopenharmony_ci			^ rol32(W[(i-3) & 0x0f], 15))	\
6962306a36Sopenharmony_ci		^ rol32(W[(i-13) & 0x0f], 7)		\
7062306a36Sopenharmony_ci		^ W[(i-6) & 0x0f])
7162306a36Sopenharmony_ci
7262306a36Sopenharmony_cistatic void sm3_transform(struct sm3_state *sctx, u8 const *data, u32 W[16])
7362306a36Sopenharmony_ci{
7462306a36Sopenharmony_ci	u32 a, b, c, d, e, f, g, h, ss1, ss2;
7562306a36Sopenharmony_ci
7662306a36Sopenharmony_ci	a = sctx->state[0];
7762306a36Sopenharmony_ci	b = sctx->state[1];
7862306a36Sopenharmony_ci	c = sctx->state[2];
7962306a36Sopenharmony_ci	d = sctx->state[3];
8062306a36Sopenharmony_ci	e = sctx->state[4];
8162306a36Sopenharmony_ci	f = sctx->state[5];
8262306a36Sopenharmony_ci	g = sctx->state[6];
8362306a36Sopenharmony_ci	h = sctx->state[7];
8462306a36Sopenharmony_ci
8562306a36Sopenharmony_ci	R1(a, b, c, d, e, f, g, h, K[0], I(0), I(4));
8662306a36Sopenharmony_ci	R1(d, a, b, c, h, e, f, g, K[1], I(1), I(5));
8762306a36Sopenharmony_ci	R1(c, d, a, b, g, h, e, f, K[2], I(2), I(6));
8862306a36Sopenharmony_ci	R1(b, c, d, a, f, g, h, e, K[3], I(3), I(7));
8962306a36Sopenharmony_ci	R1(a, b, c, d, e, f, g, h, K[4], W1(4), I(8));
9062306a36Sopenharmony_ci	R1(d, a, b, c, h, e, f, g, K[5], W1(5), I(9));
9162306a36Sopenharmony_ci	R1(c, d, a, b, g, h, e, f, K[6], W1(6), I(10));
9262306a36Sopenharmony_ci	R1(b, c, d, a, f, g, h, e, K[7], W1(7), I(11));
9362306a36Sopenharmony_ci	R1(a, b, c, d, e, f, g, h, K[8], W1(8), I(12));
9462306a36Sopenharmony_ci	R1(d, a, b, c, h, e, f, g, K[9], W1(9), I(13));
9562306a36Sopenharmony_ci	R1(c, d, a, b, g, h, e, f, K[10], W1(10), I(14));
9662306a36Sopenharmony_ci	R1(b, c, d, a, f, g, h, e, K[11], W1(11), I(15));
9762306a36Sopenharmony_ci	R1(a, b, c, d, e, f, g, h, K[12], W1(12), W2(16));
9862306a36Sopenharmony_ci	R1(d, a, b, c, h, e, f, g, K[13], W1(13), W2(17));
9962306a36Sopenharmony_ci	R1(c, d, a, b, g, h, e, f, K[14], W1(14), W2(18));
10062306a36Sopenharmony_ci	R1(b, c, d, a, f, g, h, e, K[15], W1(15), W2(19));
10162306a36Sopenharmony_ci
10262306a36Sopenharmony_ci	R2(a, b, c, d, e, f, g, h, K[16], W1(16), W2(20));
10362306a36Sopenharmony_ci	R2(d, a, b, c, h, e, f, g, K[17], W1(17), W2(21));
10462306a36Sopenharmony_ci	R2(c, d, a, b, g, h, e, f, K[18], W1(18), W2(22));
10562306a36Sopenharmony_ci	R2(b, c, d, a, f, g, h, e, K[19], W1(19), W2(23));
10662306a36Sopenharmony_ci	R2(a, b, c, d, e, f, g, h, K[20], W1(20), W2(24));
10762306a36Sopenharmony_ci	R2(d, a, b, c, h, e, f, g, K[21], W1(21), W2(25));
10862306a36Sopenharmony_ci	R2(c, d, a, b, g, h, e, f, K[22], W1(22), W2(26));
10962306a36Sopenharmony_ci	R2(b, c, d, a, f, g, h, e, K[23], W1(23), W2(27));
11062306a36Sopenharmony_ci	R2(a, b, c, d, e, f, g, h, K[24], W1(24), W2(28));
11162306a36Sopenharmony_ci	R2(d, a, b, c, h, e, f, g, K[25], W1(25), W2(29));
11262306a36Sopenharmony_ci	R2(c, d, a, b, g, h, e, f, K[26], W1(26), W2(30));
11362306a36Sopenharmony_ci	R2(b, c, d, a, f, g, h, e, K[27], W1(27), W2(31));
11462306a36Sopenharmony_ci	R2(a, b, c, d, e, f, g, h, K[28], W1(28), W2(32));
11562306a36Sopenharmony_ci	R2(d, a, b, c, h, e, f, g, K[29], W1(29), W2(33));
11662306a36Sopenharmony_ci	R2(c, d, a, b, g, h, e, f, K[30], W1(30), W2(34));
11762306a36Sopenharmony_ci	R2(b, c, d, a, f, g, h, e, K[31], W1(31), W2(35));
11862306a36Sopenharmony_ci
11962306a36Sopenharmony_ci	R2(a, b, c, d, e, f, g, h, K[32], W1(32), W2(36));
12062306a36Sopenharmony_ci	R2(d, a, b, c, h, e, f, g, K[33], W1(33), W2(37));
12162306a36Sopenharmony_ci	R2(c, d, a, b, g, h, e, f, K[34], W1(34), W2(38));
12262306a36Sopenharmony_ci	R2(b, c, d, a, f, g, h, e, K[35], W1(35), W2(39));
12362306a36Sopenharmony_ci	R2(a, b, c, d, e, f, g, h, K[36], W1(36), W2(40));
12462306a36Sopenharmony_ci	R2(d, a, b, c, h, e, f, g, K[37], W1(37), W2(41));
12562306a36Sopenharmony_ci	R2(c, d, a, b, g, h, e, f, K[38], W1(38), W2(42));
12662306a36Sopenharmony_ci	R2(b, c, d, a, f, g, h, e, K[39], W1(39), W2(43));
12762306a36Sopenharmony_ci	R2(a, b, c, d, e, f, g, h, K[40], W1(40), W2(44));
12862306a36Sopenharmony_ci	R2(d, a, b, c, h, e, f, g, K[41], W1(41), W2(45));
12962306a36Sopenharmony_ci	R2(c, d, a, b, g, h, e, f, K[42], W1(42), W2(46));
13062306a36Sopenharmony_ci	R2(b, c, d, a, f, g, h, e, K[43], W1(43), W2(47));
13162306a36Sopenharmony_ci	R2(a, b, c, d, e, f, g, h, K[44], W1(44), W2(48));
13262306a36Sopenharmony_ci	R2(d, a, b, c, h, e, f, g, K[45], W1(45), W2(49));
13362306a36Sopenharmony_ci	R2(c, d, a, b, g, h, e, f, K[46], W1(46), W2(50));
13462306a36Sopenharmony_ci	R2(b, c, d, a, f, g, h, e, K[47], W1(47), W2(51));
13562306a36Sopenharmony_ci
13662306a36Sopenharmony_ci	R2(a, b, c, d, e, f, g, h, K[48], W1(48), W2(52));
13762306a36Sopenharmony_ci	R2(d, a, b, c, h, e, f, g, K[49], W1(49), W2(53));
13862306a36Sopenharmony_ci	R2(c, d, a, b, g, h, e, f, K[50], W1(50), W2(54));
13962306a36Sopenharmony_ci	R2(b, c, d, a, f, g, h, e, K[51], W1(51), W2(55));
14062306a36Sopenharmony_ci	R2(a, b, c, d, e, f, g, h, K[52], W1(52), W2(56));
14162306a36Sopenharmony_ci	R2(d, a, b, c, h, e, f, g, K[53], W1(53), W2(57));
14262306a36Sopenharmony_ci	R2(c, d, a, b, g, h, e, f, K[54], W1(54), W2(58));
14362306a36Sopenharmony_ci	R2(b, c, d, a, f, g, h, e, K[55], W1(55), W2(59));
14462306a36Sopenharmony_ci	R2(a, b, c, d, e, f, g, h, K[56], W1(56), W2(60));
14562306a36Sopenharmony_ci	R2(d, a, b, c, h, e, f, g, K[57], W1(57), W2(61));
14662306a36Sopenharmony_ci	R2(c, d, a, b, g, h, e, f, K[58], W1(58), W2(62));
14762306a36Sopenharmony_ci	R2(b, c, d, a, f, g, h, e, K[59], W1(59), W2(63));
14862306a36Sopenharmony_ci	R2(a, b, c, d, e, f, g, h, K[60], W1(60), W2(64));
14962306a36Sopenharmony_ci	R2(d, a, b, c, h, e, f, g, K[61], W1(61), W2(65));
15062306a36Sopenharmony_ci	R2(c, d, a, b, g, h, e, f, K[62], W1(62), W2(66));
15162306a36Sopenharmony_ci	R2(b, c, d, a, f, g, h, e, K[63], W1(63), W2(67));
15262306a36Sopenharmony_ci
15362306a36Sopenharmony_ci	sctx->state[0] ^= a;
15462306a36Sopenharmony_ci	sctx->state[1] ^= b;
15562306a36Sopenharmony_ci	sctx->state[2] ^= c;
15662306a36Sopenharmony_ci	sctx->state[3] ^= d;
15762306a36Sopenharmony_ci	sctx->state[4] ^= e;
15862306a36Sopenharmony_ci	sctx->state[5] ^= f;
15962306a36Sopenharmony_ci	sctx->state[6] ^= g;
16062306a36Sopenharmony_ci	sctx->state[7] ^= h;
16162306a36Sopenharmony_ci}
16262306a36Sopenharmony_ci#undef R
16362306a36Sopenharmony_ci#undef R1
16462306a36Sopenharmony_ci#undef R2
16562306a36Sopenharmony_ci#undef I
16662306a36Sopenharmony_ci#undef W1
16762306a36Sopenharmony_ci#undef W2
16862306a36Sopenharmony_ci
16962306a36Sopenharmony_cistatic inline void sm3_block(struct sm3_state *sctx,
17062306a36Sopenharmony_ci		u8 const *data, int blocks, u32 W[16])
17162306a36Sopenharmony_ci{
17262306a36Sopenharmony_ci	while (blocks--) {
17362306a36Sopenharmony_ci		sm3_transform(sctx, data, W);
17462306a36Sopenharmony_ci		data += SM3_BLOCK_SIZE;
17562306a36Sopenharmony_ci	}
17662306a36Sopenharmony_ci}
17762306a36Sopenharmony_ci
17862306a36Sopenharmony_civoid sm3_update(struct sm3_state *sctx, const u8 *data, unsigned int len)
17962306a36Sopenharmony_ci{
18062306a36Sopenharmony_ci	unsigned int partial = sctx->count % SM3_BLOCK_SIZE;
18162306a36Sopenharmony_ci	u32 W[16];
18262306a36Sopenharmony_ci
18362306a36Sopenharmony_ci	sctx->count += len;
18462306a36Sopenharmony_ci
18562306a36Sopenharmony_ci	if ((partial + len) >= SM3_BLOCK_SIZE) {
18662306a36Sopenharmony_ci		int blocks;
18762306a36Sopenharmony_ci
18862306a36Sopenharmony_ci		if (partial) {
18962306a36Sopenharmony_ci			int p = SM3_BLOCK_SIZE - partial;
19062306a36Sopenharmony_ci
19162306a36Sopenharmony_ci			memcpy(sctx->buffer + partial, data, p);
19262306a36Sopenharmony_ci			data += p;
19362306a36Sopenharmony_ci			len -= p;
19462306a36Sopenharmony_ci
19562306a36Sopenharmony_ci			sm3_block(sctx, sctx->buffer, 1, W);
19662306a36Sopenharmony_ci		}
19762306a36Sopenharmony_ci
19862306a36Sopenharmony_ci		blocks = len / SM3_BLOCK_SIZE;
19962306a36Sopenharmony_ci		len %= SM3_BLOCK_SIZE;
20062306a36Sopenharmony_ci
20162306a36Sopenharmony_ci		if (blocks) {
20262306a36Sopenharmony_ci			sm3_block(sctx, data, blocks, W);
20362306a36Sopenharmony_ci			data += blocks * SM3_BLOCK_SIZE;
20462306a36Sopenharmony_ci		}
20562306a36Sopenharmony_ci
20662306a36Sopenharmony_ci		memzero_explicit(W, sizeof(W));
20762306a36Sopenharmony_ci
20862306a36Sopenharmony_ci		partial = 0;
20962306a36Sopenharmony_ci	}
21062306a36Sopenharmony_ci	if (len)
21162306a36Sopenharmony_ci		memcpy(sctx->buffer + partial, data, len);
21262306a36Sopenharmony_ci}
21362306a36Sopenharmony_ciEXPORT_SYMBOL_GPL(sm3_update);
21462306a36Sopenharmony_ci
21562306a36Sopenharmony_civoid sm3_final(struct sm3_state *sctx, u8 *out)
21662306a36Sopenharmony_ci{
21762306a36Sopenharmony_ci	const int bit_offset = SM3_BLOCK_SIZE - sizeof(u64);
21862306a36Sopenharmony_ci	__be64 *bits = (__be64 *)(sctx->buffer + bit_offset);
21962306a36Sopenharmony_ci	__be32 *digest = (__be32 *)out;
22062306a36Sopenharmony_ci	unsigned int partial = sctx->count % SM3_BLOCK_SIZE;
22162306a36Sopenharmony_ci	u32 W[16];
22262306a36Sopenharmony_ci	int i;
22362306a36Sopenharmony_ci
22462306a36Sopenharmony_ci	sctx->buffer[partial++] = 0x80;
22562306a36Sopenharmony_ci	if (partial > bit_offset) {
22662306a36Sopenharmony_ci		memset(sctx->buffer + partial, 0, SM3_BLOCK_SIZE - partial);
22762306a36Sopenharmony_ci		partial = 0;
22862306a36Sopenharmony_ci
22962306a36Sopenharmony_ci		sm3_block(sctx, sctx->buffer, 1, W);
23062306a36Sopenharmony_ci	}
23162306a36Sopenharmony_ci
23262306a36Sopenharmony_ci	memset(sctx->buffer + partial, 0, bit_offset - partial);
23362306a36Sopenharmony_ci	*bits = cpu_to_be64(sctx->count << 3);
23462306a36Sopenharmony_ci	sm3_block(sctx, sctx->buffer, 1, W);
23562306a36Sopenharmony_ci
23662306a36Sopenharmony_ci	for (i = 0; i < 8; i++)
23762306a36Sopenharmony_ci		put_unaligned_be32(sctx->state[i], digest++);
23862306a36Sopenharmony_ci
23962306a36Sopenharmony_ci	/* Zeroize sensitive information. */
24062306a36Sopenharmony_ci	memzero_explicit(W, sizeof(W));
24162306a36Sopenharmony_ci	memzero_explicit(sctx, sizeof(*sctx));
24262306a36Sopenharmony_ci}
24362306a36Sopenharmony_ciEXPORT_SYMBOL_GPL(sm3_final);
24462306a36Sopenharmony_ci
24562306a36Sopenharmony_ciMODULE_DESCRIPTION("Generic SM3 library");
24662306a36Sopenharmony_ciMODULE_LICENSE("GPL v2");
247