162306a36Sopenharmony_ci// SPDX-License-Identifier: GPL-2.0-only
262306a36Sopenharmony_ci/*
362306a36Sopenharmony_ci * Accelerated CRC-T10DIF using arm64 NEON and Crypto Extensions instructions
462306a36Sopenharmony_ci *
562306a36Sopenharmony_ci * Copyright (C) 2016 - 2017 Linaro Ltd <ard.biesheuvel@linaro.org>
662306a36Sopenharmony_ci */
762306a36Sopenharmony_ci
862306a36Sopenharmony_ci#include <linux/cpufeature.h>
962306a36Sopenharmony_ci#include <linux/crc-t10dif.h>
1062306a36Sopenharmony_ci#include <linux/init.h>
1162306a36Sopenharmony_ci#include <linux/kernel.h>
1262306a36Sopenharmony_ci#include <linux/module.h>
1362306a36Sopenharmony_ci#include <linux/string.h>
1462306a36Sopenharmony_ci
1562306a36Sopenharmony_ci#include <crypto/internal/hash.h>
1662306a36Sopenharmony_ci#include <crypto/internal/simd.h>
1762306a36Sopenharmony_ci
1862306a36Sopenharmony_ci#include <asm/neon.h>
1962306a36Sopenharmony_ci#include <asm/simd.h>
2062306a36Sopenharmony_ci
2162306a36Sopenharmony_ci#define CRC_T10DIF_PMULL_CHUNK_SIZE	16U
2262306a36Sopenharmony_ci
2362306a36Sopenharmony_ciasmlinkage u16 crc_t10dif_pmull_p8(u16 init_crc, const u8 *buf, size_t len);
2462306a36Sopenharmony_ciasmlinkage u16 crc_t10dif_pmull_p64(u16 init_crc, const u8 *buf, size_t len);
2562306a36Sopenharmony_ci
2662306a36Sopenharmony_cistatic int crct10dif_init(struct shash_desc *desc)
2762306a36Sopenharmony_ci{
2862306a36Sopenharmony_ci	u16 *crc = shash_desc_ctx(desc);
2962306a36Sopenharmony_ci
3062306a36Sopenharmony_ci	*crc = 0;
3162306a36Sopenharmony_ci	return 0;
3262306a36Sopenharmony_ci}
3362306a36Sopenharmony_ci
3462306a36Sopenharmony_cistatic int crct10dif_update_pmull_p8(struct shash_desc *desc, const u8 *data,
3562306a36Sopenharmony_ci			    unsigned int length)
3662306a36Sopenharmony_ci{
3762306a36Sopenharmony_ci	u16 *crc = shash_desc_ctx(desc);
3862306a36Sopenharmony_ci
3962306a36Sopenharmony_ci	if (length >= CRC_T10DIF_PMULL_CHUNK_SIZE && crypto_simd_usable()) {
4062306a36Sopenharmony_ci		do {
4162306a36Sopenharmony_ci			unsigned int chunk = length;
4262306a36Sopenharmony_ci
4362306a36Sopenharmony_ci			if (chunk > SZ_4K + CRC_T10DIF_PMULL_CHUNK_SIZE)
4462306a36Sopenharmony_ci				chunk = SZ_4K;
4562306a36Sopenharmony_ci
4662306a36Sopenharmony_ci			kernel_neon_begin();
4762306a36Sopenharmony_ci			*crc = crc_t10dif_pmull_p8(*crc, data, chunk);
4862306a36Sopenharmony_ci			kernel_neon_end();
4962306a36Sopenharmony_ci			data += chunk;
5062306a36Sopenharmony_ci			length -= chunk;
5162306a36Sopenharmony_ci		} while (length);
5262306a36Sopenharmony_ci	} else {
5362306a36Sopenharmony_ci		*crc = crc_t10dif_generic(*crc, data, length);
5462306a36Sopenharmony_ci	}
5562306a36Sopenharmony_ci
5662306a36Sopenharmony_ci	return 0;
5762306a36Sopenharmony_ci}
5862306a36Sopenharmony_ci
5962306a36Sopenharmony_cistatic int crct10dif_update_pmull_p64(struct shash_desc *desc, const u8 *data,
6062306a36Sopenharmony_ci			    unsigned int length)
6162306a36Sopenharmony_ci{
6262306a36Sopenharmony_ci	u16 *crc = shash_desc_ctx(desc);
6362306a36Sopenharmony_ci
6462306a36Sopenharmony_ci	if (length >= CRC_T10DIF_PMULL_CHUNK_SIZE && crypto_simd_usable()) {
6562306a36Sopenharmony_ci		do {
6662306a36Sopenharmony_ci			unsigned int chunk = length;
6762306a36Sopenharmony_ci
6862306a36Sopenharmony_ci			if (chunk > SZ_4K + CRC_T10DIF_PMULL_CHUNK_SIZE)
6962306a36Sopenharmony_ci				chunk = SZ_4K;
7062306a36Sopenharmony_ci
7162306a36Sopenharmony_ci			kernel_neon_begin();
7262306a36Sopenharmony_ci			*crc = crc_t10dif_pmull_p64(*crc, data, chunk);
7362306a36Sopenharmony_ci			kernel_neon_end();
7462306a36Sopenharmony_ci			data += chunk;
7562306a36Sopenharmony_ci			length -= chunk;
7662306a36Sopenharmony_ci		} while (length);
7762306a36Sopenharmony_ci	} else {
7862306a36Sopenharmony_ci		*crc = crc_t10dif_generic(*crc, data, length);
7962306a36Sopenharmony_ci	}
8062306a36Sopenharmony_ci
8162306a36Sopenharmony_ci	return 0;
8262306a36Sopenharmony_ci}
8362306a36Sopenharmony_ci
8462306a36Sopenharmony_cistatic int crct10dif_final(struct shash_desc *desc, u8 *out)
8562306a36Sopenharmony_ci{
8662306a36Sopenharmony_ci	u16 *crc = shash_desc_ctx(desc);
8762306a36Sopenharmony_ci
8862306a36Sopenharmony_ci	*(u16 *)out = *crc;
8962306a36Sopenharmony_ci	return 0;
9062306a36Sopenharmony_ci}
9162306a36Sopenharmony_ci
9262306a36Sopenharmony_cistatic struct shash_alg crc_t10dif_alg[] = {{
9362306a36Sopenharmony_ci	.digestsize		= CRC_T10DIF_DIGEST_SIZE,
9462306a36Sopenharmony_ci	.init			= crct10dif_init,
9562306a36Sopenharmony_ci	.update			= crct10dif_update_pmull_p8,
9662306a36Sopenharmony_ci	.final			= crct10dif_final,
9762306a36Sopenharmony_ci	.descsize		= CRC_T10DIF_DIGEST_SIZE,
9862306a36Sopenharmony_ci
9962306a36Sopenharmony_ci	.base.cra_name		= "crct10dif",
10062306a36Sopenharmony_ci	.base.cra_driver_name	= "crct10dif-arm64-neon",
10162306a36Sopenharmony_ci	.base.cra_priority	= 100,
10262306a36Sopenharmony_ci	.base.cra_blocksize	= CRC_T10DIF_BLOCK_SIZE,
10362306a36Sopenharmony_ci	.base.cra_module	= THIS_MODULE,
10462306a36Sopenharmony_ci}, {
10562306a36Sopenharmony_ci	.digestsize		= CRC_T10DIF_DIGEST_SIZE,
10662306a36Sopenharmony_ci	.init			= crct10dif_init,
10762306a36Sopenharmony_ci	.update			= crct10dif_update_pmull_p64,
10862306a36Sopenharmony_ci	.final			= crct10dif_final,
10962306a36Sopenharmony_ci	.descsize		= CRC_T10DIF_DIGEST_SIZE,
11062306a36Sopenharmony_ci
11162306a36Sopenharmony_ci	.base.cra_name		= "crct10dif",
11262306a36Sopenharmony_ci	.base.cra_driver_name	= "crct10dif-arm64-ce",
11362306a36Sopenharmony_ci	.base.cra_priority	= 200,
11462306a36Sopenharmony_ci	.base.cra_blocksize	= CRC_T10DIF_BLOCK_SIZE,
11562306a36Sopenharmony_ci	.base.cra_module	= THIS_MODULE,
11662306a36Sopenharmony_ci}};
11762306a36Sopenharmony_ci
11862306a36Sopenharmony_cistatic int __init crc_t10dif_mod_init(void)
11962306a36Sopenharmony_ci{
12062306a36Sopenharmony_ci	if (cpu_have_named_feature(PMULL))
12162306a36Sopenharmony_ci		return crypto_register_shashes(crc_t10dif_alg,
12262306a36Sopenharmony_ci					       ARRAY_SIZE(crc_t10dif_alg));
12362306a36Sopenharmony_ci	else
12462306a36Sopenharmony_ci		/* only register the first array element */
12562306a36Sopenharmony_ci		return crypto_register_shash(crc_t10dif_alg);
12662306a36Sopenharmony_ci}
12762306a36Sopenharmony_ci
12862306a36Sopenharmony_cistatic void __exit crc_t10dif_mod_exit(void)
12962306a36Sopenharmony_ci{
13062306a36Sopenharmony_ci	if (cpu_have_named_feature(PMULL))
13162306a36Sopenharmony_ci		crypto_unregister_shashes(crc_t10dif_alg,
13262306a36Sopenharmony_ci					  ARRAY_SIZE(crc_t10dif_alg));
13362306a36Sopenharmony_ci	else
13462306a36Sopenharmony_ci		crypto_unregister_shash(crc_t10dif_alg);
13562306a36Sopenharmony_ci}
13662306a36Sopenharmony_ci
13762306a36Sopenharmony_cimodule_cpu_feature_match(ASIMD, crc_t10dif_mod_init);
13862306a36Sopenharmony_cimodule_exit(crc_t10dif_mod_exit);
13962306a36Sopenharmony_ci
14062306a36Sopenharmony_ciMODULE_AUTHOR("Ard Biesheuvel <ard.biesheuvel@linaro.org>");
14162306a36Sopenharmony_ciMODULE_LICENSE("GPL v2");
14262306a36Sopenharmony_ciMODULE_ALIAS_CRYPTO("crct10dif");
14362306a36Sopenharmony_ciMODULE_ALIAS_CRYPTO("crct10dif-arm64-ce");
144