162306a36Sopenharmony_ci// SPDX-License-Identifier: GPL-2.0-or-later
262306a36Sopenharmony_ci/*
362306a36Sopenharmony_ci * Glue Code for 3-way parallel assembler optimized version of Twofish
462306a36Sopenharmony_ci *
562306a36Sopenharmony_ci * Copyright (c) 2011 Jussi Kivilinna <jussi.kivilinna@mbnet.fi>
662306a36Sopenharmony_ci */
762306a36Sopenharmony_ci
862306a36Sopenharmony_ci#include <crypto/algapi.h>
962306a36Sopenharmony_ci#include <crypto/twofish.h>
1062306a36Sopenharmony_ci#include <linux/crypto.h>
1162306a36Sopenharmony_ci#include <linux/init.h>
1262306a36Sopenharmony_ci#include <linux/module.h>
1362306a36Sopenharmony_ci#include <linux/types.h>
1462306a36Sopenharmony_ci
1562306a36Sopenharmony_ci#include "twofish.h"
1662306a36Sopenharmony_ci#include "ecb_cbc_helpers.h"
1762306a36Sopenharmony_ci
1862306a36Sopenharmony_ciEXPORT_SYMBOL_GPL(__twofish_enc_blk_3way);
1962306a36Sopenharmony_ciEXPORT_SYMBOL_GPL(twofish_dec_blk_3way);
2062306a36Sopenharmony_ci
2162306a36Sopenharmony_cistatic int twofish_setkey_skcipher(struct crypto_skcipher *tfm,
2262306a36Sopenharmony_ci				   const u8 *key, unsigned int keylen)
2362306a36Sopenharmony_ci{
2462306a36Sopenharmony_ci	return twofish_setkey(&tfm->base, key, keylen);
2562306a36Sopenharmony_ci}
2662306a36Sopenharmony_ci
2762306a36Sopenharmony_cistatic inline void twofish_enc_blk_3way(const void *ctx, u8 *dst, const u8 *src)
2862306a36Sopenharmony_ci{
2962306a36Sopenharmony_ci	__twofish_enc_blk_3way(ctx, dst, src, false);
3062306a36Sopenharmony_ci}
3162306a36Sopenharmony_ci
3262306a36Sopenharmony_civoid twofish_dec_blk_cbc_3way(const void *ctx, u8 *dst, const u8 *src)
3362306a36Sopenharmony_ci{
3462306a36Sopenharmony_ci	u8 buf[2][TF_BLOCK_SIZE];
3562306a36Sopenharmony_ci	const u8 *s = src;
3662306a36Sopenharmony_ci
3762306a36Sopenharmony_ci	if (dst == src)
3862306a36Sopenharmony_ci		s = memcpy(buf, src, sizeof(buf));
3962306a36Sopenharmony_ci	twofish_dec_blk_3way(ctx, dst, src);
4062306a36Sopenharmony_ci	crypto_xor(dst + TF_BLOCK_SIZE, s, sizeof(buf));
4162306a36Sopenharmony_ci
4262306a36Sopenharmony_ci}
4362306a36Sopenharmony_ciEXPORT_SYMBOL_GPL(twofish_dec_blk_cbc_3way);
4462306a36Sopenharmony_ci
4562306a36Sopenharmony_cistatic int ecb_encrypt(struct skcipher_request *req)
4662306a36Sopenharmony_ci{
4762306a36Sopenharmony_ci	ECB_WALK_START(req, TF_BLOCK_SIZE, -1);
4862306a36Sopenharmony_ci	ECB_BLOCK(3, twofish_enc_blk_3way);
4962306a36Sopenharmony_ci	ECB_BLOCK(1, twofish_enc_blk);
5062306a36Sopenharmony_ci	ECB_WALK_END();
5162306a36Sopenharmony_ci}
5262306a36Sopenharmony_ci
5362306a36Sopenharmony_cistatic int ecb_decrypt(struct skcipher_request *req)
5462306a36Sopenharmony_ci{
5562306a36Sopenharmony_ci	ECB_WALK_START(req, TF_BLOCK_SIZE, -1);
5662306a36Sopenharmony_ci	ECB_BLOCK(3, twofish_dec_blk_3way);
5762306a36Sopenharmony_ci	ECB_BLOCK(1, twofish_dec_blk);
5862306a36Sopenharmony_ci	ECB_WALK_END();
5962306a36Sopenharmony_ci}
6062306a36Sopenharmony_ci
6162306a36Sopenharmony_cistatic int cbc_encrypt(struct skcipher_request *req)
6262306a36Sopenharmony_ci{
6362306a36Sopenharmony_ci	CBC_WALK_START(req, TF_BLOCK_SIZE, -1);
6462306a36Sopenharmony_ci	CBC_ENC_BLOCK(twofish_enc_blk);
6562306a36Sopenharmony_ci	CBC_WALK_END();
6662306a36Sopenharmony_ci}
6762306a36Sopenharmony_ci
6862306a36Sopenharmony_cistatic int cbc_decrypt(struct skcipher_request *req)
6962306a36Sopenharmony_ci{
7062306a36Sopenharmony_ci	CBC_WALK_START(req, TF_BLOCK_SIZE, -1);
7162306a36Sopenharmony_ci	CBC_DEC_BLOCK(3, twofish_dec_blk_cbc_3way);
7262306a36Sopenharmony_ci	CBC_DEC_BLOCK(1, twofish_dec_blk);
7362306a36Sopenharmony_ci	CBC_WALK_END();
7462306a36Sopenharmony_ci}
7562306a36Sopenharmony_ci
7662306a36Sopenharmony_cistatic struct skcipher_alg tf_skciphers[] = {
7762306a36Sopenharmony_ci	{
7862306a36Sopenharmony_ci		.base.cra_name		= "ecb(twofish)",
7962306a36Sopenharmony_ci		.base.cra_driver_name	= "ecb-twofish-3way",
8062306a36Sopenharmony_ci		.base.cra_priority	= 300,
8162306a36Sopenharmony_ci		.base.cra_blocksize	= TF_BLOCK_SIZE,
8262306a36Sopenharmony_ci		.base.cra_ctxsize	= sizeof(struct twofish_ctx),
8362306a36Sopenharmony_ci		.base.cra_module	= THIS_MODULE,
8462306a36Sopenharmony_ci		.min_keysize		= TF_MIN_KEY_SIZE,
8562306a36Sopenharmony_ci		.max_keysize		= TF_MAX_KEY_SIZE,
8662306a36Sopenharmony_ci		.setkey			= twofish_setkey_skcipher,
8762306a36Sopenharmony_ci		.encrypt		= ecb_encrypt,
8862306a36Sopenharmony_ci		.decrypt		= ecb_decrypt,
8962306a36Sopenharmony_ci	}, {
9062306a36Sopenharmony_ci		.base.cra_name		= "cbc(twofish)",
9162306a36Sopenharmony_ci		.base.cra_driver_name	= "cbc-twofish-3way",
9262306a36Sopenharmony_ci		.base.cra_priority	= 300,
9362306a36Sopenharmony_ci		.base.cra_blocksize	= TF_BLOCK_SIZE,
9462306a36Sopenharmony_ci		.base.cra_ctxsize	= sizeof(struct twofish_ctx),
9562306a36Sopenharmony_ci		.base.cra_module	= THIS_MODULE,
9662306a36Sopenharmony_ci		.min_keysize		= TF_MIN_KEY_SIZE,
9762306a36Sopenharmony_ci		.max_keysize		= TF_MAX_KEY_SIZE,
9862306a36Sopenharmony_ci		.ivsize			= TF_BLOCK_SIZE,
9962306a36Sopenharmony_ci		.setkey			= twofish_setkey_skcipher,
10062306a36Sopenharmony_ci		.encrypt		= cbc_encrypt,
10162306a36Sopenharmony_ci		.decrypt		= cbc_decrypt,
10262306a36Sopenharmony_ci	},
10362306a36Sopenharmony_ci};
10462306a36Sopenharmony_ci
10562306a36Sopenharmony_cistatic bool is_blacklisted_cpu(void)
10662306a36Sopenharmony_ci{
10762306a36Sopenharmony_ci	if (boot_cpu_data.x86_vendor != X86_VENDOR_INTEL)
10862306a36Sopenharmony_ci		return false;
10962306a36Sopenharmony_ci
11062306a36Sopenharmony_ci	if (boot_cpu_data.x86 == 0x06 &&
11162306a36Sopenharmony_ci		(boot_cpu_data.x86_model == 0x1c ||
11262306a36Sopenharmony_ci		 boot_cpu_data.x86_model == 0x26 ||
11362306a36Sopenharmony_ci		 boot_cpu_data.x86_model == 0x36)) {
11462306a36Sopenharmony_ci		/*
11562306a36Sopenharmony_ci		 * On Atom, twofish-3way is slower than original assembler
11662306a36Sopenharmony_ci		 * implementation. Twofish-3way trades off some performance in
11762306a36Sopenharmony_ci		 * storing blocks in 64bit registers to allow three blocks to
11862306a36Sopenharmony_ci		 * be processed parallel. Parallel operation then allows gaining
11962306a36Sopenharmony_ci		 * more performance than was trade off, on out-of-order CPUs.
12062306a36Sopenharmony_ci		 * However Atom does not benefit from this parallelism and
12162306a36Sopenharmony_ci		 * should be blacklisted.
12262306a36Sopenharmony_ci		 */
12362306a36Sopenharmony_ci		return true;
12462306a36Sopenharmony_ci	}
12562306a36Sopenharmony_ci
12662306a36Sopenharmony_ci	if (boot_cpu_data.x86 == 0x0f) {
12762306a36Sopenharmony_ci		/*
12862306a36Sopenharmony_ci		 * On Pentium 4, twofish-3way is slower than original assembler
12962306a36Sopenharmony_ci		 * implementation because excessive uses of 64bit rotate and
13062306a36Sopenharmony_ci		 * left-shifts (which are really slow on P4) needed to store and
13162306a36Sopenharmony_ci		 * handle 128bit block in two 64bit registers.
13262306a36Sopenharmony_ci		 */
13362306a36Sopenharmony_ci		return true;
13462306a36Sopenharmony_ci	}
13562306a36Sopenharmony_ci
13662306a36Sopenharmony_ci	return false;
13762306a36Sopenharmony_ci}
13862306a36Sopenharmony_ci
13962306a36Sopenharmony_cistatic int force;
14062306a36Sopenharmony_cimodule_param(force, int, 0);
14162306a36Sopenharmony_ciMODULE_PARM_DESC(force, "Force module load, ignore CPU blacklist");
14262306a36Sopenharmony_ci
14362306a36Sopenharmony_cistatic int __init twofish_3way_init(void)
14462306a36Sopenharmony_ci{
14562306a36Sopenharmony_ci	if (!force && is_blacklisted_cpu()) {
14662306a36Sopenharmony_ci		printk(KERN_INFO
14762306a36Sopenharmony_ci			"twofish-x86_64-3way: performance on this CPU "
14862306a36Sopenharmony_ci			"would be suboptimal: disabling "
14962306a36Sopenharmony_ci			"twofish-x86_64-3way.\n");
15062306a36Sopenharmony_ci		return -ENODEV;
15162306a36Sopenharmony_ci	}
15262306a36Sopenharmony_ci
15362306a36Sopenharmony_ci	return crypto_register_skciphers(tf_skciphers,
15462306a36Sopenharmony_ci					 ARRAY_SIZE(tf_skciphers));
15562306a36Sopenharmony_ci}
15662306a36Sopenharmony_ci
15762306a36Sopenharmony_cistatic void __exit twofish_3way_fini(void)
15862306a36Sopenharmony_ci{
15962306a36Sopenharmony_ci	crypto_unregister_skciphers(tf_skciphers, ARRAY_SIZE(tf_skciphers));
16062306a36Sopenharmony_ci}
16162306a36Sopenharmony_ci
16262306a36Sopenharmony_cimodule_init(twofish_3way_init);
16362306a36Sopenharmony_cimodule_exit(twofish_3way_fini);
16462306a36Sopenharmony_ci
16562306a36Sopenharmony_ciMODULE_LICENSE("GPL");
16662306a36Sopenharmony_ciMODULE_DESCRIPTION("Twofish Cipher Algorithm, 3-way parallel asm optimized");
16762306a36Sopenharmony_ciMODULE_ALIAS_CRYPTO("twofish");
16862306a36Sopenharmony_ciMODULE_ALIAS_CRYPTO("twofish-asm");
169