18c2ecf20Sopenharmony_ci// SPDX-License-Identifier: GPL-2.0-or-later 28c2ecf20Sopenharmony_ci/* 38c2ecf20Sopenharmony_ci * Calculate a CRC T10-DIF with vpmsum acceleration 48c2ecf20Sopenharmony_ci * 58c2ecf20Sopenharmony_ci * Copyright 2017, Daniel Axtens, IBM Corporation. 68c2ecf20Sopenharmony_ci * [based on crc32c-vpmsum_glue.c] 78c2ecf20Sopenharmony_ci */ 88c2ecf20Sopenharmony_ci 98c2ecf20Sopenharmony_ci#include <linux/crc-t10dif.h> 108c2ecf20Sopenharmony_ci#include <crypto/internal/hash.h> 118c2ecf20Sopenharmony_ci#include <crypto/internal/simd.h> 128c2ecf20Sopenharmony_ci#include <linux/init.h> 138c2ecf20Sopenharmony_ci#include <linux/module.h> 148c2ecf20Sopenharmony_ci#include <linux/string.h> 158c2ecf20Sopenharmony_ci#include <linux/kernel.h> 168c2ecf20Sopenharmony_ci#include <linux/cpufeature.h> 178c2ecf20Sopenharmony_ci#include <asm/simd.h> 188c2ecf20Sopenharmony_ci#include <asm/switch_to.h> 198c2ecf20Sopenharmony_ci 208c2ecf20Sopenharmony_ci#define VMX_ALIGN 16 218c2ecf20Sopenharmony_ci#define VMX_ALIGN_MASK (VMX_ALIGN-1) 228c2ecf20Sopenharmony_ci 238c2ecf20Sopenharmony_ci#define VECTOR_BREAKPOINT 64 248c2ecf20Sopenharmony_ci 258c2ecf20Sopenharmony_ciu32 __crct10dif_vpmsum(u32 crc, unsigned char const *p, size_t len); 268c2ecf20Sopenharmony_ci 278c2ecf20Sopenharmony_cistatic u16 crct10dif_vpmsum(u16 crci, unsigned char const *p, size_t len) 288c2ecf20Sopenharmony_ci{ 298c2ecf20Sopenharmony_ci unsigned int prealign; 308c2ecf20Sopenharmony_ci unsigned int tail; 318c2ecf20Sopenharmony_ci u32 crc = crci; 328c2ecf20Sopenharmony_ci 338c2ecf20Sopenharmony_ci if (len < (VECTOR_BREAKPOINT + VMX_ALIGN) || !crypto_simd_usable()) 348c2ecf20Sopenharmony_ci return crc_t10dif_generic(crc, p, len); 358c2ecf20Sopenharmony_ci 368c2ecf20Sopenharmony_ci if ((unsigned long)p & VMX_ALIGN_MASK) { 378c2ecf20Sopenharmony_ci prealign = VMX_ALIGN - ((unsigned long)p & VMX_ALIGN_MASK); 388c2ecf20Sopenharmony_ci crc = crc_t10dif_generic(crc, p, prealign); 398c2ecf20Sopenharmony_ci len -= prealign; 408c2ecf20Sopenharmony_ci p += prealign; 418c2ecf20Sopenharmony_ci } 428c2ecf20Sopenharmony_ci 438c2ecf20Sopenharmony_ci if (len & ~VMX_ALIGN_MASK) { 448c2ecf20Sopenharmony_ci crc <<= 16; 458c2ecf20Sopenharmony_ci preempt_disable(); 468c2ecf20Sopenharmony_ci pagefault_disable(); 478c2ecf20Sopenharmony_ci enable_kernel_altivec(); 488c2ecf20Sopenharmony_ci crc = __crct10dif_vpmsum(crc, p, len & ~VMX_ALIGN_MASK); 498c2ecf20Sopenharmony_ci disable_kernel_altivec(); 508c2ecf20Sopenharmony_ci pagefault_enable(); 518c2ecf20Sopenharmony_ci preempt_enable(); 528c2ecf20Sopenharmony_ci crc >>= 16; 538c2ecf20Sopenharmony_ci } 548c2ecf20Sopenharmony_ci 558c2ecf20Sopenharmony_ci tail = len & VMX_ALIGN_MASK; 568c2ecf20Sopenharmony_ci if (tail) { 578c2ecf20Sopenharmony_ci p += len & ~VMX_ALIGN_MASK; 588c2ecf20Sopenharmony_ci crc = crc_t10dif_generic(crc, p, tail); 598c2ecf20Sopenharmony_ci } 608c2ecf20Sopenharmony_ci 618c2ecf20Sopenharmony_ci return crc & 0xffff; 628c2ecf20Sopenharmony_ci} 638c2ecf20Sopenharmony_ci 648c2ecf20Sopenharmony_cistatic int crct10dif_vpmsum_init(struct shash_desc *desc) 658c2ecf20Sopenharmony_ci{ 668c2ecf20Sopenharmony_ci u16 *crc = shash_desc_ctx(desc); 678c2ecf20Sopenharmony_ci 688c2ecf20Sopenharmony_ci *crc = 0; 698c2ecf20Sopenharmony_ci return 0; 708c2ecf20Sopenharmony_ci} 718c2ecf20Sopenharmony_ci 728c2ecf20Sopenharmony_cistatic int crct10dif_vpmsum_update(struct shash_desc *desc, const u8 *data, 738c2ecf20Sopenharmony_ci unsigned int length) 748c2ecf20Sopenharmony_ci{ 758c2ecf20Sopenharmony_ci u16 *crc = shash_desc_ctx(desc); 768c2ecf20Sopenharmony_ci 778c2ecf20Sopenharmony_ci *crc = crct10dif_vpmsum(*crc, data, length); 788c2ecf20Sopenharmony_ci 798c2ecf20Sopenharmony_ci return 0; 808c2ecf20Sopenharmony_ci} 818c2ecf20Sopenharmony_ci 828c2ecf20Sopenharmony_ci 838c2ecf20Sopenharmony_cistatic int crct10dif_vpmsum_final(struct shash_desc *desc, u8 *out) 848c2ecf20Sopenharmony_ci{ 858c2ecf20Sopenharmony_ci u16 *crcp = shash_desc_ctx(desc); 868c2ecf20Sopenharmony_ci 878c2ecf20Sopenharmony_ci *(u16 *)out = *crcp; 888c2ecf20Sopenharmony_ci return 0; 898c2ecf20Sopenharmony_ci} 908c2ecf20Sopenharmony_ci 918c2ecf20Sopenharmony_cistatic struct shash_alg alg = { 928c2ecf20Sopenharmony_ci .init = crct10dif_vpmsum_init, 938c2ecf20Sopenharmony_ci .update = crct10dif_vpmsum_update, 948c2ecf20Sopenharmony_ci .final = crct10dif_vpmsum_final, 958c2ecf20Sopenharmony_ci .descsize = CRC_T10DIF_DIGEST_SIZE, 968c2ecf20Sopenharmony_ci .digestsize = CRC_T10DIF_DIGEST_SIZE, 978c2ecf20Sopenharmony_ci .base = { 988c2ecf20Sopenharmony_ci .cra_name = "crct10dif", 998c2ecf20Sopenharmony_ci .cra_driver_name = "crct10dif-vpmsum", 1008c2ecf20Sopenharmony_ci .cra_priority = 200, 1018c2ecf20Sopenharmony_ci .cra_blocksize = CRC_T10DIF_BLOCK_SIZE, 1028c2ecf20Sopenharmony_ci .cra_module = THIS_MODULE, 1038c2ecf20Sopenharmony_ci } 1048c2ecf20Sopenharmony_ci}; 1058c2ecf20Sopenharmony_ci 1068c2ecf20Sopenharmony_cistatic int __init crct10dif_vpmsum_mod_init(void) 1078c2ecf20Sopenharmony_ci{ 1088c2ecf20Sopenharmony_ci if (!cpu_has_feature(CPU_FTR_ARCH_207S)) 1098c2ecf20Sopenharmony_ci return -ENODEV; 1108c2ecf20Sopenharmony_ci 1118c2ecf20Sopenharmony_ci return crypto_register_shash(&alg); 1128c2ecf20Sopenharmony_ci} 1138c2ecf20Sopenharmony_ci 1148c2ecf20Sopenharmony_cistatic void __exit crct10dif_vpmsum_mod_fini(void) 1158c2ecf20Sopenharmony_ci{ 1168c2ecf20Sopenharmony_ci crypto_unregister_shash(&alg); 1178c2ecf20Sopenharmony_ci} 1188c2ecf20Sopenharmony_ci 1198c2ecf20Sopenharmony_cimodule_cpu_feature_match(PPC_MODULE_FEATURE_VEC_CRYPTO, crct10dif_vpmsum_mod_init); 1208c2ecf20Sopenharmony_cimodule_exit(crct10dif_vpmsum_mod_fini); 1218c2ecf20Sopenharmony_ci 1228c2ecf20Sopenharmony_ciMODULE_AUTHOR("Daniel Axtens <dja@axtens.net>"); 1238c2ecf20Sopenharmony_ciMODULE_DESCRIPTION("CRCT10DIF using vector polynomial multiply-sum instructions"); 1248c2ecf20Sopenharmony_ciMODULE_LICENSE("GPL"); 1258c2ecf20Sopenharmony_ciMODULE_ALIAS_CRYPTO("crct10dif"); 1268c2ecf20Sopenharmony_ciMODULE_ALIAS_CRYPTO("crct10dif-vpmsum"); 127