162306a36Sopenharmony_ci// SPDX-License-Identifier: GPL-2.0-or-later 262306a36Sopenharmony_ci/* 362306a36Sopenharmony_ci * Cryptographic API for the NX-842 hardware compression. 462306a36Sopenharmony_ci * 562306a36Sopenharmony_ci * Copyright (C) IBM Corporation, 2011-2015 662306a36Sopenharmony_ci * 762306a36Sopenharmony_ci * Designer of the Power data compression engine: 862306a36Sopenharmony_ci * Bulent Abali <abali@us.ibm.com> 962306a36Sopenharmony_ci * 1062306a36Sopenharmony_ci * Original Authors: Robert Jennings <rcj@linux.vnet.ibm.com> 1162306a36Sopenharmony_ci * Seth Jennings <sjenning@linux.vnet.ibm.com> 1262306a36Sopenharmony_ci * 1362306a36Sopenharmony_ci * Rewrite: Dan Streetman <ddstreet@ieee.org> 1462306a36Sopenharmony_ci * 1562306a36Sopenharmony_ci * This is an interface to the NX-842 compression hardware in PowerPC 1662306a36Sopenharmony_ci * processors. Most of the complexity of this drvier is due to the fact that 1762306a36Sopenharmony_ci * the NX-842 compression hardware requires the input and output data buffers 1862306a36Sopenharmony_ci * to be specifically aligned, to be a specific multiple in length, and within 1962306a36Sopenharmony_ci * specific minimum and maximum lengths. Those restrictions, provided by the 2062306a36Sopenharmony_ci * nx-842 driver via nx842_constraints, mean this driver must use bounce 2162306a36Sopenharmony_ci * buffers and headers to correct misaligned in or out buffers, and to split 2262306a36Sopenharmony_ci * input buffers that are too large. 2362306a36Sopenharmony_ci * 2462306a36Sopenharmony_ci * This driver will fall back to software decompression if the hardware 2562306a36Sopenharmony_ci * decompression fails, so this driver's decompression should never fail as 2662306a36Sopenharmony_ci * long as the provided compressed buffer is valid. Any compressed buffer 2762306a36Sopenharmony_ci * created by this driver will have a header (except ones where the input 2862306a36Sopenharmony_ci * perfectly matches the constraints); so users of this driver cannot simply 2962306a36Sopenharmony_ci * pass a compressed buffer created by this driver over to the 842 software 3062306a36Sopenharmony_ci * decompression library. Instead, users must use this driver to decompress; 3162306a36Sopenharmony_ci * if the hardware fails or is unavailable, the compressed buffer will be 3262306a36Sopenharmony_ci * parsed and the header removed, and the raw 842 buffer(s) passed to the 842 3362306a36Sopenharmony_ci * software decompression library. 3462306a36Sopenharmony_ci * 3562306a36Sopenharmony_ci * This does not fall back to software compression, however, since the caller 3662306a36Sopenharmony_ci * of this function is specifically requesting hardware compression; if the 3762306a36Sopenharmony_ci * hardware compression fails, the caller can fall back to software 3862306a36Sopenharmony_ci * compression, and the raw 842 compressed buffer that the software compressor 3962306a36Sopenharmony_ci * creates can be passed to this driver for hardware decompression; any 4062306a36Sopenharmony_ci * buffer without our specific header magic is assumed to be a raw 842 buffer 4162306a36Sopenharmony_ci * and passed directly to the hardware. Note that the software compression 4262306a36Sopenharmony_ci * library will produce a compressed buffer that is incompatible with the 4362306a36Sopenharmony_ci * hardware decompressor if the original input buffer length is not a multiple 4462306a36Sopenharmony_ci * of 8; if such a compressed buffer is passed to this driver for 4562306a36Sopenharmony_ci * decompression, the hardware will reject it and this driver will then pass 4662306a36Sopenharmony_ci * it over to the software library for decompression. 4762306a36Sopenharmony_ci */ 4862306a36Sopenharmony_ci 4962306a36Sopenharmony_ci#define pr_fmt(fmt) KBUILD_MODNAME ": " fmt 5062306a36Sopenharmony_ci 5162306a36Sopenharmony_ci#include <linux/vmalloc.h> 5262306a36Sopenharmony_ci#include <linux/sw842.h> 5362306a36Sopenharmony_ci#include <linux/spinlock.h> 5462306a36Sopenharmony_ci 5562306a36Sopenharmony_ci#include "nx-842.h" 5662306a36Sopenharmony_ci 5762306a36Sopenharmony_ci/* The first 5 bits of this magic are 0x1f, which is an invalid 842 5-bit 5862306a36Sopenharmony_ci * template (see lib/842/842.h), so this magic number will never appear at 5962306a36Sopenharmony_ci * the start of a raw 842 compressed buffer. That is important, as any buffer 6062306a36Sopenharmony_ci * passed to us without this magic is assumed to be a raw 842 compressed 6162306a36Sopenharmony_ci * buffer, and passed directly to the hardware to decompress. 6262306a36Sopenharmony_ci */ 6362306a36Sopenharmony_ci#define NX842_CRYPTO_MAGIC (0xf842) 6462306a36Sopenharmony_ci#define NX842_CRYPTO_HEADER_SIZE(g) \ 6562306a36Sopenharmony_ci (sizeof(struct nx842_crypto_header) + \ 6662306a36Sopenharmony_ci sizeof(struct nx842_crypto_header_group) * (g)) 6762306a36Sopenharmony_ci#define NX842_CRYPTO_HEADER_MAX_SIZE \ 6862306a36Sopenharmony_ci NX842_CRYPTO_HEADER_SIZE(NX842_CRYPTO_GROUP_MAX) 6962306a36Sopenharmony_ci 7062306a36Sopenharmony_ci/* bounce buffer size */ 7162306a36Sopenharmony_ci#define BOUNCE_BUFFER_ORDER (2) 7262306a36Sopenharmony_ci#define BOUNCE_BUFFER_SIZE \ 7362306a36Sopenharmony_ci ((unsigned int)(PAGE_SIZE << BOUNCE_BUFFER_ORDER)) 7462306a36Sopenharmony_ci 7562306a36Sopenharmony_ci/* try longer on comp because we can fallback to sw decomp if hw is busy */ 7662306a36Sopenharmony_ci#define COMP_BUSY_TIMEOUT (250) /* ms */ 7762306a36Sopenharmony_ci#define DECOMP_BUSY_TIMEOUT (50) /* ms */ 7862306a36Sopenharmony_ci 7962306a36Sopenharmony_cistruct nx842_crypto_param { 8062306a36Sopenharmony_ci u8 *in; 8162306a36Sopenharmony_ci unsigned int iremain; 8262306a36Sopenharmony_ci u8 *out; 8362306a36Sopenharmony_ci unsigned int oremain; 8462306a36Sopenharmony_ci unsigned int ototal; 8562306a36Sopenharmony_ci}; 8662306a36Sopenharmony_ci 8762306a36Sopenharmony_cistatic int update_param(struct nx842_crypto_param *p, 8862306a36Sopenharmony_ci unsigned int slen, unsigned int dlen) 8962306a36Sopenharmony_ci{ 9062306a36Sopenharmony_ci if (p->iremain < slen) 9162306a36Sopenharmony_ci return -EOVERFLOW; 9262306a36Sopenharmony_ci if (p->oremain < dlen) 9362306a36Sopenharmony_ci return -ENOSPC; 9462306a36Sopenharmony_ci 9562306a36Sopenharmony_ci p->in += slen; 9662306a36Sopenharmony_ci p->iremain -= slen; 9762306a36Sopenharmony_ci p->out += dlen; 9862306a36Sopenharmony_ci p->oremain -= dlen; 9962306a36Sopenharmony_ci p->ototal += dlen; 10062306a36Sopenharmony_ci 10162306a36Sopenharmony_ci return 0; 10262306a36Sopenharmony_ci} 10362306a36Sopenharmony_ci 10462306a36Sopenharmony_ciint nx842_crypto_init(struct crypto_tfm *tfm, struct nx842_driver *driver) 10562306a36Sopenharmony_ci{ 10662306a36Sopenharmony_ci struct nx842_crypto_ctx *ctx = crypto_tfm_ctx(tfm); 10762306a36Sopenharmony_ci 10862306a36Sopenharmony_ci spin_lock_init(&ctx->lock); 10962306a36Sopenharmony_ci ctx->driver = driver; 11062306a36Sopenharmony_ci ctx->wmem = kmalloc(driver->workmem_size, GFP_KERNEL); 11162306a36Sopenharmony_ci ctx->sbounce = (u8 *)__get_free_pages(GFP_KERNEL, BOUNCE_BUFFER_ORDER); 11262306a36Sopenharmony_ci ctx->dbounce = (u8 *)__get_free_pages(GFP_KERNEL, BOUNCE_BUFFER_ORDER); 11362306a36Sopenharmony_ci if (!ctx->wmem || !ctx->sbounce || !ctx->dbounce) { 11462306a36Sopenharmony_ci kfree(ctx->wmem); 11562306a36Sopenharmony_ci free_page((unsigned long)ctx->sbounce); 11662306a36Sopenharmony_ci free_page((unsigned long)ctx->dbounce); 11762306a36Sopenharmony_ci return -ENOMEM; 11862306a36Sopenharmony_ci } 11962306a36Sopenharmony_ci 12062306a36Sopenharmony_ci return 0; 12162306a36Sopenharmony_ci} 12262306a36Sopenharmony_ciEXPORT_SYMBOL_GPL(nx842_crypto_init); 12362306a36Sopenharmony_ci 12462306a36Sopenharmony_civoid nx842_crypto_exit(struct crypto_tfm *tfm) 12562306a36Sopenharmony_ci{ 12662306a36Sopenharmony_ci struct nx842_crypto_ctx *ctx = crypto_tfm_ctx(tfm); 12762306a36Sopenharmony_ci 12862306a36Sopenharmony_ci kfree(ctx->wmem); 12962306a36Sopenharmony_ci free_page((unsigned long)ctx->sbounce); 13062306a36Sopenharmony_ci free_page((unsigned long)ctx->dbounce); 13162306a36Sopenharmony_ci} 13262306a36Sopenharmony_ciEXPORT_SYMBOL_GPL(nx842_crypto_exit); 13362306a36Sopenharmony_ci 13462306a36Sopenharmony_cistatic void check_constraints(struct nx842_constraints *c) 13562306a36Sopenharmony_ci{ 13662306a36Sopenharmony_ci /* limit maximum, to always have enough bounce buffer to decompress */ 13762306a36Sopenharmony_ci if (c->maximum > BOUNCE_BUFFER_SIZE) 13862306a36Sopenharmony_ci c->maximum = BOUNCE_BUFFER_SIZE; 13962306a36Sopenharmony_ci} 14062306a36Sopenharmony_ci 14162306a36Sopenharmony_cistatic int nx842_crypto_add_header(struct nx842_crypto_header *hdr, u8 *buf) 14262306a36Sopenharmony_ci{ 14362306a36Sopenharmony_ci int s = NX842_CRYPTO_HEADER_SIZE(hdr->groups); 14462306a36Sopenharmony_ci 14562306a36Sopenharmony_ci /* compress should have added space for header */ 14662306a36Sopenharmony_ci if (s > be16_to_cpu(hdr->group[0].padding)) { 14762306a36Sopenharmony_ci pr_err("Internal error: no space for header\n"); 14862306a36Sopenharmony_ci return -EINVAL; 14962306a36Sopenharmony_ci } 15062306a36Sopenharmony_ci 15162306a36Sopenharmony_ci memcpy(buf, hdr, s); 15262306a36Sopenharmony_ci 15362306a36Sopenharmony_ci print_hex_dump_debug("header ", DUMP_PREFIX_OFFSET, 16, 1, buf, s, 0); 15462306a36Sopenharmony_ci 15562306a36Sopenharmony_ci return 0; 15662306a36Sopenharmony_ci} 15762306a36Sopenharmony_ci 15862306a36Sopenharmony_cistatic int compress(struct nx842_crypto_ctx *ctx, 15962306a36Sopenharmony_ci struct nx842_crypto_param *p, 16062306a36Sopenharmony_ci struct nx842_crypto_header_group *g, 16162306a36Sopenharmony_ci struct nx842_constraints *c, 16262306a36Sopenharmony_ci u16 *ignore, 16362306a36Sopenharmony_ci unsigned int hdrsize) 16462306a36Sopenharmony_ci{ 16562306a36Sopenharmony_ci unsigned int slen = p->iremain, dlen = p->oremain, tmplen; 16662306a36Sopenharmony_ci unsigned int adj_slen = slen; 16762306a36Sopenharmony_ci u8 *src = p->in, *dst = p->out; 16862306a36Sopenharmony_ci int ret, dskip = 0; 16962306a36Sopenharmony_ci ktime_t timeout; 17062306a36Sopenharmony_ci 17162306a36Sopenharmony_ci if (p->iremain == 0) 17262306a36Sopenharmony_ci return -EOVERFLOW; 17362306a36Sopenharmony_ci 17462306a36Sopenharmony_ci if (p->oremain == 0 || hdrsize + c->minimum > dlen) 17562306a36Sopenharmony_ci return -ENOSPC; 17662306a36Sopenharmony_ci 17762306a36Sopenharmony_ci if (slen % c->multiple) 17862306a36Sopenharmony_ci adj_slen = round_up(slen, c->multiple); 17962306a36Sopenharmony_ci if (slen < c->minimum) 18062306a36Sopenharmony_ci adj_slen = c->minimum; 18162306a36Sopenharmony_ci if (slen > c->maximum) 18262306a36Sopenharmony_ci adj_slen = slen = c->maximum; 18362306a36Sopenharmony_ci if (adj_slen > slen || (u64)src % c->alignment) { 18462306a36Sopenharmony_ci adj_slen = min(adj_slen, BOUNCE_BUFFER_SIZE); 18562306a36Sopenharmony_ci slen = min(slen, BOUNCE_BUFFER_SIZE); 18662306a36Sopenharmony_ci if (adj_slen > slen) 18762306a36Sopenharmony_ci memset(ctx->sbounce + slen, 0, adj_slen - slen); 18862306a36Sopenharmony_ci memcpy(ctx->sbounce, src, slen); 18962306a36Sopenharmony_ci src = ctx->sbounce; 19062306a36Sopenharmony_ci slen = adj_slen; 19162306a36Sopenharmony_ci pr_debug("using comp sbounce buffer, len %x\n", slen); 19262306a36Sopenharmony_ci } 19362306a36Sopenharmony_ci 19462306a36Sopenharmony_ci dst += hdrsize; 19562306a36Sopenharmony_ci dlen -= hdrsize; 19662306a36Sopenharmony_ci 19762306a36Sopenharmony_ci if ((u64)dst % c->alignment) { 19862306a36Sopenharmony_ci dskip = (int)(PTR_ALIGN(dst, c->alignment) - dst); 19962306a36Sopenharmony_ci dst += dskip; 20062306a36Sopenharmony_ci dlen -= dskip; 20162306a36Sopenharmony_ci } 20262306a36Sopenharmony_ci if (dlen % c->multiple) 20362306a36Sopenharmony_ci dlen = round_down(dlen, c->multiple); 20462306a36Sopenharmony_ci if (dlen < c->minimum) { 20562306a36Sopenharmony_cinospc: 20662306a36Sopenharmony_ci dst = ctx->dbounce; 20762306a36Sopenharmony_ci dlen = min(p->oremain, BOUNCE_BUFFER_SIZE); 20862306a36Sopenharmony_ci dlen = round_down(dlen, c->multiple); 20962306a36Sopenharmony_ci dskip = 0; 21062306a36Sopenharmony_ci pr_debug("using comp dbounce buffer, len %x\n", dlen); 21162306a36Sopenharmony_ci } 21262306a36Sopenharmony_ci if (dlen > c->maximum) 21362306a36Sopenharmony_ci dlen = c->maximum; 21462306a36Sopenharmony_ci 21562306a36Sopenharmony_ci tmplen = dlen; 21662306a36Sopenharmony_ci timeout = ktime_add_ms(ktime_get(), COMP_BUSY_TIMEOUT); 21762306a36Sopenharmony_ci do { 21862306a36Sopenharmony_ci dlen = tmplen; /* reset dlen, if we're retrying */ 21962306a36Sopenharmony_ci ret = ctx->driver->compress(src, slen, dst, &dlen, ctx->wmem); 22062306a36Sopenharmony_ci /* possibly we should reduce the slen here, instead of 22162306a36Sopenharmony_ci * retrying with the dbounce buffer? 22262306a36Sopenharmony_ci */ 22362306a36Sopenharmony_ci if (ret == -ENOSPC && dst != ctx->dbounce) 22462306a36Sopenharmony_ci goto nospc; 22562306a36Sopenharmony_ci } while (ret == -EBUSY && ktime_before(ktime_get(), timeout)); 22662306a36Sopenharmony_ci if (ret) 22762306a36Sopenharmony_ci return ret; 22862306a36Sopenharmony_ci 22962306a36Sopenharmony_ci dskip += hdrsize; 23062306a36Sopenharmony_ci 23162306a36Sopenharmony_ci if (dst == ctx->dbounce) 23262306a36Sopenharmony_ci memcpy(p->out + dskip, dst, dlen); 23362306a36Sopenharmony_ci 23462306a36Sopenharmony_ci g->padding = cpu_to_be16(dskip); 23562306a36Sopenharmony_ci g->compressed_length = cpu_to_be32(dlen); 23662306a36Sopenharmony_ci g->uncompressed_length = cpu_to_be32(slen); 23762306a36Sopenharmony_ci 23862306a36Sopenharmony_ci if (p->iremain < slen) { 23962306a36Sopenharmony_ci *ignore = slen - p->iremain; 24062306a36Sopenharmony_ci slen = p->iremain; 24162306a36Sopenharmony_ci } 24262306a36Sopenharmony_ci 24362306a36Sopenharmony_ci pr_debug("compress slen %x ignore %x dlen %x padding %x\n", 24462306a36Sopenharmony_ci slen, *ignore, dlen, dskip); 24562306a36Sopenharmony_ci 24662306a36Sopenharmony_ci return update_param(p, slen, dskip + dlen); 24762306a36Sopenharmony_ci} 24862306a36Sopenharmony_ci 24962306a36Sopenharmony_ciint nx842_crypto_compress(struct crypto_tfm *tfm, 25062306a36Sopenharmony_ci const u8 *src, unsigned int slen, 25162306a36Sopenharmony_ci u8 *dst, unsigned int *dlen) 25262306a36Sopenharmony_ci{ 25362306a36Sopenharmony_ci struct nx842_crypto_ctx *ctx = crypto_tfm_ctx(tfm); 25462306a36Sopenharmony_ci struct nx842_crypto_header *hdr = &ctx->header; 25562306a36Sopenharmony_ci struct nx842_crypto_param p; 25662306a36Sopenharmony_ci struct nx842_constraints c = *ctx->driver->constraints; 25762306a36Sopenharmony_ci unsigned int groups, hdrsize, h; 25862306a36Sopenharmony_ci int ret, n; 25962306a36Sopenharmony_ci bool add_header; 26062306a36Sopenharmony_ci u16 ignore = 0; 26162306a36Sopenharmony_ci 26262306a36Sopenharmony_ci check_constraints(&c); 26362306a36Sopenharmony_ci 26462306a36Sopenharmony_ci p.in = (u8 *)src; 26562306a36Sopenharmony_ci p.iremain = slen; 26662306a36Sopenharmony_ci p.out = dst; 26762306a36Sopenharmony_ci p.oremain = *dlen; 26862306a36Sopenharmony_ci p.ototal = 0; 26962306a36Sopenharmony_ci 27062306a36Sopenharmony_ci *dlen = 0; 27162306a36Sopenharmony_ci 27262306a36Sopenharmony_ci groups = min_t(unsigned int, NX842_CRYPTO_GROUP_MAX, 27362306a36Sopenharmony_ci DIV_ROUND_UP(p.iremain, c.maximum)); 27462306a36Sopenharmony_ci hdrsize = NX842_CRYPTO_HEADER_SIZE(groups); 27562306a36Sopenharmony_ci 27662306a36Sopenharmony_ci spin_lock_bh(&ctx->lock); 27762306a36Sopenharmony_ci 27862306a36Sopenharmony_ci /* skip adding header if the buffers meet all constraints */ 27962306a36Sopenharmony_ci add_header = (p.iremain % c.multiple || 28062306a36Sopenharmony_ci p.iremain < c.minimum || 28162306a36Sopenharmony_ci p.iremain > c.maximum || 28262306a36Sopenharmony_ci (u64)p.in % c.alignment || 28362306a36Sopenharmony_ci p.oremain % c.multiple || 28462306a36Sopenharmony_ci p.oremain < c.minimum || 28562306a36Sopenharmony_ci p.oremain > c.maximum || 28662306a36Sopenharmony_ci (u64)p.out % c.alignment); 28762306a36Sopenharmony_ci 28862306a36Sopenharmony_ci hdr->magic = cpu_to_be16(NX842_CRYPTO_MAGIC); 28962306a36Sopenharmony_ci hdr->groups = 0; 29062306a36Sopenharmony_ci hdr->ignore = 0; 29162306a36Sopenharmony_ci 29262306a36Sopenharmony_ci while (p.iremain > 0) { 29362306a36Sopenharmony_ci n = hdr->groups++; 29462306a36Sopenharmony_ci ret = -ENOSPC; 29562306a36Sopenharmony_ci if (hdr->groups > NX842_CRYPTO_GROUP_MAX) 29662306a36Sopenharmony_ci goto unlock; 29762306a36Sopenharmony_ci 29862306a36Sopenharmony_ci /* header goes before first group */ 29962306a36Sopenharmony_ci h = !n && add_header ? hdrsize : 0; 30062306a36Sopenharmony_ci 30162306a36Sopenharmony_ci if (ignore) 30262306a36Sopenharmony_ci pr_warn("internal error, ignore is set %x\n", ignore); 30362306a36Sopenharmony_ci 30462306a36Sopenharmony_ci ret = compress(ctx, &p, &hdr->group[n], &c, &ignore, h); 30562306a36Sopenharmony_ci if (ret) 30662306a36Sopenharmony_ci goto unlock; 30762306a36Sopenharmony_ci } 30862306a36Sopenharmony_ci 30962306a36Sopenharmony_ci if (!add_header && hdr->groups > 1) { 31062306a36Sopenharmony_ci pr_err("Internal error: No header but multiple groups\n"); 31162306a36Sopenharmony_ci ret = -EINVAL; 31262306a36Sopenharmony_ci goto unlock; 31362306a36Sopenharmony_ci } 31462306a36Sopenharmony_ci 31562306a36Sopenharmony_ci /* ignore indicates the input stream needed to be padded */ 31662306a36Sopenharmony_ci hdr->ignore = cpu_to_be16(ignore); 31762306a36Sopenharmony_ci if (ignore) 31862306a36Sopenharmony_ci pr_debug("marked %d bytes as ignore\n", ignore); 31962306a36Sopenharmony_ci 32062306a36Sopenharmony_ci if (add_header) 32162306a36Sopenharmony_ci ret = nx842_crypto_add_header(hdr, dst); 32262306a36Sopenharmony_ci if (ret) 32362306a36Sopenharmony_ci goto unlock; 32462306a36Sopenharmony_ci 32562306a36Sopenharmony_ci *dlen = p.ototal; 32662306a36Sopenharmony_ci 32762306a36Sopenharmony_ci pr_debug("compress total slen %x dlen %x\n", slen, *dlen); 32862306a36Sopenharmony_ci 32962306a36Sopenharmony_ciunlock: 33062306a36Sopenharmony_ci spin_unlock_bh(&ctx->lock); 33162306a36Sopenharmony_ci return ret; 33262306a36Sopenharmony_ci} 33362306a36Sopenharmony_ciEXPORT_SYMBOL_GPL(nx842_crypto_compress); 33462306a36Sopenharmony_ci 33562306a36Sopenharmony_cistatic int decompress(struct nx842_crypto_ctx *ctx, 33662306a36Sopenharmony_ci struct nx842_crypto_param *p, 33762306a36Sopenharmony_ci struct nx842_crypto_header_group *g, 33862306a36Sopenharmony_ci struct nx842_constraints *c, 33962306a36Sopenharmony_ci u16 ignore) 34062306a36Sopenharmony_ci{ 34162306a36Sopenharmony_ci unsigned int slen = be32_to_cpu(g->compressed_length); 34262306a36Sopenharmony_ci unsigned int required_len = be32_to_cpu(g->uncompressed_length); 34362306a36Sopenharmony_ci unsigned int dlen = p->oremain, tmplen; 34462306a36Sopenharmony_ci unsigned int adj_slen = slen; 34562306a36Sopenharmony_ci u8 *src = p->in, *dst = p->out; 34662306a36Sopenharmony_ci u16 padding = be16_to_cpu(g->padding); 34762306a36Sopenharmony_ci int ret, spadding = 0; 34862306a36Sopenharmony_ci ktime_t timeout; 34962306a36Sopenharmony_ci 35062306a36Sopenharmony_ci if (!slen || !required_len) 35162306a36Sopenharmony_ci return -EINVAL; 35262306a36Sopenharmony_ci 35362306a36Sopenharmony_ci if (p->iremain <= 0 || padding + slen > p->iremain) 35462306a36Sopenharmony_ci return -EOVERFLOW; 35562306a36Sopenharmony_ci 35662306a36Sopenharmony_ci if (p->oremain <= 0 || required_len - ignore > p->oremain) 35762306a36Sopenharmony_ci return -ENOSPC; 35862306a36Sopenharmony_ci 35962306a36Sopenharmony_ci src += padding; 36062306a36Sopenharmony_ci 36162306a36Sopenharmony_ci if (slen % c->multiple) 36262306a36Sopenharmony_ci adj_slen = round_up(slen, c->multiple); 36362306a36Sopenharmony_ci if (slen < c->minimum) 36462306a36Sopenharmony_ci adj_slen = c->minimum; 36562306a36Sopenharmony_ci if (slen > c->maximum) 36662306a36Sopenharmony_ci goto usesw; 36762306a36Sopenharmony_ci if (slen < adj_slen || (u64)src % c->alignment) { 36862306a36Sopenharmony_ci /* we can append padding bytes because the 842 format defines 36962306a36Sopenharmony_ci * an "end" template (see lib/842/842_decompress.c) and will 37062306a36Sopenharmony_ci * ignore any bytes following it. 37162306a36Sopenharmony_ci */ 37262306a36Sopenharmony_ci if (slen < adj_slen) 37362306a36Sopenharmony_ci memset(ctx->sbounce + slen, 0, adj_slen - slen); 37462306a36Sopenharmony_ci memcpy(ctx->sbounce, src, slen); 37562306a36Sopenharmony_ci src = ctx->sbounce; 37662306a36Sopenharmony_ci spadding = adj_slen - slen; 37762306a36Sopenharmony_ci slen = adj_slen; 37862306a36Sopenharmony_ci pr_debug("using decomp sbounce buffer, len %x\n", slen); 37962306a36Sopenharmony_ci } 38062306a36Sopenharmony_ci 38162306a36Sopenharmony_ci if (dlen % c->multiple) 38262306a36Sopenharmony_ci dlen = round_down(dlen, c->multiple); 38362306a36Sopenharmony_ci if (dlen < required_len || (u64)dst % c->alignment) { 38462306a36Sopenharmony_ci dst = ctx->dbounce; 38562306a36Sopenharmony_ci dlen = min(required_len, BOUNCE_BUFFER_SIZE); 38662306a36Sopenharmony_ci pr_debug("using decomp dbounce buffer, len %x\n", dlen); 38762306a36Sopenharmony_ci } 38862306a36Sopenharmony_ci if (dlen < c->minimum) 38962306a36Sopenharmony_ci goto usesw; 39062306a36Sopenharmony_ci if (dlen > c->maximum) 39162306a36Sopenharmony_ci dlen = c->maximum; 39262306a36Sopenharmony_ci 39362306a36Sopenharmony_ci tmplen = dlen; 39462306a36Sopenharmony_ci timeout = ktime_add_ms(ktime_get(), DECOMP_BUSY_TIMEOUT); 39562306a36Sopenharmony_ci do { 39662306a36Sopenharmony_ci dlen = tmplen; /* reset dlen, if we're retrying */ 39762306a36Sopenharmony_ci ret = ctx->driver->decompress(src, slen, dst, &dlen, ctx->wmem); 39862306a36Sopenharmony_ci } while (ret == -EBUSY && ktime_before(ktime_get(), timeout)); 39962306a36Sopenharmony_ci if (ret) { 40062306a36Sopenharmony_ciusesw: 40162306a36Sopenharmony_ci /* reset everything, sw doesn't have constraints */ 40262306a36Sopenharmony_ci src = p->in + padding; 40362306a36Sopenharmony_ci slen = be32_to_cpu(g->compressed_length); 40462306a36Sopenharmony_ci spadding = 0; 40562306a36Sopenharmony_ci dst = p->out; 40662306a36Sopenharmony_ci dlen = p->oremain; 40762306a36Sopenharmony_ci if (dlen < required_len) { /* have ignore bytes */ 40862306a36Sopenharmony_ci dst = ctx->dbounce; 40962306a36Sopenharmony_ci dlen = BOUNCE_BUFFER_SIZE; 41062306a36Sopenharmony_ci } 41162306a36Sopenharmony_ci pr_info_ratelimited("using software 842 decompression\n"); 41262306a36Sopenharmony_ci ret = sw842_decompress(src, slen, dst, &dlen); 41362306a36Sopenharmony_ci } 41462306a36Sopenharmony_ci if (ret) 41562306a36Sopenharmony_ci return ret; 41662306a36Sopenharmony_ci 41762306a36Sopenharmony_ci slen -= spadding; 41862306a36Sopenharmony_ci 41962306a36Sopenharmony_ci dlen -= ignore; 42062306a36Sopenharmony_ci if (ignore) 42162306a36Sopenharmony_ci pr_debug("ignoring last %x bytes\n", ignore); 42262306a36Sopenharmony_ci 42362306a36Sopenharmony_ci if (dst == ctx->dbounce) 42462306a36Sopenharmony_ci memcpy(p->out, dst, dlen); 42562306a36Sopenharmony_ci 42662306a36Sopenharmony_ci pr_debug("decompress slen %x padding %x dlen %x ignore %x\n", 42762306a36Sopenharmony_ci slen, padding, dlen, ignore); 42862306a36Sopenharmony_ci 42962306a36Sopenharmony_ci return update_param(p, slen + padding, dlen); 43062306a36Sopenharmony_ci} 43162306a36Sopenharmony_ci 43262306a36Sopenharmony_ciint nx842_crypto_decompress(struct crypto_tfm *tfm, 43362306a36Sopenharmony_ci const u8 *src, unsigned int slen, 43462306a36Sopenharmony_ci u8 *dst, unsigned int *dlen) 43562306a36Sopenharmony_ci{ 43662306a36Sopenharmony_ci struct nx842_crypto_ctx *ctx = crypto_tfm_ctx(tfm); 43762306a36Sopenharmony_ci struct nx842_crypto_header *hdr; 43862306a36Sopenharmony_ci struct nx842_crypto_param p; 43962306a36Sopenharmony_ci struct nx842_constraints c = *ctx->driver->constraints; 44062306a36Sopenharmony_ci int n, ret, hdr_len; 44162306a36Sopenharmony_ci u16 ignore = 0; 44262306a36Sopenharmony_ci 44362306a36Sopenharmony_ci check_constraints(&c); 44462306a36Sopenharmony_ci 44562306a36Sopenharmony_ci p.in = (u8 *)src; 44662306a36Sopenharmony_ci p.iremain = slen; 44762306a36Sopenharmony_ci p.out = dst; 44862306a36Sopenharmony_ci p.oremain = *dlen; 44962306a36Sopenharmony_ci p.ototal = 0; 45062306a36Sopenharmony_ci 45162306a36Sopenharmony_ci *dlen = 0; 45262306a36Sopenharmony_ci 45362306a36Sopenharmony_ci hdr = (struct nx842_crypto_header *)src; 45462306a36Sopenharmony_ci 45562306a36Sopenharmony_ci spin_lock_bh(&ctx->lock); 45662306a36Sopenharmony_ci 45762306a36Sopenharmony_ci /* If it doesn't start with our header magic number, assume it's a raw 45862306a36Sopenharmony_ci * 842 compressed buffer and pass it directly to the hardware driver 45962306a36Sopenharmony_ci */ 46062306a36Sopenharmony_ci if (be16_to_cpu(hdr->magic) != NX842_CRYPTO_MAGIC) { 46162306a36Sopenharmony_ci struct nx842_crypto_header_group g = { 46262306a36Sopenharmony_ci .padding = 0, 46362306a36Sopenharmony_ci .compressed_length = cpu_to_be32(p.iremain), 46462306a36Sopenharmony_ci .uncompressed_length = cpu_to_be32(p.oremain), 46562306a36Sopenharmony_ci }; 46662306a36Sopenharmony_ci 46762306a36Sopenharmony_ci ret = decompress(ctx, &p, &g, &c, 0); 46862306a36Sopenharmony_ci if (ret) 46962306a36Sopenharmony_ci goto unlock; 47062306a36Sopenharmony_ci 47162306a36Sopenharmony_ci goto success; 47262306a36Sopenharmony_ci } 47362306a36Sopenharmony_ci 47462306a36Sopenharmony_ci if (!hdr->groups) { 47562306a36Sopenharmony_ci pr_err("header has no groups\n"); 47662306a36Sopenharmony_ci ret = -EINVAL; 47762306a36Sopenharmony_ci goto unlock; 47862306a36Sopenharmony_ci } 47962306a36Sopenharmony_ci if (hdr->groups > NX842_CRYPTO_GROUP_MAX) { 48062306a36Sopenharmony_ci pr_err("header has too many groups %x, max %x\n", 48162306a36Sopenharmony_ci hdr->groups, NX842_CRYPTO_GROUP_MAX); 48262306a36Sopenharmony_ci ret = -EINVAL; 48362306a36Sopenharmony_ci goto unlock; 48462306a36Sopenharmony_ci } 48562306a36Sopenharmony_ci 48662306a36Sopenharmony_ci hdr_len = NX842_CRYPTO_HEADER_SIZE(hdr->groups); 48762306a36Sopenharmony_ci if (hdr_len > slen) { 48862306a36Sopenharmony_ci ret = -EOVERFLOW; 48962306a36Sopenharmony_ci goto unlock; 49062306a36Sopenharmony_ci } 49162306a36Sopenharmony_ci 49262306a36Sopenharmony_ci memcpy(&ctx->header, src, hdr_len); 49362306a36Sopenharmony_ci hdr = &ctx->header; 49462306a36Sopenharmony_ci 49562306a36Sopenharmony_ci for (n = 0; n < hdr->groups; n++) { 49662306a36Sopenharmony_ci /* ignore applies to last group */ 49762306a36Sopenharmony_ci if (n + 1 == hdr->groups) 49862306a36Sopenharmony_ci ignore = be16_to_cpu(hdr->ignore); 49962306a36Sopenharmony_ci 50062306a36Sopenharmony_ci ret = decompress(ctx, &p, &hdr->group[n], &c, ignore); 50162306a36Sopenharmony_ci if (ret) 50262306a36Sopenharmony_ci goto unlock; 50362306a36Sopenharmony_ci } 50462306a36Sopenharmony_ci 50562306a36Sopenharmony_cisuccess: 50662306a36Sopenharmony_ci *dlen = p.ototal; 50762306a36Sopenharmony_ci 50862306a36Sopenharmony_ci pr_debug("decompress total slen %x dlen %x\n", slen, *dlen); 50962306a36Sopenharmony_ci 51062306a36Sopenharmony_ci ret = 0; 51162306a36Sopenharmony_ci 51262306a36Sopenharmony_ciunlock: 51362306a36Sopenharmony_ci spin_unlock_bh(&ctx->lock); 51462306a36Sopenharmony_ci 51562306a36Sopenharmony_ci return ret; 51662306a36Sopenharmony_ci} 51762306a36Sopenharmony_ciEXPORT_SYMBOL_GPL(nx842_crypto_decompress); 51862306a36Sopenharmony_ci 51962306a36Sopenharmony_ciMODULE_LICENSE("GPL"); 52062306a36Sopenharmony_ciMODULE_DESCRIPTION("IBM PowerPC Nest (NX) 842 Hardware Compression Driver"); 52162306a36Sopenharmony_ciMODULE_AUTHOR("Dan Streetman <ddstreet@ieee.org>"); 522