162306a36Sopenharmony_ci// SPDX-License-Identifier: GPL-2.0-or-later
262306a36Sopenharmony_ci/*
362306a36Sopenharmony_ci * Cryptographic API for the NX-842 hardware compression.
462306a36Sopenharmony_ci *
562306a36Sopenharmony_ci * Copyright (C) IBM Corporation, 2011-2015
662306a36Sopenharmony_ci *
762306a36Sopenharmony_ci * Designer of the Power data compression engine:
862306a36Sopenharmony_ci *   Bulent Abali <abali@us.ibm.com>
962306a36Sopenharmony_ci *
1062306a36Sopenharmony_ci * Original Authors: Robert Jennings <rcj@linux.vnet.ibm.com>
1162306a36Sopenharmony_ci *                   Seth Jennings <sjenning@linux.vnet.ibm.com>
1262306a36Sopenharmony_ci *
1362306a36Sopenharmony_ci * Rewrite: Dan Streetman <ddstreet@ieee.org>
1462306a36Sopenharmony_ci *
1562306a36Sopenharmony_ci * This is an interface to the NX-842 compression hardware in PowerPC
1662306a36Sopenharmony_ci * processors.  Most of the complexity of this drvier is due to the fact that
1762306a36Sopenharmony_ci * the NX-842 compression hardware requires the input and output data buffers
1862306a36Sopenharmony_ci * to be specifically aligned, to be a specific multiple in length, and within
1962306a36Sopenharmony_ci * specific minimum and maximum lengths.  Those restrictions, provided by the
2062306a36Sopenharmony_ci * nx-842 driver via nx842_constraints, mean this driver must use bounce
2162306a36Sopenharmony_ci * buffers and headers to correct misaligned in or out buffers, and to split
2262306a36Sopenharmony_ci * input buffers that are too large.
2362306a36Sopenharmony_ci *
2462306a36Sopenharmony_ci * This driver will fall back to software decompression if the hardware
2562306a36Sopenharmony_ci * decompression fails, so this driver's decompression should never fail as
2662306a36Sopenharmony_ci * long as the provided compressed buffer is valid.  Any compressed buffer
2762306a36Sopenharmony_ci * created by this driver will have a header (except ones where the input
2862306a36Sopenharmony_ci * perfectly matches the constraints); so users of this driver cannot simply
2962306a36Sopenharmony_ci * pass a compressed buffer created by this driver over to the 842 software
3062306a36Sopenharmony_ci * decompression library.  Instead, users must use this driver to decompress;
3162306a36Sopenharmony_ci * if the hardware fails or is unavailable, the compressed buffer will be
3262306a36Sopenharmony_ci * parsed and the header removed, and the raw 842 buffer(s) passed to the 842
3362306a36Sopenharmony_ci * software decompression library.
3462306a36Sopenharmony_ci *
3562306a36Sopenharmony_ci * This does not fall back to software compression, however, since the caller
3662306a36Sopenharmony_ci * of this function is specifically requesting hardware compression; if the
3762306a36Sopenharmony_ci * hardware compression fails, the caller can fall back to software
3862306a36Sopenharmony_ci * compression, and the raw 842 compressed buffer that the software compressor
3962306a36Sopenharmony_ci * creates can be passed to this driver for hardware decompression; any
4062306a36Sopenharmony_ci * buffer without our specific header magic is assumed to be a raw 842 buffer
4162306a36Sopenharmony_ci * and passed directly to the hardware.  Note that the software compression
4262306a36Sopenharmony_ci * library will produce a compressed buffer that is incompatible with the
4362306a36Sopenharmony_ci * hardware decompressor if the original input buffer length is not a multiple
4462306a36Sopenharmony_ci * of 8; if such a compressed buffer is passed to this driver for
4562306a36Sopenharmony_ci * decompression, the hardware will reject it and this driver will then pass
4662306a36Sopenharmony_ci * it over to the software library for decompression.
4762306a36Sopenharmony_ci */
4862306a36Sopenharmony_ci
4962306a36Sopenharmony_ci#define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
5062306a36Sopenharmony_ci
5162306a36Sopenharmony_ci#include <linux/vmalloc.h>
5262306a36Sopenharmony_ci#include <linux/sw842.h>
5362306a36Sopenharmony_ci#include <linux/spinlock.h>
5462306a36Sopenharmony_ci
5562306a36Sopenharmony_ci#include "nx-842.h"
5662306a36Sopenharmony_ci
5762306a36Sopenharmony_ci/* The first 5 bits of this magic are 0x1f, which is an invalid 842 5-bit
5862306a36Sopenharmony_ci * template (see lib/842/842.h), so this magic number will never appear at
5962306a36Sopenharmony_ci * the start of a raw 842 compressed buffer.  That is important, as any buffer
6062306a36Sopenharmony_ci * passed to us without this magic is assumed to be a raw 842 compressed
6162306a36Sopenharmony_ci * buffer, and passed directly to the hardware to decompress.
6262306a36Sopenharmony_ci */
6362306a36Sopenharmony_ci#define NX842_CRYPTO_MAGIC	(0xf842)
6462306a36Sopenharmony_ci#define NX842_CRYPTO_HEADER_SIZE(g)				\
6562306a36Sopenharmony_ci	(sizeof(struct nx842_crypto_header) +			\
6662306a36Sopenharmony_ci	 sizeof(struct nx842_crypto_header_group) * (g))
6762306a36Sopenharmony_ci#define NX842_CRYPTO_HEADER_MAX_SIZE				\
6862306a36Sopenharmony_ci	NX842_CRYPTO_HEADER_SIZE(NX842_CRYPTO_GROUP_MAX)
6962306a36Sopenharmony_ci
7062306a36Sopenharmony_ci/* bounce buffer size */
7162306a36Sopenharmony_ci#define BOUNCE_BUFFER_ORDER	(2)
7262306a36Sopenharmony_ci#define BOUNCE_BUFFER_SIZE					\
7362306a36Sopenharmony_ci	((unsigned int)(PAGE_SIZE << BOUNCE_BUFFER_ORDER))
7462306a36Sopenharmony_ci
7562306a36Sopenharmony_ci/* try longer on comp because we can fallback to sw decomp if hw is busy */
7662306a36Sopenharmony_ci#define COMP_BUSY_TIMEOUT	(250) /* ms */
7762306a36Sopenharmony_ci#define DECOMP_BUSY_TIMEOUT	(50) /* ms */
7862306a36Sopenharmony_ci
7962306a36Sopenharmony_cistruct nx842_crypto_param {
8062306a36Sopenharmony_ci	u8 *in;
8162306a36Sopenharmony_ci	unsigned int iremain;
8262306a36Sopenharmony_ci	u8 *out;
8362306a36Sopenharmony_ci	unsigned int oremain;
8462306a36Sopenharmony_ci	unsigned int ototal;
8562306a36Sopenharmony_ci};
8662306a36Sopenharmony_ci
8762306a36Sopenharmony_cistatic int update_param(struct nx842_crypto_param *p,
8862306a36Sopenharmony_ci			unsigned int slen, unsigned int dlen)
8962306a36Sopenharmony_ci{
9062306a36Sopenharmony_ci	if (p->iremain < slen)
9162306a36Sopenharmony_ci		return -EOVERFLOW;
9262306a36Sopenharmony_ci	if (p->oremain < dlen)
9362306a36Sopenharmony_ci		return -ENOSPC;
9462306a36Sopenharmony_ci
9562306a36Sopenharmony_ci	p->in += slen;
9662306a36Sopenharmony_ci	p->iremain -= slen;
9762306a36Sopenharmony_ci	p->out += dlen;
9862306a36Sopenharmony_ci	p->oremain -= dlen;
9962306a36Sopenharmony_ci	p->ototal += dlen;
10062306a36Sopenharmony_ci
10162306a36Sopenharmony_ci	return 0;
10262306a36Sopenharmony_ci}
10362306a36Sopenharmony_ci
10462306a36Sopenharmony_ciint nx842_crypto_init(struct crypto_tfm *tfm, struct nx842_driver *driver)
10562306a36Sopenharmony_ci{
10662306a36Sopenharmony_ci	struct nx842_crypto_ctx *ctx = crypto_tfm_ctx(tfm);
10762306a36Sopenharmony_ci
10862306a36Sopenharmony_ci	spin_lock_init(&ctx->lock);
10962306a36Sopenharmony_ci	ctx->driver = driver;
11062306a36Sopenharmony_ci	ctx->wmem = kmalloc(driver->workmem_size, GFP_KERNEL);
11162306a36Sopenharmony_ci	ctx->sbounce = (u8 *)__get_free_pages(GFP_KERNEL, BOUNCE_BUFFER_ORDER);
11262306a36Sopenharmony_ci	ctx->dbounce = (u8 *)__get_free_pages(GFP_KERNEL, BOUNCE_BUFFER_ORDER);
11362306a36Sopenharmony_ci	if (!ctx->wmem || !ctx->sbounce || !ctx->dbounce) {
11462306a36Sopenharmony_ci		kfree(ctx->wmem);
11562306a36Sopenharmony_ci		free_page((unsigned long)ctx->sbounce);
11662306a36Sopenharmony_ci		free_page((unsigned long)ctx->dbounce);
11762306a36Sopenharmony_ci		return -ENOMEM;
11862306a36Sopenharmony_ci	}
11962306a36Sopenharmony_ci
12062306a36Sopenharmony_ci	return 0;
12162306a36Sopenharmony_ci}
12262306a36Sopenharmony_ciEXPORT_SYMBOL_GPL(nx842_crypto_init);
12362306a36Sopenharmony_ci
12462306a36Sopenharmony_civoid nx842_crypto_exit(struct crypto_tfm *tfm)
12562306a36Sopenharmony_ci{
12662306a36Sopenharmony_ci	struct nx842_crypto_ctx *ctx = crypto_tfm_ctx(tfm);
12762306a36Sopenharmony_ci
12862306a36Sopenharmony_ci	kfree(ctx->wmem);
12962306a36Sopenharmony_ci	free_page((unsigned long)ctx->sbounce);
13062306a36Sopenharmony_ci	free_page((unsigned long)ctx->dbounce);
13162306a36Sopenharmony_ci}
13262306a36Sopenharmony_ciEXPORT_SYMBOL_GPL(nx842_crypto_exit);
13362306a36Sopenharmony_ci
13462306a36Sopenharmony_cistatic void check_constraints(struct nx842_constraints *c)
13562306a36Sopenharmony_ci{
13662306a36Sopenharmony_ci	/* limit maximum, to always have enough bounce buffer to decompress */
13762306a36Sopenharmony_ci	if (c->maximum > BOUNCE_BUFFER_SIZE)
13862306a36Sopenharmony_ci		c->maximum = BOUNCE_BUFFER_SIZE;
13962306a36Sopenharmony_ci}
14062306a36Sopenharmony_ci
14162306a36Sopenharmony_cistatic int nx842_crypto_add_header(struct nx842_crypto_header *hdr, u8 *buf)
14262306a36Sopenharmony_ci{
14362306a36Sopenharmony_ci	int s = NX842_CRYPTO_HEADER_SIZE(hdr->groups);
14462306a36Sopenharmony_ci
14562306a36Sopenharmony_ci	/* compress should have added space for header */
14662306a36Sopenharmony_ci	if (s > be16_to_cpu(hdr->group[0].padding)) {
14762306a36Sopenharmony_ci		pr_err("Internal error: no space for header\n");
14862306a36Sopenharmony_ci		return -EINVAL;
14962306a36Sopenharmony_ci	}
15062306a36Sopenharmony_ci
15162306a36Sopenharmony_ci	memcpy(buf, hdr, s);
15262306a36Sopenharmony_ci
15362306a36Sopenharmony_ci	print_hex_dump_debug("header ", DUMP_PREFIX_OFFSET, 16, 1, buf, s, 0);
15462306a36Sopenharmony_ci
15562306a36Sopenharmony_ci	return 0;
15662306a36Sopenharmony_ci}
15762306a36Sopenharmony_ci
15862306a36Sopenharmony_cistatic int compress(struct nx842_crypto_ctx *ctx,
15962306a36Sopenharmony_ci		    struct nx842_crypto_param *p,
16062306a36Sopenharmony_ci		    struct nx842_crypto_header_group *g,
16162306a36Sopenharmony_ci		    struct nx842_constraints *c,
16262306a36Sopenharmony_ci		    u16 *ignore,
16362306a36Sopenharmony_ci		    unsigned int hdrsize)
16462306a36Sopenharmony_ci{
16562306a36Sopenharmony_ci	unsigned int slen = p->iremain, dlen = p->oremain, tmplen;
16662306a36Sopenharmony_ci	unsigned int adj_slen = slen;
16762306a36Sopenharmony_ci	u8 *src = p->in, *dst = p->out;
16862306a36Sopenharmony_ci	int ret, dskip = 0;
16962306a36Sopenharmony_ci	ktime_t timeout;
17062306a36Sopenharmony_ci
17162306a36Sopenharmony_ci	if (p->iremain == 0)
17262306a36Sopenharmony_ci		return -EOVERFLOW;
17362306a36Sopenharmony_ci
17462306a36Sopenharmony_ci	if (p->oremain == 0 || hdrsize + c->minimum > dlen)
17562306a36Sopenharmony_ci		return -ENOSPC;
17662306a36Sopenharmony_ci
17762306a36Sopenharmony_ci	if (slen % c->multiple)
17862306a36Sopenharmony_ci		adj_slen = round_up(slen, c->multiple);
17962306a36Sopenharmony_ci	if (slen < c->minimum)
18062306a36Sopenharmony_ci		adj_slen = c->minimum;
18162306a36Sopenharmony_ci	if (slen > c->maximum)
18262306a36Sopenharmony_ci		adj_slen = slen = c->maximum;
18362306a36Sopenharmony_ci	if (adj_slen > slen || (u64)src % c->alignment) {
18462306a36Sopenharmony_ci		adj_slen = min(adj_slen, BOUNCE_BUFFER_SIZE);
18562306a36Sopenharmony_ci		slen = min(slen, BOUNCE_BUFFER_SIZE);
18662306a36Sopenharmony_ci		if (adj_slen > slen)
18762306a36Sopenharmony_ci			memset(ctx->sbounce + slen, 0, adj_slen - slen);
18862306a36Sopenharmony_ci		memcpy(ctx->sbounce, src, slen);
18962306a36Sopenharmony_ci		src = ctx->sbounce;
19062306a36Sopenharmony_ci		slen = adj_slen;
19162306a36Sopenharmony_ci		pr_debug("using comp sbounce buffer, len %x\n", slen);
19262306a36Sopenharmony_ci	}
19362306a36Sopenharmony_ci
19462306a36Sopenharmony_ci	dst += hdrsize;
19562306a36Sopenharmony_ci	dlen -= hdrsize;
19662306a36Sopenharmony_ci
19762306a36Sopenharmony_ci	if ((u64)dst % c->alignment) {
19862306a36Sopenharmony_ci		dskip = (int)(PTR_ALIGN(dst, c->alignment) - dst);
19962306a36Sopenharmony_ci		dst += dskip;
20062306a36Sopenharmony_ci		dlen -= dskip;
20162306a36Sopenharmony_ci	}
20262306a36Sopenharmony_ci	if (dlen % c->multiple)
20362306a36Sopenharmony_ci		dlen = round_down(dlen, c->multiple);
20462306a36Sopenharmony_ci	if (dlen < c->minimum) {
20562306a36Sopenharmony_cinospc:
20662306a36Sopenharmony_ci		dst = ctx->dbounce;
20762306a36Sopenharmony_ci		dlen = min(p->oremain, BOUNCE_BUFFER_SIZE);
20862306a36Sopenharmony_ci		dlen = round_down(dlen, c->multiple);
20962306a36Sopenharmony_ci		dskip = 0;
21062306a36Sopenharmony_ci		pr_debug("using comp dbounce buffer, len %x\n", dlen);
21162306a36Sopenharmony_ci	}
21262306a36Sopenharmony_ci	if (dlen > c->maximum)
21362306a36Sopenharmony_ci		dlen = c->maximum;
21462306a36Sopenharmony_ci
21562306a36Sopenharmony_ci	tmplen = dlen;
21662306a36Sopenharmony_ci	timeout = ktime_add_ms(ktime_get(), COMP_BUSY_TIMEOUT);
21762306a36Sopenharmony_ci	do {
21862306a36Sopenharmony_ci		dlen = tmplen; /* reset dlen, if we're retrying */
21962306a36Sopenharmony_ci		ret = ctx->driver->compress(src, slen, dst, &dlen, ctx->wmem);
22062306a36Sopenharmony_ci		/* possibly we should reduce the slen here, instead of
22162306a36Sopenharmony_ci		 * retrying with the dbounce buffer?
22262306a36Sopenharmony_ci		 */
22362306a36Sopenharmony_ci		if (ret == -ENOSPC && dst != ctx->dbounce)
22462306a36Sopenharmony_ci			goto nospc;
22562306a36Sopenharmony_ci	} while (ret == -EBUSY && ktime_before(ktime_get(), timeout));
22662306a36Sopenharmony_ci	if (ret)
22762306a36Sopenharmony_ci		return ret;
22862306a36Sopenharmony_ci
22962306a36Sopenharmony_ci	dskip += hdrsize;
23062306a36Sopenharmony_ci
23162306a36Sopenharmony_ci	if (dst == ctx->dbounce)
23262306a36Sopenharmony_ci		memcpy(p->out + dskip, dst, dlen);
23362306a36Sopenharmony_ci
23462306a36Sopenharmony_ci	g->padding = cpu_to_be16(dskip);
23562306a36Sopenharmony_ci	g->compressed_length = cpu_to_be32(dlen);
23662306a36Sopenharmony_ci	g->uncompressed_length = cpu_to_be32(slen);
23762306a36Sopenharmony_ci
23862306a36Sopenharmony_ci	if (p->iremain < slen) {
23962306a36Sopenharmony_ci		*ignore = slen - p->iremain;
24062306a36Sopenharmony_ci		slen = p->iremain;
24162306a36Sopenharmony_ci	}
24262306a36Sopenharmony_ci
24362306a36Sopenharmony_ci	pr_debug("compress slen %x ignore %x dlen %x padding %x\n",
24462306a36Sopenharmony_ci		 slen, *ignore, dlen, dskip);
24562306a36Sopenharmony_ci
24662306a36Sopenharmony_ci	return update_param(p, slen, dskip + dlen);
24762306a36Sopenharmony_ci}
24862306a36Sopenharmony_ci
24962306a36Sopenharmony_ciint nx842_crypto_compress(struct crypto_tfm *tfm,
25062306a36Sopenharmony_ci			  const u8 *src, unsigned int slen,
25162306a36Sopenharmony_ci			  u8 *dst, unsigned int *dlen)
25262306a36Sopenharmony_ci{
25362306a36Sopenharmony_ci	struct nx842_crypto_ctx *ctx = crypto_tfm_ctx(tfm);
25462306a36Sopenharmony_ci	struct nx842_crypto_header *hdr = &ctx->header;
25562306a36Sopenharmony_ci	struct nx842_crypto_param p;
25662306a36Sopenharmony_ci	struct nx842_constraints c = *ctx->driver->constraints;
25762306a36Sopenharmony_ci	unsigned int groups, hdrsize, h;
25862306a36Sopenharmony_ci	int ret, n;
25962306a36Sopenharmony_ci	bool add_header;
26062306a36Sopenharmony_ci	u16 ignore = 0;
26162306a36Sopenharmony_ci
26262306a36Sopenharmony_ci	check_constraints(&c);
26362306a36Sopenharmony_ci
26462306a36Sopenharmony_ci	p.in = (u8 *)src;
26562306a36Sopenharmony_ci	p.iremain = slen;
26662306a36Sopenharmony_ci	p.out = dst;
26762306a36Sopenharmony_ci	p.oremain = *dlen;
26862306a36Sopenharmony_ci	p.ototal = 0;
26962306a36Sopenharmony_ci
27062306a36Sopenharmony_ci	*dlen = 0;
27162306a36Sopenharmony_ci
27262306a36Sopenharmony_ci	groups = min_t(unsigned int, NX842_CRYPTO_GROUP_MAX,
27362306a36Sopenharmony_ci		       DIV_ROUND_UP(p.iremain, c.maximum));
27462306a36Sopenharmony_ci	hdrsize = NX842_CRYPTO_HEADER_SIZE(groups);
27562306a36Sopenharmony_ci
27662306a36Sopenharmony_ci	spin_lock_bh(&ctx->lock);
27762306a36Sopenharmony_ci
27862306a36Sopenharmony_ci	/* skip adding header if the buffers meet all constraints */
27962306a36Sopenharmony_ci	add_header = (p.iremain % c.multiple	||
28062306a36Sopenharmony_ci		      p.iremain < c.minimum	||
28162306a36Sopenharmony_ci		      p.iremain > c.maximum	||
28262306a36Sopenharmony_ci		      (u64)p.in % c.alignment	||
28362306a36Sopenharmony_ci		      p.oremain % c.multiple	||
28462306a36Sopenharmony_ci		      p.oremain < c.minimum	||
28562306a36Sopenharmony_ci		      p.oremain > c.maximum	||
28662306a36Sopenharmony_ci		      (u64)p.out % c.alignment);
28762306a36Sopenharmony_ci
28862306a36Sopenharmony_ci	hdr->magic = cpu_to_be16(NX842_CRYPTO_MAGIC);
28962306a36Sopenharmony_ci	hdr->groups = 0;
29062306a36Sopenharmony_ci	hdr->ignore = 0;
29162306a36Sopenharmony_ci
29262306a36Sopenharmony_ci	while (p.iremain > 0) {
29362306a36Sopenharmony_ci		n = hdr->groups++;
29462306a36Sopenharmony_ci		ret = -ENOSPC;
29562306a36Sopenharmony_ci		if (hdr->groups > NX842_CRYPTO_GROUP_MAX)
29662306a36Sopenharmony_ci			goto unlock;
29762306a36Sopenharmony_ci
29862306a36Sopenharmony_ci		/* header goes before first group */
29962306a36Sopenharmony_ci		h = !n && add_header ? hdrsize : 0;
30062306a36Sopenharmony_ci
30162306a36Sopenharmony_ci		if (ignore)
30262306a36Sopenharmony_ci			pr_warn("internal error, ignore is set %x\n", ignore);
30362306a36Sopenharmony_ci
30462306a36Sopenharmony_ci		ret = compress(ctx, &p, &hdr->group[n], &c, &ignore, h);
30562306a36Sopenharmony_ci		if (ret)
30662306a36Sopenharmony_ci			goto unlock;
30762306a36Sopenharmony_ci	}
30862306a36Sopenharmony_ci
30962306a36Sopenharmony_ci	if (!add_header && hdr->groups > 1) {
31062306a36Sopenharmony_ci		pr_err("Internal error: No header but multiple groups\n");
31162306a36Sopenharmony_ci		ret = -EINVAL;
31262306a36Sopenharmony_ci		goto unlock;
31362306a36Sopenharmony_ci	}
31462306a36Sopenharmony_ci
31562306a36Sopenharmony_ci	/* ignore indicates the input stream needed to be padded */
31662306a36Sopenharmony_ci	hdr->ignore = cpu_to_be16(ignore);
31762306a36Sopenharmony_ci	if (ignore)
31862306a36Sopenharmony_ci		pr_debug("marked %d bytes as ignore\n", ignore);
31962306a36Sopenharmony_ci
32062306a36Sopenharmony_ci	if (add_header)
32162306a36Sopenharmony_ci		ret = nx842_crypto_add_header(hdr, dst);
32262306a36Sopenharmony_ci	if (ret)
32362306a36Sopenharmony_ci		goto unlock;
32462306a36Sopenharmony_ci
32562306a36Sopenharmony_ci	*dlen = p.ototal;
32662306a36Sopenharmony_ci
32762306a36Sopenharmony_ci	pr_debug("compress total slen %x dlen %x\n", slen, *dlen);
32862306a36Sopenharmony_ci
32962306a36Sopenharmony_ciunlock:
33062306a36Sopenharmony_ci	spin_unlock_bh(&ctx->lock);
33162306a36Sopenharmony_ci	return ret;
33262306a36Sopenharmony_ci}
33362306a36Sopenharmony_ciEXPORT_SYMBOL_GPL(nx842_crypto_compress);
33462306a36Sopenharmony_ci
33562306a36Sopenharmony_cistatic int decompress(struct nx842_crypto_ctx *ctx,
33662306a36Sopenharmony_ci		      struct nx842_crypto_param *p,
33762306a36Sopenharmony_ci		      struct nx842_crypto_header_group *g,
33862306a36Sopenharmony_ci		      struct nx842_constraints *c,
33962306a36Sopenharmony_ci		      u16 ignore)
34062306a36Sopenharmony_ci{
34162306a36Sopenharmony_ci	unsigned int slen = be32_to_cpu(g->compressed_length);
34262306a36Sopenharmony_ci	unsigned int required_len = be32_to_cpu(g->uncompressed_length);
34362306a36Sopenharmony_ci	unsigned int dlen = p->oremain, tmplen;
34462306a36Sopenharmony_ci	unsigned int adj_slen = slen;
34562306a36Sopenharmony_ci	u8 *src = p->in, *dst = p->out;
34662306a36Sopenharmony_ci	u16 padding = be16_to_cpu(g->padding);
34762306a36Sopenharmony_ci	int ret, spadding = 0;
34862306a36Sopenharmony_ci	ktime_t timeout;
34962306a36Sopenharmony_ci
35062306a36Sopenharmony_ci	if (!slen || !required_len)
35162306a36Sopenharmony_ci		return -EINVAL;
35262306a36Sopenharmony_ci
35362306a36Sopenharmony_ci	if (p->iremain <= 0 || padding + slen > p->iremain)
35462306a36Sopenharmony_ci		return -EOVERFLOW;
35562306a36Sopenharmony_ci
35662306a36Sopenharmony_ci	if (p->oremain <= 0 || required_len - ignore > p->oremain)
35762306a36Sopenharmony_ci		return -ENOSPC;
35862306a36Sopenharmony_ci
35962306a36Sopenharmony_ci	src += padding;
36062306a36Sopenharmony_ci
36162306a36Sopenharmony_ci	if (slen % c->multiple)
36262306a36Sopenharmony_ci		adj_slen = round_up(slen, c->multiple);
36362306a36Sopenharmony_ci	if (slen < c->minimum)
36462306a36Sopenharmony_ci		adj_slen = c->minimum;
36562306a36Sopenharmony_ci	if (slen > c->maximum)
36662306a36Sopenharmony_ci		goto usesw;
36762306a36Sopenharmony_ci	if (slen < adj_slen || (u64)src % c->alignment) {
36862306a36Sopenharmony_ci		/* we can append padding bytes because the 842 format defines
36962306a36Sopenharmony_ci		 * an "end" template (see lib/842/842_decompress.c) and will
37062306a36Sopenharmony_ci		 * ignore any bytes following it.
37162306a36Sopenharmony_ci		 */
37262306a36Sopenharmony_ci		if (slen < adj_slen)
37362306a36Sopenharmony_ci			memset(ctx->sbounce + slen, 0, adj_slen - slen);
37462306a36Sopenharmony_ci		memcpy(ctx->sbounce, src, slen);
37562306a36Sopenharmony_ci		src = ctx->sbounce;
37662306a36Sopenharmony_ci		spadding = adj_slen - slen;
37762306a36Sopenharmony_ci		slen = adj_slen;
37862306a36Sopenharmony_ci		pr_debug("using decomp sbounce buffer, len %x\n", slen);
37962306a36Sopenharmony_ci	}
38062306a36Sopenharmony_ci
38162306a36Sopenharmony_ci	if (dlen % c->multiple)
38262306a36Sopenharmony_ci		dlen = round_down(dlen, c->multiple);
38362306a36Sopenharmony_ci	if (dlen < required_len || (u64)dst % c->alignment) {
38462306a36Sopenharmony_ci		dst = ctx->dbounce;
38562306a36Sopenharmony_ci		dlen = min(required_len, BOUNCE_BUFFER_SIZE);
38662306a36Sopenharmony_ci		pr_debug("using decomp dbounce buffer, len %x\n", dlen);
38762306a36Sopenharmony_ci	}
38862306a36Sopenharmony_ci	if (dlen < c->minimum)
38962306a36Sopenharmony_ci		goto usesw;
39062306a36Sopenharmony_ci	if (dlen > c->maximum)
39162306a36Sopenharmony_ci		dlen = c->maximum;
39262306a36Sopenharmony_ci
39362306a36Sopenharmony_ci	tmplen = dlen;
39462306a36Sopenharmony_ci	timeout = ktime_add_ms(ktime_get(), DECOMP_BUSY_TIMEOUT);
39562306a36Sopenharmony_ci	do {
39662306a36Sopenharmony_ci		dlen = tmplen; /* reset dlen, if we're retrying */
39762306a36Sopenharmony_ci		ret = ctx->driver->decompress(src, slen, dst, &dlen, ctx->wmem);
39862306a36Sopenharmony_ci	} while (ret == -EBUSY && ktime_before(ktime_get(), timeout));
39962306a36Sopenharmony_ci	if (ret) {
40062306a36Sopenharmony_ciusesw:
40162306a36Sopenharmony_ci		/* reset everything, sw doesn't have constraints */
40262306a36Sopenharmony_ci		src = p->in + padding;
40362306a36Sopenharmony_ci		slen = be32_to_cpu(g->compressed_length);
40462306a36Sopenharmony_ci		spadding = 0;
40562306a36Sopenharmony_ci		dst = p->out;
40662306a36Sopenharmony_ci		dlen = p->oremain;
40762306a36Sopenharmony_ci		if (dlen < required_len) { /* have ignore bytes */
40862306a36Sopenharmony_ci			dst = ctx->dbounce;
40962306a36Sopenharmony_ci			dlen = BOUNCE_BUFFER_SIZE;
41062306a36Sopenharmony_ci		}
41162306a36Sopenharmony_ci		pr_info_ratelimited("using software 842 decompression\n");
41262306a36Sopenharmony_ci		ret = sw842_decompress(src, slen, dst, &dlen);
41362306a36Sopenharmony_ci	}
41462306a36Sopenharmony_ci	if (ret)
41562306a36Sopenharmony_ci		return ret;
41662306a36Sopenharmony_ci
41762306a36Sopenharmony_ci	slen -= spadding;
41862306a36Sopenharmony_ci
41962306a36Sopenharmony_ci	dlen -= ignore;
42062306a36Sopenharmony_ci	if (ignore)
42162306a36Sopenharmony_ci		pr_debug("ignoring last %x bytes\n", ignore);
42262306a36Sopenharmony_ci
42362306a36Sopenharmony_ci	if (dst == ctx->dbounce)
42462306a36Sopenharmony_ci		memcpy(p->out, dst, dlen);
42562306a36Sopenharmony_ci
42662306a36Sopenharmony_ci	pr_debug("decompress slen %x padding %x dlen %x ignore %x\n",
42762306a36Sopenharmony_ci		 slen, padding, dlen, ignore);
42862306a36Sopenharmony_ci
42962306a36Sopenharmony_ci	return update_param(p, slen + padding, dlen);
43062306a36Sopenharmony_ci}
43162306a36Sopenharmony_ci
43262306a36Sopenharmony_ciint nx842_crypto_decompress(struct crypto_tfm *tfm,
43362306a36Sopenharmony_ci			    const u8 *src, unsigned int slen,
43462306a36Sopenharmony_ci			    u8 *dst, unsigned int *dlen)
43562306a36Sopenharmony_ci{
43662306a36Sopenharmony_ci	struct nx842_crypto_ctx *ctx = crypto_tfm_ctx(tfm);
43762306a36Sopenharmony_ci	struct nx842_crypto_header *hdr;
43862306a36Sopenharmony_ci	struct nx842_crypto_param p;
43962306a36Sopenharmony_ci	struct nx842_constraints c = *ctx->driver->constraints;
44062306a36Sopenharmony_ci	int n, ret, hdr_len;
44162306a36Sopenharmony_ci	u16 ignore = 0;
44262306a36Sopenharmony_ci
44362306a36Sopenharmony_ci	check_constraints(&c);
44462306a36Sopenharmony_ci
44562306a36Sopenharmony_ci	p.in = (u8 *)src;
44662306a36Sopenharmony_ci	p.iremain = slen;
44762306a36Sopenharmony_ci	p.out = dst;
44862306a36Sopenharmony_ci	p.oremain = *dlen;
44962306a36Sopenharmony_ci	p.ototal = 0;
45062306a36Sopenharmony_ci
45162306a36Sopenharmony_ci	*dlen = 0;
45262306a36Sopenharmony_ci
45362306a36Sopenharmony_ci	hdr = (struct nx842_crypto_header *)src;
45462306a36Sopenharmony_ci
45562306a36Sopenharmony_ci	spin_lock_bh(&ctx->lock);
45662306a36Sopenharmony_ci
45762306a36Sopenharmony_ci	/* If it doesn't start with our header magic number, assume it's a raw
45862306a36Sopenharmony_ci	 * 842 compressed buffer and pass it directly to the hardware driver
45962306a36Sopenharmony_ci	 */
46062306a36Sopenharmony_ci	if (be16_to_cpu(hdr->magic) != NX842_CRYPTO_MAGIC) {
46162306a36Sopenharmony_ci		struct nx842_crypto_header_group g = {
46262306a36Sopenharmony_ci			.padding =		0,
46362306a36Sopenharmony_ci			.compressed_length =	cpu_to_be32(p.iremain),
46462306a36Sopenharmony_ci			.uncompressed_length =	cpu_to_be32(p.oremain),
46562306a36Sopenharmony_ci		};
46662306a36Sopenharmony_ci
46762306a36Sopenharmony_ci		ret = decompress(ctx, &p, &g, &c, 0);
46862306a36Sopenharmony_ci		if (ret)
46962306a36Sopenharmony_ci			goto unlock;
47062306a36Sopenharmony_ci
47162306a36Sopenharmony_ci		goto success;
47262306a36Sopenharmony_ci	}
47362306a36Sopenharmony_ci
47462306a36Sopenharmony_ci	if (!hdr->groups) {
47562306a36Sopenharmony_ci		pr_err("header has no groups\n");
47662306a36Sopenharmony_ci		ret = -EINVAL;
47762306a36Sopenharmony_ci		goto unlock;
47862306a36Sopenharmony_ci	}
47962306a36Sopenharmony_ci	if (hdr->groups > NX842_CRYPTO_GROUP_MAX) {
48062306a36Sopenharmony_ci		pr_err("header has too many groups %x, max %x\n",
48162306a36Sopenharmony_ci		       hdr->groups, NX842_CRYPTO_GROUP_MAX);
48262306a36Sopenharmony_ci		ret = -EINVAL;
48362306a36Sopenharmony_ci		goto unlock;
48462306a36Sopenharmony_ci	}
48562306a36Sopenharmony_ci
48662306a36Sopenharmony_ci	hdr_len = NX842_CRYPTO_HEADER_SIZE(hdr->groups);
48762306a36Sopenharmony_ci	if (hdr_len > slen) {
48862306a36Sopenharmony_ci		ret = -EOVERFLOW;
48962306a36Sopenharmony_ci		goto unlock;
49062306a36Sopenharmony_ci	}
49162306a36Sopenharmony_ci
49262306a36Sopenharmony_ci	memcpy(&ctx->header, src, hdr_len);
49362306a36Sopenharmony_ci	hdr = &ctx->header;
49462306a36Sopenharmony_ci
49562306a36Sopenharmony_ci	for (n = 0; n < hdr->groups; n++) {
49662306a36Sopenharmony_ci		/* ignore applies to last group */
49762306a36Sopenharmony_ci		if (n + 1 == hdr->groups)
49862306a36Sopenharmony_ci			ignore = be16_to_cpu(hdr->ignore);
49962306a36Sopenharmony_ci
50062306a36Sopenharmony_ci		ret = decompress(ctx, &p, &hdr->group[n], &c, ignore);
50162306a36Sopenharmony_ci		if (ret)
50262306a36Sopenharmony_ci			goto unlock;
50362306a36Sopenharmony_ci	}
50462306a36Sopenharmony_ci
50562306a36Sopenharmony_cisuccess:
50662306a36Sopenharmony_ci	*dlen = p.ototal;
50762306a36Sopenharmony_ci
50862306a36Sopenharmony_ci	pr_debug("decompress total slen %x dlen %x\n", slen, *dlen);
50962306a36Sopenharmony_ci
51062306a36Sopenharmony_ci	ret = 0;
51162306a36Sopenharmony_ci
51262306a36Sopenharmony_ciunlock:
51362306a36Sopenharmony_ci	spin_unlock_bh(&ctx->lock);
51462306a36Sopenharmony_ci
51562306a36Sopenharmony_ci	return ret;
51662306a36Sopenharmony_ci}
51762306a36Sopenharmony_ciEXPORT_SYMBOL_GPL(nx842_crypto_decompress);
51862306a36Sopenharmony_ci
51962306a36Sopenharmony_ciMODULE_LICENSE("GPL");
52062306a36Sopenharmony_ciMODULE_DESCRIPTION("IBM PowerPC Nest (NX) 842 Hardware Compression Driver");
52162306a36Sopenharmony_ciMODULE_AUTHOR("Dan Streetman <ddstreet@ieee.org>");
522