162306a36Sopenharmony_ci// SPDX-License-Identifier: GPL-2.0-only
262306a36Sopenharmony_ci/*
362306a36Sopenharmony_ci * Scaler library
462306a36Sopenharmony_ci *
562306a36Sopenharmony_ci * Copyright (c) 2013 Texas Instruments Inc.
662306a36Sopenharmony_ci *
762306a36Sopenharmony_ci * David Griego, <dagriego@biglakesoftware.com>
862306a36Sopenharmony_ci * Dale Farnsworth, <dale@farnsworth.org>
962306a36Sopenharmony_ci * Archit Taneja, <archit@ti.com>
1062306a36Sopenharmony_ci */
1162306a36Sopenharmony_ci
1262306a36Sopenharmony_ci#include <linux/err.h>
1362306a36Sopenharmony_ci#include <linux/io.h>
1462306a36Sopenharmony_ci#include <linux/module.h>
1562306a36Sopenharmony_ci#include <linux/platform_device.h>
1662306a36Sopenharmony_ci#include <linux/slab.h>
1762306a36Sopenharmony_ci
1862306a36Sopenharmony_ci#include "sc.h"
1962306a36Sopenharmony_ci#include "sc_coeff.h"
2062306a36Sopenharmony_ci
2162306a36Sopenharmony_civoid sc_dump_regs(struct sc_data *sc)
2262306a36Sopenharmony_ci{
2362306a36Sopenharmony_ci	struct device *dev = &sc->pdev->dev;
2462306a36Sopenharmony_ci
2562306a36Sopenharmony_ci#define DUMPREG(r) dev_dbg(dev, "%-35s %08x\n", #r, \
2662306a36Sopenharmony_ci	ioread32(sc->base + CFG_##r))
2762306a36Sopenharmony_ci
2862306a36Sopenharmony_ci	dev_dbg(dev, "SC Registers @ %pa:\n", &sc->res->start);
2962306a36Sopenharmony_ci
3062306a36Sopenharmony_ci	DUMPREG(SC0);
3162306a36Sopenharmony_ci	DUMPREG(SC1);
3262306a36Sopenharmony_ci	DUMPREG(SC2);
3362306a36Sopenharmony_ci	DUMPREG(SC3);
3462306a36Sopenharmony_ci	DUMPREG(SC4);
3562306a36Sopenharmony_ci	DUMPREG(SC5);
3662306a36Sopenharmony_ci	DUMPREG(SC6);
3762306a36Sopenharmony_ci	DUMPREG(SC8);
3862306a36Sopenharmony_ci	DUMPREG(SC9);
3962306a36Sopenharmony_ci	DUMPREG(SC10);
4062306a36Sopenharmony_ci	DUMPREG(SC11);
4162306a36Sopenharmony_ci	DUMPREG(SC12);
4262306a36Sopenharmony_ci	DUMPREG(SC13);
4362306a36Sopenharmony_ci	DUMPREG(SC17);
4462306a36Sopenharmony_ci	DUMPREG(SC18);
4562306a36Sopenharmony_ci	DUMPREG(SC19);
4662306a36Sopenharmony_ci	DUMPREG(SC20);
4762306a36Sopenharmony_ci	DUMPREG(SC21);
4862306a36Sopenharmony_ci	DUMPREG(SC22);
4962306a36Sopenharmony_ci	DUMPREG(SC23);
5062306a36Sopenharmony_ci	DUMPREG(SC24);
5162306a36Sopenharmony_ci	DUMPREG(SC25);
5262306a36Sopenharmony_ci
5362306a36Sopenharmony_ci#undef DUMPREG
5462306a36Sopenharmony_ci}
5562306a36Sopenharmony_ciEXPORT_SYMBOL(sc_dump_regs);
5662306a36Sopenharmony_ci
5762306a36Sopenharmony_ci/*
5862306a36Sopenharmony_ci * set the horizontal scaler coefficients according to the ratio of output to
5962306a36Sopenharmony_ci * input widths, after accounting for up to two levels of decimation
6062306a36Sopenharmony_ci */
6162306a36Sopenharmony_civoid sc_set_hs_coeffs(struct sc_data *sc, void *addr, unsigned int src_w,
6262306a36Sopenharmony_ci		unsigned int dst_w)
6362306a36Sopenharmony_ci{
6462306a36Sopenharmony_ci	int sixteenths;
6562306a36Sopenharmony_ci	int idx;
6662306a36Sopenharmony_ci	int i, j;
6762306a36Sopenharmony_ci	u16 *coeff_h = addr;
6862306a36Sopenharmony_ci	const u16 *cp;
6962306a36Sopenharmony_ci
7062306a36Sopenharmony_ci	if (dst_w > src_w) {
7162306a36Sopenharmony_ci		idx = HS_UP_SCALE;
7262306a36Sopenharmony_ci	} else {
7362306a36Sopenharmony_ci		if ((dst_w << 1) < src_w)
7462306a36Sopenharmony_ci			dst_w <<= 1;	/* first level decimation */
7562306a36Sopenharmony_ci		if ((dst_w << 1) < src_w)
7662306a36Sopenharmony_ci			dst_w <<= 1;	/* second level decimation */
7762306a36Sopenharmony_ci
7862306a36Sopenharmony_ci		if (dst_w == src_w) {
7962306a36Sopenharmony_ci			idx = HS_LE_16_16_SCALE;
8062306a36Sopenharmony_ci		} else {
8162306a36Sopenharmony_ci			sixteenths = (dst_w << 4) / src_w;
8262306a36Sopenharmony_ci			if (sixteenths < 8)
8362306a36Sopenharmony_ci				sixteenths = 8;
8462306a36Sopenharmony_ci			idx = HS_LT_9_16_SCALE + sixteenths - 8;
8562306a36Sopenharmony_ci		}
8662306a36Sopenharmony_ci	}
8762306a36Sopenharmony_ci
8862306a36Sopenharmony_ci	cp = scaler_hs_coeffs[idx];
8962306a36Sopenharmony_ci
9062306a36Sopenharmony_ci	for (i = 0; i < SC_NUM_PHASES * 2; i++) {
9162306a36Sopenharmony_ci		for (j = 0; j < SC_H_NUM_TAPS; j++)
9262306a36Sopenharmony_ci			*coeff_h++ = *cp++;
9362306a36Sopenharmony_ci		/*
9462306a36Sopenharmony_ci		 * for each phase, the scaler expects space for 8 coefficients
9562306a36Sopenharmony_ci		 * in it's memory. For the horizontal scaler, we copy the first
9662306a36Sopenharmony_ci		 * 7 coefficients and skip the last slot to move to the next
9762306a36Sopenharmony_ci		 * row to hold coefficients for the next phase
9862306a36Sopenharmony_ci		 */
9962306a36Sopenharmony_ci		coeff_h += SC_NUM_TAPS_MEM_ALIGN - SC_H_NUM_TAPS;
10062306a36Sopenharmony_ci	}
10162306a36Sopenharmony_ci
10262306a36Sopenharmony_ci	sc->load_coeff_h = true;
10362306a36Sopenharmony_ci}
10462306a36Sopenharmony_ciEXPORT_SYMBOL(sc_set_hs_coeffs);
10562306a36Sopenharmony_ci
10662306a36Sopenharmony_ci/*
10762306a36Sopenharmony_ci * set the vertical scaler coefficients according to the ratio of output to
10862306a36Sopenharmony_ci * input heights
10962306a36Sopenharmony_ci */
11062306a36Sopenharmony_civoid sc_set_vs_coeffs(struct sc_data *sc, void *addr, unsigned int src_h,
11162306a36Sopenharmony_ci		unsigned int dst_h)
11262306a36Sopenharmony_ci{
11362306a36Sopenharmony_ci	int sixteenths;
11462306a36Sopenharmony_ci	int idx;
11562306a36Sopenharmony_ci	int i, j;
11662306a36Sopenharmony_ci	u16 *coeff_v = addr;
11762306a36Sopenharmony_ci	const u16 *cp;
11862306a36Sopenharmony_ci
11962306a36Sopenharmony_ci	if (dst_h > src_h) {
12062306a36Sopenharmony_ci		idx = VS_UP_SCALE;
12162306a36Sopenharmony_ci	} else if (dst_h == src_h) {
12262306a36Sopenharmony_ci		idx = VS_1_TO_1_SCALE;
12362306a36Sopenharmony_ci	} else {
12462306a36Sopenharmony_ci		sixteenths = (dst_h << 4) / src_h;
12562306a36Sopenharmony_ci		if (sixteenths < 8)
12662306a36Sopenharmony_ci			sixteenths = 8;
12762306a36Sopenharmony_ci		idx = VS_LT_9_16_SCALE + sixteenths - 8;
12862306a36Sopenharmony_ci	}
12962306a36Sopenharmony_ci
13062306a36Sopenharmony_ci	cp = scaler_vs_coeffs[idx];
13162306a36Sopenharmony_ci
13262306a36Sopenharmony_ci	for (i = 0; i < SC_NUM_PHASES * 2; i++) {
13362306a36Sopenharmony_ci		for (j = 0; j < SC_V_NUM_TAPS; j++)
13462306a36Sopenharmony_ci			*coeff_v++ = *cp++;
13562306a36Sopenharmony_ci		/*
13662306a36Sopenharmony_ci		 * for the vertical scaler, we copy the first 5 coefficients and
13762306a36Sopenharmony_ci		 * skip the last 3 slots to move to the next row to hold
13862306a36Sopenharmony_ci		 * coefficients for the next phase
13962306a36Sopenharmony_ci		 */
14062306a36Sopenharmony_ci		coeff_v += SC_NUM_TAPS_MEM_ALIGN - SC_V_NUM_TAPS;
14162306a36Sopenharmony_ci	}
14262306a36Sopenharmony_ci
14362306a36Sopenharmony_ci	sc->load_coeff_v = true;
14462306a36Sopenharmony_ci}
14562306a36Sopenharmony_ciEXPORT_SYMBOL(sc_set_vs_coeffs);
14662306a36Sopenharmony_ci
14762306a36Sopenharmony_civoid sc_config_scaler(struct sc_data *sc, u32 *sc_reg0, u32 *sc_reg8,
14862306a36Sopenharmony_ci		u32 *sc_reg17, unsigned int src_w, unsigned int src_h,
14962306a36Sopenharmony_ci		unsigned int dst_w, unsigned int dst_h)
15062306a36Sopenharmony_ci{
15162306a36Sopenharmony_ci	struct device *dev = &sc->pdev->dev;
15262306a36Sopenharmony_ci	u32 val;
15362306a36Sopenharmony_ci	int dcm_x, dcm_shift;
15462306a36Sopenharmony_ci	bool use_rav;
15562306a36Sopenharmony_ci	unsigned long lltmp;
15662306a36Sopenharmony_ci	u32 lin_acc_inc, lin_acc_inc_u;
15762306a36Sopenharmony_ci	u32 col_acc_offset;
15862306a36Sopenharmony_ci	u16 factor = 0;
15962306a36Sopenharmony_ci	int row_acc_init_rav = 0, row_acc_init_rav_b = 0;
16062306a36Sopenharmony_ci	u32 row_acc_inc = 0, row_acc_offset = 0, row_acc_offset_b = 0;
16162306a36Sopenharmony_ci	/*
16262306a36Sopenharmony_ci	 * location of SC register in payload memory with respect to the first
16362306a36Sopenharmony_ci	 * register in the mmr address data block
16462306a36Sopenharmony_ci	 */
16562306a36Sopenharmony_ci	u32 *sc_reg9 = sc_reg8 + 1;
16662306a36Sopenharmony_ci	u32 *sc_reg12 = sc_reg8 + 4;
16762306a36Sopenharmony_ci	u32 *sc_reg13 = sc_reg8 + 5;
16862306a36Sopenharmony_ci	u32 *sc_reg24 = sc_reg17 + 7;
16962306a36Sopenharmony_ci
17062306a36Sopenharmony_ci	val = sc_reg0[0];
17162306a36Sopenharmony_ci
17262306a36Sopenharmony_ci	/* clear all the features(they may get enabled elsewhere later) */
17362306a36Sopenharmony_ci	val &= ~(CFG_SELFGEN_FID | CFG_TRIM | CFG_ENABLE_SIN2_VER_INTP |
17462306a36Sopenharmony_ci		CFG_INTERLACE_I | CFG_DCM_4X | CFG_DCM_2X | CFG_AUTO_HS |
17562306a36Sopenharmony_ci		CFG_ENABLE_EV | CFG_USE_RAV | CFG_INVT_FID | CFG_SC_BYPASS |
17662306a36Sopenharmony_ci		CFG_INTERLACE_O | CFG_Y_PK_EN | CFG_HP_BYPASS | CFG_LINEAR);
17762306a36Sopenharmony_ci
17862306a36Sopenharmony_ci	if (src_w == dst_w && src_h == dst_h) {
17962306a36Sopenharmony_ci		val |= CFG_SC_BYPASS;
18062306a36Sopenharmony_ci		sc_reg0[0] = val;
18162306a36Sopenharmony_ci		return;
18262306a36Sopenharmony_ci	}
18362306a36Sopenharmony_ci
18462306a36Sopenharmony_ci	/* we only support linear scaling for now */
18562306a36Sopenharmony_ci	val |= CFG_LINEAR;
18662306a36Sopenharmony_ci
18762306a36Sopenharmony_ci	/* configure horizontal scaler */
18862306a36Sopenharmony_ci
18962306a36Sopenharmony_ci	/* enable 2X or 4X decimation */
19062306a36Sopenharmony_ci	dcm_x = src_w / dst_w;
19162306a36Sopenharmony_ci	if (dcm_x > 4) {
19262306a36Sopenharmony_ci		val |= CFG_DCM_4X;
19362306a36Sopenharmony_ci		dcm_shift = 2;
19462306a36Sopenharmony_ci	} else if (dcm_x > 2) {
19562306a36Sopenharmony_ci		val |= CFG_DCM_2X;
19662306a36Sopenharmony_ci		dcm_shift = 1;
19762306a36Sopenharmony_ci	} else {
19862306a36Sopenharmony_ci		dcm_shift = 0;
19962306a36Sopenharmony_ci	}
20062306a36Sopenharmony_ci
20162306a36Sopenharmony_ci	lltmp = dst_w - 1;
20262306a36Sopenharmony_ci	lin_acc_inc = div64_u64(((u64)(src_w >> dcm_shift) - 1) << 24, lltmp);
20362306a36Sopenharmony_ci	lin_acc_inc_u = 0;
20462306a36Sopenharmony_ci	col_acc_offset = 0;
20562306a36Sopenharmony_ci
20662306a36Sopenharmony_ci	dev_dbg(dev, "hs config: src_w = %d, dst_w = %d, decimation = %s, lin_acc_inc = %08x\n",
20762306a36Sopenharmony_ci		src_w, dst_w, dcm_shift == 2 ? "4x" :
20862306a36Sopenharmony_ci		(dcm_shift == 1 ? "2x" : "none"), lin_acc_inc);
20962306a36Sopenharmony_ci
21062306a36Sopenharmony_ci	/* configure vertical scaler */
21162306a36Sopenharmony_ci
21262306a36Sopenharmony_ci	/* use RAV for vertical scaler if vertical downscaling is > 4x */
21362306a36Sopenharmony_ci	if (dst_h < (src_h >> 2)) {
21462306a36Sopenharmony_ci		use_rav = true;
21562306a36Sopenharmony_ci		val |= CFG_USE_RAV;
21662306a36Sopenharmony_ci	} else {
21762306a36Sopenharmony_ci		use_rav = false;
21862306a36Sopenharmony_ci	}
21962306a36Sopenharmony_ci
22062306a36Sopenharmony_ci	if (use_rav) {
22162306a36Sopenharmony_ci		/* use RAV */
22262306a36Sopenharmony_ci		factor = (u16) ((dst_h << 10) / src_h);
22362306a36Sopenharmony_ci
22462306a36Sopenharmony_ci		row_acc_init_rav = factor + ((1 + factor) >> 1);
22562306a36Sopenharmony_ci		if (row_acc_init_rav >= 1024)
22662306a36Sopenharmony_ci			row_acc_init_rav -= 1024;
22762306a36Sopenharmony_ci
22862306a36Sopenharmony_ci		row_acc_init_rav_b = row_acc_init_rav +
22962306a36Sopenharmony_ci				(1 + (row_acc_init_rav >> 1)) -
23062306a36Sopenharmony_ci				(1024 >> 1);
23162306a36Sopenharmony_ci
23262306a36Sopenharmony_ci		if (row_acc_init_rav_b < 0) {
23362306a36Sopenharmony_ci			row_acc_init_rav_b += row_acc_init_rav;
23462306a36Sopenharmony_ci			row_acc_init_rav *= 2;
23562306a36Sopenharmony_ci		}
23662306a36Sopenharmony_ci
23762306a36Sopenharmony_ci		dev_dbg(dev, "vs config(RAV): src_h = %d, dst_h = %d, factor = %d, acc_init = %08x, acc_init_b = %08x\n",
23862306a36Sopenharmony_ci			src_h, dst_h, factor, row_acc_init_rav,
23962306a36Sopenharmony_ci			row_acc_init_rav_b);
24062306a36Sopenharmony_ci	} else {
24162306a36Sopenharmony_ci		/* use polyphase */
24262306a36Sopenharmony_ci		row_acc_inc = ((src_h - 1) << 16) / (dst_h - 1);
24362306a36Sopenharmony_ci		row_acc_offset = 0;
24462306a36Sopenharmony_ci		row_acc_offset_b = 0;
24562306a36Sopenharmony_ci
24662306a36Sopenharmony_ci		dev_dbg(dev, "vs config(POLY): src_h = %d, dst_h = %d,row_acc_inc = %08x\n",
24762306a36Sopenharmony_ci			src_h, dst_h, row_acc_inc);
24862306a36Sopenharmony_ci	}
24962306a36Sopenharmony_ci
25062306a36Sopenharmony_ci
25162306a36Sopenharmony_ci	sc_reg0[0] = val;
25262306a36Sopenharmony_ci	sc_reg0[1] = row_acc_inc;
25362306a36Sopenharmony_ci	sc_reg0[2] = row_acc_offset;
25462306a36Sopenharmony_ci	sc_reg0[3] = row_acc_offset_b;
25562306a36Sopenharmony_ci
25662306a36Sopenharmony_ci	sc_reg0[4] = ((lin_acc_inc_u & CFG_LIN_ACC_INC_U_MASK) <<
25762306a36Sopenharmony_ci			CFG_LIN_ACC_INC_U_SHIFT) | (dst_w << CFG_TAR_W_SHIFT) |
25862306a36Sopenharmony_ci			(dst_h << CFG_TAR_H_SHIFT);
25962306a36Sopenharmony_ci
26062306a36Sopenharmony_ci	sc_reg0[5] = (src_w << CFG_SRC_W_SHIFT) | (src_h << CFG_SRC_H_SHIFT);
26162306a36Sopenharmony_ci
26262306a36Sopenharmony_ci	sc_reg0[6] = (row_acc_init_rav_b << CFG_ROW_ACC_INIT_RAV_B_SHIFT) |
26362306a36Sopenharmony_ci		(row_acc_init_rav << CFG_ROW_ACC_INIT_RAV_SHIFT);
26462306a36Sopenharmony_ci
26562306a36Sopenharmony_ci	*sc_reg9 = lin_acc_inc;
26662306a36Sopenharmony_ci
26762306a36Sopenharmony_ci	*sc_reg12 = col_acc_offset << CFG_COL_ACC_OFFSET_SHIFT;
26862306a36Sopenharmony_ci
26962306a36Sopenharmony_ci	*sc_reg13 = factor;
27062306a36Sopenharmony_ci
27162306a36Sopenharmony_ci	*sc_reg24 = (src_w << CFG_ORG_W_SHIFT) | (src_h << CFG_ORG_H_SHIFT);
27262306a36Sopenharmony_ci}
27362306a36Sopenharmony_ciEXPORT_SYMBOL(sc_config_scaler);
27462306a36Sopenharmony_ci
27562306a36Sopenharmony_cistruct sc_data *sc_create(struct platform_device *pdev, const char *res_name)
27662306a36Sopenharmony_ci{
27762306a36Sopenharmony_ci	struct sc_data *sc;
27862306a36Sopenharmony_ci
27962306a36Sopenharmony_ci	dev_dbg(&pdev->dev, "sc_create\n");
28062306a36Sopenharmony_ci
28162306a36Sopenharmony_ci	sc = devm_kzalloc(&pdev->dev, sizeof(*sc), GFP_KERNEL);
28262306a36Sopenharmony_ci	if (!sc) {
28362306a36Sopenharmony_ci		dev_err(&pdev->dev, "couldn't alloc sc_data\n");
28462306a36Sopenharmony_ci		return ERR_PTR(-ENOMEM);
28562306a36Sopenharmony_ci	}
28662306a36Sopenharmony_ci
28762306a36Sopenharmony_ci	sc->pdev = pdev;
28862306a36Sopenharmony_ci
28962306a36Sopenharmony_ci	sc->res = platform_get_resource_byname(pdev, IORESOURCE_MEM, res_name);
29062306a36Sopenharmony_ci	if (!sc->res) {
29162306a36Sopenharmony_ci		dev_err(&pdev->dev, "missing '%s' platform resources data\n",
29262306a36Sopenharmony_ci			res_name);
29362306a36Sopenharmony_ci		return ERR_PTR(-ENODEV);
29462306a36Sopenharmony_ci	}
29562306a36Sopenharmony_ci
29662306a36Sopenharmony_ci	sc->base = devm_ioremap_resource(&pdev->dev, sc->res);
29762306a36Sopenharmony_ci	if (IS_ERR(sc->base))
29862306a36Sopenharmony_ci		return ERR_CAST(sc->base);
29962306a36Sopenharmony_ci
30062306a36Sopenharmony_ci	return sc;
30162306a36Sopenharmony_ci}
30262306a36Sopenharmony_ciEXPORT_SYMBOL(sc_create);
30362306a36Sopenharmony_ci
30462306a36Sopenharmony_ciMODULE_DESCRIPTION("TI VIP/VPE Scaler");
30562306a36Sopenharmony_ciMODULE_AUTHOR("Texas Instruments Inc.");
30662306a36Sopenharmony_ciMODULE_LICENSE("GPL v2");
307