162306a36Sopenharmony_ci// SPDX-License-Identifier: GPL-2.0-only 262306a36Sopenharmony_ci/* 362306a36Sopenharmony_ci * Scaler library 462306a36Sopenharmony_ci * 562306a36Sopenharmony_ci * Copyright (c) 2013 Texas Instruments Inc. 662306a36Sopenharmony_ci * 762306a36Sopenharmony_ci * David Griego, <dagriego@biglakesoftware.com> 862306a36Sopenharmony_ci * Dale Farnsworth, <dale@farnsworth.org> 962306a36Sopenharmony_ci * Archit Taneja, <archit@ti.com> 1062306a36Sopenharmony_ci */ 1162306a36Sopenharmony_ci 1262306a36Sopenharmony_ci#include <linux/err.h> 1362306a36Sopenharmony_ci#include <linux/io.h> 1462306a36Sopenharmony_ci#include <linux/module.h> 1562306a36Sopenharmony_ci#include <linux/platform_device.h> 1662306a36Sopenharmony_ci#include <linux/slab.h> 1762306a36Sopenharmony_ci 1862306a36Sopenharmony_ci#include "sc.h" 1962306a36Sopenharmony_ci#include "sc_coeff.h" 2062306a36Sopenharmony_ci 2162306a36Sopenharmony_civoid sc_dump_regs(struct sc_data *sc) 2262306a36Sopenharmony_ci{ 2362306a36Sopenharmony_ci struct device *dev = &sc->pdev->dev; 2462306a36Sopenharmony_ci 2562306a36Sopenharmony_ci#define DUMPREG(r) dev_dbg(dev, "%-35s %08x\n", #r, \ 2662306a36Sopenharmony_ci ioread32(sc->base + CFG_##r)) 2762306a36Sopenharmony_ci 2862306a36Sopenharmony_ci dev_dbg(dev, "SC Registers @ %pa:\n", &sc->res->start); 2962306a36Sopenharmony_ci 3062306a36Sopenharmony_ci DUMPREG(SC0); 3162306a36Sopenharmony_ci DUMPREG(SC1); 3262306a36Sopenharmony_ci DUMPREG(SC2); 3362306a36Sopenharmony_ci DUMPREG(SC3); 3462306a36Sopenharmony_ci DUMPREG(SC4); 3562306a36Sopenharmony_ci DUMPREG(SC5); 3662306a36Sopenharmony_ci DUMPREG(SC6); 3762306a36Sopenharmony_ci DUMPREG(SC8); 3862306a36Sopenharmony_ci DUMPREG(SC9); 3962306a36Sopenharmony_ci DUMPREG(SC10); 4062306a36Sopenharmony_ci DUMPREG(SC11); 4162306a36Sopenharmony_ci DUMPREG(SC12); 4262306a36Sopenharmony_ci DUMPREG(SC13); 4362306a36Sopenharmony_ci DUMPREG(SC17); 4462306a36Sopenharmony_ci DUMPREG(SC18); 4562306a36Sopenharmony_ci DUMPREG(SC19); 4662306a36Sopenharmony_ci DUMPREG(SC20); 4762306a36Sopenharmony_ci DUMPREG(SC21); 4862306a36Sopenharmony_ci DUMPREG(SC22); 4962306a36Sopenharmony_ci DUMPREG(SC23); 5062306a36Sopenharmony_ci DUMPREG(SC24); 5162306a36Sopenharmony_ci DUMPREG(SC25); 5262306a36Sopenharmony_ci 5362306a36Sopenharmony_ci#undef DUMPREG 5462306a36Sopenharmony_ci} 5562306a36Sopenharmony_ciEXPORT_SYMBOL(sc_dump_regs); 5662306a36Sopenharmony_ci 5762306a36Sopenharmony_ci/* 5862306a36Sopenharmony_ci * set the horizontal scaler coefficients according to the ratio of output to 5962306a36Sopenharmony_ci * input widths, after accounting for up to two levels of decimation 6062306a36Sopenharmony_ci */ 6162306a36Sopenharmony_civoid sc_set_hs_coeffs(struct sc_data *sc, void *addr, unsigned int src_w, 6262306a36Sopenharmony_ci unsigned int dst_w) 6362306a36Sopenharmony_ci{ 6462306a36Sopenharmony_ci int sixteenths; 6562306a36Sopenharmony_ci int idx; 6662306a36Sopenharmony_ci int i, j; 6762306a36Sopenharmony_ci u16 *coeff_h = addr; 6862306a36Sopenharmony_ci const u16 *cp; 6962306a36Sopenharmony_ci 7062306a36Sopenharmony_ci if (dst_w > src_w) { 7162306a36Sopenharmony_ci idx = HS_UP_SCALE; 7262306a36Sopenharmony_ci } else { 7362306a36Sopenharmony_ci if ((dst_w << 1) < src_w) 7462306a36Sopenharmony_ci dst_w <<= 1; /* first level decimation */ 7562306a36Sopenharmony_ci if ((dst_w << 1) < src_w) 7662306a36Sopenharmony_ci dst_w <<= 1; /* second level decimation */ 7762306a36Sopenharmony_ci 7862306a36Sopenharmony_ci if (dst_w == src_w) { 7962306a36Sopenharmony_ci idx = HS_LE_16_16_SCALE; 8062306a36Sopenharmony_ci } else { 8162306a36Sopenharmony_ci sixteenths = (dst_w << 4) / src_w; 8262306a36Sopenharmony_ci if (sixteenths < 8) 8362306a36Sopenharmony_ci sixteenths = 8; 8462306a36Sopenharmony_ci idx = HS_LT_9_16_SCALE + sixteenths - 8; 8562306a36Sopenharmony_ci } 8662306a36Sopenharmony_ci } 8762306a36Sopenharmony_ci 8862306a36Sopenharmony_ci cp = scaler_hs_coeffs[idx]; 8962306a36Sopenharmony_ci 9062306a36Sopenharmony_ci for (i = 0; i < SC_NUM_PHASES * 2; i++) { 9162306a36Sopenharmony_ci for (j = 0; j < SC_H_NUM_TAPS; j++) 9262306a36Sopenharmony_ci *coeff_h++ = *cp++; 9362306a36Sopenharmony_ci /* 9462306a36Sopenharmony_ci * for each phase, the scaler expects space for 8 coefficients 9562306a36Sopenharmony_ci * in it's memory. For the horizontal scaler, we copy the first 9662306a36Sopenharmony_ci * 7 coefficients and skip the last slot to move to the next 9762306a36Sopenharmony_ci * row to hold coefficients for the next phase 9862306a36Sopenharmony_ci */ 9962306a36Sopenharmony_ci coeff_h += SC_NUM_TAPS_MEM_ALIGN - SC_H_NUM_TAPS; 10062306a36Sopenharmony_ci } 10162306a36Sopenharmony_ci 10262306a36Sopenharmony_ci sc->load_coeff_h = true; 10362306a36Sopenharmony_ci} 10462306a36Sopenharmony_ciEXPORT_SYMBOL(sc_set_hs_coeffs); 10562306a36Sopenharmony_ci 10662306a36Sopenharmony_ci/* 10762306a36Sopenharmony_ci * set the vertical scaler coefficients according to the ratio of output to 10862306a36Sopenharmony_ci * input heights 10962306a36Sopenharmony_ci */ 11062306a36Sopenharmony_civoid sc_set_vs_coeffs(struct sc_data *sc, void *addr, unsigned int src_h, 11162306a36Sopenharmony_ci unsigned int dst_h) 11262306a36Sopenharmony_ci{ 11362306a36Sopenharmony_ci int sixteenths; 11462306a36Sopenharmony_ci int idx; 11562306a36Sopenharmony_ci int i, j; 11662306a36Sopenharmony_ci u16 *coeff_v = addr; 11762306a36Sopenharmony_ci const u16 *cp; 11862306a36Sopenharmony_ci 11962306a36Sopenharmony_ci if (dst_h > src_h) { 12062306a36Sopenharmony_ci idx = VS_UP_SCALE; 12162306a36Sopenharmony_ci } else if (dst_h == src_h) { 12262306a36Sopenharmony_ci idx = VS_1_TO_1_SCALE; 12362306a36Sopenharmony_ci } else { 12462306a36Sopenharmony_ci sixteenths = (dst_h << 4) / src_h; 12562306a36Sopenharmony_ci if (sixteenths < 8) 12662306a36Sopenharmony_ci sixteenths = 8; 12762306a36Sopenharmony_ci idx = VS_LT_9_16_SCALE + sixteenths - 8; 12862306a36Sopenharmony_ci } 12962306a36Sopenharmony_ci 13062306a36Sopenharmony_ci cp = scaler_vs_coeffs[idx]; 13162306a36Sopenharmony_ci 13262306a36Sopenharmony_ci for (i = 0; i < SC_NUM_PHASES * 2; i++) { 13362306a36Sopenharmony_ci for (j = 0; j < SC_V_NUM_TAPS; j++) 13462306a36Sopenharmony_ci *coeff_v++ = *cp++; 13562306a36Sopenharmony_ci /* 13662306a36Sopenharmony_ci * for the vertical scaler, we copy the first 5 coefficients and 13762306a36Sopenharmony_ci * skip the last 3 slots to move to the next row to hold 13862306a36Sopenharmony_ci * coefficients for the next phase 13962306a36Sopenharmony_ci */ 14062306a36Sopenharmony_ci coeff_v += SC_NUM_TAPS_MEM_ALIGN - SC_V_NUM_TAPS; 14162306a36Sopenharmony_ci } 14262306a36Sopenharmony_ci 14362306a36Sopenharmony_ci sc->load_coeff_v = true; 14462306a36Sopenharmony_ci} 14562306a36Sopenharmony_ciEXPORT_SYMBOL(sc_set_vs_coeffs); 14662306a36Sopenharmony_ci 14762306a36Sopenharmony_civoid sc_config_scaler(struct sc_data *sc, u32 *sc_reg0, u32 *sc_reg8, 14862306a36Sopenharmony_ci u32 *sc_reg17, unsigned int src_w, unsigned int src_h, 14962306a36Sopenharmony_ci unsigned int dst_w, unsigned int dst_h) 15062306a36Sopenharmony_ci{ 15162306a36Sopenharmony_ci struct device *dev = &sc->pdev->dev; 15262306a36Sopenharmony_ci u32 val; 15362306a36Sopenharmony_ci int dcm_x, dcm_shift; 15462306a36Sopenharmony_ci bool use_rav; 15562306a36Sopenharmony_ci unsigned long lltmp; 15662306a36Sopenharmony_ci u32 lin_acc_inc, lin_acc_inc_u; 15762306a36Sopenharmony_ci u32 col_acc_offset; 15862306a36Sopenharmony_ci u16 factor = 0; 15962306a36Sopenharmony_ci int row_acc_init_rav = 0, row_acc_init_rav_b = 0; 16062306a36Sopenharmony_ci u32 row_acc_inc = 0, row_acc_offset = 0, row_acc_offset_b = 0; 16162306a36Sopenharmony_ci /* 16262306a36Sopenharmony_ci * location of SC register in payload memory with respect to the first 16362306a36Sopenharmony_ci * register in the mmr address data block 16462306a36Sopenharmony_ci */ 16562306a36Sopenharmony_ci u32 *sc_reg9 = sc_reg8 + 1; 16662306a36Sopenharmony_ci u32 *sc_reg12 = sc_reg8 + 4; 16762306a36Sopenharmony_ci u32 *sc_reg13 = sc_reg8 + 5; 16862306a36Sopenharmony_ci u32 *sc_reg24 = sc_reg17 + 7; 16962306a36Sopenharmony_ci 17062306a36Sopenharmony_ci val = sc_reg0[0]; 17162306a36Sopenharmony_ci 17262306a36Sopenharmony_ci /* clear all the features(they may get enabled elsewhere later) */ 17362306a36Sopenharmony_ci val &= ~(CFG_SELFGEN_FID | CFG_TRIM | CFG_ENABLE_SIN2_VER_INTP | 17462306a36Sopenharmony_ci CFG_INTERLACE_I | CFG_DCM_4X | CFG_DCM_2X | CFG_AUTO_HS | 17562306a36Sopenharmony_ci CFG_ENABLE_EV | CFG_USE_RAV | CFG_INVT_FID | CFG_SC_BYPASS | 17662306a36Sopenharmony_ci CFG_INTERLACE_O | CFG_Y_PK_EN | CFG_HP_BYPASS | CFG_LINEAR); 17762306a36Sopenharmony_ci 17862306a36Sopenharmony_ci if (src_w == dst_w && src_h == dst_h) { 17962306a36Sopenharmony_ci val |= CFG_SC_BYPASS; 18062306a36Sopenharmony_ci sc_reg0[0] = val; 18162306a36Sopenharmony_ci return; 18262306a36Sopenharmony_ci } 18362306a36Sopenharmony_ci 18462306a36Sopenharmony_ci /* we only support linear scaling for now */ 18562306a36Sopenharmony_ci val |= CFG_LINEAR; 18662306a36Sopenharmony_ci 18762306a36Sopenharmony_ci /* configure horizontal scaler */ 18862306a36Sopenharmony_ci 18962306a36Sopenharmony_ci /* enable 2X or 4X decimation */ 19062306a36Sopenharmony_ci dcm_x = src_w / dst_w; 19162306a36Sopenharmony_ci if (dcm_x > 4) { 19262306a36Sopenharmony_ci val |= CFG_DCM_4X; 19362306a36Sopenharmony_ci dcm_shift = 2; 19462306a36Sopenharmony_ci } else if (dcm_x > 2) { 19562306a36Sopenharmony_ci val |= CFG_DCM_2X; 19662306a36Sopenharmony_ci dcm_shift = 1; 19762306a36Sopenharmony_ci } else { 19862306a36Sopenharmony_ci dcm_shift = 0; 19962306a36Sopenharmony_ci } 20062306a36Sopenharmony_ci 20162306a36Sopenharmony_ci lltmp = dst_w - 1; 20262306a36Sopenharmony_ci lin_acc_inc = div64_u64(((u64)(src_w >> dcm_shift) - 1) << 24, lltmp); 20362306a36Sopenharmony_ci lin_acc_inc_u = 0; 20462306a36Sopenharmony_ci col_acc_offset = 0; 20562306a36Sopenharmony_ci 20662306a36Sopenharmony_ci dev_dbg(dev, "hs config: src_w = %d, dst_w = %d, decimation = %s, lin_acc_inc = %08x\n", 20762306a36Sopenharmony_ci src_w, dst_w, dcm_shift == 2 ? "4x" : 20862306a36Sopenharmony_ci (dcm_shift == 1 ? "2x" : "none"), lin_acc_inc); 20962306a36Sopenharmony_ci 21062306a36Sopenharmony_ci /* configure vertical scaler */ 21162306a36Sopenharmony_ci 21262306a36Sopenharmony_ci /* use RAV for vertical scaler if vertical downscaling is > 4x */ 21362306a36Sopenharmony_ci if (dst_h < (src_h >> 2)) { 21462306a36Sopenharmony_ci use_rav = true; 21562306a36Sopenharmony_ci val |= CFG_USE_RAV; 21662306a36Sopenharmony_ci } else { 21762306a36Sopenharmony_ci use_rav = false; 21862306a36Sopenharmony_ci } 21962306a36Sopenharmony_ci 22062306a36Sopenharmony_ci if (use_rav) { 22162306a36Sopenharmony_ci /* use RAV */ 22262306a36Sopenharmony_ci factor = (u16) ((dst_h << 10) / src_h); 22362306a36Sopenharmony_ci 22462306a36Sopenharmony_ci row_acc_init_rav = factor + ((1 + factor) >> 1); 22562306a36Sopenharmony_ci if (row_acc_init_rav >= 1024) 22662306a36Sopenharmony_ci row_acc_init_rav -= 1024; 22762306a36Sopenharmony_ci 22862306a36Sopenharmony_ci row_acc_init_rav_b = row_acc_init_rav + 22962306a36Sopenharmony_ci (1 + (row_acc_init_rav >> 1)) - 23062306a36Sopenharmony_ci (1024 >> 1); 23162306a36Sopenharmony_ci 23262306a36Sopenharmony_ci if (row_acc_init_rav_b < 0) { 23362306a36Sopenharmony_ci row_acc_init_rav_b += row_acc_init_rav; 23462306a36Sopenharmony_ci row_acc_init_rav *= 2; 23562306a36Sopenharmony_ci } 23662306a36Sopenharmony_ci 23762306a36Sopenharmony_ci dev_dbg(dev, "vs config(RAV): src_h = %d, dst_h = %d, factor = %d, acc_init = %08x, acc_init_b = %08x\n", 23862306a36Sopenharmony_ci src_h, dst_h, factor, row_acc_init_rav, 23962306a36Sopenharmony_ci row_acc_init_rav_b); 24062306a36Sopenharmony_ci } else { 24162306a36Sopenharmony_ci /* use polyphase */ 24262306a36Sopenharmony_ci row_acc_inc = ((src_h - 1) << 16) / (dst_h - 1); 24362306a36Sopenharmony_ci row_acc_offset = 0; 24462306a36Sopenharmony_ci row_acc_offset_b = 0; 24562306a36Sopenharmony_ci 24662306a36Sopenharmony_ci dev_dbg(dev, "vs config(POLY): src_h = %d, dst_h = %d,row_acc_inc = %08x\n", 24762306a36Sopenharmony_ci src_h, dst_h, row_acc_inc); 24862306a36Sopenharmony_ci } 24962306a36Sopenharmony_ci 25062306a36Sopenharmony_ci 25162306a36Sopenharmony_ci sc_reg0[0] = val; 25262306a36Sopenharmony_ci sc_reg0[1] = row_acc_inc; 25362306a36Sopenharmony_ci sc_reg0[2] = row_acc_offset; 25462306a36Sopenharmony_ci sc_reg0[3] = row_acc_offset_b; 25562306a36Sopenharmony_ci 25662306a36Sopenharmony_ci sc_reg0[4] = ((lin_acc_inc_u & CFG_LIN_ACC_INC_U_MASK) << 25762306a36Sopenharmony_ci CFG_LIN_ACC_INC_U_SHIFT) | (dst_w << CFG_TAR_W_SHIFT) | 25862306a36Sopenharmony_ci (dst_h << CFG_TAR_H_SHIFT); 25962306a36Sopenharmony_ci 26062306a36Sopenharmony_ci sc_reg0[5] = (src_w << CFG_SRC_W_SHIFT) | (src_h << CFG_SRC_H_SHIFT); 26162306a36Sopenharmony_ci 26262306a36Sopenharmony_ci sc_reg0[6] = (row_acc_init_rav_b << CFG_ROW_ACC_INIT_RAV_B_SHIFT) | 26362306a36Sopenharmony_ci (row_acc_init_rav << CFG_ROW_ACC_INIT_RAV_SHIFT); 26462306a36Sopenharmony_ci 26562306a36Sopenharmony_ci *sc_reg9 = lin_acc_inc; 26662306a36Sopenharmony_ci 26762306a36Sopenharmony_ci *sc_reg12 = col_acc_offset << CFG_COL_ACC_OFFSET_SHIFT; 26862306a36Sopenharmony_ci 26962306a36Sopenharmony_ci *sc_reg13 = factor; 27062306a36Sopenharmony_ci 27162306a36Sopenharmony_ci *sc_reg24 = (src_w << CFG_ORG_W_SHIFT) | (src_h << CFG_ORG_H_SHIFT); 27262306a36Sopenharmony_ci} 27362306a36Sopenharmony_ciEXPORT_SYMBOL(sc_config_scaler); 27462306a36Sopenharmony_ci 27562306a36Sopenharmony_cistruct sc_data *sc_create(struct platform_device *pdev, const char *res_name) 27662306a36Sopenharmony_ci{ 27762306a36Sopenharmony_ci struct sc_data *sc; 27862306a36Sopenharmony_ci 27962306a36Sopenharmony_ci dev_dbg(&pdev->dev, "sc_create\n"); 28062306a36Sopenharmony_ci 28162306a36Sopenharmony_ci sc = devm_kzalloc(&pdev->dev, sizeof(*sc), GFP_KERNEL); 28262306a36Sopenharmony_ci if (!sc) { 28362306a36Sopenharmony_ci dev_err(&pdev->dev, "couldn't alloc sc_data\n"); 28462306a36Sopenharmony_ci return ERR_PTR(-ENOMEM); 28562306a36Sopenharmony_ci } 28662306a36Sopenharmony_ci 28762306a36Sopenharmony_ci sc->pdev = pdev; 28862306a36Sopenharmony_ci 28962306a36Sopenharmony_ci sc->res = platform_get_resource_byname(pdev, IORESOURCE_MEM, res_name); 29062306a36Sopenharmony_ci if (!sc->res) { 29162306a36Sopenharmony_ci dev_err(&pdev->dev, "missing '%s' platform resources data\n", 29262306a36Sopenharmony_ci res_name); 29362306a36Sopenharmony_ci return ERR_PTR(-ENODEV); 29462306a36Sopenharmony_ci } 29562306a36Sopenharmony_ci 29662306a36Sopenharmony_ci sc->base = devm_ioremap_resource(&pdev->dev, sc->res); 29762306a36Sopenharmony_ci if (IS_ERR(sc->base)) 29862306a36Sopenharmony_ci return ERR_CAST(sc->base); 29962306a36Sopenharmony_ci 30062306a36Sopenharmony_ci return sc; 30162306a36Sopenharmony_ci} 30262306a36Sopenharmony_ciEXPORT_SYMBOL(sc_create); 30362306a36Sopenharmony_ci 30462306a36Sopenharmony_ciMODULE_DESCRIPTION("TI VIP/VPE Scaler"); 30562306a36Sopenharmony_ciMODULE_AUTHOR("Texas Instruments Inc."); 30662306a36Sopenharmony_ciMODULE_LICENSE("GPL v2"); 307