xref: /OK3568_Linux_fs/kernel/drivers/media/platform/ti-vpe/sc.c (revision 4882a59341e53eb6f0b4789bf948001014eff981)
1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0-only
2*4882a593Smuzhiyun /*
3*4882a593Smuzhiyun  * Scaler library
4*4882a593Smuzhiyun  *
5*4882a593Smuzhiyun  * Copyright (c) 2013 Texas Instruments Inc.
6*4882a593Smuzhiyun  *
7*4882a593Smuzhiyun  * David Griego, <dagriego@biglakesoftware.com>
8*4882a593Smuzhiyun  * Dale Farnsworth, <dale@farnsworth.org>
9*4882a593Smuzhiyun  * Archit Taneja, <archit@ti.com>
10*4882a593Smuzhiyun  */
11*4882a593Smuzhiyun 
12*4882a593Smuzhiyun #include <linux/err.h>
13*4882a593Smuzhiyun #include <linux/io.h>
14*4882a593Smuzhiyun #include <linux/module.h>
15*4882a593Smuzhiyun #include <linux/platform_device.h>
16*4882a593Smuzhiyun #include <linux/slab.h>
17*4882a593Smuzhiyun 
18*4882a593Smuzhiyun #include "sc.h"
19*4882a593Smuzhiyun #include "sc_coeff.h"
20*4882a593Smuzhiyun 
sc_dump_regs(struct sc_data * sc)21*4882a593Smuzhiyun void sc_dump_regs(struct sc_data *sc)
22*4882a593Smuzhiyun {
23*4882a593Smuzhiyun 	struct device *dev = &sc->pdev->dev;
24*4882a593Smuzhiyun 
25*4882a593Smuzhiyun #define DUMPREG(r) dev_dbg(dev, "%-35s %08x\n", #r, \
26*4882a593Smuzhiyun 	ioread32(sc->base + CFG_##r))
27*4882a593Smuzhiyun 
28*4882a593Smuzhiyun 	dev_dbg(dev, "SC Registers @ %pa:\n", &sc->res->start);
29*4882a593Smuzhiyun 
30*4882a593Smuzhiyun 	DUMPREG(SC0);
31*4882a593Smuzhiyun 	DUMPREG(SC1);
32*4882a593Smuzhiyun 	DUMPREG(SC2);
33*4882a593Smuzhiyun 	DUMPREG(SC3);
34*4882a593Smuzhiyun 	DUMPREG(SC4);
35*4882a593Smuzhiyun 	DUMPREG(SC5);
36*4882a593Smuzhiyun 	DUMPREG(SC6);
37*4882a593Smuzhiyun 	DUMPREG(SC8);
38*4882a593Smuzhiyun 	DUMPREG(SC9);
39*4882a593Smuzhiyun 	DUMPREG(SC10);
40*4882a593Smuzhiyun 	DUMPREG(SC11);
41*4882a593Smuzhiyun 	DUMPREG(SC12);
42*4882a593Smuzhiyun 	DUMPREG(SC13);
43*4882a593Smuzhiyun 	DUMPREG(SC17);
44*4882a593Smuzhiyun 	DUMPREG(SC18);
45*4882a593Smuzhiyun 	DUMPREG(SC19);
46*4882a593Smuzhiyun 	DUMPREG(SC20);
47*4882a593Smuzhiyun 	DUMPREG(SC21);
48*4882a593Smuzhiyun 	DUMPREG(SC22);
49*4882a593Smuzhiyun 	DUMPREG(SC23);
50*4882a593Smuzhiyun 	DUMPREG(SC24);
51*4882a593Smuzhiyun 	DUMPREG(SC25);
52*4882a593Smuzhiyun 
53*4882a593Smuzhiyun #undef DUMPREG
54*4882a593Smuzhiyun }
55*4882a593Smuzhiyun EXPORT_SYMBOL(sc_dump_regs);
56*4882a593Smuzhiyun 
57*4882a593Smuzhiyun /*
58*4882a593Smuzhiyun  * set the horizontal scaler coefficients according to the ratio of output to
59*4882a593Smuzhiyun  * input widths, after accounting for up to two levels of decimation
60*4882a593Smuzhiyun  */
sc_set_hs_coeffs(struct sc_data * sc,void * addr,unsigned int src_w,unsigned int dst_w)61*4882a593Smuzhiyun void sc_set_hs_coeffs(struct sc_data *sc, void *addr, unsigned int src_w,
62*4882a593Smuzhiyun 		unsigned int dst_w)
63*4882a593Smuzhiyun {
64*4882a593Smuzhiyun 	int sixteenths;
65*4882a593Smuzhiyun 	int idx;
66*4882a593Smuzhiyun 	int i, j;
67*4882a593Smuzhiyun 	u16 *coeff_h = addr;
68*4882a593Smuzhiyun 	const u16 *cp;
69*4882a593Smuzhiyun 
70*4882a593Smuzhiyun 	if (dst_w > src_w) {
71*4882a593Smuzhiyun 		idx = HS_UP_SCALE;
72*4882a593Smuzhiyun 	} else {
73*4882a593Smuzhiyun 		if ((dst_w << 1) < src_w)
74*4882a593Smuzhiyun 			dst_w <<= 1;	/* first level decimation */
75*4882a593Smuzhiyun 		if ((dst_w << 1) < src_w)
76*4882a593Smuzhiyun 			dst_w <<= 1;	/* second level decimation */
77*4882a593Smuzhiyun 
78*4882a593Smuzhiyun 		if (dst_w == src_w) {
79*4882a593Smuzhiyun 			idx = HS_LE_16_16_SCALE;
80*4882a593Smuzhiyun 		} else {
81*4882a593Smuzhiyun 			sixteenths = (dst_w << 4) / src_w;
82*4882a593Smuzhiyun 			if (sixteenths < 8)
83*4882a593Smuzhiyun 				sixteenths = 8;
84*4882a593Smuzhiyun 			idx = HS_LT_9_16_SCALE + sixteenths - 8;
85*4882a593Smuzhiyun 		}
86*4882a593Smuzhiyun 	}
87*4882a593Smuzhiyun 
88*4882a593Smuzhiyun 	cp = scaler_hs_coeffs[idx];
89*4882a593Smuzhiyun 
90*4882a593Smuzhiyun 	for (i = 0; i < SC_NUM_PHASES * 2; i++) {
91*4882a593Smuzhiyun 		for (j = 0; j < SC_H_NUM_TAPS; j++)
92*4882a593Smuzhiyun 			*coeff_h++ = *cp++;
93*4882a593Smuzhiyun 		/*
94*4882a593Smuzhiyun 		 * for each phase, the scaler expects space for 8 coefficients
95*4882a593Smuzhiyun 		 * in it's memory. For the horizontal scaler, we copy the first
96*4882a593Smuzhiyun 		 * 7 coefficients and skip the last slot to move to the next
97*4882a593Smuzhiyun 		 * row to hold coefficients for the next phase
98*4882a593Smuzhiyun 		 */
99*4882a593Smuzhiyun 		coeff_h += SC_NUM_TAPS_MEM_ALIGN - SC_H_NUM_TAPS;
100*4882a593Smuzhiyun 	}
101*4882a593Smuzhiyun 
102*4882a593Smuzhiyun 	sc->load_coeff_h = true;
103*4882a593Smuzhiyun }
104*4882a593Smuzhiyun EXPORT_SYMBOL(sc_set_hs_coeffs);
105*4882a593Smuzhiyun 
106*4882a593Smuzhiyun /*
107*4882a593Smuzhiyun  * set the vertical scaler coefficients according to the ratio of output to
108*4882a593Smuzhiyun  * input heights
109*4882a593Smuzhiyun  */
sc_set_vs_coeffs(struct sc_data * sc,void * addr,unsigned int src_h,unsigned int dst_h)110*4882a593Smuzhiyun void sc_set_vs_coeffs(struct sc_data *sc, void *addr, unsigned int src_h,
111*4882a593Smuzhiyun 		unsigned int dst_h)
112*4882a593Smuzhiyun {
113*4882a593Smuzhiyun 	int sixteenths;
114*4882a593Smuzhiyun 	int idx;
115*4882a593Smuzhiyun 	int i, j;
116*4882a593Smuzhiyun 	u16 *coeff_v = addr;
117*4882a593Smuzhiyun 	const u16 *cp;
118*4882a593Smuzhiyun 
119*4882a593Smuzhiyun 	if (dst_h > src_h) {
120*4882a593Smuzhiyun 		idx = VS_UP_SCALE;
121*4882a593Smuzhiyun 	} else if (dst_h == src_h) {
122*4882a593Smuzhiyun 		idx = VS_1_TO_1_SCALE;
123*4882a593Smuzhiyun 	} else {
124*4882a593Smuzhiyun 		sixteenths = (dst_h << 4) / src_h;
125*4882a593Smuzhiyun 		if (sixteenths < 8)
126*4882a593Smuzhiyun 			sixteenths = 8;
127*4882a593Smuzhiyun 		idx = VS_LT_9_16_SCALE + sixteenths - 8;
128*4882a593Smuzhiyun 	}
129*4882a593Smuzhiyun 
130*4882a593Smuzhiyun 	cp = scaler_vs_coeffs[idx];
131*4882a593Smuzhiyun 
132*4882a593Smuzhiyun 	for (i = 0; i < SC_NUM_PHASES * 2; i++) {
133*4882a593Smuzhiyun 		for (j = 0; j < SC_V_NUM_TAPS; j++)
134*4882a593Smuzhiyun 			*coeff_v++ = *cp++;
135*4882a593Smuzhiyun 		/*
136*4882a593Smuzhiyun 		 * for the vertical scaler, we copy the first 5 coefficients and
137*4882a593Smuzhiyun 		 * skip the last 3 slots to move to the next row to hold
138*4882a593Smuzhiyun 		 * coefficients for the next phase
139*4882a593Smuzhiyun 		 */
140*4882a593Smuzhiyun 		coeff_v += SC_NUM_TAPS_MEM_ALIGN - SC_V_NUM_TAPS;
141*4882a593Smuzhiyun 	}
142*4882a593Smuzhiyun 
143*4882a593Smuzhiyun 	sc->load_coeff_v = true;
144*4882a593Smuzhiyun }
145*4882a593Smuzhiyun EXPORT_SYMBOL(sc_set_vs_coeffs);
146*4882a593Smuzhiyun 
sc_config_scaler(struct sc_data * sc,u32 * sc_reg0,u32 * sc_reg8,u32 * sc_reg17,unsigned int src_w,unsigned int src_h,unsigned int dst_w,unsigned int dst_h)147*4882a593Smuzhiyun void sc_config_scaler(struct sc_data *sc, u32 *sc_reg0, u32 *sc_reg8,
148*4882a593Smuzhiyun 		u32 *sc_reg17, unsigned int src_w, unsigned int src_h,
149*4882a593Smuzhiyun 		unsigned int dst_w, unsigned int dst_h)
150*4882a593Smuzhiyun {
151*4882a593Smuzhiyun 	struct device *dev = &sc->pdev->dev;
152*4882a593Smuzhiyun 	u32 val;
153*4882a593Smuzhiyun 	int dcm_x, dcm_shift;
154*4882a593Smuzhiyun 	bool use_rav;
155*4882a593Smuzhiyun 	unsigned long lltmp;
156*4882a593Smuzhiyun 	u32 lin_acc_inc, lin_acc_inc_u;
157*4882a593Smuzhiyun 	u32 col_acc_offset;
158*4882a593Smuzhiyun 	u16 factor = 0;
159*4882a593Smuzhiyun 	int row_acc_init_rav = 0, row_acc_init_rav_b = 0;
160*4882a593Smuzhiyun 	u32 row_acc_inc = 0, row_acc_offset = 0, row_acc_offset_b = 0;
161*4882a593Smuzhiyun 	/*
162*4882a593Smuzhiyun 	 * location of SC register in payload memory with respect to the first
163*4882a593Smuzhiyun 	 * register in the mmr address data block
164*4882a593Smuzhiyun 	 */
165*4882a593Smuzhiyun 	u32 *sc_reg9 = sc_reg8 + 1;
166*4882a593Smuzhiyun 	u32 *sc_reg12 = sc_reg8 + 4;
167*4882a593Smuzhiyun 	u32 *sc_reg13 = sc_reg8 + 5;
168*4882a593Smuzhiyun 	u32 *sc_reg24 = sc_reg17 + 7;
169*4882a593Smuzhiyun 
170*4882a593Smuzhiyun 	val = sc_reg0[0];
171*4882a593Smuzhiyun 
172*4882a593Smuzhiyun 	/* clear all the features(they may get enabled elsewhere later) */
173*4882a593Smuzhiyun 	val &= ~(CFG_SELFGEN_FID | CFG_TRIM | CFG_ENABLE_SIN2_VER_INTP |
174*4882a593Smuzhiyun 		CFG_INTERLACE_I | CFG_DCM_4X | CFG_DCM_2X | CFG_AUTO_HS |
175*4882a593Smuzhiyun 		CFG_ENABLE_EV | CFG_USE_RAV | CFG_INVT_FID | CFG_SC_BYPASS |
176*4882a593Smuzhiyun 		CFG_INTERLACE_O | CFG_Y_PK_EN | CFG_HP_BYPASS | CFG_LINEAR);
177*4882a593Smuzhiyun 
178*4882a593Smuzhiyun 	if (src_w == dst_w && src_h == dst_h) {
179*4882a593Smuzhiyun 		val |= CFG_SC_BYPASS;
180*4882a593Smuzhiyun 		sc_reg0[0] = val;
181*4882a593Smuzhiyun 		return;
182*4882a593Smuzhiyun 	}
183*4882a593Smuzhiyun 
184*4882a593Smuzhiyun 	/* we only support linear scaling for now */
185*4882a593Smuzhiyun 	val |= CFG_LINEAR;
186*4882a593Smuzhiyun 
187*4882a593Smuzhiyun 	/* configure horizontal scaler */
188*4882a593Smuzhiyun 
189*4882a593Smuzhiyun 	/* enable 2X or 4X decimation */
190*4882a593Smuzhiyun 	dcm_x = src_w / dst_w;
191*4882a593Smuzhiyun 	if (dcm_x > 4) {
192*4882a593Smuzhiyun 		val |= CFG_DCM_4X;
193*4882a593Smuzhiyun 		dcm_shift = 2;
194*4882a593Smuzhiyun 	} else if (dcm_x > 2) {
195*4882a593Smuzhiyun 		val |= CFG_DCM_2X;
196*4882a593Smuzhiyun 		dcm_shift = 1;
197*4882a593Smuzhiyun 	} else {
198*4882a593Smuzhiyun 		dcm_shift = 0;
199*4882a593Smuzhiyun 	}
200*4882a593Smuzhiyun 
201*4882a593Smuzhiyun 	lltmp = dst_w - 1;
202*4882a593Smuzhiyun 	lin_acc_inc = div64_u64(((u64)(src_w >> dcm_shift) - 1) << 24, lltmp);
203*4882a593Smuzhiyun 	lin_acc_inc_u = 0;
204*4882a593Smuzhiyun 	col_acc_offset = 0;
205*4882a593Smuzhiyun 
206*4882a593Smuzhiyun 	dev_dbg(dev, "hs config: src_w = %d, dst_w = %d, decimation = %s, lin_acc_inc = %08x\n",
207*4882a593Smuzhiyun 		src_w, dst_w, dcm_shift == 2 ? "4x" :
208*4882a593Smuzhiyun 		(dcm_shift == 1 ? "2x" : "none"), lin_acc_inc);
209*4882a593Smuzhiyun 
210*4882a593Smuzhiyun 	/* configure vertical scaler */
211*4882a593Smuzhiyun 
212*4882a593Smuzhiyun 	/* use RAV for vertical scaler if vertical downscaling is > 4x */
213*4882a593Smuzhiyun 	if (dst_h < (src_h >> 2)) {
214*4882a593Smuzhiyun 		use_rav = true;
215*4882a593Smuzhiyun 		val |= CFG_USE_RAV;
216*4882a593Smuzhiyun 	} else {
217*4882a593Smuzhiyun 		use_rav = false;
218*4882a593Smuzhiyun 	}
219*4882a593Smuzhiyun 
220*4882a593Smuzhiyun 	if (use_rav) {
221*4882a593Smuzhiyun 		/* use RAV */
222*4882a593Smuzhiyun 		factor = (u16) ((dst_h << 10) / src_h);
223*4882a593Smuzhiyun 
224*4882a593Smuzhiyun 		row_acc_init_rav = factor + ((1 + factor) >> 1);
225*4882a593Smuzhiyun 		if (row_acc_init_rav >= 1024)
226*4882a593Smuzhiyun 			row_acc_init_rav -= 1024;
227*4882a593Smuzhiyun 
228*4882a593Smuzhiyun 		row_acc_init_rav_b = row_acc_init_rav +
229*4882a593Smuzhiyun 				(1 + (row_acc_init_rav >> 1)) -
230*4882a593Smuzhiyun 				(1024 >> 1);
231*4882a593Smuzhiyun 
232*4882a593Smuzhiyun 		if (row_acc_init_rav_b < 0) {
233*4882a593Smuzhiyun 			row_acc_init_rav_b += row_acc_init_rav;
234*4882a593Smuzhiyun 			row_acc_init_rav *= 2;
235*4882a593Smuzhiyun 		}
236*4882a593Smuzhiyun 
237*4882a593Smuzhiyun 		dev_dbg(dev, "vs config(RAV): src_h = %d, dst_h = %d, factor = %d, acc_init = %08x, acc_init_b = %08x\n",
238*4882a593Smuzhiyun 			src_h, dst_h, factor, row_acc_init_rav,
239*4882a593Smuzhiyun 			row_acc_init_rav_b);
240*4882a593Smuzhiyun 	} else {
241*4882a593Smuzhiyun 		/* use polyphase */
242*4882a593Smuzhiyun 		row_acc_inc = ((src_h - 1) << 16) / (dst_h - 1);
243*4882a593Smuzhiyun 		row_acc_offset = 0;
244*4882a593Smuzhiyun 		row_acc_offset_b = 0;
245*4882a593Smuzhiyun 
246*4882a593Smuzhiyun 		dev_dbg(dev, "vs config(POLY): src_h = %d, dst_h = %d,row_acc_inc = %08x\n",
247*4882a593Smuzhiyun 			src_h, dst_h, row_acc_inc);
248*4882a593Smuzhiyun 	}
249*4882a593Smuzhiyun 
250*4882a593Smuzhiyun 
251*4882a593Smuzhiyun 	sc_reg0[0] = val;
252*4882a593Smuzhiyun 	sc_reg0[1] = row_acc_inc;
253*4882a593Smuzhiyun 	sc_reg0[2] = row_acc_offset;
254*4882a593Smuzhiyun 	sc_reg0[3] = row_acc_offset_b;
255*4882a593Smuzhiyun 
256*4882a593Smuzhiyun 	sc_reg0[4] = ((lin_acc_inc_u & CFG_LIN_ACC_INC_U_MASK) <<
257*4882a593Smuzhiyun 			CFG_LIN_ACC_INC_U_SHIFT) | (dst_w << CFG_TAR_W_SHIFT) |
258*4882a593Smuzhiyun 			(dst_h << CFG_TAR_H_SHIFT);
259*4882a593Smuzhiyun 
260*4882a593Smuzhiyun 	sc_reg0[5] = (src_w << CFG_SRC_W_SHIFT) | (src_h << CFG_SRC_H_SHIFT);
261*4882a593Smuzhiyun 
262*4882a593Smuzhiyun 	sc_reg0[6] = (row_acc_init_rav_b << CFG_ROW_ACC_INIT_RAV_B_SHIFT) |
263*4882a593Smuzhiyun 		(row_acc_init_rav << CFG_ROW_ACC_INIT_RAV_SHIFT);
264*4882a593Smuzhiyun 
265*4882a593Smuzhiyun 	*sc_reg9 = lin_acc_inc;
266*4882a593Smuzhiyun 
267*4882a593Smuzhiyun 	*sc_reg12 = col_acc_offset << CFG_COL_ACC_OFFSET_SHIFT;
268*4882a593Smuzhiyun 
269*4882a593Smuzhiyun 	*sc_reg13 = factor;
270*4882a593Smuzhiyun 
271*4882a593Smuzhiyun 	*sc_reg24 = (src_w << CFG_ORG_W_SHIFT) | (src_h << CFG_ORG_H_SHIFT);
272*4882a593Smuzhiyun }
273*4882a593Smuzhiyun EXPORT_SYMBOL(sc_config_scaler);
274*4882a593Smuzhiyun 
sc_create(struct platform_device * pdev,const char * res_name)275*4882a593Smuzhiyun struct sc_data *sc_create(struct platform_device *pdev, const char *res_name)
276*4882a593Smuzhiyun {
277*4882a593Smuzhiyun 	struct sc_data *sc;
278*4882a593Smuzhiyun 
279*4882a593Smuzhiyun 	dev_dbg(&pdev->dev, "sc_create\n");
280*4882a593Smuzhiyun 
281*4882a593Smuzhiyun 	sc = devm_kzalloc(&pdev->dev, sizeof(*sc), GFP_KERNEL);
282*4882a593Smuzhiyun 	if (!sc) {
283*4882a593Smuzhiyun 		dev_err(&pdev->dev, "couldn't alloc sc_data\n");
284*4882a593Smuzhiyun 		return ERR_PTR(-ENOMEM);
285*4882a593Smuzhiyun 	}
286*4882a593Smuzhiyun 
287*4882a593Smuzhiyun 	sc->pdev = pdev;
288*4882a593Smuzhiyun 
289*4882a593Smuzhiyun 	sc->res = platform_get_resource_byname(pdev, IORESOURCE_MEM, res_name);
290*4882a593Smuzhiyun 	if (!sc->res) {
291*4882a593Smuzhiyun 		dev_err(&pdev->dev, "missing '%s' platform resources data\n",
292*4882a593Smuzhiyun 			res_name);
293*4882a593Smuzhiyun 		return ERR_PTR(-ENODEV);
294*4882a593Smuzhiyun 	}
295*4882a593Smuzhiyun 
296*4882a593Smuzhiyun 	sc->base = devm_ioremap_resource(&pdev->dev, sc->res);
297*4882a593Smuzhiyun 	if (IS_ERR(sc->base)) {
298*4882a593Smuzhiyun 		dev_err(&pdev->dev, "failed to ioremap\n");
299*4882a593Smuzhiyun 		return ERR_CAST(sc->base);
300*4882a593Smuzhiyun 	}
301*4882a593Smuzhiyun 
302*4882a593Smuzhiyun 	return sc;
303*4882a593Smuzhiyun }
304*4882a593Smuzhiyun EXPORT_SYMBOL(sc_create);
305*4882a593Smuzhiyun 
306*4882a593Smuzhiyun MODULE_DESCRIPTION("TI VIP/VPE Scaler");
307*4882a593Smuzhiyun MODULE_AUTHOR("Texas Instruments Inc.");
308*4882a593Smuzhiyun MODULE_LICENSE("GPL v2");
309