xref: /OK3568_Linux_fs/kernel/drivers/media/platform/coda/coda-jpeg.c (revision 4882a59341e53eb6f0b4789bf948001014eff981)
1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0-or-later
2*4882a593Smuzhiyun /*
3*4882a593Smuzhiyun  * Coda multi-standard codec IP - JPEG support functions
4*4882a593Smuzhiyun  *
5*4882a593Smuzhiyun  * Copyright (C) 2014 Philipp Zabel, Pengutronix
6*4882a593Smuzhiyun  */
7*4882a593Smuzhiyun 
8*4882a593Smuzhiyun #include <asm/unaligned.h>
9*4882a593Smuzhiyun #include <linux/irqreturn.h>
10*4882a593Smuzhiyun #include <linux/kernel.h>
11*4882a593Smuzhiyun #include <linux/ktime.h>
12*4882a593Smuzhiyun #include <linux/slab.h>
13*4882a593Smuzhiyun #include <linux/swab.h>
14*4882a593Smuzhiyun #include <linux/videodev2.h>
15*4882a593Smuzhiyun 
16*4882a593Smuzhiyun #include <media/v4l2-common.h>
17*4882a593Smuzhiyun #include <media/v4l2-fh.h>
18*4882a593Smuzhiyun #include <media/v4l2-jpeg.h>
19*4882a593Smuzhiyun #include <media/v4l2-mem2mem.h>
20*4882a593Smuzhiyun #include <media/videobuf2-core.h>
21*4882a593Smuzhiyun #include <media/videobuf2-dma-contig.h>
22*4882a593Smuzhiyun 
23*4882a593Smuzhiyun #include "coda.h"
24*4882a593Smuzhiyun #include "trace.h"
25*4882a593Smuzhiyun 
26*4882a593Smuzhiyun #define SOI_MARKER	0xffd8
27*4882a593Smuzhiyun #define APP9_MARKER	0xffe9
28*4882a593Smuzhiyun #define DRI_MARKER	0xffdd
29*4882a593Smuzhiyun #define DQT_MARKER	0xffdb
30*4882a593Smuzhiyun #define DHT_MARKER	0xffc4
31*4882a593Smuzhiyun #define SOF_MARKER	0xffc0
32*4882a593Smuzhiyun #define SOS_MARKER	0xffda
33*4882a593Smuzhiyun #define EOI_MARKER	0xffd9
34*4882a593Smuzhiyun 
35*4882a593Smuzhiyun enum {
36*4882a593Smuzhiyun 	CODA9_JPEG_FORMAT_420,
37*4882a593Smuzhiyun 	CODA9_JPEG_FORMAT_422,
38*4882a593Smuzhiyun 	CODA9_JPEG_FORMAT_224,
39*4882a593Smuzhiyun 	CODA9_JPEG_FORMAT_444,
40*4882a593Smuzhiyun 	CODA9_JPEG_FORMAT_400,
41*4882a593Smuzhiyun };
42*4882a593Smuzhiyun 
43*4882a593Smuzhiyun struct coda_huff_tab {
44*4882a593Smuzhiyun 	u8 luma_dc[16 + 12];
45*4882a593Smuzhiyun 	u8 chroma_dc[16 + 12];
46*4882a593Smuzhiyun 	u8 luma_ac[16 + 162];
47*4882a593Smuzhiyun 	u8 chroma_ac[16 + 162];
48*4882a593Smuzhiyun 
49*4882a593Smuzhiyun 	/* DC Luma, DC Chroma, AC Luma, AC Chroma */
50*4882a593Smuzhiyun 	s16	min[4 * 16];
51*4882a593Smuzhiyun 	s16	max[4 * 16];
52*4882a593Smuzhiyun 	s8	ptr[4 * 16];
53*4882a593Smuzhiyun };
54*4882a593Smuzhiyun 
55*4882a593Smuzhiyun #define CODA9_JPEG_ENC_HUFF_DATA_SIZE	(256 + 256 + 16 + 16)
56*4882a593Smuzhiyun 
57*4882a593Smuzhiyun /*
58*4882a593Smuzhiyun  * Typical Huffman tables for 8-bit precision luminance and
59*4882a593Smuzhiyun  * chrominance from JPEG ITU-T.81 (ISO/IEC 10918-1) Annex K.3
60*4882a593Smuzhiyun  */
61*4882a593Smuzhiyun 
62*4882a593Smuzhiyun static const unsigned char luma_dc[16 + 12] = {
63*4882a593Smuzhiyun 	/* bits */
64*4882a593Smuzhiyun 	0x00, 0x01, 0x05, 0x01, 0x01, 0x01, 0x01, 0x01,
65*4882a593Smuzhiyun 	0x01, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
66*4882a593Smuzhiyun 	/* values */
67*4882a593Smuzhiyun 	0x00, 0x01, 0x02, 0x03, 0x04, 0x05, 0x06, 0x07,
68*4882a593Smuzhiyun 	0x08, 0x09, 0x0a, 0x0b,
69*4882a593Smuzhiyun };
70*4882a593Smuzhiyun 
71*4882a593Smuzhiyun static const unsigned char chroma_dc[16 + 12] = {
72*4882a593Smuzhiyun 	/* bits */
73*4882a593Smuzhiyun 	0x00, 0x03, 0x01, 0x01, 0x01, 0x01, 0x01, 0x01,
74*4882a593Smuzhiyun 	0x01, 0x01, 0x01, 0x00, 0x00, 0x00, 0x00, 0x00,
75*4882a593Smuzhiyun 	/* values */
76*4882a593Smuzhiyun 	0x00, 0x01, 0x02, 0x03, 0x04, 0x05, 0x06, 0x07,
77*4882a593Smuzhiyun 	0x08, 0x09, 0x0a, 0x0b,
78*4882a593Smuzhiyun };
79*4882a593Smuzhiyun 
80*4882a593Smuzhiyun static const unsigned char luma_ac[16 + 162 + 2] = {
81*4882a593Smuzhiyun 	/* bits */
82*4882a593Smuzhiyun 	0x00, 0x02, 0x01, 0x03, 0x03, 0x02, 0x04, 0x03,
83*4882a593Smuzhiyun 	0x05, 0x05, 0x04, 0x04, 0x00, 0x00, 0x01, 0x7d,
84*4882a593Smuzhiyun 	/* values */
85*4882a593Smuzhiyun 	0x01, 0x02, 0x03, 0x00, 0x04, 0x11, 0x05, 0x12,
86*4882a593Smuzhiyun 	0x21, 0x31, 0x41, 0x06, 0x13, 0x51, 0x61, 0x07,
87*4882a593Smuzhiyun 	0x22, 0x71, 0x14, 0x32, 0x81, 0x91, 0xa1, 0x08,
88*4882a593Smuzhiyun 	0x23, 0x42, 0xb1, 0xc1, 0x15, 0x52, 0xd1, 0xf0,
89*4882a593Smuzhiyun 	0x24, 0x33, 0x62, 0x72, 0x82, 0x09, 0x0a, 0x16,
90*4882a593Smuzhiyun 	0x17, 0x18, 0x19, 0x1a, 0x25, 0x26, 0x27, 0x28,
91*4882a593Smuzhiyun 	0x29, 0x2a, 0x34, 0x35, 0x36, 0x37, 0x38, 0x39,
92*4882a593Smuzhiyun 	0x3a, 0x43, 0x44, 0x45, 0x46, 0x47, 0x48, 0x49,
93*4882a593Smuzhiyun 	0x4a, 0x53, 0x54, 0x55, 0x56, 0x57, 0x58, 0x59,
94*4882a593Smuzhiyun 	0x5a, 0x63, 0x64, 0x65, 0x66, 0x67, 0x68, 0x69,
95*4882a593Smuzhiyun 	0x6a, 0x73, 0x74, 0x75, 0x76, 0x77, 0x78, 0x79,
96*4882a593Smuzhiyun 	0x7a, 0x83, 0x84, 0x85, 0x86, 0x87, 0x88, 0x89,
97*4882a593Smuzhiyun 	0x8a, 0x92, 0x93, 0x94, 0x95, 0x96, 0x97, 0x98,
98*4882a593Smuzhiyun 	0x99, 0x9a, 0xa2, 0xa3, 0xa4, 0xa5, 0xa6, 0xa7,
99*4882a593Smuzhiyun 	0xa8, 0xa9, 0xaa, 0xb2, 0xb3, 0xb4, 0xb5, 0xb6,
100*4882a593Smuzhiyun 	0xb7, 0xb8, 0xb9, 0xba, 0xc2, 0xc3, 0xc4, 0xc5,
101*4882a593Smuzhiyun 	0xc6, 0xc7, 0xc8, 0xc9, 0xca, 0xd2, 0xd3, 0xd4,
102*4882a593Smuzhiyun 	0xd5, 0xd6, 0xd7, 0xd8, 0xd9, 0xda, 0xe1, 0xe2,
103*4882a593Smuzhiyun 	0xe3, 0xe4, 0xe5, 0xe6, 0xe7, 0xe8, 0xe9, 0xea,
104*4882a593Smuzhiyun 	0xf1, 0xf2, 0xf3, 0xf4, 0xf5, 0xf6, 0xf7, 0xf8,
105*4882a593Smuzhiyun 	0xf9, 0xfa, /* padded to 32-bit */
106*4882a593Smuzhiyun };
107*4882a593Smuzhiyun 
108*4882a593Smuzhiyun static const unsigned char chroma_ac[16 + 162 + 2] = {
109*4882a593Smuzhiyun 	/* bits */
110*4882a593Smuzhiyun 	0x00, 0x02, 0x01, 0x02, 0x04, 0x04, 0x03, 0x04,
111*4882a593Smuzhiyun 	0x07, 0x05, 0x04, 0x04, 0x00, 0x01, 0x02, 0x77,
112*4882a593Smuzhiyun 	/* values */
113*4882a593Smuzhiyun 	0x00, 0x01, 0x02, 0x03, 0x11, 0x04, 0x05, 0x21,
114*4882a593Smuzhiyun 	0x31, 0x06, 0x12, 0x41, 0x51, 0x07, 0x61, 0x71,
115*4882a593Smuzhiyun 	0x13, 0x22, 0x32, 0x81, 0x08, 0x14, 0x42, 0x91,
116*4882a593Smuzhiyun 	0xa1, 0xb1, 0xc1, 0x09, 0x23, 0x33, 0x52, 0xf0,
117*4882a593Smuzhiyun 	0x15, 0x62, 0x72, 0xd1, 0x0a, 0x16, 0x24, 0x34,
118*4882a593Smuzhiyun 	0xe1, 0x25, 0xf1, 0x17, 0x18, 0x19, 0x1a, 0x26,
119*4882a593Smuzhiyun 	0x27, 0x28, 0x29, 0x2a, 0x35, 0x36, 0x37, 0x38,
120*4882a593Smuzhiyun 	0x39, 0x3a, 0x43, 0x44, 0x45, 0x46, 0x47, 0x48,
121*4882a593Smuzhiyun 	0x49, 0x4a, 0x53, 0x54, 0x55, 0x56, 0x57, 0x58,
122*4882a593Smuzhiyun 	0x59, 0x5a, 0x63, 0x64, 0x65, 0x66, 0x67, 0x68,
123*4882a593Smuzhiyun 	0x69, 0x6a, 0x73, 0x74, 0x75, 0x76, 0x77, 0x78,
124*4882a593Smuzhiyun 	0x79, 0x7a, 0x82, 0x83, 0x84, 0x85, 0x86, 0x87,
125*4882a593Smuzhiyun 	0x88, 0x89, 0x8a, 0x92, 0x93, 0x94, 0x95, 0x96,
126*4882a593Smuzhiyun 	0x97, 0x98, 0x99, 0x9a, 0xa2, 0xa3, 0xa4, 0xa5,
127*4882a593Smuzhiyun 	0xa6, 0xa7, 0xa8, 0xa9, 0xaa, 0xb2, 0xb3, 0xb4,
128*4882a593Smuzhiyun 	0xb5, 0xb6, 0xb7, 0xb8, 0xb9, 0xba, 0xc2, 0xc3,
129*4882a593Smuzhiyun 	0xc4, 0xc5, 0xc6, 0xc7, 0xc8, 0xc9, 0xca, 0xd2,
130*4882a593Smuzhiyun 	0xd3, 0xd4, 0xd5, 0xd6, 0xd7, 0xd8, 0xd9, 0xda,
131*4882a593Smuzhiyun 	0xe2, 0xe3, 0xe4, 0xe5, 0xe6, 0xe7, 0xe8, 0xe9,
132*4882a593Smuzhiyun 	0xea, 0xf2, 0xf3, 0xf4, 0xf5, 0xf6, 0xf7, 0xf8,
133*4882a593Smuzhiyun 	0xf9, 0xfa, /* padded to 32-bit */
134*4882a593Smuzhiyun };
135*4882a593Smuzhiyun 
136*4882a593Smuzhiyun /*
137*4882a593Smuzhiyun  * Quantization tables for luminance and chrominance components in
138*4882a593Smuzhiyun  * zig-zag scan order from the Freescale i.MX VPU libraries
139*4882a593Smuzhiyun  */
140*4882a593Smuzhiyun 
141*4882a593Smuzhiyun static unsigned char luma_q[64] = {
142*4882a593Smuzhiyun 	0x06, 0x04, 0x04, 0x04, 0x05, 0x04, 0x06, 0x05,
143*4882a593Smuzhiyun 	0x05, 0x06, 0x09, 0x06, 0x05, 0x06, 0x09, 0x0b,
144*4882a593Smuzhiyun 	0x08, 0x06, 0x06, 0x08, 0x0b, 0x0c, 0x0a, 0x0a,
145*4882a593Smuzhiyun 	0x0b, 0x0a, 0x0a, 0x0c, 0x10, 0x0c, 0x0c, 0x0c,
146*4882a593Smuzhiyun 	0x0c, 0x0c, 0x0c, 0x10, 0x0c, 0x0c, 0x0c, 0x0c,
147*4882a593Smuzhiyun 	0x0c, 0x0c, 0x0c, 0x0c, 0x0c, 0x0c, 0x0c, 0x0c,
148*4882a593Smuzhiyun 	0x0c, 0x0c, 0x0c, 0x0c, 0x0c, 0x0c, 0x0c, 0x0c,
149*4882a593Smuzhiyun 	0x0c, 0x0c, 0x0c, 0x0c, 0x0c, 0x0c, 0x0c, 0x0c,
150*4882a593Smuzhiyun };
151*4882a593Smuzhiyun 
152*4882a593Smuzhiyun static unsigned char chroma_q[64] = {
153*4882a593Smuzhiyun 	0x07, 0x07, 0x07, 0x0d, 0x0c, 0x0d, 0x18, 0x10,
154*4882a593Smuzhiyun 	0x10, 0x18, 0x14, 0x0e, 0x0e, 0x0e, 0x14, 0x14,
155*4882a593Smuzhiyun 	0x0e, 0x0e, 0x0e, 0x0e, 0x14, 0x11, 0x0c, 0x0c,
156*4882a593Smuzhiyun 	0x0c, 0x0c, 0x0c, 0x11, 0x11, 0x0c, 0x0c, 0x0c,
157*4882a593Smuzhiyun 	0x0c, 0x0c, 0x0c, 0x11, 0x0c, 0x0c, 0x0c, 0x0c,
158*4882a593Smuzhiyun 	0x0c, 0x0c, 0x0c, 0x0c, 0x0c, 0x0c, 0x0c, 0x0c,
159*4882a593Smuzhiyun 	0x0c, 0x0c, 0x0c, 0x0c, 0x0c, 0x0c, 0x0c, 0x0c,
160*4882a593Smuzhiyun 	0x0c, 0x0c, 0x0c, 0x0c, 0x0c, 0x0c, 0x0c, 0x0c,
161*4882a593Smuzhiyun };
162*4882a593Smuzhiyun 
163*4882a593Smuzhiyun static const unsigned char width_align[] = {
164*4882a593Smuzhiyun 	[CODA9_JPEG_FORMAT_420] = 16,
165*4882a593Smuzhiyun 	[CODA9_JPEG_FORMAT_422] = 16,
166*4882a593Smuzhiyun 	[CODA9_JPEG_FORMAT_224] = 8,
167*4882a593Smuzhiyun 	[CODA9_JPEG_FORMAT_444] = 8,
168*4882a593Smuzhiyun 	[CODA9_JPEG_FORMAT_400] = 8,
169*4882a593Smuzhiyun };
170*4882a593Smuzhiyun 
171*4882a593Smuzhiyun static const unsigned char height_align[] = {
172*4882a593Smuzhiyun 	[CODA9_JPEG_FORMAT_420] = 16,
173*4882a593Smuzhiyun 	[CODA9_JPEG_FORMAT_422] = 8,
174*4882a593Smuzhiyun 	[CODA9_JPEG_FORMAT_224] = 16,
175*4882a593Smuzhiyun 	[CODA9_JPEG_FORMAT_444] = 8,
176*4882a593Smuzhiyun 	[CODA9_JPEG_FORMAT_400] = 8,
177*4882a593Smuzhiyun };
178*4882a593Smuzhiyun 
coda9_jpeg_chroma_format(u32 pixfmt)179*4882a593Smuzhiyun static int coda9_jpeg_chroma_format(u32 pixfmt)
180*4882a593Smuzhiyun {
181*4882a593Smuzhiyun 	switch (pixfmt) {
182*4882a593Smuzhiyun 	case V4L2_PIX_FMT_YUV420:
183*4882a593Smuzhiyun 	case V4L2_PIX_FMT_NV12:
184*4882a593Smuzhiyun 		return CODA9_JPEG_FORMAT_420;
185*4882a593Smuzhiyun 	case V4L2_PIX_FMT_YUV422P:
186*4882a593Smuzhiyun 		return CODA9_JPEG_FORMAT_422;
187*4882a593Smuzhiyun 	case V4L2_PIX_FMT_YUV444:
188*4882a593Smuzhiyun 		return CODA9_JPEG_FORMAT_444;
189*4882a593Smuzhiyun 	case V4L2_PIX_FMT_GREY:
190*4882a593Smuzhiyun 		return CODA9_JPEG_FORMAT_400;
191*4882a593Smuzhiyun 	}
192*4882a593Smuzhiyun 	return -EINVAL;
193*4882a593Smuzhiyun }
194*4882a593Smuzhiyun 
195*4882a593Smuzhiyun struct coda_memcpy_desc {
196*4882a593Smuzhiyun 	int offset;
197*4882a593Smuzhiyun 	const void *src;
198*4882a593Smuzhiyun 	size_t len;
199*4882a593Smuzhiyun };
200*4882a593Smuzhiyun 
coda_memcpy_parabuf(void * parabuf,const struct coda_memcpy_desc * desc)201*4882a593Smuzhiyun static void coda_memcpy_parabuf(void *parabuf,
202*4882a593Smuzhiyun 				const struct coda_memcpy_desc *desc)
203*4882a593Smuzhiyun {
204*4882a593Smuzhiyun 	u32 *dst = parabuf + desc->offset;
205*4882a593Smuzhiyun 	const u32 *src = desc->src;
206*4882a593Smuzhiyun 	int len = desc->len / 4;
207*4882a593Smuzhiyun 	int i;
208*4882a593Smuzhiyun 
209*4882a593Smuzhiyun 	for (i = 0; i < len; i += 2) {
210*4882a593Smuzhiyun 		dst[i + 1] = swab32(src[i]);
211*4882a593Smuzhiyun 		dst[i] = swab32(src[i + 1]);
212*4882a593Smuzhiyun 	}
213*4882a593Smuzhiyun }
214*4882a593Smuzhiyun 
coda_jpeg_write_tables(struct coda_ctx * ctx)215*4882a593Smuzhiyun int coda_jpeg_write_tables(struct coda_ctx *ctx)
216*4882a593Smuzhiyun {
217*4882a593Smuzhiyun 	int i;
218*4882a593Smuzhiyun 	static const struct coda_memcpy_desc huff[8] = {
219*4882a593Smuzhiyun 		{ 0,   luma_dc,    sizeof(luma_dc)    },
220*4882a593Smuzhiyun 		{ 32,  luma_ac,    sizeof(luma_ac)    },
221*4882a593Smuzhiyun 		{ 216, chroma_dc,  sizeof(chroma_dc)  },
222*4882a593Smuzhiyun 		{ 248, chroma_ac,  sizeof(chroma_ac)  },
223*4882a593Smuzhiyun 	};
224*4882a593Smuzhiyun 	struct coda_memcpy_desc qmat[3] = {
225*4882a593Smuzhiyun 		{ 512, ctx->params.jpeg_qmat_tab[0], 64 },
226*4882a593Smuzhiyun 		{ 576, ctx->params.jpeg_qmat_tab[1], 64 },
227*4882a593Smuzhiyun 		{ 640, ctx->params.jpeg_qmat_tab[1], 64 },
228*4882a593Smuzhiyun 	};
229*4882a593Smuzhiyun 
230*4882a593Smuzhiyun 	/* Write huffman tables to parameter memory */
231*4882a593Smuzhiyun 	for (i = 0; i < ARRAY_SIZE(huff); i++)
232*4882a593Smuzhiyun 		coda_memcpy_parabuf(ctx->parabuf.vaddr, huff + i);
233*4882a593Smuzhiyun 
234*4882a593Smuzhiyun 	/* Write Q-matrix to parameter memory */
235*4882a593Smuzhiyun 	for (i = 0; i < ARRAY_SIZE(qmat); i++)
236*4882a593Smuzhiyun 		coda_memcpy_parabuf(ctx->parabuf.vaddr, qmat + i);
237*4882a593Smuzhiyun 
238*4882a593Smuzhiyun 	return 0;
239*4882a593Smuzhiyun }
240*4882a593Smuzhiyun 
coda_jpeg_check_buffer(struct coda_ctx * ctx,struct vb2_buffer * vb)241*4882a593Smuzhiyun bool coda_jpeg_check_buffer(struct coda_ctx *ctx, struct vb2_buffer *vb)
242*4882a593Smuzhiyun {
243*4882a593Smuzhiyun 	void *vaddr = vb2_plane_vaddr(vb, 0);
244*4882a593Smuzhiyun 	u16 soi, eoi;
245*4882a593Smuzhiyun 	int len, i;
246*4882a593Smuzhiyun 
247*4882a593Smuzhiyun 	soi = be16_to_cpup((__be16 *)vaddr);
248*4882a593Smuzhiyun 	if (soi != SOI_MARKER)
249*4882a593Smuzhiyun 		return false;
250*4882a593Smuzhiyun 
251*4882a593Smuzhiyun 	len = vb2_get_plane_payload(vb, 0);
252*4882a593Smuzhiyun 	vaddr += len - 2;
253*4882a593Smuzhiyun 	for (i = 0; i < 32; i++) {
254*4882a593Smuzhiyun 		eoi = be16_to_cpup((__be16 *)(vaddr - i));
255*4882a593Smuzhiyun 		if (eoi == EOI_MARKER) {
256*4882a593Smuzhiyun 			if (i > 0)
257*4882a593Smuzhiyun 				vb2_set_plane_payload(vb, 0, len - i);
258*4882a593Smuzhiyun 			return true;
259*4882a593Smuzhiyun 		}
260*4882a593Smuzhiyun 	}
261*4882a593Smuzhiyun 
262*4882a593Smuzhiyun 	return false;
263*4882a593Smuzhiyun }
264*4882a593Smuzhiyun 
265*4882a593Smuzhiyun static int coda9_jpeg_gen_dec_huff_tab(struct coda_ctx *ctx, int tab_num);
266*4882a593Smuzhiyun 
coda_jpeg_decode_header(struct coda_ctx * ctx,struct vb2_buffer * vb)267*4882a593Smuzhiyun int coda_jpeg_decode_header(struct coda_ctx *ctx, struct vb2_buffer *vb)
268*4882a593Smuzhiyun {
269*4882a593Smuzhiyun 	struct coda_dev *dev = ctx->dev;
270*4882a593Smuzhiyun 	u8 *buf = vb2_plane_vaddr(vb, 0);
271*4882a593Smuzhiyun 	size_t len = vb2_get_plane_payload(vb, 0);
272*4882a593Smuzhiyun 	struct v4l2_jpeg_scan_header scan_header;
273*4882a593Smuzhiyun 	struct v4l2_jpeg_reference quantization_tables[4] = { };
274*4882a593Smuzhiyun 	struct v4l2_jpeg_reference huffman_tables[4] = { };
275*4882a593Smuzhiyun 	struct v4l2_jpeg_header header = {
276*4882a593Smuzhiyun 		.scan = &scan_header,
277*4882a593Smuzhiyun 		.quantization_tables = quantization_tables,
278*4882a593Smuzhiyun 		.huffman_tables = huffman_tables,
279*4882a593Smuzhiyun 	};
280*4882a593Smuzhiyun 	struct coda_q_data *q_data_src;
281*4882a593Smuzhiyun 	struct coda_huff_tab *huff_tab;
282*4882a593Smuzhiyun 	int i, j, ret;
283*4882a593Smuzhiyun 
284*4882a593Smuzhiyun 	ret = v4l2_jpeg_parse_header(buf, len, &header);
285*4882a593Smuzhiyun 	if (ret < 0) {
286*4882a593Smuzhiyun 		v4l2_err(&dev->v4l2_dev, "failed to parse header\n");
287*4882a593Smuzhiyun 		return ret;
288*4882a593Smuzhiyun 	}
289*4882a593Smuzhiyun 
290*4882a593Smuzhiyun 	ctx->params.jpeg_restart_interval = header.restart_interval;
291*4882a593Smuzhiyun 
292*4882a593Smuzhiyun 	/* check frame header */
293*4882a593Smuzhiyun 	if (header.frame.height > ctx->codec->max_h ||
294*4882a593Smuzhiyun 	    header.frame.width > ctx->codec->max_w) {
295*4882a593Smuzhiyun 		v4l2_err(&dev->v4l2_dev, "invalid dimensions: %dx%d\n",
296*4882a593Smuzhiyun 			 header.frame.width, header.frame.height);
297*4882a593Smuzhiyun 		return -EINVAL;
298*4882a593Smuzhiyun 	}
299*4882a593Smuzhiyun 
300*4882a593Smuzhiyun 	q_data_src = get_q_data(ctx, V4L2_BUF_TYPE_VIDEO_OUTPUT);
301*4882a593Smuzhiyun 	if (header.frame.height != q_data_src->height ||
302*4882a593Smuzhiyun 	    header.frame.width != q_data_src->width) {
303*4882a593Smuzhiyun 		v4l2_err(&dev->v4l2_dev,
304*4882a593Smuzhiyun 			 "dimensions don't match format: %dx%d\n",
305*4882a593Smuzhiyun 			 header.frame.width, header.frame.height);
306*4882a593Smuzhiyun 		return -EINVAL;
307*4882a593Smuzhiyun 	}
308*4882a593Smuzhiyun 
309*4882a593Smuzhiyun 	if (header.frame.num_components != 3) {
310*4882a593Smuzhiyun 		v4l2_err(&dev->v4l2_dev,
311*4882a593Smuzhiyun 			 "unsupported number of components: %d\n",
312*4882a593Smuzhiyun 			 header.frame.num_components);
313*4882a593Smuzhiyun 		return -EINVAL;
314*4882a593Smuzhiyun 	}
315*4882a593Smuzhiyun 
316*4882a593Smuzhiyun 	/* install quantization tables */
317*4882a593Smuzhiyun 	if (quantization_tables[3].start) {
318*4882a593Smuzhiyun 		v4l2_err(&dev->v4l2_dev,
319*4882a593Smuzhiyun 			 "only 3 quantization tables supported\n");
320*4882a593Smuzhiyun 		return -EINVAL;
321*4882a593Smuzhiyun 	}
322*4882a593Smuzhiyun 	for (i = 0; i < 3; i++) {
323*4882a593Smuzhiyun 		if (!quantization_tables[i].start)
324*4882a593Smuzhiyun 			continue;
325*4882a593Smuzhiyun 		if (quantization_tables[i].length != 64) {
326*4882a593Smuzhiyun 			v4l2_err(&dev->v4l2_dev,
327*4882a593Smuzhiyun 				 "only 8-bit quantization tables supported\n");
328*4882a593Smuzhiyun 			continue;
329*4882a593Smuzhiyun 		}
330*4882a593Smuzhiyun 		if (!ctx->params.jpeg_qmat_tab[i]) {
331*4882a593Smuzhiyun 			ctx->params.jpeg_qmat_tab[i] = kmalloc(64, GFP_KERNEL);
332*4882a593Smuzhiyun 			if (!ctx->params.jpeg_qmat_tab[i])
333*4882a593Smuzhiyun 				return -ENOMEM;
334*4882a593Smuzhiyun 		}
335*4882a593Smuzhiyun 		memcpy(ctx->params.jpeg_qmat_tab[i],
336*4882a593Smuzhiyun 		       quantization_tables[i].start, 64);
337*4882a593Smuzhiyun 	}
338*4882a593Smuzhiyun 
339*4882a593Smuzhiyun 	/* install Huffman tables */
340*4882a593Smuzhiyun 	for (i = 0; i < 4; i++) {
341*4882a593Smuzhiyun 		if (!huffman_tables[i].start) {
342*4882a593Smuzhiyun 			v4l2_err(&dev->v4l2_dev, "missing Huffman table\n");
343*4882a593Smuzhiyun 			return -EINVAL;
344*4882a593Smuzhiyun 		}
345*4882a593Smuzhiyun 		/* AC tables should be between 17 -> 178, DC between 17 -> 28 */
346*4882a593Smuzhiyun 		if (huffman_tables[i].length < 17 ||
347*4882a593Smuzhiyun 		    huffman_tables[i].length > 178 ||
348*4882a593Smuzhiyun 		    ((i & 2) == 0 && huffman_tables[i].length > 28)) {
349*4882a593Smuzhiyun 			v4l2_err(&dev->v4l2_dev,
350*4882a593Smuzhiyun 				 "invalid Huffman table %d length: %zu\n",
351*4882a593Smuzhiyun 				 i, huffman_tables[i].length);
352*4882a593Smuzhiyun 			return -EINVAL;
353*4882a593Smuzhiyun 		}
354*4882a593Smuzhiyun 	}
355*4882a593Smuzhiyun 	huff_tab = ctx->params.jpeg_huff_tab;
356*4882a593Smuzhiyun 	if (!huff_tab) {
357*4882a593Smuzhiyun 		huff_tab = kzalloc(sizeof(struct coda_huff_tab), GFP_KERNEL);
358*4882a593Smuzhiyun 		if (!huff_tab)
359*4882a593Smuzhiyun 			return -ENOMEM;
360*4882a593Smuzhiyun 		ctx->params.jpeg_huff_tab = huff_tab;
361*4882a593Smuzhiyun 	}
362*4882a593Smuzhiyun 
363*4882a593Smuzhiyun 	memset(huff_tab, 0, sizeof(*huff_tab));
364*4882a593Smuzhiyun 	memcpy(huff_tab->luma_dc, huffman_tables[0].start, huffman_tables[0].length);
365*4882a593Smuzhiyun 	memcpy(huff_tab->chroma_dc, huffman_tables[1].start, huffman_tables[1].length);
366*4882a593Smuzhiyun 	memcpy(huff_tab->luma_ac, huffman_tables[2].start, huffman_tables[2].length);
367*4882a593Smuzhiyun 	memcpy(huff_tab->chroma_ac, huffman_tables[3].start, huffman_tables[3].length);
368*4882a593Smuzhiyun 
369*4882a593Smuzhiyun 	/* check scan header */
370*4882a593Smuzhiyun 	for (i = 0; i < scan_header.num_components; i++) {
371*4882a593Smuzhiyun 		struct v4l2_jpeg_scan_component_spec *scan_component;
372*4882a593Smuzhiyun 
373*4882a593Smuzhiyun 		scan_component = &scan_header.component[i];
374*4882a593Smuzhiyun 		for (j = 0; j < header.frame.num_components; j++) {
375*4882a593Smuzhiyun 			if (header.frame.component[j].component_identifier ==
376*4882a593Smuzhiyun 			    scan_component->component_selector)
377*4882a593Smuzhiyun 				break;
378*4882a593Smuzhiyun 		}
379*4882a593Smuzhiyun 		if (j == header.frame.num_components)
380*4882a593Smuzhiyun 			continue;
381*4882a593Smuzhiyun 
382*4882a593Smuzhiyun 		ctx->params.jpeg_huff_dc_index[j] =
383*4882a593Smuzhiyun 			scan_component->dc_entropy_coding_table_selector;
384*4882a593Smuzhiyun 		ctx->params.jpeg_huff_ac_index[j] =
385*4882a593Smuzhiyun 			scan_component->ac_entropy_coding_table_selector;
386*4882a593Smuzhiyun 	}
387*4882a593Smuzhiyun 
388*4882a593Smuzhiyun 	/* Generate Huffman table information */
389*4882a593Smuzhiyun 	for (i = 0; i < 4; i++)
390*4882a593Smuzhiyun 		coda9_jpeg_gen_dec_huff_tab(ctx, i);
391*4882a593Smuzhiyun 
392*4882a593Smuzhiyun 	/* start of entropy coded segment */
393*4882a593Smuzhiyun 	ctx->jpeg_ecs_offset = header.ecs_offset;
394*4882a593Smuzhiyun 
395*4882a593Smuzhiyun 	switch (header.frame.subsampling) {
396*4882a593Smuzhiyun 	case V4L2_JPEG_CHROMA_SUBSAMPLING_420:
397*4882a593Smuzhiyun 	case V4L2_JPEG_CHROMA_SUBSAMPLING_422:
398*4882a593Smuzhiyun 		ctx->params.jpeg_chroma_subsampling = header.frame.subsampling;
399*4882a593Smuzhiyun 		break;
400*4882a593Smuzhiyun 	default:
401*4882a593Smuzhiyun 		v4l2_err(&dev->v4l2_dev, "chroma subsampling not supported: %d",
402*4882a593Smuzhiyun 			 header.frame.subsampling);
403*4882a593Smuzhiyun 		return -EINVAL;
404*4882a593Smuzhiyun 	}
405*4882a593Smuzhiyun 
406*4882a593Smuzhiyun 	return 0;
407*4882a593Smuzhiyun }
408*4882a593Smuzhiyun 
coda9_jpeg_write_huff_values(struct coda_dev * dev,u8 * bits,int num_values)409*4882a593Smuzhiyun static inline void coda9_jpeg_write_huff_values(struct coda_dev *dev, u8 *bits,
410*4882a593Smuzhiyun 						int num_values)
411*4882a593Smuzhiyun {
412*4882a593Smuzhiyun 	s8 *values = (s8 *)(bits + 16);
413*4882a593Smuzhiyun 	int huff_length, i;
414*4882a593Smuzhiyun 
415*4882a593Smuzhiyun 	for (huff_length = 0, i = 0; i < 16; i++)
416*4882a593Smuzhiyun 		huff_length += bits[i];
417*4882a593Smuzhiyun 	for (i = huff_length; i < num_values; i++)
418*4882a593Smuzhiyun 		values[i] = -1;
419*4882a593Smuzhiyun 	for (i = 0; i < num_values; i++)
420*4882a593Smuzhiyun 		coda_write(dev, (s32)values[i], CODA9_REG_JPEG_HUFF_DATA);
421*4882a593Smuzhiyun }
422*4882a593Smuzhiyun 
coda9_jpeg_dec_huff_setup(struct coda_ctx * ctx)423*4882a593Smuzhiyun static int coda9_jpeg_dec_huff_setup(struct coda_ctx *ctx)
424*4882a593Smuzhiyun {
425*4882a593Smuzhiyun 	struct coda_huff_tab *huff_tab = ctx->params.jpeg_huff_tab;
426*4882a593Smuzhiyun 	struct coda_dev *dev = ctx->dev;
427*4882a593Smuzhiyun 	s16 *huff_min = huff_tab->min;
428*4882a593Smuzhiyun 	s16 *huff_max = huff_tab->max;
429*4882a593Smuzhiyun 	s8 *huff_ptr = huff_tab->ptr;
430*4882a593Smuzhiyun 	int i;
431*4882a593Smuzhiyun 
432*4882a593Smuzhiyun 	/* MIN Tables */
433*4882a593Smuzhiyun 	coda_write(dev, 0x003, CODA9_REG_JPEG_HUFF_CTRL);
434*4882a593Smuzhiyun 	coda_write(dev, 0x000, CODA9_REG_JPEG_HUFF_ADDR);
435*4882a593Smuzhiyun 	for (i = 0; i < 4 * 16; i++)
436*4882a593Smuzhiyun 		coda_write(dev, (s32)huff_min[i], CODA9_REG_JPEG_HUFF_DATA);
437*4882a593Smuzhiyun 
438*4882a593Smuzhiyun 	/* MAX Tables */
439*4882a593Smuzhiyun 	coda_write(dev, 0x403, CODA9_REG_JPEG_HUFF_CTRL);
440*4882a593Smuzhiyun 	coda_write(dev, 0x440, CODA9_REG_JPEG_HUFF_ADDR);
441*4882a593Smuzhiyun 	for (i = 0; i < 4 * 16; i++)
442*4882a593Smuzhiyun 		coda_write(dev, (s32)huff_max[i], CODA9_REG_JPEG_HUFF_DATA);
443*4882a593Smuzhiyun 
444*4882a593Smuzhiyun 	/* PTR Tables */
445*4882a593Smuzhiyun 	coda_write(dev, 0x803, CODA9_REG_JPEG_HUFF_CTRL);
446*4882a593Smuzhiyun 	coda_write(dev, 0x880, CODA9_REG_JPEG_HUFF_ADDR);
447*4882a593Smuzhiyun 	for (i = 0; i < 4 * 16; i++)
448*4882a593Smuzhiyun 		coda_write(dev, (s32)huff_ptr[i], CODA9_REG_JPEG_HUFF_DATA);
449*4882a593Smuzhiyun 
450*4882a593Smuzhiyun 	/* VAL Tables: DC Luma, DC Chroma, AC Luma, AC Chroma */
451*4882a593Smuzhiyun 	coda_write(dev, 0xc03, CODA9_REG_JPEG_HUFF_CTRL);
452*4882a593Smuzhiyun 	coda9_jpeg_write_huff_values(dev, huff_tab->luma_dc, 12);
453*4882a593Smuzhiyun 	coda9_jpeg_write_huff_values(dev, huff_tab->chroma_dc, 12);
454*4882a593Smuzhiyun 	coda9_jpeg_write_huff_values(dev, huff_tab->luma_ac, 162);
455*4882a593Smuzhiyun 	coda9_jpeg_write_huff_values(dev, huff_tab->chroma_ac, 162);
456*4882a593Smuzhiyun 	coda_write(dev, 0x000, CODA9_REG_JPEG_HUFF_CTRL);
457*4882a593Smuzhiyun 	return 0;
458*4882a593Smuzhiyun }
459*4882a593Smuzhiyun 
coda9_jpeg_write_qmat_tab(struct coda_dev * dev,u8 * qmat,int index)460*4882a593Smuzhiyun static inline void coda9_jpeg_write_qmat_tab(struct coda_dev *dev,
461*4882a593Smuzhiyun 					     u8 *qmat, int index)
462*4882a593Smuzhiyun {
463*4882a593Smuzhiyun 	int i;
464*4882a593Smuzhiyun 
465*4882a593Smuzhiyun 	coda_write(dev, index | 0x3, CODA9_REG_JPEG_QMAT_CTRL);
466*4882a593Smuzhiyun 	for (i = 0; i < 64; i++)
467*4882a593Smuzhiyun 		coda_write(dev, qmat[i], CODA9_REG_JPEG_QMAT_DATA);
468*4882a593Smuzhiyun 	coda_write(dev, 0, CODA9_REG_JPEG_QMAT_CTRL);
469*4882a593Smuzhiyun }
470*4882a593Smuzhiyun 
coda9_jpeg_qmat_setup(struct coda_ctx * ctx)471*4882a593Smuzhiyun static void coda9_jpeg_qmat_setup(struct coda_ctx *ctx)
472*4882a593Smuzhiyun {
473*4882a593Smuzhiyun 	struct coda_dev *dev = ctx->dev;
474*4882a593Smuzhiyun 	int *qmat_index = ctx->params.jpeg_qmat_index;
475*4882a593Smuzhiyun 	u8 **qmat_tab = ctx->params.jpeg_qmat_tab;
476*4882a593Smuzhiyun 
477*4882a593Smuzhiyun 	coda9_jpeg_write_qmat_tab(dev, qmat_tab[qmat_index[0]], 0x00);
478*4882a593Smuzhiyun 	coda9_jpeg_write_qmat_tab(dev, qmat_tab[qmat_index[1]], 0x40);
479*4882a593Smuzhiyun 	coda9_jpeg_write_qmat_tab(dev, qmat_tab[qmat_index[2]], 0x80);
480*4882a593Smuzhiyun }
481*4882a593Smuzhiyun 
coda9_jpeg_dec_bbc_gbu_setup(struct coda_ctx * ctx,struct vb2_buffer * buf,u32 ecs_offset)482*4882a593Smuzhiyun static void coda9_jpeg_dec_bbc_gbu_setup(struct coda_ctx *ctx,
483*4882a593Smuzhiyun 					 struct vb2_buffer *buf, u32 ecs_offset)
484*4882a593Smuzhiyun {
485*4882a593Smuzhiyun 	struct coda_dev *dev = ctx->dev;
486*4882a593Smuzhiyun 	int page_ptr, word_ptr, bit_ptr;
487*4882a593Smuzhiyun 	u32 bbc_base_addr, end_addr;
488*4882a593Smuzhiyun 	int bbc_cur_pos;
489*4882a593Smuzhiyun 	int ret, val;
490*4882a593Smuzhiyun 
491*4882a593Smuzhiyun 	bbc_base_addr = vb2_dma_contig_plane_dma_addr(buf, 0);
492*4882a593Smuzhiyun 	end_addr = bbc_base_addr + vb2_get_plane_payload(buf, 0);
493*4882a593Smuzhiyun 
494*4882a593Smuzhiyun 	page_ptr = ecs_offset / 256;
495*4882a593Smuzhiyun 	word_ptr = (ecs_offset % 256) / 4;
496*4882a593Smuzhiyun 	if (page_ptr & 1)
497*4882a593Smuzhiyun 		word_ptr += 64;
498*4882a593Smuzhiyun 	bit_ptr = (ecs_offset % 4) * 8;
499*4882a593Smuzhiyun 	if (word_ptr & 1)
500*4882a593Smuzhiyun 		bit_ptr += 32;
501*4882a593Smuzhiyun 	word_ptr &= ~0x1;
502*4882a593Smuzhiyun 
503*4882a593Smuzhiyun 	coda_write(dev, end_addr, CODA9_REG_JPEG_BBC_WR_PTR);
504*4882a593Smuzhiyun 	coda_write(dev, bbc_base_addr, CODA9_REG_JPEG_BBC_BAS_ADDR);
505*4882a593Smuzhiyun 
506*4882a593Smuzhiyun 	/* Leave 3 256-byte page margin to avoid a BBC interrupt */
507*4882a593Smuzhiyun 	coda_write(dev, end_addr + 256 * 3 + 256, CODA9_REG_JPEG_BBC_END_ADDR);
508*4882a593Smuzhiyun 	val = DIV_ROUND_UP(vb2_plane_size(buf, 0), 256) + 3;
509*4882a593Smuzhiyun 	coda_write(dev, BIT(31) | val, CODA9_REG_JPEG_BBC_STRM_CTRL);
510*4882a593Smuzhiyun 
511*4882a593Smuzhiyun 	bbc_cur_pos = page_ptr;
512*4882a593Smuzhiyun 	coda_write(dev, bbc_cur_pos, CODA9_REG_JPEG_BBC_CUR_POS);
513*4882a593Smuzhiyun 	coda_write(dev, bbc_base_addr + (bbc_cur_pos << 8),
514*4882a593Smuzhiyun 			CODA9_REG_JPEG_BBC_EXT_ADDR);
515*4882a593Smuzhiyun 	coda_write(dev, (bbc_cur_pos & 1) << 6, CODA9_REG_JPEG_BBC_INT_ADDR);
516*4882a593Smuzhiyun 	coda_write(dev, 64, CODA9_REG_JPEG_BBC_DATA_CNT);
517*4882a593Smuzhiyun 	coda_write(dev, 0, CODA9_REG_JPEG_BBC_COMMAND);
518*4882a593Smuzhiyun 	do {
519*4882a593Smuzhiyun 		ret = coda_read(dev, CODA9_REG_JPEG_BBC_BUSY);
520*4882a593Smuzhiyun 	} while (ret == 1);
521*4882a593Smuzhiyun 
522*4882a593Smuzhiyun 	bbc_cur_pos++;
523*4882a593Smuzhiyun 	coda_write(dev, bbc_cur_pos, CODA9_REG_JPEG_BBC_CUR_POS);
524*4882a593Smuzhiyun 	coda_write(dev, bbc_base_addr + (bbc_cur_pos << 8),
525*4882a593Smuzhiyun 			CODA9_REG_JPEG_BBC_EXT_ADDR);
526*4882a593Smuzhiyun 	coda_write(dev, (bbc_cur_pos & 1) << 6, CODA9_REG_JPEG_BBC_INT_ADDR);
527*4882a593Smuzhiyun 	coda_write(dev, 64, CODA9_REG_JPEG_BBC_DATA_CNT);
528*4882a593Smuzhiyun 	coda_write(dev, 0, CODA9_REG_JPEG_BBC_COMMAND);
529*4882a593Smuzhiyun 	do {
530*4882a593Smuzhiyun 		ret = coda_read(dev, CODA9_REG_JPEG_BBC_BUSY);
531*4882a593Smuzhiyun 	} while (ret == 1);
532*4882a593Smuzhiyun 
533*4882a593Smuzhiyun 	bbc_cur_pos++;
534*4882a593Smuzhiyun 	coda_write(dev, bbc_cur_pos, CODA9_REG_JPEG_BBC_CUR_POS);
535*4882a593Smuzhiyun 	coda_write(dev, 1, CODA9_REG_JPEG_BBC_CTRL);
536*4882a593Smuzhiyun 
537*4882a593Smuzhiyun 	coda_write(dev, 0, CODA9_REG_JPEG_GBU_TT_CNT);
538*4882a593Smuzhiyun 	coda_write(dev, word_ptr, CODA9_REG_JPEG_GBU_WD_PTR);
539*4882a593Smuzhiyun 	coda_write(dev, 0, CODA9_REG_JPEG_GBU_BBSR);
540*4882a593Smuzhiyun 	coda_write(dev, 127, CODA9_REG_JPEG_GBU_BBER);
541*4882a593Smuzhiyun 	if (page_ptr & 1) {
542*4882a593Smuzhiyun 		coda_write(dev, 0, CODA9_REG_JPEG_GBU_BBIR);
543*4882a593Smuzhiyun 		coda_write(dev, 0, CODA9_REG_JPEG_GBU_BBHR);
544*4882a593Smuzhiyun 	} else {
545*4882a593Smuzhiyun 		coda_write(dev, 64, CODA9_REG_JPEG_GBU_BBIR);
546*4882a593Smuzhiyun 		coda_write(dev, 64, CODA9_REG_JPEG_GBU_BBHR);
547*4882a593Smuzhiyun 	}
548*4882a593Smuzhiyun 	coda_write(dev, 4, CODA9_REG_JPEG_GBU_CTRL);
549*4882a593Smuzhiyun 	coda_write(dev, bit_ptr, CODA9_REG_JPEG_GBU_FF_RPTR);
550*4882a593Smuzhiyun 	coda_write(dev, 3, CODA9_REG_JPEG_GBU_CTRL);
551*4882a593Smuzhiyun }
552*4882a593Smuzhiyun 
553*4882a593Smuzhiyun static const int bus_req_num[] = {
554*4882a593Smuzhiyun 	[CODA9_JPEG_FORMAT_420] = 2,
555*4882a593Smuzhiyun 	[CODA9_JPEG_FORMAT_422] = 3,
556*4882a593Smuzhiyun 	[CODA9_JPEG_FORMAT_224] = 3,
557*4882a593Smuzhiyun 	[CODA9_JPEG_FORMAT_444] = 4,
558*4882a593Smuzhiyun 	[CODA9_JPEG_FORMAT_400] = 4,
559*4882a593Smuzhiyun };
560*4882a593Smuzhiyun 
561*4882a593Smuzhiyun #define MCU_INFO(mcu_block_num, comp_num, comp0_info, comp1_info, comp2_info) \
562*4882a593Smuzhiyun 	(((mcu_block_num) << CODA9_JPEG_MCU_BLOCK_NUM_OFFSET) | \
563*4882a593Smuzhiyun 	 ((comp_num) << CODA9_JPEG_COMP_NUM_OFFSET) | \
564*4882a593Smuzhiyun 	 ((comp0_info) << CODA9_JPEG_COMP0_INFO_OFFSET) | \
565*4882a593Smuzhiyun 	 ((comp1_info) << CODA9_JPEG_COMP1_INFO_OFFSET) | \
566*4882a593Smuzhiyun 	 ((comp2_info) << CODA9_JPEG_COMP2_INFO_OFFSET))
567*4882a593Smuzhiyun 
568*4882a593Smuzhiyun static const u32 mcu_info[] = {
569*4882a593Smuzhiyun 	[CODA9_JPEG_FORMAT_420] = MCU_INFO(6, 3, 10, 5, 5),
570*4882a593Smuzhiyun 	[CODA9_JPEG_FORMAT_422] = MCU_INFO(4, 3, 9, 5, 5),
571*4882a593Smuzhiyun 	[CODA9_JPEG_FORMAT_224] = MCU_INFO(4, 3, 6, 5, 5),
572*4882a593Smuzhiyun 	[CODA9_JPEG_FORMAT_444] = MCU_INFO(3, 3, 5, 5, 5),
573*4882a593Smuzhiyun 	[CODA9_JPEG_FORMAT_400] = MCU_INFO(1, 1, 5, 0, 0),
574*4882a593Smuzhiyun };
575*4882a593Smuzhiyun 
576*4882a593Smuzhiyun /*
577*4882a593Smuzhiyun  * Convert Huffman table specifcations to tables of codes and code lengths.
578*4882a593Smuzhiyun  * For reference, see JPEG ITU-T.81 (ISO/IEC 10918-1) [1]
579*4882a593Smuzhiyun  *
580*4882a593Smuzhiyun  * [1] https://www.w3.org/Graphics/JPEG/itu-t81.pdf
581*4882a593Smuzhiyun  */
coda9_jpeg_gen_enc_huff_tab(struct coda_ctx * ctx,int tab_num,int * ehufsi,int * ehufco)582*4882a593Smuzhiyun static int coda9_jpeg_gen_enc_huff_tab(struct coda_ctx *ctx, int tab_num,
583*4882a593Smuzhiyun 				       int *ehufsi, int *ehufco)
584*4882a593Smuzhiyun {
585*4882a593Smuzhiyun 	int i, j, k, lastk, si, code, maxsymbol;
586*4882a593Smuzhiyun 	const u8 *bits, *huffval;
587*4882a593Smuzhiyun 	struct {
588*4882a593Smuzhiyun 		int size[256];
589*4882a593Smuzhiyun 		int code[256];
590*4882a593Smuzhiyun 	} *huff;
591*4882a593Smuzhiyun 	static const unsigned char *huff_tabs[4] = {
592*4882a593Smuzhiyun 		luma_dc, luma_ac, chroma_dc, chroma_ac,
593*4882a593Smuzhiyun 	};
594*4882a593Smuzhiyun 	int ret = -EINVAL;
595*4882a593Smuzhiyun 
596*4882a593Smuzhiyun 	huff = kzalloc(sizeof(*huff), GFP_KERNEL);
597*4882a593Smuzhiyun 	if (!huff)
598*4882a593Smuzhiyun 		return -ENOMEM;
599*4882a593Smuzhiyun 
600*4882a593Smuzhiyun 	bits = huff_tabs[tab_num];
601*4882a593Smuzhiyun 	huffval = huff_tabs[tab_num] + 16;
602*4882a593Smuzhiyun 
603*4882a593Smuzhiyun 	maxsymbol = tab_num & 1 ? 256 : 16;
604*4882a593Smuzhiyun 
605*4882a593Smuzhiyun 	/* Figure C.1 - Generation of table of Huffman code sizes */
606*4882a593Smuzhiyun 	k = 0;
607*4882a593Smuzhiyun 	for (i = 1; i <= 16; i++) {
608*4882a593Smuzhiyun 		j = bits[i - 1];
609*4882a593Smuzhiyun 		if (k + j > maxsymbol)
610*4882a593Smuzhiyun 			goto out;
611*4882a593Smuzhiyun 		while (j--)
612*4882a593Smuzhiyun 			huff->size[k++] = i;
613*4882a593Smuzhiyun 	}
614*4882a593Smuzhiyun 	lastk = k;
615*4882a593Smuzhiyun 
616*4882a593Smuzhiyun 	/* Figure C.2 - Generation of table of Huffman codes */
617*4882a593Smuzhiyun 	k = 0;
618*4882a593Smuzhiyun 	code = 0;
619*4882a593Smuzhiyun 	si = huff->size[0];
620*4882a593Smuzhiyun 	while (k < lastk) {
621*4882a593Smuzhiyun 		while (huff->size[k] == si) {
622*4882a593Smuzhiyun 			huff->code[k++] = code;
623*4882a593Smuzhiyun 			code++;
624*4882a593Smuzhiyun 		}
625*4882a593Smuzhiyun 		if (code >= (1 << si))
626*4882a593Smuzhiyun 			goto out;
627*4882a593Smuzhiyun 		code <<= 1;
628*4882a593Smuzhiyun 		si++;
629*4882a593Smuzhiyun 	}
630*4882a593Smuzhiyun 
631*4882a593Smuzhiyun 	/* Figure C.3 - Ordering procedure for encoding procedure code tables */
632*4882a593Smuzhiyun 	for (k = 0; k < lastk; k++) {
633*4882a593Smuzhiyun 		i = huffval[k];
634*4882a593Smuzhiyun 		if (i >= maxsymbol || ehufsi[i])
635*4882a593Smuzhiyun 			goto out;
636*4882a593Smuzhiyun 		ehufco[i] = huff->code[k];
637*4882a593Smuzhiyun 		ehufsi[i] = huff->size[k];
638*4882a593Smuzhiyun 	}
639*4882a593Smuzhiyun 
640*4882a593Smuzhiyun 	ret = 0;
641*4882a593Smuzhiyun out:
642*4882a593Smuzhiyun 	kfree(huff);
643*4882a593Smuzhiyun 	return ret;
644*4882a593Smuzhiyun }
645*4882a593Smuzhiyun 
646*4882a593Smuzhiyun #define DC_TABLE_INDEX0		    0
647*4882a593Smuzhiyun #define AC_TABLE_INDEX0		    1
648*4882a593Smuzhiyun #define DC_TABLE_INDEX1		    2
649*4882a593Smuzhiyun #define AC_TABLE_INDEX1		    3
650*4882a593Smuzhiyun 
coda9_jpeg_get_huff_bits(struct coda_ctx * ctx,int tab_num)651*4882a593Smuzhiyun static u8 *coda9_jpeg_get_huff_bits(struct coda_ctx *ctx, int tab_num)
652*4882a593Smuzhiyun {
653*4882a593Smuzhiyun 	struct coda_huff_tab *huff_tab = ctx->params.jpeg_huff_tab;
654*4882a593Smuzhiyun 
655*4882a593Smuzhiyun 	if (!huff_tab)
656*4882a593Smuzhiyun 		return NULL;
657*4882a593Smuzhiyun 
658*4882a593Smuzhiyun 	switch (tab_num) {
659*4882a593Smuzhiyun 	case DC_TABLE_INDEX0: return huff_tab->luma_dc;
660*4882a593Smuzhiyun 	case AC_TABLE_INDEX0: return huff_tab->luma_ac;
661*4882a593Smuzhiyun 	case DC_TABLE_INDEX1: return huff_tab->chroma_dc;
662*4882a593Smuzhiyun 	case AC_TABLE_INDEX1: return huff_tab->chroma_ac;
663*4882a593Smuzhiyun 	}
664*4882a593Smuzhiyun 
665*4882a593Smuzhiyun 	return NULL;
666*4882a593Smuzhiyun }
667*4882a593Smuzhiyun 
coda9_jpeg_gen_dec_huff_tab(struct coda_ctx * ctx,int tab_num)668*4882a593Smuzhiyun static int coda9_jpeg_gen_dec_huff_tab(struct coda_ctx *ctx, int tab_num)
669*4882a593Smuzhiyun {
670*4882a593Smuzhiyun 	int ptr_cnt = 0, huff_code = 0, zero_flag = 0, data_flag = 0;
671*4882a593Smuzhiyun 	u8 *huff_bits;
672*4882a593Smuzhiyun 	s16 *huff_max;
673*4882a593Smuzhiyun 	s16 *huff_min;
674*4882a593Smuzhiyun 	s8 *huff_ptr;
675*4882a593Smuzhiyun 	int ofs;
676*4882a593Smuzhiyun 	int i;
677*4882a593Smuzhiyun 
678*4882a593Smuzhiyun 	huff_bits = coda9_jpeg_get_huff_bits(ctx, tab_num);
679*4882a593Smuzhiyun 	if (!huff_bits)
680*4882a593Smuzhiyun 		return -EINVAL;
681*4882a593Smuzhiyun 
682*4882a593Smuzhiyun 	/* DC/AC Luma, DC/AC Chroma -> DC Luma/Chroma, AC Luma/Chroma */
683*4882a593Smuzhiyun 	ofs = ((tab_num & 1) << 1) | ((tab_num >> 1) & 1);
684*4882a593Smuzhiyun 	ofs *= 16;
685*4882a593Smuzhiyun 
686*4882a593Smuzhiyun 	huff_ptr = ctx->params.jpeg_huff_tab->ptr + ofs;
687*4882a593Smuzhiyun 	huff_max = ctx->params.jpeg_huff_tab->max + ofs;
688*4882a593Smuzhiyun 	huff_min = ctx->params.jpeg_huff_tab->min + ofs;
689*4882a593Smuzhiyun 
690*4882a593Smuzhiyun 	for (i = 0; i < 16; i++) {
691*4882a593Smuzhiyun 		if (huff_bits[i]) {
692*4882a593Smuzhiyun 			huff_ptr[i] = ptr_cnt;
693*4882a593Smuzhiyun 			ptr_cnt += huff_bits[i];
694*4882a593Smuzhiyun 			huff_min[i] = huff_code;
695*4882a593Smuzhiyun 			huff_max[i] = huff_code + (huff_bits[i] - 1);
696*4882a593Smuzhiyun 			data_flag = 1;
697*4882a593Smuzhiyun 			zero_flag = 0;
698*4882a593Smuzhiyun 		} else {
699*4882a593Smuzhiyun 			huff_ptr[i] = -1;
700*4882a593Smuzhiyun 			huff_min[i] = -1;
701*4882a593Smuzhiyun 			huff_max[i] = -1;
702*4882a593Smuzhiyun 			zero_flag = 1;
703*4882a593Smuzhiyun 		}
704*4882a593Smuzhiyun 
705*4882a593Smuzhiyun 		if (data_flag == 1) {
706*4882a593Smuzhiyun 			if (zero_flag == 1)
707*4882a593Smuzhiyun 				huff_code <<= 1;
708*4882a593Smuzhiyun 			else
709*4882a593Smuzhiyun 				huff_code = (huff_max[i] + 1) << 1;
710*4882a593Smuzhiyun 		}
711*4882a593Smuzhiyun 	}
712*4882a593Smuzhiyun 
713*4882a593Smuzhiyun 	return 0;
714*4882a593Smuzhiyun }
715*4882a593Smuzhiyun 
coda9_jpeg_load_huff_tab(struct coda_ctx * ctx)716*4882a593Smuzhiyun static int coda9_jpeg_load_huff_tab(struct coda_ctx *ctx)
717*4882a593Smuzhiyun {
718*4882a593Smuzhiyun 	struct {
719*4882a593Smuzhiyun 		int size[4][256];
720*4882a593Smuzhiyun 		int code[4][256];
721*4882a593Smuzhiyun 	} *huff;
722*4882a593Smuzhiyun 	u32 *huff_data;
723*4882a593Smuzhiyun 	int i, j;
724*4882a593Smuzhiyun 	int ret;
725*4882a593Smuzhiyun 
726*4882a593Smuzhiyun 	huff = kzalloc(sizeof(*huff), GFP_KERNEL);
727*4882a593Smuzhiyun 	if (!huff)
728*4882a593Smuzhiyun 		return -ENOMEM;
729*4882a593Smuzhiyun 
730*4882a593Smuzhiyun 	/* Generate all four (luma/chroma DC/AC) code/size lookup tables */
731*4882a593Smuzhiyun 	for (i = 0; i < 4; i++) {
732*4882a593Smuzhiyun 		ret = coda9_jpeg_gen_enc_huff_tab(ctx, i, huff->size[i],
733*4882a593Smuzhiyun 						  huff->code[i]);
734*4882a593Smuzhiyun 		if (ret)
735*4882a593Smuzhiyun 			goto out;
736*4882a593Smuzhiyun 	}
737*4882a593Smuzhiyun 
738*4882a593Smuzhiyun 	if (!ctx->params.jpeg_huff_data) {
739*4882a593Smuzhiyun 		ctx->params.jpeg_huff_data =
740*4882a593Smuzhiyun 			kzalloc(sizeof(u32) * CODA9_JPEG_ENC_HUFF_DATA_SIZE,
741*4882a593Smuzhiyun 				GFP_KERNEL);
742*4882a593Smuzhiyun 		if (!ctx->params.jpeg_huff_data) {
743*4882a593Smuzhiyun 			ret = -ENOMEM;
744*4882a593Smuzhiyun 			goto out;
745*4882a593Smuzhiyun 		}
746*4882a593Smuzhiyun 	}
747*4882a593Smuzhiyun 	huff_data = ctx->params.jpeg_huff_data;
748*4882a593Smuzhiyun 
749*4882a593Smuzhiyun 	for (j = 0; j < 4; j++) {
750*4882a593Smuzhiyun 		/* Store Huffman lookup tables in AC0, AC1, DC0, DC1 order */
751*4882a593Smuzhiyun 		int t = (j == 0) ? AC_TABLE_INDEX0 :
752*4882a593Smuzhiyun 			(j == 1) ? AC_TABLE_INDEX1 :
753*4882a593Smuzhiyun 			(j == 2) ? DC_TABLE_INDEX0 :
754*4882a593Smuzhiyun 				   DC_TABLE_INDEX1;
755*4882a593Smuzhiyun 		/* DC tables only have 16 entries */
756*4882a593Smuzhiyun 		int len = (j < 2) ? 256 : 16;
757*4882a593Smuzhiyun 
758*4882a593Smuzhiyun 		for (i = 0; i < len; i++) {
759*4882a593Smuzhiyun 			if (huff->size[t][i] == 0 && huff->code[t][i] == 0)
760*4882a593Smuzhiyun 				*(huff_data++) = 0;
761*4882a593Smuzhiyun 			else
762*4882a593Smuzhiyun 				*(huff_data++) =
763*4882a593Smuzhiyun 					((huff->size[t][i] - 1) << 16) |
764*4882a593Smuzhiyun 					huff->code[t][i];
765*4882a593Smuzhiyun 		}
766*4882a593Smuzhiyun 	}
767*4882a593Smuzhiyun 
768*4882a593Smuzhiyun 	ret = 0;
769*4882a593Smuzhiyun out:
770*4882a593Smuzhiyun 	kfree(huff);
771*4882a593Smuzhiyun 	return ret;
772*4882a593Smuzhiyun }
773*4882a593Smuzhiyun 
coda9_jpeg_write_huff_tab(struct coda_ctx * ctx)774*4882a593Smuzhiyun static void coda9_jpeg_write_huff_tab(struct coda_ctx *ctx)
775*4882a593Smuzhiyun {
776*4882a593Smuzhiyun 	struct coda_dev *dev = ctx->dev;
777*4882a593Smuzhiyun 	u32 *huff_data = ctx->params.jpeg_huff_data;
778*4882a593Smuzhiyun 	int i;
779*4882a593Smuzhiyun 
780*4882a593Smuzhiyun 	/* Write Huffman size/code lookup tables in AC0, AC1, DC0, DC1 order */
781*4882a593Smuzhiyun 	coda_write(dev, 0x3, CODA9_REG_JPEG_HUFF_CTRL);
782*4882a593Smuzhiyun 	for (i = 0; i < CODA9_JPEG_ENC_HUFF_DATA_SIZE; i++)
783*4882a593Smuzhiyun 		coda_write(dev, *(huff_data++), CODA9_REG_JPEG_HUFF_DATA);
784*4882a593Smuzhiyun 	coda_write(dev, 0x0, CODA9_REG_JPEG_HUFF_CTRL);
785*4882a593Smuzhiyun }
786*4882a593Smuzhiyun 
coda9_jpeg_write_qmat_quotients(struct coda_dev * dev,u8 * qmat,int index)787*4882a593Smuzhiyun static inline void coda9_jpeg_write_qmat_quotients(struct coda_dev *dev,
788*4882a593Smuzhiyun 						   u8 *qmat, int index)
789*4882a593Smuzhiyun {
790*4882a593Smuzhiyun 	int i;
791*4882a593Smuzhiyun 
792*4882a593Smuzhiyun 	coda_write(dev, index | 0x3, CODA9_REG_JPEG_QMAT_CTRL);
793*4882a593Smuzhiyun 	for (i = 0; i < 64; i++)
794*4882a593Smuzhiyun 		coda_write(dev, 0x80000 / qmat[i], CODA9_REG_JPEG_QMAT_DATA);
795*4882a593Smuzhiyun 	coda_write(dev, index, CODA9_REG_JPEG_QMAT_CTRL);
796*4882a593Smuzhiyun }
797*4882a593Smuzhiyun 
coda9_jpeg_load_qmat_tab(struct coda_ctx * ctx)798*4882a593Smuzhiyun static void coda9_jpeg_load_qmat_tab(struct coda_ctx *ctx)
799*4882a593Smuzhiyun {
800*4882a593Smuzhiyun 	struct coda_dev *dev = ctx->dev;
801*4882a593Smuzhiyun 	u8 *luma_tab;
802*4882a593Smuzhiyun 	u8 *chroma_tab;
803*4882a593Smuzhiyun 
804*4882a593Smuzhiyun 	luma_tab = ctx->params.jpeg_qmat_tab[0];
805*4882a593Smuzhiyun 	if (!luma_tab)
806*4882a593Smuzhiyun 		luma_tab = luma_q;
807*4882a593Smuzhiyun 
808*4882a593Smuzhiyun 	chroma_tab = ctx->params.jpeg_qmat_tab[1];
809*4882a593Smuzhiyun 	if (!chroma_tab)
810*4882a593Smuzhiyun 		chroma_tab = chroma_q;
811*4882a593Smuzhiyun 
812*4882a593Smuzhiyun 	coda9_jpeg_write_qmat_quotients(dev, luma_tab, 0x00);
813*4882a593Smuzhiyun 	coda9_jpeg_write_qmat_quotients(dev, chroma_tab, 0x40);
814*4882a593Smuzhiyun 	coda9_jpeg_write_qmat_quotients(dev, chroma_tab, 0x80);
815*4882a593Smuzhiyun }
816*4882a593Smuzhiyun 
817*4882a593Smuzhiyun struct coda_jpeg_stream {
818*4882a593Smuzhiyun 	u8 *curr;
819*4882a593Smuzhiyun 	u8 *end;
820*4882a593Smuzhiyun };
821*4882a593Smuzhiyun 
coda_jpeg_put_byte(u8 byte,struct coda_jpeg_stream * stream)822*4882a593Smuzhiyun static inline int coda_jpeg_put_byte(u8 byte, struct coda_jpeg_stream *stream)
823*4882a593Smuzhiyun {
824*4882a593Smuzhiyun 	if (stream->curr >= stream->end)
825*4882a593Smuzhiyun 		return -EINVAL;
826*4882a593Smuzhiyun 
827*4882a593Smuzhiyun 	*stream->curr++ = byte;
828*4882a593Smuzhiyun 
829*4882a593Smuzhiyun 	return 0;
830*4882a593Smuzhiyun }
831*4882a593Smuzhiyun 
coda_jpeg_put_word(u16 word,struct coda_jpeg_stream * stream)832*4882a593Smuzhiyun static inline int coda_jpeg_put_word(u16 word, struct coda_jpeg_stream *stream)
833*4882a593Smuzhiyun {
834*4882a593Smuzhiyun 	if (stream->curr + sizeof(__be16) > stream->end)
835*4882a593Smuzhiyun 		return -EINVAL;
836*4882a593Smuzhiyun 
837*4882a593Smuzhiyun 	put_unaligned_be16(word, stream->curr);
838*4882a593Smuzhiyun 	stream->curr += sizeof(__be16);
839*4882a593Smuzhiyun 
840*4882a593Smuzhiyun 	return 0;
841*4882a593Smuzhiyun }
842*4882a593Smuzhiyun 
coda_jpeg_put_table(u16 marker,u8 index,const u8 * table,size_t len,struct coda_jpeg_stream * stream)843*4882a593Smuzhiyun static int coda_jpeg_put_table(u16 marker, u8 index, const u8 *table,
844*4882a593Smuzhiyun 			       size_t len, struct coda_jpeg_stream *stream)
845*4882a593Smuzhiyun {
846*4882a593Smuzhiyun 	int i, ret;
847*4882a593Smuzhiyun 
848*4882a593Smuzhiyun 	ret = coda_jpeg_put_word(marker, stream);
849*4882a593Smuzhiyun 	if (ret < 0)
850*4882a593Smuzhiyun 		return ret;
851*4882a593Smuzhiyun 	ret = coda_jpeg_put_word(3 + len, stream);
852*4882a593Smuzhiyun 	if (ret < 0)
853*4882a593Smuzhiyun 		return ret;
854*4882a593Smuzhiyun 	ret = coda_jpeg_put_byte(index, stream);
855*4882a593Smuzhiyun 	for (i = 0; i < len && ret == 0; i++)
856*4882a593Smuzhiyun 		ret = coda_jpeg_put_byte(table[i], stream);
857*4882a593Smuzhiyun 
858*4882a593Smuzhiyun 	return ret;
859*4882a593Smuzhiyun }
860*4882a593Smuzhiyun 
coda_jpeg_define_quantization_table(struct coda_ctx * ctx,u8 index,struct coda_jpeg_stream * stream)861*4882a593Smuzhiyun static int coda_jpeg_define_quantization_table(struct coda_ctx *ctx, u8 index,
862*4882a593Smuzhiyun 					       struct coda_jpeg_stream *stream)
863*4882a593Smuzhiyun {
864*4882a593Smuzhiyun 	return coda_jpeg_put_table(DQT_MARKER, index,
865*4882a593Smuzhiyun 				   ctx->params.jpeg_qmat_tab[index], 64,
866*4882a593Smuzhiyun 				   stream);
867*4882a593Smuzhiyun }
868*4882a593Smuzhiyun 
coda_jpeg_define_huffman_table(u8 index,const u8 * table,size_t len,struct coda_jpeg_stream * stream)869*4882a593Smuzhiyun static int coda_jpeg_define_huffman_table(u8 index, const u8 *table, size_t len,
870*4882a593Smuzhiyun 					  struct coda_jpeg_stream *stream)
871*4882a593Smuzhiyun {
872*4882a593Smuzhiyun 	return coda_jpeg_put_table(DHT_MARKER, index, table, len, stream);
873*4882a593Smuzhiyun }
874*4882a593Smuzhiyun 
coda9_jpeg_encode_header(struct coda_ctx * ctx,int len,u8 * buf)875*4882a593Smuzhiyun static int coda9_jpeg_encode_header(struct coda_ctx *ctx, int len, u8 *buf)
876*4882a593Smuzhiyun {
877*4882a593Smuzhiyun 	struct coda_jpeg_stream stream = { buf, buf + len };
878*4882a593Smuzhiyun 	struct coda_q_data *q_data_src;
879*4882a593Smuzhiyun 	int chroma_format, comp_num;
880*4882a593Smuzhiyun 	int i, ret, pad;
881*4882a593Smuzhiyun 
882*4882a593Smuzhiyun 	q_data_src = get_q_data(ctx, V4L2_BUF_TYPE_VIDEO_OUTPUT);
883*4882a593Smuzhiyun 	chroma_format = coda9_jpeg_chroma_format(q_data_src->fourcc);
884*4882a593Smuzhiyun 	if (chroma_format < 0)
885*4882a593Smuzhiyun 		return 0;
886*4882a593Smuzhiyun 
887*4882a593Smuzhiyun 	/* Start Of Image */
888*4882a593Smuzhiyun 	ret = coda_jpeg_put_word(SOI_MARKER, &stream);
889*4882a593Smuzhiyun 	if (ret < 0)
890*4882a593Smuzhiyun 		return ret;
891*4882a593Smuzhiyun 
892*4882a593Smuzhiyun 	/* Define Restart Interval */
893*4882a593Smuzhiyun 	if (ctx->params.jpeg_restart_interval) {
894*4882a593Smuzhiyun 		ret = coda_jpeg_put_word(DRI_MARKER, &stream);
895*4882a593Smuzhiyun 		if (ret < 0)
896*4882a593Smuzhiyun 			return ret;
897*4882a593Smuzhiyun 		ret = coda_jpeg_put_word(4, &stream);
898*4882a593Smuzhiyun 		if (ret < 0)
899*4882a593Smuzhiyun 			return ret;
900*4882a593Smuzhiyun 		ret = coda_jpeg_put_word(ctx->params.jpeg_restart_interval,
901*4882a593Smuzhiyun 					 &stream);
902*4882a593Smuzhiyun 		if (ret < 0)
903*4882a593Smuzhiyun 			return ret;
904*4882a593Smuzhiyun 	}
905*4882a593Smuzhiyun 
906*4882a593Smuzhiyun 	/* Define Quantization Tables */
907*4882a593Smuzhiyun 	ret = coda_jpeg_define_quantization_table(ctx, 0x00, &stream);
908*4882a593Smuzhiyun 	if (ret < 0)
909*4882a593Smuzhiyun 		return ret;
910*4882a593Smuzhiyun 	if (chroma_format != CODA9_JPEG_FORMAT_400) {
911*4882a593Smuzhiyun 		ret = coda_jpeg_define_quantization_table(ctx, 0x01, &stream);
912*4882a593Smuzhiyun 		if (ret < 0)
913*4882a593Smuzhiyun 			return ret;
914*4882a593Smuzhiyun 	}
915*4882a593Smuzhiyun 
916*4882a593Smuzhiyun 	/* Define Huffman Tables */
917*4882a593Smuzhiyun 	ret = coda_jpeg_define_huffman_table(0x00, luma_dc, 16 + 12, &stream);
918*4882a593Smuzhiyun 	if (ret < 0)
919*4882a593Smuzhiyun 		return ret;
920*4882a593Smuzhiyun 	ret = coda_jpeg_define_huffman_table(0x10, luma_ac, 16 + 162, &stream);
921*4882a593Smuzhiyun 	if (ret < 0)
922*4882a593Smuzhiyun 		return ret;
923*4882a593Smuzhiyun 	if (chroma_format != CODA9_JPEG_FORMAT_400) {
924*4882a593Smuzhiyun 		ret = coda_jpeg_define_huffman_table(0x01, chroma_dc, 16 + 12,
925*4882a593Smuzhiyun 						     &stream);
926*4882a593Smuzhiyun 		if (ret < 0)
927*4882a593Smuzhiyun 			return ret;
928*4882a593Smuzhiyun 		ret = coda_jpeg_define_huffman_table(0x11, chroma_ac, 16 + 162,
929*4882a593Smuzhiyun 						     &stream);
930*4882a593Smuzhiyun 		if (ret < 0)
931*4882a593Smuzhiyun 			return ret;
932*4882a593Smuzhiyun 	}
933*4882a593Smuzhiyun 
934*4882a593Smuzhiyun 	/* Start Of Frame */
935*4882a593Smuzhiyun 	ret = coda_jpeg_put_word(SOF_MARKER, &stream);
936*4882a593Smuzhiyun 	if (ret < 0)
937*4882a593Smuzhiyun 		return ret;
938*4882a593Smuzhiyun 	comp_num = (chroma_format == CODA9_JPEG_FORMAT_400) ? 1 : 3;
939*4882a593Smuzhiyun 	ret = coda_jpeg_put_word(8 + comp_num * 3, &stream);
940*4882a593Smuzhiyun 	if (ret < 0)
941*4882a593Smuzhiyun 		return ret;
942*4882a593Smuzhiyun 	ret = coda_jpeg_put_byte(0x08, &stream);
943*4882a593Smuzhiyun 	if (ret < 0)
944*4882a593Smuzhiyun 		return ret;
945*4882a593Smuzhiyun 	ret = coda_jpeg_put_word(q_data_src->height, &stream);
946*4882a593Smuzhiyun 	if (ret < 0)
947*4882a593Smuzhiyun 		return ret;
948*4882a593Smuzhiyun 	ret = coda_jpeg_put_word(q_data_src->width, &stream);
949*4882a593Smuzhiyun 	if (ret < 0)
950*4882a593Smuzhiyun 		return ret;
951*4882a593Smuzhiyun 	ret = coda_jpeg_put_byte(comp_num, &stream);
952*4882a593Smuzhiyun 	if (ret < 0)
953*4882a593Smuzhiyun 		return ret;
954*4882a593Smuzhiyun 	for (i = 0; i < comp_num; i++) {
955*4882a593Smuzhiyun 		static unsigned char subsampling[5][3] = {
956*4882a593Smuzhiyun 			[CODA9_JPEG_FORMAT_420] = { 0x22, 0x11, 0x11 },
957*4882a593Smuzhiyun 			[CODA9_JPEG_FORMAT_422] = { 0x21, 0x11, 0x11 },
958*4882a593Smuzhiyun 			[CODA9_JPEG_FORMAT_224] = { 0x12, 0x11, 0x11 },
959*4882a593Smuzhiyun 			[CODA9_JPEG_FORMAT_444] = { 0x11, 0x11, 0x11 },
960*4882a593Smuzhiyun 			[CODA9_JPEG_FORMAT_400] = { 0x11 },
961*4882a593Smuzhiyun 		};
962*4882a593Smuzhiyun 
963*4882a593Smuzhiyun 		/* Component identifier, matches SOS */
964*4882a593Smuzhiyun 		ret = coda_jpeg_put_byte(i + 1, &stream);
965*4882a593Smuzhiyun 		if (ret < 0)
966*4882a593Smuzhiyun 			return ret;
967*4882a593Smuzhiyun 		ret = coda_jpeg_put_byte(subsampling[chroma_format][i],
968*4882a593Smuzhiyun 					 &stream);
969*4882a593Smuzhiyun 		if (ret < 0)
970*4882a593Smuzhiyun 			return ret;
971*4882a593Smuzhiyun 		/* Chroma table index */
972*4882a593Smuzhiyun 		ret = coda_jpeg_put_byte((i == 0) ? 0 : 1, &stream);
973*4882a593Smuzhiyun 		if (ret < 0)
974*4882a593Smuzhiyun 			return ret;
975*4882a593Smuzhiyun 	}
976*4882a593Smuzhiyun 
977*4882a593Smuzhiyun 	/* Pad to multiple of 8 bytes */
978*4882a593Smuzhiyun 	pad = (stream.curr - buf) % 8;
979*4882a593Smuzhiyun 	if (pad) {
980*4882a593Smuzhiyun 		pad = 8 - pad;
981*4882a593Smuzhiyun 		while (pad--) {
982*4882a593Smuzhiyun 			ret = coda_jpeg_put_byte(0x00, &stream);
983*4882a593Smuzhiyun 			if (ret < 0)
984*4882a593Smuzhiyun 				return ret;
985*4882a593Smuzhiyun 		}
986*4882a593Smuzhiyun 	}
987*4882a593Smuzhiyun 
988*4882a593Smuzhiyun 	return stream.curr - buf;
989*4882a593Smuzhiyun }
990*4882a593Smuzhiyun 
991*4882a593Smuzhiyun /*
992*4882a593Smuzhiyun  * Scale quantization table using nonlinear scaling factor
993*4882a593Smuzhiyun  * u8 qtab[64], scale [50,190]
994*4882a593Smuzhiyun  */
coda_scale_quant_table(u8 * q_tab,int scale)995*4882a593Smuzhiyun static void coda_scale_quant_table(u8 *q_tab, int scale)
996*4882a593Smuzhiyun {
997*4882a593Smuzhiyun 	unsigned int temp;
998*4882a593Smuzhiyun 	int i;
999*4882a593Smuzhiyun 
1000*4882a593Smuzhiyun 	for (i = 0; i < 64; i++) {
1001*4882a593Smuzhiyun 		temp = DIV_ROUND_CLOSEST((unsigned int)q_tab[i] * scale, 100);
1002*4882a593Smuzhiyun 		if (temp <= 0)
1003*4882a593Smuzhiyun 			temp = 1;
1004*4882a593Smuzhiyun 		if (temp > 255)
1005*4882a593Smuzhiyun 			temp = 255;
1006*4882a593Smuzhiyun 		q_tab[i] = (unsigned char)temp;
1007*4882a593Smuzhiyun 	}
1008*4882a593Smuzhiyun }
1009*4882a593Smuzhiyun 
coda_set_jpeg_compression_quality(struct coda_ctx * ctx,int quality)1010*4882a593Smuzhiyun void coda_set_jpeg_compression_quality(struct coda_ctx *ctx, int quality)
1011*4882a593Smuzhiyun {
1012*4882a593Smuzhiyun 	unsigned int scale;
1013*4882a593Smuzhiyun 
1014*4882a593Smuzhiyun 	ctx->params.jpeg_quality = quality;
1015*4882a593Smuzhiyun 
1016*4882a593Smuzhiyun 	/* Clip quality setting to [5,100] interval */
1017*4882a593Smuzhiyun 	if (quality > 100)
1018*4882a593Smuzhiyun 		quality = 100;
1019*4882a593Smuzhiyun 	if (quality < 5)
1020*4882a593Smuzhiyun 		quality = 5;
1021*4882a593Smuzhiyun 
1022*4882a593Smuzhiyun 	/*
1023*4882a593Smuzhiyun 	 * Non-linear scaling factor:
1024*4882a593Smuzhiyun 	 * [5,50] -> [1000..100], [51,100] -> [98..0]
1025*4882a593Smuzhiyun 	 */
1026*4882a593Smuzhiyun 	if (quality < 50)
1027*4882a593Smuzhiyun 		scale = 5000 / quality;
1028*4882a593Smuzhiyun 	else
1029*4882a593Smuzhiyun 		scale = 200 - 2 * quality;
1030*4882a593Smuzhiyun 
1031*4882a593Smuzhiyun 	if (ctx->params.jpeg_qmat_tab[0]) {
1032*4882a593Smuzhiyun 		memcpy(ctx->params.jpeg_qmat_tab[0], luma_q, 64);
1033*4882a593Smuzhiyun 		coda_scale_quant_table(ctx->params.jpeg_qmat_tab[0], scale);
1034*4882a593Smuzhiyun 	}
1035*4882a593Smuzhiyun 	if (ctx->params.jpeg_qmat_tab[1]) {
1036*4882a593Smuzhiyun 		memcpy(ctx->params.jpeg_qmat_tab[1], chroma_q, 64);
1037*4882a593Smuzhiyun 		coda_scale_quant_table(ctx->params.jpeg_qmat_tab[1], scale);
1038*4882a593Smuzhiyun 	}
1039*4882a593Smuzhiyun }
1040*4882a593Smuzhiyun 
1041*4882a593Smuzhiyun /*
1042*4882a593Smuzhiyun  * Encoder context operations
1043*4882a593Smuzhiyun  */
1044*4882a593Smuzhiyun 
coda9_jpeg_start_encoding(struct coda_ctx * ctx)1045*4882a593Smuzhiyun static int coda9_jpeg_start_encoding(struct coda_ctx *ctx)
1046*4882a593Smuzhiyun {
1047*4882a593Smuzhiyun 	struct coda_dev *dev = ctx->dev;
1048*4882a593Smuzhiyun 	int ret;
1049*4882a593Smuzhiyun 
1050*4882a593Smuzhiyun 	ret = coda9_jpeg_load_huff_tab(ctx);
1051*4882a593Smuzhiyun 	if (ret < 0) {
1052*4882a593Smuzhiyun 		v4l2_err(&dev->v4l2_dev, "error loading Huffman tables\n");
1053*4882a593Smuzhiyun 		return ret;
1054*4882a593Smuzhiyun 	}
1055*4882a593Smuzhiyun 	if (!ctx->params.jpeg_qmat_tab[0])
1056*4882a593Smuzhiyun 		ctx->params.jpeg_qmat_tab[0] = kmalloc(64, GFP_KERNEL);
1057*4882a593Smuzhiyun 	if (!ctx->params.jpeg_qmat_tab[1])
1058*4882a593Smuzhiyun 		ctx->params.jpeg_qmat_tab[1] = kmalloc(64, GFP_KERNEL);
1059*4882a593Smuzhiyun 	coda_set_jpeg_compression_quality(ctx, ctx->params.jpeg_quality);
1060*4882a593Smuzhiyun 
1061*4882a593Smuzhiyun 	return 0;
1062*4882a593Smuzhiyun }
1063*4882a593Smuzhiyun 
coda9_jpeg_prepare_encode(struct coda_ctx * ctx)1064*4882a593Smuzhiyun static int coda9_jpeg_prepare_encode(struct coda_ctx *ctx)
1065*4882a593Smuzhiyun {
1066*4882a593Smuzhiyun 	struct coda_q_data *q_data_src;
1067*4882a593Smuzhiyun 	struct vb2_v4l2_buffer *src_buf, *dst_buf;
1068*4882a593Smuzhiyun 	struct coda_dev *dev = ctx->dev;
1069*4882a593Smuzhiyun 	u32 start_addr, end_addr;
1070*4882a593Smuzhiyun 	u16 aligned_width, aligned_height;
1071*4882a593Smuzhiyun 	bool chroma_interleave;
1072*4882a593Smuzhiyun 	int chroma_format;
1073*4882a593Smuzhiyun 	int header_len;
1074*4882a593Smuzhiyun 	int ret;
1075*4882a593Smuzhiyun 	ktime_t timeout;
1076*4882a593Smuzhiyun 
1077*4882a593Smuzhiyun 	src_buf = v4l2_m2m_next_src_buf(ctx->fh.m2m_ctx);
1078*4882a593Smuzhiyun 	dst_buf = v4l2_m2m_next_dst_buf(ctx->fh.m2m_ctx);
1079*4882a593Smuzhiyun 	q_data_src = get_q_data(ctx, V4L2_BUF_TYPE_VIDEO_OUTPUT);
1080*4882a593Smuzhiyun 
1081*4882a593Smuzhiyun 	if (vb2_get_plane_payload(&src_buf->vb2_buf, 0) == 0)
1082*4882a593Smuzhiyun 		vb2_set_plane_payload(&src_buf->vb2_buf, 0,
1083*4882a593Smuzhiyun 				      vb2_plane_size(&src_buf->vb2_buf, 0));
1084*4882a593Smuzhiyun 
1085*4882a593Smuzhiyun 	src_buf->sequence = ctx->osequence;
1086*4882a593Smuzhiyun 	dst_buf->sequence = ctx->osequence;
1087*4882a593Smuzhiyun 	ctx->osequence++;
1088*4882a593Smuzhiyun 
1089*4882a593Smuzhiyun 	src_buf->flags |= V4L2_BUF_FLAG_KEYFRAME;
1090*4882a593Smuzhiyun 	src_buf->flags &= ~V4L2_BUF_FLAG_PFRAME;
1091*4882a593Smuzhiyun 
1092*4882a593Smuzhiyun 	coda_set_gdi_regs(ctx);
1093*4882a593Smuzhiyun 
1094*4882a593Smuzhiyun 	start_addr = vb2_dma_contig_plane_dma_addr(&dst_buf->vb2_buf, 0);
1095*4882a593Smuzhiyun 	end_addr = start_addr + vb2_plane_size(&dst_buf->vb2_buf, 0);
1096*4882a593Smuzhiyun 
1097*4882a593Smuzhiyun 	chroma_format = coda9_jpeg_chroma_format(q_data_src->fourcc);
1098*4882a593Smuzhiyun 	if (chroma_format < 0)
1099*4882a593Smuzhiyun 		return chroma_format;
1100*4882a593Smuzhiyun 
1101*4882a593Smuzhiyun 	/* Round image dimensions to multiple of MCU size */
1102*4882a593Smuzhiyun 	aligned_width = round_up(q_data_src->width, width_align[chroma_format]);
1103*4882a593Smuzhiyun 	aligned_height = round_up(q_data_src->height,
1104*4882a593Smuzhiyun 				  height_align[chroma_format]);
1105*4882a593Smuzhiyun 	if (aligned_width != q_data_src->bytesperline) {
1106*4882a593Smuzhiyun 		v4l2_err(&dev->v4l2_dev, "wrong stride: %d instead of %d\n",
1107*4882a593Smuzhiyun 			 aligned_width, q_data_src->bytesperline);
1108*4882a593Smuzhiyun 	}
1109*4882a593Smuzhiyun 
1110*4882a593Smuzhiyun 	header_len =
1111*4882a593Smuzhiyun 		coda9_jpeg_encode_header(ctx,
1112*4882a593Smuzhiyun 					 vb2_plane_size(&dst_buf->vb2_buf, 0),
1113*4882a593Smuzhiyun 					 vb2_plane_vaddr(&dst_buf->vb2_buf, 0));
1114*4882a593Smuzhiyun 	if (header_len < 0)
1115*4882a593Smuzhiyun 		return header_len;
1116*4882a593Smuzhiyun 
1117*4882a593Smuzhiyun 	coda_write(dev, start_addr + header_len, CODA9_REG_JPEG_BBC_BAS_ADDR);
1118*4882a593Smuzhiyun 	coda_write(dev, end_addr, CODA9_REG_JPEG_BBC_END_ADDR);
1119*4882a593Smuzhiyun 	coda_write(dev, start_addr + header_len, CODA9_REG_JPEG_BBC_WR_PTR);
1120*4882a593Smuzhiyun 	coda_write(dev, start_addr + header_len, CODA9_REG_JPEG_BBC_RD_PTR);
1121*4882a593Smuzhiyun 	coda_write(dev, 0, CODA9_REG_JPEG_BBC_CUR_POS);
1122*4882a593Smuzhiyun 	/* 64 words per 256-byte page */
1123*4882a593Smuzhiyun 	coda_write(dev, 64, CODA9_REG_JPEG_BBC_DATA_CNT);
1124*4882a593Smuzhiyun 	coda_write(dev, start_addr, CODA9_REG_JPEG_BBC_EXT_ADDR);
1125*4882a593Smuzhiyun 	coda_write(dev, 0, CODA9_REG_JPEG_BBC_INT_ADDR);
1126*4882a593Smuzhiyun 
1127*4882a593Smuzhiyun 	coda_write(dev, 0, CODA9_REG_JPEG_GBU_BT_PTR);
1128*4882a593Smuzhiyun 	coda_write(dev, 0, CODA9_REG_JPEG_GBU_WD_PTR);
1129*4882a593Smuzhiyun 	coda_write(dev, 0, CODA9_REG_JPEG_GBU_BBSR);
1130*4882a593Smuzhiyun 	coda_write(dev, BIT(31) | ((end_addr - start_addr - header_len) / 256),
1131*4882a593Smuzhiyun 		   CODA9_REG_JPEG_BBC_STRM_CTRL);
1132*4882a593Smuzhiyun 	coda_write(dev, 0, CODA9_REG_JPEG_GBU_CTRL);
1133*4882a593Smuzhiyun 	coda_write(dev, 0, CODA9_REG_JPEG_GBU_FF_RPTR);
1134*4882a593Smuzhiyun 	coda_write(dev, 127, CODA9_REG_JPEG_GBU_BBER);
1135*4882a593Smuzhiyun 	coda_write(dev, 64, CODA9_REG_JPEG_GBU_BBIR);
1136*4882a593Smuzhiyun 	coda_write(dev, 64, CODA9_REG_JPEG_GBU_BBHR);
1137*4882a593Smuzhiyun 
1138*4882a593Smuzhiyun 	chroma_interleave = (q_data_src->fourcc == V4L2_PIX_FMT_NV12);
1139*4882a593Smuzhiyun 	coda_write(dev, CODA9_JPEG_PIC_CTRL_TC_DIRECTION |
1140*4882a593Smuzhiyun 		   CODA9_JPEG_PIC_CTRL_ENCODER_EN, CODA9_REG_JPEG_PIC_CTRL);
1141*4882a593Smuzhiyun 	coda_write(dev, 0, CODA9_REG_JPEG_SCL_INFO);
1142*4882a593Smuzhiyun 	coda_write(dev, chroma_interleave, CODA9_REG_JPEG_DPB_CONFIG);
1143*4882a593Smuzhiyun 	coda_write(dev, ctx->params.jpeg_restart_interval,
1144*4882a593Smuzhiyun 		   CODA9_REG_JPEG_RST_INTVAL);
1145*4882a593Smuzhiyun 	coda_write(dev, 1, CODA9_REG_JPEG_BBC_CTRL);
1146*4882a593Smuzhiyun 
1147*4882a593Smuzhiyun 	coda_write(dev, bus_req_num[chroma_format], CODA9_REG_JPEG_OP_INFO);
1148*4882a593Smuzhiyun 
1149*4882a593Smuzhiyun 	coda9_jpeg_write_huff_tab(ctx);
1150*4882a593Smuzhiyun 	coda9_jpeg_load_qmat_tab(ctx);
1151*4882a593Smuzhiyun 
1152*4882a593Smuzhiyun 	if (ctx->params.rot_mode & CODA_ROT_90) {
1153*4882a593Smuzhiyun 		aligned_width = aligned_height;
1154*4882a593Smuzhiyun 		aligned_height = q_data_src->bytesperline;
1155*4882a593Smuzhiyun 		if (chroma_format == CODA9_JPEG_FORMAT_422)
1156*4882a593Smuzhiyun 			chroma_format = CODA9_JPEG_FORMAT_224;
1157*4882a593Smuzhiyun 		else if (chroma_format == CODA9_JPEG_FORMAT_224)
1158*4882a593Smuzhiyun 			chroma_format = CODA9_JPEG_FORMAT_422;
1159*4882a593Smuzhiyun 	}
1160*4882a593Smuzhiyun 	/* These need to be multiples of MCU size */
1161*4882a593Smuzhiyun 	coda_write(dev, aligned_width << 16 | aligned_height,
1162*4882a593Smuzhiyun 		   CODA9_REG_JPEG_PIC_SIZE);
1163*4882a593Smuzhiyun 	coda_write(dev, ctx->params.rot_mode ?
1164*4882a593Smuzhiyun 		   (CODA_ROT_MIR_ENABLE | ctx->params.rot_mode) : 0,
1165*4882a593Smuzhiyun 		   CODA9_REG_JPEG_ROT_INFO);
1166*4882a593Smuzhiyun 
1167*4882a593Smuzhiyun 	coda_write(dev, mcu_info[chroma_format], CODA9_REG_JPEG_MCU_INFO);
1168*4882a593Smuzhiyun 
1169*4882a593Smuzhiyun 	coda_write(dev, 1, CODA9_GDI_CONTROL);
1170*4882a593Smuzhiyun 	timeout = ktime_add_us(ktime_get(), 100000);
1171*4882a593Smuzhiyun 	do {
1172*4882a593Smuzhiyun 		ret = coda_read(dev, CODA9_GDI_STATUS);
1173*4882a593Smuzhiyun 		if (ktime_compare(ktime_get(), timeout) > 0) {
1174*4882a593Smuzhiyun 			v4l2_err(&dev->v4l2_dev, "timeout waiting for GDI\n");
1175*4882a593Smuzhiyun 			return -ETIMEDOUT;
1176*4882a593Smuzhiyun 		}
1177*4882a593Smuzhiyun 	} while (!ret);
1178*4882a593Smuzhiyun 
1179*4882a593Smuzhiyun 	coda_write(dev, (chroma_format << 17) | (chroma_interleave << 16) |
1180*4882a593Smuzhiyun 		   q_data_src->bytesperline, CODA9_GDI_INFO_CONTROL);
1181*4882a593Smuzhiyun 	/* The content of this register seems to be irrelevant: */
1182*4882a593Smuzhiyun 	coda_write(dev, aligned_width << 16 | aligned_height,
1183*4882a593Smuzhiyun 		   CODA9_GDI_INFO_PIC_SIZE);
1184*4882a593Smuzhiyun 
1185*4882a593Smuzhiyun 	coda_write_base(ctx, q_data_src, src_buf, CODA9_GDI_INFO_BASE_Y);
1186*4882a593Smuzhiyun 
1187*4882a593Smuzhiyun 	coda_write(dev, 0, CODA9_REG_JPEG_DPB_BASE00);
1188*4882a593Smuzhiyun 	coda_write(dev, 0, CODA9_GDI_CONTROL);
1189*4882a593Smuzhiyun 	coda_write(dev, 1, CODA9_GDI_PIC_INIT_HOST);
1190*4882a593Smuzhiyun 
1191*4882a593Smuzhiyun 	coda_write(dev, 1, CODA9_GDI_WPROT_ERR_CLR);
1192*4882a593Smuzhiyun 	coda_write(dev, 0, CODA9_GDI_WPROT_RGN_EN);
1193*4882a593Smuzhiyun 
1194*4882a593Smuzhiyun 	trace_coda_jpeg_run(ctx, src_buf);
1195*4882a593Smuzhiyun 
1196*4882a593Smuzhiyun 	coda_write(dev, 1, CODA9_REG_JPEG_PIC_START);
1197*4882a593Smuzhiyun 
1198*4882a593Smuzhiyun 	return 0;
1199*4882a593Smuzhiyun }
1200*4882a593Smuzhiyun 
coda9_jpeg_finish_encode(struct coda_ctx * ctx)1201*4882a593Smuzhiyun static void coda9_jpeg_finish_encode(struct coda_ctx *ctx)
1202*4882a593Smuzhiyun {
1203*4882a593Smuzhiyun 	struct vb2_v4l2_buffer *src_buf, *dst_buf;
1204*4882a593Smuzhiyun 	struct coda_dev *dev = ctx->dev;
1205*4882a593Smuzhiyun 	u32 wr_ptr, start_ptr;
1206*4882a593Smuzhiyun 	u32 err_mb;
1207*4882a593Smuzhiyun 
1208*4882a593Smuzhiyun 	if (ctx->aborting) {
1209*4882a593Smuzhiyun 		coda_write(ctx->dev, 0, CODA9_REG_JPEG_BBC_FLUSH_CMD);
1210*4882a593Smuzhiyun 		return;
1211*4882a593Smuzhiyun 	}
1212*4882a593Smuzhiyun 
1213*4882a593Smuzhiyun 	/*
1214*4882a593Smuzhiyun 	 * Lock to make sure that an encoder stop command running in parallel
1215*4882a593Smuzhiyun 	 * will either already have marked src_buf as last, or it will wake up
1216*4882a593Smuzhiyun 	 * the capture queue after the buffers are returned.
1217*4882a593Smuzhiyun 	 */
1218*4882a593Smuzhiyun 	mutex_lock(&ctx->wakeup_mutex);
1219*4882a593Smuzhiyun 	src_buf = v4l2_m2m_src_buf_remove(ctx->fh.m2m_ctx);
1220*4882a593Smuzhiyun 	dst_buf = v4l2_m2m_dst_buf_remove(ctx->fh.m2m_ctx);
1221*4882a593Smuzhiyun 
1222*4882a593Smuzhiyun 	trace_coda_jpeg_done(ctx, dst_buf);
1223*4882a593Smuzhiyun 
1224*4882a593Smuzhiyun 	/*
1225*4882a593Smuzhiyun 	 * Set plane payload to the number of bytes written out
1226*4882a593Smuzhiyun 	 * by the JPEG processing unit
1227*4882a593Smuzhiyun 	 */
1228*4882a593Smuzhiyun 	start_ptr = vb2_dma_contig_plane_dma_addr(&dst_buf->vb2_buf, 0);
1229*4882a593Smuzhiyun 	wr_ptr = coda_read(dev, CODA9_REG_JPEG_BBC_WR_PTR);
1230*4882a593Smuzhiyun 	vb2_set_plane_payload(&dst_buf->vb2_buf, 0, wr_ptr - start_ptr);
1231*4882a593Smuzhiyun 
1232*4882a593Smuzhiyun 	err_mb = coda_read(dev, CODA9_REG_JPEG_PIC_ERRMB);
1233*4882a593Smuzhiyun 	if (err_mb)
1234*4882a593Smuzhiyun 		coda_dbg(1, ctx, "ERRMB: 0x%x\n", err_mb);
1235*4882a593Smuzhiyun 
1236*4882a593Smuzhiyun 	coda_write(dev, 0, CODA9_REG_JPEG_BBC_FLUSH_CMD);
1237*4882a593Smuzhiyun 
1238*4882a593Smuzhiyun 	dst_buf->flags &= ~(V4L2_BUF_FLAG_PFRAME | V4L2_BUF_FLAG_LAST);
1239*4882a593Smuzhiyun 	dst_buf->flags |= V4L2_BUF_FLAG_KEYFRAME;
1240*4882a593Smuzhiyun 	dst_buf->flags |= src_buf->flags & V4L2_BUF_FLAG_LAST;
1241*4882a593Smuzhiyun 
1242*4882a593Smuzhiyun 	v4l2_m2m_buf_copy_metadata(src_buf, dst_buf, false);
1243*4882a593Smuzhiyun 
1244*4882a593Smuzhiyun 	v4l2_m2m_buf_done(src_buf, VB2_BUF_STATE_DONE);
1245*4882a593Smuzhiyun 	coda_m2m_buf_done(ctx, dst_buf, err_mb ? VB2_BUF_STATE_ERROR :
1246*4882a593Smuzhiyun 						 VB2_BUF_STATE_DONE);
1247*4882a593Smuzhiyun 	mutex_unlock(&ctx->wakeup_mutex);
1248*4882a593Smuzhiyun 
1249*4882a593Smuzhiyun 	coda_dbg(1, ctx, "job finished: encoded frame (%u)%s\n",
1250*4882a593Smuzhiyun 		 dst_buf->sequence,
1251*4882a593Smuzhiyun 		 (dst_buf->flags & V4L2_BUF_FLAG_LAST) ? " (last)" : "");
1252*4882a593Smuzhiyun 
1253*4882a593Smuzhiyun 	/*
1254*4882a593Smuzhiyun 	 * Reset JPEG processing unit after each encode run to work
1255*4882a593Smuzhiyun 	 * around hangups when switching context between encoder and
1256*4882a593Smuzhiyun 	 * decoder.
1257*4882a593Smuzhiyun 	 */
1258*4882a593Smuzhiyun 	coda_hw_reset(ctx);
1259*4882a593Smuzhiyun }
1260*4882a593Smuzhiyun 
coda9_jpeg_encode_timeout(struct coda_ctx * ctx)1261*4882a593Smuzhiyun static void coda9_jpeg_encode_timeout(struct coda_ctx *ctx)
1262*4882a593Smuzhiyun {
1263*4882a593Smuzhiyun 	struct coda_dev *dev = ctx->dev;
1264*4882a593Smuzhiyun 	u32 end_addr, wr_ptr;
1265*4882a593Smuzhiyun 
1266*4882a593Smuzhiyun 	/* Handle missing BBC overflow interrupt via timeout */
1267*4882a593Smuzhiyun 	end_addr = coda_read(dev, CODA9_REG_JPEG_BBC_END_ADDR);
1268*4882a593Smuzhiyun 	wr_ptr = coda_read(dev, CODA9_REG_JPEG_BBC_WR_PTR);
1269*4882a593Smuzhiyun 	if (wr_ptr >= end_addr - 256) {
1270*4882a593Smuzhiyun 		v4l2_err(&dev->v4l2_dev, "JPEG too large for capture buffer\n");
1271*4882a593Smuzhiyun 		coda9_jpeg_finish_encode(ctx);
1272*4882a593Smuzhiyun 		return;
1273*4882a593Smuzhiyun 	}
1274*4882a593Smuzhiyun 
1275*4882a593Smuzhiyun 	coda_hw_reset(ctx);
1276*4882a593Smuzhiyun }
1277*4882a593Smuzhiyun 
coda9_jpeg_release(struct coda_ctx * ctx)1278*4882a593Smuzhiyun static void coda9_jpeg_release(struct coda_ctx *ctx)
1279*4882a593Smuzhiyun {
1280*4882a593Smuzhiyun 	int i;
1281*4882a593Smuzhiyun 
1282*4882a593Smuzhiyun 	if (ctx->params.jpeg_qmat_tab[0] == luma_q)
1283*4882a593Smuzhiyun 		ctx->params.jpeg_qmat_tab[0] = NULL;
1284*4882a593Smuzhiyun 	if (ctx->params.jpeg_qmat_tab[1] == chroma_q)
1285*4882a593Smuzhiyun 		ctx->params.jpeg_qmat_tab[1] = NULL;
1286*4882a593Smuzhiyun 	for (i = 0; i < 3; i++)
1287*4882a593Smuzhiyun 		kfree(ctx->params.jpeg_qmat_tab[i]);
1288*4882a593Smuzhiyun 	kfree(ctx->params.jpeg_huff_data);
1289*4882a593Smuzhiyun 	kfree(ctx->params.jpeg_huff_tab);
1290*4882a593Smuzhiyun }
1291*4882a593Smuzhiyun 
1292*4882a593Smuzhiyun const struct coda_context_ops coda9_jpeg_encode_ops = {
1293*4882a593Smuzhiyun 	.queue_init = coda_encoder_queue_init,
1294*4882a593Smuzhiyun 	.start_streaming = coda9_jpeg_start_encoding,
1295*4882a593Smuzhiyun 	.prepare_run = coda9_jpeg_prepare_encode,
1296*4882a593Smuzhiyun 	.finish_run = coda9_jpeg_finish_encode,
1297*4882a593Smuzhiyun 	.run_timeout = coda9_jpeg_encode_timeout,
1298*4882a593Smuzhiyun 	.release = coda9_jpeg_release,
1299*4882a593Smuzhiyun };
1300*4882a593Smuzhiyun 
1301*4882a593Smuzhiyun /*
1302*4882a593Smuzhiyun  * Decoder context operations
1303*4882a593Smuzhiyun  */
1304*4882a593Smuzhiyun 
coda9_jpeg_start_decoding(struct coda_ctx * ctx)1305*4882a593Smuzhiyun static int coda9_jpeg_start_decoding(struct coda_ctx *ctx)
1306*4882a593Smuzhiyun {
1307*4882a593Smuzhiyun 	ctx->params.jpeg_qmat_index[0] = 0;
1308*4882a593Smuzhiyun 	ctx->params.jpeg_qmat_index[1] = 1;
1309*4882a593Smuzhiyun 	ctx->params.jpeg_qmat_index[2] = 1;
1310*4882a593Smuzhiyun 	ctx->params.jpeg_qmat_tab[0] = luma_q;
1311*4882a593Smuzhiyun 	ctx->params.jpeg_qmat_tab[1] = chroma_q;
1312*4882a593Smuzhiyun 	/* nothing more to do here */
1313*4882a593Smuzhiyun 
1314*4882a593Smuzhiyun 	/* TODO: we could already scan the first header to get the chroma
1315*4882a593Smuzhiyun 	 * format.
1316*4882a593Smuzhiyun 	 */
1317*4882a593Smuzhiyun 
1318*4882a593Smuzhiyun 	return 0;
1319*4882a593Smuzhiyun }
1320*4882a593Smuzhiyun 
coda9_jpeg_prepare_decode(struct coda_ctx * ctx)1321*4882a593Smuzhiyun static int coda9_jpeg_prepare_decode(struct coda_ctx *ctx)
1322*4882a593Smuzhiyun {
1323*4882a593Smuzhiyun 	struct coda_dev *dev = ctx->dev;
1324*4882a593Smuzhiyun 	int aligned_width, aligned_height;
1325*4882a593Smuzhiyun 	int chroma_format;
1326*4882a593Smuzhiyun 	int ret;
1327*4882a593Smuzhiyun 	u32 val, dst_fourcc;
1328*4882a593Smuzhiyun 	struct coda_q_data *q_data_src, *q_data_dst;
1329*4882a593Smuzhiyun 	struct vb2_v4l2_buffer *src_buf, *dst_buf;
1330*4882a593Smuzhiyun 	int chroma_interleave;
1331*4882a593Smuzhiyun 
1332*4882a593Smuzhiyun 	src_buf = v4l2_m2m_next_src_buf(ctx->fh.m2m_ctx);
1333*4882a593Smuzhiyun 	dst_buf = v4l2_m2m_next_dst_buf(ctx->fh.m2m_ctx);
1334*4882a593Smuzhiyun 	q_data_src = get_q_data(ctx, V4L2_BUF_TYPE_VIDEO_OUTPUT);
1335*4882a593Smuzhiyun 	q_data_dst = get_q_data(ctx, V4L2_BUF_TYPE_VIDEO_CAPTURE);
1336*4882a593Smuzhiyun 	dst_fourcc = q_data_dst->fourcc;
1337*4882a593Smuzhiyun 
1338*4882a593Smuzhiyun 	if (vb2_get_plane_payload(&src_buf->vb2_buf, 0) == 0)
1339*4882a593Smuzhiyun 		vb2_set_plane_payload(&src_buf->vb2_buf, 0,
1340*4882a593Smuzhiyun 				      vb2_plane_size(&src_buf->vb2_buf, 0));
1341*4882a593Smuzhiyun 
1342*4882a593Smuzhiyun 	chroma_format = coda9_jpeg_chroma_format(q_data_dst->fourcc);
1343*4882a593Smuzhiyun 	if (chroma_format < 0) {
1344*4882a593Smuzhiyun 		v4l2_m2m_job_finish(ctx->dev->m2m_dev, ctx->fh.m2m_ctx);
1345*4882a593Smuzhiyun 		return chroma_format;
1346*4882a593Smuzhiyun 	}
1347*4882a593Smuzhiyun 
1348*4882a593Smuzhiyun 	ret = coda_jpeg_decode_header(ctx, &src_buf->vb2_buf);
1349*4882a593Smuzhiyun 	if (ret < 0) {
1350*4882a593Smuzhiyun 		v4l2_err(&dev->v4l2_dev, "failed to decode JPEG header: %d\n",
1351*4882a593Smuzhiyun 			 ret);
1352*4882a593Smuzhiyun 
1353*4882a593Smuzhiyun 		src_buf = v4l2_m2m_src_buf_remove(ctx->fh.m2m_ctx);
1354*4882a593Smuzhiyun 		dst_buf = v4l2_m2m_dst_buf_remove(ctx->fh.m2m_ctx);
1355*4882a593Smuzhiyun 		v4l2_m2m_buf_done(src_buf, VB2_BUF_STATE_DONE);
1356*4882a593Smuzhiyun 		v4l2_m2m_buf_done(dst_buf, VB2_BUF_STATE_DONE);
1357*4882a593Smuzhiyun 
1358*4882a593Smuzhiyun 		v4l2_m2m_job_finish(ctx->dev->m2m_dev, ctx->fh.m2m_ctx);
1359*4882a593Smuzhiyun 		return ret;
1360*4882a593Smuzhiyun 	}
1361*4882a593Smuzhiyun 
1362*4882a593Smuzhiyun 	/* Round image dimensions to multiple of MCU size */
1363*4882a593Smuzhiyun 	aligned_width = round_up(q_data_src->width, width_align[chroma_format]);
1364*4882a593Smuzhiyun 	aligned_height = round_up(q_data_src->height, height_align[chroma_format]);
1365*4882a593Smuzhiyun 	if (aligned_width != q_data_dst->bytesperline) {
1366*4882a593Smuzhiyun 		v4l2_err(&dev->v4l2_dev, "stride mismatch: %d != %d\n",
1367*4882a593Smuzhiyun 			 aligned_width, q_data_dst->bytesperline);
1368*4882a593Smuzhiyun 	}
1369*4882a593Smuzhiyun 
1370*4882a593Smuzhiyun 	coda_set_gdi_regs(ctx);
1371*4882a593Smuzhiyun 
1372*4882a593Smuzhiyun 	val = ctx->params.jpeg_huff_ac_index[0] << 12 |
1373*4882a593Smuzhiyun 	      ctx->params.jpeg_huff_ac_index[1] << 11 |
1374*4882a593Smuzhiyun 	      ctx->params.jpeg_huff_ac_index[2] << 10 |
1375*4882a593Smuzhiyun 	      ctx->params.jpeg_huff_dc_index[0] << 9 |
1376*4882a593Smuzhiyun 	      ctx->params.jpeg_huff_dc_index[1] << 8 |
1377*4882a593Smuzhiyun 	      ctx->params.jpeg_huff_dc_index[2] << 7;
1378*4882a593Smuzhiyun 	if (ctx->params.jpeg_huff_tab)
1379*4882a593Smuzhiyun 		val |= CODA9_JPEG_PIC_CTRL_USER_HUFFMAN_EN;
1380*4882a593Smuzhiyun 	coda_write(dev, val, CODA9_REG_JPEG_PIC_CTRL);
1381*4882a593Smuzhiyun 
1382*4882a593Smuzhiyun 	coda_write(dev, aligned_width << 16 | aligned_height,
1383*4882a593Smuzhiyun 			CODA9_REG_JPEG_PIC_SIZE);
1384*4882a593Smuzhiyun 
1385*4882a593Smuzhiyun 	chroma_interleave = (dst_fourcc == V4L2_PIX_FMT_NV12);
1386*4882a593Smuzhiyun 	coda_write(dev, 0, CODA9_REG_JPEG_ROT_INFO);
1387*4882a593Smuzhiyun 	coda_write(dev, bus_req_num[chroma_format], CODA9_REG_JPEG_OP_INFO);
1388*4882a593Smuzhiyun 	coda_write(dev, mcu_info[chroma_format], CODA9_REG_JPEG_MCU_INFO);
1389*4882a593Smuzhiyun 	coda_write(dev, 0, CODA9_REG_JPEG_SCL_INFO);
1390*4882a593Smuzhiyun 	coda_write(dev, chroma_interleave, CODA9_REG_JPEG_DPB_CONFIG);
1391*4882a593Smuzhiyun 	coda_write(dev, ctx->params.jpeg_restart_interval,
1392*4882a593Smuzhiyun 			CODA9_REG_JPEG_RST_INTVAL);
1393*4882a593Smuzhiyun 
1394*4882a593Smuzhiyun 	if (ctx->params.jpeg_huff_tab) {
1395*4882a593Smuzhiyun 		ret = coda9_jpeg_dec_huff_setup(ctx);
1396*4882a593Smuzhiyun 		if (ret < 0) {
1397*4882a593Smuzhiyun 			v4l2_err(&dev->v4l2_dev,
1398*4882a593Smuzhiyun 				 "failed to set up Huffman tables: %d\n", ret);
1399*4882a593Smuzhiyun 			v4l2_m2m_job_finish(ctx->dev->m2m_dev, ctx->fh.m2m_ctx);
1400*4882a593Smuzhiyun 			return ret;
1401*4882a593Smuzhiyun 		}
1402*4882a593Smuzhiyun 	}
1403*4882a593Smuzhiyun 
1404*4882a593Smuzhiyun 	coda9_jpeg_qmat_setup(ctx);
1405*4882a593Smuzhiyun 
1406*4882a593Smuzhiyun 	coda9_jpeg_dec_bbc_gbu_setup(ctx, &src_buf->vb2_buf,
1407*4882a593Smuzhiyun 				     ctx->jpeg_ecs_offset);
1408*4882a593Smuzhiyun 
1409*4882a593Smuzhiyun 	coda_write(dev, 0, CODA9_REG_JPEG_RST_INDEX);
1410*4882a593Smuzhiyun 	coda_write(dev, 0, CODA9_REG_JPEG_RST_COUNT);
1411*4882a593Smuzhiyun 
1412*4882a593Smuzhiyun 	coda_write(dev, 0, CODA9_REG_JPEG_DPCM_DIFF_Y);
1413*4882a593Smuzhiyun 	coda_write(dev, 0, CODA9_REG_JPEG_DPCM_DIFF_CB);
1414*4882a593Smuzhiyun 	coda_write(dev, 0, CODA9_REG_JPEG_DPCM_DIFF_CR);
1415*4882a593Smuzhiyun 
1416*4882a593Smuzhiyun 	coda_write(dev, 0, CODA9_REG_JPEG_ROT_INFO);
1417*4882a593Smuzhiyun 
1418*4882a593Smuzhiyun 	coda_write(dev, 1, CODA9_GDI_CONTROL);
1419*4882a593Smuzhiyun 	do {
1420*4882a593Smuzhiyun 		ret = coda_read(dev, CODA9_GDI_STATUS);
1421*4882a593Smuzhiyun 	} while (!ret);
1422*4882a593Smuzhiyun 
1423*4882a593Smuzhiyun 	val = (chroma_format << 17) | (chroma_interleave << 16) |
1424*4882a593Smuzhiyun 	      q_data_dst->bytesperline;
1425*4882a593Smuzhiyun 	if (ctx->tiled_map_type == GDI_TILED_FRAME_MB_RASTER_MAP)
1426*4882a593Smuzhiyun 		val |= 3 << 20;
1427*4882a593Smuzhiyun 	coda_write(dev, val, CODA9_GDI_INFO_CONTROL);
1428*4882a593Smuzhiyun 
1429*4882a593Smuzhiyun 	coda_write(dev, aligned_width << 16 | aligned_height,
1430*4882a593Smuzhiyun 			CODA9_GDI_INFO_PIC_SIZE);
1431*4882a593Smuzhiyun 
1432*4882a593Smuzhiyun 	coda_write_base(ctx, q_data_dst, dst_buf, CODA9_GDI_INFO_BASE_Y);
1433*4882a593Smuzhiyun 
1434*4882a593Smuzhiyun 	coda_write(dev, 0, CODA9_REG_JPEG_DPB_BASE00);
1435*4882a593Smuzhiyun 	coda_write(dev, 0, CODA9_GDI_CONTROL);
1436*4882a593Smuzhiyun 	coda_write(dev, 1, CODA9_GDI_PIC_INIT_HOST);
1437*4882a593Smuzhiyun 
1438*4882a593Smuzhiyun 	trace_coda_jpeg_run(ctx, src_buf);
1439*4882a593Smuzhiyun 
1440*4882a593Smuzhiyun 	coda_write(dev, 1, CODA9_REG_JPEG_PIC_START);
1441*4882a593Smuzhiyun 
1442*4882a593Smuzhiyun 	return 0;
1443*4882a593Smuzhiyun }
1444*4882a593Smuzhiyun 
coda9_jpeg_finish_decode(struct coda_ctx * ctx)1445*4882a593Smuzhiyun static void coda9_jpeg_finish_decode(struct coda_ctx *ctx)
1446*4882a593Smuzhiyun {
1447*4882a593Smuzhiyun 	struct coda_dev *dev = ctx->dev;
1448*4882a593Smuzhiyun 	struct vb2_v4l2_buffer *dst_buf, *src_buf;
1449*4882a593Smuzhiyun 	struct coda_q_data *q_data_dst;
1450*4882a593Smuzhiyun 	u32 err_mb;
1451*4882a593Smuzhiyun 
1452*4882a593Smuzhiyun 	err_mb = coda_read(dev, CODA9_REG_JPEG_PIC_ERRMB);
1453*4882a593Smuzhiyun 	if (err_mb)
1454*4882a593Smuzhiyun 		v4l2_err(&dev->v4l2_dev, "ERRMB: 0x%x\n", err_mb);
1455*4882a593Smuzhiyun 
1456*4882a593Smuzhiyun 	coda_write(dev, 0, CODA9_REG_JPEG_BBC_FLUSH_CMD);
1457*4882a593Smuzhiyun 
1458*4882a593Smuzhiyun 	/*
1459*4882a593Smuzhiyun 	 * Lock to make sure that a decoder stop command running in parallel
1460*4882a593Smuzhiyun 	 * will either already have marked src_buf as last, or it will wake up
1461*4882a593Smuzhiyun 	 * the capture queue after the buffers are returned.
1462*4882a593Smuzhiyun 	 */
1463*4882a593Smuzhiyun 	mutex_lock(&ctx->wakeup_mutex);
1464*4882a593Smuzhiyun 	src_buf = v4l2_m2m_src_buf_remove(ctx->fh.m2m_ctx);
1465*4882a593Smuzhiyun 	dst_buf = v4l2_m2m_dst_buf_remove(ctx->fh.m2m_ctx);
1466*4882a593Smuzhiyun 	dst_buf->sequence = ctx->osequence++;
1467*4882a593Smuzhiyun 
1468*4882a593Smuzhiyun 	trace_coda_jpeg_done(ctx, dst_buf);
1469*4882a593Smuzhiyun 
1470*4882a593Smuzhiyun 	dst_buf->flags &= ~(V4L2_BUF_FLAG_PFRAME | V4L2_BUF_FLAG_LAST);
1471*4882a593Smuzhiyun 	dst_buf->flags |= V4L2_BUF_FLAG_KEYFRAME;
1472*4882a593Smuzhiyun 	dst_buf->flags |= src_buf->flags & V4L2_BUF_FLAG_LAST;
1473*4882a593Smuzhiyun 
1474*4882a593Smuzhiyun 	v4l2_m2m_buf_copy_metadata(src_buf, dst_buf, false);
1475*4882a593Smuzhiyun 
1476*4882a593Smuzhiyun 	q_data_dst = get_q_data(ctx, V4L2_BUF_TYPE_VIDEO_CAPTURE);
1477*4882a593Smuzhiyun 	vb2_set_plane_payload(&dst_buf->vb2_buf, 0, q_data_dst->sizeimage);
1478*4882a593Smuzhiyun 
1479*4882a593Smuzhiyun 	v4l2_m2m_buf_done(src_buf, VB2_BUF_STATE_DONE);
1480*4882a593Smuzhiyun 	coda_m2m_buf_done(ctx, dst_buf, err_mb ? VB2_BUF_STATE_ERROR :
1481*4882a593Smuzhiyun 						 VB2_BUF_STATE_DONE);
1482*4882a593Smuzhiyun 
1483*4882a593Smuzhiyun 	mutex_unlock(&ctx->wakeup_mutex);
1484*4882a593Smuzhiyun 
1485*4882a593Smuzhiyun 	coda_dbg(1, ctx, "job finished: decoded frame (%u)%s\n",
1486*4882a593Smuzhiyun 		 dst_buf->sequence,
1487*4882a593Smuzhiyun 		 (dst_buf->flags & V4L2_BUF_FLAG_LAST) ? " (last)" : "");
1488*4882a593Smuzhiyun 
1489*4882a593Smuzhiyun 	/*
1490*4882a593Smuzhiyun 	 * Reset JPEG processing unit after each decode run to work
1491*4882a593Smuzhiyun 	 * around hangups when switching context between encoder and
1492*4882a593Smuzhiyun 	 * decoder.
1493*4882a593Smuzhiyun 	 */
1494*4882a593Smuzhiyun 	coda_hw_reset(ctx);
1495*4882a593Smuzhiyun }
1496*4882a593Smuzhiyun 
1497*4882a593Smuzhiyun const struct coda_context_ops coda9_jpeg_decode_ops = {
1498*4882a593Smuzhiyun 	.queue_init = coda_encoder_queue_init, /* non-bitstream operation */
1499*4882a593Smuzhiyun 	.start_streaming = coda9_jpeg_start_decoding,
1500*4882a593Smuzhiyun 	.prepare_run = coda9_jpeg_prepare_decode,
1501*4882a593Smuzhiyun 	.finish_run = coda9_jpeg_finish_decode,
1502*4882a593Smuzhiyun 	.release = coda9_jpeg_release,
1503*4882a593Smuzhiyun };
1504*4882a593Smuzhiyun 
coda9_jpeg_irq_handler(int irq,void * data)1505*4882a593Smuzhiyun irqreturn_t coda9_jpeg_irq_handler(int irq, void *data)
1506*4882a593Smuzhiyun {
1507*4882a593Smuzhiyun 	struct coda_dev *dev = data;
1508*4882a593Smuzhiyun 	struct coda_ctx *ctx;
1509*4882a593Smuzhiyun 	int status;
1510*4882a593Smuzhiyun 	int err_mb;
1511*4882a593Smuzhiyun 
1512*4882a593Smuzhiyun 	status = coda_read(dev, CODA9_REG_JPEG_PIC_STATUS);
1513*4882a593Smuzhiyun 	if (status == 0)
1514*4882a593Smuzhiyun 		return IRQ_HANDLED;
1515*4882a593Smuzhiyun 	coda_write(dev, status, CODA9_REG_JPEG_PIC_STATUS);
1516*4882a593Smuzhiyun 
1517*4882a593Smuzhiyun 	if (status & CODA9_JPEG_STATUS_OVERFLOW)
1518*4882a593Smuzhiyun 		v4l2_err(&dev->v4l2_dev, "JPEG overflow\n");
1519*4882a593Smuzhiyun 
1520*4882a593Smuzhiyun 	if (status & CODA9_JPEG_STATUS_BBC_INT)
1521*4882a593Smuzhiyun 		v4l2_err(&dev->v4l2_dev, "JPEG BBC interrupt\n");
1522*4882a593Smuzhiyun 
1523*4882a593Smuzhiyun 	if (status & CODA9_JPEG_STATUS_ERROR) {
1524*4882a593Smuzhiyun 		v4l2_err(&dev->v4l2_dev, "JPEG error\n");
1525*4882a593Smuzhiyun 
1526*4882a593Smuzhiyun 		err_mb = coda_read(dev, CODA9_REG_JPEG_PIC_ERRMB);
1527*4882a593Smuzhiyun 		if (err_mb) {
1528*4882a593Smuzhiyun 			v4l2_err(&dev->v4l2_dev,
1529*4882a593Smuzhiyun 				 "ERRMB: 0x%x: rst idx %d, mcu pos (%d,%d)\n",
1530*4882a593Smuzhiyun 				 err_mb, err_mb >> 24, (err_mb >> 12) & 0xfff,
1531*4882a593Smuzhiyun 				 err_mb & 0xfff);
1532*4882a593Smuzhiyun 		}
1533*4882a593Smuzhiyun 	}
1534*4882a593Smuzhiyun 
1535*4882a593Smuzhiyun 	ctx = v4l2_m2m_get_curr_priv(dev->m2m_dev);
1536*4882a593Smuzhiyun 	if (!ctx) {
1537*4882a593Smuzhiyun 		v4l2_err(&dev->v4l2_dev,
1538*4882a593Smuzhiyun 			 "Instance released before the end of transaction\n");
1539*4882a593Smuzhiyun 		mutex_unlock(&dev->coda_mutex);
1540*4882a593Smuzhiyun 		return IRQ_HANDLED;
1541*4882a593Smuzhiyun 	}
1542*4882a593Smuzhiyun 
1543*4882a593Smuzhiyun 	complete(&ctx->completion);
1544*4882a593Smuzhiyun 
1545*4882a593Smuzhiyun 	return IRQ_HANDLED;
1546*4882a593Smuzhiyun }
1547