xref: /linux/drivers/media/platform/renesas/rcar_jpu.c (revision c8b90d40d5bba8e6fba457b8a7c10d3c0d467e37)
1 // SPDX-License-Identifier: GPL-2.0
2 /*
3  * Author: Mikhail Ulyanov
4  * Copyright (C) 2014-2015 Cogent Embedded, Inc.  <source@cogentembedded.com>
5  * Copyright (C) 2014-2015 Renesas Electronics Corporation
6  *
7  * This is based on the drivers/media/platform/samsung/s5p-jpeg driver by
8  * Andrzej Pietrasiewicz and Jacek Anaszewski.
9  * Some portions of code inspired by VSP1 driver by Laurent Pinchart.
10  *
11  * TODO in order of priority:
12  *      1) Rotation
13  *      2) Cropping
14  *      3) V4L2_CID_JPEG_ACTIVE_MARKER
15  */
16 
17 #include <linux/unaligned.h>
18 #include <linux/clk.h>
19 #include <linux/err.h>
20 #include <linux/interrupt.h>
21 #include <linux/io.h>
22 #include <linux/kernel.h>
23 #include <linux/module.h>
24 #include <linux/of.h>
25 #include <linux/platform_device.h>
26 #include <linux/slab.h>
27 #include <linux/spinlock.h>
28 #include <linux/string.h>
29 #include <linux/videodev2.h>
30 #include <media/jpeg.h>
31 #include <media/v4l2-ctrls.h>
32 #include <media/v4l2-device.h>
33 #include <media/v4l2-event.h>
34 #include <media/v4l2-fh.h>
35 #include <media/v4l2-mem2mem.h>
36 #include <media/v4l2-ioctl.h>
37 #include <media/videobuf2-v4l2.h>
38 #include <media/videobuf2-dma-contig.h>
39 
40 
41 #define DRV_NAME "rcar_jpu"
42 
43 /*
44  * Align JPEG header end to cache line to make sure we will not have any issues
45  * with cache; additionally to requirement (33.3.27 R01UH0501EJ0100 Rev.1.00)
46  */
47 #define JPU_JPEG_HDR_SIZE		(ALIGN(0x258, L1_CACHE_BYTES))
48 #define JPU_JPEG_MAX_BYTES_PER_PIXEL	2	/* 16 bit precision format */
49 #define JPU_JPEG_MIN_SIZE		25	/* SOI + SOF + EOI */
50 #define JPU_JPEG_QTBL_SIZE		0x40
51 #define JPU_JPEG_HDCTBL_SIZE		0x1c
52 #define JPU_JPEG_HACTBL_SIZE		0xb2
53 #define JPU_JPEG_HEIGHT_OFFSET		0x91
54 #define JPU_JPEG_WIDTH_OFFSET		0x93
55 #define JPU_JPEG_SUBS_OFFSET		0x97
56 #define JPU_JPEG_QTBL_LUM_OFFSET	0x07
57 #define JPU_JPEG_QTBL_CHR_OFFSET	0x4c
58 #define JPU_JPEG_HDCTBL_LUM_OFFSET	0xa4
59 #define JPU_JPEG_HACTBL_LUM_OFFSET	0xc5
60 #define JPU_JPEG_HDCTBL_CHR_OFFSET	0x17c
61 #define JPU_JPEG_HACTBL_CHR_OFFSET	0x19d
62 #define JPU_JPEG_PADDING_OFFSET		0x24f
63 #define JPU_JPEG_LUM 0x00
64 #define JPU_JPEG_CHR 0x01
65 #define JPU_JPEG_DC  0x00
66 #define JPU_JPEG_AC  0x10
67 
68 #define JPU_JPEG_422 0x21
69 #define JPU_JPEG_420 0x22
70 
71 #define JPU_JPEG_DEFAULT_422_PIX_FMT V4L2_PIX_FMT_NV16M
72 #define JPU_JPEG_DEFAULT_420_PIX_FMT V4L2_PIX_FMT_NV12M
73 
74 #define JPU_RESET_TIMEOUT	100 /* ms */
75 #define JPU_JOB_TIMEOUT		300 /* ms */
76 #define JPU_MAX_QUALITY		4
77 #define JPU_WIDTH_MIN		16
78 #define JPU_HEIGHT_MIN		16
79 #define JPU_WIDTH_MAX		4096
80 #define JPU_HEIGHT_MAX		4096
81 #define JPU_MEMALIGN		8
82 
83 /* Flags that indicate a format can be used for capture/output */
84 #define JPU_FMT_TYPE_OUTPUT	0
85 #define JPU_FMT_TYPE_CAPTURE	1
86 #define JPU_ENC_CAPTURE		(1 << 0)
87 #define JPU_ENC_OUTPUT		(1 << 1)
88 #define JPU_DEC_CAPTURE		(1 << 2)
89 #define JPU_DEC_OUTPUT		(1 << 3)
90 
91 /*
92  * JPEG registers and bits
93  */
94 
95 /* JPEG code mode register */
96 #define JCMOD	0x00
97 #define JCMOD_PCTR		(1 << 7)
98 #define JCMOD_MSKIP_ENABLE	(1 << 5)
99 #define JCMOD_DSP_ENC		(0 << 3)
100 #define JCMOD_DSP_DEC		(1 << 3)
101 #define JCMOD_REDU		(7 << 0)
102 #define JCMOD_REDU_422		(1 << 0)
103 #define JCMOD_REDU_420		(2 << 0)
104 
105 /* JPEG code command register */
106 #define JCCMD	0x04
107 #define JCCMD_SRST	(1 << 12)
108 #define JCCMD_JEND	(1 << 2)
109 #define JCCMD_JSRT	(1 << 0)
110 
111 /* JPEG code quantization table number register */
112 #define JCQTN	0x0c
113 #define JCQTN_SHIFT(t)		(((t) - 1) << 1)
114 
115 /* JPEG code Huffman table number register */
116 #define JCHTN	0x10
117 #define JCHTN_AC_SHIFT(t)	(((t) << 1) - 1)
118 #define JCHTN_DC_SHIFT(t)	(((t) - 1) << 1)
119 
120 #define JCVSZU	0x1c /* JPEG code vertical size upper register */
121 #define JCVSZD	0x20 /* JPEG code vertical size lower register */
122 #define JCHSZU	0x24 /* JPEG code horizontal size upper register */
123 #define JCHSZD	0x28 /* JPEG code horizontal size lower register */
124 #define JCSZ_MASK 0xff /* JPEG code h/v size register contains only 1 byte*/
125 
126 #define JCDTCU	0x2c /* JPEG code data count upper register */
127 #define JCDTCM	0x30 /* JPEG code data count middle register */
128 #define JCDTCD	0x34 /* JPEG code data count lower register */
129 
130 /* JPEG interrupt enable register */
131 #define JINTE	0x38
132 #define JINTE_ERR		(7 << 5) /* INT5 + INT6 + INT7 */
133 #define JINTE_TRANSF_COMPL	(1 << 10)
134 
135 /* JPEG interrupt status register */
136 #define JINTS	0x3c
137 #define JINTS_MASK	0x7c68
138 #define JINTS_ERR		(1 << 5)
139 #define JINTS_PROCESS_COMPL	(1 << 6)
140 #define JINTS_TRANSF_COMPL	(1 << 10)
141 
142 #define JCDERR	0x40 /* JPEG code decode error register */
143 #define JCDERR_MASK	0xf /* JPEG code decode error register mask*/
144 
145 /* JPEG interface encoding */
146 #define JIFECNT	0x70
147 #define JIFECNT_INFT_422	0
148 #define JIFECNT_INFT_420	1
149 #define JIFECNT_SWAP_WB		(3 << 4) /* to JPU */
150 
151 #define JIFESYA1	0x74	/* encode source Y address register 1 */
152 #define JIFESCA1	0x78	/* encode source C address register 1 */
153 #define JIFESYA2	0x7c	/* encode source Y address register 2 */
154 #define JIFESCA2	0x80	/* encode source C address register 2 */
155 #define JIFESMW		0x84	/* encode source memory width register */
156 #define JIFESVSZ	0x88	/* encode source vertical size register */
157 #define JIFESHSZ	0x8c	/* encode source horizontal size register */
158 #define JIFEDA1		0x90	/* encode destination address register 1 */
159 #define JIFEDA2		0x94	/* encode destination address register 2 */
160 
161 /* JPEG decoding control register */
162 #define JIFDCNT	0xa0
163 #define JIFDCNT_SWAP_WB		(3 << 1) /* from JPU */
164 
165 #define JIFDSA1		0xa4	/* decode source address register 1 */
166 #define JIFDDMW		0xb0	/* decode destination  memory width register */
167 #define JIFDDVSZ	0xb4	/* decode destination  vert. size register */
168 #define JIFDDHSZ	0xb8	/* decode destination  horiz. size register */
169 #define JIFDDYA1	0xbc	/* decode destination  Y address register 1 */
170 #define JIFDDCA1	0xc0	/* decode destination  C address register 1 */
171 
172 #define JCQTBL(n)	(0x10000 + (n) * 0x40)	/* quantization tables regs */
173 #define JCHTBD(n)	(0x10100 + (n) * 0x100)	/* Huffman table DC regs */
174 #define JCHTBA(n)	(0x10120 + (n) * 0x100)	/* Huffman table AC regs */
175 
176 /**
177  * struct jpu - JPEG IP abstraction
178  * @mutex: the mutex protecting this structure
179  * @lock: spinlock protecting the device contexts
180  * @v4l2_dev: v4l2 device for mem2mem mode
181  * @vfd_encoder: video device node for encoder mem2mem mode
182  * @vfd_decoder: video device node for decoder mem2mem mode
183  * @m2m_dev: v4l2 mem2mem device data
184  * @curr: pointer to current context
185  * @regs: JPEG IP registers mapping
186  * @irq: JPEG IP irq
187  * @clk: JPEG IP clock
188  * @dev: JPEG IP struct device
189  * @ref_count: reference counter
190  */
191 struct jpu {
192 	struct mutex	mutex;
193 	spinlock_t	lock;
194 	struct v4l2_device	v4l2_dev;
195 	struct video_device	vfd_encoder;
196 	struct video_device	vfd_decoder;
197 	struct v4l2_m2m_dev	*m2m_dev;
198 	struct jpu_ctx		*curr;
199 
200 	void __iomem		*regs;
201 	unsigned int		irq;
202 	struct clk		*clk;
203 	struct device		*dev;
204 	int			ref_count;
205 };
206 
207 /**
208  * struct jpu_buffer - driver's specific video buffer
209  * @buf: m2m buffer
210  * @compr_quality: destination image quality in compression mode
211  * @subsampling: source image subsampling in decompression mode
212  */
213 struct jpu_buffer {
214 	struct v4l2_m2m_buffer buf;
215 	unsigned short	compr_quality;
216 	unsigned char	subsampling;
217 };
218 
219 /**
220  * struct jpu_fmt - driver's internal format data
221  * @fourcc: the fourcc code, 0 if not applicable
222  * @colorspace: the colorspace specifier
223  * @bpp: number of bits per pixel per plane
224  * @h_align: horizontal alignment order (align to 2^h_align)
225  * @v_align: vertical alignment order (align to 2^v_align)
226  * @subsampling: (horizontal:4 | vertical:4) subsampling factor
227  * @num_planes: number of planes
228  * @types: types of queue this format is applicable to
229  */
230 struct jpu_fmt {
231 	u32 fourcc;
232 	u32 colorspace;
233 	u8 bpp[2];
234 	u8 h_align;
235 	u8 v_align;
236 	u8 subsampling;
237 	u8 num_planes;
238 	u16 types;
239 };
240 
241 /**
242  * struct jpu_q_data - parameters of one queue
243  * @fmtinfo: driver-specific format of this queue
244  * @format: multiplanar format of this queue
245  * @sequence: sequence number
246  */
247 struct jpu_q_data {
248 	struct jpu_fmt *fmtinfo;
249 	struct v4l2_pix_format_mplane format;
250 	unsigned int sequence;
251 };
252 
253 /**
254  * struct jpu_ctx - the device context data
255  * @jpu: JPEG IP device for this context
256  * @encoder: compression (encode) operation or decompression (decode)
257  * @compr_quality: destination image quality in compression (encode) mode
258  * @out_q: source (output) queue information
259  * @cap_q: destination (capture) queue information
260  * @fh: file handler
261  * @ctrl_handler: controls handler
262  */
263 struct jpu_ctx {
264 	struct jpu		*jpu;
265 	bool			encoder;
266 	unsigned short		compr_quality;
267 	struct jpu_q_data	out_q;
268 	struct jpu_q_data	cap_q;
269 	struct v4l2_fh		fh;
270 	struct v4l2_ctrl_handler ctrl_handler;
271 };
272 
273  /**
274  * jpeg_buffer - description of memory containing input JPEG data
275  * @end: end position in the buffer
276  * @curr: current position in the buffer
277  */
278 struct jpeg_buffer {
279 	void *end;
280 	void *curr;
281 };
282 
283 static struct jpu_fmt jpu_formats[] = {
284 	{ V4L2_PIX_FMT_JPEG, V4L2_COLORSPACE_JPEG,
285 	  {0, 0}, 0, 0, 0, 1, JPU_ENC_CAPTURE | JPU_DEC_OUTPUT },
286 	{ V4L2_PIX_FMT_NV16M, V4L2_COLORSPACE_SRGB,
287 	  {8, 8}, 2, 2, JPU_JPEG_422, 2, JPU_ENC_OUTPUT | JPU_DEC_CAPTURE },
288 	{ V4L2_PIX_FMT_NV12M, V4L2_COLORSPACE_SRGB,
289 	  {8, 4}, 2, 2, JPU_JPEG_420, 2, JPU_ENC_OUTPUT | JPU_DEC_CAPTURE },
290 	{ V4L2_PIX_FMT_NV16, V4L2_COLORSPACE_SRGB,
291 	  {16, 0}, 2, 2, JPU_JPEG_422, 1, JPU_ENC_OUTPUT | JPU_DEC_CAPTURE },
292 	{ V4L2_PIX_FMT_NV12, V4L2_COLORSPACE_SRGB,
293 	  {12, 0}, 2, 2, JPU_JPEG_420, 1, JPU_ENC_OUTPUT | JPU_DEC_CAPTURE },
294 };
295 
296 static const u8 zigzag[] = {
297 	0x03, 0x02, 0x0b, 0x13, 0x0a, 0x01, 0x00, 0x09,
298 	0x12, 0x1b, 0x23, 0x1a, 0x11, 0x08, 0x07, 0x06,
299 	0x0f, 0x10, 0x19, 0x22, 0x2b, 0x33, 0x2a, 0x21,
300 	0x18, 0x17, 0x0e, 0x05, 0x04, 0x0d, 0x16, 0x1f,
301 	0x20, 0x29, 0x32, 0x3b, 0x3a, 0x31, 0x28, 0x27,
302 	0x1e, 0x15, 0x0e, 0x14, 0x10, 0x26, 0x2f, 0x30,
303 	0x39, 0x38, 0x37, 0x2e, 0x25, 0x1c, 0x24, 0x2b,
304 	0x36, 0x3f, 0x3e, 0x35, 0x2c, 0x34, 0x3d, 0x3c
305 };
306 
307 #define QTBL_SIZE (ALIGN(JPU_JPEG_QTBL_SIZE, \
308 			  sizeof(unsigned int)) / sizeof(unsigned int))
309 #define HDCTBL_SIZE (ALIGN(JPU_JPEG_HDCTBL_SIZE, \
310 			  sizeof(unsigned int)) / sizeof(unsigned int))
311 #define HACTBL_SIZE (ALIGN(JPU_JPEG_HACTBL_SIZE, \
312 			  sizeof(unsigned int)) / sizeof(unsigned int))
313 /*
314  * Start of image; Quantization tables
315  * SOF0 (17 bytes payload) is Baseline DCT - Sample precision, height, width,
316  * Number of image components, (Ci:8 - Hi:4 - Vi:4 - Tq:8) * 3 - Y,Cb,Cr;
317  * Huffman tables; Padding with 0xff (33.3.27 R01UH0501EJ0100 Rev.1.00)
318  */
319 #define JPU_JPEG_HDR_BLOB {                                                    \
320 	0xff, JPEG_MARKER_SOI, 0xff, JPEG_MARKER_DQT, 0x00,		       \
321 	JPU_JPEG_QTBL_SIZE + 0x3, JPU_JPEG_LUM,				       \
322 	[JPU_JPEG_QTBL_LUM_OFFSET ...					       \
323 		JPU_JPEG_QTBL_LUM_OFFSET + JPU_JPEG_QTBL_SIZE - 1] = 0x00,     \
324 	0xff, JPEG_MARKER_DQT, 0x00, JPU_JPEG_QTBL_SIZE + 0x3, JPU_JPEG_CHR,   \
325 	[JPU_JPEG_QTBL_CHR_OFFSET ... JPU_JPEG_QTBL_CHR_OFFSET +               \
326 		JPU_JPEG_QTBL_SIZE - 1] = 0x00,				       \
327 	0xff, JPEG_MARKER_SOF0, 0x00, 0x11, 0x08,			       \
328 	[JPU_JPEG_HEIGHT_OFFSET ... JPU_JPEG_HEIGHT_OFFSET + 1] = 0x00,        \
329 	[JPU_JPEG_WIDTH_OFFSET ... JPU_JPEG_WIDTH_OFFSET + 1] = 0x00,          \
330 	0x03, 0x01, [JPU_JPEG_SUBS_OFFSET] = 0x00, JPU_JPEG_LUM,               \
331 	0x02, 0x11, JPU_JPEG_CHR, 0x03, 0x11, JPU_JPEG_CHR,                    \
332 	0xff, JPEG_MARKER_DHT, 0x00, JPU_JPEG_HDCTBL_SIZE + 0x3,	       \
333 	JPU_JPEG_LUM | JPU_JPEG_DC,					       \
334 	[JPU_JPEG_HDCTBL_LUM_OFFSET ...                                        \
335 		JPU_JPEG_HDCTBL_LUM_OFFSET + JPU_JPEG_HDCTBL_SIZE - 1] = 0x00, \
336 	0xff, JPEG_MARKER_DHT, 0x00, JPU_JPEG_HACTBL_SIZE + 0x3,	       \
337 	JPU_JPEG_LUM | JPU_JPEG_AC,					       \
338 	[JPU_JPEG_HACTBL_LUM_OFFSET ...                                        \
339 		JPU_JPEG_HACTBL_LUM_OFFSET + JPU_JPEG_HACTBL_SIZE - 1] = 0x00, \
340 	0xff, JPEG_MARKER_DHT, 0x00, JPU_JPEG_HDCTBL_SIZE + 0x3,	       \
341 	JPU_JPEG_CHR | JPU_JPEG_DC,					       \
342 	[JPU_JPEG_HDCTBL_CHR_OFFSET ...                                        \
343 		JPU_JPEG_HDCTBL_CHR_OFFSET + JPU_JPEG_HDCTBL_SIZE - 1] = 0x00, \
344 	0xff, JPEG_MARKER_DHT, 0x00, JPU_JPEG_HACTBL_SIZE + 0x3,	       \
345 	JPU_JPEG_CHR | JPU_JPEG_AC,					       \
346 	[JPU_JPEG_HACTBL_CHR_OFFSET ...                                        \
347 		JPU_JPEG_HACTBL_CHR_OFFSET + JPU_JPEG_HACTBL_SIZE - 1] = 0x00, \
348 	[JPU_JPEG_PADDING_OFFSET ... JPU_JPEG_HDR_SIZE - 1] = 0xff             \
349 }
350 
351 static unsigned char jpeg_hdrs[JPU_MAX_QUALITY][JPU_JPEG_HDR_SIZE] = {
352 	[0 ... JPU_MAX_QUALITY - 1] = JPU_JPEG_HDR_BLOB
353 };
354 
355 static const unsigned int qtbl_lum[JPU_MAX_QUALITY][QTBL_SIZE] = {
356 	{
357 		0x14101927, 0x322e3e44, 0x10121726, 0x26354144,
358 		0x19171f26, 0x35414444, 0x27262635, 0x41444444,
359 		0x32263541, 0x44444444, 0x2e354144, 0x44444444,
360 		0x3e414444, 0x44444444, 0x44444444, 0x44444444
361 	},
362 	{
363 		0x100b0b10, 0x171b1f1e, 0x0b0c0c0f, 0x1417171e,
364 		0x0b0c0d10, 0x171a232f, 0x100f1017, 0x1a252f40,
365 		0x1714171a, 0x27334040, 0x1b171a25, 0x33404040,
366 		0x1f17232f, 0x40404040, 0x1e1e2f40, 0x40404040
367 	},
368 	{
369 		0x0c08080c, 0x11151817, 0x0809090b, 0x0f131217,
370 		0x08090a0c, 0x13141b24, 0x0c0b0c15, 0x141c2435,
371 		0x110f1314, 0x1e27333b, 0x1513141c, 0x27333b3b,
372 		0x18121b24, 0x333b3b3b, 0x17172435, 0x3b3b3b3b
373 	},
374 	{
375 		0x08060608, 0x0c0e1011, 0x06060608, 0x0a0d0c0f,
376 		0x06060708, 0x0d0e1218, 0x0808080e, 0x0d131823,
377 		0x0c0a0d0d, 0x141a2227, 0x0e0d0e13, 0x1a222727,
378 		0x100c1318, 0x22272727, 0x110f1823, 0x27272727
379 	}
380 };
381 
382 static const unsigned int qtbl_chr[JPU_MAX_QUALITY][QTBL_SIZE] = {
383 	{
384 		0x15192026, 0x36444444, 0x191c1826, 0x36444444,
385 		0x2018202b, 0x42444444, 0x26262b35, 0x44444444,
386 		0x36424444, 0x44444444, 0x44444444, 0x44444444,
387 		0x44444444, 0x44444444, 0x44444444, 0x44444444
388 	},
389 	{
390 		0x110f1115, 0x141a2630, 0x0f131211, 0x141a232b,
391 		0x11121416, 0x1a1e2e35, 0x1511161c, 0x1e273540,
392 		0x14141a1e, 0x27304040, 0x1a1a1e27, 0x303f4040,
393 		0x26232e35, 0x40404040, 0x302b3540, 0x40404040
394 	},
395 	{
396 		0x0d0b0d10, 0x14141d25, 0x0b0e0e0e, 0x10141a20,
397 		0x0d0e0f11, 0x14172328, 0x100e1115, 0x171e2832,
398 		0x14101417, 0x1e25323b, 0x1414171e, 0x25303b3b,
399 		0x1d1a2328, 0x323b3b3b, 0x25202832, 0x3b3b3b3b
400 	},
401 	{
402 		0x0908090b, 0x0e111318, 0x080a090b, 0x0e0d1116,
403 		0x09090d0e, 0x0d0f171a, 0x0b0b0e0e, 0x0f141a21,
404 		0x0e0e0d0f, 0x14182127, 0x110d0f14, 0x18202727,
405 		0x1311171a, 0x21272727, 0x18161a21, 0x27272727
406 	}
407 };
408 
409 static const unsigned int hdctbl_lum[HDCTBL_SIZE] = {
410 	0x00010501, 0x01010101, 0x01000000, 0x00000000,
411 	0x00010203, 0x04050607, 0x08090a0b
412 };
413 
414 static const unsigned int hdctbl_chr[HDCTBL_SIZE] = {
415 	0x00010501, 0x01010101, 0x01000000, 0x00000000,
416 	0x00010203, 0x04050607, 0x08090a0b
417 };
418 
419 static const unsigned int hactbl_lum[HACTBL_SIZE] = {
420 	0x00020103, 0x03020403, 0x05050404, 0x0000017d, 0x01020300, 0x04110512,
421 	0x21314106, 0x13516107,	0x22711432, 0x8191a108, 0x2342b1c1, 0x1552d1f0,
422 	0x24336272, 0x82090a16, 0x1718191a, 0x25262728, 0x292a3435, 0x36373839,
423 	0x3a434445, 0x46474849, 0x4a535455, 0x56575859, 0x5a636465, 0x66676869,
424 	0x6a737475, 0x76777879, 0x7a838485, 0x86878889, 0x8a929394, 0x95969798,
425 	0x999aa2a3, 0xa4a5a6a7, 0xa8a9aab2, 0xb3b4b5b6, 0xb7b8b9ba, 0xc2c3c4c5,
426 	0xc6c7c8c9, 0xcad2d3d4, 0xd5d6d7d8, 0xd9dae1e2, 0xe3e4e5e6, 0xe7e8e9ea,
427 	0xf1f2f3f4, 0xf5f6f7f8, 0xf9fa0000
428 };
429 
430 static const unsigned int hactbl_chr[HACTBL_SIZE] = {
431 	0x00020103, 0x03020403, 0x05050404, 0x0000017d, 0x01020300, 0x04110512,
432 	0x21314106, 0x13516107,	0x22711432, 0x8191a108, 0x2342b1c1, 0x1552d1f0,
433 	0x24336272, 0x82090a16, 0x1718191a, 0x25262728, 0x292a3435, 0x36373839,
434 	0x3a434445, 0x46474849, 0x4a535455, 0x56575859, 0x5a636465, 0x66676869,
435 	0x6a737475, 0x76777879, 0x7a838485, 0x86878889, 0x8a929394, 0x95969798,
436 	0x999aa2a3, 0xa4a5a6a7, 0xa8a9aab2, 0xb3b4b5b6, 0xb7b8b9ba, 0xc2c3c4c5,
437 	0xc6c7c8c9, 0xcad2d3d4, 0xd5d6d7d8, 0xd9dae1e2, 0xe3e4e5e6, 0xe7e8e9ea,
438 	0xf1f2f3f4, 0xf5f6f7f8, 0xf9fa0000
439 };
440 
441 static const char *error_to_text[16] = {
442 	"Normal",
443 	"SOI not detected",
444 	"SOF1 to SOFF detected",
445 	"Subsampling not detected",
446 	"SOF accuracy error",
447 	"DQT accuracy error",
448 	"Component error 1",
449 	"Component error 2",
450 	"SOF0, DQT, and DHT not detected when SOS detected",
451 	"SOS not detected",
452 	"EOI not detected",
453 	"Restart interval data number error detected",
454 	"Image size error",
455 	"Last MCU data number error",
456 	"Block data number error",
457 	"Unknown"
458 };
459 
460 static struct jpu_buffer *vb2_to_jpu_buffer(struct vb2_v4l2_buffer *vb)
461 {
462 	struct v4l2_m2m_buffer *b =
463 		container_of(vb, struct v4l2_m2m_buffer, vb);
464 
465 	return container_of(b, struct jpu_buffer, buf);
466 }
467 
468 static u32 jpu_read(struct jpu *jpu, unsigned int reg)
469 {
470 	return ioread32(jpu->regs + reg);
471 }
472 
473 static void jpu_write(struct jpu *jpu, u32 val, unsigned int reg)
474 {
475 	iowrite32(val, jpu->regs + reg);
476 }
477 
478 static struct jpu_ctx *ctrl_to_ctx(struct v4l2_ctrl *c)
479 {
480 	return container_of(c->handler, struct jpu_ctx, ctrl_handler);
481 }
482 
483 static struct jpu_ctx *fh_to_ctx(struct v4l2_fh *fh)
484 {
485 	return container_of(fh, struct jpu_ctx, fh);
486 }
487 
488 static void jpu_set_tbl(struct jpu *jpu, u32 reg, const unsigned int *tbl,
489 			unsigned int len) {
490 	unsigned int i;
491 
492 	for (i = 0; i < len; i++)
493 		jpu_write(jpu, tbl[i], reg + (i << 2));
494 }
495 
496 static void jpu_set_qtbl(struct jpu *jpu, unsigned short quality)
497 {
498 	jpu_set_tbl(jpu, JCQTBL(0), qtbl_lum[quality], QTBL_SIZE);
499 	jpu_set_tbl(jpu, JCQTBL(1), qtbl_chr[quality], QTBL_SIZE);
500 }
501 
502 static void jpu_set_htbl(struct jpu *jpu)
503 {
504 	jpu_set_tbl(jpu, JCHTBD(0), hdctbl_lum, HDCTBL_SIZE);
505 	jpu_set_tbl(jpu, JCHTBA(0), hactbl_lum, HACTBL_SIZE);
506 	jpu_set_tbl(jpu, JCHTBD(1), hdctbl_chr, HDCTBL_SIZE);
507 	jpu_set_tbl(jpu, JCHTBA(1), hactbl_chr, HACTBL_SIZE);
508 }
509 
510 static int jpu_wait_reset(struct jpu *jpu)
511 {
512 	unsigned long timeout;
513 
514 	timeout = jiffies + msecs_to_jiffies(JPU_RESET_TIMEOUT);
515 
516 	while (jpu_read(jpu, JCCMD) & JCCMD_SRST) {
517 		if (time_after(jiffies, timeout)) {
518 			dev_err(jpu->dev, "timed out in reset\n");
519 			return -ETIMEDOUT;
520 		}
521 		schedule();
522 	}
523 
524 	return 0;
525 }
526 
527 static int jpu_reset(struct jpu *jpu)
528 {
529 	jpu_write(jpu, JCCMD_SRST, JCCMD);
530 	return jpu_wait_reset(jpu);
531 }
532 
533 /*
534  * ============================================================================
535  * video ioctl operations
536  * ============================================================================
537  */
538 static void put_qtbl(u8 *p, const u8 *qtbl)
539 {
540 	unsigned int i;
541 
542 	for (i = 0; i < ARRAY_SIZE(zigzag); i++)
543 		p[i] = *(qtbl + zigzag[i]);
544 }
545 
546 static void put_htbl(u8 *p, const u8 *htbl, unsigned int len)
547 {
548 	unsigned int i, j;
549 
550 	for (i = 0; i < len; i += 4)
551 		for (j = 0; j < 4 && (i + j) < len; ++j)
552 			p[i + j] = htbl[i + 3 - j];
553 }
554 
555 static void jpu_generate_hdr(unsigned short quality, unsigned char *p)
556 {
557 	put_qtbl(p + JPU_JPEG_QTBL_LUM_OFFSET, (const u8 *)qtbl_lum[quality]);
558 	put_qtbl(p + JPU_JPEG_QTBL_CHR_OFFSET, (const u8 *)qtbl_chr[quality]);
559 
560 	put_htbl(p + JPU_JPEG_HDCTBL_LUM_OFFSET, (const u8 *)hdctbl_lum,
561 		 JPU_JPEG_HDCTBL_SIZE);
562 	put_htbl(p + JPU_JPEG_HACTBL_LUM_OFFSET, (const u8 *)hactbl_lum,
563 		 JPU_JPEG_HACTBL_SIZE);
564 
565 	put_htbl(p + JPU_JPEG_HDCTBL_CHR_OFFSET, (const u8 *)hdctbl_chr,
566 		 JPU_JPEG_HDCTBL_SIZE);
567 	put_htbl(p + JPU_JPEG_HACTBL_CHR_OFFSET, (const u8 *)hactbl_chr,
568 		 JPU_JPEG_HACTBL_SIZE);
569 }
570 
571 static int get_byte(struct jpeg_buffer *buf)
572 {
573 	if (buf->curr >= buf->end)
574 		return -1;
575 
576 	return *(u8 *)buf->curr++;
577 }
578 
579 static int get_word_be(struct jpeg_buffer *buf, unsigned int *word)
580 {
581 	if (buf->end - buf->curr < 2)
582 		return -1;
583 
584 	*word = get_unaligned_be16(buf->curr);
585 	buf->curr += 2;
586 
587 	return 0;
588 }
589 
590 static void skip(struct jpeg_buffer *buf, unsigned long len)
591 {
592 	buf->curr += min((unsigned long)(buf->end - buf->curr), len);
593 }
594 
595 static u8 jpu_parse_hdr(void *buffer, unsigned long size, unsigned int *width,
596 			  unsigned int *height)
597 {
598 	struct jpeg_buffer jpeg_buffer;
599 	unsigned int word;
600 	bool soi = false;
601 
602 	jpeg_buffer.end = buffer + size;
603 	jpeg_buffer.curr = buffer;
604 
605 	/*
606 	 * basic size check and EOI - we don't want to let JPU cross
607 	 * buffer bounds in any case. Hope it's stopping by EOI.
608 	 */
609 	if (size < JPU_JPEG_MIN_SIZE ||
610 	    *(u8 *)(buffer + size - 1) != JPEG_MARKER_EOI)
611 		return 0;
612 
613 	for (;;) {
614 		int c;
615 
616 		/* skip preceding filler bytes */
617 		do
618 			c = get_byte(&jpeg_buffer);
619 		while (c == 0xff || c == 0);
620 
621 		if (!soi && c == JPEG_MARKER_SOI) {
622 			soi = true;
623 			continue;
624 		} else if (soi != (c != JPEG_MARKER_SOI))
625 			return 0;
626 
627 		switch (c) {
628 		case JPEG_MARKER_SOF0: /* SOF0: baseline JPEG */
629 			skip(&jpeg_buffer, 3); /* segment length and bpp */
630 			if (get_word_be(&jpeg_buffer, height) ||
631 			    get_word_be(&jpeg_buffer, width) ||
632 			    get_byte(&jpeg_buffer) != 3) /* YCbCr only */
633 				return 0;
634 
635 			skip(&jpeg_buffer, 1);
636 			return get_byte(&jpeg_buffer);
637 		case JPEG_MARKER_DHT:
638 		case JPEG_MARKER_DQT:
639 		case JPEG_MARKER_COM:
640 		case JPEG_MARKER_DRI:
641 		case JPEG_MARKER_APP0 ... JPEG_MARKER_APP0 + 0x0f:
642 			if (get_word_be(&jpeg_buffer, &word))
643 				return 0;
644 			skip(&jpeg_buffer, (long)word - 2);
645 			break;
646 		case 0:
647 			break;
648 		default:
649 			return 0;
650 		}
651 	}
652 
653 	return 0;
654 }
655 
656 static int jpu_querycap(struct file *file, void *priv,
657 			struct v4l2_capability *cap)
658 {
659 	struct jpu_ctx *ctx = fh_to_ctx(priv);
660 
661 	if (ctx->encoder)
662 		strscpy(cap->card, DRV_NAME " encoder", sizeof(cap->card));
663 	else
664 		strscpy(cap->card, DRV_NAME " decoder", sizeof(cap->card));
665 
666 	strscpy(cap->driver, DRV_NAME, sizeof(cap->driver));
667 	memset(cap->reserved, 0, sizeof(cap->reserved));
668 
669 	return 0;
670 }
671 
672 static struct jpu_fmt *jpu_find_format(bool encoder, u32 pixelformat,
673 				       unsigned int fmt_type)
674 {
675 	unsigned int i, fmt_flag;
676 
677 	if (encoder)
678 		fmt_flag = fmt_type == JPU_FMT_TYPE_OUTPUT ? JPU_ENC_OUTPUT :
679 							     JPU_ENC_CAPTURE;
680 	else
681 		fmt_flag = fmt_type == JPU_FMT_TYPE_OUTPUT ? JPU_DEC_OUTPUT :
682 							     JPU_DEC_CAPTURE;
683 
684 	for (i = 0; i < ARRAY_SIZE(jpu_formats); i++) {
685 		struct jpu_fmt *fmt = &jpu_formats[i];
686 
687 		if (fmt->fourcc == pixelformat && fmt->types & fmt_flag)
688 			return fmt;
689 	}
690 
691 	return NULL;
692 }
693 
694 static int jpu_enum_fmt(struct v4l2_fmtdesc *f, u32 type)
695 {
696 	unsigned int i, num = 0;
697 
698 	for (i = 0; i < ARRAY_SIZE(jpu_formats); ++i) {
699 		if (jpu_formats[i].types & type) {
700 			if (num == f->index)
701 				break;
702 			++num;
703 		}
704 	}
705 
706 	if (i >= ARRAY_SIZE(jpu_formats))
707 		return -EINVAL;
708 
709 	f->pixelformat = jpu_formats[i].fourcc;
710 
711 	return 0;
712 }
713 
714 static int jpu_enum_fmt_cap(struct file *file, void *priv,
715 			    struct v4l2_fmtdesc *f)
716 {
717 	struct jpu_ctx *ctx = fh_to_ctx(priv);
718 
719 	return jpu_enum_fmt(f, ctx->encoder ? JPU_ENC_CAPTURE :
720 			    JPU_DEC_CAPTURE);
721 }
722 
723 static int jpu_enum_fmt_out(struct file *file, void *priv,
724 			    struct v4l2_fmtdesc *f)
725 {
726 	struct jpu_ctx *ctx = fh_to_ctx(priv);
727 
728 	return jpu_enum_fmt(f, ctx->encoder ? JPU_ENC_OUTPUT : JPU_DEC_OUTPUT);
729 }
730 
731 static struct jpu_q_data *jpu_get_q_data(struct jpu_ctx *ctx,
732 					 enum v4l2_buf_type type)
733 {
734 	if (V4L2_TYPE_IS_OUTPUT(type))
735 		return &ctx->out_q;
736 	else
737 		return &ctx->cap_q;
738 }
739 
740 static void jpu_bound_align_image(u32 *w, unsigned int w_min,
741 				  unsigned int w_max, unsigned int w_align,
742 				  u32 *h, unsigned int h_min,
743 				  unsigned int h_max, unsigned int h_align)
744 {
745 	unsigned int width, height, w_step, h_step;
746 
747 	width = *w;
748 	height = *h;
749 
750 	w_step = 1U << w_align;
751 	h_step = 1U << h_align;
752 	v4l_bound_align_image(w, w_min, w_max, w_align, h, h_min, h_max,
753 			      h_align, 3);
754 
755 	if (*w < width && *w + w_step < w_max)
756 		*w += w_step;
757 	if (*h < height && *h + h_step < h_max)
758 		*h += h_step;
759 }
760 
761 static int __jpu_try_fmt(struct jpu_ctx *ctx, struct jpu_fmt **fmtinfo,
762 			 struct v4l2_pix_format_mplane *pix,
763 			 enum v4l2_buf_type type)
764 {
765 	struct jpu_fmt *fmt;
766 	unsigned int f_type, w, h;
767 
768 	f_type = V4L2_TYPE_IS_OUTPUT(type) ? JPU_FMT_TYPE_OUTPUT :
769 						JPU_FMT_TYPE_CAPTURE;
770 
771 	fmt = jpu_find_format(ctx->encoder, pix->pixelformat, f_type);
772 	if (!fmt) {
773 		unsigned int pixelformat;
774 
775 		dev_dbg(ctx->jpu->dev, "unknown format; set default format\n");
776 		if (ctx->encoder)
777 			pixelformat = f_type == JPU_FMT_TYPE_OUTPUT ?
778 				V4L2_PIX_FMT_NV16M : V4L2_PIX_FMT_JPEG;
779 		else
780 			pixelformat = f_type == JPU_FMT_TYPE_CAPTURE ?
781 				V4L2_PIX_FMT_NV16M : V4L2_PIX_FMT_JPEG;
782 		fmt = jpu_find_format(ctx->encoder, pixelformat, f_type);
783 	}
784 
785 	pix->pixelformat = fmt->fourcc;
786 	pix->colorspace = fmt->colorspace;
787 	pix->field = V4L2_FIELD_NONE;
788 	pix->num_planes = fmt->num_planes;
789 
790 	jpu_bound_align_image(&pix->width, JPU_WIDTH_MIN, JPU_WIDTH_MAX,
791 			      fmt->h_align, &pix->height, JPU_HEIGHT_MIN,
792 			      JPU_HEIGHT_MAX, fmt->v_align);
793 
794 	w = pix->width;
795 	h = pix->height;
796 
797 	if (fmt->fourcc == V4L2_PIX_FMT_JPEG) {
798 		/* ignore userspaces's sizeimage for encoding */
799 		if (pix->plane_fmt[0].sizeimage <= 0 || ctx->encoder)
800 			pix->plane_fmt[0].sizeimage = JPU_JPEG_HDR_SIZE +
801 				(JPU_JPEG_MAX_BYTES_PER_PIXEL * w * h);
802 		pix->plane_fmt[0].bytesperline = 0;
803 	} else {
804 		unsigned int i, bpl = 0;
805 
806 		for (i = 0; i < pix->num_planes; ++i)
807 			bpl = max(bpl, pix->plane_fmt[i].bytesperline);
808 
809 		bpl = clamp_t(unsigned int, bpl, w, JPU_WIDTH_MAX);
810 		bpl = round_up(bpl, JPU_MEMALIGN);
811 
812 		for (i = 0; i < pix->num_planes; ++i) {
813 			pix->plane_fmt[i].bytesperline = bpl;
814 			pix->plane_fmt[i].sizeimage = bpl * h * fmt->bpp[i] / 8;
815 		}
816 	}
817 
818 	if (fmtinfo)
819 		*fmtinfo = fmt;
820 
821 	return 0;
822 }
823 
824 static int jpu_try_fmt(struct file *file, void *priv, struct v4l2_format *f)
825 {
826 	struct jpu_ctx *ctx = fh_to_ctx(priv);
827 
828 	if (!v4l2_m2m_get_vq(ctx->fh.m2m_ctx, f->type))
829 		return -EINVAL;
830 
831 	return __jpu_try_fmt(ctx, NULL, &f->fmt.pix_mp, f->type);
832 }
833 
834 static int jpu_s_fmt(struct file *file, void *priv, struct v4l2_format *f)
835 {
836 	struct vb2_queue *vq;
837 	struct jpu_ctx *ctx = fh_to_ctx(priv);
838 	struct v4l2_m2m_ctx *m2m_ctx = ctx->fh.m2m_ctx;
839 	struct jpu_fmt *fmtinfo;
840 	struct jpu_q_data *q_data;
841 	int ret;
842 
843 	vq = v4l2_m2m_get_vq(m2m_ctx, f->type);
844 	if (!vq)
845 		return -EINVAL;
846 
847 	if (vb2_is_busy(vq)) {
848 		v4l2_err(&ctx->jpu->v4l2_dev, "%s queue busy\n", __func__);
849 		return -EBUSY;
850 	}
851 
852 	ret = __jpu_try_fmt(ctx, &fmtinfo, &f->fmt.pix_mp, f->type);
853 	if (ret < 0)
854 		return ret;
855 
856 	q_data = jpu_get_q_data(ctx, f->type);
857 
858 	q_data->format = f->fmt.pix_mp;
859 	q_data->fmtinfo = fmtinfo;
860 
861 	return 0;
862 }
863 
864 static int jpu_g_fmt(struct file *file, void *priv, struct v4l2_format *f)
865 {
866 	struct jpu_q_data *q_data;
867 	struct jpu_ctx *ctx = fh_to_ctx(priv);
868 
869 	if (!v4l2_m2m_get_vq(ctx->fh.m2m_ctx, f->type))
870 		return -EINVAL;
871 
872 	q_data = jpu_get_q_data(ctx, f->type);
873 	f->fmt.pix_mp = q_data->format;
874 
875 	return 0;
876 }
877 
878 /*
879  * V4L2 controls
880  */
881 static int jpu_s_ctrl(struct v4l2_ctrl *ctrl)
882 {
883 	struct jpu_ctx *ctx = ctrl_to_ctx(ctrl);
884 	unsigned long flags;
885 
886 	spin_lock_irqsave(&ctx->jpu->lock, flags);
887 	if (ctrl->id == V4L2_CID_JPEG_COMPRESSION_QUALITY)
888 		ctx->compr_quality = ctrl->val;
889 	spin_unlock_irqrestore(&ctx->jpu->lock, flags);
890 
891 	return 0;
892 }
893 
894 static const struct v4l2_ctrl_ops jpu_ctrl_ops = {
895 	.s_ctrl		= jpu_s_ctrl,
896 };
897 
898 static int jpu_streamon(struct file *file, void *priv, enum v4l2_buf_type type)
899 {
900 	struct jpu_ctx *ctx = fh_to_ctx(priv);
901 	struct jpu_q_data *src_q_data, *dst_q_data, *orig, adj, *ref;
902 	enum v4l2_buf_type adj_type;
903 
904 	src_q_data = jpu_get_q_data(ctx, V4L2_BUF_TYPE_VIDEO_OUTPUT_MPLANE);
905 	dst_q_data = jpu_get_q_data(ctx, V4L2_BUF_TYPE_VIDEO_CAPTURE_MPLANE);
906 
907 	if (ctx->encoder) {
908 		adj = *src_q_data;
909 		orig = src_q_data;
910 		ref = dst_q_data;
911 		adj_type = V4L2_BUF_TYPE_VIDEO_OUTPUT_MPLANE;
912 	} else {
913 		adj = *dst_q_data;
914 		orig = dst_q_data;
915 		ref = src_q_data;
916 		adj_type = V4L2_BUF_TYPE_VIDEO_CAPTURE_MPLANE;
917 	}
918 
919 	adj.format.width = ref->format.width;
920 	adj.format.height = ref->format.height;
921 
922 	__jpu_try_fmt(ctx, NULL, &adj.format, adj_type);
923 
924 	if (adj.format.width != orig->format.width ||
925 	    adj.format.height != orig->format.height) {
926 		dev_err(ctx->jpu->dev, "src and dst formats do not match.\n");
927 		/* maybe we can return -EPIPE here? */
928 		return -EINVAL;
929 	}
930 
931 	return v4l2_m2m_streamon(file, ctx->fh.m2m_ctx, type);
932 }
933 
934 static const struct v4l2_ioctl_ops jpu_ioctl_ops = {
935 	.vidioc_querycap		= jpu_querycap,
936 
937 	.vidioc_enum_fmt_vid_cap	= jpu_enum_fmt_cap,
938 	.vidioc_enum_fmt_vid_out	= jpu_enum_fmt_out,
939 	.vidioc_g_fmt_vid_cap_mplane	= jpu_g_fmt,
940 	.vidioc_g_fmt_vid_out_mplane	= jpu_g_fmt,
941 	.vidioc_try_fmt_vid_cap_mplane	= jpu_try_fmt,
942 	.vidioc_try_fmt_vid_out_mplane	= jpu_try_fmt,
943 	.vidioc_s_fmt_vid_cap_mplane	= jpu_s_fmt,
944 	.vidioc_s_fmt_vid_out_mplane	= jpu_s_fmt,
945 
946 	.vidioc_reqbufs			= v4l2_m2m_ioctl_reqbufs,
947 	.vidioc_create_bufs             = v4l2_m2m_ioctl_create_bufs,
948 	.vidioc_querybuf		= v4l2_m2m_ioctl_querybuf,
949 	.vidioc_qbuf			= v4l2_m2m_ioctl_qbuf,
950 	.vidioc_dqbuf			= v4l2_m2m_ioctl_dqbuf,
951 	.vidioc_expbuf			= v4l2_m2m_ioctl_expbuf,
952 
953 	.vidioc_streamon		= jpu_streamon,
954 	.vidioc_streamoff		= v4l2_m2m_ioctl_streamoff,
955 
956 	.vidioc_subscribe_event		= v4l2_ctrl_subscribe_event,
957 	.vidioc_unsubscribe_event	= v4l2_event_unsubscribe
958 };
959 
960 static int jpu_controls_create(struct jpu_ctx *ctx)
961 {
962 	struct v4l2_ctrl *ctrl;
963 	int ret;
964 
965 	v4l2_ctrl_handler_init(&ctx->ctrl_handler, 1);
966 
967 	ctrl = v4l2_ctrl_new_std(&ctx->ctrl_handler, &jpu_ctrl_ops,
968 				 V4L2_CID_JPEG_COMPRESSION_QUALITY,
969 				 0, JPU_MAX_QUALITY - 1, 1, 0);
970 
971 	if (ctx->ctrl_handler.error) {
972 		ret = ctx->ctrl_handler.error;
973 		goto error_free;
974 	}
975 
976 	if (!ctx->encoder)
977 		ctrl->flags |= V4L2_CTRL_FLAG_VOLATILE |
978 				V4L2_CTRL_FLAG_READ_ONLY;
979 
980 	ret = v4l2_ctrl_handler_setup(&ctx->ctrl_handler);
981 	if (ret < 0)
982 		goto error_free;
983 
984 	return 0;
985 
986 error_free:
987 	v4l2_ctrl_handler_free(&ctx->ctrl_handler);
988 	return ret;
989 }
990 
991 /*
992  * ============================================================================
993  * Queue operations
994  * ============================================================================
995  */
996 static int jpu_queue_setup(struct vb2_queue *vq,
997 			   unsigned int *nbuffers, unsigned int *nplanes,
998 			   unsigned int sizes[], struct device *alloc_devs[])
999 {
1000 	struct jpu_ctx *ctx = vb2_get_drv_priv(vq);
1001 	struct jpu_q_data *q_data;
1002 	unsigned int i;
1003 
1004 	q_data = jpu_get_q_data(ctx, vq->type);
1005 
1006 	if (*nplanes) {
1007 		if (*nplanes != q_data->format.num_planes)
1008 			return -EINVAL;
1009 
1010 		for (i = 0; i < *nplanes; i++) {
1011 			unsigned int q_size = q_data->format.plane_fmt[i].sizeimage;
1012 
1013 			if (sizes[i] < q_size)
1014 				return -EINVAL;
1015 		}
1016 		return 0;
1017 	}
1018 
1019 	*nplanes = q_data->format.num_planes;
1020 
1021 	for (i = 0; i < *nplanes; i++)
1022 		sizes[i] = q_data->format.plane_fmt[i].sizeimage;
1023 
1024 	return 0;
1025 }
1026 
1027 static int jpu_buf_prepare(struct vb2_buffer *vb)
1028 {
1029 	struct vb2_v4l2_buffer *vbuf = to_vb2_v4l2_buffer(vb);
1030 	struct jpu_ctx *ctx = vb2_get_drv_priv(vb->vb2_queue);
1031 	struct jpu_q_data *q_data;
1032 	unsigned int i;
1033 
1034 	q_data = jpu_get_q_data(ctx, vb->vb2_queue->type);
1035 
1036 	if (V4L2_TYPE_IS_OUTPUT(vb->vb2_queue->type)) {
1037 		if (vbuf->field == V4L2_FIELD_ANY)
1038 			vbuf->field = V4L2_FIELD_NONE;
1039 		if (vbuf->field != V4L2_FIELD_NONE) {
1040 			dev_err(ctx->jpu->dev, "%s field isn't supported\n",
1041 					__func__);
1042 			return -EINVAL;
1043 		}
1044 	}
1045 
1046 	for (i = 0; i < q_data->format.num_planes; i++) {
1047 		unsigned long size = q_data->format.plane_fmt[i].sizeimage;
1048 
1049 		if (vb2_plane_size(vb, i) < size) {
1050 			dev_err(ctx->jpu->dev,
1051 				"%s: data will not fit into plane (%lu < %lu)\n",
1052 			       __func__, vb2_plane_size(vb, i), size);
1053 			return -EINVAL;
1054 		}
1055 
1056 		/* decoder capture queue */
1057 		if (!ctx->encoder && V4L2_TYPE_IS_CAPTURE(vb->vb2_queue->type))
1058 			vb2_set_plane_payload(vb, i, size);
1059 	}
1060 
1061 	return 0;
1062 }
1063 
1064 static void jpu_buf_queue(struct vb2_buffer *vb)
1065 {
1066 	struct vb2_v4l2_buffer *vbuf = to_vb2_v4l2_buffer(vb);
1067 	struct jpu_ctx *ctx = vb2_get_drv_priv(vb->vb2_queue);
1068 
1069 	if (!ctx->encoder && V4L2_TYPE_IS_OUTPUT(vb->vb2_queue->type)) {
1070 		struct jpu_buffer *jpu_buf = vb2_to_jpu_buffer(vbuf);
1071 		struct jpu_q_data *q_data, adjust;
1072 		void *buffer = vb2_plane_vaddr(vb, 0);
1073 		unsigned long buf_size = vb2_get_plane_payload(vb, 0);
1074 		unsigned int width, height;
1075 
1076 		u8 subsampling = jpu_parse_hdr(buffer, buf_size, &width,
1077 						 &height);
1078 
1079 		/* check if JPEG data basic parsing was successful */
1080 		if (subsampling != JPU_JPEG_422 && subsampling != JPU_JPEG_420)
1081 			goto format_error;
1082 
1083 		q_data = &ctx->out_q;
1084 
1085 		adjust = *q_data;
1086 		adjust.format.width = width;
1087 		adjust.format.height = height;
1088 
1089 		__jpu_try_fmt(ctx, &adjust.fmtinfo, &adjust.format,
1090 			      V4L2_BUF_TYPE_VIDEO_OUTPUT_MPLANE);
1091 
1092 		if (adjust.format.width != q_data->format.width ||
1093 		    adjust.format.height != q_data->format.height)
1094 			goto format_error;
1095 
1096 		/*
1097 		 * keep subsampling in buffer to check it
1098 		 * for compatibility in device_run
1099 		 */
1100 		jpu_buf->subsampling = subsampling;
1101 	}
1102 
1103 	if (ctx->fh.m2m_ctx)
1104 		v4l2_m2m_buf_queue(ctx->fh.m2m_ctx, vbuf);
1105 
1106 	return;
1107 
1108 format_error:
1109 	dev_err(ctx->jpu->dev, "incompatible or corrupted JPEG data\n");
1110 	vb2_buffer_done(vb, VB2_BUF_STATE_ERROR);
1111 }
1112 
1113 static void jpu_buf_finish(struct vb2_buffer *vb)
1114 {
1115 	struct vb2_v4l2_buffer *vbuf = to_vb2_v4l2_buffer(vb);
1116 	struct jpu_buffer *jpu_buf = vb2_to_jpu_buffer(vbuf);
1117 	struct jpu_ctx *ctx = vb2_get_drv_priv(vb->vb2_queue);
1118 	struct jpu_q_data *q_data = &ctx->out_q;
1119 	enum v4l2_buf_type type = vb->vb2_queue->type;
1120 	u8 *buffer;
1121 
1122 	if (vb->state == VB2_BUF_STATE_DONE)
1123 		vbuf->sequence = jpu_get_q_data(ctx, type)->sequence++;
1124 
1125 	if (!ctx->encoder || vb->state != VB2_BUF_STATE_DONE ||
1126 	    V4L2_TYPE_IS_OUTPUT(type))
1127 		return;
1128 
1129 	buffer = vb2_plane_vaddr(vb, 0);
1130 
1131 	memcpy(buffer, jpeg_hdrs[jpu_buf->compr_quality], JPU_JPEG_HDR_SIZE);
1132 	*(__be16 *)(buffer + JPU_JPEG_HEIGHT_OFFSET) =
1133 					cpu_to_be16(q_data->format.height);
1134 	*(__be16 *)(buffer + JPU_JPEG_WIDTH_OFFSET) =
1135 					cpu_to_be16(q_data->format.width);
1136 	*(buffer + JPU_JPEG_SUBS_OFFSET) = q_data->fmtinfo->subsampling;
1137 }
1138 
1139 static int jpu_start_streaming(struct vb2_queue *vq, unsigned count)
1140 {
1141 	struct jpu_ctx *ctx = vb2_get_drv_priv(vq);
1142 	struct jpu_q_data *q_data = jpu_get_q_data(ctx, vq->type);
1143 
1144 	q_data->sequence = 0;
1145 	return 0;
1146 }
1147 
1148 static void jpu_stop_streaming(struct vb2_queue *vq)
1149 {
1150 	struct jpu_ctx *ctx = vb2_get_drv_priv(vq);
1151 	struct vb2_v4l2_buffer *vb;
1152 	unsigned long flags;
1153 
1154 	for (;;) {
1155 		if (V4L2_TYPE_IS_OUTPUT(vq->type))
1156 			vb = v4l2_m2m_src_buf_remove(ctx->fh.m2m_ctx);
1157 		else
1158 			vb = v4l2_m2m_dst_buf_remove(ctx->fh.m2m_ctx);
1159 		if (vb == NULL)
1160 			return;
1161 		spin_lock_irqsave(&ctx->jpu->lock, flags);
1162 		v4l2_m2m_buf_done(vb, VB2_BUF_STATE_ERROR);
1163 		spin_unlock_irqrestore(&ctx->jpu->lock, flags);
1164 	}
1165 }
1166 
1167 static const struct vb2_ops jpu_qops = {
1168 	.queue_setup		= jpu_queue_setup,
1169 	.buf_prepare		= jpu_buf_prepare,
1170 	.buf_queue		= jpu_buf_queue,
1171 	.buf_finish		= jpu_buf_finish,
1172 	.start_streaming	= jpu_start_streaming,
1173 	.stop_streaming		= jpu_stop_streaming,
1174 };
1175 
1176 static int jpu_queue_init(void *priv, struct vb2_queue *src_vq,
1177 			  struct vb2_queue *dst_vq)
1178 {
1179 	struct jpu_ctx *ctx = priv;
1180 	int ret;
1181 
1182 	memset(src_vq, 0, sizeof(*src_vq));
1183 	src_vq->type = V4L2_BUF_TYPE_VIDEO_OUTPUT_MPLANE;
1184 	src_vq->io_modes = VB2_MMAP | VB2_DMABUF;
1185 	src_vq->drv_priv = ctx;
1186 	src_vq->buf_struct_size = sizeof(struct jpu_buffer);
1187 	src_vq->ops = &jpu_qops;
1188 	src_vq->mem_ops = &vb2_dma_contig_memops;
1189 	src_vq->timestamp_flags = V4L2_BUF_FLAG_TIMESTAMP_COPY;
1190 	src_vq->lock = &ctx->jpu->mutex;
1191 	src_vq->dev = ctx->jpu->v4l2_dev.dev;
1192 
1193 	ret = vb2_queue_init(src_vq);
1194 	if (ret)
1195 		return ret;
1196 
1197 	memset(dst_vq, 0, sizeof(*dst_vq));
1198 	dst_vq->type = V4L2_BUF_TYPE_VIDEO_CAPTURE_MPLANE;
1199 	dst_vq->io_modes = VB2_MMAP | VB2_DMABUF;
1200 	dst_vq->drv_priv = ctx;
1201 	dst_vq->buf_struct_size = sizeof(struct jpu_buffer);
1202 	dst_vq->ops = &jpu_qops;
1203 	dst_vq->mem_ops = &vb2_dma_contig_memops;
1204 	dst_vq->timestamp_flags = V4L2_BUF_FLAG_TIMESTAMP_COPY;
1205 	dst_vq->lock = &ctx->jpu->mutex;
1206 	dst_vq->dev = ctx->jpu->v4l2_dev.dev;
1207 
1208 	return vb2_queue_init(dst_vq);
1209 }
1210 
1211 /*
1212  * ============================================================================
1213  * Device file operations
1214  * ============================================================================
1215  */
1216 static int jpu_open(struct file *file)
1217 {
1218 	struct jpu *jpu = video_drvdata(file);
1219 	struct video_device *vfd = video_devdata(file);
1220 	struct jpu_ctx *ctx;
1221 	int ret;
1222 
1223 	ctx = kzalloc(sizeof(*ctx), GFP_KERNEL);
1224 	if (!ctx)
1225 		return -ENOMEM;
1226 
1227 	v4l2_fh_init(&ctx->fh, vfd);
1228 	ctx->fh.ctrl_handler = &ctx->ctrl_handler;
1229 	file->private_data = &ctx->fh;
1230 	v4l2_fh_add(&ctx->fh);
1231 
1232 	ctx->jpu = jpu;
1233 	ctx->encoder = vfd == &jpu->vfd_encoder;
1234 
1235 	__jpu_try_fmt(ctx, &ctx->out_q.fmtinfo, &ctx->out_q.format,
1236 		      V4L2_BUF_TYPE_VIDEO_OUTPUT_MPLANE);
1237 	__jpu_try_fmt(ctx, &ctx->cap_q.fmtinfo, &ctx->cap_q.format,
1238 		      V4L2_BUF_TYPE_VIDEO_CAPTURE_MPLANE);
1239 
1240 	ctx->fh.m2m_ctx = v4l2_m2m_ctx_init(jpu->m2m_dev, ctx, jpu_queue_init);
1241 	if (IS_ERR(ctx->fh.m2m_ctx)) {
1242 		ret = PTR_ERR(ctx->fh.m2m_ctx);
1243 		goto v4l_prepare_rollback;
1244 	}
1245 
1246 	ret = jpu_controls_create(ctx);
1247 	if (ret < 0)
1248 		goto v4l_prepare_rollback;
1249 
1250 	if (mutex_lock_interruptible(&jpu->mutex)) {
1251 		ret = -ERESTARTSYS;
1252 		goto v4l_prepare_rollback;
1253 	}
1254 
1255 	if (jpu->ref_count == 0) {
1256 		ret = clk_prepare_enable(jpu->clk);
1257 		if (ret < 0)
1258 			goto device_prepare_rollback;
1259 		/* ...issue software reset */
1260 		ret = jpu_reset(jpu);
1261 		if (ret)
1262 			goto jpu_reset_rollback;
1263 	}
1264 
1265 	jpu->ref_count++;
1266 
1267 	mutex_unlock(&jpu->mutex);
1268 	return 0;
1269 
1270 jpu_reset_rollback:
1271 	clk_disable_unprepare(jpu->clk);
1272 device_prepare_rollback:
1273 	mutex_unlock(&jpu->mutex);
1274 v4l_prepare_rollback:
1275 	v4l2_fh_del(&ctx->fh);
1276 	v4l2_fh_exit(&ctx->fh);
1277 	kfree(ctx);
1278 	return ret;
1279 }
1280 
1281 static int jpu_release(struct file *file)
1282 {
1283 	struct jpu *jpu = video_drvdata(file);
1284 	struct jpu_ctx *ctx = fh_to_ctx(file->private_data);
1285 
1286 	v4l2_m2m_ctx_release(ctx->fh.m2m_ctx);
1287 	v4l2_ctrl_handler_free(&ctx->ctrl_handler);
1288 	v4l2_fh_del(&ctx->fh);
1289 	v4l2_fh_exit(&ctx->fh);
1290 	kfree(ctx);
1291 
1292 	mutex_lock(&jpu->mutex);
1293 	if (--jpu->ref_count == 0)
1294 		clk_disable_unprepare(jpu->clk);
1295 	mutex_unlock(&jpu->mutex);
1296 
1297 	return 0;
1298 }
1299 
1300 static const struct v4l2_file_operations jpu_fops = {
1301 	.owner		= THIS_MODULE,
1302 	.open		= jpu_open,
1303 	.release	= jpu_release,
1304 	.unlocked_ioctl	= video_ioctl2,
1305 	.poll		= v4l2_m2m_fop_poll,
1306 	.mmap		= v4l2_m2m_fop_mmap,
1307 };
1308 
1309 /*
1310  * ============================================================================
1311  * mem2mem callbacks
1312  * ============================================================================
1313  */
1314 static void jpu_cleanup(struct jpu_ctx *ctx, bool reset)
1315 {
1316 	/* remove current buffers and finish job */
1317 	struct vb2_v4l2_buffer *src_buf, *dst_buf;
1318 	unsigned long flags;
1319 
1320 	spin_lock_irqsave(&ctx->jpu->lock, flags);
1321 
1322 	src_buf = v4l2_m2m_src_buf_remove(ctx->fh.m2m_ctx);
1323 	dst_buf = v4l2_m2m_dst_buf_remove(ctx->fh.m2m_ctx);
1324 
1325 	v4l2_m2m_buf_done(src_buf, VB2_BUF_STATE_ERROR);
1326 	v4l2_m2m_buf_done(dst_buf, VB2_BUF_STATE_ERROR);
1327 
1328 	/* ...and give it a chance on next run */
1329 	if (reset)
1330 		jpu_write(ctx->jpu, JCCMD_SRST, JCCMD);
1331 
1332 	spin_unlock_irqrestore(&ctx->jpu->lock, flags);
1333 
1334 	v4l2_m2m_job_finish(ctx->jpu->m2m_dev, ctx->fh.m2m_ctx);
1335 }
1336 
1337 static void jpu_device_run(void *priv)
1338 {
1339 	struct jpu_ctx *ctx = priv;
1340 	struct jpu *jpu = ctx->jpu;
1341 	struct jpu_buffer *jpu_buf;
1342 	struct jpu_q_data *q_data;
1343 	struct vb2_v4l2_buffer *src_buf, *dst_buf;
1344 	unsigned int w, h, bpl;
1345 	unsigned char num_planes, subsampling;
1346 	unsigned long flags;
1347 
1348 	/* ...wait until module reset completes; we have mutex locked here */
1349 	if (jpu_wait_reset(jpu)) {
1350 		jpu_cleanup(ctx, true);
1351 		return;
1352 	}
1353 
1354 	spin_lock_irqsave(&ctx->jpu->lock, flags);
1355 
1356 	jpu->curr = ctx;
1357 
1358 	src_buf = v4l2_m2m_next_src_buf(ctx->fh.m2m_ctx);
1359 	dst_buf = v4l2_m2m_next_dst_buf(ctx->fh.m2m_ctx);
1360 
1361 	if (ctx->encoder) {
1362 		jpu_buf = vb2_to_jpu_buffer(dst_buf);
1363 		q_data = &ctx->out_q;
1364 	} else {
1365 		jpu_buf = vb2_to_jpu_buffer(src_buf);
1366 		q_data = &ctx->cap_q;
1367 	}
1368 
1369 	w = q_data->format.width;
1370 	h = q_data->format.height;
1371 	bpl = q_data->format.plane_fmt[0].bytesperline;
1372 	num_planes = q_data->fmtinfo->num_planes;
1373 	subsampling = q_data->fmtinfo->subsampling;
1374 
1375 	if (ctx->encoder) {
1376 		unsigned long src_1_addr, src_2_addr, dst_addr;
1377 		unsigned int redu, inft;
1378 
1379 		dst_addr = vb2_dma_contig_plane_dma_addr(&dst_buf->vb2_buf, 0);
1380 		src_1_addr =
1381 			vb2_dma_contig_plane_dma_addr(&src_buf->vb2_buf, 0);
1382 		if (num_planes > 1)
1383 			src_2_addr = vb2_dma_contig_plane_dma_addr(
1384 					&src_buf->vb2_buf, 1);
1385 		else
1386 			src_2_addr = src_1_addr + w * h;
1387 
1388 		jpu_buf->compr_quality = ctx->compr_quality;
1389 
1390 		if (subsampling == JPU_JPEG_420) {
1391 			redu = JCMOD_REDU_420;
1392 			inft = JIFECNT_INFT_420;
1393 		} else {
1394 			redu = JCMOD_REDU_422;
1395 			inft = JIFECNT_INFT_422;
1396 		}
1397 
1398 		/* only no marker mode works for encoding */
1399 		jpu_write(jpu, JCMOD_DSP_ENC | JCMOD_PCTR | redu |
1400 			  JCMOD_MSKIP_ENABLE, JCMOD);
1401 
1402 		jpu_write(jpu, JIFECNT_SWAP_WB | inft, JIFECNT);
1403 		jpu_write(jpu, JIFDCNT_SWAP_WB, JIFDCNT);
1404 		jpu_write(jpu, JINTE_TRANSF_COMPL, JINTE);
1405 
1406 		/* Y and C components source addresses */
1407 		jpu_write(jpu, src_1_addr, JIFESYA1);
1408 		jpu_write(jpu, src_2_addr, JIFESCA1);
1409 
1410 		/* memory width */
1411 		jpu_write(jpu, bpl, JIFESMW);
1412 
1413 		jpu_write(jpu, (w >> 8) & JCSZ_MASK, JCHSZU);
1414 		jpu_write(jpu, w & JCSZ_MASK, JCHSZD);
1415 
1416 		jpu_write(jpu, (h >> 8) & JCSZ_MASK, JCVSZU);
1417 		jpu_write(jpu, h & JCSZ_MASK, JCVSZD);
1418 
1419 		jpu_write(jpu, w, JIFESHSZ);
1420 		jpu_write(jpu, h, JIFESVSZ);
1421 
1422 		jpu_write(jpu, dst_addr + JPU_JPEG_HDR_SIZE, JIFEDA1);
1423 
1424 		jpu_write(jpu, 0 << JCQTN_SHIFT(1) | 1 << JCQTN_SHIFT(2) |
1425 			  1 << JCQTN_SHIFT(3), JCQTN);
1426 
1427 		jpu_write(jpu, 0 << JCHTN_AC_SHIFT(1) | 0 << JCHTN_DC_SHIFT(1) |
1428 			  1 << JCHTN_AC_SHIFT(2) | 1 << JCHTN_DC_SHIFT(2) |
1429 			  1 << JCHTN_AC_SHIFT(3) | 1 << JCHTN_DC_SHIFT(3),
1430 			  JCHTN);
1431 
1432 		jpu_set_qtbl(jpu, ctx->compr_quality);
1433 		jpu_set_htbl(jpu);
1434 	} else {
1435 		unsigned long src_addr, dst_1_addr, dst_2_addr;
1436 
1437 		if (jpu_buf->subsampling != subsampling) {
1438 			dev_err(ctx->jpu->dev,
1439 				"src and dst formats do not match.\n");
1440 			spin_unlock_irqrestore(&ctx->jpu->lock, flags);
1441 			jpu_cleanup(ctx, false);
1442 			return;
1443 		}
1444 
1445 		src_addr = vb2_dma_contig_plane_dma_addr(&src_buf->vb2_buf, 0);
1446 		dst_1_addr =
1447 			vb2_dma_contig_plane_dma_addr(&dst_buf->vb2_buf, 0);
1448 		if (q_data->fmtinfo->num_planes > 1)
1449 			dst_2_addr = vb2_dma_contig_plane_dma_addr(
1450 					&dst_buf->vb2_buf, 1);
1451 		else
1452 			dst_2_addr = dst_1_addr + w * h;
1453 
1454 		/* ...set up decoder operation */
1455 		jpu_write(jpu, JCMOD_DSP_DEC | JCMOD_PCTR, JCMOD);
1456 		jpu_write(jpu, JIFECNT_SWAP_WB, JIFECNT);
1457 		jpu_write(jpu, JIFDCNT_SWAP_WB, JIFDCNT);
1458 
1459 		/* ...enable interrupts on transfer completion and d-g error */
1460 		jpu_write(jpu, JINTE_TRANSF_COMPL | JINTE_ERR, JINTE);
1461 
1462 		/* ...set source/destination addresses of encoded data */
1463 		jpu_write(jpu, src_addr, JIFDSA1);
1464 		jpu_write(jpu, dst_1_addr, JIFDDYA1);
1465 		jpu_write(jpu, dst_2_addr, JIFDDCA1);
1466 
1467 		jpu_write(jpu, bpl, JIFDDMW);
1468 	}
1469 
1470 	/* ...start encoder/decoder operation */
1471 	jpu_write(jpu, JCCMD_JSRT, JCCMD);
1472 
1473 	spin_unlock_irqrestore(&ctx->jpu->lock, flags);
1474 }
1475 
1476 static const struct v4l2_m2m_ops jpu_m2m_ops = {
1477 	.device_run	= jpu_device_run,
1478 };
1479 
1480 /*
1481  * ============================================================================
1482  * IRQ handler
1483  * ============================================================================
1484  */
1485 static irqreturn_t jpu_irq_handler(int irq, void *dev_id)
1486 {
1487 	struct jpu *jpu = dev_id;
1488 	struct jpu_ctx *curr_ctx;
1489 	struct vb2_v4l2_buffer *src_buf, *dst_buf;
1490 	unsigned int int_status;
1491 
1492 	int_status = jpu_read(jpu, JINTS);
1493 
1494 	/* ...spurious interrupt */
1495 	if (!((JINTS_TRANSF_COMPL | JINTS_PROCESS_COMPL | JINTS_ERR) &
1496 	    int_status))
1497 		return IRQ_NONE;
1498 
1499 	/* ...clear interrupts */
1500 	jpu_write(jpu, ~(int_status & JINTS_MASK), JINTS);
1501 	if (int_status & (JINTS_ERR | JINTS_PROCESS_COMPL))
1502 		jpu_write(jpu, JCCMD_JEND, JCCMD);
1503 
1504 	spin_lock(&jpu->lock);
1505 
1506 	if ((int_status & JINTS_PROCESS_COMPL) &&
1507 	   !(int_status & JINTS_TRANSF_COMPL))
1508 		goto handled;
1509 
1510 	curr_ctx = v4l2_m2m_get_curr_priv(jpu->m2m_dev);
1511 	if (!curr_ctx) {
1512 		/* ...instance is not running */
1513 		dev_err(jpu->dev, "no active context for m2m\n");
1514 		goto handled;
1515 	}
1516 
1517 	src_buf = v4l2_m2m_src_buf_remove(curr_ctx->fh.m2m_ctx);
1518 	dst_buf = v4l2_m2m_dst_buf_remove(curr_ctx->fh.m2m_ctx);
1519 
1520 	if (int_status & JINTS_TRANSF_COMPL) {
1521 		if (curr_ctx->encoder) {
1522 			unsigned long payload_size = jpu_read(jpu, JCDTCU) << 16
1523 						   | jpu_read(jpu, JCDTCM) << 8
1524 						   | jpu_read(jpu, JCDTCD);
1525 			vb2_set_plane_payload(&dst_buf->vb2_buf, 0,
1526 				payload_size + JPU_JPEG_HDR_SIZE);
1527 		}
1528 
1529 		dst_buf->field = src_buf->field;
1530 		dst_buf->vb2_buf.timestamp = src_buf->vb2_buf.timestamp;
1531 		if (src_buf->flags & V4L2_BUF_FLAG_TIMECODE)
1532 			dst_buf->timecode = src_buf->timecode;
1533 		dst_buf->flags = src_buf->flags &
1534 			(V4L2_BUF_FLAG_TIMECODE | V4L2_BUF_FLAG_KEYFRAME |
1535 			 V4L2_BUF_FLAG_PFRAME | V4L2_BUF_FLAG_BFRAME |
1536 			 V4L2_BUF_FLAG_TSTAMP_SRC_MASK);
1537 
1538 		v4l2_m2m_buf_done(src_buf, VB2_BUF_STATE_DONE);
1539 		v4l2_m2m_buf_done(dst_buf, VB2_BUF_STATE_DONE);
1540 	} else if (int_status & JINTS_ERR) {
1541 		unsigned char error = jpu_read(jpu, JCDERR) & JCDERR_MASK;
1542 
1543 		dev_dbg(jpu->dev, "processing error: %#X: %s\n", error,
1544 			error_to_text[error]);
1545 
1546 		v4l2_m2m_buf_done(src_buf, VB2_BUF_STATE_ERROR);
1547 		v4l2_m2m_buf_done(dst_buf, VB2_BUF_STATE_ERROR);
1548 	}
1549 
1550 	jpu->curr = NULL;
1551 
1552 	/* ...reset JPU after completion */
1553 	jpu_write(jpu, JCCMD_SRST, JCCMD);
1554 	spin_unlock(&jpu->lock);
1555 
1556 	v4l2_m2m_job_finish(jpu->m2m_dev, curr_ctx->fh.m2m_ctx);
1557 
1558 	return IRQ_HANDLED;
1559 
1560 handled:
1561 	spin_unlock(&jpu->lock);
1562 	return IRQ_HANDLED;
1563 }
1564 
1565 /*
1566  * ============================================================================
1567  * Driver basic infrastructure
1568  * ============================================================================
1569  */
1570 static const struct of_device_id jpu_dt_ids[] = {
1571 	{ .compatible = "renesas,jpu-r8a7790" }, /* H2 */
1572 	{ .compatible = "renesas,jpu-r8a7791" }, /* M2-W */
1573 	{ .compatible = "renesas,jpu-r8a7792" }, /* V2H */
1574 	{ .compatible = "renesas,jpu-r8a7793" }, /* M2-N */
1575 	{ .compatible = "renesas,rcar-gen2-jpu" },
1576 	{ },
1577 };
1578 MODULE_DEVICE_TABLE(of, jpu_dt_ids);
1579 
1580 static int jpu_probe(struct platform_device *pdev)
1581 {
1582 	struct jpu *jpu;
1583 	int ret;
1584 	unsigned int i;
1585 
1586 	jpu = devm_kzalloc(&pdev->dev, sizeof(*jpu), GFP_KERNEL);
1587 	if (!jpu)
1588 		return -ENOMEM;
1589 
1590 	mutex_init(&jpu->mutex);
1591 	spin_lock_init(&jpu->lock);
1592 	jpu->dev = &pdev->dev;
1593 
1594 	/* memory-mapped registers */
1595 	jpu->regs = devm_platform_ioremap_resource(pdev, 0);
1596 	if (IS_ERR(jpu->regs))
1597 		return PTR_ERR(jpu->regs);
1598 
1599 	/* interrupt service routine registration */
1600 	jpu->irq = ret = platform_get_irq(pdev, 0);
1601 	if (ret < 0)
1602 		return ret;
1603 
1604 	ret = devm_request_irq(&pdev->dev, jpu->irq, jpu_irq_handler, 0,
1605 			       dev_name(&pdev->dev), jpu);
1606 	if (ret) {
1607 		dev_err(&pdev->dev, "cannot claim IRQ %d\n", jpu->irq);
1608 		return ret;
1609 	}
1610 
1611 	/* clocks */
1612 	jpu->clk = devm_clk_get(&pdev->dev, NULL);
1613 	if (IS_ERR(jpu->clk)) {
1614 		dev_err(&pdev->dev, "cannot get clock\n");
1615 		return PTR_ERR(jpu->clk);
1616 	}
1617 
1618 	/* v4l2 device */
1619 	ret = v4l2_device_register(&pdev->dev, &jpu->v4l2_dev);
1620 	if (ret) {
1621 		dev_err(&pdev->dev, "Failed to register v4l2 device\n");
1622 		return ret;
1623 	}
1624 
1625 	/* mem2mem device */
1626 	jpu->m2m_dev = v4l2_m2m_init(&jpu_m2m_ops);
1627 	if (IS_ERR(jpu->m2m_dev)) {
1628 		v4l2_err(&jpu->v4l2_dev, "Failed to init mem2mem device\n");
1629 		ret = PTR_ERR(jpu->m2m_dev);
1630 		goto device_register_rollback;
1631 	}
1632 
1633 	/* fill in quantization and Huffman tables for encoder */
1634 	for (i = 0; i < JPU_MAX_QUALITY; i++)
1635 		jpu_generate_hdr(i, (unsigned char *)jpeg_hdrs[i]);
1636 
1637 	strscpy(jpu->vfd_encoder.name, DRV_NAME, sizeof(jpu->vfd_encoder.name));
1638 	jpu->vfd_encoder.fops		= &jpu_fops;
1639 	jpu->vfd_encoder.ioctl_ops	= &jpu_ioctl_ops;
1640 	jpu->vfd_encoder.minor		= -1;
1641 	jpu->vfd_encoder.release	= video_device_release_empty;
1642 	jpu->vfd_encoder.lock		= &jpu->mutex;
1643 	jpu->vfd_encoder.v4l2_dev	= &jpu->v4l2_dev;
1644 	jpu->vfd_encoder.vfl_dir	= VFL_DIR_M2M;
1645 	jpu->vfd_encoder.device_caps	= V4L2_CAP_STREAMING |
1646 					  V4L2_CAP_VIDEO_M2M_MPLANE;
1647 
1648 	ret = video_register_device(&jpu->vfd_encoder, VFL_TYPE_VIDEO, -1);
1649 	if (ret) {
1650 		v4l2_err(&jpu->v4l2_dev, "Failed to register video device\n");
1651 		goto m2m_init_rollback;
1652 	}
1653 
1654 	video_set_drvdata(&jpu->vfd_encoder, jpu);
1655 
1656 	strscpy(jpu->vfd_decoder.name, DRV_NAME, sizeof(jpu->vfd_decoder.name));
1657 	jpu->vfd_decoder.fops		= &jpu_fops;
1658 	jpu->vfd_decoder.ioctl_ops	= &jpu_ioctl_ops;
1659 	jpu->vfd_decoder.minor		= -1;
1660 	jpu->vfd_decoder.release	= video_device_release_empty;
1661 	jpu->vfd_decoder.lock		= &jpu->mutex;
1662 	jpu->vfd_decoder.v4l2_dev	= &jpu->v4l2_dev;
1663 	jpu->vfd_decoder.vfl_dir	= VFL_DIR_M2M;
1664 	jpu->vfd_decoder.device_caps	= V4L2_CAP_STREAMING |
1665 					  V4L2_CAP_VIDEO_M2M_MPLANE;
1666 
1667 	ret = video_register_device(&jpu->vfd_decoder, VFL_TYPE_VIDEO, -1);
1668 	if (ret) {
1669 		v4l2_err(&jpu->v4l2_dev, "Failed to register video device\n");
1670 		goto enc_vdev_register_rollback;
1671 	}
1672 
1673 	video_set_drvdata(&jpu->vfd_decoder, jpu);
1674 	platform_set_drvdata(pdev, jpu);
1675 
1676 	v4l2_info(&jpu->v4l2_dev, "encoder device registered as /dev/video%d\n",
1677 		  jpu->vfd_encoder.num);
1678 	v4l2_info(&jpu->v4l2_dev, "decoder device registered as /dev/video%d\n",
1679 		  jpu->vfd_decoder.num);
1680 
1681 	return 0;
1682 
1683 enc_vdev_register_rollback:
1684 	video_unregister_device(&jpu->vfd_encoder);
1685 
1686 m2m_init_rollback:
1687 	v4l2_m2m_release(jpu->m2m_dev);
1688 
1689 device_register_rollback:
1690 	v4l2_device_unregister(&jpu->v4l2_dev);
1691 
1692 	return ret;
1693 }
1694 
1695 static void jpu_remove(struct platform_device *pdev)
1696 {
1697 	struct jpu *jpu = platform_get_drvdata(pdev);
1698 
1699 	video_unregister_device(&jpu->vfd_decoder);
1700 	video_unregister_device(&jpu->vfd_encoder);
1701 	v4l2_m2m_release(jpu->m2m_dev);
1702 	v4l2_device_unregister(&jpu->v4l2_dev);
1703 }
1704 
1705 #ifdef CONFIG_PM_SLEEP
1706 static int jpu_suspend(struct device *dev)
1707 {
1708 	struct jpu *jpu = dev_get_drvdata(dev);
1709 
1710 	if (jpu->ref_count == 0)
1711 		return 0;
1712 
1713 	clk_disable_unprepare(jpu->clk);
1714 
1715 	return 0;
1716 }
1717 
1718 static int jpu_resume(struct device *dev)
1719 {
1720 	struct jpu *jpu = dev_get_drvdata(dev);
1721 
1722 	if (jpu->ref_count == 0)
1723 		return 0;
1724 
1725 	clk_prepare_enable(jpu->clk);
1726 
1727 	return 0;
1728 }
1729 #endif
1730 
1731 static const struct dev_pm_ops jpu_pm_ops = {
1732 	SET_SYSTEM_SLEEP_PM_OPS(jpu_suspend, jpu_resume)
1733 };
1734 
1735 static struct platform_driver jpu_driver = {
1736 	.probe = jpu_probe,
1737 	.remove = jpu_remove,
1738 	.driver = {
1739 		.of_match_table = jpu_dt_ids,
1740 		.name = DRV_NAME,
1741 		.pm = &jpu_pm_ops,
1742 	},
1743 };
1744 
1745 module_platform_driver(jpu_driver);
1746 
1747 MODULE_ALIAS("platform:" DRV_NAME);
1748 MODULE_AUTHOR("Mikhail Ulianov <mikhail.ulyanov@cogentembedded.com>");
1749 MODULE_DESCRIPTION("Renesas R-Car JPEG processing unit driver");
1750 MODULE_LICENSE("GPL v2");
1751