1 // SPDX-License-Identifier: GPL-2.0+
2 /*
3 * Copyright (C) Collabora, Ltd.
4 *
5 * Based on GSPCA and CODA drivers:
6 * Copyright (C) Jean-Francois Moine (http://moinejf.free.fr)
7 * Copyright (C) 2014 Philipp Zabel, Pengutronix
8 */
9
10 #include <linux/align.h>
11 #include <linux/build_bug.h>
12 #include <linux/kernel.h>
13 #include <linux/string.h>
14 #include "hantro_jpeg.h"
15 #include "hantro.h"
16
17 #define LUMA_QUANT_OFF 25
18 #define CHROMA_QUANT_OFF 90
19 #define HEIGHT_OFF 159
20 #define WIDTH_OFF 161
21
22 #define HUFF_LUMA_DC_OFF 178
23 #define HUFF_LUMA_AC_OFF 211
24 #define HUFF_CHROMA_DC_OFF 394
25 #define HUFF_CHROMA_AC_OFF 427
26
27 /* Default tables from JPEG ITU-T.81
28 * (ISO/IEC 10918-1) Annex K, tables K.1 and K.2
29 */
30 static const unsigned char luma_q_table[] = {
31 0x10, 0x0b, 0x0a, 0x10, 0x18, 0x28, 0x33, 0x3d,
32 0x0c, 0x0c, 0x0e, 0x13, 0x1a, 0x3a, 0x3c, 0x37,
33 0x0e, 0x0d, 0x10, 0x18, 0x28, 0x39, 0x45, 0x38,
34 0x0e, 0x11, 0x16, 0x1d, 0x33, 0x57, 0x50, 0x3e,
35 0x12, 0x16, 0x25, 0x38, 0x44, 0x6d, 0x67, 0x4d,
36 0x18, 0x23, 0x37, 0x40, 0x51, 0x68, 0x71, 0x5c,
37 0x31, 0x40, 0x4e, 0x57, 0x67, 0x79, 0x78, 0x65,
38 0x48, 0x5c, 0x5f, 0x62, 0x70, 0x64, 0x67, 0x63
39 };
40
41 static const unsigned char chroma_q_table[] = {
42 0x11, 0x12, 0x18, 0x2f, 0x63, 0x63, 0x63, 0x63,
43 0x12, 0x15, 0x1a, 0x42, 0x63, 0x63, 0x63, 0x63,
44 0x18, 0x1a, 0x38, 0x63, 0x63, 0x63, 0x63, 0x63,
45 0x2f, 0x42, 0x63, 0x63, 0x63, 0x63, 0x63, 0x63,
46 0x63, 0x63, 0x63, 0x63, 0x63, 0x63, 0x63, 0x63,
47 0x63, 0x63, 0x63, 0x63, 0x63, 0x63, 0x63, 0x63,
48 0x63, 0x63, 0x63, 0x63, 0x63, 0x63, 0x63, 0x63,
49 0x63, 0x63, 0x63, 0x63, 0x63, 0x63, 0x63, 0x63
50 };
51
52 static const unsigned char zigzag[] = {
53 0, 1, 8, 16, 9, 2, 3, 10,
54 17, 24, 32, 25, 18, 11, 4, 5,
55 12, 19, 26, 33, 40, 48, 41, 34,
56 27, 20, 13, 6, 7, 14, 21, 28,
57 35, 42, 49, 56, 57, 50, 43, 36,
58 29, 22, 15, 23, 30, 37, 44, 51,
59 58, 59, 52, 45, 38, 31, 39, 46,
60 53, 60, 61, 54, 47, 55, 62, 63
61 };
62
63 static const u32 hw_reorder[] = {
64 0, 8, 16, 24, 1, 9, 17, 25,
65 32, 40, 48, 56, 33, 41, 49, 57,
66 2, 10, 18, 26, 3, 11, 19, 27,
67 34, 42, 50, 58, 35, 43, 51, 59,
68 4, 12, 20, 28, 5, 13, 21, 29,
69 36, 44, 52, 60, 37, 45, 53, 61,
70 6, 14, 22, 30, 7, 15, 23, 31,
71 38, 46, 54, 62, 39, 47, 55, 63
72 };
73
74 /* Huffman tables are shared with CODA */
75 static const unsigned char luma_dc_table[] = {
76 0x00, 0x01, 0x05, 0x01, 0x01, 0x01, 0x01, 0x01,
77 0x01, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
78 0x00, 0x01, 0x02, 0x03, 0x04, 0x05, 0x06, 0x07,
79 0x08, 0x09, 0x0a, 0x0b,
80 };
81
82 static const unsigned char chroma_dc_table[] = {
83 0x00, 0x03, 0x01, 0x01, 0x01, 0x01, 0x01, 0x01,
84 0x01, 0x01, 0x01, 0x00, 0x00, 0x00, 0x00, 0x00,
85 0x00, 0x01, 0x02, 0x03, 0x04, 0x05, 0x06, 0x07,
86 0x08, 0x09, 0x0a, 0x0b,
87 };
88
89 static const unsigned char luma_ac_table[] = {
90 0x00, 0x02, 0x01, 0x03, 0x03, 0x02, 0x04, 0x03,
91 0x05, 0x05, 0x04, 0x04, 0x00, 0x00, 0x01, 0x7d,
92 0x01, 0x02, 0x03, 0x00, 0x04, 0x11, 0x05, 0x12,
93 0x21, 0x31, 0x41, 0x06, 0x13, 0x51, 0x61, 0x07,
94 0x22, 0x71, 0x14, 0x32, 0x81, 0x91, 0xa1, 0x08,
95 0x23, 0x42, 0xb1, 0xc1, 0x15, 0x52, 0xd1, 0xf0,
96 0x24, 0x33, 0x62, 0x72, 0x82, 0x09, 0x0a, 0x16,
97 0x17, 0x18, 0x19, 0x1a, 0x25, 0x26, 0x27, 0x28,
98 0x29, 0x2a, 0x34, 0x35, 0x36, 0x37, 0x38, 0x39,
99 0x3a, 0x43, 0x44, 0x45, 0x46, 0x47, 0x48, 0x49,
100 0x4a, 0x53, 0x54, 0x55, 0x56, 0x57, 0x58, 0x59,
101 0x5a, 0x63, 0x64, 0x65, 0x66, 0x67, 0x68, 0x69,
102 0x6a, 0x73, 0x74, 0x75, 0x76, 0x77, 0x78, 0x79,
103 0x7a, 0x83, 0x84, 0x85, 0x86, 0x87, 0x88, 0x89,
104 0x8a, 0x92, 0x93, 0x94, 0x95, 0x96, 0x97, 0x98,
105 0x99, 0x9a, 0xa2, 0xa3, 0xa4, 0xa5, 0xa6, 0xa7,
106 0xa8, 0xa9, 0xaa, 0xb2, 0xb3, 0xb4, 0xb5, 0xb6,
107 0xb7, 0xb8, 0xb9, 0xba, 0xc2, 0xc3, 0xc4, 0xc5,
108 0xc6, 0xc7, 0xc8, 0xc9, 0xca, 0xd2, 0xd3, 0xd4,
109 0xd5, 0xd6, 0xd7, 0xd8, 0xd9, 0xda, 0xe1, 0xe2,
110 0xe3, 0xe4, 0xe5, 0xe6, 0xe7, 0xe8, 0xe9, 0xea,
111 0xf1, 0xf2, 0xf3, 0xf4, 0xf5, 0xf6, 0xf7, 0xf8,
112 0xf9, 0xfa,
113 };
114
115 static const unsigned char chroma_ac_table[] = {
116 0x00, 0x02, 0x01, 0x02, 0x04, 0x04, 0x03, 0x04,
117 0x07, 0x05, 0x04, 0x04, 0x00, 0x01, 0x02, 0x77,
118 0x00, 0x01, 0x02, 0x03, 0x11, 0x04, 0x05, 0x21,
119 0x31, 0x06, 0x12, 0x41, 0x51, 0x07, 0x61, 0x71,
120 0x13, 0x22, 0x32, 0x81, 0x08, 0x14, 0x42, 0x91,
121 0xa1, 0xb1, 0xc1, 0x09, 0x23, 0x33, 0x52, 0xf0,
122 0x15, 0x62, 0x72, 0xd1, 0x0a, 0x16, 0x24, 0x34,
123 0xe1, 0x25, 0xf1, 0x17, 0x18, 0x19, 0x1a, 0x26,
124 0x27, 0x28, 0x29, 0x2a, 0x35, 0x36, 0x37, 0x38,
125 0x39, 0x3a, 0x43, 0x44, 0x45, 0x46, 0x47, 0x48,
126 0x49, 0x4a, 0x53, 0x54, 0x55, 0x56, 0x57, 0x58,
127 0x59, 0x5a, 0x63, 0x64, 0x65, 0x66, 0x67, 0x68,
128 0x69, 0x6a, 0x73, 0x74, 0x75, 0x76, 0x77, 0x78,
129 0x79, 0x7a, 0x82, 0x83, 0x84, 0x85, 0x86, 0x87,
130 0x88, 0x89, 0x8a, 0x92, 0x93, 0x94, 0x95, 0x96,
131 0x97, 0x98, 0x99, 0x9a, 0xa2, 0xa3, 0xa4, 0xa5,
132 0xa6, 0xa7, 0xa8, 0xa9, 0xaa, 0xb2, 0xb3, 0xb4,
133 0xb5, 0xb6, 0xb7, 0xb8, 0xb9, 0xba, 0xc2, 0xc3,
134 0xc4, 0xc5, 0xc6, 0xc7, 0xc8, 0xc9, 0xca, 0xd2,
135 0xd3, 0xd4, 0xd5, 0xd6, 0xd7, 0xd8, 0xd9, 0xda,
136 0xe2, 0xe3, 0xe4, 0xe5, 0xe6, 0xe7, 0xe8, 0xe9,
137 0xea, 0xf2, 0xf3, 0xf4, 0xf5, 0xf6, 0xf7, 0xf8,
138 0xf9, 0xfa,
139 };
140
141 /* For simplicity, we keep a pre-formatted JPEG header,
142 * and we'll use fixed offsets to change the width, height
143 * quantization tables, etc.
144 */
145 static const unsigned char hantro_jpeg_header[] = {
146 /* SOI */
147 0xff, 0xd8,
148
149 /* JFIF-APP0 */
150 0xff, 0xe0, 0x00, 0x10, 0x4a, 0x46, 0x49, 0x46,
151 0x00, 0x01, 0x01, 0x00, 0x00, 0x01, 0x00, 0x01,
152 0x00, 0x00,
153
154 /* DQT */
155 0xff, 0xdb, 0x00, 0x84,
156
157 0x00,
158 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
159 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
160 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
161 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
162 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
163 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
164 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
165 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
166
167 0x01,
168 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
169 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
170 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
171 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
172 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
173 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
174 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
175 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
176
177 /* SOF */
178 0xff, 0xc0, 0x00, 0x11, 0x08, 0x00, 0xf0, 0x01,
179 0x40, 0x03, 0x01, 0x22, 0x00, 0x02, 0x11, 0x01,
180 0x03, 0x11, 0x01,
181
182 /* DHT */
183 0xff, 0xc4, 0x00, 0x1f, 0x00,
184
185 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
186 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
187 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
188 0x00, 0x00, 0x00, 0x00,
189
190 /* DHT */
191 0xff, 0xc4, 0x00, 0xb5, 0x10,
192
193 0x00, 0x00,
194 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
195 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
196 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
197 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
198 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
199 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
200 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
201 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
202 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
203 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
204 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
205 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
206 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
207 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
208 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
209 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
210 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
211 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
212 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
213 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
214 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
215 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
216
217 /* DHT */
218 0xff, 0xc4, 0x00, 0x1f, 0x01,
219
220 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
221 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
222 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
223 0x00, 0x00, 0x00, 0x00,
224
225 /* DHT */
226 0xff, 0xc4, 0x00, 0xb5, 0x11,
227
228 0x00, 0x00,
229 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
230 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
231 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
232 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
233 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
234 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
235 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
236 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
237 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
238 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
239 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
240 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
241 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
242 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
243 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
244 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
245 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
246 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
247 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
248 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
249 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
250 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
251
252 /* COM */
253 0xff, 0xfe, 0x00, 0x03, 0x00,
254
255 /* SOS */
256 0xff, 0xda, 0x00, 0x0c, 0x03, 0x01, 0x00, 0x02,
257 0x11, 0x03, 0x11, 0x00, 0x3f, 0x00,
258 };
259
260 /*
261 * JPEG_HEADER_SIZE is used in other parts of the driver in lieu of
262 * "sizeof(hantro_jpeg_header)". The two must be equal.
263 */
264 static_assert(sizeof(hantro_jpeg_header) == JPEG_HEADER_SIZE);
265
266 /*
267 * hantro_jpeg_header is padded with a COM segment, so that the payload
268 * of the SOS segment (the entropy-encoded image scan), which should
269 * trail the whole header, is 8-byte aligned for the hardware to write
270 * to directly.
271 */
272 static_assert(IS_ALIGNED(sizeof(hantro_jpeg_header), 8),
273 "Hantro JPEG header size needs to be 8-byte aligned.");
274
jpeg_scale_qp(const unsigned char qp,int scale)275 static unsigned char jpeg_scale_qp(const unsigned char qp, int scale)
276 {
277 unsigned int temp;
278
279 temp = DIV_ROUND_CLOSEST((unsigned int)qp * scale, 100);
280 if (temp <= 0)
281 temp = 1;
282 if (temp > 255)
283 temp = 255;
284
285 return (unsigned char)temp;
286 }
287
288 static void
jpeg_scale_quant_table(unsigned char * file_q_tab,unsigned char * reordered_q_tab,const unsigned char * tab,int scale)289 jpeg_scale_quant_table(unsigned char *file_q_tab,
290 unsigned char *reordered_q_tab,
291 const unsigned char *tab, int scale)
292 {
293 int i;
294
295 BUILD_BUG_ON(ARRAY_SIZE(zigzag) != JPEG_QUANT_SIZE);
296 BUILD_BUG_ON(ARRAY_SIZE(hw_reorder) != JPEG_QUANT_SIZE);
297
298 for (i = 0; i < JPEG_QUANT_SIZE; i++) {
299 file_q_tab[i] = jpeg_scale_qp(tab[zigzag[i]], scale);
300 reordered_q_tab[i] = jpeg_scale_qp(tab[hw_reorder[i]], scale);
301 }
302 }
303
jpeg_set_quality(struct hantro_jpeg_ctx * ctx)304 static void jpeg_set_quality(struct hantro_jpeg_ctx *ctx)
305 {
306 int scale;
307
308 /*
309 * Non-linear scaling factor:
310 * [5,50] -> [1000..100], [51,100] -> [98..0]
311 */
312 if (ctx->quality < 50)
313 scale = 5000 / ctx->quality;
314 else
315 scale = 200 - 2 * ctx->quality;
316
317 BUILD_BUG_ON(ARRAY_SIZE(luma_q_table) != JPEG_QUANT_SIZE);
318 BUILD_BUG_ON(ARRAY_SIZE(chroma_q_table) != JPEG_QUANT_SIZE);
319 BUILD_BUG_ON(ARRAY_SIZE(ctx->hw_luma_qtable) != JPEG_QUANT_SIZE);
320 BUILD_BUG_ON(ARRAY_SIZE(ctx->hw_chroma_qtable) != JPEG_QUANT_SIZE);
321
322 jpeg_scale_quant_table(ctx->buffer + LUMA_QUANT_OFF,
323 ctx->hw_luma_qtable, luma_q_table, scale);
324 jpeg_scale_quant_table(ctx->buffer + CHROMA_QUANT_OFF,
325 ctx->hw_chroma_qtable, chroma_q_table, scale);
326 }
327
hantro_jpeg_header_assemble(struct hantro_jpeg_ctx * ctx)328 void hantro_jpeg_header_assemble(struct hantro_jpeg_ctx *ctx)
329 {
330 char *buf = ctx->buffer;
331
332 memcpy(buf, hantro_jpeg_header,
333 sizeof(hantro_jpeg_header));
334
335 buf[HEIGHT_OFF + 0] = ctx->height >> 8;
336 buf[HEIGHT_OFF + 1] = ctx->height;
337 buf[WIDTH_OFF + 0] = ctx->width >> 8;
338 buf[WIDTH_OFF + 1] = ctx->width;
339
340 memcpy(buf + HUFF_LUMA_DC_OFF, luma_dc_table, sizeof(luma_dc_table));
341 memcpy(buf + HUFF_LUMA_AC_OFF, luma_ac_table, sizeof(luma_ac_table));
342 memcpy(buf + HUFF_CHROMA_DC_OFF, chroma_dc_table,
343 sizeof(chroma_dc_table));
344 memcpy(buf + HUFF_CHROMA_AC_OFF, chroma_ac_table,
345 sizeof(chroma_ac_table));
346
347 jpeg_set_quality(ctx);
348 }
349