Line | Branch | Exec | Source |
---|---|---|---|
1 | /* | ||
2 | * NewTek SpeedHQ codec | ||
3 | * Copyright 2017 Steinar H. Gunderson | ||
4 | * | ||
5 | * This file is part of FFmpeg. | ||
6 | * | ||
7 | * FFmpeg is free software; you can redistribute it and/or | ||
8 | * modify it under the terms of the GNU Lesser General Public | ||
9 | * License as published by the Free Software Foundation; either | ||
10 | * version 2.1 of the License, or (at your option) any later version. | ||
11 | * | ||
12 | * FFmpeg is distributed in the hope that it will be useful, | ||
13 | * but WITHOUT ANY WARRANTY; without even the implied warranty of | ||
14 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU | ||
15 | * Lesser General Public License for more details. | ||
16 | * | ||
17 | * You should have received a copy of the GNU Lesser General Public | ||
18 | * License along with FFmpeg; if not, write to the Free Software | ||
19 | * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA | ||
20 | */ | ||
21 | |||
22 | /** | ||
23 | * @file | ||
24 | * NewTek SpeedHQ decoder. | ||
25 | */ | ||
26 | |||
27 | #define BITSTREAM_READER_LE | ||
28 | |||
29 | #include "libavutil/attributes.h" | ||
30 | #include "libavutil/mem_internal.h" | ||
31 | |||
32 | #include "avcodec.h" | ||
33 | #include "blockdsp.h" | ||
34 | #include "codec_internal.h" | ||
35 | #include "decode.h" | ||
36 | #include "get_bits.h" | ||
37 | #include "idctdsp.h" | ||
38 | #include "libavutil/thread.h" | ||
39 | #include "mathops.h" | ||
40 | #include "mpeg12data.h" | ||
41 | #include "mpeg12vlc.h" | ||
42 | #include "speedhq.h" | ||
43 | #include "thread.h" | ||
44 | |||
45 | #define MAX_INDEX (64 - 1) | ||
46 | |||
47 | /* | ||
48 | * 5 bits makes for very small tables, with no more than two lookups needed | ||
49 | * for the longest (10-bit) codes. | ||
50 | */ | ||
51 | #define ALPHA_VLC_BITS 5 | ||
52 | |||
53 | typedef struct SHQContext { | ||
54 | BlockDSPContext bdsp; | ||
55 | IDCTDSPContext idsp; | ||
56 | uint8_t permutated_intra_scantable[64]; | ||
57 | int quant_matrix[64]; | ||
58 | enum { SHQ_SUBSAMPLING_420, SHQ_SUBSAMPLING_422, SHQ_SUBSAMPLING_444 } | ||
59 | subsampling; | ||
60 | enum { SHQ_NO_ALPHA, SHQ_RLE_ALPHA, SHQ_DCT_ALPHA } alpha_type; | ||
61 | AVPacket *avpkt; | ||
62 | uint32_t second_field_offset; | ||
63 | } SHQContext; | ||
64 | |||
65 | /* NOTE: The first element is always 16, unscaled. */ | ||
66 | static const uint8_t unscaled_quant_matrix[64] = { | ||
67 | 16, 16, 19, 22, 26, 27, 29, 34, | ||
68 | 16, 16, 22, 24, 27, 29, 34, 37, | ||
69 | 19, 22, 26, 27, 29, 34, 34, 38, | ||
70 | 22, 22, 26, 27, 29, 34, 37, 40, | ||
71 | 22, 26, 27, 29, 32, 35, 40, 48, | ||
72 | 26, 27, 29, 32, 35, 40, 48, 58, | ||
73 | 26, 27, 29, 34, 38, 46, 56, 69, | ||
74 | 27, 29, 35, 38, 46, 56, 69, 83 | ||
75 | }; | ||
76 | |||
77 | static VLCElem dc_lum_vlc_le[512]; | ||
78 | static VLCElem dc_chroma_vlc_le[514]; | ||
79 | static VLCElem dc_alpha_run_vlc_le[160]; | ||
80 | static VLCElem dc_alpha_level_vlc_le[288]; | ||
81 | |||
82 | static RL_VLC_ELEM speedhq_rl_vlc[674]; | ||
83 | |||
84 | 1544736 | static inline int decode_dc_le(GetBitContext *gb, int component) | |
85 | { | ||
86 | int code, diff; | ||
87 | |||
88 |
3/4✓ Branch 0 taken 831768 times.
✓ Branch 1 taken 712968 times.
✗ Branch 2 not taken.
✓ Branch 3 taken 831768 times.
|
1544736 | if (component == 0 || component == 3) { |
89 | 712968 | code = get_vlc2(gb, dc_lum_vlc_le, DC_VLC_BITS, 2); | |
90 | } else { | ||
91 | 831768 | code = get_vlc2(gb, dc_chroma_vlc_le, DC_VLC_BITS, 2); | |
92 | } | ||
93 |
2/2✓ Branch 0 taken 9976 times.
✓ Branch 1 taken 1534760 times.
|
1544736 | if (!code) { |
94 | 9976 | diff = 0; | |
95 | } else { | ||
96 | 1534760 | diff = get_xbits_le(gb, code); | |
97 | } | ||
98 | 1544736 | return diff; | |
99 | } | ||
100 | |||
101 | ✗ | static inline int decode_alpha_block(const SHQContext *s, GetBitContext *gb, uint8_t last_alpha[16], uint8_t *dest, int linesize) | |
102 | { | ||
103 | uint8_t block[128]; | ||
104 | ✗ | int i = 0, x, y; | |
105 | |||
106 | ✗ | memset(block, 0, sizeof(block)); | |
107 | |||
108 | { | ||
109 | ✗ | OPEN_READER(re, gb); | |
110 | |||
111 | ✗ | for ( ;; ) { | |
112 | int run, level; | ||
113 | |||
114 | ✗ | UPDATE_CACHE_LE(re, gb); | |
115 | ✗ | GET_VLC(run, re, gb, dc_alpha_run_vlc_le, ALPHA_VLC_BITS, 2); | |
116 | |||
117 | ✗ | if (run < 0) break; | |
118 | ✗ | i += run; | |
119 | ✗ | if (i >= 128) | |
120 | ✗ | return AVERROR_INVALIDDATA; | |
121 | |||
122 | ✗ | UPDATE_CACHE_LE(re, gb); | |
123 | ✗ | GET_VLC(level, re, gb, dc_alpha_level_vlc_le, ALPHA_VLC_BITS, 2); | |
124 | ✗ | block[i++] = level; | |
125 | } | ||
126 | |||
127 | ✗ | CLOSE_READER(re, gb); | |
128 | } | ||
129 | |||
130 | ✗ | for (y = 0; y < 8; y++) { | |
131 | ✗ | for (x = 0; x < 16; x++) { | |
132 | ✗ | last_alpha[x] -= block[y * 16 + x]; | |
133 | } | ||
134 | ✗ | memcpy(dest, last_alpha, 16); | |
135 | ✗ | dest += linesize; | |
136 | } | ||
137 | |||
138 | ✗ | return 0; | |
139 | } | ||
140 | |||
141 | 1544736 | static inline int decode_dct_block(const SHQContext *s, GetBitContext *gb, int last_dc[4], int component, uint8_t *dest, int linesize) | |
142 | { | ||
143 | 1544736 | const int *quant_matrix = s->quant_matrix; | |
144 | 1544736 | const uint8_t *scantable = s->permutated_intra_scantable; | |
145 | 1544736 | LOCAL_ALIGNED_32(int16_t, block, [64]); | |
146 | int dc_offset; | ||
147 | |||
148 | 1544736 | s->bdsp.clear_block(block); | |
149 | |||
150 | 1544736 | dc_offset = decode_dc_le(gb, component); | |
151 | 1544736 | last_dc[component] -= dc_offset; /* Note: Opposite of most codecs. */ | |
152 | 1544736 | block[scantable[0]] = last_dc[component]; /* quant_matrix[0] is always 16. */ | |
153 | |||
154 | /* Read AC coefficients. */ | ||
155 | { | ||
156 | 1544736 | int i = 0; | |
157 | 1544736 | OPEN_READER(re, gb); | |
158 | 5781637 | for ( ;; ) { | |
159 | int level, run; | ||
160 | 7326373 | UPDATE_CACHE_LE(re, gb); | |
161 |
2/2✓ Branch 0 taken 152486 times.
✓ Branch 1 taken 7173887 times.
|
7326373 | GET_RL_VLC(level, run, re, gb, speedhq_rl_vlc, |
162 | TEX_VLC_BITS, 2, 0); | ||
163 |
2/2✓ Branch 0 taken 1544736 times.
✓ Branch 1 taken 5781637 times.
|
7326373 | if (level == 127) { |
164 | 1544736 | break; | |
165 |
2/2✓ Branch 0 taken 5755452 times.
✓ Branch 1 taken 26185 times.
|
5781637 | } else if (level) { |
166 | 5755452 | i += run; | |
167 |
1/2✗ Branch 0 not taken.
✓ Branch 1 taken 5755452 times.
|
5755452 | if (i > MAX_INDEX) |
168 | ✗ | return AVERROR_INVALIDDATA; | |
169 | /* If next bit is 1, level = -level */ | ||
170 | 5755452 | level = (level ^ SHOW_SBITS(re, gb, 1)) - | |
171 | 5755452 | SHOW_SBITS(re, gb, 1); | |
172 | 5755452 | LAST_SKIP_BITS(re, gb, 1); | |
173 | } else { | ||
174 | /* Escape. */ | ||
175 | #if MIN_CACHE_BITS < 6 + 6 + 12 | ||
176 | #error MIN_CACHE_BITS is too small for the escape code, add UPDATE_CACHE | ||
177 | #endif | ||
178 | 26185 | run = SHOW_UBITS(re, gb, 6) + 1; | |
179 | 26185 | SKIP_BITS(re, gb, 6); | |
180 | 26185 | level = SHOW_UBITS(re, gb, 12) - 2048; | |
181 | 26185 | LAST_SKIP_BITS(re, gb, 12); | |
182 | |||
183 | 26185 | i += run; | |
184 |
1/2✗ Branch 0 not taken.
✓ Branch 1 taken 26185 times.
|
26185 | if (i > MAX_INDEX) |
185 | ✗ | return AVERROR_INVALIDDATA; | |
186 | } | ||
187 | |||
188 | 5781637 | block[scantable[i]] = (level * quant_matrix[i]) >> 4; | |
189 | } | ||
190 | 1544736 | CLOSE_READER(re, gb); | |
191 | } | ||
192 | |||
193 | 1544736 | s->idsp.idct_put(dest, linesize, block); | |
194 | |||
195 | 1544736 | return 0; | |
196 | } | ||
197 | |||
198 | ✗ | static int decode_speedhq_border(const SHQContext *s, GetBitContext *gb, AVFrame *frame, int field_number, int line_stride) | |
199 | { | ||
200 | ✗ | int linesize_y = frame->linesize[0] * line_stride; | |
201 | ✗ | int linesize_cb = frame->linesize[1] * line_stride; | |
202 | ✗ | int linesize_cr = frame->linesize[2] * line_stride; | |
203 | int linesize_a; | ||
204 | int ret; | ||
205 | |||
206 | ✗ | if (s->alpha_type != SHQ_NO_ALPHA) | |
207 | ✗ | linesize_a = frame->linesize[3] * line_stride; | |
208 | |||
209 | ✗ | for (int y = 0; y < frame->height; y += 16 * line_stride) { | |
210 | ✗ | int last_dc[4] = { 1024, 1024, 1024, 1024 }; | |
211 | uint8_t *dest_y, *dest_cb, *dest_cr, *dest_a; | ||
212 | uint8_t last_alpha[16]; | ||
213 | ✗ | int x = frame->width - 8; | |
214 | |||
215 | ✗ | dest_y = frame->data[0] + frame->linesize[0] * (y + field_number) + x; | |
216 | ✗ | if (s->subsampling == SHQ_SUBSAMPLING_420) { | |
217 | ✗ | dest_cb = frame->data[1] + frame->linesize[1] * (y/2 + field_number) + x / 2; | |
218 | ✗ | dest_cr = frame->data[2] + frame->linesize[2] * (y/2 + field_number) + x / 2; | |
219 | } else { | ||
220 | av_assert2(s->subsampling == SHQ_SUBSAMPLING_422); | ||
221 | ✗ | dest_cb = frame->data[1] + frame->linesize[1] * (y + field_number) + x / 2; | |
222 | ✗ | dest_cr = frame->data[2] + frame->linesize[2] * (y + field_number) + x / 2; | |
223 | } | ||
224 | ✗ | if (s->alpha_type != SHQ_NO_ALPHA) { | |
225 | ✗ | memset(last_alpha, 255, sizeof(last_alpha)); | |
226 | ✗ | dest_a = frame->data[3] + frame->linesize[3] * (y + field_number) + x; | |
227 | } | ||
228 | |||
229 | ✗ | if ((ret = decode_dct_block(s, gb, last_dc, 0, dest_y, linesize_y)) < 0) | |
230 | ✗ | return ret; | |
231 | ✗ | if ((ret = decode_dct_block(s, gb, last_dc, 0, dest_y + 8, linesize_y)) < 0) | |
232 | ✗ | return ret; | |
233 | ✗ | if ((ret = decode_dct_block(s, gb, last_dc, 0, dest_y + 8 * linesize_y, linesize_y)) < 0) | |
234 | ✗ | return ret; | |
235 | ✗ | if ((ret = decode_dct_block(s, gb, last_dc, 0, dest_y + 8 * linesize_y + 8, linesize_y)) < 0) | |
236 | ✗ | return ret; | |
237 | ✗ | if ((ret = decode_dct_block(s, gb, last_dc, 1, dest_cb, linesize_cb)) < 0) | |
238 | ✗ | return ret; | |
239 | ✗ | if ((ret = decode_dct_block(s, gb, last_dc, 2, dest_cr, linesize_cr)) < 0) | |
240 | ✗ | return ret; | |
241 | |||
242 | ✗ | if (s->subsampling != SHQ_SUBSAMPLING_420) { | |
243 | ✗ | if ((ret = decode_dct_block(s, gb, last_dc, 1, dest_cb + 8 * linesize_cb, linesize_cb)) < 0) | |
244 | ✗ | return ret; | |
245 | ✗ | if ((ret = decode_dct_block(s, gb, last_dc, 2, dest_cr + 8 * linesize_cr, linesize_cr)) < 0) | |
246 | ✗ | return ret; | |
247 | } | ||
248 | |||
249 | ✗ | if (s->alpha_type == SHQ_RLE_ALPHA) { | |
250 | /* Alpha coded using 16x8 RLE blocks. */ | ||
251 | ✗ | if ((ret = decode_alpha_block(s, gb, last_alpha, dest_a, linesize_a)) < 0) | |
252 | ✗ | return ret; | |
253 | ✗ | if ((ret = decode_alpha_block(s, gb, last_alpha, dest_a + 8 * linesize_a, linesize_a)) < 0) | |
254 | ✗ | return ret; | |
255 | ✗ | } else if (s->alpha_type == SHQ_DCT_ALPHA) { | |
256 | /* Alpha encoded exactly like luma. */ | ||
257 | ✗ | if ((ret = decode_dct_block(s, gb, last_dc, 3, dest_a, linesize_a)) < 0) | |
258 | ✗ | return ret; | |
259 | ✗ | if ((ret = decode_dct_block(s, gb, last_dc, 3, dest_a + 8, linesize_a)) < 0) | |
260 | ✗ | return ret; | |
261 | ✗ | if ((ret = decode_dct_block(s, gb, last_dc, 3, dest_a + 8 * linesize_a, linesize_a)) < 0) | |
262 | ✗ | return ret; | |
263 | ✗ | if ((ret = decode_dct_block(s, gb, last_dc, 3, dest_a + 8 * linesize_a + 8, linesize_a)) < 0) | |
264 | ✗ | return ret; | |
265 | } | ||
266 | } | ||
267 | |||
268 | ✗ | return 0; | |
269 | } | ||
270 | |||
271 | 1812 | static int decode_speedhq_field(const SHQContext *s, const uint8_t *buf, int buf_size, AVFrame *frame, int field_number, int start, int end, int line_stride, int slice_number) | |
272 | { | ||
273 | int ret, x, y, slice_offsets[5]; | ||
274 | uint32_t slice_begin, slice_end; | ||
275 | 1812 | int linesize_y = frame->linesize[0] * line_stride; | |
276 | 1812 | int linesize_cb = frame->linesize[1] * line_stride; | |
277 | 1812 | int linesize_cr = frame->linesize[2] * line_stride; | |
278 | int linesize_a; | ||
279 | GetBitContext gb; | ||
280 | |||
281 |
1/2✗ Branch 0 not taken.
✓ Branch 1 taken 1812 times.
|
1812 | if (s->alpha_type != SHQ_NO_ALPHA) |
282 | ✗ | linesize_a = frame->linesize[3] * line_stride; | |
283 | |||
284 |
3/6✓ Branch 0 taken 1812 times.
✗ Branch 1 not taken.
✓ Branch 2 taken 1812 times.
✗ Branch 3 not taken.
✗ Branch 4 not taken.
✓ Branch 5 taken 1812 times.
|
1812 | if (end < start || end - start < 3 || end > buf_size) |
285 | ✗ | return AVERROR_INVALIDDATA; | |
286 | |||
287 | 1812 | slice_offsets[0] = start; | |
288 | 1812 | slice_offsets[4] = end; | |
289 |
2/2✓ Branch 0 taken 5436 times.
✓ Branch 1 taken 1812 times.
|
7248 | for (x = 1; x < 4; x++) { |
290 | uint32_t last_offset, slice_len; | ||
291 | |||
292 | 5436 | last_offset = slice_offsets[x - 1]; | |
293 | 5436 | slice_len = AV_RL24(buf + last_offset); | |
294 | 5436 | slice_offsets[x] = last_offset + slice_len; | |
295 | |||
296 |
2/4✓ Branch 0 taken 5436 times.
✗ Branch 1 not taken.
✗ Branch 2 not taken.
✓ Branch 3 taken 5436 times.
|
5436 | if (slice_len < 3 || slice_offsets[x] > end - 3) |
297 | ✗ | return AVERROR_INVALIDDATA; | |
298 | } | ||
299 | |||
300 | 1812 | slice_begin = slice_offsets[slice_number]; | |
301 | 1812 | slice_end = slice_offsets[slice_number + 1]; | |
302 | |||
303 |
1/2✗ Branch 1 not taken.
✓ Branch 2 taken 1812 times.
|
1812 | if ((ret = init_get_bits8(&gb, buf + slice_begin + 3, slice_end - slice_begin - 3)) < 0) |
304 | ✗ | return ret; | |
305 | |||
306 |
2/2✓ Branch 0 taken 8106 times.
✓ Branch 1 taken 1812 times.
|
9918 | for (y = slice_number * 16 * line_stride; y < frame->height; y += line_stride * 64) { |
307 | uint8_t *dest_y, *dest_cb, *dest_cr, *dest_a; | ||
308 | 8106 | int last_dc[4] = { 1024, 1024, 1024, 1024 }; | |
309 | uint8_t last_alpha[16]; | ||
310 | |||
311 | 8106 | memset(last_alpha, 255, sizeof(last_alpha)); | |
312 | |||
313 | 8106 | dest_y = frame->data[0] + frame->linesize[0] * (y + field_number); | |
314 |
2/2✓ Branch 0 taken 2700 times.
✓ Branch 1 taken 5406 times.
|
8106 | if (s->subsampling == SHQ_SUBSAMPLING_420) { |
315 | 2700 | dest_cb = frame->data[1] + frame->linesize[1] * (y/2 + field_number); | |
316 | 2700 | dest_cr = frame->data[2] + frame->linesize[2] * (y/2 + field_number); | |
317 | } else { | ||
318 | 5406 | dest_cb = frame->data[1] + frame->linesize[1] * (y + field_number); | |
319 | 5406 | dest_cr = frame->data[2] + frame->linesize[2] * (y + field_number); | |
320 | } | ||
321 |
1/2✗ Branch 0 not taken.
✓ Branch 1 taken 8106 times.
|
8106 | if (s->alpha_type != SHQ_NO_ALPHA) { |
322 | ✗ | dest_a = frame->data[3] + frame->linesize[3] * (y + field_number); | |
323 | } | ||
324 | |||
325 |
4/4✓ Branch 0 taken 124248 times.
✓ Branch 1 taken 62100 times.
✓ Branch 2 taken 178242 times.
✓ Branch 3 taken 8106 times.
|
186348 | for (x = 0; x < frame->width - 8 * (s->subsampling != SHQ_SUBSAMPLING_444); x += 16) { |
326 | /* Decode the four luma blocks. */ | ||
327 |
1/2✗ Branch 1 not taken.
✓ Branch 2 taken 178242 times.
|
178242 | if ((ret = decode_dct_block(s, &gb, last_dc, 0, dest_y, linesize_y)) < 0) |
328 | ✗ | return ret; | |
329 |
1/2✗ Branch 1 not taken.
✓ Branch 2 taken 178242 times.
|
178242 | if ((ret = decode_dct_block(s, &gb, last_dc, 0, dest_y + 8, linesize_y)) < 0) |
330 | ✗ | return ret; | |
331 |
1/2✗ Branch 1 not taken.
✓ Branch 2 taken 178242 times.
|
178242 | if ((ret = decode_dct_block(s, &gb, last_dc, 0, dest_y + 8 * linesize_y, linesize_y)) < 0) |
332 | ✗ | return ret; | |
333 |
1/2✗ Branch 1 not taken.
✓ Branch 2 taken 178242 times.
|
178242 | if ((ret = decode_dct_block(s, &gb, last_dc, 0, dest_y + 8 * linesize_y + 8, linesize_y)) < 0) |
334 | ✗ | return ret; | |
335 | |||
336 | /* | ||
337 | * Decode the first chroma block. For 4:2:0, this is the only one; | ||
338 | * for 4:2:2, it's the top block; for 4:4:4, it's the top-left block. | ||
339 | */ | ||
340 |
1/2✗ Branch 1 not taken.
✓ Branch 2 taken 178242 times.
|
178242 | if ((ret = decode_dct_block(s, &gb, last_dc, 1, dest_cb, linesize_cb)) < 0) |
341 | ✗ | return ret; | |
342 |
1/2✗ Branch 1 not taken.
✓ Branch 2 taken 178242 times.
|
178242 | if ((ret = decode_dct_block(s, &gb, last_dc, 2, dest_cr, linesize_cr)) < 0) |
343 | ✗ | return ret; | |
344 | |||
345 |
2/2✓ Branch 0 taken 118842 times.
✓ Branch 1 taken 59400 times.
|
178242 | if (s->subsampling != SHQ_SUBSAMPLING_420) { |
346 | /* For 4:2:2, this is the bottom block; for 4:4:4, it's the bottom-left block. */ | ||
347 |
1/2✗ Branch 1 not taken.
✓ Branch 2 taken 118842 times.
|
118842 | if ((ret = decode_dct_block(s, &gb, last_dc, 1, dest_cb + 8 * linesize_cb, linesize_cb)) < 0) |
348 | ✗ | return ret; | |
349 |
1/2✗ Branch 1 not taken.
✓ Branch 2 taken 118842 times.
|
118842 | if ((ret = decode_dct_block(s, &gb, last_dc, 2, dest_cr + 8 * linesize_cr, linesize_cr)) < 0) |
350 | ✗ | return ret; | |
351 | |||
352 |
2/2✓ Branch 0 taken 59400 times.
✓ Branch 1 taken 59442 times.
|
118842 | if (s->subsampling == SHQ_SUBSAMPLING_444) { |
353 | /* Top-right and bottom-right blocks. */ | ||
354 |
1/2✗ Branch 1 not taken.
✓ Branch 2 taken 59400 times.
|
59400 | if ((ret = decode_dct_block(s, &gb, last_dc, 1, dest_cb + 8, linesize_cb)) < 0) |
355 | ✗ | return ret; | |
356 |
1/2✗ Branch 1 not taken.
✓ Branch 2 taken 59400 times.
|
59400 | if ((ret = decode_dct_block(s, &gb, last_dc, 2, dest_cr + 8, linesize_cr)) < 0) |
357 | ✗ | return ret; | |
358 |
1/2✗ Branch 1 not taken.
✓ Branch 2 taken 59400 times.
|
59400 | if ((ret = decode_dct_block(s, &gb, last_dc, 1, dest_cb + 8 * linesize_cb + 8, linesize_cb)) < 0) |
359 | ✗ | return ret; | |
360 |
1/2✗ Branch 1 not taken.
✓ Branch 2 taken 59400 times.
|
59400 | if ((ret = decode_dct_block(s, &gb, last_dc, 2, dest_cr + 8 * linesize_cr + 8, linesize_cr)) < 0) |
361 | ✗ | return ret; | |
362 | |||
363 | 59400 | dest_cb += 8; | |
364 | 59400 | dest_cr += 8; | |
365 | } | ||
366 | } | ||
367 | 178242 | dest_y += 16; | |
368 | 178242 | dest_cb += 8; | |
369 | 178242 | dest_cr += 8; | |
370 | |||
371 |
1/2✗ Branch 0 not taken.
✓ Branch 1 taken 178242 times.
|
178242 | if (s->alpha_type == SHQ_RLE_ALPHA) { |
372 | /* Alpha coded using 16x8 RLE blocks. */ | ||
373 | ✗ | if ((ret = decode_alpha_block(s, &gb, last_alpha, dest_a, linesize_a)) < 0) | |
374 | ✗ | return ret; | |
375 | ✗ | if ((ret = decode_alpha_block(s, &gb, last_alpha, dest_a + 8 * linesize_a, linesize_a)) < 0) | |
376 | ✗ | return ret; | |
377 | ✗ | dest_a += 16; | |
378 |
1/2✗ Branch 0 not taken.
✓ Branch 1 taken 178242 times.
|
178242 | } else if (s->alpha_type == SHQ_DCT_ALPHA) { |
379 | /* Alpha encoded exactly like luma. */ | ||
380 | ✗ | if ((ret = decode_dct_block(s, &gb, last_dc, 3, dest_a, linesize_a)) < 0) | |
381 | ✗ | return ret; | |
382 | ✗ | if ((ret = decode_dct_block(s, &gb, last_dc, 3, dest_a + 8, linesize_a)) < 0) | |
383 | ✗ | return ret; | |
384 | ✗ | if ((ret = decode_dct_block(s, &gb, last_dc, 3, dest_a + 8 * linesize_a, linesize_a)) < 0) | |
385 | ✗ | return ret; | |
386 | ✗ | if ((ret = decode_dct_block(s, &gb, last_dc, 3, dest_a + 8 * linesize_a + 8, linesize_a)) < 0) | |
387 | ✗ | return ret; | |
388 | ✗ | dest_a += 16; | |
389 | } | ||
390 | } | ||
391 | } | ||
392 | |||
393 |
3/6✓ Branch 0 taken 1212 times.
✓ Branch 1 taken 600 times.
✗ Branch 2 not taken.
✓ Branch 3 taken 1212 times.
✗ Branch 4 not taken.
✗ Branch 5 not taken.
|
1812 | if (s->subsampling != SHQ_SUBSAMPLING_444 && (frame->width & 15) && slice_number == 3) |
394 | ✗ | return decode_speedhq_border(s, &gb, frame, field_number, line_stride); | |
395 | |||
396 | 1812 | return 0; | |
397 | } | ||
398 | |||
399 | 1804 | static int decode_slice_progressive(AVCodecContext *avctx, void *arg, int jobnr, int threadnr) | |
400 | { | ||
401 | 1804 | SHQContext *s = avctx->priv_data; | |
402 | (void)threadnr; | ||
403 | |||
404 | 1804 | return decode_speedhq_field(avctx->priv_data, s->avpkt->data, s->avpkt->size, arg, 0, 4, s->avpkt->size, 1, jobnr); | |
405 | } | ||
406 | |||
407 | 8 | static int decode_slice_interlaced(AVCodecContext *avctx, void *arg, int jobnr, int threadnr) | |
408 | { | ||
409 | 8 | SHQContext *s = avctx->priv_data; | |
410 | 8 | int field_number = jobnr / 4; | |
411 | 8 | int slice_number = jobnr % 4; | |
412 | (void)threadnr; | ||
413 | |||
414 |
2/2✓ Branch 0 taken 4 times.
✓ Branch 1 taken 4 times.
|
8 | if (field_number == 0) |
415 | 4 | return decode_speedhq_field(avctx->priv_data, s->avpkt->data, s->avpkt->size, arg, 0, 4, s->second_field_offset, 2, slice_number); | |
416 | else | ||
417 | 4 | return decode_speedhq_field(avctx->priv_data, s->avpkt->data, s->avpkt->size, arg, 1, s->second_field_offset, s->avpkt->size, 2, slice_number); | |
418 | } | ||
419 | |||
420 | 452 | static void compute_quant_matrix(int *output, int qscale) | |
421 | { | ||
422 | int i; | ||
423 |
2/2✓ Branch 0 taken 28928 times.
✓ Branch 1 taken 452 times.
|
29380 | for (i = 0; i < 64; i++) output[i] = unscaled_quant_matrix[ff_zigzag_direct[i]] * qscale; |
424 | 452 | } | |
425 | |||
426 | 452 | static int speedhq_decode_frame(AVCodecContext *avctx, AVFrame *frame, | |
427 | int *got_frame, AVPacket *avpkt) | ||
428 | { | ||
429 | 452 | SHQContext * const s = avctx->priv_data; | |
430 | 452 | const uint8_t *buf = avpkt->data; | |
431 | 452 | int buf_size = avpkt->size; | |
432 | uint8_t quality; | ||
433 | int ret; | ||
434 | |||
435 |
3/6✓ Branch 0 taken 452 times.
✗ Branch 1 not taken.
✓ Branch 2 taken 452 times.
✗ Branch 3 not taken.
✗ Branch 4 not taken.
✓ Branch 5 taken 452 times.
|
452 | if (buf_size < 4 || avctx->width < 8 || avctx->width % 8 != 0) |
436 | ✗ | return AVERROR_INVALIDDATA; | |
437 |
1/2✗ Branch 0 not taken.
✓ Branch 1 taken 452 times.
|
452 | if (buf_size < avctx->width*avctx->height / 64 / 4) |
438 | ✗ | return AVERROR_INVALIDDATA; | |
439 | |||
440 | 452 | quality = buf[0]; | |
441 |
1/2✗ Branch 0 not taken.
✓ Branch 1 taken 452 times.
|
452 | if (quality >= 100) { |
442 | ✗ | return AVERROR_INVALIDDATA; | |
443 | } | ||
444 | |||
445 |
1/2✗ Branch 0 not taken.
✓ Branch 1 taken 452 times.
|
452 | if (avctx->skip_frame >= AVDISCARD_ALL) |
446 | ✗ | return avpkt->size; | |
447 | |||
448 | 452 | compute_quant_matrix(s->quant_matrix, 100 - quality); | |
449 | |||
450 | 452 | s->second_field_offset = AV_RL24(buf + 1); | |
451 |
1/2✗ Branch 0 not taken.
✓ Branch 1 taken 452 times.
|
452 | if (s->second_field_offset >= buf_size - 3) { |
452 | ✗ | return AVERROR_INVALIDDATA; | |
453 | } | ||
454 | |||
455 | 452 | avctx->coded_width = FFALIGN(avctx->width, 16); | |
456 | 452 | avctx->coded_height = FFALIGN(avctx->height, 16); | |
457 | |||
458 |
1/2✗ Branch 1 not taken.
✓ Branch 2 taken 452 times.
|
452 | if ((ret = ff_thread_get_buffer(avctx, frame, 0)) < 0) { |
459 | ✗ | return ret; | |
460 | } | ||
461 | |||
462 | 452 | s->avpkt = avpkt; | |
463 | |||
464 |
3/4✓ Branch 0 taken 1 times.
✓ Branch 1 taken 451 times.
✗ Branch 2 not taken.
✓ Branch 3 taken 1 times.
|
452 | if (s->second_field_offset == 4 || s->second_field_offset == (buf_size-4)) { |
465 | /* | ||
466 | * Overlapping first and second fields is used to signal | ||
467 | * encoding only a single field. In this case, "height" | ||
468 | * is ambiguous; it could mean either the height of the | ||
469 | * frame as a whole, or of the field. The former would make | ||
470 | * more sense for compatibility with legacy decoders, | ||
471 | * but this matches the convention used in NDI, which is | ||
472 | * the primary user of this trick. | ||
473 | */ | ||
474 |
1/2✗ Branch 1 not taken.
✓ Branch 2 taken 451 times.
|
451 | if ((ret = avctx->execute2(avctx, decode_slice_progressive, frame, NULL, 4)) < 0) |
475 | ✗ | return ret; | |
476 | } else { | ||
477 |
1/2✗ Branch 1 not taken.
✓ Branch 2 taken 1 times.
|
1 | if ((ret = avctx->execute2(avctx, decode_slice_interlaced, frame, NULL, 8)) < 0) |
478 | ✗ | return ret; | |
479 | } | ||
480 | |||
481 | 452 | *got_frame = 1; | |
482 | 452 | return buf_size; | |
483 | } | ||
484 | |||
485 | /* | ||
486 | * Alpha VLC. Run and level are independently coded, and would be | ||
487 | * outside the default limits for MAX_RUN/MAX_LEVEL, so we don't | ||
488 | * bother with combining them into one table. | ||
489 | */ | ||
490 | 11 | static av_cold void compute_alpha_vlcs(void) | |
491 | { | ||
492 | uint16_t run_code[134], level_code[266]; | ||
493 | uint8_t run_bits[134], level_bits[266]; | ||
494 | int16_t run_symbols[134], level_symbols[266]; | ||
495 | int entry, i, sign; | ||
496 | |||
497 | /* Initialize VLC for alpha run. */ | ||
498 | 11 | entry = 0; | |
499 | |||
500 | /* 0 -> 0. */ | ||
501 | 11 | run_code[entry] = 0; | |
502 | 11 | run_bits[entry] = 1; | |
503 | 11 | run_symbols[entry] = 0; | |
504 | 11 | ++entry; | |
505 | |||
506 | /* 10xx -> xx plus 1. */ | ||
507 |
2/2✓ Branch 0 taken 44 times.
✓ Branch 1 taken 11 times.
|
55 | for (i = 0; i < 4; ++i) { |
508 | 44 | run_code[entry] = (i << 2) | 1; | |
509 | 44 | run_bits[entry] = 4; | |
510 | 44 | run_symbols[entry] = i + 1; | |
511 | 44 | ++entry; | |
512 | } | ||
513 | |||
514 | /* 111xxxxxxx -> xxxxxxx. */ | ||
515 |
2/2✓ Branch 0 taken 1408 times.
✓ Branch 1 taken 11 times.
|
1419 | for (i = 0; i < 128; ++i) { |
516 | 1408 | run_code[entry] = (i << 3) | 7; | |
517 | 1408 | run_bits[entry] = 10; | |
518 | 1408 | run_symbols[entry] = i; | |
519 | 1408 | ++entry; | |
520 | } | ||
521 | |||
522 | /* 110 -> EOB. */ | ||
523 | 11 | run_code[entry] = 3; | |
524 | 11 | run_bits[entry] = 3; | |
525 | 11 | run_symbols[entry] = -1; | |
526 | 11 | ++entry; | |
527 | |||
528 |
1/2✗ Branch 0 not taken.
✓ Branch 1 taken 11 times.
|
11 | av_assert0(entry == FF_ARRAY_ELEMS(run_code)); |
529 | |||
530 | 11 | VLC_INIT_STATIC_SPARSE_TABLE(dc_alpha_run_vlc_le, ALPHA_VLC_BITS, | |
531 | FF_ARRAY_ELEMS(run_code), | ||
532 | run_bits, 1, 1, | ||
533 | run_code, 2, 2, | ||
534 | run_symbols, 2, 2, VLC_INIT_LE); | ||
535 | |||
536 | /* Initialize VLC for alpha level. */ | ||
537 | 11 | entry = 0; | |
538 | |||
539 |
2/2✓ Branch 0 taken 22 times.
✓ Branch 1 taken 11 times.
|
33 | for (sign = 0; sign <= 1; ++sign) { |
540 | /* 1s -> -1 or +1 (depending on sign bit). */ | ||
541 | 22 | level_code[entry] = (sign << 1) | 1; | |
542 | 22 | level_bits[entry] = 2; | |
543 |
2/2✓ Branch 0 taken 11 times.
✓ Branch 1 taken 11 times.
|
22 | level_symbols[entry] = sign ? -1 : 1; |
544 | 22 | ++entry; | |
545 | |||
546 | /* 01sxx -> xx plus 2 (2..5 or -2..-5, depending on sign bit). */ | ||
547 |
2/2✓ Branch 0 taken 88 times.
✓ Branch 1 taken 22 times.
|
110 | for (i = 0; i < 4; ++i) { |
548 | 88 | level_code[entry] = (i << 3) | (sign << 2) | 2; | |
549 | 88 | level_bits[entry] = 5; | |
550 |
2/2✓ Branch 0 taken 44 times.
✓ Branch 1 taken 44 times.
|
88 | level_symbols[entry] = sign ? -(i + 2) : (i + 2); |
551 | 88 | ++entry; | |
552 | } | ||
553 | } | ||
554 | |||
555 | /* | ||
556 | * 00xxxxxxxx -> xxxxxxxx, in two's complement. There are many codes | ||
557 | * here that would better be encoded in other ways (e.g. 0 would be | ||
558 | * encoded by increasing run, and +/- 1 would be encoded with a | ||
559 | * shorter code), but it doesn't hurt to allow everything. | ||
560 | */ | ||
561 |
2/2✓ Branch 0 taken 2816 times.
✓ Branch 1 taken 11 times.
|
2827 | for (i = 0; i < 256; ++i) { |
562 | 2816 | level_code[entry] = i << 2; | |
563 | 2816 | level_bits[entry] = 10; | |
564 | 2816 | level_symbols[entry] = i; | |
565 | 2816 | ++entry; | |
566 | } | ||
567 | |||
568 |
1/2✗ Branch 0 not taken.
✓ Branch 1 taken 11 times.
|
11 | av_assert0(entry == FF_ARRAY_ELEMS(level_code)); |
569 | |||
570 | 11 | VLC_INIT_STATIC_SPARSE_TABLE(dc_alpha_level_vlc_le, ALPHA_VLC_BITS, | |
571 | FF_ARRAY_ELEMS(level_code), | ||
572 | level_bits, 1, 1, | ||
573 | level_code, 2, 2, | ||
574 | level_symbols, 2, 2, VLC_INIT_LE); | ||
575 | 11 | } | |
576 | |||
577 | 11 | static av_cold void speedhq_static_init(void) | |
578 | { | ||
579 | /* Exactly the same as MPEG-2, except for a little-endian reader. */ | ||
580 | 11 | VLC_INIT_STATIC_TABLE(dc_lum_vlc_le, DC_VLC_BITS, 12, | |
581 | ff_mpeg12_vlc_dc_lum_bits, 1, 1, | ||
582 | ff_mpeg12_vlc_dc_lum_code, 2, 2, | ||
583 | VLC_INIT_OUTPUT_LE); | ||
584 | 11 | VLC_INIT_STATIC_TABLE(dc_chroma_vlc_le, DC_VLC_BITS, 12, | |
585 | ff_mpeg12_vlc_dc_chroma_bits, 1, 1, | ||
586 | ff_mpeg12_vlc_dc_chroma_code, 2, 2, | ||
587 | VLC_INIT_OUTPUT_LE); | ||
588 | |||
589 | 11 | ff_init_2d_vlc_rl(ff_speedhq_vlc_table, speedhq_rl_vlc, ff_speedhq_run, | |
590 | ff_speedhq_level, SPEEDHQ_RL_NB_ELEMS, | ||
591 | FF_ARRAY_ELEMS(speedhq_rl_vlc), VLC_INIT_LE); | ||
592 | |||
593 | 11 | compute_alpha_vlcs(); | |
594 | 11 | } | |
595 | |||
596 | 22 | static av_cold int speedhq_decode_init(AVCodecContext *avctx) | |
597 | { | ||
598 | int ret; | ||
599 | static AVOnce init_once = AV_ONCE_INIT; | ||
600 | 22 | SHQContext * const s = avctx->priv_data; | |
601 | |||
602 | 22 | ret = ff_thread_once(&init_once, speedhq_static_init); | |
603 |
1/2✗ Branch 0 not taken.
✓ Branch 1 taken 22 times.
|
22 | if (ret) |
604 | ✗ | return AVERROR_UNKNOWN; | |
605 | |||
606 | 22 | ff_blockdsp_init(&s->bdsp); | |
607 | 22 | ff_idctdsp_init(&s->idsp, avctx); | |
608 | 22 | ff_permute_scantable(s->permutated_intra_scantable, ff_zigzag_direct, | |
609 | 22 | s->idsp.idct_permutation); | |
610 | |||
611 |
4/9✓ Branch 0 taken 6 times.
✗ Branch 1 not taken.
✓ Branch 2 taken 8 times.
✗ Branch 3 not taken.
✓ Branch 4 taken 6 times.
✗ Branch 5 not taken.
✗ Branch 6 not taken.
✗ Branch 7 not taken.
✓ Branch 8 taken 2 times.
|
22 | switch (avctx->codec_tag) { |
612 | 6 | case MKTAG('S', 'H', 'Q', '0'): | |
613 | 6 | s->subsampling = SHQ_SUBSAMPLING_420; | |
614 | 6 | s->alpha_type = SHQ_NO_ALPHA; | |
615 | 6 | avctx->pix_fmt = AV_PIX_FMT_YUV420P; | |
616 | 6 | break; | |
617 | ✗ | case MKTAG('S', 'H', 'Q', '1'): | |
618 | ✗ | s->subsampling = SHQ_SUBSAMPLING_420; | |
619 | ✗ | s->alpha_type = SHQ_RLE_ALPHA; | |
620 | ✗ | avctx->pix_fmt = AV_PIX_FMT_YUVA420P; | |
621 | ✗ | break; | |
622 | 8 | case MKTAG('S', 'H', 'Q', '2'): | |
623 | 8 | s->subsampling = SHQ_SUBSAMPLING_422; | |
624 | 8 | s->alpha_type = SHQ_NO_ALPHA; | |
625 | 8 | avctx->pix_fmt = AV_PIX_FMT_YUV422P; | |
626 | 8 | break; | |
627 | ✗ | case MKTAG('S', 'H', 'Q', '3'): | |
628 | ✗ | s->subsampling = SHQ_SUBSAMPLING_422; | |
629 | ✗ | s->alpha_type = SHQ_RLE_ALPHA; | |
630 | ✗ | avctx->pix_fmt = AV_PIX_FMT_YUVA422P; | |
631 | ✗ | break; | |
632 | 6 | case MKTAG('S', 'H', 'Q', '4'): | |
633 | 6 | s->subsampling = SHQ_SUBSAMPLING_444; | |
634 | 6 | s->alpha_type = SHQ_NO_ALPHA; | |
635 | 6 | avctx->pix_fmt = AV_PIX_FMT_YUV444P; | |
636 | 6 | break; | |
637 | ✗ | case MKTAG('S', 'H', 'Q', '5'): | |
638 | ✗ | s->subsampling = SHQ_SUBSAMPLING_444; | |
639 | ✗ | s->alpha_type = SHQ_RLE_ALPHA; | |
640 | ✗ | avctx->pix_fmt = AV_PIX_FMT_YUVA444P; | |
641 | ✗ | break; | |
642 | ✗ | case MKTAG('S', 'H', 'Q', '7'): | |
643 | ✗ | s->subsampling = SHQ_SUBSAMPLING_422; | |
644 | ✗ | s->alpha_type = SHQ_DCT_ALPHA; | |
645 | ✗ | avctx->pix_fmt = AV_PIX_FMT_YUVA422P; | |
646 | ✗ | break; | |
647 | ✗ | case MKTAG('S', 'H', 'Q', '9'): | |
648 | ✗ | s->subsampling = SHQ_SUBSAMPLING_444; | |
649 | ✗ | s->alpha_type = SHQ_DCT_ALPHA; | |
650 | ✗ | avctx->pix_fmt = AV_PIX_FMT_YUVA444P; | |
651 | ✗ | break; | |
652 | 2 | default: | |
653 | 2 | av_log(avctx, AV_LOG_ERROR, "Unknown NewTek SpeedHQ FOURCC provided (%08X)\n", | |
654 | avctx->codec_tag); | ||
655 | 2 | return AVERROR_INVALIDDATA; | |
656 | } | ||
657 | |||
658 | /* This matches what NDI's RGB -> Y'CbCr 4:2:2 converter uses. */ | ||
659 | 20 | avctx->colorspace = AVCOL_SPC_BT470BG; | |
660 | 20 | avctx->chroma_sample_location = AVCHROMA_LOC_CENTER; | |
661 | |||
662 | 20 | return 0; | |
663 | } | ||
664 | |||
665 | const FFCodec ff_speedhq_decoder = { | ||
666 | .p.name = "speedhq", | ||
667 | CODEC_LONG_NAME("NewTek SpeedHQ"), | ||
668 | .p.type = AVMEDIA_TYPE_VIDEO, | ||
669 | .p.id = AV_CODEC_ID_SPEEDHQ, | ||
670 | .priv_data_size = sizeof(SHQContext), | ||
671 | .init = speedhq_decode_init, | ||
672 | FF_CODEC_DECODE_CB(speedhq_decode_frame), | ||
673 | .p.capabilities = AV_CODEC_CAP_DR1 | AV_CODEC_CAP_FRAME_THREADS | AV_CODEC_CAP_SLICE_THREADS, | ||
674 | }; | ||
675 |