| Line | Branch | Exec | Source |
|---|---|---|---|
| 1 | /* | ||
| 2 | * NewTek SpeedHQ codec | ||
| 3 | * Copyright 2017 Steinar H. Gunderson | ||
| 4 | * | ||
| 5 | * This file is part of FFmpeg. | ||
| 6 | * | ||
| 7 | * FFmpeg is free software; you can redistribute it and/or | ||
| 8 | * modify it under the terms of the GNU Lesser General Public | ||
| 9 | * License as published by the Free Software Foundation; either | ||
| 10 | * version 2.1 of the License, or (at your option) any later version. | ||
| 11 | * | ||
| 12 | * FFmpeg is distributed in the hope that it will be useful, | ||
| 13 | * but WITHOUT ANY WARRANTY; without even the implied warranty of | ||
| 14 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU | ||
| 15 | * Lesser General Public License for more details. | ||
| 16 | * | ||
| 17 | * You should have received a copy of the GNU Lesser General Public | ||
| 18 | * License along with FFmpeg; if not, write to the Free Software | ||
| 19 | * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA | ||
| 20 | */ | ||
| 21 | |||
| 22 | /** | ||
| 23 | * @file | ||
| 24 | * NewTek SpeedHQ decoder. | ||
| 25 | */ | ||
| 26 | |||
| 27 | #define BITSTREAM_READER_LE | ||
| 28 | |||
| 29 | #include "libavutil/attributes.h" | ||
| 30 | #include "libavutil/mem_internal.h" | ||
| 31 | |||
| 32 | #include "avcodec.h" | ||
| 33 | #include "blockdsp.h" | ||
| 34 | #include "codec_internal.h" | ||
| 35 | #include "decode.h" | ||
| 36 | #include "get_bits.h" | ||
| 37 | #include "idctdsp.h" | ||
| 38 | #include "libavutil/thread.h" | ||
| 39 | #include "mathops.h" | ||
| 40 | #include "mpeg12data.h" | ||
| 41 | #include "mpeg12vlc.h" | ||
| 42 | #include "speedhq.h" | ||
| 43 | #include "thread.h" | ||
| 44 | |||
| 45 | #define MAX_INDEX (64 - 1) | ||
| 46 | |||
| 47 | /* | ||
| 48 | * 5 bits makes for very small tables, with no more than two lookups needed | ||
| 49 | * for the longest (10-bit) codes. | ||
| 50 | */ | ||
| 51 | #define ALPHA_VLC_BITS 5 | ||
| 52 | |||
| 53 | typedef struct SHQContext { | ||
| 54 | BlockDSPContext bdsp; | ||
| 55 | IDCTDSPContext idsp; | ||
| 56 | uint8_t permutated_intra_scantable[64]; | ||
| 57 | int quant_matrix[64]; | ||
| 58 | enum { SHQ_SUBSAMPLING_420, SHQ_SUBSAMPLING_422, SHQ_SUBSAMPLING_444 } | ||
| 59 | subsampling; | ||
| 60 | enum { SHQ_NO_ALPHA, SHQ_RLE_ALPHA, SHQ_DCT_ALPHA } alpha_type; | ||
| 61 | AVPacket *avpkt; | ||
| 62 | uint32_t second_field_offset; | ||
| 63 | } SHQContext; | ||
| 64 | |||
| 65 | /* NOTE: The first element is always 16, unscaled. */ | ||
| 66 | static const uint8_t unscaled_quant_matrix[64] = { | ||
| 67 | 16, 16, 19, 22, 26, 27, 29, 34, | ||
| 68 | 16, 16, 22, 24, 27, 29, 34, 37, | ||
| 69 | 19, 22, 26, 27, 29, 34, 34, 38, | ||
| 70 | 22, 22, 26, 27, 29, 34, 37, 40, | ||
| 71 | 22, 26, 27, 29, 32, 35, 40, 48, | ||
| 72 | 26, 27, 29, 32, 35, 40, 48, 58, | ||
| 73 | 26, 27, 29, 34, 38, 46, 56, 69, | ||
| 74 | 27, 29, 35, 38, 46, 56, 69, 83 | ||
| 75 | }; | ||
| 76 | |||
| 77 | static VLCElem dc_lum_vlc_le[512]; | ||
| 78 | static VLCElem dc_chroma_vlc_le[514]; | ||
| 79 | static VLCElem dc_alpha_run_vlc_le[160]; | ||
| 80 | static VLCElem dc_alpha_level_vlc_le[288]; | ||
| 81 | |||
| 82 | static RL_VLC_ELEM speedhq_rl_vlc[674]; | ||
| 83 | |||
| 84 | 1544736 | static inline int decode_dc_le(GetBitContext *gb, int component) | |
| 85 | { | ||
| 86 | int code, diff; | ||
| 87 | |||
| 88 |
3/4✓ Branch 0 taken 831768 times.
✓ Branch 1 taken 712968 times.
✗ Branch 2 not taken.
✓ Branch 3 taken 831768 times.
|
1544736 | if (component == 0 || component == 3) { |
| 89 | 712968 | code = get_vlc2(gb, dc_lum_vlc_le, DC_VLC_BITS, 2); | |
| 90 | } else { | ||
| 91 | 831768 | code = get_vlc2(gb, dc_chroma_vlc_le, DC_VLC_BITS, 2); | |
| 92 | } | ||
| 93 |
2/2✓ Branch 0 taken 9976 times.
✓ Branch 1 taken 1534760 times.
|
1544736 | if (!code) { |
| 94 | 9976 | diff = 0; | |
| 95 | } else { | ||
| 96 | 1534760 | diff = get_xbits_le(gb, code); | |
| 97 | } | ||
| 98 | 1544736 | return diff; | |
| 99 | } | ||
| 100 | |||
| 101 | ✗ | static inline int decode_alpha_block(const SHQContext *s, GetBitContext *gb, uint8_t last_alpha[16], uint8_t *dest, int linesize) | |
| 102 | { | ||
| 103 | uint8_t block[128]; | ||
| 104 | ✗ | int i = 0, x, y; | |
| 105 | |||
| 106 | ✗ | memset(block, 0, sizeof(block)); | |
| 107 | |||
| 108 | { | ||
| 109 | ✗ | OPEN_READER(re, gb); | |
| 110 | |||
| 111 | ✗ | for ( ;; ) { | |
| 112 | int run, level; | ||
| 113 | |||
| 114 | ✗ | UPDATE_CACHE_LE(re, gb); | |
| 115 | ✗ | GET_VLC(run, re, gb, dc_alpha_run_vlc_le, ALPHA_VLC_BITS, 2); | |
| 116 | |||
| 117 | ✗ | if (run < 0) break; | |
| 118 | ✗ | i += run; | |
| 119 | ✗ | if (i >= 128) | |
| 120 | ✗ | return AVERROR_INVALIDDATA; | |
| 121 | |||
| 122 | ✗ | UPDATE_CACHE_LE(re, gb); | |
| 123 | ✗ | GET_VLC(level, re, gb, dc_alpha_level_vlc_le, ALPHA_VLC_BITS, 2); | |
| 124 | ✗ | block[i++] = level; | |
| 125 | } | ||
| 126 | |||
| 127 | ✗ | CLOSE_READER(re, gb); | |
| 128 | } | ||
| 129 | |||
| 130 | ✗ | for (y = 0; y < 8; y++) { | |
| 131 | ✗ | for (x = 0; x < 16; x++) { | |
| 132 | ✗ | last_alpha[x] -= block[y * 16 + x]; | |
| 133 | } | ||
| 134 | ✗ | memcpy(dest, last_alpha, 16); | |
| 135 | ✗ | dest += linesize; | |
| 136 | } | ||
| 137 | |||
| 138 | ✗ | return 0; | |
| 139 | } | ||
| 140 | |||
| 141 | 1544736 | static inline int decode_dct_block(const SHQContext *s, GetBitContext *gb, int last_dc[4], int component, uint8_t *dest, int linesize) | |
| 142 | { | ||
| 143 | 1544736 | const int *quant_matrix = s->quant_matrix; | |
| 144 | 1544736 | const uint8_t *scantable = s->permutated_intra_scantable; | |
| 145 | 1544736 | LOCAL_ALIGNED_32(int16_t, block, [64]); | |
| 146 | int dc_offset; | ||
| 147 | |||
| 148 | 1544736 | s->bdsp.clear_block(block); | |
| 149 | |||
| 150 | 1544736 | dc_offset = decode_dc_le(gb, component); | |
| 151 | 1544736 | last_dc[component] -= dc_offset; /* Note: Opposite of most codecs. */ | |
| 152 | 1544736 | block[scantable[0]] = last_dc[component]; /* quant_matrix[0] is always 16. */ | |
| 153 | |||
| 154 | /* Read AC coefficients. */ | ||
| 155 | { | ||
| 156 | 1544736 | int i = 0; | |
| 157 | 1544736 | OPEN_READER(re, gb); | |
| 158 | 5781637 | for ( ;; ) { | |
| 159 | int level, run; | ||
| 160 | 7326373 | UPDATE_CACHE_LE(re, gb); | |
| 161 |
2/2✓ Branch 0 taken 152486 times.
✓ Branch 1 taken 7173887 times.
|
7326373 | GET_RL_VLC(level, run, re, gb, speedhq_rl_vlc, |
| 162 | TEX_VLC_BITS, 2, 0); | ||
| 163 |
2/2✓ Branch 0 taken 1544736 times.
✓ Branch 1 taken 5781637 times.
|
7326373 | if (level == 127) { |
| 164 | 1544736 | break; | |
| 165 |
2/2✓ Branch 0 taken 5755452 times.
✓ Branch 1 taken 26185 times.
|
5781637 | } else if (level) { |
| 166 | 5755452 | i += run; | |
| 167 |
1/2✗ Branch 0 not taken.
✓ Branch 1 taken 5755452 times.
|
5755452 | if (i > MAX_INDEX) |
| 168 | ✗ | return AVERROR_INVALIDDATA; | |
| 169 | /* If next bit is 1, level = -level */ | ||
| 170 | 5755452 | level = (level ^ SHOW_SBITS(re, gb, 1)) - | |
| 171 | 5755452 | SHOW_SBITS(re, gb, 1); | |
| 172 | 5755452 | LAST_SKIP_BITS(re, gb, 1); | |
| 173 | } else { | ||
| 174 | /* Escape. */ | ||
| 175 | #if MIN_CACHE_BITS < 6 + 6 + 12 | ||
| 176 | #error MIN_CACHE_BITS is too small for the escape code, add UPDATE_CACHE | ||
| 177 | #endif | ||
| 178 | 26185 | run = SHOW_UBITS(re, gb, 6) + 1; | |
| 179 | 26185 | SKIP_BITS(re, gb, 6); | |
| 180 | 26185 | level = SHOW_UBITS(re, gb, 12) - 2048; | |
| 181 | 26185 | LAST_SKIP_BITS(re, gb, 12); | |
| 182 | |||
| 183 | 26185 | i += run; | |
| 184 |
1/2✗ Branch 0 not taken.
✓ Branch 1 taken 26185 times.
|
26185 | if (i > MAX_INDEX) |
| 185 | ✗ | return AVERROR_INVALIDDATA; | |
| 186 | } | ||
| 187 | |||
| 188 | 5781637 | block[scantable[i]] = (level * quant_matrix[i]) >> 4; | |
| 189 | } | ||
| 190 | 1544736 | CLOSE_READER(re, gb); | |
| 191 | } | ||
| 192 | |||
| 193 | 1544736 | s->idsp.idct_put(dest, linesize, block); | |
| 194 | |||
| 195 | 1544736 | return 0; | |
| 196 | } | ||
| 197 | |||
| 198 | ✗ | static int decode_speedhq_border(const SHQContext *s, GetBitContext *gb, AVFrame *frame, int field_number, int line_stride) | |
| 199 | { | ||
| 200 | ✗ | int linesize_y = frame->linesize[0] * line_stride; | |
| 201 | ✗ | int linesize_cb = frame->linesize[1] * line_stride; | |
| 202 | ✗ | int linesize_cr = frame->linesize[2] * line_stride; | |
| 203 | int linesize_a; | ||
| 204 | int ret; | ||
| 205 | |||
| 206 | ✗ | if (s->alpha_type != SHQ_NO_ALPHA) | |
| 207 | ✗ | linesize_a = frame->linesize[3] * line_stride; | |
| 208 | |||
| 209 | ✗ | for (int y = 0; y < frame->height; y += 16 * line_stride) { | |
| 210 | ✗ | int last_dc[4] = { 1024, 1024, 1024, 1024 }; | |
| 211 | uint8_t *dest_y, *dest_cb, *dest_cr, *dest_a; | ||
| 212 | uint8_t last_alpha[16]; | ||
| 213 | ✗ | int x = frame->width - 8; | |
| 214 | |||
| 215 | ✗ | dest_y = frame->data[0] + frame->linesize[0] * (y + field_number) + x; | |
| 216 | ✗ | if (s->subsampling == SHQ_SUBSAMPLING_420) { | |
| 217 | ✗ | dest_cb = frame->data[1] + frame->linesize[1] * (y/2 + field_number) + x / 2; | |
| 218 | ✗ | dest_cr = frame->data[2] + frame->linesize[2] * (y/2 + field_number) + x / 2; | |
| 219 | } else { | ||
| 220 | av_assert2(s->subsampling == SHQ_SUBSAMPLING_422); | ||
| 221 | ✗ | dest_cb = frame->data[1] + frame->linesize[1] * (y + field_number) + x / 2; | |
| 222 | ✗ | dest_cr = frame->data[2] + frame->linesize[2] * (y + field_number) + x / 2; | |
| 223 | } | ||
| 224 | ✗ | if (s->alpha_type != SHQ_NO_ALPHA) { | |
| 225 | ✗ | memset(last_alpha, 255, sizeof(last_alpha)); | |
| 226 | ✗ | dest_a = frame->data[3] + frame->linesize[3] * (y + field_number) + x; | |
| 227 | } | ||
| 228 | |||
| 229 | ✗ | if ((ret = decode_dct_block(s, gb, last_dc, 0, dest_y, linesize_y)) < 0) | |
| 230 | ✗ | return ret; | |
| 231 | ✗ | if ((ret = decode_dct_block(s, gb, last_dc, 0, dest_y + 8, linesize_y)) < 0) | |
| 232 | ✗ | return ret; | |
| 233 | ✗ | if ((ret = decode_dct_block(s, gb, last_dc, 0, dest_y + 8 * linesize_y, linesize_y)) < 0) | |
| 234 | ✗ | return ret; | |
| 235 | ✗ | if ((ret = decode_dct_block(s, gb, last_dc, 0, dest_y + 8 * linesize_y + 8, linesize_y)) < 0) | |
| 236 | ✗ | return ret; | |
| 237 | ✗ | if ((ret = decode_dct_block(s, gb, last_dc, 1, dest_cb, linesize_cb)) < 0) | |
| 238 | ✗ | return ret; | |
| 239 | ✗ | if ((ret = decode_dct_block(s, gb, last_dc, 2, dest_cr, linesize_cr)) < 0) | |
| 240 | ✗ | return ret; | |
| 241 | |||
| 242 | ✗ | if (s->subsampling != SHQ_SUBSAMPLING_420) { | |
| 243 | ✗ | if ((ret = decode_dct_block(s, gb, last_dc, 1, dest_cb + 8 * linesize_cb, linesize_cb)) < 0) | |
| 244 | ✗ | return ret; | |
| 245 | ✗ | if ((ret = decode_dct_block(s, gb, last_dc, 2, dest_cr + 8 * linesize_cr, linesize_cr)) < 0) | |
| 246 | ✗ | return ret; | |
| 247 | } | ||
| 248 | |||
| 249 | ✗ | if (s->alpha_type == SHQ_RLE_ALPHA) { | |
| 250 | /* Alpha coded using 16x8 RLE blocks. */ | ||
| 251 | ✗ | if ((ret = decode_alpha_block(s, gb, last_alpha, dest_a, linesize_a)) < 0) | |
| 252 | ✗ | return ret; | |
| 253 | ✗ | if ((ret = decode_alpha_block(s, gb, last_alpha, dest_a + 8 * linesize_a, linesize_a)) < 0) | |
| 254 | ✗ | return ret; | |
| 255 | ✗ | } else if (s->alpha_type == SHQ_DCT_ALPHA) { | |
| 256 | /* Alpha encoded exactly like luma. */ | ||
| 257 | ✗ | if ((ret = decode_dct_block(s, gb, last_dc, 3, dest_a, linesize_a)) < 0) | |
| 258 | ✗ | return ret; | |
| 259 | ✗ | if ((ret = decode_dct_block(s, gb, last_dc, 3, dest_a + 8, linesize_a)) < 0) | |
| 260 | ✗ | return ret; | |
| 261 | ✗ | if ((ret = decode_dct_block(s, gb, last_dc, 3, dest_a + 8 * linesize_a, linesize_a)) < 0) | |
| 262 | ✗ | return ret; | |
| 263 | ✗ | if ((ret = decode_dct_block(s, gb, last_dc, 3, dest_a + 8 * linesize_a + 8, linesize_a)) < 0) | |
| 264 | ✗ | return ret; | |
| 265 | } | ||
| 266 | } | ||
| 267 | |||
| 268 | ✗ | return 0; | |
| 269 | } | ||
| 270 | |||
| 271 | 1812 | static int decode_speedhq_field(const SHQContext *s, const uint8_t *buf, int buf_size, AVFrame *frame, int field_number, int start, int end, int line_stride, int slice_number) | |
| 272 | { | ||
| 273 | int ret, x, y, slice_offsets[5]; | ||
| 274 | uint32_t slice_begin, slice_end; | ||
| 275 | 1812 | int linesize_y = frame->linesize[0] * line_stride; | |
| 276 | 1812 | int linesize_cb = frame->linesize[1] * line_stride; | |
| 277 | 1812 | int linesize_cr = frame->linesize[2] * line_stride; | |
| 278 | int linesize_a; | ||
| 279 | GetBitContext gb; | ||
| 280 | |||
| 281 |
1/2✗ Branch 0 not taken.
✓ Branch 1 taken 1812 times.
|
1812 | if (s->alpha_type != SHQ_NO_ALPHA) |
| 282 | ✗ | linesize_a = frame->linesize[3] * line_stride; | |
| 283 | |||
| 284 |
3/6✓ Branch 0 taken 1812 times.
✗ Branch 1 not taken.
✓ Branch 2 taken 1812 times.
✗ Branch 3 not taken.
✗ Branch 4 not taken.
✓ Branch 5 taken 1812 times.
|
1812 | if (end < start || end - start < 3 || end > buf_size) |
| 285 | ✗ | return AVERROR_INVALIDDATA; | |
| 286 | |||
| 287 | 1812 | slice_offsets[0] = start; | |
| 288 | 1812 | slice_offsets[4] = end; | |
| 289 |
2/2✓ Branch 0 taken 5436 times.
✓ Branch 1 taken 1812 times.
|
7248 | for (x = 1; x < 4; x++) { |
| 290 | uint32_t last_offset, slice_len; | ||
| 291 | |||
| 292 | 5436 | last_offset = slice_offsets[x - 1]; | |
| 293 | 5436 | slice_len = AV_RL24(buf + last_offset); | |
| 294 | 5436 | slice_offsets[x] = last_offset + slice_len; | |
| 295 | |||
| 296 |
2/4✓ Branch 0 taken 5436 times.
✗ Branch 1 not taken.
✗ Branch 2 not taken.
✓ Branch 3 taken 5436 times.
|
5436 | if (slice_len < 3 || slice_offsets[x] > end - 3) |
| 297 | ✗ | return AVERROR_INVALIDDATA; | |
| 298 | } | ||
| 299 | |||
| 300 | 1812 | slice_begin = slice_offsets[slice_number]; | |
| 301 | 1812 | slice_end = slice_offsets[slice_number + 1]; | |
| 302 | |||
| 303 |
1/2✗ Branch 1 not taken.
✓ Branch 2 taken 1812 times.
|
1812 | if ((ret = init_get_bits8(&gb, buf + slice_begin + 3, slice_end - slice_begin - 3)) < 0) |
| 304 | ✗ | return ret; | |
| 305 | |||
| 306 |
2/2✓ Branch 0 taken 8106 times.
✓ Branch 1 taken 1812 times.
|
9918 | for (y = slice_number * 16 * line_stride; y < frame->height; y += line_stride * 64) { |
| 307 | uint8_t *dest_y, *dest_cb, *dest_cr, *dest_a; | ||
| 308 | 8106 | int last_dc[4] = { 1024, 1024, 1024, 1024 }; | |
| 309 | uint8_t last_alpha[16]; | ||
| 310 | |||
| 311 | 8106 | memset(last_alpha, 255, sizeof(last_alpha)); | |
| 312 | |||
| 313 | 8106 | dest_y = frame->data[0] + frame->linesize[0] * (y + field_number); | |
| 314 |
2/2✓ Branch 0 taken 2700 times.
✓ Branch 1 taken 5406 times.
|
8106 | if (s->subsampling == SHQ_SUBSAMPLING_420) { |
| 315 | 2700 | dest_cb = frame->data[1] + frame->linesize[1] * (y/2 + field_number); | |
| 316 | 2700 | dest_cr = frame->data[2] + frame->linesize[2] * (y/2 + field_number); | |
| 317 | } else { | ||
| 318 | 5406 | dest_cb = frame->data[1] + frame->linesize[1] * (y + field_number); | |
| 319 | 5406 | dest_cr = frame->data[2] + frame->linesize[2] * (y + field_number); | |
| 320 | } | ||
| 321 |
1/2✗ Branch 0 not taken.
✓ Branch 1 taken 8106 times.
|
8106 | if (s->alpha_type != SHQ_NO_ALPHA) { |
| 322 | ✗ | dest_a = frame->data[3] + frame->linesize[3] * (y + field_number); | |
| 323 | } | ||
| 324 | |||
| 325 |
4/4✓ Branch 0 taken 124248 times.
✓ Branch 1 taken 62100 times.
✓ Branch 2 taken 178242 times.
✓ Branch 3 taken 8106 times.
|
186348 | for (x = 0; x < frame->width - 8 * (s->subsampling != SHQ_SUBSAMPLING_444); x += 16) { |
| 326 | /* Decode the four luma blocks. */ | ||
| 327 |
1/2✗ Branch 1 not taken.
✓ Branch 2 taken 178242 times.
|
178242 | if ((ret = decode_dct_block(s, &gb, last_dc, 0, dest_y, linesize_y)) < 0) |
| 328 | ✗ | return ret; | |
| 329 |
1/2✗ Branch 1 not taken.
✓ Branch 2 taken 178242 times.
|
178242 | if ((ret = decode_dct_block(s, &gb, last_dc, 0, dest_y + 8, linesize_y)) < 0) |
| 330 | ✗ | return ret; | |
| 331 |
1/2✗ Branch 1 not taken.
✓ Branch 2 taken 178242 times.
|
178242 | if ((ret = decode_dct_block(s, &gb, last_dc, 0, dest_y + 8 * linesize_y, linesize_y)) < 0) |
| 332 | ✗ | return ret; | |
| 333 |
1/2✗ Branch 1 not taken.
✓ Branch 2 taken 178242 times.
|
178242 | if ((ret = decode_dct_block(s, &gb, last_dc, 0, dest_y + 8 * linesize_y + 8, linesize_y)) < 0) |
| 334 | ✗ | return ret; | |
| 335 | |||
| 336 | /* | ||
| 337 | * Decode the first chroma block. For 4:2:0, this is the only one; | ||
| 338 | * for 4:2:2, it's the top block; for 4:4:4, it's the top-left block. | ||
| 339 | */ | ||
| 340 |
1/2✗ Branch 1 not taken.
✓ Branch 2 taken 178242 times.
|
178242 | if ((ret = decode_dct_block(s, &gb, last_dc, 1, dest_cb, linesize_cb)) < 0) |
| 341 | ✗ | return ret; | |
| 342 |
1/2✗ Branch 1 not taken.
✓ Branch 2 taken 178242 times.
|
178242 | if ((ret = decode_dct_block(s, &gb, last_dc, 2, dest_cr, linesize_cr)) < 0) |
| 343 | ✗ | return ret; | |
| 344 | |||
| 345 |
2/2✓ Branch 0 taken 118842 times.
✓ Branch 1 taken 59400 times.
|
178242 | if (s->subsampling != SHQ_SUBSAMPLING_420) { |
| 346 | /* For 4:2:2, this is the bottom block; for 4:4:4, it's the bottom-left block. */ | ||
| 347 |
1/2✗ Branch 1 not taken.
✓ Branch 2 taken 118842 times.
|
118842 | if ((ret = decode_dct_block(s, &gb, last_dc, 1, dest_cb + 8 * linesize_cb, linesize_cb)) < 0) |
| 348 | ✗ | return ret; | |
| 349 |
1/2✗ Branch 1 not taken.
✓ Branch 2 taken 118842 times.
|
118842 | if ((ret = decode_dct_block(s, &gb, last_dc, 2, dest_cr + 8 * linesize_cr, linesize_cr)) < 0) |
| 350 | ✗ | return ret; | |
| 351 | |||
| 352 |
2/2✓ Branch 0 taken 59400 times.
✓ Branch 1 taken 59442 times.
|
118842 | if (s->subsampling == SHQ_SUBSAMPLING_444) { |
| 353 | /* Top-right and bottom-right blocks. */ | ||
| 354 |
1/2✗ Branch 1 not taken.
✓ Branch 2 taken 59400 times.
|
59400 | if ((ret = decode_dct_block(s, &gb, last_dc, 1, dest_cb + 8, linesize_cb)) < 0) |
| 355 | ✗ | return ret; | |
| 356 |
1/2✗ Branch 1 not taken.
✓ Branch 2 taken 59400 times.
|
59400 | if ((ret = decode_dct_block(s, &gb, last_dc, 2, dest_cr + 8, linesize_cr)) < 0) |
| 357 | ✗ | return ret; | |
| 358 |
1/2✗ Branch 1 not taken.
✓ Branch 2 taken 59400 times.
|
59400 | if ((ret = decode_dct_block(s, &gb, last_dc, 1, dest_cb + 8 * linesize_cb + 8, linesize_cb)) < 0) |
| 359 | ✗ | return ret; | |
| 360 |
1/2✗ Branch 1 not taken.
✓ Branch 2 taken 59400 times.
|
59400 | if ((ret = decode_dct_block(s, &gb, last_dc, 2, dest_cr + 8 * linesize_cr + 8, linesize_cr)) < 0) |
| 361 | ✗ | return ret; | |
| 362 | |||
| 363 | 59400 | dest_cb += 8; | |
| 364 | 59400 | dest_cr += 8; | |
| 365 | } | ||
| 366 | } | ||
| 367 | 178242 | dest_y += 16; | |
| 368 | 178242 | dest_cb += 8; | |
| 369 | 178242 | dest_cr += 8; | |
| 370 | |||
| 371 |
1/2✗ Branch 0 not taken.
✓ Branch 1 taken 178242 times.
|
178242 | if (s->alpha_type == SHQ_RLE_ALPHA) { |
| 372 | /* Alpha coded using 16x8 RLE blocks. */ | ||
| 373 | ✗ | if ((ret = decode_alpha_block(s, &gb, last_alpha, dest_a, linesize_a)) < 0) | |
| 374 | ✗ | return ret; | |
| 375 | ✗ | if ((ret = decode_alpha_block(s, &gb, last_alpha, dest_a + 8 * linesize_a, linesize_a)) < 0) | |
| 376 | ✗ | return ret; | |
| 377 | ✗ | dest_a += 16; | |
| 378 |
1/2✗ Branch 0 not taken.
✓ Branch 1 taken 178242 times.
|
178242 | } else if (s->alpha_type == SHQ_DCT_ALPHA) { |
| 379 | /* Alpha encoded exactly like luma. */ | ||
| 380 | ✗ | if ((ret = decode_dct_block(s, &gb, last_dc, 3, dest_a, linesize_a)) < 0) | |
| 381 | ✗ | return ret; | |
| 382 | ✗ | if ((ret = decode_dct_block(s, &gb, last_dc, 3, dest_a + 8, linesize_a)) < 0) | |
| 383 | ✗ | return ret; | |
| 384 | ✗ | if ((ret = decode_dct_block(s, &gb, last_dc, 3, dest_a + 8 * linesize_a, linesize_a)) < 0) | |
| 385 | ✗ | return ret; | |
| 386 | ✗ | if ((ret = decode_dct_block(s, &gb, last_dc, 3, dest_a + 8 * linesize_a + 8, linesize_a)) < 0) | |
| 387 | ✗ | return ret; | |
| 388 | ✗ | dest_a += 16; | |
| 389 | } | ||
| 390 | } | ||
| 391 | } | ||
| 392 | |||
| 393 |
3/6✓ Branch 0 taken 1212 times.
✓ Branch 1 taken 600 times.
✗ Branch 2 not taken.
✓ Branch 3 taken 1212 times.
✗ Branch 4 not taken.
✗ Branch 5 not taken.
|
1812 | if (s->subsampling != SHQ_SUBSAMPLING_444 && (frame->width & 15) && slice_number == 3) |
| 394 | ✗ | return decode_speedhq_border(s, &gb, frame, field_number, line_stride); | |
| 395 | |||
| 396 | 1812 | return 0; | |
| 397 | } | ||
| 398 | |||
| 399 | 1804 | static int decode_slice_progressive(AVCodecContext *avctx, void *arg, int jobnr, int threadnr) | |
| 400 | { | ||
| 401 | 1804 | SHQContext *s = avctx->priv_data; | |
| 402 | (void)threadnr; | ||
| 403 | |||
| 404 | 1804 | return decode_speedhq_field(avctx->priv_data, s->avpkt->data, s->avpkt->size, arg, 0, 4, s->avpkt->size, 1, jobnr); | |
| 405 | } | ||
| 406 | |||
| 407 | 8 | static int decode_slice_interlaced(AVCodecContext *avctx, void *arg, int jobnr, int threadnr) | |
| 408 | { | ||
| 409 | 8 | SHQContext *s = avctx->priv_data; | |
| 410 | 8 | int field_number = jobnr / 4; | |
| 411 | 8 | int slice_number = jobnr % 4; | |
| 412 | (void)threadnr; | ||
| 413 | |||
| 414 |
2/2✓ Branch 0 taken 4 times.
✓ Branch 1 taken 4 times.
|
8 | if (field_number == 0) |
| 415 | 4 | return decode_speedhq_field(avctx->priv_data, s->avpkt->data, s->avpkt->size, arg, 0, 4, s->second_field_offset, 2, slice_number); | |
| 416 | else | ||
| 417 | 4 | return decode_speedhq_field(avctx->priv_data, s->avpkt->data, s->avpkt->size, arg, 1, s->second_field_offset, s->avpkt->size, 2, slice_number); | |
| 418 | } | ||
| 419 | |||
| 420 | 452 | static void compute_quant_matrix(int *output, int qscale) | |
| 421 | { | ||
| 422 | int i; | ||
| 423 |
2/2✓ Branch 0 taken 28928 times.
✓ Branch 1 taken 452 times.
|
29380 | for (i = 0; i < 64; i++) output[i] = unscaled_quant_matrix[ff_zigzag_direct[i]] * qscale; |
| 424 | 452 | } | |
| 425 | |||
| 426 | 452 | static int speedhq_decode_frame(AVCodecContext *avctx, AVFrame *frame, | |
| 427 | int *got_frame, AVPacket *avpkt) | ||
| 428 | { | ||
| 429 | 452 | SHQContext * const s = avctx->priv_data; | |
| 430 | 452 | const uint8_t *buf = avpkt->data; | |
| 431 | 452 | int buf_size = avpkt->size; | |
| 432 | uint8_t quality; | ||
| 433 | int ret; | ||
| 434 | |||
| 435 |
3/6✓ Branch 0 taken 452 times.
✗ Branch 1 not taken.
✓ Branch 2 taken 452 times.
✗ Branch 3 not taken.
✗ Branch 4 not taken.
✓ Branch 5 taken 452 times.
|
452 | if (buf_size < 4 || avctx->width < 8 || avctx->width % 8 != 0) |
| 436 | ✗ | return AVERROR_INVALIDDATA; | |
| 437 |
1/2✗ Branch 0 not taken.
✓ Branch 1 taken 452 times.
|
452 | if (buf_size < avctx->width*avctx->height / 64 / 4) |
| 438 | ✗ | return AVERROR_INVALIDDATA; | |
| 439 | |||
| 440 | 452 | quality = buf[0]; | |
| 441 |
1/2✗ Branch 0 not taken.
✓ Branch 1 taken 452 times.
|
452 | if (quality >= 100) { |
| 442 | ✗ | return AVERROR_INVALIDDATA; | |
| 443 | } | ||
| 444 | |||
| 445 |
1/2✗ Branch 0 not taken.
✓ Branch 1 taken 452 times.
|
452 | if (avctx->skip_frame >= AVDISCARD_ALL) |
| 446 | ✗ | return avpkt->size; | |
| 447 | |||
| 448 | 452 | compute_quant_matrix(s->quant_matrix, 100 - quality); | |
| 449 | |||
| 450 | 452 | s->second_field_offset = AV_RL24(buf + 1); | |
| 451 |
1/2✗ Branch 0 not taken.
✓ Branch 1 taken 452 times.
|
452 | if (s->second_field_offset >= buf_size - 3) { |
| 452 | ✗ | return AVERROR_INVALIDDATA; | |
| 453 | } | ||
| 454 | |||
| 455 | 452 | avctx->coded_width = FFALIGN(avctx->width, 16); | |
| 456 | 452 | avctx->coded_height = FFALIGN(avctx->height, 16); | |
| 457 | |||
| 458 |
1/2✗ Branch 1 not taken.
✓ Branch 2 taken 452 times.
|
452 | if ((ret = ff_thread_get_buffer(avctx, frame, 0)) < 0) { |
| 459 | ✗ | return ret; | |
| 460 | } | ||
| 461 | |||
| 462 | 452 | s->avpkt = avpkt; | |
| 463 | |||
| 464 |
3/4✓ Branch 0 taken 1 times.
✓ Branch 1 taken 451 times.
✗ Branch 2 not taken.
✓ Branch 3 taken 1 times.
|
452 | if (s->second_field_offset == 4 || s->second_field_offset == (buf_size-4)) { |
| 465 | /* | ||
| 466 | * Overlapping first and second fields is used to signal | ||
| 467 | * encoding only a single field. In this case, "height" | ||
| 468 | * is ambiguous; it could mean either the height of the | ||
| 469 | * frame as a whole, or of the field. The former would make | ||
| 470 | * more sense for compatibility with legacy decoders, | ||
| 471 | * but this matches the convention used in NDI, which is | ||
| 472 | * the primary user of this trick. | ||
| 473 | */ | ||
| 474 |
1/2✗ Branch 1 not taken.
✓ Branch 2 taken 451 times.
|
451 | if ((ret = avctx->execute2(avctx, decode_slice_progressive, frame, NULL, 4)) < 0) |
| 475 | ✗ | return ret; | |
| 476 | } else { | ||
| 477 |
1/2✗ Branch 1 not taken.
✓ Branch 2 taken 1 times.
|
1 | if ((ret = avctx->execute2(avctx, decode_slice_interlaced, frame, NULL, 8)) < 0) |
| 478 | ✗ | return ret; | |
| 479 | } | ||
| 480 | |||
| 481 | 452 | *got_frame = 1; | |
| 482 | 452 | return buf_size; | |
| 483 | } | ||
| 484 | |||
| 485 | /* | ||
| 486 | * Alpha VLC. Run and level are independently coded, and would be | ||
| 487 | * outside the default limits for MAX_RUN/MAX_LEVEL, so we don't | ||
| 488 | * bother with combining them into one table. | ||
| 489 | */ | ||
| 490 | 11 | static av_cold void compute_alpha_vlcs(void) | |
| 491 | { | ||
| 492 | uint16_t run_code[134], level_code[266]; | ||
| 493 | uint8_t run_bits[134], level_bits[266]; | ||
| 494 | int16_t run_symbols[134], level_symbols[266]; | ||
| 495 | int entry, i, sign; | ||
| 496 | |||
| 497 | /* Initialize VLC for alpha run. */ | ||
| 498 | 11 | entry = 0; | |
| 499 | |||
| 500 | /* 0 -> 0. */ | ||
| 501 | 11 | run_code[entry] = 0; | |
| 502 | 11 | run_bits[entry] = 1; | |
| 503 | 11 | run_symbols[entry] = 0; | |
| 504 | 11 | ++entry; | |
| 505 | |||
| 506 | /* 10xx -> xx plus 1. */ | ||
| 507 |
2/2✓ Branch 0 taken 44 times.
✓ Branch 1 taken 11 times.
|
55 | for (i = 0; i < 4; ++i) { |
| 508 | 44 | run_code[entry] = (i << 2) | 1; | |
| 509 | 44 | run_bits[entry] = 4; | |
| 510 | 44 | run_symbols[entry] = i + 1; | |
| 511 | 44 | ++entry; | |
| 512 | } | ||
| 513 | |||
| 514 | /* 111xxxxxxx -> xxxxxxx. */ | ||
| 515 |
2/2✓ Branch 0 taken 1408 times.
✓ Branch 1 taken 11 times.
|
1419 | for (i = 0; i < 128; ++i) { |
| 516 | 1408 | run_code[entry] = (i << 3) | 7; | |
| 517 | 1408 | run_bits[entry] = 10; | |
| 518 | 1408 | run_symbols[entry] = i; | |
| 519 | 1408 | ++entry; | |
| 520 | } | ||
| 521 | |||
| 522 | /* 110 -> EOB. */ | ||
| 523 | 11 | run_code[entry] = 3; | |
| 524 | 11 | run_bits[entry] = 3; | |
| 525 | 11 | run_symbols[entry] = -1; | |
| 526 | 11 | ++entry; | |
| 527 | |||
| 528 |
1/2✗ Branch 0 not taken.
✓ Branch 1 taken 11 times.
|
11 | av_assert0(entry == FF_ARRAY_ELEMS(run_code)); |
| 529 | |||
| 530 | 11 | VLC_INIT_STATIC_SPARSE_TABLE(dc_alpha_run_vlc_le, ALPHA_VLC_BITS, | |
| 531 | FF_ARRAY_ELEMS(run_code), | ||
| 532 | run_bits, 1, 1, | ||
| 533 | run_code, 2, 2, | ||
| 534 | run_symbols, 2, 2, VLC_INIT_LE); | ||
| 535 | |||
| 536 | /* Initialize VLC for alpha level. */ | ||
| 537 | 11 | entry = 0; | |
| 538 | |||
| 539 |
2/2✓ Branch 0 taken 22 times.
✓ Branch 1 taken 11 times.
|
33 | for (sign = 0; sign <= 1; ++sign) { |
| 540 | /* 1s -> -1 or +1 (depending on sign bit). */ | ||
| 541 | 22 | level_code[entry] = (sign << 1) | 1; | |
| 542 | 22 | level_bits[entry] = 2; | |
| 543 |
2/2✓ Branch 0 taken 11 times.
✓ Branch 1 taken 11 times.
|
22 | level_symbols[entry] = sign ? -1 : 1; |
| 544 | 22 | ++entry; | |
| 545 | |||
| 546 | /* 01sxx -> xx plus 2 (2..5 or -2..-5, depending on sign bit). */ | ||
| 547 |
2/2✓ Branch 0 taken 88 times.
✓ Branch 1 taken 22 times.
|
110 | for (i = 0; i < 4; ++i) { |
| 548 | 88 | level_code[entry] = (i << 3) | (sign << 2) | 2; | |
| 549 | 88 | level_bits[entry] = 5; | |
| 550 |
2/2✓ Branch 0 taken 44 times.
✓ Branch 1 taken 44 times.
|
88 | level_symbols[entry] = sign ? -(i + 2) : (i + 2); |
| 551 | 88 | ++entry; | |
| 552 | } | ||
| 553 | } | ||
| 554 | |||
| 555 | /* | ||
| 556 | * 00xxxxxxxx -> xxxxxxxx, in two's complement. There are many codes | ||
| 557 | * here that would better be encoded in other ways (e.g. 0 would be | ||
| 558 | * encoded by increasing run, and +/- 1 would be encoded with a | ||
| 559 | * shorter code), but it doesn't hurt to allow everything. | ||
| 560 | */ | ||
| 561 |
2/2✓ Branch 0 taken 2816 times.
✓ Branch 1 taken 11 times.
|
2827 | for (i = 0; i < 256; ++i) { |
| 562 | 2816 | level_code[entry] = i << 2; | |
| 563 | 2816 | level_bits[entry] = 10; | |
| 564 | 2816 | level_symbols[entry] = i; | |
| 565 | 2816 | ++entry; | |
| 566 | } | ||
| 567 | |||
| 568 |
1/2✗ Branch 0 not taken.
✓ Branch 1 taken 11 times.
|
11 | av_assert0(entry == FF_ARRAY_ELEMS(level_code)); |
| 569 | |||
| 570 | 11 | VLC_INIT_STATIC_SPARSE_TABLE(dc_alpha_level_vlc_le, ALPHA_VLC_BITS, | |
| 571 | FF_ARRAY_ELEMS(level_code), | ||
| 572 | level_bits, 1, 1, | ||
| 573 | level_code, 2, 2, | ||
| 574 | level_symbols, 2, 2, VLC_INIT_LE); | ||
| 575 | 11 | } | |
| 576 | |||
| 577 | 11 | static av_cold void speedhq_static_init(void) | |
| 578 | { | ||
| 579 | /* Exactly the same as MPEG-2, except for a little-endian reader. */ | ||
| 580 | 11 | VLC_INIT_STATIC_TABLE(dc_lum_vlc_le, DC_VLC_BITS, 12, | |
| 581 | ff_mpeg12_vlc_dc_lum_bits, 1, 1, | ||
| 582 | ff_mpeg12_vlc_dc_lum_code, 2, 2, | ||
| 583 | VLC_INIT_OUTPUT_LE); | ||
| 584 | 11 | VLC_INIT_STATIC_TABLE(dc_chroma_vlc_le, DC_VLC_BITS, 12, | |
| 585 | ff_mpeg12_vlc_dc_chroma_bits, 1, 1, | ||
| 586 | ff_mpeg12_vlc_dc_chroma_code, 2, 2, | ||
| 587 | VLC_INIT_OUTPUT_LE); | ||
| 588 | |||
| 589 | 11 | ff_init_2d_vlc_rl(ff_speedhq_vlc_table, speedhq_rl_vlc, ff_speedhq_run, | |
| 590 | ff_speedhq_level, SPEEDHQ_RL_NB_ELEMS, | ||
| 591 | FF_ARRAY_ELEMS(speedhq_rl_vlc), VLC_INIT_LE); | ||
| 592 | |||
| 593 | 11 | compute_alpha_vlcs(); | |
| 594 | 11 | } | |
| 595 | |||
| 596 | 22 | static av_cold int speedhq_decode_init(AVCodecContext *avctx) | |
| 597 | { | ||
| 598 | int ret; | ||
| 599 | static AVOnce init_once = AV_ONCE_INIT; | ||
| 600 | 22 | SHQContext * const s = avctx->priv_data; | |
| 601 | |||
| 602 | 22 | ret = ff_thread_once(&init_once, speedhq_static_init); | |
| 603 |
1/2✗ Branch 0 not taken.
✓ Branch 1 taken 22 times.
|
22 | if (ret) |
| 604 | ✗ | return AVERROR_UNKNOWN; | |
| 605 | |||
| 606 | 22 | ff_blockdsp_init(&s->bdsp); | |
| 607 | 22 | ff_idctdsp_init(&s->idsp, avctx); | |
| 608 | 22 | ff_permute_scantable(s->permutated_intra_scantable, ff_zigzag_direct, | |
| 609 | 22 | s->idsp.idct_permutation); | |
| 610 | |||
| 611 |
4/9✓ Branch 0 taken 6 times.
✗ Branch 1 not taken.
✓ Branch 2 taken 8 times.
✗ Branch 3 not taken.
✓ Branch 4 taken 6 times.
✗ Branch 5 not taken.
✗ Branch 6 not taken.
✗ Branch 7 not taken.
✓ Branch 8 taken 2 times.
|
22 | switch (avctx->codec_tag) { |
| 612 | 6 | case MKTAG('S', 'H', 'Q', '0'): | |
| 613 | 6 | s->subsampling = SHQ_SUBSAMPLING_420; | |
| 614 | 6 | s->alpha_type = SHQ_NO_ALPHA; | |
| 615 | 6 | avctx->pix_fmt = AV_PIX_FMT_YUV420P; | |
| 616 | 6 | break; | |
| 617 | ✗ | case MKTAG('S', 'H', 'Q', '1'): | |
| 618 | ✗ | s->subsampling = SHQ_SUBSAMPLING_420; | |
| 619 | ✗ | s->alpha_type = SHQ_RLE_ALPHA; | |
| 620 | ✗ | avctx->pix_fmt = AV_PIX_FMT_YUVA420P; | |
| 621 | ✗ | break; | |
| 622 | 8 | case MKTAG('S', 'H', 'Q', '2'): | |
| 623 | 8 | s->subsampling = SHQ_SUBSAMPLING_422; | |
| 624 | 8 | s->alpha_type = SHQ_NO_ALPHA; | |
| 625 | 8 | avctx->pix_fmt = AV_PIX_FMT_YUV422P; | |
| 626 | 8 | break; | |
| 627 | ✗ | case MKTAG('S', 'H', 'Q', '3'): | |
| 628 | ✗ | s->subsampling = SHQ_SUBSAMPLING_422; | |
| 629 | ✗ | s->alpha_type = SHQ_RLE_ALPHA; | |
| 630 | ✗ | avctx->pix_fmt = AV_PIX_FMT_YUVA422P; | |
| 631 | ✗ | break; | |
| 632 | 6 | case MKTAG('S', 'H', 'Q', '4'): | |
| 633 | 6 | s->subsampling = SHQ_SUBSAMPLING_444; | |
| 634 | 6 | s->alpha_type = SHQ_NO_ALPHA; | |
| 635 | 6 | avctx->pix_fmt = AV_PIX_FMT_YUV444P; | |
| 636 | 6 | break; | |
| 637 | ✗ | case MKTAG('S', 'H', 'Q', '5'): | |
| 638 | ✗ | s->subsampling = SHQ_SUBSAMPLING_444; | |
| 639 | ✗ | s->alpha_type = SHQ_RLE_ALPHA; | |
| 640 | ✗ | avctx->pix_fmt = AV_PIX_FMT_YUVA444P; | |
| 641 | ✗ | break; | |
| 642 | ✗ | case MKTAG('S', 'H', 'Q', '7'): | |
| 643 | ✗ | s->subsampling = SHQ_SUBSAMPLING_422; | |
| 644 | ✗ | s->alpha_type = SHQ_DCT_ALPHA; | |
| 645 | ✗ | avctx->pix_fmt = AV_PIX_FMT_YUVA422P; | |
| 646 | ✗ | break; | |
| 647 | ✗ | case MKTAG('S', 'H', 'Q', '9'): | |
| 648 | ✗ | s->subsampling = SHQ_SUBSAMPLING_444; | |
| 649 | ✗ | s->alpha_type = SHQ_DCT_ALPHA; | |
| 650 | ✗ | avctx->pix_fmt = AV_PIX_FMT_YUVA444P; | |
| 651 | ✗ | break; | |
| 652 | 2 | default: | |
| 653 | 2 | av_log(avctx, AV_LOG_ERROR, "Unknown NewTek SpeedHQ FOURCC provided (%08X)\n", | |
| 654 | avctx->codec_tag); | ||
| 655 | 2 | return AVERROR_INVALIDDATA; | |
| 656 | } | ||
| 657 | |||
| 658 | /* This matches what NDI's RGB -> Y'CbCr 4:2:2 converter uses. */ | ||
| 659 | 20 | avctx->colorspace = AVCOL_SPC_BT470BG; | |
| 660 | 20 | avctx->chroma_sample_location = AVCHROMA_LOC_CENTER; | |
| 661 | |||
| 662 | 20 | return 0; | |
| 663 | } | ||
| 664 | |||
| 665 | const FFCodec ff_speedhq_decoder = { | ||
| 666 | .p.name = "speedhq", | ||
| 667 | CODEC_LONG_NAME("NewTek SpeedHQ"), | ||
| 668 | .p.type = AVMEDIA_TYPE_VIDEO, | ||
| 669 | .p.id = AV_CODEC_ID_SPEEDHQ, | ||
| 670 | .priv_data_size = sizeof(SHQContext), | ||
| 671 | .init = speedhq_decode_init, | ||
| 672 | FF_CODEC_DECODE_CB(speedhq_decode_frame), | ||
| 673 | .p.capabilities = AV_CODEC_CAP_DR1 | AV_CODEC_CAP_FRAME_THREADS | AV_CODEC_CAP_SLICE_THREADS, | ||
| 674 | }; | ||
| 675 |