Line | Branch | Exec | Source |
---|---|---|---|
1 | /* | ||
2 | * SpeedHQ encoder | ||
3 | * Copyright (c) 2000, 2001 Fabrice Bellard | ||
4 | * Copyright (c) 2003 Alex Beregszaszi | ||
5 | * Copyright (c) 2003-2004 Michael Niedermayer | ||
6 | * Copyright (c) 2020 FFmpeg | ||
7 | * | ||
8 | * This file is part of FFmpeg. | ||
9 | * | ||
10 | * FFmpeg is free software; you can redistribute it and/or | ||
11 | * modify it under the terms of the GNU Lesser General Public | ||
12 | * License as published by the Free Software Foundation; either | ||
13 | * version 2.1 of the License, or (at your option) any later version. | ||
14 | * | ||
15 | * FFmpeg is distributed in the hope that it will be useful, | ||
16 | * but WITHOUT ANY WARRANTY; without even the implied warranty of | ||
17 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU | ||
18 | * Lesser General Public License for more details. | ||
19 | * | ||
20 | * You should have received a copy of the GNU Lesser General Public | ||
21 | * License along with FFmpeg; if not, write to the Free Software | ||
22 | * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA | ||
23 | */ | ||
24 | |||
25 | /** | ||
26 | * @file | ||
27 | * SpeedHQ encoder. | ||
28 | */ | ||
29 | |||
30 | #include "libavutil/avassert.h" | ||
31 | #include "libavutil/thread.h" | ||
32 | |||
33 | #include "avcodec.h" | ||
34 | #include "codec_internal.h" | ||
35 | #include "mpeg12data.h" | ||
36 | #include "mpeg12vlc.h" | ||
37 | #include "mpegvideo.h" | ||
38 | #include "mpegvideodata.h" | ||
39 | #include "mpegvideoenc.h" | ||
40 | #include "put_bits.h" | ||
41 | #include "rl.h" | ||
42 | #include "speedhq.h" | ||
43 | #include "speedhqenc.h" | ||
44 | |||
45 | static uint8_t speedhq_max_level[MAX_LEVEL + 1]; | ||
46 | static uint8_t speedhq_index_run[MAX_RUN + 1]; | ||
47 | |||
48 | /* Exactly the same as MPEG-2, except little-endian. */ | ||
49 | static const uint16_t mpeg12_vlc_dc_lum_code_reversed[12] = { | ||
50 | 0x1, 0x0, 0x2, 0x5, 0x3, 0x7, 0xF, 0x1F, 0x3F, 0x7F, 0xFF, 0x1FF | ||
51 | }; | ||
52 | static const uint16_t mpeg12_vlc_dc_chroma_code_reversed[12] = { | ||
53 | 0x0, 0x2, 0x1, 0x3, 0x7, 0xF, 0x1F, 0x3F, 0x7F, 0xFF, 0x1FF, 0x3FF | ||
54 | }; | ||
55 | |||
56 | /* simple include everything table for dc, first byte is bits | ||
57 | * number next 3 are code */ | ||
58 | static uint32_t speedhq_lum_dc_uni[512]; | ||
59 | static uint32_t speedhq_chr_dc_uni[512]; | ||
60 | |||
61 | static uint8_t uni_speedhq_ac_vlc_len[64 * 64 * 2]; | ||
62 | |||
63 | typedef struct SpeedHQEncContext { | ||
64 | MPVMainEncContext m; | ||
65 | |||
66 | int slice_start; | ||
67 | } SpeedHQEncContext; | ||
68 | |||
69 | 9 | static av_cold void speedhq_init_static_data(void) | |
70 | { | ||
71 | 9 | ff_rl_init_level_run(speedhq_max_level, speedhq_index_run, | |
72 | ff_speedhq_run, ff_speedhq_level, SPEEDHQ_RL_NB_ELEMS); | ||
73 | |||
74 | /* build unified dc encoding tables */ | ||
75 |
2/2✓ Branch 0 taken 4599 times.
✓ Branch 1 taken 9 times.
|
4608 | for (int i = -255; i < 256; i++) { |
76 | int adiff, index; | ||
77 | int bits, code; | ||
78 | 4599 | int diff = i; | |
79 | |||
80 | 4599 | adiff = FFABS(diff); | |
81 |
2/2✓ Branch 0 taken 2295 times.
✓ Branch 1 taken 2304 times.
|
4599 | if (diff < 0) |
82 | 2295 | diff--; | |
83 | 4599 | index = av_log2(2 * adiff); | |
84 | |||
85 | 4599 | bits = ff_mpeg12_vlc_dc_lum_bits[index] + index; | |
86 | 4599 | code = mpeg12_vlc_dc_lum_code_reversed[index] + | |
87 | 4599 | (av_zero_extend(diff, index) << ff_mpeg12_vlc_dc_lum_bits[index]); | |
88 | 4599 | speedhq_lum_dc_uni[i + 255] = bits + (code << 8); | |
89 | |||
90 | 4599 | bits = ff_mpeg12_vlc_dc_chroma_bits[index] + index; | |
91 | 4599 | code = mpeg12_vlc_dc_chroma_code_reversed[index] + | |
92 | 4599 | (av_zero_extend(diff, index) << ff_mpeg12_vlc_dc_chroma_bits[index]); | |
93 | 4599 | speedhq_chr_dc_uni[i + 255] = bits + (code << 8); | |
94 | } | ||
95 | |||
96 | 9 | ff_mpeg1_init_uni_ac_vlc(speedhq_max_level, speedhq_index_run, | |
97 | ff_speedhq_vlc_table, uni_speedhq_ac_vlc_len); | ||
98 | 9 | } | |
99 | |||
100 | 450 | static int speedhq_encode_picture_header(MPVMainEncContext *const m) | |
101 | { | ||
102 | 450 | SpeedHQEncContext *const ctx = (SpeedHQEncContext*)m; | |
103 | 450 | MPVEncContext *const s = &m->s; | |
104 | |||
105 | 450 | put_bits_assume_flushed(&s->pb); | |
106 | |||
107 | 450 | put_bits_le(&s->pb, 8, 100 - s->c.qscale * 2); /* FIXME why doubled */ | |
108 | 450 | put_bits_le(&s->pb, 24, 4); /* no second field */ | |
109 | |||
110 | 450 | ctx->slice_start = 4; | |
111 | /* length of first slice, will be filled out later */ | ||
112 | 450 | put_bits_le(&s->pb, 24, 0); | |
113 | |||
114 | 450 | return 0; | |
115 | } | ||
116 | |||
117 | 1800 | void ff_speedhq_end_slice(MPVEncContext *const s) | |
118 | { | ||
119 | 1800 | SpeedHQEncContext *ctx = (SpeedHQEncContext*)s; | |
120 | int slice_len; | ||
121 | |||
122 | 1800 | flush_put_bits_le(&s->pb); | |
123 | 1800 | slice_len = put_bytes_output(&s->pb) - ctx->slice_start; | |
124 | 1800 | AV_WL24(s->pb.buf + ctx->slice_start, slice_len); | |
125 | |||
126 | /* length of next slice, will be filled out later */ | ||
127 | 1800 | ctx->slice_start = put_bytes_output(&s->pb); | |
128 | 1800 | put_bits_le(&s->pb, 24, 0); | |
129 | 1800 | } | |
130 | |||
131 | 1544400 | static inline void encode_dc(PutBitContext *pb, int diff, int component) | |
132 | { | ||
133 | 1544400 | unsigned int diff_u = diff + 255; | |
134 |
2/2✓ Branch 0 taken 329487 times.
✓ Branch 1 taken 1214913 times.
|
1544400 | if (diff_u >= 511) { |
135 | int index; | ||
136 | |||
137 |
2/2✓ Branch 0 taken 169357 times.
✓ Branch 1 taken 160130 times.
|
329487 | if (diff < 0) { |
138 | 169357 | index = av_log2_16bit(-2 * diff); | |
139 | 169357 | diff--; | |
140 | } else { | ||
141 | 160130 | index = av_log2_16bit(2 * diff); | |
142 | } | ||
143 |
2/2✓ Branch 0 taken 239838 times.
✓ Branch 1 taken 89649 times.
|
329487 | if (component == 0) |
144 | 239838 | put_bits_le(pb, | |
145 | 239838 | ff_mpeg12_vlc_dc_lum_bits[index] + index, | |
146 | 239838 | mpeg12_vlc_dc_lum_code_reversed[index] + | |
147 | 239838 | (av_zero_extend(diff, index) << ff_mpeg12_vlc_dc_lum_bits[index])); | |
148 | else | ||
149 | 89649 | put_bits_le(pb, | |
150 | 89649 | ff_mpeg12_vlc_dc_chroma_bits[index] + index, | |
151 | 89649 | mpeg12_vlc_dc_chroma_code_reversed[index] + | |
152 | 89649 | (av_zero_extend(diff, index) << ff_mpeg12_vlc_dc_chroma_bits[index])); | |
153 | } else { | ||
154 |
2/2✓ Branch 0 taken 472962 times.
✓ Branch 1 taken 741951 times.
|
1214913 | if (component == 0) |
155 | 472962 | put_bits_le(pb, | |
156 | 472962 | speedhq_lum_dc_uni[diff + 255] & 0xFF, | |
157 | 472962 | speedhq_lum_dc_uni[diff + 255] >> 8); | |
158 | else | ||
159 | 741951 | put_bits_le(pb, | |
160 | 741951 | speedhq_chr_dc_uni[diff + 255] & 0xFF, | |
161 | 741951 | speedhq_chr_dc_uni[diff + 255] >> 8); | |
162 | } | ||
163 | 1544400 | } | |
164 | |||
165 | 1544400 | static void encode_block(MPVEncContext *const s, const int16_t block[], int n) | |
166 | { | ||
167 | int alevel, level, last_non_zero, dc, i, j, run, last_index, sign; | ||
168 | int code; | ||
169 | int component, val; | ||
170 | |||
171 | /* DC coef */ | ||
172 |
2/2✓ Branch 0 taken 831600 times.
✓ Branch 1 taken 712800 times.
|
1544400 | component = (n <= 3 ? 0 : (n&1) + 1); |
173 | 1544400 | dc = block[0]; /* overflow is impossible */ | |
174 | 1544400 | val = s->c.last_dc[component] - dc; /* opposite of most codecs */ | |
175 | 1544400 | encode_dc(&s->pb, val, component); | |
176 | 1544400 | s->c.last_dc[component] = dc; | |
177 | |||
178 | /* now quantify & encode AC coefs */ | ||
179 | 1544400 | last_non_zero = 0; | |
180 | 1544400 | last_index = s->c.block_last_index[n]; | |
181 | |||
182 |
2/2✓ Branch 0 taken 11960496 times.
✓ Branch 1 taken 1544400 times.
|
13504896 | for (i = 1; i <= last_index; i++) { |
183 | 11960496 | j = s->c.intra_scantable.permutated[i]; | |
184 | 11960496 | level = block[j]; | |
185 | |||
186 | /* encode using VLC */ | ||
187 |
2/2✓ Branch 0 taken 5766974 times.
✓ Branch 1 taken 6193522 times.
|
11960496 | if (level != 0) { |
188 | 5766974 | run = i - last_non_zero - 1; | |
189 | |||
190 | 5766974 | alevel = level; | |
191 | 5766974 | MASK_ABS(sign, alevel); | |
192 | 5766974 | sign &= 1; | |
193 | |||
194 |
2/2✓ Branch 0 taken 5741265 times.
✓ Branch 1 taken 25709 times.
|
5766974 | if (alevel <= speedhq_max_level[run]) { |
195 | 5741265 | code = speedhq_index_run[run] + alevel - 1; | |
196 | /* store the VLC & sign at once */ | ||
197 | 5741265 | put_bits_le(&s->pb, ff_speedhq_vlc_table[code][1] + 1, | |
198 | 5741265 | ff_speedhq_vlc_table[code][0] | (sign << ff_speedhq_vlc_table[code][1])); | |
199 | } else { | ||
200 | /* escape seems to be pretty rare <5% so I do not optimize it; | ||
201 | * The following encodes the escape value 100000b together with | ||
202 | * run and level. */ | ||
203 | 25709 | put_bits_le(&s->pb, 6 + 6 + 12, 0x20 | run << 6 | | |
204 | 25709 | (level + 2048) << 12); | |
205 | } | ||
206 | 5766974 | last_non_zero = i; | |
207 | } | ||
208 | } | ||
209 | /* end of block; the values correspond to ff_speedhq_vlc_table[122] */ | ||
210 | 1544400 | put_bits_le(&s->pb, 4, 6); | |
211 | 1544400 | } | |
212 | |||
213 | 178200 | static void speedhq_encode_mb(MPVEncContext *const s, int16_t block[12][64], | |
214 | int unused_x, int unused_y) | ||
215 | { | ||
216 | int i; | ||
217 |
2/2✓ Branch 0 taken 1069200 times.
✓ Branch 1 taken 178200 times.
|
1247400 | for(i=0;i<6;i++) { |
218 | 1069200 | encode_block(s, block[i], i); | |
219 | } | ||
220 |
2/2✓ Branch 0 taken 59400 times.
✓ Branch 1 taken 118800 times.
|
178200 | if (s->c.chroma_format == CHROMA_444) { |
221 | 59400 | encode_block(s, block[8], 8); | |
222 | 59400 | encode_block(s, block[9], 9); | |
223 | |||
224 | 59400 | encode_block(s, block[6], 6); | |
225 | 59400 | encode_block(s, block[7], 7); | |
226 | |||
227 | 59400 | encode_block(s, block[10], 10); | |
228 | 59400 | encode_block(s, block[11], 11); | |
229 |
2/2✓ Branch 0 taken 59400 times.
✓ Branch 1 taken 59400 times.
|
118800 | } else if (s->c.chroma_format == CHROMA_422) { |
230 | 59400 | encode_block(s, block[6], 6); | |
231 | 59400 | encode_block(s, block[7], 7); | |
232 | } | ||
233 | |||
234 | 178200 | s->i_tex_bits += get_bits_diff(s); | |
235 | 178200 | } | |
236 | |||
237 | 9 | static av_cold int speedhq_encode_init(AVCodecContext *avctx) | |
238 | { | ||
239 | static AVOnce init_static_once = AV_ONCE_INIT; | ||
240 | 9 | MPVMainEncContext *const m = avctx->priv_data; | |
241 | 9 | MPVEncContext *const s = &m->s; | |
242 | int ret; | ||
243 | |||
244 |
2/4✓ Branch 0 taken 9 times.
✗ Branch 1 not taken.
✗ Branch 2 not taken.
✓ Branch 3 taken 9 times.
|
9 | if (avctx->width > 65500 || avctx->height > 65500) { |
245 | ✗ | av_log(avctx, AV_LOG_ERROR, "SpeedHQ does not support resolutions above 65500x65500\n"); | |
246 | ✗ | return AVERROR(EINVAL); | |
247 | } | ||
248 | |||
249 | // border is not implemented correctly at the moment, see ticket #10078 | ||
250 |
1/2✗ Branch 0 not taken.
✓ Branch 1 taken 9 times.
|
9 | if (avctx->width % 16) { |
251 | ✗ | av_log(avctx, AV_LOG_ERROR, "width must be a multiple of 16\n"); | |
252 | ✗ | return AVERROR_PATCHWELCOME; | |
253 | } | ||
254 | |||
255 |
3/4✓ Branch 0 taken 3 times.
✓ Branch 1 taken 3 times.
✓ Branch 2 taken 3 times.
✗ Branch 3 not taken.
|
9 | switch (avctx->pix_fmt) { |
256 | 3 | case AV_PIX_FMT_YUV420P: | |
257 | 3 | avctx->codec_tag = MKTAG('S','H','Q','0'); | |
258 | 3 | break; | |
259 | 3 | case AV_PIX_FMT_YUV422P: | |
260 | 3 | avctx->codec_tag = MKTAG('S','H','Q','2'); | |
261 | 3 | break; | |
262 | 3 | case AV_PIX_FMT_YUV444P: | |
263 | 3 | avctx->codec_tag = MKTAG('S','H','Q','4'); | |
264 | 3 | break; | |
265 | ✗ | default: | |
266 | ✗ | av_unreachable("Already checked via CODEC_PIXFMTS"); | |
267 | } | ||
268 | |||
269 | 9 | m->encode_picture_header = speedhq_encode_picture_header; | |
270 | 9 | s->encode_mb = speedhq_encode_mb; | |
271 | |||
272 | 9 | s->min_qcoeff = -2048; | |
273 | 9 | s->max_qcoeff = 2047; | |
274 | |||
275 | 9 | s->intra_ac_vlc_length = | |
276 | 9 | s->intra_ac_vlc_last_length = | |
277 | 9 | s->intra_chroma_ac_vlc_length = | |
278 | 9 | s->intra_chroma_ac_vlc_last_length = uni_speedhq_ac_vlc_len; | |
279 | |||
280 | 9 | s->c.y_dc_scale_table = | |
281 | 9 | s->c.c_dc_scale_table = ff_mpeg12_dc_scale_table[3]; | |
282 | |||
283 | 9 | ret = ff_mpv_encode_init(avctx); | |
284 |
1/2✗ Branch 0 not taken.
✓ Branch 1 taken 9 times.
|
9 | if (ret < 0) |
285 | ✗ | return ret; | |
286 | |||
287 | 9 | ff_thread_once(&init_static_once, speedhq_init_static_data); | |
288 | |||
289 | 9 | return 0; | |
290 | } | ||
291 | |||
292 | const FFCodec ff_speedhq_encoder = { | ||
293 | .p.name = "speedhq", | ||
294 | CODEC_LONG_NAME("NewTek SpeedHQ"), | ||
295 | .p.type = AVMEDIA_TYPE_VIDEO, | ||
296 | .p.id = AV_CODEC_ID_SPEEDHQ, | ||
297 | .p.priv_class = &ff_mpv_enc_class, | ||
298 | .p.capabilities = AV_CODEC_CAP_DR1 | AV_CODEC_CAP_ENCODER_REORDERED_OPAQUE, | ||
299 | .priv_data_size = sizeof(SpeedHQEncContext), | ||
300 | .init = speedhq_encode_init, | ||
301 | FF_CODEC_ENCODE_CB(ff_mpv_encode_picture), | ||
302 | .close = ff_mpv_encode_end, | ||
303 | .caps_internal = FF_CODEC_CAP_INIT_CLEANUP, | ||
304 | .color_ranges = AVCOL_RANGE_MPEG, | ||
305 | CODEC_PIXFMTS(AV_PIX_FMT_YUV420P, AV_PIX_FMT_YUV422P, AV_PIX_FMT_YUV444P), | ||
306 | }; | ||
307 |