FFmpeg coverage


Directory: ../../../ffmpeg/
File: src/libavcodec/svq1enc.c
Date: 2024-04-19 07:31:02
Exec Total Coverage
Lines: 363 383 94.8%
Functions: 8 8 100.0%
Branches: 166 194 85.6%

Line Branch Exec Source
1 /*
2 * SVQ1 Encoder
3 * Copyright (C) 2004 Mike Melanson <melanson@pcisys.net>
4 *
5 * This file is part of FFmpeg.
6 *
7 * FFmpeg is free software; you can redistribute it and/or
8 * modify it under the terms of the GNU Lesser General Public
9 * License as published by the Free Software Foundation; either
10 * version 2.1 of the License, or (at your option) any later version.
11 *
12 * FFmpeg is distributed in the hope that it will be useful,
13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
15 * Lesser General Public License for more details.
16 *
17 * You should have received a copy of the GNU Lesser General Public
18 * License along with FFmpeg; if not, write to the Free Software
19 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
20 */
21
22 /**
23 * @file
24 * Sorenson Vector Quantizer #1 (SVQ1) video codec.
25 * For more information of the SVQ1 algorithm, visit:
26 * http://www.pcisys.net/~melanson/codecs/
27 */
28
29 #include "libavutil/emms.h"
30 #include "libavutil/mem.h"
31 #include "avcodec.h"
32 #include "codec_internal.h"
33 #include "encode.h"
34 #include "hpeldsp.h"
35 #include "me_cmp.h"
36 #include "mpegvideo.h"
37 #include "h263.h"
38 #include "h263enc.h"
39 #include "internal.h"
40 #include "mpegutils.h"
41 #include "packet_internal.h"
42 #include "put_bits.h"
43 #include "svq1.h"
44 #include "svq1encdsp.h"
45 #include "svq1enc_cb.h"
46 #include "version.h"
47
48 #include "libavutil/avassert.h"
49 #include "libavutil/frame.h"
50 #include "libavutil/mem_internal.h"
51
52 // Workaround for GCC bug 102513
53 #if AV_GCC_VERSION_AT_LEAST(10, 0) && AV_GCC_VERSION_AT_MOST(12, 0) \
54 && !defined(__clang__) && !defined(__INTEL_COMPILER)
55 #pragma GCC optimize ("no-ipa-cp-clone")
56 #endif
57
58 typedef struct SVQ1EncContext {
59 /* FIXME: Needed for motion estimation, should not be used for anything
60 * else, the idea is to make the motion estimation eventually independent
61 * of MpegEncContext, so this will be removed then. */
62 MpegEncContext m;
63 AVCodecContext *avctx;
64 MECmpContext mecc;
65 HpelDSPContext hdsp;
66 AVFrame *current_picture;
67 AVFrame *last_picture;
68
69 /* Some compression statistics */
70 enum AVPictureType pict_type;
71 int quality;
72
73 /* why ooh why this sick breadth first order,
74 * everything is slower and more complex */
75 PutBitContext reorder_pb[6];
76
77 int frame_width;
78 int frame_height;
79
80 /* Y plane block dimensions */
81 int y_block_width;
82 int y_block_height;
83
84 /* U & V plane (C planes) block dimensions */
85 int c_block_width;
86 int c_block_height;
87
88 DECLARE_ALIGNED(16, int16_t, encoded_block_levels)[6][7][256];
89
90 uint16_t *mb_type;
91 uint32_t *dummy;
92 int16_t (*motion_val8[3])[2];
93 int16_t (*motion_val16[3])[2];
94
95 int64_t rd_total;
96
97 uint8_t *scratchbuf;
98
99 int motion_est;
100
101 SVQ1EncDSPContext svq1encdsp;
102 } SVQ1EncContext;
103
104 200 static void svq1_write_header(SVQ1EncContext *s, PutBitContext *pb, int frame_type)
105 {
106 int i;
107
108 /* frame code */
109 200 put_bits(pb, 22, 0x20);
110
111 /* temporal reference (sure hope this is a "don't care") */
112 200 put_bits(pb, 8, 0x00);
113
114 /* frame type */
115 200 put_bits(pb, 2, frame_type - 1);
116
117
2/2
✓ Branch 0 taken 20 times.
✓ Branch 1 taken 180 times.
200 if (frame_type == AV_PICTURE_TYPE_I) {
118 /* no checksum since frame code is 0x20 */
119 /* no embedded string either */
120 /* output 5 unknown bits (2 + 2 + 1) */
121 20 put_bits(pb, 5, 2); /* 2 needed by quicktime decoder */
122
123 20 i = ff_match_2uint16(ff_svq1_frame_size_table,
124 FF_ARRAY_ELEMS(ff_svq1_frame_size_table),
125 s->frame_width, s->frame_height);
126 20 put_bits(pb, 3, i);
127
128
2/2
✓ Branch 0 taken 5 times.
✓ Branch 1 taken 15 times.
20 if (i == 7) {
129 5 put_bits(pb, 12, s->frame_width);
130 5 put_bits(pb, 12, s->frame_height);
131 }
132 }
133
134 /* no checksum or extra data (next 2 bits get 0) */
135 200 put_bits(pb, 2, 0);
136 200 }
137
138 #define QUALITY_THRESHOLD 100
139 #define THRESHOLD_MULTIPLIER 0.6
140
141 4302522 static int encode_block(SVQ1EncContext *s, uint8_t *src, uint8_t *ref,
142 uint8_t *decoded, int stride, unsigned level,
143 int threshold, int lambda, int intra)
144 {
145 int count, y, x, i, j, split, best_mean, best_score, best_count;
146 int best_vector[6];
147 4302522 int block_sum[7] = { 0, 0, 0, 0, 0, 0 };
148 4302522 int w = 2 << (level + 2 >> 1);
149 4302522 int h = 2 << (level + 1 >> 1);
150 4302522 int size = w * h;
151 4302522 int16_t (*block)[256] = s->encoded_block_levels[level];
152 const int8_t *codebook_sum, *codebook;
153 const uint16_t(*mean_vlc)[2];
154 const uint8_t(*multistage_vlc)[2];
155
156 4302522 best_score = 0;
157 // FIXME: Optimize, this does not need to be done multiple times.
158
2/2
✓ Branch 0 taken 643715 times.
✓ Branch 1 taken 3658807 times.
4302522 if (intra) {
159 // level is 5 when encode_block is called from svq1_encode_plane
160 // and always < 4 when called recursively from this function.
161
2/2
✓ Branch 0 taken 612686 times.
✓ Branch 1 taken 31029 times.
643715 codebook_sum = level < 4 ? svq1_intra_codebook_sum[level] : NULL;
162 643715 codebook = ff_svq1_intra_codebooks[level];
163 643715 mean_vlc = ff_svq1_intra_mean_vlc;
164 643715 multistage_vlc = ff_svq1_intra_multistage_vlc[level];
165
2/2
✓ Branch 0 taken 2296676 times.
✓ Branch 1 taken 643715 times.
2940391 for (y = 0; y < h; y++) {
166
2/2
✓ Branch 0 taken 15798160 times.
✓ Branch 1 taken 2296676 times.
18094836 for (x = 0; x < w; x++) {
167 15798160 int v = src[x + y * stride];
168 15798160 block[0][x + w * y] = v;
169 15798160 best_score += v * v;
170 15798160 block_sum[0] += v;
171 }
172 }
173 } else {
174 // level is 5 or < 4, see above for details.
175
2/2
✓ Branch 0 taken 3483018 times.
✓ Branch 1 taken 175789 times.
3658807 codebook_sum = level < 4 ? svq1_inter_codebook_sum[level] : NULL;
176 3658807 codebook = ff_svq1_inter_codebooks[level];
177 3658807 mean_vlc = ff_svq1_inter_mean_vlc + 256;
178 3658807 multistage_vlc = ff_svq1_inter_multistage_vlc[level];
179
2/2
✓ Branch 0 taken 13044696 times.
✓ Branch 1 taken 3658807 times.
16703503 for (y = 0; y < h; y++) {
180
2/2
✓ Branch 0 taken 89655008 times.
✓ Branch 1 taken 13044696 times.
102699704 for (x = 0; x < w; x++) {
181 89655008 int v = src[x + y * stride] - ref[x + y * stride];
182 89655008 block[0][x + w * y] = v;
183 89655008 best_score += v * v;
184 89655008 block_sum[0] += v;
185 }
186 }
187 }
188
189 4302522 best_count = 0;
190 4302522 best_score -= (int)((unsigned)block_sum[0] * block_sum[0] >> (level + 3));
191 4302522 best_mean = block_sum[0] + (size >> 1) >> (level + 3);
192
193
2/2
✓ Branch 0 taken 4095704 times.
✓ Branch 1 taken 206818 times.
4302522 if (level < 4) {
194
2/2
✓ Branch 0 taken 24574224 times.
✓ Branch 1 taken 4095704 times.
28669928 for (count = 1; count < 7; count++) {
195 24574224 int best_vector_score = INT_MAX;
196 24574224 int best_vector_sum = -999, best_vector_mean = -999;
197 24574224 const int stage = count - 1;
198 const int8_t *vector;
199
200
2/2
✓ Branch 0 taken 393187584 times.
✓ Branch 1 taken 24574224 times.
417761808 for (i = 0; i < 16; i++) {
201 393187584 int sum = codebook_sum[stage * 16 + i];
202 int sqr, diff, score;
203
204 393187584 vector = codebook + stage * size * 16 + i * size;
205 393187584 sqr = s->svq1encdsp.ssd_int8_vs_int16(vector, block[stage], size);
206 393187584 diff = block_sum[stage] - sum;
207 393187584 score = sqr - (diff * (int64_t)diff >> (level + 3)); // FIXME: 64 bits slooow
208
2/2
✓ Branch 0 taken 65426753 times.
✓ Branch 1 taken 327760831 times.
393187584 if (score < best_vector_score) {
209 65426753 int mean = diff + (size >> 1) >> (level + 3);
210 av_assert2(mean > -300 && mean < 300);
211
2/2
✓ Branch 0 taken 9912177 times.
✓ Branch 1 taken 55514576 times.
65426753 mean = av_clip(mean, intra ? 0 : -256, 255);
212 65426753 best_vector_score = score;
213 65426753 best_vector[stage] = i;
214 65426753 best_vector_sum = sum;
215 65426753 best_vector_mean = mean;
216 }
217 }
218
1/2
✗ Branch 0 not taken.
✓ Branch 1 taken 24574224 times.
24574224 av_assert0(best_vector_mean != -999);
219 24574224 vector = codebook + stage * size * 16 + best_vector[stage] * size;
220
2/2
✓ Branch 0 taken 420929184 times.
✓ Branch 1 taken 24574224 times.
445503408 for (j = 0; j < size; j++)
221 420929184 block[stage + 1][j] = block[stage][j] - vector[j];
222 24574224 block_sum[stage + 1] = block_sum[stage] - best_vector_sum;
223 24574224 best_vector_score += lambda *
224 24574224 (+1 + 4 * count +
225 24574224 multistage_vlc[1 + count][1]
226 24574224 + mean_vlc[best_vector_mean][1]);
227
228
2/2
✓ Branch 0 taken 5416629 times.
✓ Branch 1 taken 19157595 times.
24574224 if (best_vector_score < best_score) {
229 5416629 best_score = best_vector_score;
230 5416629 best_count = count;
231 5416629 best_mean = best_vector_mean;
232 }
233 }
234 }
235
236
2/2
✓ Branch 0 taken 12 times.
✓ Branch 1 taken 4302510 times.
4302522 if (best_mean == -128)
237 12 best_mean = -127;
238
2/2
✓ Branch 0 taken 6210 times.
✓ Branch 1 taken 4296300 times.
4302510 else if (best_mean == 128)
239 6210 best_mean = 127;
240
241 4302522 split = 0;
242
4/4
✓ Branch 0 taken 4243230 times.
✓ Branch 1 taken 59292 times.
✓ Branch 2 taken 2116786 times.
✓ Branch 3 taken 2126444 times.
4302522 if (best_score > threshold && level) {
243 2116786 int score = 0;
244
2/2
✓ Branch 0 taken 1431267 times.
✓ Branch 1 taken 685519 times.
2116786 int offset = level & 1 ? stride * h / 2 : w / 2;
245 PutBitContext backup[6];
246
247
2/2
✓ Branch 0 taken 3903357 times.
✓ Branch 1 taken 2116786 times.
6020143 for (i = level - 1; i >= 0; i--)
248 3903357 backup[i] = s->reorder_pb[i];
249 2116786 score += encode_block(s, src, ref, decoded, stride, level - 1,
250 threshold >> 1, lambda, intra);
251 2116786 score += encode_block(s, src + offset, ref + offset, decoded + offset,
252 stride, level - 1, threshold >> 1, lambda, intra);
253 2116786 score += lambda;
254
255
2/2
✓ Branch 0 taken 1359243 times.
✓ Branch 1 taken 757543 times.
2116786 if (score < best_score) {
256 1359243 best_score = score;
257 1359243 split = 1;
258 } else {
259
2/2
✓ Branch 0 taken 1046147 times.
✓ Branch 1 taken 757543 times.
1803690 for (i = level - 1; i >= 0; i--)
260 1046147 s->reorder_pb[i] = backup[i];
261 }
262 }
263
2/2
✓ Branch 0 taken 2127616 times.
✓ Branch 1 taken 2174906 times.
4302522 if (level > 0)
264 2127616 put_bits(&s->reorder_pb[level], 1, split);
265
266
2/2
✓ Branch 0 taken 2943279 times.
✓ Branch 1 taken 1359243 times.
4302522 if (!split) {
267 av_assert1(best_mean >= 0 && best_mean < 256 || !intra);
268 av_assert1(best_mean >= -256 && best_mean < 256);
269 av_assert1(best_count >= 0 && best_count < 7);
270 av_assert1(level < 4 || best_count == 0);
271
272 /* output the encoding */
273 2943279 put_bits(&s->reorder_pb[level],
274 2943279 multistage_vlc[1 + best_count][1],
275 2943279 multistage_vlc[1 + best_count][0]);
276 2943279 put_bits(&s->reorder_pb[level], mean_vlc[best_mean][1],
277 2943279 mean_vlc[best_mean][0]);
278
279
2/2
✓ Branch 0 taken 3649044 times.
✓ Branch 1 taken 2943279 times.
6592323 for (i = 0; i < best_count; i++) {
280 av_assert2(best_vector[i] >= 0 && best_vector[i] < 16);
281 3649044 put_bits(&s->reorder_pb[level], 4, best_vector[i]);
282 }
283
284
2/2
✓ Branch 0 taken 7680728 times.
✓ Branch 1 taken 2943279 times.
10624007 for (y = 0; y < h; y++)
285
2/2
✓ Branch 0 taken 36196848 times.
✓ Branch 1 taken 7680728 times.
43877576 for (x = 0; x < w; x++)
286 36196848 decoded[x + y * stride] = src[x + y * stride] -
287 36196848 block[best_count][x + w * y] +
288 best_mean;
289 }
290
291 4302522 return best_score;
292 }
293
294 131005 static void init_block_index(MpegEncContext *s){
295 131005 s->block_index[0]= s->b8_stride*(s->mb_y*2 ) + s->mb_x*2;
296 131005 s->block_index[1]= s->b8_stride*(s->mb_y*2 ) + 1 + s->mb_x*2;
297 131005 s->block_index[2]= s->b8_stride*(s->mb_y*2 + 1) + s->mb_x*2;
298 131005 s->block_index[3]= s->b8_stride*(s->mb_y*2 + 1) + 1 + s->mb_x*2;
299 131005 s->block_index[4]= s->mb_stride*(s->mb_y + 1) + s->b8_stride*s->mb_height*2 + s->mb_x;
300 131005 s->block_index[5]= s->mb_stride*(s->mb_y + s->mb_height + 2) + s->b8_stride*s->mb_height*2 + s->mb_x;
301 131005 }
302
303 600 static int svq1_encode_plane(SVQ1EncContext *s, int plane,
304 PutBitContext *pb,
305 const unsigned char *src_plane,
306 unsigned char *ref_plane,
307 unsigned char *decoded_plane,
308 int width, int height, int src_stride, int stride)
309 {
310 int x, y;
311 int i;
312 int block_width, block_height;
313 int level;
314 int threshold[6];
315 600 uint8_t *src = s->scratchbuf + stride * 32;
316 600 const int lambda = (s->quality * s->quality) >>
317 (2 * FF_LAMBDA_SHIFT);
318
319 /* figure out the acceptable level thresholds in advance */
320 600 threshold[5] = QUALITY_THRESHOLD;
321
2/2
✓ Branch 0 taken 3000 times.
✓ Branch 1 taken 600 times.
3600 for (level = 4; level >= 0; level--)
322 3000 threshold[level] = threshold[level + 1] * THRESHOLD_MULTIPLIER;
323
324 600 block_width = (width + 15) / 16;
325 600 block_height = (height + 15) / 16;
326
327
2/2
✓ Branch 0 taken 540 times.
✓ Branch 1 taken 60 times.
600 if (s->pict_type == AV_PICTURE_TYPE_P) {
328 540 s->m.avctx = s->avctx;
329 540 s->m.current_picture_ptr = &s->m.current_picture;
330 540 s->m.last_picture_ptr = &s->m.last_picture;
331 540 s->m.last_picture.f->data[0] = ref_plane;
332 540 s->m.linesize =
333 540 s->m.last_picture.f->linesize[0] =
334 540 s->m.new_picture->linesize[0] =
335 540 s->m.current_picture.f->linesize[0] = stride;
336 540 s->m.width = width;
337 540 s->m.height = height;
338 540 s->m.mb_width = block_width;
339 540 s->m.mb_height = block_height;
340 540 s->m.mb_stride = s->m.mb_width + 1;
341 540 s->m.b8_stride = 2 * s->m.mb_width + 1;
342 540 s->m.f_code = 1;
343 540 s->m.pict_type = s->pict_type;
344 540 s->m.motion_est = s->motion_est;
345 540 s->m.me.scene_change_score = 0;
346 // s->m.out_format = FMT_H263;
347 // s->m.unrestricted_mv = 1;
348 540 s->m.lambda = s->quality;
349 540 s->m.qscale = s->m.lambda * 139 +
350 540 FF_LAMBDA_SCALE * 64 >>
351 FF_LAMBDA_SHIFT + 7;
352 540 s->m.lambda2 = s->m.lambda * s->m.lambda +
353 540 FF_LAMBDA_SCALE / 2 >>
354 FF_LAMBDA_SHIFT;
355
356
2/2
✓ Branch 0 taken 12 times.
✓ Branch 1 taken 528 times.
540 if (!s->motion_val8[plane]) {
357 24 s->motion_val8[plane] = av_mallocz((s->m.b8_stride *
358 12 block_height * 2 + 2) *
359 2 * sizeof(int16_t));
360 24 s->motion_val16[plane] = av_mallocz((s->m.mb_stride *
361 12 (block_height + 2) + 1) *
362 2 * sizeof(int16_t));
363
2/4
✓ Branch 0 taken 12 times.
✗ Branch 1 not taken.
✗ Branch 2 not taken.
✓ Branch 3 taken 12 times.
12 if (!s->motion_val8[plane] || !s->motion_val16[plane])
364 return AVERROR(ENOMEM);
365 }
366
367 540 s->m.mb_type = s->mb_type;
368
369 // dummies, to avoid segfaults
370 540 s->m.mb_mean = (uint8_t *)s->dummy;
371 540 s->m.mb_var = (uint16_t *)s->dummy;
372 540 s->m.mc_mb_var = (uint16_t *)s->dummy;
373 540 s->m.current_picture.mb_type = s->dummy;
374
375 540 s->m.current_picture.motion_val[0] = s->motion_val8[plane] + 2;
376 540 s->m.p_mv_table = s->motion_val16[plane] +
377 540 s->m.mb_stride + 1;
378 540 s->m.mecc = s->mecc; // move
379 540 ff_init_me(&s->m);
380
381 540 s->m.me.dia_size = s->avctx->dia_size;
382 540 s->m.first_slice_line = 1;
383
2/2
✓ Branch 0 taken 4005 times.
✓ Branch 1 taken 540 times.
4545 for (y = 0; y < block_height; y++) {
384 4005 s->m.new_picture->data[0] = src - y * 16 * stride; // ugly
385 4005 s->m.mb_y = y;
386
387
4/4
✓ Branch 0 taken 60975 times.
✓ Branch 1 taken 3600 times.
✓ Branch 2 taken 60570 times.
✓ Branch 3 taken 405 times.
64575 for (i = 0; i < 16 && i + 16 * y < height; i++) {
388 60570 memcpy(&src[i * stride], &src_plane[(i + 16 * y) * src_stride],
389 width);
390
2/2
✓ Branch 0 taken 182700 times.
✓ Branch 1 taken 60570 times.
243270 for (x = width; x < 16 * block_width; x++)
391 182700 src[i * stride + x] = src[i * stride + x - 1];
392 }
393
3/4
✓ Branch 0 taken 3510 times.
✓ Branch 1 taken 4005 times.
✓ Branch 2 taken 3510 times.
✗ Branch 3 not taken.
7515 for (; i < 16 && i + 16 * y < 16 * block_height; i++)
394 3510 memcpy(&src[i * stride], &src[(i - 1) * stride],
395 3510 16 * block_width);
396
397
2/2
✓ Branch 0 taken 62055 times.
✓ Branch 1 taken 4005 times.
66060 for (x = 0; x < block_width; x++) {
398 62055 s->m.mb_x = x;
399 62055 init_block_index(&s->m);
400
401 62055 ff_estimate_p_frame_motion(&s->m, x, y);
402 }
403 4005 s->m.first_slice_line = 0;
404 }
405
406 540 ff_fix_long_p_mvs(&s->m, CANDIDATE_MB_TYPE_INTRA);
407 540 ff_fix_long_mvs(&s->m, NULL, 0, s->m.p_mv_table, s->m.f_code,
408 CANDIDATE_MB_TYPE_INTER, 0);
409 }
410
411 600 s->m.first_slice_line = 1;
412
2/2
✓ Branch 0 taken 4450 times.
✓ Branch 1 taken 600 times.
5050 for (y = 0; y < block_height; y++) {
413
4/4
✓ Branch 0 taken 67750 times.
✓ Branch 1 taken 4000 times.
✓ Branch 2 taken 67300 times.
✓ Branch 3 taken 450 times.
71750 for (i = 0; i < 16 && i + 16 * y < height; i++) {
414 67300 memcpy(&src[i * stride], &src_plane[(i + 16 * y) * src_stride],
415 width);
416
2/2
✓ Branch 0 taken 203000 times.
✓ Branch 1 taken 67300 times.
270300 for (x = width; x < 16 * block_width; x++)
417 203000 src[i * stride + x] = src[i * stride + x - 1];
418 }
419
3/4
✓ Branch 0 taken 3900 times.
✓ Branch 1 taken 4450 times.
✓ Branch 2 taken 3900 times.
✗ Branch 3 not taken.
8350 for (; i < 16 && i + 16 * y < 16 * block_height; i++)
420 3900 memcpy(&src[i * stride], &src[(i - 1) * stride], 16 * block_width);
421
422 4450 s->m.mb_y = y;
423
2/2
✓ Branch 0 taken 68950 times.
✓ Branch 1 taken 4450 times.
73400 for (x = 0; x < block_width; x++) {
424 uint8_t reorder_buffer[2][6][7 * 32];
425 int count[2][6];
426 68950 int offset = y * 16 * stride + x * 16;
427 68950 uint8_t *decoded = decoded_plane + offset;
428 68950 const uint8_t *ref = ref_plane + offset;
429 68950 int score[4] = { 0, 0, 0, 0 }, best;
430 68950 uint8_t *temp = s->scratchbuf;
431
432
1/2
✗ Branch 1 not taken.
✓ Branch 2 taken 68950 times.
68950 if (put_bytes_left(pb, 0) < 3000) { // FIXME: check size
433 av_log(s->avctx, AV_LOG_ERROR, "encoded frame too large\n");
434 return -1;
435 }
436
437 68950 s->m.mb_x = x;
438 68950 init_block_index(&s->m);
439
440
2/2
✓ Branch 0 taken 62055 times.
✓ Branch 1 taken 6895 times.
68950 if (s->pict_type == AV_PICTURE_TYPE_I ||
441
2/2
✓ Branch 0 taken 3450 times.
✓ Branch 1 taken 58605 times.
62055 (s->m.mb_type[x + y * s->m.mb_stride] &
442 CANDIDATE_MB_TYPE_INTRA)) {
443
2/2
✓ Branch 0 taken 62070 times.
✓ Branch 1 taken 10345 times.
72415 for (i = 0; i < 6; i++)
444 62070 init_put_bits(&s->reorder_pb[i], reorder_buffer[0][i],
445 7 * 32);
446
2/2
✓ Branch 0 taken 3450 times.
✓ Branch 1 taken 6895 times.
10345 if (s->pict_type == AV_PICTURE_TYPE_P) {
447 3450 put_bits(&s->reorder_pb[5], SVQ1_BLOCK_INTRA_LEN, SVQ1_BLOCK_INTRA_CODE);
448 3450 score[0] = SVQ1_BLOCK_INTRA_LEN * lambda;
449 }
450 10345 score[0] += encode_block(s, src + 16 * x, NULL, temp, stride,
451 5, 64, lambda, 1);
452
2/2
✓ Branch 0 taken 62070 times.
✓ Branch 1 taken 10345 times.
72415 for (i = 0; i < 6; i++) {
453 62070 count[0][i] = put_bits_count(&s->reorder_pb[i]);
454 62070 flush_put_bits(&s->reorder_pb[i]);
455 }
456 } else
457 58605 score[0] = INT_MAX;
458
459 68950 best = 0;
460
461
2/2
✓ Branch 0 taken 62055 times.
✓ Branch 1 taken 6895 times.
68950 if (s->pict_type == AV_PICTURE_TYPE_P) {
462 int mx, my, pred_x, pred_y, dxy;
463 int16_t *motion_ptr;
464
465 62055 motion_ptr = ff_h263_pred_motion(&s->m, 0, 0, &pred_x, &pred_y);
466
2/2
✓ Branch 0 taken 58605 times.
✓ Branch 1 taken 3450 times.
62055 if (s->m.mb_type[x + y * s->m.mb_stride] &
467 CANDIDATE_MB_TYPE_INTER) {
468
2/2
✓ Branch 0 taken 351630 times.
✓ Branch 1 taken 58605 times.
410235 for (i = 0; i < 6; i++)
469 351630 init_put_bits(&s->reorder_pb[i], reorder_buffer[1][i],
470 7 * 32);
471
472 58605 put_bits(&s->reorder_pb[5], SVQ1_BLOCK_INTER_LEN, SVQ1_BLOCK_INTER_CODE);
473
474 58605 s->m.pb = s->reorder_pb[5];
475 58605 mx = motion_ptr[0];
476 58605 my = motion_ptr[1];
477 av_assert1(mx >= -32 && mx <= 31);
478 av_assert1(my >= -32 && my <= 31);
479 av_assert1(pred_x >= -32 && pred_x <= 31);
480 av_assert1(pred_y >= -32 && pred_y <= 31);
481 58605 ff_h263_encode_motion(&s->m.pb, mx - pred_x, 1);
482 58605 ff_h263_encode_motion(&s->m.pb, my - pred_y, 1);
483 58605 s->reorder_pb[5] = s->m.pb;
484 58605 score[1] += lambda * put_bits_count(&s->reorder_pb[5]);
485
486 58605 dxy = (mx & 1) + 2 * (my & 1);
487
488 58605 s->hdsp.put_pixels_tab[0][dxy](temp + 16*stride,
489 58605 ref + (mx >> 1) +
490 58605 stride * (my >> 1),
491 stride, 16);
492
493 58605 score[1] += encode_block(s, src + 16 * x, temp + 16*stride,
494 decoded, stride, 5, 64, lambda, 0);
495 58605 best = score[1] <= score[0];
496
497 58605 score[2] = s->mecc.sse[0](NULL, src + 16 * x, ref,
498 stride, 16);
499 58605 score[2] += SVQ1_BLOCK_SKIP_LEN * lambda;
500
6/6
✓ Branch 0 taken 119 times.
✓ Branch 1 taken 58486 times.
✓ Branch 2 taken 88 times.
✓ Branch 3 taken 31 times.
✓ Branch 4 taken 83 times.
✓ Branch 5 taken 5 times.
58605 if (score[2] < score[best] && mx == 0 && my == 0) {
501 83 best = 2;
502 83 s->hdsp.put_pixels_tab[0][0](decoded, ref, stride, 16);
503 83 put_bits(pb, SVQ1_BLOCK_SKIP_LEN, SVQ1_BLOCK_SKIP_CODE);
504 }
505 }
506
507
2/2
✓ Branch 0 taken 58522 times.
✓ Branch 1 taken 3533 times.
62055 if (best == 1) {
508
2/2
✓ Branch 0 taken 351132 times.
✓ Branch 1 taken 58522 times.
409654 for (i = 0; i < 6; i++) {
509 351132 count[1][i] = put_bits_count(&s->reorder_pb[i]);
510 351132 flush_put_bits(&s->reorder_pb[i]);
511 }
512 } else {
513 3533 motion_ptr[0] =
514 3533 motion_ptr[1] =
515 3533 motion_ptr[2] =
516 3533 motion_ptr[3] =
517 3533 motion_ptr[0 + 2 * s->m.b8_stride] =
518 3533 motion_ptr[1 + 2 * s->m.b8_stride] =
519 3533 motion_ptr[2 + 2 * s->m.b8_stride] =
520 3533 motion_ptr[3 + 2 * s->m.b8_stride] = 0;
521 }
522 }
523
524 68950 s->rd_total += score[best];
525
526
2/2
✓ Branch 0 taken 68867 times.
✓ Branch 1 taken 83 times.
68950 if (best != 2)
527
2/2
✓ Branch 0 taken 413202 times.
✓ Branch 1 taken 68867 times.
482069 for (i = 5; i >= 0; i--)
528 413202 ff_copy_bits(pb, reorder_buffer[best][i],
529 count[best][i]);
530
2/2
✓ Branch 0 taken 10345 times.
✓ Branch 1 taken 58605 times.
68950 if (best == 0)
531 10345 s->hdsp.put_pixels_tab[0][0](decoded, temp, stride, 16);
532 }
533 4450 s->m.first_slice_line = 0;
534 }
535 600 return 0;
536 }
537
538 4 static av_cold int svq1_encode_end(AVCodecContext *avctx)
539 {
540 4 SVQ1EncContext *const s = avctx->priv_data;
541 int i;
542
543
1/2
✓ Branch 0 taken 4 times.
✗ Branch 1 not taken.
4 if (avctx->frame_num)
544 4 av_log(avctx, AV_LOG_DEBUG, "RD: %f\n",
545 4 s->rd_total / (double)(avctx->width * avctx->height *
546 4 avctx->frame_num));
547
548 4 s->m.mb_type = NULL;
549 4 ff_mpv_common_end(&s->m);
550
551 4 av_freep(&s->m.me.scratchpad);
552 4 av_freep(&s->m.me.map);
553 4 av_freep(&s->mb_type);
554 4 av_freep(&s->dummy);
555 4 av_freep(&s->scratchbuf);
556
557
2/2
✓ Branch 0 taken 12 times.
✓ Branch 1 taken 4 times.
16 for (i = 0; i < 3; i++) {
558 12 av_freep(&s->motion_val8[i]);
559 12 av_freep(&s->motion_val16[i]);
560 }
561
562 4 av_frame_free(&s->current_picture);
563 4 av_frame_free(&s->last_picture);
564 4 av_frame_free(&s->m.new_picture);
565
566 4 return 0;
567 }
568
569 4 static av_cold int write_ident(AVCodecContext *avctx, const char *ident)
570 {
571 4 int size = strlen(ident);
572 4 avctx->extradata = av_malloc(size + 8);
573
1/2
✗ Branch 0 not taken.
✓ Branch 1 taken 4 times.
4 if (!avctx->extradata)
574 return AVERROR(ENOMEM);
575 4 AV_WB32(avctx->extradata, size + 8);
576 4 AV_WL32(avctx->extradata + 4, MKTAG('S', 'V', 'Q', '1'));
577 4 memcpy(avctx->extradata + 8, ident, size);
578 4 avctx->extradata_size = size + 8;
579 4 return 0;
580 }
581
582 4 static av_cold int svq1_encode_init(AVCodecContext *avctx)
583 {
584 4 SVQ1EncContext *const s = avctx->priv_data;
585 int ret;
586
587
2/4
✓ Branch 0 taken 4 times.
✗ Branch 1 not taken.
✗ Branch 2 not taken.
✓ Branch 3 taken 4 times.
4 if (avctx->width >= 4096 || avctx->height >= 4096) {
588 av_log(avctx, AV_LOG_ERROR, "Dimensions too large, maximum is 4095x4095\n");
589 return AVERROR(EINVAL);
590 }
591
592 4 ff_hpeldsp_init(&s->hdsp, avctx->flags);
593 4 ff_me_cmp_init(&s->mecc, avctx);
594 4 ff_mpegvideoencdsp_init(&s->m.mpvencdsp, avctx);
595
596 4 s->current_picture = av_frame_alloc();
597 4 s->last_picture = av_frame_alloc();
598
2/4
✓ Branch 0 taken 4 times.
✗ Branch 1 not taken.
✗ Branch 2 not taken.
✓ Branch 3 taken 4 times.
4 if (!s->current_picture || !s->last_picture) {
599 return AVERROR(ENOMEM);
600 }
601
602 4 s->frame_width = avctx->width;
603 4 s->frame_height = avctx->height;
604
605 4 s->y_block_width = (s->frame_width + 15) / 16;
606 4 s->y_block_height = (s->frame_height + 15) / 16;
607
608 4 s->c_block_width = (s->frame_width / 4 + 15) / 16;
609 4 s->c_block_height = (s->frame_height / 4 + 15) / 16;
610
611 4 s->avctx = avctx;
612 4 s->m.avctx = avctx;
613
614
1/2
✗ Branch 1 not taken.
✓ Branch 2 taken 4 times.
4 if ((ret = ff_mpv_common_init(&s->m)) < 0) {
615 return ret;
616 }
617
618 4 s->m.picture_structure = PICT_FRAME;
619 4 s->m.me.temp =
620 8 s->m.me.scratchpad = av_mallocz((avctx->width + 64) *
621 4 2 * 16 * 2 * sizeof(uint8_t));
622 8 s->mb_type = av_mallocz((s->y_block_width + 1) *
623 4 s->y_block_height * sizeof(int16_t));
624 8 s->dummy = av_mallocz((s->y_block_width + 1) *
625 4 s->y_block_height * sizeof(int32_t));
626 4 s->m.me.map = av_mallocz(2 * ME_MAP_SIZE * sizeof(*s->m.me.map));
627 4 s->m.new_picture = av_frame_alloc();
628
629
2/4
✓ Branch 0 taken 4 times.
✗ Branch 1 not taken.
✓ Branch 2 taken 4 times.
✗ Branch 3 not taken.
4 if (!s->m.me.scratchpad || !s->m.me.map ||
630
3/6
✓ Branch 0 taken 4 times.
✗ Branch 1 not taken.
✓ Branch 2 taken 4 times.
✗ Branch 3 not taken.
✗ Branch 4 not taken.
✓ Branch 5 taken 4 times.
4 !s->mb_type || !s->dummy || !s->m.new_picture)
631 return AVERROR(ENOMEM);
632 4 s->m.me.score_map = s->m.me.map + ME_MAP_SIZE;
633
634 4 ff_svq1enc_init(&s->svq1encdsp);
635
636 4 ff_h263_encode_init(&s->m); // mv_penalty
637
638
1/2
✓ Branch 0 taken 4 times.
✗ Branch 1 not taken.
4 return write_ident(avctx, s->avctx->flags & AV_CODEC_FLAG_BITEXACT ? "Lavc" : LIBAVCODEC_IDENT);
639 }
640
641 200 static int svq1_encode_frame(AVCodecContext *avctx, AVPacket *pkt,
642 const AVFrame *pict, int *got_packet)
643 {
644 200 SVQ1EncContext *const s = avctx->priv_data;
645 PutBitContext pb;
646 int i, ret;
647
648 200 ret = ff_alloc_packet(avctx, pkt, s->y_block_width * s->y_block_height *
649 200 MAX_MB_BYTES * 3 + FF_INPUT_BUFFER_MIN_SIZE);
650
1/2
✗ Branch 0 not taken.
✓ Branch 1 taken 200 times.
200 if (ret < 0)
651 return ret;
652
653
1/2
✗ Branch 0 not taken.
✓ Branch 1 taken 200 times.
200 if (avctx->pix_fmt != AV_PIX_FMT_YUV410P) {
654 av_log(avctx, AV_LOG_ERROR, "unsupported pixel format\n");
655 return -1;
656 }
657
658
2/2
✓ Branch 0 taken 4 times.
✓ Branch 1 taken 196 times.
200 if (!s->current_picture->data[0]) {
659
1/2
✗ Branch 1 not taken.
✓ Branch 2 taken 4 times.
4 if ((ret = ff_encode_alloc_frame(avctx, s->current_picture)) < 0) {
660 return ret;
661 }
662 }
663
2/2
✓ Branch 0 taken 4 times.
✓ Branch 1 taken 196 times.
200 if (!s->last_picture->data[0]) {
664 4 ret = ff_encode_alloc_frame(avctx, s->last_picture);
665
1/2
✗ Branch 0 not taken.
✓ Branch 1 taken 4 times.
4 if (ret < 0)
666 return ret;
667 }
668
2/2
✓ Branch 0 taken 4 times.
✓ Branch 1 taken 196 times.
200 if (!s->scratchbuf) {
669 4 s->scratchbuf = av_malloc_array(s->current_picture->linesize[0], 16 * 3);
670
1/2
✗ Branch 0 not taken.
✓ Branch 1 taken 4 times.
4 if (!s->scratchbuf)
671 return AVERROR(ENOMEM);
672 }
673
674 200 FFSWAP(AVFrame*, s->current_picture, s->last_picture);
675
676
3/4
✓ Branch 0 taken 200 times.
✗ Branch 1 not taken.
✓ Branch 2 taken 180 times.
✓ Branch 3 taken 20 times.
200 if (avctx->gop_size && (avctx->frame_num % avctx->gop_size))
677 180 s->pict_type = AV_PICTURE_TYPE_P;
678 else
679 20 s->pict_type = AV_PICTURE_TYPE_I;
680 200 s->quality = pict->quality;
681
682 200 ff_side_data_set_encoder_stats(pkt, pict->quality, NULL, 0, s->pict_type);
683
684 200 init_put_bits(&pb, pkt->data, pkt->size);
685 200 svq1_write_header(s, &pb, s->pict_type);
686
2/2
✓ Branch 0 taken 600 times.
✓ Branch 1 taken 200 times.
800 for (i = 0; i < 3; i++) {
687 1800 int ret = svq1_encode_plane(s, i, &pb,
688 600 pict->data[i],
689 600 s->last_picture->data[i],
690 600 s->current_picture->data[i],
691
2/2
✓ Branch 0 taken 400 times.
✓ Branch 1 taken 200 times.
600 s->frame_width / (i ? 4 : 1),
692 600 s->frame_height / (i ? 4 : 1),
693 600 pict->linesize[i],
694
2/2
✓ Branch 0 taken 400 times.
✓ Branch 1 taken 200 times.
600 s->current_picture->linesize[i]);
695 600 emms_c();
696
1/2
✗ Branch 0 not taken.
✓ Branch 1 taken 600 times.
600 if (ret < 0) {
697 int j;
698 for (j = 0; j < i; j++) {
699 av_freep(&s->motion_val8[j]);
700 av_freep(&s->motion_val16[j]);
701 }
702 av_freep(&s->scratchbuf);
703 return -1;
704 }
705 }
706
707 // align_put_bits(&pb);
708
2/2
✓ Branch 1 taken 3154 times.
✓ Branch 2 taken 200 times.
3354 while (put_bits_count(&pb) & 31)
709 3154 put_bits(&pb, 1, 0);
710
711 200 flush_put_bits(&pb);
712
713 200 pkt->size = put_bytes_output(&pb);
714
2/2
✓ Branch 0 taken 20 times.
✓ Branch 1 taken 180 times.
200 if (s->pict_type == AV_PICTURE_TYPE_I)
715 20 pkt->flags |= AV_PKT_FLAG_KEY;
716 200 *got_packet = 1;
717
718 200 return 0;
719 }
720
721 #define OFFSET(x) offsetof(struct SVQ1EncContext, x)
722 #define VE AV_OPT_FLAG_VIDEO_PARAM | AV_OPT_FLAG_ENCODING_PARAM
723 static const AVOption options[] = {
724 { "motion-est", "Motion estimation algorithm", OFFSET(motion_est), AV_OPT_TYPE_INT, { .i64 = FF_ME_EPZS }, FF_ME_ZERO, FF_ME_XONE, VE, .unit = "motion-est"},
725 { "zero", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = FF_ME_ZERO }, 0, 0, FF_MPV_OPT_FLAGS, .unit = "motion-est" },
726 { "epzs", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = FF_ME_EPZS }, 0, 0, FF_MPV_OPT_FLAGS, .unit = "motion-est" },
727 { "xone", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = FF_ME_XONE }, 0, 0, FF_MPV_OPT_FLAGS, .unit = "motion-est" },
728
729 { NULL },
730 };
731
732 static const AVClass svq1enc_class = {
733 .class_name = "svq1enc",
734 .item_name = av_default_item_name,
735 .option = options,
736 .version = LIBAVUTIL_VERSION_INT,
737 };
738
739 const FFCodec ff_svq1_encoder = {
740 .p.name = "svq1",
741 CODEC_LONG_NAME("Sorenson Vector Quantizer 1 / Sorenson Video 1 / SVQ1"),
742 .p.type = AVMEDIA_TYPE_VIDEO,
743 .p.id = AV_CODEC_ID_SVQ1,
744 .p.capabilities = AV_CODEC_CAP_DR1 | AV_CODEC_CAP_ENCODER_REORDERED_OPAQUE,
745 .priv_data_size = sizeof(SVQ1EncContext),
746 .p.priv_class = &svq1enc_class,
747 .init = svq1_encode_init,
748 FF_CODEC_ENCODE_CB(svq1_encode_frame),
749 .close = svq1_encode_end,
750 .p.pix_fmts = (const enum AVPixelFormat[]) { AV_PIX_FMT_YUV410P,
751 AV_PIX_FMT_NONE },
752 .caps_internal = FF_CODEC_CAP_INIT_CLEANUP,
753 };
754