FFmpeg coverage


Directory: ../../../ffmpeg/
File: src/libavcodec/svq1enc.c
Date: 2024-07-26 21:54:09
Exec Total Coverage
Lines: 360 381 94.5%
Functions: 8 8 100.0%
Branches: 167 196 85.2%

Line Branch Exec Source
1 /*
2 * SVQ1 Encoder
3 * Copyright (C) 2004 Mike Melanson <melanson@pcisys.net>
4 *
5 * This file is part of FFmpeg.
6 *
7 * FFmpeg is free software; you can redistribute it and/or
8 * modify it under the terms of the GNU Lesser General Public
9 * License as published by the Free Software Foundation; either
10 * version 2.1 of the License, or (at your option) any later version.
11 *
12 * FFmpeg is distributed in the hope that it will be useful,
13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
15 * Lesser General Public License for more details.
16 *
17 * You should have received a copy of the GNU Lesser General Public
18 * License along with FFmpeg; if not, write to the Free Software
19 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
20 */
21
22 /**
23 * @file
24 * Sorenson Vector Quantizer #1 (SVQ1) video codec.
25 * For more information of the SVQ1 algorithm, visit:
26 * http://www.pcisys.net/~melanson/codecs/
27 */
28
29 #include "libavutil/emms.h"
30 #include "libavutil/mem.h"
31 #include "avcodec.h"
32 #include "codec_internal.h"
33 #include "encode.h"
34 #include "hpeldsp.h"
35 #include "me_cmp.h"
36 #include "mpegvideo.h"
37 #include "h263.h"
38 #include "h263enc.h"
39 #include "internal.h"
40 #include "mpegutils.h"
41 #include "packet_internal.h"
42 #include "put_bits.h"
43 #include "svq1.h"
44 #include "svq1encdsp.h"
45 #include "svq1enc_cb.h"
46 #include "version.h"
47
48 #include "libavutil/avassert.h"
49 #include "libavutil/frame.h"
50 #include "libavutil/mem_internal.h"
51
52 // Workaround for GCC bug 102513
53 #if AV_GCC_VERSION_AT_LEAST(10, 0) && AV_GCC_VERSION_AT_MOST(12, 0) \
54 && !defined(__clang__) && !defined(__INTEL_COMPILER)
55 #pragma GCC optimize ("no-ipa-cp-clone")
56 #endif
57
58 typedef struct SVQ1EncContext {
59 /* FIXME: Needed for motion estimation, should not be used for anything
60 * else, the idea is to make the motion estimation eventually independent
61 * of MpegEncContext, so this will be removed then. */
62 MpegEncContext m;
63 AVCodecContext *avctx;
64 MECmpContext mecc;
65 HpelDSPContext hdsp;
66 AVFrame *current_picture;
67 AVFrame *last_picture;
68
69 /* Some compression statistics */
70 enum AVPictureType pict_type;
71 int quality;
72
73 /* why ooh why this sick breadth first order,
74 * everything is slower and more complex */
75 PutBitContext reorder_pb[6];
76
77 int frame_width;
78 int frame_height;
79
80 /* Y plane block dimensions */
81 int y_block_width;
82 int y_block_height;
83
84 /* U & V plane (C planes) block dimensions */
85 int c_block_width;
86 int c_block_height;
87
88 DECLARE_ALIGNED(16, int16_t, encoded_block_levels)[6][7][256];
89
90 uint16_t *mb_type;
91 uint32_t *dummy;
92 int16_t (*motion_val8[3])[2];
93 int16_t (*motion_val16[3])[2];
94
95 int64_t rd_total;
96
97 uint8_t *scratchbuf;
98
99 int motion_est;
100
101 SVQ1EncDSPContext svq1encdsp;
102 } SVQ1EncContext;
103
104 200 static void svq1_write_header(SVQ1EncContext *s, PutBitContext *pb, int frame_type)
105 {
106 int i;
107
108 /* frame code */
109 200 put_bits(pb, 22, 0x20);
110
111 /* temporal reference (sure hope this is a "don't care") */
112 200 put_bits(pb, 8, 0x00);
113
114 /* frame type */
115 200 put_bits(pb, 2, frame_type - 1);
116
117
2/2
✓ Branch 0 taken 20 times.
✓ Branch 1 taken 180 times.
200 if (frame_type == AV_PICTURE_TYPE_I) {
118 /* no checksum since frame code is 0x20 */
119 /* no embedded string either */
120 /* output 5 unknown bits (2 + 2 + 1) */
121 20 put_bits(pb, 5, 2); /* 2 needed by quicktime decoder */
122
123 20 i = ff_match_2uint16(ff_svq1_frame_size_table,
124 FF_ARRAY_ELEMS(ff_svq1_frame_size_table),
125 s->frame_width, s->frame_height);
126 20 put_bits(pb, 3, i);
127
128
2/2
✓ Branch 0 taken 5 times.
✓ Branch 1 taken 15 times.
20 if (i == 7) {
129 5 put_bits(pb, 12, s->frame_width);
130 5 put_bits(pb, 12, s->frame_height);
131 }
132 }
133
134 /* no checksum or extra data (next 2 bits get 0) */
135 200 put_bits(pb, 2, 0);
136 200 }
137
138 #define QUALITY_THRESHOLD 100
139 #define THRESHOLD_MULTIPLIER 0.6
140
141 4302522 static int encode_block(SVQ1EncContext *s, uint8_t *src, uint8_t *ref,
142 uint8_t *decoded, int stride, unsigned level,
143 int threshold, int lambda, int intra)
144 {
145 int count, y, x, i, j, split, best_mean, best_score, best_count;
146 int best_vector[6];
147 4302522 int block_sum[7] = { 0, 0, 0, 0, 0, 0 };
148 4302522 int w = 2 << (level + 2 >> 1);
149 4302522 int h = 2 << (level + 1 >> 1);
150 4302522 int size = w * h;
151 4302522 int16_t (*block)[256] = s->encoded_block_levels[level];
152 const int8_t *codebook_sum, *codebook;
153 const uint16_t(*mean_vlc)[2];
154 const uint8_t(*multistage_vlc)[2];
155
156 4302522 best_score = 0;
157 // FIXME: Optimize, this does not need to be done multiple times.
158
2/2
✓ Branch 0 taken 643715 times.
✓ Branch 1 taken 3658807 times.
4302522 if (intra) {
159 // level is 5 when encode_block is called from svq1_encode_plane
160 // and always < 4 when called recursively from this function.
161
2/2
✓ Branch 0 taken 612686 times.
✓ Branch 1 taken 31029 times.
643715 codebook_sum = level < 4 ? svq1_intra_codebook_sum[level] : NULL;
162 643715 codebook = ff_svq1_intra_codebooks[level];
163 643715 mean_vlc = ff_svq1_intra_mean_vlc;
164 643715 multistage_vlc = ff_svq1_intra_multistage_vlc[level];
165
2/2
✓ Branch 0 taken 2296676 times.
✓ Branch 1 taken 643715 times.
2940391 for (y = 0; y < h; y++) {
166
2/2
✓ Branch 0 taken 15798160 times.
✓ Branch 1 taken 2296676 times.
18094836 for (x = 0; x < w; x++) {
167 15798160 int v = src[x + y * stride];
168 15798160 block[0][x + w * y] = v;
169 15798160 best_score += v * v;
170 15798160 block_sum[0] += v;
171 }
172 }
173 } else {
174 // level is 5 or < 4, see above for details.
175
2/2
✓ Branch 0 taken 3483018 times.
✓ Branch 1 taken 175789 times.
3658807 codebook_sum = level < 4 ? svq1_inter_codebook_sum[level] : NULL;
176 3658807 codebook = ff_svq1_inter_codebooks[level];
177 3658807 mean_vlc = ff_svq1_inter_mean_vlc + 256;
178 3658807 multistage_vlc = ff_svq1_inter_multistage_vlc[level];
179
2/2
✓ Branch 0 taken 13044696 times.
✓ Branch 1 taken 3658807 times.
16703503 for (y = 0; y < h; y++) {
180
2/2
✓ Branch 0 taken 89655008 times.
✓ Branch 1 taken 13044696 times.
102699704 for (x = 0; x < w; x++) {
181 89655008 int v = src[x + y * stride] - ref[x + y * stride];
182 89655008 block[0][x + w * y] = v;
183 89655008 best_score += v * v;
184 89655008 block_sum[0] += v;
185 }
186 }
187 }
188
189 4302522 best_count = 0;
190 4302522 best_score -= (int)((unsigned)block_sum[0] * block_sum[0] >> (level + 3));
191 4302522 best_mean = block_sum[0] + (size >> 1) >> (level + 3);
192
193
2/2
✓ Branch 0 taken 4095704 times.
✓ Branch 1 taken 206818 times.
4302522 if (level < 4) {
194
2/2
✓ Branch 0 taken 24574224 times.
✓ Branch 1 taken 4095704 times.
28669928 for (count = 1; count < 7; count++) {
195 24574224 int best_vector_score = INT_MAX;
196 24574224 int best_vector_sum = -999, best_vector_mean = -999;
197 24574224 const int stage = count - 1;
198 const int8_t *vector;
199
200
2/2
✓ Branch 0 taken 393187584 times.
✓ Branch 1 taken 24574224 times.
417761808 for (i = 0; i < 16; i++) {
201 393187584 int sum = codebook_sum[stage * 16 + i];
202 int sqr, diff, score;
203
204 393187584 vector = codebook + stage * size * 16 + i * size;
205 393187584 sqr = s->svq1encdsp.ssd_int8_vs_int16(vector, block[stage], size);
206 393187584 diff = block_sum[stage] - sum;
207 393187584 score = sqr - (diff * (int64_t)diff >> (level + 3)); // FIXME: 64 bits slooow
208
2/2
✓ Branch 0 taken 65426753 times.
✓ Branch 1 taken 327760831 times.
393187584 if (score < best_vector_score) {
209 65426753 int mean = diff + (size >> 1) >> (level + 3);
210 av_assert2(mean > -300 && mean < 300);
211
2/2
✓ Branch 0 taken 9912177 times.
✓ Branch 1 taken 55514576 times.
65426753 mean = av_clip(mean, intra ? 0 : -256, 255);
212 65426753 best_vector_score = score;
213 65426753 best_vector[stage] = i;
214 65426753 best_vector_sum = sum;
215 65426753 best_vector_mean = mean;
216 }
217 }
218
1/2
✗ Branch 0 not taken.
✓ Branch 1 taken 24574224 times.
24574224 av_assert0(best_vector_mean != -999);
219 24574224 vector = codebook + stage * size * 16 + best_vector[stage] * size;
220
2/2
✓ Branch 0 taken 420929184 times.
✓ Branch 1 taken 24574224 times.
445503408 for (j = 0; j < size; j++)
221 420929184 block[stage + 1][j] = block[stage][j] - vector[j];
222 24574224 block_sum[stage + 1] = block_sum[stage] - best_vector_sum;
223 24574224 best_vector_score += lambda *
224 24574224 (+1 + 4 * count +
225 24574224 multistage_vlc[1 + count][1]
226 24574224 + mean_vlc[best_vector_mean][1]);
227
228
2/2
✓ Branch 0 taken 5416629 times.
✓ Branch 1 taken 19157595 times.
24574224 if (best_vector_score < best_score) {
229 5416629 best_score = best_vector_score;
230 5416629 best_count = count;
231 5416629 best_mean = best_vector_mean;
232 }
233 }
234 }
235
236
2/2
✓ Branch 0 taken 12 times.
✓ Branch 1 taken 4302510 times.
4302522 if (best_mean == -128)
237 12 best_mean = -127;
238
2/2
✓ Branch 0 taken 6210 times.
✓ Branch 1 taken 4296300 times.
4302510 else if (best_mean == 128)
239 6210 best_mean = 127;
240
241 4302522 split = 0;
242
4/4
✓ Branch 0 taken 4243230 times.
✓ Branch 1 taken 59292 times.
✓ Branch 2 taken 2116786 times.
✓ Branch 3 taken 2126444 times.
4302522 if (best_score > threshold && level) {
243 2116786 int score = 0;
244
2/2
✓ Branch 0 taken 1431267 times.
✓ Branch 1 taken 685519 times.
2116786 int offset = level & 1 ? stride * h / 2 : w / 2;
245 PutBitContext backup[6];
246
247
2/2
✓ Branch 0 taken 3903357 times.
✓ Branch 1 taken 2116786 times.
6020143 for (i = level - 1; i >= 0; i--)
248 3903357 backup[i] = s->reorder_pb[i];
249 2116786 score += encode_block(s, src, ref, decoded, stride, level - 1,
250 threshold >> 1, lambda, intra);
251 2116786 score += encode_block(s, src + offset, ref + offset, decoded + offset,
252 stride, level - 1, threshold >> 1, lambda, intra);
253 2116786 score += lambda;
254
255
2/2
✓ Branch 0 taken 1359243 times.
✓ Branch 1 taken 757543 times.
2116786 if (score < best_score) {
256 1359243 best_score = score;
257 1359243 split = 1;
258 } else {
259
2/2
✓ Branch 0 taken 1046147 times.
✓ Branch 1 taken 757543 times.
1803690 for (i = level - 1; i >= 0; i--)
260 1046147 s->reorder_pb[i] = backup[i];
261 }
262 }
263
2/2
✓ Branch 0 taken 2127616 times.
✓ Branch 1 taken 2174906 times.
4302522 if (level > 0)
264 2127616 put_bits(&s->reorder_pb[level], 1, split);
265
266
2/2
✓ Branch 0 taken 2943279 times.
✓ Branch 1 taken 1359243 times.
4302522 if (!split) {
267 av_assert1(best_mean >= 0 && best_mean < 256 || !intra);
268 av_assert1(best_mean >= -256 && best_mean < 256);
269 av_assert1(best_count >= 0 && best_count < 7);
270 av_assert1(level < 4 || best_count == 0);
271
272 /* output the encoding */
273 2943279 put_bits(&s->reorder_pb[level],
274 2943279 multistage_vlc[1 + best_count][1],
275 2943279 multistage_vlc[1 + best_count][0]);
276 2943279 put_bits(&s->reorder_pb[level], mean_vlc[best_mean][1],
277 2943279 mean_vlc[best_mean][0]);
278
279
2/2
✓ Branch 0 taken 3649044 times.
✓ Branch 1 taken 2943279 times.
6592323 for (i = 0; i < best_count; i++) {
280 av_assert2(best_vector[i] >= 0 && best_vector[i] < 16);
281 3649044 put_bits(&s->reorder_pb[level], 4, best_vector[i]);
282 }
283
284
2/2
✓ Branch 0 taken 7680728 times.
✓ Branch 1 taken 2943279 times.
10624007 for (y = 0; y < h; y++)
285
2/2
✓ Branch 0 taken 36196848 times.
✓ Branch 1 taken 7680728 times.
43877576 for (x = 0; x < w; x++)
286 36196848 decoded[x + y * stride] = src[x + y * stride] -
287 36196848 block[best_count][x + w * y] +
288 best_mean;
289 }
290
291 4302522 return best_score;
292 }
293
294 131005 static void init_block_index(MpegEncContext *s){
295 131005 s->block_index[0]= s->b8_stride*(s->mb_y*2 ) + s->mb_x*2;
296 131005 s->block_index[1]= s->b8_stride*(s->mb_y*2 ) + 1 + s->mb_x*2;
297 131005 s->block_index[2]= s->b8_stride*(s->mb_y*2 + 1) + s->mb_x*2;
298 131005 s->block_index[3]= s->b8_stride*(s->mb_y*2 + 1) + 1 + s->mb_x*2;
299 131005 s->block_index[4]= s->mb_stride*(s->mb_y + 1) + s->b8_stride*s->mb_height*2 + s->mb_x;
300 131005 s->block_index[5]= s->mb_stride*(s->mb_y + s->mb_height + 2) + s->b8_stride*s->mb_height*2 + s->mb_x;
301 131005 }
302
303 600 static int svq1_encode_plane(SVQ1EncContext *s, int plane,
304 PutBitContext *pb,
305 const unsigned char *src_plane,
306 unsigned char *ref_plane,
307 unsigned char *decoded_plane,
308 int width, int height, int src_stride, int stride)
309 {
310 int x, y;
311 int i;
312 int block_width, block_height;
313 int level;
314 int threshold[6];
315 600 uint8_t *src = s->scratchbuf + stride * 32;
316 600 const int lambda = (s->quality * s->quality) >>
317 (2 * FF_LAMBDA_SHIFT);
318
319 /* figure out the acceptable level thresholds in advance */
320 600 threshold[5] = QUALITY_THRESHOLD;
321
2/2
✓ Branch 0 taken 3000 times.
✓ Branch 1 taken 600 times.
3600 for (level = 4; level >= 0; level--)
322 3000 threshold[level] = threshold[level + 1] * THRESHOLD_MULTIPLIER;
323
324 600 block_width = (width + 15) / 16;
325 600 block_height = (height + 15) / 16;
326
327
2/2
✓ Branch 0 taken 540 times.
✓ Branch 1 taken 60 times.
600 if (s->pict_type == AV_PICTURE_TYPE_P) {
328 540 s->m.avctx = s->avctx;
329 540 s->m.last_pic.data[0] = ref_plane;
330 540 s->m.linesize =
331 540 s->m.last_pic.linesize[0] =
332 540 s->m.new_pic->linesize[0] =
333 540 s->m.cur_pic.linesize[0] = stride;
334 540 s->m.width = width;
335 540 s->m.height = height;
336 540 s->m.mb_width = block_width;
337 540 s->m.mb_height = block_height;
338 540 s->m.mb_stride = s->m.mb_width + 1;
339 540 s->m.b8_stride = 2 * s->m.mb_width + 1;
340 540 s->m.f_code = 1;
341 540 s->m.pict_type = s->pict_type;
342 540 s->m.motion_est = s->motion_est;
343 540 s->m.me.scene_change_score = 0;
344 // s->m.out_format = FMT_H263;
345 // s->m.unrestricted_mv = 1;
346 540 s->m.lambda = s->quality;
347 540 s->m.qscale = s->m.lambda * 139 +
348 540 FF_LAMBDA_SCALE * 64 >>
349 FF_LAMBDA_SHIFT + 7;
350 540 s->m.lambda2 = s->m.lambda * s->m.lambda +
351 540 FF_LAMBDA_SCALE / 2 >>
352 FF_LAMBDA_SHIFT;
353
354
2/2
✓ Branch 0 taken 12 times.
✓ Branch 1 taken 528 times.
540 if (!s->motion_val8[plane]) {
355 24 s->motion_val8[plane] = av_mallocz((s->m.b8_stride *
356 12 block_height * 2 + 2) *
357 2 * sizeof(int16_t));
358 24 s->motion_val16[plane] = av_mallocz((s->m.mb_stride *
359 12 (block_height + 2) + 1) *
360 2 * sizeof(int16_t));
361
2/4
✓ Branch 0 taken 12 times.
✗ Branch 1 not taken.
✗ Branch 2 not taken.
✓ Branch 3 taken 12 times.
12 if (!s->motion_val8[plane] || !s->motion_val16[plane])
362 return AVERROR(ENOMEM);
363 }
364
365 540 s->m.mb_type = s->mb_type;
366
367 // dummies, to avoid segfaults
368 540 s->m.mb_mean = (uint8_t *)s->dummy;
369 540 s->m.mb_var = (uint16_t *)s->dummy;
370 540 s->m.mc_mb_var = (uint16_t *)s->dummy;
371 540 s->m.cur_pic.mb_type = s->dummy;
372
373 540 s->m.cur_pic.motion_val[0] = s->motion_val8[plane] + 2;
374 540 s->m.p_mv_table = s->motion_val16[plane] +
375 540 s->m.mb_stride + 1;
376 540 ff_me_init_pic(&s->m);
377
378 540 s->m.me.dia_size = s->avctx->dia_size;
379 540 s->m.first_slice_line = 1;
380
2/2
✓ Branch 0 taken 4005 times.
✓ Branch 1 taken 540 times.
4545 for (y = 0; y < block_height; y++) {
381 4005 s->m.new_pic->data[0] = src - y * 16 * stride; // ugly
382 4005 s->m.mb_y = y;
383
384
4/4
✓ Branch 0 taken 60975 times.
✓ Branch 1 taken 3600 times.
✓ Branch 2 taken 60570 times.
✓ Branch 3 taken 405 times.
64575 for (i = 0; i < 16 && i + 16 * y < height; i++) {
385 60570 memcpy(&src[i * stride], &src_plane[(i + 16 * y) * src_stride],
386 width);
387
2/2
✓ Branch 0 taken 182700 times.
✓ Branch 1 taken 60570 times.
243270 for (x = width; x < 16 * block_width; x++)
388 182700 src[i * stride + x] = src[i * stride + x - 1];
389 }
390
3/4
✓ Branch 0 taken 3510 times.
✓ Branch 1 taken 4005 times.
✓ Branch 2 taken 3510 times.
✗ Branch 3 not taken.
7515 for (; i < 16 && i + 16 * y < 16 * block_height; i++)
391 3510 memcpy(&src[i * stride], &src[(i - 1) * stride],
392 3510 16 * block_width);
393
394
2/2
✓ Branch 0 taken 62055 times.
✓ Branch 1 taken 4005 times.
66060 for (x = 0; x < block_width; x++) {
395 62055 s->m.mb_x = x;
396 62055 init_block_index(&s->m);
397
398 62055 ff_estimate_p_frame_motion(&s->m, x, y);
399 }
400 4005 s->m.first_slice_line = 0;
401 }
402
403 540 ff_fix_long_p_mvs(&s->m, CANDIDATE_MB_TYPE_INTRA);
404 540 ff_fix_long_mvs(&s->m, NULL, 0, s->m.p_mv_table, s->m.f_code,
405 CANDIDATE_MB_TYPE_INTER, 0);
406 }
407
408 600 s->m.first_slice_line = 1;
409
2/2
✓ Branch 0 taken 4450 times.
✓ Branch 1 taken 600 times.
5050 for (y = 0; y < block_height; y++) {
410
4/4
✓ Branch 0 taken 67750 times.
✓ Branch 1 taken 4000 times.
✓ Branch 2 taken 67300 times.
✓ Branch 3 taken 450 times.
71750 for (i = 0; i < 16 && i + 16 * y < height; i++) {
411 67300 memcpy(&src[i * stride], &src_plane[(i + 16 * y) * src_stride],
412 width);
413
2/2
✓ Branch 0 taken 203000 times.
✓ Branch 1 taken 67300 times.
270300 for (x = width; x < 16 * block_width; x++)
414 203000 src[i * stride + x] = src[i * stride + x - 1];
415 }
416
3/4
✓ Branch 0 taken 3900 times.
✓ Branch 1 taken 4450 times.
✓ Branch 2 taken 3900 times.
✗ Branch 3 not taken.
8350 for (; i < 16 && i + 16 * y < 16 * block_height; i++)
417 3900 memcpy(&src[i * stride], &src[(i - 1) * stride], 16 * block_width);
418
419 4450 s->m.mb_y = y;
420
2/2
✓ Branch 0 taken 68950 times.
✓ Branch 1 taken 4450 times.
73400 for (x = 0; x < block_width; x++) {
421 uint8_t reorder_buffer[2][6][7 * 32];
422 int count[2][6];
423 68950 int offset = y * 16 * stride + x * 16;
424 68950 uint8_t *decoded = decoded_plane + offset;
425 68950 const uint8_t *ref = ref_plane + offset;
426 68950 int score[4] = { 0, 0, 0, 0 }, best;
427 68950 uint8_t *temp = s->scratchbuf;
428
429
1/2
✗ Branch 1 not taken.
✓ Branch 2 taken 68950 times.
68950 if (put_bytes_left(pb, 0) < 3000) { // FIXME: check size
430 av_log(s->avctx, AV_LOG_ERROR, "encoded frame too large\n");
431 return -1;
432 }
433
434 68950 s->m.mb_x = x;
435 68950 init_block_index(&s->m);
436
437
2/2
✓ Branch 0 taken 62055 times.
✓ Branch 1 taken 6895 times.
68950 if (s->pict_type == AV_PICTURE_TYPE_I ||
438
2/2
✓ Branch 0 taken 3450 times.
✓ Branch 1 taken 58605 times.
62055 (s->m.mb_type[x + y * s->m.mb_stride] &
439 CANDIDATE_MB_TYPE_INTRA)) {
440
2/2
✓ Branch 0 taken 62070 times.
✓ Branch 1 taken 10345 times.
72415 for (i = 0; i < 6; i++)
441 62070 init_put_bits(&s->reorder_pb[i], reorder_buffer[0][i],
442 7 * 32);
443
2/2
✓ Branch 0 taken 3450 times.
✓ Branch 1 taken 6895 times.
10345 if (s->pict_type == AV_PICTURE_TYPE_P) {
444 3450 put_bits(&s->reorder_pb[5], SVQ1_BLOCK_INTRA_LEN, SVQ1_BLOCK_INTRA_CODE);
445 3450 score[0] = SVQ1_BLOCK_INTRA_LEN * lambda;
446 }
447 10345 score[0] += encode_block(s, src + 16 * x, NULL, temp, stride,
448 5, 64, lambda, 1);
449
2/2
✓ Branch 0 taken 62070 times.
✓ Branch 1 taken 10345 times.
72415 for (i = 0; i < 6; i++) {
450 62070 count[0][i] = put_bits_count(&s->reorder_pb[i]);
451 62070 flush_put_bits(&s->reorder_pb[i]);
452 }
453 } else
454 58605 score[0] = INT_MAX;
455
456 68950 best = 0;
457
458
2/2
✓ Branch 0 taken 62055 times.
✓ Branch 1 taken 6895 times.
68950 if (s->pict_type == AV_PICTURE_TYPE_P) {
459 int mx, my, pred_x, pred_y, dxy;
460 int16_t *motion_ptr;
461
462 62055 motion_ptr = ff_h263_pred_motion(&s->m, 0, 0, &pred_x, &pred_y);
463
2/2
✓ Branch 0 taken 58605 times.
✓ Branch 1 taken 3450 times.
62055 if (s->m.mb_type[x + y * s->m.mb_stride] &
464 CANDIDATE_MB_TYPE_INTER) {
465
2/2
✓ Branch 0 taken 351630 times.
✓ Branch 1 taken 58605 times.
410235 for (i = 0; i < 6; i++)
466 351630 init_put_bits(&s->reorder_pb[i], reorder_buffer[1][i],
467 7 * 32);
468
469 58605 put_bits(&s->reorder_pb[5], SVQ1_BLOCK_INTER_LEN, SVQ1_BLOCK_INTER_CODE);
470
471 58605 mx = motion_ptr[0];
472 58605 my = motion_ptr[1];
473 av_assert1(mx >= -32 && mx <= 31);
474 av_assert1(my >= -32 && my <= 31);
475 av_assert1(pred_x >= -32 && pred_x <= 31);
476 av_assert1(pred_y >= -32 && pred_y <= 31);
477 58605 ff_h263_encode_motion(&s->reorder_pb[5], mx - pred_x, 1);
478 58605 ff_h263_encode_motion(&s->reorder_pb[5], my - pred_y, 1);
479 58605 score[1] += lambda * put_bits_count(&s->reorder_pb[5]);
480
481 58605 dxy = (mx & 1) + 2 * (my & 1);
482
483 58605 s->hdsp.put_pixels_tab[0][dxy](temp + 16*stride,
484 58605 ref + (mx >> 1) +
485 58605 stride * (my >> 1),
486 stride, 16);
487
488 58605 score[1] += encode_block(s, src + 16 * x, temp + 16*stride,
489 decoded, stride, 5, 64, lambda, 0);
490 58605 best = score[1] <= score[0];
491
492 58605 score[2] = s->mecc.sse[0](NULL, src + 16 * x, ref,
493 stride, 16);
494 58605 score[2] += SVQ1_BLOCK_SKIP_LEN * lambda;
495
6/6
✓ Branch 0 taken 119 times.
✓ Branch 1 taken 58486 times.
✓ Branch 2 taken 88 times.
✓ Branch 3 taken 31 times.
✓ Branch 4 taken 83 times.
✓ Branch 5 taken 5 times.
58605 if (score[2] < score[best] && mx == 0 && my == 0) {
496 83 best = 2;
497 83 s->hdsp.put_pixels_tab[0][0](decoded, ref, stride, 16);
498 83 put_bits(pb, SVQ1_BLOCK_SKIP_LEN, SVQ1_BLOCK_SKIP_CODE);
499 }
500 }
501
502
2/2
✓ Branch 0 taken 58522 times.
✓ Branch 1 taken 3533 times.
62055 if (best == 1) {
503
2/2
✓ Branch 0 taken 351132 times.
✓ Branch 1 taken 58522 times.
409654 for (i = 0; i < 6; i++) {
504 351132 count[1][i] = put_bits_count(&s->reorder_pb[i]);
505 351132 flush_put_bits(&s->reorder_pb[i]);
506 }
507 } else {
508 3533 motion_ptr[0] =
509 3533 motion_ptr[1] =
510 3533 motion_ptr[2] =
511 3533 motion_ptr[3] =
512 3533 motion_ptr[0 + 2 * s->m.b8_stride] =
513 3533 motion_ptr[1 + 2 * s->m.b8_stride] =
514 3533 motion_ptr[2 + 2 * s->m.b8_stride] =
515 3533 motion_ptr[3 + 2 * s->m.b8_stride] = 0;
516 }
517 }
518
519 68950 s->rd_total += score[best];
520
521
2/2
✓ Branch 0 taken 68867 times.
✓ Branch 1 taken 83 times.
68950 if (best != 2)
522
2/2
✓ Branch 0 taken 413202 times.
✓ Branch 1 taken 68867 times.
482069 for (i = 5; i >= 0; i--)
523 413202 ff_copy_bits(pb, reorder_buffer[best][i],
524 count[best][i]);
525
2/2
✓ Branch 0 taken 10345 times.
✓ Branch 1 taken 58605 times.
68950 if (best == 0)
526 10345 s->hdsp.put_pixels_tab[0][0](decoded, temp, stride, 16);
527 }
528 4450 s->m.first_slice_line = 0;
529 }
530 600 return 0;
531 }
532
533 4 static av_cold int svq1_encode_end(AVCodecContext *avctx)
534 {
535 4 SVQ1EncContext *const s = avctx->priv_data;
536 int i;
537
538
1/2
✓ Branch 0 taken 4 times.
✗ Branch 1 not taken.
4 if (avctx->frame_num)
539 4 av_log(avctx, AV_LOG_DEBUG, "RD: %f\n",
540 4 s->rd_total / (double)(avctx->width * avctx->height *
541 4 avctx->frame_num));
542
543 4 av_freep(&s->m.me.scratchpad);
544 4 av_freep(&s->m.me.map);
545 4 av_freep(&s->mb_type);
546 4 av_freep(&s->dummy);
547 4 av_freep(&s->scratchbuf);
548
549 4 s->m.mb_type = NULL;
550 4 ff_mpv_common_end(&s->m);
551
552
2/2
✓ Branch 0 taken 12 times.
✓ Branch 1 taken 4 times.
16 for (i = 0; i < 3; i++) {
553 12 av_freep(&s->motion_val8[i]);
554 12 av_freep(&s->motion_val16[i]);
555 }
556
557 4 av_frame_free(&s->current_picture);
558 4 av_frame_free(&s->last_picture);
559 4 av_frame_free(&s->m.new_pic);
560
561 4 return 0;
562 }
563
564 4 static av_cold int write_ident(AVCodecContext *avctx, const char *ident)
565 {
566 4 int size = strlen(ident);
567 4 avctx->extradata = av_malloc(size + 8);
568
1/2
✗ Branch 0 not taken.
✓ Branch 1 taken 4 times.
4 if (!avctx->extradata)
569 return AVERROR(ENOMEM);
570 4 AV_WB32(avctx->extradata, size + 8);
571 4 AV_WL32(avctx->extradata + 4, MKTAG('S', 'V', 'Q', '1'));
572 4 memcpy(avctx->extradata + 8, ident, size);
573 4 avctx->extradata_size = size + 8;
574 4 return 0;
575 }
576
577 4 static av_cold int svq1_encode_init(AVCodecContext *avctx)
578 {
579 4 SVQ1EncContext *const s = avctx->priv_data;
580 int ret;
581
582
2/4
✓ Branch 0 taken 4 times.
✗ Branch 1 not taken.
✗ Branch 2 not taken.
✓ Branch 3 taken 4 times.
4 if (avctx->width >= 4096 || avctx->height >= 4096) {
583 av_log(avctx, AV_LOG_ERROR, "Dimensions too large, maximum is 4095x4095\n");
584 return AVERROR(EINVAL);
585 }
586
587 4 ff_hpeldsp_init(&s->hdsp, avctx->flags);
588 4 ff_me_cmp_init(&s->mecc, avctx);
589 4 ret = ff_me_init(&s->m.me, avctx, &s->mecc, 0);
590
1/2
✗ Branch 0 not taken.
✓ Branch 1 taken 4 times.
4 if (ret < 0)
591 return ret;
592 4 ff_mpegvideoencdsp_init(&s->m.mpvencdsp, avctx);
593
594 4 s->current_picture = av_frame_alloc();
595 4 s->last_picture = av_frame_alloc();
596
2/4
✓ Branch 0 taken 4 times.
✗ Branch 1 not taken.
✗ Branch 2 not taken.
✓ Branch 3 taken 4 times.
4 if (!s->current_picture || !s->last_picture) {
597 return AVERROR(ENOMEM);
598 }
599
600 4 s->frame_width = avctx->width;
601 4 s->frame_height = avctx->height;
602
603 4 s->y_block_width = (s->frame_width + 15) / 16;
604 4 s->y_block_height = (s->frame_height + 15) / 16;
605
606 4 s->c_block_width = (s->frame_width / 4 + 15) / 16;
607 4 s->c_block_height = (s->frame_height / 4 + 15) / 16;
608
609 4 s->avctx = avctx;
610 4 s->m.avctx = avctx;
611
612
1/2
✗ Branch 1 not taken.
✓ Branch 2 taken 4 times.
4 if ((ret = ff_mpv_common_init(&s->m)) < 0) {
613 return ret;
614 }
615
616 4 s->m.picture_structure = PICT_FRAME;
617 4 s->m.me.temp =
618 8 s->m.me.scratchpad = av_mallocz((avctx->width + 64) *
619 4 2 * 16 * 2 * sizeof(uint8_t));
620 8 s->mb_type = av_mallocz((s->y_block_width + 1) *
621 4 s->y_block_height * sizeof(int16_t));
622 8 s->dummy = av_mallocz((s->y_block_width + 1) *
623 4 s->y_block_height * sizeof(int32_t));
624 4 s->m.me.map = av_mallocz(2 * ME_MAP_SIZE * sizeof(*s->m.me.map));
625 4 s->m.new_pic = av_frame_alloc();
626
627
2/4
✓ Branch 0 taken 4 times.
✗ Branch 1 not taken.
✓ Branch 2 taken 4 times.
✗ Branch 3 not taken.
4 if (!s->m.me.scratchpad || !s->m.me.map ||
628
3/6
✓ Branch 0 taken 4 times.
✗ Branch 1 not taken.
✓ Branch 2 taken 4 times.
✗ Branch 3 not taken.
✗ Branch 4 not taken.
✓ Branch 5 taken 4 times.
4 !s->mb_type || !s->dummy || !s->m.new_pic)
629 return AVERROR(ENOMEM);
630 4 s->m.me.score_map = s->m.me.map + ME_MAP_SIZE;
631
632 4 ff_svq1enc_init(&s->svq1encdsp);
633
634 4 ff_h263_encode_init(&s->m); // mv_penalty
635
636
1/2
✓ Branch 0 taken 4 times.
✗ Branch 1 not taken.
4 return write_ident(avctx, s->avctx->flags & AV_CODEC_FLAG_BITEXACT ? "Lavc" : LIBAVCODEC_IDENT);
637 }
638
639 200 static int svq1_encode_frame(AVCodecContext *avctx, AVPacket *pkt,
640 const AVFrame *pict, int *got_packet)
641 {
642 200 SVQ1EncContext *const s = avctx->priv_data;
643 PutBitContext pb;
644 int i, ret;
645
646 200 ret = ff_alloc_packet(avctx, pkt, s->y_block_width * s->y_block_height *
647 200 MAX_MB_BYTES * 3 + FF_INPUT_BUFFER_MIN_SIZE);
648
1/2
✗ Branch 0 not taken.
✓ Branch 1 taken 200 times.
200 if (ret < 0)
649 return ret;
650
651
1/2
✗ Branch 0 not taken.
✓ Branch 1 taken 200 times.
200 if (avctx->pix_fmt != AV_PIX_FMT_YUV410P) {
652 av_log(avctx, AV_LOG_ERROR, "unsupported pixel format\n");
653 return -1;
654 }
655
656
2/2
✓ Branch 0 taken 4 times.
✓ Branch 1 taken 196 times.
200 if (!s->current_picture->data[0]) {
657
1/2
✗ Branch 1 not taken.
✓ Branch 2 taken 4 times.
4 if ((ret = ff_encode_alloc_frame(avctx, s->current_picture)) < 0) {
658 return ret;
659 }
660 }
661
2/2
✓ Branch 0 taken 4 times.
✓ Branch 1 taken 196 times.
200 if (!s->last_picture->data[0]) {
662 4 ret = ff_encode_alloc_frame(avctx, s->last_picture);
663
1/2
✗ Branch 0 not taken.
✓ Branch 1 taken 4 times.
4 if (ret < 0)
664 return ret;
665 }
666
2/2
✓ Branch 0 taken 4 times.
✓ Branch 1 taken 196 times.
200 if (!s->scratchbuf) {
667 4 s->scratchbuf = av_malloc_array(s->current_picture->linesize[0], 16 * 3);
668
1/2
✗ Branch 0 not taken.
✓ Branch 1 taken 4 times.
4 if (!s->scratchbuf)
669 return AVERROR(ENOMEM);
670 }
671
672 200 FFSWAP(AVFrame*, s->current_picture, s->last_picture);
673
674
3/4
✓ Branch 0 taken 200 times.
✗ Branch 1 not taken.
✓ Branch 2 taken 180 times.
✓ Branch 3 taken 20 times.
200 if (avctx->gop_size && (avctx->frame_num % avctx->gop_size))
675 180 s->pict_type = AV_PICTURE_TYPE_P;
676 else
677 20 s->pict_type = AV_PICTURE_TYPE_I;
678 200 s->quality = pict->quality;
679
680 200 ff_side_data_set_encoder_stats(pkt, pict->quality, NULL, 0, s->pict_type);
681
682 200 init_put_bits(&pb, pkt->data, pkt->size);
683 200 svq1_write_header(s, &pb, s->pict_type);
684
2/2
✓ Branch 0 taken 600 times.
✓ Branch 1 taken 200 times.
800 for (i = 0; i < 3; i++) {
685 1800 int ret = svq1_encode_plane(s, i, &pb,
686 600 pict->data[i],
687 600 s->last_picture->data[i],
688 600 s->current_picture->data[i],
689
2/2
✓ Branch 0 taken 400 times.
✓ Branch 1 taken 200 times.
600 s->frame_width / (i ? 4 : 1),
690 600 s->frame_height / (i ? 4 : 1),
691 600 pict->linesize[i],
692
2/2
✓ Branch 0 taken 400 times.
✓ Branch 1 taken 200 times.
600 s->current_picture->linesize[i]);
693 600 emms_c();
694
1/2
✗ Branch 0 not taken.
✓ Branch 1 taken 600 times.
600 if (ret < 0) {
695 int j;
696 for (j = 0; j < i; j++) {
697 av_freep(&s->motion_val8[j]);
698 av_freep(&s->motion_val16[j]);
699 }
700 av_freep(&s->scratchbuf);
701 return -1;
702 }
703 }
704
705 // align_put_bits(&pb);
706
2/2
✓ Branch 1 taken 3154 times.
✓ Branch 2 taken 200 times.
3354 while (put_bits_count(&pb) & 31)
707 3154 put_bits(&pb, 1, 0);
708
709 200 flush_put_bits(&pb);
710
711 200 pkt->size = put_bytes_output(&pb);
712
2/2
✓ Branch 0 taken 20 times.
✓ Branch 1 taken 180 times.
200 if (s->pict_type == AV_PICTURE_TYPE_I)
713 20 pkt->flags |= AV_PKT_FLAG_KEY;
714 200 *got_packet = 1;
715
716 200 return 0;
717 }
718
719 #define OFFSET(x) offsetof(struct SVQ1EncContext, x)
720 #define VE AV_OPT_FLAG_VIDEO_PARAM | AV_OPT_FLAG_ENCODING_PARAM
721 static const AVOption options[] = {
722 { "motion-est", "Motion estimation algorithm", OFFSET(motion_est), AV_OPT_TYPE_INT, { .i64 = FF_ME_EPZS }, FF_ME_ZERO, FF_ME_XONE, VE, .unit = "motion-est"},
723 { "zero", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = FF_ME_ZERO }, 0, 0, FF_MPV_OPT_FLAGS, .unit = "motion-est" },
724 { "epzs", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = FF_ME_EPZS }, 0, 0, FF_MPV_OPT_FLAGS, .unit = "motion-est" },
725 { "xone", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = FF_ME_XONE }, 0, 0, FF_MPV_OPT_FLAGS, .unit = "motion-est" },
726
727 { NULL },
728 };
729
730 static const AVClass svq1enc_class = {
731 .class_name = "svq1enc",
732 .item_name = av_default_item_name,
733 .option = options,
734 .version = LIBAVUTIL_VERSION_INT,
735 };
736
737 const FFCodec ff_svq1_encoder = {
738 .p.name = "svq1",
739 CODEC_LONG_NAME("Sorenson Vector Quantizer 1 / Sorenson Video 1 / SVQ1"),
740 .p.type = AVMEDIA_TYPE_VIDEO,
741 .p.id = AV_CODEC_ID_SVQ1,
742 .p.capabilities = AV_CODEC_CAP_DR1 | AV_CODEC_CAP_ENCODER_REORDERED_OPAQUE,
743 .priv_data_size = sizeof(SVQ1EncContext),
744 .p.priv_class = &svq1enc_class,
745 .init = svq1_encode_init,
746 FF_CODEC_ENCODE_CB(svq1_encode_frame),
747 .close = svq1_encode_end,
748 .p.pix_fmts = (const enum AVPixelFormat[]) { AV_PIX_FMT_YUV410P,
749 AV_PIX_FMT_NONE },
750 .caps_internal = FF_CODEC_CAP_INIT_CLEANUP,
751 };
752