FFmpeg coverage


Directory: ../../../ffmpeg/
File: src/libavcodec/svq1enc.c
Date: 2024-03-28 04:31:58
Exec Total Coverage
Lines: 363 383 94.8%
Functions: 8 8 100.0%
Branches: 166 194 85.6%

Line Branch Exec Source
1 /*
2 * SVQ1 Encoder
3 * Copyright (C) 2004 Mike Melanson <melanson@pcisys.net>
4 *
5 * This file is part of FFmpeg.
6 *
7 * FFmpeg is free software; you can redistribute it and/or
8 * modify it under the terms of the GNU Lesser General Public
9 * License as published by the Free Software Foundation; either
10 * version 2.1 of the License, or (at your option) any later version.
11 *
12 * FFmpeg is distributed in the hope that it will be useful,
13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
15 * Lesser General Public License for more details.
16 *
17 * You should have received a copy of the GNU Lesser General Public
18 * License along with FFmpeg; if not, write to the Free Software
19 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
20 */
21
22 /**
23 * @file
24 * Sorenson Vector Quantizer #1 (SVQ1) video codec.
25 * For more information of the SVQ1 algorithm, visit:
26 * http://www.pcisys.net/~melanson/codecs/
27 */
28
29 #include "libavutil/emms.h"
30 #include "avcodec.h"
31 #include "codec_internal.h"
32 #include "encode.h"
33 #include "hpeldsp.h"
34 #include "me_cmp.h"
35 #include "mpegvideo.h"
36 #include "h263.h"
37 #include "h263enc.h"
38 #include "internal.h"
39 #include "mpegutils.h"
40 #include "packet_internal.h"
41 #include "put_bits.h"
42 #include "svq1.h"
43 #include "svq1encdsp.h"
44 #include "svq1enc_cb.h"
45 #include "version.h"
46
47 #include "libavutil/avassert.h"
48 #include "libavutil/frame.h"
49 #include "libavutil/mem_internal.h"
50
51 // Workaround for GCC bug 102513
52 #if AV_GCC_VERSION_AT_LEAST(10, 0) && AV_GCC_VERSION_AT_MOST(12, 0) \
53 && !defined(__clang__) && !defined(__INTEL_COMPILER)
54 #pragma GCC optimize ("no-ipa-cp-clone")
55 #endif
56
57 typedef struct SVQ1EncContext {
58 /* FIXME: Needed for motion estimation, should not be used for anything
59 * else, the idea is to make the motion estimation eventually independent
60 * of MpegEncContext, so this will be removed then. */
61 MpegEncContext m;
62 AVCodecContext *avctx;
63 MECmpContext mecc;
64 HpelDSPContext hdsp;
65 AVFrame *current_picture;
66 AVFrame *last_picture;
67
68 /* Some compression statistics */
69 enum AVPictureType pict_type;
70 int quality;
71
72 /* why ooh why this sick breadth first order,
73 * everything is slower and more complex */
74 PutBitContext reorder_pb[6];
75
76 int frame_width;
77 int frame_height;
78
79 /* Y plane block dimensions */
80 int y_block_width;
81 int y_block_height;
82
83 /* U & V plane (C planes) block dimensions */
84 int c_block_width;
85 int c_block_height;
86
87 DECLARE_ALIGNED(16, int16_t, encoded_block_levels)[6][7][256];
88
89 uint16_t *mb_type;
90 uint32_t *dummy;
91 int16_t (*motion_val8[3])[2];
92 int16_t (*motion_val16[3])[2];
93
94 int64_t rd_total;
95
96 uint8_t *scratchbuf;
97
98 int motion_est;
99
100 SVQ1EncDSPContext svq1encdsp;
101 } SVQ1EncContext;
102
103 200 static void svq1_write_header(SVQ1EncContext *s, PutBitContext *pb, int frame_type)
104 {
105 int i;
106
107 /* frame code */
108 200 put_bits(pb, 22, 0x20);
109
110 /* temporal reference (sure hope this is a "don't care") */
111 200 put_bits(pb, 8, 0x00);
112
113 /* frame type */
114 200 put_bits(pb, 2, frame_type - 1);
115
116
2/2
✓ Branch 0 taken 20 times.
✓ Branch 1 taken 180 times.
200 if (frame_type == AV_PICTURE_TYPE_I) {
117 /* no checksum since frame code is 0x20 */
118 /* no embedded string either */
119 /* output 5 unknown bits (2 + 2 + 1) */
120 20 put_bits(pb, 5, 2); /* 2 needed by quicktime decoder */
121
122 20 i = ff_match_2uint16(ff_svq1_frame_size_table,
123 FF_ARRAY_ELEMS(ff_svq1_frame_size_table),
124 s->frame_width, s->frame_height);
125 20 put_bits(pb, 3, i);
126
127
2/2
✓ Branch 0 taken 5 times.
✓ Branch 1 taken 15 times.
20 if (i == 7) {
128 5 put_bits(pb, 12, s->frame_width);
129 5 put_bits(pb, 12, s->frame_height);
130 }
131 }
132
133 /* no checksum or extra data (next 2 bits get 0) */
134 200 put_bits(pb, 2, 0);
135 200 }
136
137 #define QUALITY_THRESHOLD 100
138 #define THRESHOLD_MULTIPLIER 0.6
139
140 4302522 static int encode_block(SVQ1EncContext *s, uint8_t *src, uint8_t *ref,
141 uint8_t *decoded, int stride, unsigned level,
142 int threshold, int lambda, int intra)
143 {
144 int count, y, x, i, j, split, best_mean, best_score, best_count;
145 int best_vector[6];
146 4302522 int block_sum[7] = { 0, 0, 0, 0, 0, 0 };
147 4302522 int w = 2 << (level + 2 >> 1);
148 4302522 int h = 2 << (level + 1 >> 1);
149 4302522 int size = w * h;
150 4302522 int16_t (*block)[256] = s->encoded_block_levels[level];
151 const int8_t *codebook_sum, *codebook;
152 const uint16_t(*mean_vlc)[2];
153 const uint8_t(*multistage_vlc)[2];
154
155 4302522 best_score = 0;
156 // FIXME: Optimize, this does not need to be done multiple times.
157
2/2
✓ Branch 0 taken 643715 times.
✓ Branch 1 taken 3658807 times.
4302522 if (intra) {
158 // level is 5 when encode_block is called from svq1_encode_plane
159 // and always < 4 when called recursively from this function.
160
2/2
✓ Branch 0 taken 612686 times.
✓ Branch 1 taken 31029 times.
643715 codebook_sum = level < 4 ? svq1_intra_codebook_sum[level] : NULL;
161 643715 codebook = ff_svq1_intra_codebooks[level];
162 643715 mean_vlc = ff_svq1_intra_mean_vlc;
163 643715 multistage_vlc = ff_svq1_intra_multistage_vlc[level];
164
2/2
✓ Branch 0 taken 2296676 times.
✓ Branch 1 taken 643715 times.
2940391 for (y = 0; y < h; y++) {
165
2/2
✓ Branch 0 taken 15798160 times.
✓ Branch 1 taken 2296676 times.
18094836 for (x = 0; x < w; x++) {
166 15798160 int v = src[x + y * stride];
167 15798160 block[0][x + w * y] = v;
168 15798160 best_score += v * v;
169 15798160 block_sum[0] += v;
170 }
171 }
172 } else {
173 // level is 5 or < 4, see above for details.
174
2/2
✓ Branch 0 taken 3483018 times.
✓ Branch 1 taken 175789 times.
3658807 codebook_sum = level < 4 ? svq1_inter_codebook_sum[level] : NULL;
175 3658807 codebook = ff_svq1_inter_codebooks[level];
176 3658807 mean_vlc = ff_svq1_inter_mean_vlc + 256;
177 3658807 multistage_vlc = ff_svq1_inter_multistage_vlc[level];
178
2/2
✓ Branch 0 taken 13044696 times.
✓ Branch 1 taken 3658807 times.
16703503 for (y = 0; y < h; y++) {
179
2/2
✓ Branch 0 taken 89655008 times.
✓ Branch 1 taken 13044696 times.
102699704 for (x = 0; x < w; x++) {
180 89655008 int v = src[x + y * stride] - ref[x + y * stride];
181 89655008 block[0][x + w * y] = v;
182 89655008 best_score += v * v;
183 89655008 block_sum[0] += v;
184 }
185 }
186 }
187
188 4302522 best_count = 0;
189 4302522 best_score -= (int)((unsigned)block_sum[0] * block_sum[0] >> (level + 3));
190 4302522 best_mean = block_sum[0] + (size >> 1) >> (level + 3);
191
192
2/2
✓ Branch 0 taken 4095704 times.
✓ Branch 1 taken 206818 times.
4302522 if (level < 4) {
193
2/2
✓ Branch 0 taken 24574224 times.
✓ Branch 1 taken 4095704 times.
28669928 for (count = 1; count < 7; count++) {
194 24574224 int best_vector_score = INT_MAX;
195 24574224 int best_vector_sum = -999, best_vector_mean = -999;
196 24574224 const int stage = count - 1;
197 const int8_t *vector;
198
199
2/2
✓ Branch 0 taken 393187584 times.
✓ Branch 1 taken 24574224 times.
417761808 for (i = 0; i < 16; i++) {
200 393187584 int sum = codebook_sum[stage * 16 + i];
201 int sqr, diff, score;
202
203 393187584 vector = codebook + stage * size * 16 + i * size;
204 393187584 sqr = s->svq1encdsp.ssd_int8_vs_int16(vector, block[stage], size);
205 393187584 diff = block_sum[stage] - sum;
206 393187584 score = sqr - (diff * (int64_t)diff >> (level + 3)); // FIXME: 64 bits slooow
207
2/2
✓ Branch 0 taken 65426753 times.
✓ Branch 1 taken 327760831 times.
393187584 if (score < best_vector_score) {
208 65426753 int mean = diff + (size >> 1) >> (level + 3);
209 av_assert2(mean > -300 && mean < 300);
210
2/2
✓ Branch 0 taken 9912177 times.
✓ Branch 1 taken 55514576 times.
65426753 mean = av_clip(mean, intra ? 0 : -256, 255);
211 65426753 best_vector_score = score;
212 65426753 best_vector[stage] = i;
213 65426753 best_vector_sum = sum;
214 65426753 best_vector_mean = mean;
215 }
216 }
217
1/2
✗ Branch 0 not taken.
✓ Branch 1 taken 24574224 times.
24574224 av_assert0(best_vector_mean != -999);
218 24574224 vector = codebook + stage * size * 16 + best_vector[stage] * size;
219
2/2
✓ Branch 0 taken 420929184 times.
✓ Branch 1 taken 24574224 times.
445503408 for (j = 0; j < size; j++)
220 420929184 block[stage + 1][j] = block[stage][j] - vector[j];
221 24574224 block_sum[stage + 1] = block_sum[stage] - best_vector_sum;
222 24574224 best_vector_score += lambda *
223 24574224 (+1 + 4 * count +
224 24574224 multistage_vlc[1 + count][1]
225 24574224 + mean_vlc[best_vector_mean][1]);
226
227
2/2
✓ Branch 0 taken 5416629 times.
✓ Branch 1 taken 19157595 times.
24574224 if (best_vector_score < best_score) {
228 5416629 best_score = best_vector_score;
229 5416629 best_count = count;
230 5416629 best_mean = best_vector_mean;
231 }
232 }
233 }
234
235
2/2
✓ Branch 0 taken 12 times.
✓ Branch 1 taken 4302510 times.
4302522 if (best_mean == -128)
236 12 best_mean = -127;
237
2/2
✓ Branch 0 taken 6210 times.
✓ Branch 1 taken 4296300 times.
4302510 else if (best_mean == 128)
238 6210 best_mean = 127;
239
240 4302522 split = 0;
241
4/4
✓ Branch 0 taken 4243230 times.
✓ Branch 1 taken 59292 times.
✓ Branch 2 taken 2116786 times.
✓ Branch 3 taken 2126444 times.
4302522 if (best_score > threshold && level) {
242 2116786 int score = 0;
243
2/2
✓ Branch 0 taken 1431267 times.
✓ Branch 1 taken 685519 times.
2116786 int offset = level & 1 ? stride * h / 2 : w / 2;
244 PutBitContext backup[6];
245
246
2/2
✓ Branch 0 taken 3903357 times.
✓ Branch 1 taken 2116786 times.
6020143 for (i = level - 1; i >= 0; i--)
247 3903357 backup[i] = s->reorder_pb[i];
248 2116786 score += encode_block(s, src, ref, decoded, stride, level - 1,
249 threshold >> 1, lambda, intra);
250 2116786 score += encode_block(s, src + offset, ref + offset, decoded + offset,
251 stride, level - 1, threshold >> 1, lambda, intra);
252 2116786 score += lambda;
253
254
2/2
✓ Branch 0 taken 1359243 times.
✓ Branch 1 taken 757543 times.
2116786 if (score < best_score) {
255 1359243 best_score = score;
256 1359243 split = 1;
257 } else {
258
2/2
✓ Branch 0 taken 1046147 times.
✓ Branch 1 taken 757543 times.
1803690 for (i = level - 1; i >= 0; i--)
259 1046147 s->reorder_pb[i] = backup[i];
260 }
261 }
262
2/2
✓ Branch 0 taken 2127616 times.
✓ Branch 1 taken 2174906 times.
4302522 if (level > 0)
263 2127616 put_bits(&s->reorder_pb[level], 1, split);
264
265
2/2
✓ Branch 0 taken 2943279 times.
✓ Branch 1 taken 1359243 times.
4302522 if (!split) {
266 av_assert1(best_mean >= 0 && best_mean < 256 || !intra);
267 av_assert1(best_mean >= -256 && best_mean < 256);
268 av_assert1(best_count >= 0 && best_count < 7);
269 av_assert1(level < 4 || best_count == 0);
270
271 /* output the encoding */
272 2943279 put_bits(&s->reorder_pb[level],
273 2943279 multistage_vlc[1 + best_count][1],
274 2943279 multistage_vlc[1 + best_count][0]);
275 2943279 put_bits(&s->reorder_pb[level], mean_vlc[best_mean][1],
276 2943279 mean_vlc[best_mean][0]);
277
278
2/2
✓ Branch 0 taken 3649044 times.
✓ Branch 1 taken 2943279 times.
6592323 for (i = 0; i < best_count; i++) {
279 av_assert2(best_vector[i] >= 0 && best_vector[i] < 16);
280 3649044 put_bits(&s->reorder_pb[level], 4, best_vector[i]);
281 }
282
283
2/2
✓ Branch 0 taken 7680728 times.
✓ Branch 1 taken 2943279 times.
10624007 for (y = 0; y < h; y++)
284
2/2
✓ Branch 0 taken 36196848 times.
✓ Branch 1 taken 7680728 times.
43877576 for (x = 0; x < w; x++)
285 36196848 decoded[x + y * stride] = src[x + y * stride] -
286 36196848 block[best_count][x + w * y] +
287 best_mean;
288 }
289
290 4302522 return best_score;
291 }
292
293 131005 static void init_block_index(MpegEncContext *s){
294 131005 s->block_index[0]= s->b8_stride*(s->mb_y*2 ) + s->mb_x*2;
295 131005 s->block_index[1]= s->b8_stride*(s->mb_y*2 ) + 1 + s->mb_x*2;
296 131005 s->block_index[2]= s->b8_stride*(s->mb_y*2 + 1) + s->mb_x*2;
297 131005 s->block_index[3]= s->b8_stride*(s->mb_y*2 + 1) + 1 + s->mb_x*2;
298 131005 s->block_index[4]= s->mb_stride*(s->mb_y + 1) + s->b8_stride*s->mb_height*2 + s->mb_x;
299 131005 s->block_index[5]= s->mb_stride*(s->mb_y + s->mb_height + 2) + s->b8_stride*s->mb_height*2 + s->mb_x;
300 131005 }
301
302 600 static int svq1_encode_plane(SVQ1EncContext *s, int plane,
303 PutBitContext *pb,
304 const unsigned char *src_plane,
305 unsigned char *ref_plane,
306 unsigned char *decoded_plane,
307 int width, int height, int src_stride, int stride)
308 {
309 int x, y;
310 int i;
311 int block_width, block_height;
312 int level;
313 int threshold[6];
314 600 uint8_t *src = s->scratchbuf + stride * 32;
315 600 const int lambda = (s->quality * s->quality) >>
316 (2 * FF_LAMBDA_SHIFT);
317
318 /* figure out the acceptable level thresholds in advance */
319 600 threshold[5] = QUALITY_THRESHOLD;
320
2/2
✓ Branch 0 taken 3000 times.
✓ Branch 1 taken 600 times.
3600 for (level = 4; level >= 0; level--)
321 3000 threshold[level] = threshold[level + 1] * THRESHOLD_MULTIPLIER;
322
323 600 block_width = (width + 15) / 16;
324 600 block_height = (height + 15) / 16;
325
326
2/2
✓ Branch 0 taken 540 times.
✓ Branch 1 taken 60 times.
600 if (s->pict_type == AV_PICTURE_TYPE_P) {
327 540 s->m.avctx = s->avctx;
328 540 s->m.current_picture_ptr = &s->m.current_picture;
329 540 s->m.last_picture_ptr = &s->m.last_picture;
330 540 s->m.last_picture.f->data[0] = ref_plane;
331 540 s->m.linesize =
332 540 s->m.last_picture.f->linesize[0] =
333 540 s->m.new_picture->linesize[0] =
334 540 s->m.current_picture.f->linesize[0] = stride;
335 540 s->m.width = width;
336 540 s->m.height = height;
337 540 s->m.mb_width = block_width;
338 540 s->m.mb_height = block_height;
339 540 s->m.mb_stride = s->m.mb_width + 1;
340 540 s->m.b8_stride = 2 * s->m.mb_width + 1;
341 540 s->m.f_code = 1;
342 540 s->m.pict_type = s->pict_type;
343 540 s->m.motion_est = s->motion_est;
344 540 s->m.me.scene_change_score = 0;
345 // s->m.out_format = FMT_H263;
346 // s->m.unrestricted_mv = 1;
347 540 s->m.lambda = s->quality;
348 540 s->m.qscale = s->m.lambda * 139 +
349 540 FF_LAMBDA_SCALE * 64 >>
350 FF_LAMBDA_SHIFT + 7;
351 540 s->m.lambda2 = s->m.lambda * s->m.lambda +
352 540 FF_LAMBDA_SCALE / 2 >>
353 FF_LAMBDA_SHIFT;
354
355
2/2
✓ Branch 0 taken 12 times.
✓ Branch 1 taken 528 times.
540 if (!s->motion_val8[plane]) {
356 24 s->motion_val8[plane] = av_mallocz((s->m.b8_stride *
357 12 block_height * 2 + 2) *
358 2 * sizeof(int16_t));
359 24 s->motion_val16[plane] = av_mallocz((s->m.mb_stride *
360 12 (block_height + 2) + 1) *
361 2 * sizeof(int16_t));
362
2/4
✓ Branch 0 taken 12 times.
✗ Branch 1 not taken.
✗ Branch 2 not taken.
✓ Branch 3 taken 12 times.
12 if (!s->motion_val8[plane] || !s->motion_val16[plane])
363 return AVERROR(ENOMEM);
364 }
365
366 540 s->m.mb_type = s->mb_type;
367
368 // dummies, to avoid segfaults
369 540 s->m.mb_mean = (uint8_t *)s->dummy;
370 540 s->m.mb_var = (uint16_t *)s->dummy;
371 540 s->m.mc_mb_var = (uint16_t *)s->dummy;
372 540 s->m.current_picture.mb_type = s->dummy;
373
374 540 s->m.current_picture.motion_val[0] = s->motion_val8[plane] + 2;
375 540 s->m.p_mv_table = s->motion_val16[plane] +
376 540 s->m.mb_stride + 1;
377 540 s->m.mecc = s->mecc; // move
378 540 ff_init_me(&s->m);
379
380 540 s->m.me.dia_size = s->avctx->dia_size;
381 540 s->m.first_slice_line = 1;
382
2/2
✓ Branch 0 taken 4005 times.
✓ Branch 1 taken 540 times.
4545 for (y = 0; y < block_height; y++) {
383 4005 s->m.new_picture->data[0] = src - y * 16 * stride; // ugly
384 4005 s->m.mb_y = y;
385
386
4/4
✓ Branch 0 taken 60975 times.
✓ Branch 1 taken 3600 times.
✓ Branch 2 taken 60570 times.
✓ Branch 3 taken 405 times.
64575 for (i = 0; i < 16 && i + 16 * y < height; i++) {
387 60570 memcpy(&src[i * stride], &src_plane[(i + 16 * y) * src_stride],
388 width);
389
2/2
✓ Branch 0 taken 182700 times.
✓ Branch 1 taken 60570 times.
243270 for (x = width; x < 16 * block_width; x++)
390 182700 src[i * stride + x] = src[i * stride + x - 1];
391 }
392
3/4
✓ Branch 0 taken 3510 times.
✓ Branch 1 taken 4005 times.
✓ Branch 2 taken 3510 times.
✗ Branch 3 not taken.
7515 for (; i < 16 && i + 16 * y < 16 * block_height; i++)
393 3510 memcpy(&src[i * stride], &src[(i - 1) * stride],
394 3510 16 * block_width);
395
396
2/2
✓ Branch 0 taken 62055 times.
✓ Branch 1 taken 4005 times.
66060 for (x = 0; x < block_width; x++) {
397 62055 s->m.mb_x = x;
398 62055 init_block_index(&s->m);
399
400 62055 ff_estimate_p_frame_motion(&s->m, x, y);
401 }
402 4005 s->m.first_slice_line = 0;
403 }
404
405 540 ff_fix_long_p_mvs(&s->m, CANDIDATE_MB_TYPE_INTRA);
406 540 ff_fix_long_mvs(&s->m, NULL, 0, s->m.p_mv_table, s->m.f_code,
407 CANDIDATE_MB_TYPE_INTER, 0);
408 }
409
410 600 s->m.first_slice_line = 1;
411
2/2
✓ Branch 0 taken 4450 times.
✓ Branch 1 taken 600 times.
5050 for (y = 0; y < block_height; y++) {
412
4/4
✓ Branch 0 taken 67750 times.
✓ Branch 1 taken 4000 times.
✓ Branch 2 taken 67300 times.
✓ Branch 3 taken 450 times.
71750 for (i = 0; i < 16 && i + 16 * y < height; i++) {
413 67300 memcpy(&src[i * stride], &src_plane[(i + 16 * y) * src_stride],
414 width);
415
2/2
✓ Branch 0 taken 203000 times.
✓ Branch 1 taken 67300 times.
270300 for (x = width; x < 16 * block_width; x++)
416 203000 src[i * stride + x] = src[i * stride + x - 1];
417 }
418
3/4
✓ Branch 0 taken 3900 times.
✓ Branch 1 taken 4450 times.
✓ Branch 2 taken 3900 times.
✗ Branch 3 not taken.
8350 for (; i < 16 && i + 16 * y < 16 * block_height; i++)
419 3900 memcpy(&src[i * stride], &src[(i - 1) * stride], 16 * block_width);
420
421 4450 s->m.mb_y = y;
422
2/2
✓ Branch 0 taken 68950 times.
✓ Branch 1 taken 4450 times.
73400 for (x = 0; x < block_width; x++) {
423 uint8_t reorder_buffer[2][6][7 * 32];
424 int count[2][6];
425 68950 int offset = y * 16 * stride + x * 16;
426 68950 uint8_t *decoded = decoded_plane + offset;
427 68950 const uint8_t *ref = ref_plane + offset;
428 68950 int score[4] = { 0, 0, 0, 0 }, best;
429 68950 uint8_t *temp = s->scratchbuf;
430
431
1/2
✗ Branch 1 not taken.
✓ Branch 2 taken 68950 times.
68950 if (put_bytes_left(pb, 0) < 3000) { // FIXME: check size
432 av_log(s->avctx, AV_LOG_ERROR, "encoded frame too large\n");
433 return -1;
434 }
435
436 68950 s->m.mb_x = x;
437 68950 init_block_index(&s->m);
438
439
2/2
✓ Branch 0 taken 62055 times.
✓ Branch 1 taken 6895 times.
68950 if (s->pict_type == AV_PICTURE_TYPE_I ||
440
2/2
✓ Branch 0 taken 3450 times.
✓ Branch 1 taken 58605 times.
62055 (s->m.mb_type[x + y * s->m.mb_stride] &
441 CANDIDATE_MB_TYPE_INTRA)) {
442
2/2
✓ Branch 0 taken 62070 times.
✓ Branch 1 taken 10345 times.
72415 for (i = 0; i < 6; i++)
443 62070 init_put_bits(&s->reorder_pb[i], reorder_buffer[0][i],
444 7 * 32);
445
2/2
✓ Branch 0 taken 3450 times.
✓ Branch 1 taken 6895 times.
10345 if (s->pict_type == AV_PICTURE_TYPE_P) {
446 3450 put_bits(&s->reorder_pb[5], SVQ1_BLOCK_INTRA_LEN, SVQ1_BLOCK_INTRA_CODE);
447 3450 score[0] = SVQ1_BLOCK_INTRA_LEN * lambda;
448 }
449 10345 score[0] += encode_block(s, src + 16 * x, NULL, temp, stride,
450 5, 64, lambda, 1);
451
2/2
✓ Branch 0 taken 62070 times.
✓ Branch 1 taken 10345 times.
72415 for (i = 0; i < 6; i++) {
452 62070 count[0][i] = put_bits_count(&s->reorder_pb[i]);
453 62070 flush_put_bits(&s->reorder_pb[i]);
454 }
455 } else
456 58605 score[0] = INT_MAX;
457
458 68950 best = 0;
459
460
2/2
✓ Branch 0 taken 62055 times.
✓ Branch 1 taken 6895 times.
68950 if (s->pict_type == AV_PICTURE_TYPE_P) {
461 int mx, my, pred_x, pred_y, dxy;
462 int16_t *motion_ptr;
463
464 62055 motion_ptr = ff_h263_pred_motion(&s->m, 0, 0, &pred_x, &pred_y);
465
2/2
✓ Branch 0 taken 58605 times.
✓ Branch 1 taken 3450 times.
62055 if (s->m.mb_type[x + y * s->m.mb_stride] &
466 CANDIDATE_MB_TYPE_INTER) {
467
2/2
✓ Branch 0 taken 351630 times.
✓ Branch 1 taken 58605 times.
410235 for (i = 0; i < 6; i++)
468 351630 init_put_bits(&s->reorder_pb[i], reorder_buffer[1][i],
469 7 * 32);
470
471 58605 put_bits(&s->reorder_pb[5], SVQ1_BLOCK_INTER_LEN, SVQ1_BLOCK_INTER_CODE);
472
473 58605 s->m.pb = s->reorder_pb[5];
474 58605 mx = motion_ptr[0];
475 58605 my = motion_ptr[1];
476 av_assert1(mx >= -32 && mx <= 31);
477 av_assert1(my >= -32 && my <= 31);
478 av_assert1(pred_x >= -32 && pred_x <= 31);
479 av_assert1(pred_y >= -32 && pred_y <= 31);
480 58605 ff_h263_encode_motion(&s->m.pb, mx - pred_x, 1);
481 58605 ff_h263_encode_motion(&s->m.pb, my - pred_y, 1);
482 58605 s->reorder_pb[5] = s->m.pb;
483 58605 score[1] += lambda * put_bits_count(&s->reorder_pb[5]);
484
485 58605 dxy = (mx & 1) + 2 * (my & 1);
486
487 58605 s->hdsp.put_pixels_tab[0][dxy](temp + 16*stride,
488 58605 ref + (mx >> 1) +
489 58605 stride * (my >> 1),
490 stride, 16);
491
492 58605 score[1] += encode_block(s, src + 16 * x, temp + 16*stride,
493 decoded, stride, 5, 64, lambda, 0);
494 58605 best = score[1] <= score[0];
495
496 58605 score[2] = s->mecc.sse[0](NULL, src + 16 * x, ref,
497 stride, 16);
498 58605 score[2] += SVQ1_BLOCK_SKIP_LEN * lambda;
499
6/6
✓ Branch 0 taken 119 times.
✓ Branch 1 taken 58486 times.
✓ Branch 2 taken 88 times.
✓ Branch 3 taken 31 times.
✓ Branch 4 taken 83 times.
✓ Branch 5 taken 5 times.
58605 if (score[2] < score[best] && mx == 0 && my == 0) {
500 83 best = 2;
501 83 s->hdsp.put_pixels_tab[0][0](decoded, ref, stride, 16);
502 83 put_bits(pb, SVQ1_BLOCK_SKIP_LEN, SVQ1_BLOCK_SKIP_CODE);
503 }
504 }
505
506
2/2
✓ Branch 0 taken 58522 times.
✓ Branch 1 taken 3533 times.
62055 if (best == 1) {
507
2/2
✓ Branch 0 taken 351132 times.
✓ Branch 1 taken 58522 times.
409654 for (i = 0; i < 6; i++) {
508 351132 count[1][i] = put_bits_count(&s->reorder_pb[i]);
509 351132 flush_put_bits(&s->reorder_pb[i]);
510 }
511 } else {
512 3533 motion_ptr[0] =
513 3533 motion_ptr[1] =
514 3533 motion_ptr[2] =
515 3533 motion_ptr[3] =
516 3533 motion_ptr[0 + 2 * s->m.b8_stride] =
517 3533 motion_ptr[1 + 2 * s->m.b8_stride] =
518 3533 motion_ptr[2 + 2 * s->m.b8_stride] =
519 3533 motion_ptr[3 + 2 * s->m.b8_stride] = 0;
520 }
521 }
522
523 68950 s->rd_total += score[best];
524
525
2/2
✓ Branch 0 taken 68867 times.
✓ Branch 1 taken 83 times.
68950 if (best != 2)
526
2/2
✓ Branch 0 taken 413202 times.
✓ Branch 1 taken 68867 times.
482069 for (i = 5; i >= 0; i--)
527 413202 ff_copy_bits(pb, reorder_buffer[best][i],
528 count[best][i]);
529
2/2
✓ Branch 0 taken 10345 times.
✓ Branch 1 taken 58605 times.
68950 if (best == 0)
530 10345 s->hdsp.put_pixels_tab[0][0](decoded, temp, stride, 16);
531 }
532 4450 s->m.first_slice_line = 0;
533 }
534 600 return 0;
535 }
536
537 4 static av_cold int svq1_encode_end(AVCodecContext *avctx)
538 {
539 4 SVQ1EncContext *const s = avctx->priv_data;
540 int i;
541
542
1/2
✓ Branch 0 taken 4 times.
✗ Branch 1 not taken.
4 if (avctx->frame_num)
543 4 av_log(avctx, AV_LOG_DEBUG, "RD: %f\n",
544 4 s->rd_total / (double)(avctx->width * avctx->height *
545 4 avctx->frame_num));
546
547 4 s->m.mb_type = NULL;
548 4 ff_mpv_common_end(&s->m);
549
550 4 av_freep(&s->m.me.scratchpad);
551 4 av_freep(&s->m.me.map);
552 4 av_freep(&s->mb_type);
553 4 av_freep(&s->dummy);
554 4 av_freep(&s->scratchbuf);
555
556
2/2
✓ Branch 0 taken 12 times.
✓ Branch 1 taken 4 times.
16 for (i = 0; i < 3; i++) {
557 12 av_freep(&s->motion_val8[i]);
558 12 av_freep(&s->motion_val16[i]);
559 }
560
561 4 av_frame_free(&s->current_picture);
562 4 av_frame_free(&s->last_picture);
563 4 av_frame_free(&s->m.new_picture);
564
565 4 return 0;
566 }
567
568 4 static av_cold int write_ident(AVCodecContext *avctx, const char *ident)
569 {
570 4 int size = strlen(ident);
571 4 avctx->extradata = av_malloc(size + 8);
572
1/2
✗ Branch 0 not taken.
✓ Branch 1 taken 4 times.
4 if (!avctx->extradata)
573 return AVERROR(ENOMEM);
574 4 AV_WB32(avctx->extradata, size + 8);
575 4 AV_WL32(avctx->extradata + 4, MKTAG('S', 'V', 'Q', '1'));
576 4 memcpy(avctx->extradata + 8, ident, size);
577 4 avctx->extradata_size = size + 8;
578 4 return 0;
579 }
580
581 4 static av_cold int svq1_encode_init(AVCodecContext *avctx)
582 {
583 4 SVQ1EncContext *const s = avctx->priv_data;
584 int ret;
585
586
2/4
✓ Branch 0 taken 4 times.
✗ Branch 1 not taken.
✗ Branch 2 not taken.
✓ Branch 3 taken 4 times.
4 if (avctx->width >= 4096 || avctx->height >= 4096) {
587 av_log(avctx, AV_LOG_ERROR, "Dimensions too large, maximum is 4095x4095\n");
588 return AVERROR(EINVAL);
589 }
590
591 4 ff_hpeldsp_init(&s->hdsp, avctx->flags);
592 4 ff_me_cmp_init(&s->mecc, avctx);
593 4 ff_mpegvideoencdsp_init(&s->m.mpvencdsp, avctx);
594
595 4 s->current_picture = av_frame_alloc();
596 4 s->last_picture = av_frame_alloc();
597
2/4
✓ Branch 0 taken 4 times.
✗ Branch 1 not taken.
✗ Branch 2 not taken.
✓ Branch 3 taken 4 times.
4 if (!s->current_picture || !s->last_picture) {
598 return AVERROR(ENOMEM);
599 }
600
601 4 s->frame_width = avctx->width;
602 4 s->frame_height = avctx->height;
603
604 4 s->y_block_width = (s->frame_width + 15) / 16;
605 4 s->y_block_height = (s->frame_height + 15) / 16;
606
607 4 s->c_block_width = (s->frame_width / 4 + 15) / 16;
608 4 s->c_block_height = (s->frame_height / 4 + 15) / 16;
609
610 4 s->avctx = avctx;
611 4 s->m.avctx = avctx;
612
613
1/2
✗ Branch 1 not taken.
✓ Branch 2 taken 4 times.
4 if ((ret = ff_mpv_common_init(&s->m)) < 0) {
614 return ret;
615 }
616
617 4 s->m.picture_structure = PICT_FRAME;
618 4 s->m.me.temp =
619 8 s->m.me.scratchpad = av_mallocz((avctx->width + 64) *
620 4 2 * 16 * 2 * sizeof(uint8_t));
621 8 s->mb_type = av_mallocz((s->y_block_width + 1) *
622 4 s->y_block_height * sizeof(int16_t));
623 8 s->dummy = av_mallocz((s->y_block_width + 1) *
624 4 s->y_block_height * sizeof(int32_t));
625 4 s->m.me.map = av_mallocz(2 * ME_MAP_SIZE * sizeof(*s->m.me.map));
626 4 s->m.new_picture = av_frame_alloc();
627
628
2/4
✓ Branch 0 taken 4 times.
✗ Branch 1 not taken.
✓ Branch 2 taken 4 times.
✗ Branch 3 not taken.
4 if (!s->m.me.scratchpad || !s->m.me.map ||
629
3/6
✓ Branch 0 taken 4 times.
✗ Branch 1 not taken.
✓ Branch 2 taken 4 times.
✗ Branch 3 not taken.
✗ Branch 4 not taken.
✓ Branch 5 taken 4 times.
4 !s->mb_type || !s->dummy || !s->m.new_picture)
630 return AVERROR(ENOMEM);
631 4 s->m.me.score_map = s->m.me.map + ME_MAP_SIZE;
632
633 4 ff_svq1enc_init(&s->svq1encdsp);
634
635 4 ff_h263_encode_init(&s->m); // mv_penalty
636
637
1/2
✓ Branch 0 taken 4 times.
✗ Branch 1 not taken.
4 return write_ident(avctx, s->avctx->flags & AV_CODEC_FLAG_BITEXACT ? "Lavc" : LIBAVCODEC_IDENT);
638 }
639
640 200 static int svq1_encode_frame(AVCodecContext *avctx, AVPacket *pkt,
641 const AVFrame *pict, int *got_packet)
642 {
643 200 SVQ1EncContext *const s = avctx->priv_data;
644 PutBitContext pb;
645 int i, ret;
646
647 200 ret = ff_alloc_packet(avctx, pkt, s->y_block_width * s->y_block_height *
648 200 MAX_MB_BYTES * 3 + FF_INPUT_BUFFER_MIN_SIZE);
649
1/2
✗ Branch 0 not taken.
✓ Branch 1 taken 200 times.
200 if (ret < 0)
650 return ret;
651
652
1/2
✗ Branch 0 not taken.
✓ Branch 1 taken 200 times.
200 if (avctx->pix_fmt != AV_PIX_FMT_YUV410P) {
653 av_log(avctx, AV_LOG_ERROR, "unsupported pixel format\n");
654 return -1;
655 }
656
657
2/2
✓ Branch 0 taken 4 times.
✓ Branch 1 taken 196 times.
200 if (!s->current_picture->data[0]) {
658
1/2
✗ Branch 1 not taken.
✓ Branch 2 taken 4 times.
4 if ((ret = ff_encode_alloc_frame(avctx, s->current_picture)) < 0) {
659 return ret;
660 }
661 }
662
2/2
✓ Branch 0 taken 4 times.
✓ Branch 1 taken 196 times.
200 if (!s->last_picture->data[0]) {
663 4 ret = ff_encode_alloc_frame(avctx, s->last_picture);
664
1/2
✗ Branch 0 not taken.
✓ Branch 1 taken 4 times.
4 if (ret < 0)
665 return ret;
666 }
667
2/2
✓ Branch 0 taken 4 times.
✓ Branch 1 taken 196 times.
200 if (!s->scratchbuf) {
668 4 s->scratchbuf = av_malloc_array(s->current_picture->linesize[0], 16 * 3);
669
1/2
✗ Branch 0 not taken.
✓ Branch 1 taken 4 times.
4 if (!s->scratchbuf)
670 return AVERROR(ENOMEM);
671 }
672
673 200 FFSWAP(AVFrame*, s->current_picture, s->last_picture);
674
675
3/4
✓ Branch 0 taken 200 times.
✗ Branch 1 not taken.
✓ Branch 2 taken 180 times.
✓ Branch 3 taken 20 times.
200 if (avctx->gop_size && (avctx->frame_num % avctx->gop_size))
676 180 s->pict_type = AV_PICTURE_TYPE_P;
677 else
678 20 s->pict_type = AV_PICTURE_TYPE_I;
679 200 s->quality = pict->quality;
680
681 200 ff_side_data_set_encoder_stats(pkt, pict->quality, NULL, 0, s->pict_type);
682
683 200 init_put_bits(&pb, pkt->data, pkt->size);
684 200 svq1_write_header(s, &pb, s->pict_type);
685
2/2
✓ Branch 0 taken 600 times.
✓ Branch 1 taken 200 times.
800 for (i = 0; i < 3; i++) {
686 1800 int ret = svq1_encode_plane(s, i, &pb,
687 600 pict->data[i],
688 600 s->last_picture->data[i],
689 600 s->current_picture->data[i],
690
2/2
✓ Branch 0 taken 400 times.
✓ Branch 1 taken 200 times.
600 s->frame_width / (i ? 4 : 1),
691 600 s->frame_height / (i ? 4 : 1),
692 600 pict->linesize[i],
693
2/2
✓ Branch 0 taken 400 times.
✓ Branch 1 taken 200 times.
600 s->current_picture->linesize[i]);
694 600 emms_c();
695
1/2
✗ Branch 0 not taken.
✓ Branch 1 taken 600 times.
600 if (ret < 0) {
696 int j;
697 for (j = 0; j < i; j++) {
698 av_freep(&s->motion_val8[j]);
699 av_freep(&s->motion_val16[j]);
700 }
701 av_freep(&s->scratchbuf);
702 return -1;
703 }
704 }
705
706 // align_put_bits(&pb);
707
2/2
✓ Branch 1 taken 3154 times.
✓ Branch 2 taken 200 times.
3354 while (put_bits_count(&pb) & 31)
708 3154 put_bits(&pb, 1, 0);
709
710 200 flush_put_bits(&pb);
711
712 200 pkt->size = put_bytes_output(&pb);
713
2/2
✓ Branch 0 taken 20 times.
✓ Branch 1 taken 180 times.
200 if (s->pict_type == AV_PICTURE_TYPE_I)
714 20 pkt->flags |= AV_PKT_FLAG_KEY;
715 200 *got_packet = 1;
716
717 200 return 0;
718 }
719
720 #define OFFSET(x) offsetof(struct SVQ1EncContext, x)
721 #define VE AV_OPT_FLAG_VIDEO_PARAM | AV_OPT_FLAG_ENCODING_PARAM
722 static const AVOption options[] = {
723 { "motion-est", "Motion estimation algorithm", OFFSET(motion_est), AV_OPT_TYPE_INT, { .i64 = FF_ME_EPZS }, FF_ME_ZERO, FF_ME_XONE, VE, .unit = "motion-est"},
724 { "zero", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = FF_ME_ZERO }, 0, 0, FF_MPV_OPT_FLAGS, .unit = "motion-est" },
725 { "epzs", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = FF_ME_EPZS }, 0, 0, FF_MPV_OPT_FLAGS, .unit = "motion-est" },
726 { "xone", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = FF_ME_XONE }, 0, 0, FF_MPV_OPT_FLAGS, .unit = "motion-est" },
727
728 { NULL },
729 };
730
731 static const AVClass svq1enc_class = {
732 .class_name = "svq1enc",
733 .item_name = av_default_item_name,
734 .option = options,
735 .version = LIBAVUTIL_VERSION_INT,
736 };
737
738 const FFCodec ff_svq1_encoder = {
739 .p.name = "svq1",
740 CODEC_LONG_NAME("Sorenson Vector Quantizer 1 / Sorenson Video 1 / SVQ1"),
741 .p.type = AVMEDIA_TYPE_VIDEO,
742 .p.id = AV_CODEC_ID_SVQ1,
743 .p.capabilities = AV_CODEC_CAP_DR1 | AV_CODEC_CAP_ENCODER_REORDERED_OPAQUE,
744 .priv_data_size = sizeof(SVQ1EncContext),
745 .p.priv_class = &svq1enc_class,
746 .init = svq1_encode_init,
747 FF_CODEC_ENCODE_CB(svq1_encode_frame),
748 .close = svq1_encode_end,
749 .p.pix_fmts = (const enum AVPixelFormat[]) { AV_PIX_FMT_YUV410P,
750 AV_PIX_FMT_NONE },
751 .caps_internal = FF_CODEC_CAP_INIT_CLEANUP,
752 };
753