FFmpeg coverage


Directory: ../../../ffmpeg/
File: src/libavcodec/snow.h
Date: 2024-11-20 23:03:26
Exec Total Coverage
Lines: 149 156 95.5%
Functions: 6 6 100.0%
Branches: 92 96 95.8%

Line Branch Exec Source
1 /*
2 * Copyright (C) 2004 Michael Niedermayer <michaelni@gmx.at>
3 * Copyright (C) 2006 Robert Edele <yartrebo@earthlink.net>
4 *
5 * This file is part of FFmpeg.
6 *
7 * FFmpeg is free software; you can redistribute it and/or
8 * modify it under the terms of the GNU Lesser General Public
9 * License as published by the Free Software Foundation; either
10 * version 2.1 of the License, or (at your option) any later version.
11 *
12 * FFmpeg is distributed in the hope that it will be useful,
13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
15 * Lesser General Public License for more details.
16 *
17 * You should have received a copy of the GNU Lesser General Public
18 * License along with FFmpeg; if not, write to the Free Software
19 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
20 */
21
22 #ifndef AVCODEC_SNOW_H
23 #define AVCODEC_SNOW_H
24
25 #include "libavutil/motion_vector.h"
26
27 #include "avcodec.h"
28 #include "hpeldsp.h"
29 #include "snow_dwt.h"
30
31 #include "rangecoder.h"
32 #include "mathops.h"
33
34 #include "h264qpel.h"
35 #include "videodsp.h"
36
37 #define SNOW_MAX_PLANES 4
38
39 #define MID_STATE 128
40
41 #define MAX_PLANES 4
42 #define QSHIFT 5
43 #define QROOT (1<<QSHIFT)
44 #define LOSSLESS_QLOG -128
45 #define FRAC_BITS 4
46 #define MAX_REF_FRAMES 8
47
48 #define LOG2_OBMC_MAX 8
49 #define OBMC_MAX (1<<(LOG2_OBMC_MAX))
50 typedef struct BlockNode{
51 int16_t mx; ///< Motion vector component X, see mv_scale
52 int16_t my; ///< Motion vector component Y, see mv_scale
53 uint8_t ref; ///< Reference frame index
54 uint8_t color[3]; ///< Color for intra
55 uint8_t type; ///< Bitfield of BLOCK_*
56 //#define TYPE_SPLIT 1
57 #define BLOCK_INTRA 1 ///< Intra block, inter otherwise
58 #define BLOCK_OPT 2 ///< Block needs no checks in this round of iterative motion estiation
59 //#define TYPE_NOCOLOR 4
60 uint8_t level; //FIXME merge into type?
61 }BlockNode;
62
63 static const BlockNode null_block= { //FIXME add border maybe
64 .color= {128,128,128},
65 .mx= 0,
66 .my= 0,
67 .ref= 0,
68 .type= 0,
69 .level= 0,
70 };
71
72 #define LOG2_MB_SIZE 4
73 #define MB_SIZE (1<<LOG2_MB_SIZE)
74 #define ENCODER_EXTRA_BITS 4
75 #define HTAPS_MAX 8
76
77 typedef struct x_and_coeff{
78 int16_t x;
79 uint16_t coeff;
80 } x_and_coeff;
81
82 typedef struct SubBand{
83 int level;
84 int stride;
85 int width;
86 int height;
87 int qlog; ///< log(qscale)/log[2^(1/6)]
88 DWTELEM *buf;
89 IDWTELEM *ibuf;
90 int buf_x_offset;
91 int buf_y_offset;
92 int stride_line; ///< Stride measured in lines, not pixels.
93 x_and_coeff * x_coeff;
94 struct SubBand *parent;
95 uint8_t state[/*7*2*/ 7 + 512][32];
96 }SubBand;
97
98 typedef struct Plane{
99 int width;
100 int height;
101 SubBand band[MAX_DECOMPOSITIONS][4];
102
103 int htaps;
104 int8_t hcoeff[HTAPS_MAX/2];
105 int diag_mc;
106 int fast_mc;
107
108 int last_htaps;
109 int8_t last_hcoeff[HTAPS_MAX/2];
110 int last_diag_mc;
111 }Plane;
112
113 typedef struct SnowContext{
114 AVClass *class;
115 AVCodecContext *avctx;
116 RangeCoder c;
117 HpelDSPContext hdsp;
118 VideoDSPContext vdsp;
119 H264QpelContext h264qpel;
120 SnowDWTContext dwt;
121 AVFrame *input_picture; ///< new_picture with the internal linesizes
122 AVFrame *current_picture;
123 AVFrame *last_picture[MAX_REF_FRAMES];
124 AVFrame *mconly_picture;
125 // uint8_t q_context[16];
126 uint8_t header_state[32];
127 uint8_t block_state[128 + 32*128];
128 int keyframe;
129 int always_reset;
130 int version;
131 int spatial_decomposition_type;
132 int last_spatial_decomposition_type;
133 int temporal_decomposition_type;
134 int spatial_decomposition_count;
135 int last_spatial_decomposition_count;
136 int temporal_decomposition_count;
137 int max_ref_frames;
138 int ref_frames;
139 int16_t (*ref_mvs[MAX_REF_FRAMES])[2];
140 uint32_t *ref_scores[MAX_REF_FRAMES];
141 DWTELEM *spatial_dwt_buffer;
142 DWTELEM *temp_dwt_buffer;
143 IDWTELEM *spatial_idwt_buffer;
144 IDWTELEM *temp_idwt_buffer;
145 int *run_buffer;
146 int colorspace_type;
147 int chroma_h_shift;
148 int chroma_v_shift;
149 int spatial_scalability;
150 int qlog;
151 int last_qlog;
152 int mv_scale;
153 int last_mv_scale;
154 int qbias;
155 int last_qbias;
156 #define QBIAS_SHIFT 3
157 int b_width;
158 int b_height;
159 int block_max_depth;
160 int last_block_max_depth;
161 int nb_planes;
162 Plane plane[MAX_PLANES];
163 BlockNode *block;
164 slice_buffer sb;
165
166 uint8_t *scratchbuf;
167 uint8_t *emu_edge_buffer;
168
169 AVMotionVector *avmv;
170 unsigned avmv_size;
171 int avmv_index;
172 }SnowContext;
173
174 /* Tables */
175 extern const uint8_t * const ff_obmc_tab[4];
176 extern const uint8_t ff_qexp[QROOT];
177 extern int ff_scale_mv_ref[MAX_REF_FRAMES][MAX_REF_FRAMES];
178
179 /* common code */
180
181 int ff_snow_common_init(AVCodecContext *avctx);
182 int ff_snow_common_init_after_header(AVCodecContext *avctx);
183 void ff_snow_common_end(SnowContext *s);
184 void ff_snow_release_buffer(AVCodecContext *avctx);
185 void ff_snow_reset_contexts(SnowContext *s);
186 int ff_snow_alloc_blocks(SnowContext *s);
187 int ff_snow_frames_prepare(SnowContext *s);
188 void ff_snow_pred_block(SnowContext *s, uint8_t *dst, uint8_t *tmp, ptrdiff_t stride,
189 int sx, int sy, int b_w, int b_h, const BlockNode *block,
190 int plane_index, int w, int h);
191 /* common inline functions */
192 //XXX doublecheck all of them should stay inlined
193
194 1898120 static inline void pred_mv(SnowContext *s, int *mx, int *my, int ref,
195 const BlockNode *left, const BlockNode *top, const BlockNode *tr){
196
1/2
✓ Branch 0 taken 1898120 times.
✗ Branch 1 not taken.
1898120 if(s->ref_frames == 1){
197 1898120 *mx = mid_pred(left->mx, top->mx, tr->mx);
198 1898120 *my = mid_pred(left->my, top->my, tr->my);
199 }else{
200 const int *scale = ff_scale_mv_ref[ref];
201 *mx = mid_pred((left->mx * scale[left->ref] + 128) >>8,
202 (top ->mx * scale[top ->ref] + 128) >>8,
203 (tr ->mx * scale[tr ->ref] + 128) >>8);
204 *my = mid_pred((left->my * scale[left->ref] + 128) >>8,
205 (top ->my * scale[top ->ref] + 128) >>8,
206 (tr ->my * scale[tr ->ref] + 128) >>8);
207 }
208 1898120 }
209
210 16120402 static av_always_inline int same_block(BlockNode *a, BlockNode *b){
211
4/4
✓ Branch 0 taken 1856778 times.
✓ Branch 1 taken 14263624 times.
✓ Branch 2 taken 1027453 times.
✓ Branch 3 taken 829325 times.
16120402 if((a->type&BLOCK_INTRA) && (b->type&BLOCK_INTRA)){
212 1027453 return !((a->color[0] - b->color[0]) | (a->color[1] - b->color[1]) | (a->color[2] - b->color[2]));
213 }else{
214 15092949 return !((a->mx - b->mx) | (a->my - b->my) | (a->ref - b->ref) | ((a->type ^ b->type)&BLOCK_INTRA));
215 }
216 }
217
218 //FIXME name cleanup (b_w, block_w, b_width stuff)
219 //XXX should we really inline it?
220 3077196 static av_always_inline void add_yblock(SnowContext *s, int sliced, slice_buffer *sb, IDWTELEM *dst, uint8_t *dst8, const uint8_t *obmc, int src_x, int src_y, int b_w, int b_h, int w, int h, int dst_stride, int src_stride, int obmc_stride, int b_x, int b_y, int add, int offset_dst, int plane_index){
221 3077196 const int b_width = s->b_width << s->block_max_depth;
222 3077196 const int b_height= s->b_height << s->block_max_depth;
223 3077196 const int b_stride= b_width;
224 3077196 BlockNode *lt= &s->block[b_x + b_y*b_stride];
225 3077196 BlockNode *rt= lt+1;
226 3077196 BlockNode *lb= lt+b_stride;
227 3077196 BlockNode *rb= lb+1;
228 uint8_t *block[4];
229 // When src_stride is large enough, it is possible to interleave the blocks.
230 // Otherwise the blocks are written sequentially in the tmp buffer.
231
2/2
✓ Branch 0 taken 24300 times.
✓ Branch 1 taken 3052896 times.
3077196 int tmp_step= src_stride >= 7*MB_SIZE ? MB_SIZE : MB_SIZE*src_stride;
232 3077196 uint8_t *tmp = s->scratchbuf;
233 uint8_t *ptmp;
234 int x,y;
235
236
2/2
✓ Branch 0 taken 80121 times.
✓ Branch 1 taken 2997075 times.
3077196 if(b_x<0){
237 80121 lt= rt;
238 80121 lb= rb;
239
2/2
✓ Branch 0 taken 77253 times.
✓ Branch 1 taken 2919822 times.
2997075 }else if(b_x + 1 >= b_width){
240 77253 rt= lt;
241 77253 rb= lb;
242 }
243
2/2
✓ Branch 0 taken 118116 times.
✓ Branch 1 taken 2959080 times.
3077196 if(b_y<0){
244 118116 lt= lb;
245 118116 rt= rb;
246
2/2
✓ Branch 0 taken 109416 times.
✓ Branch 1 taken 2849664 times.
2959080 }else if(b_y + 1 >= b_height){
247 109416 lb= lt;
248 109416 rb= rt;
249 }
250
251
2/2
✓ Branch 0 taken 80121 times.
✓ Branch 1 taken 2997075 times.
3077196 if(src_x<0){ //FIXME merge with prev & always round internal width up to *16
252 80121 obmc -= src_x;
253 80121 b_w += src_x;
254
4/4
✓ Branch 0 taken 61086 times.
✓ Branch 1 taken 19035 times.
✓ Branch 2 taken 13446 times.
✓ Branch 3 taken 47640 times.
80121 if(!sliced && !offset_dst)
255 13446 dst -= src_x;
256 80121 src_x=0;
257 }
258
2/2
✓ Branch 0 taken 77253 times.
✓ Branch 1 taken 2999943 times.
3077196 if(src_x + b_w > w){
259 77253 b_w = w - src_x;
260 }
261
2/2
✓ Branch 0 taken 118116 times.
✓ Branch 1 taken 2959080 times.
3077196 if(src_y<0){
262 118116 obmc -= src_y*obmc_stride;
263 118116 b_h += src_y;
264
4/4
✓ Branch 0 taken 92601 times.
✓ Branch 1 taken 25515 times.
✓ Branch 2 taken 29652 times.
✓ Branch 3 taken 62949 times.
118116 if(!sliced && !offset_dst)
265 29652 dst -= src_y*dst_stride;
266 118116 src_y=0;
267 }
268
2/2
✓ Branch 0 taken 109416 times.
✓ Branch 1 taken 2967780 times.
3077196 if(src_y + b_h> h){
269 109416 b_h = h - src_y;
270 }
271
272
2/4
✓ Branch 0 taken 3077196 times.
✗ Branch 1 not taken.
✗ Branch 2 not taken.
✓ Branch 3 taken 3077196 times.
3077196 if(b_w<=0 || b_h<=0) return;
273
274
4/4
✓ Branch 0 taken 2366421 times.
✓ Branch 1 taken 710775 times.
✓ Branch 2 taken 2147565 times.
✓ Branch 3 taken 218856 times.
3077196 if(!sliced && offset_dst)
275 2147565 dst += src_x + src_y*dst_stride;
276 3077196 dst8+= src_x + src_y*src_stride;
277 // src += src_x + src_y*src_stride;
278
279 3077196 ptmp= tmp + 3*tmp_step;
280 3077196 block[0]= ptmp;
281 3077196 ptmp+=tmp_step;
282 3077196 ff_snow_pred_block(s, block[0], tmp, src_stride, src_x, src_y, b_w, b_h, lt, plane_index, w, h);
283
284
2/2
✓ Branch 1 taken 845676 times.
✓ Branch 2 taken 2231520 times.
3077196 if(same_block(lt, rt)){
285 845676 block[1]= block[0];
286 }else{
287 2231520 block[1]= ptmp;
288 2231520 ptmp+=tmp_step;
289 2231520 ff_snow_pred_block(s, block[1], tmp, src_stride, src_x, src_y, b_w, b_h, rt, plane_index, w, h);
290 }
291
292
2/2
✓ Branch 1 taken 871989 times.
✓ Branch 2 taken 2205207 times.
3077196 if(same_block(lt, lb)){
293 871989 block[2]= block[0];
294
2/2
✓ Branch 1 taken 208509 times.
✓ Branch 2 taken 1996698 times.
2205207 }else if(same_block(rt, lb)){
295 208509 block[2]= block[1];
296 }else{
297 1996698 block[2]= ptmp;
298 1996698 ptmp+=tmp_step;
299 1996698 ff_snow_pred_block(s, block[2], tmp, src_stride, src_x, src_y, b_w, b_h, lb, plane_index, w, h);
300 }
301
302
2/2
✓ Branch 1 taken 481413 times.
✓ Branch 2 taken 2595783 times.
3077196 if(same_block(lt, rb) ){
303 481413 block[3]= block[0];
304
2/2
✓ Branch 1 taken 526197 times.
✓ Branch 2 taken 2069586 times.
2595783 }else if(same_block(rt, rb)){
305 526197 block[3]= block[1];
306
2/2
✓ Branch 1 taken 396564 times.
✓ Branch 2 taken 1673022 times.
2069586 }else if(same_block(lb, rb)){
307 396564 block[3]= block[2];
308 }else{
309 1673022 block[3]= ptmp;
310 1673022 ff_snow_pred_block(s, block[3], tmp, src_stride, src_x, src_y, b_w, b_h, rb, plane_index, w, h);
311 }
312
2/2
✓ Branch 0 taken 710775 times.
✓ Branch 1 taken 2366421 times.
3077196 if(sliced){
313 710775 s->dwt.inner_add_yblock(obmc, obmc_stride, block, b_w, b_h, src_x,src_y, src_stride, sb, add, dst8);
314 }else{
315
2/2
✓ Branch 0 taken 14261952 times.
✓ Branch 1 taken 2366421 times.
16628373 for(y=0; y<b_h; y++){
316 //FIXME ugly misuse of obmc_stride
317 14261952 const uint8_t *obmc1= obmc + y*obmc_stride;
318 14261952 const uint8_t *obmc2= obmc1+ (obmc_stride>>1);
319 14261952 const uint8_t *obmc3= obmc1+ obmc_stride*(obmc_stride>>1);
320 14261952 const uint8_t *obmc4= obmc3+ (obmc_stride>>1);
321
2/2
✓ Branch 0 taken 107184672 times.
✓ Branch 1 taken 14261952 times.
121446624 for(x=0; x<b_w; x++){
322 107184672 int v= obmc1[x] * block[3][x + y*src_stride]
323 107184672 +obmc2[x] * block[2][x + y*src_stride]
324 107184672 +obmc3[x] * block[1][x + y*src_stride]
325 107184672 +obmc4[x] * block[0][x + y*src_stride];
326
327 107184672 v <<= 8 - LOG2_OBMC_MAX;
328 if(FRAC_BITS != 8){
329 107184672 v >>= 8 - FRAC_BITS;
330 }
331
2/2
✓ Branch 0 taken 59927040 times.
✓ Branch 1 taken 47257632 times.
107184672 if(add){
332 59927040 v += dst[x + y*dst_stride];
333 59927040 v = (v + (1<<(FRAC_BITS-1))) >> FRAC_BITS;
334
2/2
✓ Branch 0 taken 1126 times.
✓ Branch 1 taken 59925914 times.
59927040 if(v&(~255)) v= ~(v>>31);
335 59927040 dst8[x + y*src_stride] = v;
336 }else{
337 47257632 dst[x + y*dst_stride] -= v;
338 }
339 }
340 }
341 }
342 }
343
344 51870 static av_always_inline void predict_slice(SnowContext *s, IDWTELEM *buf, int plane_index, int add, int mb_y){
345 51870 Plane *p= &s->plane[plane_index];
346 51870 const int mb_w= s->b_width << s->block_max_depth;
347 51870 const int mb_h= s->b_height << s->block_max_depth;
348 int x, y, mb_x;
349 51870 int block_size = MB_SIZE >> s->block_max_depth;
350
2/2
✓ Branch 0 taken 34580 times.
✓ Branch 1 taken 17290 times.
51870 int block_w = plane_index ? block_size>>s->chroma_h_shift : block_size;
351
2/2
✓ Branch 0 taken 34580 times.
✓ Branch 1 taken 17290 times.
51870 int block_h = plane_index ? block_size>>s->chroma_v_shift : block_size;
352
2/2
✓ Branch 0 taken 34580 times.
✓ Branch 1 taken 17290 times.
51870 const uint8_t *obmc = plane_index ? ff_obmc_tab[s->block_max_depth+s->chroma_h_shift] : ff_obmc_tab[s->block_max_depth];
353
2/2
✓ Branch 0 taken 34580 times.
✓ Branch 1 taken 17290 times.
51870 const int obmc_stride= plane_index ? (2*block_size)>>s->chroma_h_shift : 2*block_size;
354 51870 int ref_stride= s->current_picture->linesize[plane_index];
355 51870 uint8_t *dst8= s->current_picture->data[plane_index];
356 51870 int w= p->width;
357 51870 int h= p->height;
358 av_assert2(s->chroma_h_shift == s->chroma_v_shift); // obmc params assume squares
359
3/4
✓ Branch 0 taken 47640 times.
✓ Branch 1 taken 4230 times.
✗ Branch 2 not taken.
✓ Branch 3 taken 47640 times.
51870 if(s->keyframe || (s->avctx->debug&512)){
360
2/2
✓ Branch 0 taken 270 times.
✓ Branch 1 taken 3960 times.
4230 if(mb_y==mb_h)
361 270 return;
362
363
2/2
✓ Branch 0 taken 1980 times.
✓ Branch 1 taken 1980 times.
3960 if(add){
364
2/2
✓ Branch 0 taken 12480 times.
✓ Branch 1 taken 1980 times.
14460 for(y=block_h*mb_y; y<FFMIN(h,block_h*(mb_y+1)); y++){
365
2/2
✓ Branch 0 taken 2649600 times.
✓ Branch 1 taken 12480 times.
2662080 for(x=0; x<w; x++){
366 2649600 int v= buf[x + y*w] + (128<<FRAC_BITS) + (1<<(FRAC_BITS-1));
367 2649600 v >>= FRAC_BITS;
368
2/2
✓ Branch 0 taken 104 times.
✓ Branch 1 taken 2649496 times.
2649600 if(v&(~255)) v= ~(v>>31);
369 2649600 dst8[x + y*ref_stride]= v;
370 }
371 }
372 }else{
373
2/2
✓ Branch 0 taken 12480 times.
✓ Branch 1 taken 1980 times.
14460 for(y=block_h*mb_y; y<FFMIN(h,block_h*(mb_y+1)); y++){
374
2/2
✓ Branch 0 taken 2649600 times.
✓ Branch 1 taken 12480 times.
2662080 for(x=0; x<w; x++){
375 2649600 buf[x + y*w]-= 128<<FRAC_BITS;
376 }
377 }
378 }
379
380 3960 return;
381 }
382
383
2/2
✓ Branch 0 taken 2147565 times.
✓ Branch 1 taken 47640 times.
2195205 for(mb_x=0; mb_x<=mb_w; mb_x++){
384 2147565 add_yblock(s, 0, NULL, buf, dst8, obmc,
385 2147565 block_w*mb_x - block_w/2,
386 2147565 block_h*mb_y - block_h/2,
387 block_w, block_h,
388 w, h,
389 w, ref_stride, obmc_stride,
390 mb_x - 1, mb_y - 1,
391 add, 1, plane_index);
392 }
393 }
394
395 2874 static av_always_inline void predict_plane(SnowContext *s, IDWTELEM *buf, int plane_index, int add){
396 2874 const int mb_h= s->b_height << s->block_max_depth;
397 int mb_y;
398
2/2
✓ Branch 0 taken 51870 times.
✓ Branch 1 taken 2874 times.
54744 for(mb_y=0; mb_y<=mb_h; mb_y++)
399 51870 predict_slice(s, buf, plane_index, add, mb_y);
400 2874 }
401
402 693867 static inline void set_blocks(SnowContext *s, int level, int x, int y, int l, int cb, int cr, int mx, int my, int ref, int type){
403 693867 const int w= s->b_width << s->block_max_depth;
404 693867 const int rem_depth= s->block_max_depth - level;
405 693867 const int index= (x + y*w) << rem_depth;
406 693867 const int block_w= 1<<rem_depth;
407 693867 const int block_h= 1<<rem_depth; //FIXME "w!=h"
408 BlockNode block;
409 int i,j;
410
411 693867 block.color[0]= l;
412 693867 block.color[1]= cb;
413 693867 block.color[2]= cr;
414 693867 block.mx= mx;
415 693867 block.my= my;
416 693867 block.ref= ref;
417 693867 block.type= type;
418 693867 block.level= level;
419
420
2/2
✓ Branch 0 taken 729258 times.
✓ Branch 1 taken 693867 times.
1423125 for(j=0; j<block_h; j++){
421
2/2
✓ Branch 0 taken 800040 times.
✓ Branch 1 taken 729258 times.
1529298 for(i=0; i<block_w; i++){
422 800040 s->block[index + i + j*w]= block;
423 }
424 }
425 693867 }
426
427 extern const int8_t ff_quant3bA[256];
428
429 #define QEXPSHIFT (7-FRAC_BITS+8) //FIXME try to change this to 0
430
431 #endif /* AVCODEC_SNOW_H */
432