Directory: | ../../../ffmpeg/ |
---|---|
File: | src/libavcodec/h264_direct.c |
Date: | 2022-07-07 01:21:54 |
Exec | Total | Coverage | |
---|---|---|---|
Lines: | 439 | 445 | 98.7% |
Branches: | 300 | 316 | 94.9% |
Line | Branch | Exec | Source |
---|---|---|---|
1 | /* | ||
2 | * H.26L/H.264/AVC/JVT/14496-10/... direct mb/block decoding | ||
3 | * Copyright (c) 2003 Michael Niedermayer <michaelni@gmx.at> | ||
4 | * | ||
5 | * This file is part of FFmpeg. | ||
6 | * | ||
7 | * FFmpeg is free software; you can redistribute it and/or | ||
8 | * modify it under the terms of the GNU Lesser General Public | ||
9 | * License as published by the Free Software Foundation; either | ||
10 | * version 2.1 of the License, or (at your option) any later version. | ||
11 | * | ||
12 | * FFmpeg is distributed in the hope that it will be useful, | ||
13 | * but WITHOUT ANY WARRANTY; without even the implied warranty of | ||
14 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU | ||
15 | * Lesser General Public License for more details. | ||
16 | * | ||
17 | * You should have received a copy of the GNU Lesser General Public | ||
18 | * License along with FFmpeg; if not, write to the Free Software | ||
19 | * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA | ||
20 | */ | ||
21 | |||
22 | /** | ||
23 | * @file | ||
24 | * H.264 / AVC / MPEG-4 part10 direct mb/block decoding. | ||
25 | * @author Michael Niedermayer <michaelni@gmx.at> | ||
26 | */ | ||
27 | |||
28 | #include "avcodec.h" | ||
29 | #include "h264dec.h" | ||
30 | #include "h264_ps.h" | ||
31 | #include "mpegutils.h" | ||
32 | #include "rectangle.h" | ||
33 | #include "threadframe.h" | ||
34 | |||
35 | #include <assert.h> | ||
36 | |||
37 | 27501 | static int get_scale_factor(H264SliceContext *sl, | |
38 | int poc, int poc1, int i) | ||
39 | { | ||
40 | 27501 | int poc0 = sl->ref_list[0][i].poc; | |
41 | 27501 | int64_t pocdiff = poc1 - (int64_t)poc0; | |
42 | 27501 | int td = av_clip_int8(pocdiff); | |
43 | |||
44 |
1/2✗ Branch 0 not taken.
✓ Branch 1 taken 27501 times.
|
27501 | if (pocdiff != (int)pocdiff) |
45 | ✗ | avpriv_request_sample(sl->h264->avctx, "pocdiff overflow"); | |
46 | |||
47 |
4/4✓ Branch 0 taken 19905 times.
✓ Branch 1 taken 7596 times.
✓ Branch 2 taken 531 times.
✓ Branch 3 taken 19374 times.
|
27501 | if (td == 0 || sl->ref_list[0][i].parent->long_ref) { |
48 | 8127 | return 256; | |
49 | } else { | ||
50 | 19374 | int64_t pocdiff0 = poc - (int64_t)poc0; | |
51 | 19374 | int tb = av_clip_int8(pocdiff0); | |
52 | 19374 | int tx = (16384 + (FFABS(td) >> 1)) / td; | |
53 | |||
54 |
1/2✗ Branch 0 not taken.
✓ Branch 1 taken 19374 times.
|
19374 | if (pocdiff0 != (int)pocdiff0) |
55 | ✗ | av_log(sl->h264->avctx, AV_LOG_DEBUG, "pocdiff0 overflow\n"); | |
56 | |||
57 | 19374 | return av_clip_intp2((tb * tx + 32) >> 6, 10); | |
58 | } | ||
59 | } | ||
60 | |||
61 | 7703 | void ff_h264_direct_dist_scale_factor(const H264Context *const h, | |
62 | H264SliceContext *sl) | ||
63 | { | ||
64 | 18790 | const int poc = FIELD_PICTURE(h) ? h->cur_pic_ptr->field_poc[h->picture_structure == PICT_BOTTOM_FIELD] | |
65 |
2/2✓ Branch 0 taken 3384 times.
✓ Branch 1 taken 4319 times.
|
7703 | : h->cur_pic_ptr->poc; |
66 | 7703 | const int poc1 = sl->ref_list[1][0].poc; | |
67 | int i, field; | ||
68 | |||
69 |
2/2✓ Branch 0 taken 513 times.
✓ Branch 1 taken 7190 times.
|
7703 | if (FRAME_MBAFF(h)) |
70 |
2/2✓ Branch 0 taken 1026 times.
✓ Branch 1 taken 513 times.
|
1539 | for (field = 0; field < 2; field++) { |
71 | 1026 | const int poc = h->cur_pic_ptr->field_poc[field]; | |
72 | 1026 | const int poc1 = sl->ref_list[1][0].parent->field_poc[field]; | |
73 |
2/2✓ Branch 0 taken 6572 times.
✓ Branch 1 taken 1026 times.
|
7598 | for (i = 0; i < 2 * sl->ref_count[0]; i++) |
74 | 6572 | sl->dist_scale_factor_field[field][i ^ field] = | |
75 | 6572 | get_scale_factor(sl, poc, poc1, i + 16); | |
76 | } | ||
77 | |||
78 |
2/2✓ Branch 0 taken 20929 times.
✓ Branch 1 taken 7703 times.
|
28632 | for (i = 0; i < sl->ref_count[0]; i++) |
79 | 20929 | sl->dist_scale_factor[i] = get_scale_factor(sl, poc, poc1, i); | |
80 | 7703 | } | |
81 | |||
82 | 17458 | static void fill_colmap(const H264Context *h, H264SliceContext *sl, | |
83 | int map[2][16 + 32], int list, | ||
84 | int field, int colfield, int mbafi) | ||
85 | { | ||
86 | 17458 | H264Picture *const ref1 = sl->ref_list[1][0].parent; | |
87 | int j, old_ref, rfield; | ||
88 |
2/2✓ Branch 0 taken 2052 times.
✓ Branch 1 taken 15406 times.
|
17458 | int start = mbafi ? 16 : 0; |
89 |
2/2✓ Branch 0 taken 2052 times.
✓ Branch 1 taken 15406 times.
|
17458 | int end = mbafi ? 16 + 2 * sl->ref_count[0] : sl->ref_count[0]; |
90 |
4/4✓ Branch 0 taken 15406 times.
✓ Branch 1 taken 2052 times.
✓ Branch 2 taken 6768 times.
✓ Branch 3 taken 8638 times.
|
17458 | int interl = mbafi || h->picture_structure != PICT_FRAME; |
91 | |||
92 | /* bogus; fills in for missing frames */ | ||
93 | 17458 | memset(map[list], 0, sizeof(map[list])); | |
94 | |||
95 |
2/2✓ Branch 0 taken 34916 times.
✓ Branch 1 taken 17458 times.
|
52374 | for (rfield = 0; rfield < 2; rfield++) { |
96 |
2/2✓ Branch 0 taken 37168 times.
✓ Branch 1 taken 34916 times.
|
72084 | for (old_ref = 0; old_ref < ref1->ref_count[colfield][list]; old_ref++) { |
97 | 37168 | int poc = ref1->ref_poc[colfield][list][old_ref]; | |
98 | |||
99 |
2/2✓ Branch 0 taken 16796 times.
✓ Branch 1 taken 20372 times.
|
37168 | if (!interl) |
100 | 16796 | poc |= 3; | |
101 | // FIXME: store all MBAFF references so this is not needed | ||
102 |
3/4✓ Branch 0 taken 20372 times.
✗ Branch 1 not taken.
✓ Branch 2 taken 5396 times.
✓ Branch 3 taken 14976 times.
|
20372 | else if (interl && (poc & 3) == 3) |
103 | 5396 | poc = (poc & ~3) + rfield + 1; | |
104 | |||
105 |
2/2✓ Branch 0 taken 101132 times.
✓ Branch 1 taken 7392 times.
|
108524 | for (j = start; j < end; j++) { |
106 | 101132 | if (4 * sl->ref_list[0][j].parent->frame_num + | |
107 |
2/2✓ Branch 0 taken 29776 times.
✓ Branch 1 taken 71356 times.
|
101132 | (sl->ref_list[0][j].reference & 3) == poc) { |
108 |
2/2✓ Branch 0 taken 4168 times.
✓ Branch 1 taken 25608 times.
|
29776 | int cur_ref = mbafi ? (j - 16) ^ field : j; |
109 |
2/2✓ Branch 0 taken 5736 times.
✓ Branch 1 taken 24040 times.
|
29776 | if (ref1->mbaff) |
110 | 5736 | map[list][2 * old_ref + (rfield ^ field) + 16] = cur_ref; | |
111 |
4/4✓ Branch 0 taken 14888 times.
✓ Branch 1 taken 14888 times.
✓ Branch 2 taken 6574 times.
✓ Branch 3 taken 8314 times.
|
29776 | if (rfield == field || !interl) |
112 | 21462 | map[list][old_ref] = cur_ref; | |
113 | 29776 | break; | |
114 | } | ||
115 | } | ||
116 | } | ||
117 | } | ||
118 | 17458 | } | |
119 | |||
120 | 34401 | void ff_h264_direct_ref_list_init(const H264Context *const h, H264SliceContext *sl) | |
121 | { | ||
122 | 34401 | H264Ref *const ref1 = &sl->ref_list[1][0]; | |
123 | 34401 | H264Picture *const cur = h->cur_pic_ptr; | |
124 | int list, j, field; | ||
125 | 34401 | int sidx = (h->picture_structure & 1) ^ 1; | |
126 | 34401 | int ref1sidx = (ref1->reference & 1) ^ 1; | |
127 | |||
128 |
2/2✓ Branch 0 taken 42193 times.
✓ Branch 1 taken 34401 times.
|
76594 | for (list = 0; list < sl->list_count; list++) { |
129 | 42193 | cur->ref_count[sidx][list] = sl->ref_count[list]; | |
130 |
2/2✓ Branch 0 taken 134619 times.
✓ Branch 1 taken 42193 times.
|
176812 | for (j = 0; j < sl->ref_count[list]; j++) |
131 | 134619 | cur->ref_poc[sidx][list][j] = 4 * sl->ref_list[list][j].parent->frame_num + | |
132 | 134619 | (sl->ref_list[list][j].reference & 3); | |
133 | } | ||
134 | |||
135 |
2/2✓ Branch 0 taken 25805 times.
✓ Branch 1 taken 8596 times.
|
34401 | if (h->picture_structure == PICT_FRAME) { |
136 | 25805 | memcpy(cur->ref_count[1], cur->ref_count[0], sizeof(cur->ref_count[0])); | |
137 | 25805 | memcpy(cur->ref_poc[1], cur->ref_poc[0], sizeof(cur->ref_poc[0])); | |
138 | } | ||
139 | |||
140 |
2/2✓ Branch 0 taken 26296 times.
✓ Branch 1 taken 8105 times.
|
34401 | if (h->current_slice == 0) { |
141 | 26296 | cur->mbaff = FRAME_MBAFF(h); | |
142 | } else { | ||
143 |
1/2✗ Branch 0 not taken.
✓ Branch 1 taken 8105 times.
|
8105 | av_assert0(cur->mbaff == FRAME_MBAFF(h)); |
144 | } | ||
145 | |||
146 | 34401 | sl->col_fieldoff = 0; | |
147 | |||
148 |
3/4✓ Branch 0 taken 12032 times.
✓ Branch 1 taken 22369 times.
✗ Branch 2 not taken.
✓ Branch 3 taken 12032 times.
|
34401 | if (sl->list_count != 2 || !sl->ref_count[1]) |
149 | 22369 | return; | |
150 | |||
151 |
2/2✓ Branch 0 taken 7453 times.
✓ Branch 1 taken 4579 times.
|
12032 | if (h->picture_structure == PICT_FRAME) { |
152 | 7453 | int cur_poc = h->cur_pic_ptr->poc; | |
153 | 7453 | int *col_poc = sl->ref_list[1][0].parent->field_poc; | |
154 |
3/4✓ Branch 0 taken 4 times.
✓ Branch 1 taken 7449 times.
✓ Branch 2 taken 4 times.
✗ Branch 3 not taken.
|
7453 | if (col_poc[0] == INT_MAX && col_poc[1] == INT_MAX) { |
155 | 4 | av_log(h->avctx, AV_LOG_ERROR, "co located POCs unavailable\n"); | |
156 | 4 | sl->col_parity = 1; | |
157 | } else | ||
158 | 7449 | sl->col_parity = (FFABS(col_poc[0] - (int64_t)cur_poc) >= | |
159 | 7449 | FFABS(col_poc[1] - (int64_t)cur_poc)); | |
160 | 7453 | ref1sidx = | |
161 | 7453 | sidx = sl->col_parity; | |
162 | // FL -> FL & differ parity | ||
163 |
2/2✓ Branch 0 taken 1866 times.
✓ Branch 1 taken 2713 times.
|
4579 | } else if (!(h->picture_structure & sl->ref_list[1][0].reference) && |
164 |
2/2✓ Branch 0 taken 1728 times.
✓ Branch 1 taken 138 times.
|
1866 | !sl->ref_list[1][0].parent->mbaff) { |
165 | 1728 | sl->col_fieldoff = 2 * sl->ref_list[1][0].reference - 3; | |
166 | } | ||
167 | |||
168 |
3/4✓ Branch 0 taken 12032 times.
✗ Branch 1 not taken.
✓ Branch 2 taken 4329 times.
✓ Branch 3 taken 7703 times.
|
12032 | if (sl->slice_type_nos != AV_PICTURE_TYPE_B || sl->direct_spatial_mv_pred) |
169 | 4329 | return; | |
170 | |||
171 |
2/2✓ Branch 0 taken 15406 times.
✓ Branch 1 taken 7703 times.
|
23109 | for (list = 0; list < 2; list++) { |
172 | 15406 | fill_colmap(h, sl, sl->map_col_to_list0, list, sidx, ref1sidx, 0); | |
173 |
2/2✓ Branch 0 taken 1026 times.
✓ Branch 1 taken 14380 times.
|
15406 | if (FRAME_MBAFF(h)) |
174 |
2/2✓ Branch 0 taken 2052 times.
✓ Branch 1 taken 1026 times.
|
3078 | for (field = 0; field < 2; field++) |
175 | 2052 | fill_colmap(h, sl, sl->map_col_to_list0_field[field], list, field, | |
176 | field, 1); | ||
177 | } | ||
178 | } | ||
179 | |||
180 | 4096924 | static void await_reference_mb_row(const H264Context *const h, H264Ref *ref, | |
181 | int mb_y) | ||
182 | { | ||
183 | 4096924 | int ref_field = ref->reference - 1; | |
184 | 4096924 | int ref_field_picture = ref->parent->field_picture; | |
185 | 4096924 | int ref_height = 16 * h->mb_height >> ref_field_picture; | |
186 | |||
187 |
2/2✓ Branch 0 taken 4080106 times.
✓ Branch 1 taken 16818 times.
|
4096924 | if (!HAVE_THREADS || !(h->avctx->active_thread_type & FF_THREAD_FRAME)) |
188 | 4080106 | return; | |
189 | |||
190 | /* FIXME: It can be safe to access mb stuff | ||
191 | * even if pixels aren't deblocked yet. */ | ||
192 | |||
193 |
1/4✗ Branch 0 not taken.
✓ Branch 1 taken 16818 times.
✗ Branch 2 not taken.
✗ Branch 3 not taken.
|
33636 | ff_thread_await_progress(&ref->parent->tf, |
194 |
1/2✗ Branch 0 not taken.
✓ Branch 1 taken 16818 times.
|
16818 | FFMIN(16 * mb_y >> ref_field_picture, |
195 | ref_height - 1), | ||
196 | ref_field_picture && ref_field); | ||
197 | } | ||
198 | |||
199 | 2608161 | static void pred_spatial_direct_motion(const H264Context *const h, H264SliceContext *sl, | |
200 | int *mb_type) | ||
201 | { | ||
202 | 2608161 | int b8_stride = 2; | |
203 | 2608161 | int b4_stride = h->b_stride; | |
204 | 2608161 | int mb_xy = sl->mb_xy, mb_y = sl->mb_y; | |
205 | int mb_type_col[2]; | ||
206 | const int16_t (*l1mv0)[2], (*l1mv1)[2]; | ||
207 | const int8_t *l1ref0, *l1ref1; | ||
208 | 2608161 | const int is_b8x8 = IS_8X8(*mb_type); | |
209 | 2608161 | unsigned int sub_mb_type = MB_TYPE_L0L1; | |
210 | int i8, i4; | ||
211 | int ref[2]; | ||
212 | int mv[2]; | ||
213 | int list; | ||
214 | |||
215 | assert(sl->ref_list[1][0].reference & 3); | ||
216 | |||
217 | 2608161 | await_reference_mb_row(h, &sl->ref_list[1][0], | |
218 | 2608161 | sl->mb_y + !!IS_INTERLACED(*mb_type)); | |
219 | |||
220 | #define MB_TYPE_16x16_OR_INTRA (MB_TYPE_16x16 | MB_TYPE_INTRA4x4 | \ | ||
221 | MB_TYPE_INTRA16x16 | MB_TYPE_INTRA_PCM) | ||
222 | |||
223 | /* ref = min(neighbors) */ | ||
224 |
2/2✓ Branch 0 taken 5216322 times.
✓ Branch 1 taken 2608161 times.
|
7824483 | for (list = 0; list < 2; list++) { |
225 | 5216322 | int left_ref = sl->ref_cache[list][scan8[0] - 1]; | |
226 | 5216322 | int top_ref = sl->ref_cache[list][scan8[0] - 8]; | |
227 | 5216322 | int refc = sl->ref_cache[list][scan8[0] - 8 + 4]; | |
228 | 5216322 | const int16_t *C = sl->mv_cache[list][scan8[0] - 8 + 4]; | |
229 |
2/2✓ Branch 0 taken 567052 times.
✓ Branch 1 taken 4649270 times.
|
5216322 | if (refc == PART_NOT_AVAILABLE) { |
230 | 567052 | refc = sl->ref_cache[list][scan8[0] - 8 - 1]; | |
231 | 567052 | C = sl->mv_cache[list][scan8[0] - 8 - 1]; | |
232 | } | ||
233 | 5216322 | ref[list] = FFMIN3((unsigned)left_ref, | |
234 | (unsigned)top_ref, | ||
235 | (unsigned)refc); | ||
236 |
2/2✓ Branch 0 taken 4806933 times.
✓ Branch 1 taken 409389 times.
|
5216322 | if (ref[list] >= 0) { |
237 | /* This is just pred_motion() but with the cases removed that | ||
238 | * cannot happen for direct blocks. */ | ||
239 | 4806933 | const int16_t *const A = sl->mv_cache[list][scan8[0] - 1]; | |
240 | 4806933 | const int16_t *const B = sl->mv_cache[list][scan8[0] - 8]; | |
241 | |||
242 | 4806933 | int match_count = (left_ref == ref[list]) + | |
243 | 4806933 | (top_ref == ref[list]) + | |
244 | 4806933 | (refc == ref[list]); | |
245 | |||
246 |
2/2✓ Branch 0 taken 4315513 times.
✓ Branch 1 taken 491420 times.
|
4806933 | if (match_count > 1) { // most common |
247 | 4315513 | mv[list] = pack16to32(mid_pred(A[0], B[0], C[0]), | |
248 | 4315513 | mid_pred(A[1], B[1], C[1])); | |
249 | } else { | ||
250 | assert(match_count == 1); | ||
251 |
2/2✓ Branch 0 taken 375187 times.
✓ Branch 1 taken 116233 times.
|
491420 | if (left_ref == ref[list]) |
252 | 375187 | mv[list] = AV_RN32A(A); | |
253 |
2/2✓ Branch 0 taken 54407 times.
✓ Branch 1 taken 61826 times.
|
116233 | else if (top_ref == ref[list]) |
254 | 54407 | mv[list] = AV_RN32A(B); | |
255 | else | ||
256 | 61826 | mv[list] = AV_RN32A(C); | |
257 | } | ||
258 | av_assert2(ref[list] < (sl->ref_count[list] << !!FRAME_MBAFF(h))); | ||
259 | } else { | ||
260 | 409389 | int mask = ~(MB_TYPE_L0 << (2 * list)); | |
261 | 409389 | mv[list] = 0; | |
262 | 409389 | ref[list] = -1; | |
263 |
2/2✓ Branch 0 taken 384940 times.
✓ Branch 1 taken 24449 times.
|
409389 | if (!is_b8x8) |
264 | 384940 | *mb_type &= mask; | |
265 | 409389 | sub_mb_type &= mask; | |
266 | } | ||
267 | } | ||
268 |
4/4✓ Branch 0 taken 212687 times.
✓ Branch 1 taken 2395474 times.
✓ Branch 2 taken 5180 times.
✓ Branch 3 taken 207507 times.
|
2608161 | if (ref[0] < 0 && ref[1] < 0) { |
269 | 5180 | ref[0] = ref[1] = 0; | |
270 |
2/2✓ Branch 0 taken 4350 times.
✓ Branch 1 taken 830 times.
|
5180 | if (!is_b8x8) |
271 | 4350 | *mb_type |= MB_TYPE_L0L1; | |
272 | 5180 | sub_mb_type |= MB_TYPE_L0L1; | |
273 | } | ||
274 | |||
275 |
2/2✓ Branch 0 taken 1623030 times.
✓ Branch 1 taken 985131 times.
|
2608161 | if (!(is_b8x8 | mv[0] | mv[1])) { |
276 | 1623030 | fill_rectangle(&sl->ref_cache[0][scan8[0]], 4, 4, 8, (uint8_t)ref[0], 1); | |
277 | 1623030 | fill_rectangle(&sl->ref_cache[1][scan8[0]], 4, 4, 8, (uint8_t)ref[1], 1); | |
278 | 1623030 | fill_rectangle(&sl->mv_cache[0][scan8[0]], 4, 4, 8, 0, 4); | |
279 | 1623030 | fill_rectangle(&sl->mv_cache[1][scan8[0]], 4, 4, 8, 0, 4); | |
280 | 1623030 | *mb_type = (*mb_type & ~(MB_TYPE_8x8 | MB_TYPE_16x8 | MB_TYPE_8x16 | | |
281 | MB_TYPE_P1L0 | MB_TYPE_P1L1)) | | ||
282 | 1623030 | MB_TYPE_16x16 | MB_TYPE_DIRECT2; | |
283 | 1623030 | return; | |
284 | } | ||
285 | |||
286 |
2/2✓ Branch 0 taken 678812 times.
✓ Branch 1 taken 306319 times.
|
985131 | if (IS_INTERLACED(sl->ref_list[1][0].parent->mb_type[mb_xy])) { // AFL/AFR/FR/FL -> AFL/FL |
287 |
2/2✓ Branch 0 taken 39366 times.
✓ Branch 1 taken 639446 times.
|
678812 | if (!IS_INTERLACED(*mb_type)) { // AFR/FR -> AFL/FL |
288 | 39366 | mb_y = (sl->mb_y & ~1) + sl->col_parity; | |
289 | 39366 | mb_xy = sl->mb_x + | |
290 | 39366 | ((sl->mb_y & ~1) + sl->col_parity) * h->mb_stride; | |
291 | 39366 | b8_stride = 0; | |
292 | } else { | ||
293 | 639446 | mb_y += sl->col_fieldoff; | |
294 | 639446 | mb_xy += h->mb_stride * sl->col_fieldoff; // non-zero for FL -> FL & differ parity | |
295 | } | ||
296 | 678812 | goto single_col; | |
297 | } else { // AFL/AFR/FR/FL -> AFR/FR | ||
298 |
2/2✓ Branch 0 taken 43711 times.
✓ Branch 1 taken 262608 times.
|
306319 | if (IS_INTERLACED(*mb_type)) { // AFL /FL -> AFR/FR |
299 | 43711 | mb_y = sl->mb_y & ~1; | |
300 | 43711 | mb_xy = (sl->mb_y & ~1) * h->mb_stride + sl->mb_x; | |
301 | 43711 | mb_type_col[0] = sl->ref_list[1][0].parent->mb_type[mb_xy]; | |
302 | 43711 | mb_type_col[1] = sl->ref_list[1][0].parent->mb_type[mb_xy + h->mb_stride]; | |
303 | 43711 | b8_stride = 2 + 4 * h->mb_stride; | |
304 | 43711 | b4_stride *= 6; | |
305 | 43711 | if (IS_INTERLACED(mb_type_col[0]) != | |
306 |
1/2✗ Branch 0 not taken.
✓ Branch 1 taken 43711 times.
|
43711 | IS_INTERLACED(mb_type_col[1])) { |
307 | ✗ | mb_type_col[0] &= ~MB_TYPE_INTERLACED; | |
308 | ✗ | mb_type_col[1] &= ~MB_TYPE_INTERLACED; | |
309 | } | ||
310 | |||
311 | 43711 | sub_mb_type |= MB_TYPE_16x16 | MB_TYPE_DIRECT2; /* B_SUB_8x8 */ | |
312 |
2/2✓ Branch 0 taken 33897 times.
✓ Branch 1 taken 9814 times.
|
43711 | if ((mb_type_col[0] & MB_TYPE_16x16_OR_INTRA) && |
313 |
4/4✓ Branch 0 taken 29403 times.
✓ Branch 1 taken 4494 times.
✓ Branch 2 taken 26172 times.
✓ Branch 3 taken 3231 times.
|
33897 | (mb_type_col[1] & MB_TYPE_16x16_OR_INTRA) && |
314 | !is_b8x8) { | ||
315 | 26172 | *mb_type |= MB_TYPE_16x8 | MB_TYPE_DIRECT2; /* B_16x8 */ | |
316 | } else { | ||
317 | 17539 | *mb_type |= MB_TYPE_8x8; | |
318 | } | ||
319 | } else { // AFR/FR -> AFR/FR | ||
320 | 262608 | single_col: | |
321 | 941420 | mb_type_col[0] = | |
322 | 941420 | mb_type_col[1] = sl->ref_list[1][0].parent->mb_type[mb_xy]; | |
323 | |||
324 | 941420 | sub_mb_type |= MB_TYPE_16x16 | MB_TYPE_DIRECT2; /* B_SUB_8x8 */ | |
325 |
4/4✓ Branch 0 taken 872466 times.
✓ Branch 1 taken 68954 times.
✓ Branch 2 taken 784150 times.
✓ Branch 3 taken 88316 times.
|
941420 | if (!is_b8x8 && (mb_type_col[0] & MB_TYPE_16x16_OR_INTRA)) { |
326 | 784150 | *mb_type |= MB_TYPE_16x16 | MB_TYPE_DIRECT2; /* B_16x16 */ | |
327 |
2/2✓ Branch 0 taken 88316 times.
✓ Branch 1 taken 68954 times.
|
157270 | } else if (!is_b8x8 && |
328 |
2/2✓ Branch 0 taken 47987 times.
✓ Branch 1 taken 40329 times.
|
88316 | (mb_type_col[0] & (MB_TYPE_16x8 | MB_TYPE_8x16))) { |
329 | 47987 | *mb_type |= MB_TYPE_DIRECT2 | | |
330 | 47987 | (mb_type_col[0] & (MB_TYPE_16x8 | MB_TYPE_8x16)); | |
331 | } else { | ||
332 |
2/2✓ Branch 0 taken 21546 times.
✓ Branch 1 taken 87737 times.
|
109283 | if (!h->ps.sps->direct_8x8_inference_flag) { |
333 | /* FIXME: Save sub mb types from previous frames (or derive | ||
334 | * from MVs) so we know exactly what block size to use. */ | ||
335 | 21546 | sub_mb_type += (MB_TYPE_8x8 - MB_TYPE_16x16); /* B_SUB_4x4 */ | |
336 | } | ||
337 | 109283 | *mb_type |= MB_TYPE_8x8; | |
338 | } | ||
339 | } | ||
340 | } | ||
341 | |||
342 | 985131 | await_reference_mb_row(h, &sl->ref_list[1][0], mb_y); | |
343 | |||
344 | 985131 | l1mv0 = (void*)&sl->ref_list[1][0].parent->motion_val[0][h->mb2b_xy[mb_xy]]; | |
345 | 985131 | l1mv1 = (void*)&sl->ref_list[1][0].parent->motion_val[1][h->mb2b_xy[mb_xy]]; | |
346 | 985131 | l1ref0 = &sl->ref_list[1][0].parent->ref_index[0][4 * mb_xy]; | |
347 | 985131 | l1ref1 = &sl->ref_list[1][0].parent->ref_index[1][4 * mb_xy]; | |
348 |
2/2✓ Branch 0 taken 39366 times.
✓ Branch 1 taken 945765 times.
|
985131 | if (!b8_stride) { |
349 |
2/2✓ Branch 0 taken 19982 times.
✓ Branch 1 taken 19384 times.
|
39366 | if (sl->mb_y & 1) { |
350 | 19982 | l1ref0 += 2; | |
351 | 19982 | l1ref1 += 2; | |
352 | 19982 | l1mv0 += 2 * b4_stride; | |
353 | 19982 | l1mv1 += 2 * b4_stride; | |
354 | } | ||
355 | } | ||
356 | |||
357 |
2/2✓ Branch 0 taken 83077 times.
✓ Branch 1 taken 902054 times.
|
985131 | if (IS_INTERLACED(*mb_type) != IS_INTERLACED(mb_type_col[0])) { |
358 | 83077 | int n = 0; | |
359 |
2/2✓ Branch 0 taken 332308 times.
✓ Branch 1 taken 83077 times.
|
415385 | for (i8 = 0; i8 < 4; i8++) { |
360 | 332308 | int x8 = i8 & 1; | |
361 | 332308 | int y8 = i8 >> 1; | |
362 | 332308 | int xy8 = x8 + y8 * b8_stride; | |
363 | 332308 | int xy4 = x8 * 3 + y8 * b4_stride; | |
364 | int a, b; | ||
365 | |||
366 |
4/4✓ Branch 0 taken 63764 times.
✓ Branch 1 taken 268544 times.
✓ Branch 2 taken 25993 times.
✓ Branch 3 taken 37771 times.
|
332308 | if (is_b8x8 && !IS_DIRECT(sl->sub_mb_type[i8])) |
367 | 25993 | continue; | |
368 | 306315 | sl->sub_mb_type[i8] = sub_mb_type; | |
369 | |||
370 | 306315 | fill_rectangle(&sl->ref_cache[0][scan8[i8 * 4]], 2, 2, 8, | |
371 | 306315 | (uint8_t)ref[0], 1); | |
372 | 306315 | fill_rectangle(&sl->ref_cache[1][scan8[i8 * 4]], 2, 2, 8, | |
373 | 306315 | (uint8_t)ref[1], 1); | |
374 |
3/4✓ Branch 0 taken 173012 times.
✓ Branch 1 taken 133303 times.
✓ Branch 2 taken 173012 times.
✗ Branch 3 not taken.
|
306315 | if (!IS_INTRA(mb_type_col[y8]) && !sl->ref_list[1][0].parent->long_ref && |
375 |
2/2✓ Branch 0 taken 118708 times.
✓ Branch 1 taken 54304 times.
|
173012 | ((l1ref0[xy8] == 0 && |
376 |
2/2✓ Branch 0 taken 8884 times.
✓ Branch 1 taken 109824 times.
|
118708 | FFABS(l1mv0[xy4][0]) <= 1 && |
377 |
2/2✓ Branch 0 taken 3955 times.
✓ Branch 1 taken 4929 times.
|
8884 | FFABS(l1mv0[xy4][1]) <= 1) || |
378 |
2/2✓ Branch 0 taken 8526 times.
✓ Branch 1 taken 159557 times.
|
168083 | (l1ref0[xy8] < 0 && |
379 |
2/2✓ Branch 0 taken 6741 times.
✓ Branch 1 taken 1785 times.
|
8526 | l1ref1[xy8] == 0 && |
380 |
2/2✓ Branch 0 taken 574 times.
✓ Branch 1 taken 6167 times.
|
6741 | FFABS(l1mv1[xy4][0]) <= 1 && |
381 |
2/2✓ Branch 0 taken 354 times.
✓ Branch 1 taken 220 times.
|
574 | FFABS(l1mv1[xy4][1]) <= 1))) { |
382 | 5283 | a = | |
383 | 5283 | b = 0; | |
384 |
2/2✓ Branch 0 taken 459 times.
✓ Branch 1 taken 4824 times.
|
5283 | if (ref[0] > 0) |
385 | 459 | a = mv[0]; | |
386 |
2/2✓ Branch 0 taken 149 times.
✓ Branch 1 taken 5134 times.
|
5283 | if (ref[1] > 0) |
387 | 149 | b = mv[1]; | |
388 | 5283 | n++; | |
389 | } else { | ||
390 | 301032 | a = mv[0]; | |
391 | 301032 | b = mv[1]; | |
392 | } | ||
393 | 306315 | fill_rectangle(&sl->mv_cache[0][scan8[i8 * 4]], 2, 2, 8, a, 4); | |
394 | 306315 | fill_rectangle(&sl->mv_cache[1][scan8[i8 * 4]], 2, 2, 8, b, 4); | |
395 | } | ||
396 |
4/4✓ Branch 0 taken 67136 times.
✓ Branch 1 taken 15941 times.
✓ Branch 2 taken 66179 times.
✓ Branch 3 taken 957 times.
|
83077 | if (!is_b8x8 && !(n & 3)) |
397 | 66179 | *mb_type = (*mb_type & ~(MB_TYPE_8x8 | MB_TYPE_16x8 | MB_TYPE_8x16 | | |
398 | MB_TYPE_P1L0 | MB_TYPE_P1L1)) | | ||
399 | 66179 | MB_TYPE_16x16 | MB_TYPE_DIRECT2; | |
400 |
2/2✓ Branch 0 taken 759078 times.
✓ Branch 1 taken 142976 times.
|
902054 | } else if (IS_16X16(*mb_type)) { |
401 | int a, b; | ||
402 | |||
403 | 759078 | fill_rectangle(&sl->ref_cache[0][scan8[0]], 4, 4, 8, (uint8_t)ref[0], 1); | |
404 | 759078 | fill_rectangle(&sl->ref_cache[1][scan8[0]], 4, 4, 8, (uint8_t)ref[1], 1); | |
405 |
4/4✓ Branch 0 taken 571727 times.
✓ Branch 1 taken 187351 times.
✓ Branch 2 taken 571716 times.
✓ Branch 3 taken 11 times.
|
759078 | if (!IS_INTRA(mb_type_col[0]) && !sl->ref_list[1][0].parent->long_ref && |
406 |
2/2✓ Branch 0 taken 307858 times.
✓ Branch 1 taken 263858 times.
|
571716 | ((l1ref0[0] == 0 && |
407 |
2/2✓ Branch 0 taken 57913 times.
✓ Branch 1 taken 249945 times.
|
307858 | FFABS(l1mv0[0][0]) <= 1 && |
408 |
2/2✓ Branch 0 taken 33754 times.
✓ Branch 1 taken 24159 times.
|
57913 | FFABS(l1mv0[0][1]) <= 1) || |
409 |
4/4✓ Branch 0 taken 15800 times.
✓ Branch 1 taken 531757 times.
✓ Branch 2 taken 15337 times.
✓ Branch 3 taken 463 times.
|
547557 | (l1ref0[0] < 0 && !l1ref1[0] && |
410 |
2/2✓ Branch 0 taken 4335 times.
✓ Branch 1 taken 11002 times.
|
15337 | FFABS(l1mv1[0][0]) <= 1 && |
411 |
2/2✓ Branch 0 taken 3598 times.
✓ Branch 1 taken 737 times.
|
4335 | FFABS(l1mv1[0][1]) <= 1 && |
412 |
1/2✓ Branch 0 taken 3598 times.
✗ Branch 1 not taken.
|
3598 | h->x264_build > 33U))) { |
413 | 27757 | a = b = 0; | |
414 |
2/2✓ Branch 0 taken 5010 times.
✓ Branch 1 taken 22747 times.
|
27757 | if (ref[0] > 0) |
415 | 5010 | a = mv[0]; | |
416 |
2/2✓ Branch 0 taken 3330 times.
✓ Branch 1 taken 24427 times.
|
27757 | if (ref[1] > 0) |
417 | 3330 | b = mv[1]; | |
418 | } else { | ||
419 | 731321 | a = mv[0]; | |
420 | 731321 | b = mv[1]; | |
421 | } | ||
422 | 759078 | fill_rectangle(&sl->mv_cache[0][scan8[0]], 4, 4, 8, a, 4); | |
423 | 759078 | fill_rectangle(&sl->mv_cache[1][scan8[0]], 4, 4, 8, b, 4); | |
424 | } else { | ||
425 | 142976 | int n = 0; | |
426 |
2/2✓ Branch 0 taken 571904 times.
✓ Branch 1 taken 142976 times.
|
714880 | for (i8 = 0; i8 < 4; i8++) { |
427 | 571904 | const int x8 = i8 & 1; | |
428 | 571904 | const int y8 = i8 >> 1; | |
429 | |||
430 |
4/4✓ Branch 0 taken 246176 times.
✓ Branch 1 taken 325728 times.
✓ Branch 2 taken 112794 times.
✓ Branch 3 taken 133382 times.
|
571904 | if (is_b8x8 && !IS_DIRECT(sl->sub_mb_type[i8])) |
431 | 112794 | continue; | |
432 | 459110 | sl->sub_mb_type[i8] = sub_mb_type; | |
433 | |||
434 | 459110 | fill_rectangle(&sl->mv_cache[0][scan8[i8 * 4]], 2, 2, 8, mv[0], 4); | |
435 | 459110 | fill_rectangle(&sl->mv_cache[1][scan8[i8 * 4]], 2, 2, 8, mv[1], 4); | |
436 | 459110 | fill_rectangle(&sl->ref_cache[0][scan8[i8 * 4]], 2, 2, 8, | |
437 | 459110 | (uint8_t)ref[0], 1); | |
438 | 459110 | fill_rectangle(&sl->ref_cache[1][scan8[i8 * 4]], 2, 2, 8, | |
439 | 459110 | (uint8_t)ref[1], 1); | |
440 | |||
441 | assert(b8_stride == 2); | ||
442 | /* col_zero_flag */ | ||
443 |
4/4✓ Branch 0 taken 424093 times.
✓ Branch 1 taken 35017 times.
✓ Branch 2 taken 423961 times.
✓ Branch 3 taken 132 times.
|
459110 | if (!IS_INTRA(mb_type_col[0]) && !sl->ref_list[1][0].parent->long_ref && |
444 |
2/2✓ Branch 0 taken 161723 times.
✓ Branch 1 taken 262238 times.
|
423961 | (l1ref0[i8] == 0 || |
445 |
2/2✓ Branch 0 taken 10931 times.
✓ Branch 1 taken 150792 times.
|
161723 | (l1ref0[i8] < 0 && |
446 |
2/2✓ Branch 0 taken 10185 times.
✓ Branch 1 taken 746 times.
|
10931 | l1ref1[i8] == 0 && |
447 |
1/2✓ Branch 0 taken 10185 times.
✗ Branch 1 not taken.
|
10185 | h->x264_build > 33U))) { |
448 |
2/2✓ Branch 0 taken 262238 times.
✓ Branch 1 taken 10185 times.
|
272423 | const int16_t (*l1mv)[2] = l1ref0[i8] == 0 ? l1mv0 : l1mv1; |
449 |
2/2✓ Branch 0 taken 242184 times.
✓ Branch 1 taken 30239 times.
|
272423 | if (IS_SUB_8X8(sub_mb_type)) { |
450 | 242184 | const int16_t *mv_col = l1mv[x8 * 3 + y8 * 3 * b4_stride]; | |
451 |
4/4✓ Branch 0 taken 36551 times.
✓ Branch 1 taken 205633 times.
✓ Branch 2 taken 18805 times.
✓ Branch 3 taken 17746 times.
|
242184 | if (FFABS(mv_col[0]) <= 1 && FFABS(mv_col[1]) <= 1) { |
452 |
2/2✓ Branch 0 taken 15715 times.
✓ Branch 1 taken 3090 times.
|
18805 | if (ref[0] == 0) |
453 | 15715 | fill_rectangle(&sl->mv_cache[0][scan8[i8 * 4]], 2, 2, | |
454 | 8, 0, 4); | ||
455 |
2/2✓ Branch 0 taken 16796 times.
✓ Branch 1 taken 2009 times.
|
18805 | if (ref[1] == 0) |
456 | 16796 | fill_rectangle(&sl->mv_cache[1][scan8[i8 * 4]], 2, 2, | |
457 | 8, 0, 4); | ||
458 | 18805 | n += 4; | |
459 | } | ||
460 | } else { | ||
461 | 30239 | int m = 0; | |
462 |
2/2✓ Branch 0 taken 120956 times.
✓ Branch 1 taken 30239 times.
|
151195 | for (i4 = 0; i4 < 4; i4++) { |
463 | 120956 | const int16_t *mv_col = l1mv[x8 * 2 + (i4 & 1) + | |
464 | 120956 | (y8 * 2 + (i4 >> 1)) * b4_stride]; | |
465 |
4/4✓ Branch 0 taken 8348 times.
✓ Branch 1 taken 112608 times.
✓ Branch 2 taken 2956 times.
✓ Branch 3 taken 5392 times.
|
120956 | if (FFABS(mv_col[0]) <= 1 && FFABS(mv_col[1]) <= 1) { |
466 |
2/2✓ Branch 0 taken 1991 times.
✓ Branch 1 taken 965 times.
|
2956 | if (ref[0] == 0) |
467 | 1991 | AV_ZERO32(sl->mv_cache[0][scan8[i8 * 4 + i4]]); | |
468 |
2/2✓ Branch 0 taken 2710 times.
✓ Branch 1 taken 246 times.
|
2956 | if (ref[1] == 0) |
469 | 2710 | AV_ZERO32(sl->mv_cache[1][scan8[i8 * 4 + i4]]); | |
470 | 2956 | m++; | |
471 | } | ||
472 | } | ||
473 |
2/2✓ Branch 0 taken 29926 times.
✓ Branch 1 taken 313 times.
|
30239 | if (!(m & 3)) |
474 | 29926 | sl->sub_mb_type[i8] += MB_TYPE_16x16 - MB_TYPE_8x8; | |
475 | 30239 | n += m; | |
476 | } | ||
477 | } | ||
478 | } | ||
479 |
4/4✓ Branch 0 taken 81432 times.
✓ Branch 1 taken 61544 times.
✓ Branch 2 taken 75301 times.
✓ Branch 3 taken 6131 times.
|
142976 | if (!is_b8x8 && !(n & 15)) |
480 | 75301 | *mb_type = (*mb_type & ~(MB_TYPE_8x8 | MB_TYPE_16x8 | MB_TYPE_8x16 | | |
481 | MB_TYPE_P1L0 | MB_TYPE_P1L1)) | | ||
482 | 75301 | MB_TYPE_16x16 | MB_TYPE_DIRECT2; | |
483 | } | ||
484 | } | ||
485 | |||
486 | 251816 | static void pred_temp_direct_motion(const H264Context *const h, H264SliceContext *sl, | |
487 | int *mb_type) | ||
488 | { | ||
489 | 251816 | int b8_stride = 2; | |
490 | 251816 | int b4_stride = h->b_stride; | |
491 | 251816 | int mb_xy = sl->mb_xy, mb_y = sl->mb_y; | |
492 | int mb_type_col[2]; | ||
493 | const int16_t (*l1mv0)[2], (*l1mv1)[2]; | ||
494 | const int8_t *l1ref0, *l1ref1; | ||
495 | 251816 | const int is_b8x8 = IS_8X8(*mb_type); | |
496 | unsigned int sub_mb_type; | ||
497 | int i8, i4; | ||
498 | |||
499 | assert(sl->ref_list[1][0].reference & 3); | ||
500 | |||
501 | 251816 | await_reference_mb_row(h, &sl->ref_list[1][0], | |
502 | 251816 | sl->mb_y + !!IS_INTERLACED(*mb_type)); | |
503 | |||
504 |
2/2✓ Branch 0 taken 88777 times.
✓ Branch 1 taken 163039 times.
|
251816 | if (IS_INTERLACED(sl->ref_list[1][0].parent->mb_type[mb_xy])) { // AFL/AFR/FR/FL -> AFL/FL |
505 |
2/2✓ Branch 0 taken 15611 times.
✓ Branch 1 taken 73166 times.
|
88777 | if (!IS_INTERLACED(*mb_type)) { // AFR/FR -> AFL/FL |
506 | 15611 | mb_y = (sl->mb_y & ~1) + sl->col_parity; | |
507 | 15611 | mb_xy = sl->mb_x + | |
508 | 15611 | ((sl->mb_y & ~1) + sl->col_parity) * h->mb_stride; | |
509 | 15611 | b8_stride = 0; | |
510 | } else { | ||
511 | 73166 | mb_y += sl->col_fieldoff; | |
512 | 73166 | mb_xy += h->mb_stride * sl->col_fieldoff; // non-zero for FL -> FL & differ parity | |
513 | } | ||
514 | 88777 | goto single_col; | |
515 | } else { // AFL/AFR/FR/FL -> AFR/FR | ||
516 |
2/2✓ Branch 0 taken 16549 times.
✓ Branch 1 taken 146490 times.
|
163039 | if (IS_INTERLACED(*mb_type)) { // AFL /FL -> AFR/FR |
517 | 16549 | mb_y = sl->mb_y & ~1; | |
518 | 16549 | mb_xy = sl->mb_x + (sl->mb_y & ~1) * h->mb_stride; | |
519 | 16549 | mb_type_col[0] = sl->ref_list[1][0].parent->mb_type[mb_xy]; | |
520 | 16549 | mb_type_col[1] = sl->ref_list[1][0].parent->mb_type[mb_xy + h->mb_stride]; | |
521 | 16549 | b8_stride = 2 + 4 * h->mb_stride; | |
522 | 16549 | b4_stride *= 6; | |
523 | 16549 | if (IS_INTERLACED(mb_type_col[0]) != | |
524 |
1/2✗ Branch 0 not taken.
✓ Branch 1 taken 16549 times.
|
16549 | IS_INTERLACED(mb_type_col[1])) { |
525 | ✗ | mb_type_col[0] &= ~MB_TYPE_INTERLACED; | |
526 | ✗ | mb_type_col[1] &= ~MB_TYPE_INTERLACED; | |
527 | } | ||
528 | |||
529 | 16549 | sub_mb_type = MB_TYPE_16x16 | MB_TYPE_P0L0 | MB_TYPE_P0L1 | | |
530 | MB_TYPE_DIRECT2; /* B_SUB_8x8 */ | ||
531 | |||
532 |
2/2✓ Branch 0 taken 9887 times.
✓ Branch 1 taken 6662 times.
|
16549 | if ((mb_type_col[0] & MB_TYPE_16x16_OR_INTRA) && |
533 |
4/4✓ Branch 0 taken 7209 times.
✓ Branch 1 taken 2678 times.
✓ Branch 2 taken 5873 times.
✓ Branch 3 taken 1336 times.
|
9887 | (mb_type_col[1] & MB_TYPE_16x16_OR_INTRA) && |
534 | !is_b8x8) { | ||
535 | 5873 | *mb_type |= MB_TYPE_16x8 | MB_TYPE_L0L1 | | |
536 | MB_TYPE_DIRECT2; /* B_16x8 */ | ||
537 | } else { | ||
538 | 10676 | *mb_type |= MB_TYPE_8x8 | MB_TYPE_L0L1; | |
539 | } | ||
540 | } else { // AFR/FR -> AFR/FR | ||
541 | 146490 | single_col: | |
542 | 235267 | mb_type_col[0] = | |
543 | 235267 | mb_type_col[1] = sl->ref_list[1][0].parent->mb_type[mb_xy]; | |
544 | |||
545 | 235267 | sub_mb_type = MB_TYPE_16x16 | MB_TYPE_P0L0 | MB_TYPE_P0L1 | | |
546 | MB_TYPE_DIRECT2; /* B_SUB_8x8 */ | ||
547 |
4/4✓ Branch 0 taken 189694 times.
✓ Branch 1 taken 45573 times.
✓ Branch 2 taken 134937 times.
✓ Branch 3 taken 54757 times.
|
235267 | if (!is_b8x8 && (mb_type_col[0] & MB_TYPE_16x16_OR_INTRA)) { |
548 | 134937 | *mb_type |= MB_TYPE_16x16 | MB_TYPE_P0L0 | MB_TYPE_P0L1 | | |
549 | MB_TYPE_DIRECT2; /* B_16x16 */ | ||
550 |
2/2✓ Branch 0 taken 54757 times.
✓ Branch 1 taken 45573 times.
|
100330 | } else if (!is_b8x8 && |
551 |
2/2✓ Branch 0 taken 34983 times.
✓ Branch 1 taken 19774 times.
|
54757 | (mb_type_col[0] & (MB_TYPE_16x8 | MB_TYPE_8x16))) { |
552 | 34983 | *mb_type |= MB_TYPE_L0L1 | MB_TYPE_DIRECT2 | | |
553 | 34983 | (mb_type_col[0] & (MB_TYPE_16x8 | MB_TYPE_8x16)); | |
554 | } else { | ||
555 |
2/2✓ Branch 0 taken 10593 times.
✓ Branch 1 taken 54754 times.
|
65347 | if (!h->ps.sps->direct_8x8_inference_flag) { |
556 | /* FIXME: save sub mb types from previous frames (or derive | ||
557 | * from MVs) so we know exactly what block size to use */ | ||
558 | 10593 | sub_mb_type = MB_TYPE_8x8 | MB_TYPE_P0L0 | MB_TYPE_P0L1 | | |
559 | MB_TYPE_DIRECT2; /* B_SUB_4x4 */ | ||
560 | } | ||
561 | 65347 | *mb_type |= MB_TYPE_8x8 | MB_TYPE_L0L1; | |
562 | } | ||
563 | } | ||
564 | } | ||
565 | |||
566 | 251816 | await_reference_mb_row(h, &sl->ref_list[1][0], mb_y); | |
567 | |||
568 | 251816 | l1mv0 = (void*)&sl->ref_list[1][0].parent->motion_val[0][h->mb2b_xy[mb_xy]]; | |
569 | 251816 | l1mv1 = (void*)&sl->ref_list[1][0].parent->motion_val[1][h->mb2b_xy[mb_xy]]; | |
570 | 251816 | l1ref0 = &sl->ref_list[1][0].parent->ref_index[0][4 * mb_xy]; | |
571 | 251816 | l1ref1 = &sl->ref_list[1][0].parent->ref_index[1][4 * mb_xy]; | |
572 |
2/2✓ Branch 0 taken 15611 times.
✓ Branch 1 taken 236205 times.
|
251816 | if (!b8_stride) { |
573 |
2/2✓ Branch 0 taken 7720 times.
✓ Branch 1 taken 7891 times.
|
15611 | if (sl->mb_y & 1) { |
574 | 7720 | l1ref0 += 2; | |
575 | 7720 | l1ref1 += 2; | |
576 | 7720 | l1mv0 += 2 * b4_stride; | |
577 | 7720 | l1mv1 += 2 * b4_stride; | |
578 | } | ||
579 | } | ||
580 | |||
581 | { | ||
582 | 251816 | const int *map_col_to_list0[2] = { sl->map_col_to_list0[0], | |
583 | 251816 | sl->map_col_to_list0[1] }; | |
584 | 251816 | const int *dist_scale_factor = sl->dist_scale_factor; | |
585 | int ref_offset; | ||
586 | |||
587 |
4/4✓ Branch 0 taken 42213 times.
✓ Branch 1 taken 209603 times.
✓ Branch 2 taken 20032 times.
✓ Branch 3 taken 22181 times.
|
251816 | if (FRAME_MBAFF(h) && IS_INTERLACED(*mb_type)) { |
588 | 20032 | map_col_to_list0[0] = sl->map_col_to_list0_field[sl->mb_y & 1][0]; | |
589 | 20032 | map_col_to_list0[1] = sl->map_col_to_list0_field[sl->mb_y & 1][1]; | |
590 | 20032 | dist_scale_factor = sl->dist_scale_factor_field[sl->mb_y & 1]; | |
591 | } | ||
592 | 251816 | ref_offset = (sl->ref_list[1][0].parent->mbaff << 4) & (mb_type_col[0] >> 3); | |
593 | |||
594 |
2/2✓ Branch 0 taken 32160 times.
✓ Branch 1 taken 219656 times.
|
251816 | if (IS_INTERLACED(*mb_type) != IS_INTERLACED(mb_type_col[0])) { |
595 |
2/2✓ Branch 0 taken 15611 times.
✓ Branch 1 taken 16549 times.
|
32160 | int y_shift = 2 * !IS_INTERLACED(*mb_type); |
596 | assert(h->ps.sps->direct_8x8_inference_flag); | ||
597 | |||
598 |
2/2✓ Branch 0 taken 128640 times.
✓ Branch 1 taken 32160 times.
|
160800 | for (i8 = 0; i8 < 4; i8++) { |
599 | 128640 | const int x8 = i8 & 1; | |
600 | 128640 | const int y8 = i8 >> 1; | |
601 | int ref0, scale; | ||
602 | 128640 | const int16_t (*l1mv)[2] = l1mv0; | |
603 | |||
604 |
4/4✓ Branch 0 taken 43260 times.
✓ Branch 1 taken 85380 times.
✓ Branch 2 taken 22674 times.
✓ Branch 3 taken 20586 times.
|
128640 | if (is_b8x8 && !IS_DIRECT(sl->sub_mb_type[i8])) |
605 | 22674 | continue; | |
606 | 105966 | sl->sub_mb_type[i8] = sub_mb_type; | |
607 | |||
608 | 105966 | fill_rectangle(&sl->ref_cache[1][scan8[i8 * 4]], 2, 2, 8, 0, 1); | |
609 |
2/2✓ Branch 0 taken 25496 times.
✓ Branch 1 taken 80470 times.
|
105966 | if (IS_INTRA(mb_type_col[y8])) { |
610 | 25496 | fill_rectangle(&sl->ref_cache[0][scan8[i8 * 4]], 2, 2, 8, 0, 1); | |
611 | 25496 | fill_rectangle(&sl->mv_cache[0][scan8[i8 * 4]], 2, 2, 8, 0, 4); | |
612 | 25496 | fill_rectangle(&sl->mv_cache[1][scan8[i8 * 4]], 2, 2, 8, 0, 4); | |
613 | 25496 | continue; | |
614 | } | ||
615 | |||
616 | 80470 | ref0 = l1ref0[x8 + y8 * b8_stride]; | |
617 |
2/2✓ Branch 0 taken 80277 times.
✓ Branch 1 taken 193 times.
|
80470 | if (ref0 >= 0) |
618 | 80277 | ref0 = map_col_to_list0[0][ref0 + ref_offset]; | |
619 | else { | ||
620 | 193 | ref0 = map_col_to_list0[1][l1ref1[x8 + y8 * b8_stride] + | |
621 | ref_offset]; | ||
622 | 193 | l1mv = l1mv1; | |
623 | } | ||
624 | 80470 | scale = dist_scale_factor[ref0]; | |
625 | 80470 | fill_rectangle(&sl->ref_cache[0][scan8[i8 * 4]], 2, 2, 8, | |
626 | ref0, 1); | ||
627 | |||
628 | { | ||
629 | 80470 | const int16_t *mv_col = l1mv[x8 * 3 + y8 * b4_stride]; | |
630 | 80470 | int my_col = (mv_col[1] * (1 << y_shift)) / 2; | |
631 | 80470 | int mx = (scale * mv_col[0] + 128) >> 8; | |
632 | 80470 | int my = (scale * my_col + 128) >> 8; | |
633 | 80470 | fill_rectangle(&sl->mv_cache[0][scan8[i8 * 4]], 2, 2, 8, | |
634 | pack16to32(mx, my), 4); | ||
635 | 80470 | fill_rectangle(&sl->mv_cache[1][scan8[i8 * 4]], 2, 2, 8, | |
636 | 80470 | pack16to32(mx - mv_col[0], my - my_col), 4); | |
637 | } | ||
638 | } | ||
639 | 32160 | return; | |
640 | } | ||
641 | |||
642 | /* one-to-one mv scaling */ | ||
643 | |||
644 |
2/2✓ Branch 0 taken 127333 times.
✓ Branch 1 taken 92323 times.
|
219656 | if (IS_16X16(*mb_type)) { |
645 | int ref, mv0, mv1; | ||
646 | |||
647 | 127333 | fill_rectangle(&sl->ref_cache[1][scan8[0]], 4, 4, 8, 0, 1); | |
648 |
2/2✓ Branch 0 taken 60991 times.
✓ Branch 1 taken 66342 times.
|
127333 | if (IS_INTRA(mb_type_col[0])) { |
649 | 60991 | ref = mv0 = mv1 = 0; | |
650 | } else { | ||
651 | 198975 | const int ref0 = l1ref0[0] >= 0 ? map_col_to_list0[0][l1ref0[0] + ref_offset] | |
652 |
2/2✓ Branch 0 taken 66291 times.
✓ Branch 1 taken 51 times.
|
66342 | : map_col_to_list0[1][l1ref1[0] + ref_offset]; |
653 | 66342 | const int scale = dist_scale_factor[ref0]; | |
654 |
2/2✓ Branch 0 taken 66291 times.
✓ Branch 1 taken 51 times.
|
66342 | const int16_t *mv_col = l1ref0[0] >= 0 ? l1mv0[0] : l1mv1[0]; |
655 | int mv_l0[2]; | ||
656 | 66342 | mv_l0[0] = (scale * mv_col[0] + 128) >> 8; | |
657 | 66342 | mv_l0[1] = (scale * mv_col[1] + 128) >> 8; | |
658 | 66342 | ref = ref0; | |
659 | 66342 | mv0 = pack16to32(mv_l0[0], mv_l0[1]); | |
660 | 66342 | mv1 = pack16to32(mv_l0[0] - mv_col[0], mv_l0[1] - mv_col[1]); | |
661 | } | ||
662 | 127333 | fill_rectangle(&sl->ref_cache[0][scan8[0]], 4, 4, 8, ref, 1); | |
663 | 127333 | fill_rectangle(&sl->mv_cache[0][scan8[0]], 4, 4, 8, mv0, 4); | |
664 | 127333 | fill_rectangle(&sl->mv_cache[1][scan8[0]], 4, 4, 8, mv1, 4); | |
665 | } else { | ||
666 |
2/2✓ Branch 0 taken 369292 times.
✓ Branch 1 taken 92323 times.
|
461615 | for (i8 = 0; i8 < 4; i8++) { |
667 | 369292 | const int x8 = i8 & 1; | |
668 | 369292 | const int y8 = i8 >> 1; | |
669 | int ref0, scale; | ||
670 | 369292 | const int16_t (*l1mv)[2] = l1mv0; | |
671 | |||
672 |
4/4✓ Branch 0 taken 163900 times.
✓ Branch 1 taken 205392 times.
✓ Branch 2 taken 92460 times.
✓ Branch 3 taken 71440 times.
|
369292 | if (is_b8x8 && !IS_DIRECT(sl->sub_mb_type[i8])) |
673 | 92460 | continue; | |
674 | 276832 | sl->sub_mb_type[i8] = sub_mb_type; | |
675 | 276832 | fill_rectangle(&sl->ref_cache[1][scan8[i8 * 4]], 2, 2, 8, 0, 1); | |
676 |
2/2✓ Branch 0 taken 22293 times.
✓ Branch 1 taken 254539 times.
|
276832 | if (IS_INTRA(mb_type_col[0])) { |
677 | 22293 | fill_rectangle(&sl->ref_cache[0][scan8[i8 * 4]], 2, 2, 8, 0, 1); | |
678 | 22293 | fill_rectangle(&sl->mv_cache[0][scan8[i8 * 4]], 2, 2, 8, 0, 4); | |
679 | 22293 | fill_rectangle(&sl->mv_cache[1][scan8[i8 * 4]], 2, 2, 8, 0, 4); | |
680 | 22293 | continue; | |
681 | } | ||
682 | |||
683 | assert(b8_stride == 2); | ||
684 | 254539 | ref0 = l1ref0[i8]; | |
685 |
2/2✓ Branch 0 taken 254519 times.
✓ Branch 1 taken 20 times.
|
254539 | if (ref0 >= 0) |
686 | 254519 | ref0 = map_col_to_list0[0][ref0 + ref_offset]; | |
687 | else { | ||
688 | 20 | ref0 = map_col_to_list0[1][l1ref1[i8] + ref_offset]; | |
689 | 20 | l1mv = l1mv1; | |
690 | } | ||
691 | 254539 | scale = dist_scale_factor[ref0]; | |
692 | |||
693 | 254539 | fill_rectangle(&sl->ref_cache[0][scan8[i8 * 4]], 2, 2, 8, | |
694 | ref0, 1); | ||
695 |
2/2✓ Branch 0 taken 229231 times.
✓ Branch 1 taken 25308 times.
|
254539 | if (IS_SUB_8X8(sub_mb_type)) { |
696 | 229231 | const int16_t *mv_col = l1mv[x8 * 3 + y8 * 3 * b4_stride]; | |
697 | 229231 | int mx = (scale * mv_col[0] + 128) >> 8; | |
698 | 229231 | int my = (scale * mv_col[1] + 128) >> 8; | |
699 | 229231 | fill_rectangle(&sl->mv_cache[0][scan8[i8 * 4]], 2, 2, 8, | |
700 | pack16to32(mx, my), 4); | ||
701 | 229231 | fill_rectangle(&sl->mv_cache[1][scan8[i8 * 4]], 2, 2, 8, | |
702 | 229231 | pack16to32(mx - mv_col[0], my - mv_col[1]), 4); | |
703 | } else { | ||
704 |
2/2✓ Branch 0 taken 101232 times.
✓ Branch 1 taken 25308 times.
|
126540 | for (i4 = 0; i4 < 4; i4++) { |
705 | 101232 | const int16_t *mv_col = l1mv[x8 * 2 + (i4 & 1) + | |
706 | 101232 | (y8 * 2 + (i4 >> 1)) * b4_stride]; | |
707 | 101232 | int16_t *mv_l0 = sl->mv_cache[0][scan8[i8 * 4 + i4]]; | |
708 | 101232 | mv_l0[0] = (scale * mv_col[0] + 128) >> 8; | |
709 | 101232 | mv_l0[1] = (scale * mv_col[1] + 128) >> 8; | |
710 | 101232 | AV_WN32A(sl->mv_cache[1][scan8[i8 * 4 + i4]], | |
711 | pack16to32(mv_l0[0] - mv_col[0], | ||
712 | mv_l0[1] - mv_col[1])); | ||
713 | } | ||
714 | } | ||
715 | } | ||
716 | } | ||
717 | } | ||
718 | } | ||
719 | |||
720 | 2859977 | void ff_h264_pred_direct_motion(const H264Context *const h, H264SliceContext *sl, | |
721 | int *mb_type) | ||
722 | { | ||
723 |
2/2✓ Branch 0 taken 2608161 times.
✓ Branch 1 taken 251816 times.
|
2859977 | if (sl->direct_spatial_mv_pred) |
724 | 2608161 | pred_spatial_direct_motion(h, sl, mb_type); | |
725 | else | ||
726 | 251816 | pred_temp_direct_motion(h, sl, mb_type); | |
727 | 2859977 | } | |
728 |