FFmpeg coverage


Directory: ../../../ffmpeg/
File: src/libavutil/tx.c
Date: 2026-04-24 19:58:39
Exec Total Coverage
Lines: 432 496 87.1%
Functions: 24 25 96.0%
Branches: 466 612 76.1%

Line Branch Exec Source
1 /*
2 * This file is part of FFmpeg.
3 *
4 * FFmpeg is free software; you can redistribute it and/or
5 * modify it under the terms of the GNU Lesser General Public
6 * License as published by the Free Software Foundation; either
7 * version 2.1 of the License, or (at your option) any later version.
8 *
9 * FFmpeg is distributed in the hope that it will be useful,
10 * but WITHOUT ANY WARRANTY; without even the implied warranty of
11 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
12 * Lesser General Public License for more details.
13 *
14 * You should have received a copy of the GNU Lesser General Public
15 * License along with FFmpeg; if not, write to the Free Software
16 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
17 */
18
19 #include "avassert.h"
20 #include "intmath.h"
21 #include "cpu.h"
22 #include "mem.h"
23 #include "qsort.h"
24 #include "bprint.h"
25
26 #include "tx_priv.h"
27
28 #define TYPE_IS(type, x) \
29 (((x) == AV_TX_FLOAT_ ## type) || \
30 ((x) == AV_TX_DOUBLE_ ## type) || \
31 ((x) == AV_TX_INT32_ ## type))
32
33 /* Calculates the modular multiplicative inverse */
34 4458 static av_always_inline int mulinv(int n, int m)
35 {
36 4458 n = n % m;
37
1/2
✓ Branch 0 taken 45406 times.
✗ Branch 1 not taken.
45406 for (int x = 1; x < m; x++)
38
2/2
✓ Branch 0 taken 4458 times.
✓ Branch 1 taken 40948 times.
45406 if (((n * x) % m) == 1)
39 4458 return x;
40 av_assert0(0); /* Never reached */
41 return 0;
42 }
43
44 81 int ff_tx_gen_pfa_input_map(AVTXContext *s, FFTXCodeletOptions *opts,
45 int d1, int d2)
46 {
47 81 const int sl = d1*d2;
48
49 81 s->map = av_malloc(s->len*sizeof(*s->map));
50
1/2
✗ Branch 0 not taken.
✓ Branch 1 taken 81 times.
81 if (!s->map)
51 return AVERROR(ENOMEM);
52
53
2/2
✓ Branch 0 taken 81 times.
✓ Branch 1 taken 81 times.
162 for (int k = 0; k < s->len; k += sl) {
54
3/6
✓ Branch 0 taken 81 times.
✗ Branch 1 not taken.
✓ Branch 2 taken 81 times.
✗ Branch 3 not taken.
✗ Branch 4 not taken.
✓ Branch 5 taken 81 times.
81 if (s->inv || (opts && opts->map_dir == FF_TX_MAP_SCATTER)) {
55 for (int m = 0; m < d2; m++)
56 for (int n = 0; n < d1; n++)
57 s->map[k + ((m*d1 + n*d2) % (sl))] = m*d1 + n;
58 } else {
59
2/2
✓ Branch 0 taken 405 times.
✓ Branch 1 taken 81 times.
486 for (int m = 0; m < d2; m++)
60
2/2
✓ Branch 0 taken 1215 times.
✓ Branch 1 taken 405 times.
1620 for (int n = 0; n < d1; n++)
61 1215 s->map[k + m*d1 + n] = (m*d1 + n*d2) % (sl);
62 }
63
64
1/2
✗ Branch 0 not taken.
✓ Branch 1 taken 81 times.
81 if (s->inv)
65 for (int w = 1; w <= ((sl) >> 1); w++)
66 FFSWAP(int, s->map[k + w], s->map[k + sl - w]);
67 }
68
69
1/2
✓ Branch 0 taken 81 times.
✗ Branch 1 not taken.
81 s->map_dir = opts ? opts->map_dir : FF_TX_MAP_GATHER;
70
71 81 return 0;
72 }
73
74 /* Guaranteed to work for any n, m where gcd(n, m) == 1 */
75 2229 int ff_tx_gen_compound_mapping(AVTXContext *s, FFTXCodeletOptions *opts,
76 int inv, int n, int m)
77 {
78 int *in_map, *out_map;
79 2229 const int len = n*m; /* Will not be equal to s->len for MDCTs */
80 int m_inv, n_inv;
81
82 /* Make sure the numbers are coprime */
83
1/2
✗ Branch 0 not taken.
✓ Branch 1 taken 2229 times.
2229 if (av_gcd(n, m) != 1)
84 return AVERROR(EINVAL);
85
86 2229 m_inv = mulinv(m, n);
87 2229 n_inv = mulinv(n, m);
88
89
1/2
✗ Branch 1 not taken.
✓ Branch 2 taken 2229 times.
2229 if (!(s->map = av_malloc(2*len*sizeof(*s->map))))
90 return AVERROR(ENOMEM);
91
92 2229 in_map = s->map;
93 2229 out_map = s->map + len;
94
95 /* Ruritanian map for input, CRT map for output, can be swapped */
96
3/4
✓ Branch 0 taken 417 times.
✓ Branch 1 taken 1812 times.
✗ Branch 2 not taken.
✓ Branch 3 taken 417 times.
2229 if (opts && opts->map_dir == FF_TX_MAP_SCATTER) {
97 for (int j = 0; j < m; j++) {
98 for (int i = 0; i < n; i++) {
99 in_map[(i*m + j*n) % len] = j*n + i;
100 out_map[(i*m*m_inv + j*n*n_inv) % len] = i*m + j;
101 }
102 }
103 } else {
104
2/2
✓ Branch 0 taken 75840 times.
✓ Branch 1 taken 2229 times.
78069 for (int j = 0; j < m; j++) {
105
2/2
✓ Branch 0 taken 602352 times.
✓ Branch 1 taken 75840 times.
678192 for (int i = 0; i < n; i++) {
106 602352 in_map[j*n + i] = (i*m + j*n) % len;
107 602352 out_map[(i*m*m_inv + j*n*n_inv) % len] = i*m + j;
108 }
109 }
110 }
111
112
2/2
✓ Branch 0 taken 2129 times.
✓ Branch 1 taken 100 times.
2229 if (inv) {
113
2/2
✓ Branch 0 taken 70128 times.
✓ Branch 1 taken 2129 times.
72257 for (int i = 0; i < m; i++) {
114 70128 int *in = &in_map[i*n + 1]; /* Skip the DC */
115
2/2
✓ Branch 0 taken 223600 times.
✓ Branch 1 taken 70128 times.
293728 for (int j = 0; j < ((n - 1) >> 1); j++)
116 223600 FFSWAP(int, in[j], in[n - j - 2]);
117 }
118 }
119
120
2/2
✓ Branch 0 taken 417 times.
✓ Branch 1 taken 1812 times.
2229 s->map_dir = opts ? opts->map_dir : FF_TX_MAP_GATHER;
121
122 2229 return 0;
123 }
124
125 11074950 static inline int split_radix_permutation(int i, int len, int inv)
126 {
127 11074950 len >>= 1;
128
2/2
✓ Branch 0 taken 1419474 times.
✓ Branch 1 taken 9655476 times.
11074950 if (len <= 1)
129 1419474 return i & 1;
130
2/2
✓ Branch 0 taken 4827738 times.
✓ Branch 1 taken 4827738 times.
9655476 if (!(i & len))
131 4827738 return split_radix_permutation(i, len, inv) * 2;
132 4827738 len >>= 1;
133 4827738 return split_radix_permutation(i, len, inv) * 4 + 1 - 2*(!(i & len) ^ inv);
134 }
135
136 4361 int ff_tx_gen_ptwo_revtab(AVTXContext *s, FFTXCodeletOptions *opts)
137 {
138 4361 int len = s->len;
139
140
1/2
✗ Branch 1 not taken.
✓ Branch 2 taken 4361 times.
4361 if (!(s->map = av_malloc(len*sizeof(*s->map))))
141 return AVERROR(ENOMEM);
142
143
3/4
✓ Branch 0 taken 4361 times.
✗ Branch 1 not taken.
✓ Branch 2 taken 1958 times.
✓ Branch 3 taken 2403 times.
4361 if (opts && opts->map_dir == FF_TX_MAP_SCATTER) {
144
2/2
✓ Branch 0 taken 201548 times.
✓ Branch 1 taken 1958 times.
203506 for (int i = 0; i < s->len; i++)
145 201548 s->map[-split_radix_permutation(i, len, s->inv) & (len - 1)] = i;
146 } else {
147
2/2
✓ Branch 0 taken 1021610 times.
✓ Branch 1 taken 2403 times.
1024013 for (int i = 0; i < s->len; i++)
148 1021610 s->map[i] = -split_radix_permutation(i, len, s->inv) & (len - 1);
149 }
150
151
1/2
✓ Branch 0 taken 4361 times.
✗ Branch 1 not taken.
4361 s->map_dir = opts ? opts->map_dir : FF_TX_MAP_GATHER;
152
153 4361 return 0;
154 }
155
156 int ff_tx_gen_inplace_map(AVTXContext *s, int len)
157 {
158 int *src_map, out_map_idx = 0;
159
160 if (!s->sub || !s->sub->map)
161 return AVERROR(EINVAL);
162
163 if (!(s->map = av_mallocz(len*sizeof(*s->map))))
164 return AVERROR(ENOMEM);
165
166 src_map = s->sub->map;
167
168 /* The first coefficient is always already in-place */
169 for (int src = 1; src < s->len; src++) {
170 int dst = src_map[src];
171 int found = 0;
172
173 if (dst <= src)
174 continue;
175
176 /* This just checks if a closed loop has been encountered before,
177 * and if so, skips it, since to fully permute a loop we must only
178 * enter it once. */
179 do {
180 for (int j = 0; j < out_map_idx; j++) {
181 if (dst == s->map[j]) {
182 found = 1;
183 break;
184 }
185 }
186 dst = src_map[dst];
187 } while (dst != src && !found);
188
189 if (!found)
190 s->map[out_map_idx++] = src;
191 }
192
193 s->map[out_map_idx++] = 0;
194
195 return 0;
196 }
197
198 48442 static void parity_revtab_generator(int *revtab, int n, int inv, int offset,
199 int is_dual, int dual_high, int len,
200 int basis, int dual_stride, int inv_lookup)
201 {
202 48442 len >>= 1;
203
204
2/2
✓ Branch 0 taken 32689 times.
✓ Branch 1 taken 15753 times.
48442 if (len <= basis) {
205 int k1, k2, stride, even_idx, odd_idx;
206
207
3/4
✓ Branch 0 taken 24370 times.
✓ Branch 1 taken 8319 times.
✓ Branch 2 taken 24370 times.
✗ Branch 3 not taken.
32689 is_dual = is_dual && dual_stride;
208 32689 dual_high = is_dual & dual_high;
209
2/2
✓ Branch 0 taken 24370 times.
✓ Branch 1 taken 8319 times.
32689 stride = is_dual ? FFMIN(dual_stride, len) : 0;
210
211 32689 even_idx = offset + dual_high*(stride - 2*len);
212
4/4
✓ Branch 0 taken 24370 times.
✓ Branch 1 taken 8319 times.
✓ Branch 2 taken 12185 times.
✓ Branch 3 taken 12185 times.
32689 odd_idx = even_idx + len + (is_dual && !dual_high)*len + dual_high*len;
213
214
2/2
✓ Branch 0 taken 98158 times.
✓ Branch 1 taken 32689 times.
130847 for (int i = 0; i < len; i++) {
215 98158 k1 = -split_radix_permutation(offset + i*2 + 0, n, inv) & (n - 1);
216 98158 k2 = -split_radix_permutation(offset + i*2 + 1, n, inv) & (n - 1);
217
2/2
✓ Branch 0 taken 76628 times.
✓ Branch 1 taken 21530 times.
98158 if (inv_lookup) {
218 76628 revtab[even_idx++] = k1;
219 76628 revtab[odd_idx++] = k2;
220 } else {
221 21530 revtab[k1] = even_idx++;
222 21530 revtab[k2] = odd_idx++;
223 }
224
4/4
✓ Branch 0 taken 65156 times.
✓ Branch 1 taken 33002 times.
✓ Branch 2 taken 32578 times.
✓ Branch 3 taken 32578 times.
98158 if (stride && !((i + 1) % stride)) {
225 32578 even_idx += stride;
226 32578 odd_idx += stride;
227 }
228 }
229
230 32689 return;
231 }
232
233 15753 parity_revtab_generator(revtab, n, inv, offset,
234 0, 0, len >> 0, basis, dual_stride, inv_lookup);
235 15753 parity_revtab_generator(revtab, n, inv, offset + (len >> 0),
236 1, 0, len >> 1, basis, dual_stride, inv_lookup);
237 15753 parity_revtab_generator(revtab, n, inv, offset + (len >> 0) + (len >> 1),
238 1, 1, len >> 1, basis, dual_stride, inv_lookup);
239 }
240
241 1183 int ff_tx_gen_split_radix_parity_revtab(AVTXContext *s, int len, int inv,
242 FFTXCodeletOptions *opts,
243 int basis, int dual_stride)
244 {
245 1183 basis >>= 1;
246
1/2
✗ Branch 0 not taken.
✓ Branch 1 taken 1183 times.
1183 if (len < basis)
247 return AVERROR(EINVAL);
248
249
1/2
✗ Branch 1 not taken.
✓ Branch 2 taken 1183 times.
1183 if (!(s->map = av_mallocz(len*sizeof(*s->map))))
250 return AVERROR(ENOMEM);
251
252
3/4
✓ Branch 0 taken 945 times.
✓ Branch 1 taken 238 times.
✗ Branch 2 not taken.
✓ Branch 3 taken 945 times.
1183 av_assert0(!dual_stride || !(dual_stride & (dual_stride - 1)));
253
1/2
✗ Branch 0 not taken.
✓ Branch 1 taken 1183 times.
1183 av_assert0(dual_stride <= basis);
254
255
2/2
✓ Branch 0 taken 1159 times.
✓ Branch 1 taken 24 times.
2342 parity_revtab_generator(s->map, len, inv, 0, 0, 0, len,
256 basis, dual_stride,
257
2/2
✓ Branch 0 taken 543 times.
✓ Branch 1 taken 616 times.
1159 opts ? opts->map_dir == FF_TX_MAP_GATHER : FF_TX_MAP_GATHER);
258
259
2/2
✓ Branch 0 taken 1159 times.
✓ Branch 1 taken 24 times.
1183 s->map_dir = opts ? opts->map_dir : FF_TX_MAP_GATHER;
260
261 1183 return 0;
262 }
263
264 34458 static void reset_ctx(AVTXContext *s, int free_sub)
265 {
266
1/2
✗ Branch 0 not taken.
✓ Branch 1 taken 34458 times.
34458 if (!s)
267 return;
268
269
2/2
✓ Branch 0 taken 6115 times.
✓ Branch 1 taken 28343 times.
34458 if (s->sub)
270
2/2
✓ Branch 0 taken 24460 times.
✓ Branch 1 taken 6115 times.
30575 for (int i = 0; i < TX_MAX_SUB; i++)
271 24460 reset_ctx(&s->sub[i], free_sub + 1);
272
273
3/4
✓ Branch 0 taken 16210 times.
✓ Branch 1 taken 18248 times.
✗ Branch 2 not taken.
✓ Branch 3 taken 16210 times.
34458 if (s->cd_self && s->cd_self->uninit)
274 s->cd_self->uninit(s);
275
276
2/2
✓ Branch 0 taken 30053 times.
✓ Branch 1 taken 4405 times.
34458 if (free_sub)
277 30053 av_freep(&s->sub);
278
279 34458 av_freep(&s->map);
280 34458 av_freep(&s->exp);
281 34458 av_freep(&s->tmp);
282
283 /* Nothing else needs to be reset, it gets overwritten if another
284 * ff_tx_init_subtx() call is made. */
285 34458 s->nb_sub = 0;
286 34458 s->opaque = NULL;
287 34458 memset(s->fn, 0, sizeof(s->fn));
288 }
289
290 97 void ff_tx_clear_ctx(AVTXContext *s)
291 {
292 97 reset_ctx(s, 0);
293 97 }
294
295 6236 av_cold void av_tx_uninit(AVTXContext **ctx)
296 {
297
2/2
✓ Branch 0 taken 643 times.
✓ Branch 1 taken 5593 times.
6236 if (!(*ctx))
298 643 return;
299
300 5593 reset_ctx(*ctx, 1);
301 5593 av_freep(ctx);
302 }
303
304 14 static av_cold int ff_tx_null_init(AVTXContext *s, const FFTXCodelet *cd,
305 uint64_t flags, FFTXCodeletOptions *opts,
306 int len, int inv, const void *scale)
307 {
308 /* Can only handle one sample+type to one sample+type transforms */
309
6/12
✓ Branch 0 taken 14 times.
✗ Branch 1 not taken.
✓ Branch 2 taken 14 times.
✗ Branch 3 not taken.
✓ Branch 4 taken 14 times.
✗ Branch 5 not taken.
✓ Branch 6 taken 14 times.
✗ Branch 7 not taken.
✓ Branch 8 taken 14 times.
✗ Branch 9 not taken.
✗ Branch 10 not taken.
✓ Branch 11 taken 14 times.
14 if (TYPE_IS(MDCT, s->type) || TYPE_IS(RDFT, s->type))
310 return AVERROR(EINVAL);
311 14 return 0;
312 }
313
314 /* Null transform when the length is 1 */
315 2 static void ff_tx_null(AVTXContext *s, void *_out, void *_in, ptrdiff_t stride)
316 {
317 2 memcpy(_out, _in, stride);
318 2 }
319
320 static const FFTXCodelet ff_tx_null_def = {
321 .name = NULL_IF_CONFIG_SMALL("null"),
322 .function = ff_tx_null,
323 .type = TX_TYPE_ANY,
324 .flags = AV_TX_UNALIGNED | FF_TX_ALIGNED |
325 FF_TX_OUT_OF_PLACE | AV_TX_INPLACE,
326 .factors[0] = TX_FACTOR_ANY,
327 .min_len = 1,
328 .max_len = 1,
329 .init = ff_tx_null_init,
330 .cpu_flags = FF_TX_CPU_FLAGS_ALL,
331 .prio = FF_TX_PRIO_MAX,
332 };
333
334 static const FFTXCodelet * const ff_tx_null_list[] = {
335 &ff_tx_null_def,
336 NULL,
337 };
338
339 /* Array of all compiled codelet lists. Order is irrelevant. */
340 static const FFTXCodelet * const * const codelet_list[] = {
341 ff_tx_codelet_list_float_c,
342 ff_tx_codelet_list_double_c,
343 ff_tx_codelet_list_int32_c,
344 ff_tx_null_list,
345 #if HAVE_X86ASM
346 ff_tx_codelet_list_float_x86,
347 #endif
348 #if ARCH_AARCH64
349 ff_tx_codelet_list_float_aarch64,
350 #endif
351 };
352 static const int codelet_list_num = FF_ARRAY_ELEMS(codelet_list);
353
354 static const int cpu_slow_mask = AV_CPU_FLAG_SSE2SLOW | AV_CPU_FLAG_SSE3SLOW |
355 AV_CPU_FLAG_ATOM | AV_CPU_FLAG_SSSE3SLOW |
356 AV_CPU_FLAG_AVXSLOW | AV_CPU_FLAG_SLOW_GATHER;
357
358 static const int cpu_slow_penalties[][2] = {
359 { AV_CPU_FLAG_SSE2SLOW, 1 + 64 },
360 { AV_CPU_FLAG_SSE3SLOW, 1 + 64 },
361 { AV_CPU_FLAG_SSSE3SLOW, 1 + 64 },
362 { AV_CPU_FLAG_ATOM, 1 + 128 },
363 { AV_CPU_FLAG_AVXSLOW, 1 + 128 },
364 { AV_CPU_FLAG_SLOW_GATHER, 1 + 32 },
365 };
366
367 31521 static int get_codelet_prio(const FFTXCodelet *cd, int cpu_flags, int len)
368 {
369 31521 int prio = cd->prio;
370 31521 int max_factor = 0;
371
372 /* If the CPU has a SLOW flag, and the instruction is also flagged
373 * as being slow for such, reduce its priority */
374
2/2
✓ Branch 0 taken 189126 times.
✓ Branch 1 taken 31521 times.
220647 for (int i = 0; i < FF_ARRAY_ELEMS(cpu_slow_penalties); i++) {
375
2/2
✓ Branch 0 taken 1820 times.
✓ Branch 1 taken 187306 times.
189126 if ((cpu_flags & cd->cpu_flags) & cpu_slow_penalties[i][0])
376 1820 prio -= cpu_slow_penalties[i][1];
377 }
378
379 /* Prioritize aligned-only codelets */
380
4/4
✓ Branch 0 taken 4124 times.
✓ Branch 1 taken 27397 times.
✓ Branch 2 taken 4110 times.
✓ Branch 3 taken 14 times.
31521 if ((cd->flags & FF_TX_ALIGNED) && !(cd->flags & AV_TX_UNALIGNED))
381 4110 prio += 64;
382
383 /* Codelets for specific lengths are generally faster */
384
4/4
✓ Branch 0 taken 7315 times.
✓ Branch 1 taken 24206 times.
✓ Branch 2 taken 6702 times.
✓ Branch 3 taken 613 times.
31521 if ((len == cd->min_len) && (len == cd->max_len))
385 6702 prio += 64;
386
387 /* Forward-only or inverse-only transforms are generally better */
388
2/2
✓ Branch 0 taken 16872 times.
✓ Branch 1 taken 14649 times.
31521 if ((cd->flags & (FF_TX_FORWARD_ONLY | FF_TX_INVERSE_ONLY)))
389 16872 prio += 64;
390
391 /* Larger factors are generally better */
392
2/2
✓ Branch 0 taken 126084 times.
✓ Branch 1 taken 31521 times.
157605 for (int i = 0; i < TX_MAX_SUB; i++)
393 126084 max_factor = FFMAX(cd->factors[i], max_factor);
394
2/2
✓ Branch 0 taken 29635 times.
✓ Branch 1 taken 1886 times.
31521 if (max_factor)
395 29635 prio += 16*max_factor;
396
397 31521 return prio;
398 }
399
400 typedef struct FFTXLenDecomp {
401 int len;
402 int len2;
403 int prio;
404 const FFTXCodelet *cd;
405 } FFTXLenDecomp;
406
407 475 static int cmp_decomp(FFTXLenDecomp *a, FFTXLenDecomp *b)
408 {
409 475 return FFDIFFSIGN(b->prio, a->prio);
410 }
411
412 4273 int ff_tx_decompose_length(int dst[TX_MAX_DECOMPOSITIONS], enum AVTXType type,
413 int len, int inv)
414 {
415 4273 int nb_decomp = 0;
416 FFTXLenDecomp ld[TX_MAX_DECOMPOSITIONS];
417 4273 int codelet_list_idx = codelet_list_num;
418
419 4273 const int cpu_flags = av_get_cpu_flags();
420
421 /* Loop through all codelets in all codelet lists to find matches
422 * to the requirements */
423
2/2
✓ Branch 0 taken 21365 times.
✓ Branch 1 taken 4273 times.
25638 while (codelet_list_idx--) {
424 21365 const FFTXCodelet * const * list = codelet_list[codelet_list_idx];
425 21365 const FFTXCodelet *cd = NULL;
426
427
2/2
✓ Branch 0 taken 922968 times.
✓ Branch 1 taken 21365 times.
944333 while ((cd = *list++)) {
428 922968 int fl = len;
429 922968 int skip = 0, prio;
430 922968 int factors_product = 1, factors_mod = 0;
431
432
1/2
✗ Branch 0 not taken.
✓ Branch 1 taken 922968 times.
922968 if (nb_decomp >= TX_MAX_DECOMPOSITIONS)
433 goto sort;
434
435 /* Check if the type matches */
436
4/4
✓ Branch 0 taken 918695 times.
✓ Branch 1 taken 4273 times.
✓ Branch 2 taken 627766 times.
✓ Branch 3 taken 290929 times.
922968 if (cd->type != TX_TYPE_ANY && type != cd->type)
437 627766 continue;
438
439 /* Check direction for non-orthogonal codelets */
440
4/4
✓ Branch 0 taken 20840 times.
✓ Branch 1 taken 274362 times.
✓ Branch 2 taken 3694 times.
✓ Branch 3 taken 17146 times.
295202 if (((cd->flags & FF_TX_FORWARD_ONLY) && inv) ||
441
4/4
✓ Branch 0 taken 7496 times.
✓ Branch 1 taken 270560 times.
✓ Branch 2 taken 6476 times.
✓ Branch 3 taken 1020 times.
278056 ((cd->flags & (FF_TX_INVERSE_ONLY | AV_TX_FULL_IMDCT)) && !inv) ||
442
3/4
✓ Branch 0 taken 3694 times.
✓ Branch 1 taken 273342 times.
✓ Branch 2 taken 3694 times.
✗ Branch 3 not taken.
277036 ((cd->flags & (FF_TX_FORWARD_ONLY | AV_TX_REAL_TO_REAL)) && inv) ||
443
3/4
✓ Branch 0 taken 3694 times.
✓ Branch 1 taken 273342 times.
✗ Branch 2 not taken.
✓ Branch 3 taken 3694 times.
277036 ((cd->flags & (FF_TX_FORWARD_ONLY | AV_TX_REAL_TO_IMAGINARY)) && inv))
444 18166 continue;
445
446 /* Check if the CPU supports the required ISA */
447
2/2
✓ Branch 0 taken 145662 times.
✓ Branch 1 taken 131374 times.
277036 if (cd->cpu_flags != FF_TX_CPU_FLAGS_ALL &&
448
2/2
✓ Branch 0 taken 144254 times.
✓ Branch 1 taken 1408 times.
145662 !(cpu_flags & (cd->cpu_flags & ~cpu_slow_mask)))
449 144254 continue;
450
451
1/2
✓ Branch 0 taken 291202 times.
✗ Branch 1 not taken.
291202 for (int i = 0; i < TX_MAX_FACTORS; i++) {
452
4/4
✓ Branch 0 taken 166950 times.
✓ Branch 1 taken 124252 times.
✓ Branch 2 taken 158420 times.
✓ Branch 3 taken 8530 times.
291202 if (!cd->factors[i] || (fl == 1))
453 break;
454
455
2/2
✓ Branch 0 taken 25654 times.
✓ Branch 1 taken 132766 times.
158420 if (cd->factors[i] == TX_FACTOR_ANY) {
456 25654 factors_mod++;
457 25654 factors_product *= fl;
458
2/2
✓ Branch 0 taken 83132 times.
✓ Branch 1 taken 49634 times.
132766 } else if (!(fl % cd->factors[i])) {
459 83132 factors_mod++;
460
2/2
✓ Branch 0 taken 82291 times.
✓ Branch 1 taken 841 times.
83132 if (cd->factors[i] == 2) {
461 82291 int b = ff_ctz(fl);
462 82291 fl >>= b;
463 82291 factors_product <<= b;
464 } else {
465 do {
466 873 fl /= cd->factors[i];
467 873 factors_product *= cd->factors[i];
468
2/2
✓ Branch 0 taken 32 times.
✓ Branch 1 taken 841 times.
873 } while (!(fl % cd->factors[i]));
469 }
470 }
471 }
472
473 /* Disqualify if factor requirements are not satisfied or if trivial */
474
4/4
✓ Branch 0 taken 100078 times.
✓ Branch 1 taken 32704 times.
✓ Branch 2 taken 97908 times.
✓ Branch 3 taken 2170 times.
132782 if ((factors_mod < cd->nb_factors) || (len == factors_product))
475 130612 continue;
476
477
1/2
✗ Branch 0 not taken.
✓ Branch 1 taken 2170 times.
2170 if (av_gcd(factors_product, fl) != 1)
478 continue;
479
480 /* Check if length is supported and factorization was successful */
481
2/2
✓ Branch 0 taken 1198 times.
✓ Branch 1 taken 972 times.
2170 if ((factors_product < cd->min_len) ||
482
3/4
✓ Branch 0 taken 1198 times.
✗ Branch 1 not taken.
✓ Branch 2 taken 616 times.
✓ Branch 3 taken 582 times.
1198 (cd->max_len != TX_LEN_UNLIMITED && (factors_product > cd->max_len)))
483 1588 continue;
484
485 582 prio = get_codelet_prio(cd, cpu_flags, factors_product) * factors_product;
486
487 /* Check for duplicates */
488
2/2
✓ Branch 0 taken 979 times.
✓ Branch 1 taken 348 times.
1327 for (int i = 0; i < nb_decomp; i++) {
489
2/2
✓ Branch 0 taken 234 times.
✓ Branch 1 taken 745 times.
979 if (factors_product == ld[i].len) {
490 /* Update priority if new one is higher */
491
2/2
✓ Branch 0 taken 204 times.
✓ Branch 1 taken 30 times.
234 if (prio > ld[i].prio)
492 204 ld[i].prio = prio;
493 234 skip = 1;
494 234 break;
495 }
496 }
497
498 /* Add decomposition if unique */
499
2/2
✓ Branch 0 taken 348 times.
✓ Branch 1 taken 234 times.
582 if (!skip) {
500 348 ld[nb_decomp].cd = cd;
501 348 ld[nb_decomp].len = factors_product;
502 348 ld[nb_decomp].len2 = fl;
503 348 ld[nb_decomp].prio = prio;
504 348 nb_decomp++;
505 }
506 }
507 }
508
509
2/2
✓ Branch 0 taken 4176 times.
✓ Branch 1 taken 97 times.
4273 if (!nb_decomp)
510 4176 return AVERROR(EINVAL);
511
512 97 sort:
513
27/44
✓ Branch 0 taken 81 times.
✓ Branch 1 taken 89 times.
✓ Branch 3 taken 27 times.
✓ Branch 4 taken 54 times.
✗ Branch 6 not taken.
✓ Branch 7 taken 27 times.
✗ Branch 9 not taken.
✓ Branch 10 taken 54 times.
✓ Branch 12 taken 81 times.
✗ Branch 13 not taken.
✗ Branch 14 not taken.
✓ Branch 15 taken 81 times.
✓ Branch 16 taken 81 times.
✓ Branch 17 taken 19 times.
✓ Branch 19 taken 19 times.
✓ Branch 20 taken 62 times.
✓ Branch 21 taken 62 times.
✓ Branch 22 taken 81 times.
✓ Branch 24 taken 62 times.
✗ Branch 25 not taken.
✗ Branch 26 not taken.
✓ Branch 27 taken 81 times.
✓ Branch 28 taken 81 times.
✓ Branch 29 taken 81 times.
✗ Branch 30 not taken.
✓ Branch 31 taken 81 times.
✗ Branch 32 not taken.
✗ Branch 33 not taken.
✗ Branch 34 not taken.
✗ Branch 35 not taken.
✗ Branch 36 not taken.
✗ Branch 37 not taken.
✗ Branch 39 not taken.
✗ Branch 40 not taken.
✗ Branch 41 not taken.
✗ Branch 42 not taken.
✓ Branch 43 taken 19 times.
✓ Branch 44 taken 62 times.
✓ Branch 46 taken 8 times.
✓ Branch 47 taken 81 times.
✓ Branch 48 taken 170 times.
✓ Branch 49 taken 89 times.
✓ Branch 50 taken 178 times.
✓ Branch 51 taken 97 times.
599 AV_QSORT(ld, nb_decomp, FFTXLenDecomp, cmp_decomp);
514
515
2/2
✓ Branch 0 taken 348 times.
✓ Branch 1 taken 97 times.
445 for (int i = 0; i < nb_decomp; i++) {
516
1/2
✗ Branch 0 not taken.
✓ Branch 1 taken 348 times.
348 if (ld[i].cd->nb_factors > 1)
517 dst[i] = ld[i].len2;
518 else
519 348 dst[i] = ld[i].len;
520 }
521
522 97 return nb_decomp;
523 }
524
525 24 int ff_tx_gen_default_map(AVTXContext *s, FFTXCodeletOptions *opts)
526 {
527 24 s->map = av_malloc(s->len*sizeof(*s->map));
528
1/2
✗ Branch 0 not taken.
✓ Branch 1 taken 24 times.
24 if (!s->map)
529 return AVERROR(ENOMEM);
530
531 24 s->map[0] = 0; /* DC is always at the start */
532
1/2
✗ Branch 0 not taken.
✓ Branch 1 taken 24 times.
24 if (s->inv) /* Reversing the ACs flips the transform direction */
533 for (int i = 1; i < s->len; i++)
534 s->map[i] = s->len - i;
535 else
536
2/2
✓ Branch 0 taken 144 times.
✓ Branch 1 taken 24 times.
168 for (int i = 1; i < s->len; i++)
537 144 s->map[i] = i;
538
539 24 s->map_dir = FF_TX_MAP_GATHER;
540
541 24 return 0;
542 }
543
544 #if !CONFIG_SMALL
545 54703 static void print_flags(AVBPrint *bp, uint64_t f)
546 {
547 54703 int prev = 0;
548 54703 const char *sep = ", ";
549 54703 av_bprintf(bp, "flags: [");
550
3/4
✓ Branch 0 taken 18614 times.
✓ Branch 1 taken 36089 times.
✓ Branch 2 taken 18614 times.
✗ Branch 3 not taken.
54703 if ((f & FF_TX_ALIGNED) && ++prev)
551 18614 av_bprintf(bp, "aligned");
552
3/4
✓ Branch 0 taken 36117 times.
✓ Branch 1 taken 18586 times.
✓ Branch 2 taken 36117 times.
✗ Branch 3 not taken.
54703 if ((f & AV_TX_UNALIGNED) && ++prev)
553
2/2
✓ Branch 0 taken 28 times.
✓ Branch 1 taken 36089 times.
36117 av_bprintf(bp, "%sunaligned", prev > 1 ? sep : "");
554
3/4
✓ Branch 0 taken 25665 times.
✓ Branch 1 taken 29038 times.
✓ Branch 2 taken 25665 times.
✗ Branch 3 not taken.
54703 if ((f & AV_TX_INPLACE) && ++prev)
555
1/2
✓ Branch 0 taken 25665 times.
✗ Branch 1 not taken.
25665 av_bprintf(bp, "%sinplace", prev > 1 ? sep : "");
556
3/4
✓ Branch 0 taken 48590 times.
✓ Branch 1 taken 6113 times.
✓ Branch 2 taken 48590 times.
✗ Branch 3 not taken.
54703 if ((f & FF_TX_OUT_OF_PLACE) && ++prev)
557
1/2
✓ Branch 0 taken 48590 times.
✗ Branch 1 not taken.
48590 av_bprintf(bp, "%sout_of_place", prev > 1 ? sep : "");
558
3/4
✓ Branch 0 taken 1163 times.
✓ Branch 1 taken 53540 times.
✓ Branch 2 taken 1163 times.
✗ Branch 3 not taken.
54703 if ((f & FF_TX_FORWARD_ONLY) && ++prev)
559
1/2
✓ Branch 0 taken 1163 times.
✗ Branch 1 not taken.
1163 av_bprintf(bp, "%sfwd_only", prev > 1 ? sep : "");
560
3/4
✓ Branch 0 taken 20808 times.
✓ Branch 1 taken 33895 times.
✓ Branch 2 taken 20808 times.
✗ Branch 3 not taken.
54703 if ((f & FF_TX_INVERSE_ONLY) && ++prev)
561
1/2
✓ Branch 0 taken 20808 times.
✗ Branch 1 not taken.
20808 av_bprintf(bp, "%sinv_only", prev > 1 ? sep : "");
562
3/4
✓ Branch 0 taken 24143 times.
✓ Branch 1 taken 30560 times.
✓ Branch 2 taken 24143 times.
✗ Branch 3 not taken.
54703 if ((f & FF_TX_PRESHUFFLE) && ++prev)
563
1/2
✓ Branch 0 taken 24143 times.
✗ Branch 1 not taken.
24143 av_bprintf(bp, "%spreshuf", prev > 1 ? sep : "");
564
3/4
✓ Branch 0 taken 207 times.
✓ Branch 1 taken 54496 times.
✓ Branch 2 taken 207 times.
✗ Branch 3 not taken.
54703 if ((f & AV_TX_FULL_IMDCT) && ++prev)
565
1/2
✓ Branch 0 taken 207 times.
✗ Branch 1 not taken.
207 av_bprintf(bp, "%simdct_full", prev > 1 ? sep : "");
566
3/4
✓ Branch 0 taken 24 times.
✓ Branch 1 taken 54679 times.
✓ Branch 2 taken 24 times.
✗ Branch 3 not taken.
54703 if ((f & AV_TX_REAL_TO_REAL) && ++prev)
567
1/2
✓ Branch 0 taken 24 times.
✗ Branch 1 not taken.
24 av_bprintf(bp, "%sreal_to_real", prev > 1 ? sep : "");
568
3/4
✓ Branch 0 taken 24 times.
✓ Branch 1 taken 54679 times.
✓ Branch 2 taken 24 times.
✗ Branch 3 not taken.
54703 if ((f & AV_TX_REAL_TO_IMAGINARY) && ++prev)
569
1/2
✓ Branch 0 taken 24 times.
✗ Branch 1 not taken.
24 av_bprintf(bp, "%sreal_to_imaginary", prev > 1 ? sep : "");
570
3/4
✓ Branch 0 taken 5258 times.
✓ Branch 1 taken 49445 times.
✓ Branch 2 taken 5258 times.
✗ Branch 3 not taken.
54703 if ((f & FF_TX_ASM_CALL) && ++prev)
571
1/2
✓ Branch 0 taken 5258 times.
✗ Branch 1 not taken.
5258 av_bprintf(bp, "%sasm_call", prev > 1 ? sep : "");
572 54703 av_bprintf(bp, "]");
573 54703 }
574
575 54703 static void print_type(AVBPrint *bp, enum AVTXType type)
576 {
577
2/2
✓ Branch 0 taken 54675 times.
✓ Branch 1 taken 28 times.
109378 av_bprintf(bp, "%s",
578 type == TX_TYPE_ANY ? "any" :
579
2/2
✓ Branch 0 taken 30574 times.
✓ Branch 1 taken 24101 times.
85249 type == AV_TX_FLOAT_FFT ? "fft_float" :
580
2/2
✓ Branch 0 taken 4767 times.
✓ Branch 1 taken 25807 times.
35341 type == AV_TX_FLOAT_MDCT ? "mdct_float" :
581
2/2
✓ Branch 0 taken 4590 times.
✓ Branch 1 taken 177 times.
9357 type == AV_TX_FLOAT_RDFT ? "rdft_float" :
582
2/2
✓ Branch 0 taken 4566 times.
✓ Branch 1 taken 24 times.
9156 type == AV_TX_FLOAT_DCT_I ? "dctI_float" :
583
2/2
✓ Branch 0 taken 4542 times.
✓ Branch 1 taken 24 times.
9108 type == AV_TX_FLOAT_DST_I ? "dstI_float" :
584
2/2
✓ Branch 0 taken 2610 times.
✓ Branch 1 taken 1932 times.
7152 type == AV_TX_DOUBLE_FFT ? "fft_double" :
585
1/2
✓ Branch 0 taken 2610 times.
✗ Branch 1 not taken.
5220 type == AV_TX_DOUBLE_MDCT ? "mdct_double" :
586
1/2
✓ Branch 0 taken 2610 times.
✗ Branch 1 not taken.
5220 type == AV_TX_DOUBLE_RDFT ? "rdft_double" :
587
1/2
✓ Branch 0 taken 2610 times.
✗ Branch 1 not taken.
5220 type == AV_TX_DOUBLE_DCT_I ? "dctI_double" :
588
1/2
✓ Branch 0 taken 2610 times.
✗ Branch 1 not taken.
5220 type == AV_TX_DOUBLE_DST_I ? "dstI_double" :
589
2/2
✓ Branch 0 taken 1449 times.
✓ Branch 1 taken 1161 times.
4059 type == AV_TX_INT32_FFT ? "fft_int32" :
590
2/2
✓ Branch 0 taken 12 times.
✓ Branch 1 taken 1437 times.
1461 type == AV_TX_INT32_MDCT ? "mdct_int32" :
591
1/2
✓ Branch 0 taken 12 times.
✗ Branch 1 not taken.
24 type == AV_TX_INT32_RDFT ? "rdft_int32" :
592
1/2
✓ Branch 0 taken 12 times.
✗ Branch 1 not taken.
24 type == AV_TX_INT32_DCT_I ? "dctI_int32" :
593
1/2
✗ Branch 0 not taken.
✓ Branch 1 taken 12 times.
12 type == AV_TX_INT32_DST_I ? "dstI_int32" :
594 "unknown");
595 54703 }
596
597 42744 static void print_cd_info(const FFTXCodelet *cd, int prio, int len, int print_prio,
598 int log_level)
599 {
600 AVBPrint bp;
601 42744 av_bprint_init(&bp, 0, AV_BPRINT_SIZE_AUTOMATIC);
602
603 42744 av_bprintf(&bp, "%s - type: ", cd->name);
604
605 42744 print_type(&bp, cd->type);
606
607 42744 av_bprintf(&bp, ", len: ");
608
2/2
✓ Branch 0 taken 30939 times.
✓ Branch 1 taken 11805 times.
42744 if (!len) {
609
2/2
✓ Branch 0 taken 24801 times.
✓ Branch 1 taken 6138 times.
30939 if (cd->min_len != cd->max_len)
610 24801 av_bprintf(&bp, "[%i, ", cd->min_len);
611
612
2/2
✓ Branch 0 taken 22932 times.
✓ Branch 1 taken 8007 times.
30939 if (cd->max_len == TX_LEN_UNLIMITED)
613 22932 av_bprintf(&bp, "∞");
614 else
615 8007 av_bprintf(&bp, "%i", cd->max_len);
616 } else {
617 11805 av_bprintf(&bp, "%i", len);
618 }
619
620
2/2
✓ Branch 0 taken 27642 times.
✓ Branch 1 taken 15102 times.
42744 if (cd->factors[1]) {
621
3/4
✓ Branch 0 taken 21765 times.
✓ Branch 1 taken 5877 times.
✓ Branch 2 taken 21765 times.
✗ Branch 3 not taken.
27642 av_bprintf(&bp, "%s, factors", !len && cd->min_len != cd->max_len ? "]" : "");
622
2/2
✓ Branch 0 taken 8 times.
✓ Branch 1 taken 27634 times.
27642 if (!cd->nb_factors)
623 8 av_bprintf(&bp, ": [");
624 else
625 27634 av_bprintf(&bp, "[%i]: [", cd->nb_factors);
626
627
1/2
✓ Branch 0 taken 96969 times.
✗ Branch 1 not taken.
96969 for (int i = 0; i < TX_MAX_FACTORS; i++) {
628
4/4
✓ Branch 0 taken 69327 times.
✓ Branch 1 taken 27642 times.
✓ Branch 2 taken 41685 times.
✓ Branch 3 taken 27642 times.
96969 if (i && cd->factors[i])
629 41685 av_bprintf(&bp, ", ");
630
2/2
✓ Branch 0 taken 26802 times.
✓ Branch 1 taken 70167 times.
96969 if (cd->factors[i] == TX_FACTOR_ANY)
631 26802 av_bprintf(&bp, "any");
632
2/2
✓ Branch 0 taken 42525 times.
✓ Branch 1 taken 27642 times.
70167 else if (cd->factors[i])
633 42525 av_bprintf(&bp, "%i", cd->factors[i]);
634 else
635 27642 break;
636 }
637
638 27642 av_bprintf(&bp, "], ");
639 } else {
640 15102 av_bprintf(&bp, "%s, factor: %i, ",
641
4/4
✓ Branch 0 taken 9174 times.
✓ Branch 1 taken 5928 times.
✓ Branch 2 taken 3036 times.
✓ Branch 3 taken 6138 times.
15102 !len && cd->min_len != cd->max_len ? "]" : "", cd->factors[0]);
642 }
643 42744 print_flags(&bp, cd->flags);
644
645
2/2
✓ Branch 0 taken 30939 times.
✓ Branch 1 taken 11805 times.
42744 if (print_prio)
646 30939 av_bprintf(&bp, ", prio: %i", prio);
647
648 42744 av_log(NULL, log_level, "%s\n", bp.str);
649 42744 }
650
651 11805 static void print_tx_structure(AVTXContext *s, int depth)
652 {
653 11805 const FFTXCodelet *cd = s->cd_self;
654
655
2/2
✓ Branch 0 taken 18634 times.
✓ Branch 1 taken 11805 times.
30439 for (int i = 0; i <= depth; i++)
656 18634 av_log(NULL, AV_LOG_DEBUG, " ");
657
658 11805 print_cd_info(cd, cd->prio, s->len, 0, AV_LOG_DEBUG);
659
660
2/2
✓ Branch 0 taken 6212 times.
✓ Branch 1 taken 11805 times.
18017 for (int i = 0; i < s->nb_sub; i++)
661 6212 print_tx_structure(&s->sub[i], depth + 1);
662 11805 }
663 #endif /* CONFIG_SMALL */
664
665 typedef struct TXCodeletMatch {
666 const FFTXCodelet *cd;
667 int prio;
668 } TXCodeletMatch;
669
670 31392 static int cmp_matches(TXCodeletMatch *a, TXCodeletMatch *b)
671 {
672 31392 return FFDIFFSIGN(b->prio, a->prio);
673 }
674
675 /* We want all factors to completely cover the length */
676 53167 static inline int check_cd_factors(const FFTXCodelet *cd, int len)
677 {
678 53167 int matches = 0, any_flag = 0;
679
680
1/2
✓ Branch 0 taken 162944 times.
✗ Branch 1 not taken.
162944 for (int i = 0; i < TX_MAX_FACTORS; i++) {
681 162944 int factor = cd->factors[i];
682
683
2/2
✓ Branch 0 taken 43843 times.
✓ Branch 1 taken 119101 times.
162944 if (factor == TX_FACTOR_ANY) {
684 43843 any_flag = 1;
685 43843 matches++;
686 43843 continue;
687
4/4
✓ Branch 0 taken 99622 times.
✓ Branch 1 taken 19479 times.
✓ Branch 2 taken 65934 times.
✓ Branch 3 taken 33688 times.
119101 } else if (len <= 1 || !factor) {
688 break;
689
2/2
✓ Branch 0 taken 25220 times.
✓ Branch 1 taken 40714 times.
65934 } else if (factor == 2) { /* Fast path */
690 25220 int bits_2 = ff_ctz(len);
691
2/2
✓ Branch 0 taken 48 times.
✓ Branch 1 taken 25172 times.
25220 if (!bits_2)
692 48 continue; /* Factor not supported */
693
694 25172 len >>= bits_2;
695 25172 matches++;
696 } else {
697 40714 int res = len % factor;
698
2/2
✓ Branch 0 taken 34629 times.
✓ Branch 1 taken 6085 times.
40714 if (res)
699 34629 continue; /* Factor not supported */
700
701
2/2
✓ Branch 0 taken 6259 times.
✓ Branch 1 taken 6085 times.
12344 while (!res) {
702 6259 len /= factor;
703 6259 res = len % factor;
704 }
705 6085 matches++;
706 }
707 }
708
709
6/6
✓ Branch 0 taken 32016 times.
✓ Branch 1 taken 21151 times.
✓ Branch 2 taken 8874 times.
✓ Branch 3 taken 23142 times.
✓ Branch 4 taken 7797 times.
✓ Branch 5 taken 1077 times.
53167 return (cd->nb_factors <= matches) && (any_flag || len == 1);
710 }
711
712 11959 av_cold int ff_tx_init_subtx(AVTXContext *s, enum AVTXType type,
713 uint64_t flags, FFTXCodeletOptions *opts,
714 int len, int inv, const void *scale)
715 {
716 11959 int ret = 0;
717 11959 AVTXContext *sub = NULL;
718 11959 TXCodeletMatch *cd_tmp, *cd_matches = NULL;
719 11959 unsigned int cd_matches_size = 0;
720 11959 int codelet_list_idx = codelet_list_num;
721 11959 int nb_cd_matches = 0;
722 #if !CONFIG_SMALL
723 AVBPrint bp;
724 #endif
725
726 /* We still accept functions marked with SLOW, even if the CPU is
727 * marked with the same flag, but we give them lower priority. */
728 11959 const int cpu_flags = av_get_cpu_flags();
729
730 /* Flags the transform wants */
731 11959 uint64_t req_flags = flags;
732
733 /* Flags the codelet may require to be present */
734 11959 uint64_t inv_req_mask = AV_TX_FULL_IMDCT |
735 AV_TX_REAL_TO_REAL |
736 AV_TX_REAL_TO_IMAGINARY |
737 FF_TX_PRESHUFFLE |
738 FF_TX_ASM_CALL;
739
740 /* Unaligned codelets are compatible with the aligned flag */
741
1/2
✓ Branch 0 taken 11959 times.
✗ Branch 1 not taken.
11959 if (req_flags & FF_TX_ALIGNED)
742 11959 req_flags |= AV_TX_UNALIGNED;
743
744 /* If either flag is set, both are okay, so don't check for an exact match */
745
3/4
✓ Branch 0 taken 6113 times.
✓ Branch 1 taken 5846 times.
✗ Branch 2 not taken.
✓ Branch 3 taken 6113 times.
11959 if ((req_flags & AV_TX_INPLACE) && (req_flags & FF_TX_OUT_OF_PLACE))
746 req_flags &= ~(AV_TX_INPLACE | FF_TX_OUT_OF_PLACE);
747
2/4
✓ Branch 0 taken 11959 times.
✗ Branch 1 not taken.
✓ Branch 2 taken 11959 times.
✗ Branch 3 not taken.
11959 if ((req_flags & FF_TX_ALIGNED) && (req_flags & AV_TX_UNALIGNED))
748 11959 req_flags &= ~(FF_TX_ALIGNED | AV_TX_UNALIGNED);
749
750 /* Loop through all codelets in all codelet lists to find matches
751 * to the requirements */
752
2/2
✓ Branch 0 taken 59795 times.
✓ Branch 1 taken 11959 times.
71754 while (codelet_list_idx--) {
753 59795 const FFTXCodelet * const * list = codelet_list[codelet_list_idx];
754 59795 const FFTXCodelet *cd = NULL;
755
756
2/2
✓ Branch 0 taken 2583144 times.
✓ Branch 1 taken 59795 times.
2642939 while ((cd = *list++)) {
757 /* Check if the type matches */
758
4/4
✓ Branch 0 taken 2571185 times.
✓ Branch 1 taken 11959 times.
✓ Branch 2 taken 2030720 times.
✓ Branch 3 taken 540465 times.
2583144 if (cd->type != TX_TYPE_ANY && type != cd->type)
759 2030720 continue;
760
761 /* Check direction for non-orthogonal codelets */
762
4/4
✓ Branch 0 taken 69615 times.
✓ Branch 1 taken 482809 times.
✓ Branch 2 taken 7988 times.
✓ Branch 3 taken 61627 times.
552424 if (((cd->flags & FF_TX_FORWARD_ONLY) && inv) ||
763
4/4
✓ Branch 0 taken 59202 times.
✓ Branch 1 taken 431595 times.
✓ Branch 2 taken 54447 times.
✓ Branch 3 taken 4755 times.
490797 ((cd->flags & (FF_TX_INVERSE_ONLY | AV_TX_FULL_IMDCT)) && !inv) ||
764
3/4
✓ Branch 0 taken 7988 times.
✓ Branch 1 taken 478054 times.
✓ Branch 2 taken 7988 times.
✗ Branch 3 not taken.
486042 ((cd->flags & (FF_TX_FORWARD_ONLY | AV_TX_REAL_TO_REAL)) && inv) ||
765
3/4
✓ Branch 0 taken 7988 times.
✓ Branch 1 taken 478054 times.
✗ Branch 2 not taken.
✓ Branch 3 taken 7988 times.
486042 ((cd->flags & (FF_TX_FORWARD_ONLY | AV_TX_REAL_TO_IMAGINARY)) && inv))
766 66382 continue;
767
768 /* Check if the requested flags match from both sides */
769
2/2
✓ Branch 0 taken 306828 times.
✓ Branch 1 taken 179214 times.
486042 if (((req_flags & cd->flags) != (req_flags)) ||
770
2/2
✓ Branch 0 taken 71354 times.
✓ Branch 1 taken 235474 times.
306828 ((inv_req_mask & cd->flags) != (req_flags & inv_req_mask)))
771 250568 continue;
772
773 /* Check if length is supported */
774
6/6
✓ Branch 0 taken 158579 times.
✓ Branch 1 taken 76895 times.
✓ Branch 2 taken 109086 times.
✓ Branch 3 taken 49493 times.
✓ Branch 4 taken 90223 times.
✓ Branch 5 taken 18863 times.
235474 if ((len < cd->min_len) || (cd->max_len != -1 && (len > cd->max_len)))
775 167118 continue;
776
777 /* Check if the CPU supports the required ISA */
778
2/2
✓ Branch 0 taken 20762 times.
✓ Branch 1 taken 47594 times.
68356 if (cd->cpu_flags != FF_TX_CPU_FLAGS_ALL &&
779
2/2
✓ Branch 0 taken 15189 times.
✓ Branch 1 taken 5573 times.
20762 !(cpu_flags & (cd->cpu_flags & ~cpu_slow_mask)))
780 15189 continue;
781
782 /* Check for factors */
783
2/2
✓ Branch 1 taken 22228 times.
✓ Branch 2 taken 30939 times.
53167 if (!check_cd_factors(cd, len))
784 22228 continue;
785
786 /* Realloc array and append */
787 30939 cd_tmp = av_fast_realloc(cd_matches, &cd_matches_size,
788 30939 sizeof(*cd_tmp) * (nb_cd_matches + 1));
789
1/2
✗ Branch 0 not taken.
✓ Branch 1 taken 30939 times.
30939 if (!cd_tmp) {
790 av_free(cd_matches);
791 return AVERROR(ENOMEM);
792 }
793
794 30939 cd_matches = cd_tmp;
795 30939 cd_matches[nb_cd_matches].cd = cd;
796 30939 cd_matches[nb_cd_matches].prio = get_codelet_prio(cd, cpu_flags, len);
797 30939 nb_cd_matches++;
798 }
799 }
800
801 #if !CONFIG_SMALL
802 /* Print debugging info */
803 11959 av_bprint_init(&bp, 0, AV_BPRINT_SIZE_AUTOMATIC);
804
2/2
✓ Branch 0 taken 10413 times.
✓ Branch 1 taken 1546 times.
11959 av_bprintf(&bp, "For transform of length %i, %s, ", len,
805 inv ? "inverse" : "forward");
806 11959 print_type(&bp, type);
807 11959 av_bprintf(&bp, ", ");
808 11959 print_flags(&bp, flags);
809
2/2
✓ Branch 0 taken 11805 times.
✓ Branch 1 taken 154 times.
11959 av_bprintf(&bp, ", found %i matches%s", nb_cd_matches,
810 nb_cd_matches ? ":" : ".");
811 #endif
812
813 /* No matches found */
814
2/2
✓ Branch 0 taken 154 times.
✓ Branch 1 taken 11805 times.
11959 if (!nb_cd_matches)
815 154 return AVERROR(ENOSYS);
816
817 /* Sort the list */
818
44/44
✓ Branch 0 taken 5361 times.
✓ Branch 1 taken 8302 times.
✓ Branch 3 taken 1406 times.
✓ Branch 4 taken 3955 times.
✓ Branch 6 taken 309 times.
✓ Branch 7 taken 1097 times.
✓ Branch 9 taken 1796 times.
✓ Branch 10 taken 2159 times.
✓ Branch 12 taken 2097 times.
✓ Branch 13 taken 3264 times.
✓ Branch 14 taken 3163 times.
✓ Branch 15 taken 2198 times.
✓ Branch 16 taken 4144 times.
✓ Branch 17 taken 1644 times.
✓ Branch 19 taken 2921 times.
✓ Branch 20 taken 1223 times.
✓ Branch 21 taken 1271 times.
✓ Branch 22 taken 2110 times.
✓ Branch 24 taken 514 times.
✓ Branch 25 taken 757 times.
✓ Branch 26 taken 2110 times.
✓ Branch 27 taken 757 times.
✓ Branch 28 taken 2867 times.
✓ Branch 29 taken 2198 times.
✓ Branch 30 taken 926 times.
✓ Branch 31 taken 1272 times.
✓ Branch 32 taken 369 times.
✓ Branch 33 taken 557 times.
✓ Branch 34 taken 310 times.
✓ Branch 35 taken 59 times.
✓ Branch 36 taken 1592 times.
✓ Branch 37 taken 110 times.
✓ Branch 39 taken 835 times.
✓ Branch 40 taken 757 times.
✓ Branch 41 taken 110 times.
✓ Branch 42 taken 757 times.
✓ Branch 43 taken 1554 times.
✓ Branch 44 taken 534 times.
✓ Branch 46 taken 5139 times.
✓ Branch 47 taken 3163 times.
✓ Branch 48 taken 13663 times.
✓ Branch 49 taken 2318 times.
✓ Branch 50 taken 13893 times.
✓ Branch 51 taken 11805 times.
37121 AV_QSORT(cd_matches, nb_cd_matches, TXCodeletMatch, cmp_matches);
819
820 #if !CONFIG_SMALL
821 11805 av_log(NULL, AV_LOG_TRACE, "%s\n", bp.str);
822
823
2/2
✓ Branch 0 taken 30939 times.
✓ Branch 1 taken 11805 times.
42744 for (int i = 0; i < nb_cd_matches; i++) {
824 30939 av_log(NULL, AV_LOG_TRACE, " %i: ", i + 1);
825 30939 print_cd_info(cd_matches[i].cd, cd_matches[i].prio, 0, 1, AV_LOG_TRACE);
826 }
827 #endif
828
829
2/2
✓ Branch 0 taken 11708 times.
✓ Branch 1 taken 97 times.
11805 if (!s->sub) {
830 11708 s->sub = sub = av_mallocz(TX_MAX_SUB*sizeof(*sub));
831
1/2
✗ Branch 0 not taken.
✓ Branch 1 taken 11708 times.
11708 if (!sub) {
832 ret = AVERROR(ENOMEM);
833 goto end;
834 }
835 }
836
837 /* Attempt to initialize each */
838
1/2
✓ Branch 0 taken 16113 times.
✗ Branch 1 not taken.
16113 for (int i = 0; i < nb_cd_matches; i++) {
839 16113 const FFTXCodelet *cd = cd_matches[i].cd;
840 16113 AVTXContext *sctx = &s->sub[s->nb_sub];
841
842 16113 sctx->len = len;
843 16113 sctx->inv = inv;
844 16113 sctx->type = type;
845 16113 sctx->flags = cd->flags | flags;
846 16113 sctx->cd_self = cd;
847
848 16113 s->fn[s->nb_sub] = cd->function;
849 16113 s->cd[s->nb_sub] = cd;
850
851 16113 ret = 0;
852
2/2
✓ Branch 0 taken 16094 times.
✓ Branch 1 taken 19 times.
16113 if (cd->init)
853 16094 ret = cd->init(sctx, cd, flags, opts, len, inv, scale);
854
855
2/2
✓ Branch 0 taken 11805 times.
✓ Branch 1 taken 4308 times.
16113 if (ret >= 0) {
856
3/4
✓ Branch 0 taken 6064 times.
✓ Branch 1 taken 5741 times.
✓ Branch 2 taken 6064 times.
✗ Branch 3 not taken.
11805 if (opts && opts->map_dir != FF_TX_MAP_NONE &&
857
2/2
✓ Branch 0 taken 22 times.
✓ Branch 1 taken 6042 times.
6064 sctx->map_dir == FF_TX_MAP_NONE) {
858 /* If a specific map direction was requested, and it doesn't
859 * exist, create one.*/
860 22 sctx->map = av_malloc(len*sizeof(*sctx->map));
861
1/2
✗ Branch 0 not taken.
✓ Branch 1 taken 22 times.
22 if (!sctx->map) {
862 ret = AVERROR(ENOMEM);
863 goto end;
864 }
865
866
2/2
✓ Branch 0 taken 118 times.
✓ Branch 1 taken 22 times.
140 for (int i = 0; i < len; i++)
867 118 sctx->map[i] = i;
868
4/4
✓ Branch 0 taken 6042 times.
✓ Branch 1 taken 5741 times.
✓ Branch 2 taken 16 times.
✓ Branch 3 taken 6026 times.
11783 } else if (opts && (opts->map_dir != sctx->map_dir)) {
869 16 int *tmp = av_malloc(len*sizeof(*sctx->map));
870
1/2
✗ Branch 0 not taken.
✓ Branch 1 taken 16 times.
16 if (!tmp) {
871 ret = AVERROR(ENOMEM);
872 goto end;
873 }
874
875 16 memcpy(tmp, sctx->map, len*sizeof(*sctx->map));
876
877
2/2
✓ Branch 0 taken 112 times.
✓ Branch 1 taken 16 times.
128 for (int i = 0; i < len; i++)
878 112 sctx->map[tmp[i]] = i;
879
880 16 av_free(tmp);
881 }
882
883 11805 s->nb_sub++;
884 11805 goto end;
885 }
886
887 4308 s->fn[s->nb_sub] = NULL;
888 4308 s->cd[s->nb_sub] = NULL;
889
890 4308 reset_ctx(sctx, 0);
891
1/2
✗ Branch 0 not taken.
✓ Branch 1 taken 4308 times.
4308 if (ret == AVERROR(ENOMEM))
892 break;
893 }
894
895 if (!s->nb_sub)
896 av_freep(&s->sub);
897
898 end:
899 11805 av_free(cd_matches);
900 11805 return ret;
901 }
902
903 5593 av_cold int av_tx_init(AVTXContext **ctx, av_tx_fn *tx, enum AVTXType type,
904 int inv, int len, const void *scale, uint64_t flags)
905 {
906 int ret;
907 5593 AVTXContext tmp = { 0 };
908 5593 const double default_scale_d = 1.0;
909 5593 const float default_scale_f = 1.0f;
910
911
4/8
✓ Branch 0 taken 5593 times.
✗ Branch 1 not taken.
✓ Branch 2 taken 5593 times.
✗ Branch 3 not taken.
✓ Branch 4 taken 5593 times.
✗ Branch 5 not taken.
✗ Branch 6 not taken.
✓ Branch 7 taken 5593 times.
5593 if (!len || type >= AV_TX_NB || !ctx || !tx)
912 return AVERROR(EINVAL);
913
914
1/2
✓ Branch 0 taken 5593 times.
✗ Branch 1 not taken.
5593 if (!(flags & AV_TX_UNALIGNED))
915 5593 flags |= FF_TX_ALIGNED;
916
1/2
✓ Branch 0 taken 5593 times.
✗ Branch 1 not taken.
5593 if (!(flags & AV_TX_INPLACE))
917 5593 flags |= FF_TX_OUT_OF_PLACE;
918
919
5/8
✓ Branch 0 taken 12 times.
✓ Branch 1 taken 5581 times.
✓ Branch 2 taken 12 times.
✗ Branch 3 not taken.
✓ Branch 4 taken 12 times.
✗ Branch 5 not taken.
✓ Branch 6 taken 12 times.
✗ Branch 7 not taken.
5593 if (!scale && ((type == AV_TX_DOUBLE_MDCT) || (type == AV_TX_DOUBLE_DCT) ||
920
2/4
✓ Branch 0 taken 12 times.
✗ Branch 1 not taken.
✗ Branch 2 not taken.
✓ Branch 3 taken 12 times.
12 (type == AV_TX_DOUBLE_DCT_I) || (type == AV_TX_DOUBLE_DST_I) ||
921 (type == AV_TX_DOUBLE_RDFT)))
922 scale = &default_scale_d;
923
3/8
✓ Branch 0 taken 12 times.
✓ Branch 1 taken 5581 times.
✗ Branch 2 not taken.
✓ Branch 3 taken 12 times.
✗ Branch 4 not taken.
✗ Branch 5 not taken.
✗ Branch 6 not taken.
✗ Branch 7 not taken.
5593 else if (!scale && !TYPE_IS(FFT, type))
924 scale = &default_scale_f;
925
926 5593 ret = ff_tx_init_subtx(&tmp, type, flags, NULL, len, inv, scale);
927
1/2
✗ Branch 0 not taken.
✓ Branch 1 taken 5593 times.
5593 if (ret < 0)
928 return ret;
929
930 5593 *ctx = &tmp.sub[0];
931 5593 *tx = tmp.fn[0];
932
933 #if !CONFIG_SMALL
934 5593 av_log(NULL, AV_LOG_DEBUG, "Transform tree:\n");
935 5593 print_tx_structure(*ctx, 0);
936 #endif
937
938 5593 return ret;
939 }
940