Line | Branch | Exec | Source |
---|---|---|---|
1 | /** | ||
2 | * Copyright (C) 2025 Niklas Haas | ||
3 | * | ||
4 | * This file is part of FFmpeg. | ||
5 | * | ||
6 | * FFmpeg is free software; you can redistribute it and/or | ||
7 | * modify it under the terms of the GNU Lesser General Public | ||
8 | * License as published by the Free Software Foundation; either | ||
9 | * version 2.1 of the License, or (at your option) any later version. | ||
10 | * | ||
11 | * FFmpeg is distributed in the hope that it will be useful, | ||
12 | * but WITHOUT ANY WARRANTY; without even the implied warranty of | ||
13 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU | ||
14 | * Lesser General Public License for more details. | ||
15 | * | ||
16 | * You should have received a copy of the GNU Lesser General Public | ||
17 | * License along with FFmpeg; if not, write to the Free Software | ||
18 | * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA | ||
19 | */ | ||
20 | |||
21 | #ifndef SWSCALE_OPS_BACKEND_H | ||
22 | #define SWSCALE_OPS_BACKEND_H | ||
23 | |||
24 | /** | ||
25 | * Helper macros for the C-based backend. | ||
26 | * | ||
27 | * To use these macros, the following types must be defined: | ||
28 | * - PIXEL_TYPE should be one of SWS_PIXEL_* | ||
29 | * - pixel_t should be the type of pixels | ||
30 | * - block_t should be the type of blocks (groups of pixels) | ||
31 | */ | ||
32 | |||
33 | #include <assert.h> | ||
34 | #include <float.h> | ||
35 | #include <stdint.h> | ||
36 | |||
37 | #include "libavutil/attributes.h" | ||
38 | #include "libavutil/mem.h" | ||
39 | |||
40 | #include "ops_chain.h" | ||
41 | |||
42 | /** | ||
43 | * Internal context holding per-iter execution data. The data pointers will be | ||
44 | * directly incremented by the corresponding read/write functions. | ||
45 | */ | ||
46 | typedef struct SwsOpIter { | ||
47 | const uint8_t *in[4]; | ||
48 | uint8_t *out[4]; | ||
49 | int x, y; | ||
50 | } SwsOpIter; | ||
51 | |||
52 | #ifdef __clang__ | ||
53 | # define SWS_FUNC | ||
54 | # define SWS_LOOP AV_PRAGMA(clang loop vectorize(assume_safety)) | ||
55 | #elif defined(__GNUC__) | ||
56 | # define SWS_FUNC __attribute__((optimize("tree-vectorize"))) | ||
57 | # define SWS_LOOP AV_PRAGMA(GCC ivdep) | ||
58 | #else | ||
59 | # define SWS_FUNC | ||
60 | # define SWS_LOOP | ||
61 | #endif | ||
62 | |||
63 | /* Miscellaneous helpers */ | ||
64 | #define bitfn2(name, ext) name ## _ ## ext | ||
65 | #define bitfn(name, ext) bitfn2(name, ext) | ||
66 | |||
67 | #define FN_SUFFIX AV_JOIN(FMT_CHAR, BIT_DEPTH) | ||
68 | #define fn(name) bitfn(name, FN_SUFFIX) | ||
69 | |||
70 | #define av_q2pixel(q) ((q).den ? (pixel_t) (q).num / (q).den : 0) | ||
71 | |||
72 | /* Helper macros to make writing common function signatures less painful */ | ||
73 | #define DECL_FUNC(NAME, ...) \ | ||
74 | static av_always_inline void fn(NAME)(SwsOpIter *restrict iter, \ | ||
75 | const SwsOpImpl *restrict impl, \ | ||
76 | block_t x, block_t y, \ | ||
77 | block_t z, block_t w, \ | ||
78 | __VA_ARGS__) | ||
79 | |||
80 | #define DECL_READ(NAME, ...) \ | ||
81 | static av_always_inline void fn(NAME)(SwsOpIter *restrict iter, \ | ||
82 | const SwsOpImpl *restrict impl, \ | ||
83 | const pixel_t *restrict in0, \ | ||
84 | const pixel_t *restrict in1, \ | ||
85 | const pixel_t *restrict in2, \ | ||
86 | const pixel_t *restrict in3, \ | ||
87 | __VA_ARGS__) | ||
88 | |||
89 | #define DECL_WRITE(NAME, ...) \ | ||
90 | DECL_FUNC(NAME, pixel_t *restrict out0, pixel_t *restrict out1, \ | ||
91 | pixel_t *restrict out2, pixel_t *restrict out3, \ | ||
92 | __VA_ARGS__) | ||
93 | |||
94 | /* Helper macros to call into functions declared with DECL_FUNC_* */ | ||
95 | #define CALL(FUNC, ...) \ | ||
96 | fn(FUNC)(iter, impl, x, y, z, w, __VA_ARGS__) | ||
97 | |||
98 | #define CALL_READ(FUNC, ...) \ | ||
99 | fn(FUNC)(iter, impl, (const pixel_t *) iter->in[0], \ | ||
100 | (const pixel_t *) iter->in[1], \ | ||
101 | (const pixel_t *) iter->in[2], \ | ||
102 | (const pixel_t *) iter->in[3], __VA_ARGS__) | ||
103 | |||
104 | #define CALL_WRITE(FUNC, ...) \ | ||
105 | CALL(FUNC, (pixel_t *) iter->out[0], (pixel_t *) iter->out[1], \ | ||
106 | (pixel_t *) iter->out[2], (pixel_t *) iter->out[3], __VA_ARGS__) | ||
107 | |||
108 | /* Helper macros to declare continuation functions */ | ||
109 | #define DECL_IMPL(NAME) \ | ||
110 | static SWS_FUNC void fn(NAME)(SwsOpIter *restrict iter, \ | ||
111 | const SwsOpImpl *restrict impl, \ | ||
112 | block_t x, block_t y, \ | ||
113 | block_t z, block_t w) \ | ||
114 | |||
115 | /* Helper macro to call into the next continuation with a given type */ | ||
116 | #define CONTINUE(TYPE, ...) \ | ||
117 | ((void (*)(SwsOpIter *, const SwsOpImpl *, \ | ||
118 | TYPE x, TYPE y, TYPE z, TYPE w)) impl->cont) \ | ||
119 | (iter, &impl[1], __VA_ARGS__) | ||
120 | |||
121 | /* Helper macros for common op setup code */ | ||
122 | #define DECL_SETUP(NAME) \ | ||
123 | static int fn(NAME)(const SwsOp *op, SwsOpPriv *out) | ||
124 | |||
125 | #define SETUP_MEMDUP(c) ff_setup_memdup(&(c), sizeof(c), out) | ||
126 | 273 | static inline int ff_setup_memdup(const void *c, size_t size, SwsOpPriv *out) | |
127 | { | ||
128 | 273 | out->ptr = av_memdup(c, size); | |
129 |
1/2✓ Branch 0 taken 273 times.
✗ Branch 1 not taken.
|
273 | return out->ptr ? 0 : AVERROR(ENOMEM); |
130 | } | ||
131 | |||
132 | /* Helper macro for declaring op table entries */ | ||
133 | #define DECL_ENTRY(NAME, ...) \ | ||
134 | static const SwsOpEntry fn(op_##NAME) = { \ | ||
135 | .func = (SwsFuncPtr) fn(NAME), \ | ||
136 | .type = PIXEL_TYPE, \ | ||
137 | __VA_ARGS__ \ | ||
138 | } | ||
139 | |||
140 | /* Helpers to define functions for common subsets of components */ | ||
141 | #define DECL_PATTERN(NAME) \ | ||
142 | DECL_FUNC(NAME, const bool X, const bool Y, const bool Z, const bool W) | ||
143 | |||
144 | #define WRAP_PATTERN(FUNC, X, Y, Z, W, ...) \ | ||
145 | DECL_IMPL(FUNC##_##X##Y##Z##W) \ | ||
146 | { \ | ||
147 | CALL(FUNC, X, Y, Z, W); \ | ||
148 | } \ | ||
149 | \ | ||
150 | DECL_ENTRY(FUNC##_##X##Y##Z##W, \ | ||
151 | .unused = { !X, !Y, !Z, !W }, \ | ||
152 | __VA_ARGS__ \ | ||
153 | ) | ||
154 | |||
155 | #define WRAP_COMMON_PATTERNS(FUNC, ...) \ | ||
156 | WRAP_PATTERN(FUNC, 1, 0, 0, 0, __VA_ARGS__); \ | ||
157 | WRAP_PATTERN(FUNC, 1, 0, 0, 1, __VA_ARGS__); \ | ||
158 | WRAP_PATTERN(FUNC, 1, 1, 1, 0, __VA_ARGS__); \ | ||
159 | WRAP_PATTERN(FUNC, 1, 1, 1, 1, __VA_ARGS__) | ||
160 | |||
161 | #define REF_COMMON_PATTERNS(NAME) \ | ||
162 | &fn(op_##NAME##_1000), \ | ||
163 | &fn(op_##NAME##_1001), \ | ||
164 | &fn(op_##NAME##_1110), \ | ||
165 | &fn(op_##NAME##_1111) | ||
166 | |||
167 | #endif | ||
168 |