Line | Branch | Exec | Source |
---|---|---|---|
1 | /* | ||
2 | * RV40 decoder motion compensation functions | ||
3 | * Copyright (c) 2008 Konstantin Shishkov | ||
4 | * | ||
5 | * This file is part of FFmpeg. | ||
6 | * | ||
7 | * FFmpeg is free software; you can redistribute it and/or | ||
8 | * modify it under the terms of the GNU Lesser General Public | ||
9 | * License as published by the Free Software Foundation; either | ||
10 | * version 2.1 of the License, or (at your option) any later version. | ||
11 | * | ||
12 | * FFmpeg is distributed in the hope that it will be useful, | ||
13 | * but WITHOUT ANY WARRANTY; without even the implied warranty of | ||
14 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU | ||
15 | * Lesser General Public License for more details. | ||
16 | * | ||
17 | * You should have received a copy of the GNU Lesser General Public | ||
18 | * License along with FFmpeg; if not, write to the Free Software | ||
19 | * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA | ||
20 | */ | ||
21 | |||
22 | /** | ||
23 | * @file | ||
24 | * RV40 decoder motion compensation functions | ||
25 | */ | ||
26 | |||
27 | #include "libavutil/common.h" | ||
28 | #include "libavutil/intreadwrite.h" | ||
29 | #include "h264qpel.h" | ||
30 | #include "mathops.h" | ||
31 | #include "pixels.h" | ||
32 | #include "rnd_avg.h" | ||
33 | #include "rv34dsp.h" | ||
34 | #include "libavutil/avassert.h" | ||
35 | |||
36 | #define RV40_LOWPASS(OPNAME, OP) \ | ||
37 | static void OPNAME ## rv40_qpel8_h_lowpass(uint8_t *dst, const uint8_t *src, int dstStride, int srcStride,\ | ||
38 | const int h, const int C1, const int C2, const int SHIFT){\ | ||
39 | const uint8_t *cm = ff_crop_tab + MAX_NEG_CROP;\ | ||
40 | int i;\ | ||
41 | for(i = 0; i < h; i++)\ | ||
42 | {\ | ||
43 | OP(dst[0], (src[-2] + src[ 3] - 5*(src[-1]+src[2]) + src[0]*C1 + src[1]*C2 + (1<<(SHIFT-1))) >> SHIFT);\ | ||
44 | OP(dst[1], (src[-1] + src[ 4] - 5*(src[ 0]+src[3]) + src[1]*C1 + src[2]*C2 + (1<<(SHIFT-1))) >> SHIFT);\ | ||
45 | OP(dst[2], (src[ 0] + src[ 5] - 5*(src[ 1]+src[4]) + src[2]*C1 + src[3]*C2 + (1<<(SHIFT-1))) >> SHIFT);\ | ||
46 | OP(dst[3], (src[ 1] + src[ 6] - 5*(src[ 2]+src[5]) + src[3]*C1 + src[4]*C2 + (1<<(SHIFT-1))) >> SHIFT);\ | ||
47 | OP(dst[4], (src[ 2] + src[ 7] - 5*(src[ 3]+src[6]) + src[4]*C1 + src[5]*C2 + (1<<(SHIFT-1))) >> SHIFT);\ | ||
48 | OP(dst[5], (src[ 3] + src[ 8] - 5*(src[ 4]+src[7]) + src[5]*C1 + src[6]*C2 + (1<<(SHIFT-1))) >> SHIFT);\ | ||
49 | OP(dst[6], (src[ 4] + src[ 9] - 5*(src[ 5]+src[8]) + src[6]*C1 + src[7]*C2 + (1<<(SHIFT-1))) >> SHIFT);\ | ||
50 | OP(dst[7], (src[ 5] + src[10] - 5*(src[ 6]+src[9]) + src[7]*C1 + src[8]*C2 + (1<<(SHIFT-1))) >> SHIFT);\ | ||
51 | dst += dstStride;\ | ||
52 | src += srcStride;\ | ||
53 | }\ | ||
54 | }\ | ||
55 | \ | ||
56 | static void OPNAME ## rv40_qpel8_v_lowpass(uint8_t *dst, const uint8_t *src, int dstStride, int srcStride,\ | ||
57 | const int w, const int C1, const int C2, const int SHIFT){\ | ||
58 | const uint8_t *cm = ff_crop_tab + MAX_NEG_CROP;\ | ||
59 | int i;\ | ||
60 | for(i = 0; i < w; i++)\ | ||
61 | {\ | ||
62 | const int srcB = src[-2*srcStride];\ | ||
63 | const int srcA = src[-1*srcStride];\ | ||
64 | const int src0 = src[0 *srcStride];\ | ||
65 | const int src1 = src[1 *srcStride];\ | ||
66 | const int src2 = src[2 *srcStride];\ | ||
67 | const int src3 = src[3 *srcStride];\ | ||
68 | const int src4 = src[4 *srcStride];\ | ||
69 | const int src5 = src[5 *srcStride];\ | ||
70 | const int src6 = src[6 *srcStride];\ | ||
71 | const int src7 = src[7 *srcStride];\ | ||
72 | const int src8 = src[8 *srcStride];\ | ||
73 | const int src9 = src[9 *srcStride];\ | ||
74 | const int src10 = src[10*srcStride];\ | ||
75 | OP(dst[0*dstStride], (srcB + src3 - 5*(srcA+src2) + src0*C1 + src1*C2 + (1<<(SHIFT-1))) >> SHIFT);\ | ||
76 | OP(dst[1*dstStride], (srcA + src4 - 5*(src0+src3) + src1*C1 + src2*C2 + (1<<(SHIFT-1))) >> SHIFT);\ | ||
77 | OP(dst[2*dstStride], (src0 + src5 - 5*(src1+src4) + src2*C1 + src3*C2 + (1<<(SHIFT-1))) >> SHIFT);\ | ||
78 | OP(dst[3*dstStride], (src1 + src6 - 5*(src2+src5) + src3*C1 + src4*C2 + (1<<(SHIFT-1))) >> SHIFT);\ | ||
79 | OP(dst[4*dstStride], (src2 + src7 - 5*(src3+src6) + src4*C1 + src5*C2 + (1<<(SHIFT-1))) >> SHIFT);\ | ||
80 | OP(dst[5*dstStride], (src3 + src8 - 5*(src4+src7) + src5*C1 + src6*C2 + (1<<(SHIFT-1))) >> SHIFT);\ | ||
81 | OP(dst[6*dstStride], (src4 + src9 - 5*(src5+src8) + src6*C1 + src7*C2 + (1<<(SHIFT-1))) >> SHIFT);\ | ||
82 | OP(dst[7*dstStride], (src5 + src10 - 5*(src6+src9) + src7*C1 + src8*C2 + (1<<(SHIFT-1))) >> SHIFT);\ | ||
83 | dst++;\ | ||
84 | src++;\ | ||
85 | }\ | ||
86 | }\ | ||
87 | \ | ||
88 | static void OPNAME ## rv40_qpel16_v_lowpass(uint8_t *dst, const uint8_t *src, int dstStride, int srcStride,\ | ||
89 | const int w, const int C1, const int C2, const int SHIFT){\ | ||
90 | OPNAME ## rv40_qpel8_v_lowpass(dst , src , dstStride, srcStride, 8, C1, C2, SHIFT);\ | ||
91 | OPNAME ## rv40_qpel8_v_lowpass(dst+8, src+8, dstStride, srcStride, 8, C1, C2, SHIFT);\ | ||
92 | src += 8*srcStride;\ | ||
93 | dst += 8*dstStride;\ | ||
94 | OPNAME ## rv40_qpel8_v_lowpass(dst , src , dstStride, srcStride, w-8, C1, C2, SHIFT);\ | ||
95 | OPNAME ## rv40_qpel8_v_lowpass(dst+8, src+8, dstStride, srcStride, w-8, C1, C2, SHIFT);\ | ||
96 | }\ | ||
97 | \ | ||
98 | static void OPNAME ## rv40_qpel16_h_lowpass(uint8_t *dst, const uint8_t *src, int dstStride, int srcStride,\ | ||
99 | const int h, const int C1, const int C2, const int SHIFT){\ | ||
100 | OPNAME ## rv40_qpel8_h_lowpass(dst , src , dstStride, srcStride, 8, C1, C2, SHIFT);\ | ||
101 | OPNAME ## rv40_qpel8_h_lowpass(dst+8, src+8, dstStride, srcStride, 8, C1, C2, SHIFT);\ | ||
102 | src += 8*srcStride;\ | ||
103 | dst += 8*dstStride;\ | ||
104 | OPNAME ## rv40_qpel8_h_lowpass(dst , src , dstStride, srcStride, h-8, C1, C2, SHIFT);\ | ||
105 | OPNAME ## rv40_qpel8_h_lowpass(dst+8, src+8, dstStride, srcStride, h-8, C1, C2, SHIFT);\ | ||
106 | }\ | ||
107 | \ | ||
108 | |||
109 | #define RV40_MC(OPNAME, SIZE) \ | ||
110 | static void OPNAME ## rv40_qpel ## SIZE ## _mc10_c(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)\ | ||
111 | {\ | ||
112 | OPNAME ## rv40_qpel ## SIZE ## _h_lowpass(dst, src, stride, stride, SIZE, 52, 20, 6);\ | ||
113 | }\ | ||
114 | \ | ||
115 | static void OPNAME ## rv40_qpel ## SIZE ## _mc30_c(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)\ | ||
116 | {\ | ||
117 | OPNAME ## rv40_qpel ## SIZE ## _h_lowpass(dst, src, stride, stride, SIZE, 20, 52, 6);\ | ||
118 | }\ | ||
119 | \ | ||
120 | static void OPNAME ## rv40_qpel ## SIZE ## _mc01_c(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)\ | ||
121 | {\ | ||
122 | OPNAME ## rv40_qpel ## SIZE ## _v_lowpass(dst, src, stride, stride, SIZE, 52, 20, 6);\ | ||
123 | }\ | ||
124 | \ | ||
125 | static void OPNAME ## rv40_qpel ## SIZE ## _mc11_c(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)\ | ||
126 | {\ | ||
127 | uint8_t full[SIZE*(SIZE+5)];\ | ||
128 | uint8_t * const full_mid = full + SIZE*2;\ | ||
129 | put_rv40_qpel ## SIZE ## _h_lowpass(full, src - 2*stride, SIZE, stride, SIZE+5, 52, 20, 6);\ | ||
130 | OPNAME ## rv40_qpel ## SIZE ## _v_lowpass(dst, full_mid, stride, SIZE, SIZE, 52, 20, 6);\ | ||
131 | }\ | ||
132 | \ | ||
133 | static void OPNAME ## rv40_qpel ## SIZE ## _mc21_c(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)\ | ||
134 | {\ | ||
135 | uint8_t full[SIZE*(SIZE+5)];\ | ||
136 | uint8_t * const full_mid = full + SIZE*2;\ | ||
137 | put_rv40_qpel ## SIZE ## _h_lowpass(full, src - 2*stride, SIZE, stride, SIZE+5, 20, 20, 5);\ | ||
138 | OPNAME ## rv40_qpel ## SIZE ## _v_lowpass(dst, full_mid, stride, SIZE, SIZE, 52, 20, 6);\ | ||
139 | }\ | ||
140 | \ | ||
141 | static void OPNAME ## rv40_qpel ## SIZE ## _mc31_c(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)\ | ||
142 | {\ | ||
143 | uint8_t full[SIZE*(SIZE+5)];\ | ||
144 | uint8_t * const full_mid = full + SIZE*2;\ | ||
145 | put_rv40_qpel ## SIZE ## _h_lowpass(full, src - 2*stride, SIZE, stride, SIZE+5, 20, 52, 6);\ | ||
146 | OPNAME ## rv40_qpel ## SIZE ## _v_lowpass(dst, full_mid, stride, SIZE, SIZE, 52, 20, 6);\ | ||
147 | }\ | ||
148 | \ | ||
149 | static void OPNAME ## rv40_qpel ## SIZE ## _mc12_c(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)\ | ||
150 | {\ | ||
151 | uint8_t full[SIZE*(SIZE+5)];\ | ||
152 | uint8_t * const full_mid = full + SIZE*2;\ | ||
153 | put_rv40_qpel ## SIZE ## _h_lowpass(full, src - 2*stride, SIZE, stride, SIZE+5, 52, 20, 6);\ | ||
154 | OPNAME ## rv40_qpel ## SIZE ## _v_lowpass(dst, full_mid, stride, SIZE, SIZE, 20, 20, 5);\ | ||
155 | }\ | ||
156 | \ | ||
157 | static void OPNAME ## rv40_qpel ## SIZE ## _mc22_c(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)\ | ||
158 | {\ | ||
159 | uint8_t full[SIZE*(SIZE+5)];\ | ||
160 | uint8_t * const full_mid = full + SIZE*2;\ | ||
161 | put_rv40_qpel ## SIZE ## _h_lowpass(full, src - 2*stride, SIZE, stride, SIZE+5, 20, 20, 5);\ | ||
162 | OPNAME ## rv40_qpel ## SIZE ## _v_lowpass(dst, full_mid, stride, SIZE, SIZE, 20, 20, 5);\ | ||
163 | }\ | ||
164 | \ | ||
165 | static void OPNAME ## rv40_qpel ## SIZE ## _mc32_c(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)\ | ||
166 | {\ | ||
167 | uint8_t full[SIZE*(SIZE+5)];\ | ||
168 | uint8_t * const full_mid = full + SIZE*2;\ | ||
169 | put_rv40_qpel ## SIZE ## _h_lowpass(full, src - 2*stride, SIZE, stride, SIZE+5, 20, 52, 6);\ | ||
170 | OPNAME ## rv40_qpel ## SIZE ## _v_lowpass(dst, full_mid, stride, SIZE, SIZE, 20, 20, 5);\ | ||
171 | }\ | ||
172 | \ | ||
173 | static void OPNAME ## rv40_qpel ## SIZE ## _mc03_c(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)\ | ||
174 | {\ | ||
175 | OPNAME ## rv40_qpel ## SIZE ## _v_lowpass(dst, src, stride, stride, SIZE, 20, 52, 6);\ | ||
176 | }\ | ||
177 | \ | ||
178 | static void OPNAME ## rv40_qpel ## SIZE ## _mc13_c(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)\ | ||
179 | {\ | ||
180 | uint8_t full[SIZE*(SIZE+5)];\ | ||
181 | uint8_t * const full_mid = full + SIZE*2;\ | ||
182 | put_rv40_qpel ## SIZE ## _h_lowpass(full, src - 2*stride, SIZE, stride, SIZE+5, 52, 20, 6);\ | ||
183 | OPNAME ## rv40_qpel ## SIZE ## _v_lowpass(dst, full_mid, stride, SIZE, SIZE, 20, 52, 6);\ | ||
184 | }\ | ||
185 | \ | ||
186 | static void OPNAME ## rv40_qpel ## SIZE ## _mc23_c(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)\ | ||
187 | {\ | ||
188 | uint8_t full[SIZE*(SIZE+5)];\ | ||
189 | uint8_t * const full_mid = full + SIZE*2;\ | ||
190 | put_rv40_qpel ## SIZE ## _h_lowpass(full, src - 2*stride, SIZE, stride, SIZE+5, 20, 20, 5);\ | ||
191 | OPNAME ## rv40_qpel ## SIZE ## _v_lowpass(dst, full_mid, stride, SIZE, SIZE, 20, 52, 6);\ | ||
192 | }\ | ||
193 | \ | ||
194 | |||
195 | #define op_avg(a, b) a = (((a)+cm[b]+1)>>1) | ||
196 | #define op_put(a, b) a = cm[b] | ||
197 | |||
198 |
2/2✓ Branch 0 taken 2368794 times.
✓ Branch 1 taken 253673 times.
|
5323912 | RV40_LOWPASS(put_ , op_put) |
199 |
2/2✓ Branch 0 taken 122688 times.
✓ Branch 1 taken 15336 times.
|
283716 | RV40_LOWPASS(avg_ , op_avg) |
200 | |||
201 | #undef op_avg | ||
202 | #undef op_put | ||
203 | |||
204 | 119314 | RV40_MC(put_, 8) | |
205 | 47156 | RV40_MC(put_, 16) | |
206 | ✗ | RV40_MC(avg_, 8) | |
207 | 7668 | RV40_MC(avg_, 16) | |
208 | |||
209 | #define PIXOP2(OPNAME, OP) \ | ||
210 | static inline void OPNAME ## _pixels8_xy2_8_c(uint8_t *block, \ | ||
211 | const uint8_t *pixels, \ | ||
212 | ptrdiff_t line_size, \ | ||
213 | int h) \ | ||
214 | { \ | ||
215 | /* FIXME HIGH BIT DEPTH */ \ | ||
216 | int j; \ | ||
217 | \ | ||
218 | for (j = 0; j < 2; j++) { \ | ||
219 | int i; \ | ||
220 | const uint32_t a = AV_RN32(pixels); \ | ||
221 | const uint32_t b = AV_RN32(pixels + 1); \ | ||
222 | uint32_t l0 = (a & 0x03030303UL) + \ | ||
223 | (b & 0x03030303UL) + \ | ||
224 | 0x02020202UL; \ | ||
225 | uint32_t h0 = ((a & 0xFCFCFCFCUL) >> 2) + \ | ||
226 | ((b & 0xFCFCFCFCUL) >> 2); \ | ||
227 | uint32_t l1, h1; \ | ||
228 | \ | ||
229 | pixels += line_size; \ | ||
230 | for (i = 0; i < h; i += 2) { \ | ||
231 | uint32_t a = AV_RN32(pixels); \ | ||
232 | uint32_t b = AV_RN32(pixels + 1); \ | ||
233 | l1 = (a & 0x03030303UL) + \ | ||
234 | (b & 0x03030303UL); \ | ||
235 | h1 = ((a & 0xFCFCFCFCUL) >> 2) + \ | ||
236 | ((b & 0xFCFCFCFCUL) >> 2); \ | ||
237 | OP(*((uint32_t *) block), \ | ||
238 | h0 + h1 + (((l0 + l1) >> 2) & 0x0F0F0F0FUL)); \ | ||
239 | pixels += line_size; \ | ||
240 | block += line_size; \ | ||
241 | a = AV_RN32(pixels); \ | ||
242 | b = AV_RN32(pixels + 1); \ | ||
243 | l0 = (a & 0x03030303UL) + \ | ||
244 | (b & 0x03030303UL) + \ | ||
245 | 0x02020202UL; \ | ||
246 | h0 = ((a & 0xFCFCFCFCUL) >> 2) + \ | ||
247 | ((b & 0xFCFCFCFCUL) >> 2); \ | ||
248 | OP(*((uint32_t *) block), \ | ||
249 | h0 + h1 + (((l0 + l1) >> 2) & 0x0F0F0F0FUL)); \ | ||
250 | pixels += line_size; \ | ||
251 | block += line_size; \ | ||
252 | } \ | ||
253 | pixels += 4 - line_size * (h + 1); \ | ||
254 | block += 4 - line_size * h; \ | ||
255 | } \ | ||
256 | } \ | ||
257 | \ | ||
258 | CALL_2X_PIXELS(OPNAME ## _pixels16_xy2_8_c, \ | ||
259 | OPNAME ## _pixels8_xy2_8_c, \ | ||
260 | 8) \ | ||
261 | |||
262 | #define op_avg(a, b) a = rnd_avg32(a, b) | ||
263 | #define op_put(a, b) a = b | ||
264 |
4/4✓ Branch 2 taken 155008 times.
✓ Branch 3 taken 19376 times.
✓ Branch 4 taken 19376 times.
✓ Branch 5 taken 9688 times.
|
377832 | PIXOP2(avg, op_avg) |
265 |
4/4✓ Branch 0 taken 808424 times.
✓ Branch 1 taken 118070 times.
✓ Branch 2 taken 118070 times.
✓ Branch 3 taken 59035 times.
|
2013076 | PIXOP2(put, op_put) |
266 | #undef op_avg | ||
267 | #undef op_put | ||
268 | |||
269 | 21009 | static void put_rv40_qpel16_mc33_c(uint8_t *dst, const uint8_t *src, ptrdiff_t stride) | |
270 | { | ||
271 | 21009 | put_pixels16_xy2_8_c(dst, src, stride, 16); | |
272 | 21009 | } | |
273 | 4844 | static void avg_rv40_qpel16_mc33_c(uint8_t *dst, const uint8_t *src, ptrdiff_t stride) | |
274 | { | ||
275 | 4844 | avg_pixels16_xy2_8_c(dst, src, stride, 16); | |
276 | 4844 | } | |
277 | 17017 | static void put_rv40_qpel8_mc33_c(uint8_t *dst, const uint8_t *src, ptrdiff_t stride) | |
278 | { | ||
279 | 17017 | put_pixels8_xy2_8_c(dst, src, stride, 8); | |
280 | 17017 | } | |
281 | ✗ | static void avg_rv40_qpel8_mc33_c(uint8_t *dst, const uint8_t *src, ptrdiff_t stride) | |
282 | { | ||
283 | ✗ | avg_pixels8_xy2_8_c(dst, src, stride, 8); | |
284 | ✗ | } | |
285 | |||
286 | static const int rv40_bias[4][4] = { | ||
287 | { 0, 16, 32, 16 }, | ||
288 | { 32, 28, 32, 28 }, | ||
289 | { 0, 32, 16, 32 }, | ||
290 | { 32, 28, 32, 28 } | ||
291 | }; | ||
292 | |||
293 | #define RV40_CHROMA_MC(OPNAME, OP)\ | ||
294 | static void OPNAME ## rv40_chroma_mc4_c(uint8_t *dst /*align 8*/,\ | ||
295 | const uint8_t *src /*align 1*/,\ | ||
296 | ptrdiff_t stride, int h, int x, int y)\ | ||
297 | {\ | ||
298 | const int A = (8-x) * (8-y);\ | ||
299 | const int B = ( x) * (8-y);\ | ||
300 | const int C = (8-x) * ( y);\ | ||
301 | const int D = ( x) * ( y);\ | ||
302 | int i;\ | ||
303 | int bias = rv40_bias[y>>1][x>>1];\ | ||
304 | \ | ||
305 | av_assert2(x<8 && y<8 && x>=0 && y>=0);\ | ||
306 | \ | ||
307 | if(D){\ | ||
308 | for(i = 0; i < h; i++){\ | ||
309 | OP(dst[0], (A*src[0] + B*src[1] + C*src[stride+0] + D*src[stride+1] + bias));\ | ||
310 | OP(dst[1], (A*src[1] + B*src[2] + C*src[stride+1] + D*src[stride+2] + bias));\ | ||
311 | OP(dst[2], (A*src[2] + B*src[3] + C*src[stride+2] + D*src[stride+3] + bias));\ | ||
312 | OP(dst[3], (A*src[3] + B*src[4] + C*src[stride+3] + D*src[stride+4] + bias));\ | ||
313 | dst += stride;\ | ||
314 | src += stride;\ | ||
315 | }\ | ||
316 | }else{\ | ||
317 | const int E = B + C;\ | ||
318 | const ptrdiff_t step = C ? stride : 1;\ | ||
319 | for(i = 0; i < h; i++){\ | ||
320 | OP(dst[0], (A*src[0] + E*src[step+0] + bias));\ | ||
321 | OP(dst[1], (A*src[1] + E*src[step+1] + bias));\ | ||
322 | OP(dst[2], (A*src[2] + E*src[step+2] + bias));\ | ||
323 | OP(dst[3], (A*src[3] + E*src[step+3] + bias));\ | ||
324 | dst += stride;\ | ||
325 | src += stride;\ | ||
326 | }\ | ||
327 | }\ | ||
328 | }\ | ||
329 | \ | ||
330 | static void OPNAME ## rv40_chroma_mc8_c(uint8_t *dst/*align 8*/,\ | ||
331 | const uint8_t *src/*align 1*/,\ | ||
332 | ptrdiff_t stride, int h, int x, int y)\ | ||
333 | {\ | ||
334 | const int A = (8-x) * (8-y);\ | ||
335 | const int B = ( x) * (8-y);\ | ||
336 | const int C = (8-x) * ( y);\ | ||
337 | const int D = ( x) * ( y);\ | ||
338 | int i;\ | ||
339 | int bias = rv40_bias[y>>1][x>>1];\ | ||
340 | \ | ||
341 | av_assert2(x<8 && y<8 && x>=0 && y>=0);\ | ||
342 | \ | ||
343 | if(D){\ | ||
344 | for(i = 0; i < h; i++){\ | ||
345 | OP(dst[0], (A*src[0] + B*src[1] + C*src[stride+0] + D*src[stride+1] + bias));\ | ||
346 | OP(dst[1], (A*src[1] + B*src[2] + C*src[stride+1] + D*src[stride+2] + bias));\ | ||
347 | OP(dst[2], (A*src[2] + B*src[3] + C*src[stride+2] + D*src[stride+3] + bias));\ | ||
348 | OP(dst[3], (A*src[3] + B*src[4] + C*src[stride+3] + D*src[stride+4] + bias));\ | ||
349 | OP(dst[4], (A*src[4] + B*src[5] + C*src[stride+4] + D*src[stride+5] + bias));\ | ||
350 | OP(dst[5], (A*src[5] + B*src[6] + C*src[stride+5] + D*src[stride+6] + bias));\ | ||
351 | OP(dst[6], (A*src[6] + B*src[7] + C*src[stride+6] + D*src[stride+7] + bias));\ | ||
352 | OP(dst[7], (A*src[7] + B*src[8] + C*src[stride+7] + D*src[stride+8] + bias));\ | ||
353 | dst += stride;\ | ||
354 | src += stride;\ | ||
355 | }\ | ||
356 | }else{\ | ||
357 | const int E = B + C;\ | ||
358 | const ptrdiff_t step = C ? stride : 1;\ | ||
359 | for(i = 0; i < h; i++){\ | ||
360 | OP(dst[0], (A*src[0] + E*src[step+0] + bias));\ | ||
361 | OP(dst[1], (A*src[1] + E*src[step+1] + bias));\ | ||
362 | OP(dst[2], (A*src[2] + E*src[step+2] + bias));\ | ||
363 | OP(dst[3], (A*src[3] + E*src[step+3] + bias));\ | ||
364 | OP(dst[4], (A*src[4] + E*src[step+4] + bias));\ | ||
365 | OP(dst[5], (A*src[5] + E*src[step+5] + bias));\ | ||
366 | OP(dst[6], (A*src[6] + E*src[step+6] + bias));\ | ||
367 | OP(dst[7], (A*src[7] + E*src[step+7] + bias));\ | ||
368 | dst += stride;\ | ||
369 | src += stride;\ | ||
370 | }\ | ||
371 | }\ | ||
372 | } | ||
373 | |||
374 | #define op_avg(a, b) a = (((a)+((b)>>6)+1)>>1) | ||
375 | #define op_put(a, b) a = ((b)>>6) | ||
376 | |||
377 |
8/8✓ Branch 0 taken 131614 times.
✓ Branch 1 taken 623566 times.
✓ Branch 2 taken 736016 times.
✓ Branch 3 taken 131614 times.
✓ Branch 4 taken 52374 times.
✓ Branch 5 taken 571192 times.
✓ Branch 6 taken 4652624 times.
✓ Branch 7 taken 623566 times.
|
12287640 | RV40_CHROMA_MC(put_, op_put) |
378 |
8/8✓ Branch 0 taken 7550 times.
✓ Branch 1 taken 11092 times.
✓ Branch 2 taken 60448 times.
✓ Branch 3 taken 7550 times.
✓ Branch 4 taken 2808 times.
✓ Branch 5 taken 8284 times.
✓ Branch 6 taken 88880 times.
✓ Branch 7 taken 11092 times.
|
335940 | RV40_CHROMA_MC(avg_, op_avg) |
379 | |||
380 | #define RV40_WEIGHT_FUNC(size) \ | ||
381 | static void rv40_weight_func_rnd_ ## size (uint8_t *dst, uint8_t *src1, uint8_t *src2, int w1, int w2, ptrdiff_t stride)\ | ||
382 | {\ | ||
383 | int i, j;\ | ||
384 | \ | ||
385 | for (j = 0; j < size; j++) {\ | ||
386 | for (i = 0; i < size; i++)\ | ||
387 | dst[i] = ((((unsigned)w2 * src1[i]) >> 9) + (((unsigned)w1 * src2[i]) >> 9) + 0x10) >> 5;\ | ||
388 | src1 += stride;\ | ||
389 | src2 += stride;\ | ||
390 | dst += stride;\ | ||
391 | }\ | ||
392 | }\ | ||
393 | static void rv40_weight_func_nornd_ ## size (uint8_t *dst, uint8_t *src1, uint8_t *src2, int w1, int w2, ptrdiff_t stride)\ | ||
394 | {\ | ||
395 | int i, j;\ | ||
396 | \ | ||
397 | for (j = 0; j < size; j++) {\ | ||
398 | for (i = 0; i < size; i++)\ | ||
399 | dst[i] = ((unsigned)w2 * src1[i] + (unsigned)w1 * src2[i] + 0x10) >> 5;\ | ||
400 | src1 += stride;\ | ||
401 | src2 += stride;\ | ||
402 | dst += stride;\ | ||
403 | }\ | ||
404 | } | ||
405 | |||
406 |
4/4✓ Branch 0 taken 29802752 times.
✓ Branch 1 taken 1862672 times.
✓ Branch 2 taken 1862672 times.
✓ Branch 3 taken 116417 times.
|
63563682 | RV40_WEIGHT_FUNC(16) |
407 |
4/4✓ Branch 0 taken 14901376 times.
✓ Branch 1 taken 1862672 times.
✓ Branch 2 taken 1862672 times.
✓ Branch 3 taken 232834 times.
|
33993764 | RV40_WEIGHT_FUNC(8) |
408 | |||
409 | /** | ||
410 | * dither values for deblocking filter - left/top values | ||
411 | */ | ||
412 | static const uint8_t rv40_dither_l[16] = { | ||
413 | 0x40, 0x50, 0x20, 0x60, 0x30, 0x50, 0x40, 0x30, | ||
414 | 0x50, 0x40, 0x50, 0x30, 0x60, 0x20, 0x50, 0x40 | ||
415 | }; | ||
416 | |||
417 | /** | ||
418 | * dither values for deblocking filter - right/bottom values | ||
419 | */ | ||
420 | static const uint8_t rv40_dither_r[16] = { | ||
421 | 0x40, 0x30, 0x60, 0x20, 0x50, 0x30, 0x30, 0x40, | ||
422 | 0x40, 0x40, 0x50, 0x30, 0x20, 0x60, 0x30, 0x40 | ||
423 | }; | ||
424 | |||
425 | #define CLIP_SYMM(a, b) av_clip(a, -(b), b) | ||
426 | /** | ||
427 | * weaker deblocking very similar to the one described in 4.4.2 of JVT-A003r1 | ||
428 | */ | ||
429 | 1493706 | static av_always_inline void rv40_weak_loop_filter(uint8_t *src, | |
430 | const int step, | ||
431 | const ptrdiff_t stride, | ||
432 | const int filter_p1, | ||
433 | const int filter_q1, | ||
434 | const int alpha, | ||
435 | const int beta, | ||
436 | const int lim_p0q0, | ||
437 | const int lim_q1, | ||
438 | const int lim_p1) | ||
439 | { | ||
440 | 1493706 | const uint8_t *cm = ff_crop_tab + MAX_NEG_CROP; | |
441 | int i, t, u, diff; | ||
442 | |||
443 |
2/2✓ Branch 0 taken 5974824 times.
✓ Branch 1 taken 1493706 times.
|
7468530 | for (i = 0; i < 4; i++, src += stride) { |
444 | 5974824 | int diff_p1p0 = src[-2*step] - src[-1*step]; | |
445 | 5974824 | int diff_q1q0 = src[ 1*step] - src[ 0*step]; | |
446 | 5974824 | int diff_p1p2 = src[-2*step] - src[-3*step]; | |
447 | 5974824 | int diff_q1q2 = src[ 1*step] - src[ 2*step]; | |
448 | |||
449 | 5974824 | t = src[0*step] - src[-1*step]; | |
450 |
2/2✓ Branch 0 taken 1310272 times.
✓ Branch 1 taken 4664552 times.
|
5974824 | if (!t) |
451 | 1310272 | continue; | |
452 | |||
453 | 4664552 | u = (alpha * FFABS(t)) >> 7; | |
454 |
6/6✓ Branch 0 taken 4208918 times.
✓ Branch 1 taken 455634 times.
✓ Branch 2 taken 3751971 times.
✓ Branch 3 taken 456947 times.
✓ Branch 4 taken 515980 times.
✓ Branch 5 taken 4148572 times.
|
4664552 | if (u > 3 - (filter_p1 && filter_q1)) |
455 | 515980 | continue; | |
456 | |||
457 | 4148572 | t *= 1 << 2; | |
458 |
4/4✓ Branch 0 taken 3793325 times.
✓ Branch 1 taken 355247 times.
✓ Branch 2 taken 3442555 times.
✓ Branch 3 taken 350770 times.
|
4148572 | if (filter_p1 && filter_q1) |
459 | 3442555 | t += src[-2*step] - src[1*step]; | |
460 | |||
461 | 4148572 | diff = CLIP_SYMM((t + 4) >> 3, lim_p0q0); | |
462 | 4148572 | src[-1*step] = cm[src[-1*step] + diff]; | |
463 | 4148572 | src[ 0*step] = cm[src[ 0*step] - diff]; | |
464 | |||
465 |
4/4✓ Branch 0 taken 3793325 times.
✓ Branch 1 taken 355247 times.
✓ Branch 2 taken 3578515 times.
✓ Branch 3 taken 214810 times.
|
4148572 | if (filter_p1 && FFABS(diff_p1p2) <= beta) { |
466 | 3578515 | t = (diff_p1p0 + diff_p1p2 - diff) >> 1; | |
467 | 3578515 | src[-2*step] = cm[src[-2*step] - CLIP_SYMM(t, lim_p1)]; | |
468 | } | ||
469 | |||
470 |
4/4✓ Branch 0 taken 3797802 times.
✓ Branch 1 taken 350770 times.
✓ Branch 2 taken 3580816 times.
✓ Branch 3 taken 216986 times.
|
4148572 | if (filter_q1 && FFABS(diff_q1q2) <= beta) { |
471 | 3580816 | t = (diff_q1q0 + diff_q1q2 + diff) >> 1; | |
472 | 3580816 | src[ 1*step] = cm[src[ 1*step] - CLIP_SYMM(t, lim_q1)]; | |
473 | } | ||
474 | } | ||
475 | 1493706 | } | |
476 | |||
477 | 749410 | static void rv40_h_weak_loop_filter(uint8_t *src, const ptrdiff_t stride, | |
478 | const int filter_p1, const int filter_q1, | ||
479 | const int alpha, const int beta, | ||
480 | const int lim_p0q0, const int lim_q1, | ||
481 | const int lim_p1) | ||
482 | { | ||
483 | 749410 | rv40_weak_loop_filter(src, stride, 1, filter_p1, filter_q1, | |
484 | alpha, beta, lim_p0q0, lim_q1, lim_p1); | ||
485 | 749410 | } | |
486 | |||
487 | 744296 | static void rv40_v_weak_loop_filter(uint8_t *src, const ptrdiff_t stride, | |
488 | const int filter_p1, const int filter_q1, | ||
489 | const int alpha, const int beta, | ||
490 | const int lim_p0q0, const int lim_q1, | ||
491 | const int lim_p1) | ||
492 | { | ||
493 | 744296 | rv40_weak_loop_filter(src, 1, stride, filter_p1, filter_q1, | |
494 | alpha, beta, lim_p0q0, lim_q1, lim_p1); | ||
495 | 744296 | } | |
496 | |||
497 | 329538 | static av_always_inline void rv40_strong_loop_filter(uint8_t *src, | |
498 | const int step, | ||
499 | const ptrdiff_t stride, | ||
500 | const int alpha, | ||
501 | const int lims, | ||
502 | const int dmode, | ||
503 | const int chroma) | ||
504 | { | ||
505 | int i; | ||
506 | |||
507 |
2/2✓ Branch 0 taken 1318152 times.
✓ Branch 1 taken 329538 times.
|
1647690 | for(i = 0; i < 4; i++, src += stride){ |
508 | int sflag, p0, q0, p1, q1; | ||
509 | 1318152 | int t = src[0*step] - src[-1*step]; | |
510 | |||
511 |
2/2✓ Branch 0 taken 444696 times.
✓ Branch 1 taken 873456 times.
|
1318152 | if (!t) |
512 | 444696 | continue; | |
513 | |||
514 | 873456 | sflag = (alpha * FFABS(t)) >> 7; | |
515 |
2/2✓ Branch 0 taken 128844 times.
✓ Branch 1 taken 744612 times.
|
873456 | if (sflag > 1) |
516 | 128844 | continue; | |
517 | |||
518 | 744612 | p0 = (25*src[-3*step] + 26*src[-2*step] + 26*src[-1*step] + | |
519 | 744612 | 26*src[ 0*step] + 25*src[ 1*step] + | |
520 | 744612 | rv40_dither_l[dmode + i]) >> 7; | |
521 | |||
522 | 744612 | q0 = (25*src[-2*step] + 26*src[-1*step] + 26*src[ 0*step] + | |
523 | 744612 | 26*src[ 1*step] + 25*src[ 2*step] + | |
524 | 744612 | rv40_dither_r[dmode + i]) >> 7; | |
525 | |||
526 |
2/2✓ Branch 0 taken 193811 times.
✓ Branch 1 taken 550801 times.
|
744612 | if (sflag) { |
527 | 193811 | p0 = av_clip(p0, src[-1*step] - lims, src[-1*step] + lims); | |
528 | 193811 | q0 = av_clip(q0, src[ 0*step] - lims, src[ 0*step] + lims); | |
529 | } | ||
530 | |||
531 | 744612 | p1 = (25*src[-4*step] + 26*src[-3*step] + 26*src[-2*step] + 26*p0 + | |
532 | 744612 | 25*src[ 0*step] + rv40_dither_l[dmode + i]) >> 7; | |
533 | 744612 | q1 = (25*src[-1*step] + 26*q0 + 26*src[ 1*step] + 26*src[ 2*step] + | |
534 | 744612 | 25*src[ 3*step] + rv40_dither_r[dmode + i]) >> 7; | |
535 | |||
536 |
2/2✓ Branch 0 taken 193811 times.
✓ Branch 1 taken 550801 times.
|
744612 | if (sflag) { |
537 | 193811 | p1 = av_clip(p1, src[-2*step] - lims, src[-2*step] + lims); | |
538 | 193811 | q1 = av_clip(q1, src[ 1*step] - lims, src[ 1*step] + lims); | |
539 | } | ||
540 | |||
541 | 744612 | src[-2*step] = p1; | |
542 | 744612 | src[-1*step] = p0; | |
543 | 744612 | src[ 0*step] = q0; | |
544 | 744612 | src[ 1*step] = q1; | |
545 | |||
546 |
2/2✓ Branch 0 taken 333000 times.
✓ Branch 1 taken 411612 times.
|
744612 | if(!chroma){ |
547 | 333000 | src[-3*step] = (25*src[-1*step] + 26*src[-2*step] + | |
548 | 333000 | 51*src[-3*step] + 26*src[-4*step] + 64) >> 7; | |
549 | 333000 | src[ 2*step] = (25*src[ 0*step] + 26*src[ 1*step] + | |
550 | 333000 | 51*src[ 2*step] + 26*src[ 3*step] + 64) >> 7; | |
551 | } | ||
552 | } | ||
553 | 329538 | } | |
554 | |||
555 | 174243 | static void rv40_h_strong_loop_filter(uint8_t *src, const ptrdiff_t stride, | |
556 | const int alpha, const int lims, | ||
557 | const int dmode, const int chroma) | ||
558 | { | ||
559 | 174243 | rv40_strong_loop_filter(src, stride, 1, alpha, lims, dmode, chroma); | |
560 | 174243 | } | |
561 | |||
562 | 155295 | static void rv40_v_strong_loop_filter(uint8_t *src, const ptrdiff_t stride, | |
563 | const int alpha, const int lims, | ||
564 | const int dmode, const int chroma) | ||
565 | { | ||
566 | 155295 | rv40_strong_loop_filter(src, 1, stride, alpha, lims, dmode, chroma); | |
567 | 155295 | } | |
568 | |||
569 | 2330845 | static av_always_inline int rv40_loop_filter_strength(uint8_t *src, | |
570 | int step, ptrdiff_t stride, | ||
571 | int beta, int beta2, | ||
572 | int edge, | ||
573 | int *p1, int *q1) | ||
574 | { | ||
575 | 2330845 | int sum_p1p0 = 0, sum_q1q0 = 0, sum_p1p2 = 0, sum_q1q2 = 0; | |
576 | 2330845 | int strong0 = 0, strong1 = 0; | |
577 | uint8_t *ptr; | ||
578 | int i; | ||
579 | |||
580 |
2/2✓ Branch 0 taken 9323380 times.
✓ Branch 1 taken 2330845 times.
|
11654225 | for (i = 0, ptr = src; i < 4; i++, ptr += stride) { |
581 | 9323380 | sum_p1p0 += ptr[-2*step] - ptr[-1*step]; | |
582 | 9323380 | sum_q1q0 += ptr[ 1*step] - ptr[ 0*step]; | |
583 | } | ||
584 | |||
585 | 2330845 | *p1 = FFABS(sum_p1p0) < (beta << 2); | |
586 | 2330845 | *q1 = FFABS(sum_q1q0) < (beta << 2); | |
587 | |||
588 |
4/4✓ Branch 0 taken 629010 times.
✓ Branch 1 taken 1701835 times.
✓ Branch 2 taken 507601 times.
✓ Branch 3 taken 121409 times.
|
2330845 | if(!*p1 && !*q1) |
589 | 507601 | return 0; | |
590 | |||
591 |
2/2✓ Branch 0 taken 1427718 times.
✓ Branch 1 taken 395526 times.
|
1823244 | if (!edge) |
592 | 1427718 | return 0; | |
593 | |||
594 |
2/2✓ Branch 0 taken 1582104 times.
✓ Branch 1 taken 395526 times.
|
1977630 | for (i = 0, ptr = src; i < 4; i++, ptr += stride) { |
595 | 1582104 | sum_p1p2 += ptr[-2*step] - ptr[-3*step]; | |
596 | 1582104 | sum_q1q2 += ptr[ 1*step] - ptr[ 2*step]; | |
597 | } | ||
598 | |||
599 |
4/4✓ Branch 0 taken 380941 times.
✓ Branch 1 taken 14585 times.
✓ Branch 2 taken 358938 times.
✓ Branch 3 taken 22003 times.
|
395526 | strong0 = *p1 && (FFABS(sum_p1p2) < beta2); |
600 |
4/4✓ Branch 0 taken 378085 times.
✓ Branch 1 taken 17441 times.
✓ Branch 2 taken 354901 times.
✓ Branch 3 taken 23184 times.
|
395526 | strong1 = *q1 && (FFABS(sum_q1q2) < beta2); |
601 | |||
602 |
4/4✓ Branch 0 taken 358938 times.
✓ Branch 1 taken 36588 times.
✓ Branch 2 taken 329538 times.
✓ Branch 3 taken 29400 times.
|
395526 | return strong0 && strong1; |
603 | } | ||
604 | |||
605 | 1178527 | static int rv40_h_loop_filter_strength(uint8_t *src, ptrdiff_t stride, | |
606 | int beta, int beta2, int edge, | ||
607 | int *p1, int *q1) | ||
608 | { | ||
609 | 1178527 | return rv40_loop_filter_strength(src, stride, 1, beta, beta2, edge, p1, q1); | |
610 | } | ||
611 | |||
612 | 1152318 | static int rv40_v_loop_filter_strength(uint8_t *src, ptrdiff_t stride, | |
613 | int beta, int beta2, int edge, | ||
614 | int *p1, int *q1) | ||
615 | { | ||
616 | 1152318 | return rv40_loop_filter_strength(src, 1, stride, beta, beta2, edge, p1, q1); | |
617 | } | ||
618 | |||
619 | 17 | av_cold void ff_rv40dsp_init(RV34DSPContext *c) | |
620 | { | ||
621 | H264QpelContext qpel; | ||
622 | |||
623 | 17 | ff_rv34dsp_init(c); | |
624 | 17 | ff_h264qpel_init(&qpel, 8); | |
625 | |||
626 | 17 | c->put_pixels_tab[0][ 0] = qpel.put_h264_qpel_pixels_tab[0][0]; | |
627 | 17 | c->put_pixels_tab[0][ 1] = put_rv40_qpel16_mc10_c; | |
628 | 17 | c->put_pixels_tab[0][ 2] = qpel.put_h264_qpel_pixels_tab[0][2]; | |
629 | 17 | c->put_pixels_tab[0][ 3] = put_rv40_qpel16_mc30_c; | |
630 | 17 | c->put_pixels_tab[0][ 4] = put_rv40_qpel16_mc01_c; | |
631 | 17 | c->put_pixels_tab[0][ 5] = put_rv40_qpel16_mc11_c; | |
632 | 17 | c->put_pixels_tab[0][ 6] = put_rv40_qpel16_mc21_c; | |
633 | 17 | c->put_pixels_tab[0][ 7] = put_rv40_qpel16_mc31_c; | |
634 | 17 | c->put_pixels_tab[0][ 8] = qpel.put_h264_qpel_pixels_tab[0][8]; | |
635 | 17 | c->put_pixels_tab[0][ 9] = put_rv40_qpel16_mc12_c; | |
636 | 17 | c->put_pixels_tab[0][10] = put_rv40_qpel16_mc22_c; | |
637 | 17 | c->put_pixels_tab[0][11] = put_rv40_qpel16_mc32_c; | |
638 | 17 | c->put_pixels_tab[0][12] = put_rv40_qpel16_mc03_c; | |
639 | 17 | c->put_pixels_tab[0][13] = put_rv40_qpel16_mc13_c; | |
640 | 17 | c->put_pixels_tab[0][14] = put_rv40_qpel16_mc23_c; | |
641 | 17 | c->put_pixels_tab[0][15] = put_rv40_qpel16_mc33_c; | |
642 | 17 | c->avg_pixels_tab[0][ 0] = qpel.avg_h264_qpel_pixels_tab[0][0]; | |
643 | 17 | c->avg_pixels_tab[0][ 1] = avg_rv40_qpel16_mc10_c; | |
644 | 17 | c->avg_pixels_tab[0][ 2] = qpel.avg_h264_qpel_pixels_tab[0][2]; | |
645 | 17 | c->avg_pixels_tab[0][ 3] = avg_rv40_qpel16_mc30_c; | |
646 | 17 | c->avg_pixels_tab[0][ 4] = avg_rv40_qpel16_mc01_c; | |
647 | 17 | c->avg_pixels_tab[0][ 5] = avg_rv40_qpel16_mc11_c; | |
648 | 17 | c->avg_pixels_tab[0][ 6] = avg_rv40_qpel16_mc21_c; | |
649 | 17 | c->avg_pixels_tab[0][ 7] = avg_rv40_qpel16_mc31_c; | |
650 | 17 | c->avg_pixels_tab[0][ 8] = qpel.avg_h264_qpel_pixels_tab[0][8]; | |
651 | 17 | c->avg_pixels_tab[0][ 9] = avg_rv40_qpel16_mc12_c; | |
652 | 17 | c->avg_pixels_tab[0][10] = avg_rv40_qpel16_mc22_c; | |
653 | 17 | c->avg_pixels_tab[0][11] = avg_rv40_qpel16_mc32_c; | |
654 | 17 | c->avg_pixels_tab[0][12] = avg_rv40_qpel16_mc03_c; | |
655 | 17 | c->avg_pixels_tab[0][13] = avg_rv40_qpel16_mc13_c; | |
656 | 17 | c->avg_pixels_tab[0][14] = avg_rv40_qpel16_mc23_c; | |
657 | 17 | c->avg_pixels_tab[0][15] = avg_rv40_qpel16_mc33_c; | |
658 | 17 | c->put_pixels_tab[1][ 0] = qpel.put_h264_qpel_pixels_tab[1][0]; | |
659 | 17 | c->put_pixels_tab[1][ 1] = put_rv40_qpel8_mc10_c; | |
660 | 17 | c->put_pixels_tab[1][ 2] = qpel.put_h264_qpel_pixels_tab[1][2]; | |
661 | 17 | c->put_pixels_tab[1][ 3] = put_rv40_qpel8_mc30_c; | |
662 | 17 | c->put_pixels_tab[1][ 4] = put_rv40_qpel8_mc01_c; | |
663 | 17 | c->put_pixels_tab[1][ 5] = put_rv40_qpel8_mc11_c; | |
664 | 17 | c->put_pixels_tab[1][ 6] = put_rv40_qpel8_mc21_c; | |
665 | 17 | c->put_pixels_tab[1][ 7] = put_rv40_qpel8_mc31_c; | |
666 | 17 | c->put_pixels_tab[1][ 8] = qpel.put_h264_qpel_pixels_tab[1][8]; | |
667 | 17 | c->put_pixels_tab[1][ 9] = put_rv40_qpel8_mc12_c; | |
668 | 17 | c->put_pixels_tab[1][10] = put_rv40_qpel8_mc22_c; | |
669 | 17 | c->put_pixels_tab[1][11] = put_rv40_qpel8_mc32_c; | |
670 | 17 | c->put_pixels_tab[1][12] = put_rv40_qpel8_mc03_c; | |
671 | 17 | c->put_pixels_tab[1][13] = put_rv40_qpel8_mc13_c; | |
672 | 17 | c->put_pixels_tab[1][14] = put_rv40_qpel8_mc23_c; | |
673 | 17 | c->put_pixels_tab[1][15] = put_rv40_qpel8_mc33_c; | |
674 | 17 | c->avg_pixels_tab[1][ 0] = qpel.avg_h264_qpel_pixels_tab[1][0]; | |
675 | 17 | c->avg_pixels_tab[1][ 1] = avg_rv40_qpel8_mc10_c; | |
676 | 17 | c->avg_pixels_tab[1][ 2] = qpel.avg_h264_qpel_pixels_tab[1][2]; | |
677 | 17 | c->avg_pixels_tab[1][ 3] = avg_rv40_qpel8_mc30_c; | |
678 | 17 | c->avg_pixels_tab[1][ 4] = avg_rv40_qpel8_mc01_c; | |
679 | 17 | c->avg_pixels_tab[1][ 5] = avg_rv40_qpel8_mc11_c; | |
680 | 17 | c->avg_pixels_tab[1][ 6] = avg_rv40_qpel8_mc21_c; | |
681 | 17 | c->avg_pixels_tab[1][ 7] = avg_rv40_qpel8_mc31_c; | |
682 | 17 | c->avg_pixels_tab[1][ 8] = qpel.avg_h264_qpel_pixels_tab[1][8]; | |
683 | 17 | c->avg_pixels_tab[1][ 9] = avg_rv40_qpel8_mc12_c; | |
684 | 17 | c->avg_pixels_tab[1][10] = avg_rv40_qpel8_mc22_c; | |
685 | 17 | c->avg_pixels_tab[1][11] = avg_rv40_qpel8_mc32_c; | |
686 | 17 | c->avg_pixels_tab[1][12] = avg_rv40_qpel8_mc03_c; | |
687 | 17 | c->avg_pixels_tab[1][13] = avg_rv40_qpel8_mc13_c; | |
688 | 17 | c->avg_pixels_tab[1][14] = avg_rv40_qpel8_mc23_c; | |
689 | 17 | c->avg_pixels_tab[1][15] = avg_rv40_qpel8_mc33_c; | |
690 | |||
691 | 17 | c->put_chroma_pixels_tab[0] = put_rv40_chroma_mc8_c; | |
692 | 17 | c->put_chroma_pixels_tab[1] = put_rv40_chroma_mc4_c; | |
693 | 17 | c->avg_chroma_pixels_tab[0] = avg_rv40_chroma_mc8_c; | |
694 | 17 | c->avg_chroma_pixels_tab[1] = avg_rv40_chroma_mc4_c; | |
695 | |||
696 | 17 | c->rv40_weight_pixels_tab[0][0] = rv40_weight_func_rnd_16; | |
697 | 17 | c->rv40_weight_pixels_tab[0][1] = rv40_weight_func_rnd_8; | |
698 | 17 | c->rv40_weight_pixels_tab[1][0] = rv40_weight_func_nornd_16; | |
699 | 17 | c->rv40_weight_pixels_tab[1][1] = rv40_weight_func_nornd_8; | |
700 | |||
701 | 17 | c->rv40_weak_loop_filter[0] = rv40_h_weak_loop_filter; | |
702 | 17 | c->rv40_weak_loop_filter[1] = rv40_v_weak_loop_filter; | |
703 | 17 | c->rv40_strong_loop_filter[0] = rv40_h_strong_loop_filter; | |
704 | 17 | c->rv40_strong_loop_filter[1] = rv40_v_strong_loop_filter; | |
705 | 17 | c->rv40_loop_filter_strength[0] = rv40_h_loop_filter_strength; | |
706 | 17 | c->rv40_loop_filter_strength[1] = rv40_v_loop_filter_strength; | |
707 | |||
708 | #if ARCH_AARCH64 | ||
709 | ff_rv40dsp_init_aarch64(c); | ||
710 | #elif ARCH_ARM | ||
711 | ff_rv40dsp_init_arm(c); | ||
712 | #elif ARCH_RISCV | ||
713 | ff_rv40dsp_init_riscv(c); | ||
714 | #elif ARCH_X86 | ||
715 | 17 | ff_rv40dsp_init_x86(c); | |
716 | #endif | ||
717 | 17 | } | |
718 |