Line | Branch | Exec | Source |
---|---|---|---|
1 | /* | ||
2 | * Canopus HQ/HQA decoder | ||
3 | * | ||
4 | * This file is part of FFmpeg. | ||
5 | * | ||
6 | * FFmpeg is free software; you can redistribute it and/or | ||
7 | * modify it under the terms of the GNU Lesser General Public | ||
8 | * License as published by the Free Software Foundation; either | ||
9 | * version 2.1 of the License, or (at your option) any later version. | ||
10 | * | ||
11 | * FFmpeg is distributed in the hope that it will be useful, | ||
12 | * but WITHOUT ANY WARRANTY; without even the implied warranty of | ||
13 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU | ||
14 | * Lesser General Public License for more details. | ||
15 | * | ||
16 | * You should have received a copy of the GNU Lesser General Public | ||
17 | * License along with FFmpeg; if not, write to the Free Software | ||
18 | * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA | ||
19 | */ | ||
20 | |||
21 | #include <stdint.h> | ||
22 | |||
23 | #include "libavutil/attributes.h" | ||
24 | #include "libavutil/common.h" | ||
25 | |||
26 | #include "hq_hqadsp.h" | ||
27 | |||
28 | #define FIX_1_082 17734 | ||
29 | #define FIX_1_847 30274 | ||
30 | #define FIX_1_414 23170 | ||
31 | #define FIX_2_613 21407 // divided by two to fit the range | ||
32 | |||
33 | #define IDCTMUL(a, b) ((int)((a) * (unsigned)(b)) >> 16) | ||
34 | |||
35 | 3544320 | static inline void idct_row(int16_t *blk) | |
36 | { | ||
37 | int tmp0, tmp1, tmp2, tmp3, tmp4, tmp5, tmp6, tmp7, tmp8, tmp9, tmpA; | ||
38 | int tmpB, tmpC, tmpD, tmpE, tmpF, tmp10, tmp11, tmp12, tmp13, tmp14; | ||
39 | |||
40 | 3544320 | tmp0 = blk[5] - blk[3]; | |
41 | 3544320 | tmp1 = blk[5] + blk[3]; | |
42 | 3544320 | tmp2 = blk[1] - blk[7]; | |
43 | 3544320 | tmp3 = blk[1] + blk[7]; | |
44 | 3544320 | tmp4 = tmp3 - tmp1; | |
45 | 3544320 | tmp5 = IDCTMUL(tmp0 + tmp2, FIX_1_847); | |
46 | 3544320 | tmp6 = IDCTMUL(tmp2, FIX_1_082) - tmp5; | |
47 | 3544320 | tmp7 = tmp5 - IDCTMUL(tmp0, FIX_2_613) * 2; | |
48 | 3544320 | tmp8 = tmp3 + tmp1; | |
49 | 3544320 | tmp9 = tmp7 * 4 - tmp8; | |
50 | 3544320 | tmpA = IDCTMUL(tmp4, FIX_1_414) * 4 - tmp9; | |
51 | 3544320 | tmpB = tmp6 * 4 + tmpA; | |
52 | 3544320 | tmpC = blk[2] + blk[6]; | |
53 | 3544320 | tmpD = blk[2] - blk[6]; | |
54 | 3544320 | tmpE = blk[0] - blk[4]; | |
55 | 3544320 | tmpF = blk[0] + blk[4]; | |
56 | |||
57 | 3544320 | tmp10 = IDCTMUL(tmpD, FIX_1_414) * 4 - tmpC; | |
58 | 3544320 | tmp11 = tmpE - tmp10; | |
59 | 3544320 | tmp12 = tmpF - tmpC; | |
60 | 3544320 | tmp13 = tmpE + tmp10; | |
61 | 3544320 | tmp14 = tmpF + tmpC; | |
62 | |||
63 | 3544320 | blk[0] = tmp14 + tmp8; | |
64 | 3544320 | blk[1] = tmp13 + tmp9; | |
65 | 3544320 | blk[2] = tmp11 + tmpA; | |
66 | 3544320 | blk[3] = tmp12 - tmpB; | |
67 | 3544320 | blk[4] = tmp12 + tmpB; | |
68 | 3544320 | blk[5] = tmp11 - tmpA; | |
69 | 3544320 | blk[6] = tmp13 - tmp9; | |
70 | 3544320 | blk[7] = tmp14 - tmp8; | |
71 | 3544320 | } | |
72 | |||
73 | 3544320 | static inline void idct_col(int16_t *blk) | |
74 | { | ||
75 | int tmp0, tmp1, tmp2, tmp3, tmp4, tmp5, tmp6, tmp7, tmp8, tmp9, tmpA; | ||
76 | int tmpB, tmpC, tmpD, tmpE, tmpF, tmp10, tmp11, tmp12, tmp13, tmp14; | ||
77 | |||
78 | 3544320 | tmp0 = blk[5 * 8] - blk[3 * 8]; | |
79 | 3544320 | tmp1 = blk[5 * 8] + blk[3 * 8]; | |
80 | 3544320 | tmp2 = blk[1 * 8] * 2 - (blk[7 * 8] >> 2); | |
81 | 3544320 | tmp3 = blk[1 * 8] * 2 + (blk[7 * 8] >> 2); | |
82 | 3544320 | tmp4 = tmp3 - tmp1; | |
83 | 3544320 | tmp5 = IDCTMUL(tmp0 + tmp2, FIX_1_847); | |
84 | 3544320 | tmp6 = IDCTMUL(tmp2, FIX_1_082) - tmp5; | |
85 | 3544320 | tmp7 = tmp5 - IDCTMUL(tmp0, FIX_2_613) * 2; | |
86 | 3544320 | tmp8 = (tmp3 + tmp1) >> 1; | |
87 | 3544320 | tmp9 = tmp7 * 2 - tmp8; | |
88 | 3544320 | tmpA = IDCTMUL(tmp4, FIX_1_414) * 2 - tmp9; | |
89 | 3544320 | tmpB = tmp6 * 2 + tmpA; | |
90 | 3544320 | tmpC = blk[2 * 8] + (blk[6 * 8] >> 1) >> 1; | |
91 | 3544320 | tmpD = blk[2 * 8] - (blk[6 * 8] >> 1); | |
92 | 3544320 | tmpE = (blk[0 * 8] >> 1) - (blk[4 * 8] >> 1) + 0x2020; | |
93 | 3544320 | tmpF = (blk[0 * 8] >> 1) + (blk[4 * 8] >> 1) + 0x2020; | |
94 | |||
95 | 3544320 | tmp10 = IDCTMUL(tmpD, FIX_1_414) * 2 - tmpC; | |
96 | 3544320 | tmp11 = tmpE - tmp10; | |
97 | 3544320 | tmp12 = tmpF - tmpC; | |
98 | 3544320 | tmp13 = tmpE + tmp10; | |
99 | 3544320 | tmp14 = tmpF + tmpC; | |
100 | |||
101 | 3544320 | blk[0 * 8] = (tmp14 + tmp8) >> 6; | |
102 | 3544320 | blk[1 * 8] = (tmp13 + tmp9) >> 6; | |
103 | 3544320 | blk[2 * 8] = (tmp11 + tmpA) >> 6; | |
104 | 3544320 | blk[3 * 8] = (tmp12 - tmpB) >> 6; | |
105 | 3544320 | blk[4 * 8] = (tmp12 + tmpB) >> 6; | |
106 | 3544320 | blk[5 * 8] = (tmp11 - tmpA) >> 6; | |
107 | 3544320 | blk[6 * 8] = (tmp13 - tmp9) >> 6; | |
108 | 3544320 | blk[7 * 8] = (tmp14 - tmp8) >> 6; | |
109 | 3544320 | } | |
110 | |||
111 | 443040 | static void hq_idct_put(uint8_t *dst, int stride, int16_t *block) | |
112 | { | ||
113 | int i, j; | ||
114 | |||
115 |
2/2✓ Branch 0 taken 3544320 times.
✓ Branch 1 taken 443040 times.
|
3987360 | for (i = 0; i < 8; i++) |
116 | 3544320 | idct_row(block + i * 8); | |
117 |
2/2✓ Branch 0 taken 3544320 times.
✓ Branch 1 taken 443040 times.
|
3987360 | for (i = 0; i < 8; i++) |
118 | 3544320 | idct_col(block + i); | |
119 | |||
120 |
2/2✓ Branch 0 taken 3544320 times.
✓ Branch 1 taken 443040 times.
|
3987360 | for (i = 0; i < 8; i++) { |
121 |
2/2✓ Branch 0 taken 28354560 times.
✓ Branch 1 taken 3544320 times.
|
31898880 | for (j = 0; j < 8; j++) |
122 | 28354560 | dst[j] = av_clip_uint8(block[j + i * 8]); | |
123 | 3544320 | dst += stride; | |
124 | } | ||
125 | 443040 | } | |
126 | |||
127 | 6 | av_cold void ff_hqdsp_init(HQDSPContext *c) | |
128 | { | ||
129 | 6 | c->idct_put = hq_idct_put; | |
130 | 6 | } | |
131 |