| Line | Branch | Exec | Source |
|---|---|---|---|
| 1 | /* | ||
| 2 | * Canopus HQ/HQA decoder | ||
| 3 | * | ||
| 4 | * This file is part of FFmpeg. | ||
| 5 | * | ||
| 6 | * FFmpeg is free software; you can redistribute it and/or | ||
| 7 | * modify it under the terms of the GNU Lesser General Public | ||
| 8 | * License as published by the Free Software Foundation; either | ||
| 9 | * version 2.1 of the License, or (at your option) any later version. | ||
| 10 | * | ||
| 11 | * FFmpeg is distributed in the hope that it will be useful, | ||
| 12 | * but WITHOUT ANY WARRANTY; without even the implied warranty of | ||
| 13 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU | ||
| 14 | * Lesser General Public License for more details. | ||
| 15 | * | ||
| 16 | * You should have received a copy of the GNU Lesser General Public | ||
| 17 | * License along with FFmpeg; if not, write to the Free Software | ||
| 18 | * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA | ||
| 19 | */ | ||
| 20 | |||
| 21 | #include <stdint.h> | ||
| 22 | |||
| 23 | #include "libavutil/attributes.h" | ||
| 24 | #include "libavutil/common.h" | ||
| 25 | |||
| 26 | #include "hq_hqadsp.h" | ||
| 27 | |||
| 28 | #define FIX_1_082 17734 | ||
| 29 | #define FIX_1_847 30274 | ||
| 30 | #define FIX_1_414 23170 | ||
| 31 | #define FIX_2_613 21407 // divided by two to fit the range | ||
| 32 | |||
| 33 | #define IDCTMUL(a, b) ((int)((a) * (unsigned)(b)) >> 16) | ||
| 34 | |||
| 35 | 3544320 | static inline void idct_row(int16_t *blk) | |
| 36 | { | ||
| 37 | int tmp0, tmp1, tmp2, tmp3, tmp4, tmp5, tmp6, tmp7, tmp8, tmp9, tmpA; | ||
| 38 | int tmpB, tmpC, tmpD, tmpE, tmpF, tmp10, tmp11, tmp12, tmp13, tmp14; | ||
| 39 | |||
| 40 | 3544320 | tmp0 = blk[5] - blk[3]; | |
| 41 | 3544320 | tmp1 = blk[5] + blk[3]; | |
| 42 | 3544320 | tmp2 = blk[1] - blk[7]; | |
| 43 | 3544320 | tmp3 = blk[1] + blk[7]; | |
| 44 | 3544320 | tmp4 = tmp3 - tmp1; | |
| 45 | 3544320 | tmp5 = IDCTMUL(tmp0 + tmp2, FIX_1_847); | |
| 46 | 3544320 | tmp6 = IDCTMUL(tmp2, FIX_1_082) - tmp5; | |
| 47 | 3544320 | tmp7 = tmp5 - IDCTMUL(tmp0, FIX_2_613) * 2; | |
| 48 | 3544320 | tmp8 = tmp3 + tmp1; | |
| 49 | 3544320 | tmp9 = tmp7 * 4 - tmp8; | |
| 50 | 3544320 | tmpA = IDCTMUL(tmp4, FIX_1_414) * 4 - tmp9; | |
| 51 | 3544320 | tmpB = tmp6 * 4 + tmpA; | |
| 52 | 3544320 | tmpC = blk[2] + blk[6]; | |
| 53 | 3544320 | tmpD = blk[2] - blk[6]; | |
| 54 | 3544320 | tmpE = blk[0] - blk[4]; | |
| 55 | 3544320 | tmpF = blk[0] + blk[4]; | |
| 56 | |||
| 57 | 3544320 | tmp10 = IDCTMUL(tmpD, FIX_1_414) * 4 - tmpC; | |
| 58 | 3544320 | tmp11 = tmpE - tmp10; | |
| 59 | 3544320 | tmp12 = tmpF - tmpC; | |
| 60 | 3544320 | tmp13 = tmpE + tmp10; | |
| 61 | 3544320 | tmp14 = tmpF + tmpC; | |
| 62 | |||
| 63 | 3544320 | blk[0] = tmp14 + tmp8; | |
| 64 | 3544320 | blk[1] = tmp13 + tmp9; | |
| 65 | 3544320 | blk[2] = tmp11 + tmpA; | |
| 66 | 3544320 | blk[3] = tmp12 - tmpB; | |
| 67 | 3544320 | blk[4] = tmp12 + tmpB; | |
| 68 | 3544320 | blk[5] = tmp11 - tmpA; | |
| 69 | 3544320 | blk[6] = tmp13 - tmp9; | |
| 70 | 3544320 | blk[7] = tmp14 - tmp8; | |
| 71 | 3544320 | } | |
| 72 | |||
| 73 | 3544320 | static inline void idct_col(int16_t *blk) | |
| 74 | { | ||
| 75 | int tmp0, tmp1, tmp2, tmp3, tmp4, tmp5, tmp6, tmp7, tmp8, tmp9, tmpA; | ||
| 76 | int tmpB, tmpC, tmpD, tmpE, tmpF, tmp10, tmp11, tmp12, tmp13, tmp14; | ||
| 77 | |||
| 78 | 3544320 | tmp0 = blk[5 * 8] - blk[3 * 8]; | |
| 79 | 3544320 | tmp1 = blk[5 * 8] + blk[3 * 8]; | |
| 80 | 3544320 | tmp2 = blk[1 * 8] * 2 - (blk[7 * 8] >> 2); | |
| 81 | 3544320 | tmp3 = blk[1 * 8] * 2 + (blk[7 * 8] >> 2); | |
| 82 | 3544320 | tmp4 = tmp3 - tmp1; | |
| 83 | 3544320 | tmp5 = IDCTMUL(tmp0 + tmp2, FIX_1_847); | |
| 84 | 3544320 | tmp6 = IDCTMUL(tmp2, FIX_1_082) - tmp5; | |
| 85 | 3544320 | tmp7 = tmp5 - IDCTMUL(tmp0, FIX_2_613) * 2; | |
| 86 | 3544320 | tmp8 = (tmp3 + tmp1) >> 1; | |
| 87 | 3544320 | tmp9 = tmp7 * 2 - tmp8; | |
| 88 | 3544320 | tmpA = IDCTMUL(tmp4, FIX_1_414) * 2 - tmp9; | |
| 89 | 3544320 | tmpB = tmp6 * 2 + tmpA; | |
| 90 | 3544320 | tmpC = blk[2 * 8] + (blk[6 * 8] >> 1) >> 1; | |
| 91 | 3544320 | tmpD = blk[2 * 8] - (blk[6 * 8] >> 1); | |
| 92 | 3544320 | tmpE = (blk[0 * 8] >> 1) - (blk[4 * 8] >> 1) + 0x2020; | |
| 93 | 3544320 | tmpF = (blk[0 * 8] >> 1) + (blk[4 * 8] >> 1) + 0x2020; | |
| 94 | |||
| 95 | 3544320 | tmp10 = IDCTMUL(tmpD, FIX_1_414) * 2 - tmpC; | |
| 96 | 3544320 | tmp11 = tmpE - tmp10; | |
| 97 | 3544320 | tmp12 = tmpF - tmpC; | |
| 98 | 3544320 | tmp13 = tmpE + tmp10; | |
| 99 | 3544320 | tmp14 = tmpF + tmpC; | |
| 100 | |||
| 101 | 3544320 | blk[0 * 8] = (tmp14 + tmp8) >> 6; | |
| 102 | 3544320 | blk[1 * 8] = (tmp13 + tmp9) >> 6; | |
| 103 | 3544320 | blk[2 * 8] = (tmp11 + tmpA) >> 6; | |
| 104 | 3544320 | blk[3 * 8] = (tmp12 - tmpB) >> 6; | |
| 105 | 3544320 | blk[4 * 8] = (tmp12 + tmpB) >> 6; | |
| 106 | 3544320 | blk[5 * 8] = (tmp11 - tmpA) >> 6; | |
| 107 | 3544320 | blk[6 * 8] = (tmp13 - tmp9) >> 6; | |
| 108 | 3544320 | blk[7 * 8] = (tmp14 - tmp8) >> 6; | |
| 109 | 3544320 | } | |
| 110 | |||
| 111 | 443040 | static void hq_idct_put(uint8_t *dst, int stride, int16_t *block) | |
| 112 | { | ||
| 113 | int i, j; | ||
| 114 | |||
| 115 |
2/2✓ Branch 0 taken 3544320 times.
✓ Branch 1 taken 443040 times.
|
3987360 | for (i = 0; i < 8; i++) |
| 116 | 3544320 | idct_row(block + i * 8); | |
| 117 |
2/2✓ Branch 0 taken 3544320 times.
✓ Branch 1 taken 443040 times.
|
3987360 | for (i = 0; i < 8; i++) |
| 118 | 3544320 | idct_col(block + i); | |
| 119 | |||
| 120 |
2/2✓ Branch 0 taken 3544320 times.
✓ Branch 1 taken 443040 times.
|
3987360 | for (i = 0; i < 8; i++) { |
| 121 |
2/2✓ Branch 0 taken 28354560 times.
✓ Branch 1 taken 3544320 times.
|
31898880 | for (j = 0; j < 8; j++) |
| 122 | 28354560 | dst[j] = av_clip_uint8(block[j + i * 8]); | |
| 123 | 3544320 | dst += stride; | |
| 124 | } | ||
| 125 | 443040 | } | |
| 126 | |||
| 127 | 6 | av_cold void ff_hqdsp_init(HQDSPContext *c) | |
| 128 | { | ||
| 129 | 6 | c->idct_put = hq_idct_put; | |
| 130 | 6 | } | |
| 131 |