| Line | Branch | Exec | Source |
|---|---|---|---|
| 1 | /* | ||
| 2 | * Copyright (C) 2012 Michael Niedermayer (michaelni@gmx.at) | ||
| 3 | * | ||
| 4 | * This file is part of libswresample | ||
| 5 | * | ||
| 6 | * libswresample is free software; you can redistribute it and/or | ||
| 7 | * modify it under the terms of the GNU Lesser General Public | ||
| 8 | * License as published by the Free Software Foundation; either | ||
| 9 | * version 2.1 of the License, or (at your option) any later version. | ||
| 10 | * | ||
| 11 | * libswresample is distributed in the hope that it will be useful, | ||
| 12 | * but WITHOUT ANY WARRANTY; without even the implied warranty of | ||
| 13 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU | ||
| 14 | * Lesser General Public License for more details. | ||
| 15 | * | ||
| 16 | * You should have received a copy of the GNU Lesser General Public | ||
| 17 | * License along with libswresample; if not, write to the Free Software | ||
| 18 | * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA | ||
| 19 | */ | ||
| 20 | |||
| 21 | #include "libavutil/attributes.h" | ||
| 22 | #include "libavutil/mem.h" | ||
| 23 | #include "libavutil/x86/cpu.h" | ||
| 24 | #include "libswresample/swresample_internal.h" | ||
| 25 | |||
| 26 | #define D(type, simd) \ | ||
| 27 | mix_1_1_func_type ff_mix_1_1_a_## type ## _ ## simd;\ | ||
| 28 | mix_2_1_func_type ff_mix_2_1_a_## type ## _ ## simd; | ||
| 29 | |||
| 30 | D(float, sse) | ||
| 31 | D(float, avx) | ||
| 32 | D(int16, sse2) | ||
| 33 | |||
| 34 | 27 | av_cold int swri_rematrix_init_x86(struct SwrContext *s){ | |
| 35 | #if HAVE_X86ASM | ||
| 36 | 27 | int mm_flags = av_get_cpu_flags(); | |
| 37 | 27 | int nb_in = s->used_ch_layout.nb_channels; | |
| 38 | 27 | int nb_out = s->out.ch_count; | |
| 39 | 27 | int num = nb_in * nb_out; | |
| 40 | int i,j; | ||
| 41 | |||
| 42 | 27 | s->mix_1_1_simd = NULL; | |
| 43 | 27 | s->mix_2_1_simd = NULL; | |
| 44 | |||
| 45 |
2/2✓ Branch 0 taken 19 times.
✓ Branch 1 taken 8 times.
|
27 | if (s->midbuf.fmt == AV_SAMPLE_FMT_S16P){ |
| 46 |
1/2✗ Branch 0 not taken.
✓ Branch 1 taken 19 times.
|
19 | if(EXTERNAL_SSE2(mm_flags)) { |
| 47 | ✗ | s->mix_1_1_simd = ff_mix_1_1_a_int16_sse2; | |
| 48 | ✗ | s->mix_2_1_simd = ff_mix_2_1_a_int16_sse2; | |
| 49 | } | ||
| 50 | 19 | s->native_simd_matrix = av_calloc(num, 2 * sizeof(int16_t)); | |
| 51 |
1/2✗ Branch 0 not taken.
✓ Branch 1 taken 19 times.
|
19 | if (!s->native_simd_matrix) |
| 52 | ✗ | return AVERROR(ENOMEM); | |
| 53 | |||
| 54 |
2/2✓ Branch 0 taken 42 times.
✓ Branch 1 taken 19 times.
|
61 | for(i=0; i<nb_out; i++){ |
| 55 | 42 | int sh = 0; | |
| 56 |
2/2✓ Branch 0 taken 166 times.
✓ Branch 1 taken 42 times.
|
208 | for(j=0; j<nb_in; j++) |
| 57 | 166 | sh = FFMAX(sh, FFABS(((int*)s->native_matrix)[i * nb_in + j])); | |
| 58 | 42 | sh = FFMAX(av_log2(sh) - 14, 0); | |
| 59 |
2/2✓ Branch 0 taken 166 times.
✓ Branch 1 taken 42 times.
|
208 | for(j=0; j<nb_in; j++) { |
| 60 | 166 | ((int16_t*)s->native_simd_matrix)[2*(i * nb_in + j)+1] = 15 - sh; | |
| 61 | 166 | ((int16_t*)s->native_simd_matrix)[2*(i * nb_in + j)] = | |
| 62 | 166 | ((((int*)s->native_matrix)[i * nb_in + j]) + (1<<sh>>1)) >> sh; | |
| 63 | } | ||
| 64 | } | ||
| 65 | 19 | s->native_simd_one.i16[1] = 14; | |
| 66 | 19 | s->native_simd_one.i16[0] = 16384; | |
| 67 |
1/2✓ Branch 0 taken 8 times.
✗ Branch 1 not taken.
|
8 | } else if(s->midbuf.fmt == AV_SAMPLE_FMT_FLTP){ |
| 68 |
2/2✓ Branch 0 taken 1 times.
✓ Branch 1 taken 7 times.
|
8 | if(EXTERNAL_SSE(mm_flags)) { |
| 69 | 1 | s->mix_1_1_simd = ff_mix_1_1_a_float_sse; | |
| 70 | 1 | s->mix_2_1_simd = ff_mix_2_1_a_float_sse; | |
| 71 | } | ||
| 72 |
3/4✓ Branch 0 taken 1 times.
✓ Branch 1 taken 7 times.
✓ Branch 2 taken 1 times.
✗ Branch 3 not taken.
|
8 | if(EXTERNAL_AVX_FAST(mm_flags)) { |
| 73 | 1 | s->mix_1_1_simd = ff_mix_1_1_a_float_avx; | |
| 74 | 1 | s->mix_2_1_simd = ff_mix_2_1_a_float_avx; | |
| 75 | } | ||
| 76 | 8 | s->native_simd_matrix = av_calloc(num, sizeof(float)); | |
| 77 |
1/2✗ Branch 0 not taken.
✓ Branch 1 taken 8 times.
|
8 | if (!s->native_simd_matrix) |
| 78 | ✗ | return AVERROR(ENOMEM); | |
| 79 | 8 | memcpy(s->native_simd_matrix, s->native_matrix, num * sizeof(float)); | |
| 80 | 8 | s->native_simd_one.f = s->native_one.f; | |
| 81 | } | ||
| 82 | #endif | ||
| 83 | |||
| 84 | 27 | return 0; | |
| 85 | } | ||
| 86 |