| Line | Branch | Exec | Source |
|---|---|---|---|
| 1 | /* | ||
| 2 | * Copyright (c) 2012 Nicolas George | ||
| 3 | * | ||
| 4 | * This file is part of FFmpeg. | ||
| 5 | * | ||
| 6 | * FFmpeg is free software; you can redistribute it and/or | ||
| 7 | * modify it under the terms of the GNU Lesser General Public License | ||
| 8 | * as published by the Free Software Foundation; either | ||
| 9 | * version 2.1 of the License, or (at your option) any later version. | ||
| 10 | * | ||
| 11 | * FFmpeg is distributed in the hope that it will be useful, | ||
| 12 | * but WITHOUT ANY WARRANTY; without even the implied warranty of | ||
| 13 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | ||
| 14 | * GNU Lesser General Public License for more details. | ||
| 15 | * | ||
| 16 | * You should have received a copy of the GNU Lesser General Public License | ||
| 17 | * along with FFmpeg; if not, write to the Free Software Foundation, Inc., | ||
| 18 | * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA | ||
| 19 | */ | ||
| 20 | |||
| 21 | #include "libavutil/channel_layout.h" | ||
| 22 | #include "libavutil/avassert.h" | ||
| 23 | #include "audio.h" | ||
| 24 | #include "avfilter.h" | ||
| 25 | #include "filters.h" | ||
| 26 | |||
| 27 | typedef struct VolDetectContext { | ||
| 28 | /** | ||
| 29 | * Number of samples at each PCM value. | ||
| 30 | * histogram[0x8000 + i] is the number of samples at value i. | ||
| 31 | * The extra element is there for symmetry. | ||
| 32 | */ | ||
| 33 | uint64_t histogram[0x10001]; | ||
| 34 | } VolDetectContext; | ||
| 35 | |||
| 36 | ✗ | static int filter_frame(AVFilterLink *inlink, AVFrame *samples) | |
| 37 | { | ||
| 38 | ✗ | AVFilterContext *ctx = inlink->dst; | |
| 39 | ✗ | VolDetectContext *vd = ctx->priv; | |
| 40 | ✗ | int nb_samples = samples->nb_samples; | |
| 41 | ✗ | int nb_channels = samples->ch_layout.nb_channels; | |
| 42 | ✗ | int nb_planes = nb_channels; | |
| 43 | int plane, i; | ||
| 44 | int16_t *pcm; | ||
| 45 | |||
| 46 | ✗ | if (!av_sample_fmt_is_planar(samples->format)) { | |
| 47 | ✗ | nb_samples *= nb_channels; | |
| 48 | ✗ | nb_planes = 1; | |
| 49 | } | ||
| 50 | ✗ | for (plane = 0; plane < nb_planes; plane++) { | |
| 51 | ✗ | pcm = (int16_t *)samples->extended_data[plane]; | |
| 52 | ✗ | for (i = 0; i < nb_samples; i++) | |
| 53 | ✗ | vd->histogram[pcm[i] + 0x8000]++; | |
| 54 | } | ||
| 55 | |||
| 56 | ✗ | return ff_filter_frame(inlink->dst->outputs[0], samples); | |
| 57 | } | ||
| 58 | |||
| 59 | #define MAX_DB 91 | ||
| 60 | |||
| 61 | ✗ | static inline double logdb(uint64_t v) | |
| 62 | { | ||
| 63 | ✗ | double d = v / (double)(0x8000 * 0x8000); | |
| 64 | ✗ | if (!v) | |
| 65 | ✗ | return MAX_DB; | |
| 66 | ✗ | return -log10(d) * 10; | |
| 67 | } | ||
| 68 | |||
| 69 | ✗ | static void print_stats(AVFilterContext *ctx) | |
| 70 | { | ||
| 71 | ✗ | VolDetectContext *vd = ctx->priv; | |
| 72 | int i, max_volume, shift; | ||
| 73 | ✗ | uint64_t nb_samples = 0, power = 0, nb_samples_shift = 0, sum = 0; | |
| 74 | ✗ | uint64_t histdb[MAX_DB + 1] = { 0 }; | |
| 75 | |||
| 76 | ✗ | for (i = 0; i < 0x10000; i++) | |
| 77 | ✗ | nb_samples += vd->histogram[i]; | |
| 78 | ✗ | av_log(ctx, AV_LOG_INFO, "n_samples: %"PRId64"\n", nb_samples); | |
| 79 | ✗ | if (!nb_samples) | |
| 80 | ✗ | return; | |
| 81 | |||
| 82 | /* If nb_samples > 1<<34, there is a risk of overflow in the | ||
| 83 | multiplication or the sum: shift all histogram values to avoid that. | ||
| 84 | The total number of samples must be recomputed to avoid rounding | ||
| 85 | errors. */ | ||
| 86 | ✗ | shift = av_log2(nb_samples >> 33); | |
| 87 | ✗ | for (i = 0; i < 0x10000; i++) { | |
| 88 | ✗ | nb_samples_shift += vd->histogram[i] >> shift; | |
| 89 | ✗ | power += (i - 0x8000) * (i - 0x8000) * (vd->histogram[i] >> shift); | |
| 90 | } | ||
| 91 | ✗ | if (!nb_samples_shift) | |
| 92 | ✗ | return; | |
| 93 | ✗ | power = (power + nb_samples_shift / 2) / nb_samples_shift; | |
| 94 | ✗ | av_assert0(power <= 0x8000 * 0x8000); | |
| 95 | ✗ | av_log(ctx, AV_LOG_INFO, "mean_volume: %.1f dB\n", -logdb(power)); | |
| 96 | |||
| 97 | ✗ | max_volume = 0x8000; | |
| 98 | ✗ | while (max_volume > 0 && !vd->histogram[0x8000 + max_volume] && | |
| 99 | ✗ | !vd->histogram[0x8000 - max_volume]) | |
| 100 | ✗ | max_volume--; | |
| 101 | ✗ | av_log(ctx, AV_LOG_INFO, "max_volume: %.1f dB\n", -logdb(max_volume * max_volume)); | |
| 102 | |||
| 103 | ✗ | for (i = 0; i < 0x10000; i++) | |
| 104 | ✗ | histdb[(int)logdb((i - 0x8000) * (i - 0x8000))] += vd->histogram[i]; | |
| 105 | ✗ | for (i = 0; i <= MAX_DB && !histdb[i]; i++); | |
| 106 | ✗ | for (; i <= MAX_DB && sum < nb_samples / 1000; i++) { | |
| 107 | ✗ | av_log(ctx, AV_LOG_INFO, "histogram_%ddb: %"PRId64"\n", i, histdb[i]); | |
| 108 | ✗ | sum += histdb[i]; | |
| 109 | } | ||
| 110 | } | ||
| 111 | |||
| 112 | ✗ | static av_cold void uninit(AVFilterContext *ctx) | |
| 113 | { | ||
| 114 | ✗ | print_stats(ctx); | |
| 115 | ✗ | } | |
| 116 | |||
| 117 | static const AVFilterPad volumedetect_inputs[] = { | ||
| 118 | { | ||
| 119 | .name = "default", | ||
| 120 | .type = AVMEDIA_TYPE_AUDIO, | ||
| 121 | .filter_frame = filter_frame, | ||
| 122 | }, | ||
| 123 | }; | ||
| 124 | |||
| 125 | const FFFilter ff_af_volumedetect = { | ||
| 126 | .p.name = "volumedetect", | ||
| 127 | .p.description = NULL_IF_CONFIG_SMALL("Detect audio volume."), | ||
| 128 | .p.flags = AVFILTER_FLAG_METADATA_ONLY, | ||
| 129 | .priv_size = sizeof(VolDetectContext), | ||
| 130 | .uninit = uninit, | ||
| 131 | FILTER_INPUTS(volumedetect_inputs), | ||
| 132 | FILTER_OUTPUTS(ff_audio_default_filterpad), | ||
| 133 | FILTER_SAMPLEFMTS(AV_SAMPLE_FMT_S16, AV_SAMPLE_FMT_S16P), | ||
| 134 | }; | ||
| 135 |