diff options
Diffstat (limited to 'libavcodec/synth_filter.c')
-rw-r--r-- | libavcodec/synth_filter.c | 169 |
1 files changed, 142 insertions, 27 deletions
diff --git a/libavcodec/synth_filter.c b/libavcodec/synth_filter.c index 708bd4e..1c5dab5 100644 --- a/libavcodec/synth_filter.c +++ b/libavcodec/synth_filter.c @@ -1,64 +1,179 @@ /* * copyright (c) 2008 Michael Niedermayer <michaelni@gmx.at> + * Copyright (C) 2016 foo86 * - * This file is part of Libav. + * This file is part of FFmpeg. * - * Libav is free software; you can redistribute it and/or + * FFmpeg is free software; you can redistribute it and/or * modify it under the terms of the GNU Lesser General Public * License as published by the Free Software Foundation; either * version 2.1 of the License, or (at your option) any later version. * - * Libav is distributed in the hope that it will be useful, + * FFmpeg is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU * Lesser General Public License for more details. * * You should have received a copy of the GNU Lesser General Public - * License along with Libav; if not, write to the Free Software + * License along with FFmpeg; if not, write to the Free Software * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA */ #include "fft.h" +#include "dcadct.h" +#include "dcamath.h" #include "synth_filter.h" static void synth_filter_float(FFTContext *imdct, - float *synth_buf_ptr, int *synth_buf_offset, - float synth_buf2[32], const float window[512], - float out[32], const float in[32], float scale) + float *synth_buf_ptr, int *synth_buf_offset, + float synth_buf2[32], const float window[512], + float out[32], const float in[32], float scale) { - float *synth_buf= synth_buf_ptr + *synth_buf_offset; + float *synth_buf = synth_buf_ptr + *synth_buf_offset; int i, j; imdct->imdct_half(imdct, synth_buf, in); - for (i = 0; i < 16; i++){ - float a= synth_buf2[i ]; - float b= synth_buf2[i + 16]; - float c= 0; - float d= 0; - for (j = 0; j < 512 - *synth_buf_offset; j += 64){ - a += window[i + j ]*(-synth_buf[15 - i + j ]); - b += window[i + j + 16]*( synth_buf[ i + j ]); - c += window[i + j + 32]*( synth_buf[16 + i + j ]); - d += window[i + j + 48]*( synth_buf[31 - i + j ]); + for (i = 0; i < 16; i++) { + float a = synth_buf2[i ]; + float b = synth_buf2[i + 16]; + float c = 0; + float d = 0; + for (j = 0; j < 512 - *synth_buf_offset; j += 64) { + a += window[i + j ] * (-synth_buf[15 - i + j ]); + b += window[i + j + 16] * ( synth_buf[ i + j ]); + c += window[i + j + 32] * ( synth_buf[16 + i + j ]); + d += window[i + j + 48] * ( synth_buf[31 - i + j ]); } - for ( ; j < 512; j += 64){ - a += window[i + j ]*(-synth_buf[15 - i + j - 512]); - b += window[i + j + 16]*( synth_buf[ i + j - 512]); - c += window[i + j + 32]*( synth_buf[16 + i + j - 512]); - d += window[i + j + 48]*( synth_buf[31 - i + j - 512]); + for ( ; j < 512; j += 64) { + a += window[i + j ] * (-synth_buf[15 - i + j - 512]); + b += window[i + j + 16] * ( synth_buf[ i + j - 512]); + c += window[i + j + 32] * ( synth_buf[16 + i + j - 512]); + d += window[i + j + 48] * ( synth_buf[31 - i + j - 512]); } - out[i ] = a*scale; - out[i + 16] = b*scale; + out[i ] = a * scale; + out[i + 16] = b * scale; synth_buf2[i ] = c; synth_buf2[i + 16] = d; } - *synth_buf_offset= (*synth_buf_offset - 32)&511; + + *synth_buf_offset = (*synth_buf_offset - 32) & 511; +} + +static void synth_filter_float_64(FFTContext *imdct, + float *synth_buf_ptr, int *synth_buf_offset, + float synth_buf2[64], const float window[1024], + float out[64], const float in[64], float scale) +{ + float *synth_buf = synth_buf_ptr + *synth_buf_offset; + int i, j; + + imdct->imdct_half(imdct, synth_buf, in); + + for (i = 0; i < 32; i++) { + float a = synth_buf2[i ]; + float b = synth_buf2[i + 32]; + float c = 0; + float d = 0; + for (j = 0; j < 1024 - *synth_buf_offset; j += 128) { + a += window[i + j ] * (-synth_buf[31 - i + j ]); + b += window[i + j + 32] * ( synth_buf[ i + j ]); + c += window[i + j + 64] * ( synth_buf[32 + i + j ]); + d += window[i + j + 96] * ( synth_buf[63 - i + j ]); + } + for ( ; j < 1024; j += 128) { + a += window[i + j ] * (-synth_buf[31 - i + j - 1024]); + b += window[i + j + 32] * ( synth_buf[ i + j - 1024]); + c += window[i + j + 64] * ( synth_buf[32 + i + j - 1024]); + d += window[i + j + 96] * ( synth_buf[63 - i + j - 1024]); + } + out[i ] = a * scale; + out[i + 32] = b * scale; + synth_buf2[i ] = c; + synth_buf2[i + 32] = d; + } + + *synth_buf_offset = (*synth_buf_offset - 64) & 1023; +} + +static void synth_filter_fixed(DCADCTContext *imdct, + int32_t *synth_buf_ptr, int *synth_buf_offset, + int32_t synth_buf2[32], const int32_t window[512], + int32_t out[32], const int32_t in[32]) +{ + int32_t *synth_buf = synth_buf_ptr + *synth_buf_offset; + int i, j; + + imdct->imdct_half[0](synth_buf, in); + + for (i = 0; i < 16; i++) { + int64_t a = synth_buf2[i ] * (INT64_C(1) << 21); + int64_t b = synth_buf2[i + 16] * (INT64_C(1) << 21); + int64_t c = 0; + int64_t d = 0; + for (j = 0; j < 512 - *synth_buf_offset; j += 64) { + a += (int64_t)window[i + j ] * synth_buf[ i + j ]; + b += (int64_t)window[i + j + 16] * synth_buf[15 - i + j ]; + c += (int64_t)window[i + j + 32] * synth_buf[16 + i + j ]; + d += (int64_t)window[i + j + 48] * synth_buf[31 - i + j ]; + } + for ( ; j < 512; j += 64) { + a += (int64_t)window[i + j ] * synth_buf[ i + j - 512]; + b += (int64_t)window[i + j + 16] * synth_buf[15 - i + j - 512]; + c += (int64_t)window[i + j + 32] * synth_buf[16 + i + j - 512]; + d += (int64_t)window[i + j + 48] * synth_buf[31 - i + j - 512]; + } + out[i ] = clip23(norm21(a)); + out[i + 16] = clip23(norm21(b)); + synth_buf2[i ] = norm21(c); + synth_buf2[i + 16] = norm21(d); + } + + *synth_buf_offset = (*synth_buf_offset - 32) & 511; +} + +static void synth_filter_fixed_64(DCADCTContext *imdct, + int32_t *synth_buf_ptr, int *synth_buf_offset, + int32_t synth_buf2[64], const int32_t window[1024], + int32_t out[64], const int32_t in[64]) +{ + int32_t *synth_buf = synth_buf_ptr + *synth_buf_offset; + int i, j; + + imdct->imdct_half[1](synth_buf, in); + + for (i = 0; i < 32; i++) { + int64_t a = synth_buf2[i ] * (INT64_C(1) << 20); + int64_t b = synth_buf2[i + 32] * (INT64_C(1) << 20); + int64_t c = 0; + int64_t d = 0; + for (j = 0; j < 1024 - *synth_buf_offset; j += 128) { + a += (int64_t)window[i + j ] * synth_buf[ i + j ]; + b += (int64_t)window[i + j + 32] * synth_buf[31 - i + j ]; + c += (int64_t)window[i + j + 64] * synth_buf[32 + i + j ]; + d += (int64_t)window[i + j + 96] * synth_buf[63 - i + j ]; + } + for ( ; j < 1024; j += 128) { + a += (int64_t)window[i + j ] * synth_buf[ i + j - 1024]; + b += (int64_t)window[i + j + 32] * synth_buf[31 - i + j - 1024]; + c += (int64_t)window[i + j + 64] * synth_buf[32 + i + j - 1024]; + d += (int64_t)window[i + j + 96] * synth_buf[63 - i + j - 1024]; + } + out[i ] = clip23(norm20(a)); + out[i + 32] = clip23(norm20(b)); + synth_buf2[i ] = norm20(c); + synth_buf2[i + 32] = norm20(d); + } + + *synth_buf_offset = (*synth_buf_offset - 64) & 1023; } av_cold void ff_synth_filter_init(SynthFilterContext *c) { - c->synth_filter_float = synth_filter_float; + c->synth_filter_float = synth_filter_float; + c->synth_filter_float_64 = synth_filter_float_64; + c->synth_filter_fixed = synth_filter_fixed; + c->synth_filter_fixed_64 = synth_filter_fixed_64; if (ARCH_AARCH64) ff_synth_filter_init_aarch64(c); |