summaryrefslogtreecommitdiff
path: root/libavcodec/synth_filter.c
diff options
context:
space:
mode:
Diffstat (limited to 'libavcodec/synth_filter.c')
-rw-r--r--libavcodec/synth_filter.c169
1 files changed, 142 insertions, 27 deletions
diff --git a/libavcodec/synth_filter.c b/libavcodec/synth_filter.c
index 708bd4e00c..1c5dab5c5a 100644
--- a/libavcodec/synth_filter.c
+++ b/libavcodec/synth_filter.c
@@ -1,64 +1,179 @@
/*
* copyright (c) 2008 Michael Niedermayer <michaelni@gmx.at>
+ * Copyright (C) 2016 foo86
*
- * This file is part of Libav.
+ * This file is part of FFmpeg.
*
- * Libav is free software; you can redistribute it and/or
+ * FFmpeg is free software; you can redistribute it and/or
* modify it under the terms of the GNU Lesser General Public
* License as published by the Free Software Foundation; either
* version 2.1 of the License, or (at your option) any later version.
*
- * Libav is distributed in the hope that it will be useful,
+ * FFmpeg is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
* Lesser General Public License for more details.
*
* You should have received a copy of the GNU Lesser General Public
- * License along with Libav; if not, write to the Free Software
+ * License along with FFmpeg; if not, write to the Free Software
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
*/
#include "fft.h"
+#include "dcadct.h"
+#include "dcamath.h"
#include "synth_filter.h"
static void synth_filter_float(FFTContext *imdct,
- float *synth_buf_ptr, int *synth_buf_offset,
- float synth_buf2[32], const float window[512],
- float out[32], const float in[32], float scale)
+ float *synth_buf_ptr, int *synth_buf_offset,
+ float synth_buf2[32], const float window[512],
+ float out[32], const float in[32], float scale)
{
- float *synth_buf= synth_buf_ptr + *synth_buf_offset;
+ float *synth_buf = synth_buf_ptr + *synth_buf_offset;
int i, j;
imdct->imdct_half(imdct, synth_buf, in);
- for (i = 0; i < 16; i++){
- float a= synth_buf2[i ];
- float b= synth_buf2[i + 16];
- float c= 0;
- float d= 0;
- for (j = 0; j < 512 - *synth_buf_offset; j += 64){
- a += window[i + j ]*(-synth_buf[15 - i + j ]);
- b += window[i + j + 16]*( synth_buf[ i + j ]);
- c += window[i + j + 32]*( synth_buf[16 + i + j ]);
- d += window[i + j + 48]*( synth_buf[31 - i + j ]);
+ for (i = 0; i < 16; i++) {
+ float a = synth_buf2[i ];
+ float b = synth_buf2[i + 16];
+ float c = 0;
+ float d = 0;
+ for (j = 0; j < 512 - *synth_buf_offset; j += 64) {
+ a += window[i + j ] * (-synth_buf[15 - i + j ]);
+ b += window[i + j + 16] * ( synth_buf[ i + j ]);
+ c += window[i + j + 32] * ( synth_buf[16 + i + j ]);
+ d += window[i + j + 48] * ( synth_buf[31 - i + j ]);
}
- for ( ; j < 512; j += 64){
- a += window[i + j ]*(-synth_buf[15 - i + j - 512]);
- b += window[i + j + 16]*( synth_buf[ i + j - 512]);
- c += window[i + j + 32]*( synth_buf[16 + i + j - 512]);
- d += window[i + j + 48]*( synth_buf[31 - i + j - 512]);
+ for ( ; j < 512; j += 64) {
+ a += window[i + j ] * (-synth_buf[15 - i + j - 512]);
+ b += window[i + j + 16] * ( synth_buf[ i + j - 512]);
+ c += window[i + j + 32] * ( synth_buf[16 + i + j - 512]);
+ d += window[i + j + 48] * ( synth_buf[31 - i + j - 512]);
}
- out[i ] = a*scale;
- out[i + 16] = b*scale;
+ out[i ] = a * scale;
+ out[i + 16] = b * scale;
synth_buf2[i ] = c;
synth_buf2[i + 16] = d;
}
- *synth_buf_offset= (*synth_buf_offset - 32)&511;
+
+ *synth_buf_offset = (*synth_buf_offset - 32) & 511;
+}
+
+static void synth_filter_float_64(FFTContext *imdct,
+ float *synth_buf_ptr, int *synth_buf_offset,
+ float synth_buf2[64], const float window[1024],
+ float out[64], const float in[64], float scale)
+{
+ float *synth_buf = synth_buf_ptr + *synth_buf_offset;
+ int i, j;
+
+ imdct->imdct_half(imdct, synth_buf, in);
+
+ for (i = 0; i < 32; i++) {
+ float a = synth_buf2[i ];
+ float b = synth_buf2[i + 32];
+ float c = 0;
+ float d = 0;
+ for (j = 0; j < 1024 - *synth_buf_offset; j += 128) {
+ a += window[i + j ] * (-synth_buf[31 - i + j ]);
+ b += window[i + j + 32] * ( synth_buf[ i + j ]);
+ c += window[i + j + 64] * ( synth_buf[32 + i + j ]);
+ d += window[i + j + 96] * ( synth_buf[63 - i + j ]);
+ }
+ for ( ; j < 1024; j += 128) {
+ a += window[i + j ] * (-synth_buf[31 - i + j - 1024]);
+ b += window[i + j + 32] * ( synth_buf[ i + j - 1024]);
+ c += window[i + j + 64] * ( synth_buf[32 + i + j - 1024]);
+ d += window[i + j + 96] * ( synth_buf[63 - i + j - 1024]);
+ }
+ out[i ] = a * scale;
+ out[i + 32] = b * scale;
+ synth_buf2[i ] = c;
+ synth_buf2[i + 32] = d;
+ }
+
+ *synth_buf_offset = (*synth_buf_offset - 64) & 1023;
+}
+
+static void synth_filter_fixed(DCADCTContext *imdct,
+ int32_t *synth_buf_ptr, int *synth_buf_offset,
+ int32_t synth_buf2[32], const int32_t window[512],
+ int32_t out[32], const int32_t in[32])
+{
+ int32_t *synth_buf = synth_buf_ptr + *synth_buf_offset;
+ int i, j;
+
+ imdct->imdct_half[0](synth_buf, in);
+
+ for (i = 0; i < 16; i++) {
+ int64_t a = synth_buf2[i ] * (INT64_C(1) << 21);
+ int64_t b = synth_buf2[i + 16] * (INT64_C(1) << 21);
+ int64_t c = 0;
+ int64_t d = 0;
+ for (j = 0; j < 512 - *synth_buf_offset; j += 64) {
+ a += (int64_t)window[i + j ] * synth_buf[ i + j ];
+ b += (int64_t)window[i + j + 16] * synth_buf[15 - i + j ];
+ c += (int64_t)window[i + j + 32] * synth_buf[16 + i + j ];
+ d += (int64_t)window[i + j + 48] * synth_buf[31 - i + j ];
+ }
+ for ( ; j < 512; j += 64) {
+ a += (int64_t)window[i + j ] * synth_buf[ i + j - 512];
+ b += (int64_t)window[i + j + 16] * synth_buf[15 - i + j - 512];
+ c += (int64_t)window[i + j + 32] * synth_buf[16 + i + j - 512];
+ d += (int64_t)window[i + j + 48] * synth_buf[31 - i + j - 512];
+ }
+ out[i ] = clip23(norm21(a));
+ out[i + 16] = clip23(norm21(b));
+ synth_buf2[i ] = norm21(c);
+ synth_buf2[i + 16] = norm21(d);
+ }
+
+ *synth_buf_offset = (*synth_buf_offset - 32) & 511;
+}
+
+static void synth_filter_fixed_64(DCADCTContext *imdct,
+ int32_t *synth_buf_ptr, int *synth_buf_offset,
+ int32_t synth_buf2[64], const int32_t window[1024],
+ int32_t out[64], const int32_t in[64])
+{
+ int32_t *synth_buf = synth_buf_ptr + *synth_buf_offset;
+ int i, j;
+
+ imdct->imdct_half[1](synth_buf, in);
+
+ for (i = 0; i < 32; i++) {
+ int64_t a = synth_buf2[i ] * (INT64_C(1) << 20);
+ int64_t b = synth_buf2[i + 32] * (INT64_C(1) << 20);
+ int64_t c = 0;
+ int64_t d = 0;
+ for (j = 0; j < 1024 - *synth_buf_offset; j += 128) {
+ a += (int64_t)window[i + j ] * synth_buf[ i + j ];
+ b += (int64_t)window[i + j + 32] * synth_buf[31 - i + j ];
+ c += (int64_t)window[i + j + 64] * synth_buf[32 + i + j ];
+ d += (int64_t)window[i + j + 96] * synth_buf[63 - i + j ];
+ }
+ for ( ; j < 1024; j += 128) {
+ a += (int64_t)window[i + j ] * synth_buf[ i + j - 1024];
+ b += (int64_t)window[i + j + 32] * synth_buf[31 - i + j - 1024];
+ c += (int64_t)window[i + j + 64] * synth_buf[32 + i + j - 1024];
+ d += (int64_t)window[i + j + 96] * synth_buf[63 - i + j - 1024];
+ }
+ out[i ] = clip23(norm20(a));
+ out[i + 32] = clip23(norm20(b));
+ synth_buf2[i ] = norm20(c);
+ synth_buf2[i + 32] = norm20(d);
+ }
+
+ *synth_buf_offset = (*synth_buf_offset - 64) & 1023;
}
av_cold void ff_synth_filter_init(SynthFilterContext *c)
{
- c->synth_filter_float = synth_filter_float;
+ c->synth_filter_float = synth_filter_float;
+ c->synth_filter_float_64 = synth_filter_float_64;
+ c->synth_filter_fixed = synth_filter_fixed;
+ c->synth_filter_fixed_64 = synth_filter_fixed_64;
if (ARCH_AARCH64)
ff_synth_filter_init_aarch64(c);