| /* |
| * Copyright (c) 2011 The WebRTC project authors. All Rights Reserved. |
| * |
| * Use of this source code is governed by a BSD-style license |
| * that can be found in the LICENSE file in the root of the source |
| * tree. An additional intellectual property rights grant can be found |
| * in the file PATENTS. All contributing project authors may |
| * be found in the AUTHORS file in the root of the source tree. |
| */ |
| |
| |
| /* |
| * This file contains the function WebRtcSpl_ComplexFFT(). |
| * The description header can be found in signal_processing_library.h |
| * |
| */ |
| |
| #include "common_audio/signal_processing/complex_fft_tables.h" |
| #include "common_audio/signal_processing/include/signal_processing_library.h" |
| #include "rtc_base/system/arch.h" |
| |
| #define CFFTSFT 14 |
| #define CFFTRND 1 |
| #define CFFTRND2 16384 |
| |
| #define CIFFTSFT 14 |
| #define CIFFTRND 1 |
| |
| |
| int WebRtcSpl_ComplexFFT(int16_t frfi[], int stages, int mode) |
| { |
| int i, j, l, k, istep, n, m; |
| int16_t wr, wi; |
| int32_t tr32, ti32, qr32, qi32; |
| |
| /* The 1024-value is a constant given from the size of kSinTable1024[], |
| * and should not be changed depending on the input parameter 'stages' |
| */ |
| n = 1 << stages; |
| if (n > 1024) |
| return -1; |
| |
| l = 1; |
| k = 10 - 1; /* Constant for given kSinTable1024[]. Do not change |
| depending on the input parameter 'stages' */ |
| |
| if (mode == 0) |
| { |
| // mode==0: Low-complexity and Low-accuracy mode |
| while (l < n) |
| { |
| istep = l << 1; |
| |
| for (m = 0; m < l; ++m) |
| { |
| j = m << k; |
| |
| /* The 256-value is a constant given as 1/4 of the size of |
| * kSinTable1024[], and should not be changed depending on the input |
| * parameter 'stages'. It will result in 0 <= j < N_SINE_WAVE/2 |
| */ |
| wr = kSinTable1024[j + 256]; |
| wi = -kSinTable1024[j]; |
| |
| for (i = m; i < n; i += istep) |
| { |
| j = i + l; |
| |
| tr32 = (wr * frfi[2 * j] - wi * frfi[2 * j + 1]) >> 15; |
| |
| ti32 = (wr * frfi[2 * j + 1] + wi * frfi[2 * j]) >> 15; |
| |
| qr32 = (int32_t)frfi[2 * i]; |
| qi32 = (int32_t)frfi[2 * i + 1]; |
| frfi[2 * j] = (int16_t)((qr32 - tr32) >> 1); |
| frfi[2 * j + 1] = (int16_t)((qi32 - ti32) >> 1); |
| frfi[2 * i] = (int16_t)((qr32 + tr32) >> 1); |
| frfi[2 * i + 1] = (int16_t)((qi32 + ti32) >> 1); |
| } |
| } |
| |
| --k; |
| l = istep; |
| |
| } |
| |
| } else |
| { |
| // mode==1: High-complexity and High-accuracy mode |
| while (l < n) |
| { |
| istep = l << 1; |
| |
| for (m = 0; m < l; ++m) |
| { |
| j = m << k; |
| |
| /* The 256-value is a constant given as 1/4 of the size of |
| * kSinTable1024[], and should not be changed depending on the input |
| * parameter 'stages'. It will result in 0 <= j < N_SINE_WAVE/2 |
| */ |
| wr = kSinTable1024[j + 256]; |
| wi = -kSinTable1024[j]; |
| |
| #ifdef WEBRTC_ARCH_ARM_V7 |
| int32_t wri = 0; |
| __asm __volatile("pkhbt %0, %1, %2, lsl #16" : "=r"(wri) : |
| "r"((int32_t)wr), "r"((int32_t)wi)); |
| #endif |
| |
| for (i = m; i < n; i += istep) |
| { |
| j = i + l; |
| |
| #ifdef WEBRTC_ARCH_ARM_V7 |
| register int32_t frfi_r; |
| __asm __volatile( |
| "pkhbt %[frfi_r], %[frfi_even], %[frfi_odd]," |
| " lsl #16\n\t" |
| "smlsd %[tr32], %[wri], %[frfi_r], %[cfftrnd]\n\t" |
| "smladx %[ti32], %[wri], %[frfi_r], %[cfftrnd]\n\t" |
| :[frfi_r]"=&r"(frfi_r), |
| [tr32]"=&r"(tr32), |
| [ti32]"=r"(ti32) |
| :[frfi_even]"r"((int32_t)frfi[2*j]), |
| [frfi_odd]"r"((int32_t)frfi[2*j +1]), |
| [wri]"r"(wri), |
| [cfftrnd]"r"(CFFTRND)); |
| #else |
| tr32 = wr * frfi[2 * j] - wi * frfi[2 * j + 1] + CFFTRND; |
| |
| ti32 = wr * frfi[2 * j + 1] + wi * frfi[2 * j] + CFFTRND; |
| #endif |
| |
| tr32 >>= 15 - CFFTSFT; |
| ti32 >>= 15 - CFFTSFT; |
| |
| qr32 = ((int32_t)frfi[2 * i]) * (1 << CFFTSFT); |
| qi32 = ((int32_t)frfi[2 * i + 1]) * (1 << CFFTSFT); |
| |
| frfi[2 * j] = (int16_t)( |
| (qr32 - tr32 + CFFTRND2) >> (1 + CFFTSFT)); |
| frfi[2 * j + 1] = (int16_t)( |
| (qi32 - ti32 + CFFTRND2) >> (1 + CFFTSFT)); |
| frfi[2 * i] = (int16_t)( |
| (qr32 + tr32 + CFFTRND2) >> (1 + CFFTSFT)); |
| frfi[2 * i + 1] = (int16_t)( |
| (qi32 + ti32 + CFFTRND2) >> (1 + CFFTSFT)); |
| } |
| } |
| |
| --k; |
| l = istep; |
| } |
| } |
| return 0; |
| } |
| |
| int WebRtcSpl_ComplexIFFT(int16_t frfi[], int stages, int mode) |
| { |
| size_t i, j, l, istep, n, m; |
| int k, scale, shift; |
| int16_t wr, wi; |
| int32_t tr32, ti32, qr32, qi32; |
| int32_t tmp32, round2; |
| |
| /* The 1024-value is a constant given from the size of kSinTable1024[], |
| * and should not be changed depending on the input parameter 'stages' |
| */ |
| n = ((size_t)1) << stages; |
| if (n > 1024) |
| return -1; |
| |
| scale = 0; |
| |
| l = 1; |
| k = 10 - 1; /* Constant for given kSinTable1024[]. Do not change |
| depending on the input parameter 'stages' */ |
| |
| while (l < n) |
| { |
| // variable scaling, depending upon data |
| shift = 0; |
| round2 = 8192; |
| |
| tmp32 = WebRtcSpl_MaxAbsValueW16(frfi, 2 * n); |
| if (tmp32 > 13573) |
| { |
| shift++; |
| scale++; |
| round2 <<= 1; |
| } |
| if (tmp32 > 27146) |
| { |
| shift++; |
| scale++; |
| round2 <<= 1; |
| } |
| |
| istep = l << 1; |
| |
| if (mode == 0) |
| { |
| // mode==0: Low-complexity and Low-accuracy mode |
| for (m = 0; m < l; ++m) |
| { |
| j = m << k; |
| |
| /* The 256-value is a constant given as 1/4 of the size of |
| * kSinTable1024[], and should not be changed depending on the input |
| * parameter 'stages'. It will result in 0 <= j < N_SINE_WAVE/2 |
| */ |
| wr = kSinTable1024[j + 256]; |
| wi = kSinTable1024[j]; |
| |
| for (i = m; i < n; i += istep) |
| { |
| j = i + l; |
| |
| tr32 = (wr * frfi[2 * j] - wi * frfi[2 * j + 1]) >> 15; |
| |
| ti32 = (wr * frfi[2 * j + 1] + wi * frfi[2 * j]) >> 15; |
| |
| qr32 = (int32_t)frfi[2 * i]; |
| qi32 = (int32_t)frfi[2 * i + 1]; |
| frfi[2 * j] = (int16_t)((qr32 - tr32) >> shift); |
| frfi[2 * j + 1] = (int16_t)((qi32 - ti32) >> shift); |
| frfi[2 * i] = (int16_t)((qr32 + tr32) >> shift); |
| frfi[2 * i + 1] = (int16_t)((qi32 + ti32) >> shift); |
| } |
| } |
| } else |
| { |
| // mode==1: High-complexity and High-accuracy mode |
| |
| for (m = 0; m < l; ++m) |
| { |
| j = m << k; |
| |
| /* The 256-value is a constant given as 1/4 of the size of |
| * kSinTable1024[], and should not be changed depending on the input |
| * parameter 'stages'. It will result in 0 <= j < N_SINE_WAVE/2 |
| */ |
| wr = kSinTable1024[j + 256]; |
| wi = kSinTable1024[j]; |
| |
| #ifdef WEBRTC_ARCH_ARM_V7 |
| int32_t wri = 0; |
| __asm __volatile("pkhbt %0, %1, %2, lsl #16" : "=r"(wri) : |
| "r"((int32_t)wr), "r"((int32_t)wi)); |
| #endif |
| |
| for (i = m; i < n; i += istep) |
| { |
| j = i + l; |
| |
| #ifdef WEBRTC_ARCH_ARM_V7 |
| register int32_t frfi_r; |
| __asm __volatile( |
| "pkhbt %[frfi_r], %[frfi_even], %[frfi_odd], lsl #16\n\t" |
| "smlsd %[tr32], %[wri], %[frfi_r], %[cifftrnd]\n\t" |
| "smladx %[ti32], %[wri], %[frfi_r], %[cifftrnd]\n\t" |
| :[frfi_r]"=&r"(frfi_r), |
| [tr32]"=&r"(tr32), |
| [ti32]"=r"(ti32) |
| :[frfi_even]"r"((int32_t)frfi[2*j]), |
| [frfi_odd]"r"((int32_t)frfi[2*j +1]), |
| [wri]"r"(wri), |
| [cifftrnd]"r"(CIFFTRND) |
| ); |
| #else |
| |
| tr32 = wr * frfi[2 * j] - wi * frfi[2 * j + 1] + CIFFTRND; |
| |
| ti32 = wr * frfi[2 * j + 1] + wi * frfi[2 * j] + CIFFTRND; |
| #endif |
| tr32 >>= 15 - CIFFTSFT; |
| ti32 >>= 15 - CIFFTSFT; |
| |
| qr32 = ((int32_t)frfi[2 * i]) * (1 << CIFFTSFT); |
| qi32 = ((int32_t)frfi[2 * i + 1]) * (1 << CIFFTSFT); |
| |
| frfi[2 * j] = (int16_t)( |
| (qr32 - tr32 + round2) >> (shift + CIFFTSFT)); |
| frfi[2 * j + 1] = (int16_t)( |
| (qi32 - ti32 + round2) >> (shift + CIFFTSFT)); |
| frfi[2 * i] = (int16_t)( |
| (qr32 + tr32 + round2) >> (shift + CIFFTSFT)); |
| frfi[2 * i + 1] = (int16_t)( |
| (qi32 + ti32 + round2) >> (shift + CIFFTSFT)); |
| } |
| } |
| |
| } |
| --k; |
| l = istep; |
| } |
| return scale; |
| } |