blob: 58908d3aa2b1554e66c1568fbe0a51fdbdc59080 [file] [log] [blame]
/*
* Copyright (c) 2013 The WebRTC project authors. All Rights Reserved.
*
* Use of this source code is governed by a BSD-style license
* that can be found in the LICENSE file in the root of the source
* tree. An additional intellectual property rights grant can be found
* in the file PATENTS. All contributing project authors may
* be found in the AUTHORS file in the root of the source tree.
*
*/
#include "dl/api/omxtypes.h"
#include "dl/sp/src/x86/x86SP_SSE_Math.h"
void x86SP_FFT_CToC_FC32_Fwd_Radix4_fs_sse(
const OMX_F32 *in,
OMX_F32 *out,
OMX_INT n) {
OMX_INT i;
OMX_INT n_by_2 = n >> 1;
OMX_INT n_by_4 = n >> 2;
OMX_F32 *out0 = out;
for (i = 0; i < n_by_2; i += 8) {
VC v_t0;
VC v_t1;
VC v_t2;
VC v_t3;
VC v_t4;
VC v_t5;
VC v_t6;
VC v_t7;
const OMX_F32 *in0 = in + i;
const OMX_F32 *in1 = in0 + n_by_2;
const OMX_F32 *in2 = in1 + n_by_2;
const OMX_F32 *in3 = in2 + n_by_2;
OMX_F32 *out1 = out0 + n_by_4;
OMX_F32 *out2 = out1 + n_by_4;
OMX_F32 *out3 = out2 + n_by_4;
VC_LOAD_SHUFFLE(&(v_t0.real), &(v_t0.imag), in0);
VC_LOAD_SHUFFLE(&(v_t1.real), &(v_t1.imag), in1);
VC_LOAD_SHUFFLE(&(v_t2.real), &(v_t2.imag), in2);
VC_LOAD_SHUFFLE(&(v_t3.real), &(v_t3.imag), in3);
RADIX4_BUTTERFLY_FS(&v_t4, &v_t5, &v_t6, &v_t7,
&v_t0, &v_t1, &v_t2, &v_t3);
RADIX4_FWD_BUTTERFLY_STORE(out0, out1, out2, out3,
&v_t4, &v_t5, &v_t6, &v_t7, n);
out0 += 4;
}
}