1/*
2 *  Copyright (c) 2013 The WebRTC project authors. All Rights Reserved.
3 *
4 *  Use of this source code is governed by a BSD-style license
5 *  that can be found in the LICENSE file in the root of the source
6 *  tree. An additional intellectual property rights grant can be found
7 *  in the file PATENTS.  All contributing project authors may
8 *  be found in the AUTHORS file in the root of the source tree.
9 *
10 */
11
12#include "dl/api/omxtypes.h"
13#include "dl/sp/src/x86/x86SP_SSE_Math.h"
14
15void x86SP_FFT_CToC_FC32_Inv_Radix4_fs_sse(
16    const OMX_F32 *in,
17    OMX_F32 *out,
18    OMX_INT n) {
19  OMX_INT i;
20  OMX_INT n_by_4 = n >> 2;
21  OMX_F32 *out0 = out;
22
23  for (i = 0; i < n_by_4; i += 4) {
24    VC v_t0;
25    VC v_t1;
26    VC v_t2;
27    VC v_t3;
28    VC v_t4;
29    VC v_t5;
30    VC v_t6;
31    VC v_t7;
32
33    const OMX_F32 *in0 = in + i;
34    const OMX_F32 *in1 = in0 + n_by_4;
35    const OMX_F32 *in2 = in1 + n_by_4;
36    const OMX_F32 *in3 = in2 + n_by_4;
37
38    OMX_F32 *out1 = out0 + n_by_4;
39    OMX_F32 *out2 = out1 + n_by_4;
40    OMX_F32 *out3 = out2 + n_by_4;
41
42    VC_LOAD_SPLIT(&v_t0, in0, n);
43    VC_LOAD_SPLIT(&v_t1, in1, n);
44    VC_LOAD_SPLIT(&v_t2, in2, n);
45    VC_LOAD_SPLIT(&v_t3, in3, n);
46
47    RADIX4_BUTTERFLY_FS(&v_t4, &v_t5, &v_t6, &v_t7,
48                        &v_t0, &v_t1, &v_t2, &v_t3);
49
50    RADIX4_INV_BUTTERFLY_STORE(out0, out1, out2, out3,
51                               &v_t4, &v_t5, &v_t6, &v_t7, n);
52
53    out0 += 4;
54  }
55}
56