15dea86a9c0ad69135561667a6912b26be0de692bandrew@webrtc.org/*
25dea86a9c0ad69135561667a6912b26be0de692bandrew@webrtc.org *  Copyright (c) 2013 The WebRTC project authors. All Rights Reserved.
35dea86a9c0ad69135561667a6912b26be0de692bandrew@webrtc.org *
45dea86a9c0ad69135561667a6912b26be0de692bandrew@webrtc.org *  Use of this source code is governed by a BSD-style license
55dea86a9c0ad69135561667a6912b26be0de692bandrew@webrtc.org *  that can be found in the LICENSE file in the root of the source
65dea86a9c0ad69135561667a6912b26be0de692bandrew@webrtc.org *  tree. An additional intellectual property rights grant can be found
75dea86a9c0ad69135561667a6912b26be0de692bandrew@webrtc.org *  in the file PATENTS.  All contributing project authors may
85dea86a9c0ad69135561667a6912b26be0de692bandrew@webrtc.org *  be found in the AUTHORS file in the root of the source tree.
95dea86a9c0ad69135561667a6912b26be0de692bandrew@webrtc.org */
105dea86a9c0ad69135561667a6912b26be0de692bandrew@webrtc.org
115dea86a9c0ad69135561667a6912b26be0de692bandrew@webrtc.org// Modified from the Chromium original:
125dea86a9c0ad69135561667a6912b26be0de692bandrew@webrtc.org// src/media/base/sinc_resampler.cc
135dea86a9c0ad69135561667a6912b26be0de692bandrew@webrtc.org
145dea86a9c0ad69135561667a6912b26be0de692bandrew@webrtc.org#include "webrtc/common_audio/resampler/sinc_resampler.h"
155dea86a9c0ad69135561667a6912b26be0de692bandrew@webrtc.org
165dea86a9c0ad69135561667a6912b26be0de692bandrew@webrtc.org#include <arm_neon.h>
175dea86a9c0ad69135561667a6912b26be0de692bandrew@webrtc.org
185dea86a9c0ad69135561667a6912b26be0de692bandrew@webrtc.orgnamespace webrtc {
195dea86a9c0ad69135561667a6912b26be0de692bandrew@webrtc.org
205dea86a9c0ad69135561667a6912b26be0de692bandrew@webrtc.orgfloat SincResampler::Convolve_NEON(const float* input_ptr, const float* k1,
215dea86a9c0ad69135561667a6912b26be0de692bandrew@webrtc.org                                   const float* k2,
225dea86a9c0ad69135561667a6912b26be0de692bandrew@webrtc.org                                   double kernel_interpolation_factor) {
235dea86a9c0ad69135561667a6912b26be0de692bandrew@webrtc.org  float32x4_t m_input;
245dea86a9c0ad69135561667a6912b26be0de692bandrew@webrtc.org  float32x4_t m_sums1 = vmovq_n_f32(0);
255dea86a9c0ad69135561667a6912b26be0de692bandrew@webrtc.org  float32x4_t m_sums2 = vmovq_n_f32(0);
265dea86a9c0ad69135561667a6912b26be0de692bandrew@webrtc.org
275dea86a9c0ad69135561667a6912b26be0de692bandrew@webrtc.org  const float* upper = input_ptr + kKernelSize;
285dea86a9c0ad69135561667a6912b26be0de692bandrew@webrtc.org  for (; input_ptr < upper; ) {
295dea86a9c0ad69135561667a6912b26be0de692bandrew@webrtc.org    m_input = vld1q_f32(input_ptr);
305dea86a9c0ad69135561667a6912b26be0de692bandrew@webrtc.org    input_ptr += 4;
315dea86a9c0ad69135561667a6912b26be0de692bandrew@webrtc.org    m_sums1 = vmlaq_f32(m_sums1, m_input, vld1q_f32(k1));
325dea86a9c0ad69135561667a6912b26be0de692bandrew@webrtc.org    k1 += 4;
335dea86a9c0ad69135561667a6912b26be0de692bandrew@webrtc.org    m_sums2 = vmlaq_f32(m_sums2, m_input, vld1q_f32(k2));
345dea86a9c0ad69135561667a6912b26be0de692bandrew@webrtc.org    k2 += 4;
355dea86a9c0ad69135561667a6912b26be0de692bandrew@webrtc.org  }
365dea86a9c0ad69135561667a6912b26be0de692bandrew@webrtc.org
375dea86a9c0ad69135561667a6912b26be0de692bandrew@webrtc.org  // Linearly interpolate the two "convolutions".
385dea86a9c0ad69135561667a6912b26be0de692bandrew@webrtc.org  m_sums1 = vmlaq_f32(
395dea86a9c0ad69135561667a6912b26be0de692bandrew@webrtc.org      vmulq_f32(m_sums1, vmovq_n_f32(1.0 - kernel_interpolation_factor)),
405dea86a9c0ad69135561667a6912b26be0de692bandrew@webrtc.org      m_sums2, vmovq_n_f32(kernel_interpolation_factor));
415dea86a9c0ad69135561667a6912b26be0de692bandrew@webrtc.org
425dea86a9c0ad69135561667a6912b26be0de692bandrew@webrtc.org  // Sum components together.
435dea86a9c0ad69135561667a6912b26be0de692bandrew@webrtc.org  float32x2_t m_half = vadd_f32(vget_high_f32(m_sums1), vget_low_f32(m_sums1));
445dea86a9c0ad69135561667a6912b26be0de692bandrew@webrtc.org  return vget_lane_f32(vpadd_f32(m_half, m_half), 0);
455dea86a9c0ad69135561667a6912b26be0de692bandrew@webrtc.org}
465dea86a9c0ad69135561667a6912b26be0de692bandrew@webrtc.org
475dea86a9c0ad69135561667a6912b26be0de692bandrew@webrtc.org}  // namespace webrtc
48