198913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project/* Copyright (C) 2004 Jean-Marc Valin */ 298913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project/** 398913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project @file vq_sse.h 498913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project @brief SSE-optimized vq routine 598913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project*/ 698913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project/* 798913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project Redistribution and use in source and binary forms, with or without 898913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project modification, are permitted provided that the following conditions 998913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project are met: 1098913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project 1198913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project - Redistributions of source code must retain the above copyright 1298913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project notice, this list of conditions and the following disclaimer. 1398913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project 1498913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project - Redistributions in binary form must reproduce the above copyright 1598913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project notice, this list of conditions and the following disclaimer in the 1698913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project documentation and/or other materials provided with the distribution. 1798913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project 1898913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project - Neither the name of the Xiph.org Foundation nor the names of its 1998913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project contributors may be used to endorse or promote products derived from 2098913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project this software without specific prior written permission. 2198913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project 2298913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS 2398913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT 2498913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR 2598913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR 2698913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, 2798913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, 2898913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR 2998913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF 3098913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING 3198913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS 3298913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. 3398913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project*/ 3498913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project 3598913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project#define OVERRIDE_VQ_NBEST 3698913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Projectvoid vq_nbest(spx_word16_t *_in, const __m128 *codebook, int len, int entries, __m128 *E, int N, int *nbest, spx_word32_t *best_dist, char *stack) 3798913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project{ 3898913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project int i,j,k,used; 3998913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project VARDECL(float *dist); 4098913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project VARDECL(__m128 *in); 4198913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project __m128 half; 4298913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project used = 0; 4398913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project ALLOC(dist, entries, float); 4498913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project half = _mm_set_ps1(.5f); 4598913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project ALLOC(in, len, __m128); 4698913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project for (i=0;i<len;i++) 4798913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project in[i] = _mm_set_ps1(_in[i]); 4898913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project for (i=0;i<entries>>2;i++) 4998913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project { 5098913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project __m128 d = _mm_mul_ps(E[i], half); 5198913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project for (j=0;j<len;j++) 5298913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project d = _mm_sub_ps(d, _mm_mul_ps(in[j], *codebook++)); 5398913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project _mm_storeu_ps(dist+4*i, d); 5498913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project } 5598913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project for (i=0;i<entries;i++) 5698913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project { 5798913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project if (i<N || dist[i]<best_dist[N-1]) 5898913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project { 5998913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project for (k=N-1; (k >= 1) && (k > used || dist[i] < best_dist[k-1]); k--) 6098913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project { 6198913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project best_dist[k]=best_dist[k-1]; 6298913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project nbest[k] = nbest[k-1]; 6398913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project } 6498913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project best_dist[k]=dist[i]; 6598913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project nbest[k]=i; 6698913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project used++; 6798913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project } 6898913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project } 6998913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project} 7098913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project 7198913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project 7298913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project 7398913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project 7498913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project#define OVERRIDE_VQ_NBEST_SIGN 7598913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Projectvoid vq_nbest_sign(spx_word16_t *_in, const __m128 *codebook, int len, int entries, __m128 *E, int N, int *nbest, spx_word32_t *best_dist, char *stack) 7698913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project{ 7798913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project int i,j,k,used; 7898913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project VARDECL(float *dist); 7998913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project VARDECL(__m128 *in); 8098913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project __m128 half; 8198913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project used = 0; 8298913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project ALLOC(dist, entries, float); 8398913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project half = _mm_set_ps1(.5f); 8498913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project ALLOC(in, len, __m128); 8598913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project for (i=0;i<len;i++) 8698913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project in[i] = _mm_set_ps1(_in[i]); 8798913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project for (i=0;i<entries>>2;i++) 8898913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project { 8998913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project __m128 d = _mm_setzero_ps(); 9098913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project for (j=0;j<len;j++) 9198913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project d = _mm_add_ps(d, _mm_mul_ps(in[j], *codebook++)); 9298913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project _mm_storeu_ps(dist+4*i, d); 9398913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project } 9498913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project for (i=0;i<entries;i++) 9598913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project { 9698913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project int sign; 9798913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project if (dist[i]>0) 9898913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project { 9998913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project sign=0; 10098913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project dist[i]=-dist[i]; 10198913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project } else 10298913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project { 10398913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project sign=1; 10498913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project } 10598913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project dist[i] += .5f*((float*)E)[i]; 10698913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project if (i<N || dist[i]<best_dist[N-1]) 10798913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project { 10898913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project for (k=N-1; (k >= 1) && (k > used || dist[i] < best_dist[k-1]); k--) 10998913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project { 11098913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project best_dist[k]=best_dist[k-1]; 11198913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project nbest[k] = nbest[k-1]; 11298913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project } 11398913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project best_dist[k]=dist[i]; 11498913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project nbest[k]=i; 11598913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project used++; 11698913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project if (sign) 11798913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project nbest[k]+=entries; 11898913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project } 11998913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project } 12098913fed6520d8849fb2e246be943e04474aefaThe Android Open Source Project} 121