12bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian/* Copyright (c) 2008-2011 Octasic Inc. 22bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian Written by Jean-Marc Valin */ 32bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian/* 42bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian Redistribution and use in source and binary forms, with or without 52bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian modification, are permitted provided that the following conditions 62bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian are met: 72bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian 82bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian - Redistributions of source code must retain the above copyright 92bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian notice, this list of conditions and the following disclaimer. 102bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian 112bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian - Redistributions in binary form must reproduce the above copyright 122bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian notice, this list of conditions and the following disclaimer in the 132bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian documentation and/or other materials provided with the distribution. 142bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian 152bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS 162bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT 172bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR 182bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR 192bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, 202bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, 212bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR 222bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF 232bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING 242bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS 252bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. 262bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian*/ 272bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian 282bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian#ifdef HAVE_CONFIG_H 292bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian#include "config.h" 302bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian#endif 312bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian 322bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian#include "opus_types.h" 332bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian#include "opus_defines.h" 342bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian 352bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian#include <math.h> 362bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian#include "mlp.h" 372bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian#include "arch.h" 382bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian#include "tansig_table.h" 392bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian#define MAX_NEURONS 100 402bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian 412bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian#if 0 422bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanianstatic OPUS_INLINE opus_val16 tansig_approx(opus_val32 _x) /* Q19 */ 432bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian{ 44c91ee5b5642fcc4969150f73d5f6848f88bf1638flim int i; 45c91ee5b5642fcc4969150f73d5f6848f88bf1638flim opus_val16 xx; /* Q11 */ 46c91ee5b5642fcc4969150f73d5f6848f88bf1638flim /*double x, y;*/ 47c91ee5b5642fcc4969150f73d5f6848f88bf1638flim opus_val16 dy, yy; /* Q14 */ 48c91ee5b5642fcc4969150f73d5f6848f88bf1638flim /*x = 1.9073e-06*_x;*/ 49c91ee5b5642fcc4969150f73d5f6848f88bf1638flim if (_x>=QCONST32(8,19)) 50c91ee5b5642fcc4969150f73d5f6848f88bf1638flim return QCONST32(1.,14); 51c91ee5b5642fcc4969150f73d5f6848f88bf1638flim if (_x<=-QCONST32(8,19)) 52c91ee5b5642fcc4969150f73d5f6848f88bf1638flim return -QCONST32(1.,14); 53c91ee5b5642fcc4969150f73d5f6848f88bf1638flim xx = EXTRACT16(SHR32(_x, 8)); 54c91ee5b5642fcc4969150f73d5f6848f88bf1638flim /*i = lrint(25*x);*/ 55c91ee5b5642fcc4969150f73d5f6848f88bf1638flim i = SHR32(ADD32(1024,MULT16_16(25, xx)),11); 56c91ee5b5642fcc4969150f73d5f6848f88bf1638flim /*x -= .04*i;*/ 57c91ee5b5642fcc4969150f73d5f6848f88bf1638flim xx -= EXTRACT16(SHR32(MULT16_16(20972,i),8)); 58c91ee5b5642fcc4969150f73d5f6848f88bf1638flim /*x = xx*(1./2048);*/ 59c91ee5b5642fcc4969150f73d5f6848f88bf1638flim /*y = tansig_table[250+i];*/ 60c91ee5b5642fcc4969150f73d5f6848f88bf1638flim yy = tansig_table[250+i]; 61c91ee5b5642fcc4969150f73d5f6848f88bf1638flim /*y = yy*(1./16384);*/ 62c91ee5b5642fcc4969150f73d5f6848f88bf1638flim dy = 16384-MULT16_16_Q14(yy,yy); 63c91ee5b5642fcc4969150f73d5f6848f88bf1638flim yy = yy + MULT16_16_Q14(MULT16_16_Q11(xx,dy),(16384 - MULT16_16_Q11(yy,xx))); 64c91ee5b5642fcc4969150f73d5f6848f88bf1638flim return yy; 652bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian} 662bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian#else 672bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian/*extern const float tansig_table[501];*/ 682bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanianstatic OPUS_INLINE float tansig_approx(float x) 692bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian{ 70c91ee5b5642fcc4969150f73d5f6848f88bf1638flim int i; 71c91ee5b5642fcc4969150f73d5f6848f88bf1638flim float y, dy; 72c91ee5b5642fcc4969150f73d5f6848f88bf1638flim float sign=1; 73c91ee5b5642fcc4969150f73d5f6848f88bf1638flim /* Tests are reversed to catch NaNs */ 742bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian if (!(x<8)) 752bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian return 1; 762bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian if (!(x>-8)) 772bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian return -1; 78c91ee5b5642fcc4969150f73d5f6848f88bf1638flim#ifndef FIXED_POINT 79c91ee5b5642fcc4969150f73d5f6848f88bf1638flim /* Another check in case of -ffast-math */ 80c91ee5b5642fcc4969150f73d5f6848f88bf1638flim if (celt_isnan(x)) 81c91ee5b5642fcc4969150f73d5f6848f88bf1638flim return 0; 82c91ee5b5642fcc4969150f73d5f6848f88bf1638flim#endif 83c91ee5b5642fcc4969150f73d5f6848f88bf1638flim if (x<0) 84c91ee5b5642fcc4969150f73d5f6848f88bf1638flim { 85c91ee5b5642fcc4969150f73d5f6848f88bf1638flim x=-x; 86c91ee5b5642fcc4969150f73d5f6848f88bf1638flim sign=-1; 87c91ee5b5642fcc4969150f73d5f6848f88bf1638flim } 88c91ee5b5642fcc4969150f73d5f6848f88bf1638flim i = (int)floor(.5f+25*x); 89c91ee5b5642fcc4969150f73d5f6848f88bf1638flim x -= .04f*i; 90c91ee5b5642fcc4969150f73d5f6848f88bf1638flim y = tansig_table[i]; 91c91ee5b5642fcc4969150f73d5f6848f88bf1638flim dy = 1-y*y; 92c91ee5b5642fcc4969150f73d5f6848f88bf1638flim y = y + x*dy*(1 - y*x); 93c91ee5b5642fcc4969150f73d5f6848f88bf1638flim return sign*y; 942bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian} 952bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian#endif 962bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian 972bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian#if 0 982bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanianvoid mlp_process(const MLP *m, const opus_val16 *in, opus_val16 *out) 992bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian{ 100c91ee5b5642fcc4969150f73d5f6848f88bf1638flim int j; 101c91ee5b5642fcc4969150f73d5f6848f88bf1638flim opus_val16 hidden[MAX_NEURONS]; 102c91ee5b5642fcc4969150f73d5f6848f88bf1638flim const opus_val16 *W = m->weights; 103c91ee5b5642fcc4969150f73d5f6848f88bf1638flim /* Copy to tmp_in */ 104c91ee5b5642fcc4969150f73d5f6848f88bf1638flim for (j=0;j<m->topo[1];j++) 105c91ee5b5642fcc4969150f73d5f6848f88bf1638flim { 106c91ee5b5642fcc4969150f73d5f6848f88bf1638flim int k; 107c91ee5b5642fcc4969150f73d5f6848f88bf1638flim opus_val32 sum = SHL32(EXTEND32(*W++),8); 108c91ee5b5642fcc4969150f73d5f6848f88bf1638flim for (k=0;k<m->topo[0];k++) 109c91ee5b5642fcc4969150f73d5f6848f88bf1638flim sum = MAC16_16(sum, in[k],*W++); 110c91ee5b5642fcc4969150f73d5f6848f88bf1638flim hidden[j] = tansig_approx(sum); 111c91ee5b5642fcc4969150f73d5f6848f88bf1638flim } 112c91ee5b5642fcc4969150f73d5f6848f88bf1638flim for (j=0;j<m->topo[2];j++) 113c91ee5b5642fcc4969150f73d5f6848f88bf1638flim { 114c91ee5b5642fcc4969150f73d5f6848f88bf1638flim int k; 115c91ee5b5642fcc4969150f73d5f6848f88bf1638flim opus_val32 sum = SHL32(EXTEND32(*W++),14); 116c91ee5b5642fcc4969150f73d5f6848f88bf1638flim for (k=0;k<m->topo[1];k++) 117c91ee5b5642fcc4969150f73d5f6848f88bf1638flim sum = MAC16_16(sum, hidden[k], *W++); 118c91ee5b5642fcc4969150f73d5f6848f88bf1638flim out[j] = tansig_approx(EXTRACT16(PSHR32(sum,17))); 119c91ee5b5642fcc4969150f73d5f6848f88bf1638flim } 1202bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian} 1212bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian#else 1222bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanianvoid mlp_process(const MLP *m, const float *in, float *out) 1232bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian{ 1242bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian int j; 1252bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian float hidden[MAX_NEURONS]; 1262bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian const float *W = m->weights; 1272bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian /* Copy to tmp_in */ 1282bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian for (j=0;j<m->topo[1];j++) 1292bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian { 1302bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian int k; 1312bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian float sum = *W++; 1322bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian for (k=0;k<m->topo[0];k++) 1332bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian sum = sum + in[k]**W++; 1342bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian hidden[j] = tansig_approx(sum); 1352bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian } 1362bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian for (j=0;j<m->topo[2];j++) 1372bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian { 1382bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian int k; 1392bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian float sum = *W++; 1402bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian for (k=0;k<m->topo[1];k++) 1412bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian sum = sum + hidden[k]**W++; 1422bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian out[j] = tansig_approx(sum); 1432bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian } 1442bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian} 1452bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian#endif 146