12bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian/* Copyright (c) 2008-2011 Octasic Inc.
22bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian   Written by Jean-Marc Valin */
32bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian/*
42bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian   Redistribution and use in source and binary forms, with or without
52bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian   modification, are permitted provided that the following conditions
62bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian   are met:
72bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian
82bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian   - Redistributions of source code must retain the above copyright
92bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian   notice, this list of conditions and the following disclaimer.
102bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian
112bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian   - Redistributions in binary form must reproduce the above copyright
122bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian   notice, this list of conditions and the following disclaimer in the
132bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian   documentation and/or other materials provided with the distribution.
142bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian
152bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian   THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
162bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian   ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
172bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian   LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
182bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian   A PARTICULAR PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION OR
192bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian   CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
202bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian   EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
212bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian   PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
222bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian   PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
232bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian   LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
242bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian   NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
252bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian   SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
262bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian*/
272bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian
282bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian#ifdef HAVE_CONFIG_H
292bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian#include "config.h"
302bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian#endif
312bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian
322bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian#include "opus_types.h"
332bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian#include "opus_defines.h"
342bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian
352bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian#include <math.h>
362bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian#include "mlp.h"
372bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian#include "arch.h"
382bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian#include "tansig_table.h"
392bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian#define MAX_NEURONS 100
402bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian
412bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian#if 0
422bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanianstatic OPUS_INLINE opus_val16 tansig_approx(opus_val32 _x) /* Q19 */
432bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian{
44c91ee5b5642fcc4969150f73d5f6848f88bf1638flim    int i;
45c91ee5b5642fcc4969150f73d5f6848f88bf1638flim    opus_val16 xx; /* Q11 */
46c91ee5b5642fcc4969150f73d5f6848f88bf1638flim    /*double x, y;*/
47c91ee5b5642fcc4969150f73d5f6848f88bf1638flim    opus_val16 dy, yy; /* Q14 */
48c91ee5b5642fcc4969150f73d5f6848f88bf1638flim    /*x = 1.9073e-06*_x;*/
49c91ee5b5642fcc4969150f73d5f6848f88bf1638flim    if (_x>=QCONST32(8,19))
50c91ee5b5642fcc4969150f73d5f6848f88bf1638flim        return QCONST32(1.,14);
51c91ee5b5642fcc4969150f73d5f6848f88bf1638flim    if (_x<=-QCONST32(8,19))
52c91ee5b5642fcc4969150f73d5f6848f88bf1638flim        return -QCONST32(1.,14);
53c91ee5b5642fcc4969150f73d5f6848f88bf1638flim    xx = EXTRACT16(SHR32(_x, 8));
54c91ee5b5642fcc4969150f73d5f6848f88bf1638flim    /*i = lrint(25*x);*/
55c91ee5b5642fcc4969150f73d5f6848f88bf1638flim    i = SHR32(ADD32(1024,MULT16_16(25, xx)),11);
56c91ee5b5642fcc4969150f73d5f6848f88bf1638flim    /*x -= .04*i;*/
57c91ee5b5642fcc4969150f73d5f6848f88bf1638flim    xx -= EXTRACT16(SHR32(MULT16_16(20972,i),8));
58c91ee5b5642fcc4969150f73d5f6848f88bf1638flim    /*x = xx*(1./2048);*/
59c91ee5b5642fcc4969150f73d5f6848f88bf1638flim    /*y = tansig_table[250+i];*/
60c91ee5b5642fcc4969150f73d5f6848f88bf1638flim    yy = tansig_table[250+i];
61c91ee5b5642fcc4969150f73d5f6848f88bf1638flim    /*y = yy*(1./16384);*/
62c91ee5b5642fcc4969150f73d5f6848f88bf1638flim    dy = 16384-MULT16_16_Q14(yy,yy);
63c91ee5b5642fcc4969150f73d5f6848f88bf1638flim    yy = yy + MULT16_16_Q14(MULT16_16_Q11(xx,dy),(16384 - MULT16_16_Q11(yy,xx)));
64c91ee5b5642fcc4969150f73d5f6848f88bf1638flim    return yy;
652bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian}
662bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian#else
672bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian/*extern const float tansig_table[501];*/
682bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanianstatic OPUS_INLINE float tansig_approx(float x)
692bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian{
70c91ee5b5642fcc4969150f73d5f6848f88bf1638flim    int i;
71c91ee5b5642fcc4969150f73d5f6848f88bf1638flim    float y, dy;
72c91ee5b5642fcc4969150f73d5f6848f88bf1638flim    float sign=1;
73c91ee5b5642fcc4969150f73d5f6848f88bf1638flim    /* Tests are reversed to catch NaNs */
742bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian    if (!(x<8))
752bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian        return 1;
762bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian    if (!(x>-8))
772bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian        return -1;
78c91ee5b5642fcc4969150f73d5f6848f88bf1638flim#ifndef FIXED_POINT
79c91ee5b5642fcc4969150f73d5f6848f88bf1638flim    /* Another check in case of -ffast-math */
80c91ee5b5642fcc4969150f73d5f6848f88bf1638flim    if (celt_isnan(x))
81c91ee5b5642fcc4969150f73d5f6848f88bf1638flim       return 0;
82c91ee5b5642fcc4969150f73d5f6848f88bf1638flim#endif
83c91ee5b5642fcc4969150f73d5f6848f88bf1638flim    if (x<0)
84c91ee5b5642fcc4969150f73d5f6848f88bf1638flim    {
85c91ee5b5642fcc4969150f73d5f6848f88bf1638flim       x=-x;
86c91ee5b5642fcc4969150f73d5f6848f88bf1638flim       sign=-1;
87c91ee5b5642fcc4969150f73d5f6848f88bf1638flim    }
88c91ee5b5642fcc4969150f73d5f6848f88bf1638flim    i = (int)floor(.5f+25*x);
89c91ee5b5642fcc4969150f73d5f6848f88bf1638flim    x -= .04f*i;
90c91ee5b5642fcc4969150f73d5f6848f88bf1638flim    y = tansig_table[i];
91c91ee5b5642fcc4969150f73d5f6848f88bf1638flim    dy = 1-y*y;
92c91ee5b5642fcc4969150f73d5f6848f88bf1638flim    y = y + x*dy*(1 - y*x);
93c91ee5b5642fcc4969150f73d5f6848f88bf1638flim    return sign*y;
942bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian}
952bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian#endif
962bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian
972bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian#if 0
982bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanianvoid mlp_process(const MLP *m, const opus_val16 *in, opus_val16 *out)
992bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian{
100c91ee5b5642fcc4969150f73d5f6848f88bf1638flim    int j;
101c91ee5b5642fcc4969150f73d5f6848f88bf1638flim    opus_val16 hidden[MAX_NEURONS];
102c91ee5b5642fcc4969150f73d5f6848f88bf1638flim    const opus_val16 *W = m->weights;
103c91ee5b5642fcc4969150f73d5f6848f88bf1638flim    /* Copy to tmp_in */
104c91ee5b5642fcc4969150f73d5f6848f88bf1638flim    for (j=0;j<m->topo[1];j++)
105c91ee5b5642fcc4969150f73d5f6848f88bf1638flim    {
106c91ee5b5642fcc4969150f73d5f6848f88bf1638flim        int k;
107c91ee5b5642fcc4969150f73d5f6848f88bf1638flim        opus_val32 sum = SHL32(EXTEND32(*W++),8);
108c91ee5b5642fcc4969150f73d5f6848f88bf1638flim        for (k=0;k<m->topo[0];k++)
109c91ee5b5642fcc4969150f73d5f6848f88bf1638flim            sum = MAC16_16(sum, in[k],*W++);
110c91ee5b5642fcc4969150f73d5f6848f88bf1638flim        hidden[j] = tansig_approx(sum);
111c91ee5b5642fcc4969150f73d5f6848f88bf1638flim    }
112c91ee5b5642fcc4969150f73d5f6848f88bf1638flim    for (j=0;j<m->topo[2];j++)
113c91ee5b5642fcc4969150f73d5f6848f88bf1638flim    {
114c91ee5b5642fcc4969150f73d5f6848f88bf1638flim        int k;
115c91ee5b5642fcc4969150f73d5f6848f88bf1638flim        opus_val32 sum = SHL32(EXTEND32(*W++),14);
116c91ee5b5642fcc4969150f73d5f6848f88bf1638flim        for (k=0;k<m->topo[1];k++)
117c91ee5b5642fcc4969150f73d5f6848f88bf1638flim            sum = MAC16_16(sum, hidden[k], *W++);
118c91ee5b5642fcc4969150f73d5f6848f88bf1638flim        out[j] = tansig_approx(EXTRACT16(PSHR32(sum,17)));
119c91ee5b5642fcc4969150f73d5f6848f88bf1638flim    }
1202bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian}
1212bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian#else
1222bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanianvoid mlp_process(const MLP *m, const float *in, float *out)
1232bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian{
1242bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian    int j;
1252bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian    float hidden[MAX_NEURONS];
1262bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian    const float *W = m->weights;
1272bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian    /* Copy to tmp_in */
1282bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian    for (j=0;j<m->topo[1];j++)
1292bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian    {
1302bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian        int k;
1312bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian        float sum = *W++;
1322bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian        for (k=0;k<m->topo[0];k++)
1332bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian            sum = sum + in[k]**W++;
1342bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian        hidden[j] = tansig_approx(sum);
1352bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian    }
1362bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian    for (j=0;j<m->topo[2];j++)
1372bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian    {
1382bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian        int k;
1392bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian        float sum = *W++;
1402bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian        for (k=0;k<m->topo[1];k++)
1412bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian            sum = sum + hidden[k]**W++;
1422bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian        out[j] = tansig_approx(sum);
1432bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian    }
1442bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian}
1452bd8b54017b5320bc0c1df9bf86f4cdc9f8db242Vignesh Venkatasubramanian#endif
146