1*a58d3d2aSXin Li /* Copyright (c) 2023 Amazon */ 2*a58d3d2aSXin Li /* 3*a58d3d2aSXin Li Redistribution and use in source and binary forms, with or without 4*a58d3d2aSXin Li modification, are permitted provided that the following conditions 5*a58d3d2aSXin Li are met: 6*a58d3d2aSXin Li 7*a58d3d2aSXin Li - Redistributions of source code must retain the above copyright 8*a58d3d2aSXin Li notice, this list of conditions and the following disclaimer. 9*a58d3d2aSXin Li 10*a58d3d2aSXin Li - Redistributions in binary form must reproduce the above copyright 11*a58d3d2aSXin Li notice, this list of conditions and the following disclaimer in the 12*a58d3d2aSXin Li documentation and/or other materials provided with the distribution. 13*a58d3d2aSXin Li 14*a58d3d2aSXin Li THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS 15*a58d3d2aSXin Li ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT 16*a58d3d2aSXin Li LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR 17*a58d3d2aSXin Li A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER 18*a58d3d2aSXin Li OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, 19*a58d3d2aSXin Li EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, 20*a58d3d2aSXin Li PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR 21*a58d3d2aSXin Li PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF 22*a58d3d2aSXin Li LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING 23*a58d3d2aSXin Li NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS 24*a58d3d2aSXin Li SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. 25*a58d3d2aSXin Li */ 26*a58d3d2aSXin Li 27*a58d3d2aSXin Li #ifndef FARGAN_H 28*a58d3d2aSXin Li #define FARGAN_H 29*a58d3d2aSXin Li 30*a58d3d2aSXin Li #include "freq.h" 31*a58d3d2aSXin Li #include "fargan_data.h" 32*a58d3d2aSXin Li #include "pitchdnn.h" 33*a58d3d2aSXin Li 34*a58d3d2aSXin Li #define FARGAN_CONT_SAMPLES 320 35*a58d3d2aSXin Li #define FARGAN_NB_SUBFRAMES 4 36*a58d3d2aSXin Li #define FARGAN_SUBFRAME_SIZE 40 37*a58d3d2aSXin Li #define FARGAN_FRAME_SIZE (FARGAN_NB_SUBFRAMES*FARGAN_SUBFRAME_SIZE) 38*a58d3d2aSXin Li #define FARGAN_COND_SIZE (COND_NET_FDENSE2_OUT_SIZE/FARGAN_NB_SUBFRAMES) 39*a58d3d2aSXin Li #define FARGAN_DEEMPHASIS 0.85f 40*a58d3d2aSXin Li 41*a58d3d2aSXin Li #define SIG_NET_INPUT_SIZE (FARGAN_COND_SIZE+2*FARGAN_SUBFRAME_SIZE+4) 42*a58d3d2aSXin Li #define SIG_NET_FWC0_STATE_SIZE (2*SIG_NET_INPUT_SIZE) 43*a58d3d2aSXin Li 44*a58d3d2aSXin Li #define FARGAN_MAX_RNN_NEURONS SIG_NET_GRU1_OUT_SIZE 45*a58d3d2aSXin Li typedef struct { 46*a58d3d2aSXin Li FARGAN model; 47*a58d3d2aSXin Li int arch; 48*a58d3d2aSXin Li int cont_initialized; 49*a58d3d2aSXin Li float deemph_mem; 50*a58d3d2aSXin Li float pitch_buf[PITCH_MAX_PERIOD]; 51*a58d3d2aSXin Li float cond_conv1_state[COND_NET_FCONV1_STATE_SIZE]; 52*a58d3d2aSXin Li float fwc0_mem[SIG_NET_FWC0_STATE_SIZE]; 53*a58d3d2aSXin Li float gru1_state[SIG_NET_GRU1_STATE_SIZE]; 54*a58d3d2aSXin Li float gru2_state[SIG_NET_GRU2_STATE_SIZE]; 55*a58d3d2aSXin Li float gru3_state[SIG_NET_GRU3_STATE_SIZE]; 56*a58d3d2aSXin Li int last_period; 57*a58d3d2aSXin Li } FARGANState; 58*a58d3d2aSXin Li 59*a58d3d2aSXin Li void fargan_init(FARGANState *st); 60*a58d3d2aSXin Li int fargan_load_model(FARGANState *st, const void *data, int len); 61*a58d3d2aSXin Li 62*a58d3d2aSXin Li void fargan_cont(FARGANState *st, const float *pcm0, const float *features0); 63*a58d3d2aSXin Li 64*a58d3d2aSXin Li void fargan_synthesize(FARGANState *st, float *pcm, const float *features); 65*a58d3d2aSXin Li void fargan_synthesize_int(FARGANState *st, opus_int16 *pcm, const float *features); 66*a58d3d2aSXin Li 67*a58d3d2aSXin Li 68*a58d3d2aSXin Li #endif /* FARGAN_H */ 69