xref: /aosp_15_r20/external/libopus/dnn/fargan.h (revision a58d3d2adb790c104798cd88c8a3aff4fa8b82cc)
1*a58d3d2aSXin Li /* Copyright (c) 2023 Amazon */
2*a58d3d2aSXin Li /*
3*a58d3d2aSXin Li    Redistribution and use in source and binary forms, with or without
4*a58d3d2aSXin Li    modification, are permitted provided that the following conditions
5*a58d3d2aSXin Li    are met:
6*a58d3d2aSXin Li 
7*a58d3d2aSXin Li    - Redistributions of source code must retain the above copyright
8*a58d3d2aSXin Li    notice, this list of conditions and the following disclaimer.
9*a58d3d2aSXin Li 
10*a58d3d2aSXin Li    - Redistributions in binary form must reproduce the above copyright
11*a58d3d2aSXin Li    notice, this list of conditions and the following disclaimer in the
12*a58d3d2aSXin Li    documentation and/or other materials provided with the distribution.
13*a58d3d2aSXin Li 
14*a58d3d2aSXin Li    THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
15*a58d3d2aSXin Li    ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
16*a58d3d2aSXin Li    LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
17*a58d3d2aSXin Li    A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER
18*a58d3d2aSXin Li    OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
19*a58d3d2aSXin Li    EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
20*a58d3d2aSXin Li    PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
21*a58d3d2aSXin Li    PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
22*a58d3d2aSXin Li    LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
23*a58d3d2aSXin Li    NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
24*a58d3d2aSXin Li    SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
25*a58d3d2aSXin Li */
26*a58d3d2aSXin Li 
27*a58d3d2aSXin Li #ifndef FARGAN_H
28*a58d3d2aSXin Li #define FARGAN_H
29*a58d3d2aSXin Li 
30*a58d3d2aSXin Li #include "freq.h"
31*a58d3d2aSXin Li #include "fargan_data.h"
32*a58d3d2aSXin Li #include "pitchdnn.h"
33*a58d3d2aSXin Li 
34*a58d3d2aSXin Li #define FARGAN_CONT_SAMPLES 320
35*a58d3d2aSXin Li #define FARGAN_NB_SUBFRAMES 4
36*a58d3d2aSXin Li #define FARGAN_SUBFRAME_SIZE 40
37*a58d3d2aSXin Li #define FARGAN_FRAME_SIZE (FARGAN_NB_SUBFRAMES*FARGAN_SUBFRAME_SIZE)
38*a58d3d2aSXin Li #define FARGAN_COND_SIZE (COND_NET_FDENSE2_OUT_SIZE/FARGAN_NB_SUBFRAMES)
39*a58d3d2aSXin Li #define FARGAN_DEEMPHASIS 0.85f
40*a58d3d2aSXin Li 
41*a58d3d2aSXin Li #define SIG_NET_INPUT_SIZE (FARGAN_COND_SIZE+2*FARGAN_SUBFRAME_SIZE+4)
42*a58d3d2aSXin Li #define SIG_NET_FWC0_STATE_SIZE (2*SIG_NET_INPUT_SIZE)
43*a58d3d2aSXin Li 
44*a58d3d2aSXin Li #define FARGAN_MAX_RNN_NEURONS SIG_NET_GRU1_OUT_SIZE
45*a58d3d2aSXin Li typedef struct {
46*a58d3d2aSXin Li   FARGAN model;
47*a58d3d2aSXin Li   int arch;
48*a58d3d2aSXin Li   int cont_initialized;
49*a58d3d2aSXin Li   float deemph_mem;
50*a58d3d2aSXin Li   float pitch_buf[PITCH_MAX_PERIOD];
51*a58d3d2aSXin Li   float cond_conv1_state[COND_NET_FCONV1_STATE_SIZE];
52*a58d3d2aSXin Li   float fwc0_mem[SIG_NET_FWC0_STATE_SIZE];
53*a58d3d2aSXin Li   float gru1_state[SIG_NET_GRU1_STATE_SIZE];
54*a58d3d2aSXin Li   float gru2_state[SIG_NET_GRU2_STATE_SIZE];
55*a58d3d2aSXin Li   float gru3_state[SIG_NET_GRU3_STATE_SIZE];
56*a58d3d2aSXin Li   int last_period;
57*a58d3d2aSXin Li } FARGANState;
58*a58d3d2aSXin Li 
59*a58d3d2aSXin Li void fargan_init(FARGANState *st);
60*a58d3d2aSXin Li int fargan_load_model(FARGANState *st, const void *data, int len);
61*a58d3d2aSXin Li 
62*a58d3d2aSXin Li void fargan_cont(FARGANState *st, const float *pcm0, const float *features0);
63*a58d3d2aSXin Li 
64*a58d3d2aSXin Li void fargan_synthesize(FARGANState *st, float *pcm, const float *features);
65*a58d3d2aSXin Li void fargan_synthesize_int(FARGANState *st, opus_int16 *pcm, const float *features);
66*a58d3d2aSXin Li 
67*a58d3d2aSXin Li 
68*a58d3d2aSXin Li #endif /* FARGAN_H */
69