xref: /aosp_15_r20/external/libopus/dnn/fwgan.h (revision a58d3d2adb790c104798cd88c8a3aff4fa8b82cc)
1*a58d3d2aSXin Li /* Copyright (c) 2023 Amazon */
2*a58d3d2aSXin Li /*
3*a58d3d2aSXin Li    Redistribution and use in source and binary forms, with or without
4*a58d3d2aSXin Li    modification, are permitted provided that the following conditions
5*a58d3d2aSXin Li    are met:
6*a58d3d2aSXin Li 
7*a58d3d2aSXin Li    - Redistributions of source code must retain the above copyright
8*a58d3d2aSXin Li    notice, this list of conditions and the following disclaimer.
9*a58d3d2aSXin Li 
10*a58d3d2aSXin Li    - Redistributions in binary form must reproduce the above copyright
11*a58d3d2aSXin Li    notice, this list of conditions and the following disclaimer in the
12*a58d3d2aSXin Li    documentation and/or other materials provided with the distribution.
13*a58d3d2aSXin Li 
14*a58d3d2aSXin Li    THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
15*a58d3d2aSXin Li    ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
16*a58d3d2aSXin Li    LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
17*a58d3d2aSXin Li    A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER
18*a58d3d2aSXin Li    OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
19*a58d3d2aSXin Li    EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
20*a58d3d2aSXin Li    PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
21*a58d3d2aSXin Li    PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
22*a58d3d2aSXin Li    LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
23*a58d3d2aSXin Li    NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
24*a58d3d2aSXin Li    SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
25*a58d3d2aSXin Li */
26*a58d3d2aSXin Li 
27*a58d3d2aSXin Li #ifndef FWGAN_H
28*a58d3d2aSXin Li #define FWGAN_H
29*a58d3d2aSXin Li 
30*a58d3d2aSXin Li #include "freq.h"
31*a58d3d2aSXin Li #include "fwgan_data.h"
32*a58d3d2aSXin Li 
33*a58d3d2aSXin Li #define FWGAN_CONT_SAMPLES 320
34*a58d3d2aSXin Li #define NB_SUBFRAMES 4
35*a58d3d2aSXin Li #define SUBFRAME_SIZE 40
36*a58d3d2aSXin Li #define FWGAN_FRAME_SIZE (NB_SUBFRAMES*SUBFRAME_SIZE)
37*a58d3d2aSXin Li #define CONT_PCM_INPUTS 320
38*a58d3d2aSXin Li #define MAX_CONT_SIZE CONT_NET_0_OUT_SIZE
39*a58d3d2aSXin Li #define FWGAN_GAMMA 0.92f
40*a58d3d2aSXin Li #define FWGAN_DEEMPHASIS 0.85f
41*a58d3d2aSXin Li 
42*a58d3d2aSXin Li /* FIXME: Derive those from the model rather than hardcoding. */
43*a58d3d2aSXin Li #define FWC1_STATE_SIZE 512
44*a58d3d2aSXin Li #define FWC2_STATE_SIZE 512
45*a58d3d2aSXin Li #define FWC3_STATE_SIZE 256
46*a58d3d2aSXin Li #define FWC4_STATE_SIZE 256
47*a58d3d2aSXin Li #define FWC5_STATE_SIZE 128
48*a58d3d2aSXin Li #define FWC6_STATE_SIZE 128
49*a58d3d2aSXin Li #define FWC7_STATE_SIZE 80
50*a58d3d2aSXin Li 
51*a58d3d2aSXin Li typedef struct {
52*a58d3d2aSXin Li   FWGAN model;
53*a58d3d2aSXin Li   int arch;
54*a58d3d2aSXin Li   int cont_initialized;
55*a58d3d2aSXin Li   float embed_phase[2];
56*a58d3d2aSXin Li   float last_gain;
57*a58d3d2aSXin Li   float last_lpc[LPC_ORDER];
58*a58d3d2aSXin Li   float syn_mem[LPC_ORDER];
59*a58d3d2aSXin Li   float preemph_mem;
60*a58d3d2aSXin Li   float deemph_mem;
61*a58d3d2aSXin Li   float pcm_buf[FWGAN_FRAME_SIZE];
62*a58d3d2aSXin Li   float cont[CONT_NET_10_OUT_SIZE];
63*a58d3d2aSXin Li   float cont_conv1_mem[FEAT_IN_CONV1_CONV_STATE_SIZE];
64*a58d3d2aSXin Li   float rnn_state[RNN_GRU_STATE_SIZE];
65*a58d3d2aSXin Li   float fwc1_state[FWC1_STATE_SIZE];
66*a58d3d2aSXin Li   float fwc2_state[FWC2_STATE_SIZE];
67*a58d3d2aSXin Li   float fwc3_state[FWC3_STATE_SIZE];
68*a58d3d2aSXin Li   float fwc4_state[FWC4_STATE_SIZE];
69*a58d3d2aSXin Li   float fwc5_state[FWC5_STATE_SIZE];
70*a58d3d2aSXin Li   float fwc6_state[FWC6_STATE_SIZE];
71*a58d3d2aSXin Li   float fwc7_state[FWC7_STATE_SIZE];
72*a58d3d2aSXin Li } FWGANState;
73*a58d3d2aSXin Li 
74*a58d3d2aSXin Li void fwgan_init(FWGANState *st);
75*a58d3d2aSXin Li int fwgan_load_model(FWGANState *st, const unsigned char *data, int len);
76*a58d3d2aSXin Li 
77*a58d3d2aSXin Li void fwgan_cont(FWGANState *st, const float *pcm0, const float *features0);
78*a58d3d2aSXin Li 
79*a58d3d2aSXin Li void fwgan_synthesize(FWGANState *st, float *pcm, const float *features);
80*a58d3d2aSXin Li void fwgan_synthesize_int(FWGANState *st, opus_int16 *pcm, const float *features);
81*a58d3d2aSXin Li 
82*a58d3d2aSXin Li 
83*a58d3d2aSXin Li #endif /* FWGAN_H */
84