1*a58d3d2aSXin Li /* Copyright (c) 2023 Amazon */ 2*a58d3d2aSXin Li /* 3*a58d3d2aSXin Li Redistribution and use in source and binary forms, with or without 4*a58d3d2aSXin Li modification, are permitted provided that the following conditions 5*a58d3d2aSXin Li are met: 6*a58d3d2aSXin Li 7*a58d3d2aSXin Li - Redistributions of source code must retain the above copyright 8*a58d3d2aSXin Li notice, this list of conditions and the following disclaimer. 9*a58d3d2aSXin Li 10*a58d3d2aSXin Li - Redistributions in binary form must reproduce the above copyright 11*a58d3d2aSXin Li notice, this list of conditions and the following disclaimer in the 12*a58d3d2aSXin Li documentation and/or other materials provided with the distribution. 13*a58d3d2aSXin Li 14*a58d3d2aSXin Li THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS 15*a58d3d2aSXin Li ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT 16*a58d3d2aSXin Li LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR 17*a58d3d2aSXin Li A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER 18*a58d3d2aSXin Li OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, 19*a58d3d2aSXin Li EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, 20*a58d3d2aSXin Li PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR 21*a58d3d2aSXin Li PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF 22*a58d3d2aSXin Li LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING 23*a58d3d2aSXin Li NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS 24*a58d3d2aSXin Li SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. 25*a58d3d2aSXin Li */ 26*a58d3d2aSXin Li 27*a58d3d2aSXin Li #ifndef FWGAN_H 28*a58d3d2aSXin Li #define FWGAN_H 29*a58d3d2aSXin Li 30*a58d3d2aSXin Li #include "freq.h" 31*a58d3d2aSXin Li #include "fwgan_data.h" 32*a58d3d2aSXin Li 33*a58d3d2aSXin Li #define FWGAN_CONT_SAMPLES 320 34*a58d3d2aSXin Li #define NB_SUBFRAMES 4 35*a58d3d2aSXin Li #define SUBFRAME_SIZE 40 36*a58d3d2aSXin Li #define FWGAN_FRAME_SIZE (NB_SUBFRAMES*SUBFRAME_SIZE) 37*a58d3d2aSXin Li #define CONT_PCM_INPUTS 320 38*a58d3d2aSXin Li #define MAX_CONT_SIZE CONT_NET_0_OUT_SIZE 39*a58d3d2aSXin Li #define FWGAN_GAMMA 0.92f 40*a58d3d2aSXin Li #define FWGAN_DEEMPHASIS 0.85f 41*a58d3d2aSXin Li 42*a58d3d2aSXin Li /* FIXME: Derive those from the model rather than hardcoding. */ 43*a58d3d2aSXin Li #define FWC1_STATE_SIZE 512 44*a58d3d2aSXin Li #define FWC2_STATE_SIZE 512 45*a58d3d2aSXin Li #define FWC3_STATE_SIZE 256 46*a58d3d2aSXin Li #define FWC4_STATE_SIZE 256 47*a58d3d2aSXin Li #define FWC5_STATE_SIZE 128 48*a58d3d2aSXin Li #define FWC6_STATE_SIZE 128 49*a58d3d2aSXin Li #define FWC7_STATE_SIZE 80 50*a58d3d2aSXin Li 51*a58d3d2aSXin Li typedef struct { 52*a58d3d2aSXin Li FWGAN model; 53*a58d3d2aSXin Li int arch; 54*a58d3d2aSXin Li int cont_initialized; 55*a58d3d2aSXin Li float embed_phase[2]; 56*a58d3d2aSXin Li float last_gain; 57*a58d3d2aSXin Li float last_lpc[LPC_ORDER]; 58*a58d3d2aSXin Li float syn_mem[LPC_ORDER]; 59*a58d3d2aSXin Li float preemph_mem; 60*a58d3d2aSXin Li float deemph_mem; 61*a58d3d2aSXin Li float pcm_buf[FWGAN_FRAME_SIZE]; 62*a58d3d2aSXin Li float cont[CONT_NET_10_OUT_SIZE]; 63*a58d3d2aSXin Li float cont_conv1_mem[FEAT_IN_CONV1_CONV_STATE_SIZE]; 64*a58d3d2aSXin Li float rnn_state[RNN_GRU_STATE_SIZE]; 65*a58d3d2aSXin Li float fwc1_state[FWC1_STATE_SIZE]; 66*a58d3d2aSXin Li float fwc2_state[FWC2_STATE_SIZE]; 67*a58d3d2aSXin Li float fwc3_state[FWC3_STATE_SIZE]; 68*a58d3d2aSXin Li float fwc4_state[FWC4_STATE_SIZE]; 69*a58d3d2aSXin Li float fwc5_state[FWC5_STATE_SIZE]; 70*a58d3d2aSXin Li float fwc6_state[FWC6_STATE_SIZE]; 71*a58d3d2aSXin Li float fwc7_state[FWC7_STATE_SIZE]; 72*a58d3d2aSXin Li } FWGANState; 73*a58d3d2aSXin Li 74*a58d3d2aSXin Li void fwgan_init(FWGANState *st); 75*a58d3d2aSXin Li int fwgan_load_model(FWGANState *st, const unsigned char *data, int len); 76*a58d3d2aSXin Li 77*a58d3d2aSXin Li void fwgan_cont(FWGANState *st, const float *pcm0, const float *features0); 78*a58d3d2aSXin Li 79*a58d3d2aSXin Li void fwgan_synthesize(FWGANState *st, float *pcm, const float *features); 80*a58d3d2aSXin Li void fwgan_synthesize_int(FWGANState *st, opus_int16 *pcm, const float *features); 81*a58d3d2aSXin Li 82*a58d3d2aSXin Li 83*a58d3d2aSXin Li #endif /* FWGAN_H */ 84