/*
 *===================================================================
 *  3GPP AMR Wideband Floating-point Speech Codec
 *===================================================================
 */
#ifndef ENC_F_DTX_H
#define ENC_F_DTX_H

#include "typedef.h"

#define M               16       /* Order of LP filter                  */
#define DTX_HIST_SIZE   8        /* 8 frames                            */
#define COMPLEN         12       /* Number of sub-bands used by VAD     */
#define F_5TH_CNT       5        /* Number of 5th order filters in VAD  */
#define F_3TH_CNT       6        /* Number of 3th order filters in VAD  */

typedef struct {
   Float32 mem_isf[M * DTX_HIST_SIZE]; /* LSP history                        */
   Float32 mem_distance[28];           /* ISF history distance matrix        */
   Float32 mem_distance_sum[DTX_HIST_SIZE];/* Sum of ISF history distances   */
   Float32 mem_log_en[DTX_HIST_SIZE];  /* logarithmic frame energy history   */

   Word16 mem_hist_ptr;             /* pointer to the cyclic history vectors */
   Word16 mem_log_en_index;         /* Index for logarithmic energy          */
   Word16 mem_cng_seed;             /* Comfort noise excitation seed         */
   Word16 mem_dtx_hangover_count;   /* DTX hangover period                   */
   Word16 mem_dec_ana_elapsed_count;/* counter for elapsed speech frames     */
                                    /* in DTX                                */
} E_DTX_State;


typedef struct {

   Float64 mem_pow_sum;             /* power of previous frame               */

   Float32 mem_bckr_est[COMPLEN];   /* background noise estimate             */
   Float32 mem_ave_level[COMPLEN];  /* averaged input components             */
                                    /* for stationary estimation             */
   Float32 mem_level[COMPLEN];      /* input levels of the previous frame    */
   Float32 mem_sub_level[COMPLEN];  /* input levels calculated at the end of */
                                    /* a frame (lookahead)                   */
   Float32 mem_a_data5[F_5TH_CNT][2];/* memory for the filter bank           */
   Float32 mem_a_data3[F_3TH_CNT];  /* memory for the filter bank            */

   Float32 mem_sp_max;              /* maximum level                         */
   Float32 mem_speech_level;        /* estimated speech level                */

   Word16 mem_burst_count;          /* counts length of a speech burst       */
   Word16 mem_hang_count;           /* hangover counter                      */
   Word16 mem_stat_count;           /* stationary counter                    */
   Word16 mem_vadreg;               /* flags for intermediate VAD decisions  */
   Word16 mem_pitch_tone;           /* flags for pitch and tone detection    */
   Word16 mem_sp_est_cnt;           /* counter for speech level estimation   */
   Word16 mem_sp_max_cnt;           /* counts frames that contains speech    */

} E_DTX_Vad_State;

Word32 E_DTX_init(E_DTX_State **st);
Word32 E_DTX_reset(E_DTX_State *st);
void E_DTX_exit(E_DTX_State **st);
void E_DTX_tx_handler(E_DTX_State *st, Word32 vad_flag, Word16 *usedMode);
void E_DTX_buffer(E_DTX_State *st, Float32 isf_new[], Float32 enr,
                  Word16 codec_mode);
void E_DTX_exe(E_DTX_State *st, Float32 *exc2, Word16 **pt_prms);
Word32 E_DTX_vad_init(E_DTX_Vad_State **st);
Word32 E_DTX_vad_reset(E_DTX_Vad_State *st);
void E_DTX_vad_exit(E_DTX_Vad_State **st);
void E_DTX_pitch_tone_detection(E_DTX_Vad_State *st, Float32 p_gain);
Word16 E_DTX_vad(E_DTX_Vad_State *st, Float32 in_buf[]);

#endif