gps/GPSResources/tcpmp 0.73/amr/26204/enc_dtx.h

73 lines
3.6 KiB
C
Raw Normal View History

2019-05-01 12:32:35 +00:00
/*
*===================================================================
* 3GPP AMR Wideband Floating-point Speech Codec
*===================================================================
*/
#ifndef ENC_F_DTX_H
#define ENC_F_DTX_H
#include "typedef.h"
#define M 16 /* Order of LP filter */
#define DTX_HIST_SIZE 8 /* 8 frames */
#define COMPLEN 12 /* Number of sub-bands used by VAD */
#define F_5TH_CNT 5 /* Number of 5th order filters in VAD */
#define F_3TH_CNT 6 /* Number of 3th order filters in VAD */
typedef struct {
Float32 mem_isf[M * DTX_HIST_SIZE]; /* LSP history */
Float32 mem_distance[28]; /* ISF history distance matrix */
Float32 mem_distance_sum[DTX_HIST_SIZE];/* Sum of ISF history distances */
Float32 mem_log_en[DTX_HIST_SIZE]; /* logarithmic frame energy history */
Word16 mem_hist_ptr; /* pointer to the cyclic history vectors */
Word16 mem_log_en_index; /* Index for logarithmic energy */
Word16 mem_cng_seed; /* Comfort noise excitation seed */
Word16 mem_dtx_hangover_count; /* DTX hangover period */
Word16 mem_dec_ana_elapsed_count;/* counter for elapsed speech frames */
/* in DTX */
} E_DTX_State;
typedef struct {
Float64 mem_pow_sum; /* power of previous frame */
Float32 mem_bckr_est[COMPLEN]; /* background noise estimate */
Float32 mem_ave_level[COMPLEN]; /* averaged input components */
/* for stationary estimation */
Float32 mem_level[COMPLEN]; /* input levels of the previous frame */
Float32 mem_sub_level[COMPLEN]; /* input levels calculated at the end of */
/* a frame (lookahead) */
Float32 mem_a_data5[F_5TH_CNT][2];/* memory for the filter bank */
Float32 mem_a_data3[F_3TH_CNT]; /* memory for the filter bank */
Float32 mem_sp_max; /* maximum level */
Float32 mem_speech_level; /* estimated speech level */
Word16 mem_burst_count; /* counts length of a speech burst */
Word16 mem_hang_count; /* hangover counter */
Word16 mem_stat_count; /* stationary counter */
Word16 mem_vadreg; /* flags for intermediate VAD decisions */
Word16 mem_pitch_tone; /* flags for pitch and tone detection */
Word16 mem_sp_est_cnt; /* counter for speech level estimation */
Word16 mem_sp_max_cnt; /* counts frames that contains speech */
} E_DTX_Vad_State;
Word32 E_DTX_init(E_DTX_State **st);
Word32 E_DTX_reset(E_DTX_State *st);
void E_DTX_exit(E_DTX_State **st);
void E_DTX_tx_handler(E_DTX_State *st, Word32 vad_flag, Word16 *usedMode);
void E_DTX_buffer(E_DTX_State *st, Float32 isf_new[], Float32 enr,
Word16 codec_mode);
void E_DTX_exe(E_DTX_State *st, Float32 *exc2, Word16 **pt_prms);
Word32 E_DTX_vad_init(E_DTX_Vad_State **st);
Word32 E_DTX_vad_reset(E_DTX_Vad_State *st);
void E_DTX_vad_exit(E_DTX_Vad_State **st);
void E_DTX_pitch_tone_detection(E_DTX_Vad_State *st, Float32 p_gain);
Word16 E_DTX_vad(E_DTX_Vad_State *st, Float32 in_buf[]);
#endif