/* ** Copyright 2003-2010, VisualOn, Inc. ** ** Licensed under the Apache License, Version 2.0 (the "License"); ** you may not use this file except in compliance with the License. ** You may obtain a copy of the License at ** ** http://www.apache.org/licenses/LICENSE-2.0 ** ** Unless required by applicable law or agreed to in writing, software ** distributed under the License is distributed on an "AS IS" BASIS, ** WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. ** See the License for the specific language governing permissions and ** limitations under the License. */ /*-------------------------------------------------------------------* * WB_VAD.H * *-------------------------------------------------------------------* * Functions and static memory for Voice Activity Detection. * *-------------------------------------------------------------------*/ #ifndef __WB_VAD_H__ #define __WB_VAD_H__ /****************************************************************************** * INCLUDE FILES ******************************************************************************/ #include "typedef.h" #include "wb_vad_c.h" #include "voMem.h" /****************************************************************************** * DEFINITION OF DATA TYPES ******************************************************************************/ typedef struct { Word16 bckr_est[COMPLEN]; /* background noise estimate */ Word16 ave_level[COMPLEN]; /* averaged input components for stationary */ /* estimation */ Word16 old_level[COMPLEN]; /* input levels of the previous frame */ Word16 sub_level[COMPLEN]; /* input levels calculated at the end of a frame (lookahead) */ Word16 a_data5[F_5TH_CNT][2]; /* memory for the filter bank */ Word16 a_data3[F_3TH_CNT]; /* memory for the filter bank */ Word16 burst_count; /* counts length of a speech burst */ Word16 hang_count; /* hangover counter */ Word16 stat_count; /* stationary counter */ /* Note that each of the following two variables holds 15 flags. Each flag reserves 1 bit of the * variable. The newest flag is in the bit 15 (assuming that LSB is bit 1 and MSB is bit 16). */ Word16 vadreg; /* flags for intermediate VAD decisions */ Word16 tone_flag; /* tone detection flags */ Word16 sp_est_cnt; /* counter for speech level estimation */ Word16 sp_max; /* maximum level */ Word16 sp_max_cnt; /* counts frames that contains speech */ Word16 speech_level; /* estimated speech level */ Word32 prev_pow_sum; /* power of previous frame */ } VadVars; /******************************************************************************** * * DECLARATION OF PROTOTYPES ********************************************************************************/ Word16 wb_vad_init(VadVars ** st, VO_MEM_OPERATOR *pMemOP); Word16 wb_vad_reset(VadVars * st); void wb_vad_exit(VadVars ** st, VO_MEM_OPERATOR *pMemOP); void wb_vad_tone_detection(VadVars * st, Word16 p_gain); Word16 wb_vad(VadVars * st, Word16 in_buf[]); #endif //__WB_VAD_H__