1 /* 2 ** Copyright 2003-2010, VisualOn, Inc. 3 ** 4 ** Licensed under the Apache License, Version 2.0 (the "License"); 5 ** you may not use this file except in compliance with the License. 6 ** You may obtain a copy of the License at 7 ** 8 ** http://www.apache.org/licenses/LICENSE-2.0 9 ** 10 ** Unless required by applicable law or agreed to in writing, software 11 ** distributed under the License is distributed on an "AS IS" BASIS, 12 ** WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. 13 ** See the License for the specific language governing permissions and 14 ** limitations under the License. 15 */ 16 17 18 /*-------------------------------------------------------------------* 19 * WB_VAD.H * 20 *-------------------------------------------------------------------* 21 * Functions and static memory for Voice Activity Detection. * 22 *-------------------------------------------------------------------*/ 23 24 #ifndef __WB_VAD_H__ 25 #define __WB_VAD_H__ 26 27 /****************************************************************************** 28 * INCLUDE FILES 29 ******************************************************************************/ 30 #include "typedef.h" 31 #include "wb_vad_c.h" 32 #include "voMem.h" 33 34 /****************************************************************************** 35 * DEFINITION OF DATA TYPES 36 ******************************************************************************/ 37 38 typedef struct 39 { 40 Word16 bckr_est[COMPLEN]; /* background noise estimate */ 41 Word16 ave_level[COMPLEN]; /* averaged input components for stationary */ 42 /* estimation */ 43 Word16 old_level[COMPLEN]; /* input levels of the previous frame */ 44 Word16 sub_level[COMPLEN]; /* input levels calculated at the end of a frame (lookahead) */ 45 Word16 a_data5[F_5TH_CNT][2]; /* memory for the filter bank */ 46 Word16 a_data3[F_3TH_CNT]; /* memory for the filter bank */ 47 48 Word16 burst_count; /* counts length of a speech burst */ 49 Word16 hang_count; /* hangover counter */ 50 Word16 stat_count; /* stationary counter */ 51 52 /* Note that each of the following two variables holds 15 flags. Each flag reserves 1 bit of the 53 * variable. The newest flag is in the bit 15 (assuming that LSB is bit 1 and MSB is bit 16). */ 54 Word16 vadreg; /* flags for intermediate VAD decisions */ 55 Word16 tone_flag; /* tone detection flags */ 56 57 Word16 sp_est_cnt; /* counter for speech level estimation */ 58 Word16 sp_max; /* maximum level */ 59 Word16 sp_max_cnt; /* counts frames that contains speech */ 60 Word16 speech_level; /* estimated speech level */ 61 Word32 prev_pow_sum; /* power of previous frame */ 62 63 } VadVars; 64 65 /******************************************************************************** 66 * 67 * DECLARATION OF PROTOTYPES 68 ********************************************************************************/ 69 70 Word16 wb_vad_init(VadVars ** st, VO_MEM_OPERATOR *pMemOP); 71 Word16 wb_vad_reset(VadVars * st); 72 void wb_vad_exit(VadVars ** st, VO_MEM_OPERATOR *pMemOP); 73 void wb_vad_tone_detection(VadVars * st, Word16 p_gain); 74 Word16 wb_vad(VadVars * st, Word16 in_buf[]); 75 76 #endif //__WB_VAD_H__ 77 78 79