| /* |
| ** Copyright 2003-2010, VisualOn, Inc. |
| ** |
| ** Licensed under the Apache License, Version 2.0 (the "License"); |
| ** you may not use this file except in compliance with the License. |
| ** You may obtain a copy of the License at |
| ** |
| ** http://www.apache.org/licenses/LICENSE-2.0 |
| ** |
| ** Unless required by applicable law or agreed to in writing, software |
| ** distributed under the License is distributed on an "AS IS" BASIS, |
| ** WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| ** See the License for the specific language governing permissions and |
| ** limitations under the License. |
| */ |
| |
| |
| /*-------------------------------------------------------------------* |
| * WB_VAD.H * |
| *-------------------------------------------------------------------* |
| * Functions and static memory for Voice Activity Detection. * |
| *-------------------------------------------------------------------*/ |
| |
| #ifndef __WB_VAD_H__ |
| #define __WB_VAD_H__ |
| |
| /****************************************************************************** |
| * INCLUDE FILES |
| ******************************************************************************/ |
| #include "typedef.h" |
| #include "wb_vad_c.h" |
| #include "voMem.h" |
| |
| /****************************************************************************** |
| * DEFINITION OF DATA TYPES |
| ******************************************************************************/ |
| |
| typedef struct |
| { |
| Word16 bckr_est[COMPLEN]; /* background noise estimate */ |
| Word16 ave_level[COMPLEN]; /* averaged input components for stationary */ |
| /* estimation */ |
| Word16 old_level[COMPLEN]; /* input levels of the previous frame */ |
| Word16 sub_level[COMPLEN]; /* input levels calculated at the end of a frame (lookahead) */ |
| Word16 a_data5[F_5TH_CNT][2]; /* memory for the filter bank */ |
| Word16 a_data3[F_3TH_CNT]; /* memory for the filter bank */ |
| |
| Word16 burst_count; /* counts length of a speech burst */ |
| Word16 hang_count; /* hangover counter */ |
| Word16 stat_count; /* stationary counter */ |
| |
| /* Note that each of the following two variables holds 15 flags. Each flag reserves 1 bit of the |
| * variable. The newest flag is in the bit 15 (assuming that LSB is bit 1 and MSB is bit 16). */ |
| Word16 vadreg; /* flags for intermediate VAD decisions */ |
| Word16 tone_flag; /* tone detection flags */ |
| |
| Word16 sp_est_cnt; /* counter for speech level estimation */ |
| Word16 sp_max; /* maximum level */ |
| Word16 sp_max_cnt; /* counts frames that contains speech */ |
| Word16 speech_level; /* estimated speech level */ |
| Word32 prev_pow_sum; /* power of previous frame */ |
| |
| } VadVars; |
| |
| /******************************************************************************** |
| * |
| * DECLARATION OF PROTOTYPES |
| ********************************************************************************/ |
| |
| Word16 wb_vad_init(VadVars ** st, VO_MEM_OPERATOR *pMemOP); |
| Word16 wb_vad_reset(VadVars * st); |
| void wb_vad_exit(VadVars ** st, VO_MEM_OPERATOR *pMemOP); |
| void wb_vad_tone_detection(VadVars * st, Word16 p_gain); |
| Word16 wb_vad(VadVars * st, Word16 in_buf[]); |
| |
| #endif //__WB_VAD_H__ |
| |
| |