1 /*
2  ** Copyright 2003-2010, VisualOn, Inc.
3  **
4  ** Licensed under the Apache License, Version 2.0 (the "License");
5  ** you may not use this file except in compliance with the License.
6  ** You may obtain a copy of the License at
7  **
8  **     http://www.apache.org/licenses/LICENSE-2.0
9  **
10  ** Unless required by applicable law or agreed to in writing, software
11  ** distributed under the License is distributed on an "AS IS" BASIS,
12  ** WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13  ** See the License for the specific language governing permissions and
14  ** limitations under the License.
15  */
16 
17 
18 /*-------------------------------------------------------------------*
19  *                         WB_VAD.H                                  *
20  *-------------------------------------------------------------------*
21  * Functions and static memory for Voice Activity Detection.         *
22  *-------------------------------------------------------------------*/
23 
24 #ifndef __WB_VAD_H__
25 #define __WB_VAD_H__
26 
27 /******************************************************************************
28  *                         INCLUDE FILES
29  ******************************************************************************/
30 #include "typedef.h"
31 #include "wb_vad_c.h"
32 #include "voMem.h"
33 
34 /******************************************************************************
35  *                         DEFINITION OF DATA TYPES
36  ******************************************************************************/
37 
38 typedef struct
39 {
40     Word16 bckr_est[COMPLEN];              /* background noise estimate                */
41     Word16 ave_level[COMPLEN];             /* averaged input components for stationary */
42     /* estimation                               */
43     Word16 old_level[COMPLEN];             /* input levels of the previous frame       */
44     Word16 sub_level[COMPLEN];             /* input levels calculated at the end of a frame (lookahead)  */
45     Word16 a_data5[F_5TH_CNT][2];          /* memory for the filter bank               */
46     Word16 a_data3[F_3TH_CNT];             /* memory for the filter bank               */
47 
48     Word16 burst_count;                    /* counts length of a speech burst          */
49     Word16 hang_count;                     /* hangover counter                         */
50     Word16 stat_count;                     /* stationary counter                       */
51 
52     /* Note that each of the following two variables holds 15 flags. Each flag reserves 1 bit of the
53      * variable. The newest flag is in the bit 15 (assuming that LSB is bit 1 and MSB is bit 16). */
54     Word16 vadreg;                         /* flags for intermediate VAD decisions     */
55     Word16 tone_flag;                      /* tone detection flags                     */
56 
57     Word16 sp_est_cnt;                     /* counter for speech level estimation      */
58     Word16 sp_max;                         /* maximum level                            */
59     Word16 sp_max_cnt;                     /* counts frames that contains speech       */
60     Word16 speech_level;                   /* estimated speech level                   */
61     Word32 prev_pow_sum;                   /* power of previous frame                  */
62 
63 } VadVars;
64 
65 /********************************************************************************
66  *
67  * DECLARATION OF PROTOTYPES
68  ********************************************************************************/
69 
70 Word16 wb_vad_init(VadVars ** st, VO_MEM_OPERATOR *pMemOP);
71 Word16 wb_vad_reset(VadVars * st);
72 void wb_vad_exit(VadVars ** st, VO_MEM_OPERATOR *pMemOP);
73 void wb_vad_tone_detection(VadVars * st, Word16 p_gain);
74 Word16 wb_vad(VadVars * st, Word16 in_buf[]);
75 
76 #endif  //__WB_VAD_H__
77 
78 
79