-
Notifications
You must be signed in to change notification settings - Fork 24
/
wb_vad.h
54 lines (45 loc) · 2.33 KB
/
wb_vad.h
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
#ifndef wb_vad_h
#define wb_vad_h
/******************************************************************************
* INCLUDE FILES
******************************************************************************/
#include "typedef.h"
#include "wb_vad_c.h"
/******************************************************************************
* DEFINITION OF DATA TYPES
******************************************************************************/
typedef struct
{
float bckr_est[COMPLEN]; /* background noise estimate */
float ave_level[COMPLEN]; /* averaged input components for stationary */
/* estimation */
float old_level[COMPLEN]; /* input levels of the previous frame */
float sub_level[COMPLEN]; /* input levels calculated at the end of a frame (lookahead) */
float a_data5[F_5TH_CNT][2]; /* memory for the filter bank */
float a_data3[F_3TH_CNT]; /* memory for the filter bank */
Word16 burst_count; /* counts length of a speech burst */
Word16 hang_count; /* hangover counter */
Word16 stat_count; /* stationary counter */
/* Note that each of the following two variables holds 15 flags. Each flag reserves 1 bit of the variable. The newest flag is
* in the bit 15 (assuming that LSB is bit 1 and MSB is bit 16). */
Word16 vadreg; /* flags for intermediate VAD decisions */
Word16 pitch_tone; /* flags for pitch and tone detection */
Word16 sp_est_cnt; /* counter for speech level estimation */
float sp_max; /* maximum level */
Word16 sp_max_cnt; /* counts frames that contains speech */
float speech_level; /* estimated speech level */
double prev_pow_sum; /* power of previous frame */
float level[COMPLEN];
float prevLevel[COMPLEN];
} VadVars;
/*
********************************************************************************
* DECLARATION OF PROTOTYPES
********************************************************************************
*/
int wb_vad_init(VadVars ** st);
int wb_vad_reset(VadVars * st);
void wb_vad_exit(VadVars ** st);
void wb_vad_pitch_tone_detection(VadVars * st, float p_gain);
Word16 wb_vad(VadVars * st, float in_buf[]);
#endif