79 lines
3.6 KiB
C
79 lines
3.6 KiB
C
|
/*
|
||
|
** Copyright 2003-2010, VisualOn, Inc.
|
||
|
**
|
||
|
** Licensed under the Apache License, Version 2.0 (the "License");
|
||
|
** you may not use this file except in compliance with the License.
|
||
|
** You may obtain a copy of the License at
|
||
|
**
|
||
|
** http://www.apache.org/licenses/LICENSE-2.0
|
||
|
**
|
||
|
** Unless required by applicable law or agreed to in writing, software
|
||
|
** distributed under the License is distributed on an "AS IS" BASIS,
|
||
|
** WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||
|
** See the License for the specific language governing permissions and
|
||
|
** limitations under the License.
|
||
|
*/
|
||
|
|
||
|
|
||
|
/*-------------------------------------------------------------------*
|
||
|
* WB_VAD.H *
|
||
|
*-------------------------------------------------------------------*
|
||
|
* Functions and static memory for Voice Activity Detection. *
|
||
|
*-------------------------------------------------------------------*/
|
||
|
|
||
|
#ifndef __WB_VAD_H__
|
||
|
#define __WB_VAD_H__
|
||
|
|
||
|
/******************************************************************************
|
||
|
* INCLUDE FILES
|
||
|
******************************************************************************/
|
||
|
#include "typedef.h"
|
||
|
#include "wb_vad_c.h"
|
||
|
#include "voMem.h"
|
||
|
|
||
|
/******************************************************************************
|
||
|
* DEFINITION OF DATA TYPES
|
||
|
******************************************************************************/
|
||
|
|
||
|
typedef struct
|
||
|
{
|
||
|
Word16 bckr_est[COMPLEN]; /* background noise estimate */
|
||
|
Word16 ave_level[COMPLEN]; /* averaged input components for stationary */
|
||
|
/* estimation */
|
||
|
Word16 old_level[COMPLEN]; /* input levels of the previous frame */
|
||
|
Word16 sub_level[COMPLEN]; /* input levels calculated at the end of a frame (lookahead) */
|
||
|
Word16 a_data5[F_5TH_CNT][2]; /* memory for the filter bank */
|
||
|
Word16 a_data3[F_3TH_CNT]; /* memory for the filter bank */
|
||
|
|
||
|
Word16 burst_count; /* counts length of a speech burst */
|
||
|
Word16 hang_count; /* hangover counter */
|
||
|
Word16 stat_count; /* stationary counter */
|
||
|
|
||
|
/* Note that each of the following two variables holds 15 flags. Each flag reserves 1 bit of the
|
||
|
* variable. The newest flag is in the bit 15 (assuming that LSB is bit 1 and MSB is bit 16). */
|
||
|
Word16 vadreg; /* flags for intermediate VAD decisions */
|
||
|
Word16 tone_flag; /* tone detection flags */
|
||
|
|
||
|
Word16 sp_est_cnt; /* counter for speech level estimation */
|
||
|
Word16 sp_max; /* maximum level */
|
||
|
Word16 sp_max_cnt; /* counts frames that contains speech */
|
||
|
Word16 speech_level; /* estimated speech level */
|
||
|
Word32 prev_pow_sum; /* power of previous frame */
|
||
|
|
||
|
} VadVars;
|
||
|
|
||
|
/********************************************************************************
|
||
|
*
|
||
|
* DECLARATION OF PROTOTYPES
|
||
|
********************************************************************************/
|
||
|
|
||
|
Word16 wb_vad_init(VadVars ** st, VO_MEM_OPERATOR *pMemOP);
|
||
|
Word16 wb_vad_reset(VadVars * st);
|
||
|
void wb_vad_exit(VadVars ** st, VO_MEM_OPERATOR *pMemOP);
|
||
|
void wb_vad_tone_detection(VadVars * st, Word16 p_gain);
|
||
|
Word16 wb_vad(VadVars * st, Word16 in_buf[]);
|
||
|
|
||
|
#endif //__WB_VAD_H__
|
||
|
|
||
|
|