134 lines
6.7 KiB
C
134 lines
6.7 KiB
C
/* ------------------------------------------------------------------
|
|
* Copyright (C) 1998-2009 PacketVideo
|
|
*
|
|
* Licensed under the Apache License, Version 2.0 (the "License");
|
|
* you may not use this file except in compliance with the License.
|
|
* You may obtain a copy of the License at
|
|
*
|
|
* http://www.apache.org/licenses/LICENSE-2.0
|
|
*
|
|
* Unless required by applicable law or agreed to in writing, software
|
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either
|
|
* express or implied.
|
|
* See the License for the specific language governing permissions
|
|
* and limitations under the License.
|
|
* -------------------------------------------------------------------
|
|
*/
|
|
/****************************************************************************************
|
|
Portions of this file are derived from the following 3GPP standard:
|
|
|
|
3GPP TS 26.073
|
|
ANSI-C code for the Adaptive Multi-Rate (AMR) speech codec
|
|
Available from http://www.3gpp.org
|
|
|
|
(C) 2004, 3GPP Organizational Partners (ARIB, ATIS, CCSA, ETSI, TTA, TTC)
|
|
Permission to distribute, modify and use this file under the standard license
|
|
terms listed above has been obtained from the copyright holder.
|
|
****************************************************************************************/
|
|
/*
|
|
********************************************************************************
|
|
**-------------------------------------------------------------------------**
|
|
** **
|
|
** GSM AMR-NB speech codec R98 Version 7.5.0 March 2, 2001 **
|
|
** R99 Version 3.2.0 **
|
|
** REL-4 Version 4.0.0 **
|
|
** **
|
|
**-------------------------------------------------------------------------**
|
|
********************************************************************************
|
|
*
|
|
* File : cnst_vad.h
|
|
* Purpose : Constants and definitions for VAD
|
|
*
|
|
********************************************************************************
|
|
*/
|
|
#ifndef cnst_vad_h
|
|
#define cnst_vad_h "$Id $"
|
|
|
|
#define FRAME_LEN 160 /* Length (samples) of the input frame */
|
|
#define COMPLEN 9 /* Number of sub-bands used by VAD */
|
|
#define INV_COMPLEN 3641 /* 1.0/COMPLEN*2^15 */
|
|
#define LOOKAHEAD 40 /* length of the lookahead used by speech coder */
|
|
|
|
#define UNITY 512 /* Scaling used with SNR calculation */
|
|
#define UNIRSHFT 6 /* = log2(MAX_16/UNITY) */
|
|
|
|
#define TONE_THR (Word16)(0.65*MAX_16) /* Threshold for tone detection */
|
|
|
|
/* Constants for background spectrum update */
|
|
#define ALPHA_UP1 (Word16)((1.0 - 0.95)*MAX_16) /* Normal update, upwards: */
|
|
#define ALPHA_DOWN1 (Word16)((1.0 - 0.936)*MAX_16) /* Normal update, downwards */
|
|
#define ALPHA_UP2 (Word16)((1.0 - 0.985)*MAX_16) /* Forced update, upwards */
|
|
#define ALPHA_DOWN2 (Word16)((1.0 - 0.943)*MAX_16) /* Forced update, downwards */
|
|
#define ALPHA3 (Word16)((1.0 - 0.95)*MAX_16) /* Update downwards */
|
|
#define ALPHA4 (Word16)((1.0 - 0.9)*MAX_16) /* For stationary estimation */
|
|
#define ALPHA5 (Word16)((1.0 - 0.5)*MAX_16) /* For stationary estimation */
|
|
|
|
/* Constants for VAD threshold */
|
|
#define VAD_THR_HIGH 1260 /* Highest threshold */
|
|
#define VAD_THR_LOW 720 /* Lowest threshold */
|
|
#define VAD_P1 0 /* Noise level for highest threshold */
|
|
#define VAD_P2 6300 /* Noise level for lowest threshold */
|
|
#define VAD_SLOPE (Word16)(MAX_16*(float)(VAD_THR_LOW-VAD_THR_HIGH)/(float)(VAD_P2-VAD_P1))
|
|
|
|
/* Parameters for background spectrum recovery function */
|
|
#define STAT_COUNT 20 /* threshold of stationary detection counter */
|
|
#define STAT_COUNT_BY_2 10 /* threshold of stationary detection counter */
|
|
#define CAD_MIN_STAT_COUNT 5 /* threshold of stationary detection counter */
|
|
|
|
#define STAT_THR_LEVEL 184 /* Threshold level for stationarity detection */
|
|
#define STAT_THR 1000 /* Threshold for stationarity detection */
|
|
|
|
/* Limits for background noise estimate */
|
|
#define NOISE_MIN 40 /* minimum */
|
|
#define NOISE_MAX 16000 /* maximum */
|
|
#define NOISE_INIT 150 /* initial */
|
|
|
|
/* Constants for VAD hangover addition */
|
|
#define HANG_NOISE_THR 100
|
|
#define BURST_LEN_HIGH_NOISE 4
|
|
#define HANG_LEN_HIGH_NOISE 7
|
|
#define BURST_LEN_LOW_NOISE 5
|
|
#define HANG_LEN_LOW_NOISE 4
|
|
|
|
/* Thresholds for signal power */
|
|
#define VAD_POW_LOW (Word32)15000 /* If input power is lower, */
|
|
/* VAD is set to 0 */
|
|
#define POW_PITCH_THR (Word32)343040 /* If input power is lower, pitch */
|
|
/* detection is ignored */
|
|
|
|
#define POW_COMPLEX_THR (Word32)15000 /* If input power is lower, complex */
|
|
/* flags value for previous frame is un-set */
|
|
|
|
|
|
/* Constants for the filter bank */
|
|
#define LEVEL_SHIFT 0 /* scaling */
|
|
#define COEFF3 13363 /* coefficient for the 3rd order filter */
|
|
#define COEFF5_1 21955 /* 1st coefficient the for 5th order filter */
|
|
#define COEFF5_2 6390 /* 2nd coefficient the for 5th order filter */
|
|
|
|
/* Constants for pitch detection */
|
|
#define LTHRESH 4
|
|
#define NTHRESH 4
|
|
|
|
/* Constants for complex signal VAD */
|
|
#define CVAD_THRESH_ADAPT_HIGH (Word16)(0.6 * MAX_16) /* threshold for adapt stopping high */
|
|
#define CVAD_THRESH_ADAPT_LOW (Word16)(0.5 * MAX_16) /* threshold for adapt stopping low */
|
|
#define CVAD_THRESH_IN_NOISE (Word16)(0.65 * MAX_16) /* threshold going into speech on */
|
|
/* a short term basis */
|
|
|
|
#define CVAD_THRESH_HANG (Word16)(0.70 * MAX_16) /* threshold */
|
|
#define CVAD_HANG_LIMIT (Word16)(100) /* 2 second estimation time */
|
|
#define CVAD_HANG_LENGTH (Word16)(250) /* 5 second hangover */
|
|
|
|
#define CVAD_LOWPOW_RESET (Word16) (0.40 * MAX_16) /* init in low power segment */
|
|
#define CVAD_MIN_CORR (Word16) (0.40 * MAX_16) /* lowest adaptation value */
|
|
|
|
#define CVAD_BURST 20 /* speech burst length for speech reset */
|
|
#define CVAD_ADAPT_SLOW (Word16)(( 1.0 - 0.98) * MAX_16) /* threshold for slow adaption */
|
|
#define CVAD_ADAPT_FAST (Word16)((1.0 - 0.92) * MAX_16) /* threshold for fast adaption */
|
|
#define CVAD_ADAPT_REALLY_FAST (Word16)((1.0 - 0.80) * MAX_16) /* threshold for really fast */
|
|
/* adaption */
|
|
|
|
#endif
|