summaryrefslogtreecommitdiffstats
path: root/media/libstagefright/codecs/amrnb/common/include/vad1.h
blob: c144ea0249ef9c4152713eb26904b8f6d446cf5e (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
/* ------------------------------------------------------------------
 * Copyright (C) 1998-2009 PacketVideo
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 *      http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either
 * express or implied.
 * See the License for the specific language governing permissions
 * and limitations under the License.
 * -------------------------------------------------------------------
 */
/****************************************************************************************
Portions of this file are derived from the following 3GPP standard:

    3GPP TS 26.073
    ANSI-C code for the Adaptive Multi-Rate (AMR) speech codec
    Available from http://www.3gpp.org

(C) 2004, 3GPP Organizational Partners (ARIB, ATIS, CCSA, ETSI, TTA, TTC)
Permission to distribute, modify and use this file under the standard license
terms listed above has been obtained from the copyright holder.
****************************************************************************************/
/*

 Filename: /audio/gsm_amr/c/include/vad_1.h

------------------------------------------------------------------------------
 REVISION HISTORY

 Description: Placed header file in the proper template format.  Added
 parameter pOverflow for the basic math ops.

 Description:  Replaced "int" and/or "char" with OSCL defined types.

 Description: Moved _cplusplus #ifdef after Include section.

 Description:

------------------------------------------------------------------------------
 INCLUDE DESCRIPTION

 This file contains all the constant definitions, prototype and structure
 definitions needed by vad_1.c

------------------------------------------------------------------------------
*/

/*----------------------------------------------------------------------------
; CONTINUE ONLY IF NOT ALREADY DEFINED
----------------------------------------------------------------------------*/
#ifndef vad_1_h
#define vad_1_h "$Id $"

/*----------------------------------------------------------------------------
; INCLUDES
----------------------------------------------------------------------------*/
#include "typedef.h"
#include "cnst_vad.h"

/*--------------------------------------------------------------------------*/
#ifdef __cplusplus
extern "C"
{
#endif

    /*----------------------------------------------------------------------------
    ; MACROS
    ; Define module specific macros here
    ----------------------------------------------------------------------------*/

    /*----------------------------------------------------------------------------
    ; DEFINES
    ; Include all pre-processor statements here.
    ----------------------------------------------------------------------------*/

    /*----------------------------------------------------------------------------
    ; EXTERNAL VARIABLES REFERENCES
    ; Declare variables used in this module but defined elsewhere
    ----------------------------------------------------------------------------*/

    /*----------------------------------------------------------------------------
    ; SIMPLE TYPEDEF'S
    ----------------------------------------------------------------------------*/

    /*----------------------------------------------------------------------------
    ; ENUMERATED TYPEDEF'S
    ----------------------------------------------------------------------------*/

    /*----------------------------------------------------------------------------
    ; STRUCTURES TYPEDEF'S
    ----------------------------------------------------------------------------*/
    /* state variable */
    typedef struct
    {

        Word16 bckr_est[COMPLEN];    /* background noise estimate                */
        Word16 ave_level[COMPLEN];   /* averaged input components for stationary */
        /*    estimation                            */
        Word16 old_level[COMPLEN];   /* input levels of the previous frame       */
        Word16 sub_level[COMPLEN];   /* input levels calculated at the end of
                                      a frame (lookahead)                   */
        Word16 a_data5[3][2];        /* memory for the filter bank               */
        Word16 a_data3[5];           /* memory for the filter bank               */

        Word16 burst_count;          /* counts length of a speech burst          */
        Word16 hang_count;           /* hangover counter                         */
        Word16 stat_count;           /* stationary counter                       */

        /* Note that each of the following three variables (vadreg, pitch and tone)
           holds 15 flags. Each flag reserves 1 bit of the variable. The newest
           flag is in the bit 15 (assuming that LSB is bit 1 and MSB is bit 16). */
        Word16 vadreg;               /* flags for intermediate VAD decisions     */
        Word16 pitch;                /* flags for pitch detection                */
        Word16 tone;                 /* flags for tone detection                 */
        Word16 complex_high;         /* flags for complex detection              */
        Word16 complex_low;          /* flags for complex detection              */

        Word16 oldlag_count, oldlag; /* variables for pitch detection            */

        Word16 complex_hang_count;   /* complex hangover counter, used by VAD    */
        Word16 complex_hang_timer;   /* hangover initiator, used by CAD          */

        Word16 best_corr_hp;         /* FIP filtered value Q15                   */

        Word16 speech_vad_decision;  /* final decision                           */
        Word16 complex_warning;      /* complex background warning               */

        Word16 sp_burst_count;       /* counts length of a speech burst incl     */
        Word16 corr_hp_fast;         /* filtered value                           */
    } vadState1;
    /*----------------------------------------------------------------------------
    ; GLOBAL FUNCTION DEFINITIONS
    ; Function Prototype declaration
    ----------------------------------------------------------------------------*/
    Word16 vad1_init(vadState1 **st);
    /* initialize one instance of the pre processing state.
       Stores pointer to filter status struct in *st. This pointer has to
       be passed to vad in each call.
       returns 0 on success
     */

    Word16 vad1_reset(vadState1 *st);
    /* reset of pre processing state (i.e. set state memory to zero)
       returns 0 on success
     */

    void vad1_exit(vadState1 **st);
    /* de-initialize pre processing state (i.e. free status struct)
       stores NULL in *st
     */

    void vad_complex_detection_update(vadState1 *st,       /* i/o : State struct     */
                                      Word16 best_corr_hp /* i   : best Corr Q15    */
                                     );

    void vad_tone_detection(vadState1 *st,  /* i/o : State struct            */
                            Word32 t0,     /* i   : autocorrelation maxima  */
                            Word32 t1,     /* i   : energy                  */
                            Flag   *pOverflow
                           );

    void vad_tone_detection_update(
        vadState1 *st,             /* i/o : State struct              */
        Word16 one_lag_per_frame,  /* i   : 1 if one open-loop lag is
                                              calculated per each frame,
                                              otherwise 0                     */
        Flag *pOverflow
    );

    void vad_pitch_detection(vadState1 *st,   /* i/o : State struct                  */
                             Word16 lags[],  /* i   : speech encoder open loop lags */
                             Flag   *pOverflow
                            );

    Word16 vad1(vadState1 *st,   /* i/o : State struct                      */
                Word16 in_buf[], /* i   : samples of the input frame
                                inbuf[159] is the very last sample,
                                incl lookahead                          */
                Flag *pOverflow
               );

    /*----------------------------------------------------------------------------
    ; END
    ----------------------------------------------------------------------------*/
#ifdef __cplusplus
}
#endif

#endif /* _VAD1_H_ */