blob: 4ff590b04caba50835fcd18009437bc790aaaaae [file] [log] [blame]
Gregory Maxwellae231142011-07-30 08:18:48 -04001/***********************************************************************
2Copyright (c) 2006-2011, Skype Limited. All rights reserved.
3Redistribution and use in source and binary forms, with or without
Jean-Marc Valinae00e602012-04-20 16:31:04 -04004modification, are permitted provided that the following conditions
5are met:
Gregory Maxwellae231142011-07-30 08:18:48 -04006- Redistributions of source code must retain the above copyright notice,
7this list of conditions and the following disclaimer.
8- Redistributions in binary form must reproduce the above copyright
9notice, this list of conditions and the following disclaimer in the
10documentation and/or other materials provided with the distribution.
Ralph Gilesf2446c22013-09-16 14:40:04 -070011- Neither the name of Internet Society, IETF or IETF Trust, nor the
Jean-Marc Valinae00e602012-04-20 16:31:04 -040012names of specific contributors, may be used to endorse or promote
13products derived from this software without specific prior written
14permission.
Timothy B. Terriberry80ad3832013-05-19 18:00:39 -070015THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
Jean-Marc Valinae00e602012-04-20 16:31:04 -040016AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
17IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
18ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
19LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
20CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
21SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
22INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
23CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
24ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
25POSSIBILITY OF SUCH DAMAGE.
Gregory Maxwellae231142011-07-30 08:18:48 -040026***********************************************************************/
27
28#ifndef SILK_STRUCTS_H
29#define SILK_STRUCTS_H
30
Jean-Marc Valin1c2f5632011-09-16 01:16:53 -070031#include "typedef.h"
32#include "SigProc_FIX.h"
33#include "define.h"
Gregory Maxwellae231142011-07-30 08:18:48 -040034#include "entenc.h"
35#include "entdec.h"
36
37#ifdef __cplusplus
38extern "C"
39{
40#endif
41
42/************************************/
43/* Noise shaping quantization state */
44/************************************/
45typedef struct {
Koen Vosacc7a6c2011-10-28 19:44:26 -040046 opus_int16 xq[ 2 * MAX_FRAME_LENGTH ]; /* Buffer for quantized output signal */
Koen Vosa51ebd62011-12-14 11:39:29 -050047 opus_int32 sLTP_shp_Q14[ 2 * MAX_FRAME_LENGTH ];
Koen Vosacc7a6c2011-10-28 19:44:26 -040048 opus_int32 sLPC_Q14[ MAX_SUB_FRAME_LENGTH + NSQ_LPC_BUF_LENGTH ];
49 opus_int32 sAR2_Q14[ MAX_SHAPE_LPC_ORDER ];
Koen Vosa51ebd62011-12-14 11:39:29 -050050 opus_int32 sLF_AR_shp_Q14;
Koen Vos6e40eb52016-02-21 11:34:11 +080051 opus_int32 sDiff_shp_Q14;
Koen Vosacc7a6c2011-10-28 19:44:26 -040052 opus_int lagPrev;
53 opus_int sLTP_buf_idx;
54 opus_int sLTP_shp_buf_idx;
55 opus_int32 rand_seed;
Koen Vosa51ebd62011-12-14 11:39:29 -050056 opus_int32 prev_gain_Q16;
Koen Vosacc7a6c2011-10-28 19:44:26 -040057 opus_int rewhite_flag;
Gregory Maxwellae231142011-07-30 08:18:48 -040058} silk_nsq_state;
59
60/********************************/
61/* VAD state */
62/********************************/
63typedef struct {
Koen Vosacc7a6c2011-10-28 19:44:26 -040064 opus_int32 AnaState[ 2 ]; /* Analysis filterbank state: 0-8 kHz */
65 opus_int32 AnaState1[ 2 ]; /* Analysis filterbank state: 0-4 kHz */
66 opus_int32 AnaState2[ 2 ]; /* Analysis filterbank state: 0-2 kHz */
67 opus_int32 XnrgSubfr[ VAD_N_BANDS ]; /* Subframe energies */
68 opus_int32 NrgRatioSmth_Q8[ VAD_N_BANDS ]; /* Smoothed energy level in each band */
69 opus_int16 HPstate; /* State of differentiator in the lowest band */
70 opus_int32 NL[ VAD_N_BANDS ]; /* Noise energy level in each band */
71 opus_int32 inv_NL[ VAD_N_BANDS ]; /* Inverse noise energy level in each band */
72 opus_int32 NoiseLevelBias[ VAD_N_BANDS ]; /* Noise level estimator bias/offset */
73 opus_int32 counter; /* Frame counter used in the initial phase */
Gregory Maxwellae231142011-07-30 08:18:48 -040074} silk_VAD_state;
75
76/* Variable cut-off low-pass filter state */
77typedef struct {
78 opus_int32 In_LP_State[ 2 ]; /* Low pass filter state */
79 opus_int32 transition_frame_no; /* Counter which is mapped to a cut-off frequency */
Koen Vosacc7a6c2011-10-28 19:44:26 -040080 opus_int mode; /* Operating mode, <0: switch down, >0: switch up; 0: do nothing */
Gregory Maxwellae231142011-07-30 08:18:48 -040081} silk_LP_state;
82
83/* Structure containing NLSF codebook */
84typedef struct {
85 const opus_int16 nVectors;
86 const opus_int16 order;
87 const opus_int16 quantStepSize_Q16;
88 const opus_int16 invQuantStepSize_Q6;
89 const opus_uint8 *CB1_NLSF_Q8;
Koen Vos2955f682016-02-21 13:16:46 +080090 const opus_int16 *CB1_Wght_Q9;
Gregory Maxwellae231142011-07-30 08:18:48 -040091 const opus_uint8 *CB1_iCDF;
92 const opus_uint8 *pred_Q8;
93 const opus_uint8 *ec_sel;
94 const opus_uint8 *ec_iCDF;
95 const opus_uint8 *ec_Rates_Q5;
96 const opus_int16 *deltaMin_Q15;
97} silk_NLSF_CB_struct;
98
99typedef struct {
100 opus_int16 pred_prev_Q13[ 2 ];
101 opus_int16 sMid[ 2 ];
102 opus_int16 sSide[ 2 ];
103 opus_int32 mid_side_amp_Q0[ 4 ];
104 opus_int16 smth_width_Q14;
105 opus_int16 width_prev_Q14;
Jean-Marc Valinb24e5742011-10-11 21:09:14 -0400106 opus_int16 silent_side_len;
Koen Vos4e1ce382011-08-25 13:50:21 -0400107 opus_int8 predIx[ MAX_FRAMES_PER_PACKET ][ 2 ][ 3 ];
108 opus_int8 mid_only_flags[ MAX_FRAMES_PER_PACKET ];
Gregory Maxwellae231142011-07-30 08:18:48 -0400109} stereo_enc_state;
110
111typedef struct {
112 opus_int16 pred_prev_Q13[ 2 ];
113 opus_int16 sMid[ 2 ];
114 opus_int16 sSide[ 2 ];
115} stereo_dec_state;
116
117typedef struct {
118 opus_int8 GainsIndices[ MAX_NB_SUBFR ];
119 opus_int8 LTPIndex[ MAX_NB_SUBFR ];
120 opus_int8 NLSFIndices[ MAX_LPC_ORDER + 1 ];
121 opus_int16 lagIndex;
122 opus_int8 contourIndex;
123 opus_int8 signalType;
124 opus_int8 quantOffsetType;
125 opus_int8 NLSFInterpCoef_Q2;
126 opus_int8 PERIndex;
127 opus_int8 LTP_scaleIndex;
128 opus_int8 Seed;
129} SideInfoIndices;
130
131/********************************/
132/* Encoder state */
133/********************************/
134typedef struct {
Koen Vosacc7a6c2011-10-28 19:44:26 -0400135 opus_int32 In_HP_State[ 2 ]; /* High pass filter state */
136 opus_int32 variable_HP_smth1_Q15; /* State of first smoother */
137 opus_int32 variable_HP_smth2_Q15; /* State of second smoother */
138 silk_LP_state sLP; /* Low pass filter state */
139 silk_VAD_state sVAD; /* Voice activity detector state */
140 silk_nsq_state sNSQ; /* Noise Shape Quantizer State */
141 opus_int16 prev_NLSFq_Q15[ MAX_LPC_ORDER ]; /* Previously quantized NLSF vector */
142 opus_int speech_activity_Q8; /* Speech activity */
143 opus_int allow_bandwidth_switch; /* Flag indicating that switching of internal bandwidth is allowed */
144 opus_int8 LBRRprevLastGainIndex;
145 opus_int8 prevSignalType;
146 opus_int prevLag;
147 opus_int pitch_LPC_win_length;
148 opus_int max_pitch_lag; /* Highest possible pitch lag (samples) */
149 opus_int32 API_fs_Hz; /* API sampling frequency (Hz) */
150 opus_int32 prev_API_fs_Hz; /* Previous API sampling frequency (Hz) */
151 opus_int maxInternal_fs_Hz; /* Maximum internal sampling frequency (Hz) */
152 opus_int minInternal_fs_Hz; /* Minimum internal sampling frequency (Hz) */
153 opus_int desiredInternal_fs_Hz; /* Soft request for internal sampling frequency (Hz) */
154 opus_int fs_kHz; /* Internal sampling frequency (kHz) */
Koen Vosacc7a6c2011-10-28 19:44:26 -0400155 opus_int nb_subfr; /* Number of 5 ms subframes in a frame */
156 opus_int frame_length; /* Frame length (samples) */
157 opus_int subfr_length; /* Subframe length (samples) */
158 opus_int ltp_mem_length; /* Length of LTP memory */
159 opus_int la_pitch; /* Look-ahead for pitch analysis (samples) */
160 opus_int la_shape; /* Look-ahead for noise shape analysis (samples) */
161 opus_int shapeWinLength; /* Window length for noise shape analysis (samples) */
162 opus_int32 TargetRate_bps; /* Target bitrate (bps) */
163 opus_int PacketSize_ms; /* Number of milliseconds to put in each packet */
164 opus_int PacketLoss_perc; /* Packet loss rate measured by farend */
165 opus_int32 frameCounter;
166 opus_int Complexity; /* Complexity setting */
167 opus_int nStatesDelayedDecision; /* Number of states in delayed decision quantization */
168 opus_int useInterpolatedNLSFs; /* Flag for using NLSF interpolation */
169 opus_int shapingLPCOrder; /* Filter order for noise shaping filters */
170 opus_int predictLPCOrder; /* Filter order for prediction filters */
171 opus_int pitchEstimationComplexity; /* Complexity level for pitch estimator */
172 opus_int pitchEstimationLPCOrder; /* Whitening filter order for pitch estimator */
173 opus_int32 pitchEstimationThreshold_Q16; /* Threshold for pitch estimator */
Timothy B. Terriberry554b3492014-10-03 21:49:57 -0700174 opus_int32 sum_log_gain_Q7; /* Cumulative max prediction gain */
Koen Vosacc7a6c2011-10-28 19:44:26 -0400175 opus_int NLSF_MSVQ_Survivors; /* Number of survivors in NLSF MSVQ */
176 opus_int first_frame_after_reset; /* Flag for deactivating NLSF interpolation, pitch prediction */
177 opus_int controlled_since_last_payload; /* Flag for ensuring codec_control only runs once per packet */
178 opus_int warping_Q16; /* Warping parameter for warped noise shaping */
179 opus_int useCBR; /* Flag to enable constant bitrate */
180 opus_int prefillFlag; /* Flag to indicate that only buffers are prefilled, no coding */
181 const opus_uint8 *pitch_lag_low_bits_iCDF; /* Pointer to iCDF table for low bits of pitch lag index */
182 const opus_uint8 *pitch_contour_iCDF; /* Pointer to iCDF table for pitch contour index */
183 const silk_NLSF_CB_struct *psNLSF_CB; /* Pointer to NLSF codebook */
184 opus_int input_quality_bands_Q15[ VAD_N_BANDS ];
185 opus_int input_tilt_Q15;
186 opus_int SNR_dB_Q7; /* Quality setting */
Gregory Maxwellae231142011-07-30 08:18:48 -0400187
Koen Vosacc7a6c2011-10-28 19:44:26 -0400188 opus_int8 VAD_flags[ MAX_FRAMES_PER_PACKET ];
189 opus_int8 LBRR_flag;
190 opus_int LBRR_flags[ MAX_FRAMES_PER_PACKET ];
Gregory Maxwellae231142011-07-30 08:18:48 -0400191
Koen Vosacc7a6c2011-10-28 19:44:26 -0400192 SideInfoIndices indices;
193 opus_int8 pulses[ MAX_FRAME_LENGTH ];
Gregory Maxwellae231142011-07-30 08:18:48 -0400194
Timothy B. Terriberry39386e02013-11-18 13:30:13 -0500195 int arch;
196
Gregory Maxwellae231142011-07-30 08:18:48 -0400197 /* Input/output buffering */
Koen Vosacc7a6c2011-10-28 19:44:26 -0400198 opus_int16 inputBuf[ MAX_FRAME_LENGTH + 2 ]; /* Buffer containing input signal */
Koen Vosacc7a6c2011-10-28 19:44:26 -0400199 opus_int inputBufIx;
200 opus_int nFramesPerPacket;
201 opus_int nFramesEncoded; /* Number of frames analyzed in current packet */
Gregory Maxwellae231142011-07-30 08:18:48 -0400202
Koen Vosacc7a6c2011-10-28 19:44:26 -0400203 opus_int nChannelsAPI;
204 opus_int nChannelsInternal;
205 opus_int channelNb;
Gregory Maxwellae231142011-07-30 08:18:48 -0400206
207 /* Parameters For LTP scaling Control */
Koen Vosacc7a6c2011-10-28 19:44:26 -0400208 opus_int frames_since_onset;
Gregory Maxwellae231142011-07-30 08:18:48 -0400209
210 /* Specifically for entropy coding */
Koen Vosacc7a6c2011-10-28 19:44:26 -0400211 opus_int ec_prevSignalType;
212 opus_int16 ec_prevLagIndex;
Gregory Maxwellae231142011-07-30 08:18:48 -0400213
214 silk_resampler_state_struct resampler_state;
215
216 /* DTX */
Koen Vosacc7a6c2011-10-28 19:44:26 -0400217 opus_int useDTX; /* Flag to enable DTX */
218 opus_int inDTX; /* Flag to signal DTX period */
219 opus_int noSpeechCounter; /* Counts concecutive nonactive frames, used by DTX */
Gregory Maxwellae231142011-07-30 08:18:48 -0400220
221 /* Inband Low Bitrate Redundancy (LBRR) data */
Koen Vosacc7a6c2011-10-28 19:44:26 -0400222 opus_int useInBandFEC; /* Saves the API setting for query */
223 opus_int LBRR_enabled; /* Depends on useInBandFRC, bitrate and packet loss rate */
224 opus_int LBRR_GainIncreases; /* Gains increment for coding LBRR frames */
225 SideInfoIndices indices_LBRR[ MAX_FRAMES_PER_PACKET ];
226 opus_int8 pulses_LBRR[ MAX_FRAMES_PER_PACKET ][ MAX_FRAME_LENGTH ];
Gregory Maxwellae231142011-07-30 08:18:48 -0400227} silk_encoder_state;
228
229
230/* Struct for Packet Loss Concealment */
231typedef struct {
Koen Vosacc7a6c2011-10-28 19:44:26 -0400232 opus_int32 pitchL_Q8; /* Pitch lag to use for voiced concealment */
233 opus_int16 LTPCoef_Q14[ LTP_ORDER ]; /* LTP coeficients to use for voiced concealment */
234 opus_int16 prevLPC_Q12[ MAX_LPC_ORDER ];
235 opus_int last_frame_lost; /* Was previous frame lost */
236 opus_int32 rand_seed; /* Seed for unvoiced signal generation */
237 opus_int16 randScale_Q14; /* Scaling of unvoiced random signal */
238 opus_int32 conc_energy;
239 opus_int conc_energy_shift;
240 opus_int16 prevLTP_scale_Q14;
Koen Vos0dbd0ca2011-10-28 21:05:22 -0400241 opus_int32 prevGain_Q16[ 2 ];
Koen Vosacc7a6c2011-10-28 19:44:26 -0400242 opus_int fs_kHz;
Koen Vos0dbd0ca2011-10-28 21:05:22 -0400243 opus_int nb_subfr;
244 opus_int subfr_length;
Gregory Maxwellae231142011-07-30 08:18:48 -0400245} silk_PLC_struct;
246
247/* Struct for CNG */
248typedef struct {
Koen Vosa51ebd62011-12-14 11:39:29 -0500249 opus_int32 CNG_exc_buf_Q14[ MAX_FRAME_LENGTH ];
Koen Vosacc7a6c2011-10-28 19:44:26 -0400250 opus_int16 CNG_smth_NLSF_Q15[ MAX_LPC_ORDER ];
251 opus_int32 CNG_synth_state[ MAX_LPC_ORDER ];
252 opus_int32 CNG_smth_Gain_Q16;
253 opus_int32 rand_seed;
254 opus_int fs_kHz;
Gregory Maxwellae231142011-07-30 08:18:48 -0400255} silk_CNG_struct;
256
257/********************************/
258/* Decoder state */
259/********************************/
260typedef struct {
Koen Vosa51ebd62011-12-14 11:39:29 -0500261 opus_int32 prev_gain_Q16;
262 opus_int32 exc_Q14[ MAX_FRAME_LENGTH ];
Koen Vosacc7a6c2011-10-28 19:44:26 -0400263 opus_int32 sLPC_Q14_buf[ MAX_LPC_ORDER ];
264 opus_int16 outBuf[ MAX_FRAME_LENGTH + 2 * MAX_SUB_FRAME_LENGTH ]; /* Buffer for output signal */
Koen Vosacc7a6c2011-10-28 19:44:26 -0400265 opus_int lagPrev; /* Previous Lag */
266 opus_int8 LastGainIndex; /* Previous gain index */
267 opus_int fs_kHz; /* Sampling frequency in kHz */
268 opus_int32 fs_API_hz; /* API sample frequency (Hz) */
269 opus_int nb_subfr; /* Number of 5 ms subframes in a frame */
270 opus_int frame_length; /* Frame length (samples) */
271 opus_int subfr_length; /* Subframe length (samples) */
272 opus_int ltp_mem_length; /* Length of LTP memory */
273 opus_int LPC_order; /* LPC order */
274 opus_int16 prevNLSF_Q15[ MAX_LPC_ORDER ]; /* Used to interpolate LSFs */
275 opus_int first_frame_after_reset; /* Flag for deactivating NLSF interpolation */
276 const opus_uint8 *pitch_lag_low_bits_iCDF; /* Pointer to iCDF table for low bits of pitch lag index */
277 const opus_uint8 *pitch_contour_iCDF; /* Pointer to iCDF table for pitch contour index */
Gregory Maxwellae231142011-07-30 08:18:48 -0400278
279 /* For buffering payload in case of more frames per packet */
Koen Vosacc7a6c2011-10-28 19:44:26 -0400280 opus_int nFramesDecoded;
281 opus_int nFramesPerPacket;
Gregory Maxwellae231142011-07-30 08:18:48 -0400282
283 /* Specifically for entropy coding */
Koen Vosacc7a6c2011-10-28 19:44:26 -0400284 opus_int ec_prevSignalType;
285 opus_int16 ec_prevLagIndex;
Gregory Maxwellae231142011-07-30 08:18:48 -0400286
Koen Vosacc7a6c2011-10-28 19:44:26 -0400287 opus_int VAD_flags[ MAX_FRAMES_PER_PACKET ];
288 opus_int LBRR_flag;
289 opus_int LBRR_flags[ MAX_FRAMES_PER_PACKET ];
Gregory Maxwellae231142011-07-30 08:18:48 -0400290
291 silk_resampler_state_struct resampler_state;
292
Koen Vosacc7a6c2011-10-28 19:44:26 -0400293 const silk_NLSF_CB_struct *psNLSF_CB; /* Pointer to NLSF codebook */
Gregory Maxwellae231142011-07-30 08:18:48 -0400294
295 /* Quantization indices */
Koen Vosacc7a6c2011-10-28 19:44:26 -0400296 SideInfoIndices indices;
Gregory Maxwellae231142011-07-30 08:18:48 -0400297
298 /* CNG state */
Koen Vosacc7a6c2011-10-28 19:44:26 -0400299 silk_CNG_struct sCNG;
Gregory Maxwellae231142011-07-30 08:18:48 -0400300
301 /* Stuff used for PLC */
Koen Vosacc7a6c2011-10-28 19:44:26 -0400302 opus_int lossCnt;
303 opus_int prevSignalType;
Linfeng Zhang95d4c9f2016-07-13 17:25:49 -0700304 int arch;
Gregory Maxwellae231142011-07-30 08:18:48 -0400305
306 silk_PLC_struct sPLC;
307
308} silk_decoder_state;
309
310/************************/
311/* Decoder control */
312/************************/
313typedef struct {
Koen Vosacc7a6c2011-10-28 19:44:26 -0400314 /* Prediction and coding parameters */
315 opus_int pitchL[ MAX_NB_SUBFR ];
316 opus_int32 Gains_Q16[ MAX_NB_SUBFR ];
317 /* Holds interpolated and final coefficients, 4-byte aligned */
Jean-Marc Valinfb3a4372011-09-16 00:58:26 -0700318 silk_DWORD_ALIGN opus_int16 PredCoef_Q12[ 2 ][ MAX_LPC_ORDER ];
Koen Vosacc7a6c2011-10-28 19:44:26 -0400319 opus_int16 LTPCoef_Q14[ LTP_ORDER * MAX_NB_SUBFR ];
320 opus_int LTP_scale_Q14;
Gregory Maxwellae231142011-07-30 08:18:48 -0400321} silk_decoder_control;
322
323
324#ifdef __cplusplus
325}
326#endif
327
328#endif