| /*********************************************************************** |
| Copyright (c) 2006-2011, Skype Limited. All rights reserved. |
| Redistribution and use in source and binary forms, with or without |
| modification, (subject to the limitations in the disclaimer below) |
| are permitted provided that the following conditions are met: |
| - Redistributions of source code must retain the above copyright notice, |
| this list of conditions and the following disclaimer. |
| - Redistributions in binary form must reproduce the above copyright |
| notice, this list of conditions and the following disclaimer in the |
| documentation and/or other materials provided with the distribution. |
| - Neither the name of Skype Limited, nor the names of specific |
| contributors, may be used to endorse or promote products derived from |
| this software without specific prior written permission. |
| NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE GRANTED |
| BY THIS LICENSE. THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND |
| CONTRIBUTORS ''AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, |
| BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND |
| FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE |
| COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, |
| INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT |
| NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF |
| USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON |
| ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT |
| (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE |
| OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. |
| ***********************************************************************/ |
| |
| #ifdef HAVE_CONFIG_H |
| #include "config.h" |
| #endif |
| |
| #include "main_FIX.h" |
| #include "tuning_parameters.h" |
| |
| /****************/ |
| /* Encode frame */ |
| /****************/ |
| opus_int silk_encode_frame_FIX( |
| silk_encoder_state_FIX *psEnc, /* I/O Encoder state FIX */ |
| opus_int32 *pnBytesOut, /* O Number of payload bytes */ |
| ec_enc *psRangeEnc, /* I/O compressor data structure */ |
| opus_int condCoding /* I The type of conditional coding to use */ |
| ) |
| { |
| silk_encoder_control_FIX sEncCtrl; |
| opus_int ret = 0; |
| opus_int16 *x_frame, *res_pitch_frame; |
| opus_int16 xfw[ MAX_FRAME_LENGTH ]; |
| opus_int16 res_pitch[ 2 * MAX_FRAME_LENGTH + LA_PITCH_MAX ]; |
| |
| TIC(ENCODE_FRAME) |
| |
| psEnc->sCmn.indices.Seed = psEnc->sCmn.frameCounter++ & 3; |
| |
| /**************************************************************/ |
| /* Setup Input Pointers, and insert frame in input buffer */ |
| /*************************************************************/ |
| /* pointers aligned with start of frame to encode */ |
| x_frame = psEnc->x_buf + psEnc->sCmn.ltp_mem_length; /* start of frame to encode */ |
| res_pitch_frame = res_pitch + psEnc->sCmn.ltp_mem_length; /* start of pitch LPC residual frame */ |
| |
| /****************************/ |
| /* Voice Activity Detection */ |
| /****************************/ |
| TIC(VAD) |
| ret = silk_VAD_GetSA_Q8( &psEnc->sCmn, psEnc->sCmn.inputBuf + 1 ); |
| TOC(VAD) |
| |
| /**************************************************/ |
| /* Convert speech activity into VAD and DTX flags */ |
| /**************************************************/ |
| if( psEnc->sCmn.nFramesEncoded == 0 ) { |
| psEnc->sCmn.inDTX = psEnc->sCmn.useDTX; |
| } |
| if( psEnc->sCmn.speech_activity_Q8 < SILK_FIX_CONST( SPEECH_ACTIVITY_DTX_THRES, 8 ) ) { |
| psEnc->sCmn.indices.signalType = TYPE_NO_VOICE_ACTIVITY; |
| psEnc->sCmn.noSpeechCounter++; |
| if( psEnc->sCmn.noSpeechCounter < NB_SPEECH_FRAMES_BEFORE_DTX ) { |
| psEnc->sCmn.inDTX = 0; |
| } else if( psEnc->sCmn.noSpeechCounter > MAX_CONSECUTIVE_DTX + NB_SPEECH_FRAMES_BEFORE_DTX ) { |
| psEnc->sCmn.noSpeechCounter = NB_SPEECH_FRAMES_BEFORE_DTX; |
| psEnc->sCmn.inDTX = 0; |
| } |
| psEnc->sCmn.VAD_flags[ psEnc->sCmn.nFramesEncoded ] = 0; |
| } else { |
| psEnc->sCmn.noSpeechCounter = 0; |
| psEnc->sCmn.inDTX = 0; |
| psEnc->sCmn.indices.signalType = TYPE_UNVOICED; |
| psEnc->sCmn.VAD_flags[ psEnc->sCmn.nFramesEncoded ] = 1; |
| } |
| |
| /***************************************/ |
| /* Ensure smooth bandwidth transitions */ |
| /***************************************/ |
| silk_LP_variable_cutoff( &psEnc->sCmn.sLP, psEnc->sCmn.inputBuf + 1, psEnc->sCmn.frame_length ); |
| |
| /*******************************************/ |
| /* Copy new frame to front of input buffer */ |
| /*******************************************/ |
| silk_memcpy( x_frame + LA_SHAPE_MS * psEnc->sCmn.fs_kHz, psEnc->sCmn.inputBuf + 1, psEnc->sCmn.frame_length * sizeof( opus_int16 ) ); |
| |
| /*****************************************/ |
| /* Find pitch lags, initial LPC analysis */ |
| /*****************************************/ |
| TIC(FIND_PITCH) |
| silk_find_pitch_lags_FIX( psEnc, &sEncCtrl, res_pitch, x_frame ); |
| TOC(FIND_PITCH) |
| |
| /************************/ |
| /* Noise shape analysis */ |
| /************************/ |
| TIC(NOISE_SHAPE_ANALYSIS) |
| silk_noise_shape_analysis_FIX( psEnc, &sEncCtrl, res_pitch_frame, x_frame ); |
| TOC(NOISE_SHAPE_ANALYSIS) |
| |
| /***************************************************/ |
| /* Find linear prediction coefficients (LPC + LTP) */ |
| /***************************************************/ |
| TIC(FIND_PRED_COEF) |
| silk_find_pred_coefs_FIX( psEnc, &sEncCtrl, res_pitch, x_frame, condCoding ); |
| TOC(FIND_PRED_COEF) |
| |
| /****************************************/ |
| /* Process gains */ |
| /****************************************/ |
| TIC(PROCESS_GAINS) |
| silk_process_gains_FIX( psEnc, &sEncCtrl ); |
| TOC(PROCESS_GAINS) |
| |
| /*****************************************/ |
| /* Prefiltering for noise shaper */ |
| /*****************************************/ |
| TIC(PREFILTER) |
| silk_prefilter_FIX( psEnc, &sEncCtrl, xfw, x_frame ); |
| TOC(PREFILTER) |
| |
| /****************************************/ |
| /* Low Bitrate Redundant Encoding */ |
| /****************************************/ |
| TIC(LBRR) |
| silk_LBRR_encode_FIX( psEnc, &sEncCtrl, xfw, condCoding ); |
| TOC(LBRR) |
| |
| /*****************************************/ |
| /* Noise shaping quantization */ |
| /*****************************************/ |
| TIC(NSQ) |
| if( psEnc->sCmn.nStatesDelayedDecision > 1 || psEnc->sCmn.warping_Q16 > 0 ) { |
| silk_NSQ_del_dec( &psEnc->sCmn, &psEnc->sCmn.sNSQ, &psEnc->sCmn.indices, xfw, psEnc->sCmn.pulses, |
| sEncCtrl.PredCoef_Q12[ 0 ], sEncCtrl.LTPCoef_Q14, sEncCtrl.AR2_Q13, sEncCtrl.HarmShapeGain_Q14, |
| sEncCtrl.Tilt_Q14, sEncCtrl.LF_shp_Q14, sEncCtrl.Gains_Q16, sEncCtrl.pitchL, sEncCtrl.Lambda_Q10, sEncCtrl.LTP_scale_Q14 ); |
| } else { |
| silk_NSQ( &psEnc->sCmn, &psEnc->sCmn.sNSQ, &psEnc->sCmn.indices, xfw, psEnc->sCmn.pulses, |
| sEncCtrl.PredCoef_Q12[ 0 ], sEncCtrl.LTPCoef_Q14, sEncCtrl.AR2_Q13, sEncCtrl.HarmShapeGain_Q14, |
| sEncCtrl.Tilt_Q14, sEncCtrl.LF_shp_Q14, sEncCtrl.Gains_Q16, sEncCtrl.pitchL, sEncCtrl.Lambda_Q10, sEncCtrl.LTP_scale_Q14 ); |
| } |
| TOC(NSQ) |
| |
| /* Update input buffer */ |
| silk_memmove( psEnc->x_buf, &psEnc->x_buf[ psEnc->sCmn.frame_length ], |
| ( psEnc->sCmn.ltp_mem_length + LA_SHAPE_MS * psEnc->sCmn.fs_kHz ) * sizeof( opus_int16 ) ); |
| |
| /* Parameters needed for next frame */ |
| psEnc->sCmn.prevLag = sEncCtrl.pitchL[ psEnc->sCmn.nb_subfr - 1 ]; |
| psEnc->sCmn.prevSignalType = psEnc->sCmn.indices.signalType; |
| |
| /* Exit without entropy coding */ |
| if( psEnc->sCmn.prefillFlag ) { |
| /* No payload */ |
| *pnBytesOut = 0; |
| return ret; |
| } |
| |
| /****************************************/ |
| /* Encode Parameters */ |
| /****************************************/ |
| TIC(ENCODE_PARAMS) |
| silk_encode_indices( &psEnc->sCmn, psRangeEnc, psEnc->sCmn.nFramesEncoded, 0, condCoding ); |
| TOC(ENCODE_PARAMS) |
| |
| /****************************************/ |
| /* Encode Excitation Signal */ |
| /****************************************/ |
| TIC(ENCODE_PULSES) |
| silk_encode_pulses( psRangeEnc, psEnc->sCmn.indices.signalType, psEnc->sCmn.indices.quantOffsetType, |
| psEnc->sCmn.pulses, psEnc->sCmn.frame_length ); |
| TOC(ENCODE_PULSES) |
| |
| /****************************************/ |
| /* Finalize payload */ |
| /****************************************/ |
| psEnc->sCmn.first_frame_after_reset = 0; |
| /* Payload size */ |
| *pnBytesOut = silk_RSHIFT( ec_tell( psRangeEnc ) + 7, 3 ); |
| TOC(ENCODE_FRAME) |
| |
| #ifdef SAVE_ALL_INTERNAL_DATA |
| { |
| silk_float tmp[ MAX_NB_SUBFR * LTP_ORDER ]; |
| int i; |
| DEBUG_STORE_DATA( xf.dat, x_frame + LA_SHAPE_MS * psEnc->sCmn.fs_kHz, psEnc->sCmn.frame_length * sizeof( opus_int16 ) ); |
| DEBUG_STORE_DATA( xfw.dat, xfw, psEnc->sCmn.frame_length * sizeof( opus_int16 ) ); |
| DEBUG_STORE_DATA( pitchL.dat, sEncCtrl.pitchL, psEnc->sCmn.nb_subfr * sizeof( opus_int ) ); |
| for( i = 0; i < psEnc->sCmn.nb_subfr * LTP_ORDER; i++ ) { |
| tmp[ i ] = (silk_float)sEncCtrl.LTPCoef_Q14[ i ] / 16384.0f; |
| } |
| DEBUG_STORE_DATA( pitchG_quantized.dat, tmp, psEnc->sCmn.nb_subfr * LTP_ORDER * sizeof( silk_float ) ); |
| for( i = 0; i <psEnc->sCmn.predictLPCOrder; i++ ) { |
| tmp[ i ] = (silk_float)sEncCtrl.PredCoef_Q12[ 1 ][ i ] / 4096.0f; |
| } |
| DEBUG_STORE_DATA( PredCoef.dat, tmp, psEnc->sCmn.predictLPCOrder * sizeof( silk_float ) ); |
| |
| tmp[ 0 ] = (silk_float)sEncCtrl.LTPredCodGain_Q7 / 128.0f; |
| DEBUG_STORE_DATA( LTPredCodGain.dat, tmp, sizeof( silk_float ) ); |
| tmp[ 0 ] = (silk_float)psEnc->LTPCorr_Q15 / 32768.0f; |
| DEBUG_STORE_DATA( LTPcorr.dat, tmp, sizeof( silk_float ) ); |
| tmp[ 0 ] = (silk_float)psEnc->sCmn.input_tilt_Q15 / 32768.0f; |
| DEBUG_STORE_DATA( tilt.dat, tmp, sizeof( silk_float ) ); |
| for( i = 0; i < psEnc->sCmn.nb_subfr; i++ ) { |
| tmp[ i ] = (silk_float)sEncCtrl.Gains_Q16[ i ] / 65536.0f; |
| } |
| DEBUG_STORE_DATA( gains.dat, tmp, psEnc->sCmn.nb_subfr * sizeof( silk_float ) ); |
| DEBUG_STORE_DATA( gains_indices.dat, &psEnc->sCmn.indices.GainsIndices, psEnc->sCmn.nb_subfr * sizeof( opus_int ) ); |
| tmp[ 0 ] = (silk_float)sEncCtrl.current_SNR_dB_Q7 / 128.0f; |
| DEBUG_STORE_DATA( current_SNR_db.dat, tmp, sizeof( silk_float ) ); |
| DEBUG_STORE_DATA( quantOffsetType.dat, &psEnc->sCmn.indices.quantOffsetType, sizeof( opus_int ) ); |
| tmp[ 0 ] = (silk_float)psEnc->sCmn.speech_activity_Q8 / 256.0f; |
| DEBUG_STORE_DATA( speech_activity.dat, tmp, sizeof( silk_float ) ); |
| for( i = 0; i < VAD_N_BANDS; i++ ) { |
| tmp[ i ] = (silk_float)psEnc->sCmn.input_quality_bands_Q15[ i ] / 32768.0f; |
| } |
| DEBUG_STORE_DATA( input_quality_bands.dat, tmp, VAD_N_BANDS * sizeof( silk_float ) ); |
| DEBUG_STORE_DATA( signalType.dat, &psEnc->sCmn.indices.signalType, sizeof( opus_int8) ); |
| DEBUG_STORE_DATA( lag_index.dat, &psEnc->sCmn.indices.lagIndex, sizeof( opus_int16 ) ); |
| DEBUG_STORE_DATA( contour_index.dat, &psEnc->sCmn.indices.contourIndex, sizeof( opus_int8 ) ); |
| DEBUG_STORE_DATA( per_index.dat, &psEnc->sCmn.indices.PERIndex, sizeof( opus_int8) ); |
| } |
| #endif |
| return ret; |
| } |
| |
| /* Low-Bitrate Redundancy (LBRR) encoding. Reuse all parameters but encode excitation at lower bitrate */ |
| void silk_LBRR_encode_FIX( |
| silk_encoder_state_FIX *psEnc, /* I/O Pointer to Silk FIX encoder state */ |
| silk_encoder_control_FIX *psEncCtrl, /* I/O Pointer to Silk FIX encoder control struct */ |
| const opus_int16 xfw[], /* I Input signal */ |
| opus_int condCoding /* I The type of conditional coding used so far for this frame */ |
| ) |
| { |
| opus_int32 TempGains_Q16[ MAX_NB_SUBFR ]; |
| SideInfoIndices *psIndices_LBRR = &psEnc->sCmn.indices_LBRR[ psEnc->sCmn.nFramesEncoded ]; |
| silk_nsq_state sNSQ_LBRR; |
| |
| /*******************************************/ |
| /* Control use of inband LBRR */ |
| /*******************************************/ |
| if( psEnc->sCmn.LBRR_enabled && psEnc->sCmn.speech_activity_Q8 > SILK_FIX_CONST( LBRR_SPEECH_ACTIVITY_THRES, 8 ) ) { |
| psEnc->sCmn.LBRR_flags[ psEnc->sCmn.nFramesEncoded ] = 1; |
| |
| /* Copy noise shaping quantizer state and quantization indices from regular encoding */ |
| silk_memcpy( &sNSQ_LBRR, &psEnc->sCmn.sNSQ, sizeof( silk_nsq_state ) ); |
| silk_memcpy( psIndices_LBRR, &psEnc->sCmn.indices, sizeof( SideInfoIndices ) ); |
| |
| /* Save original gains */ |
| silk_memcpy( TempGains_Q16, psEncCtrl->Gains_Q16, psEnc->sCmn.nb_subfr * sizeof( opus_int32 ) ); |
| |
| if( psEnc->sCmn.nFramesEncoded == 0 || psEnc->sCmn.LBRR_flags[ psEnc->sCmn.nFramesEncoded - 1 ] == 0 ) { |
| /* First frame in packet or previous frame not LBRR coded */ |
| psEnc->sCmn.LBRRprevLastGainIndex = psEnc->sShape.LastGainIndex; |
| |
| /* Increase Gains to get target LBRR rate */ |
| psIndices_LBRR->GainsIndices[ 0 ] = psIndices_LBRR->GainsIndices[ 0 ] + psEnc->sCmn.LBRR_GainIncreases; |
| psIndices_LBRR->GainsIndices[ 0 ] = silk_min_int( psIndices_LBRR->GainsIndices[ 0 ], N_LEVELS_QGAIN - 1 ); |
| } |
| |
| /* Decode to get gains in sync with decoder */ |
| /* Overwrite unquantized gains with quantized gains */ |
| silk_gains_dequant( psEncCtrl->Gains_Q16, psIndices_LBRR->GainsIndices, |
| &psEnc->sCmn.LBRRprevLastGainIndex, condCoding == CODE_CONDITIONALLY, psEnc->sCmn.nb_subfr ); |
| |
| /*****************************************/ |
| /* Noise shaping quantization */ |
| /*****************************************/ |
| if( psEnc->sCmn.nStatesDelayedDecision > 1 || psEnc->sCmn.warping_Q16 > 0 ) { |
| silk_NSQ_del_dec( &psEnc->sCmn, &sNSQ_LBRR, psIndices_LBRR, xfw, |
| psEnc->sCmn.pulses_LBRR[ psEnc->sCmn.nFramesEncoded ], psEncCtrl->PredCoef_Q12[ 0 ], psEncCtrl->LTPCoef_Q14, |
| psEncCtrl->AR2_Q13, psEncCtrl->HarmShapeGain_Q14, psEncCtrl->Tilt_Q14, psEncCtrl->LF_shp_Q14, |
| psEncCtrl->Gains_Q16, psEncCtrl->pitchL, psEncCtrl->Lambda_Q10, psEncCtrl->LTP_scale_Q14 ); |
| } else { |
| silk_NSQ( &psEnc->sCmn, &sNSQ_LBRR, psIndices_LBRR, xfw, |
| psEnc->sCmn.pulses_LBRR[ psEnc->sCmn.nFramesEncoded ], psEncCtrl->PredCoef_Q12[ 0 ], psEncCtrl->LTPCoef_Q14, |
| psEncCtrl->AR2_Q13, psEncCtrl->HarmShapeGain_Q14, psEncCtrl->Tilt_Q14, psEncCtrl->LF_shp_Q14, |
| psEncCtrl->Gains_Q16, psEncCtrl->pitchL, psEncCtrl->Lambda_Q10, psEncCtrl->LTP_scale_Q14 ); |
| } |
| |
| /* Restore original gains */ |
| silk_memcpy( psEncCtrl->Gains_Q16, TempGains_Q16, psEnc->sCmn.nb_subfr * sizeof( opus_int32 ) ); |
| } |
| } |