Coverage Report

Created: 2025-08-28 07:12

/src/opus/silk/enc_API.c
Line
Count
Source (jump to first uncovered line)
1
/***********************************************************************
2
Copyright (c) 2006-2011, Skype Limited. All rights reserved.
3
Redistribution and use in source and binary forms, with or without
4
modification, are permitted provided that the following conditions
5
are met:
6
- Redistributions of source code must retain the above copyright notice,
7
this list of conditions and the following disclaimer.
8
- Redistributions in binary form must reproduce the above copyright
9
notice, this list of conditions and the following disclaimer in the
10
documentation and/or other materials provided with the distribution.
11
- Neither the name of Internet Society, IETF or IETF Trust, nor the
12
names of specific contributors, may be used to endorse or promote
13
products derived from this software without specific prior written
14
permission.
15
THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
16
AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
17
IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
18
ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
19
LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
20
CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
21
SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
22
INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
23
CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
24
ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
25
POSSIBILITY OF SUCH DAMAGE.
26
***********************************************************************/
27
28
#ifdef HAVE_CONFIG_H
29
#include "config.h"
30
#endif
31
#include "define.h"
32
#include "API.h"
33
#include "control.h"
34
#include "typedef.h"
35
#include "stack_alloc.h"
36
#include "structs.h"
37
#include "tuning_parameters.h"
38
#ifdef FIXED_POINT
39
#include "main_FIX.h"
40
#else
41
#include "main_FLP.h"
42
#endif
43
44
#ifdef ENABLE_DRED
45
#include "dred_encoder.h"
46
#endif
47
48
/***************************************/
49
/* Read control structure from encoder */
50
/***************************************/
51
static opus_int silk_QueryEncoder(                      /* O    Returns error code                              */
52
    const void                      *encState,          /* I    State                                           */
53
    silk_EncControlStruct           *encStatus          /* O    Encoder Status                                  */
54
);
55
56
/****************************************/
57
/* Encoder functions                    */
58
/****************************************/
59
60
opus_int silk_Get_Encoder_Size(                         /* O    Returns error code                              */
61
    opus_int                        *encSizeBytes       /* O    Number of bytes in SILK encoder state           */
62
)
63
0
{
64
0
    opus_int ret = SILK_NO_ERROR;
65
66
0
    *encSizeBytes = sizeof( silk_encoder );
67
68
0
    return ret;
69
0
}
70
71
/*************************/
72
/* Init or Reset encoder */
73
/*************************/
74
opus_int silk_InitEncoder(                              /* O    Returns error code                              */
75
    void                            *encState,          /* I/O  State                                           */
76
    int                              arch,              /* I    Run-time architecture                           */
77
    silk_EncControlStruct           *encStatus          /* O    Encoder Status                                  */
78
)
79
0
{
80
0
    silk_encoder *psEnc;
81
0
    opus_int n, ret = SILK_NO_ERROR;
82
83
0
    psEnc = (silk_encoder *)encState;
84
85
    /* Reset encoder */
86
0
    silk_memset( psEnc, 0, sizeof( silk_encoder ) );
87
0
    for( n = 0; n < ENCODER_NUM_CHANNELS; n++ ) {
88
0
        if( ret += silk_init_encoder( &psEnc->state_Fxx[ n ], arch ) ) {
89
0
            celt_assert( 0 );
90
0
        }
91
0
    }
92
93
0
    psEnc->nChannelsAPI = 1;
94
0
    psEnc->nChannelsInternal = 1;
95
96
    /* Read control structure */
97
0
    if( ret += silk_QueryEncoder( encState, encStatus ) ) {
98
0
        celt_assert( 0 );
99
0
    }
100
101
0
    return ret;
102
0
}
103
104
/***************************************/
105
/* Read control structure from encoder */
106
/***************************************/
107
static opus_int silk_QueryEncoder(                      /* O    Returns error code                              */
108
    const void                      *encState,          /* I    State                                           */
109
    silk_EncControlStruct           *encStatus          /* O    Encoder Status                                  */
110
)
111
0
{
112
0
    opus_int ret = SILK_NO_ERROR;
113
0
    silk_encoder_state_Fxx *state_Fxx;
114
0
    silk_encoder *psEnc = (silk_encoder *)encState;
115
116
0
    state_Fxx = psEnc->state_Fxx;
117
118
0
    encStatus->nChannelsAPI              = psEnc->nChannelsAPI;
119
0
    encStatus->nChannelsInternal         = psEnc->nChannelsInternal;
120
0
    encStatus->API_sampleRate            = state_Fxx[ 0 ].sCmn.API_fs_Hz;
121
0
    encStatus->maxInternalSampleRate     = state_Fxx[ 0 ].sCmn.maxInternal_fs_Hz;
122
0
    encStatus->minInternalSampleRate     = state_Fxx[ 0 ].sCmn.minInternal_fs_Hz;
123
0
    encStatus->desiredInternalSampleRate = state_Fxx[ 0 ].sCmn.desiredInternal_fs_Hz;
124
0
    encStatus->payloadSize_ms            = state_Fxx[ 0 ].sCmn.PacketSize_ms;
125
0
    encStatus->bitRate                   = state_Fxx[ 0 ].sCmn.TargetRate_bps;
126
0
    encStatus->packetLossPercentage      = state_Fxx[ 0 ].sCmn.PacketLoss_perc;
127
0
    encStatus->complexity                = state_Fxx[ 0 ].sCmn.Complexity;
128
0
    encStatus->useInBandFEC              = state_Fxx[ 0 ].sCmn.useInBandFEC;
129
0
    encStatus->useDTX                    = state_Fxx[ 0 ].sCmn.useDTX;
130
0
    encStatus->useCBR                    = state_Fxx[ 0 ].sCmn.useCBR;
131
0
    encStatus->internalSampleRate        = silk_SMULBB( state_Fxx[ 0 ].sCmn.fs_kHz, 1000 );
132
0
    encStatus->allowBandwidthSwitch      = state_Fxx[ 0 ].sCmn.allow_bandwidth_switch;
133
0
    encStatus->inWBmodeWithoutVariableLP = state_Fxx[ 0 ].sCmn.fs_kHz == 16 && state_Fxx[ 0 ].sCmn.sLP.mode == 0;
134
135
0
    return ret;
136
0
}
137
138
139
/**************************/
140
/* Encode frame with Silk */
141
/**************************/
142
/* Note: if prefillFlag is set, the input must contain 10 ms of audio, irrespective of what                     */
143
/* encControl->payloadSize_ms is set to                                                                         */
144
opus_int silk_Encode(                                   /* O    Returns error code                              */
145
    void                            *encState,          /* I/O  State                                           */
146
    silk_EncControlStruct           *encControl,        /* I    Control status                                  */
147
    const opus_res                  *samplesIn,         /* I    Speech sample input vector                      */
148
    opus_int                        nSamplesIn,         /* I    Number of samples in input vector               */
149
    ec_enc                          *psRangeEnc,        /* I/O  Compressor data structure                       */
150
    opus_int32                      *nBytesOut,         /* I/O  Number of bytes in payload (input: Max bytes)   */
151
    const opus_int                  prefillFlag,        /* I    Flag to indicate prefilling buffers no coding   */
152
    opus_int                        activity            /* I    Decision of Opus voice activity detector        */
153
)
154
0
{
155
0
    opus_int   n, i, nBits, flags, tmp_payloadSize_ms = 0, tmp_complexity = 0, ret = 0;
156
0
    opus_int   nSamplesToBuffer, nSamplesToBufferMax, nBlocksOf10ms;
157
0
    opus_int   nSamplesFromInput = 0, nSamplesFromInputMax;
158
0
    opus_int   speech_act_thr_for_switch_Q8;
159
0
    opus_int32 TargetRate_bps, MStargetRates_bps[ 2 ], channelRate_bps, LBRR_symbol, sum;
160
0
    silk_encoder *psEnc = ( silk_encoder * )encState;
161
0
    VARDECL( opus_int16, buf );
162
0
    opus_int transition, curr_block, tot_blocks;
163
0
    SAVE_STACK;
164
165
0
    if (encControl->reducedDependency)
166
0
    {
167
0
       psEnc->state_Fxx[0].sCmn.first_frame_after_reset = 1;
168
0
       psEnc->state_Fxx[1].sCmn.first_frame_after_reset = 1;
169
0
    }
170
0
    psEnc->state_Fxx[ 0 ].sCmn.nFramesEncoded = psEnc->state_Fxx[ 1 ].sCmn.nFramesEncoded = 0;
171
172
    /* Check values in encoder control structure */
173
0
    if( ( ret = check_control_input( encControl ) ) != 0 ) {
174
0
        celt_assert( 0 );
175
0
        RESTORE_STACK;
176
0
        return ret;
177
0
    }
178
179
0
    encControl->switchReady = 0;
180
181
0
    if( encControl->nChannelsInternal > psEnc->nChannelsInternal ) {
182
        /* Mono -> Stereo transition: init state of second channel and stereo state */
183
0
        ret += silk_init_encoder( &psEnc->state_Fxx[ 1 ], psEnc->state_Fxx[ 0 ].sCmn.arch );
184
0
        silk_memset( psEnc->sStereo.pred_prev_Q13, 0, sizeof( psEnc->sStereo.pred_prev_Q13 ) );
185
0
        silk_memset( psEnc->sStereo.sSide, 0, sizeof( psEnc->sStereo.sSide ) );
186
0
        psEnc->sStereo.mid_side_amp_Q0[ 0 ] = 0;
187
0
        psEnc->sStereo.mid_side_amp_Q0[ 1 ] = 1;
188
0
        psEnc->sStereo.mid_side_amp_Q0[ 2 ] = 0;
189
0
        psEnc->sStereo.mid_side_amp_Q0[ 3 ] = 1;
190
0
        psEnc->sStereo.width_prev_Q14 = 0;
191
0
        psEnc->sStereo.smth_width_Q14 = SILK_FIX_CONST( 1, 14 );
192
0
        if( psEnc->nChannelsAPI == 2 ) {
193
0
            silk_memcpy( &psEnc->state_Fxx[ 1 ].sCmn.resampler_state, &psEnc->state_Fxx[ 0 ].sCmn.resampler_state, sizeof( silk_resampler_state_struct ) );
194
0
            silk_memcpy( &psEnc->state_Fxx[ 1 ].sCmn.In_HP_State,     &psEnc->state_Fxx[ 0 ].sCmn.In_HP_State,     sizeof( psEnc->state_Fxx[ 1 ].sCmn.In_HP_State ) );
195
0
        }
196
0
    }
197
198
0
    transition = (encControl->payloadSize_ms != psEnc->state_Fxx[ 0 ].sCmn.PacketSize_ms) || (psEnc->nChannelsInternal != encControl->nChannelsInternal);
199
200
0
    psEnc->nChannelsAPI = encControl->nChannelsAPI;
201
0
    psEnc->nChannelsInternal = encControl->nChannelsInternal;
202
203
0
    nBlocksOf10ms = silk_DIV32( 100 * nSamplesIn, encControl->API_sampleRate );
204
0
    tot_blocks = ( nBlocksOf10ms > 1 ) ? nBlocksOf10ms >> 1 : 1;
205
0
    curr_block = 0;
206
0
    if( prefillFlag ) {
207
0
        silk_LP_state save_LP;
208
        /* Only accept input length of 10 ms */
209
0
        if( nBlocksOf10ms != 1 ) {
210
0
            celt_assert( 0 );
211
0
            RESTORE_STACK;
212
0
            return SILK_ENC_INPUT_INVALID_NO_OF_SAMPLES;
213
0
        }
214
0
        if ( prefillFlag == 2 ) {
215
0
            save_LP = psEnc->state_Fxx[ 0 ].sCmn.sLP;
216
            /* Save the sampling rate so the bandwidth switching code can keep handling transitions. */
217
0
            save_LP.saved_fs_kHz = psEnc->state_Fxx[ 0 ].sCmn.fs_kHz;
218
0
        }
219
        /* Reset Encoder */
220
0
        for( n = 0; n < encControl->nChannelsInternal; n++ ) {
221
0
            ret = silk_init_encoder( &psEnc->state_Fxx[ n ], psEnc->state_Fxx[ n ].sCmn.arch );
222
            /* Restore the variable LP state. */
223
0
            if ( prefillFlag == 2 ) {
224
0
                psEnc->state_Fxx[ n ].sCmn.sLP = save_LP;
225
0
            }
226
0
            celt_assert( !ret );
227
0
        }
228
0
        tmp_payloadSize_ms = encControl->payloadSize_ms;
229
0
        encControl->payloadSize_ms = 10;
230
0
        tmp_complexity = encControl->complexity;
231
0
        encControl->complexity = 0;
232
0
        for( n = 0; n < encControl->nChannelsInternal; n++ ) {
233
0
            psEnc->state_Fxx[ n ].sCmn.controlled_since_last_payload = 0;
234
0
            psEnc->state_Fxx[ n ].sCmn.prefillFlag = 1;
235
0
        }
236
0
    } else {
237
        /* Only accept input lengths that are a multiple of 10 ms */
238
0
        if( nBlocksOf10ms * encControl->API_sampleRate != 100 * nSamplesIn || nSamplesIn < 0 ) {
239
0
            celt_assert( 0 );
240
0
            RESTORE_STACK;
241
0
            return SILK_ENC_INPUT_INVALID_NO_OF_SAMPLES;
242
0
        }
243
        /* Make sure no more than one packet can be produced */
244
0
        if( 1000 * (opus_int32)nSamplesIn > encControl->payloadSize_ms * encControl->API_sampleRate ) {
245
0
            celt_assert( 0 );
246
0
            RESTORE_STACK;
247
0
            return SILK_ENC_INPUT_INVALID_NO_OF_SAMPLES;
248
0
        }
249
0
    }
250
251
0
    for( n = 0; n < encControl->nChannelsInternal; n++ ) {
252
        /* Force the side channel to the same rate as the mid */
253
0
        opus_int force_fs_kHz = (n==1) ? psEnc->state_Fxx[0].sCmn.fs_kHz : 0;
254
0
        if( ( ret = silk_control_encoder( &psEnc->state_Fxx[ n ], encControl, psEnc->allowBandwidthSwitch, n, force_fs_kHz ) ) != 0 ) {
255
0
            silk_assert( 0 );
256
0
            RESTORE_STACK;
257
0
            return ret;
258
0
        }
259
0
        if( psEnc->state_Fxx[n].sCmn.first_frame_after_reset || transition ) {
260
0
            for( i = 0; i < psEnc->state_Fxx[ 0 ].sCmn.nFramesPerPacket; i++ ) {
261
0
                psEnc->state_Fxx[ n ].sCmn.LBRR_flags[ i ] = 0;
262
0
            }
263
0
        }
264
0
        psEnc->state_Fxx[ n ].sCmn.inDTX = psEnc->state_Fxx[ n ].sCmn.useDTX;
265
0
    }
266
0
    celt_assert( encControl->nChannelsInternal == 1 || psEnc->state_Fxx[ 0 ].sCmn.fs_kHz == psEnc->state_Fxx[ 1 ].sCmn.fs_kHz );
267
268
    /* Input buffering/resampling and encoding */
269
0
    nSamplesToBufferMax =
270
0
        10 * nBlocksOf10ms * psEnc->state_Fxx[ 0 ].sCmn.fs_kHz;
271
0
    nSamplesFromInputMax =
272
0
        silk_DIV32_16( nSamplesToBufferMax *
273
0
                           psEnc->state_Fxx[ 0 ].sCmn.API_fs_Hz,
274
0
                       psEnc->state_Fxx[ 0 ].sCmn.fs_kHz * 1000 );
275
0
    ALLOC( buf, nSamplesFromInputMax, opus_int16 );
276
0
    while( 1 ) {
277
0
        int curr_nBitsUsedLBRR = 0;
278
0
        nSamplesToBuffer  = psEnc->state_Fxx[ 0 ].sCmn.frame_length - psEnc->state_Fxx[ 0 ].sCmn.inputBufIx;
279
0
        nSamplesToBuffer  = silk_min( nSamplesToBuffer, nSamplesToBufferMax );
280
0
        nSamplesFromInput = silk_DIV32_16( nSamplesToBuffer * psEnc->state_Fxx[ 0 ].sCmn.API_fs_Hz, psEnc->state_Fxx[ 0 ].sCmn.fs_kHz * 1000 );
281
        /* Resample and write to buffer */
282
0
        if( encControl->nChannelsAPI == 2 && encControl->nChannelsInternal == 2 ) {
283
0
            opus_int id = psEnc->state_Fxx[ 0 ].sCmn.nFramesEncoded;
284
0
            for( n = 0; n < nSamplesFromInput; n++ ) {
285
0
                buf[ n ] = RES2INT16(samplesIn[ 2 * n ]);
286
0
            }
287
            /* Making sure to start both resamplers from the same state when switching from mono to stereo */
288
0
            if( psEnc->nPrevChannelsInternal == 1 && id==0 ) {
289
0
               silk_memcpy( &psEnc->state_Fxx[ 1 ].sCmn.resampler_state, &psEnc->state_Fxx[ 0 ].sCmn.resampler_state, sizeof(psEnc->state_Fxx[ 1 ].sCmn.resampler_state));
290
0
            }
291
292
0
            ret += silk_resampler( &psEnc->state_Fxx[ 0 ].sCmn.resampler_state,
293
0
                &psEnc->state_Fxx[ 0 ].sCmn.inputBuf[ psEnc->state_Fxx[ 0 ].sCmn.inputBufIx + 2 ], buf, nSamplesFromInput );
294
0
            psEnc->state_Fxx[ 0 ].sCmn.inputBufIx += nSamplesToBuffer;
295
296
0
            nSamplesToBuffer  = psEnc->state_Fxx[ 1 ].sCmn.frame_length - psEnc->state_Fxx[ 1 ].sCmn.inputBufIx;
297
0
            nSamplesToBuffer  = silk_min( nSamplesToBuffer, 10 * nBlocksOf10ms * psEnc->state_Fxx[ 1 ].sCmn.fs_kHz );
298
0
            for( n = 0; n < nSamplesFromInput; n++ ) {
299
0
                buf[ n ] = RES2INT16(samplesIn[ 2 * n + 1 ]);
300
0
            }
301
0
            ret += silk_resampler( &psEnc->state_Fxx[ 1 ].sCmn.resampler_state,
302
0
                &psEnc->state_Fxx[ 1 ].sCmn.inputBuf[ psEnc->state_Fxx[ 1 ].sCmn.inputBufIx + 2 ], buf, nSamplesFromInput );
303
304
0
            psEnc->state_Fxx[ 1 ].sCmn.inputBufIx += nSamplesToBuffer;
305
0
        } else if( encControl->nChannelsAPI == 2 && encControl->nChannelsInternal == 1 ) {
306
            /* Combine left and right channels before resampling */
307
0
            for( n = 0; n < nSamplesFromInput; n++ ) {
308
0
                sum = RES2INT16(samplesIn[ 2 * n ] + samplesIn[ 2 * n + 1 ]);
309
0
                buf[ n ] = (opus_int16)silk_RSHIFT_ROUND( sum,  1 );
310
0
            }
311
0
            ret += silk_resampler( &psEnc->state_Fxx[ 0 ].sCmn.resampler_state,
312
0
                &psEnc->state_Fxx[ 0 ].sCmn.inputBuf[ psEnc->state_Fxx[ 0 ].sCmn.inputBufIx + 2 ], buf, nSamplesFromInput );
313
            /* On the first mono frame, average the results for the two resampler states  */
314
0
            if( psEnc->nPrevChannelsInternal == 2 && psEnc->state_Fxx[ 0 ].sCmn.nFramesEncoded == 0 ) {
315
0
               ret += silk_resampler( &psEnc->state_Fxx[ 1 ].sCmn.resampler_state,
316
0
                   &psEnc->state_Fxx[ 1 ].sCmn.inputBuf[ psEnc->state_Fxx[ 1 ].sCmn.inputBufIx + 2 ], buf, nSamplesFromInput );
317
0
               for( n = 0; n < psEnc->state_Fxx[ 0 ].sCmn.frame_length; n++ ) {
318
0
                  psEnc->state_Fxx[ 0 ].sCmn.inputBuf[ psEnc->state_Fxx[ 0 ].sCmn.inputBufIx+n+2 ] =
319
0
                        silk_RSHIFT(psEnc->state_Fxx[ 0 ].sCmn.inputBuf[ psEnc->state_Fxx[ 0 ].sCmn.inputBufIx+n+2 ]
320
0
                                  + psEnc->state_Fxx[ 1 ].sCmn.inputBuf[ psEnc->state_Fxx[ 1 ].sCmn.inputBufIx+n+2 ], 1);
321
0
               }
322
0
            }
323
0
            psEnc->state_Fxx[ 0 ].sCmn.inputBufIx += nSamplesToBuffer;
324
0
        } else {
325
0
            celt_assert( encControl->nChannelsAPI == 1 && encControl->nChannelsInternal == 1 );
326
0
            for( n = 0; n < nSamplesFromInput; n++ ) {
327
0
                buf[n] = RES2INT16(samplesIn[n]);
328
0
            }
329
0
            ret += silk_resampler( &psEnc->state_Fxx[ 0 ].sCmn.resampler_state,
330
0
                &psEnc->state_Fxx[ 0 ].sCmn.inputBuf[ psEnc->state_Fxx[ 0 ].sCmn.inputBufIx + 2 ], buf, nSamplesFromInput );
331
0
            psEnc->state_Fxx[ 0 ].sCmn.inputBufIx += nSamplesToBuffer;
332
0
        }
333
334
0
        samplesIn  += nSamplesFromInput * encControl->nChannelsAPI;
335
0
        nSamplesIn -= nSamplesFromInput;
336
337
        /* Default */
338
0
        psEnc->allowBandwidthSwitch = 0;
339
340
        /* Silk encoder */
341
0
        if( psEnc->state_Fxx[ 0 ].sCmn.inputBufIx >= psEnc->state_Fxx[ 0 ].sCmn.frame_length ) {
342
            /* Enough data in input buffer, so encode */
343
0
            celt_assert( psEnc->state_Fxx[ 0 ].sCmn.inputBufIx == psEnc->state_Fxx[ 0 ].sCmn.frame_length );
344
0
            celt_assert( encControl->nChannelsInternal == 1 || psEnc->state_Fxx[ 1 ].sCmn.inputBufIx == psEnc->state_Fxx[ 1 ].sCmn.frame_length );
345
346
            /* Deal with LBRR data */
347
0
            if( psEnc->state_Fxx[ 0 ].sCmn.nFramesEncoded == 0 && !prefillFlag ) {
348
                /* Create space at start of payload for VAD and FEC flags */
349
0
                opus_uint8 iCDF[ 2 ] = { 0, 0 };
350
0
                iCDF[ 0 ] = 256 - silk_RSHIFT( 256, ( psEnc->state_Fxx[ 0 ].sCmn.nFramesPerPacket + 1 ) * encControl->nChannelsInternal );
351
0
                ec_enc_icdf( psRangeEnc, 0, iCDF, 8 );
352
0
                curr_nBitsUsedLBRR = ec_tell( psRangeEnc );
353
354
                /* Encode any LBRR data from previous packet */
355
                /* Encode LBRR flags */
356
0
                for( n = 0; n < encControl->nChannelsInternal; n++ ) {
357
0
                    LBRR_symbol = 0;
358
0
                    for( i = 0; i < psEnc->state_Fxx[ n ].sCmn.nFramesPerPacket; i++ ) {
359
0
                        LBRR_symbol |= silk_LSHIFT( psEnc->state_Fxx[ n ].sCmn.LBRR_flags[ i ], i );
360
0
                    }
361
0
                    psEnc->state_Fxx[ n ].sCmn.LBRR_flag = LBRR_symbol > 0 ? 1 : 0;
362
0
                    if( LBRR_symbol && psEnc->state_Fxx[ n ].sCmn.nFramesPerPacket > 1 ) {
363
0
                        ec_enc_icdf( psRangeEnc, LBRR_symbol - 1, silk_LBRR_flags_iCDF_ptr[ psEnc->state_Fxx[ n ].sCmn.nFramesPerPacket - 2 ], 8 );
364
0
                    }
365
0
                }
366
367
                /* Code LBRR indices and excitation signals */
368
0
                for( i = 0; i < psEnc->state_Fxx[ 0 ].sCmn.nFramesPerPacket; i++ ) {
369
0
                    for( n = 0; n < encControl->nChannelsInternal; n++ ) {
370
0
                        if( psEnc->state_Fxx[ n ].sCmn.LBRR_flags[ i ] ) {
371
0
                            opus_int condCoding;
372
373
0
                            if( encControl->nChannelsInternal == 2 && n == 0 ) {
374
0
                                silk_stereo_encode_pred( psRangeEnc, psEnc->sStereo.predIx[ i ] );
375
                                /* For LBRR data there's no need to code the mid-only flag if the side-channel LBRR flag is set */
376
0
                                if( psEnc->state_Fxx[ 1 ].sCmn.LBRR_flags[ i ] == 0 ) {
377
0
                                    silk_stereo_encode_mid_only( psRangeEnc, psEnc->sStereo.mid_only_flags[ i ] );
378
0
                                }
379
0
                            }
380
                            /* Use conditional coding if previous frame available */
381
0
                            if( i > 0 && psEnc->state_Fxx[ n ].sCmn.LBRR_flags[ i - 1 ] ) {
382
0
                                condCoding = CODE_CONDITIONALLY;
383
0
                            } else {
384
0
                                condCoding = CODE_INDEPENDENTLY;
385
0
                            }
386
0
                            silk_encode_indices( &psEnc->state_Fxx[ n ].sCmn, psRangeEnc, i, 1, condCoding );
387
0
                            silk_encode_pulses( psRangeEnc, psEnc->state_Fxx[ n ].sCmn.indices_LBRR[i].signalType, psEnc->state_Fxx[ n ].sCmn.indices_LBRR[i].quantOffsetType,
388
0
                                psEnc->state_Fxx[ n ].sCmn.pulses_LBRR[ i ], psEnc->state_Fxx[ n ].sCmn.frame_length );
389
0
                        }
390
0
                    }
391
0
                }
392
393
                /* Reset LBRR flags */
394
0
                for( n = 0; n < encControl->nChannelsInternal; n++ ) {
395
0
                    silk_memset( psEnc->state_Fxx[ n ].sCmn.LBRR_flags, 0, sizeof( psEnc->state_Fxx[ n ].sCmn.LBRR_flags ) );
396
0
                }
397
0
                curr_nBitsUsedLBRR = ec_tell( psRangeEnc ) - curr_nBitsUsedLBRR;
398
0
            }
399
400
0
            silk_HP_variable_cutoff( psEnc->state_Fxx );
401
402
            /* Total target bits for packet */
403
0
            nBits = silk_DIV32_16( silk_MUL( encControl->bitRate, encControl->payloadSize_ms ), 1000 );
404
            /* Subtract bits used for LBRR */
405
0
            if( !prefillFlag ) {
406
                /* psEnc->nBitsUsedLBRR is an exponential moving average of the LBRR usage,
407
                   except that for the first LBRR frame it does no averaging and for the first
408
                   frame after after LBRR, it goes back to zero immediately. */
409
0
                if ( curr_nBitsUsedLBRR < 10 ) {
410
0
                    psEnc->nBitsUsedLBRR = 0;
411
0
                } else if ( psEnc->nBitsUsedLBRR < 10) {
412
0
                    psEnc->nBitsUsedLBRR = curr_nBitsUsedLBRR;
413
0
                } else {
414
0
                    psEnc->nBitsUsedLBRR = ( psEnc->nBitsUsedLBRR + curr_nBitsUsedLBRR ) / 2;
415
0
                }
416
0
                nBits -= psEnc->nBitsUsedLBRR;
417
0
            }
418
            /* Divide by number of uncoded frames left in packet */
419
0
            nBits = silk_DIV32_16( nBits, psEnc->state_Fxx[ 0 ].sCmn.nFramesPerPacket );
420
            /* Convert to bits/second */
421
0
            if( encControl->payloadSize_ms == 10 ) {
422
0
                TargetRate_bps = silk_SMULBB( nBits, 100 );
423
0
            } else {
424
0
                TargetRate_bps = silk_SMULBB( nBits, 50 );
425
0
            }
426
            /* Subtract fraction of bits in excess of target in previous frames and packets */
427
0
            TargetRate_bps -= silk_DIV32_16( silk_MUL( psEnc->nBitsExceeded, 1000 ), BITRESERVOIR_DECAY_TIME_MS );
428
0
            if( !prefillFlag && psEnc->state_Fxx[ 0 ].sCmn.nFramesEncoded > 0 ) {
429
                /* Compare actual vs target bits so far in this packet */
430
0
                opus_int32 bitsBalance = ec_tell( psRangeEnc ) - psEnc->nBitsUsedLBRR - nBits * psEnc->state_Fxx[ 0 ].sCmn.nFramesEncoded;
431
0
                TargetRate_bps -= silk_DIV32_16( silk_MUL( bitsBalance, 1000 ), BITRESERVOIR_DECAY_TIME_MS );
432
0
            }
433
            /* Never exceed input bitrate */
434
0
            TargetRate_bps = silk_LIMIT( TargetRate_bps, encControl->bitRate, 5000 );
435
436
            /* Convert Left/Right to Mid/Side */
437
0
            if( encControl->nChannelsInternal == 2 ) {
438
0
                silk_stereo_LR_to_MS( &psEnc->sStereo, &psEnc->state_Fxx[ 0 ].sCmn.inputBuf[ 2 ], &psEnc->state_Fxx[ 1 ].sCmn.inputBuf[ 2 ],
439
0
                    psEnc->sStereo.predIx[ psEnc->state_Fxx[ 0 ].sCmn.nFramesEncoded ], &psEnc->sStereo.mid_only_flags[ psEnc->state_Fxx[ 0 ].sCmn.nFramesEncoded ],
440
0
                    MStargetRates_bps, TargetRate_bps, psEnc->state_Fxx[ 0 ].sCmn.speech_activity_Q8, encControl->toMono,
441
0
                    psEnc->state_Fxx[ 0 ].sCmn.fs_kHz, psEnc->state_Fxx[ 0 ].sCmn.frame_length );
442
0
                if( psEnc->sStereo.mid_only_flags[ psEnc->state_Fxx[ 0 ].sCmn.nFramesEncoded ] == 0 ) {
443
                    /* Reset side channel encoder memory for first frame with side coding */
444
0
                    if( psEnc->prev_decode_only_middle == 1 ) {
445
0
                        silk_memset( &psEnc->state_Fxx[ 1 ].sShape,               0, sizeof( psEnc->state_Fxx[ 1 ].sShape ) );
446
0
                        silk_memset( &psEnc->state_Fxx[ 1 ].sCmn.sNSQ,            0, sizeof( psEnc->state_Fxx[ 1 ].sCmn.sNSQ ) );
447
0
                        silk_memset( psEnc->state_Fxx[ 1 ].sCmn.prev_NLSFq_Q15,   0, sizeof( psEnc->state_Fxx[ 1 ].sCmn.prev_NLSFq_Q15 ) );
448
0
                        silk_memset( &psEnc->state_Fxx[ 1 ].sCmn.sLP.In_LP_State, 0, sizeof( psEnc->state_Fxx[ 1 ].sCmn.sLP.In_LP_State ) );
449
0
                        psEnc->state_Fxx[ 1 ].sCmn.prevLag                 = 100;
450
0
                        psEnc->state_Fxx[ 1 ].sCmn.sNSQ.lagPrev            = 100;
451
0
                        psEnc->state_Fxx[ 1 ].sShape.LastGainIndex         = 10;
452
0
                        psEnc->state_Fxx[ 1 ].sCmn.prevSignalType          = TYPE_NO_VOICE_ACTIVITY;
453
0
                        psEnc->state_Fxx[ 1 ].sCmn.sNSQ.prev_gain_Q16      = 65536;
454
0
                        psEnc->state_Fxx[ 1 ].sCmn.first_frame_after_reset = 1;
455
0
                    }
456
0
                    silk_encode_do_VAD_Fxx( &psEnc->state_Fxx[ 1 ], activity );
457
0
                } else {
458
0
                    psEnc->state_Fxx[ 1 ].sCmn.VAD_flags[ psEnc->state_Fxx[ 0 ].sCmn.nFramesEncoded ] = 0;
459
0
                }
460
0
                if( !prefillFlag ) {
461
0
                    silk_stereo_encode_pred( psRangeEnc, psEnc->sStereo.predIx[ psEnc->state_Fxx[ 0 ].sCmn.nFramesEncoded ] );
462
0
                    if( psEnc->state_Fxx[ 1 ].sCmn.VAD_flags[ psEnc->state_Fxx[ 0 ].sCmn.nFramesEncoded ] == 0 ) {
463
0
                        silk_stereo_encode_mid_only( psRangeEnc, psEnc->sStereo.mid_only_flags[ psEnc->state_Fxx[ 0 ].sCmn.nFramesEncoded ] );
464
0
                    }
465
0
                }
466
0
            } else {
467
                /* Buffering */
468
0
                silk_memcpy( psEnc->state_Fxx[ 0 ].sCmn.inputBuf, psEnc->sStereo.sMid, 2 * sizeof( opus_int16 ) );
469
0
                silk_memcpy( psEnc->sStereo.sMid, &psEnc->state_Fxx[ 0 ].sCmn.inputBuf[ psEnc->state_Fxx[ 0 ].sCmn.frame_length ], 2 * sizeof( opus_int16 ) );
470
0
            }
471
0
            silk_encode_do_VAD_Fxx( &psEnc->state_Fxx[ 0 ], activity );
472
473
            /* Encode */
474
0
            for( n = 0; n < encControl->nChannelsInternal; n++ ) {
475
0
                opus_int maxBits, useCBR;
476
477
                /* Handling rate constraints */
478
0
                maxBits = encControl->maxBits;
479
0
                if( tot_blocks == 2 && curr_block == 0 ) {
480
0
                    maxBits = maxBits * 3 / 5;
481
0
                } else if( tot_blocks == 3 ) {
482
0
                    if( curr_block == 0 ) {
483
0
                        maxBits = maxBits * 2 / 5;
484
0
                    } else if( curr_block == 1 ) {
485
0
                        maxBits = maxBits * 3 / 4;
486
0
                    }
487
0
                }
488
0
                useCBR = encControl->useCBR && curr_block == tot_blocks - 1;
489
490
0
                if( encControl->nChannelsInternal == 1 ) {
491
0
                    channelRate_bps = TargetRate_bps;
492
0
                } else {
493
0
                    channelRate_bps = MStargetRates_bps[ n ];
494
0
                    if( n == 0 && MStargetRates_bps[ 1 ] > 0 ) {
495
0
                        useCBR = 0;
496
                        /* Give mid up to 1/2 of the max bits for that frame */
497
0
                        maxBits -= encControl->maxBits / ( tot_blocks * 2 );
498
0
                    }
499
0
                }
500
501
0
                if( channelRate_bps > 0 ) {
502
0
                    opus_int condCoding;
503
504
0
                    silk_control_SNR( &psEnc->state_Fxx[ n ].sCmn, channelRate_bps );
505
506
                    /* Use independent coding if no previous frame available */
507
0
                    if( psEnc->state_Fxx[ 0 ].sCmn.nFramesEncoded - n <= 0 ) {
508
0
                        condCoding = CODE_INDEPENDENTLY;
509
0
                    } else if( n > 0 && psEnc->prev_decode_only_middle ) {
510
                        /* If we skipped a side frame in this packet, we don't
511
                           need LTP scaling; the LTP state is well-defined. */
512
0
                        condCoding = CODE_INDEPENDENTLY_NO_LTP_SCALING;
513
0
                    } else {
514
0
                        condCoding = CODE_CONDITIONALLY;
515
0
                    }
516
0
                    if( ( ret = silk_encode_frame_Fxx( &psEnc->state_Fxx[ n ], nBytesOut, psRangeEnc, condCoding, maxBits, useCBR ) ) != 0 ) {
517
0
                        silk_assert( 0 );
518
0
                    }
519
0
                }
520
0
                psEnc->state_Fxx[ n ].sCmn.controlled_since_last_payload = 0;
521
0
                psEnc->state_Fxx[ n ].sCmn.inputBufIx = 0;
522
0
                psEnc->state_Fxx[ n ].sCmn.nFramesEncoded++;
523
0
            }
524
0
            psEnc->prev_decode_only_middle = psEnc->sStereo.mid_only_flags[ psEnc->state_Fxx[ 0 ].sCmn.nFramesEncoded - 1 ];
525
526
            /* Insert VAD and FEC flags at beginning of bitstream */
527
0
            if( *nBytesOut > 0 && psEnc->state_Fxx[ 0 ].sCmn.nFramesEncoded == psEnc->state_Fxx[ 0 ].sCmn.nFramesPerPacket) {
528
0
                flags = 0;
529
0
                for( n = 0; n < encControl->nChannelsInternal; n++ ) {
530
0
                    for( i = 0; i < psEnc->state_Fxx[ n ].sCmn.nFramesPerPacket; i++ ) {
531
0
                        flags  = silk_LSHIFT( flags, 1 );
532
0
                        flags |= psEnc->state_Fxx[ n ].sCmn.VAD_flags[ i ];
533
0
                    }
534
0
                    flags  = silk_LSHIFT( flags, 1 );
535
0
                    flags |= psEnc->state_Fxx[ n ].sCmn.LBRR_flag;
536
0
                }
537
0
                if( !prefillFlag ) {
538
0
                    ec_enc_patch_initial_bits( psRangeEnc, flags, ( psEnc->state_Fxx[ 0 ].sCmn.nFramesPerPacket + 1 ) * encControl->nChannelsInternal );
539
0
                }
540
541
                /* Return zero bytes if all channels DTXed */
542
0
                if( psEnc->state_Fxx[ 0 ].sCmn.inDTX && ( encControl->nChannelsInternal == 1 || psEnc->state_Fxx[ 1 ].sCmn.inDTX ) ) {
543
0
                    *nBytesOut = 0;
544
0
                }
545
546
0
                psEnc->nBitsExceeded += *nBytesOut * 8;
547
0
                psEnc->nBitsExceeded -= silk_DIV32_16( silk_MUL( encControl->bitRate, encControl->payloadSize_ms ), 1000 );
548
0
                psEnc->nBitsExceeded  = silk_LIMIT( psEnc->nBitsExceeded, 0, 10000 );
549
550
                /* Update flag indicating if bandwidth switching is allowed */
551
0
                speech_act_thr_for_switch_Q8 = silk_SMLAWB( SILK_FIX_CONST( SPEECH_ACTIVITY_DTX_THRES, 8 ),
552
0
                    SILK_FIX_CONST( ( 1 - SPEECH_ACTIVITY_DTX_THRES ) / MAX_BANDWIDTH_SWITCH_DELAY_MS, 16 + 8 ), psEnc->timeSinceSwitchAllowed_ms );
553
0
                if( psEnc->state_Fxx[ 0 ].sCmn.speech_activity_Q8 < speech_act_thr_for_switch_Q8 ) {
554
0
                    psEnc->allowBandwidthSwitch = 1;
555
0
                    psEnc->timeSinceSwitchAllowed_ms = 0;
556
0
                } else {
557
0
                    psEnc->allowBandwidthSwitch = 0;
558
0
                    psEnc->timeSinceSwitchAllowed_ms += encControl->payloadSize_ms;
559
0
                }
560
0
            }
561
562
0
            if( nSamplesIn == 0 ) {
563
0
                break;
564
0
            }
565
0
        } else {
566
0
            break;
567
0
        }
568
0
        curr_block++;
569
0
    }
570
571
0
    psEnc->nPrevChannelsInternal = encControl->nChannelsInternal;
572
573
0
    encControl->allowBandwidthSwitch = psEnc->allowBandwidthSwitch;
574
0
    encControl->inWBmodeWithoutVariableLP = psEnc->state_Fxx[ 0 ].sCmn.fs_kHz == 16 && psEnc->state_Fxx[ 0 ].sCmn.sLP.mode == 0;
575
0
    encControl->internalSampleRate = silk_SMULBB( psEnc->state_Fxx[ 0 ].sCmn.fs_kHz, 1000 );
576
0
    encControl->stereoWidth_Q14 = encControl->toMono ? 0 : psEnc->sStereo.smth_width_Q14;
577
0
    if( prefillFlag ) {
578
0
        encControl->payloadSize_ms = tmp_payloadSize_ms;
579
0
        encControl->complexity = tmp_complexity;
580
0
        for( n = 0; n < encControl->nChannelsInternal; n++ ) {
581
0
            psEnc->state_Fxx[ n ].sCmn.controlled_since_last_payload = 0;
582
0
            psEnc->state_Fxx[ n ].sCmn.prefillFlag = 0;
583
0
        }
584
0
    }
585
586
0
    encControl->signalType = psEnc->state_Fxx[0].sCmn.indices.signalType;
587
0
    encControl->offset = silk_Quantization_Offsets_Q10
588
0
                         [ psEnc->state_Fxx[0].sCmn.indices.signalType >> 1 ]
589
0
                         [ psEnc->state_Fxx[0].sCmn.indices.quantOffsetType ];
590
0
    RESTORE_STACK;
591
0
    return ret;
592
0
}