Coverage Report

Created: 2025-11-16 07:20

next uncovered line (L), next uncovered region (R), next uncovered branch (B)
/src/opus/silk/enc_API.c
Line
Count
Source
1
/***********************************************************************
2
Copyright (c) 2006-2011, Skype Limited. All rights reserved.
3
Redistribution and use in source and binary forms, with or without
4
modification, are permitted provided that the following conditions
5
are met:
6
- Redistributions of source code must retain the above copyright notice,
7
this list of conditions and the following disclaimer.
8
- Redistributions in binary form must reproduce the above copyright
9
notice, this list of conditions and the following disclaimer in the
10
documentation and/or other materials provided with the distribution.
11
- Neither the name of Internet Society, IETF or IETF Trust, nor the
12
names of specific contributors, may be used to endorse or promote
13
products derived from this software without specific prior written
14
permission.
15
THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
16
AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
17
IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
18
ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
19
LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
20
CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
21
SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
22
INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
23
CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
24
ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
25
POSSIBILITY OF SUCH DAMAGE.
26
***********************************************************************/
27
28
#ifdef HAVE_CONFIG_H
29
#include "config.h"
30
#endif
31
#include "define.h"
32
#include "API.h"
33
#include "control.h"
34
#include "typedef.h"
35
#include "stack_alloc.h"
36
#include "structs.h"
37
#include "tuning_parameters.h"
38
#ifdef FIXED_POINT
39
#include "main_FIX.h"
40
#else
41
#include "main_FLP.h"
42
#endif
43
44
#ifdef ENABLE_DRED
45
#include "dred_encoder.h"
46
#endif
47
48
/***************************************/
49
/* Read control structure from encoder */
50
/***************************************/
51
static opus_int silk_QueryEncoder(                      /* O    Returns error code                              */
52
    const void                      *encState,          /* I    State                                           */
53
    silk_EncControlStruct           *encStatus          /* O    Encoder Status                                  */
54
);
55
56
/****************************************/
57
/* Encoder functions                    */
58
/****************************************/
59
60
opus_int silk_Get_Encoder_Size(                         /* O    Returns error code                              */
61
    opus_int                        *encSizeBytes,      /* O    Number of bytes in SILK encoder state           */
62
    opus_int                         channels           /* I    Number of channels                              */
63
)
64
0
{
65
0
    opus_int ret = SILK_NO_ERROR;
66
67
0
    *encSizeBytes = sizeof( silk_encoder );
68
    /* Skip second encoder state for mono. */
69
0
    if ( channels == 1 ) {
70
0
        *encSizeBytes -= sizeof( silk_encoder_state_Fxx );
71
0
    }
72
73
0
    return ret;
74
0
}
75
76
/*************************/
77
/* Init or Reset encoder */
78
/*************************/
79
opus_int silk_InitEncoder(                              /* O    Returns error code                              */
80
    void                            *encState,          /* I/O  State                                           */
81
    int                              channels,          /* I    Number of channels                              */
82
    int                              arch,              /* I    Run-time architecture                           */
83
    silk_EncControlStruct           *encStatus          /* O    Encoder Status                                  */
84
)
85
0
{
86
0
    silk_encoder *psEnc;
87
0
    opus_int n, ret = SILK_NO_ERROR;
88
89
0
    psEnc = (silk_encoder *)encState;
90
91
    /* Reset encoder. Skip second encoder state for mono. */
92
0
    silk_memset( psEnc, 0, sizeof( silk_encoder ) - (channels==1)*sizeof( silk_encoder_state_Fxx ) );
93
0
    for( n = 0; n < channels; n++ ) {
94
0
        if( ret += silk_init_encoder( &psEnc->state_Fxx[ n ], arch ) ) {
95
0
            celt_assert( 0 );
96
0
        }
97
0
    }
98
99
0
    psEnc->nChannelsAPI = 1;
100
0
    psEnc->nChannelsInternal = 1;
101
102
    /* Read control structure */
103
0
    if( ret += silk_QueryEncoder( encState, encStatus ) ) {
104
0
        celt_assert( 0 );
105
0
    }
106
107
0
    return ret;
108
0
}
109
110
/***************************************/
111
/* Read control structure from encoder */
112
/***************************************/
113
static opus_int silk_QueryEncoder(                      /* O    Returns error code                              */
114
    const void                      *encState,          /* I    State                                           */
115
    silk_EncControlStruct           *encStatus          /* O    Encoder Status                                  */
116
)
117
0
{
118
0
    opus_int ret = SILK_NO_ERROR;
119
0
    silk_encoder_state_Fxx *state_Fxx;
120
0
    silk_encoder *psEnc = (silk_encoder *)encState;
121
122
0
    state_Fxx = psEnc->state_Fxx;
123
124
0
    encStatus->nChannelsAPI              = psEnc->nChannelsAPI;
125
0
    encStatus->nChannelsInternal         = psEnc->nChannelsInternal;
126
0
    encStatus->API_sampleRate            = state_Fxx[ 0 ].sCmn.API_fs_Hz;
127
0
    encStatus->maxInternalSampleRate     = state_Fxx[ 0 ].sCmn.maxInternal_fs_Hz;
128
0
    encStatus->minInternalSampleRate     = state_Fxx[ 0 ].sCmn.minInternal_fs_Hz;
129
0
    encStatus->desiredInternalSampleRate = state_Fxx[ 0 ].sCmn.desiredInternal_fs_Hz;
130
0
    encStatus->payloadSize_ms            = state_Fxx[ 0 ].sCmn.PacketSize_ms;
131
0
    encStatus->bitRate                   = state_Fxx[ 0 ].sCmn.TargetRate_bps;
132
0
    encStatus->packetLossPercentage      = state_Fxx[ 0 ].sCmn.PacketLoss_perc;
133
0
    encStatus->complexity                = state_Fxx[ 0 ].sCmn.Complexity;
134
0
    encStatus->useInBandFEC              = state_Fxx[ 0 ].sCmn.useInBandFEC;
135
0
    encStatus->useDTX                    = state_Fxx[ 0 ].sCmn.useDTX;
136
0
    encStatus->useCBR                    = state_Fxx[ 0 ].sCmn.useCBR;
137
0
    encStatus->internalSampleRate        = silk_SMULBB( state_Fxx[ 0 ].sCmn.fs_kHz, 1000 );
138
0
    encStatus->allowBandwidthSwitch      = state_Fxx[ 0 ].sCmn.allow_bandwidth_switch;
139
0
    encStatus->inWBmodeWithoutVariableLP = state_Fxx[ 0 ].sCmn.fs_kHz == 16 && state_Fxx[ 0 ].sCmn.sLP.mode == 0;
140
141
0
    return ret;
142
0
}
143
144
145
/**************************/
146
/* Encode frame with Silk */
147
/**************************/
148
/* Note: if prefillFlag is set, the input must contain 10 ms of audio, irrespective of what                     */
149
/* encControl->payloadSize_ms is set to                                                                         */
150
opus_int silk_Encode(                                   /* O    Returns error code                              */
151
    void                            *encState,          /* I/O  State                                           */
152
    silk_EncControlStruct           *encControl,        /* I    Control status                                  */
153
    const opus_res                  *samplesIn,         /* I    Speech sample input vector                      */
154
    opus_int                        nSamplesIn,         /* I    Number of samples in input vector               */
155
    ec_enc                          *psRangeEnc,        /* I/O  Compressor data structure                       */
156
    opus_int32                      *nBytesOut,         /* I/O  Number of bytes in payload (input: Max bytes)   */
157
    const opus_int                  prefillFlag,        /* I    Flag to indicate prefilling buffers no coding   */
158
    opus_int                        activity            /* I    Decision of Opus voice activity detector        */
159
)
160
0
{
161
0
    opus_int   n, i, nBits, flags, tmp_payloadSize_ms = 0, tmp_complexity = 0, ret = 0;
162
0
    opus_int   nSamplesToBuffer, nSamplesToBufferMax, nBlocksOf10ms;
163
0
    opus_int   nSamplesFromInput = 0, nSamplesFromInputMax;
164
0
    opus_int   speech_act_thr_for_switch_Q8;
165
0
    opus_int32 TargetRate_bps, MStargetRates_bps[ 2 ], channelRate_bps, LBRR_symbol, sum;
166
0
    silk_encoder *psEnc = ( silk_encoder * )encState;
167
0
    VARDECL( opus_int16, buf );
168
0
    opus_int transition, curr_block, tot_blocks;
169
0
    SAVE_STACK;
170
171
0
    celt_assert( encControl->nChannelsAPI >= encControl->nChannelsInternal && encControl->nChannelsAPI >= psEnc->nChannelsInternal );
172
0
    if (encControl->reducedDependency)
173
0
    {
174
0
       for( n = 0; n < encControl->nChannelsAPI; n++ ) {
175
0
           psEnc->state_Fxx[ n ].sCmn.first_frame_after_reset = 1;
176
0
       }
177
0
    }
178
0
    for( n = 0; n < encControl->nChannelsAPI; n++ ) {
179
0
        psEnc->state_Fxx[ n ].sCmn.nFramesEncoded = 0;
180
0
    }
181
    /* Check values in encoder control structure */
182
0
    if( ( ret = check_control_input( encControl ) ) != 0 ) {
183
0
        celt_assert( 0 );
184
0
        RESTORE_STACK;
185
0
        return ret;
186
0
    }
187
188
0
    encControl->switchReady = 0;
189
190
0
    if( encControl->nChannelsInternal > psEnc->nChannelsInternal ) {
191
        /* Mono -> Stereo transition: init state of second channel and stereo state */
192
0
        ret += silk_init_encoder( &psEnc->state_Fxx[ 1 ], psEnc->state_Fxx[ 0 ].sCmn.arch );
193
0
        silk_memset( psEnc->sStereo.pred_prev_Q13, 0, sizeof( psEnc->sStereo.pred_prev_Q13 ) );
194
0
        silk_memset( psEnc->sStereo.sSide, 0, sizeof( psEnc->sStereo.sSide ) );
195
0
        psEnc->sStereo.mid_side_amp_Q0[ 0 ] = 0;
196
0
        psEnc->sStereo.mid_side_amp_Q0[ 1 ] = 1;
197
0
        psEnc->sStereo.mid_side_amp_Q0[ 2 ] = 0;
198
0
        psEnc->sStereo.mid_side_amp_Q0[ 3 ] = 1;
199
0
        psEnc->sStereo.width_prev_Q14 = 0;
200
0
        psEnc->sStereo.smth_width_Q14 = SILK_FIX_CONST( 1, 14 );
201
0
        if( psEnc->nChannelsAPI == 2 ) {
202
0
            silk_memcpy( &psEnc->state_Fxx[ 1 ].sCmn.resampler_state, &psEnc->state_Fxx[ 0 ].sCmn.resampler_state, sizeof( silk_resampler_state_struct ) );
203
0
            silk_memcpy( &psEnc->state_Fxx[ 1 ].sCmn.In_HP_State,     &psEnc->state_Fxx[ 0 ].sCmn.In_HP_State,     sizeof( psEnc->state_Fxx[ 1 ].sCmn.In_HP_State ) );
204
0
        }
205
0
    }
206
207
0
    transition = (encControl->payloadSize_ms != psEnc->state_Fxx[ 0 ].sCmn.PacketSize_ms) || (psEnc->nChannelsInternal != encControl->nChannelsInternal);
208
209
0
    psEnc->nChannelsAPI = encControl->nChannelsAPI;
210
0
    psEnc->nChannelsInternal = encControl->nChannelsInternal;
211
212
0
    nBlocksOf10ms = silk_DIV32( 100 * nSamplesIn, encControl->API_sampleRate );
213
0
    tot_blocks = ( nBlocksOf10ms > 1 ) ? nBlocksOf10ms >> 1 : 1;
214
0
    curr_block = 0;
215
0
    if( prefillFlag ) {
216
0
        silk_LP_state save_LP;
217
        /* Only accept input length of 10 ms */
218
0
        if( nBlocksOf10ms != 1 ) {
219
0
            celt_assert( 0 );
220
0
            RESTORE_STACK;
221
0
            return SILK_ENC_INPUT_INVALID_NO_OF_SAMPLES;
222
0
        }
223
0
        if ( prefillFlag == 2 ) {
224
0
            save_LP = psEnc->state_Fxx[ 0 ].sCmn.sLP;
225
            /* Save the sampling rate so the bandwidth switching code can keep handling transitions. */
226
0
            save_LP.saved_fs_kHz = psEnc->state_Fxx[ 0 ].sCmn.fs_kHz;
227
0
        }
228
        /* Reset Encoder */
229
0
        for( n = 0; n < encControl->nChannelsInternal; n++ ) {
230
0
            ret = silk_init_encoder( &psEnc->state_Fxx[ n ], psEnc->state_Fxx[ n ].sCmn.arch );
231
            /* Restore the variable LP state. */
232
0
            if ( prefillFlag == 2 ) {
233
0
                psEnc->state_Fxx[ n ].sCmn.sLP = save_LP;
234
0
            }
235
0
            celt_assert( !ret );
236
0
        }
237
0
        tmp_payloadSize_ms = encControl->payloadSize_ms;
238
0
        encControl->payloadSize_ms = 10;
239
0
        tmp_complexity = encControl->complexity;
240
0
        encControl->complexity = 0;
241
0
        for( n = 0; n < encControl->nChannelsInternal; n++ ) {
242
0
            psEnc->state_Fxx[ n ].sCmn.controlled_since_last_payload = 0;
243
0
            psEnc->state_Fxx[ n ].sCmn.prefillFlag = 1;
244
0
        }
245
0
    } else {
246
        /* Only accept input lengths that are a multiple of 10 ms */
247
0
        if( nBlocksOf10ms * encControl->API_sampleRate != 100 * nSamplesIn || nSamplesIn < 0 ) {
248
0
            celt_assert( 0 );
249
0
            RESTORE_STACK;
250
0
            return SILK_ENC_INPUT_INVALID_NO_OF_SAMPLES;
251
0
        }
252
        /* Make sure no more than one packet can be produced */
253
0
        if( 1000 * (opus_int32)nSamplesIn > encControl->payloadSize_ms * encControl->API_sampleRate ) {
254
0
            celt_assert( 0 );
255
0
            RESTORE_STACK;
256
0
            return SILK_ENC_INPUT_INVALID_NO_OF_SAMPLES;
257
0
        }
258
0
    }
259
260
0
    for( n = 0; n < encControl->nChannelsInternal; n++ ) {
261
        /* Force the side channel to the same rate as the mid */
262
0
        opus_int force_fs_kHz = (n==1) ? psEnc->state_Fxx[0].sCmn.fs_kHz : 0;
263
0
        if( ( ret = silk_control_encoder( &psEnc->state_Fxx[ n ], encControl, psEnc->allowBandwidthSwitch, n, force_fs_kHz ) ) != 0 ) {
264
0
            silk_assert( 0 );
265
0
            RESTORE_STACK;
266
0
            return ret;
267
0
        }
268
0
        if( psEnc->state_Fxx[n].sCmn.first_frame_after_reset || transition ) {
269
0
            for( i = 0; i < psEnc->state_Fxx[ 0 ].sCmn.nFramesPerPacket; i++ ) {
270
0
                psEnc->state_Fxx[ n ].sCmn.LBRR_flags[ i ] = 0;
271
0
            }
272
0
        }
273
0
        psEnc->state_Fxx[ n ].sCmn.inDTX = psEnc->state_Fxx[ n ].sCmn.useDTX;
274
0
    }
275
0
    celt_assert( encControl->nChannelsInternal == 1 || psEnc->state_Fxx[ 0 ].sCmn.fs_kHz == psEnc->state_Fxx[ 1 ].sCmn.fs_kHz );
276
277
    /* Input buffering/resampling and encoding */
278
0
    nSamplesToBufferMax =
279
0
        10 * nBlocksOf10ms * psEnc->state_Fxx[ 0 ].sCmn.fs_kHz;
280
0
    nSamplesFromInputMax =
281
0
        silk_DIV32_16( nSamplesToBufferMax *
282
0
                           psEnc->state_Fxx[ 0 ].sCmn.API_fs_Hz,
283
0
                       psEnc->state_Fxx[ 0 ].sCmn.fs_kHz * 1000 );
284
0
    ALLOC( buf, nSamplesFromInputMax, opus_int16 );
285
0
    while( 1 ) {
286
0
        int curr_nBitsUsedLBRR = 0;
287
0
        nSamplesToBuffer  = psEnc->state_Fxx[ 0 ].sCmn.frame_length - psEnc->state_Fxx[ 0 ].sCmn.inputBufIx;
288
0
        nSamplesToBuffer  = silk_min( nSamplesToBuffer, nSamplesToBufferMax );
289
0
        nSamplesFromInput = silk_DIV32_16( nSamplesToBuffer * psEnc->state_Fxx[ 0 ].sCmn.API_fs_Hz, psEnc->state_Fxx[ 0 ].sCmn.fs_kHz * 1000 );
290
        /* Resample and write to buffer */
291
0
        if( encControl->nChannelsAPI == 2 && encControl->nChannelsInternal == 2 ) {
292
0
            opus_int id = psEnc->state_Fxx[ 0 ].sCmn.nFramesEncoded;
293
0
            for( n = 0; n < nSamplesFromInput; n++ ) {
294
0
                buf[ n ] = RES2INT16(samplesIn[ 2 * n ]);
295
0
            }
296
            /* Making sure to start both resamplers from the same state when switching from mono to stereo */
297
0
            if( psEnc->nPrevChannelsInternal == 1 && id==0 ) {
298
0
               silk_memcpy( &psEnc->state_Fxx[ 1 ].sCmn.resampler_state, &psEnc->state_Fxx[ 0 ].sCmn.resampler_state, sizeof(psEnc->state_Fxx[ 1 ].sCmn.resampler_state));
299
0
            }
300
301
0
            ret += silk_resampler( &psEnc->state_Fxx[ 0 ].sCmn.resampler_state,
302
0
                &psEnc->state_Fxx[ 0 ].sCmn.inputBuf[ psEnc->state_Fxx[ 0 ].sCmn.inputBufIx + 2 ], buf, nSamplesFromInput );
303
0
            psEnc->state_Fxx[ 0 ].sCmn.inputBufIx += nSamplesToBuffer;
304
305
0
            nSamplesToBuffer  = psEnc->state_Fxx[ 1 ].sCmn.frame_length - psEnc->state_Fxx[ 1 ].sCmn.inputBufIx;
306
0
            nSamplesToBuffer  = silk_min( nSamplesToBuffer, 10 * nBlocksOf10ms * psEnc->state_Fxx[ 1 ].sCmn.fs_kHz );
307
0
            for( n = 0; n < nSamplesFromInput; n++ ) {
308
0
                buf[ n ] = RES2INT16(samplesIn[ 2 * n + 1 ]);
309
0
            }
310
0
            ret += silk_resampler( &psEnc->state_Fxx[ 1 ].sCmn.resampler_state,
311
0
                &psEnc->state_Fxx[ 1 ].sCmn.inputBuf[ psEnc->state_Fxx[ 1 ].sCmn.inputBufIx + 2 ], buf, nSamplesFromInput );
312
313
0
            psEnc->state_Fxx[ 1 ].sCmn.inputBufIx += nSamplesToBuffer;
314
0
        } else if( encControl->nChannelsAPI == 2 && encControl->nChannelsInternal == 1 ) {
315
            /* Combine left and right channels before resampling */
316
0
            for( n = 0; n < nSamplesFromInput; n++ ) {
317
0
                sum = RES2INT16(samplesIn[ 2 * n ] + samplesIn[ 2 * n + 1 ]);
318
0
                buf[ n ] = (opus_int16)silk_RSHIFT_ROUND( sum,  1 );
319
0
            }
320
0
            ret += silk_resampler( &psEnc->state_Fxx[ 0 ].sCmn.resampler_state,
321
0
                &psEnc->state_Fxx[ 0 ].sCmn.inputBuf[ psEnc->state_Fxx[ 0 ].sCmn.inputBufIx + 2 ], buf, nSamplesFromInput );
322
            /* On the first mono frame, average the results for the two resampler states  */
323
0
            if( psEnc->nPrevChannelsInternal == 2 && psEnc->state_Fxx[ 0 ].sCmn.nFramesEncoded == 0 ) {
324
0
               ret += silk_resampler( &psEnc->state_Fxx[ 1 ].sCmn.resampler_state,
325
0
                   &psEnc->state_Fxx[ 1 ].sCmn.inputBuf[ psEnc->state_Fxx[ 1 ].sCmn.inputBufIx + 2 ], buf, nSamplesFromInput );
326
0
               for( n = 0; n < psEnc->state_Fxx[ 0 ].sCmn.frame_length; n++ ) {
327
0
                  psEnc->state_Fxx[ 0 ].sCmn.inputBuf[ psEnc->state_Fxx[ 0 ].sCmn.inputBufIx+n+2 ] =
328
0
                        silk_RSHIFT(psEnc->state_Fxx[ 0 ].sCmn.inputBuf[ psEnc->state_Fxx[ 0 ].sCmn.inputBufIx+n+2 ]
329
0
                                  + psEnc->state_Fxx[ 1 ].sCmn.inputBuf[ psEnc->state_Fxx[ 1 ].sCmn.inputBufIx+n+2 ], 1);
330
0
               }
331
0
            }
332
0
            psEnc->state_Fxx[ 0 ].sCmn.inputBufIx += nSamplesToBuffer;
333
0
        } else {
334
0
            celt_assert( encControl->nChannelsAPI == 1 && encControl->nChannelsInternal == 1 );
335
0
            for( n = 0; n < nSamplesFromInput; n++ ) {
336
0
                buf[n] = RES2INT16(samplesIn[n]);
337
0
            }
338
0
            ret += silk_resampler( &psEnc->state_Fxx[ 0 ].sCmn.resampler_state,
339
0
                &psEnc->state_Fxx[ 0 ].sCmn.inputBuf[ psEnc->state_Fxx[ 0 ].sCmn.inputBufIx + 2 ], buf, nSamplesFromInput );
340
0
            psEnc->state_Fxx[ 0 ].sCmn.inputBufIx += nSamplesToBuffer;
341
0
        }
342
343
0
        samplesIn  += nSamplesFromInput * encControl->nChannelsAPI;
344
0
        nSamplesIn -= nSamplesFromInput;
345
346
        /* Default */
347
0
        psEnc->allowBandwidthSwitch = 0;
348
349
        /* Silk encoder */
350
0
        if( psEnc->state_Fxx[ 0 ].sCmn.inputBufIx >= psEnc->state_Fxx[ 0 ].sCmn.frame_length ) {
351
            /* Enough data in input buffer, so encode */
352
0
            celt_assert( psEnc->state_Fxx[ 0 ].sCmn.inputBufIx == psEnc->state_Fxx[ 0 ].sCmn.frame_length );
353
0
            celt_assert( encControl->nChannelsInternal == 1 || psEnc->state_Fxx[ 1 ].sCmn.inputBufIx == psEnc->state_Fxx[ 1 ].sCmn.frame_length );
354
355
            /* Deal with LBRR data */
356
0
            if( psEnc->state_Fxx[ 0 ].sCmn.nFramesEncoded == 0 && !prefillFlag ) {
357
                /* Create space at start of payload for VAD and FEC flags */
358
0
                opus_uint8 iCDF[ 2 ] = { 0, 0 };
359
0
                iCDF[ 0 ] = 256 - silk_RSHIFT( 256, ( psEnc->state_Fxx[ 0 ].sCmn.nFramesPerPacket + 1 ) * encControl->nChannelsInternal );
360
0
                ec_enc_icdf( psRangeEnc, 0, iCDF, 8 );
361
0
                curr_nBitsUsedLBRR = ec_tell( psRangeEnc );
362
363
                /* Encode any LBRR data from previous packet */
364
                /* Encode LBRR flags */
365
0
                for( n = 0; n < encControl->nChannelsInternal; n++ ) {
366
0
                    LBRR_symbol = 0;
367
0
                    for( i = 0; i < psEnc->state_Fxx[ n ].sCmn.nFramesPerPacket; i++ ) {
368
0
                        LBRR_symbol |= silk_LSHIFT( psEnc->state_Fxx[ n ].sCmn.LBRR_flags[ i ], i );
369
0
                    }
370
0
                    psEnc->state_Fxx[ n ].sCmn.LBRR_flag = LBRR_symbol > 0 ? 1 : 0;
371
0
                    if( LBRR_symbol && psEnc->state_Fxx[ n ].sCmn.nFramesPerPacket > 1 ) {
372
0
                        ec_enc_icdf( psRangeEnc, LBRR_symbol - 1, silk_LBRR_flags_iCDF_ptr[ psEnc->state_Fxx[ n ].sCmn.nFramesPerPacket - 2 ], 8 );
373
0
                    }
374
0
                }
375
376
                /* Code LBRR indices and excitation signals */
377
0
                for( i = 0; i < psEnc->state_Fxx[ 0 ].sCmn.nFramesPerPacket; i++ ) {
378
0
                    for( n = 0; n < encControl->nChannelsInternal; n++ ) {
379
0
                        if( psEnc->state_Fxx[ n ].sCmn.LBRR_flags[ i ] ) {
380
0
                            opus_int condCoding;
381
382
0
                            if( encControl->nChannelsInternal == 2 && n == 0 ) {
383
0
                                silk_stereo_encode_pred( psRangeEnc, psEnc->sStereo.predIx[ i ] );
384
                                /* For LBRR data there's no need to code the mid-only flag if the side-channel LBRR flag is set */
385
0
                                if( psEnc->state_Fxx[ 1 ].sCmn.LBRR_flags[ i ] == 0 ) {
386
0
                                    silk_stereo_encode_mid_only( psRangeEnc, psEnc->sStereo.mid_only_flags[ i ] );
387
0
                                }
388
0
                            }
389
                            /* Use conditional coding if previous frame available */
390
0
                            if( i > 0 && psEnc->state_Fxx[ n ].sCmn.LBRR_flags[ i - 1 ] ) {
391
0
                                condCoding = CODE_CONDITIONALLY;
392
0
                            } else {
393
0
                                condCoding = CODE_INDEPENDENTLY;
394
0
                            }
395
0
                            silk_encode_indices( &psEnc->state_Fxx[ n ].sCmn, psRangeEnc, i, 1, condCoding );
396
0
                            silk_encode_pulses( psRangeEnc, psEnc->state_Fxx[ n ].sCmn.indices_LBRR[i].signalType, psEnc->state_Fxx[ n ].sCmn.indices_LBRR[i].quantOffsetType,
397
0
                                psEnc->state_Fxx[ n ].sCmn.pulses_LBRR[ i ], psEnc->state_Fxx[ n ].sCmn.frame_length );
398
0
                        }
399
0
                    }
400
0
                }
401
402
                /* Reset LBRR flags */
403
0
                for( n = 0; n < encControl->nChannelsInternal; n++ ) {
404
0
                    silk_memset( psEnc->state_Fxx[ n ].sCmn.LBRR_flags, 0, sizeof( psEnc->state_Fxx[ n ].sCmn.LBRR_flags ) );
405
0
                }
406
0
                curr_nBitsUsedLBRR = ec_tell( psRangeEnc ) - curr_nBitsUsedLBRR;
407
0
            }
408
409
0
            silk_HP_variable_cutoff( psEnc->state_Fxx );
410
411
            /* Total target bits for packet */
412
0
            nBits = silk_DIV32_16( silk_MUL( encControl->bitRate, encControl->payloadSize_ms ), 1000 );
413
            /* Subtract bits used for LBRR */
414
0
            if( !prefillFlag ) {
415
                /* psEnc->nBitsUsedLBRR is an exponential moving average of the LBRR usage,
416
                   except that for the first LBRR frame it does no averaging and for the first
417
                   frame after after LBRR, it goes back to zero immediately. */
418
0
                if ( curr_nBitsUsedLBRR < 10 ) {
419
0
                    psEnc->nBitsUsedLBRR = 0;
420
0
                } else if ( psEnc->nBitsUsedLBRR < 10) {
421
0
                    psEnc->nBitsUsedLBRR = curr_nBitsUsedLBRR;
422
0
                } else {
423
0
                    psEnc->nBitsUsedLBRR = ( psEnc->nBitsUsedLBRR + curr_nBitsUsedLBRR ) / 2;
424
0
                }
425
0
                nBits -= psEnc->nBitsUsedLBRR;
426
0
            }
427
            /* Divide by number of uncoded frames left in packet */
428
0
            nBits = silk_DIV32_16( nBits, psEnc->state_Fxx[ 0 ].sCmn.nFramesPerPacket );
429
            /* Convert to bits/second */
430
0
            if( encControl->payloadSize_ms == 10 ) {
431
0
                TargetRate_bps = silk_SMULBB( nBits, 100 );
432
0
            } else {
433
0
                TargetRate_bps = silk_SMULBB( nBits, 50 );
434
0
            }
435
            /* Subtract fraction of bits in excess of target in previous frames and packets */
436
0
            TargetRate_bps -= silk_DIV32_16( silk_MUL( psEnc->nBitsExceeded, 1000 ), BITRESERVOIR_DECAY_TIME_MS );
437
0
            if( !prefillFlag && psEnc->state_Fxx[ 0 ].sCmn.nFramesEncoded > 0 ) {
438
                /* Compare actual vs target bits so far in this packet */
439
0
                opus_int32 bitsBalance = ec_tell( psRangeEnc ) - psEnc->nBitsUsedLBRR - nBits * psEnc->state_Fxx[ 0 ].sCmn.nFramesEncoded;
440
0
                TargetRate_bps -= silk_DIV32_16( silk_MUL( bitsBalance, 1000 ), BITRESERVOIR_DECAY_TIME_MS );
441
0
            }
442
            /* Never exceed input bitrate */
443
0
            TargetRate_bps = silk_LIMIT( TargetRate_bps, encControl->bitRate, 5000 );
444
445
            /* Convert Left/Right to Mid/Side */
446
0
            if( encControl->nChannelsInternal == 2 ) {
447
0
                silk_stereo_LR_to_MS( &psEnc->sStereo, &psEnc->state_Fxx[ 0 ].sCmn.inputBuf[ 2 ], &psEnc->state_Fxx[ 1 ].sCmn.inputBuf[ 2 ],
448
0
                    psEnc->sStereo.predIx[ psEnc->state_Fxx[ 0 ].sCmn.nFramesEncoded ], &psEnc->sStereo.mid_only_flags[ psEnc->state_Fxx[ 0 ].sCmn.nFramesEncoded ],
449
0
                    MStargetRates_bps, TargetRate_bps, psEnc->state_Fxx[ 0 ].sCmn.speech_activity_Q8, encControl->toMono,
450
0
                    psEnc->state_Fxx[ 0 ].sCmn.fs_kHz, psEnc->state_Fxx[ 0 ].sCmn.frame_length );
451
0
                if( psEnc->sStereo.mid_only_flags[ psEnc->state_Fxx[ 0 ].sCmn.nFramesEncoded ] == 0 ) {
452
                    /* Reset side channel encoder memory for first frame with side coding */
453
0
                    if( psEnc->prev_decode_only_middle == 1 ) {
454
0
                        silk_memset( &psEnc->state_Fxx[ 1 ].sShape,               0, sizeof( psEnc->state_Fxx[ 1 ].sShape ) );
455
0
                        silk_memset( &psEnc->state_Fxx[ 1 ].sCmn.sNSQ,            0, sizeof( psEnc->state_Fxx[ 1 ].sCmn.sNSQ ) );
456
0
                        silk_memset( psEnc->state_Fxx[ 1 ].sCmn.prev_NLSFq_Q15,   0, sizeof( psEnc->state_Fxx[ 1 ].sCmn.prev_NLSFq_Q15 ) );
457
0
                        silk_memset( &psEnc->state_Fxx[ 1 ].sCmn.sLP.In_LP_State, 0, sizeof( psEnc->state_Fxx[ 1 ].sCmn.sLP.In_LP_State ) );
458
0
                        psEnc->state_Fxx[ 1 ].sCmn.prevLag                 = 100;
459
0
                        psEnc->state_Fxx[ 1 ].sCmn.sNSQ.lagPrev            = 100;
460
0
                        psEnc->state_Fxx[ 1 ].sShape.LastGainIndex         = 10;
461
0
                        psEnc->state_Fxx[ 1 ].sCmn.prevSignalType          = TYPE_NO_VOICE_ACTIVITY;
462
0
                        psEnc->state_Fxx[ 1 ].sCmn.sNSQ.prev_gain_Q16      = 65536;
463
0
                        psEnc->state_Fxx[ 1 ].sCmn.first_frame_after_reset = 1;
464
0
                    }
465
0
                    silk_encode_do_VAD_Fxx( &psEnc->state_Fxx[ 1 ], activity );
466
0
                } else {
467
0
                    psEnc->state_Fxx[ 1 ].sCmn.VAD_flags[ psEnc->state_Fxx[ 0 ].sCmn.nFramesEncoded ] = 0;
468
0
                }
469
0
                if( !prefillFlag ) {
470
0
                    silk_stereo_encode_pred( psRangeEnc, psEnc->sStereo.predIx[ psEnc->state_Fxx[ 0 ].sCmn.nFramesEncoded ] );
471
0
                    if( psEnc->state_Fxx[ 1 ].sCmn.VAD_flags[ psEnc->state_Fxx[ 0 ].sCmn.nFramesEncoded ] == 0 ) {
472
0
                        silk_stereo_encode_mid_only( psRangeEnc, psEnc->sStereo.mid_only_flags[ psEnc->state_Fxx[ 0 ].sCmn.nFramesEncoded ] );
473
0
                    }
474
0
                }
475
0
            } else {
476
                /* Buffering */
477
0
                silk_memcpy( psEnc->state_Fxx[ 0 ].sCmn.inputBuf, psEnc->sStereo.sMid, 2 * sizeof( opus_int16 ) );
478
0
                silk_memcpy( psEnc->sStereo.sMid, &psEnc->state_Fxx[ 0 ].sCmn.inputBuf[ psEnc->state_Fxx[ 0 ].sCmn.frame_length ], 2 * sizeof( opus_int16 ) );
479
0
            }
480
0
            silk_encode_do_VAD_Fxx( &psEnc->state_Fxx[ 0 ], activity );
481
482
            /* Encode */
483
0
            for( n = 0; n < encControl->nChannelsInternal; n++ ) {
484
0
                opus_int maxBits, useCBR;
485
486
                /* Handling rate constraints */
487
0
                maxBits = encControl->maxBits;
488
0
                if( tot_blocks == 2 && curr_block == 0 ) {
489
0
                    maxBits = maxBits * 3 / 5;
490
0
                } else if( tot_blocks == 3 ) {
491
0
                    if( curr_block == 0 ) {
492
0
                        maxBits = maxBits * 2 / 5;
493
0
                    } else if( curr_block == 1 ) {
494
0
                        maxBits = maxBits * 3 / 4;
495
0
                    }
496
0
                }
497
0
                useCBR = encControl->useCBR && curr_block == tot_blocks - 1;
498
499
0
                if( encControl->nChannelsInternal == 1 ) {
500
0
                    channelRate_bps = TargetRate_bps;
501
0
                } else {
502
0
                    channelRate_bps = MStargetRates_bps[ n ];
503
0
                    if( n == 0 && MStargetRates_bps[ 1 ] > 0 ) {
504
0
                        useCBR = 0;
505
                        /* Give mid up to 1/2 of the max bits for that frame */
506
0
                        maxBits -= encControl->maxBits / ( tot_blocks * 2 );
507
0
                    }
508
0
                }
509
510
0
                if( channelRate_bps > 0 ) {
511
0
                    opus_int condCoding;
512
513
0
                    silk_control_SNR( &psEnc->state_Fxx[ n ].sCmn, channelRate_bps );
514
515
                    /* Use independent coding if no previous frame available */
516
0
                    if( psEnc->state_Fxx[ 0 ].sCmn.nFramesEncoded - n <= 0 ) {
517
0
                        condCoding = CODE_INDEPENDENTLY;
518
0
                    } else if( n > 0 && psEnc->prev_decode_only_middle ) {
519
                        /* If we skipped a side frame in this packet, we don't
520
                           need LTP scaling; the LTP state is well-defined. */
521
0
                        condCoding = CODE_INDEPENDENTLY_NO_LTP_SCALING;
522
0
                    } else {
523
0
                        condCoding = CODE_CONDITIONALLY;
524
0
                    }
525
0
                    if( ( ret = silk_encode_frame_Fxx( &psEnc->state_Fxx[ n ], nBytesOut, psRangeEnc, condCoding, maxBits, useCBR ) ) != 0 ) {
526
0
                        silk_assert( 0 );
527
0
                    }
528
0
                }
529
0
                psEnc->state_Fxx[ n ].sCmn.controlled_since_last_payload = 0;
530
0
                psEnc->state_Fxx[ n ].sCmn.inputBufIx = 0;
531
0
                psEnc->state_Fxx[ n ].sCmn.nFramesEncoded++;
532
0
            }
533
0
            psEnc->prev_decode_only_middle = psEnc->sStereo.mid_only_flags[ psEnc->state_Fxx[ 0 ].sCmn.nFramesEncoded - 1 ];
534
535
            /* Insert VAD and FEC flags at beginning of bitstream */
536
0
            if( *nBytesOut > 0 && psEnc->state_Fxx[ 0 ].sCmn.nFramesEncoded == psEnc->state_Fxx[ 0 ].sCmn.nFramesPerPacket) {
537
0
                flags = 0;
538
0
                for( n = 0; n < encControl->nChannelsInternal; n++ ) {
539
0
                    for( i = 0; i < psEnc->state_Fxx[ n ].sCmn.nFramesPerPacket; i++ ) {
540
0
                        flags  = silk_LSHIFT( flags, 1 );
541
0
                        flags |= psEnc->state_Fxx[ n ].sCmn.VAD_flags[ i ];
542
0
                    }
543
0
                    flags  = silk_LSHIFT( flags, 1 );
544
0
                    flags |= psEnc->state_Fxx[ n ].sCmn.LBRR_flag;
545
0
                }
546
0
                if( !prefillFlag ) {
547
0
                    ec_enc_patch_initial_bits( psRangeEnc, flags, ( psEnc->state_Fxx[ 0 ].sCmn.nFramesPerPacket + 1 ) * encControl->nChannelsInternal );
548
0
                }
549
550
                /* Return zero bytes if all channels DTXed */
551
0
                if( psEnc->state_Fxx[ 0 ].sCmn.inDTX && ( encControl->nChannelsInternal == 1 || psEnc->state_Fxx[ 1 ].sCmn.inDTX ) ) {
552
0
                    *nBytesOut = 0;
553
0
                }
554
555
0
                psEnc->nBitsExceeded += *nBytesOut * 8;
556
0
                psEnc->nBitsExceeded -= silk_DIV32_16( silk_MUL( encControl->bitRate, encControl->payloadSize_ms ), 1000 );
557
0
                psEnc->nBitsExceeded  = silk_LIMIT( psEnc->nBitsExceeded, 0, 10000 );
558
559
                /* Update flag indicating if bandwidth switching is allowed */
560
0
                speech_act_thr_for_switch_Q8 = silk_SMLAWB( SILK_FIX_CONST( SPEECH_ACTIVITY_DTX_THRES, 8 ),
561
0
                    SILK_FIX_CONST( ( 1 - SPEECH_ACTIVITY_DTX_THRES ) / MAX_BANDWIDTH_SWITCH_DELAY_MS, 16 + 8 ), psEnc->timeSinceSwitchAllowed_ms );
562
0
                if( psEnc->state_Fxx[ 0 ].sCmn.speech_activity_Q8 < speech_act_thr_for_switch_Q8 ) {
563
0
                    psEnc->allowBandwidthSwitch = 1;
564
0
                    psEnc->timeSinceSwitchAllowed_ms = 0;
565
0
                } else {
566
0
                    psEnc->allowBandwidthSwitch = 0;
567
0
                    psEnc->timeSinceSwitchAllowed_ms += encControl->payloadSize_ms;
568
0
                }
569
0
            }
570
571
0
            if( nSamplesIn == 0 ) {
572
0
                break;
573
0
            }
574
0
        } else {
575
0
            break;
576
0
        }
577
0
        curr_block++;
578
0
    }
579
580
0
    psEnc->nPrevChannelsInternal = encControl->nChannelsInternal;
581
582
0
    encControl->allowBandwidthSwitch = psEnc->allowBandwidthSwitch;
583
0
    encControl->inWBmodeWithoutVariableLP = psEnc->state_Fxx[ 0 ].sCmn.fs_kHz == 16 && psEnc->state_Fxx[ 0 ].sCmn.sLP.mode == 0;
584
0
    encControl->internalSampleRate = silk_SMULBB( psEnc->state_Fxx[ 0 ].sCmn.fs_kHz, 1000 );
585
0
    encControl->stereoWidth_Q14 = encControl->toMono ? 0 : psEnc->sStereo.smth_width_Q14;
586
0
    if( prefillFlag ) {
587
0
        encControl->payloadSize_ms = tmp_payloadSize_ms;
588
0
        encControl->complexity = tmp_complexity;
589
0
        for( n = 0; n < encControl->nChannelsInternal; n++ ) {
590
0
            psEnc->state_Fxx[ n ].sCmn.controlled_since_last_payload = 0;
591
0
            psEnc->state_Fxx[ n ].sCmn.prefillFlag = 0;
592
0
        }
593
0
    }
594
595
0
    encControl->signalType = psEnc->state_Fxx[0].sCmn.indices.signalType;
596
0
    encControl->offset = silk_Quantization_Offsets_Q10
597
0
                         [ psEnc->state_Fxx[0].sCmn.indices.signalType >> 1 ]
598
0
                         [ psEnc->state_Fxx[0].sCmn.indices.quantOffsetType ];
599
0
    RESTORE_STACK;
600
0
    return ret;
601
0
}