Coverage Report

Created: 2026-02-26 07:37

next uncovered line (L), next uncovered region (R), next uncovered branch (B)
/src/opus/celt/celt.c
Line
Count
Source
1
/* Copyright (c) 2007-2008 CSIRO
2
   Copyright (c) 2007-2010 Xiph.Org Foundation
3
   Copyright (c) 2008 Gregory Maxwell
4
   Written by Jean-Marc Valin and Gregory Maxwell */
5
/*
6
   Redistribution and use in source and binary forms, with or without
7
   modification, are permitted provided that the following conditions
8
   are met:
9
10
   - Redistributions of source code must retain the above copyright
11
   notice, this list of conditions and the following disclaimer.
12
13
   - Redistributions in binary form must reproduce the above copyright
14
   notice, this list of conditions and the following disclaimer in the
15
   documentation and/or other materials provided with the distribution.
16
17
   THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
18
   ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
19
   LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
20
   A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER
21
   OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
22
   EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
23
   PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
24
   PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
25
   LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
26
   NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
27
   SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
28
*/
29
30
#ifdef HAVE_CONFIG_H
31
#include "config.h"
32
#endif
33
34
#define CELT_C
35
36
#include "os_support.h"
37
#include "mdct.h"
38
#include <math.h>
39
#include "celt.h"
40
#include "pitch.h"
41
#include "bands.h"
42
#include "modes.h"
43
#include "entcode.h"
44
#include "quant_bands.h"
45
#include "rate.h"
46
#include "stack_alloc.h"
47
#include "mathops.h"
48
#include "float_cast.h"
49
#include <stdarg.h>
50
#include "celt_lpc.h"
51
#include "vq.h"
52
53
#ifndef PACKAGE_VERSION
54
#define PACKAGE_VERSION "unknown"
55
#endif
56
57
#if defined(FIXED_POINT) && defined(__mips)
58
#include "mips/celt_mipsr1.h"
59
#endif
60
61
62
int resampling_factor(opus_int32 rate)
63
4.31k
{
64
4.31k
   int ret;
65
4.31k
   switch (rate)
66
4.31k
   {
67
#ifdef ENABLE_QEXT
68
   case 96000:
69
#endif
70
742
   case 48000:
71
742
      ret = 1;
72
742
      break;
73
702
   case 24000:
74
702
      ret = 2;
75
702
      break;
76
849
   case 16000:
77
849
      ret = 3;
78
849
      break;
79
589
   case 12000:
80
589
      ret = 4;
81
589
      break;
82
1.43k
   case 8000:
83
1.43k
      ret = 6;
84
1.43k
      break;
85
0
   default:
86
0
#ifndef CUSTOM_MODES
87
0
      celt_assert(0);
88
0
#endif
89
0
      ret = 0;
90
0
      break;
91
4.31k
   }
92
4.31k
   return ret;
93
4.31k
}
94
95
96
#if !defined(OVERRIDE_COMB_FILTER_CONST) || defined(NON_STATIC_COMB_FILTER_CONST_C)
97
/* This version should be faster on ARM */
98
#ifdef OPUS_ARM_ASM
99
#ifndef NON_STATIC_COMB_FILTER_CONST_C
100
static
101
#endif
102
void comb_filter_const_c(opus_val32 *y, opus_val32 *x, int T, int N,
103
      celt_coef g10, celt_coef g11, celt_coef g12)
104
{
105
   opus_val32 x0, x1, x2, x3, x4;
106
   int i;
107
   x4 = SHL32(x[-T-2], 1);
108
   x3 = SHL32(x[-T-1], 1);
109
   x2 = SHL32(x[-T], 1);
110
   x1 = SHL32(x[-T+1], 1);
111
   for (i=0;i<N-4;i+=5)
112
   {
113
      opus_val32 t;
114
      x0=SHL32(x[i-T+2],1);
115
      t = MAC_COEF_32_ARM(x[i], g10, x2);
116
      t = MAC_COEF_32_ARM(t, g11, ADD32(x1,x3));
117
      t = MAC_COEF_32_ARM(t, g12, ADD32(x0,x4));
118
      t = SATURATE(t, SIG_SAT);
119
      y[i] = t;
120
      x4=SHL32(x[i-T+3],1);
121
      t = MAC_COEF_32_ARM(x[i+1], g10, x1);
122
      t = MAC_COEF_32_ARM(t, g11, ADD32(x0,x2));
123
      t = MAC_COEF_32_ARM(t, g12, ADD32(x4,x3));
124
      t = SATURATE(t, SIG_SAT);
125
      y[i+1] = t;
126
      x3=SHL32(x[i-T+4],1);
127
      t = MAC_COEF_32_ARM(x[i+2], g10, x0);
128
      t = MAC_COEF_32_ARM(t, g11, ADD32(x4,x1));
129
      t = MAC_COEF_32_ARM(t, g12, ADD32(x3,x2));
130
      t = SATURATE(t, SIG_SAT);
131
      y[i+2] = t;
132
      x2=SHL32(x[i-T+5],1);
133
      t = MAC_COEF_32_ARM(x[i+3], g10, x4);
134
      t = MAC_COEF_32_ARM(t, g11, ADD32(x3,x0));
135
      t = MAC_COEF_32_ARM(t, g12, ADD32(x2,x1));
136
      t = SATURATE(t, SIG_SAT);
137
      y[i+3] = t;
138
      x1=SHL32(x[i-T+6],1);
139
      t = MAC_COEF_32_ARM(x[i+4], g10, x3);
140
      t = MAC_COEF_32_ARM(t, g11, ADD32(x2,x4));
141
      t = MAC_COEF_32_ARM(t, g12, ADD32(x1,x0));
142
      t = SATURATE(t, SIG_SAT);
143
      y[i+4] = t;
144
   }
145
#ifdef CUSTOM_MODES
146
   for (;i<N;i++)
147
   {
148
      opus_val32 t;
149
      x0=SHL32(x[i-T+2],1);
150
      t = MAC_COEF_32_ARM(x[i], g10, x2);
151
      t = MAC_COEF_32_ARM(t, g11, ADD32(x1,x3));
152
      t = MAC_COEF_32_ARM(t, g12, ADD32(x0,x4));
153
      t = SATURATE(t, SIG_SAT);
154
      y[i] = t;
155
      x4=x3;
156
      x3=x2;
157
      x2=x1;
158
      x1=x0;
159
   }
160
#endif
161
}
162
#else
163
#ifndef NON_STATIC_COMB_FILTER_CONST_C
164
static
165
#endif
166
void comb_filter_const_c(opus_val32 *y, opus_val32 *x, int T, int N,
167
      celt_coef g10, celt_coef g11, celt_coef g12)
168
767k
{
169
767k
   opus_val32 x0, x1, x2, x3, x4;
170
767k
   int i;
171
767k
   x4 = x[-T-2];
172
767k
   x3 = x[-T-1];
173
767k
   x2 = x[-T];
174
767k
   x1 = x[-T+1];
175
438M
   for (i=0;i<N;i++)
176
438M
   {
177
438M
      x0=x[i-T+2];
178
438M
      y[i] = x[i]
179
438M
               + MULT_COEF_32(g10,x2)
180
438M
               + MULT_COEF_32(g11,ADD32(x1,x3))
181
438M
               + MULT_COEF_32(g12,ADD32(x0,x4));
182
438M
#ifdef FIXED_POINT
183
      /* A bit of bias seems to help here. */
184
438M
      y[i] = SUB32(y[i], 1);
185
438M
#endif
186
438M
      y[i] = SATURATE(y[i], SIG_SAT);
187
438M
      x4=x3;
188
438M
      x3=x2;
189
438M
      x2=x1;
190
438M
      x1=x0;
191
438M
   }
192
193
767k
}
194
#endif
195
#endif
196
197
#ifdef ENABLE_QEXT
198
void comb_filter_qext(opus_val32 *y, opus_val32 *x, int T0, int T1, int N,
199
      opus_val16 g0, opus_val16 g1, int tapset0, int tapset1,
200
      const celt_coef *window, int overlap, int arch)
201
{
202
   VARDECL(opus_val32, mem_buf);
203
   VARDECL(opus_val32, buf);
204
   celt_coef new_window[120];
205
   int s;
206
   int i;
207
   int N2;
208
   int overlap2;
209
   SAVE_STACK;
210
   /* Using ALLOC() instead of a regular stack allocation to minimize real stack use when using the pseudostack.
211
      This is useful on some embedded systems. */
212
   ALLOC(mem_buf, COMBFILTER_MAXPERIOD+960, opus_val32);
213
   ALLOC(buf, COMBFILTER_MAXPERIOD+960, opus_val32);
214
   N2 = N/2;
215
   overlap2=overlap/2;
216
   /* At 96 kHz, we double the period and the spacing between taps, which is equivalent
217
      to creating a mirror image of the filter around 24 kHz. It also means we can process
218
      the even and odd samples completely independently. */
219
   for (s=0;s<2;s++) {
220
      opus_val32 *yptr;
221
      for (i=0;i<overlap2;i++) new_window[i] = window[2*i+s];
222
      for (i=0;i<COMBFILTER_MAXPERIOD+N2;i++) mem_buf[i] = x[2*i+s-2*COMBFILTER_MAXPERIOD];
223
      if (x==y) {
224
         yptr = mem_buf+COMBFILTER_MAXPERIOD;
225
      } else {
226
         for (i=0;i<N2;i++) buf[i] = y[2*i+s];
227
         yptr = buf;
228
      }
229
      comb_filter(yptr, mem_buf+COMBFILTER_MAXPERIOD, T0, T1, N2, g0, g1, tapset0, tapset1, new_window, overlap2, arch);
230
      for (i=0;i<N2;i++) y[2*i+s] = yptr[i];
231
   }
232
   RESTORE_STACK;
233
   return;
234
}
235
#endif
236
237
#ifndef OVERRIDE_comb_filter
238
void comb_filter(opus_val32 *y, opus_val32 *x, int T0, int T1, int N,
239
      opus_val16 g0, opus_val16 g1, int tapset0, int tapset1,
240
      const celt_coef *window, int overlap, int arch)
241
66.7M
{
242
66.7M
   int i;
243
   /* printf ("%d %d %f %f\n", T0, T1, g0, g1); */
244
66.7M
   celt_coef g00, g01, g02, g10, g11, g12;
245
66.7M
   opus_val32 x0, x1, x2, x3, x4;
246
66.7M
   static const opus_val16 gains[3][3] = {
247
66.7M
         {QCONST16(0.3066406250f, 15), QCONST16(0.2170410156f, 15), QCONST16(0.1296386719f, 15)},
248
66.7M
         {QCONST16(0.4638671875f, 15), QCONST16(0.2680664062f, 15), QCONST16(0.f, 15)},
249
66.7M
         {QCONST16(0.7998046875f, 15), QCONST16(0.1000976562f, 15), QCONST16(0.f, 15)}};
250
#ifdef ENABLE_QEXT
251
   if (overlap==240) {
252
      comb_filter_qext(y, x, T0, T1, N, g0, g1, tapset0, tapset1, window, overlap, arch);
253
      return;
254
   }
255
#endif
256
66.7M
   if (g0==0 && g1==0)
257
66.0M
   {
258
      /* OPT: Happens to work without the OPUS_MOVE(), but only because the current encoder already copies x to y */
259
66.0M
      if (x!=y)
260
66.0M
         OPUS_MOVE(y, x, N);
261
66.0M
      return;
262
66.0M
   }
263
   /* When the gain is zero, T0 and/or T1 is set to zero. We need
264
      to have then be at least 2 to avoid processing garbage data. */
265
769k
   T0 = IMAX(T0, COMBFILTER_MINPERIOD);
266
769k
   T1 = IMAX(T1, COMBFILTER_MINPERIOD);
267
769k
   g00 = MULT_COEF_TAPS(g0, gains[tapset0][0]);
268
769k
   g01 = MULT_COEF_TAPS(g0, gains[tapset0][1]);
269
769k
   g02 = MULT_COEF_TAPS(g0, gains[tapset0][2]);
270
769k
   g10 = MULT_COEF_TAPS(g1, gains[tapset1][0]);
271
769k
   g11 = MULT_COEF_TAPS(g1, gains[tapset1][1]);
272
769k
   g12 = MULT_COEF_TAPS(g1, gains[tapset1][2]);
273
769k
   x1 = x[-T1+1];
274
769k
   x2 = x[-T1  ];
275
769k
   x3 = x[-T1-1];
276
769k
   x4 = x[-T1-2];
277
   /* If the filter didn't change, we don't need the overlap */
278
769k
   if (g0==g1 && T0==T1 && tapset0==tapset1)
279
215k
      overlap=0;
280
67.3M
   for (i=0;i<overlap;i++)
281
66.5M
   {
282
66.5M
      celt_coef f;
283
66.5M
      x0=x[i-T1+2];
284
66.5M
      f = MULT_COEF(window[i],window[i]);
285
66.5M
      y[i] = x[i]
286
66.5M
               + MULT_COEF_32(MULT_COEF((COEF_ONE-f),g00),x[i-T0])
287
66.5M
               + MULT_COEF_32(MULT_COEF((COEF_ONE-f),g01),ADD32(x[i-T0+1],x[i-T0-1]))
288
66.5M
               + MULT_COEF_32(MULT_COEF((COEF_ONE-f),g02),ADD32(x[i-T0+2],x[i-T0-2]))
289
66.5M
               + MULT_COEF_32(MULT_COEF(f,g10),x2)
290
66.5M
               + MULT_COEF_32(MULT_COEF(f,g11),ADD32(x1,x3))
291
66.5M
               + MULT_COEF_32(MULT_COEF(f,g12),ADD32(x0,x4));
292
66.5M
#ifdef FIXED_POINT
293
      /* A bit of bias seems to help here. */
294
66.5M
      y[i] = SUB32(y[i], 3);
295
66.5M
#endif
296
66.5M
      y[i] = SATURATE(y[i], SIG_SAT);
297
66.5M
      x4=x3;
298
66.5M
      x3=x2;
299
66.5M
      x2=x1;
300
66.5M
      x1=x0;
301
302
66.5M
   }
303
769k
   if (g1==0)
304
2.42k
   {
305
      /* OPT: Happens to work without the OPUS_MOVE(), but only because the current encoder already copies x to y */
306
2.42k
      if (x!=y)
307
2.42k
         OPUS_MOVE(y+overlap, x+overlap, N-overlap);
308
2.42k
      return;
309
2.42k
   }
310
311
   /* Compute the part with the constant filter. */
312
767k
   comb_filter_const(y+i, x+i, T1, N-i, g10, g11, g12, arch);
313
767k
}
314
#endif /* OVERRIDE_comb_filter */
315
316
/* TF change table. Positive values mean better frequency resolution (longer
317
   effective window), whereas negative values mean better time resolution
318
   (shorter effective window). The second index is computed as:
319
   4*isTransient + 2*tf_select + per_band_flag */
320
const signed char tf_select_table[4][8] = {
321
    /*isTransient=0     isTransient=1 */
322
      {0, -1, 0, -1,    0,-1, 0,-1}, /* 2.5 ms */
323
      {0, -1, 0, -2,    1, 0, 1,-1}, /* 5 ms */
324
      {0, -2, 0, -3,    2, 0, 1,-1}, /* 10 ms */
325
      {0, -2, 0, -3,    3, 0, 1,-1}, /* 20 ms */
326
};
327
328
329
void init_caps(const CELTMode *m,int *cap,int LM,int C)
330
43.2M
{
331
43.2M
   int i;
332
951M
   for (i=0;i<m->nbEBands;i++)
333
908M
   {
334
908M
      int N;
335
908M
      N=(m->eBands[i+1]-m->eBands[i])<<LM;
336
908M
      cap[i] = (m->cache.caps[m->nbEBands*(2*LM+C-1)+i]+64)*C*N>>2;
337
908M
   }
338
43.2M
}
339
340
341
342
const char *opus_strerror(int error)
343
0
{
344
0
   static const char * const error_strings[8] = {
345
0
      "success",
346
0
      "invalid argument",
347
0
      "buffer too small",
348
0
      "internal error",
349
0
      "corrupted stream",
350
0
      "request not implemented",
351
0
      "invalid state",
352
0
      "memory allocation failed"
353
0
   };
354
0
   if (error > 0 || error < -7)
355
0
      return "unknown error";
356
0
   else
357
0
      return error_strings[-error];
358
0
}
359
360
const char *opus_get_version_string(void)
361
0
{
362
0
    return "libopus " PACKAGE_VERSION
363
    /* Applications may rely on the presence of this substring in the version
364
       string to determine if they have a fixed-point or floating-point build
365
       at runtime. */
366
0
#ifdef FIXED_POINT
367
0
          "-fixed"
368
0
#endif
369
#ifdef FUZZING
370
          "-fuzzing"
371
#endif
372
0
          ;
373
0
}