/src/opus/celt/celt.c

Source
/* Copyright (c) 2007-2008 CSIRO
   Copyright (c) 2007-2010 Xiph.Org Foundation
   Copyright (c) 2008 Gregory Maxwell
   Written by Jean-Marc Valin and Gregory Maxwell */
/*
   Redistribution and use in source and binary forms, with or without
   modification, are permitted provided that the following conditions
   are met:

   - Redistributions of source code must retain the above copyright
   notice, this list of conditions and the following disclaimer.

   - Redistributions in binary form must reproduce the above copyright
   notice, this list of conditions and the following disclaimer in the
   documentation and/or other materials provided with the distribution.

   THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
   ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
   LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
   A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER
   OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
   EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
   PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
   PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
   LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
   NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
   SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
*/

#ifdef HAVE_CONFIG_H
#include "config.h"
#endif

#define CELT_C

#include "os_support.h"
#include "mdct.h"
#include <math.h>
#include "celt.h"
#include "pitch.h"
#include "bands.h"
#include "modes.h"
#include "entcode.h"
#include "quant_bands.h"
#include "rate.h"
#include "stack_alloc.h"
#include "mathops.h"
#include "float_cast.h"
#include <stdarg.h>
#include "celt_lpc.h"
#include "vq.h"

#ifndef PACKAGE_VERSION
#define PACKAGE_VERSION "unknown"
#endif

#if defined(FIXED_POINT) && defined(__mips)
#include "mips/celt_mipsr1.h"
#endif


int resampling_factor(opus_int32 rate)
{
   int ret;
   switch (rate)
   {
#ifdef ENABLE_QEXT
   case 96000:
#endif
   case 48000:
      ret = 1;
      break;
   case 24000:
      ret = 2;
      break;
   case 16000:
      ret = 3;
      break;
   case 12000:
      ret = 4;
      break;
   case 8000:
      ret = 6;
      break;
   default:
#ifndef CUSTOM_MODES
      celt_assert(0);
#endif
      ret = 0;
      break;
   }
   return ret;
}


#if !defined(OVERRIDE_COMB_FILTER_CONST) || defined(NON_STATIC_COMB_FILTER_CONST_C)
/* This version should be faster on ARM */
#ifdef OPUS_ARM_ASM
#ifndef NON_STATIC_COMB_FILTER_CONST_C
static
#endif
void comb_filter_const_c(opus_val32 *y, opus_val32 *x, int T, int N,
      celt_coef g10, celt_coef g11, celt_coef g12)
{
   opus_val32 x0, x1, x2, x3, x4;
   int i;
   x4 = SHL32(x[-T-2], 1);
   x3 = SHL32(x[-T-1], 1);
   x2 = SHL32(x[-T], 1);
   x1 = SHL32(x[-T+1], 1);
   for (i=0;i<N-4;i+=5)
   {
      opus_val32 t;
      x0=SHL32(x[i-T+2],1);
      t = MAC_COEF_32_ARM(x[i], g10, x2);
      t = MAC_COEF_32_ARM(t, g11, ADD32(x1,x3));
      t = MAC_COEF_32_ARM(t, g12, ADD32(x0,x4));
      t = SATURATE(t, SIG_SAT);
      y[i] = t;
      x4=SHL32(x[i-T+3],1);
      t = MAC_COEF_32_ARM(x[i+1], g10, x1);
      t = MAC_COEF_32_ARM(t, g11, ADD32(x0,x2));
      t = MAC_COEF_32_ARM(t, g12, ADD32(x4,x3));
      t = SATURATE(t, SIG_SAT);
      y[i+1] = t;
      x3=SHL32(x[i-T+4],1);
      t = MAC_COEF_32_ARM(x[i+2], g10, x0);
      t = MAC_COEF_32_ARM(t, g11, ADD32(x4,x1));
      t = MAC_COEF_32_ARM(t, g12, ADD32(x3,x2));
      t = SATURATE(t, SIG_SAT);
      y[i+2] = t;
      x2=SHL32(x[i-T+5],1);
      t = MAC_COEF_32_ARM(x[i+3], g10, x4);
      t = MAC_COEF_32_ARM(t, g11, ADD32(x3,x0));
      t = MAC_COEF_32_ARM(t, g12, ADD32(x2,x1));
      t = SATURATE(t, SIG_SAT);
      y[i+3] = t;
      x1=SHL32(x[i-T+6],1);
      t = MAC_COEF_32_ARM(x[i+4], g10, x3);
      t = MAC_COEF_32_ARM(t, g11, ADD32(x2,x4));
      t = MAC_COEF_32_ARM(t, g12, ADD32(x1,x0));
      t = SATURATE(t, SIG_SAT);
      y[i+4] = t;
   }
#ifdef CUSTOM_MODES
   for (;i<N;i++)
   {
      opus_val32 t;
      x0=SHL32(x[i-T+2],1);
      t = MAC_COEF_32_ARM(x[i], g10, x2);
      t = MAC_COEF_32_ARM(t, g11, ADD32(x1,x3));
      t = MAC_COEF_32_ARM(t, g12, ADD32(x0,x4));
      t = SATURATE(t, SIG_SAT);
      y[i] = t;
      x4=x3;
      x3=x2;
      x2=x1;
      x1=x0;
   }
#endif
}
#else
#ifndef NON_STATIC_COMB_FILTER_CONST_C
static
#endif
void comb_filter_const_c(opus_val32 *y, opus_val32 *x, int T, int N,
      celt_coef g10, celt_coef g11, celt_coef g12)
{
   opus_val32 x0, x1, x2, x3, x4;
   int i;
   x4 = x[-T-2];
   x3 = x[-T-1];
   x2 = x[-T];
   x1 = x[-T+1];
   for (i=0;i<N;i++)
   {
      x0=x[i-T+2];
      y[i] = x[i]
               + MULT_COEF_32(g10,x2)
               + MULT_COEF_32(g11,ADD32(x1,x3))
               + MULT_COEF_32(g12,ADD32(x0,x4));
#ifdef FIXED_POINT
      /* A bit of bias seems to help here. */
      y[i] = SUB32(y[i], 1);
#endif
      y[i] = SATURATE(y[i], SIG_SAT);
      x4=x3;
      x3=x2;
      x2=x1;
      x1=x0;
   }

}
#endif
#endif

#ifdef ENABLE_QEXT
void comb_filter_qext(opus_val32 *y, opus_val32 *x, int T0, int T1, int N,
      opus_val16 g0, opus_val16 g1, int tapset0, int tapset1,
      const celt_coef *window, int overlap, int arch)
{
   VARDECL(opus_val32, mem_buf);
   VARDECL(opus_val32, buf);
   celt_coef new_window[120];
   int s;
   int i;
   int N2;
   int overlap2;
   SAVE_STACK;
   /* Using ALLOC() instead of a regular stack allocation to minimize real stack use when using the pseudostack.
      This is useful on some embedded systems. */
   ALLOC(mem_buf, COMBFILTER_MAXPERIOD+960, opus_val32);
   ALLOC(buf, COMBFILTER_MAXPERIOD+960, opus_val32);
   N2 = N/2;
   overlap2=overlap/2;
   /* At 96 kHz, we double the period and the spacing between taps, which is equivalent
      to creating a mirror image of the filter around 24 kHz. It also means we can process
      the even and odd samples completely independently. */
   for (s=0;s<2;s++) {
      opus_val32 *yptr;
      for (i=0;i<overlap2;i++) new_window[i] = window[2*i+s];
      for (i=0;i<COMBFILTER_MAXPERIOD+N2;i++) mem_buf[i] = x[2*i+s-2*COMBFILTER_MAXPERIOD];
      if (x==y) {
         yptr = mem_buf+COMBFILTER_MAXPERIOD;
      } else {
         for (i=0;i<N2;i++) buf[i] = y[2*i+s];
         yptr = buf;
      }
      comb_filter(yptr, mem_buf+COMBFILTER_MAXPERIOD, T0, T1, N2, g0, g1, tapset0, tapset1, new_window, overlap2, arch);
      for (i=0;i<N2;i++) y[2*i+s] = yptr[i];
   }
   RESTORE_STACK;
   return;
}
#endif

#ifndef OVERRIDE_comb_filter
void comb_filter(opus_val32 *y, opus_val32 *x, int T0, int T1, int N,
      opus_val16 g0, opus_val16 g1, int tapset0, int tapset1,
      const celt_coef *window, int overlap, int arch)
{
   int i;
   /* printf ("%d %d %f %f\n", T0, T1, g0, g1); */
   celt_coef g00, g01, g02, g10, g11, g12;
   opus_val32 x0, x1, x2, x3, x4;
   static const opus_val16 gains[3][3] = {
         {QCONST16(0.3066406250f, 15), QCONST16(0.2170410156f, 15), QCONST16(0.1296386719f, 15)},
         {QCONST16(0.4638671875f, 15), QCONST16(0.2680664062f, 15), QCONST16(0.f, 15)},
         {QCONST16(0.7998046875f, 15), QCONST16(0.1000976562f, 15), QCONST16(0.f, 15)}};
#ifdef ENABLE_QEXT
   if (overlap==240) {
      comb_filter_qext(y, x, T0, T1, N, g0, g1, tapset0, tapset1, window, overlap, arch);
      return;
   }
#endif
   if (g0==0 && g1==0)
   {
      /* OPT: Happens to work without the OPUS_MOVE(), but only because the current encoder already copies x to y */
      if (x!=y)
         OPUS_MOVE(y, x, N);
      return;
   }
   /* When the gain is zero, T0 and/or T1 is set to zero. We need
      to have then be at least 2 to avoid processing garbage data. */
   T0 = IMAX(T0, COMBFILTER_MINPERIOD);
   T1 = IMAX(T1, COMBFILTER_MINPERIOD);
   g00 = MULT_COEF_TAPS(g0, gains[tapset0][0]);
   g01 = MULT_COEF_TAPS(g0, gains[tapset0][1]);
   g02 = MULT_COEF_TAPS(g0, gains[tapset0][2]);
   g10 = MULT_COEF_TAPS(g1, gains[tapset1][0]);
   g11 = MULT_COEF_TAPS(g1, gains[tapset1][1]);
   g12 = MULT_COEF_TAPS(g1, gains[tapset1][2]);
   x1 = x[-T1+1];
   x2 = x[-T1  ];
   x3 = x[-T1-1];
   x4 = x[-T1-2];
   /* If the filter didn't change, we don't need the overlap */
   if (g0==g1 && T0==T1 && tapset0==tapset1)
      overlap=0;
   for (i=0;i<overlap;i++)
   {
      celt_coef f;
      x0=x[i-T1+2];
      f = MULT_COEF(window[i],window[i]);
      y[i] = x[i]
               + MULT_COEF_32(MULT_COEF((COEF_ONE-f),g00),x[i-T0])
               + MULT_COEF_32(MULT_COEF((COEF_ONE-f),g01),ADD32(x[i-T0+1],x[i-T0-1]))
               + MULT_COEF_32(MULT_COEF((COEF_ONE-f),g02),ADD32(x[i-T0+2],x[i-T0-2]))
               + MULT_COEF_32(MULT_COEF(f,g10),x2)
               + MULT_COEF_32(MULT_COEF(f,g11),ADD32(x1,x3))
               + MULT_COEF_32(MULT_COEF(f,g12),ADD32(x0,x4));
#ifdef FIXED_POINT
      /* A bit of bias seems to help here. */
      y[i] = SUB32(y[i], 3);
#endif
      y[i] = SATURATE(y[i], SIG_SAT);
      x4=x3;
      x3=x2;
      x2=x1;
      x1=x0;

   }
   if (g1==0)
   {
      /* OPT: Happens to work without the OPUS_MOVE(), but only because the current encoder already copies x to y */
      if (x!=y)
         OPUS_MOVE(y+overlap, x+overlap, N-overlap);
      return;
   }

   /* Compute the part with the constant filter. */
   comb_filter_const(y+i, x+i, T1, N-i, g10, g11, g12, arch);
}
#endif /* OVERRIDE_comb_filter */

/* TF change table. Positive values mean better frequency resolution (longer
   effective window), whereas negative values mean better time resolution
   (shorter effective window). The second index is computed as:
   4*isTransient + 2*tf_select + per_band_flag */
const signed char tf_select_table[4][8] = {
    /*isTransient=0     isTransient=1 */
      {0, -1, 0, -1,    0,-1, 0,-1}, /* 2.5 ms */
      {0, -1, 0, -2,    1, 0, 1,-1}, /* 5 ms */
      {0, -2, 0, -3,    2, 0, 1,-1}, /* 10 ms */
      {0, -2, 0, -3,    3, 0, 1,-1}, /* 20 ms */
};


void init_caps(const CELTMode *m,int *cap,int LM,int C)
{
   int i;
   for (i=0;i<m->nbEBands;i++)
   {
      int N;
      N=(m->eBands[i+1]-m->eBands[i])<<LM;
      cap[i] = (m->cache.caps[m->nbEBands*(2*LM+C-1)+i]+64)*C*N>>2;
   }
}



const char *opus_strerror(int error)
{
   static const char * const error_strings[8] = {
      "success",
      "invalid argument",
      "buffer too small",
      "internal error",
      "corrupted stream",
      "request not implemented",
      "invalid state",
      "memory allocation failed"
   };
   if (error > 0 || error < -7)
      return "unknown error";
   else
      return error_strings[-error];
}

const char *opus_get_version_string(void)
{
    return "libopus " PACKAGE_VERSION
    /* Applications may rely on the presence of this substring in the version
       string to determine if they have a fixed-point or floating-point build
       at runtime. */
#ifdef FIXED_POINT
          "-fixed"
#endif
#ifdef FUZZING
          "-fuzzing"
#endif
          ;
}

Coverage Report

Created: 2025-12-31 07:57

Line	Count	Source
1		/* Copyright (c) 2007-2008 CSIRO
2		Copyright (c) 2007-2010 Xiph.Org Foundation
3		Copyright (c) 2008 Gregory Maxwell
4		Written by Jean-Marc Valin and Gregory Maxwell */
5		/*
6		Redistribution and use in source and binary forms, with or without
7		modification, are permitted provided that the following conditions
8		are met:
9
10		- Redistributions of source code must retain the above copyright
11		notice, this list of conditions and the following disclaimer.
12
13		- Redistributions in binary form must reproduce the above copyright
14		notice, this list of conditions and the following disclaimer in the
15		documentation and/or other materials provided with the distribution.
16
17		THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
18		``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
19		LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
20		A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER
21		OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
22		EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
23		PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
24		PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
25		LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
26		NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
27		SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
28		*/
29
30		#ifdef HAVE_CONFIG_H
31		#include "config.h"
32		#endif
33
34		#define CELT_C
35
36		#include "os_support.h"
37		#include "mdct.h"
38		#include <math.h>
39		#include "celt.h"
40		#include "pitch.h"
41		#include "bands.h"
42		#include "modes.h"
43		#include "entcode.h"
44		#include "quant_bands.h"
45		#include "rate.h"
46		#include "stack_alloc.h"
47		#include "mathops.h"
48		#include "float_cast.h"
49		#include <stdarg.h>
50		#include "celt_lpc.h"
51		#include "vq.h"
52
53		#ifndef PACKAGE_VERSION
54		#define PACKAGE_VERSION "unknown"
55		#endif
56
57		#if defined(FIXED_POINT) && defined(__mips)
58		#include "mips/celt_mipsr1.h"
59		#endif
60
61
62		int resampling_factor(opus_int32 rate)
63	60.8k	{
64	60.8k	int ret;
65	60.8k	switch (rate)
66	60.8k	{
67		#ifdef ENABLE_QEXT
68		case 96000:
69		#endif
70	60.8k	case 48000:
71	60.8k	ret = 1;
72	60.8k	break;
73	0	case 24000:
74	0	ret = 2;
75	0	break;
76	0	case 16000:
77	0	ret = 3;
78	0	break;
79	0	case 12000:
80	0	ret = 4;
81	0	break;
82	0	case 8000:
83	0	ret = 6;
84	0	break;
85	0	default:
86	0	#ifndef CUSTOM_MODES
87	0	celt_assert(0);
88	0	#endif
89	0	ret = 0;
90	0	break;
91	60.8k	}
92	60.8k	return ret;
93	60.8k	}
94
95
96		#if !defined(OVERRIDE_COMB_FILTER_CONST) \|\| defined(NON_STATIC_COMB_FILTER_CONST_C)
97		/* This version should be faster on ARM */
98		#ifdef OPUS_ARM_ASM
99		#ifndef NON_STATIC_COMB_FILTER_CONST_C
100		static
101		#endif
102		void comb_filter_const_c(opus_val32 y, opus_val32 x, int T, int N,
103		celt_coef g10, celt_coef g11, celt_coef g12)
104		{
105		opus_val32 x0, x1, x2, x3, x4;
106		int i;
107		x4 = SHL32(x[-T-2], 1);
108		x3 = SHL32(x[-T-1], 1);
109		x2 = SHL32(x[-T], 1);
110		x1 = SHL32(x[-T+1], 1);
111		for (i=0;i<N-4;i+=5)
112		{
113		opus_val32 t;
114		x0=SHL32(x[i-T+2],1);
115		t = MAC_COEF_32_ARM(x[i], g10, x2);
116		t = MAC_COEF_32_ARM(t, g11, ADD32(x1,x3));
117		t = MAC_COEF_32_ARM(t, g12, ADD32(x0,x4));
118		t = SATURATE(t, SIG_SAT);
119		y[i] = t;
120		x4=SHL32(x[i-T+3],1);
121		t = MAC_COEF_32_ARM(x[i+1], g10, x1);
122		t = MAC_COEF_32_ARM(t, g11, ADD32(x0,x2));
123		t = MAC_COEF_32_ARM(t, g12, ADD32(x4,x3));
124		t = SATURATE(t, SIG_SAT);
125		y[i+1] = t;
126		x3=SHL32(x[i-T+4],1);
127		t = MAC_COEF_32_ARM(x[i+2], g10, x0);
128		t = MAC_COEF_32_ARM(t, g11, ADD32(x4,x1));
129		t = MAC_COEF_32_ARM(t, g12, ADD32(x3,x2));
130		t = SATURATE(t, SIG_SAT);
131		y[i+2] = t;
132		x2=SHL32(x[i-T+5],1);
133		t = MAC_COEF_32_ARM(x[i+3], g10, x4);
134		t = MAC_COEF_32_ARM(t, g11, ADD32(x3,x0));
135		t = MAC_COEF_32_ARM(t, g12, ADD32(x2,x1));
136		t = SATURATE(t, SIG_SAT);
137		y[i+3] = t;
138		x1=SHL32(x[i-T+6],1);
139		t = MAC_COEF_32_ARM(x[i+4], g10, x3);
140		t = MAC_COEF_32_ARM(t, g11, ADD32(x2,x4));
141		t = MAC_COEF_32_ARM(t, g12, ADD32(x1,x0));
142		t = SATURATE(t, SIG_SAT);
143		y[i+4] = t;
144		}
145		#ifdef CUSTOM_MODES
146		for (;i<N;i++)
147		{
148		opus_val32 t;
149		x0=SHL32(x[i-T+2],1);
150		t = MAC_COEF_32_ARM(x[i], g10, x2);
151		t = MAC_COEF_32_ARM(t, g11, ADD32(x1,x3));
152		t = MAC_COEF_32_ARM(t, g12, ADD32(x0,x4));
153		t = SATURATE(t, SIG_SAT);
154		y[i] = t;
155		x4=x3;
156		x3=x2;
157		x2=x1;
158		x1=x0;
159		}
160		#endif
161		}
162		#else
163		#ifndef NON_STATIC_COMB_FILTER_CONST_C
164		static
165		#endif
166		void comb_filter_const_c(opus_val32 y, opus_val32 x, int T, int N,
167		celt_coef g10, celt_coef g11, celt_coef g12)
168		{
169		opus_val32 x0, x1, x2, x3, x4;
170		int i;
171		x4 = x[-T-2];
172		x3 = x[-T-1];
173		x2 = x[-T];
174		x1 = x[-T+1];
175		for (i=0;i<N;i++)
176		{
177		x0=x[i-T+2];
178		y[i] = x[i]
179		+ MULT_COEF_32(g10,x2)
180		+ MULT_COEF_32(g11,ADD32(x1,x3))
181		+ MULT_COEF_32(g12,ADD32(x0,x4));
182		#ifdef FIXED_POINT
183		/* A bit of bias seems to help here. */
184		y[i] = SUB32(y[i], 1);
185		#endif
186		y[i] = SATURATE(y[i], SIG_SAT);
187		x4=x3;
188		x3=x2;
189		x2=x1;
190		x1=x0;
191		}
192
193		}
194		#endif
195		#endif
196
197		#ifdef ENABLE_QEXT
198		void comb_filter_qext(opus_val32 y, opus_val32 x, int T0, int T1, int N,
199		opus_val16 g0, opus_val16 g1, int tapset0, int tapset1,
200		const celt_coef *window, int overlap, int arch)
201		{
202		VARDECL(opus_val32, mem_buf);
203		VARDECL(opus_val32, buf);
204		celt_coef new_window[120];
205		int s;
206		int i;
207		int N2;
208		int overlap2;
209		SAVE_STACK;
210		/* Using ALLOC() instead of a regular stack allocation to minimize real stack use when using the pseudostack.
211		This is useful on some embedded systems. */
212		ALLOC(mem_buf, COMBFILTER_MAXPERIOD+960, opus_val32);
213		ALLOC(buf, COMBFILTER_MAXPERIOD+960, opus_val32);
214		N2 = N/2;
215		overlap2=overlap/2;
216		/* At 96 kHz, we double the period and the spacing between taps, which is equivalent
217		to creating a mirror image of the filter around 24 kHz. It also means we can process
218		the even and odd samples completely independently. */
219		for (s=0;s<2;s++) {
220		opus_val32 *yptr;
221		for (i=0;i<overlap2;i++) new_window[i] = window[2*i+s];
222		for (i=0;i<COMBFILTER_MAXPERIOD+N2;i++) mem_buf[i] = x[2i+s-2COMBFILTER_MAXPERIOD];
223		if (x==y) {
224		yptr = mem_buf+COMBFILTER_MAXPERIOD;
225		} else {
226		for (i=0;i<N2;i++) buf[i] = y[2*i+s];
227		yptr = buf;
228		}
229		comb_filter(yptr, mem_buf+COMBFILTER_MAXPERIOD, T0, T1, N2, g0, g1, tapset0, tapset1, new_window, overlap2, arch);
230		for (i=0;i<N2;i++) y[2*i+s] = yptr[i];
231		}
232		RESTORE_STACK;
233		return;
234		}
235		#endif
236
237		#ifndef OVERRIDE_comb_filter
238		void comb_filter(opus_val32 y, opus_val32 x, int T0, int T1, int N,
239		opus_val16 g0, opus_val16 g1, int tapset0, int tapset1,
240		const celt_coef *window, int overlap, int arch)
241	689k	{
242	689k	int i;
243		/* printf ("%d %d %f %f\n", T0, T1, g0, g1); */
244	689k	celt_coef g00, g01, g02, g10, g11, g12;
245	689k	opus_val32 x0, x1, x2, x3, x4;
246	689k	static const opus_val16 gains[3][3] = {
247	689k	{QCONST16(0.3066406250f, 15), QCONST16(0.2170410156f, 15), QCONST16(0.1296386719f, 15)},
248	689k	{QCONST16(0.4638671875f, 15), QCONST16(0.2680664062f, 15), QCONST16(0.f, 15)},
249	689k	{QCONST16(0.7998046875f, 15), QCONST16(0.1000976562f, 15), QCONST16(0.f, 15)}};
250		#ifdef ENABLE_QEXT
251		if (overlap==240) {
252		comb_filter_qext(y, x, T0, T1, N, g0, g1, tapset0, tapset1, window, overlap, arch);
253		return;
254		}
255		#endif
256	689k	if (g0==0 && g1==0)
257	617k	{
258		/* OPT: Happens to work without the OPUS_MOVE(), but only because the current encoder already copies x to y */
259	617k	if (x!=y)
260	19.3k	OPUS_MOVE(y, x, N);
261	617k	return;
262	617k	}
263		/* When the gain is zero, T0 and/or T1 is set to zero. We need
264		to have then be at least 2 to avoid processing garbage data. */
265	71.9k	T0 = IMAX(T0, COMBFILTER_MINPERIOD);
266	71.9k	T1 = IMAX(T1, COMBFILTER_MINPERIOD);
267	71.9k	g00 = MULT_COEF_TAPS(g0, gains[tapset0][0]);
268	71.9k	g01 = MULT_COEF_TAPS(g0, gains[tapset0][1]);
269	71.9k	g02 = MULT_COEF_TAPS(g0, gains[tapset0][2]);
270	71.9k	g10 = MULT_COEF_TAPS(g1, gains[tapset1][0]);
271	71.9k	g11 = MULT_COEF_TAPS(g1, gains[tapset1][1]);
272	71.9k	g12 = MULT_COEF_TAPS(g1, gains[tapset1][2]);
273	71.9k	x1 = x[-T1+1];
274	71.9k	x2 = x[-T1 ];
275	71.9k	x3 = x[-T1-1];
276	71.9k	x4 = x[-T1-2];
277		/* If the filter didn't change, we don't need the overlap */
278	71.9k	if (g0==g1 && T0==T1 && tapset0==tapset1)
279	34.3k	overlap=0;
280	4.50M	for (i=0;i<overlap;i++)
281	4.43M	{
282	4.43M	celt_coef f;
283	4.43M	x0=x[i-T1+2];
284	4.43M	f = MULT_COEF(window[i],window[i]);
285	4.43M	y[i] = x[i]
286	4.43M	+ MULT_COEF_32(MULT_COEF((COEF_ONE-f),g00),x[i-T0])
287	4.43M	+ MULT_COEF_32(MULT_COEF((COEF_ONE-f),g01),ADD32(x[i-T0+1],x[i-T0-1]))
288	4.43M	+ MULT_COEF_32(MULT_COEF((COEF_ONE-f),g02),ADD32(x[i-T0+2],x[i-T0-2]))
289	4.43M	+ MULT_COEF_32(MULT_COEF(f,g10),x2)
290	4.43M	+ MULT_COEF_32(MULT_COEF(f,g11),ADD32(x1,x3))
291	4.43M	+ MULT_COEF_32(MULT_COEF(f,g12),ADD32(x0,x4));
292		#ifdef FIXED_POINT
293		/* A bit of bias seems to help here. */
294		y[i] = SUB32(y[i], 3);
295		#endif
296	4.43M	y[i] = SATURATE(y[i], SIG_SAT);
297	4.43M	x4=x3;
298	4.43M	x3=x2;
299	4.43M	x2=x1;
300	4.43M	x1=x0;
301
302	4.43M	}
303	71.9k	if (g1==0)
304	10.4k	{
305		/* OPT: Happens to work without the OPUS_MOVE(), but only because the current encoder already copies x to y */
306	10.4k	if (x!=y)
307	405	OPUS_MOVE(y+overlap, x+overlap, N-overlap);
308	10.4k	return;
309	10.4k	}
310
311		/* Compute the part with the constant filter. */
312	61.5k	comb_filter_const(y+i, x+i, T1, N-i, g10, g11, g12, arch);
313	61.5k	}
314		#endif /* OVERRIDE_comb_filter */
315
316		/* TF change table. Positive values mean better frequency resolution (longer
317		effective window), whereas negative values mean better time resolution
318		(shorter effective window). The second index is computed as:
319		4isTransient + 2tf_select + per_band_flag */
320		const signed char tf_select_table[4][8] = {
321		/isTransient=0 isTransient=1 /
322		{0, -1, 0, -1, 0,-1, 0,-1}, /* 2.5 ms */
323		{0, -1, 0, -2, 1, 0, 1,-1}, /* 5 ms */
324		{0, -2, 0, -3, 2, 0, 1,-1}, /* 10 ms */
325		{0, -2, 0, -3, 3, 0, 1,-1}, /* 20 ms */
326		};
327
328
329		void init_caps(const CELTMode m,int cap,int LM,int C)
330	107k	{
331	107k	int i;
332	2.37M	for (i=0;i<m->nbEBands;i++)
333	2.26M	{
334	2.26M	int N;
335	2.26M	N=(m->eBands[i+1]-m->eBands[i])<<LM;
336	2.26M	cap[i] = (m->cache.caps[m->nbEBands(2LM+C-1)+i]+64)CN>>2;
337	2.26M	}
338	107k	}
339
340
341
342		const char *opus_strerror(int error)
343	78.7k	{
344	78.7k	static const char * const error_strings[8] = {
345	78.7k	"success",
346	78.7k	"invalid argument",
347	78.7k	"buffer too small",
348	78.7k	"internal error",
349	78.7k	"corrupted stream",
350	78.7k	"request not implemented",
351	78.7k	"invalid state",
352	78.7k	"memory allocation failed"
353	78.7k	};
354	78.7k	if (error > 0 \|\| error < -7)
355	0	return "unknown error";
356	78.7k	else
357	78.7k	return error_strings[-error];
358	78.7k	}
359
360		const char *opus_get_version_string(void)
361	0	{
362	0	return "libopus " PACKAGE_VERSION
363		/* Applications may rely on the presence of this substring in the version
364		string to determine if they have a fixed-point or floating-point build
365		at runtime. */
366		#ifdef FIXED_POINT
367		"-fixed"
368		#endif
369		#ifdef FUZZING
370		"-fuzzing"
371		#endif
372	0	;
373	0	}