Coverage Report

Created: 2025-08-29 06:24

/src/speex/libspeex/stereo.c
Line
Count
Source (jump to first uncovered line)
1
/* Copyright (C) 2002 Jean-Marc Valin
2
   File: stereo.c
3
4
   Redistribution and use in source and binary forms, with or without
5
   modification, are permitted provided that the following conditions
6
   are met:
7
8
   - Redistributions of source code must retain the above copyright
9
   notice, this list of conditions and the following disclaimer.
10
11
   - Redistributions in binary form must reproduce the above copyright
12
   notice, this list of conditions and the following disclaimer in the
13
   documentation and/or other materials provided with the distribution.
14
15
   - Neither the name of the Xiph.org Foundation nor the names of its
16
   contributors may be used to endorse or promote products derived from
17
   this software without specific prior written permission.
18
19
   THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
20
   ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
21
   LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
22
   A PARTICULAR PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION OR
23
   CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
24
   EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
25
   PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
26
   PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
27
   LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
28
   NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
29
   SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
30
*/
31
32
#ifdef HAVE_CONFIG_H
33
#include "config.h"
34
#endif
35
36
#include "speex/speex_stereo.h"
37
#include "speex/speex_callbacks.h"
38
#include "math_approx.h"
39
#include "vq.h"
40
#include <math.h>
41
#include "os_support.h"
42
43
typedef struct RealSpeexStereoState {
44
   spx_word32_t balance;      /**< Left/right balance info */
45
   spx_word32_t e_ratio;      /**< Ratio of energies: E(left+right)/[E(left)+E(right)]  */
46
   spx_word32_t smooth_left;  /**< Smoothed left channel gain */
47
   spx_word32_t smooth_right; /**< Smoothed right channel gain */
48
   spx_uint32_t reserved1;     /**< Reserved for future use */
49
   spx_int32_t reserved2;     /**< Reserved for future use */
50
} RealSpeexStereoState;
51
52
53
/*float e_ratio_quant[4] = {1, 1.26, 1.587, 2};*/
54
#ifndef FIXED_POINT
55
static const float e_ratio_quant[4] = {.25f, .315f, .397f, .5f};
56
static const float e_ratio_quant_bounds[3] = {0.2825f, 0.356f, 0.4485f};
57
#else
58
static const spx_word16_t e_ratio_quant[4] = {8192, 10332, 13009, 16384};
59
static const spx_word16_t e_ratio_quant_bounds[3] = {9257, 11665, 14696};
60
static const spx_word16_t balance_bounds[31] = {18, 23, 30, 38, 49, 63,  81, 104,
61
   134, 172, 221,  284, 364, 468, 600, 771,
62
   990, 1271, 1632, 2096, 2691, 3455, 4436, 5696,
63
   7314, 9392, 12059, 15484, 19882, 25529, 32766};
64
#endif
65
66
/* This is an ugly compatibility hack that properly resets the stereo state
67
   In case it it compiled in fixed-point, but initialised with the deprecated
68
   floating point static initialiser */
69
#ifdef FIXED_POINT
70
6.61k
#define COMPATIBILITY_HACK(s) do {if ((s)->reserved1 != 0xdeadbeef) speex_stereo_state_reset((SpeexStereoState*)s); } while (0);
71
#else
72
#define COMPATIBILITY_HACK(s)
73
#endif
74
75
EXPORT SpeexStereoState *speex_stereo_state_init()
76
0
{
77
0
   SpeexStereoState *stereo = speex_alloc(sizeof(SpeexStereoState));
78
0
   speex_stereo_state_reset(stereo);
79
0
   return stereo;
80
0
}
81
82
EXPORT void speex_stereo_state_reset(SpeexStereoState *_stereo)
83
487
{
84
487
   RealSpeexStereoState *stereo = (RealSpeexStereoState*)_stereo;
85
487
#ifdef FIXED_POINT
86
487
   stereo->balance = 65536;
87
487
   stereo->e_ratio = 16384;
88
487
   stereo->smooth_left = 16384;
89
487
   stereo->smooth_right = 16384;
90
487
   stereo->reserved1 = 0xdeadbeef;
91
487
   stereo->reserved2 = 0;
92
#else
93
   stereo->balance = 1.0f;
94
   stereo->e_ratio = .5f;
95
   stereo->smooth_left = 1.f;
96
   stereo->smooth_right = 1.f;
97
   stereo->reserved1 = 0;
98
   stereo->reserved2 = 0;
99
#endif
100
487
}
101
102
EXPORT void speex_stereo_state_destroy(SpeexStereoState *stereo)
103
0
{
104
0
   speex_free(stereo);
105
0
}
106
107
#ifndef DISABLE_ENCODER
108
#ifndef DISABLE_FLOAT_API
109
EXPORT void speex_encode_stereo(float *data, int frame_size, SpeexBits *bits)
110
0
{
111
0
   int i, tmp;
112
0
   float e_left=0, e_right=0, e_tot=0;
113
0
   float balance, e_ratio;
114
0
   for (i=0;i<frame_size;i++)
115
0
   {
116
0
      e_left  += ((float)data[2*i])*data[2*i];
117
0
      e_right += ((float)data[2*i+1])*data[2*i+1];
118
0
      data[i] =  .5*(((float)data[2*i])+data[2*i+1]);
119
0
      e_tot   += ((float)data[i])*data[i];
120
0
   }
121
0
   balance=(e_left+1)/(e_right+1);
122
0
   e_ratio = e_tot/(1+e_left+e_right);
123
124
   /*Quantization*/
125
0
   speex_bits_pack(bits, 14, 5);
126
0
   speex_bits_pack(bits, SPEEX_INBAND_STEREO, 4);
127
128
0
   balance=4*log(balance);
129
130
   /*Pack sign*/
131
0
   if (balance>0)
132
0
      speex_bits_pack(bits, 0, 1);
133
0
   else
134
0
      speex_bits_pack(bits, 1, 1);
135
0
   balance=floor(.5+fabs(balance));
136
0
   if (balance>30)
137
0
      balance=31;
138
139
0
   speex_bits_pack(bits, (int)balance, 5);
140
141
   /* FIXME: this is a hack */
142
0
   tmp=scal_quant(e_ratio*Q15_ONE, e_ratio_quant_bounds, 4);
143
0
   speex_bits_pack(bits, tmp, 2);
144
0
}
145
#endif /* #ifndef DISABLE_FLOAT_API */
146
147
EXPORT void speex_encode_stereo_int(spx_int16_t *data, int frame_size, SpeexBits *bits)
148
0
{
149
0
   int i, tmp;
150
0
   spx_word32_t e_left=0, e_right=0, e_tot=0;
151
0
   spx_word32_t balance, e_ratio;
152
0
   spx_word32_t largest, smallest;
153
0
   int balance_id;
154
0
#ifdef FIXED_POINT
155
0
   int shift;
156
0
   int sqr_shift;
157
158
   /* Avoid overflows when summing squares */
159
0
   sqr_shift = frame_size >= 512 ? 9 : 8;
160
0
#endif
161
162
   /* In band marker */
163
0
   speex_bits_pack(bits, 14, 5);
164
   /* Stereo marker */
165
0
   speex_bits_pack(bits, SPEEX_INBAND_STEREO, 4);
166
167
0
   for (i=0;i<frame_size;i++)
168
0
   {
169
0
      e_left  += SHR32(MULT16_16(data[2*i],data[2*i]),sqr_shift);
170
0
      e_right += SHR32(MULT16_16(data[2*i+1],data[2*i+1]),sqr_shift);
171
0
#ifdef FIXED_POINT
172
      /* I think this is actually unbiased */
173
0
      data[i] =  SHR16(data[2*i],1)+PSHR16(data[2*i+1],1);
174
#else
175
      data[i] =  .5*(((float)data[2*i])+data[2*i+1]);
176
#endif
177
0
      e_tot   += SHR32(MULT16_16(data[i],data[i]),sqr_shift);
178
0
   }
179
0
   if (e_left > e_right)
180
0
   {
181
0
      speex_bits_pack(bits, 0, 1);
182
0
      largest = e_left;
183
0
      smallest = e_right;
184
0
   } else {
185
0
      speex_bits_pack(bits, 1, 1);
186
0
      largest = e_right;
187
0
      smallest = e_left;
188
0
   }
189
190
   /* Balance quantization */
191
0
#ifdef FIXED_POINT
192
0
   shift = spx_ilog2(largest)-15;
193
0
   largest = VSHR32(largest, shift-4);
194
0
   smallest = VSHR32(smallest, shift);
195
0
   balance = DIV32(largest, ADD32(smallest, 1));
196
0
   if (balance > 32767)
197
0
      balance = 32767;
198
0
   balance_id = scal_quant(EXTRACT16(balance), balance_bounds, 32);
199
#else
200
   balance=(largest+1.)/(smallest+1.);
201
   balance=4*log(balance);
202
   balance_id=floor(.5+fabs(balance));
203
   if (balance_id>30)
204
      balance_id=31;
205
#endif
206
207
0
   speex_bits_pack(bits, balance_id, 5);
208
209
   /* "coherence" quantisation */
210
0
#ifdef FIXED_POINT
211
0
   shift = spx_ilog2(e_tot);
212
0
   e_tot = VSHR32(e_tot, shift-25);
213
0
   e_left = VSHR32(e_left, shift-10);
214
0
   e_right = VSHR32(e_right, shift-10);
215
0
   e_ratio = DIV32(e_tot, e_left+e_right+1);
216
#else
217
   e_ratio = e_tot/(1.+e_left+e_right);
218
#endif
219
220
0
   tmp=scal_quant(EXTRACT16(e_ratio), e_ratio_quant_bounds, 4);
221
   /*fprintf (stderr, "%d %d %d %d\n", largest, smallest, balance_id, e_ratio);*/
222
0
   speex_bits_pack(bits, tmp, 2);
223
0
}
224
#else /* DISABLE_ENCODER */
225
EXPORT void speex_encode_stereo_int(spx_int16_t *data, int frame_size, SpeexBits *bits)
226
{
227
}
228
#endif /* DISABLE_ENCODER */
229
230
231
#ifndef DISABLE_FLOAT_API
232
EXPORT void speex_decode_stereo(float *data, int frame_size, SpeexStereoState *_stereo)
233
6.10k
{
234
6.10k
   int i;
235
6.10k
   spx_word32_t balance;
236
6.10k
   spx_word16_t e_left, e_right, e_ratio;
237
6.10k
   RealSpeexStereoState *stereo = (RealSpeexStereoState*)_stereo;
238
239
6.10k
   COMPATIBILITY_HACK(stereo);
240
241
6.10k
   balance=stereo->balance;
242
6.10k
   e_ratio=stereo->e_ratio;
243
244
   /* These two are Q14, with max value just below 2. */
245
6.10k
   e_right = DIV32(QCONST32(1., 22), spx_sqrt(MULT16_32_Q15(e_ratio, ADD32(QCONST32(1., 16), balance))));
246
6.10k
   e_left = SHR32(MULT16_16(spx_sqrt(balance), e_right), 8);
247
248
2.39M
   for (i=frame_size-1;i>=0;i--)
249
2.39M
   {
250
2.39M
      spx_word16_t tmp=data[i];
251
2.39M
      stereo->smooth_left = EXTRACT16(PSHR32(MAC16_16(MULT16_16(stereo->smooth_left, QCONST16(0.98, 15)), e_left, QCONST16(0.02, 15)), 15));
252
2.39M
      stereo->smooth_right = EXTRACT16(PSHR32(MAC16_16(MULT16_16(stereo->smooth_right, QCONST16(0.98, 15)), e_right, QCONST16(0.02, 15)), 15));
253
2.39M
      data[2*i] = (float)MULT16_16_P14(stereo->smooth_left, tmp);
254
2.39M
      data[2*i+1] = (float)MULT16_16_P14(stereo->smooth_right, tmp);
255
2.39M
   }
256
6.10k
}
257
#endif /* #ifndef DISABLE_FLOAT_API */
258
259
EXPORT void speex_decode_stereo_int(spx_int16_t *data, int frame_size, SpeexStereoState *_stereo)
260
0
{
261
0
   int i;
262
0
   spx_word32_t balance;
263
0
   spx_word16_t e_left, e_right, e_ratio;
264
0
   RealSpeexStereoState *stereo = (RealSpeexStereoState*)_stereo;
265
266
0
   COMPATIBILITY_HACK(stereo);
267
268
0
   balance=stereo->balance;
269
0
   e_ratio=stereo->e_ratio;
270
271
   /* These two are Q14, with max value just below 2. */
272
0
   e_right = DIV32(QCONST32(1., 22), spx_sqrt(MULT16_32_Q15(e_ratio, ADD32(QCONST32(1., 16), balance))));
273
0
   e_left = SHR32(MULT16_16(spx_sqrt(balance), e_right), 8);
274
275
0
   for (i=frame_size-1;i>=0;i--)
276
0
   {
277
0
      spx_int16_t tmp=data[i];
278
0
      stereo->smooth_left = EXTRACT16(PSHR32(MAC16_16(MULT16_16(stereo->smooth_left, QCONST16(0.98, 15)), e_left, QCONST16(0.02, 15)), 15));
279
0
      stereo->smooth_right = EXTRACT16(PSHR32(MAC16_16(MULT16_16(stereo->smooth_right, QCONST16(0.98, 15)), e_right, QCONST16(0.02, 15)), 15));
280
0
      data[2*i] = (spx_int16_t)MULT16_16_P14(stereo->smooth_left, tmp);
281
0
      data[2*i+1] = (spx_int16_t)MULT16_16_P14(stereo->smooth_right, tmp);
282
0
   }
283
0
}
284
285
EXPORT int speex_std_stereo_request_handler(SpeexBits *bits, void *state, void *data)
286
507
{
287
507
   RealSpeexStereoState *stereo;
288
507
   spx_word16_t sign=1, dexp;
289
507
   int tmp;
290
291
507
   stereo = (RealSpeexStereoState*)data;
292
293
507
   COMPATIBILITY_HACK(stereo);
294
295
507
   if (speex_bits_unpack_unsigned(bits, 1))
296
248
      sign=-1;
297
507
   dexp = speex_bits_unpack_unsigned(bits, 5);
298
#ifndef FIXED_POINT
299
   stereo->balance = exp(sign*.25*dexp);
300
#else
301
507
   stereo->balance = spx_exp(MULT16_16(sign, SHL16(dexp, 9)));
302
507
#endif
303
507
   tmp = speex_bits_unpack_unsigned(bits, 2);
304
507
   stereo->e_ratio = e_ratio_quant[tmp];
305
306
507
   return 0;
307
507
}