/src/ffmpeg/libavcodec/cook.c
Line | Count | Source |
1 | | /* |
2 | | * COOK compatible decoder |
3 | | * Copyright (c) 2003 Sascha Sommer |
4 | | * Copyright (c) 2005 Benjamin Larsson |
5 | | * |
6 | | * This file is part of FFmpeg. |
7 | | * |
8 | | * FFmpeg is free software; you can redistribute it and/or |
9 | | * modify it under the terms of the GNU Lesser General Public |
10 | | * License as published by the Free Software Foundation; either |
11 | | * version 2.1 of the License, or (at your option) any later version. |
12 | | * |
13 | | * FFmpeg is distributed in the hope that it will be useful, |
14 | | * but WITHOUT ANY WARRANTY; without even the implied warranty of |
15 | | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU |
16 | | * Lesser General Public License for more details. |
17 | | * |
18 | | * You should have received a copy of the GNU Lesser General Public |
19 | | * License along with FFmpeg; if not, write to the Free Software |
20 | | * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA |
21 | | */ |
22 | | |
23 | | /** |
24 | | * @file |
25 | | * Cook compatible decoder. Bastardization of the G.722.1 standard. |
26 | | * This decoder handles RealNetworks, RealAudio G2 data. |
27 | | * Cook is identified by the codec name cook in RM files. |
28 | | * |
29 | | * To use this decoder, a calling application must supply the extradata |
30 | | * bytes provided from the RM container; 8+ bytes for mono streams and |
31 | | * 16+ for stereo streams (maybe more). |
32 | | * |
33 | | * Codec technicalities (all this assume a buffer length of 1024): |
34 | | * Cook works with several different techniques to achieve its compression. |
35 | | * In the timedomain the buffer is divided into 8 pieces and quantized. If |
36 | | * two neighboring pieces have different quantization index a smooth |
37 | | * quantization curve is used to get a smooth overlap between the different |
38 | | * pieces. |
39 | | * To get to the transformdomain Cook uses a modulated lapped transform. |
40 | | * The transform domain has 50 subbands with 20 elements each. This |
41 | | * means only a maximum of 50*20=1000 coefficients are used out of the 1024 |
42 | | * available. |
43 | | */ |
44 | | |
45 | | #include "libavutil/channel_layout.h" |
46 | | #include "libavutil/lfg.h" |
47 | | #include "libavutil/mem.h" |
48 | | #include "libavutil/mem_internal.h" |
49 | | #include "libavutil/thread.h" |
50 | | #include "libavutil/tx.h" |
51 | | |
52 | | #include "audiodsp.h" |
53 | | #include "avcodec.h" |
54 | | #include "get_bits.h" |
55 | | #include "bytestream.h" |
56 | | #include "codec_internal.h" |
57 | | #include "decode.h" |
58 | | #include "sinewin.h" |
59 | | #include "unary.h" |
60 | | |
61 | | #include "cookdata.h" |
62 | | |
63 | | /* the different Cook versions */ |
64 | 7 | #define MONO 0x1000001 |
65 | 1.08k | #define STEREO 0x1000002 |
66 | 35 | #define JOINT_STEREO 0x1000003 |
67 | 767 | #define MC_COOK 0x2000000 |
68 | | |
69 | 136M | #define SUBBAND_SIZE 20 |
70 | | #define MAX_SUBPACKETS 5 |
71 | | |
72 | 7.13M | #define QUANT_VLC_BITS 9 |
73 | 43.8k | #define COUPLING_VLC_BITS 6 |
74 | | |
75 | | typedef struct cook_gains { |
76 | | int *now; |
77 | | int *previous; |
78 | | } cook_gains; |
79 | | |
80 | | typedef struct COOKSubpacket { |
81 | | int ch_idx; |
82 | | int size; |
83 | | int num_channels; |
84 | | int cookversion; |
85 | | int subbands; |
86 | | int js_subband_start; |
87 | | int js_vlc_bits; |
88 | | int samples_per_channel; |
89 | | int log2_numvector_size; |
90 | | unsigned int channel_mask; |
91 | | VLC channel_coupling; |
92 | | int joint_stereo; |
93 | | int bits_per_subpacket; |
94 | | int bits_per_subpdiv; |
95 | | int total_subbands; |
96 | | int numvector_size; // 1 << log2_numvector_size; |
97 | | |
98 | | float mono_previous_buffer1[1024]; |
99 | | float mono_previous_buffer2[1024]; |
100 | | |
101 | | cook_gains gains1; |
102 | | cook_gains gains2; |
103 | | int gain_1[9]; |
104 | | int gain_2[9]; |
105 | | int gain_3[9]; |
106 | | int gain_4[9]; |
107 | | } COOKSubpacket; |
108 | | |
109 | | typedef struct cook { |
110 | | /* |
111 | | * The following 5 functions provide the lowlevel arithmetic on |
112 | | * the internal audio buffers. |
113 | | */ |
114 | | void (*scalar_dequant)(struct cook *q, int index, int quant_index, |
115 | | int *subband_coef_index, int *subband_coef_sign, |
116 | | float *mlt_p); |
117 | | |
118 | | void (*decouple)(struct cook *q, |
119 | | COOKSubpacket *p, |
120 | | int subband, |
121 | | float f1, float f2, |
122 | | float *decode_buffer, |
123 | | float *mlt_buffer1, float *mlt_buffer2); |
124 | | |
125 | | void (*imlt_window)(struct cook *q, float *buffer1, |
126 | | cook_gains *gains_ptr, float *previous_buffer); |
127 | | |
128 | | void (*interpolate)(struct cook *q, float *buffer, |
129 | | int gain_index, int gain_index_next); |
130 | | |
131 | | void (*saturate_output)(struct cook *q, float *out); |
132 | | |
133 | | AVCodecContext* avctx; |
134 | | AudioDSPContext adsp; |
135 | | GetBitContext gb; |
136 | | /* stream data */ |
137 | | int num_vectors; |
138 | | int samples_per_channel; |
139 | | /* states */ |
140 | | AVLFG random_state; |
141 | | int discarded_packets; |
142 | | |
143 | | /* transform data */ |
144 | | AVTXContext *mdct_ctx; |
145 | | av_tx_fn mdct_fn; |
146 | | float* mlt_window; |
147 | | |
148 | | /* VLC data */ |
149 | | VLC envelope_quant_index[13]; |
150 | | VLC sqvh[7]; // scalar quantization |
151 | | |
152 | | /* generate tables and related variables */ |
153 | | int gain_size_factor; |
154 | | float gain_table[31]; |
155 | | |
156 | | /* data buffers */ |
157 | | |
158 | | uint8_t* decoded_bytes_buffer; |
159 | | DECLARE_ALIGNED(32, float, mono_mdct_output)[2048]; |
160 | | float decode_buffer_1[1024]; |
161 | | float decode_buffer_2[1024]; |
162 | | float decode_buffer_0[1060]; /* static allocation for joint decode */ |
163 | | |
164 | | const float *cplscales[5]; |
165 | | int num_subpackets; |
166 | | COOKSubpacket subpacket[MAX_SUBPACKETS]; |
167 | | } COOKContext; |
168 | | |
169 | | static float pow2tab[127]; |
170 | | static float rootpow2tab[127]; |
171 | | |
172 | | /*************** init functions ***************/ |
173 | | |
174 | | /* table generator */ |
175 | | static av_cold void init_pow2table(void) |
176 | 1 | { |
177 | | /* fast way of computing 2^i and 2^(0.5*i) for -63 <= i < 64 */ |
178 | 1 | int i; |
179 | 1 | static const float exp2_tab[2] = {1, M_SQRT2}; |
180 | 1 | float exp2_val = powf(2, -63); |
181 | 1 | float root_val = powf(2, -32); |
182 | 128 | for (i = -63; i < 64; i++) { |
183 | 127 | if (!(i & 1)) |
184 | 63 | root_val *= 2; |
185 | 127 | pow2tab[63 + i] = exp2_val; |
186 | 127 | rootpow2tab[63 + i] = root_val * exp2_tab[i & 1]; |
187 | 127 | exp2_val *= 2; |
188 | 127 | } |
189 | 1 | } |
190 | | |
191 | | /* table generator */ |
192 | | static av_cold void init_gain_table(COOKContext *q) |
193 | 767 | { |
194 | 767 | int i; |
195 | 767 | q->gain_size_factor = q->samples_per_channel / 8; |
196 | 24.5k | for (i = 0; i < 31; i++) |
197 | 23.7k | q->gain_table[i] = pow(pow2tab[i + 48], |
198 | 23.7k | (1.0 / (double) q->gain_size_factor)); |
199 | 767 | } |
200 | | |
201 | | static av_cold int build_vlc(VLC *vlc, int nb_bits, const uint8_t counts[16], |
202 | | const void *syms, int symbol_size, int offset, |
203 | | void *logctx) |
204 | 15.6k | { |
205 | 15.6k | uint8_t lens[MAX_COOK_VLC_ENTRIES]; |
206 | 15.6k | unsigned num = 0; |
207 | | |
208 | 265k | for (int i = 0; i < 16; i++) |
209 | 1.48M | for (unsigned count = num + counts[i]; num < count; num++) |
210 | 1.23M | lens[num] = i + 1; |
211 | | |
212 | 15.6k | return ff_vlc_init_from_lengths(vlc, nb_bits, num, lens, 1, |
213 | 15.6k | syms, symbol_size, symbol_size, |
214 | 15.6k | offset, 0, logctx); |
215 | 15.6k | } |
216 | | |
217 | | static av_cold int init_cook_vlc_tables(COOKContext *q) |
218 | 767 | { |
219 | 767 | int i, result; |
220 | | |
221 | 767 | result = 0; |
222 | 10.7k | for (i = 0; i < 13; i++) { |
223 | 9.97k | result |= build_vlc(&q->envelope_quant_index[i], QUANT_VLC_BITS, |
224 | 9.97k | envelope_quant_index_huffcounts[i], |
225 | 9.97k | envelope_quant_index_huffsyms[i], 1, -12, q->avctx); |
226 | 9.97k | } |
227 | 767 | av_log(q->avctx, AV_LOG_DEBUG, "sqvh VLC init\n"); |
228 | 6.13k | for (i = 0; i < 7; i++) { |
229 | 5.36k | int sym_size = 1 + (i == 3); |
230 | 5.36k | result |= build_vlc(&q->sqvh[i], vhvlcsize_tab[i], |
231 | 5.36k | cvh_huffcounts[i], |
232 | 5.36k | cvh_huffsyms[i], sym_size, 0, q->avctx); |
233 | 5.36k | } |
234 | | |
235 | 1.71k | for (i = 0; i < q->num_subpackets; i++) { |
236 | 947 | if (q->subpacket[i].joint_stereo == 1) { |
237 | 292 | result |= build_vlc(&q->subpacket[i].channel_coupling, COUPLING_VLC_BITS, |
238 | 292 | ccpl_huffcounts[q->subpacket[i].js_vlc_bits - 2], |
239 | 292 | ccpl_huffsyms[q->subpacket[i].js_vlc_bits - 2], 1, |
240 | 292 | 0, q->avctx); |
241 | 292 | av_log(q->avctx, AV_LOG_DEBUG, "subpacket %i Joint-stereo VLC used.\n", i); |
242 | 292 | } |
243 | 947 | } |
244 | | |
245 | 767 | av_log(q->avctx, AV_LOG_DEBUG, "VLC tables initialized.\n"); |
246 | 767 | return result; |
247 | 767 | } |
248 | | |
249 | | static av_cold int init_cook_mlt(COOKContext *q) |
250 | 767 | { |
251 | 767 | int j, ret; |
252 | 767 | int mlt_size = q->samples_per_channel; |
253 | 767 | const float scale = 1.0 / 32768.0; |
254 | | |
255 | 767 | if (!(q->mlt_window = av_malloc_array(mlt_size, sizeof(*q->mlt_window)))) |
256 | 0 | return AVERROR(ENOMEM); |
257 | | |
258 | | /* Initialize the MLT window: simple sine window. */ |
259 | 767 | ff_sine_window_init(q->mlt_window, mlt_size); |
260 | 382k | for (j = 0; j < mlt_size; j++) |
261 | 381k | q->mlt_window[j] *= sqrt(2.0 / q->samples_per_channel); |
262 | | |
263 | | /* Initialize the MDCT. */ |
264 | 767 | ret = av_tx_init(&q->mdct_ctx, &q->mdct_fn, AV_TX_FLOAT_MDCT, |
265 | 767 | 1, mlt_size, &scale, AV_TX_FULL_IMDCT); |
266 | 767 | if (ret < 0) |
267 | 0 | return ret; |
268 | | |
269 | 767 | return 0; |
270 | 767 | } |
271 | | |
272 | | static av_cold void init_cplscales_table(COOKContext *q) |
273 | 767 | { |
274 | 767 | int i; |
275 | 4.60k | for (i = 0; i < 5; i++) |
276 | 3.83k | q->cplscales[i] = cplscales[i]; |
277 | 767 | } |
278 | | |
279 | | /*************** init functions end ***********/ |
280 | | |
281 | 767 | #define DECODE_BYTES_PAD1(bytes) (3 - ((bytes) + 3) % 4) |
282 | | #define DECODE_BYTES_PAD2(bytes) ((bytes) % 4 + DECODE_BYTES_PAD1(2 * (bytes))) |
283 | | |
284 | | /** |
285 | | * Cook indata decoding, every 32 bits are XORed with 0x37c511f2. |
286 | | * Why? No idea, some checksum/error detection method maybe. |
287 | | * |
288 | | * Out buffer size: extra bytes are needed to cope with |
289 | | * padding/misalignment. |
290 | | * Subpackets passed to the decoder can contain two, consecutive |
291 | | * half-subpackets, of identical but arbitrary size. |
292 | | * 1234 1234 1234 1234 extraA extraB |
293 | | * Case 1: AAAA BBBB 0 0 |
294 | | * Case 2: AAAA ABBB BB-- 3 3 |
295 | | * Case 3: AAAA AABB BBBB 2 2 |
296 | | * Case 4: AAAA AAAB BBBB BB-- 1 5 |
297 | | * |
298 | | * Nice way to waste CPU cycles. |
299 | | * |
300 | | * @param inbuffer pointer to byte array of indata |
301 | | * @param out pointer to byte array of outdata |
302 | | * @param bytes number of bytes |
303 | | */ |
304 | | static inline int decode_bytes(const uint8_t *inbuffer, uint8_t *out, int bytes) |
305 | 250k | { |
306 | 250k | static const uint32_t tab[4] = { |
307 | 250k | AV_BE2NE32C(0x37c511f2u), AV_BE2NE32C(0xf237c511u), |
308 | 250k | AV_BE2NE32C(0x11f237c5u), AV_BE2NE32C(0xc511f237u), |
309 | 250k | }; |
310 | 250k | int i, off; |
311 | 250k | uint32_t c; |
312 | 250k | const uint32_t *buf; |
313 | 250k | uint32_t *obuf = (uint32_t *) out; |
314 | | /* FIXME: 64 bit platforms would be able to do 64 bits at a time. |
315 | | * I'm too lazy though, should be something like |
316 | | * for (i = 0; i < bitamount / 64; i++) |
317 | | * (int64_t) out[i] = 0x37c511f237c511f2 ^ av_be2ne64(int64_t) in[i]); |
318 | | * Buffer alignment needs to be checked. */ |
319 | | |
320 | 250k | off = (intptr_t) inbuffer & 3; |
321 | 250k | buf = (const uint32_t *) (inbuffer - off); |
322 | 250k | c = tab[off]; |
323 | 250k | bytes += 3 + off; |
324 | 3.66M | for (i = 0; i < bytes / 4; i++) |
325 | 3.41M | obuf[i] = c ^ buf[i]; |
326 | | |
327 | 250k | return off; |
328 | 250k | } |
329 | | |
330 | | static av_cold int cook_decode_close(AVCodecContext *avctx) |
331 | 1.15k | { |
332 | 1.15k | int i; |
333 | 1.15k | COOKContext *q = avctx->priv_data; |
334 | 1.15k | av_log(avctx, AV_LOG_DEBUG, "Deallocating memory.\n"); |
335 | | |
336 | | /* Free allocated memory buffers. */ |
337 | 1.15k | av_freep(&q->mlt_window); |
338 | 1.15k | av_freep(&q->decoded_bytes_buffer); |
339 | | |
340 | | /* Free the transform. */ |
341 | 1.15k | av_tx_uninit(&q->mdct_ctx); |
342 | | |
343 | | /* Free the VLC tables. */ |
344 | 16.1k | for (i = 0; i < 13; i++) |
345 | 14.9k | ff_vlc_free(&q->envelope_quant_index[i]); |
346 | 9.21k | for (i = 0; i < 7; i++) |
347 | 8.06k | ff_vlc_free(&q->sqvh[i]); |
348 | 2.21k | for (i = 0; i < q->num_subpackets; i++) |
349 | 1.06k | ff_vlc_free(&q->subpacket[i].channel_coupling); |
350 | | |
351 | 1.15k | av_log(avctx, AV_LOG_DEBUG, "Memory deallocated.\n"); |
352 | | |
353 | 1.15k | return 0; |
354 | 1.15k | } |
355 | | |
356 | | /** |
357 | | * Fill the gain array for the timedomain quantization. |
358 | | * |
359 | | * @param gb pointer to the GetBitContext |
360 | | * @param gaininfo array[9] of gain indexes |
361 | | */ |
362 | | static void decode_gain_info(GetBitContext *gb, int *gaininfo) |
363 | 250k | { |
364 | 250k | int i, n; |
365 | | |
366 | 250k | n = get_unary(gb, 0, get_bits_left(gb)); // amount of elements*2 to update |
367 | | |
368 | 250k | i = 0; |
369 | 375k | while (n--) { |
370 | 124k | int index = get_bits(gb, 3); |
371 | 124k | int gain = get_bits1(gb) ? get_bits(gb, 4) - 7 : -1; |
372 | | |
373 | 382k | while (i <= index) |
374 | 258k | gaininfo[i++] = gain; |
375 | 124k | } |
376 | 2.24M | while (i <= 8) |
377 | 1.99M | gaininfo[i++] = 0; |
378 | 250k | } |
379 | | |
380 | | /** |
381 | | * Create the quant index table needed for the envelope. |
382 | | * |
383 | | * @param q pointer to the COOKContext |
384 | | * @param quant_index_table pointer to the array |
385 | | */ |
386 | | static int decode_envelope(COOKContext *q, COOKSubpacket *p, |
387 | | int *quant_index_table) |
388 | 250k | { |
389 | 250k | int i, j, vlc_index; |
390 | | |
391 | 250k | quant_index_table[0] = get_bits(&q->gb, 6) - 6; // This is used later in categorize |
392 | | |
393 | 7.36M | for (i = 1; i < p->total_subbands; i++) { |
394 | 7.12M | vlc_index = i; |
395 | 7.12M | if (i >= p->js_subband_start * 2) { |
396 | 1.41M | vlc_index -= p->js_subband_start; |
397 | 5.70M | } else { |
398 | 5.70M | vlc_index /= 2; |
399 | 5.70M | if (vlc_index < 1) |
400 | 129k | vlc_index = 1; |
401 | 5.70M | } |
402 | 7.12M | if (vlc_index > 13) |
403 | 3.23M | vlc_index = 13; // the VLC tables >13 are identical to No. 13 |
404 | | |
405 | 7.12M | j = get_vlc2(&q->gb, q->envelope_quant_index[vlc_index - 1].table, |
406 | 7.12M | QUANT_VLC_BITS, 2); |
407 | 7.12M | quant_index_table[i] = quant_index_table[i - 1] + j; // differential encoding |
408 | 7.12M | if (quant_index_table[i] > 63 || quant_index_table[i] < -63) { |
409 | 4.82k | av_log(q->avctx, AV_LOG_ERROR, |
410 | 4.82k | "Invalid quantizer %d at position %d, outside [-63, 63] range\n", |
411 | 4.82k | quant_index_table[i], i); |
412 | 4.82k | return AVERROR_INVALIDDATA; |
413 | 4.82k | } |
414 | 7.12M | } |
415 | | |
416 | 245k | return 0; |
417 | 250k | } |
418 | | |
419 | | /** |
420 | | * Calculate the category and category_index vector. |
421 | | * |
422 | | * @param q pointer to the COOKContext |
423 | | * @param quant_index_table pointer to the array |
424 | | * @param category pointer to the category array |
425 | | * @param category_index pointer to the category_index array |
426 | | */ |
427 | | static void categorize(COOKContext *q, COOKSubpacket *p, const int *quant_index_table, |
428 | | int *category, int *category_index) |
429 | 245k | { |
430 | 245k | int exp_idx, bias, tmpbias1, tmpbias2, bits_left, num_bits, index, v, i, j; |
431 | 245k | int exp_index2[102] = { 0 }; |
432 | 245k | int exp_index1[102] = { 0 }; |
433 | | |
434 | 245k | int tmp_categorize_array[128 * 2] = { 0 }; |
435 | 245k | int tmp_categorize_array1_idx = p->numvector_size; |
436 | 245k | int tmp_categorize_array2_idx = p->numvector_size; |
437 | | |
438 | 245k | bits_left = p->bits_per_subpacket - get_bits_count(&q->gb); |
439 | | |
440 | 245k | if (bits_left > q->samples_per_channel) |
441 | 969 | bits_left = q->samples_per_channel + |
442 | 969 | ((bits_left - q->samples_per_channel) * 5) / 8; |
443 | | |
444 | 245k | bias = -32; |
445 | | |
446 | | /* Estimate bias. */ |
447 | 1.71M | for (i = 32; i > 0; i = i / 2) { |
448 | 1.47M | num_bits = 0; |
449 | 1.47M | index = 0; |
450 | 44.5M | for (j = p->total_subbands; j > 0; j--) { |
451 | 43.0M | exp_idx = av_clip_uintp2((i - quant_index_table[index] + bias) / 2, 3); |
452 | 43.0M | index++; |
453 | 43.0M | num_bits += expbits_tab[exp_idx]; |
454 | 43.0M | } |
455 | 1.47M | if (num_bits >= bits_left - 32) |
456 | 1.42M | bias += i; |
457 | 1.47M | } |
458 | | |
459 | | /* Calculate total number of bits. */ |
460 | 245k | num_bits = 0; |
461 | 7.42M | for (i = 0; i < p->total_subbands; i++) { |
462 | 7.18M | exp_idx = av_clip_uintp2((bias - quant_index_table[i]) / 2, 3); |
463 | 7.18M | num_bits += expbits_tab[exp_idx]; |
464 | 7.18M | exp_index1[i] = exp_idx; |
465 | 7.18M | exp_index2[i] = exp_idx; |
466 | 7.18M | } |
467 | 245k | tmpbias1 = tmpbias2 = num_bits; |
468 | | |
469 | 4.39M | for (j = 1; j < p->numvector_size; j++) { |
470 | 4.36M | if (tmpbias1 + tmpbias2 > 2 * bits_left) { /* ---> */ |
471 | 3.97M | int max = -999999; |
472 | 3.97M | index = -1; |
473 | 172M | for (i = 0; i < p->total_subbands; i++) { |
474 | 168M | if (exp_index1[i] < 7) { |
475 | 22.3M | v = (-2 * exp_index1[i]) - quant_index_table[i] + bias; |
476 | 22.3M | if (v >= max) { |
477 | 13.7M | max = v; |
478 | 13.7M | index = i; |
479 | 13.7M | } |
480 | 22.3M | } |
481 | 168M | } |
482 | 3.97M | if (index == -1) |
483 | 210k | break; |
484 | 3.76M | tmp_categorize_array[tmp_categorize_array1_idx++] = index; |
485 | 3.76M | tmpbias1 -= expbits_tab[exp_index1[index]] - |
486 | 3.76M | expbits_tab[exp_index1[index] + 1]; |
487 | 3.76M | ++exp_index1[index]; |
488 | 3.76M | } else { /* <--- */ |
489 | 388k | int min = 999999; |
490 | 388k | index = -1; |
491 | 3.29M | for (i = 0; i < p->total_subbands; i++) { |
492 | 2.90M | if (exp_index2[i] > 0) { |
493 | 2.30M | v = (-2 * exp_index2[i]) - quant_index_table[i] + bias; |
494 | 2.30M | if (v < min) { |
495 | 748k | min = v; |
496 | 748k | index = i; |
497 | 748k | } |
498 | 2.30M | } |
499 | 2.90M | } |
500 | 388k | if (index == -1) |
501 | 507 | break; |
502 | 387k | tmp_categorize_array[--tmp_categorize_array2_idx] = index; |
503 | 387k | tmpbias2 -= expbits_tab[exp_index2[index]] - |
504 | 387k | expbits_tab[exp_index2[index] - 1]; |
505 | 387k | --exp_index2[index]; |
506 | 387k | } |
507 | 4.36M | } |
508 | | |
509 | 7.42M | for (i = 0; i < p->total_subbands; i++) |
510 | 7.18M | category[i] = exp_index2[i]; |
511 | | |
512 | 10.1M | for (i = 0; i < p->numvector_size - 1; i++) |
513 | 9.90M | category_index[i] = tmp_categorize_array[tmp_categorize_array2_idx++]; |
514 | 245k | } |
515 | | |
516 | | |
517 | | /** |
518 | | * Expand the category vector. |
519 | | * |
520 | | * @param q pointer to the COOKContext |
521 | | * @param category pointer to the category array |
522 | | * @param category_index pointer to the category_index array |
523 | | */ |
524 | | static inline void expand_category(COOKContext *q, int *category, |
525 | | int *category_index) |
526 | 245k | { |
527 | 245k | int i; |
528 | 2.59M | for (i = 0; i < q->num_vectors; i++) |
529 | 2.35M | { |
530 | 2.35M | int idx = category_index[i]; |
531 | 2.35M | if (++category[idx] >= FF_ARRAY_ELEMS(dither_tab)) |
532 | 1.65M | --category[idx]; |
533 | 2.35M | } |
534 | 245k | } |
535 | | |
536 | | /** |
537 | | * The real requantization of the mltcoefs |
538 | | * |
539 | | * @param q pointer to the COOKContext |
540 | | * @param index index |
541 | | * @param quant_index quantisation index |
542 | | * @param subband_coef_index array of indexes to quant_centroid_tab |
543 | | * @param subband_coef_sign signs of coefficients |
544 | | * @param mlt_p pointer into the mlt buffer |
545 | | */ |
546 | | static void scalar_dequant_float(COOKContext *q, int index, int quant_index, |
547 | | int *subband_coef_index, int *subband_coef_sign, |
548 | | float *mlt_p) |
549 | 4.24M | { |
550 | 4.24M | int i; |
551 | 4.24M | float f1; |
552 | | |
553 | 89.1M | for (i = 0; i < SUBBAND_SIZE; i++) { |
554 | 84.8M | if (subband_coef_index[i]) { |
555 | 745k | f1 = quant_centroid_tab[index][subband_coef_index[i]]; |
556 | 745k | if (subband_coef_sign[i]) |
557 | 374k | f1 = -f1; |
558 | 84.1M | } else { |
559 | | /* noise coding if subband_coef_index[i] == 0 */ |
560 | 84.1M | f1 = dither_tab[index]; |
561 | 84.1M | if (av_lfg_get(&q->random_state) < 0x80000000) |
562 | 42.0M | f1 = -f1; |
563 | 84.1M | } |
564 | 84.8M | mlt_p[i] = f1 * rootpow2tab[quant_index + 63]; |
565 | 84.8M | } |
566 | 4.24M | } |
567 | | /** |
568 | | * Unpack the subband_coef_index and subband_coef_sign vectors. |
569 | | * |
570 | | * @param q pointer to the COOKContext |
571 | | * @param category pointer to the category array |
572 | | * @param subband_coef_index array of indexes to quant_centroid_tab |
573 | | * @param subband_coef_sign signs of coefficients |
574 | | */ |
575 | | static int unpack_SQVH(COOKContext *q, COOKSubpacket *p, int category, |
576 | | int *subband_coef_index, int *subband_coef_sign) |
577 | 223k | { |
578 | 223k | int i, j; |
579 | 223k | int vlc, vd, tmp, result; |
580 | | |
581 | 223k | vd = vd_tab[category]; |
582 | 223k | result = 0; |
583 | 2.01M | for (i = 0; i < vpr_tab[category]; i++) { |
584 | 1.79M | vlc = get_vlc2(&q->gb, q->sqvh[category].table, q->sqvh[category].bits, 3); |
585 | 1.79M | if (p->bits_per_subpacket < get_bits_count(&q->gb)) { |
586 | 834k | vlc = 0; |
587 | 834k | result = 1; |
588 | 834k | } |
589 | 6.25M | for (j = vd - 1; j >= 0; j--) { |
590 | 4.46M | tmp = (vlc * invradix_tab[category]) / 0x100000; |
591 | 4.46M | subband_coef_index[vd * i + j] = vlc - tmp * (kmax_tab[category] + 1); |
592 | 4.46M | vlc = tmp; |
593 | 4.46M | } |
594 | 6.25M | for (j = 0; j < vd; j++) { |
595 | 4.46M | if (subband_coef_index[i * vd + j]) { |
596 | 790k | if (get_bits_count(&q->gb) < p->bits_per_subpacket) { |
597 | 782k | subband_coef_sign[i * vd + j] = get_bits1(&q->gb); |
598 | 782k | } else { |
599 | 7.73k | result = 1; |
600 | 7.73k | subband_coef_sign[i * vd + j] = 0; |
601 | 7.73k | } |
602 | 3.67M | } else { |
603 | 3.67M | subband_coef_sign[i * vd + j] = 0; |
604 | 3.67M | } |
605 | 4.46M | } |
606 | 1.79M | } |
607 | 223k | return result; |
608 | 223k | } |
609 | | |
610 | | |
611 | | /** |
612 | | * Fill the mlt_buffer with mlt coefficients. |
613 | | * |
614 | | * @param q pointer to the COOKContext |
615 | | * @param category pointer to the category array |
616 | | * @param quant_index_table pointer to the array |
617 | | * @param mlt_buffer pointer to mlt coefficients |
618 | | */ |
619 | | static void decode_vectors(COOKContext *q, COOKSubpacket *p, int *category, |
620 | | int *quant_index_table, float *mlt_buffer) |
621 | 117k | { |
622 | | /* A zero in this table means that the subband coefficient is |
623 | | random noise coded. */ |
624 | 117k | int subband_coef_index[SUBBAND_SIZE]; |
625 | | /* A zero in this table means that the subband coefficient is a |
626 | | positive multiplicator. */ |
627 | 117k | int subband_coef_sign[SUBBAND_SIZE]; |
628 | 117k | int band, j; |
629 | 117k | int index = 0; |
630 | | |
631 | 4.36M | for (band = 0; band < p->total_subbands; band++) { |
632 | 4.24M | index = category[band]; |
633 | 4.24M | if (category[band] < 7) { |
634 | 223k | if (unpack_SQVH(q, p, category[band], subband_coef_index, subband_coef_sign)) { |
635 | 97.2k | index = 7; |
636 | 3.99M | for (j = 0; j < p->total_subbands; j++) |
637 | 3.89M | category[band + j] = 7; |
638 | 97.2k | } |
639 | 223k | } |
640 | 4.24M | if (index >= 7) { |
641 | 4.11M | memset(subband_coef_index, 0, sizeof(subband_coef_index)); |
642 | 4.11M | memset(subband_coef_sign, 0, sizeof(subband_coef_sign)); |
643 | 4.11M | } |
644 | 4.24M | q->scalar_dequant(q, index, quant_index_table[band], |
645 | 4.24M | subband_coef_index, subband_coef_sign, |
646 | 4.24M | &mlt_buffer[band * SUBBAND_SIZE]); |
647 | 4.24M | } |
648 | | |
649 | | /* FIXME: should this be removed, or moved into loop above? */ |
650 | 117k | if (p->total_subbands * SUBBAND_SIZE >= q->samples_per_channel) |
651 | 78.9k | return; |
652 | 117k | } |
653 | | |
654 | | |
655 | | static int mono_decode(COOKContext *q, COOKSubpacket *p, float *mlt_buffer) |
656 | 250k | { |
657 | 250k | int category_index[128] = { 0 }; |
658 | 250k | int category[128] = { 0 }; |
659 | 250k | int quant_index_table[102]; |
660 | 250k | int res, i; |
661 | | |
662 | 250k | if ((res = decode_envelope(q, p, quant_index_table)) < 0) |
663 | 4.82k | return res; |
664 | 245k | q->num_vectors = get_bits(&q->gb, p->log2_numvector_size); |
665 | 245k | categorize(q, p, quant_index_table, category, category_index); |
666 | 245k | expand_category(q, category, category_index); |
667 | 4.48M | for (i=0; i<p->total_subbands; i++) { |
668 | 4.37M | if (category[i] > 7) |
669 | 128k | return AVERROR_INVALIDDATA; |
670 | 4.37M | } |
671 | 117k | decode_vectors(q, p, category, quant_index_table, mlt_buffer); |
672 | | |
673 | 117k | return 0; |
674 | 245k | } |
675 | | |
676 | | |
677 | | /** |
678 | | * the actual requantization of the timedomain samples |
679 | | * |
680 | | * @param q pointer to the COOKContext |
681 | | * @param buffer pointer to the timedomain buffer |
682 | | * @param gain_index index for the block multiplier |
683 | | * @param gain_index_next index for the next block multiplier |
684 | | */ |
685 | | static void interpolate_float(COOKContext *q, float *buffer, |
686 | | int gain_index, int gain_index_next) |
687 | 107k | { |
688 | 107k | int i; |
689 | 107k | float fc1, fc2; |
690 | 107k | fc1 = pow2tab[gain_index + 63]; |
691 | | |
692 | 107k | if (gain_index == gain_index_next) { // static gain |
693 | 5.29M | for (i = 0; i < q->gain_size_factor; i++) |
694 | 5.21M | buffer[i] *= fc1; |
695 | 79.4k | } else { // smooth gain |
696 | 28.0k | fc2 = q->gain_table[15 + (gain_index_next - gain_index)]; |
697 | 1.92M | for (i = 0; i < q->gain_size_factor; i++) { |
698 | 1.89M | buffer[i] *= fc1; |
699 | 1.89M | fc1 *= fc2; |
700 | 1.89M | } |
701 | 28.0k | } |
702 | 107k | } |
703 | | |
704 | | /** |
705 | | * Apply transform window, overlap buffers. |
706 | | * |
707 | | * @param q pointer to the COOKContext |
708 | | * @param inbuffer pointer to the mltcoefficients |
709 | | * @param gains_ptr current and previous gains |
710 | | * @param previous_buffer pointer to the previous buffer to be used for overlapping |
711 | | */ |
712 | | static void imlt_window_float(COOKContext *q, float *inbuffer, |
713 | | cook_gains *gains_ptr, float *previous_buffer) |
714 | 190k | { |
715 | 190k | const float fc = pow2tab[gains_ptr->previous[0] + 63]; |
716 | 190k | int i; |
717 | | /* The weird thing here, is that the two halves of the time domain |
718 | | * buffer are swapped. Also, the newest data, that we save away for |
719 | | * next frame, has the wrong sign. Hence the subtraction below. |
720 | | * Almost sounds like a complex conjugate/reverse data/FFT effect. |
721 | | */ |
722 | | |
723 | | /* Apply window and overlap */ |
724 | 92.6M | for (i = 0; i < q->samples_per_channel; i++) |
725 | 92.4M | inbuffer[i] = inbuffer[i] * fc * q->mlt_window[i] - |
726 | 92.4M | previous_buffer[i] * q->mlt_window[q->samples_per_channel - 1 - i]; |
727 | 190k | } |
728 | | |
729 | | /** |
730 | | * The modulated lapped transform, this takes transform coefficients |
731 | | * and transforms them into timedomain samples. |
732 | | * Apply transform window, overlap buffers, apply gain profile |
733 | | * and buffer management. |
734 | | * |
735 | | * @param q pointer to the COOKContext |
736 | | * @param inbuffer pointer to the mltcoefficients |
737 | | * @param gains_ptr current and previous gains |
738 | | * @param previous_buffer pointer to the previous buffer to be used for overlapping |
739 | | */ |
740 | | static void imlt_gain(COOKContext *q, float *inbuffer, |
741 | | cook_gains *gains_ptr, float *previous_buffer) |
742 | 190k | { |
743 | 190k | float *buffer0 = q->mono_mdct_output; |
744 | 190k | float *buffer1 = q->mono_mdct_output + q->samples_per_channel; |
745 | 190k | int i; |
746 | | |
747 | | /* Inverse modified discrete cosine transform */ |
748 | 190k | q->mdct_fn(q->mdct_ctx, q->mono_mdct_output, inbuffer, sizeof(float)); |
749 | | |
750 | 190k | q->imlt_window(q, buffer1, gains_ptr, previous_buffer); |
751 | | |
752 | | /* Apply gain profile */ |
753 | 1.71M | for (i = 0; i < 8; i++) |
754 | 1.52M | if (gains_ptr->now[i] || gains_ptr->now[i + 1]) |
755 | 107k | q->interpolate(q, &buffer1[q->gain_size_factor * i], |
756 | 107k | gains_ptr->now[i], gains_ptr->now[i + 1]); |
757 | | |
758 | | /* Save away the current to be previous block. */ |
759 | 190k | memcpy(previous_buffer, buffer0, |
760 | 190k | q->samples_per_channel * sizeof(*previous_buffer)); |
761 | 190k | } |
762 | | |
763 | | |
764 | | /** |
765 | | * function for getting the jointstereo coupling information |
766 | | * |
767 | | * @param q pointer to the COOKContext |
768 | | * @param decouple_tab decoupling array |
769 | | */ |
770 | | static int decouple_info(COOKContext *q, COOKSubpacket *p, int *decouple_tab) |
771 | 130k | { |
772 | 130k | int i; |
773 | 130k | int vlc = get_bits1(&q->gb); |
774 | 130k | int start = cplband[p->js_subband_start]; |
775 | 130k | int end = cplband[p->subbands - 1]; |
776 | 130k | int length = end - start + 1; |
777 | | |
778 | 130k | if (start > end) |
779 | 70.9k | return 0; |
780 | | |
781 | 59.5k | if (vlc) |
782 | 52.8k | for (i = 0; i < length; i++) |
783 | 43.5k | decouple_tab[start + i] = get_vlc2(&q->gb, |
784 | 43.5k | p->channel_coupling.table, |
785 | 43.5k | COUPLING_VLC_BITS, 3); |
786 | 50.1k | else |
787 | 214k | for (i = 0; i < length; i++) { |
788 | 164k | int v = get_bits(&q->gb, p->js_vlc_bits); |
789 | 164k | if (v == (1<<p->js_vlc_bits)-1) { |
790 | 292 | av_log(q->avctx, AV_LOG_ERROR, "decouple value too large\n"); |
791 | 292 | return AVERROR_INVALIDDATA; |
792 | 292 | } |
793 | 164k | decouple_tab[start + i] = v; |
794 | 164k | } |
795 | 59.2k | return 0; |
796 | 59.5k | } |
797 | | |
798 | | /** |
799 | | * function decouples a pair of signals from a single signal via multiplication. |
800 | | * |
801 | | * @param q pointer to the COOKContext |
802 | | * @param subband index of the current subband |
803 | | * @param f1 multiplier for channel 1 extraction |
804 | | * @param f2 multiplier for channel 2 extraction |
805 | | * @param decode_buffer input buffer |
806 | | * @param mlt_buffer1 pointer to left channel mlt coefficients |
807 | | * @param mlt_buffer2 pointer to right channel mlt coefficients |
808 | | */ |
809 | | static void decouple_float(COOKContext *q, |
810 | | COOKSubpacket *p, |
811 | | int subband, |
812 | | float f1, float f2, |
813 | | float *decode_buffer, |
814 | | float *mlt_buffer1, float *mlt_buffer2) |
815 | 52.0k | { |
816 | 52.0k | int j, tmp_idx; |
817 | 1.09M | for (j = 0; j < SUBBAND_SIZE; j++) { |
818 | 1.04M | tmp_idx = ((p->js_subband_start + subband) * SUBBAND_SIZE) + j; |
819 | 1.04M | mlt_buffer1[SUBBAND_SIZE * subband + j] = f1 * decode_buffer[tmp_idx]; |
820 | 1.04M | mlt_buffer2[SUBBAND_SIZE * subband + j] = f2 * decode_buffer[tmp_idx]; |
821 | 1.04M | } |
822 | 52.0k | } |
823 | | |
824 | | /** |
825 | | * function for decoding joint stereo data |
826 | | * |
827 | | * @param q pointer to the COOKContext |
828 | | * @param mlt_buffer1 pointer to left channel mlt coefficients |
829 | | * @param mlt_buffer2 pointer to right channel mlt coefficients |
830 | | */ |
831 | | static int joint_decode(COOKContext *q, COOKSubpacket *p, |
832 | | float *mlt_buffer_left, float *mlt_buffer_right) |
833 | 130k | { |
834 | 130k | int i, j, res; |
835 | 130k | int decouple_tab[SUBBAND_SIZE] = { 0 }; |
836 | 130k | float *decode_buffer = q->decode_buffer_0; |
837 | 130k | int idx, cpl_tmp; |
838 | 130k | float f1, f2; |
839 | 130k | const float *cplscale; |
840 | | |
841 | 130k | memset(decode_buffer, 0, sizeof(q->decode_buffer_0)); |
842 | | |
843 | | /* Make sure the buffers are zeroed out. */ |
844 | 130k | memset(mlt_buffer_left, 0, 1024 * sizeof(*mlt_buffer_left)); |
845 | 130k | memset(mlt_buffer_right, 0, 1024 * sizeof(*mlt_buffer_right)); |
846 | 130k | if ((res = decouple_info(q, p, decouple_tab)) < 0) |
847 | 292 | return res; |
848 | 130k | if ((res = mono_decode(q, p, decode_buffer)) < 0) |
849 | 56.3k | return res; |
850 | | /* The two channels are stored interleaved in decode_buffer. */ |
851 | 1.93M | for (i = 0; i < p->js_subband_start; i++) { |
852 | 39.0M | for (j = 0; j < SUBBAND_SIZE; j++) { |
853 | 37.1M | mlt_buffer_left[i * 20 + j] = decode_buffer[i * 40 + j]; |
854 | 37.1M | mlt_buffer_right[i * 20 + j] = decode_buffer[i * 40 + 20 + j]; |
855 | 37.1M | } |
856 | 1.85M | } |
857 | | |
858 | | /* When we reach js_subband_start (the higher frequencies) |
859 | | the coefficients are stored in a coupling scheme. */ |
860 | 73.8k | idx = (1 << p->js_vlc_bits) - 1; |
861 | 125k | for (i = p->js_subband_start; i < p->subbands; i++) { |
862 | 52.0k | cpl_tmp = cplband[i]; |
863 | 52.0k | idx -= decouple_tab[cpl_tmp]; |
864 | 52.0k | cplscale = q->cplscales[p->js_vlc_bits - 2]; // choose decoupler table |
865 | 52.0k | f1 = cplscale[decouple_tab[cpl_tmp] + 1]; |
866 | 52.0k | f2 = cplscale[idx]; |
867 | 52.0k | q->decouple(q, p, i, f1, f2, decode_buffer, |
868 | 52.0k | mlt_buffer_left, mlt_buffer_right); |
869 | 52.0k | idx = (1 << p->js_vlc_bits) - 1; |
870 | 52.0k | } |
871 | | |
872 | 73.8k | return 0; |
873 | 130k | } |
874 | | |
875 | | /** |
876 | | * First part of subpacket decoding: |
877 | | * decode raw stream bytes and read gain info. |
878 | | * |
879 | | * @param q pointer to the COOKContext |
880 | | * @param inbuffer pointer to raw stream data |
881 | | * @param gains_ptr array of current/prev gain pointers |
882 | | */ |
883 | | static inline void decode_bytes_and_gain(COOKContext *q, COOKSubpacket *p, |
884 | | const uint8_t *inbuffer, |
885 | | cook_gains *gains_ptr) |
886 | 250k | { |
887 | 250k | int offset; |
888 | | |
889 | 250k | offset = decode_bytes(inbuffer, q->decoded_bytes_buffer, |
890 | 250k | p->bits_per_subpacket / 8); |
891 | 250k | init_get_bits(&q->gb, q->decoded_bytes_buffer + offset, |
892 | 250k | p->bits_per_subpacket); |
893 | 250k | decode_gain_info(&q->gb, gains_ptr->now); |
894 | | |
895 | | /* Swap current and previous gains */ |
896 | 250k | FFSWAP(int *, gains_ptr->now, gains_ptr->previous); |
897 | 250k | } |
898 | | |
899 | | /** |
900 | | * Saturate the output signal and interleave. |
901 | | * |
902 | | * @param q pointer to the COOKContext |
903 | | * @param out pointer to the output vector |
904 | | */ |
905 | | static void saturate_output_float(COOKContext *q, float *out) |
906 | 184k | { |
907 | 184k | q->adsp.vector_clipf(out, q->mono_mdct_output + q->samples_per_channel, |
908 | 184k | FFALIGN(q->samples_per_channel, 8), -1.0f, 1.0f); |
909 | 184k | } |
910 | | |
911 | | |
912 | | /** |
913 | | * Final part of subpacket decoding: |
914 | | * Apply modulated lapped transform, gain compensation, |
915 | | * clip and convert to integer. |
916 | | * |
917 | | * @param q pointer to the COOKContext |
918 | | * @param decode_buffer pointer to the mlt coefficients |
919 | | * @param gains_ptr array of current/prev gain pointers |
920 | | * @param previous_buffer pointer to the previous buffer to be used for overlapping |
921 | | * @param out pointer to the output buffer |
922 | | */ |
923 | | static inline void mlt_compensate_output(COOKContext *q, float *decode_buffer, |
924 | | cook_gains *gains_ptr, float *previous_buffer, |
925 | | float *out) |
926 | 190k | { |
927 | 190k | imlt_gain(q, decode_buffer, gains_ptr, previous_buffer); |
928 | 190k | if (out) |
929 | 184k | q->saturate_output(q, out); |
930 | 190k | } |
931 | | |
932 | | |
933 | | /** |
934 | | * Cook subpacket decoding. This function returns one decoded subpacket, |
935 | | * usually 1024 samples per channel. |
936 | | * |
937 | | * @param q pointer to the COOKContext |
938 | | * @param inbuffer pointer to the inbuffer |
939 | | * @param outbuffer pointer to the outbuffer |
940 | | */ |
941 | | static int decode_subpacket(COOKContext *q, COOKSubpacket *p, |
942 | | const uint8_t *inbuffer, float **outbuffer) |
943 | 234k | { |
944 | 234k | int sub_packet_size = p->size; |
945 | 234k | int res; |
946 | | |
947 | 234k | memset(q->decode_buffer_1, 0, sizeof(q->decode_buffer_1)); |
948 | 234k | decode_bytes_and_gain(q, p, inbuffer, &p->gains1); |
949 | | |
950 | 234k | if (p->joint_stereo) { |
951 | 130k | if ((res = joint_decode(q, p, q->decode_buffer_1, q->decode_buffer_2)) < 0) |
952 | 56.6k | return res; |
953 | 130k | } else { |
954 | 104k | if ((res = mono_decode(q, p, q->decode_buffer_1)) < 0) |
955 | 76.4k | return res; |
956 | | |
957 | 27.9k | if (p->num_channels == 2) { |
958 | 15.8k | decode_bytes_and_gain(q, p, inbuffer + sub_packet_size / 2, &p->gains2); |
959 | 15.8k | if ((res = mono_decode(q, p, q->decode_buffer_2)) < 0) |
960 | 327 | return res; |
961 | 15.8k | } |
962 | 27.9k | } |
963 | | |
964 | 101k | mlt_compensate_output(q, q->decode_buffer_1, &p->gains1, |
965 | 101k | p->mono_previous_buffer1, |
966 | 101k | outbuffer ? outbuffer[p->ch_idx] : NULL); |
967 | | |
968 | 101k | if (p->num_channels == 2) { |
969 | 89.3k | if (p->joint_stereo) |
970 | 73.8k | mlt_compensate_output(q, q->decode_buffer_2, &p->gains1, |
971 | 73.8k | p->mono_previous_buffer2, |
972 | 73.8k | outbuffer ? outbuffer[p->ch_idx + 1] : NULL); |
973 | 15.5k | else |
974 | 15.5k | mlt_compensate_output(q, q->decode_buffer_2, &p->gains2, |
975 | 15.5k | p->mono_previous_buffer2, |
976 | 15.5k | outbuffer ? outbuffer[p->ch_idx + 1] : NULL); |
977 | 89.3k | } |
978 | | |
979 | 101k | return 0; |
980 | 234k | } |
981 | | |
982 | | |
983 | | static int cook_decode_frame(AVCodecContext *avctx, AVFrame *frame, |
984 | | int *got_frame_ptr, AVPacket *avpkt) |
985 | 341k | { |
986 | 341k | const uint8_t *buf = avpkt->data; |
987 | 341k | int buf_size = avpkt->size; |
988 | 341k | COOKContext *q = avctx->priv_data; |
989 | 341k | float **samples = NULL; |
990 | 341k | int i, ret; |
991 | 341k | int offset = 0; |
992 | 341k | int chidx = 0; |
993 | | |
994 | 341k | if (buf_size < avctx->block_align) |
995 | 174k | return buf_size; |
996 | | |
997 | | /* get output buffer */ |
998 | 166k | if (q->discarded_packets >= 2) { |
999 | 131k | frame->nb_samples = q->samples_per_channel; |
1000 | 131k | if ((ret = ff_get_buffer(avctx, frame, 0)) < 0) |
1001 | 573 | return ret; |
1002 | 131k | samples = (float **)frame->extended_data; |
1003 | 131k | } |
1004 | | |
1005 | | /* estimate subpacket sizes */ |
1006 | 165k | q->subpacket[0].size = avctx->block_align; |
1007 | | |
1008 | 236k | for (i = 1; i < q->num_subpackets; i++) { |
1009 | 72.7k | q->subpacket[i].size = 2 * buf[avctx->block_align - q->num_subpackets + i]; |
1010 | 72.7k | q->subpacket[0].size -= q->subpacket[i].size + 1; |
1011 | 72.7k | if (q->subpacket[0].size < 0) { |
1012 | 1.62k | av_log(avctx, AV_LOG_DEBUG, |
1013 | 1.62k | "frame subpacket size total > avctx->block_align!\n"); |
1014 | 1.62k | return AVERROR_INVALIDDATA; |
1015 | 1.62k | } |
1016 | 72.7k | } |
1017 | | |
1018 | | /* decode supbackets */ |
1019 | 265k | for (i = 0; i < q->num_subpackets; i++) { |
1020 | 234k | q->subpacket[i].bits_per_subpacket = (q->subpacket[i].size * 8) >> |
1021 | 234k | q->subpacket[i].bits_per_subpdiv; |
1022 | 234k | q->subpacket[i].ch_idx = chidx; |
1023 | 234k | av_log(avctx, AV_LOG_DEBUG, |
1024 | 234k | "subpacket[%i] size %i js %i %i block_align %i\n", |
1025 | 234k | i, q->subpacket[i].size, q->subpacket[i].joint_stereo, offset, |
1026 | 234k | avctx->block_align); |
1027 | | |
1028 | 234k | if ((ret = decode_subpacket(q, &q->subpacket[i], buf + offset, samples)) < 0) |
1029 | 133k | return ret; |
1030 | 101k | offset += q->subpacket[i].size; |
1031 | 101k | chidx += q->subpacket[i].num_channels; |
1032 | 101k | av_log(avctx, AV_LOG_DEBUG, "subpacket[%i] %i %i\n", |
1033 | 101k | i, q->subpacket[i].size * 8, get_bits_count(&q->gb)); |
1034 | 101k | } |
1035 | | |
1036 | | /* Discard the first two frames: no valid audio. */ |
1037 | 30.6k | if (q->discarded_packets < 2) { |
1038 | 964 | q->discarded_packets++; |
1039 | 964 | *got_frame_ptr = 0; |
1040 | 964 | return avctx->block_align; |
1041 | 964 | } |
1042 | | |
1043 | 29.7k | *got_frame_ptr = 1; |
1044 | | |
1045 | 29.7k | return avctx->block_align; |
1046 | 30.6k | } |
1047 | | |
1048 | | static void dump_cook_context(COOKContext *q) |
1049 | 767 | { |
1050 | | //int i=0; |
1051 | 7.85k | #define PRINT(a, b) ff_dlog(q->avctx, " %s = %d\n", a, b); |
1052 | 767 | ff_dlog(q->avctx, "COOKextradata\n"); |
1053 | 767 | ff_dlog(q->avctx, "cookversion=%x\n", q->subpacket[0].cookversion); |
1054 | 767 | if (q->subpacket[0].cookversion > STEREO) { |
1055 | 476 | PRINT("js_subband_start", q->subpacket[0].js_subband_start); |
1056 | 476 | PRINT("js_vlc_bits", q->subpacket[0].js_vlc_bits); |
1057 | 476 | } |
1058 | 767 | ff_dlog(q->avctx, "COOKContext\n"); |
1059 | 767 | PRINT("nb_channels", q->avctx->ch_layout.nb_channels); |
1060 | 767 | PRINT("bit_rate", (int)q->avctx->bit_rate); |
1061 | 767 | PRINT("sample_rate", q->avctx->sample_rate); |
1062 | 767 | PRINT("samples_per_channel", q->subpacket[0].samples_per_channel); |
1063 | 767 | PRINT("subbands", q->subpacket[0].subbands); |
1064 | 767 | PRINT("js_subband_start", q->subpacket[0].js_subband_start); |
1065 | 767 | PRINT("log2_numvector_size", q->subpacket[0].log2_numvector_size); |
1066 | 767 | PRINT("numvector_size", q->subpacket[0].numvector_size); |
1067 | 767 | PRINT("total_subbands", q->subpacket[0].total_subbands); |
1068 | 767 | } |
1069 | | |
1070 | | /** |
1071 | | * Cook initialization |
1072 | | * |
1073 | | * @param avctx pointer to the AVCodecContext |
1074 | | */ |
1075 | | static av_cold int cook_decode_init(AVCodecContext *avctx) |
1076 | 1.15k | { |
1077 | 1.15k | static AVOnce init_static_once = AV_ONCE_INIT; |
1078 | 1.15k | COOKContext *q = avctx->priv_data; |
1079 | 1.15k | GetByteContext gb; |
1080 | 1.15k | int s = 0; |
1081 | 1.15k | unsigned int channel_mask = 0; |
1082 | 1.15k | int samples_per_frame = 0; |
1083 | 1.15k | int ret; |
1084 | 1.15k | int channels = avctx->ch_layout.nb_channels; |
1085 | | |
1086 | 1.15k | q->avctx = avctx; |
1087 | | |
1088 | | /* Take care of the codec specific extradata. */ |
1089 | 1.15k | if (avctx->extradata_size < 8) { |
1090 | 121 | av_log(avctx, AV_LOG_ERROR, "Necessary extradata missing!\n"); |
1091 | 121 | return AVERROR_INVALIDDATA; |
1092 | 121 | } |
1093 | 1.03k | av_log(avctx, AV_LOG_DEBUG, "codecdata_length=%d\n", avctx->extradata_size); |
1094 | | |
1095 | 1.03k | bytestream2_init(&gb, avctx->extradata, avctx->extradata_size); |
1096 | | |
1097 | | /* Take data from the AVCodecContext (RM container). */ |
1098 | 1.03k | if (!channels) { |
1099 | 0 | av_log(avctx, AV_LOG_ERROR, "Invalid number of channels\n"); |
1100 | 0 | return AVERROR_INVALIDDATA; |
1101 | 0 | } |
1102 | | |
1103 | 1.03k | if (avctx->block_align >= INT_MAX / 8) |
1104 | 8 | return AVERROR(EINVAL); |
1105 | | |
1106 | | /* Initialize RNG. */ |
1107 | 1.02k | av_lfg_init(&q->random_state, 0); |
1108 | | |
1109 | 1.02k | ff_audiodsp_init(&q->adsp); |
1110 | | |
1111 | 2.08k | while (bytestream2_get_bytes_left(&gb)) { |
1112 | 1.28k | if (s >= FFMIN(MAX_SUBPACKETS, avctx->block_align)) { |
1113 | 4 | avpriv_request_sample(avctx, "subpackets > %d", FFMIN(MAX_SUBPACKETS, avctx->block_align)); |
1114 | 4 | return AVERROR_PATCHWELCOME; |
1115 | 4 | } |
1116 | | /* 8 for mono, 16 for stereo, ? for multichannel |
1117 | | Swap to right endianness so we don't need to care later on. */ |
1118 | 1.28k | q->subpacket[s].cookversion = bytestream2_get_be32(&gb); |
1119 | 1.28k | samples_per_frame = bytestream2_get_be16(&gb); |
1120 | 1.28k | q->subpacket[s].subbands = bytestream2_get_be16(&gb); |
1121 | 1.28k | bytestream2_get_be32(&gb); // Unknown unused |
1122 | 1.28k | q->subpacket[s].js_subband_start = bytestream2_get_be16(&gb); |
1123 | 1.28k | if (q->subpacket[s].js_subband_start >= 51) { |
1124 | 32 | av_log(avctx, AV_LOG_ERROR, "js_subband_start %d is too large\n", q->subpacket[s].js_subband_start); |
1125 | 32 | return AVERROR_INVALIDDATA; |
1126 | 32 | } |
1127 | 1.24k | q->subpacket[s].js_vlc_bits = bytestream2_get_be16(&gb); |
1128 | | |
1129 | | /* Initialize extradata related variables. */ |
1130 | 1.24k | q->subpacket[s].samples_per_channel = samples_per_frame / channels; |
1131 | 1.24k | q->subpacket[s].bits_per_subpacket = avctx->block_align * 8; |
1132 | | |
1133 | | /* Initialize default data states. */ |
1134 | 1.24k | q->subpacket[s].log2_numvector_size = 5; |
1135 | 1.24k | q->subpacket[s].total_subbands = q->subpacket[s].subbands; |
1136 | 1.24k | q->subpacket[s].num_channels = 1; |
1137 | | |
1138 | | /* Initialize version-dependent variables */ |
1139 | | |
1140 | 1.24k | av_log(avctx, AV_LOG_DEBUG, "subpacket[%i].cookversion=%x\n", s, |
1141 | 1.24k | q->subpacket[s].cookversion); |
1142 | 1.24k | q->subpacket[s].joint_stereo = 0; |
1143 | 1.24k | switch (q->subpacket[s].cookversion) { |
1144 | 7 | case MONO: |
1145 | 7 | if (channels != 1) { |
1146 | 2 | avpriv_request_sample(avctx, "Container channels != 1"); |
1147 | 2 | return AVERROR_PATCHWELCOME; |
1148 | 2 | } |
1149 | 5 | av_log(avctx, AV_LOG_DEBUG, "MONO\n"); |
1150 | 5 | break; |
1151 | 316 | case STEREO: |
1152 | 316 | if (channels != 1) { |
1153 | 199 | q->subpacket[s].bits_per_subpdiv = 1; |
1154 | 199 | q->subpacket[s].num_channels = 2; |
1155 | 199 | } |
1156 | 316 | av_log(avctx, AV_LOG_DEBUG, "STEREO\n"); |
1157 | 316 | break; |
1158 | 35 | case JOINT_STEREO: |
1159 | 35 | if (channels != 2) { |
1160 | 1 | avpriv_request_sample(avctx, "Container channels != 2"); |
1161 | 1 | return AVERROR_PATCHWELCOME; |
1162 | 1 | } |
1163 | 34 | av_log(avctx, AV_LOG_DEBUG, "JOINT_STEREO\n"); |
1164 | 34 | if (avctx->extradata_size >= 16) { |
1165 | 1 | q->subpacket[s].total_subbands = q->subpacket[s].subbands + |
1166 | 1 | q->subpacket[s].js_subband_start; |
1167 | 1 | q->subpacket[s].joint_stereo = 1; |
1168 | 1 | q->subpacket[s].num_channels = 2; |
1169 | 1 | } |
1170 | 34 | if (q->subpacket[s].samples_per_channel > 256) { |
1171 | 25 | q->subpacket[s].log2_numvector_size = 6; |
1172 | 25 | } |
1173 | 34 | if (q->subpacket[s].samples_per_channel > 512) { |
1174 | 9 | q->subpacket[s].log2_numvector_size = 7; |
1175 | 9 | } |
1176 | 34 | break; |
1177 | 767 | case MC_COOK: |
1178 | 767 | av_log(avctx, AV_LOG_DEBUG, "MULTI_CHANNEL\n"); |
1179 | 767 | channel_mask |= q->subpacket[s].channel_mask = bytestream2_get_be32(&gb); |
1180 | | |
1181 | 767 | if (av_popcount64(q->subpacket[s].channel_mask) > 1) { |
1182 | 357 | q->subpacket[s].total_subbands = q->subpacket[s].subbands + |
1183 | 357 | q->subpacket[s].js_subband_start; |
1184 | 357 | q->subpacket[s].joint_stereo = 1; |
1185 | 357 | q->subpacket[s].num_channels = 2; |
1186 | 357 | q->subpacket[s].samples_per_channel = samples_per_frame >> 1; |
1187 | | |
1188 | 357 | if (q->subpacket[s].samples_per_channel > 256) { |
1189 | 208 | q->subpacket[s].log2_numvector_size = 6; |
1190 | 208 | } |
1191 | 357 | if (q->subpacket[s].samples_per_channel > 512) { |
1192 | 27 | q->subpacket[s].log2_numvector_size = 7; |
1193 | 27 | } |
1194 | 357 | } else |
1195 | 410 | q->subpacket[s].samples_per_channel = samples_per_frame; |
1196 | | |
1197 | 767 | break; |
1198 | 123 | default: |
1199 | 123 | avpriv_request_sample(avctx, "Cook version %d", |
1200 | 123 | q->subpacket[s].cookversion); |
1201 | 123 | return AVERROR_PATCHWELCOME; |
1202 | 1.24k | } |
1203 | | |
1204 | 1.12k | if (s > 1 && q->subpacket[s].samples_per_channel != q->samples_per_channel) { |
1205 | 21 | av_log(avctx, AV_LOG_ERROR, "different number of samples per channel!\n"); |
1206 | 21 | return AVERROR_INVALIDDATA; |
1207 | 21 | } else |
1208 | 1.10k | q->samples_per_channel = q->subpacket[0].samples_per_channel; |
1209 | | |
1210 | | |
1211 | | /* Initialize variable relations */ |
1212 | 1.10k | q->subpacket[s].numvector_size = (1 << q->subpacket[s].log2_numvector_size); |
1213 | | |
1214 | | /* Try to catch some obviously faulty streams, otherwise it might be exploitable */ |
1215 | 1.10k | if (q->subpacket[s].total_subbands > 53) { |
1216 | 11 | avpriv_request_sample(avctx, "total_subbands > 53"); |
1217 | 11 | return AVERROR_PATCHWELCOME; |
1218 | 11 | } |
1219 | | |
1220 | 1.09k | if ((q->subpacket[s].js_vlc_bits > 6) || |
1221 | 1.07k | (q->subpacket[s].js_vlc_bits < 2 * q->subpacket[s].joint_stereo)) { |
1222 | 15 | av_log(avctx, AV_LOG_ERROR, "js_vlc_bits = %d, only >= %d and <= 6 allowed!\n", |
1223 | 15 | q->subpacket[s].js_vlc_bits, 2 * q->subpacket[s].joint_stereo); |
1224 | 15 | return AVERROR_INVALIDDATA; |
1225 | 15 | } |
1226 | | |
1227 | 1.07k | if (q->subpacket[s].subbands > 50) { |
1228 | 1 | avpriv_request_sample(avctx, "subbands > 50"); |
1229 | 1 | return AVERROR_PATCHWELCOME; |
1230 | 1 | } |
1231 | 1.07k | if (q->subpacket[s].subbands == 0) { |
1232 | 6 | avpriv_request_sample(avctx, "subbands = 0"); |
1233 | 6 | return AVERROR_PATCHWELCOME; |
1234 | 6 | } |
1235 | 1.06k | q->subpacket[s].gains1.now = q->subpacket[s].gain_1; |
1236 | 1.06k | q->subpacket[s].gains1.previous = q->subpacket[s].gain_2; |
1237 | 1.06k | q->subpacket[s].gains2.now = q->subpacket[s].gain_3; |
1238 | 1.06k | q->subpacket[s].gains2.previous = q->subpacket[s].gain_4; |
1239 | | |
1240 | 1.06k | if (q->num_subpackets + q->subpacket[s].num_channels > channels) { |
1241 | 3 | av_log(avctx, AV_LOG_ERROR, "Too many subpackets %d for channels %d\n", q->num_subpackets, channels); |
1242 | 3 | return AVERROR_INVALIDDATA; |
1243 | 3 | } |
1244 | | |
1245 | 1.06k | q->num_subpackets++; |
1246 | 1.06k | s++; |
1247 | 1.06k | } |
1248 | | |
1249 | | /* Try to catch some obviously faulty streams, otherwise it might be exploitable */ |
1250 | 804 | if (q->samples_per_channel != 256 && q->samples_per_channel != 512 && |
1251 | 211 | q->samples_per_channel != 1024) { |
1252 | 37 | avpriv_request_sample(avctx, "samples_per_channel = %d", |
1253 | 37 | q->samples_per_channel); |
1254 | 37 | return AVERROR_PATCHWELCOME; |
1255 | 37 | } |
1256 | | |
1257 | | /* Generate tables */ |
1258 | 767 | ff_thread_once(&init_static_once, init_pow2table); |
1259 | 767 | init_gain_table(q); |
1260 | 767 | init_cplscales_table(q); |
1261 | | |
1262 | 767 | if ((ret = init_cook_vlc_tables(q))) |
1263 | 0 | return ret; |
1264 | | |
1265 | | /* Pad the databuffer with: |
1266 | | DECODE_BYTES_PAD1 or DECODE_BYTES_PAD2 for decode_bytes(), |
1267 | | AV_INPUT_BUFFER_PADDING_SIZE, for the bitstreamreader. */ |
1268 | 767 | q->decoded_bytes_buffer = |
1269 | 767 | av_mallocz(avctx->block_align |
1270 | 767 | + DECODE_BYTES_PAD1(avctx->block_align) |
1271 | 767 | + AV_INPUT_BUFFER_PADDING_SIZE); |
1272 | 767 | if (!q->decoded_bytes_buffer) |
1273 | 0 | return AVERROR(ENOMEM); |
1274 | | |
1275 | | /* Initialize transform. */ |
1276 | 767 | if ((ret = init_cook_mlt(q))) |
1277 | 0 | return ret; |
1278 | | |
1279 | | /* Initialize COOK signal arithmetic handling */ |
1280 | 767 | if (1) { |
1281 | 767 | q->scalar_dequant = scalar_dequant_float; |
1282 | 767 | q->decouple = decouple_float; |
1283 | 767 | q->imlt_window = imlt_window_float; |
1284 | 767 | q->interpolate = interpolate_float; |
1285 | 767 | q->saturate_output = saturate_output_float; |
1286 | 767 | } |
1287 | | |
1288 | 767 | avctx->sample_fmt = AV_SAMPLE_FMT_FLTP; |
1289 | 767 | av_channel_layout_uninit(&avctx->ch_layout); |
1290 | 767 | if (channel_mask) |
1291 | 297 | av_channel_layout_from_mask(&avctx->ch_layout, channel_mask); |
1292 | 470 | else |
1293 | 470 | av_channel_layout_default(&avctx->ch_layout, channels); |
1294 | | |
1295 | | |
1296 | 767 | dump_cook_context(q); |
1297 | | |
1298 | 767 | return 0; |
1299 | 767 | } |
1300 | | |
1301 | | const FFCodec ff_cook_decoder = { |
1302 | | .p.name = "cook", |
1303 | | CODEC_LONG_NAME("Cook / Cooker / Gecko (RealAudio G2)"), |
1304 | | .p.type = AVMEDIA_TYPE_AUDIO, |
1305 | | .p.id = AV_CODEC_ID_COOK, |
1306 | | .priv_data_size = sizeof(COOKContext), |
1307 | | .init = cook_decode_init, |
1308 | | .close = cook_decode_close, |
1309 | | FF_CODEC_DECODE_CB(cook_decode_frame), |
1310 | | .p.capabilities = AV_CODEC_CAP_DR1, |
1311 | | .caps_internal = FF_CODEC_CAP_INIT_CLEANUP, |
1312 | | }; |