/proc/self/cwd/libfaad/filtbank.c
Line | Count | Source (jump to first uncovered line) |
1 | | /* |
2 | | ** FAAD2 - Freeware Advanced Audio (AAC) Decoder including SBR decoding |
3 | | ** Copyright (C) 2003-2005 M. Bakker, Nero AG, http://www.nero.com |
4 | | ** |
5 | | ** This program is free software; you can redistribute it and/or modify |
6 | | ** it under the terms of the GNU General Public License as published by |
7 | | ** the Free Software Foundation; either version 2 of the License, or |
8 | | ** (at your option) any later version. |
9 | | ** |
10 | | ** This program is distributed in the hope that it will be useful, |
11 | | ** but WITHOUT ANY WARRANTY; without even the implied warranty of |
12 | | ** MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the |
13 | | ** GNU General Public License for more details. |
14 | | ** |
15 | | ** You should have received a copy of the GNU General Public License |
16 | | ** along with this program; if not, write to the Free Software |
17 | | ** Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA. |
18 | | ** |
19 | | ** Any non-GPL usage of this software or parts of this software is strictly |
20 | | ** forbidden. |
21 | | ** |
22 | | ** The "appropriate copyright message" mentioned in section 2c of the GPLv2 |
23 | | ** must read: "Code from FAAD2 is copyright (c) Nero AG, www.nero.com" |
24 | | ** |
25 | | ** Commercial non-GPL licensing of this software is possible. |
26 | | ** For more info contact Nero AG through Mpeg4AAClicense@nero.com. |
27 | | ** |
28 | | ** $Id: filtbank.c,v 1.46 2009/01/26 23:51:15 menno Exp $ |
29 | | **/ |
30 | | |
31 | | #include "common.h" |
32 | | #include "structs.h" |
33 | | |
34 | | #include <stdlib.h> |
35 | | #ifdef _WIN32_WCE |
36 | | #define assert(x) |
37 | | #else |
38 | | #include <assert.h> |
39 | | #endif |
40 | | |
41 | | #include "filtbank.h" |
42 | | #include "syntax.h" |
43 | | #include "kbd_win.h" |
44 | | #include "sine_win.h" |
45 | | #include "mdct.h" |
46 | | |
47 | | |
48 | | fb_info *filter_bank_init(uint16_t frame_len) |
49 | 6.80k | { |
50 | 6.80k | uint16_t nshort = frame_len/8; |
51 | 6.80k | #ifdef LD_DEC |
52 | 6.80k | uint16_t frame_len_ld = frame_len/2; |
53 | 6.80k | #endif |
54 | | |
55 | 6.80k | fb_info *fb = (fb_info*)faad_malloc(sizeof(fb_info)); |
56 | 6.80k | memset(fb, 0, sizeof(fb_info)); |
57 | | |
58 | | /* normal */ |
59 | 6.80k | fb->mdct256 = faad_mdct_init(2*nshort); |
60 | 6.80k | fb->mdct2048 = faad_mdct_init(2*frame_len); |
61 | 6.80k | #ifdef LD_DEC |
62 | | /* LD */ |
63 | 6.80k | fb->mdct1024 = faad_mdct_init(2*frame_len_ld); |
64 | 6.80k | #endif |
65 | | |
66 | 6.80k | #ifdef ALLOW_SMALL_FRAMELENGTH |
67 | 6.80k | if (frame_len == 1024) |
68 | 5.51k | { |
69 | 5.51k | #endif |
70 | 5.51k | fb->long_window[0] = sine_long_1024; |
71 | 5.51k | fb->short_window[0] = sine_short_128; |
72 | 5.51k | fb->long_window[1] = kbd_long_1024; |
73 | 5.51k | fb->short_window[1] = kbd_short_128; |
74 | 5.51k | #ifdef LD_DEC |
75 | 5.51k | fb->ld_window[0] = sine_mid_512; |
76 | 5.51k | fb->ld_window[1] = ld_mid_512; |
77 | 5.51k | #endif |
78 | 5.51k | #ifdef ALLOW_SMALL_FRAMELENGTH |
79 | 5.51k | } else /* (frame_len == 960) */ { |
80 | 1.29k | fb->long_window[0] = sine_long_960; |
81 | 1.29k | fb->short_window[0] = sine_short_120; |
82 | 1.29k | fb->long_window[1] = kbd_long_960; |
83 | 1.29k | fb->short_window[1] = kbd_short_120; |
84 | 1.29k | #ifdef LD_DEC |
85 | 1.29k | fb->ld_window[0] = sine_mid_480; |
86 | 1.29k | fb->ld_window[1] = ld_mid_480; |
87 | 1.29k | #endif |
88 | 1.29k | } |
89 | 6.80k | #endif |
90 | | |
91 | 6.80k | return fb; |
92 | 6.80k | } |
93 | | |
94 | | void filter_bank_end(fb_info *fb) |
95 | 6.96k | { |
96 | 6.96k | if (fb != NULL) |
97 | 6.80k | { |
98 | | #ifdef PROFILE |
99 | | printf("FB: %I64d cycles\n", fb->cycles); |
100 | | #endif |
101 | | |
102 | 6.80k | faad_mdct_end(fb->mdct256); |
103 | 6.80k | faad_mdct_end(fb->mdct2048); |
104 | 6.80k | #ifdef LD_DEC |
105 | 6.80k | faad_mdct_end(fb->mdct1024); |
106 | 6.80k | #endif |
107 | | |
108 | 6.80k | faad_free(fb); |
109 | 6.80k | } |
110 | 6.96k | } |
111 | | |
112 | | static INLINE void imdct_long(fb_info *fb, real_t *in_data, real_t *out_data, uint16_t len) |
113 | 182k | { |
114 | 182k | #ifdef LD_DEC |
115 | 182k | mdct_info *mdct = NULL; |
116 | | |
117 | 182k | switch (len) |
118 | 182k | { |
119 | 157k | case 2048: |
120 | 180k | case 1920: |
121 | 180k | mdct = fb->mdct2048; |
122 | 180k | break; |
123 | 695 | case 1024: |
124 | 1.70k | case 960: |
125 | 1.70k | mdct = fb->mdct1024; |
126 | 1.70k | break; |
127 | 182k | } |
128 | | |
129 | 182k | faad_imdct(mdct, in_data, out_data); |
130 | | #else |
131 | | (void)len; |
132 | | faad_imdct(fb->mdct2048, in_data, out_data); |
133 | | #endif |
134 | 182k | } |
135 | | |
136 | | |
137 | | #ifdef LTP_DEC |
138 | | static INLINE void mdct(fb_info *fb, real_t *in_data, real_t *out_data, uint16_t len) |
139 | 5.79k | { |
140 | 5.79k | mdct_info *mdct = NULL; |
141 | | |
142 | 5.79k | switch (len) |
143 | 5.79k | { |
144 | 2.52k | case 2048: |
145 | 5.67k | case 1920: |
146 | 5.67k | mdct = fb->mdct2048; |
147 | 5.67k | break; |
148 | 0 | case 256: |
149 | 0 | case 240: |
150 | 0 | mdct = fb->mdct256; |
151 | 0 | break; |
152 | 0 | #ifdef LD_DEC |
153 | 89 | case 1024: |
154 | 117 | case 960: |
155 | 117 | mdct = fb->mdct1024; |
156 | 117 | break; |
157 | 5.79k | #endif |
158 | 5.79k | } |
159 | | |
160 | 5.79k | faad_mdct(mdct, in_data, out_data); |
161 | 5.79k | } |
162 | | #endif |
163 | | |
164 | | void ifilter_bank(fb_info *fb, uint8_t window_sequence, uint8_t window_shape, |
165 | | uint8_t window_shape_prev, real_t *freq_in, |
166 | | real_t *time_out, real_t *overlap, |
167 | | uint8_t object_type, uint16_t frame_len) |
168 | 193k | { |
169 | 193k | int16_t i; |
170 | 193k | ALIGN real_t transf_buf[2*1024] = {0}; |
171 | | |
172 | 193k | const real_t *window_long = NULL; |
173 | 193k | const real_t *window_long_prev = NULL; |
174 | 193k | const real_t *window_short = NULL; |
175 | 193k | const real_t *window_short_prev = NULL; |
176 | | |
177 | 193k | uint16_t nlong = frame_len; |
178 | 193k | uint16_t nshort = frame_len/8; |
179 | 193k | uint16_t trans = nshort/2; |
180 | | |
181 | 193k | uint16_t nflat_ls = (nlong-nshort)/2; |
182 | | |
183 | | #ifdef PROFILE |
184 | | int64_t count = faad_get_ts(); |
185 | | #endif |
186 | | |
187 | | /* select windows of current frame and previous frame (Sine or KBD) */ |
188 | 193k | #ifdef LD_DEC |
189 | 193k | if (object_type == LD) |
190 | 1.70k | { |
191 | 1.70k | window_long = fb->ld_window[window_shape]; |
192 | 1.70k | window_long_prev = fb->ld_window[window_shape_prev]; |
193 | 191k | } else { |
194 | | #else |
195 | | (void)object_type; |
196 | | #endif |
197 | 191k | window_long = fb->long_window[window_shape]; |
198 | 191k | window_long_prev = fb->long_window[window_shape_prev]; |
199 | 191k | window_short = fb->short_window[window_shape]; |
200 | 191k | window_short_prev = fb->short_window[window_shape_prev]; |
201 | 191k | #ifdef LD_DEC |
202 | 191k | } |
203 | 193k | #endif |
204 | | |
205 | | #if 0 |
206 | | for (i = 0; i < 1024; i++) |
207 | | { |
208 | | printf("%d\n", freq_in[i]); |
209 | | } |
210 | | #endif |
211 | | |
212 | | #if 0 |
213 | | printf("%d %d\n", window_sequence, window_shape); |
214 | | #endif |
215 | | |
216 | 193k | switch (window_sequence) |
217 | 193k | { |
218 | 171k | case ONLY_LONG_SEQUENCE: |
219 | | /* perform iMDCT */ |
220 | 171k | imdct_long(fb, freq_in, transf_buf, 2*nlong); |
221 | | |
222 | | /* add second half output of previous frame to windowed output of current frame */ |
223 | 43.5M | for (i = 0; i < nlong; i+=4) |
224 | 43.3M | { |
225 | 43.3M | time_out[i] = overlap[i] + MUL_F(transf_buf[i],window_long_prev[i]); |
226 | 43.3M | time_out[i+1] = overlap[i+1] + MUL_F(transf_buf[i+1],window_long_prev[i+1]); |
227 | 43.3M | time_out[i+2] = overlap[i+2] + MUL_F(transf_buf[i+2],window_long_prev[i+2]); |
228 | 43.3M | time_out[i+3] = overlap[i+3] + MUL_F(transf_buf[i+3],window_long_prev[i+3]); |
229 | 43.3M | } |
230 | | |
231 | | /* window the second half and save as overlap for next frame */ |
232 | 43.5M | for (i = 0; i < nlong; i+=4) |
233 | 43.3M | { |
234 | 43.3M | overlap[i] = MUL_F(transf_buf[nlong+i],window_long[nlong-1-i]); |
235 | 43.3M | overlap[i+1] = MUL_F(transf_buf[nlong+i+1],window_long[nlong-2-i]); |
236 | 43.3M | overlap[i+2] = MUL_F(transf_buf[nlong+i+2],window_long[nlong-3-i]); |
237 | 43.3M | overlap[i+3] = MUL_F(transf_buf[nlong+i+3],window_long[nlong-4-i]); |
238 | 43.3M | } |
239 | 171k | break; |
240 | | |
241 | 6.93k | case LONG_START_SEQUENCE: |
242 | | /* perform iMDCT */ |
243 | 6.93k | imdct_long(fb, freq_in, transf_buf, 2*nlong); |
244 | | |
245 | | /* add second half output of previous frame to windowed output of current frame */ |
246 | 1.71M | for (i = 0; i < nlong; i+=4) |
247 | 1.71M | { |
248 | 1.71M | time_out[i] = overlap[i] + MUL_F(transf_buf[i],window_long_prev[i]); |
249 | 1.71M | time_out[i+1] = overlap[i+1] + MUL_F(transf_buf[i+1],window_long_prev[i+1]); |
250 | 1.71M | time_out[i+2] = overlap[i+2] + MUL_F(transf_buf[i+2],window_long_prev[i+2]); |
251 | 1.71M | time_out[i+3] = overlap[i+3] + MUL_F(transf_buf[i+3],window_long_prev[i+3]); |
252 | 1.71M | } |
253 | | |
254 | | /* window the second half and save as overlap for next frame */ |
255 | | /* construct second half window using padding with 1's and 0's */ |
256 | 3.00M | for (i = 0; i < nflat_ls; i++) |
257 | 2.99M | overlap[i] = transf_buf[nlong+i]; |
258 | 862k | for (i = 0; i < nshort; i++) |
259 | 855k | overlap[nflat_ls+i] = MUL_F(transf_buf[nlong+nflat_ls+i],window_short[nshort-i-1]); |
260 | 3.00M | for (i = 0; i < nflat_ls; i++) |
261 | 2.99M | overlap[nflat_ls+nshort+i] = 0; |
262 | 6.93k | break; |
263 | | |
264 | 11.1k | case EIGHT_SHORT_SEQUENCE: |
265 | | /* perform iMDCT for each short block */ |
266 | 11.1k | faad_imdct(fb->mdct256, freq_in+0*nshort, transf_buf+2*nshort*0); |
267 | 11.1k | faad_imdct(fb->mdct256, freq_in+1*nshort, transf_buf+2*nshort*1); |
268 | 11.1k | faad_imdct(fb->mdct256, freq_in+2*nshort, transf_buf+2*nshort*2); |
269 | 11.1k | faad_imdct(fb->mdct256, freq_in+3*nshort, transf_buf+2*nshort*3); |
270 | 11.1k | faad_imdct(fb->mdct256, freq_in+4*nshort, transf_buf+2*nshort*4); |
271 | 11.1k | faad_imdct(fb->mdct256, freq_in+5*nshort, transf_buf+2*nshort*5); |
272 | 11.1k | faad_imdct(fb->mdct256, freq_in+6*nshort, transf_buf+2*nshort*6); |
273 | 11.1k | faad_imdct(fb->mdct256, freq_in+7*nshort, transf_buf+2*nshort*7); |
274 | | |
275 | | /* add second half output of previous frame to windowed output of current frame */ |
276 | 4.92M | for (i = 0; i < nflat_ls; i++) |
277 | 4.91M | time_out[i] = overlap[i]; |
278 | 1.41M | for(i = 0; i < nshort; i++) |
279 | 1.40M | { |
280 | 1.40M | time_out[nflat_ls+ i] = overlap[nflat_ls+ i] + MUL_F(transf_buf[nshort*0+i],window_short_prev[i]); |
281 | 1.40M | time_out[nflat_ls+1*nshort+i] = overlap[nflat_ls+nshort*1+i] + MUL_F(transf_buf[nshort*1+i],window_short[nshort-1-i]) + MUL_F(transf_buf[nshort*2+i],window_short[i]); |
282 | 1.40M | time_out[nflat_ls+2*nshort+i] = overlap[nflat_ls+nshort*2+i] + MUL_F(transf_buf[nshort*3+i],window_short[nshort-1-i]) + MUL_F(transf_buf[nshort*4+i],window_short[i]); |
283 | 1.40M | time_out[nflat_ls+3*nshort+i] = overlap[nflat_ls+nshort*3+i] + MUL_F(transf_buf[nshort*5+i],window_short[nshort-1-i]) + MUL_F(transf_buf[nshort*6+i],window_short[i]); |
284 | 1.40M | if (i < trans) |
285 | 702k | time_out[nflat_ls+4*nshort+i] = overlap[nflat_ls+nshort*4+i] + MUL_F(transf_buf[nshort*7+i],window_short[nshort-1-i]) + MUL_F(transf_buf[nshort*8+i],window_short[i]); |
286 | 1.40M | } |
287 | | |
288 | | /* window the second half and save as overlap for next frame */ |
289 | 1.41M | for(i = 0; i < nshort; i++) |
290 | 1.40M | { |
291 | 1.40M | if (i >= trans) |
292 | 702k | overlap[nflat_ls+4*nshort+i-nlong] = MUL_F(transf_buf[nshort*7+i],window_short[nshort-1-i]) + MUL_F(transf_buf[nshort*8+i],window_short[i]); |
293 | 1.40M | overlap[nflat_ls+5*nshort+i-nlong] = MUL_F(transf_buf[nshort*9+i],window_short[nshort-1-i]) + MUL_F(transf_buf[nshort*10+i],window_short[i]); |
294 | 1.40M | overlap[nflat_ls+6*nshort+i-nlong] = MUL_F(transf_buf[nshort*11+i],window_short[nshort-1-i]) + MUL_F(transf_buf[nshort*12+i],window_short[i]); |
295 | 1.40M | overlap[nflat_ls+7*nshort+i-nlong] = MUL_F(transf_buf[nshort*13+i],window_short[nshort-1-i]) + MUL_F(transf_buf[nshort*14+i],window_short[i]); |
296 | 1.40M | overlap[nflat_ls+8*nshort+i-nlong] = MUL_F(transf_buf[nshort*15+i],window_short[nshort-1-i]); |
297 | 1.40M | } |
298 | 4.92M | for (i = 0; i < nflat_ls; i++) |
299 | 4.91M | overlap[nflat_ls+nshort+i] = 0; |
300 | 11.1k | break; |
301 | | |
302 | 4.04k | case LONG_STOP_SEQUENCE: |
303 | | /* perform iMDCT */ |
304 | 4.04k | imdct_long(fb, freq_in, transf_buf, 2*nlong); |
305 | | |
306 | | /* add second half output of previous frame to windowed output of current frame */ |
307 | | /* construct first half window using padding with 1's and 0's */ |
308 | 1.79M | for (i = 0; i < nflat_ls; i++) |
309 | 1.78M | time_out[i] = overlap[i]; |
310 | 514k | for (i = 0; i < nshort; i++) |
311 | 510k | time_out[nflat_ls+i] = overlap[nflat_ls+i] + MUL_F(transf_buf[nflat_ls+i],window_short_prev[i]); |
312 | 1.79M | for (i = 0; i < nflat_ls; i++) |
313 | 1.78M | time_out[nflat_ls+nshort+i] = overlap[nflat_ls+nshort+i] + transf_buf[nflat_ls+nshort+i]; |
314 | | |
315 | | /* window the second half and save as overlap for next frame */ |
316 | 4.08M | for (i = 0; i < nlong; i++) |
317 | 4.08M | overlap[i] = MUL_F(transf_buf[nlong+i],window_long[nlong-1-i]); |
318 | 4.04k | break; |
319 | 193k | } |
320 | | |
321 | | #if 0 |
322 | | for (i = 0; i < 1024; i++) |
323 | | { |
324 | | printf("%d\n", time_out[i]); |
325 | | //printf("0x%.8X\n", time_out[i]); |
326 | | } |
327 | | #endif |
328 | | |
329 | | |
330 | | #ifdef PROFILE |
331 | | count = faad_get_ts() - count; |
332 | | fb->cycles += count; |
333 | | #endif |
334 | 193k | } |
335 | | |
336 | | |
337 | | #ifdef LTP_DEC |
338 | | /* only works for LTP -> no overlapping, no short blocks */ |
339 | | void filter_bank_ltp(fb_info *fb, uint8_t window_sequence, uint8_t window_shape, |
340 | | uint8_t window_shape_prev, real_t *in_data, real_t *out_mdct, |
341 | | uint8_t object_type, uint16_t frame_len) |
342 | 5.79k | { |
343 | 5.79k | int16_t i; |
344 | 5.79k | ALIGN real_t windowed_buf[2*1024] = {0}; |
345 | | |
346 | 5.79k | const real_t *window_long = NULL; |
347 | 5.79k | const real_t *window_long_prev = NULL; |
348 | 5.79k | const real_t *window_short = NULL; |
349 | 5.79k | const real_t *window_short_prev = NULL; |
350 | | |
351 | 5.79k | uint16_t nlong = frame_len; |
352 | 5.79k | uint16_t nshort = frame_len/8; |
353 | 5.79k | uint16_t nflat_ls = (nlong-nshort)/2; |
354 | | |
355 | 5.79k | assert(window_sequence != EIGHT_SHORT_SEQUENCE); |
356 | | |
357 | 5.79k | #ifdef LD_DEC |
358 | 5.79k | if (object_type == LD) |
359 | 117 | { |
360 | 117 | window_long = fb->ld_window[window_shape]; |
361 | 117 | window_long_prev = fb->ld_window[window_shape_prev]; |
362 | 5.67k | } else { |
363 | 5.67k | #endif |
364 | 5.67k | window_long = fb->long_window[window_shape]; |
365 | 5.67k | window_long_prev = fb->long_window[window_shape_prev]; |
366 | 5.67k | window_short = fb->short_window[window_shape]; |
367 | 5.67k | window_short_prev = fb->short_window[window_shape_prev]; |
368 | 5.67k | #ifdef LD_DEC |
369 | 5.67k | } |
370 | 5.79k | #endif |
371 | | |
372 | 5.79k | switch(window_sequence) |
373 | 5.79k | { |
374 | 988 | case ONLY_LONG_SEQUENCE: |
375 | 939k | for (i = nlong-1; i >= 0; i--) |
376 | 938k | { |
377 | 938k | windowed_buf[i] = MUL_F(in_data[i], window_long_prev[i]); |
378 | 938k | windowed_buf[i+nlong] = MUL_F(in_data[i+nlong], window_long[nlong-1-i]); |
379 | 938k | } |
380 | 988 | mdct(fb, windowed_buf, out_mdct, 2*nlong); |
381 | 988 | break; |
382 | | |
383 | 4.13k | case LONG_START_SEQUENCE: |
384 | 4.08M | for (i = 0; i < nlong; i++) |
385 | 4.07M | windowed_buf[i] = MUL_F(in_data[i], window_long_prev[i]); |
386 | 1.78M | for (i = 0; i < nflat_ls; i++) |
387 | 1.78M | windowed_buf[i+nlong] = in_data[i+nlong]; |
388 | 513k | for (i = 0; i < nshort; i++) |
389 | 509k | windowed_buf[i+nlong+nflat_ls] = MUL_F(in_data[i+nlong+nflat_ls], window_short[nshort-1-i]); |
390 | 1.78M | for (i = 0; i < nflat_ls; i++) |
391 | 1.78M | windowed_buf[i+nlong+nflat_ls+nshort] = 0; |
392 | 4.13k | mdct(fb, windowed_buf, out_mdct, 2*nlong); |
393 | 4.13k | break; |
394 | | |
395 | 670 | case LONG_STOP_SEQUENCE: |
396 | 286k | for (i = 0; i < nflat_ls; i++) |
397 | 286k | windowed_buf[i] = 0; |
398 | 82.4k | for (i = 0; i < nshort; i++) |
399 | 81.7k | windowed_buf[i+nflat_ls] = MUL_F(in_data[i+nflat_ls], window_short_prev[i]); |
400 | 286k | for (i = 0; i < nflat_ls; i++) |
401 | 286k | windowed_buf[i+nflat_ls+nshort] = in_data[i+nflat_ls+nshort]; |
402 | 654k | for (i = 0; i < nlong; i++) |
403 | 654k | windowed_buf[i+nlong] = MUL_F(in_data[i+nlong], window_long[nlong-1-i]); |
404 | 670 | mdct(fb, windowed_buf, out_mdct, 2*nlong); |
405 | 670 | break; |
406 | 5.79k | } |
407 | 5.79k | } |
408 | | #endif |