Coverage Report

Created: 2025-07-18 06:36

/proc/self/cwd/libfaad/filtbank.c
Line
Count
Source (jump to first uncovered line)
1
/*
2
** FAAD2 - Freeware Advanced Audio (AAC) Decoder including SBR decoding
3
** Copyright (C) 2003-2005 M. Bakker, Nero AG, http://www.nero.com
4
**
5
** This program is free software; you can redistribute it and/or modify
6
** it under the terms of the GNU General Public License as published by
7
** the Free Software Foundation; either version 2 of the License, or
8
** (at your option) any later version.
9
**
10
** This program is distributed in the hope that it will be useful,
11
** but WITHOUT ANY WARRANTY; without even the implied warranty of
12
** MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
13
** GNU General Public License for more details.
14
**
15
** You should have received a copy of the GNU General Public License
16
** along with this program; if not, write to the Free Software
17
** Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA.
18
**
19
** Any non-GPL usage of this software or parts of this software is strictly
20
** forbidden.
21
**
22
** The "appropriate copyright message" mentioned in section 2c of the GPLv2
23
** must read: "Code from FAAD2 is copyright (c) Nero AG, www.nero.com"
24
**
25
** Commercial non-GPL licensing of this software is possible.
26
** For more info contact Nero AG through Mpeg4AAClicense@nero.com.
27
**
28
** $Id: filtbank.c,v 1.46 2009/01/26 23:51:15 menno Exp $
29
**/
30
31
#include "common.h"
32
#include "structs.h"
33
34
#include <stdlib.h>
35
#ifdef _WIN32_WCE
36
#define assert(x)
37
#else
38
#include <assert.h>
39
#endif
40
41
#include "filtbank.h"
42
#include "syntax.h"
43
#include "kbd_win.h"
44
#include "sine_win.h"
45
#include "mdct.h"
46
47
48
fb_info *filter_bank_init(uint16_t frame_len)
49
28.1k
{
50
28.1k
    uint16_t nshort = frame_len/8;
51
#ifdef LD_DEC
52
    uint16_t frame_len_ld = frame_len/2;
53
#endif
54
55
28.1k
    fb_info *fb = (fb_info*)faad_malloc(sizeof(fb_info));
56
28.1k
    memset(fb, 0, sizeof(fb_info));
57
58
    /* normal */
59
28.1k
    fb->mdct256 = faad_mdct_init(2*nshort);
60
28.1k
    fb->mdct2048 = faad_mdct_init(2*frame_len);
61
#ifdef LD_DEC
62
    /* LD */
63
    fb->mdct1024 = faad_mdct_init(2*frame_len_ld);
64
#endif
65
66
28.1k
#ifdef ALLOW_SMALL_FRAMELENGTH
67
28.1k
    if (frame_len == 1024)
68
22.2k
    {
69
22.2k
#endif
70
22.2k
        fb->long_window[0]  = sine_long_1024;
71
22.2k
        fb->short_window[0] = sine_short_128;
72
22.2k
        fb->long_window[1]  = kbd_long_1024;
73
22.2k
        fb->short_window[1] = kbd_short_128;
74
#ifdef LD_DEC
75
        fb->ld_window[0] = sine_mid_512;
76
        fb->ld_window[1] = ld_mid_512;
77
#endif
78
22.2k
#ifdef ALLOW_SMALL_FRAMELENGTH
79
22.2k
    } else /* (frame_len == 960) */ {
80
5.89k
        fb->long_window[0]  = sine_long_960;
81
5.89k
        fb->short_window[0] = sine_short_120;
82
5.89k
        fb->long_window[1]  = kbd_long_960;
83
5.89k
        fb->short_window[1] = kbd_short_120;
84
#ifdef LD_DEC
85
        fb->ld_window[0] = sine_mid_480;
86
        fb->ld_window[1] = ld_mid_480;
87
#endif
88
5.89k
    }
89
28.1k
#endif
90
91
28.1k
    return fb;
92
28.1k
}
93
94
void filter_bank_end(fb_info *fb)
95
28.7k
{
96
28.7k
    if (fb != NULL)
97
28.1k
    {
98
#ifdef PROFILE
99
        printf("FB:                 %I64d cycles\n", fb->cycles);
100
#endif
101
102
28.1k
        faad_mdct_end(fb->mdct256);
103
28.1k
        faad_mdct_end(fb->mdct2048);
104
#ifdef LD_DEC
105
        faad_mdct_end(fb->mdct1024);
106
#endif
107
108
28.1k
        faad_free(fb);
109
28.1k
    }
110
28.7k
}
111
112
static INLINE void imdct_long(fb_info *fb, real_t *in_data, real_t *out_data, uint16_t len)
113
166k
{
114
#ifdef LD_DEC
115
    mdct_info *mdct = NULL;
116
117
    switch (len)
118
    {
119
    case 2048:
120
    case 1920:
121
        mdct = fb->mdct2048;
122
        break;
123
    case 1024:
124
    case 960:
125
        mdct = fb->mdct1024;
126
        break;
127
    }
128
129
    faad_imdct(mdct, in_data, out_data);
130
#else
131
166k
    (void)len;
132
166k
    faad_imdct(fb->mdct2048, in_data, out_data);
133
166k
#endif
134
166k
}
135
136
137
#ifdef LTP_DEC
138
static INLINE void mdct(fb_info *fb, real_t *in_data, real_t *out_data, uint16_t len)
139
13.8k
{
140
13.8k
    mdct_info *mdct = NULL;
141
142
13.8k
    switch (len)
143
13.8k
    {
144
5.84k
    case 2048:
145
13.4k
    case 1920:
146
13.4k
        mdct = fb->mdct2048;
147
13.4k
        break;
148
0
    case 256:
149
0
    case 240:
150
0
        mdct = fb->mdct256;
151
0
        break;
152
0
#ifdef LD_DEC
153
287
    case 1024:
154
395
    case 960:
155
395
        mdct = fb->mdct1024;
156
395
        break;
157
13.8k
#endif
158
13.8k
    }
159
160
13.8k
    faad_mdct(mdct, in_data, out_data);
161
13.8k
}
162
#endif
163
164
void ifilter_bank(fb_info *fb, uint8_t window_sequence, uint8_t window_shape,
165
                  uint8_t window_shape_prev, real_t *freq_in,
166
                  real_t *time_out, real_t *overlap,
167
                  uint8_t object_type, uint16_t frame_len)
168
1.46M
{
169
1.46M
    int16_t i;
170
1.46M
    ALIGN real_t transf_buf[2*1024] = {0};
171
172
1.46M
    const real_t *window_long = NULL;
173
1.46M
    const real_t *window_long_prev = NULL;
174
1.46M
    const real_t *window_short = NULL;
175
1.46M
    const real_t *window_short_prev = NULL;
176
177
1.46M
    uint16_t nlong = frame_len;
178
1.46M
    uint16_t nshort = frame_len/8;
179
1.46M
    uint16_t trans = nshort/2;
180
181
1.46M
    uint16_t nflat_ls = (nlong-nshort)/2;
182
183
#ifdef PROFILE
184
    int64_t count = faad_get_ts();
185
#endif
186
187
    /* select windows of current frame and previous frame (Sine or KBD) */
188
#ifdef LD_DEC
189
1.06M
    if (object_type == LD)
190
8.77k
    {
191
8.77k
        window_long       = fb->ld_window[window_shape];
192
8.77k
        window_long_prev  = fb->ld_window[window_shape_prev];
193
1.05M
    } else {
194
#else
195
        (void)object_type;
196
#endif
197
1.05M
        window_long       = fb->long_window[window_shape];
198
1.05M
        window_long_prev  = fb->long_window[window_shape_prev];
199
1.05M
        window_short      = fb->short_window[window_shape];
200
1.05M
        window_short_prev = fb->short_window[window_shape_prev];
201
#ifdef LD_DEC
202
    }
203
#endif
204
205
#if 0
206
    for (i = 0; i < 1024; i++)
207
    {
208
        printf("%d\n", freq_in[i]);
209
    }
210
#endif
211
212
#if 0
213
    printf("%d %d\n", window_sequence, window_shape);
214
#endif
215
216
1.46M
    switch (window_sequence)
217
1.46M
    {
218
1.19M
    case ONLY_LONG_SEQUENCE:
219
        /* perform iMDCT */
220
1.19M
        imdct_long(fb, freq_in, transf_buf, 2*nlong);
221
222
        /* add second half output of previous frame to windowed output of current frame */
223
303M
        for (i = 0; i < nlong; i+=4)
224
301M
        {
225
301M
            time_out[i]   = overlap[i]   + MUL_F(transf_buf[i],window_long_prev[i]);
226
301M
            time_out[i+1] = overlap[i+1] + MUL_F(transf_buf[i+1],window_long_prev[i+1]);
227
301M
            time_out[i+2] = overlap[i+2] + MUL_F(transf_buf[i+2],window_long_prev[i+2]);
228
301M
            time_out[i+3] = overlap[i+3] + MUL_F(transf_buf[i+3],window_long_prev[i+3]);
229
301M
        }
230
231
        /* window the second half and save as overlap for next frame */
232
303M
        for (i = 0; i < nlong; i+=4)
233
301M
        {
234
301M
            overlap[i]   = MUL_F(transf_buf[nlong+i],window_long[nlong-1-i]);
235
301M
            overlap[i+1] = MUL_F(transf_buf[nlong+i+1],window_long[nlong-2-i]);
236
301M
            overlap[i+2] = MUL_F(transf_buf[nlong+i+2],window_long[nlong-3-i]);
237
301M
            overlap[i+3] = MUL_F(transf_buf[nlong+i+3],window_long[nlong-4-i]);
238
301M
        }
239
1.19M
        break;
240
241
79.1k
    case LONG_START_SEQUENCE:
242
        /* perform iMDCT */
243
79.1k
        imdct_long(fb, freq_in, transf_buf, 2*nlong);
244
245
        /* add second half output of previous frame to windowed output of current frame */
246
19.8M
        for (i = 0; i < nlong; i+=4)
247
19.7M
        {
248
19.7M
            time_out[i]   = overlap[i]   + MUL_F(transf_buf[i],window_long_prev[i]);
249
19.7M
            time_out[i+1] = overlap[i+1] + MUL_F(transf_buf[i+1],window_long_prev[i+1]);
250
19.7M
            time_out[i+2] = overlap[i+2] + MUL_F(transf_buf[i+2],window_long_prev[i+2]);
251
19.7M
            time_out[i+3] = overlap[i+3] + MUL_F(transf_buf[i+3],window_long_prev[i+3]);
252
19.7M
        }
253
254
        /* window the second half and save as overlap for next frame */
255
        /* construct second half window using padding with 1's and 0's */
256
34.5M
        for (i = 0; i < nflat_ls; i++)
257
34.5M
            overlap[i] = transf_buf[nlong+i];
258
9.94M
        for (i = 0; i < nshort; i++)
259
9.86M
            overlap[nflat_ls+i] = MUL_F(transf_buf[nlong+nflat_ls+i],window_short[nshort-i-1]);
260
34.5M
        for (i = 0; i < nflat_ls; i++)
261
34.5M
            overlap[nflat_ls+nshort+i] = 0;
262
79.1k
        break;
263
264
144k
    case EIGHT_SHORT_SEQUENCE:
265
        /* perform iMDCT for each short block */
266
144k
        faad_imdct(fb->mdct256, freq_in+0*nshort, transf_buf+2*nshort*0);
267
144k
        faad_imdct(fb->mdct256, freq_in+1*nshort, transf_buf+2*nshort*1);
268
144k
        faad_imdct(fb->mdct256, freq_in+2*nshort, transf_buf+2*nshort*2);
269
144k
        faad_imdct(fb->mdct256, freq_in+3*nshort, transf_buf+2*nshort*3);
270
144k
        faad_imdct(fb->mdct256, freq_in+4*nshort, transf_buf+2*nshort*4);
271
144k
        faad_imdct(fb->mdct256, freq_in+5*nshort, transf_buf+2*nshort*5);
272
144k
        faad_imdct(fb->mdct256, freq_in+6*nshort, transf_buf+2*nshort*6);
273
144k
        faad_imdct(fb->mdct256, freq_in+7*nshort, transf_buf+2*nshort*7);
274
275
        /* add second half output of previous frame to windowed output of current frame */
276
64.2M
        for (i = 0; i < nflat_ls; i++)
277
64.0M
            time_out[i] = overlap[i];
278
18.4M
        for(i = 0; i < nshort; i++)
279
18.3M
        {
280
18.3M
            time_out[nflat_ls+         i] = overlap[nflat_ls+         i] + MUL_F(transf_buf[nshort*0+i],window_short_prev[i]);
281
18.3M
            time_out[nflat_ls+1*nshort+i] = overlap[nflat_ls+nshort*1+i] + MUL_F(transf_buf[nshort*1+i],window_short[nshort-1-i]) + MUL_F(transf_buf[nshort*2+i],window_short[i]);
282
18.3M
            time_out[nflat_ls+2*nshort+i] = overlap[nflat_ls+nshort*2+i] + MUL_F(transf_buf[nshort*3+i],window_short[nshort-1-i]) + MUL_F(transf_buf[nshort*4+i],window_short[i]);
283
18.3M
            time_out[nflat_ls+3*nshort+i] = overlap[nflat_ls+nshort*3+i] + MUL_F(transf_buf[nshort*5+i],window_short[nshort-1-i]) + MUL_F(transf_buf[nshort*6+i],window_short[i]);
284
18.3M
            if (i < trans)
285
9.15M
                time_out[nflat_ls+4*nshort+i] = overlap[nflat_ls+nshort*4+i] + MUL_F(transf_buf[nshort*7+i],window_short[nshort-1-i]) + MUL_F(transf_buf[nshort*8+i],window_short[i]);
286
18.3M
        }
287
288
        /* window the second half and save as overlap for next frame */
289
18.4M
        for(i = 0; i < nshort; i++)
290
18.3M
        {
291
18.3M
            if (i >= trans)
292
9.15M
                overlap[nflat_ls+4*nshort+i-nlong] = MUL_F(transf_buf[nshort*7+i],window_short[nshort-1-i]) + MUL_F(transf_buf[nshort*8+i],window_short[i]);
293
18.3M
            overlap[nflat_ls+5*nshort+i-nlong] = MUL_F(transf_buf[nshort*9+i],window_short[nshort-1-i]) + MUL_F(transf_buf[nshort*10+i],window_short[i]);
294
18.3M
            overlap[nflat_ls+6*nshort+i-nlong] = MUL_F(transf_buf[nshort*11+i],window_short[nshort-1-i]) + MUL_F(transf_buf[nshort*12+i],window_short[i]);
295
18.3M
            overlap[nflat_ls+7*nshort+i-nlong] = MUL_F(transf_buf[nshort*13+i],window_short[nshort-1-i]) + MUL_F(transf_buf[nshort*14+i],window_short[i]);
296
18.3M
            overlap[nflat_ls+8*nshort+i-nlong] = MUL_F(transf_buf[nshort*15+i],window_short[nshort-1-i]);
297
18.3M
        }
298
64.2M
        for (i = 0; i < nflat_ls; i++)
299
64.0M
            overlap[nflat_ls+nshort+i] = 0;
300
144k
        break;
301
302
43.2k
    case LONG_STOP_SEQUENCE:
303
        /* perform iMDCT */
304
43.2k
        imdct_long(fb, freq_in, transf_buf, 2*nlong);
305
306
        /* add second half output of previous frame to windowed output of current frame */
307
        /* construct first half window using padding with 1's and 0's */
308
19.1M
        for (i = 0; i < nflat_ls; i++)
309
19.0M
            time_out[i] = overlap[i];
310
5.49M
        for (i = 0; i < nshort; i++)
311
5.44M
            time_out[nflat_ls+i] = overlap[nflat_ls+i] + MUL_F(transf_buf[nflat_ls+i],window_short_prev[i]);
312
19.1M
        for (i = 0; i < nflat_ls; i++)
313
19.0M
            time_out[nflat_ls+nshort+i] = overlap[nflat_ls+nshort+i] + transf_buf[nflat_ls+nshort+i];
314
315
        /* window the second half and save as overlap for next frame */
316
43.6M
        for (i = 0; i < nlong; i++)
317
43.5M
            overlap[i] = MUL_F(transf_buf[nlong+i],window_long[nlong-1-i]);
318
43.2k
    break;
319
1.46M
    }
320
321
#if 0
322
    for (i = 0; i < 1024; i++)
323
    {
324
        printf("%d\n", time_out[i]);
325
        //printf("0x%.8X\n", time_out[i]);
326
    }
327
#endif
328
329
330
#ifdef PROFILE
331
    count = faad_get_ts() - count;
332
    fb->cycles += count;
333
#endif
334
1.46M
}
ifilter_bank
Line
Count
Source
168
196k
{
169
196k
    int16_t i;
170
196k
    ALIGN real_t transf_buf[2*1024] = {0};
171
172
196k
    const real_t *window_long = NULL;
173
196k
    const real_t *window_long_prev = NULL;
174
196k
    const real_t *window_short = NULL;
175
196k
    const real_t *window_short_prev = NULL;
176
177
196k
    uint16_t nlong = frame_len;
178
196k
    uint16_t nshort = frame_len/8;
179
196k
    uint16_t trans = nshort/2;
180
181
196k
    uint16_t nflat_ls = (nlong-nshort)/2;
182
183
#ifdef PROFILE
184
    int64_t count = faad_get_ts();
185
#endif
186
187
    /* select windows of current frame and previous frame (Sine or KBD) */
188
#ifdef LD_DEC
189
    if (object_type == LD)
190
    {
191
        window_long       = fb->ld_window[window_shape];
192
        window_long_prev  = fb->ld_window[window_shape_prev];
193
    } else {
194
#else
195
196k
        (void)object_type;
196
196k
#endif
197
196k
        window_long       = fb->long_window[window_shape];
198
196k
        window_long_prev  = fb->long_window[window_shape_prev];
199
196k
        window_short      = fb->short_window[window_shape];
200
196k
        window_short_prev = fb->short_window[window_shape_prev];
201
#ifdef LD_DEC
202
    }
203
#endif
204
205
#if 0
206
    for (i = 0; i < 1024; i++)
207
    {
208
        printf("%d\n", freq_in[i]);
209
    }
210
#endif
211
212
#if 0
213
    printf("%d %d\n", window_sequence, window_shape);
214
#endif
215
216
196k
    switch (window_sequence)
217
196k
    {
218
146k
    case ONLY_LONG_SEQUENCE:
219
        /* perform iMDCT */
220
146k
        imdct_long(fb, freq_in, transf_buf, 2*nlong);
221
222
        /* add second half output of previous frame to windowed output of current frame */
223
37.3M
        for (i = 0; i < nlong; i+=4)
224
37.1M
        {
225
37.1M
            time_out[i]   = overlap[i]   + MUL_F(transf_buf[i],window_long_prev[i]);
226
37.1M
            time_out[i+1] = overlap[i+1] + MUL_F(transf_buf[i+1],window_long_prev[i+1]);
227
37.1M
            time_out[i+2] = overlap[i+2] + MUL_F(transf_buf[i+2],window_long_prev[i+2]);
228
37.1M
            time_out[i+3] = overlap[i+3] + MUL_F(transf_buf[i+3],window_long_prev[i+3]);
229
37.1M
        }
230
231
        /* window the second half and save as overlap for next frame */
232
37.3M
        for (i = 0; i < nlong; i+=4)
233
37.1M
        {
234
37.1M
            overlap[i]   = MUL_F(transf_buf[nlong+i],window_long[nlong-1-i]);
235
37.1M
            overlap[i+1] = MUL_F(transf_buf[nlong+i+1],window_long[nlong-2-i]);
236
37.1M
            overlap[i+2] = MUL_F(transf_buf[nlong+i+2],window_long[nlong-3-i]);
237
37.1M
            overlap[i+3] = MUL_F(transf_buf[nlong+i+3],window_long[nlong-4-i]);
238
37.1M
        }
239
146k
        break;
240
241
10.8k
    case LONG_START_SEQUENCE:
242
        /* perform iMDCT */
243
10.8k
        imdct_long(fb, freq_in, transf_buf, 2*nlong);
244
245
        /* add second half output of previous frame to windowed output of current frame */
246
2.70M
        for (i = 0; i < nlong; i+=4)
247
2.69M
        {
248
2.69M
            time_out[i]   = overlap[i]   + MUL_F(transf_buf[i],window_long_prev[i]);
249
2.69M
            time_out[i+1] = overlap[i+1] + MUL_F(transf_buf[i+1],window_long_prev[i+1]);
250
2.69M
            time_out[i+2] = overlap[i+2] + MUL_F(transf_buf[i+2],window_long_prev[i+2]);
251
2.69M
            time_out[i+3] = overlap[i+3] + MUL_F(transf_buf[i+3],window_long_prev[i+3]);
252
2.69M
        }
253
254
        /* window the second half and save as overlap for next frame */
255
        /* construct second half window using padding with 1's and 0's */
256
4.72M
        for (i = 0; i < nflat_ls; i++)
257
4.71M
            overlap[i] = transf_buf[nlong+i];
258
1.35M
        for (i = 0; i < nshort; i++)
259
1.34M
            overlap[nflat_ls+i] = MUL_F(transf_buf[nlong+nflat_ls+i],window_short[nshort-i-1]);
260
4.72M
        for (i = 0; i < nflat_ls; i++)
261
4.71M
            overlap[nflat_ls+nshort+i] = 0;
262
10.8k
        break;
263
264
29.3k
    case EIGHT_SHORT_SEQUENCE:
265
        /* perform iMDCT for each short block */
266
29.3k
        faad_imdct(fb->mdct256, freq_in+0*nshort, transf_buf+2*nshort*0);
267
29.3k
        faad_imdct(fb->mdct256, freq_in+1*nshort, transf_buf+2*nshort*1);
268
29.3k
        faad_imdct(fb->mdct256, freq_in+2*nshort, transf_buf+2*nshort*2);
269
29.3k
        faad_imdct(fb->mdct256, freq_in+3*nshort, transf_buf+2*nshort*3);
270
29.3k
        faad_imdct(fb->mdct256, freq_in+4*nshort, transf_buf+2*nshort*4);
271
29.3k
        faad_imdct(fb->mdct256, freq_in+5*nshort, transf_buf+2*nshort*5);
272
29.3k
        faad_imdct(fb->mdct256, freq_in+6*nshort, transf_buf+2*nshort*6);
273
29.3k
        faad_imdct(fb->mdct256, freq_in+7*nshort, transf_buf+2*nshort*7);
274
275
        /* add second half output of previous frame to windowed output of current frame */
276
13.0M
        for (i = 0; i < nflat_ls; i++)
277
12.9M
            time_out[i] = overlap[i];
278
3.73M
        for(i = 0; i < nshort; i++)
279
3.70M
        {
280
3.70M
            time_out[nflat_ls+         i] = overlap[nflat_ls+         i] + MUL_F(transf_buf[nshort*0+i],window_short_prev[i]);
281
3.70M
            time_out[nflat_ls+1*nshort+i] = overlap[nflat_ls+nshort*1+i] + MUL_F(transf_buf[nshort*1+i],window_short[nshort-1-i]) + MUL_F(transf_buf[nshort*2+i],window_short[i]);
282
3.70M
            time_out[nflat_ls+2*nshort+i] = overlap[nflat_ls+nshort*2+i] + MUL_F(transf_buf[nshort*3+i],window_short[nshort-1-i]) + MUL_F(transf_buf[nshort*4+i],window_short[i]);
283
3.70M
            time_out[nflat_ls+3*nshort+i] = overlap[nflat_ls+nshort*3+i] + MUL_F(transf_buf[nshort*5+i],window_short[nshort-1-i]) + MUL_F(transf_buf[nshort*6+i],window_short[i]);
284
3.70M
            if (i < trans)
285
1.85M
                time_out[nflat_ls+4*nshort+i] = overlap[nflat_ls+nshort*4+i] + MUL_F(transf_buf[nshort*7+i],window_short[nshort-1-i]) + MUL_F(transf_buf[nshort*8+i],window_short[i]);
286
3.70M
        }
287
288
        /* window the second half and save as overlap for next frame */
289
3.73M
        for(i = 0; i < nshort; i++)
290
3.70M
        {
291
3.70M
            if (i >= trans)
292
1.85M
                overlap[nflat_ls+4*nshort+i-nlong] = MUL_F(transf_buf[nshort*7+i],window_short[nshort-1-i]) + MUL_F(transf_buf[nshort*8+i],window_short[i]);
293
3.70M
            overlap[nflat_ls+5*nshort+i-nlong] = MUL_F(transf_buf[nshort*9+i],window_short[nshort-1-i]) + MUL_F(transf_buf[nshort*10+i],window_short[i]);
294
3.70M
            overlap[nflat_ls+6*nshort+i-nlong] = MUL_F(transf_buf[nshort*11+i],window_short[nshort-1-i]) + MUL_F(transf_buf[nshort*12+i],window_short[i]);
295
3.70M
            overlap[nflat_ls+7*nshort+i-nlong] = MUL_F(transf_buf[nshort*13+i],window_short[nshort-1-i]) + MUL_F(transf_buf[nshort*14+i],window_short[i]);
296
3.70M
            overlap[nflat_ls+8*nshort+i-nlong] = MUL_F(transf_buf[nshort*15+i],window_short[nshort-1-i]);
297
3.70M
        }
298
13.0M
        for (i = 0; i < nflat_ls; i++)
299
12.9M
            overlap[nflat_ls+nshort+i] = 0;
300
29.3k
        break;
301
302
8.91k
    case LONG_STOP_SEQUENCE:
303
        /* perform iMDCT */
304
8.91k
        imdct_long(fb, freq_in, transf_buf, 2*nlong);
305
306
        /* add second half output of previous frame to windowed output of current frame */
307
        /* construct first half window using padding with 1's and 0's */
308
3.96M
        for (i = 0; i < nflat_ls; i++)
309
3.95M
            time_out[i] = overlap[i];
310
1.13M
        for (i = 0; i < nshort; i++)
311
1.13M
            time_out[nflat_ls+i] = overlap[nflat_ls+i] + MUL_F(transf_buf[nflat_ls+i],window_short_prev[i]);
312
3.96M
        for (i = 0; i < nflat_ls; i++)
313
3.95M
            time_out[nflat_ls+nshort+i] = overlap[nflat_ls+nshort+i] + transf_buf[nflat_ls+nshort+i];
314
315
        /* window the second half and save as overlap for next frame */
316
9.05M
        for (i = 0; i < nlong; i++)
317
9.04M
            overlap[i] = MUL_F(transf_buf[nlong+i],window_long[nlong-1-i]);
318
8.91k
    break;
319
196k
    }
320
321
#if 0
322
    for (i = 0; i < 1024; i++)
323
    {
324
        printf("%d\n", time_out[i]);
325
        //printf("0x%.8X\n", time_out[i]);
326
    }
327
#endif
328
329
330
#ifdef PROFILE
331
    count = faad_get_ts() - count;
332
    fb->cycles += count;
333
#endif
334
196k
}
ifilter_bank
Line
Count
Source
168
534k
{
169
534k
    int16_t i;
170
534k
    ALIGN real_t transf_buf[2*1024] = {0};
171
172
534k
    const real_t *window_long = NULL;
173
534k
    const real_t *window_long_prev = NULL;
174
534k
    const real_t *window_short = NULL;
175
534k
    const real_t *window_short_prev = NULL;
176
177
534k
    uint16_t nlong = frame_len;
178
534k
    uint16_t nshort = frame_len/8;
179
534k
    uint16_t trans = nshort/2;
180
181
534k
    uint16_t nflat_ls = (nlong-nshort)/2;
182
183
#ifdef PROFILE
184
    int64_t count = faad_get_ts();
185
#endif
186
187
    /* select windows of current frame and previous frame (Sine or KBD) */
188
534k
#ifdef LD_DEC
189
534k
    if (object_type == LD)
190
4.38k
    {
191
4.38k
        window_long       = fb->ld_window[window_shape];
192
4.38k
        window_long_prev  = fb->ld_window[window_shape_prev];
193
529k
    } else {
194
#else
195
        (void)object_type;
196
#endif
197
529k
        window_long       = fb->long_window[window_shape];
198
529k
        window_long_prev  = fb->long_window[window_shape_prev];
199
529k
        window_short      = fb->short_window[window_shape];
200
529k
        window_short_prev = fb->short_window[window_shape_prev];
201
529k
#ifdef LD_DEC
202
529k
    }
203
534k
#endif
204
205
#if 0
206
    for (i = 0; i < 1024; i++)
207
    {
208
        printf("%d\n", freq_in[i]);
209
    }
210
#endif
211
212
#if 0
213
    printf("%d %d\n", window_sequence, window_shape);
214
#endif
215
216
534k
    switch (window_sequence)
217
534k
    {
218
449k
    case ONLY_LONG_SEQUENCE:
219
        /* perform iMDCT */
220
449k
        imdct_long(fb, freq_in, transf_buf, 2*nlong);
221
222
        /* add second half output of previous frame to windowed output of current frame */
223
114M
        for (i = 0; i < nlong; i+=4)
224
113M
        {
225
113M
            time_out[i]   = overlap[i]   + MUL_F(transf_buf[i],window_long_prev[i]);
226
113M
            time_out[i+1] = overlap[i+1] + MUL_F(transf_buf[i+1],window_long_prev[i+1]);
227
113M
            time_out[i+2] = overlap[i+2] + MUL_F(transf_buf[i+2],window_long_prev[i+2]);
228
113M
            time_out[i+3] = overlap[i+3] + MUL_F(transf_buf[i+3],window_long_prev[i+3]);
229
113M
        }
230
231
        /* window the second half and save as overlap for next frame */
232
114M
        for (i = 0; i < nlong; i+=4)
233
113M
        {
234
113M
            overlap[i]   = MUL_F(transf_buf[nlong+i],window_long[nlong-1-i]);
235
113M
            overlap[i+1] = MUL_F(transf_buf[nlong+i+1],window_long[nlong-2-i]);
236
113M
            overlap[i+2] = MUL_F(transf_buf[nlong+i+2],window_long[nlong-3-i]);
237
113M
            overlap[i+3] = MUL_F(transf_buf[nlong+i+3],window_long[nlong-4-i]);
238
113M
        }
239
449k
        break;
240
241
28.7k
    case LONG_START_SEQUENCE:
242
        /* perform iMDCT */
243
28.7k
        imdct_long(fb, freq_in, transf_buf, 2*nlong);
244
245
        /* add second half output of previous frame to windowed output of current frame */
246
7.19M
        for (i = 0; i < nlong; i+=4)
247
7.17M
        {
248
7.17M
            time_out[i]   = overlap[i]   + MUL_F(transf_buf[i],window_long_prev[i]);
249
7.17M
            time_out[i+1] = overlap[i+1] + MUL_F(transf_buf[i+1],window_long_prev[i+1]);
250
7.17M
            time_out[i+2] = overlap[i+2] + MUL_F(transf_buf[i+2],window_long_prev[i+2]);
251
7.17M
            time_out[i+3] = overlap[i+3] + MUL_F(transf_buf[i+3],window_long_prev[i+3]);
252
7.17M
        }
253
254
        /* window the second half and save as overlap for next frame */
255
        /* construct second half window using padding with 1's and 0's */
256
12.5M
        for (i = 0; i < nflat_ls; i++)
257
12.5M
            overlap[i] = transf_buf[nlong+i];
258
3.61M
        for (i = 0; i < nshort; i++)
259
3.58M
            overlap[nflat_ls+i] = MUL_F(transf_buf[nlong+nflat_ls+i],window_short[nshort-i-1]);
260
12.5M
        for (i = 0; i < nflat_ls; i++)
261
12.5M
            overlap[nflat_ls+nshort+i] = 0;
262
28.7k
        break;
263
264
43.0k
    case EIGHT_SHORT_SEQUENCE:
265
        /* perform iMDCT for each short block */
266
43.0k
        faad_imdct(fb->mdct256, freq_in+0*nshort, transf_buf+2*nshort*0);
267
43.0k
        faad_imdct(fb->mdct256, freq_in+1*nshort, transf_buf+2*nshort*1);
268
43.0k
        faad_imdct(fb->mdct256, freq_in+2*nshort, transf_buf+2*nshort*2);
269
43.0k
        faad_imdct(fb->mdct256, freq_in+3*nshort, transf_buf+2*nshort*3);
270
43.0k
        faad_imdct(fb->mdct256, freq_in+4*nshort, transf_buf+2*nshort*4);
271
43.0k
        faad_imdct(fb->mdct256, freq_in+5*nshort, transf_buf+2*nshort*5);
272
43.0k
        faad_imdct(fb->mdct256, freq_in+6*nshort, transf_buf+2*nshort*6);
273
43.0k
        faad_imdct(fb->mdct256, freq_in+7*nshort, transf_buf+2*nshort*7);
274
275
        /* add second half output of previous frame to windowed output of current frame */
276
19.1M
        for (i = 0; i < nflat_ls; i++)
277
19.0M
            time_out[i] = overlap[i];
278
5.49M
        for(i = 0; i < nshort; i++)
279
5.44M
        {
280
5.44M
            time_out[nflat_ls+         i] = overlap[nflat_ls+         i] + MUL_F(transf_buf[nshort*0+i],window_short_prev[i]);
281
5.44M
            time_out[nflat_ls+1*nshort+i] = overlap[nflat_ls+nshort*1+i] + MUL_F(transf_buf[nshort*1+i],window_short[nshort-1-i]) + MUL_F(transf_buf[nshort*2+i],window_short[i]);
282
5.44M
            time_out[nflat_ls+2*nshort+i] = overlap[nflat_ls+nshort*2+i] + MUL_F(transf_buf[nshort*3+i],window_short[nshort-1-i]) + MUL_F(transf_buf[nshort*4+i],window_short[i]);
283
5.44M
            time_out[nflat_ls+3*nshort+i] = overlap[nflat_ls+nshort*3+i] + MUL_F(transf_buf[nshort*5+i],window_short[nshort-1-i]) + MUL_F(transf_buf[nshort*6+i],window_short[i]);
284
5.44M
            if (i < trans)
285
2.72M
                time_out[nflat_ls+4*nshort+i] = overlap[nflat_ls+nshort*4+i] + MUL_F(transf_buf[nshort*7+i],window_short[nshort-1-i]) + MUL_F(transf_buf[nshort*8+i],window_short[i]);
286
5.44M
        }
287
288
        /* window the second half and save as overlap for next frame */
289
5.49M
        for(i = 0; i < nshort; i++)
290
5.44M
        {
291
5.44M
            if (i >= trans)
292
2.72M
                overlap[nflat_ls+4*nshort+i-nlong] = MUL_F(transf_buf[nshort*7+i],window_short[nshort-1-i]) + MUL_F(transf_buf[nshort*8+i],window_short[i]);
293
5.44M
            overlap[nflat_ls+5*nshort+i-nlong] = MUL_F(transf_buf[nshort*9+i],window_short[nshort-1-i]) + MUL_F(transf_buf[nshort*10+i],window_short[i]);
294
5.44M
            overlap[nflat_ls+6*nshort+i-nlong] = MUL_F(transf_buf[nshort*11+i],window_short[nshort-1-i]) + MUL_F(transf_buf[nshort*12+i],window_short[i]);
295
5.44M
            overlap[nflat_ls+7*nshort+i-nlong] = MUL_F(transf_buf[nshort*13+i],window_short[nshort-1-i]) + MUL_F(transf_buf[nshort*14+i],window_short[i]);
296
5.44M
            overlap[nflat_ls+8*nshort+i-nlong] = MUL_F(transf_buf[nshort*15+i],window_short[nshort-1-i]);
297
5.44M
        }
298
19.1M
        for (i = 0; i < nflat_ls; i++)
299
19.0M
            overlap[nflat_ls+nshort+i] = 0;
300
43.0k
        break;
301
302
12.6k
    case LONG_STOP_SEQUENCE:
303
        /* perform iMDCT */
304
12.6k
        imdct_long(fb, freq_in, transf_buf, 2*nlong);
305
306
        /* add second half output of previous frame to windowed output of current frame */
307
        /* construct first half window using padding with 1's and 0's */
308
5.59M
        for (i = 0; i < nflat_ls; i++)
309
5.58M
            time_out[i] = overlap[i];
310
1.60M
        for (i = 0; i < nshort; i++)
311
1.59M
            time_out[nflat_ls+i] = overlap[nflat_ls+i] + MUL_F(transf_buf[nflat_ls+i],window_short_prev[i]);
312
5.59M
        for (i = 0; i < nflat_ls; i++)
313
5.58M
            time_out[nflat_ls+nshort+i] = overlap[nflat_ls+nshort+i] + transf_buf[nflat_ls+nshort+i];
314
315
        /* window the second half and save as overlap for next frame */
316
12.7M
        for (i = 0; i < nlong; i++)
317
12.7M
            overlap[i] = MUL_F(transf_buf[nlong+i],window_long[nlong-1-i]);
318
12.6k
    break;
319
534k
    }
320
321
#if 0
322
    for (i = 0; i < 1024; i++)
323
    {
324
        printf("%d\n", time_out[i]);
325
        //printf("0x%.8X\n", time_out[i]);
326
    }
327
#endif
328
329
330
#ifdef PROFILE
331
    count = faad_get_ts() - count;
332
    fb->cycles += count;
333
#endif
334
534k
}
ifilter_bank
Line
Count
Source
168
534k
{
169
534k
    int16_t i;
170
534k
    ALIGN real_t transf_buf[2*1024] = {0};
171
172
534k
    const real_t *window_long = NULL;
173
534k
    const real_t *window_long_prev = NULL;
174
534k
    const real_t *window_short = NULL;
175
534k
    const real_t *window_short_prev = NULL;
176
177
534k
    uint16_t nlong = frame_len;
178
534k
    uint16_t nshort = frame_len/8;
179
534k
    uint16_t trans = nshort/2;
180
181
534k
    uint16_t nflat_ls = (nlong-nshort)/2;
182
183
#ifdef PROFILE
184
    int64_t count = faad_get_ts();
185
#endif
186
187
    /* select windows of current frame and previous frame (Sine or KBD) */
188
534k
#ifdef LD_DEC
189
534k
    if (object_type == LD)
190
4.38k
    {
191
4.38k
        window_long       = fb->ld_window[window_shape];
192
4.38k
        window_long_prev  = fb->ld_window[window_shape_prev];
193
529k
    } else {
194
#else
195
        (void)object_type;
196
#endif
197
529k
        window_long       = fb->long_window[window_shape];
198
529k
        window_long_prev  = fb->long_window[window_shape_prev];
199
529k
        window_short      = fb->short_window[window_shape];
200
529k
        window_short_prev = fb->short_window[window_shape_prev];
201
529k
#ifdef LD_DEC
202
529k
    }
203
534k
#endif
204
205
#if 0
206
    for (i = 0; i < 1024; i++)
207
    {
208
        printf("%d\n", freq_in[i]);
209
    }
210
#endif
211
212
#if 0
213
    printf("%d %d\n", window_sequence, window_shape);
214
#endif
215
216
534k
    switch (window_sequence)
217
534k
    {
218
449k
    case ONLY_LONG_SEQUENCE:
219
        /* perform iMDCT */
220
449k
        imdct_long(fb, freq_in, transf_buf, 2*nlong);
221
222
        /* add second half output of previous frame to windowed output of current frame */
223
114M
        for (i = 0; i < nlong; i+=4)
224
113M
        {
225
113M
            time_out[i]   = overlap[i]   + MUL_F(transf_buf[i],window_long_prev[i]);
226
113M
            time_out[i+1] = overlap[i+1] + MUL_F(transf_buf[i+1],window_long_prev[i+1]);
227
113M
            time_out[i+2] = overlap[i+2] + MUL_F(transf_buf[i+2],window_long_prev[i+2]);
228
113M
            time_out[i+3] = overlap[i+3] + MUL_F(transf_buf[i+3],window_long_prev[i+3]);
229
113M
        }
230
231
        /* window the second half and save as overlap for next frame */
232
114M
        for (i = 0; i < nlong; i+=4)
233
113M
        {
234
113M
            overlap[i]   = MUL_F(transf_buf[nlong+i],window_long[nlong-1-i]);
235
113M
            overlap[i+1] = MUL_F(transf_buf[nlong+i+1],window_long[nlong-2-i]);
236
113M
            overlap[i+2] = MUL_F(transf_buf[nlong+i+2],window_long[nlong-3-i]);
237
113M
            overlap[i+3] = MUL_F(transf_buf[nlong+i+3],window_long[nlong-4-i]);
238
113M
        }
239
449k
        break;
240
241
28.7k
    case LONG_START_SEQUENCE:
242
        /* perform iMDCT */
243
28.7k
        imdct_long(fb, freq_in, transf_buf, 2*nlong);
244
245
        /* add second half output of previous frame to windowed output of current frame */
246
7.19M
        for (i = 0; i < nlong; i+=4)
247
7.17M
        {
248
7.17M
            time_out[i]   = overlap[i]   + MUL_F(transf_buf[i],window_long_prev[i]);
249
7.17M
            time_out[i+1] = overlap[i+1] + MUL_F(transf_buf[i+1],window_long_prev[i+1]);
250
7.17M
            time_out[i+2] = overlap[i+2] + MUL_F(transf_buf[i+2],window_long_prev[i+2]);
251
7.17M
            time_out[i+3] = overlap[i+3] + MUL_F(transf_buf[i+3],window_long_prev[i+3]);
252
7.17M
        }
253
254
        /* window the second half and save as overlap for next frame */
255
        /* construct second half window using padding with 1's and 0's */
256
12.5M
        for (i = 0; i < nflat_ls; i++)
257
12.5M
            overlap[i] = transf_buf[nlong+i];
258
3.61M
        for (i = 0; i < nshort; i++)
259
3.58M
            overlap[nflat_ls+i] = MUL_F(transf_buf[nlong+nflat_ls+i],window_short[nshort-i-1]);
260
12.5M
        for (i = 0; i < nflat_ls; i++)
261
12.5M
            overlap[nflat_ls+nshort+i] = 0;
262
28.7k
        break;
263
264
43.0k
    case EIGHT_SHORT_SEQUENCE:
265
        /* perform iMDCT for each short block */
266
43.0k
        faad_imdct(fb->mdct256, freq_in+0*nshort, transf_buf+2*nshort*0);
267
43.0k
        faad_imdct(fb->mdct256, freq_in+1*nshort, transf_buf+2*nshort*1);
268
43.0k
        faad_imdct(fb->mdct256, freq_in+2*nshort, transf_buf+2*nshort*2);
269
43.0k
        faad_imdct(fb->mdct256, freq_in+3*nshort, transf_buf+2*nshort*3);
270
43.0k
        faad_imdct(fb->mdct256, freq_in+4*nshort, transf_buf+2*nshort*4);
271
43.0k
        faad_imdct(fb->mdct256, freq_in+5*nshort, transf_buf+2*nshort*5);
272
43.0k
        faad_imdct(fb->mdct256, freq_in+6*nshort, transf_buf+2*nshort*6);
273
43.0k
        faad_imdct(fb->mdct256, freq_in+7*nshort, transf_buf+2*nshort*7);
274
275
        /* add second half output of previous frame to windowed output of current frame */
276
19.1M
        for (i = 0; i < nflat_ls; i++)
277
19.0M
            time_out[i] = overlap[i];
278
5.49M
        for(i = 0; i < nshort; i++)
279
5.44M
        {
280
5.44M
            time_out[nflat_ls+         i] = overlap[nflat_ls+         i] + MUL_F(transf_buf[nshort*0+i],window_short_prev[i]);
281
5.44M
            time_out[nflat_ls+1*nshort+i] = overlap[nflat_ls+nshort*1+i] + MUL_F(transf_buf[nshort*1+i],window_short[nshort-1-i]) + MUL_F(transf_buf[nshort*2+i],window_short[i]);
282
5.44M
            time_out[nflat_ls+2*nshort+i] = overlap[nflat_ls+nshort*2+i] + MUL_F(transf_buf[nshort*3+i],window_short[nshort-1-i]) + MUL_F(transf_buf[nshort*4+i],window_short[i]);
283
5.44M
            time_out[nflat_ls+3*nshort+i] = overlap[nflat_ls+nshort*3+i] + MUL_F(transf_buf[nshort*5+i],window_short[nshort-1-i]) + MUL_F(transf_buf[nshort*6+i],window_short[i]);
284
5.44M
            if (i < trans)
285
2.72M
                time_out[nflat_ls+4*nshort+i] = overlap[nflat_ls+nshort*4+i] + MUL_F(transf_buf[nshort*7+i],window_short[nshort-1-i]) + MUL_F(transf_buf[nshort*8+i],window_short[i]);
286
5.44M
        }
287
288
        /* window the second half and save as overlap for next frame */
289
5.49M
        for(i = 0; i < nshort; i++)
290
5.44M
        {
291
5.44M
            if (i >= trans)
292
2.72M
                overlap[nflat_ls+4*nshort+i-nlong] = MUL_F(transf_buf[nshort*7+i],window_short[nshort-1-i]) + MUL_F(transf_buf[nshort*8+i],window_short[i]);
293
5.44M
            overlap[nflat_ls+5*nshort+i-nlong] = MUL_F(transf_buf[nshort*9+i],window_short[nshort-1-i]) + MUL_F(transf_buf[nshort*10+i],window_short[i]);
294
5.44M
            overlap[nflat_ls+6*nshort+i-nlong] = MUL_F(transf_buf[nshort*11+i],window_short[nshort-1-i]) + MUL_F(transf_buf[nshort*12+i],window_short[i]);
295
5.44M
            overlap[nflat_ls+7*nshort+i-nlong] = MUL_F(transf_buf[nshort*13+i],window_short[nshort-1-i]) + MUL_F(transf_buf[nshort*14+i],window_short[i]);
296
5.44M
            overlap[nflat_ls+8*nshort+i-nlong] = MUL_F(transf_buf[nshort*15+i],window_short[nshort-1-i]);
297
5.44M
        }
298
19.1M
        for (i = 0; i < nflat_ls; i++)
299
19.0M
            overlap[nflat_ls+nshort+i] = 0;
300
43.0k
        break;
301
302
12.6k
    case LONG_STOP_SEQUENCE:
303
        /* perform iMDCT */
304
12.6k
        imdct_long(fb, freq_in, transf_buf, 2*nlong);
305
306
        /* add second half output of previous frame to windowed output of current frame */
307
        /* construct first half window using padding with 1's and 0's */
308
5.59M
        for (i = 0; i < nflat_ls; i++)
309
5.58M
            time_out[i] = overlap[i];
310
1.60M
        for (i = 0; i < nshort; i++)
311
1.59M
            time_out[nflat_ls+i] = overlap[nflat_ls+i] + MUL_F(transf_buf[nflat_ls+i],window_short_prev[i]);
312
5.59M
        for (i = 0; i < nflat_ls; i++)
313
5.58M
            time_out[nflat_ls+nshort+i] = overlap[nflat_ls+nshort+i] + transf_buf[nflat_ls+nshort+i];
314
315
        /* window the second half and save as overlap for next frame */
316
12.7M
        for (i = 0; i < nlong; i++)
317
12.7M
            overlap[i] = MUL_F(transf_buf[nlong+i],window_long[nlong-1-i]);
318
12.6k
    break;
319
534k
    }
320
321
#if 0
322
    for (i = 0; i < 1024; i++)
323
    {
324
        printf("%d\n", time_out[i]);
325
        //printf("0x%.8X\n", time_out[i]);
326
    }
327
#endif
328
329
330
#ifdef PROFILE
331
    count = faad_get_ts() - count;
332
    fb->cycles += count;
333
#endif
334
534k
}
ifilter_bank
Line
Count
Source
168
196k
{
169
196k
    int16_t i;
170
196k
    ALIGN real_t transf_buf[2*1024] = {0};
171
172
196k
    const real_t *window_long = NULL;
173
196k
    const real_t *window_long_prev = NULL;
174
196k
    const real_t *window_short = NULL;
175
196k
    const real_t *window_short_prev = NULL;
176
177
196k
    uint16_t nlong = frame_len;
178
196k
    uint16_t nshort = frame_len/8;
179
196k
    uint16_t trans = nshort/2;
180
181
196k
    uint16_t nflat_ls = (nlong-nshort)/2;
182
183
#ifdef PROFILE
184
    int64_t count = faad_get_ts();
185
#endif
186
187
    /* select windows of current frame and previous frame (Sine or KBD) */
188
#ifdef LD_DEC
189
    if (object_type == LD)
190
    {
191
        window_long       = fb->ld_window[window_shape];
192
        window_long_prev  = fb->ld_window[window_shape_prev];
193
    } else {
194
#else
195
196k
        (void)object_type;
196
196k
#endif
197
196k
        window_long       = fb->long_window[window_shape];
198
196k
        window_long_prev  = fb->long_window[window_shape_prev];
199
196k
        window_short      = fb->short_window[window_shape];
200
196k
        window_short_prev = fb->short_window[window_shape_prev];
201
#ifdef LD_DEC
202
    }
203
#endif
204
205
#if 0
206
    for (i = 0; i < 1024; i++)
207
    {
208
        printf("%d\n", freq_in[i]);
209
    }
210
#endif
211
212
#if 0
213
    printf("%d %d\n", window_sequence, window_shape);
214
#endif
215
216
196k
    switch (window_sequence)
217
196k
    {
218
146k
    case ONLY_LONG_SEQUENCE:
219
        /* perform iMDCT */
220
146k
        imdct_long(fb, freq_in, transf_buf, 2*nlong);
221
222
        /* add second half output of previous frame to windowed output of current frame */
223
37.3M
        for (i = 0; i < nlong; i+=4)
224
37.1M
        {
225
37.1M
            time_out[i]   = overlap[i]   + MUL_F(transf_buf[i],window_long_prev[i]);
226
37.1M
            time_out[i+1] = overlap[i+1] + MUL_F(transf_buf[i+1],window_long_prev[i+1]);
227
37.1M
            time_out[i+2] = overlap[i+2] + MUL_F(transf_buf[i+2],window_long_prev[i+2]);
228
37.1M
            time_out[i+3] = overlap[i+3] + MUL_F(transf_buf[i+3],window_long_prev[i+3]);
229
37.1M
        }
230
231
        /* window the second half and save as overlap for next frame */
232
37.3M
        for (i = 0; i < nlong; i+=4)
233
37.1M
        {
234
37.1M
            overlap[i]   = MUL_F(transf_buf[nlong+i],window_long[nlong-1-i]);
235
37.1M
            overlap[i+1] = MUL_F(transf_buf[nlong+i+1],window_long[nlong-2-i]);
236
37.1M
            overlap[i+2] = MUL_F(transf_buf[nlong+i+2],window_long[nlong-3-i]);
237
37.1M
            overlap[i+3] = MUL_F(transf_buf[nlong+i+3],window_long[nlong-4-i]);
238
37.1M
        }
239
146k
        break;
240
241
10.8k
    case LONG_START_SEQUENCE:
242
        /* perform iMDCT */
243
10.8k
        imdct_long(fb, freq_in, transf_buf, 2*nlong);
244
245
        /* add second half output of previous frame to windowed output of current frame */
246
2.70M
        for (i = 0; i < nlong; i+=4)
247
2.69M
        {
248
2.69M
            time_out[i]   = overlap[i]   + MUL_F(transf_buf[i],window_long_prev[i]);
249
2.69M
            time_out[i+1] = overlap[i+1] + MUL_F(transf_buf[i+1],window_long_prev[i+1]);
250
2.69M
            time_out[i+2] = overlap[i+2] + MUL_F(transf_buf[i+2],window_long_prev[i+2]);
251
2.69M
            time_out[i+3] = overlap[i+3] + MUL_F(transf_buf[i+3],window_long_prev[i+3]);
252
2.69M
        }
253
254
        /* window the second half and save as overlap for next frame */
255
        /* construct second half window using padding with 1's and 0's */
256
4.72M
        for (i = 0; i < nflat_ls; i++)
257
4.71M
            overlap[i] = transf_buf[nlong+i];
258
1.35M
        for (i = 0; i < nshort; i++)
259
1.34M
            overlap[nflat_ls+i] = MUL_F(transf_buf[nlong+nflat_ls+i],window_short[nshort-i-1]);
260
4.72M
        for (i = 0; i < nflat_ls; i++)
261
4.71M
            overlap[nflat_ls+nshort+i] = 0;
262
10.8k
        break;
263
264
29.3k
    case EIGHT_SHORT_SEQUENCE:
265
        /* perform iMDCT for each short block */
266
29.3k
        faad_imdct(fb->mdct256, freq_in+0*nshort, transf_buf+2*nshort*0);
267
29.3k
        faad_imdct(fb->mdct256, freq_in+1*nshort, transf_buf+2*nshort*1);
268
29.3k
        faad_imdct(fb->mdct256, freq_in+2*nshort, transf_buf+2*nshort*2);
269
29.3k
        faad_imdct(fb->mdct256, freq_in+3*nshort, transf_buf+2*nshort*3);
270
29.3k
        faad_imdct(fb->mdct256, freq_in+4*nshort, transf_buf+2*nshort*4);
271
29.3k
        faad_imdct(fb->mdct256, freq_in+5*nshort, transf_buf+2*nshort*5);
272
29.3k
        faad_imdct(fb->mdct256, freq_in+6*nshort, transf_buf+2*nshort*6);
273
29.3k
        faad_imdct(fb->mdct256, freq_in+7*nshort, transf_buf+2*nshort*7);
274
275
        /* add second half output of previous frame to windowed output of current frame */
276
13.0M
        for (i = 0; i < nflat_ls; i++)
277
12.9M
            time_out[i] = overlap[i];
278
3.73M
        for(i = 0; i < nshort; i++)
279
3.70M
        {
280
3.70M
            time_out[nflat_ls+         i] = overlap[nflat_ls+         i] + MUL_F(transf_buf[nshort*0+i],window_short_prev[i]);
281
3.70M
            time_out[nflat_ls+1*nshort+i] = overlap[nflat_ls+nshort*1+i] + MUL_F(transf_buf[nshort*1+i],window_short[nshort-1-i]) + MUL_F(transf_buf[nshort*2+i],window_short[i]);
282
3.70M
            time_out[nflat_ls+2*nshort+i] = overlap[nflat_ls+nshort*2+i] + MUL_F(transf_buf[nshort*3+i],window_short[nshort-1-i]) + MUL_F(transf_buf[nshort*4+i],window_short[i]);
283
3.70M
            time_out[nflat_ls+3*nshort+i] = overlap[nflat_ls+nshort*3+i] + MUL_F(transf_buf[nshort*5+i],window_short[nshort-1-i]) + MUL_F(transf_buf[nshort*6+i],window_short[i]);
284
3.70M
            if (i < trans)
285
1.85M
                time_out[nflat_ls+4*nshort+i] = overlap[nflat_ls+nshort*4+i] + MUL_F(transf_buf[nshort*7+i],window_short[nshort-1-i]) + MUL_F(transf_buf[nshort*8+i],window_short[i]);
286
3.70M
        }
287
288
        /* window the second half and save as overlap for next frame */
289
3.73M
        for(i = 0; i < nshort; i++)
290
3.70M
        {
291
3.70M
            if (i >= trans)
292
1.85M
                overlap[nflat_ls+4*nshort+i-nlong] = MUL_F(transf_buf[nshort*7+i],window_short[nshort-1-i]) + MUL_F(transf_buf[nshort*8+i],window_short[i]);
293
3.70M
            overlap[nflat_ls+5*nshort+i-nlong] = MUL_F(transf_buf[nshort*9+i],window_short[nshort-1-i]) + MUL_F(transf_buf[nshort*10+i],window_short[i]);
294
3.70M
            overlap[nflat_ls+6*nshort+i-nlong] = MUL_F(transf_buf[nshort*11+i],window_short[nshort-1-i]) + MUL_F(transf_buf[nshort*12+i],window_short[i]);
295
3.70M
            overlap[nflat_ls+7*nshort+i-nlong] = MUL_F(transf_buf[nshort*13+i],window_short[nshort-1-i]) + MUL_F(transf_buf[nshort*14+i],window_short[i]);
296
3.70M
            overlap[nflat_ls+8*nshort+i-nlong] = MUL_F(transf_buf[nshort*15+i],window_short[nshort-1-i]);
297
3.70M
        }
298
13.0M
        for (i = 0; i < nflat_ls; i++)
299
12.9M
            overlap[nflat_ls+nshort+i] = 0;
300
29.3k
        break;
301
302
8.91k
    case LONG_STOP_SEQUENCE:
303
        /* perform iMDCT */
304
8.91k
        imdct_long(fb, freq_in, transf_buf, 2*nlong);
305
306
        /* add second half output of previous frame to windowed output of current frame */
307
        /* construct first half window using padding with 1's and 0's */
308
3.96M
        for (i = 0; i < nflat_ls; i++)
309
3.95M
            time_out[i] = overlap[i];
310
1.13M
        for (i = 0; i < nshort; i++)
311
1.13M
            time_out[nflat_ls+i] = overlap[nflat_ls+i] + MUL_F(transf_buf[nflat_ls+i],window_short_prev[i]);
312
3.96M
        for (i = 0; i < nflat_ls; i++)
313
3.95M
            time_out[nflat_ls+nshort+i] = overlap[nflat_ls+nshort+i] + transf_buf[nflat_ls+nshort+i];
314
315
        /* window the second half and save as overlap for next frame */
316
9.05M
        for (i = 0; i < nlong; i++)
317
9.04M
            overlap[i] = MUL_F(transf_buf[nlong+i],window_long[nlong-1-i]);
318
8.91k
    break;
319
196k
    }
320
321
#if 0
322
    for (i = 0; i < 1024; i++)
323
    {
324
        printf("%d\n", time_out[i]);
325
        //printf("0x%.8X\n", time_out[i]);
326
    }
327
#endif
328
329
330
#ifdef PROFILE
331
    count = faad_get_ts() - count;
332
    fb->cycles += count;
333
#endif
334
196k
}
335
336
337
#ifdef LTP_DEC
338
/* only works for LTP -> no overlapping, no short blocks */
339
void filter_bank_ltp(fb_info *fb, uint8_t window_sequence, uint8_t window_shape,
340
                     uint8_t window_shape_prev, real_t *in_data, real_t *out_mdct,
341
                     uint8_t object_type, uint16_t frame_len)
342
27.6k
{
343
27.6k
    int16_t i;
344
27.6k
    ALIGN real_t windowed_buf[2*1024] = {0};
345
346
27.6k
    const real_t *window_long = NULL;
347
27.6k
    const real_t *window_long_prev = NULL;
348
27.6k
    const real_t *window_short = NULL;
349
27.6k
    const real_t *window_short_prev = NULL;
350
351
27.6k
    uint16_t nlong = frame_len;
352
27.6k
    uint16_t nshort = frame_len/8;
353
27.6k
    uint16_t nflat_ls = (nlong-nshort)/2;
354
355
27.6k
    assert(window_sequence != EIGHT_SHORT_SEQUENCE);
356
357
27.6k
#ifdef LD_DEC
358
27.6k
    if (object_type == LD)
359
790
    {
360
790
        window_long       = fb->ld_window[window_shape];
361
790
        window_long_prev  = fb->ld_window[window_shape_prev];
362
26.8k
    } else {
363
26.8k
#endif
364
26.8k
        window_long       = fb->long_window[window_shape];
365
26.8k
        window_long_prev  = fb->long_window[window_shape_prev];
366
26.8k
        window_short      = fb->short_window[window_shape];
367
26.8k
        window_short_prev = fb->short_window[window_shape_prev];
368
26.8k
#ifdef LD_DEC
369
26.8k
    }
370
27.6k
#endif
371
372
27.6k
    switch(window_sequence)
373
27.6k
    {
374
3.82k
    case ONLY_LONG_SEQUENCE:
375
3.46M
        for (i = nlong-1; i >= 0; i--)
376
3.45M
        {
377
3.45M
            windowed_buf[i] = MUL_F(in_data[i], window_long_prev[i]);
378
3.45M
            windowed_buf[i+nlong] = MUL_F(in_data[i+nlong], window_long[nlong-1-i]);
379
3.45M
        }
380
3.82k
        mdct(fb, windowed_buf, out_mdct, 2*nlong);
381
3.82k
        break;
382
383
18.0k
    case LONG_START_SEQUENCE:
384
17.7M
        for (i = 0; i < nlong; i++)
385
17.7M
            windowed_buf[i] = MUL_F(in_data[i], window_long_prev[i]);
386
7.79M
        for (i = 0; i < nflat_ls; i++)
387
7.77M
            windowed_buf[i+nlong] = in_data[i+nlong];
388
2.24M
        for (i = 0; i < nshort; i++)
389
2.22M
            windowed_buf[i+nlong+nflat_ls] = MUL_F(in_data[i+nlong+nflat_ls], window_short[nshort-1-i]);
390
7.79M
        for (i = 0; i < nflat_ls; i++)
391
7.77M
            windowed_buf[i+nlong+nflat_ls+nshort] = 0;
392
18.0k
        mdct(fb, windowed_buf, out_mdct, 2*nlong);
393
18.0k
        break;
394
395
5.83k
    case LONG_STOP_SEQUENCE:
396
2.50M
        for (i = 0; i < nflat_ls; i++)
397
2.49M
            windowed_buf[i] = 0;
398
718k
        for (i = 0; i < nshort; i++)
399
712k
            windowed_buf[i+nflat_ls] = MUL_F(in_data[i+nflat_ls], window_short_prev[i]);
400
2.50M
        for (i = 0; i < nflat_ls; i++)
401
2.49M
            windowed_buf[i+nflat_ls+nshort] = in_data[i+nflat_ls+nshort];
402
5.70M
        for (i = 0; i < nlong; i++)
403
5.70M
            windowed_buf[i+nlong] = MUL_F(in_data[i+nlong], window_long[nlong-1-i]);
404
5.83k
        mdct(fb, windowed_buf, out_mdct, 2*nlong);
405
5.83k
        break;
406
27.6k
    }
407
27.6k
}
filter_bank_ltp
Line
Count
Source
342
13.8k
{
343
13.8k
    int16_t i;
344
13.8k
    ALIGN real_t windowed_buf[2*1024] = {0};
345
346
13.8k
    const real_t *window_long = NULL;
347
13.8k
    const real_t *window_long_prev = NULL;
348
13.8k
    const real_t *window_short = NULL;
349
13.8k
    const real_t *window_short_prev = NULL;
350
351
13.8k
    uint16_t nlong = frame_len;
352
13.8k
    uint16_t nshort = frame_len/8;
353
13.8k
    uint16_t nflat_ls = (nlong-nshort)/2;
354
355
13.8k
    assert(window_sequence != EIGHT_SHORT_SEQUENCE);
356
357
13.8k
#ifdef LD_DEC
358
13.8k
    if (object_type == LD)
359
395
    {
360
395
        window_long       = fb->ld_window[window_shape];
361
395
        window_long_prev  = fb->ld_window[window_shape_prev];
362
13.4k
    } else {
363
13.4k
#endif
364
13.4k
        window_long       = fb->long_window[window_shape];
365
13.4k
        window_long_prev  = fb->long_window[window_shape_prev];
366
13.4k
        window_short      = fb->short_window[window_shape];
367
13.4k
        window_short_prev = fb->short_window[window_shape_prev];
368
13.4k
#ifdef LD_DEC
369
13.4k
    }
370
13.8k
#endif
371
372
13.8k
    switch(window_sequence)
373
13.8k
    {
374
1.91k
    case ONLY_LONG_SEQUENCE:
375
1.73M
        for (i = nlong-1; i >= 0; i--)
376
1.72M
        {
377
1.72M
            windowed_buf[i] = MUL_F(in_data[i], window_long_prev[i]);
378
1.72M
            windowed_buf[i+nlong] = MUL_F(in_data[i+nlong], window_long[nlong-1-i]);
379
1.72M
        }
380
1.91k
        mdct(fb, windowed_buf, out_mdct, 2*nlong);
381
1.91k
        break;
382
383
9.00k
    case LONG_START_SEQUENCE:
384
8.89M
        for (i = 0; i < nlong; i++)
385
8.89M
            windowed_buf[i] = MUL_F(in_data[i], window_long_prev[i]);
386
3.89M
        for (i = 0; i < nflat_ls; i++)
387
3.88M
            windowed_buf[i+nlong] = in_data[i+nlong];
388
1.12M
        for (i = 0; i < nshort; i++)
389
1.11M
            windowed_buf[i+nlong+nflat_ls] = MUL_F(in_data[i+nlong+nflat_ls], window_short[nshort-1-i]);
390
3.89M
        for (i = 0; i < nflat_ls; i++)
391
3.88M
            windowed_buf[i+nlong+nflat_ls+nshort] = 0;
392
9.00k
        mdct(fb, windowed_buf, out_mdct, 2*nlong);
393
9.00k
        break;
394
395
2.91k
    case LONG_STOP_SEQUENCE:
396
1.25M
        for (i = 0; i < nflat_ls; i++)
397
1.24M
            windowed_buf[i] = 0;
398
359k
        for (i = 0; i < nshort; i++)
399
356k
            windowed_buf[i+nflat_ls] = MUL_F(in_data[i+nflat_ls], window_short_prev[i]);
400
1.25M
        for (i = 0; i < nflat_ls; i++)
401
1.24M
            windowed_buf[i+nflat_ls+nshort] = in_data[i+nflat_ls+nshort];
402
2.85M
        for (i = 0; i < nlong; i++)
403
2.85M
            windowed_buf[i+nlong] = MUL_F(in_data[i+nlong], window_long[nlong-1-i]);
404
2.91k
        mdct(fb, windowed_buf, out_mdct, 2*nlong);
405
2.91k
        break;
406
13.8k
    }
407
13.8k
}
filter_bank_ltp
Line
Count
Source
342
13.8k
{
343
13.8k
    int16_t i;
344
13.8k
    ALIGN real_t windowed_buf[2*1024] = {0};
345
346
13.8k
    const real_t *window_long = NULL;
347
13.8k
    const real_t *window_long_prev = NULL;
348
13.8k
    const real_t *window_short = NULL;
349
13.8k
    const real_t *window_short_prev = NULL;
350
351
13.8k
    uint16_t nlong = frame_len;
352
13.8k
    uint16_t nshort = frame_len/8;
353
13.8k
    uint16_t nflat_ls = (nlong-nshort)/2;
354
355
13.8k
    assert(window_sequence != EIGHT_SHORT_SEQUENCE);
356
357
13.8k
#ifdef LD_DEC
358
13.8k
    if (object_type == LD)
359
395
    {
360
395
        window_long       = fb->ld_window[window_shape];
361
395
        window_long_prev  = fb->ld_window[window_shape_prev];
362
13.4k
    } else {
363
13.4k
#endif
364
13.4k
        window_long       = fb->long_window[window_shape];
365
13.4k
        window_long_prev  = fb->long_window[window_shape_prev];
366
13.4k
        window_short      = fb->short_window[window_shape];
367
13.4k
        window_short_prev = fb->short_window[window_shape_prev];
368
13.4k
#ifdef LD_DEC
369
13.4k
    }
370
13.8k
#endif
371
372
13.8k
    switch(window_sequence)
373
13.8k
    {
374
1.91k
    case ONLY_LONG_SEQUENCE:
375
1.73M
        for (i = nlong-1; i >= 0; i--)
376
1.72M
        {
377
1.72M
            windowed_buf[i] = MUL_F(in_data[i], window_long_prev[i]);
378
1.72M
            windowed_buf[i+nlong] = MUL_F(in_data[i+nlong], window_long[nlong-1-i]);
379
1.72M
        }
380
1.91k
        mdct(fb, windowed_buf, out_mdct, 2*nlong);
381
1.91k
        break;
382
383
9.00k
    case LONG_START_SEQUENCE:
384
8.89M
        for (i = 0; i < nlong; i++)
385
8.89M
            windowed_buf[i] = MUL_F(in_data[i], window_long_prev[i]);
386
3.89M
        for (i = 0; i < nflat_ls; i++)
387
3.88M
            windowed_buf[i+nlong] = in_data[i+nlong];
388
1.12M
        for (i = 0; i < nshort; i++)
389
1.11M
            windowed_buf[i+nlong+nflat_ls] = MUL_F(in_data[i+nlong+nflat_ls], window_short[nshort-1-i]);
390
3.89M
        for (i = 0; i < nflat_ls; i++)
391
3.88M
            windowed_buf[i+nlong+nflat_ls+nshort] = 0;
392
9.00k
        mdct(fb, windowed_buf, out_mdct, 2*nlong);
393
9.00k
        break;
394
395
2.91k
    case LONG_STOP_SEQUENCE:
396
1.25M
        for (i = 0; i < nflat_ls; i++)
397
1.24M
            windowed_buf[i] = 0;
398
359k
        for (i = 0; i < nshort; i++)
399
356k
            windowed_buf[i+nflat_ls] = MUL_F(in_data[i+nflat_ls], window_short_prev[i]);
400
1.25M
        for (i = 0; i < nflat_ls; i++)
401
1.24M
            windowed_buf[i+nflat_ls+nshort] = in_data[i+nflat_ls+nshort];
402
2.85M
        for (i = 0; i < nlong; i++)
403
2.85M
            windowed_buf[i+nlong] = MUL_F(in_data[i+nlong], window_long[nlong-1-i]);
404
2.91k
        mdct(fb, windowed_buf, out_mdct, 2*nlong);
405
2.91k
        break;
406
13.8k
    }
407
13.8k
}
408
#endif