Coverage Report

Created: 2025-10-27 06:23

next uncovered line (L), next uncovered region (R), next uncovered branch (B)
/src/libxaac/encoder/ixheaace_mps_polyphase.c
Line
Count
Source
1
/******************************************************************************
2
 *                                                                            *
3
 * Copyright (C) 2023 The Android Open Source Project
4
 *
5
 * Licensed under the Apache License, Version 2.0 (the "License");
6
 * you may not use this file except in compliance with the License.
7
 * You may obtain a copy of the License at:
8
 *
9
 * http://www.apache.org/licenses/LICENSE-2.0
10
 *
11
 * Unless required by applicable law or agreed to in writing, software
12
 * distributed under the License is distributed on an "AS IS" BASIS,
13
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
14
 * See the License for the specific language governing permissions and
15
 * limitations under the License.
16
 *
17
 *****************************************************************************
18
 * Originally developed and contributed by Ittiam Systems Pvt. Ltd, Bangalore
19
 */
20
21
#include <string.h>
22
#include <math.h>
23
#include "ixheaac_type_def.h"
24
#include "ixheaace_mps_common_fix.h"
25
#include "ixheaace_mps_defines.h"
26
#include "ixheaace_mps_common_define.h"
27
#include "ixheaace_bitbuffer.h"
28
29
#include "ixheaace_mps_struct_def.h"
30
#include "ixheaace_mps_sac_polyphase.h"
31
#include "ixheaace_mps_sac_hybfilter.h"
32
#include "ixheaace_mps_spatial_bitstream.h"
33
#include "ixheaace_mps_bitstream.h"
34
#include "ixheaace_mps_param_extract.h"
35
#include "ixheaace_mps_tree.h"
36
#include "ixheaace_mps_rom.h"
37
38
163M
static VOID ixheaace_mps_bit_reversal(FLOAT32 *a, FLOAT32 *b) {
39
163M
  FLOAT32 temp;
40
163M
  temp = *a;
41
163M
  *a = *b;
42
163M
  *b = temp;
43
163M
}
44
45
193M
static VOID ixheaace_mps_bit_add_sub1(FLOAT32 *a, FLOAT32 *b) {
46
193M
  FLOAT32 temp;
47
193M
  temp = *a + *b;
48
193M
  *b = *b - *a;
49
193M
  *a = temp;
50
193M
}
51
52
282M
static VOID ixheaace_mps_bit_add_sub2(FLOAT32 *a, FLOAT32 *b) {
53
282M
  FLOAT32 temp;
54
282M
  temp = *a + *b;
55
282M
  *b = *a - *b;
56
282M
  *a = temp;
57
282M
}
58
59
941k
static VOID ixheaace_mps_fft32(FLOAT32 *subband) {
60
941k
  FLOAT32 val_0, val_1, val_2, val_3, val_4, val_5, val_6, val_7, val_8, val_9, val_10, val_11,
61
941k
      val_12, val_13, val_14, val_15;
62
941k
  FLOAT32 val_1_0, val_1_1, val_1_2, val_1_3, val_1_4, val_1_5, val_1_6, val_1_7, val_1_8,
63
941k
      val_1_9, val_1_10, val_1_11, val_1_12, val_1_13, val_1_14, val_1_15;
64
941k
  FLOAT32 val_2_0, val_2_1, val_2_2, val_2_3, val_2_4, val_2_5, val_2_6, val_2_7, val_2_8,
65
941k
      val_2_9, val_2_10, val_2_11, val_2_12, val_2_13, val_2_14, val_2_15;
66
941k
  FLOAT32 val_3_0, val_3_1, val_3_2, val_3_3, val_3_4, val_3_5, val_3_6, val_3_7, val_3_8,
67
941k
      val_3_9, val_3_10, val_3_11, val_3_12, val_3_13, val_3_14, val_3_15;
68
941k
  FLOAT32 val_3_16, val_3_17, val_3_18, val_3_19, val_3_20, val_3_21, val_3_22, val_3_23,
69
941k
      val_3_24, val_3_25, val_3_26, val_3_27, val_3_28, val_3_29, val_3_30, val_3_31;
70
941k
  FLOAT32 val_4_0, val_4_1, val_4_2, val_4_3, val_4_4, val_4_5, val_4_6, val_4_7, val_4_8,
71
941k
      val_4_9, val_4_10, val_4_11, val_4_12, val_4_13, val_4_14, val_4_15;
72
73
941k
  val_2_0 = subband[2] - subband[34];
74
941k
  val_2_1 = subband[3] - subband[35];
75
941k
  val_3_0 = subband[0] + subband[32];
76
941k
  val_3_1 = subband[1] + subband[33];
77
941k
  val_3_2 = subband[2] + subband[34];
78
941k
  val_3_3 = subband[3] + subband[35];
79
80
941k
  val_2_2 = subband[6] - subband[38];
81
941k
  val_2_3 = subband[7] - subband[39];
82
941k
  val_3_4 = subband[4] + subband[36];
83
941k
  val_3_5 = subband[5] + subband[37];
84
941k
  val_3_6 = subband[6] + subband[38];
85
941k
  val_3_7 = subband[7] + subband[39];
86
87
941k
  val_2_4 = subband[10] - subband[42];
88
941k
  val_2_5 = subband[11] - subband[43];
89
941k
  val_3_8 = subband[8] + subband[40];
90
941k
  val_3_9 = subband[9] + subband[41];
91
941k
  val_3_10 = subband[10] + subband[42];
92
941k
  val_3_11 = subband[11] + subband[43];
93
94
941k
  val_2_6 = subband[14] - subband[46];
95
941k
  val_2_7 = subband[15] - subband[47];
96
941k
  val_3_12 = subband[12] + subband[44];
97
941k
  val_3_13 = subband[13] + subband[45];
98
941k
  val_3_14 = subband[14] + subband[46];
99
941k
  val_3_15 = subband[15] + subband[47];
100
101
941k
  val_2_8 = subband[18] - subband[50];
102
941k
  val_2_9 = subband[19] - subband[51];
103
941k
  val_3_16 = subband[16] + subband[48];
104
941k
  val_3_17 = subband[17] + subband[49];
105
941k
  val_3_18 = subband[18] + subband[50];
106
941k
  val_3_19 = subband[19] + subband[51];
107
108
941k
  val_2_10 = subband[22] - subband[54];
109
941k
  val_2_11 = subband[23] - subband[55];
110
941k
  val_3_20 = subband[20] + subband[52];
111
941k
  val_3_21 = subband[21] + subband[53];
112
941k
  val_3_22 = subband[22] + subband[54];
113
941k
  val_3_23 = subband[23] + subband[55];
114
115
941k
  val_2_12 = subband[26] - subband[58];
116
941k
  val_2_13 = subband[27] - subband[59];
117
941k
  val_3_24 = subband[24] + subband[56];
118
941k
  val_3_25 = subband[25] + subband[57];
119
941k
  val_3_26 = subband[26] + subband[58];
120
941k
  val_3_27 = subband[27] + subband[59];
121
122
941k
  val_2_14 = subband[30] - subband[62];
123
941k
  val_2_15 = subband[31] - subband[63];
124
941k
  val_3_28 = subband[28] + subband[60];
125
941k
  val_3_29 = subband[29] + subband[61];
126
941k
  val_3_30 = subband[30] + subband[62];
127
941k
  val_3_31 = subband[31] + subband[63];
128
129
941k
  val_4_1 = -(val_2_0 + val_2_14);
130
941k
  val_4_2 = val_2_0 - val_2_14;
131
941k
  val_4_0 = val_2_1 + val_2_15;
132
941k
  val_4_3 = val_2_1 - val_2_15;
133
941k
  val_4_5 = -(val_2_2 + val_2_12);
134
941k
  val_4_6 = val_2_2 - val_2_12;
135
941k
  val_4_4 = val_2_3 + val_2_13;
136
941k
  val_4_7 = val_2_3 - val_2_13;
137
941k
  val_4_9 = -(val_2_4 + val_2_10);
138
941k
  val_4_10 = val_2_4 - val_2_10;
139
941k
  val_4_8 = val_2_5 + val_2_11;
140
941k
  val_4_11 = val_2_5 - val_2_11;
141
941k
  val_4_13 = -(val_2_6 + val_2_8);
142
941k
  val_4_14 = val_2_6 - val_2_8;
143
941k
  val_4_12 = val_2_7 + val_2_9;
144
941k
  val_4_15 = val_2_7 - val_2_9;
145
146
941k
  val_2_0 = val_4_0 * fft_c[3] + val_4_4 * fft_c[2] + val_4_8 * fft_c[1] + val_4_12 * fft_c[0];
147
148
941k
  val_2_4 = val_4_0 * fft_c[2] + val_4_4 * fft_c[0] + val_4_8 * fft_c[3] - val_4_12 * fft_c[1];
149
941k
  val_2_8 = val_4_0 * fft_c[1] + val_4_4 * fft_c[3] - val_4_8 * fft_c[0] + val_4_12 * fft_c[2];
150
151
941k
  val_2_12 = val_4_0 * fft_c[0] - val_4_4 * fft_c[1] + val_4_8 * fft_c[2] - val_4_12 * fft_c[3];
152
153
941k
  val_2_1 = val_4_1 * fft_c[3] + val_4_5 * fft_c[2] + val_4_9 * fft_c[1] + val_4_13 * fft_c[0];
154
155
941k
  val_2_5 = val_4_1 * fft_c[2] + val_4_5 * fft_c[0] + val_4_9 * fft_c[3] - val_4_13 * fft_c[1];
156
941k
  val_2_9 = val_4_1 * fft_c[1] + val_4_5 * fft_c[3] - val_4_9 * fft_c[0] + val_4_13 * fft_c[2];
157
158
941k
  val_2_13 = val_4_1 * fft_c[0] - val_4_5 * fft_c[1] + val_4_9 * fft_c[2] - val_4_13 * fft_c[3];
159
160
941k
  val_2_2 = val_4_2 * fft_c[0] + val_4_6 * fft_c[1] + val_4_10 * fft_c[2] + val_4_14 * fft_c[3];
161
162
941k
  val_2_6 = val_4_2 * fft_c[1] - val_4_6 * fft_c[3] - val_4_10 * fft_c[0] - val_4_14 * fft_c[2];
163
164
941k
  val_2_10 = val_4_2 * fft_c[2] - val_4_6 * fft_c[0] + val_4_10 * fft_c[3] + val_4_14 * fft_c[1];
165
166
941k
  val_2_14 = val_4_2 * fft_c[3] - val_4_6 * fft_c[2] + val_4_10 * fft_c[1] - val_4_14 * fft_c[0];
167
168
941k
  val_2_3 = val_4_3 * fft_c[0] + val_4_7 * fft_c[1] + val_4_11 * fft_c[2] + val_4_15 * fft_c[3];
169
170
941k
  val_2_7 = val_4_3 * fft_c[1] - val_4_7 * fft_c[3] - val_4_11 * fft_c[0] - val_4_15 * fft_c[2];
171
172
941k
  val_2_11 = val_4_3 * fft_c[2] - val_4_7 * fft_c[0] + val_4_11 * fft_c[3] + val_4_15 * fft_c[1];
173
174
941k
  val_2_15 = val_4_3 * fft_c[3] - val_4_7 * fft_c[2] + val_4_11 * fft_c[1] - val_4_15 * fft_c[0];
175
176
941k
  val_4_0 = val_2_0 + val_2_2;
177
941k
  val_4_14 = val_2_0 - val_2_2;
178
941k
  val_4_1 = val_2_1 + val_2_3;
179
941k
  val_4_15 = val_2_1 - val_2_3;
180
941k
  val_4_2 = val_2_4 + val_2_6;
181
941k
  val_4_12 = val_2_4 - val_2_6;
182
941k
  val_4_3 = val_2_5 + val_2_7;
183
941k
  val_4_13 = val_2_5 - val_2_7;
184
941k
  val_4_4 = val_2_8 + val_2_10;
185
941k
  val_4_10 = val_2_8 - val_2_10;
186
941k
  val_4_5 = val_2_9 + val_2_11;
187
941k
  val_4_11 = val_2_9 - val_2_11;
188
941k
  val_4_6 = val_2_12 + val_2_14;
189
941k
  val_4_8 = val_2_12 - val_2_14;
190
941k
  val_4_7 = val_2_13 + val_2_15;
191
941k
  val_4_9 = val_2_13 - val_2_15;
192
193
941k
  val_1_0 = val_3_0 + val_3_16;
194
941k
  val_1_1 = val_3_1 + val_3_17;
195
941k
  val_1_2 = val_3_2 + val_3_18;
196
941k
  val_1_3 = val_3_3 + val_3_19;
197
941k
  val_1_4 = val_3_4 + val_3_20;
198
941k
  val_1_5 = val_3_5 + val_3_21;
199
941k
  val_1_6 = val_3_6 + val_3_22;
200
941k
  val_1_7 = val_3_7 + val_3_23;
201
941k
  val_1_8 = val_3_8 + val_3_24;
202
941k
  val_1_9 = val_3_9 + val_3_25;
203
941k
  val_1_10 = val_3_10 + val_3_26;
204
941k
  val_1_11 = val_3_11 + val_3_27;
205
941k
  val_1_12 = val_3_12 + val_3_28;
206
941k
  val_1_13 = val_3_13 + val_3_29;
207
941k
  val_1_14 = val_3_14 + val_3_30;
208
941k
  val_1_15 = val_3_15 + val_3_31;
209
210
941k
  val_0 = val_1_0 + val_1_8;
211
941k
  val_2 = val_1_0 - val_1_8;
212
941k
  val_1 = val_1_1 + val_1_9;
213
941k
  val_3 = val_1_1 - val_1_9;
214
941k
  val_4 = val_1_2 + val_1_10;
215
941k
  val_6 = val_1_2 - val_1_10;
216
941k
  val_5 = val_1_3 + val_1_11;
217
941k
  val_7 = val_1_3 - val_1_11;
218
941k
  val_8 = val_1_4 + val_1_12;
219
941k
  val_10 = val_1_4 - val_1_12;
220
941k
  val_9 = val_1_5 + val_1_13;
221
941k
  val_11 = val_1_5 - val_1_13;
222
941k
  val_12 = val_1_6 + val_1_14;
223
941k
  val_14 = val_1_6 - val_1_14;
224
941k
  val_13 = val_1_7 + val_1_15;
225
941k
  val_15 = val_1_7 - val_1_15;
226
227
941k
  val_2_0 = val_0 + val_8;
228
941k
  val_2_4 = val_0 - val_8;
229
941k
  val_2_1 = val_1 + val_9;
230
941k
  val_2_5 = val_1 - val_9;
231
941k
  val_2_8 = val_2 - val_11;
232
941k
  val_2_10 = val_2 + val_11;
233
941k
  val_2_9 = val_3 + val_10;
234
941k
  val_2_11 = val_3 - val_10;
235
941k
  val_2_2 = val_4 + val_12;
236
941k
  val_2_7 = val_4 - val_12;
237
941k
  val_2_3 = val_5 + val_13;
238
941k
  val_2_6 = val_13 - val_5;
239
240
941k
  val_1 = val_6 + val_14;
241
941k
  val_2 = val_6 - val_14;
242
941k
  val_0 = val_7 + val_15;
243
941k
  val_3 = val_7 - val_15;
244
245
941k
  val_2_12 = (val_0 + val_2) * MPS_INV_SQRT2;
246
941k
  val_2_14 = (val_0 - val_2) * MPS_INV_SQRT2;
247
941k
  val_2_13 = (val_3 - val_1) * MPS_INV_SQRT2;
248
941k
  val_2_15 = (val_1 + val_3) * -MPS_INV_SQRT2;
249
250
941k
  val_1_0 = val_3_0 - val_3_16;
251
941k
  val_1_1 = val_3_1 - val_3_17;
252
941k
  val_1_2 = val_3_2 - val_3_18;
253
941k
  val_1_3 = val_3_3 - val_3_19;
254
941k
  val_1_4 = val_3_4 - val_3_20;
255
941k
  val_1_5 = val_3_5 - val_3_21;
256
941k
  val_1_6 = val_3_6 - val_3_22;
257
941k
  val_1_7 = val_3_7 - val_3_23;
258
941k
  val_1_8 = val_3_8 - val_3_24;
259
941k
  val_1_9 = val_3_9 - val_3_25;
260
941k
  val_1_10 = val_3_10 - val_3_26;
261
941k
  val_1_11 = val_3_11 - val_3_27;
262
941k
  val_1_12 = val_3_12 - val_3_28;
263
941k
  val_1_13 = val_3_13 - val_3_29;
264
941k
  val_1_14 = val_3_14 - val_3_30;
265
941k
  val_1_15 = val_3_15 - val_3_31;
266
267
941k
  val_3_0 = val_2_0 + val_2_2;
268
941k
  val_3_16 = val_2_0 - val_2_2;
269
941k
  val_3_1 = val_2_1 + val_2_3;
270
941k
  val_3_17 = val_2_1 - val_2_3;
271
941k
  val_3_8 = val_2_4 - val_2_6;
272
941k
  val_3_24 = val_2_4 + val_2_6;
273
941k
  val_3_9 = val_2_5 - val_2_7;
274
941k
  val_3_25 = val_2_5 + val_2_7;
275
941k
  val_3_12 = val_2_8 + val_2_14;
276
941k
  val_3_28 = val_2_8 - val_2_14;
277
941k
  val_3_13 = val_2_9 + val_2_15;
278
941k
  val_3_29 = val_2_9 - val_2_15;
279
941k
  val_3_4 = val_2_10 + val_2_12;
280
941k
  val_3_20 = val_2_10 - val_2_12;
281
941k
  val_3_5 = val_2_11 + val_2_13;
282
941k
  val_3_21 = val_2_11 - val_2_13;
283
284
941k
  val_9 = (val_1_2 + val_1_14) * -MPS_COS_3PI_DIV8;
285
941k
  val_10 = (val_1_2 - val_1_14) * MPS_COS_PI_DIV8;
286
941k
  val_8 = (val_1_3 + val_1_15) * MPS_COS_3PI_DIV8;
287
941k
  val_11 = (val_1_3 - val_1_15) * MPS_COS_PI_DIV8;
288
941k
  val_5 = (val_1_4 + val_1_12) * -MPS_INV_SQRT2;
289
941k
  val_6 = (val_1_4 - val_1_12) * MPS_INV_SQRT2;
290
941k
  val_4 = (val_1_5 + val_1_13) * MPS_INV_SQRT2;
291
941k
  val_7 = (val_1_5 - val_1_13) * MPS_INV_SQRT2;
292
941k
  val_13 = (val_1_6 + val_1_10) * -MPS_COS_PI_DIV8;
293
941k
  val_14 = (val_1_6 - val_1_10) * MPS_COS_3PI_DIV8;
294
941k
  val_12 = (val_1_7 + val_1_11) * MPS_COS_PI_DIV8;
295
941k
  val_15 = (val_1_7 - val_1_11) * MPS_COS_3PI_DIV8;
296
297
941k
  val_1_2 = val_8 * MPS_SQRT2PLUS1 - val_12 * MPS_SQRT2MINUS1;
298
941k
  val_1_3 = val_9 * MPS_SQRT2PLUS1 - val_13 * MPS_SQRT2MINUS1;
299
941k
  val_1_4 = val_10 * MPS_SQRT2MINUS1 - val_14 * MPS_SQRT2PLUS1;
300
941k
  val_1_5 = val_11 * MPS_SQRT2MINUS1 - val_15 * MPS_SQRT2PLUS1;
301
302
941k
  val_8 += val_12;
303
941k
  val_9 += val_13;
304
941k
  val_10 += val_14;
305
941k
  val_11 += val_15;
306
941k
  val_1_6 = val_1_0 + val_4;
307
941k
  val_1_10 = val_1_0 - val_4;
308
941k
  val_1_7 = val_1_1 + val_5;
309
941k
  val_1_11 = val_1_1 - val_5;
310
311
941k
  val_1_12 = val_6 - val_1_9;
312
941k
  val_1_14 = val_6 + val_1_9;
313
941k
  val_1_13 = val_1_8 + val_7;
314
941k
  val_1_15 = val_1_8 - val_7;
315
316
941k
  val_0 = val_1_6 - val_1_14;
317
941k
  val_2 = val_1_6 + val_1_14;
318
941k
  val_1 = val_1_7 + val_1_15;
319
941k
  val_3 = val_1_7 - val_1_15;
320
941k
  val_4 = val_1_10 + val_1_12;
321
941k
  val_6 = val_1_10 - val_1_12;
322
941k
  val_5 = val_1_11 + val_1_13;
323
941k
  val_7 = val_1_11 - val_1_13;
324
325
941k
  val_1_10 = val_8 + val_10;
326
941k
  val_10 = val_8 - val_10;
327
941k
  val_1_11 = val_9 + val_11;
328
941k
  val_11 = val_9 - val_11;
329
330
941k
  val_12 = val_1_2 + val_1_4;
331
941k
  val_14 = val_1_2 - val_1_4;
332
941k
  val_13 = val_1_3 + val_1_5;
333
941k
  val_15 = val_1_3 - val_1_5;
334
335
941k
  val_3_2 = val_2 + val_1_10;
336
941k
  val_3_18 = val_2 - val_1_10;
337
941k
  val_3_3 = val_3 + val_1_11;
338
941k
  val_3_19 = val_3 - val_1_11;
339
941k
  val_3_6 = val_0 + val_12;
340
941k
  val_3_22 = val_0 - val_12;
341
941k
  val_3_7 = val_1 + val_13;
342
941k
  val_3_23 = val_1 - val_13;
343
941k
  val_3_14 = val_4 + val_10;
344
941k
  val_3_30 = val_4 - val_10;
345
941k
  val_3_15 = val_5 + val_11;
346
941k
  val_3_31 = val_5 - val_11;
347
941k
  val_3_10 = val_6 + val_14;
348
941k
  val_3_26 = val_6 - val_14;
349
941k
  val_3_11 = val_7 + val_15;
350
941k
  val_3_27 = val_7 - val_15;
351
352
941k
  val_1_0 = subband[0] - subband[32];
353
941k
  val_1_1 = subband[1] - subband[33];
354
941k
  val_1_2 = subband[4] - subband[36];
355
941k
  val_1_3 = subband[5] - subband[37];
356
941k
  val_1_4 = subband[8] - subband[40];
357
941k
  val_1_5 = subband[9] - subband[41];
358
941k
  val_1_6 = subband[12] - subband[44];
359
941k
  val_1_7 = subband[13] - subband[45];
360
941k
  val_1_8 = subband[16] - subband[48];
361
941k
  val_1_9 = subband[17] - subband[49];
362
941k
  val_1_10 = subband[20] - subband[52];
363
941k
  val_1_11 = subband[21] - subband[53];
364
941k
  val_1_12 = subband[24] - subband[56];
365
941k
  val_1_13 = subband[25] - subband[57];
366
941k
  val_1_14 = subband[28] - subband[60];
367
941k
  val_1_15 = subband[29] - subband[61];
368
369
941k
  val_9 = (val_1_2 + val_1_14) * -MPS_COS_3PI_DIV8;
370
941k
  val_10 = (val_1_2 - val_1_14) * MPS_COS_PI_DIV8;
371
941k
  val_8 = (val_1_3 + val_1_15) * MPS_COS_3PI_DIV8;
372
941k
  val_11 = (val_1_3 - val_1_15) * MPS_COS_PI_DIV8;
373
941k
  val_5 = (val_1_4 + val_1_12) * -MPS_INV_SQRT2;
374
941k
  val_6 = (val_1_4 - val_1_12) * MPS_INV_SQRT2;
375
941k
  val_4 = (val_1_5 + val_1_13) * MPS_INV_SQRT2;
376
941k
  val_7 = (val_1_5 - val_1_13) * MPS_INV_SQRT2;
377
941k
  val_13 = (val_1_6 + val_1_10) * -MPS_COS_PI_DIV8;
378
941k
  val_14 = (val_1_6 - val_1_10) * MPS_COS_3PI_DIV8;
379
941k
  val_12 = (val_1_7 + val_1_11) * MPS_COS_PI_DIV8;
380
941k
  val_15 = (val_1_7 - val_1_11) * MPS_COS_3PI_DIV8;
381
382
941k
  val_1_2 = val_8 * MPS_SQRT2PLUS1 - val_12 * MPS_SQRT2MINUS1;
383
941k
  val_1_3 = val_9 * MPS_SQRT2PLUS1 - val_13 * MPS_SQRT2MINUS1;
384
941k
  val_1_4 = val_10 * MPS_SQRT2MINUS1 - val_14 * MPS_SQRT2PLUS1;
385
941k
  val_1_5 = val_11 * MPS_SQRT2MINUS1 - val_15 * MPS_SQRT2PLUS1;
386
387
941k
  val_8 += val_12;
388
941k
  val_9 += val_13;
389
941k
  val_10 += val_14;
390
941k
  val_11 += val_15;
391
941k
  val_1_6 = val_1_0 + val_4;
392
941k
  val_1_10 = val_1_0 - val_4;
393
941k
  val_1_7 = val_1_1 + val_5;
394
941k
  val_1_11 = val_1_1 - val_5;
395
396
941k
  val_1_12 = val_6 - val_1_9;
397
941k
  val_1_14 = val_6 + val_1_9;
398
941k
  val_1_13 = val_1_8 + val_7;
399
941k
  val_1_15 = val_1_8 - val_7;
400
401
941k
  val_0 = val_1_6 - val_1_14;
402
941k
  val_2 = val_1_6 + val_1_14;
403
941k
  val_1 = val_1_7 + val_1_15;
404
941k
  val_3 = val_1_7 - val_1_15;
405
941k
  val_4 = val_1_10 + val_1_12;
406
941k
  val_6 = val_1_10 - val_1_12;
407
941k
  val_5 = val_1_11 + val_1_13;
408
941k
  val_7 = val_1_11 - val_1_13;
409
410
941k
  val_1_10 = val_8 + val_10;
411
941k
  val_10 = val_8 - val_10;
412
941k
  val_1_11 = val_9 + val_11;
413
941k
  val_11 = val_9 - val_11;
414
415
941k
  val_12 = val_1_2 + val_1_4;
416
941k
  val_14 = val_1_2 - val_1_4;
417
941k
  val_13 = val_1_3 + val_1_5;
418
941k
  val_15 = val_1_3 - val_1_5;
419
420
941k
  val_1_0 = val_2 + val_1_10;
421
941k
  val_1_8 = val_2 - val_1_10;
422
941k
  val_1_1 = val_3 + val_1_11;
423
941k
  val_1_9 = val_3 - val_1_11;
424
941k
  val_1_2 = val_0 + val_12;
425
941k
  val_1_10 = val_0 - val_12;
426
941k
  val_1_3 = val_1 + val_13;
427
941k
  val_1_11 = val_1 - val_13;
428
941k
  val_1_6 = val_4 + val_10;
429
941k
  val_1_14 = val_4 - val_10;
430
941k
  val_1_7 = val_5 + val_11;
431
941k
  val_1_15 = val_5 - val_11;
432
941k
  val_1_4 = val_6 + val_14;
433
941k
  val_1_12 = val_6 - val_14;
434
941k
  val_1_5 = val_7 + val_15;
435
941k
  val_1_13 = val_7 - val_15;
436
437
941k
  *subband++ = val_3_0;
438
941k
  *subband++ = val_3_1;
439
941k
  *subband++ = val_1_0 + val_4_0;
440
941k
  *subband++ = val_1_1 + val_4_1;
441
941k
  *subband++ = val_3_2;
442
941k
  *subband++ = val_3_3;
443
941k
  *subband++ = val_1_2 + val_4_2;
444
941k
  *subband++ = val_1_3 + val_4_3;
445
941k
  *subband++ = val_3_4;
446
941k
  *subband++ = val_3_5;
447
941k
  *subband++ = val_1_4 + val_4_4;
448
941k
  *subband++ = val_1_5 + val_4_5;
449
941k
  *subband++ = val_3_6;
450
941k
  *subband++ = val_3_7;
451
941k
  *subband++ = val_1_6 + val_4_6;
452
941k
  *subband++ = val_1_7 + val_4_7;
453
941k
  *subband++ = val_3_8;
454
941k
  *subband++ = val_3_9;
455
941k
  *subband++ = val_1_8 + val_4_8;
456
941k
  *subband++ = val_1_9 + val_4_9;
457
941k
  *subband++ = val_3_10;
458
941k
  *subband++ = val_3_11;
459
941k
  *subband++ = val_1_10 + val_4_10;
460
941k
  *subband++ = val_1_11 + val_4_11;
461
941k
  *subband++ = val_3_12;
462
941k
  *subband++ = val_3_13;
463
941k
  *subband++ = val_1_12 + val_4_12;
464
941k
  *subband++ = val_1_13 + val_4_13;
465
941k
  *subband++ = val_3_14;
466
941k
  *subband++ = val_3_15;
467
941k
  *subband++ = val_1_14 + val_4_14;
468
941k
  *subband++ = val_1_15 + val_4_15;
469
941k
  *subband++ = val_3_16;
470
941k
  *subband++ = val_3_17;
471
941k
  *subband++ = val_1_0 - val_4_0;
472
941k
  *subband++ = val_1_1 - val_4_1;
473
941k
  *subband++ = val_3_18;
474
941k
  *subband++ = val_3_19;
475
941k
  *subband++ = val_1_2 - val_4_2;
476
941k
  *subband++ = val_1_3 - val_4_3;
477
941k
  *subband++ = val_3_20;
478
941k
  *subband++ = val_3_21;
479
941k
  *subband++ = val_1_4 - val_4_4;
480
941k
  *subband++ = val_1_5 - val_4_5;
481
941k
  *subband++ = val_3_22;
482
941k
  *subband++ = val_3_23;
483
941k
  *subband++ = val_1_6 - val_4_6;
484
941k
  *subband++ = val_1_7 - val_4_7;
485
941k
  *subband++ = val_3_24;
486
941k
  *subband++ = val_3_25;
487
941k
  *subband++ = val_1_8 - val_4_8;
488
941k
  *subband++ = val_1_9 - val_4_9;
489
941k
  *subband++ = val_3_26;
490
941k
  *subband++ = val_3_27;
491
941k
  *subband++ = val_1_10 - val_4_10;
492
941k
  *subband++ = val_1_11 - val_4_11;
493
941k
  *subband++ = val_3_28;
494
941k
  *subband++ = val_3_29;
495
941k
  *subband++ = val_1_12 - val_4_12;
496
941k
  *subband++ = val_1_13 - val_4_13;
497
941k
  *subband++ = val_3_30;
498
941k
  *subband++ = val_3_31;
499
941k
  *subband++ = val_1_14 - val_4_14;
500
941k
  *subband++ = val_1_15 - val_4_15;
501
941k
}
502
503
static VOID ixheaace_mps_cos_mod(
504
470k
    FLOAT32 *subband, ixheaace_mps_sac_pstr_qmf_synth_filter_bank pstr_qmf_synth_filter_bank) {
505
470k
  WORD32 idx, length;
506
470k
  FLOAT32 weight_imag, weight_real;
507
470k
  FLOAT32 real_1, real_2;
508
470k
  FLOAT32 imag_1, imag_2;
509
470k
  FLOAT32 accu1, accu2;
510
511
470k
  length = 32;
512
513
8.00M
  for (idx = 0; idx < (length / 2); idx++) {
514
7.53M
    real_1 = subband[2 * idx];
515
7.53M
    imag_2 = subband[2 * idx + 1];
516
7.53M
    real_2 = subband[2 * length - 2 - 2 * idx];
517
7.53M
    imag_1 = subband[2 * length - 1 - 2 * idx];
518
519
7.53M
    weight_imag = pstr_qmf_synth_filter_bank->sin_twiddle[idx];
520
7.53M
    weight_real = pstr_qmf_synth_filter_bank->cos_twiddle[idx];
521
522
7.53M
    accu1 = imag_1 * weight_imag + real_1 * weight_real;
523
7.53M
    accu2 = imag_1 * weight_real - real_1 * weight_imag;
524
525
7.53M
    subband[2 * idx] = accu1;
526
7.53M
    subband[2 * idx + 1] = accu2;
527
528
7.53M
    weight_imag = pstr_qmf_synth_filter_bank->sin_twiddle[length - 1 - idx];
529
7.53M
    weight_real = pstr_qmf_synth_filter_bank->cos_twiddle[length - 1 - idx];
530
531
7.53M
    accu1 = imag_2 * weight_imag + real_2 * weight_real;
532
7.53M
    accu2 = imag_2 * weight_real - real_2 * weight_imag;
533
534
7.53M
    subband[2 * length - 2 - 2 * idx] = accu1;
535
7.53M
    subband[2 * length - 1 - 2 * idx] = accu2;
536
7.53M
  }
537
538
470k
  ixheaace_mps_fft32(subband);
539
540
470k
  weight_imag = pstr_qmf_synth_filter_bank->alt_sin_twiddle[0];
541
470k
  weight_real = pstr_qmf_synth_filter_bank->alt_sin_twiddle[length];
542
543
8.00M
  for (idx = 0; idx < length / 2; idx++) {
544
7.53M
    real_1 = subband[2 * idx];
545
7.53M
    imag_1 = subband[2 * idx + 1];
546
7.53M
    real_2 = subband[2 * length - 2 - 2 * idx];
547
7.53M
    imag_2 = subband[2 * length - 1 - 2 * idx];
548
549
7.53M
    accu1 = real_1 * weight_real + imag_1 * weight_imag;
550
7.53M
    accu2 = real_1 * weight_imag - imag_1 * weight_real;
551
552
7.53M
    subband[2 * idx] = accu1;
553
7.53M
    subband[2 * length - 1 - 2 * idx] = accu2;
554
555
7.53M
    weight_imag = pstr_qmf_synth_filter_bank->alt_sin_twiddle[idx + 1];
556
7.53M
    weight_real = pstr_qmf_synth_filter_bank->alt_sin_twiddle[length - 1 - idx];
557
558
7.53M
    accu1 = real_2 * weight_imag + imag_2 * weight_real;
559
7.53M
    accu2 = real_2 * weight_real - imag_2 * weight_imag;
560
561
7.53M
    subband[2 * length - 2 - 2 * idx] = accu1;
562
7.53M
    subband[2 * idx + 1] = accu2;
563
7.53M
  }
564
470k
}
565
566
static VOID ixheaace_mps_sin_mod(
567
470k
    FLOAT32 *subband, ixheaace_mps_sac_pstr_qmf_synth_filter_bank pstr_qmf_synth_filter_bank) {
568
470k
  WORD32 idx, length;
569
470k
  FLOAT32 weight_real, weight_imag;
570
470k
  FLOAT32 real_1, imag_1, real_2, imag_2;
571
470k
  FLOAT32 accu1, accu2;
572
573
470k
  length = 32;
574
575
8.00M
  for (idx = 0; idx < length / 2; idx++) {
576
7.53M
    real_1 = subband[2 * idx];
577
7.53M
    imag_2 = subband[2 * idx + 1];
578
7.53M
    real_2 = subband[2 * length - 2 - 2 * idx];
579
7.53M
    imag_1 = subband[2 * length - 1 - 2 * idx];
580
581
7.53M
    weight_real = pstr_qmf_synth_filter_bank->sin_twiddle[idx];
582
7.53M
    weight_imag = pstr_qmf_synth_filter_bank->cos_twiddle[idx];
583
584
7.53M
    accu1 = imag_1 * weight_imag + real_1 * weight_real;
585
7.53M
    accu2 = imag_1 * weight_real - real_1 * weight_imag;
586
587
7.53M
    subband[2 * idx + 1] = accu1;
588
7.53M
    subband[2 * idx] = accu2;
589
590
7.53M
    weight_real = pstr_qmf_synth_filter_bank->sin_twiddle[length - 1 - idx];
591
7.53M
    weight_imag = pstr_qmf_synth_filter_bank->cos_twiddle[length - 1 - idx];
592
593
7.53M
    accu1 = imag_2 * weight_imag + real_2 * weight_real;
594
7.53M
    accu2 = imag_2 * weight_real - real_2 * weight_imag;
595
596
7.53M
    subband[2 * length - 1 - 2 * idx] = accu1;
597
7.53M
    subband[2 * length - 2 - 2 * idx] = accu2;
598
7.53M
  }
599
600
470k
  ixheaace_mps_fft32(subband);
601
602
470k
  weight_imag = pstr_qmf_synth_filter_bank->alt_sin_twiddle[0];
603
470k
  weight_real = pstr_qmf_synth_filter_bank->alt_sin_twiddle[length];
604
605
8.00M
  for (idx = 0; idx < length / 2; idx++) {
606
7.53M
    real_1 = subband[2 * idx];
607
7.53M
    imag_1 = subband[2 * idx + 1];
608
7.53M
    real_2 = subband[2 * length - 2 - 2 * idx];
609
7.53M
    imag_2 = subband[2 * length - 1 - 2 * idx];
610
611
7.53M
    accu1 = -(real_1 * weight_real + imag_1 * weight_imag);
612
7.53M
    accu2 = -(real_1 * weight_imag - imag_1 * weight_real);
613
614
7.53M
    subband[2 * length - 1 - 2 * idx] = accu1;
615
7.53M
    subband[2 * idx] = accu2;
616
617
7.53M
    weight_imag = pstr_qmf_synth_filter_bank->alt_sin_twiddle[idx + 1];
618
7.53M
    weight_real = pstr_qmf_synth_filter_bank->alt_sin_twiddle[length - 1 - idx];
619
620
7.53M
    accu1 = -(real_2 * weight_imag + imag_2 * weight_real);
621
7.53M
    accu2 = -(real_2 * weight_real - imag_2 * weight_imag);
622
623
7.53M
    subband[2 * idx + 1] = accu1;
624
7.53M
    subband[2 * length - 2 - 2 * idx] = accu2;
625
7.53M
  }
626
470k
}
627
628
static VOID ixheaace_mps_inverse_modulation(
629
    FLOAT32 *qmf_real, FLOAT32 *qmf_imag,
630
470k
    ixheaace_mps_sac_pstr_qmf_synth_filter_bank pstr_qmf_synth_filter_bank) {
631
470k
  WORD32 idx, no_synthesis_channels, length;
632
633
470k
  FLOAT32 r1, i1, r2, i2;
634
635
470k
  no_synthesis_channels = NUM_QMF_BANDS;
636
637
470k
  length = no_synthesis_channels / 2;
638
639
470k
  ixheaace_mps_cos_mod(qmf_real, pstr_qmf_synth_filter_bank);
640
470k
  ixheaace_mps_sin_mod(qmf_imag, pstr_qmf_synth_filter_bank);
641
642
15.5M
  for (idx = 0; idx < length; idx++) {
643
15.0M
    r1 = qmf_real[idx];
644
15.0M
    i2 = qmf_imag[no_synthesis_channels - 1 - idx];
645
15.0M
    r2 = qmf_real[no_synthesis_channels - idx - 1];
646
15.0M
    i1 = qmf_imag[idx];
647
648
15.0M
    qmf_real[idx] = (r1 - i1);
649
15.0M
    qmf_imag[no_synthesis_channels - 1 - idx] = -(r1 + i1);
650
15.0M
    qmf_real[no_synthesis_channels - idx - 1] = (r2 - i2);
651
15.0M
    qmf_imag[idx] = -(r2 + i2);
652
15.0M
  }
653
470k
}
654
655
22.3M
static VOID ixheaace_mps_fct3_4(FLOAT32 *subband) {
656
22.3M
  FLOAT32 val_00, val_01, val_10, val_11;
657
658
22.3M
  subband[1] *= MPS_INV_SQRT2;
659
660
22.3M
  val_00 = subband[0] + subband[1];
661
22.3M
  val_01 = subband[0] - subband[1];
662
663
22.3M
  val_10 = subband[2] * MPS_COS_6_PI_BY_16 + subband[3] * MPS_SIN_6_PI_BY_16;
664
22.3M
  val_11 = subband[2] * MPS_SIN_6_PI_BY_16 - subband[3] * MPS_COS_6_PI_BY_16;
665
666
22.3M
  subband[0] = val_00 + val_10;
667
22.3M
  subband[3] = val_00 - val_10;
668
22.3M
  subband[1] = val_01 + val_11;
669
22.3M
  subband[2] = val_01 - val_11;
670
22.3M
}
671
672
18.6M
static VOID ixheaace_mps_fst3_4r(FLOAT32 *subband) {
673
18.6M
  FLOAT32 val_00, val_01, val_10, val_11;
674
675
18.6M
  subband[2] *= MPS_INV_SQRT2;
676
677
18.6M
  val_00 = subband[3] + subband[2];
678
18.6M
  val_01 = subband[3] - subband[2];
679
680
18.6M
  val_10 = subband[1] * MPS_COS_6_PI_BY_16 + subband[0] * MPS_SIN_6_PI_BY_16;
681
18.6M
  val_11 = subband[0] * MPS_COS_6_PI_BY_16 - subband[1] * MPS_SIN_6_PI_BY_16;
682
683
18.6M
  subband[3] = val_00 + val_10;
684
18.6M
  subband[0] = val_10 - val_00;
685
18.6M
  subband[2] = val_11 - val_01;
686
18.6M
  subband[1] = val_11 + val_01;
687
18.6M
}
688
689
11.1M
static VOID ixheaace_mps_fct4_4r(FLOAT32 *subband) {
690
11.1M
  FLOAT32 val_00, val_01, val_10, val_11;
691
11.1M
  subband[1] *= MPS_INV_SQRT2;
692
693
11.1M
  val_00 = subband[0] + subband[1];
694
11.1M
  val_01 = subband[0] - subband[1];
695
696
11.1M
  subband[2] *= MPS_INV_SQRT2;
697
698
11.1M
  val_11 = subband[3] - subband[2];
699
11.1M
  val_10 = subband[3] + subband[2];
700
701
11.1M
  subband[3] = val_00 * MPS_COS_PI_BY_16 + val_10 * MPS_SIN_PI_BY_16;
702
11.1M
  subband[0] = val_00 * MPS_SIN_PI_BY_16 - val_10 * MPS_COS_PI_BY_16;
703
704
11.1M
  subband[2] = val_01 * MPS_COS_3_PI_BY_16 - val_11 * MPS_SIN_3_PI_BY_16;
705
11.1M
  subband[1] = val_01 * MPS_SIN_3_PI_BY_16 + val_11 * MPS_COS_3_PI_BY_16;
706
11.1M
}
707
708
7.44M
static VOID ixheaace_mps_fst4_4(FLOAT32 *subband) {
709
7.44M
  FLOAT32 val_00, val_01, val_10, val_11;
710
711
7.44M
  subband[1] *= MPS_INV_SQRT2;
712
713
7.44M
  val_10 = subband[0] + subband[1];
714
7.44M
  val_11 = subband[0] - subband[1];
715
716
7.44M
  subband[2] *= MPS_INV_SQRT2;
717
718
7.44M
  val_01 = subband[3] - subband[2];
719
7.44M
  val_00 = subband[3] + subband[2];
720
721
7.44M
  subband[0] = val_00 * MPS_COS_PI_BY_16 + val_10 * MPS_SIN_PI_BY_16;
722
7.44M
  subband[3] = val_10 * MPS_COS_PI_BY_16 - val_00 * MPS_SIN_PI_BY_16;
723
724
7.44M
  subband[1] = val_11 * MPS_SIN_3_PI_BY_16 - val_01 * MPS_COS_3_PI_BY_16;
725
7.44M
  subband[2] = val_01 * MPS_SIN_3_PI_BY_16 + val_11 * MPS_COS_3_PI_BY_16;
726
7.44M
}
727
728
3.72M
static VOID ixheaace_mps_fct3_64(FLOAT32 *subband) {
729
3.72M
  WORD32 idx;
730
3.72M
  const FLOAT32 *t_ptr;
731
3.72M
  FLOAT32 cos_val, sine_val;
732
3.72M
  FLOAT32 xp;
733
734
3.72M
  ixheaace_mps_bit_reversal(&subband[1], &subband[32]);
735
3.72M
  ixheaace_mps_bit_reversal(&subband[2], &subband[16]);
736
3.72M
  ixheaace_mps_bit_reversal(&subband[3], &subband[48]);
737
3.72M
  ixheaace_mps_bit_reversal(&subband[4], &subband[8]);
738
3.72M
  ixheaace_mps_bit_reversal(&subband[5], &subband[40]);
739
3.72M
  ixheaace_mps_bit_reversal(&subband[6], &subband[24]);
740
3.72M
  ixheaace_mps_bit_reversal(&subband[7], &subband[56]);
741
3.72M
  ixheaace_mps_bit_reversal(&subband[9], &subband[36]);
742
3.72M
  ixheaace_mps_bit_reversal(&subband[10], &subband[20]);
743
3.72M
  ixheaace_mps_bit_reversal(&subband[11], &subband[52]);
744
3.72M
  ixheaace_mps_bit_reversal(&subband[13], &subband[44]);
745
3.72M
  ixheaace_mps_bit_reversal(&subband[14], &subband[28]);
746
3.72M
  ixheaace_mps_bit_reversal(&subband[15], &subband[60]);
747
3.72M
  ixheaace_mps_bit_reversal(&subband[17], &subband[34]);
748
3.72M
  ixheaace_mps_bit_reversal(&subband[19], &subband[50]);
749
3.72M
  ixheaace_mps_bit_reversal(&subband[21], &subband[42]);
750
3.72M
  ixheaace_mps_bit_reversal(&subband[22], &subband[26]);
751
3.72M
  ixheaace_mps_bit_reversal(&subband[23], &subband[58]);
752
3.72M
  ixheaace_mps_bit_reversal(&subband[25], &subband[38]);
753
3.72M
  ixheaace_mps_bit_reversal(&subband[27], &subband[54]);
754
3.72M
  ixheaace_mps_bit_reversal(&subband[29], &subband[46]);
755
3.72M
  ixheaace_mps_bit_reversal(&subband[31], &subband[62]);
756
3.72M
  ixheaace_mps_bit_reversal(&subband[35], &subband[49]);
757
3.72M
  ixheaace_mps_bit_reversal(&subband[37], &subband[41]);
758
3.72M
  ixheaace_mps_bit_reversal(&subband[39], &subband[57]);
759
3.72M
  ixheaace_mps_bit_reversal(&subband[43], &subband[53]);
760
3.72M
  ixheaace_mps_bit_reversal(&subband[47], &subband[61]);
761
3.72M
  ixheaace_mps_bit_reversal(&subband[55], &subband[59]);
762
763
3.72M
  ixheaace_mps_bit_add_sub1(&subband[33], &subband[62]);
764
3.72M
  ixheaace_mps_bit_add_sub1(&subband[34], &subband[60]);
765
3.72M
  ixheaace_mps_bit_add_sub1(&subband[35], &subband[61]);
766
3.72M
  ixheaace_mps_bit_add_sub1(&subband[36], &subband[56]);
767
3.72M
  ixheaace_mps_bit_add_sub1(&subband[37], &subband[57]);
768
3.72M
  ixheaace_mps_bit_add_sub1(&subband[38], &subband[58]);
769
3.72M
  ixheaace_mps_bit_add_sub1(&subband[39], &subband[59]);
770
3.72M
  ixheaace_mps_bit_add_sub1(&subband[40], &subband[48]);
771
3.72M
  ixheaace_mps_bit_add_sub1(&subband[41], &subband[49]);
772
3.72M
  ixheaace_mps_bit_add_sub1(&subband[42], &subband[50]);
773
3.72M
  ixheaace_mps_bit_add_sub1(&subband[43], &subband[51]);
774
3.72M
  ixheaace_mps_bit_add_sub1(&subband[44], &subband[52]);
775
3.72M
  ixheaace_mps_bit_add_sub1(&subband[45], &subband[53]);
776
3.72M
  ixheaace_mps_bit_add_sub1(&subband[46], &subband[54]);
777
3.72M
  ixheaace_mps_bit_add_sub1(&subband[47], &subband[55]);
778
3.72M
  ixheaace_mps_bit_add_sub1(&subband[17], &subband[30]);
779
3.72M
  ixheaace_mps_bit_add_sub1(&subband[18], &subband[28]);
780
3.72M
  ixheaace_mps_bit_add_sub1(&subband[19], &subband[29]);
781
3.72M
  ixheaace_mps_bit_add_sub1(&subband[20], &subband[24]);
782
3.72M
  ixheaace_mps_bit_add_sub1(&subband[21], &subband[25]);
783
3.72M
  ixheaace_mps_bit_add_sub1(&subband[22], &subband[26]);
784
3.72M
  ixheaace_mps_bit_add_sub1(&subband[23], &subband[27]);
785
3.72M
  ixheaace_mps_bit_add_sub1(&subband[9], &subband[14]);
786
3.72M
  ixheaace_mps_bit_add_sub1(&subband[10], &subband[12]);
787
3.72M
  ixheaace_mps_bit_add_sub1(&subband[11], &subband[13]);
788
3.72M
  ixheaace_mps_bit_add_sub1(&subband[41], &subband[46]);
789
3.72M
  ixheaace_mps_bit_add_sub1(&subband[42], &subband[44]);
790
3.72M
  ixheaace_mps_bit_add_sub1(&subband[43], &subband[45]);
791
3.72M
  ixheaace_mps_bit_add_sub1(&subband[54], &subband[49]);
792
3.72M
  ixheaace_mps_bit_add_sub1(&subband[52], &subband[50]);
793
3.72M
  ixheaace_mps_bit_add_sub1(&subband[53], &subband[51]);
794
3.72M
  ixheaace_mps_bit_add_sub1(&subband[5], &subband[6]);
795
3.72M
  ixheaace_mps_bit_add_sub1(&subband[21], &subband[22]);
796
3.72M
  ixheaace_mps_bit_add_sub1(&subband[26], &subband[25]);
797
3.72M
  ixheaace_mps_bit_add_sub1(&subband[37], &subband[38]);
798
3.72M
  ixheaace_mps_bit_add_sub1(&subband[58], &subband[57]);
799
800
3.72M
  ixheaace_mps_fct3_4(subband);
801
3.72M
  ixheaace_mps_fct4_4r(subband + 4);
802
3.72M
  ixheaace_mps_fct3_4(subband + 8);
803
3.72M
  ixheaace_mps_fst3_4r(subband + 12);
804
3.72M
  ixheaace_mps_fct3_4(subband + 16);
805
3.72M
  ixheaace_mps_fct4_4r(subband + 20);
806
3.72M
  ixheaace_mps_fst4_4(subband + 24);
807
3.72M
  ixheaace_mps_fst3_4r(subband + 28);
808
3.72M
  ixheaace_mps_fct3_4(subband + 32);
809
3.72M
  ixheaace_mps_fct4_4r(subband + 36);
810
3.72M
  ixheaace_mps_fct3_4(subband + 40);
811
3.72M
  ixheaace_mps_fst3_4r(subband + 44);
812
3.72M
  ixheaace_mps_fct3_4(subband + 48);
813
3.72M
  ixheaace_mps_fst3_4r(subband + 52);
814
3.72M
  ixheaace_mps_fst4_4(subband + 56);
815
3.72M
  ixheaace_mps_fst3_4r(subband + 60);
816
817
18.6M
  for (idx = 0; idx < 4; idx++) {
818
14.8M
    ixheaace_mps_bit_add_sub2(&subband[idx], &subband[7 - idx]);
819
14.8M
    ixheaace_mps_bit_add_sub2(&subband[16 + idx], &subband[23 - idx]);
820
14.8M
    ixheaace_mps_bit_add_sub1(&subband[31 - idx], &subband[24 + idx]);
821
14.8M
    ixheaace_mps_bit_add_sub2(&subband[32 + idx], &subband[39 - idx]);
822
14.8M
    ixheaace_mps_bit_add_sub1(&subband[63 - idx], &subband[56 + idx]);
823
14.8M
  }
824
3.72M
  t_ptr = trig_data_fct4_8;
825
826
18.6M
  for (idx = 0; idx < 4; idx++) {
827
14.8M
    cos_val = *t_ptr++;
828
14.8M
    sine_val = *t_ptr++;
829
830
14.8M
    xp = subband[8 + idx] * cos_val + subband[15 - idx] * sine_val;
831
14.8M
    subband[8 + idx] = subband[8 + idx] * sine_val - subband[15 - idx] * cos_val;
832
14.8M
    subband[15 - idx] = xp;
833
14.8M
    xp = subband[40 + idx] * cos_val + subband[47 - idx] * sine_val;
834
14.8M
    subband[40 + idx] = subband[40 + idx] * sine_val - subband[47 - idx] * cos_val;
835
14.8M
    subband[47 - idx] = xp;
836
14.8M
    xp = subband[48 + idx] * sine_val + subband[55 - idx] * cos_val;
837
14.8M
    subband[55 - idx] = subband[48 + idx] * cos_val - subband[55 - idx] * sine_val;
838
14.8M
    subband[48 + idx] = xp;
839
14.8M
  }
840
841
33.4M
  for (idx = 0; idx < 8; idx++) {
842
29.7M
    ixheaace_mps_bit_add_sub2(&subband[idx], &subband[15 - idx]);
843
29.7M
    ixheaace_mps_bit_add_sub2(&subband[32 + idx], &subband[47 - idx]);
844
29.7M
    ixheaace_mps_bit_add_sub1(&subband[63 - idx], &subband[48 + idx]);
845
29.7M
  }
846
847
3.72M
  t_ptr = trig_data_fct4_16;
848
849
33.4M
  for (idx = 0; idx < 8; idx++) {
850
29.7M
    cos_val = *t_ptr++;
851
29.7M
    sine_val = *t_ptr++;
852
853
29.7M
    xp = subband[16 + idx] * cos_val + subband[31 - idx] * sine_val;
854
29.7M
    subband[16 + idx] = subband[16 + idx] * sine_val - subband[31 - idx] * cos_val;
855
29.7M
    subband[31 - idx] = xp;
856
29.7M
  }
857
858
63.2M
  for (idx = 0; idx < 16; idx++) {
859
59.5M
    ixheaace_mps_bit_add_sub2(&subband[idx], &subband[31 - idx]);
860
59.5M
  }
861
862
3.72M
  t_ptr = trig_data_fct4_32;
863
864
63.2M
  for (idx = 0; idx < 16; idx++) {
865
59.5M
    cos_val = *t_ptr++;
866
59.5M
    sine_val = *t_ptr++;
867
868
59.5M
    xp = subband[32 + idx] * cos_val + subband[63 - idx] * sine_val;
869
59.5M
    subband[32 + idx] = subband[32 + idx] * sine_val - subband[63 - idx] * cos_val;
870
59.5M
    subband[63 - idx] = xp;
871
59.5M
  }
872
873
122M
  for (idx = 0; idx < 32; idx++) {
874
119M
    ixheaace_mps_bit_add_sub2(&subband[idx], &subband[63 - idx]);
875
119M
  }
876
3.72M
}
877
878
1.86M
static VOID ixheaace_mps_fst3_64(FLOAT32 *subband) {
879
1.86M
  WORD32 k;
880
881
61.4M
  for (k = 0; k < 32; k++) {
882
59.5M
    ixheaace_mps_bit_reversal(&subband[k], &subband[63 - k]);
883
59.5M
  }
884
885
1.86M
  ixheaace_mps_fct3_64(subband);
886
887
61.4M
  for (k = 1; k < NUM_QMF_BANDS; k += 2) {
888
59.5M
    subband[k] = -subband[k];
889
59.5M
  }
890
1.86M
}
891
892
static VOID ixheaace_mps_forward_modulation(const FLOAT32 *time_in, FLOAT32 *real_subband,
893
1.86M
                                            FLOAT32 *imag_subband) {
894
1.86M
  WORD32 idx;
895
1.86M
  real_subband[0] = time_in[0];
896
897
119M
  for (idx = 1; idx < NUM_QMF_BANDS; idx++) {
898
117M
    real_subband[idx] = time_in[idx] - time_in[(NUM_QMF_BANDS * 2) - idx];
899
117M
    imag_subband[idx - 1] = time_in[idx] + time_in[(NUM_QMF_BANDS * 2) - idx];
900
117M
  }
901
902
1.86M
  imag_subband[63] = time_in[NUM_QMF_BANDS];
903
904
1.86M
  ixheaace_mps_fct3_64(real_subband);
905
906
1.86M
  ixheaace_mps_fst3_64(imag_subband);
907
1.86M
}
908
909
VOID ixheaace_mps_515_calculate_sbr_syn_filterbank(
910
    FLOAT32 *real_subband, FLOAT32 *imag_subband, FLOAT32 *time_sig, WORD32 channel,
911
    ixheaace_mps_sac_pstr_qmf_synth_filter_bank pstr_qmf_synth_filter_bank, WORD32 slots,
912
30.3k
    FLOAT32 *sbr_qmf_states_synthesis_per) {
913
30.3k
  WORD32 idx, subband, slot;
914
30.3k
  const FLOAT32 *ptr_filter;
915
30.3k
  FLOAT32 accumlate;
916
30.3k
  FLOAT32 *synth_buf;
917
918
30.3k
  synth_buf = &(sbr_qmf_states_synthesis_per[channel * QMF_FILTER_STATE_SYN_SIZE]);
919
920
501k
  for (slot = 0; slot < slots; slot++) {
921
470k
    ptr_filter = pstr_qmf_synth_filter_bank->p_filter;
922
470k
    ixheaace_mps_inverse_modulation(real_subband + NUM_QMF_BANDS * slot,
923
470k
                                    imag_subband + NUM_QMF_BANDS * slot,
924
470k
                                    pstr_qmf_synth_filter_bank);
925
926
30.5M
    for (subband = 0; subband < NUM_QMF_BANDS; subband++) {
927
30.1M
      real_subband[NUM_QMF_BANDS * slot + subband] =
928
30.1M
          real_subband[NUM_QMF_BANDS * slot + subband] * (-0.015625f);
929
30.1M
      imag_subband[NUM_QMF_BANDS * slot + subband] =
930
30.1M
          imag_subband[NUM_QMF_BANDS * slot + subband] * (-0.015625f);
931
30.1M
    }
932
933
30.5M
    for (subband = 0; subband < NUM_QMF_BANDS; subband++) {
934
30.1M
      FLOAT32 new_sample;
935
30.1M
      new_sample = imag_subband[NUM_QMF_BANDS * slot + 63 - subband];
936
937
180M
      for (idx = 0; idx < 5; idx++) {
938
150M
        accumlate = synth_buf[2 * idx * NUM_QMF_BANDS + subband] + (*ptr_filter++) * new_sample;
939
150M
        synth_buf[2 * idx * NUM_QMF_BANDS + subband] = accumlate;
940
150M
      }
941
30.1M
    }
942
943
2.82M
    for (idx = 0; idx < 5; idx++) {
944
2.35M
      accumlate = synth_buf[2 * idx * NUM_QMF_BANDS + NUM_QMF_BANDS + (NUM_QMF_BANDS - 1)] +
945
2.35M
                  (*ptr_filter++) * real_subband[NUM_QMF_BANDS * slot];
946
2.35M
      synth_buf[2 * idx * NUM_QMF_BANDS + NUM_QMF_BANDS + (NUM_QMF_BANDS - 1)] = accumlate;
947
2.35M
    }
948
470k
    time_sig[0] = accumlate;
949
950
470k
    ptr_filter -= 10;
951
952
30.1M
    for (subband = 0; subband < 63; subband++) {
953
29.6M
      FLOAT32 new_sample;
954
955
29.6M
      new_sample = real_subband[NUM_QMF_BANDS * slot + 63 - subband];
956
957
177M
      for (idx = 0; idx < 5; idx++) {
958
148M
        accumlate = synth_buf[2 * idx * NUM_QMF_BANDS + NUM_QMF_BANDS + subband] +
959
148M
                    (*--ptr_filter) * new_sample;
960
148M
        synth_buf[2 * idx * NUM_QMF_BANDS + NUM_QMF_BANDS + subband] = accumlate;
961
148M
      }
962
963
29.6M
      time_sig[NUM_QMF_BANDS - 1 - subband] = accumlate;
964
29.6M
    }
965
966
470k
    time_sig += NUM_QMF_BANDS;
967
968
470k
    memmove((synth_buf + NUM_QMF_BANDS), synth_buf, (640 - NUM_QMF_BANDS) * sizeof(FLOAT32));
969
970
470k
    memset((synth_buf), 0, NUM_QMF_BANDS * sizeof(FLOAT32));
971
470k
  }
972
30.3k
}
973
974
VOID ixheaace_mps_515_calculate_ana_filterbank(
975
    ixheaace_mps_sac_sbr_encoder_ana_filter_bank *pstr_sbr_enc_ana_filter_bank, FLOAT32 *time_sig,
976
    FLOAT32 *real_subband, FLOAT32 *imag_subband,
977
1.86M
    ixheaace_mps_sac_pstr_qmf_ana_filter_bank pstr_qmf_synth_filter_bank) {
978
1.86M
  WORD32 idx;
979
1.86M
  FLOAT32 temp_array[128];
980
1.86M
  const FLOAT32 *ptr_filter = pstr_qmf_synth_filter_bank->p_filter;
981
1.86M
  FLOAT32 accumlate;
982
983
1.07G
  for (idx = 0; idx < 576; idx++) {
984
1.07G
    pstr_sbr_enc_ana_filter_bank->x[idx] = pstr_sbr_enc_ana_filter_bank->x[idx + NUM_QMF_BANDS];
985
1.07G
  }
986
120M
  for (idx = 0; idx < NUM_QMF_BANDS; idx++) {
987
119M
    pstr_sbr_enc_ana_filter_bank->x[idx + 576] = time_sig[idx];
988
119M
  }
989
990
120M
  for (idx = 0; idx < NUM_QMF_BANDS; idx++) {
991
119M
    accumlate = 0.0f;
992
119M
    accumlate += (*ptr_filter++ * pstr_sbr_enc_ana_filter_bank->x[idx]);
993
119M
    accumlate += (*ptr_filter++ * pstr_sbr_enc_ana_filter_bank->x[idx + (NUM_QMF_BANDS * 2)]);
994
119M
    accumlate += (*ptr_filter++ * pstr_sbr_enc_ana_filter_bank->x[idx + (NUM_QMF_BANDS * 4)]);
995
119M
    accumlate += (*ptr_filter++ * pstr_sbr_enc_ana_filter_bank->x[idx + (NUM_QMF_BANDS * 6)]);
996
119M
    accumlate += (*ptr_filter++ * pstr_sbr_enc_ana_filter_bank->x[idx + (NUM_QMF_BANDS * 8)]);
997
119M
    temp_array[127 - idx] = accumlate;
998
119M
  }
999
1000
1.86M
  accumlate = 0.0f;
1001
11.1M
  for (idx = 0; idx < 5; idx++) {
1002
9.30M
    accumlate +=
1003
9.30M
        (*ptr_filter++ * pstr_sbr_enc_ana_filter_bank->x[127 + idx * (NUM_QMF_BANDS * 2)]);
1004
9.30M
  }
1005
1.86M
  temp_array[0] = accumlate;
1006
1007
1.86M
  ptr_filter -= 10;
1008
119M
  for (idx = 0; idx < 63; idx++) {
1009
117M
    accumlate = 0.0f;
1010
117M
    accumlate += (*--ptr_filter * pstr_sbr_enc_ana_filter_bank->x[NUM_QMF_BANDS + idx]);
1011
117M
    accumlate += (*--ptr_filter *
1012
117M
                  pstr_sbr_enc_ana_filter_bank->x[NUM_QMF_BANDS + idx + (NUM_QMF_BANDS * 2)]);
1013
117M
    accumlate += (*--ptr_filter *
1014
117M
                  pstr_sbr_enc_ana_filter_bank->x[NUM_QMF_BANDS + idx + (NUM_QMF_BANDS * 4)]);
1015
117M
    accumlate += (*--ptr_filter *
1016
117M
                  pstr_sbr_enc_ana_filter_bank->x[NUM_QMF_BANDS + idx + (NUM_QMF_BANDS * 6)]);
1017
117M
    accumlate += (*--ptr_filter *
1018
117M
                  pstr_sbr_enc_ana_filter_bank->x[NUM_QMF_BANDS + idx + (NUM_QMF_BANDS * 8)]);
1019
117M
    temp_array[63 - idx] = accumlate;
1020
117M
  }
1021
1022
1.86M
  ixheaace_mps_forward_modulation(temp_array, real_subband, imag_subband);
1023
1.86M
}