/src/libxaac/encoder/iusace_avq_enc.c
Line | Count | Source (jump to first uncovered line) |
1 | | /****************************************************************************** |
2 | | * * |
3 | | * Copyright (C) 2023 The Android Open Source Project |
4 | | * |
5 | | * Licensed under the Apache License, Version 2.0 (the "License"); |
6 | | * you may not use this file except in compliance with the License. |
7 | | * You may obtain a copy of the License at: |
8 | | * |
9 | | * http://www.apache.org/licenses/LICENSE-2.0 |
10 | | * |
11 | | * Unless required by applicable law or agreed to in writing, software |
12 | | * distributed under the License is distributed on an "AS IS" BASIS, |
13 | | * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
14 | | * See the License for the specific language governing permissions and |
15 | | * limitations under the License. |
16 | | * |
17 | | ***************************************************************************** |
18 | | * Originally developed and contributed by Ittiam Systems Pvt. Ltd, Bangalore |
19 | | */ |
20 | | |
21 | | #include <math.h> |
22 | | #include <stdlib.h> |
23 | | #include "ixheaac_type_def.h" |
24 | | #include "iusace_avq_enc.h" |
25 | | |
26 | 3.33M | static VOID iusace_gosset_compute_rank_and_sign(WORD32 *x, WORD32 *rank, WORD32 *sign_code) { |
27 | 3.33M | WORD32 xs[8], a[8], q, d[8], w[8], A, B, idx, tmp, abs_i, abs_j; |
28 | 3.33M | WORD32 i, j, k; |
29 | 29.9M | for (i = 0; i < 8; i++) { |
30 | 26.6M | xs[i] = x[i]; |
31 | 26.6M | } |
32 | 26.6M | for (k = 0; k < 7; k++) { |
33 | 23.3M | j = k; |
34 | 116M | for (i = k + 1; i < 8; i++) { |
35 | 93.2M | abs_j = abs(xs[j]); |
36 | 93.2M | abs_i = abs(xs[i]); |
37 | 93.2M | if (abs_i >= abs_j) { |
38 | 67.9M | if (abs_i > xs[j]) { |
39 | 25.1M | j = i; |
40 | 25.1M | } |
41 | 67.9M | } |
42 | 93.2M | } |
43 | 23.3M | if (j > k) { |
44 | 12.9M | tmp = xs[k]; |
45 | 12.9M | xs[k] = xs[j]; |
46 | 12.9M | xs[j] = tmp; |
47 | 12.9M | } |
48 | 23.3M | } |
49 | 3.33M | *sign_code = 0; |
50 | 29.9M | for (i = 0; i < 8; i++) { |
51 | 26.6M | if (xs[i] < 0) { |
52 | 8.96M | *sign_code += iusace_pow2_table[i]; |
53 | 8.96M | } |
54 | 26.6M | } |
55 | 3.33M | a[0] = xs[0]; |
56 | 3.33M | q = 1; |
57 | 26.6M | for (i = 1; i < 8; i++) { |
58 | 23.3M | if (xs[i] != xs[i - 1]) { |
59 | 5.74M | a[q] = xs[i]; |
60 | 5.74M | q++; |
61 | 5.74M | } |
62 | 23.3M | } |
63 | 29.9M | for (i = 0; i < 8; i++) { |
64 | 54.9M | for (j = 0; j < q; j++) { |
65 | 54.9M | if (x[i] == a[j]) { |
66 | 26.6M | d[i] = j; |
67 | 26.6M | break; |
68 | 26.6M | } |
69 | 54.9M | } |
70 | 26.6M | } |
71 | 3.33M | *rank = 0; |
72 | 12.4M | for (j = 0; j < q; j++) { |
73 | 9.07M | w[j] = 0; |
74 | 9.07M | } |
75 | 3.33M | B = 1; |
76 | 29.9M | for (i = 7; i >= 0; i--) { |
77 | 26.6M | idx = d[i]; |
78 | 26.6M | w[idx]++; |
79 | 26.6M | B *= w[idx]; |
80 | 26.6M | A = 0; |
81 | 54.9M | for (j = 0; j < idx; j++) { |
82 | 28.3M | A += w[j]; |
83 | 28.3M | } |
84 | 26.6M | if (A > 0) { |
85 | 9.80M | *rank += A * iusace_factorial_table[i] / B; |
86 | 9.80M | } |
87 | 26.6M | } |
88 | 3.33M | } |
89 | | |
90 | 3.33M | static VOID iusace_gosset_compute_base_idx(WORD32 *x, WORD32 ka, WORD32 *idx) { |
91 | 3.33M | WORD32 rank, offset, code, i, ks; |
92 | 3.33M | iusace_gosset_compute_rank_and_sign(x, &rank, &code); |
93 | 3.33M | ks = -1; |
94 | 13.6M | for (i = iusace_iso_code_index_table[ka]; i < LEN_SIGN_LEADER; i++) { |
95 | 13.6M | if (code == iusace_iso_code_data_table[i]) { |
96 | 3.33M | ks = i; |
97 | 3.33M | break; |
98 | 3.33M | } |
99 | 13.6M | } |
100 | 3.33M | if (ks == -1) { |
101 | 0 | ks = 0; |
102 | 0 | } |
103 | 3.33M | offset = iusace_signed_leader_is[ks]; |
104 | 3.33M | *idx = offset + rank; |
105 | 3.33M | return; |
106 | 3.33M | } |
107 | | |
108 | 8.04M | static WORD32 iusace_find_absolute_leader(WORD32 *y) { |
109 | 8.04M | WORD32 i, nb, pos, ka; |
110 | 8.04M | WORD64 s, C[8], id; |
111 | 72.3M | for (i = 0; i < 8; i++) { |
112 | 64.3M | C[i] = (WORD64)y[i] * y[i]; |
113 | 64.3M | } |
114 | 8.04M | s = 0; |
115 | 72.3M | for (i = 0; i < 8; i++) { |
116 | 64.3M | s += C[i]; |
117 | 64.3M | } |
118 | 8.04M | s >>= 3; |
119 | 8.04M | ka = LEN_ABS_LEADER + 1; |
120 | 8.04M | if (s == 0) { |
121 | 1.26M | ka = LEN_ABS_LEADER; |
122 | 6.77M | } else { |
123 | 6.77M | if (s <= NB_SPHERE) { |
124 | 6.09M | id = 0; |
125 | 54.8M | for (i = 0; i < 8; i++) { |
126 | 48.7M | id += C[i] * C[i]; |
127 | 48.7M | } |
128 | 6.09M | id = id >> 3; |
129 | 6.09M | nb = iusace_da_num_bits[s - 1]; |
130 | 6.09M | pos = iusace_da_pos[s - 1]; |
131 | 11.7M | for (i = 0; i < nb; i++) { |
132 | 9.00M | if (id == (long)iusace_da_id[pos]) { |
133 | 3.33M | ka = pos; |
134 | 3.33M | break; |
135 | 3.33M | } |
136 | 5.66M | pos++; |
137 | 5.66M | } |
138 | 6.09M | } |
139 | 6.77M | } |
140 | 8.04M | return (ka); |
141 | 8.04M | } |
142 | | |
143 | 59.4M | static VOID iusace_nearest_neighbor_2d(FLOAT32 *x, WORD32 *y) { |
144 | 59.4M | WORD32 i, j; |
145 | 59.4M | WORD64 sum; |
146 | 59.4M | FLOAT32 diff[8], em; |
147 | 59.4M | sum = 0; |
148 | 535M | for (i = 0; i < 8; i++) { |
149 | 475M | if (x[i] < 0) { |
150 | 305M | y[i] = -2 * (((WORD32)(1.0 - x[i])) >> 1); |
151 | 305M | } else { |
152 | 170M | y[i] = 2 * (((WORD32)(1.0 + x[i])) >> 1); |
153 | 170M | } |
154 | 475M | sum += y[i]; |
155 | 475M | } |
156 | 59.4M | if (sum % 4) { |
157 | 21.1M | FLOAT32 s; |
158 | 21.1M | em = 0; |
159 | 21.1M | j = 0; |
160 | 190M | for (i = 0; i < 8; i++) { |
161 | 169M | diff[i] = x[i] - y[i]; |
162 | 169M | s = (FLOAT32)fabs(diff[i]); |
163 | 169M | if (em < s) { |
164 | 50.5M | em = s; |
165 | 50.5M | j = i; |
166 | 50.5M | } |
167 | 169M | } |
168 | 21.1M | if (diff[j] < 0) { |
169 | 10.1M | y[j] -= 2; |
170 | 11.0M | } else { |
171 | 11.0M | y[j] += 2; |
172 | 11.0M | } |
173 | 21.1M | } |
174 | 59.4M | return; |
175 | 59.4M | } |
176 | | |
177 | 29.7M | VOID iusace_find_nearest_neighbor(FLOAT32 *bk, WORD32 *ck) { |
178 | 29.7M | WORD32 i, y1[8], y2[8]; |
179 | 29.7M | FLOAT32 e1k, e2k, x1[8], tmp; |
180 | | |
181 | 29.7M | iusace_nearest_neighbor_2d(bk, y1); |
182 | | |
183 | 267M | for (i = 0; i < 8; i++) { |
184 | 237M | x1[i] = bk[i] - 1.0f; |
185 | 237M | } |
186 | 29.7M | iusace_nearest_neighbor_2d(x1, y2); |
187 | 267M | for (i = 0; i < 8; i++) { |
188 | 237M | y2[i] += 1; |
189 | 237M | } |
190 | | /* Compute e1k = (Bk - y1k)^2 and e2k = (Bk – y2k)^2 */ |
191 | 29.7M | e1k = e2k = 0.0; |
192 | 267M | for (i = 0; i < 8; i++) { |
193 | 237M | tmp = bk[i] - y1[i]; |
194 | 237M | e1k += tmp * tmp; |
195 | 237M | tmp = bk[i] - y2[i]; |
196 | 237M | e2k += tmp * tmp; |
197 | 237M | } |
198 | | |
199 | | /* Select best lattice point */ |
200 | 29.7M | if (e1k < e2k) { |
201 | 193M | for (i = 0; i < 8; i++) { |
202 | 172M | ck[i] = y1[i]; |
203 | 172M | } |
204 | 21.5M | } else { |
205 | 73.9M | for (i = 0; i < 8; i++) { |
206 | 65.7M | ck[i] = y2[i]; |
207 | 65.7M | } |
208 | 8.21M | } |
209 | 29.7M | return; |
210 | 29.7M | } |
211 | | |
212 | 3.44M | static VOID iusace_vononoi_idx(WORD32 *kv, WORD32 m, WORD32 *y) { |
213 | 3.44M | WORD32 i, v[8], tmp, sum, *ptr1, *ptr2; |
214 | 3.44M | FLOAT32 z[8]; |
215 | 30.9M | for (i = 0; i < 8; i++) { |
216 | 27.5M | y[i] = kv[7]; |
217 | 27.5M | } |
218 | 3.44M | z[7] = (FLOAT32)y[7] / m; |
219 | 3.44M | sum = 0; |
220 | 24.0M | for (i = 6; i >= 1; i--) { |
221 | 20.6M | tmp = kv[i] << 1; |
222 | 20.6M | sum += tmp; |
223 | 20.6M | y[i] += tmp; |
224 | 20.6M | z[i] = (FLOAT32)y[i] / m; |
225 | 20.6M | } |
226 | 3.44M | y[0] += (4 * kv[0] + sum); |
227 | 3.44M | z[0] = (FLOAT32)(y[0] - 2) / m; |
228 | 3.44M | iusace_find_nearest_neighbor(z, v); |
229 | 3.44M | ptr1 = y; |
230 | 3.44M | ptr2 = v; |
231 | 30.9M | for (i = 0; i < 8; i++) { |
232 | 27.5M | *ptr1++ -= m * *ptr2++; |
233 | 27.5M | } |
234 | 3.44M | } |
235 | | |
236 | 1.72M | static VOID iusace_compute_coord(WORD32 *y, WORD32 *k) { |
237 | 1.72M | WORD32 i, tmp, sum; |
238 | 1.72M | k[7] = y[7]; |
239 | 1.72M | tmp = y[7]; |
240 | 1.72M | sum = 5 * y[7]; |
241 | 12.0M | for (i = 6; i >= 1; i--) { |
242 | 10.3M | k[i] = (y[i] - tmp) >> 1; |
243 | 10.3M | sum -= y[i]; |
244 | 10.3M | } |
245 | 1.72M | k[0] = (y[0] + sum) >> 2; |
246 | 1.72M | } |
247 | | |
248 | 4.59M | VOID iusace_apply_voronoi_ext(WORD32 *x, WORD32 *n, WORD32 *idx, WORD32 *k) { |
249 | 4.59M | WORD32 ka, c[8]; |
250 | 4.59M | WORD32 i, r, m, v[8], c_tmp[8], k_mod[8], k_tmp[8], iter, ka_tmp, n_tmp, mask; |
251 | 4.59M | FLOAT32 sphere; |
252 | 4.59M | ka = iusace_find_absolute_leader(x); |
253 | 4.59M | *n = iusace_da_nq[ka]; |
254 | 4.59M | if (*n <= 4) { |
255 | 25.9M | for (i = 0; i < 8; i++) { |
256 | 23.0M | c[i] = x[i]; |
257 | 23.0M | } |
258 | 2.87M | } else { |
259 | 1.72M | sphere = 0.0; |
260 | 15.4M | for (i = 0; i < 8; i++) { |
261 | 13.7M | sphere += (FLOAT32)x[i] * (FLOAT32)x[i]; |
262 | 13.7M | } |
263 | 1.72M | sphere *= 0.125; |
264 | 1.72M | r = 1; |
265 | 1.72M | sphere *= 0.25; |
266 | 2.69M | while (sphere > 11.0) { |
267 | 973k | r++; |
268 | 973k | sphere *= 0.25; |
269 | 973k | } |
270 | 1.72M | iusace_compute_coord(x, k_mod); |
271 | 1.72M | m = 1 << r; |
272 | 1.72M | mask = m - 1; |
273 | 5.16M | for (iter = 0; iter < 2; iter++) { |
274 | 30.9M | for (i = 0; i < 8; i++) { |
275 | 27.5M | k_tmp[i] = k_mod[i] & mask; |
276 | 27.5M | } |
277 | 3.44M | iusace_vononoi_idx(k_tmp, m, v); |
278 | 30.9M | for (i = 0; i < 8; i++) { |
279 | 27.5M | c_tmp[i] = (x[i] - v[i]) / m; |
280 | 27.5M | } |
281 | 3.44M | ka_tmp = iusace_find_absolute_leader(c_tmp); |
282 | 3.44M | n_tmp = iusace_da_nq[ka_tmp]; |
283 | 3.44M | if (n_tmp > 4) { |
284 | 1.71M | r++; |
285 | 1.71M | m = m << 1; |
286 | 1.71M | mask = ((mask << 1) + 1); |
287 | 1.72M | } else { |
288 | 1.72M | if (n_tmp < 3) { |
289 | 180k | n_tmp = 3; |
290 | 180k | } |
291 | 1.72M | ka = ka_tmp; |
292 | 1.72M | *n = n_tmp + 2 * r; |
293 | 15.5M | for (i = 0; i < 8; i++) { |
294 | 13.8M | k[i] = k_tmp[i]; |
295 | 13.8M | } |
296 | 15.5M | for (i = 0; i < 8; i++) { |
297 | 13.8M | c[i] = c_tmp[i]; |
298 | 13.8M | } |
299 | 1.72M | r--; |
300 | 1.72M | m = m >> 1; |
301 | 1.72M | mask = mask >> 1; |
302 | 1.72M | } |
303 | 3.44M | } |
304 | 1.72M | } |
305 | | |
306 | 4.59M | if (*n > 0) { |
307 | 3.33M | iusace_gosset_compute_base_idx(c, ka, idx); |
308 | 3.33M | } |
309 | 4.59M | return; |
310 | 4.59M | } |
311 | | |
312 | 1.13M | VOID iusace_alg_vec_quant(FLOAT32 *ptr_input, WORD32 *ptr_out, WORD32 *ptr_lpc_idx) { |
313 | 1.13M | WORD32 i, l, nq, pos, c[8], kv[8]; |
314 | 1.13M | FLOAT32 x1[8]; |
315 | 1.13M | WORD32 lpc_index; |
316 | | |
317 | 1.13M | pos = 2; |
318 | 3.40M | for (l = 0; l < 2; l++) { |
319 | 20.4M | for (i = 0; i < 8; i++) { |
320 | 18.1M | x1[i] = ptr_input[l * 8 + i]; |
321 | 18.1M | kv[i] = 0; |
322 | 18.1M | } |
323 | | |
324 | 2.27M | iusace_find_nearest_neighbor(x1, c); |
325 | | |
326 | 2.27M | iusace_apply_voronoi_ext(c, &nq, &lpc_index, kv); |
327 | | |
328 | 20.4M | for (i = 0; i < 8; i++) { |
329 | 18.1M | ptr_out[l * 8 + i] = c[i]; |
330 | 18.1M | } |
331 | | |
332 | 2.27M | ptr_lpc_idx[l] = nq; |
333 | | |
334 | 2.27M | if (nq > 0) { |
335 | 1.96M | ptr_lpc_idx[pos++] = lpc_index; |
336 | 17.7M | for (i = 0; i < 8; i++) { |
337 | 15.7M | ptr_lpc_idx[pos++] = kv[i]; |
338 | 15.7M | } |
339 | 1.96M | } |
340 | 2.27M | } |
341 | | |
342 | 1.13M | return; |
343 | 1.13M | } |