/src/ffmpeg/libavcodec/flacenc.c
Line | Count | Source |
1 | | /* |
2 | | * FLAC audio encoder |
3 | | * Copyright (c) 2006 Justin Ruggles <justin.ruggles@gmail.com> |
4 | | * |
5 | | * This file is part of FFmpeg. |
6 | | * |
7 | | * FFmpeg is free software; you can redistribute it and/or |
8 | | * modify it under the terms of the GNU Lesser General Public |
9 | | * License as published by the Free Software Foundation; either |
10 | | * version 2.1 of the License, or (at your option) any later version. |
11 | | * |
12 | | * FFmpeg is distributed in the hope that it will be useful, |
13 | | * but WITHOUT ANY WARRANTY; without even the implied warranty of |
14 | | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU |
15 | | * Lesser General Public License for more details. |
16 | | * |
17 | | * You should have received a copy of the GNU Lesser General Public |
18 | | * License along with FFmpeg; if not, write to the Free Software |
19 | | * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA |
20 | | */ |
21 | | |
22 | | #include "libavutil/avassert.h" |
23 | | #include "libavutil/channel_layout.h" |
24 | | #include "libavutil/crc.h" |
25 | | #include "libavutil/intmath.h" |
26 | | #include "libavutil/md5.h" |
27 | | #include "libavutil/mem.h" |
28 | | #include "libavutil/opt.h" |
29 | | |
30 | | #include "avcodec.h" |
31 | | #include "bswapdsp.h" |
32 | | #include "codec_internal.h" |
33 | | #include "encode.h" |
34 | | #include "put_bits.h" |
35 | | #include "lpc.h" |
36 | | #include "flac.h" |
37 | | #include "flacdata.h" |
38 | | #include "flacencdsp.h" |
39 | | |
40 | 0 | #define FLAC_SUBFRAME_CONSTANT 0 |
41 | 0 | #define FLAC_SUBFRAME_VERBATIM 1 |
42 | 0 | #define FLAC_SUBFRAME_FIXED 8 |
43 | 0 | #define FLAC_SUBFRAME_LPC 32 |
44 | | |
45 | 0 | #define MAX_FIXED_ORDER 4 |
46 | | #define MAX_PARTITION_ORDER 8 |
47 | | #define MAX_PARTITIONS (1 << MAX_PARTITION_ORDER) |
48 | | #define MAX_LPC_PRECISION 15 |
49 | 0 | #define MIN_LPC_SHIFT 0 |
50 | 0 | #define MAX_LPC_SHIFT 15 |
51 | | |
52 | | enum CodingMode { |
53 | | CODING_MODE_RICE = 4, |
54 | | CODING_MODE_RICE2 = 5, |
55 | | }; |
56 | | |
57 | | typedef struct CompressionOptions { |
58 | | int compression_level; |
59 | | int block_time_ms; |
60 | | enum FFLPCType lpc_type; |
61 | | int lpc_passes; |
62 | | int lpc_coeff_precision; |
63 | | int min_prediction_order; |
64 | | int max_prediction_order; |
65 | | int prediction_order_method; |
66 | | int min_partition_order; |
67 | | int max_partition_order; |
68 | | int ch_mode; |
69 | | int exact_rice_parameters; |
70 | | int multi_dim_quant; |
71 | | } CompressionOptions; |
72 | | |
73 | | typedef struct RiceContext { |
74 | | enum CodingMode coding_mode; |
75 | | int porder; |
76 | | int params[MAX_PARTITIONS]; |
77 | | } RiceContext; |
78 | | |
79 | | typedef struct FlacSubframe { |
80 | | int type; |
81 | | int type_code; |
82 | | int obits; |
83 | | int wasted; |
84 | | int order; |
85 | | int32_t coefs[MAX_LPC_ORDER]; |
86 | | int shift; |
87 | | |
88 | | RiceContext rc; |
89 | | uint32_t rc_udata[FLAC_MAX_BLOCKSIZE]; |
90 | | uint64_t rc_sums[32][MAX_PARTITIONS]; |
91 | | |
92 | | int32_t samples[FLAC_MAX_BLOCKSIZE]; |
93 | | int32_t residual[FLAC_MAX_BLOCKSIZE+11]; |
94 | | } FlacSubframe; |
95 | | |
96 | | typedef struct FlacFrame { |
97 | | FlacSubframe subframes[FLAC_MAX_CHANNELS]; |
98 | | int64_t samples_33bps[FLAC_MAX_BLOCKSIZE]; |
99 | | int blocksize; |
100 | | int bs_code[2]; |
101 | | uint8_t crc8; |
102 | | int ch_mode; |
103 | | int verbatim_only; |
104 | | } FlacFrame; |
105 | | |
106 | | typedef struct FlacEncodeContext { |
107 | | AVClass *class; |
108 | | PutBitContext pb; |
109 | | int channels; |
110 | | int samplerate; |
111 | | int sr_code[2]; |
112 | | int bps_code; |
113 | | int max_blocksize; |
114 | | int min_framesize; |
115 | | int max_framesize; |
116 | | int max_encoded_framesize; |
117 | | uint32_t frame_count; |
118 | | uint64_t sample_count; |
119 | | uint8_t md5sum[16]; |
120 | | FlacFrame frame; |
121 | | CompressionOptions options; |
122 | | AVCodecContext *avctx; |
123 | | LPCContext lpc_ctx; |
124 | | struct AVMD5 *md5ctx; |
125 | | uint8_t *md5_buffer; |
126 | | unsigned int md5_buffer_size; |
127 | | BswapDSPContext bdsp; |
128 | | FLACEncDSPContext flac_dsp; |
129 | | |
130 | | int flushed; |
131 | | int64_t next_pts; |
132 | | } FlacEncodeContext; |
133 | | |
134 | | |
135 | | /** |
136 | | * Write streaminfo metadata block to byte array. |
137 | | */ |
138 | | static void write_streaminfo(FlacEncodeContext *s, uint8_t *header) |
139 | 0 | { |
140 | 0 | PutBitContext pb; |
141 | |
|
142 | 0 | memset(header, 0, FLAC_STREAMINFO_SIZE); |
143 | 0 | init_put_bits(&pb, header, FLAC_STREAMINFO_SIZE); |
144 | | |
145 | | /* streaminfo metadata block */ |
146 | 0 | put_bits(&pb, 16, s->max_blocksize); |
147 | 0 | put_bits(&pb, 16, s->max_blocksize); |
148 | 0 | put_bits(&pb, 24, s->min_framesize); |
149 | 0 | put_bits(&pb, 24, s->max_framesize); |
150 | 0 | put_bits(&pb, 20, s->samplerate); |
151 | 0 | put_bits(&pb, 3, s->channels-1); |
152 | 0 | put_bits(&pb, 5, s->avctx->bits_per_raw_sample - 1); |
153 | | /* write 36-bit sample count in 2 put_bits() calls */ |
154 | 0 | put_bits(&pb, 24, (s->sample_count & 0xFFFFFF000LL) >> 12); |
155 | 0 | put_bits(&pb, 12, s->sample_count & 0x000000FFFLL); |
156 | 0 | flush_put_bits(&pb); |
157 | 0 | memcpy(&header[18], s->md5sum, 16); |
158 | 0 | } |
159 | | |
160 | | |
161 | | /** |
162 | | * Calculate an estimate for the maximum frame size based on verbatim mode. |
163 | | * @param blocksize block size, in samples |
164 | | * @param ch number of channels |
165 | | * @param bps bits-per-sample |
166 | | */ |
167 | | static int flac_get_max_frame_size(int blocksize, int ch, int bps) |
168 | 0 | { |
169 | | /* Technically, there is no limit to FLAC frame size, but an encoder |
170 | | should not write a frame that is larger than if verbatim encoding mode |
171 | | were to be used. */ |
172 | |
|
173 | 0 | int count; |
174 | |
|
175 | 0 | count = 16; /* frame header */ |
176 | 0 | count += ch * ((7+bps+7)/8); /* subframe headers */ |
177 | 0 | if (ch == 2) { |
178 | | /* for stereo, need to account for using decorrelation */ |
179 | 0 | count += (( 2*bps+1) * blocksize + 7) / 8; |
180 | 0 | } else { |
181 | 0 | count += ( ch*bps * blocksize + 7) / 8; |
182 | 0 | } |
183 | 0 | count += 2; /* frame footer */ |
184 | |
|
185 | 0 | return count; |
186 | 0 | } |
187 | | |
188 | | |
189 | | /** |
190 | | * Set blocksize based on samplerate. |
191 | | * Choose the closest predefined blocksize >= BLOCK_TIME_MS milliseconds. |
192 | | */ |
193 | | static int select_blocksize(int samplerate, int block_time_ms) |
194 | 0 | { |
195 | 0 | int i; |
196 | 0 | int target; |
197 | 0 | int blocksize; |
198 | |
|
199 | 0 | av_assert0(samplerate > 0); |
200 | 0 | blocksize = ff_flac_blocksize_table[1]; |
201 | 0 | target = (samplerate * block_time_ms) / 1000; |
202 | 0 | for (i = 0; i < 16; i++) { |
203 | 0 | if (target >= ff_flac_blocksize_table[i] && |
204 | 0 | ff_flac_blocksize_table[i] > blocksize) { |
205 | 0 | blocksize = ff_flac_blocksize_table[i]; |
206 | 0 | } |
207 | 0 | } |
208 | 0 | return blocksize; |
209 | 0 | } |
210 | | |
211 | | |
212 | | static av_cold void dprint_compression_options(FlacEncodeContext *s) |
213 | 0 | { |
214 | 0 | AVCodecContext *avctx = s->avctx; |
215 | 0 | CompressionOptions *opt = &s->options; |
216 | |
|
217 | 0 | av_log(avctx, AV_LOG_DEBUG, " compression: %d\n", opt->compression_level); |
218 | |
|
219 | 0 | switch (opt->lpc_type) { |
220 | 0 | case FF_LPC_TYPE_NONE: |
221 | 0 | av_log(avctx, AV_LOG_DEBUG, " lpc type: None\n"); |
222 | 0 | break; |
223 | 0 | case FF_LPC_TYPE_FIXED: |
224 | 0 | av_log(avctx, AV_LOG_DEBUG, " lpc type: Fixed pre-defined coefficients\n"); |
225 | 0 | break; |
226 | 0 | case FF_LPC_TYPE_LEVINSON: |
227 | 0 | av_log(avctx, AV_LOG_DEBUG, " lpc type: Levinson-Durbin recursion with Welch window\n"); |
228 | 0 | break; |
229 | 0 | case FF_LPC_TYPE_CHOLESKY: |
230 | 0 | av_log(avctx, AV_LOG_DEBUG, " lpc type: Cholesky factorization, %d pass%s\n", |
231 | 0 | opt->lpc_passes, opt->lpc_passes == 1 ? "" : "es"); |
232 | 0 | break; |
233 | 0 | } |
234 | | |
235 | 0 | av_log(avctx, AV_LOG_DEBUG, " prediction order: %d, %d\n", |
236 | 0 | opt->min_prediction_order, opt->max_prediction_order); |
237 | |
|
238 | 0 | switch (opt->prediction_order_method) { |
239 | 0 | case ORDER_METHOD_EST: |
240 | 0 | av_log(avctx, AV_LOG_DEBUG, " order method: %s\n", "estimate"); |
241 | 0 | break; |
242 | 0 | case ORDER_METHOD_2LEVEL: |
243 | 0 | av_log(avctx, AV_LOG_DEBUG, " order method: %s\n", "2-level"); |
244 | 0 | break; |
245 | 0 | case ORDER_METHOD_4LEVEL: |
246 | 0 | av_log(avctx, AV_LOG_DEBUG, " order method: %s\n", "4-level"); |
247 | 0 | break; |
248 | 0 | case ORDER_METHOD_8LEVEL: |
249 | 0 | av_log(avctx, AV_LOG_DEBUG, " order method: %s\n", "8-level"); |
250 | 0 | break; |
251 | 0 | case ORDER_METHOD_SEARCH: |
252 | 0 | av_log(avctx, AV_LOG_DEBUG, " order method: %s\n", "full search"); |
253 | 0 | break; |
254 | 0 | case ORDER_METHOD_LOG: |
255 | 0 | av_log(avctx, AV_LOG_DEBUG, " order method: %s\n", "log search"); |
256 | 0 | break; |
257 | 0 | } |
258 | | |
259 | | |
260 | 0 | av_log(avctx, AV_LOG_DEBUG, " partition order: %d, %d\n", |
261 | 0 | opt->min_partition_order, opt->max_partition_order); |
262 | |
|
263 | 0 | av_log(avctx, AV_LOG_DEBUG, " block size: %d\n", avctx->frame_size); |
264 | |
|
265 | 0 | av_log(avctx, AV_LOG_DEBUG, " lpc precision: %d\n", |
266 | 0 | opt->lpc_coeff_precision); |
267 | 0 | } |
268 | | |
269 | | |
270 | | static av_cold int flac_encode_init(AVCodecContext *avctx) |
271 | 0 | { |
272 | 0 | int freq = avctx->sample_rate; |
273 | 0 | int channels = avctx->ch_layout.nb_channels; |
274 | 0 | FlacEncodeContext *s = avctx->priv_data; |
275 | 0 | int i, level, ret; |
276 | 0 | uint8_t *streaminfo; |
277 | |
|
278 | 0 | s->avctx = avctx; |
279 | |
|
280 | 0 | switch (avctx->sample_fmt) { |
281 | 0 | case AV_SAMPLE_FMT_S16: |
282 | 0 | avctx->bits_per_raw_sample = 16; |
283 | 0 | s->bps_code = 4; |
284 | 0 | break; |
285 | 0 | case AV_SAMPLE_FMT_S32: |
286 | 0 | if (avctx->bits_per_raw_sample <= 24) { |
287 | 0 | if (avctx->bits_per_raw_sample < 24) |
288 | 0 | av_log(avctx, AV_LOG_WARNING, "encoding as 24 bits-per-sample\n"); |
289 | 0 | avctx->bits_per_raw_sample = 24; |
290 | 0 | s->bps_code = 6; |
291 | 0 | } else if (avctx->strict_std_compliance > FF_COMPLIANCE_EXPERIMENTAL) { |
292 | 0 | av_log(avctx, AV_LOG_WARNING, |
293 | 0 | "encoding as 24 bits-per-sample, more is considered " |
294 | 0 | "experimental. Add -strict experimental if you want " |
295 | 0 | "to encode more than 24 bits-per-sample\n"); |
296 | 0 | avctx->bits_per_raw_sample = 24; |
297 | 0 | s->bps_code = 6; |
298 | 0 | } else { |
299 | 0 | avctx->bits_per_raw_sample = 32; |
300 | 0 | s->bps_code = 7; |
301 | 0 | } |
302 | 0 | break; |
303 | 0 | } |
304 | | |
305 | 0 | if (channels < 1 || channels > FLAC_MAX_CHANNELS) { |
306 | 0 | av_log(avctx, AV_LOG_ERROR, "%d channels not supported (max %d)\n", |
307 | 0 | channels, FLAC_MAX_CHANNELS); |
308 | 0 | return AVERROR(EINVAL); |
309 | 0 | } |
310 | 0 | s->channels = channels; |
311 | | |
312 | | /* find samplerate in table */ |
313 | 0 | if (freq < 1) |
314 | 0 | return AVERROR(EINVAL); |
315 | 0 | for (i = 1; i < 12; i++) { |
316 | 0 | if (freq == ff_flac_sample_rate_table[i]) { |
317 | 0 | s->samplerate = ff_flac_sample_rate_table[i]; |
318 | 0 | s->sr_code[0] = i; |
319 | 0 | s->sr_code[1] = 0; |
320 | 0 | break; |
321 | 0 | } |
322 | 0 | } |
323 | | /* if not in table, samplerate is non-standard */ |
324 | 0 | if (i == 12) { |
325 | 0 | if (freq % 1000 == 0 && freq < 255000) { |
326 | 0 | s->sr_code[0] = 12; |
327 | 0 | s->sr_code[1] = freq / 1000; |
328 | 0 | } else if (freq % 10 == 0 && freq < 655350) { |
329 | 0 | s->sr_code[0] = 14; |
330 | 0 | s->sr_code[1] = freq / 10; |
331 | 0 | } else if (freq < 65535) { |
332 | 0 | s->sr_code[0] = 13; |
333 | 0 | s->sr_code[1] = freq; |
334 | 0 | } else if (freq < 1048576) { |
335 | 0 | s->sr_code[0] = 0; |
336 | 0 | s->sr_code[1] = 0; |
337 | 0 | } else { |
338 | 0 | av_log(avctx, AV_LOG_ERROR, "%d Hz not supported\n", freq); |
339 | 0 | return AVERROR(EINVAL); |
340 | 0 | } |
341 | 0 | s->samplerate = freq; |
342 | 0 | } |
343 | | |
344 | | /* set compression option defaults based on avctx->compression_level */ |
345 | 0 | if (avctx->compression_level < 0) |
346 | 0 | s->options.compression_level = 5; |
347 | 0 | else |
348 | 0 | s->options.compression_level = avctx->compression_level; |
349 | |
|
350 | 0 | level = s->options.compression_level; |
351 | 0 | if (level > 12) { |
352 | 0 | av_log(avctx, AV_LOG_ERROR, "invalid compression level: %d\n", |
353 | 0 | s->options.compression_level); |
354 | 0 | return AVERROR(EINVAL); |
355 | 0 | } |
356 | | |
357 | 0 | s->options.block_time_ms = ((int[]){ 27, 27, 27,105,105,105,105,105,105,105,105,105,105})[level]; |
358 | |
|
359 | 0 | if (s->options.lpc_type == FF_LPC_TYPE_DEFAULT) |
360 | 0 | s->options.lpc_type = ((int[]){ FF_LPC_TYPE_FIXED, FF_LPC_TYPE_FIXED, FF_LPC_TYPE_FIXED, |
361 | 0 | FF_LPC_TYPE_LEVINSON, FF_LPC_TYPE_LEVINSON, FF_LPC_TYPE_LEVINSON, |
362 | 0 | FF_LPC_TYPE_LEVINSON, FF_LPC_TYPE_LEVINSON, FF_LPC_TYPE_LEVINSON, |
363 | 0 | FF_LPC_TYPE_LEVINSON, FF_LPC_TYPE_LEVINSON, FF_LPC_TYPE_LEVINSON, |
364 | 0 | FF_LPC_TYPE_LEVINSON})[level]; |
365 | |
|
366 | 0 | if (s->options.min_prediction_order < 0) |
367 | 0 | s->options.min_prediction_order = ((int[]){ 2, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1})[level]; |
368 | 0 | if (s->options.max_prediction_order < 0) |
369 | 0 | s->options.max_prediction_order = ((int[]){ 3, 4, 4, 6, 8, 8, 8, 8, 12, 12, 12, 32, 32})[level]; |
370 | |
|
371 | 0 | if (s->options.prediction_order_method < 0) |
372 | 0 | s->options.prediction_order_method = ((int[]){ ORDER_METHOD_EST, ORDER_METHOD_EST, ORDER_METHOD_EST, |
373 | 0 | ORDER_METHOD_EST, ORDER_METHOD_EST, ORDER_METHOD_EST, |
374 | 0 | ORDER_METHOD_4LEVEL, ORDER_METHOD_LOG, ORDER_METHOD_4LEVEL, |
375 | 0 | ORDER_METHOD_LOG, ORDER_METHOD_SEARCH, ORDER_METHOD_LOG, |
376 | 0 | ORDER_METHOD_SEARCH})[level]; |
377 | |
|
378 | 0 | if (s->options.min_partition_order > s->options.max_partition_order) { |
379 | 0 | av_log(avctx, AV_LOG_ERROR, "invalid partition orders: min=%d max=%d\n", |
380 | 0 | s->options.min_partition_order, s->options.max_partition_order); |
381 | 0 | return AVERROR(EINVAL); |
382 | 0 | } |
383 | 0 | if (s->options.min_partition_order < 0) |
384 | 0 | s->options.min_partition_order = ((int[]){ 2, 2, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0})[level]; |
385 | 0 | if (s->options.max_partition_order < 0) |
386 | 0 | s->options.max_partition_order = ((int[]){ 2, 2, 3, 3, 3, 8, 8, 8, 8, 8, 8, 8, 8})[level]; |
387 | |
|
388 | 0 | if (s->options.lpc_type == FF_LPC_TYPE_NONE) { |
389 | 0 | s->options.min_prediction_order = 0; |
390 | 0 | s->options.max_prediction_order = 0; |
391 | 0 | } else if (s->options.lpc_type == FF_LPC_TYPE_FIXED) { |
392 | 0 | if (s->options.min_prediction_order > MAX_FIXED_ORDER) { |
393 | 0 | av_log(avctx, AV_LOG_WARNING, |
394 | 0 | "invalid min prediction order %d, clamped to %d\n", |
395 | 0 | s->options.min_prediction_order, MAX_FIXED_ORDER); |
396 | 0 | s->options.min_prediction_order = MAX_FIXED_ORDER; |
397 | 0 | } |
398 | 0 | if (s->options.max_prediction_order > MAX_FIXED_ORDER) { |
399 | 0 | av_log(avctx, AV_LOG_WARNING, |
400 | 0 | "invalid max prediction order %d, clamped to %d\n", |
401 | 0 | s->options.max_prediction_order, MAX_FIXED_ORDER); |
402 | 0 | s->options.max_prediction_order = MAX_FIXED_ORDER; |
403 | 0 | } |
404 | 0 | } |
405 | |
|
406 | 0 | if (s->options.max_prediction_order < s->options.min_prediction_order) { |
407 | 0 | av_log(avctx, AV_LOG_ERROR, "invalid prediction orders: min=%d max=%d\n", |
408 | 0 | s->options.min_prediction_order, s->options.max_prediction_order); |
409 | 0 | return AVERROR(EINVAL); |
410 | 0 | } |
411 | | |
412 | 0 | if (avctx->frame_size > 0) { |
413 | 0 | if (avctx->frame_size < FLAC_MIN_BLOCKSIZE || |
414 | 0 | avctx->frame_size > FLAC_MAX_BLOCKSIZE) { |
415 | 0 | av_log(avctx, AV_LOG_ERROR, "invalid block size: %d\n", |
416 | 0 | avctx->frame_size); |
417 | 0 | return AVERROR(EINVAL); |
418 | 0 | } |
419 | 0 | } else { |
420 | 0 | s->avctx->frame_size = select_blocksize(s->samplerate, s->options.block_time_ms); |
421 | 0 | } |
422 | 0 | s->max_blocksize = s->avctx->frame_size; |
423 | | |
424 | | /* set maximum encoded frame size in verbatim mode */ |
425 | 0 | s->max_framesize = flac_get_max_frame_size(s->avctx->frame_size, |
426 | 0 | s->channels, |
427 | 0 | s->avctx->bits_per_raw_sample); |
428 | | |
429 | | /* initialize MD5 context */ |
430 | 0 | s->md5ctx = av_md5_alloc(); |
431 | 0 | if (!s->md5ctx) |
432 | 0 | return AVERROR(ENOMEM); |
433 | 0 | av_md5_init(s->md5ctx); |
434 | |
|
435 | 0 | streaminfo = av_malloc(FLAC_STREAMINFO_SIZE); |
436 | 0 | if (!streaminfo) |
437 | 0 | return AVERROR(ENOMEM); |
438 | 0 | write_streaminfo(s, streaminfo); |
439 | 0 | avctx->extradata = streaminfo; |
440 | 0 | avctx->extradata_size = FLAC_STREAMINFO_SIZE; |
441 | |
|
442 | 0 | s->frame_count = 0; |
443 | 0 | s->min_framesize = s->max_framesize; |
444 | |
|
445 | 0 | if ((channels == 3 && |
446 | 0 | av_channel_layout_compare(&avctx->ch_layout, &(AVChannelLayout)AV_CHANNEL_LAYOUT_SURROUND)) || |
447 | 0 | (channels == 4 && |
448 | 0 | av_channel_layout_compare(&avctx->ch_layout, &(AVChannelLayout)AV_CHANNEL_LAYOUT_2_2) && |
449 | 0 | av_channel_layout_compare(&avctx->ch_layout, &(AVChannelLayout)AV_CHANNEL_LAYOUT_QUAD)) || |
450 | 0 | (channels == 5 && |
451 | 0 | av_channel_layout_compare(&avctx->ch_layout, &(AVChannelLayout)AV_CHANNEL_LAYOUT_5POINT0) && |
452 | 0 | av_channel_layout_compare(&avctx->ch_layout, &(AVChannelLayout)AV_CHANNEL_LAYOUT_5POINT0_BACK)) || |
453 | 0 | (channels == 6 && |
454 | 0 | av_channel_layout_compare(&avctx->ch_layout, &(AVChannelLayout)AV_CHANNEL_LAYOUT_5POINT1) && |
455 | 0 | av_channel_layout_compare(&avctx->ch_layout, &(AVChannelLayout)AV_CHANNEL_LAYOUT_5POINT1_BACK))) { |
456 | 0 | if (avctx->ch_layout.order != AV_CHANNEL_ORDER_UNSPEC) { |
457 | 0 | av_log(avctx, AV_LOG_ERROR, "Channel layout not supported by Flac, " |
458 | 0 | "output stream will have incorrect " |
459 | 0 | "channel layout.\n"); |
460 | 0 | } else { |
461 | 0 | av_log(avctx, AV_LOG_WARNING, "No channel layout specified. The encoder " |
462 | 0 | "will use Flac channel layout for " |
463 | 0 | "%d channels.\n", channels); |
464 | 0 | } |
465 | 0 | } |
466 | |
|
467 | 0 | ret = ff_lpc_init(&s->lpc_ctx, avctx->frame_size, |
468 | 0 | s->options.max_prediction_order, FF_LPC_TYPE_LEVINSON); |
469 | |
|
470 | 0 | ff_bswapdsp_init(&s->bdsp); |
471 | 0 | ff_flacencdsp_init(&s->flac_dsp); |
472 | |
|
473 | 0 | dprint_compression_options(s); |
474 | |
|
475 | 0 | return ret; |
476 | 0 | } |
477 | | |
478 | | |
479 | | static void init_frame(FlacEncodeContext *s, int nb_samples) |
480 | 0 | { |
481 | 0 | int i, ch; |
482 | 0 | FlacFrame *frame; |
483 | |
|
484 | 0 | frame = &s->frame; |
485 | |
|
486 | 0 | for (i = 0; i < 16; i++) { |
487 | 0 | if (nb_samples == ff_flac_blocksize_table[i]) { |
488 | 0 | frame->blocksize = ff_flac_blocksize_table[i]; |
489 | 0 | frame->bs_code[0] = i; |
490 | 0 | frame->bs_code[1] = 0; |
491 | 0 | break; |
492 | 0 | } |
493 | 0 | } |
494 | 0 | if (i == 16) { |
495 | 0 | frame->blocksize = nb_samples; |
496 | 0 | if (frame->blocksize <= 256) { |
497 | 0 | frame->bs_code[0] = 6; |
498 | 0 | frame->bs_code[1] = frame->blocksize-1; |
499 | 0 | } else { |
500 | 0 | frame->bs_code[0] = 7; |
501 | 0 | frame->bs_code[1] = frame->blocksize-1; |
502 | 0 | } |
503 | 0 | } |
504 | |
|
505 | 0 | for (ch = 0; ch < s->channels; ch++) { |
506 | 0 | FlacSubframe *sub = &frame->subframes[ch]; |
507 | |
|
508 | 0 | sub->wasted = 0; |
509 | 0 | sub->obits = s->avctx->bits_per_raw_sample; |
510 | |
|
511 | 0 | if (sub->obits > 16) |
512 | 0 | sub->rc.coding_mode = CODING_MODE_RICE2; |
513 | 0 | else |
514 | 0 | sub->rc.coding_mode = CODING_MODE_RICE; |
515 | 0 | } |
516 | |
|
517 | 0 | frame->verbatim_only = 0; |
518 | 0 | } |
519 | | |
520 | | |
521 | | /** |
522 | | * Copy channel-interleaved input samples into separate subframes. |
523 | | */ |
524 | | static void copy_samples(FlacEncodeContext *s, const void *samples) |
525 | 0 | { |
526 | 0 | int i, j, ch; |
527 | 0 | FlacFrame *frame; |
528 | |
|
529 | 0 | #define COPY_SAMPLES(bits, shift0) do { \ |
530 | 0 | const int ## bits ## _t *samples0 = samples; \ |
531 | 0 | const int shift = shift0; \ |
532 | 0 | frame = &s->frame; \ |
533 | 0 | for (i = 0, j = 0; i < frame->blocksize; i++) \ |
534 | 0 | for (ch = 0; ch < s->channels; ch++, j++) \ |
535 | 0 | frame->subframes[ch].samples[i] = samples0[j] >> shift; \ |
536 | 0 | } while (0) |
537 | |
|
538 | 0 | if (s->avctx->sample_fmt == AV_SAMPLE_FMT_S16) |
539 | 0 | COPY_SAMPLES(16, 0); |
540 | 0 | else |
541 | 0 | COPY_SAMPLES(32, 32 - s->avctx->bits_per_raw_sample); |
542 | 0 | } |
543 | | |
544 | | |
545 | | static uint64_t rice_count_exact(const int32_t *res, int n, int k) |
546 | 0 | { |
547 | 0 | int i; |
548 | 0 | uint64_t count = 0; |
549 | |
|
550 | 0 | for (i = 0; i < n; i++) { |
551 | 0 | unsigned v = ((unsigned)(res[i]) << 1) ^ (res[i] >> 31); |
552 | 0 | count += (v >> k) + 1 + k; |
553 | 0 | } |
554 | 0 | return count; |
555 | 0 | } |
556 | | |
557 | | |
558 | | static uint64_t subframe_count_exact(FlacEncodeContext *s, FlacSubframe *sub, |
559 | | int pred_order) |
560 | 0 | { |
561 | 0 | int p, porder, psize; |
562 | 0 | int i, part_end; |
563 | 0 | uint64_t count = 0; |
564 | | |
565 | | /* subframe header */ |
566 | 0 | count += 8; |
567 | |
|
568 | 0 | if (sub->wasted) |
569 | 0 | count += sub->wasted; |
570 | | |
571 | | /* subframe */ |
572 | 0 | if (sub->type == FLAC_SUBFRAME_CONSTANT) { |
573 | 0 | count += sub->obits; |
574 | 0 | } else if (sub->type == FLAC_SUBFRAME_VERBATIM) { |
575 | 0 | count += s->frame.blocksize * sub->obits; |
576 | 0 | } else { |
577 | | /* warm-up samples */ |
578 | 0 | count += pred_order * sub->obits; |
579 | | |
580 | | /* LPC coefficients */ |
581 | 0 | if (sub->type == FLAC_SUBFRAME_LPC) |
582 | 0 | count += 4 + 5 + pred_order * s->options.lpc_coeff_precision; |
583 | | |
584 | | /* rice-encoded block */ |
585 | 0 | count += 2; |
586 | | |
587 | | /* partition order */ |
588 | 0 | porder = sub->rc.porder; |
589 | 0 | psize = s->frame.blocksize >> porder; |
590 | 0 | count += 4; |
591 | | |
592 | | /* residual */ |
593 | 0 | i = pred_order; |
594 | 0 | part_end = psize; |
595 | 0 | for (p = 0; p < 1 << porder; p++) { |
596 | 0 | int k = sub->rc.params[p]; |
597 | 0 | count += sub->rc.coding_mode; |
598 | 0 | count += rice_count_exact(&sub->residual[i], part_end - i, k); |
599 | 0 | i = part_end; |
600 | 0 | part_end = FFMIN(s->frame.blocksize, part_end + psize); |
601 | 0 | } |
602 | 0 | } |
603 | |
|
604 | 0 | return count; |
605 | 0 | } |
606 | | |
607 | | |
608 | 0 | #define rice_encode_count(sum, n, k) (((n)*((k)+1))+((sum-(n>>1))>>(k))) |
609 | | |
610 | | /** |
611 | | * Solve for d/dk(rice_encode_count) = n-((sum-(n>>1))>>(k+1)) = 0. |
612 | | */ |
613 | | static int find_optimal_param(uint64_t sum, int n, int max_param) |
614 | 0 | { |
615 | 0 | int k; |
616 | 0 | uint64_t sum2; |
617 | |
|
618 | 0 | if (sum <= n >> 1) |
619 | 0 | return 0; |
620 | 0 | sum2 = sum - (n >> 1); |
621 | 0 | k = av_log2(av_clipl_int32(sum2 / n)); |
622 | 0 | return FFMIN(k, max_param); |
623 | 0 | } |
624 | | |
625 | | static int find_optimal_param_exact(uint64_t sums[32][MAX_PARTITIONS], int i, int max_param) |
626 | 0 | { |
627 | 0 | int bestk = 0; |
628 | 0 | int64_t bestbits = INT64_MAX; |
629 | 0 | int k; |
630 | |
|
631 | 0 | for (k = 0; k <= max_param; k++) { |
632 | 0 | int64_t bits = sums[k][i]; |
633 | 0 | if (bits < bestbits) { |
634 | 0 | bestbits = bits; |
635 | 0 | bestk = k; |
636 | 0 | } |
637 | 0 | } |
638 | |
|
639 | 0 | return bestk; |
640 | 0 | } |
641 | | |
642 | | static uint64_t calc_optimal_rice_params(RiceContext *rc, int porder, |
643 | | uint64_t sums[32][MAX_PARTITIONS], |
644 | | int n, int pred_order, int max_param, int exact) |
645 | 0 | { |
646 | 0 | int i; |
647 | 0 | int k, cnt, part; |
648 | 0 | uint64_t all_bits; |
649 | |
|
650 | 0 | part = (1 << porder); |
651 | 0 | all_bits = 4 * part; |
652 | |
|
653 | 0 | cnt = (n >> porder) - pred_order; |
654 | 0 | for (i = 0; i < part; i++) { |
655 | 0 | if (exact) { |
656 | 0 | k = find_optimal_param_exact(sums, i, max_param); |
657 | 0 | all_bits += sums[k][i]; |
658 | 0 | } else { |
659 | 0 | k = find_optimal_param(sums[0][i], cnt, max_param); |
660 | 0 | all_bits += rice_encode_count(sums[0][i], cnt, k); |
661 | 0 | } |
662 | 0 | rc->params[i] = k; |
663 | 0 | cnt = n >> porder; |
664 | 0 | } |
665 | |
|
666 | 0 | rc->porder = porder; |
667 | |
|
668 | 0 | return all_bits; |
669 | 0 | } |
670 | | |
671 | | |
672 | | static void calc_sum_top(int pmax, int kmax, const uint32_t *data, int n, int pred_order, |
673 | | uint64_t sums[32][MAX_PARTITIONS]) |
674 | 0 | { |
675 | 0 | int i, k; |
676 | 0 | int parts; |
677 | 0 | const uint32_t *res, *res_end; |
678 | | |
679 | | /* sums for highest level */ |
680 | 0 | parts = (1 << pmax); |
681 | |
|
682 | 0 | for (k = 0; k <= kmax; k++) { |
683 | 0 | res = &data[pred_order]; |
684 | 0 | res_end = &data[n >> pmax]; |
685 | 0 | for (i = 0; i < parts; i++) { |
686 | 0 | if (kmax) { |
687 | 0 | uint64_t sum = (1LL + k) * (res_end - res); |
688 | 0 | while (res < res_end) |
689 | 0 | sum += *(res++) >> k; |
690 | 0 | sums[k][i] = sum; |
691 | 0 | } else { |
692 | 0 | uint64_t sum = 0; |
693 | 0 | while (res < res_end) |
694 | 0 | sum += *(res++); |
695 | 0 | sums[k][i] = sum; |
696 | 0 | } |
697 | 0 | res_end += n >> pmax; |
698 | 0 | } |
699 | 0 | } |
700 | 0 | } |
701 | | |
702 | | static void calc_sum_next(int level, uint64_t sums[32][MAX_PARTITIONS], int kmax) |
703 | 0 | { |
704 | 0 | int i, k; |
705 | 0 | int parts = (1 << level); |
706 | 0 | for (i = 0; i < parts; i++) { |
707 | 0 | for (k=0; k<=kmax; k++) |
708 | 0 | sums[k][i] = sums[k][2*i] + sums[k][2*i+1]; |
709 | 0 | } |
710 | 0 | } |
711 | | |
712 | | static uint64_t calc_rice_params(RiceContext *rc, |
713 | | uint32_t udata[FLAC_MAX_BLOCKSIZE], |
714 | | uint64_t sums[32][MAX_PARTITIONS], |
715 | | int pmin, int pmax, |
716 | | const int32_t *data, int n, int pred_order, int exact) |
717 | 0 | { |
718 | 0 | int i; |
719 | 0 | uint64_t bits[MAX_PARTITION_ORDER+1]; |
720 | 0 | int opt_porder; |
721 | 0 | RiceContext tmp_rc; |
722 | 0 | int kmax = (1 << rc->coding_mode) - 2; |
723 | |
|
724 | 0 | av_assert1(pmin >= 0 && pmin <= MAX_PARTITION_ORDER); |
725 | 0 | av_assert1(pmax >= 0 && pmax <= MAX_PARTITION_ORDER); |
726 | 0 | av_assert1(pmin <= pmax); |
727 | |
|
728 | 0 | tmp_rc.coding_mode = rc->coding_mode; |
729 | |
|
730 | 0 | for (i = pred_order; i < n; i++) |
731 | 0 | udata[i] = ((unsigned)(data[i]) << 1) ^ (data[i] >> 31); |
732 | |
|
733 | 0 | calc_sum_top(pmax, exact ? kmax : 0, udata, n, pred_order, sums); |
734 | |
|
735 | 0 | opt_porder = pmin; |
736 | 0 | bits[pmin] = UINT32_MAX; |
737 | 0 | for (i = pmax; ; ) { |
738 | 0 | bits[i] = calc_optimal_rice_params(&tmp_rc, i, sums, n, pred_order, kmax, exact); |
739 | 0 | if (bits[i] < bits[opt_porder] || pmax == pmin) { |
740 | 0 | opt_porder = i; |
741 | 0 | *rc = tmp_rc; |
742 | 0 | } |
743 | 0 | if (i == pmin) |
744 | 0 | break; |
745 | 0 | calc_sum_next(--i, sums, exact ? kmax : 0); |
746 | 0 | } |
747 | |
|
748 | 0 | return bits[opt_porder]; |
749 | 0 | } |
750 | | |
751 | | |
752 | | static int get_max_p_order(int max_porder, int n, int order) |
753 | 0 | { |
754 | 0 | int porder = FFMIN(max_porder, av_log2(n^(n-1))); |
755 | 0 | if (order > 0) |
756 | 0 | porder = FFMIN(porder, av_log2(n/order)); |
757 | 0 | return porder; |
758 | 0 | } |
759 | | |
760 | | |
761 | | static uint64_t find_subframe_rice_params(FlacEncodeContext *s, |
762 | | FlacSubframe *sub, int pred_order) |
763 | 0 | { |
764 | 0 | int pmin = get_max_p_order(s->options.min_partition_order, |
765 | 0 | s->frame.blocksize, pred_order); |
766 | 0 | int pmax = get_max_p_order(s->options.max_partition_order, |
767 | 0 | s->frame.blocksize, pred_order); |
768 | |
|
769 | 0 | uint64_t bits = 8 + pred_order * sub->obits + 2 + sub->rc.coding_mode; |
770 | 0 | if (sub->type == FLAC_SUBFRAME_LPC) |
771 | 0 | bits += 4 + 5 + pred_order * s->options.lpc_coeff_precision; |
772 | 0 | bits += calc_rice_params(&sub->rc, sub->rc_udata, sub->rc_sums, pmin, pmax, sub->residual, |
773 | 0 | s->frame.blocksize, pred_order, s->options.exact_rice_parameters); |
774 | 0 | return bits; |
775 | 0 | } |
776 | | |
777 | | |
778 | | static void encode_residual_fixed(int32_t *res, const int32_t *smp, int n, |
779 | | int order) |
780 | 0 | { |
781 | 0 | int i; |
782 | |
|
783 | 0 | for (i = 0; i < order; i++) |
784 | 0 | res[i] = smp[i]; |
785 | |
|
786 | 0 | if (order == 0) { |
787 | 0 | for (i = order; i < n; i++) |
788 | 0 | res[i] = smp[i]; |
789 | 0 | } else if (order == 1) { |
790 | 0 | for (i = order; i < n; i++) |
791 | 0 | res[i] = smp[i] - smp[i-1]; |
792 | 0 | } else if (order == 2) { |
793 | 0 | int a = smp[order-1] - smp[order-2]; |
794 | 0 | for (i = order; i < n; i += 2) { |
795 | 0 | int b = smp[i ] - smp[i-1]; |
796 | 0 | res[i] = b - a; |
797 | 0 | a = smp[i+1] - smp[i ]; |
798 | 0 | res[i+1] = a - b; |
799 | 0 | } |
800 | 0 | } else if (order == 3) { |
801 | 0 | int a = smp[order-1] - smp[order-2]; |
802 | 0 | int c = smp[order-1] - 2*smp[order-2] + smp[order-3]; |
803 | 0 | for (i = order; i < n; i += 2) { |
804 | 0 | int b = smp[i ] - smp[i-1]; |
805 | 0 | int d = b - a; |
806 | 0 | res[i] = d - c; |
807 | 0 | a = smp[i+1] - smp[i ]; |
808 | 0 | c = a - b; |
809 | 0 | res[i+1] = c - d; |
810 | 0 | } |
811 | 0 | } else { |
812 | 0 | int a = smp[order-1] - smp[order-2]; |
813 | 0 | int c = smp[order-1] - 2*smp[order-2] + smp[order-3]; |
814 | 0 | int e = smp[order-1] - 3*smp[order-2] + 3*smp[order-3] - smp[order-4]; |
815 | 0 | for (i = order; i < n; i += 2) { |
816 | 0 | int b = smp[i ] - smp[i-1]; |
817 | 0 | int d = b - a; |
818 | 0 | int f = d - c; |
819 | 0 | res[i ] = f - e; |
820 | 0 | a = smp[i+1] - smp[i ]; |
821 | 0 | c = a - b; |
822 | 0 | e = c - d; |
823 | 0 | res[i+1] = e - f; |
824 | 0 | } |
825 | 0 | } |
826 | 0 | } |
827 | | |
828 | | |
829 | | /* These four functions check for every residual whether it can be |
830 | | * contained in <INT32_MIN,INT32_MAX]. In case it doesn't, the |
831 | | * function that called this function has to try something else. |
832 | | * Each function is duplicated, once for int32_t input, once for |
833 | | * int64_t input */ |
834 | 0 | #define ENCODE_RESIDUAL_FIXED_WITH_RESIDUAL_LIMIT() \ |
835 | 0 | { \ |
836 | 0 | for (int i = 0; i < order; i++) \ |
837 | 0 | res[i] = smp[i]; \ |
838 | 0 | if (order == 0) { \ |
839 | 0 | for (int i = order; i < n; i++) { \ |
840 | 0 | if (smp[i] == INT32_MIN) \ |
841 | 0 | return 1; \ |
842 | 0 | res[i] = smp[i]; \ |
843 | 0 | } \ |
844 | 0 | } else if (order == 1) { \ |
845 | 0 | for (int i = order; i < n; i++) { \ |
846 | 0 | int64_t res64 = (int64_t)smp[i] - smp[i-1]; \ |
847 | 0 | if (res64 <= INT32_MIN || res64 > INT32_MAX) \ |
848 | 0 | return 1; \ |
849 | 0 | res[i] = res64; \ |
850 | 0 | } \ |
851 | 0 | } else if (order == 2) { \ |
852 | 0 | for (int i = order; i < n; i++) { \ |
853 | 0 | int64_t res64 = (int64_t)smp[i] - 2*(int64_t)smp[i-1] + smp[i-2]; \ |
854 | 0 | if (res64 <= INT32_MIN || res64 > INT32_MAX) \ |
855 | 0 | return 1; \ |
856 | 0 | res[i] = res64; \ |
857 | 0 | } \ |
858 | 0 | } else if (order == 3) { \ |
859 | 0 | for (int i = order; i < n; i++) { \ |
860 | 0 | int64_t res64 = (int64_t)smp[i] - 3*(int64_t)smp[i-1] + 3*(int64_t)smp[i-2] - smp[i-3]; \ |
861 | 0 | if (res64 <= INT32_MIN || res64 > INT32_MAX) \ |
862 | 0 | return 1; \ |
863 | 0 | res[i] = res64; \ |
864 | 0 | } \ |
865 | 0 | } else { \ |
866 | 0 | for (int i = order; i < n; i++) { \ |
867 | 0 | int64_t res64 = (int64_t)smp[i] - 4*(int64_t)smp[i-1] + 6*(int64_t)smp[i-2] - 4*(int64_t)smp[i-3] + smp[i-4]; \ |
868 | 0 | if (res64 <= INT32_MIN || res64 > INT32_MAX) \ |
869 | 0 | return 1; \ |
870 | 0 | res[i] = res64; \ |
871 | 0 | } \ |
872 | 0 | } \ |
873 | 0 | return 0; \ |
874 | 0 | } |
875 | | |
876 | | static int encode_residual_fixed_with_residual_limit(int32_t *res, const int32_t *smp, |
877 | | int n, int order) |
878 | 0 | { |
879 | 0 | ENCODE_RESIDUAL_FIXED_WITH_RESIDUAL_LIMIT(); |
880 | 0 | } |
881 | | |
882 | | |
883 | | static int encode_residual_fixed_with_residual_limit_33bps(int32_t *res, const int64_t *smp, |
884 | | int n, int order) |
885 | 0 | { |
886 | 0 | ENCODE_RESIDUAL_FIXED_WITH_RESIDUAL_LIMIT(); |
887 | 0 | } |
888 | | |
889 | 0 | #define LPC_ENCODE_WITH_RESIDUAL_LIMIT() \ |
890 | 0 | { \ |
891 | 0 | for (int i = 0; i < order; i++) \ |
892 | 0 | res[i] = smp[i]; \ |
893 | 0 | for (int i = order; i < len; i++) { \ |
894 | 0 | int64_t p = 0, tmp; \ |
895 | 0 | for (int j = 0; j < order; j++) \ |
896 | 0 | p += (int64_t)coefs[j]*smp[(i-1)-j]; \ |
897 | 0 | p >>= shift; \ |
898 | 0 | tmp = smp[i] - p; \ |
899 | 0 | if (tmp <= INT32_MIN || tmp > INT32_MAX) \ |
900 | 0 | return 1; \ |
901 | 0 | res[i] = tmp; \ |
902 | 0 | } \ |
903 | 0 | return 0; \ |
904 | 0 | } |
905 | | |
906 | | static int lpc_encode_with_residual_limit(int32_t *res, const int32_t *smp, int len, |
907 | | int order, int32_t *coefs, int shift) |
908 | 0 | { |
909 | 0 | LPC_ENCODE_WITH_RESIDUAL_LIMIT(); |
910 | 0 | } |
911 | | |
912 | | static int lpc_encode_with_residual_limit_33bps(int32_t *res, const int64_t *smp, int len, |
913 | | int order, int32_t *coefs, int shift) |
914 | 0 | { |
915 | 0 | LPC_ENCODE_WITH_RESIDUAL_LIMIT(); |
916 | 0 | } |
917 | | |
918 | | static int lpc_encode_choose_datapath(FlacEncodeContext *s, int32_t bps, |
919 | | int32_t *res, const int32_t *smp, |
920 | | const int64_t *smp_33bps, int len, |
921 | | int order, int32_t *coefs, int shift) |
922 | 0 | { |
923 | 0 | uint64_t max_residual_value = 0; |
924 | 0 | int64_t max_sample_value = ((int64_t)(1) << (bps-1)); |
925 | | /* This calculates the max size of any residual with the current |
926 | | * predictor, so we know whether we need to check the residual */ |
927 | 0 | for (int i = 0; i < order; i++) |
928 | 0 | max_residual_value += FFABS(max_sample_value * coefs[i]); |
929 | 0 | max_residual_value >>= shift; |
930 | 0 | max_residual_value += max_sample_value; |
931 | 0 | if (bps > 32) { |
932 | 0 | if (lpc_encode_with_residual_limit_33bps(res, smp_33bps, len, order, coefs, shift)) |
933 | 0 | return 1; |
934 | 0 | } else if (max_residual_value > INT32_MAX) { |
935 | 0 | if (lpc_encode_with_residual_limit(res, smp, len, order, coefs, shift)) |
936 | 0 | return 1; |
937 | 0 | } else if (bps + s->options.lpc_coeff_precision + av_log2(order) <= 32) { |
938 | 0 | s->flac_dsp.lpc16_encode(res, smp, len, order, coefs, shift); |
939 | 0 | } else { |
940 | 0 | s->flac_dsp.lpc32_encode(res, smp, len, order, coefs, shift); |
941 | 0 | } |
942 | 0 | return 0; |
943 | 0 | } |
944 | | |
945 | 0 | #define DEFAULT_TO_VERBATIM() \ |
946 | 0 | { \ |
947 | 0 | sub->type = sub->type_code = FLAC_SUBFRAME_VERBATIM; \ |
948 | 0 | if (sub->obits <= 32) \ |
949 | 0 | memcpy(res, smp, n * sizeof(int32_t)); \ |
950 | 0 | return subframe_count_exact(s, sub, 0); \ |
951 | 0 | } |
952 | | |
953 | | static int encode_residual_ch(FlacEncodeContext *s, int ch) |
954 | 0 | { |
955 | 0 | int i, n; |
956 | 0 | int min_order, max_order, opt_order, omethod; |
957 | 0 | FlacFrame *frame; |
958 | 0 | FlacSubframe *sub; |
959 | 0 | int32_t coefs[MAX_LPC_ORDER][MAX_LPC_ORDER]; |
960 | 0 | int shift[MAX_LPC_ORDER]; |
961 | 0 | int32_t *res, *smp; |
962 | 0 | int64_t *smp_33bps; |
963 | |
|
964 | 0 | frame = &s->frame; |
965 | 0 | sub = &frame->subframes[ch]; |
966 | 0 | res = sub->residual; |
967 | 0 | smp = sub->samples; |
968 | 0 | smp_33bps = frame->samples_33bps; |
969 | 0 | n = frame->blocksize; |
970 | | |
971 | | /* CONSTANT */ |
972 | 0 | if (sub->obits > 32) { |
973 | 0 | for (i = 1; i < n; i++) |
974 | 0 | if(smp_33bps[i] != smp_33bps[0]) |
975 | 0 | break; |
976 | 0 | if (i == n) { |
977 | 0 | sub->type = sub->type_code = FLAC_SUBFRAME_CONSTANT; |
978 | 0 | return subframe_count_exact(s, sub, 0); |
979 | 0 | } |
980 | 0 | } else { |
981 | 0 | for (i = 1; i < n; i++) |
982 | 0 | if(smp[i] != smp[0]) |
983 | 0 | break; |
984 | 0 | if (i == n) { |
985 | 0 | sub->type = sub->type_code = FLAC_SUBFRAME_CONSTANT; |
986 | 0 | res[0] = smp[0]; |
987 | 0 | return subframe_count_exact(s, sub, 0); |
988 | 0 | } |
989 | 0 | } |
990 | | |
991 | | /* VERBATIM */ |
992 | 0 | if (frame->verbatim_only || n < 5) { |
993 | 0 | DEFAULT_TO_VERBATIM(); |
994 | 0 | } |
995 | | |
996 | 0 | min_order = s->options.min_prediction_order; |
997 | 0 | max_order = s->options.max_prediction_order; |
998 | 0 | omethod = s->options.prediction_order_method; |
999 | | |
1000 | | /* FIXED */ |
1001 | 0 | sub->type = FLAC_SUBFRAME_FIXED; |
1002 | 0 | if (s->options.lpc_type == FF_LPC_TYPE_NONE || |
1003 | 0 | s->options.lpc_type == FF_LPC_TYPE_FIXED || n <= max_order) { |
1004 | 0 | uint64_t bits[MAX_FIXED_ORDER+1]; |
1005 | 0 | if (max_order > MAX_FIXED_ORDER) |
1006 | 0 | max_order = MAX_FIXED_ORDER; |
1007 | 0 | opt_order = 0; |
1008 | 0 | bits[0] = UINT32_MAX; |
1009 | 0 | for (i = min_order; i <= max_order; i++) { |
1010 | 0 | if (sub->obits == 33) { |
1011 | 0 | if (encode_residual_fixed_with_residual_limit_33bps(res, smp_33bps, n, i)) |
1012 | 0 | continue; |
1013 | 0 | } else if (sub->obits + i >= 32) { |
1014 | 0 | if (encode_residual_fixed_with_residual_limit(res, smp, n, i)) |
1015 | 0 | continue; |
1016 | 0 | } else |
1017 | 0 | encode_residual_fixed(res, smp, n, i); |
1018 | 0 | bits[i] = find_subframe_rice_params(s, sub, i); |
1019 | 0 | if (bits[i] < bits[opt_order]) |
1020 | 0 | opt_order = i; |
1021 | 0 | } |
1022 | 0 | if (opt_order == 0 && bits[0] == UINT32_MAX) { |
1023 | | /* No predictor found with residuals within <INT32_MIN,INT32_MAX], |
1024 | | * so encode a verbatim subframe instead */ |
1025 | 0 | DEFAULT_TO_VERBATIM(); |
1026 | 0 | } |
1027 | 0 | sub->order = opt_order; |
1028 | 0 | sub->type_code = sub->type | sub->order; |
1029 | 0 | if (sub->order != max_order) { |
1030 | 0 | if (sub->obits == 33) |
1031 | 0 | encode_residual_fixed_with_residual_limit_33bps(res, smp_33bps, n, sub->order); |
1032 | 0 | else if (sub->obits + i >= 32) |
1033 | 0 | encode_residual_fixed_with_residual_limit(res, smp, n, sub->order); |
1034 | 0 | else |
1035 | 0 | encode_residual_fixed(res, smp, n, sub->order); |
1036 | 0 | find_subframe_rice_params(s, sub, sub->order); |
1037 | 0 | } |
1038 | 0 | return subframe_count_exact(s, sub, sub->order); |
1039 | 0 | } |
1040 | | |
1041 | | /* LPC */ |
1042 | 0 | sub->type = FLAC_SUBFRAME_LPC; |
1043 | 0 | if (sub->obits == 33) |
1044 | | /* As ff_lpc_calc_coefs is shared with other codecs and the LSB |
1045 | | * probably isn't predictable anyway, throw away LSB for analysis |
1046 | | * so it fits 32 bit int and existing function can be used |
1047 | | * unmodified */ |
1048 | 0 | for (i = 0; i < n; i++) |
1049 | 0 | smp[i] = smp_33bps[i] >> 1; |
1050 | |
|
1051 | 0 | opt_order = ff_lpc_calc_coefs(&s->lpc_ctx, smp, n, min_order, max_order, |
1052 | 0 | s->options.lpc_coeff_precision, coefs, shift, s->options.lpc_type, |
1053 | 0 | s->options.lpc_passes, omethod, |
1054 | 0 | MIN_LPC_SHIFT, MAX_LPC_SHIFT, 0); |
1055 | |
|
1056 | 0 | if (omethod == ORDER_METHOD_2LEVEL || |
1057 | 0 | omethod == ORDER_METHOD_4LEVEL || |
1058 | 0 | omethod == ORDER_METHOD_8LEVEL) { |
1059 | 0 | int levels = 1 << omethod; |
1060 | 0 | uint64_t bits[1 << ORDER_METHOD_8LEVEL]; |
1061 | 0 | int order = -1; |
1062 | 0 | int opt_index = levels-1; |
1063 | 0 | opt_order = max_order-1; |
1064 | 0 | bits[opt_index] = UINT32_MAX; |
1065 | 0 | for (i = levels-1; i >= 0; i--) { |
1066 | 0 | int last_order = order; |
1067 | 0 | order = min_order + (((max_order-min_order+1) * (i+1)) / levels)-1; |
1068 | 0 | order = av_clip(order, min_order - 1, max_order - 1); |
1069 | 0 | if (order == last_order) |
1070 | 0 | continue; |
1071 | 0 | if(lpc_encode_choose_datapath(s, sub->obits, res, smp, smp_33bps, n, order+1, coefs[order], shift[order])) |
1072 | 0 | continue; |
1073 | 0 | bits[i] = find_subframe_rice_params(s, sub, order+1); |
1074 | 0 | if (bits[i] < bits[opt_index]) { |
1075 | 0 | opt_index = i; |
1076 | 0 | opt_order = order; |
1077 | 0 | } |
1078 | 0 | } |
1079 | 0 | opt_order++; |
1080 | 0 | } else if (omethod == ORDER_METHOD_SEARCH) { |
1081 | | // brute-force optimal order search |
1082 | 0 | uint64_t bits[MAX_LPC_ORDER]; |
1083 | 0 | opt_order = 0; |
1084 | 0 | bits[0] = UINT32_MAX; |
1085 | 0 | for (i = min_order-1; i < max_order; i++) { |
1086 | 0 | if(lpc_encode_choose_datapath(s, sub->obits, res, smp, smp_33bps, n, i+1, coefs[i], shift[i])) |
1087 | 0 | continue; |
1088 | 0 | bits[i] = find_subframe_rice_params(s, sub, i+1); |
1089 | 0 | if (bits[i] < bits[opt_order]) |
1090 | 0 | opt_order = i; |
1091 | 0 | } |
1092 | 0 | opt_order++; |
1093 | 0 | } else if (omethod == ORDER_METHOD_LOG) { |
1094 | 0 | uint64_t bits[MAX_LPC_ORDER]; |
1095 | 0 | int step; |
1096 | |
|
1097 | 0 | opt_order = min_order - 1 + (max_order-min_order)/3; |
1098 | 0 | memset(bits, -1, sizeof(bits)); |
1099 | |
|
1100 | 0 | for (step = 16; step; step >>= 1) { |
1101 | 0 | int last = opt_order; |
1102 | 0 | for (i = last-step; i <= last+step; i += step) { |
1103 | 0 | if (i < min_order-1 || i >= max_order || bits[i] < UINT32_MAX) |
1104 | 0 | continue; |
1105 | 0 | if(lpc_encode_choose_datapath(s, sub->obits, res, smp, smp_33bps, n, i+1, coefs[i], shift[i])) |
1106 | 0 | continue; |
1107 | 0 | bits[i] = find_subframe_rice_params(s, sub, i+1); |
1108 | 0 | if (bits[i] < bits[opt_order]) |
1109 | 0 | opt_order = i; |
1110 | 0 | } |
1111 | 0 | } |
1112 | 0 | opt_order++; |
1113 | 0 | } |
1114 | |
|
1115 | 0 | if (s->options.multi_dim_quant) { |
1116 | 0 | int allsteps = 1; |
1117 | 0 | int i, step, improved; |
1118 | 0 | int64_t best_score = INT64_MAX; |
1119 | 0 | int32_t qmax; |
1120 | |
|
1121 | 0 | qmax = (1 << (s->options.lpc_coeff_precision - 1)) - 1; |
1122 | |
|
1123 | 0 | for (i=0; i<opt_order; i++) |
1124 | 0 | allsteps *= 3; |
1125 | |
|
1126 | 0 | do { |
1127 | 0 | improved = 0; |
1128 | 0 | for (step = 0; step < allsteps; step++) { |
1129 | 0 | int tmp = step; |
1130 | 0 | int32_t lpc_try[MAX_LPC_ORDER]; |
1131 | 0 | int64_t score = 0; |
1132 | 0 | int diffsum = 0; |
1133 | |
|
1134 | 0 | for (i=0; i<opt_order; i++) { |
1135 | 0 | int diff = ((tmp + 1) % 3) - 1; |
1136 | 0 | lpc_try[i] = av_clip(coefs[opt_order - 1][i] + diff, -qmax, qmax); |
1137 | 0 | tmp /= 3; |
1138 | 0 | diffsum += !!diff; |
1139 | 0 | } |
1140 | 0 | if (diffsum >8) |
1141 | 0 | continue; |
1142 | | |
1143 | 0 | if(lpc_encode_choose_datapath(s, sub->obits, res, smp, smp_33bps, n, opt_order, lpc_try, shift[opt_order-1])) |
1144 | 0 | continue; |
1145 | 0 | score = find_subframe_rice_params(s, sub, opt_order); |
1146 | 0 | if (score < best_score) { |
1147 | 0 | best_score = score; |
1148 | 0 | memcpy(coefs[opt_order-1], lpc_try, sizeof(*coefs)); |
1149 | 0 | improved=1; |
1150 | 0 | } |
1151 | 0 | } |
1152 | 0 | } while(improved); |
1153 | 0 | } |
1154 | |
|
1155 | 0 | sub->order = opt_order; |
1156 | 0 | sub->type_code = sub->type | (sub->order-1); |
1157 | 0 | sub->shift = shift[sub->order-1]; |
1158 | 0 | for (i = 0; i < sub->order; i++) |
1159 | 0 | sub->coefs[i] = coefs[sub->order-1][i]; |
1160 | |
|
1161 | 0 | if(lpc_encode_choose_datapath(s, sub->obits, res, smp, smp_33bps, n, sub->order, sub->coefs, sub->shift)) { |
1162 | | /* No predictor found with residuals within <INT32_MIN,INT32_MAX], |
1163 | | * so encode a verbatim subframe instead */ |
1164 | 0 | DEFAULT_TO_VERBATIM(); |
1165 | 0 | } |
1166 | | |
1167 | 0 | find_subframe_rice_params(s, sub, sub->order); |
1168 | |
|
1169 | 0 | return subframe_count_exact(s, sub, sub->order); |
1170 | 0 | } |
1171 | | |
1172 | | |
1173 | | static int count_frame_header(FlacEncodeContext *s) |
1174 | 0 | { |
1175 | 0 | av_unused uint8_t tmp; |
1176 | 0 | int count; |
1177 | | |
1178 | | /* |
1179 | | <14> Sync code |
1180 | | <1> Reserved |
1181 | | <1> Blocking strategy |
1182 | | <4> Block size in inter-channel samples |
1183 | | <4> Sample rate |
1184 | | <4> Channel assignment |
1185 | | <3> Sample size in bits |
1186 | | <1> Reserved |
1187 | | */ |
1188 | 0 | count = 32; |
1189 | | |
1190 | | /* coded frame number */ |
1191 | 0 | PUT_UTF8(s->frame_count, tmp, count += 8;) |
1192 | | |
1193 | | /* explicit block size */ |
1194 | 0 | if (s->frame.bs_code[0] == 6) |
1195 | 0 | count += 8; |
1196 | 0 | else if (s->frame.bs_code[0] == 7) |
1197 | 0 | count += 16; |
1198 | | |
1199 | | /* explicit sample rate */ |
1200 | 0 | count += ((s->sr_code[0] == 12) + (s->sr_code[0] > 12) * 2) * 8; |
1201 | | |
1202 | | /* frame header CRC-8 */ |
1203 | 0 | count += 8; |
1204 | |
|
1205 | 0 | return count; |
1206 | 0 | } |
1207 | | |
1208 | | |
1209 | | static int encode_frame(FlacEncodeContext *s) |
1210 | 0 | { |
1211 | 0 | int ch; |
1212 | 0 | uint64_t count; |
1213 | |
|
1214 | 0 | count = count_frame_header(s); |
1215 | |
|
1216 | 0 | for (ch = 0; ch < s->channels; ch++) |
1217 | 0 | count += encode_residual_ch(s, ch); |
1218 | |
|
1219 | 0 | count += (8 - (count & 7)) & 7; // byte alignment |
1220 | 0 | count += 16; // CRC-16 |
1221 | |
|
1222 | 0 | count >>= 3; |
1223 | 0 | if (count > INT_MAX) |
1224 | 0 | return AVERROR_BUG; |
1225 | 0 | return count; |
1226 | 0 | } |
1227 | | |
1228 | | |
1229 | | static void remove_wasted_bits(FlacEncodeContext *s) |
1230 | 0 | { |
1231 | 0 | int ch, i, wasted_bits; |
1232 | |
|
1233 | 0 | for (ch = 0; ch < s->channels; ch++) { |
1234 | 0 | FlacSubframe *sub = &s->frame.subframes[ch]; |
1235 | |
|
1236 | 0 | if (sub->obits > 32) { |
1237 | 0 | int64_t v = 0; |
1238 | 0 | for (i = 0; i < s->frame.blocksize; i++) { |
1239 | 0 | v |= s->frame.samples_33bps[i]; |
1240 | 0 | if (v & 1) |
1241 | 0 | break; |
1242 | 0 | } |
1243 | |
|
1244 | 0 | if (!v || (v & 1)) |
1245 | 0 | return; |
1246 | | |
1247 | 0 | v = ff_ctzll(v); |
1248 | | |
1249 | | /* If any wasted bits are found, samples are moved |
1250 | | * from frame.samples_33bps to frame.subframes[ch] */ |
1251 | 0 | for (i = 0; i < s->frame.blocksize; i++) |
1252 | 0 | sub->samples[i] = s->frame.samples_33bps[i] >> v; |
1253 | 0 | wasted_bits = v; |
1254 | 0 | } else { |
1255 | 0 | int32_t v = 0; |
1256 | 0 | for (i = 0; i < s->frame.blocksize; i++) { |
1257 | 0 | v |= sub->samples[i]; |
1258 | 0 | if (v & 1) |
1259 | 0 | break; |
1260 | 0 | } |
1261 | |
|
1262 | 0 | if (!v || (v & 1)) |
1263 | 0 | return; |
1264 | | |
1265 | 0 | v = ff_ctz(v); |
1266 | |
|
1267 | 0 | for (i = 0; i < s->frame.blocksize; i++) |
1268 | 0 | sub->samples[i] >>= v; |
1269 | 0 | wasted_bits = v; |
1270 | 0 | } |
1271 | | |
1272 | 0 | sub->wasted = wasted_bits; |
1273 | 0 | sub->obits -= wasted_bits; |
1274 | | |
1275 | | /* for 24-bit, check if removing wasted bits makes the range better |
1276 | | * suited for using RICE instead of RICE2 for entropy coding */ |
1277 | 0 | if (sub->obits <= 17) |
1278 | 0 | sub->rc.coding_mode = CODING_MODE_RICE; |
1279 | 0 | } |
1280 | 0 | } |
1281 | | |
1282 | | |
1283 | | static int estimate_stereo_mode(const int32_t *left_ch, const int32_t *right_ch, int n, |
1284 | | int max_rice_param, int bps) |
1285 | 0 | { |
1286 | 0 | int best; |
1287 | 0 | uint64_t sum[4]; |
1288 | 0 | uint64_t score[4]; |
1289 | 0 | int k; |
1290 | | |
1291 | | /* calculate sum of 2nd order residual for each channel */ |
1292 | 0 | sum[0] = sum[1] = sum[2] = sum[3] = 0; |
1293 | 0 | if(bps < 30) { |
1294 | 0 | int32_t lt, rt; |
1295 | 0 | for (int i = 2; i < n; i++) { |
1296 | 0 | lt = left_ch[i] - 2*left_ch[i-1] + left_ch[i-2]; |
1297 | 0 | rt = right_ch[i] - 2*right_ch[i-1] + right_ch[i-2]; |
1298 | 0 | sum[2] += FFABS((lt + rt) >> 1); |
1299 | 0 | sum[3] += FFABS(lt - rt); |
1300 | 0 | sum[0] += FFABS(lt); |
1301 | 0 | sum[1] += FFABS(rt); |
1302 | 0 | } |
1303 | 0 | } else { |
1304 | 0 | int64_t lt, rt; |
1305 | 0 | for (int i = 2; i < n; i++) { |
1306 | 0 | lt = (int64_t)left_ch[i] - 2*(int64_t)left_ch[i-1] + left_ch[i-2]; |
1307 | 0 | rt = (int64_t)right_ch[i] - 2*(int64_t)right_ch[i-1] + right_ch[i-2]; |
1308 | 0 | sum[2] += FFABS((lt + rt) >> 1); |
1309 | 0 | sum[3] += FFABS(lt - rt); |
1310 | 0 | sum[0] += FFABS(lt); |
1311 | 0 | sum[1] += FFABS(rt); |
1312 | 0 | } |
1313 | 0 | } |
1314 | | /* estimate bit counts */ |
1315 | 0 | for (int i = 0; i < 4; i++) { |
1316 | 0 | k = find_optimal_param(2 * sum[i], n, max_rice_param); |
1317 | 0 | sum[i] = rice_encode_count( 2 * sum[i], n, k); |
1318 | 0 | } |
1319 | | |
1320 | | /* calculate score for each mode */ |
1321 | 0 | score[0] = sum[0] + sum[1]; |
1322 | 0 | score[1] = sum[0] + sum[3]; |
1323 | 0 | score[2] = sum[1] + sum[3]; |
1324 | 0 | score[3] = sum[2] + sum[3]; |
1325 | | |
1326 | | /* return mode with lowest score */ |
1327 | 0 | best = 0; |
1328 | 0 | for (int i = 1; i < 4; i++) |
1329 | 0 | if (score[i] < score[best]) |
1330 | 0 | best = i; |
1331 | |
|
1332 | 0 | return best; |
1333 | 0 | } |
1334 | | |
1335 | | |
1336 | | /** |
1337 | | * Perform stereo channel decorrelation. |
1338 | | */ |
1339 | | static void channel_decorrelation(FlacEncodeContext *s) |
1340 | 0 | { |
1341 | 0 | FlacFrame *frame; |
1342 | 0 | int32_t *left, *right; |
1343 | 0 | int64_t *side_33bps; |
1344 | 0 | int n; |
1345 | |
|
1346 | 0 | frame = &s->frame; |
1347 | 0 | n = frame->blocksize; |
1348 | 0 | left = frame->subframes[0].samples; |
1349 | 0 | right = frame->subframes[1].samples; |
1350 | 0 | side_33bps = frame->samples_33bps; |
1351 | |
|
1352 | 0 | if (s->channels != 2) { |
1353 | 0 | frame->ch_mode = FLAC_CHMODE_INDEPENDENT; |
1354 | 0 | return; |
1355 | 0 | } |
1356 | | |
1357 | 0 | if (s->options.ch_mode < 0) { |
1358 | 0 | int max_rice_param = (1 << frame->subframes[0].rc.coding_mode) - 2; |
1359 | 0 | frame->ch_mode = estimate_stereo_mode(left, right, n, max_rice_param, s->avctx->bits_per_raw_sample); |
1360 | 0 | } else |
1361 | 0 | frame->ch_mode = s->options.ch_mode; |
1362 | | |
1363 | | /* perform decorrelation and adjust bits-per-sample */ |
1364 | 0 | if (frame->ch_mode == FLAC_CHMODE_INDEPENDENT) |
1365 | 0 | return; |
1366 | 0 | if(s->avctx->bits_per_raw_sample == 32) { |
1367 | 0 | if (frame->ch_mode == FLAC_CHMODE_MID_SIDE) { |
1368 | 0 | int64_t tmp; |
1369 | 0 | for (int i = 0; i < n; i++) { |
1370 | 0 | tmp = left[i]; |
1371 | 0 | left[i] = (tmp + right[i]) >> 1; |
1372 | 0 | side_33bps[i] = tmp - right[i]; |
1373 | 0 | } |
1374 | 0 | frame->subframes[1].obits++; |
1375 | 0 | } else if (frame->ch_mode == FLAC_CHMODE_LEFT_SIDE) { |
1376 | 0 | for (int i = 0; i < n; i++) |
1377 | 0 | side_33bps[i] = (int64_t)left[i] - right[i]; |
1378 | 0 | frame->subframes[1].obits++; |
1379 | 0 | } else { |
1380 | 0 | for (int i = 0; i < n; i++) |
1381 | 0 | side_33bps[i] = (int64_t)left[i] - right[i]; |
1382 | 0 | frame->subframes[0].obits++; |
1383 | 0 | } |
1384 | 0 | } else { |
1385 | 0 | if (frame->ch_mode == FLAC_CHMODE_MID_SIDE) { |
1386 | 0 | int32_t tmp; |
1387 | 0 | for (int i = 0; i < n; i++) { |
1388 | 0 | tmp = left[i]; |
1389 | 0 | left[i] = (tmp + right[i]) >> 1; |
1390 | 0 | right[i] = tmp - right[i]; |
1391 | 0 | } |
1392 | 0 | frame->subframes[1].obits++; |
1393 | 0 | } else if (frame->ch_mode == FLAC_CHMODE_LEFT_SIDE) { |
1394 | 0 | for (int i = 0; i < n; i++) |
1395 | 0 | right[i] = left[i] - right[i]; |
1396 | 0 | frame->subframes[1].obits++; |
1397 | 0 | } else { |
1398 | 0 | for (int i = 0; i < n; i++) |
1399 | 0 | left[i] -= right[i]; |
1400 | 0 | frame->subframes[0].obits++; |
1401 | 0 | } |
1402 | 0 | } |
1403 | 0 | } |
1404 | | |
1405 | | |
1406 | | static void write_utf8(PutBitContext *pb, uint32_t val) |
1407 | 0 | { |
1408 | 0 | uint8_t tmp; |
1409 | 0 | PUT_UTF8(val, tmp, put_bits(pb, 8, tmp);) |
1410 | 0 | } |
1411 | | |
1412 | | |
1413 | | static void write_frame_header(FlacEncodeContext *s) |
1414 | 0 | { |
1415 | 0 | FlacFrame *frame; |
1416 | 0 | int crc; |
1417 | |
|
1418 | 0 | frame = &s->frame; |
1419 | |
|
1420 | 0 | put_bits(&s->pb, 16, 0xFFF8); |
1421 | 0 | put_bits(&s->pb, 4, frame->bs_code[0]); |
1422 | 0 | put_bits(&s->pb, 4, s->sr_code[0]); |
1423 | |
|
1424 | 0 | if (frame->ch_mode == FLAC_CHMODE_INDEPENDENT) |
1425 | 0 | put_bits(&s->pb, 4, s->channels-1); |
1426 | 0 | else |
1427 | 0 | put_bits(&s->pb, 4, frame->ch_mode + FLAC_MAX_CHANNELS - 1); |
1428 | |
|
1429 | 0 | put_bits(&s->pb, 3, s->bps_code); |
1430 | 0 | put_bits(&s->pb, 1, 0); |
1431 | 0 | write_utf8(&s->pb, s->frame_count); |
1432 | |
|
1433 | 0 | if (frame->bs_code[0] == 6) |
1434 | 0 | put_bits(&s->pb, 8, frame->bs_code[1]); |
1435 | 0 | else if (frame->bs_code[0] == 7) |
1436 | 0 | put_bits(&s->pb, 16, frame->bs_code[1]); |
1437 | |
|
1438 | 0 | if (s->sr_code[0] == 12) |
1439 | 0 | put_bits(&s->pb, 8, s->sr_code[1]); |
1440 | 0 | else if (s->sr_code[0] > 12) |
1441 | 0 | put_bits(&s->pb, 16, s->sr_code[1]); |
1442 | |
|
1443 | 0 | flush_put_bits(&s->pb); |
1444 | 0 | crc = av_crc(av_crc_get_table(AV_CRC_8_ATM), 0, s->pb.buf, |
1445 | 0 | put_bytes_output(&s->pb)); |
1446 | 0 | put_bits(&s->pb, 8, crc); |
1447 | 0 | } |
1448 | | |
1449 | | |
1450 | | static inline void set_sr_golomb_flac(PutBitContext *pb, int i, int k) |
1451 | 0 | { |
1452 | 0 | unsigned v, e; |
1453 | |
|
1454 | 0 | v = ((unsigned)(i) << 1) ^ (i >> 31); |
1455 | |
|
1456 | 0 | e = (v >> k) + 1; |
1457 | 0 | while (e > 31) { |
1458 | 0 | put_bits(pb, 31, 0); |
1459 | 0 | e -= 31; |
1460 | 0 | } |
1461 | 0 | put_bits(pb, e, 1); |
1462 | 0 | if (k) { |
1463 | 0 | unsigned mask = UINT32_MAX >> (32-k); |
1464 | 0 | put_bits(pb, k, v & mask); |
1465 | 0 | } |
1466 | 0 | } |
1467 | | |
1468 | | |
1469 | | static void write_subframes(FlacEncodeContext *s) |
1470 | 0 | { |
1471 | 0 | int ch; |
1472 | |
|
1473 | 0 | for (ch = 0; ch < s->channels; ch++) { |
1474 | 0 | FlacSubframe *sub = &s->frame.subframes[ch]; |
1475 | 0 | int p, porder, psize; |
1476 | 0 | int32_t *part_end; |
1477 | 0 | int32_t *res = sub->residual; |
1478 | 0 | int32_t *frame_end = &sub->residual[s->frame.blocksize]; |
1479 | | |
1480 | | /* subframe header */ |
1481 | 0 | put_bits(&s->pb, 1, 0); |
1482 | 0 | put_bits(&s->pb, 6, sub->type_code); |
1483 | 0 | put_bits(&s->pb, 1, !!sub->wasted); |
1484 | 0 | if (sub->wasted) |
1485 | 0 | put_bits(&s->pb, sub->wasted, 1); |
1486 | | |
1487 | | /* subframe */ |
1488 | 0 | if (sub->type == FLAC_SUBFRAME_CONSTANT) { |
1489 | 0 | if(sub->obits == 33) |
1490 | 0 | put_sbits63(&s->pb, 33, s->frame.samples_33bps[0]); |
1491 | 0 | else if(sub->obits == 32) |
1492 | 0 | put_bits32(&s->pb, res[0]); |
1493 | 0 | else |
1494 | 0 | put_sbits(&s->pb, sub->obits, res[0]); |
1495 | 0 | } else if (sub->type == FLAC_SUBFRAME_VERBATIM) { |
1496 | 0 | if (sub->obits == 33) { |
1497 | 0 | int64_t *res64 = s->frame.samples_33bps; |
1498 | 0 | int64_t *frame_end64 = &s->frame.samples_33bps[s->frame.blocksize]; |
1499 | 0 | while (res64 < frame_end64) |
1500 | 0 | put_sbits63(&s->pb, 33, (*res64++)); |
1501 | 0 | } else if (sub->obits == 32) { |
1502 | 0 | while (res < frame_end) |
1503 | 0 | put_bits32(&s->pb, *res++); |
1504 | 0 | } else { |
1505 | 0 | while (res < frame_end) |
1506 | 0 | put_sbits(&s->pb, sub->obits, *res++); |
1507 | 0 | } |
1508 | 0 | } else { |
1509 | | /* warm-up samples */ |
1510 | 0 | if (sub->obits == 33) { |
1511 | 0 | for (int i = 0; i < sub->order; i++) |
1512 | 0 | put_sbits63(&s->pb, 33, s->frame.samples_33bps[i]); |
1513 | 0 | res += sub->order; |
1514 | 0 | } else if (sub->obits == 32) { |
1515 | 0 | for (int i = 0; i < sub->order; i++) |
1516 | 0 | put_bits32(&s->pb, *res++); |
1517 | 0 | } else { |
1518 | 0 | for (int i = 0; i < sub->order; i++) |
1519 | 0 | put_sbits(&s->pb, sub->obits, *res++); |
1520 | 0 | } |
1521 | | |
1522 | | /* LPC coefficients */ |
1523 | 0 | if (sub->type == FLAC_SUBFRAME_LPC) { |
1524 | 0 | int cbits = s->options.lpc_coeff_precision; |
1525 | 0 | put_bits( &s->pb, 4, cbits-1); |
1526 | 0 | put_sbits(&s->pb, 5, sub->shift); |
1527 | 0 | for (int i = 0; i < sub->order; i++) |
1528 | 0 | put_sbits(&s->pb, cbits, sub->coefs[i]); |
1529 | 0 | } |
1530 | | |
1531 | | /* rice-encoded block */ |
1532 | 0 | put_bits(&s->pb, 2, sub->rc.coding_mode - 4); |
1533 | | |
1534 | | /* partition order */ |
1535 | 0 | porder = sub->rc.porder; |
1536 | 0 | psize = s->frame.blocksize >> porder; |
1537 | 0 | put_bits(&s->pb, 4, porder); |
1538 | | |
1539 | | /* residual */ |
1540 | 0 | part_end = &sub->residual[psize]; |
1541 | 0 | for (p = 0; p < 1 << porder; p++) { |
1542 | 0 | int k = sub->rc.params[p]; |
1543 | 0 | put_bits(&s->pb, sub->rc.coding_mode, k); |
1544 | 0 | while (res < part_end) |
1545 | 0 | set_sr_golomb_flac(&s->pb, *res++, k); |
1546 | 0 | part_end = FFMIN(frame_end, part_end + psize); |
1547 | 0 | } |
1548 | 0 | } |
1549 | 0 | } |
1550 | 0 | } |
1551 | | |
1552 | | |
1553 | | static void write_frame_footer(FlacEncodeContext *s) |
1554 | 0 | { |
1555 | 0 | int crc; |
1556 | 0 | flush_put_bits(&s->pb); |
1557 | 0 | crc = av_bswap16(av_crc(av_crc_get_table(AV_CRC_16_ANSI), 0, s->pb.buf, |
1558 | 0 | put_bytes_output(&s->pb))); |
1559 | 0 | put_bits(&s->pb, 16, crc); |
1560 | 0 | flush_put_bits(&s->pb); |
1561 | 0 | } |
1562 | | |
1563 | | |
1564 | | static int write_frame(FlacEncodeContext *s, AVPacket *avpkt) |
1565 | 0 | { |
1566 | 0 | init_put_bits(&s->pb, avpkt->data, avpkt->size); |
1567 | 0 | write_frame_header(s); |
1568 | 0 | write_subframes(s); |
1569 | 0 | write_frame_footer(s); |
1570 | 0 | return put_bytes_output(&s->pb); |
1571 | 0 | } |
1572 | | |
1573 | | |
1574 | | static int update_md5_sum(FlacEncodeContext *s, const void *samples) |
1575 | 0 | { |
1576 | 0 | const uint8_t *buf; |
1577 | 0 | int buf_size = s->frame.blocksize * s->channels * |
1578 | 0 | ((s->avctx->bits_per_raw_sample + 7) / 8); |
1579 | |
|
1580 | 0 | if (s->avctx->bits_per_raw_sample > 16 || HAVE_BIGENDIAN) { |
1581 | 0 | av_fast_malloc(&s->md5_buffer, &s->md5_buffer_size, buf_size); |
1582 | 0 | if (!s->md5_buffer) |
1583 | 0 | return AVERROR(ENOMEM); |
1584 | 0 | } |
1585 | | |
1586 | 0 | if (s->avctx->bits_per_raw_sample <= 16) { |
1587 | 0 | buf = (const uint8_t *)samples; |
1588 | | #if HAVE_BIGENDIAN |
1589 | | s->bdsp.bswap16_buf((uint16_t *) s->md5_buffer, |
1590 | | (const uint16_t *) samples, buf_size / 2); |
1591 | | buf = s->md5_buffer; |
1592 | | #endif |
1593 | 0 | } else if (s->avctx->bits_per_raw_sample <= 24) { |
1594 | 0 | int i; |
1595 | 0 | const int32_t *samples0 = samples; |
1596 | 0 | uint8_t *tmp = s->md5_buffer; |
1597 | |
|
1598 | 0 | for (i = 0; i < s->frame.blocksize * s->channels; i++) { |
1599 | 0 | int32_t v = samples0[i] >> 8; |
1600 | 0 | AV_WL24(tmp + 3*i, v); |
1601 | 0 | } |
1602 | 0 | buf = s->md5_buffer; |
1603 | 0 | } else { |
1604 | | /* s->avctx->bits_per_raw_sample <= 32 */ |
1605 | 0 | int i; |
1606 | 0 | const int32_t *samples0 = samples; |
1607 | 0 | uint8_t *tmp = s->md5_buffer; |
1608 | |
|
1609 | 0 | for (i = 0; i < s->frame.blocksize * s->channels; i++) |
1610 | 0 | AV_WL32(tmp + 4*i, samples0[i]); |
1611 | 0 | buf = s->md5_buffer; |
1612 | 0 | } |
1613 | 0 | av_md5_update(s->md5ctx, buf, buf_size); |
1614 | |
|
1615 | 0 | return 0; |
1616 | 0 | } |
1617 | | |
1618 | | |
1619 | | static int flac_encode_frame(AVCodecContext *avctx, AVPacket *avpkt, |
1620 | | const AVFrame *frame, int *got_packet_ptr) |
1621 | 0 | { |
1622 | 0 | FlacEncodeContext *s; |
1623 | 0 | int frame_bytes, out_bytes, ret; |
1624 | |
|
1625 | 0 | s = avctx->priv_data; |
1626 | | |
1627 | | /* when the last block is reached, update the header in extradata */ |
1628 | 0 | if (!frame) { |
1629 | 0 | s->max_framesize = s->max_encoded_framesize; |
1630 | 0 | av_md5_final(s->md5ctx, s->md5sum); |
1631 | 0 | write_streaminfo(s, avctx->extradata); |
1632 | |
|
1633 | 0 | if (!s->flushed) { |
1634 | 0 | uint8_t *side_data = av_packet_new_side_data(avpkt, AV_PKT_DATA_NEW_EXTRADATA, |
1635 | 0 | avctx->extradata_size); |
1636 | 0 | if (!side_data) |
1637 | 0 | return AVERROR(ENOMEM); |
1638 | 0 | memcpy(side_data, avctx->extradata, avctx->extradata_size); |
1639 | |
|
1640 | 0 | avpkt->pts = s->next_pts; |
1641 | |
|
1642 | 0 | *got_packet_ptr = 1; |
1643 | 0 | s->flushed = 1; |
1644 | 0 | } |
1645 | | |
1646 | 0 | return 0; |
1647 | 0 | } |
1648 | | |
1649 | | /* change max_framesize for small final frame */ |
1650 | 0 | if (frame->nb_samples < s->frame.blocksize) { |
1651 | 0 | s->max_framesize = flac_get_max_frame_size(frame->nb_samples, |
1652 | 0 | s->channels, |
1653 | 0 | avctx->bits_per_raw_sample); |
1654 | 0 | } |
1655 | |
|
1656 | 0 | init_frame(s, frame->nb_samples); |
1657 | |
|
1658 | 0 | copy_samples(s, frame->data[0]); |
1659 | |
|
1660 | 0 | channel_decorrelation(s); |
1661 | |
|
1662 | 0 | remove_wasted_bits(s); |
1663 | |
|
1664 | 0 | frame_bytes = encode_frame(s); |
1665 | | |
1666 | | /* Fall back on verbatim mode if the compressed frame is larger than it |
1667 | | would be if encoded uncompressed. */ |
1668 | 0 | if (frame_bytes < 0 || frame_bytes > s->max_framesize) { |
1669 | 0 | s->frame.verbatim_only = 1; |
1670 | 0 | frame_bytes = encode_frame(s); |
1671 | 0 | if (frame_bytes < 0) { |
1672 | 0 | av_log(avctx, AV_LOG_ERROR, "Bad frame count\n"); |
1673 | 0 | return frame_bytes; |
1674 | 0 | } |
1675 | 0 | } |
1676 | | |
1677 | 0 | if ((ret = ff_get_encode_buffer(avctx, avpkt, frame_bytes, 0)) < 0) |
1678 | 0 | return ret; |
1679 | | |
1680 | 0 | out_bytes = write_frame(s, avpkt); |
1681 | |
|
1682 | 0 | s->frame_count++; |
1683 | 0 | s->sample_count += frame->nb_samples; |
1684 | 0 | if ((ret = update_md5_sum(s, frame->data[0])) < 0) { |
1685 | 0 | av_log(avctx, AV_LOG_ERROR, "Error updating MD5 checksum\n"); |
1686 | 0 | return ret; |
1687 | 0 | } |
1688 | 0 | if (out_bytes > s->max_encoded_framesize) |
1689 | 0 | s->max_encoded_framesize = out_bytes; |
1690 | 0 | if (out_bytes < s->min_framesize) |
1691 | 0 | s->min_framesize = out_bytes; |
1692 | |
|
1693 | 0 | s->next_pts = frame->pts + ff_samples_to_time_base(avctx, frame->nb_samples); |
1694 | |
|
1695 | 0 | av_shrink_packet(avpkt, out_bytes); |
1696 | |
|
1697 | 0 | *got_packet_ptr = 1; |
1698 | 0 | return 0; |
1699 | 0 | } |
1700 | | |
1701 | | |
1702 | | static av_cold int flac_encode_close(AVCodecContext *avctx) |
1703 | 0 | { |
1704 | 0 | FlacEncodeContext *s = avctx->priv_data; |
1705 | |
|
1706 | 0 | av_freep(&s->md5ctx); |
1707 | 0 | av_freep(&s->md5_buffer); |
1708 | 0 | ff_lpc_end(&s->lpc_ctx); |
1709 | 0 | return 0; |
1710 | 0 | } |
1711 | | |
1712 | | #define FLAGS AV_OPT_FLAG_ENCODING_PARAM | AV_OPT_FLAG_AUDIO_PARAM |
1713 | | static const AVOption options[] = { |
1714 | | { "lpc_coeff_precision", "LPC coefficient precision", offsetof(FlacEncodeContext, options.lpc_coeff_precision), AV_OPT_TYPE_INT, {.i64 = 15 }, 0, MAX_LPC_PRECISION, FLAGS }, |
1715 | | { "lpc_type", "LPC algorithm", offsetof(FlacEncodeContext, options.lpc_type), AV_OPT_TYPE_INT, {.i64 = FF_LPC_TYPE_DEFAULT }, FF_LPC_TYPE_DEFAULT, FF_LPC_TYPE_NB-1, FLAGS, .unit = "lpc_type" }, |
1716 | | { "none", NULL, 0, AV_OPT_TYPE_CONST, {.i64 = FF_LPC_TYPE_NONE }, INT_MIN, INT_MAX, FLAGS, .unit = "lpc_type" }, |
1717 | | { "fixed", NULL, 0, AV_OPT_TYPE_CONST, {.i64 = FF_LPC_TYPE_FIXED }, INT_MIN, INT_MAX, FLAGS, .unit = "lpc_type" }, |
1718 | | { "levinson", NULL, 0, AV_OPT_TYPE_CONST, {.i64 = FF_LPC_TYPE_LEVINSON }, INT_MIN, INT_MAX, FLAGS, .unit = "lpc_type" }, |
1719 | | { "cholesky", NULL, 0, AV_OPT_TYPE_CONST, {.i64 = FF_LPC_TYPE_CHOLESKY }, INT_MIN, INT_MAX, FLAGS, .unit = "lpc_type" }, |
1720 | | { "lpc_passes", "Number of passes to use for Cholesky factorization during LPC analysis", offsetof(FlacEncodeContext, options.lpc_passes), AV_OPT_TYPE_INT, {.i64 = 2 }, 1, INT_MAX, FLAGS }, |
1721 | | { "min_partition_order", NULL, offsetof(FlacEncodeContext, options.min_partition_order), AV_OPT_TYPE_INT, {.i64 = -1 }, -1, MAX_PARTITION_ORDER, FLAGS }, |
1722 | | { "max_partition_order", NULL, offsetof(FlacEncodeContext, options.max_partition_order), AV_OPT_TYPE_INT, {.i64 = -1 }, -1, MAX_PARTITION_ORDER, FLAGS }, |
1723 | | { "prediction_order_method", "Search method for selecting prediction order", offsetof(FlacEncodeContext, options.prediction_order_method), AV_OPT_TYPE_INT, {.i64 = -1 }, -1, ORDER_METHOD_LOG, FLAGS, .unit = "predm" }, |
1724 | | { "estimation", NULL, 0, AV_OPT_TYPE_CONST, {.i64 = ORDER_METHOD_EST }, INT_MIN, INT_MAX, FLAGS, .unit = "predm" }, |
1725 | | { "2level", NULL, 0, AV_OPT_TYPE_CONST, {.i64 = ORDER_METHOD_2LEVEL }, INT_MIN, INT_MAX, FLAGS, .unit = "predm" }, |
1726 | | { "4level", NULL, 0, AV_OPT_TYPE_CONST, {.i64 = ORDER_METHOD_4LEVEL }, INT_MIN, INT_MAX, FLAGS, .unit = "predm" }, |
1727 | | { "8level", NULL, 0, AV_OPT_TYPE_CONST, {.i64 = ORDER_METHOD_8LEVEL }, INT_MIN, INT_MAX, FLAGS, .unit = "predm" }, |
1728 | | { "search", NULL, 0, AV_OPT_TYPE_CONST, {.i64 = ORDER_METHOD_SEARCH }, INT_MIN, INT_MAX, FLAGS, .unit = "predm" }, |
1729 | | { "log", NULL, 0, AV_OPT_TYPE_CONST, {.i64 = ORDER_METHOD_LOG }, INT_MIN, INT_MAX, FLAGS, .unit = "predm" }, |
1730 | | { "ch_mode", "Stereo decorrelation mode", offsetof(FlacEncodeContext, options.ch_mode), AV_OPT_TYPE_INT, { .i64 = -1 }, -1, FLAC_CHMODE_MID_SIDE, FLAGS, .unit = "ch_mode" }, |
1731 | | { "auto", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = -1 }, INT_MIN, INT_MAX, FLAGS, .unit = "ch_mode" }, |
1732 | | { "indep", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = FLAC_CHMODE_INDEPENDENT }, INT_MIN, INT_MAX, FLAGS, .unit = "ch_mode" }, |
1733 | | { "left_side", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = FLAC_CHMODE_LEFT_SIDE }, INT_MIN, INT_MAX, FLAGS, .unit = "ch_mode" }, |
1734 | | { "right_side", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = FLAC_CHMODE_RIGHT_SIDE }, INT_MIN, INT_MAX, FLAGS, .unit = "ch_mode" }, |
1735 | | { "mid_side", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = FLAC_CHMODE_MID_SIDE }, INT_MIN, INT_MAX, FLAGS, .unit = "ch_mode" }, |
1736 | | { "exact_rice_parameters", "Calculate rice parameters exactly", offsetof(FlacEncodeContext, options.exact_rice_parameters), AV_OPT_TYPE_BOOL, { .i64 = 0 }, 0, 1, FLAGS }, |
1737 | | { "multi_dim_quant", "Multi-dimensional quantization", offsetof(FlacEncodeContext, options.multi_dim_quant), AV_OPT_TYPE_BOOL, { .i64 = 0 }, 0, 1, FLAGS }, |
1738 | | { "min_prediction_order", NULL, offsetof(FlacEncodeContext, options.min_prediction_order), AV_OPT_TYPE_INT, { .i64 = -1 }, -1, MAX_LPC_ORDER, FLAGS }, |
1739 | | { "max_prediction_order", NULL, offsetof(FlacEncodeContext, options.max_prediction_order), AV_OPT_TYPE_INT, { .i64 = -1 }, -1, MAX_LPC_ORDER, FLAGS }, |
1740 | | |
1741 | | { NULL }, |
1742 | | }; |
1743 | | |
1744 | | static const AVClass flac_encoder_class = { |
1745 | | .class_name = "FLAC encoder", |
1746 | | .item_name = av_default_item_name, |
1747 | | .option = options, |
1748 | | .version = LIBAVUTIL_VERSION_INT, |
1749 | | }; |
1750 | | |
1751 | | const FFCodec ff_flac_encoder = { |
1752 | | .p.name = "flac", |
1753 | | CODEC_LONG_NAME("FLAC (Free Lossless Audio Codec)"), |
1754 | | .p.type = AVMEDIA_TYPE_AUDIO, |
1755 | | .p.id = AV_CODEC_ID_FLAC, |
1756 | | .p.capabilities = AV_CODEC_CAP_DR1 | AV_CODEC_CAP_DELAY | |
1757 | | AV_CODEC_CAP_SMALL_LAST_FRAME | |
1758 | | AV_CODEC_CAP_ENCODER_REORDERED_OPAQUE, |
1759 | | .priv_data_size = sizeof(FlacEncodeContext), |
1760 | | .init = flac_encode_init, |
1761 | | FF_CODEC_ENCODE_CB(flac_encode_frame), |
1762 | | .close = flac_encode_close, |
1763 | | CODEC_SAMPLEFMTS(AV_SAMPLE_FMT_S16, AV_SAMPLE_FMT_S32), |
1764 | | .p.priv_class = &flac_encoder_class, |
1765 | | .caps_internal = FF_CODEC_CAP_INIT_CLEANUP | FF_CODEC_CAP_EOF_FLUSH, |
1766 | | }; |