/src/ffmpeg/libavformat/iamfdec.c
Line | Count | Source (jump to first uncovered line) |
1 | | /* |
2 | | * Immersive Audio Model and Formats demuxer |
3 | | * Copyright (c) 2023 James Almer <jamrial@gmail.com> |
4 | | * |
5 | | * This file is part of FFmpeg. |
6 | | * |
7 | | * FFmpeg is free software; you can redistribute it and/or |
8 | | * modify it under the terms of the GNU Lesser General Public |
9 | | * License as published by the Free Software Foundation; either |
10 | | * version 2.1 of the License, or (at your option) any later version. |
11 | | * |
12 | | * FFmpeg is distributed in the hope that it will be useful, |
13 | | * but WITHOUT ANY WARRANTY; without even the implied warranty of |
14 | | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU |
15 | | * Lesser General Public License for more details. |
16 | | * |
17 | | * You should have received a copy of the GNU Lesser General Public |
18 | | * License along with FFmpeg; if not, write to the Free Software |
19 | | * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA |
20 | | */ |
21 | | |
22 | | #include "libavutil/avassert.h" |
23 | | #include "libavutil/intreadwrite.h" |
24 | | #include "avformat.h" |
25 | | #include "demux.h" |
26 | | #include "iamf.h" |
27 | | #include "iamf_reader.h" |
28 | | #include "iamf_parse.h" |
29 | | #include "internal.h" |
30 | | |
31 | | //return < 0 if we need more data |
32 | | static int get_score(const uint8_t *buf, int buf_size, enum IAMF_OBU_Type type, int *seq) |
33 | 205k | { |
34 | 205k | if (type == IAMF_OBU_IA_SEQUENCE_HEADER) { |
35 | 19.0k | if (buf_size < 4 || AV_RB32(buf) != MKBETAG('i','a','m','f')) |
36 | 18.8k | return 0; |
37 | 183 | *seq = 1; |
38 | 183 | return -1; |
39 | 19.0k | } |
40 | 186k | if (type >= IAMF_OBU_IA_CODEC_CONFIG && type <= IAMF_OBU_IA_TEMPORAL_DELIMITER) |
41 | 96.1k | return *seq ? -1 : 0; |
42 | 90.6k | if (type >= IAMF_OBU_IA_AUDIO_FRAME && type <= IAMF_OBU_IA_AUDIO_FRAME_ID17) |
43 | 84.8k | return *seq ? AVPROBE_SCORE_EXTENSION + 1 : 0; |
44 | 5.74k | return 0; |
45 | 90.6k | } |
46 | | |
47 | | static int iamf_probe(const AVProbeData *p) |
48 | 358k | { |
49 | 358k | unsigned obu_size; |
50 | 358k | enum IAMF_OBU_Type type; |
51 | 358k | int seq = 0, cnt = 0, start_pos; |
52 | 358k | int ret; |
53 | | |
54 | 360k | while (1) { |
55 | 360k | int size = ff_iamf_parse_obu_header(p->buf + cnt, p->buf_size - cnt, |
56 | 360k | &obu_size, &start_pos, &type, |
57 | 360k | NULL, NULL); |
58 | 360k | if (size < 0) |
59 | 154k | return 0; |
60 | | |
61 | 205k | ret = get_score(p->buf + cnt + start_pos, |
62 | 205k | p->buf_size - cnt - start_pos, |
63 | 205k | type, &seq); |
64 | 205k | if (ret >= 0) |
65 | 204k | return ret; |
66 | | |
67 | 1.76k | cnt += FFMIN(size, p->buf_size - cnt); |
68 | 1.76k | } |
69 | 0 | return 0; |
70 | 358k | } |
71 | | |
72 | | static int iamf_read_header(AVFormatContext *s) |
73 | 5.35k | { |
74 | 5.35k | IAMFDemuxContext *const c = s->priv_data; |
75 | 5.35k | IAMFContext *const iamf = &c->iamf; |
76 | 5.35k | int ret; |
77 | | |
78 | 5.35k | ret = ff_iamfdec_read_descriptors(iamf, s->pb, INT_MAX, s); |
79 | 5.35k | if (ret < 0) |
80 | 5.19k | return ret; |
81 | | |
82 | 165 | for (int i = 0; i < iamf->nb_audio_elements; i++) { |
83 | 6 | IAMFAudioElement *audio_element = iamf->audio_elements[i]; |
84 | 6 | AVStreamGroup *stg = avformat_stream_group_create(s, AV_STREAM_GROUP_PARAMS_IAMF_AUDIO_ELEMENT, NULL); |
85 | | |
86 | 6 | if (!stg) |
87 | 0 | return AVERROR(ENOMEM); |
88 | | |
89 | 6 | av_iamf_audio_element_free(&stg->params.iamf_audio_element); |
90 | 6 | stg->id = audio_element->audio_element_id; |
91 | | /* Transfer ownership */ |
92 | 6 | stg->params.iamf_audio_element = audio_element->element; |
93 | 6 | audio_element->element = NULL; |
94 | | |
95 | 30 | for (int j = 0; j < audio_element->nb_substreams; j++) { |
96 | 24 | IAMFSubStream *substream = &audio_element->substreams[j]; |
97 | 24 | AVStream *st = avformat_new_stream(s, NULL); |
98 | | |
99 | 24 | if (!st) |
100 | 0 | return AVERROR(ENOMEM); |
101 | | |
102 | 24 | ret = avformat_stream_group_add_stream(stg, st); |
103 | 24 | if (ret < 0) |
104 | 0 | return ret; |
105 | | |
106 | 24 | ret = avcodec_parameters_copy(st->codecpar, substream->codecpar); |
107 | 24 | if (ret < 0) |
108 | 0 | return ret; |
109 | | |
110 | 24 | if (!i && !j && audio_element->layers[0].substream_count == 1) |
111 | 6 | st->disposition |= AV_DISPOSITION_DEFAULT; |
112 | 18 | else |
113 | 18 | st->disposition |= AV_DISPOSITION_DEPENDENT; |
114 | 24 | st->id = substream->audio_substream_id; |
115 | 24 | avpriv_set_pts_info(st, 64, 1, st->codecpar->sample_rate); |
116 | 24 | } |
117 | 6 | } |
118 | | |
119 | 197 | for (int i = 0; i < iamf->nb_mix_presentations; i++) { |
120 | 38 | IAMFMixPresentation *mix_presentation = iamf->mix_presentations[i]; |
121 | 38 | AVStreamGroup *stg = avformat_stream_group_create(s, AV_STREAM_GROUP_PARAMS_IAMF_MIX_PRESENTATION, NULL); |
122 | 38 | const AVIAMFMixPresentation *mix = mix_presentation->cmix; |
123 | | |
124 | 38 | if (!stg) |
125 | 0 | return AVERROR(ENOMEM); |
126 | | |
127 | 38 | av_iamf_mix_presentation_free(&stg->params.iamf_mix_presentation); |
128 | 38 | stg->id = mix_presentation->mix_presentation_id; |
129 | | /* Transfer ownership */ |
130 | 38 | stg->params.iamf_mix_presentation = mix_presentation->mix; |
131 | 38 | mix_presentation->mix = NULL; |
132 | | |
133 | 59 | for (int j = 0; j < mix->nb_submixes; j++) { |
134 | 21 | const AVIAMFSubmix *sub_mix = mix->submixes[j]; |
135 | | |
136 | 27 | for (int k = 0; k < sub_mix->nb_elements; k++) { |
137 | 6 | const AVIAMFSubmixElement *submix_element = sub_mix->elements[k]; |
138 | 6 | AVStreamGroup *audio_element = NULL; |
139 | | |
140 | 6 | for (int l = 0; l < s->nb_stream_groups; l++) |
141 | 6 | if (s->stream_groups[l]->type == AV_STREAM_GROUP_PARAMS_IAMF_AUDIO_ELEMENT && |
142 | 6 | s->stream_groups[l]->id == submix_element->audio_element_id) { |
143 | 6 | audio_element = s->stream_groups[l]; |
144 | 6 | break; |
145 | 6 | } |
146 | 6 | av_assert0(audio_element); |
147 | | |
148 | 30 | for (int l = 0; l < audio_element->nb_streams; l++) { |
149 | 24 | ret = avformat_stream_group_add_stream(stg, audio_element->streams[l]); |
150 | 24 | if (ret < 0 && ret != AVERROR(EEXIST)) |
151 | 0 | return ret; |
152 | 24 | } |
153 | 6 | } |
154 | 21 | } |
155 | 38 | } |
156 | | |
157 | 159 | if (!s->nb_streams) |
158 | 153 | return AVERROR_INVALIDDATA; |
159 | | |
160 | 6 | return 0; |
161 | 159 | } |
162 | | |
163 | | static int iamf_read_packet(AVFormatContext *s, AVPacket *pkt) |
164 | 204 | { |
165 | 204 | IAMFDemuxContext *const c = s->priv_data; |
166 | 204 | int ret; |
167 | | |
168 | 204 | ret = ff_iamf_read_packet(s, c, s->pb, INT_MAX, pkt); |
169 | 204 | if (ret < 0) |
170 | 6 | return ret; |
171 | | |
172 | 198 | return 0; |
173 | 204 | } |
174 | | |
175 | | static int iamf_read_close(AVFormatContext *s) |
176 | 5.35k | { |
177 | 5.35k | IAMFDemuxContext *const c = s->priv_data; |
178 | | |
179 | 5.35k | ff_iamf_read_deinit(c); |
180 | | |
181 | 5.35k | return 0; |
182 | 5.35k | } |
183 | | |
184 | | const FFInputFormat ff_iamf_demuxer = { |
185 | | .p.name = "iamf", |
186 | | .p.long_name = NULL_IF_CONFIG_SMALL("Raw Immersive Audio Model and Formats"), |
187 | | .p.extensions = "iamf", |
188 | | .p.flags = AVFMT_GENERIC_INDEX | AVFMT_NO_BYTE_SEEK | AVFMT_NOTIMESTAMPS | AVFMT_SHOW_IDS, |
189 | | .priv_data_size = sizeof(IAMFDemuxContext), |
190 | | .flags_internal = FF_INFMT_FLAG_INIT_CLEANUP, |
191 | | .read_probe = iamf_probe, |
192 | | .read_header = iamf_read_header, |
193 | | .read_packet = iamf_read_packet, |
194 | | .read_close = iamf_read_close, |
195 | | }; |