FFmpeg
iamf_parse.c
Go to the documentation of this file.
1 /*
2  * Immersive Audio Model and Formats parsing
3  * Copyright (c) 2023 James Almer <jamrial@gmail.com>
4  *
5  * This file is part of FFmpeg.
6  *
7  * FFmpeg is free software; you can redistribute it and/or
8  * modify it under the terms of the GNU Lesser General Public
9  * License as published by the Free Software Foundation; either
10  * version 2.1 of the License, or (at your option) any later version.
11  *
12  * FFmpeg is distributed in the hope that it will be useful,
13  * but WITHOUT ANY WARRANTY; without even the implied warranty of
14  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
15  * Lesser General Public License for more details.
16  *
17  * You should have received a copy of the GNU Lesser General Public
18  * License along with FFmpeg; if not, write to the Free Software
19  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
20  */
21 
22 #include "libavutil/avassert.h"
23 #include "libavutil/common.h"
24 #include "libavutil/iamf.h"
25 #include "libavutil/intreadwrite.h"
26 #include "libavutil/log.h"
27 #include "libavcodec/get_bits.h"
28 #include "libavcodec/flac.h"
29 #include "libavcodec/leb.h"
30 #include "libavcodec/mpeg4audio.h"
31 #include "libavcodec/put_bits.h"
32 #include "avio_internal.h"
33 #include "iamf_parse.h"
34 #include "isom.h"
35 
36 static int opus_decoder_config(IAMFCodecConfig *codec_config,
37  AVIOContext *pb, int len)
38 {
39  int left = len - avio_tell(pb);
40 
41  if (left < 11 || codec_config->audio_roll_distance >= 0)
42  return AVERROR_INVALIDDATA;
43 
44  codec_config->extradata = av_malloc(left + 8);
45  if (!codec_config->extradata)
46  return AVERROR(ENOMEM);
47 
48  AV_WB32(codec_config->extradata, MKBETAG('O','p','u','s'));
49  AV_WB32(codec_config->extradata + 4, MKBETAG('H','e','a','d'));
50  codec_config->extradata_size = avio_read(pb, codec_config->extradata + 8, left);
51  if (codec_config->extradata_size < left)
52  return AVERROR_INVALIDDATA;
53 
54  codec_config->extradata_size += 8;
55  codec_config->sample_rate = 48000;
56 
57  return 0;
58 }
59 
60 static int aac_decoder_config(IAMFCodecConfig *codec_config,
61  AVIOContext *pb, int len, void *logctx)
62 {
63  MPEG4AudioConfig cfg = { 0 };
64  int object_type_id, codec_id, stream_type;
65  int ret, tag, left;
66 
67  if (codec_config->audio_roll_distance >= 0)
68  return AVERROR_INVALIDDATA;
69 
70  ff_mp4_read_descr(logctx, pb, &tag);
72  return AVERROR_INVALIDDATA;
73 
74  object_type_id = avio_r8(pb);
75  if (object_type_id != 0x40)
76  return AVERROR_INVALIDDATA;
77 
78  stream_type = avio_r8(pb);
79  if (((stream_type >> 2) != 5) || ((stream_type >> 1) & 1))
80  return AVERROR_INVALIDDATA;
81 
82  avio_skip(pb, 3); // buffer size db
83  avio_skip(pb, 4); // rc_max_rate
84  avio_skip(pb, 4); // avg bitrate
85 
86  codec_id = ff_codec_get_id(ff_mp4_obj_type, object_type_id);
87  if (codec_id && codec_id != codec_config->codec_id)
88  return AVERROR_INVALIDDATA;
89 
90  left = ff_mp4_read_descr(logctx, pb, &tag);
91  if (tag != MP4DecSpecificDescrTag ||
92  !left || left > (len - avio_tell(pb)))
93  return AVERROR_INVALIDDATA;
94 
95  // We pad extradata here because avpriv_mpeg4audio_get_config2() needs it.
96  codec_config->extradata = av_malloc((size_t)left + AV_INPUT_BUFFER_PADDING_SIZE);
97  if (!codec_config->extradata)
98  return AVERROR(ENOMEM);
99 
100  ret = ffio_read_size(pb, codec_config->extradata, left);
101  if (ret < 0)
102  return ret;
103  codec_config->extradata_size = left;
104  memset(codec_config->extradata + codec_config->extradata_size, 0,
106 
107  ret = avpriv_mpeg4audio_get_config2(&cfg, codec_config->extradata,
108  codec_config->extradata_size, 1, logctx);
109  if (ret < 0)
110  return ret;
111 
112  codec_config->sample_rate = cfg.sample_rate;
113 
114  return 0;
115 }
116 
117 static int flac_decoder_config(IAMFCodecConfig *codec_config,
118  AVIOContext *pb, int len)
119 {
120  int left;
121 
122  if (codec_config->audio_roll_distance)
123  return AVERROR_INVALIDDATA;
124 
125  avio_skip(pb, 4); // METADATA_BLOCK_HEADER
126 
127  left = len - avio_tell(pb);
129  return AVERROR_INVALIDDATA;
130 
131  codec_config->extradata = av_malloc(left);
132  if (!codec_config->extradata)
133  return AVERROR(ENOMEM);
134 
135  codec_config->extradata_size = avio_read(pb, codec_config->extradata, left);
136  if (codec_config->extradata_size < left)
137  return AVERROR_INVALIDDATA;
138 
139  codec_config->sample_rate = AV_RB24(codec_config->extradata + 10) >> 4;
140 
141  return 0;
142 }
143 
144 static int ipcm_decoder_config(IAMFCodecConfig *codec_config,
145  AVIOContext *pb, int len)
146 {
147  static const enum AVCodecID sample_fmt[2][3] = {
150  };
151  int sample_format = avio_r8(pb); // 0 = BE, 1 = LE
152  int sample_size = (avio_r8(pb) / 8 - 2); // 16, 24, 32
153  if (sample_format > 1 || sample_size > 2U || codec_config->audio_roll_distance)
154  return AVERROR_INVALIDDATA;
155 
156  codec_config->codec_id = sample_fmt[sample_format][sample_size];
157  codec_config->sample_rate = avio_rb32(pb);
158 
159  if (len - avio_tell(pb))
160  return AVERROR_INVALIDDATA;
161 
162  return 0;
163 }
164 
165 static int codec_config_obu(void *s, IAMFContext *c, AVIOContext *pb, int len)
166 {
167  IAMFCodecConfig **tmp, *codec_config = NULL;
168  FFIOContext b;
169  AVIOContext *pbc;
170  uint8_t *buf;
171  enum AVCodecID avcodec_id;
172  unsigned codec_config_id, nb_samples, codec_id;
173  int16_t audio_roll_distance;
174  int ret;
175 
176  buf = av_malloc(len);
177  if (!buf)
178  return AVERROR(ENOMEM);
179 
180  ret = avio_read(pb, buf, len);
181  if (ret != len) {
182  if (ret >= 0)
184  goto fail;
185  }
186 
187  ffio_init_context(&b, buf, len, 0, NULL, NULL, NULL, NULL);
188  pbc = &b.pub;
189 
190  codec_config_id = ffio_read_leb(pbc);
191  codec_id = avio_rb32(pbc);
192  nb_samples = ffio_read_leb(pbc);
193  audio_roll_distance = avio_rb16(pbc);
194 
195  switch(codec_id) {
196  case MKBETAG('O','p','u','s'):
197  avcodec_id = AV_CODEC_ID_OPUS;
198  break;
199  case MKBETAG('m','p','4','a'):
200  avcodec_id = AV_CODEC_ID_AAC;
201  break;
202  case MKBETAG('f','L','a','C'):
203  avcodec_id = AV_CODEC_ID_FLAC;
204  break;
205  default:
206  avcodec_id = AV_CODEC_ID_NONE;
207  break;
208  }
209 
210  for (int i = 0; i < c->nb_codec_configs; i++)
211  if (c->codec_configs[i]->codec_config_id == codec_config_id) {
213  goto fail;
214  }
215 
216  tmp = av_realloc_array(c->codec_configs, c->nb_codec_configs + 1, sizeof(*c->codec_configs));
217  if (!tmp) {
218  ret = AVERROR(ENOMEM);
219  goto fail;
220  }
221  c->codec_configs = tmp;
222 
223  codec_config = av_mallocz(sizeof(*codec_config));
224  if (!codec_config) {
225  ret = AVERROR(ENOMEM);
226  goto fail;
227  }
228 
229  codec_config->codec_config_id = codec_config_id;
230  codec_config->codec_id = avcodec_id;
231  codec_config->nb_samples = nb_samples;
232  codec_config->audio_roll_distance = audio_roll_distance;
233 
234  switch(codec_id) {
235  case MKBETAG('O','p','u','s'):
236  ret = opus_decoder_config(codec_config, pbc, len);
237  break;
238  case MKBETAG('m','p','4','a'):
239  ret = aac_decoder_config(codec_config, pbc, len, s);
240  break;
241  case MKBETAG('f','L','a','C'):
242  ret = flac_decoder_config(codec_config, pbc, len);
243  break;
244  case MKBETAG('i','p','c','m'):
245  ret = ipcm_decoder_config(codec_config, pbc, len);
246  break;
247  default:
248  break;
249  }
250  if (ret < 0)
251  goto fail;
252 
253  if ((codec_config->nb_samples > INT_MAX) || codec_config->nb_samples <= 0 ||
254  (-codec_config->audio_roll_distance > INT_MAX / codec_config->nb_samples)) {
256  goto fail;
257  }
258 
259  c->codec_configs[c->nb_codec_configs++] = codec_config;
260 
261  len -= avio_tell(pbc);
262  if (len)
263  av_log(s, AV_LOG_WARNING, "Underread in codec_config_obu. %d bytes left at the end\n", len);
264 
265  ret = 0;
266 fail:
267  av_free(buf);
268  if (ret < 0) {
269  if (codec_config)
270  av_free(codec_config->extradata);
271  av_free(codec_config);
272  }
273  return ret;
274 }
275 
276 static int update_extradata(AVCodecParameters *codecpar)
277 {
278  GetBitContext gb;
279  PutBitContext pb;
280  int ret;
281 
282  switch(codecpar->codec_id) {
283  case AV_CODEC_ID_OPUS:
284  AV_WB8(codecpar->extradata + 9, codecpar->ch_layout.nb_channels);
285  AV_WL16(codecpar->extradata + 10, AV_RB16(codecpar->extradata + 10)); // Byte swap pre-skip
286  AV_WL32(codecpar->extradata + 12, AV_RB32(codecpar->extradata + 12)); // Byte swap sample rate
287  AV_WL16(codecpar->extradata + 16, AV_RB16(codecpar->extradata + 16)); // Byte swap Output Gain
288  break;
289  case AV_CODEC_ID_AAC: {
290  uint8_t buf[5];
291 
292  init_put_bits(&pb, buf, sizeof(buf));
293  ret = init_get_bits8(&gb, codecpar->extradata, codecpar->extradata_size);
294  if (ret < 0)
295  return ret;
296 
297  ret = get_bits(&gb, 5);
298  put_bits(&pb, 5, ret);
299  if (ret == AOT_ESCAPE) // violates section 3.11.2, but better check for it
300  put_bits(&pb, 6, get_bits(&gb, 6));
301  ret = get_bits(&gb, 4);
302  put_bits(&pb, 4, ret);
303  if (ret == 0x0f)
304  put_bits(&pb, 24, get_bits(&gb, 24));
305 
306  skip_bits(&gb, 4);
307  put_bits(&pb, 4, codecpar->ch_layout.nb_channels); // set channel config
308  ret = put_bits_left(&pb);
309  put_bits(&pb, ret, get_bits_long(&gb, ret));
310  flush_put_bits(&pb);
311 
312  memcpy(codecpar->extradata, buf, put_bytes_output(&pb));
313  break;
314  }
315  case AV_CODEC_ID_FLAC: {
316  uint8_t buf[13];
317 
318  init_put_bits(&pb, buf, sizeof(buf));
319  ret = init_get_bits8(&gb, codecpar->extradata, codecpar->extradata_size);
320  if (ret < 0)
321  return ret;
322 
323  put_bits32(&pb, get_bits_long(&gb, 32)); // min/max blocksize
324  put_bits64(&pb, 48, get_bits64(&gb, 48)); // min/max framesize
325  put_bits(&pb, 20, get_bits(&gb, 20)); // samplerate
326  skip_bits(&gb, 3);
327  put_bits(&pb, 3, codecpar->ch_layout.nb_channels - 1);
328  ret = put_bits_left(&pb);
329  put_bits(&pb, ret, get_bits(&gb, ret));
330  flush_put_bits(&pb);
331 
332  memcpy(codecpar->extradata, buf, sizeof(buf));
333  break;
334  }
335  }
336 
337  return 0;
338 }
339 
341  IAMFAudioElement *audio_element,
342  const IAMFCodecConfig *codec_config)
343 {
344  int nb_layers, k = 0;
345 
346  nb_layers = avio_r8(pb) >> 5; // get_bits(&gb, 3);
347  // skip_bits(&gb, 5); //reserved
348 
349  if (nb_layers > 6 || nb_layers == 0)
350  return AVERROR_INVALIDDATA;
351 
352  audio_element->layers = av_calloc(nb_layers, sizeof(*audio_element->layers));
353  if (!audio_element->layers)
354  return AVERROR(ENOMEM);
355 
356  audio_element->nb_layers = nb_layers;
357  for (int i = 0; i < nb_layers; i++) {
358  AVIAMFLayer *layer;
359  int loudspeaker_layout, output_gain_is_present_flag;
360  int substream_count, coupled_substream_count;
361  int ret, byte = avio_r8(pb);
362 
363  layer = av_iamf_audio_element_add_layer(audio_element->element);
364  if (!layer)
365  return AVERROR(ENOMEM);
366 
367  loudspeaker_layout = byte >> 4; // get_bits(&gb, 4);
368  output_gain_is_present_flag = (byte >> 3) & 1; //get_bits1(&gb);
369  if ((byte >> 2) & 1)
370  layer->flags |= AV_IAMF_LAYER_FLAG_RECON_GAIN;
371  substream_count = avio_r8(pb);
372  coupled_substream_count = avio_r8(pb);
373 
374  if (substream_count + k > audio_element->nb_substreams)
375  return AVERROR_INVALIDDATA;
376 
377  audio_element->layers[i].substream_count = substream_count;
378  audio_element->layers[i].coupled_substream_count = coupled_substream_count;
379  if (output_gain_is_present_flag) {
380  layer->output_gain_flags = avio_r8(pb) >> 2; // get_bits(&gb, 6);
381  layer->output_gain = av_make_q(sign_extend(avio_rb16(pb), 16), 1 << 8);
382  }
383 
384  if (loudspeaker_layout < 10)
385  av_channel_layout_copy(&layer->ch_layout, &ff_iamf_scalable_ch_layouts[loudspeaker_layout]);
386  else
388  .nb_channels = substream_count +
389  coupled_substream_count };
390 
391  for (int j = 0; j < substream_count; j++) {
392  IAMFSubStream *substream = &audio_element->substreams[k++];
393 
394  substream->codecpar->ch_layout = coupled_substream_count-- > 0 ? (AVChannelLayout)AV_CHANNEL_LAYOUT_STEREO :
396 
397  ret = update_extradata(substream->codecpar);
398  if (ret < 0)
399  return ret;
400  }
401 
402  }
403 
404  return 0;
405 }
406 
407 static int ambisonics_config(void *s, AVIOContext *pb,
408  IAMFAudioElement *audio_element,
409  const IAMFCodecConfig *codec_config)
410 {
411  AVIAMFLayer *layer;
412  unsigned ambisonics_mode;
413  int output_channel_count, substream_count, order;
414  int ret;
415 
416  ambisonics_mode = ffio_read_leb(pb);
417  if (ambisonics_mode > 1)
418  return 0;
419 
420  output_channel_count = avio_r8(pb); // C
421  substream_count = avio_r8(pb); // N
422  if (audio_element->nb_substreams != substream_count)
423  return AVERROR_INVALIDDATA;
424 
425  order = floor(sqrt(output_channel_count - 1));
426  /* incomplete order - some harmonics are missing */
427  if ((order + 1) * (order + 1) != output_channel_count)
428  return AVERROR_INVALIDDATA;
429 
430  audio_element->layers = av_mallocz(sizeof(*audio_element->layers));
431  if (!audio_element->layers)
432  return AVERROR(ENOMEM);
433 
434  audio_element->nb_layers = 1;
435  audio_element->layers->substream_count = substream_count;
436 
437  layer = av_iamf_audio_element_add_layer(audio_element->element);
438  if (!layer)
439  return AVERROR(ENOMEM);
440 
441  layer->ambisonics_mode = ambisonics_mode;
442  if (ambisonics_mode == 0) {
443  for (int i = 0; i < substream_count; i++) {
444  IAMFSubStream *substream = &audio_element->substreams[i];
445 
447 
448  ret = update_extradata(substream->codecpar);
449  if (ret < 0)
450  return ret;
451  }
452 
454  layer->ch_layout.nb_channels = output_channel_count;
455  layer->ch_layout.u.map = av_calloc(output_channel_count, sizeof(*layer->ch_layout.u.map));
456  if (!layer->ch_layout.u.map)
457  return AVERROR(ENOMEM);
458 
459  for (int i = 0; i < output_channel_count; i++)
460  layer->ch_layout.u.map[i].id = avio_r8(pb) + AV_CHAN_AMBISONIC_BASE;
461  } else {
462  int coupled_substream_count = avio_r8(pb); // M
463  int nb_demixing_matrix = substream_count + coupled_substream_count;
464  int demixing_matrix_size = nb_demixing_matrix * output_channel_count;
465 
466  audio_element->layers->coupled_substream_count = coupled_substream_count;
467 
468  layer->ch_layout = (AVChannelLayout){ .order = AV_CHANNEL_ORDER_AMBISONIC, .nb_channels = output_channel_count };
469  layer->demixing_matrix = av_malloc_array(demixing_matrix_size, sizeof(*layer->demixing_matrix));
470  if (!layer->demixing_matrix)
471  return AVERROR(ENOMEM);
472 
473  for (int i = 0; i < demixing_matrix_size; i++)
474  layer->demixing_matrix[i] = av_make_q(sign_extend(avio_rb16(pb), 16), 1 << 8);
475 
476  for (int i = 0; i < substream_count; i++) {
477  IAMFSubStream *substream = &audio_element->substreams[i];
478 
479  substream->codecpar->ch_layout = coupled_substream_count-- > 0 ? (AVChannelLayout)AV_CHANNEL_LAYOUT_STEREO :
481 
482 
483  ret = update_extradata(substream->codecpar);
484  if (ret < 0)
485  return ret;
486  }
487  }
488 
489  return 0;
490 }
491 
492 static int param_parse(void *s, IAMFContext *c, AVIOContext *pb,
493  unsigned int type,
494  const IAMFAudioElement *audio_element,
495  AVIAMFParamDefinition **out_param_definition)
496 {
498  AVIAMFParamDefinition *param;
499  unsigned int parameter_id, parameter_rate, mode;
500  unsigned int duration = 0, constant_subblock_duration = 0, nb_subblocks = 0;
501  size_t param_size;
502 
503  parameter_id = ffio_read_leb(pb);
504 
505  for (int i = 0; i < c->nb_param_definitions; i++)
506  if (c->param_definitions[i]->param->parameter_id == parameter_id) {
507  param_definition = c->param_definitions[i];
508  break;
509  }
510 
511  parameter_rate = ffio_read_leb(pb);
512  mode = avio_r8(pb) >> 7;
513 
514  if (mode == 0) {
515  duration = ffio_read_leb(pb);
516  if (!duration)
517  return AVERROR_INVALIDDATA;
518  constant_subblock_duration = ffio_read_leb(pb);
519  if (constant_subblock_duration == 0)
520  nb_subblocks = ffio_read_leb(pb);
521  else
522  nb_subblocks = duration / constant_subblock_duration;
523  }
524 
525  param = av_iamf_param_definition_alloc(type, nb_subblocks, &param_size);
526  if (!param)
527  return AVERROR(ENOMEM);
528 
529  for (int i = 0; i < nb_subblocks; i++) {
530  void *subblock = av_iamf_param_definition_get_subblock(param, i);
531  unsigned int subblock_duration = constant_subblock_duration;
532 
533  if (constant_subblock_duration == 0)
534  subblock_duration = ffio_read_leb(pb);
535 
536  switch (type) {
538  AVIAMFMixGain *mix = subblock;
539  mix->subblock_duration = subblock_duration;
540  break;
541  }
543  AVIAMFDemixingInfo *demix = subblock;
544  demix->subblock_duration = subblock_duration;
545  // DefaultDemixingInfoParameterData
546  av_assert0(audio_element);
547  demix->dmixp_mode = avio_r8(pb) >> 5;
548  audio_element->element->default_w = avio_r8(pb) >> 4;
549  break;
550  }
552  AVIAMFReconGain *recon = subblock;
553  recon->subblock_duration = subblock_duration;
554  break;
555  }
556  default:
557  av_free(param);
558  return AVERROR_INVALIDDATA;
559  }
560  }
561 
562  param->parameter_id = parameter_id;
563  param->parameter_rate = parameter_rate;
564  param->duration = duration;
565  param->constant_subblock_duration = constant_subblock_duration;
566  param->nb_subblocks = nb_subblocks;
567 
568  if (param_definition) {
569  if (param_definition->param_size != param_size || memcmp(param_definition->param, param, param_size)) {
570  av_log(s, AV_LOG_ERROR, "Incosistent parameters for parameter_id %u\n", parameter_id);
571  av_free(param);
572  return AVERROR_INVALIDDATA;
573  }
574  } else {
575  IAMFParamDefinition **tmp = av_realloc_array(c->param_definitions, c->nb_param_definitions + 1,
576  sizeof(*c->param_definitions));
577  if (!tmp) {
578  av_free(param);
579  return AVERROR(ENOMEM);
580  }
581  c->param_definitions = tmp;
582 
584  if (!param_definition) {
585  av_free(param);
586  return AVERROR(ENOMEM);
587  }
588  param_definition->param = param;
589  param_definition->mode = !mode;
590  param_definition->param_size = param_size;
591  param_definition->audio_element = audio_element;
592 
593  c->param_definitions[c->nb_param_definitions++] = param_definition;
594  }
595 
596  av_assert0(out_param_definition);
597  *out_param_definition = param;
598 
599  return 0;
600 }
601 
602 static int audio_element_obu(void *s, IAMFContext *c, AVIOContext *pb, int len)
603 {
604  const IAMFCodecConfig *codec_config;
605  AVIAMFAudioElement *element;
606  IAMFAudioElement **tmp, *audio_element = NULL;
607  FFIOContext b;
608  AVIOContext *pbc;
609  uint8_t *buf;
610  unsigned audio_element_id, nb_substreams, codec_config_id, num_parameters;
611  int audio_element_type, ret;
612 
613  buf = av_malloc(len);
614  if (!buf)
615  return AVERROR(ENOMEM);
616 
617  ret = avio_read(pb, buf, len);
618  if (ret != len) {
619  if (ret >= 0)
621  goto fail;
622  }
623 
624  ffio_init_context(&b, buf, len, 0, NULL, NULL, NULL, NULL);
625  pbc = &b.pub;
626 
627  audio_element_id = ffio_read_leb(pbc);
628 
629  for (int i = 0; i < c->nb_audio_elements; i++)
630  if (c->audio_elements[i]->audio_element_id == audio_element_id) {
631  av_log(s, AV_LOG_ERROR, "Duplicate audio_element_id %d\n", audio_element_id);
633  goto fail;
634  }
635 
636  audio_element_type = avio_r8(pbc) >> 5;
637  if (audio_element_type > AV_IAMF_AUDIO_ELEMENT_TYPE_SCENE) {
638  av_log(s, AV_LOG_DEBUG, "Unknown audio_element_type referenced in an audio element. Ignoring\n");
639  ret = 0;
640  goto fail;
641  }
642 
643  codec_config_id = ffio_read_leb(pbc);
644 
645  codec_config = ff_iamf_get_codec_config(c, codec_config_id);
646  if (!codec_config) {
647  av_log(s, AV_LOG_ERROR, "Non existant codec config id %d referenced in an audio element\n", codec_config_id);
649  goto fail;
650  }
651 
652  if (codec_config->codec_id == AV_CODEC_ID_NONE) {
653  av_log(s, AV_LOG_DEBUG, "Unknown codec id referenced in an audio element. Ignoring\n");
654  ret = 0;
655  goto fail;
656  }
657 
658  tmp = av_realloc_array(c->audio_elements, c->nb_audio_elements + 1, sizeof(*c->audio_elements));
659  if (!tmp) {
660  ret = AVERROR(ENOMEM);
661  goto fail;
662  }
663  c->audio_elements = tmp;
664 
665  audio_element = av_mallocz(sizeof(*audio_element));
666  if (!audio_element) {
667  ret = AVERROR(ENOMEM);
668  goto fail;
669  }
670 
671  nb_substreams = ffio_read_leb(pbc);
672  audio_element->codec_config_id = codec_config_id;
673  audio_element->audio_element_id = audio_element_id;
674  audio_element->substreams = av_calloc(nb_substreams, sizeof(*audio_element->substreams));
675  if (!audio_element->substreams) {
676  ret = AVERROR(ENOMEM);
677  goto fail;
678  }
679  audio_element->nb_substreams = nb_substreams;
680 
681  element = audio_element->element = av_iamf_audio_element_alloc();
682  if (!element) {
683  ret = AVERROR(ENOMEM);
684  goto fail;
685  }
686  audio_element->celement = element;
687 
688  element->audio_element_type = audio_element_type;
689 
690  for (int i = 0; i < audio_element->nb_substreams; i++) {
691  IAMFSubStream *substream = &audio_element->substreams[i];
692 
693  substream->codecpar = avcodec_parameters_alloc();
694  if (!substream->codecpar) {
695  ret = AVERROR(ENOMEM);
696  goto fail;
697  }
698 
699  substream->audio_substream_id = ffio_read_leb(pbc);
700 
701  substream->codecpar->codec_type = AVMEDIA_TYPE_AUDIO;
702  substream->codecpar->codec_id = codec_config->codec_id;
703  substream->codecpar->frame_size = codec_config->nb_samples;
704  substream->codecpar->sample_rate = codec_config->sample_rate;
705  substream->codecpar->seek_preroll = -codec_config->audio_roll_distance * codec_config->nb_samples;
706 
707  switch(substream->codecpar->codec_id) {
708  case AV_CODEC_ID_AAC:
709  case AV_CODEC_ID_FLAC:
710  case AV_CODEC_ID_OPUS:
712  if (!substream->codecpar->extradata) {
713  ret = AVERROR(ENOMEM);
714  goto fail;
715  }
716  memcpy(substream->codecpar->extradata, codec_config->extradata, codec_config->extradata_size);
717  memset(substream->codecpar->extradata + codec_config->extradata_size, 0, AV_INPUT_BUFFER_PADDING_SIZE);
718  substream->codecpar->extradata_size = codec_config->extradata_size;
719  break;
720  }
721  }
722 
723  num_parameters = ffio_read_leb(pbc);
724  if (num_parameters && audio_element_type != 0) {
725  av_log(s, AV_LOG_ERROR, "Audio Element parameter count %u is invalid"
726  " for Scene representations\n", num_parameters);
728  goto fail;
729  }
730 
731  for (int i = 0; i < num_parameters; i++) {
732  unsigned type;
733 
734  type = ffio_read_leb(pbc);
738  ret = param_parse(s, c, pbc, type, audio_element, &element->demixing_info);
740  ret = param_parse(s, c, pbc, type, audio_element, &element->recon_gain_info);
741  else {
742  unsigned param_definition_size = ffio_read_leb(pbc);
743  avio_skip(pbc, param_definition_size);
744  }
745  if (ret < 0)
746  goto fail;
747  }
748 
749  if (audio_element_type == AV_IAMF_AUDIO_ELEMENT_TYPE_CHANNEL) {
750  ret = scalable_channel_layout_config(s, pbc, audio_element, codec_config);
751  if (ret < 0)
752  goto fail;
753  } else if (audio_element_type == AV_IAMF_AUDIO_ELEMENT_TYPE_SCENE) {
754  ret = ambisonics_config(s, pbc, audio_element, codec_config);
755  if (ret < 0)
756  goto fail;
757  } else {
758  av_assert0(0);
759  }
760 
761  c->audio_elements[c->nb_audio_elements++] = audio_element;
762 
763  len -= avio_tell(pbc);
764  if (len)
765  av_log(s, AV_LOG_WARNING, "Underread in audio_element_obu. %d bytes left at the end\n", len);
766 
767  ret = 0;
768 fail:
769  av_free(buf);
770  if (ret < 0)
771  ff_iamf_free_audio_element(&audio_element);
772  return ret;
773 }
774 
775 static int label_string(AVIOContext *pb, char **label)
776 {
777  uint8_t buf[128];
778 
779  avio_get_str(pb, sizeof(buf), buf, sizeof(buf));
780 
781  if (pb->error)
782  return pb->error;
783  if (pb->eof_reached)
784  return AVERROR_INVALIDDATA;
785  *label = av_strdup(buf);
786  if (!*label)
787  return AVERROR(ENOMEM);
788 
789  return 0;
790 }
791 
792 static int mix_presentation_obu(void *s, IAMFContext *c, AVIOContext *pb, int len)
793 {
795  IAMFMixPresentation **tmp, *mix_presentation = NULL;
796  FFIOContext b;
797  AVIOContext *pbc;
798  uint8_t *buf;
799  unsigned nb_submixes, mix_presentation_id;
800  int ret;
801 
802  buf = av_malloc(len);
803  if (!buf)
804  return AVERROR(ENOMEM);
805 
806  ret = avio_read(pb, buf, len);
807  if (ret != len) {
808  if (ret >= 0)
810  goto fail;
811  }
812 
813  ffio_init_context(&b, buf, len, 0, NULL, NULL, NULL, NULL);
814  pbc = &b.pub;
815 
816  mix_presentation_id = ffio_read_leb(pbc);
817 
818  for (int i = 0; i < c->nb_mix_presentations; i++)
819  if (c->mix_presentations[i]->mix_presentation_id == mix_presentation_id) {
820  av_log(s, AV_LOG_ERROR, "Duplicate mix_presentation_id %d\n", mix_presentation_id);
822  goto fail;
823  }
824 
825  tmp = av_realloc_array(c->mix_presentations, c->nb_mix_presentations + 1, sizeof(*c->mix_presentations));
826  if (!tmp) {
827  ret = AVERROR(ENOMEM);
828  goto fail;
829  }
830  c->mix_presentations = tmp;
831 
832  mix_presentation = av_mallocz(sizeof(*mix_presentation));
833  if (!mix_presentation) {
834  ret = AVERROR(ENOMEM);
835  goto fail;
836  }
837 
838  mix_presentation->mix_presentation_id = mix_presentation_id;
839  mix = mix_presentation->mix = av_iamf_mix_presentation_alloc();
840  if (!mix) {
841  ret = AVERROR(ENOMEM);
842  goto fail;
843  }
844  mix_presentation->cmix = mix;
845 
846  mix_presentation->count_label = ffio_read_leb(pbc);
847  mix_presentation->language_label = av_calloc(mix_presentation->count_label,
848  sizeof(*mix_presentation->language_label));
849  if (!mix_presentation->language_label) {
850  ret = AVERROR(ENOMEM);
851  goto fail;
852  }
853 
854  for (int i = 0; i < mix_presentation->count_label; i++) {
855  ret = label_string(pbc, &mix_presentation->language_label[i]);
856  if (ret < 0)
857  goto fail;
858  }
859 
860  for (int i = 0; i < mix_presentation->count_label; i++) {
861  char *annotation = NULL;
862  ret = label_string(pbc, &annotation);
863  if (ret < 0)
864  goto fail;
865  ret = av_dict_set(&mix->annotations, mix_presentation->language_label[i], annotation,
867  if (ret < 0)
868  goto fail;
869  }
870 
871  nb_submixes = ffio_read_leb(pbc);
872  for (int i = 0; i < nb_submixes; i++) {
873  AVIAMFSubmix *sub_mix;
874  unsigned nb_elements, nb_layouts;
875 
877  if (!sub_mix) {
878  ret = AVERROR(ENOMEM);
879  goto fail;
880  }
881 
882  nb_elements = ffio_read_leb(pbc);
883  for (int j = 0; j < nb_elements; j++) {
884  AVIAMFSubmixElement *submix_element;
885  IAMFAudioElement *audio_element = NULL;
886  unsigned int rendering_config_extension_size;
887 
888  submix_element = av_iamf_submix_add_element(sub_mix);
889  if (!submix_element) {
890  ret = AVERROR(ENOMEM);
891  goto fail;
892  }
893 
894  submix_element->audio_element_id = ffio_read_leb(pbc);
895 
896  for (int k = 0; k < c->nb_audio_elements; k++)
897  if (c->audio_elements[k]->audio_element_id == submix_element->audio_element_id) {
898  audio_element = c->audio_elements[k];
899  break;
900  }
901 
902  if (!audio_element) {
903  av_log(s, AV_LOG_ERROR, "Invalid Audio Element with id %u referenced by Mix Parameters %u\n",
904  submix_element->audio_element_id, mix_presentation_id);
906  goto fail;
907  }
908 
909  for (int k = 0; k < mix_presentation->count_label; k++) {
910  char *annotation = NULL;
911  ret = label_string(pbc, &annotation);
912  if (ret < 0)
913  goto fail;
914  ret = av_dict_set(&submix_element->annotations, mix_presentation->language_label[k], annotation,
916  if (ret < 0)
917  goto fail;
918  }
919 
920  submix_element->headphones_rendering_mode = avio_r8(pbc) >> 6;
921 
922  rendering_config_extension_size = ffio_read_leb(pbc);
923  avio_skip(pbc, rendering_config_extension_size);
924 
926  NULL,
927  &submix_element->element_mix_config);
928  if (ret < 0)
929  goto fail;
930  submix_element->default_mix_gain = av_make_q(sign_extend(avio_rb16(pbc), 16), 1 << 8);
931  }
932 
934  if (ret < 0)
935  goto fail;
936  sub_mix->default_mix_gain = av_make_q(sign_extend(avio_rb16(pbc), 16), 1 << 8);
937 
938  nb_layouts = ffio_read_leb(pbc);
939  for (int j = 0; j < nb_layouts; j++) {
940  AVIAMFSubmixLayout *submix_layout;
941  int info_type;
942  int byte = avio_r8(pbc);
943 
944  submix_layout = av_iamf_submix_add_layout(sub_mix);
945  if (!submix_layout) {
946  ret = AVERROR(ENOMEM);
947  goto fail;
948  }
949 
950  submix_layout->layout_type = byte >> 6;
953  av_log(s, AV_LOG_ERROR, "Invalid Layout type %u in a submix from Mix Presentation %u\n",
954  submix_layout->layout_type, mix_presentation_id);
956  goto fail;
957  }
958  if (submix_layout->layout_type == 2) {
959  int sound_system;
960  sound_system = (byte >> 2) & 0xF;
961  if (sound_system >= FF_ARRAY_ELEMS(ff_iamf_sound_system_map)) {
963  goto fail;
964  }
965  av_channel_layout_copy(&submix_layout->sound_system, &ff_iamf_sound_system_map[sound_system].layout);
966  }
967 
968  info_type = avio_r8(pbc);
969  submix_layout->integrated_loudness = av_make_q(sign_extend(avio_rb16(pbc), 16), 1 << 8);
970  submix_layout->digital_peak = av_make_q(sign_extend(avio_rb16(pbc), 16), 1 << 8);
971 
972  if (info_type & 1)
973  submix_layout->true_peak = av_make_q(sign_extend(avio_rb16(pbc), 16), 1 << 8);
974  if (info_type & 2) {
975  unsigned int num_anchored_loudness = avio_r8(pbc);
976 
977  for (int k = 0; k < num_anchored_loudness; k++) {
978  unsigned int anchor_element = avio_r8(pbc);
979  AVRational anchored_loudness = av_make_q(sign_extend(avio_rb16(pbc), 16), 1 << 8);
980  if (anchor_element == IAMF_ANCHOR_ELEMENT_DIALOGUE)
981  submix_layout->dialogue_anchored_loudness = anchored_loudness;
982  else if (anchor_element <= IAMF_ANCHOR_ELEMENT_ALBUM)
983  submix_layout->album_anchored_loudness = anchored_loudness;
984  else
985  av_log(s, AV_LOG_DEBUG, "Unknown anchor_element. Ignoring\n");
986  }
987  }
988 
989  if (info_type & 0xFC) {
990  unsigned int info_type_size = ffio_read_leb(pbc);
991  avio_skip(pbc, info_type_size);
992  }
993  }
994  }
995 
996  c->mix_presentations[c->nb_mix_presentations++] = mix_presentation;
997 
998  len -= avio_tell(pbc);
999  if (len)
1000  av_log(s, AV_LOG_WARNING, "Underread in mix_presentation_obu. %d bytes left at the end\n", len);
1001 
1002  ret = 0;
1003 fail:
1004  av_free(buf);
1005  if (ret < 0)
1006  ff_iamf_free_mix_presentation(&mix_presentation);
1007  return ret;
1008 }
1009 
1010 int ff_iamf_parse_obu_header(const uint8_t *buf, int buf_size,
1011  unsigned *obu_size, int *start_pos, enum IAMF_OBU_Type *type,
1012  unsigned *skip_samples, unsigned *discard_padding)
1013 {
1014  GetBitContext gb;
1015  int ret, extension_flag, trimming, start;
1016  unsigned skip = 0, discard = 0;
1017  unsigned size;
1018 
1019  ret = init_get_bits8(&gb, buf, FFMIN(buf_size, MAX_IAMF_OBU_HEADER_SIZE));
1020  if (ret < 0)
1021  return ret;
1022 
1023  *type = get_bits(&gb, 5);
1024  /*redundant =*/ get_bits1(&gb);
1025  trimming = get_bits1(&gb);
1026  extension_flag = get_bits1(&gb);
1027 
1028  *obu_size = get_leb(&gb);
1029  if (*obu_size > INT_MAX)
1030  return AVERROR_INVALIDDATA;
1031 
1032  start = get_bits_count(&gb) / 8;
1033 
1034  if (trimming) {
1035  discard = get_leb(&gb); // num_samples_to_trim_at_end
1036  skip = get_leb(&gb); // num_samples_to_trim_at_start
1037  }
1038 
1039  if (skip_samples)
1040  *skip_samples = skip;
1041  if (discard_padding)
1042  *discard_padding = discard;
1043 
1044  if (extension_flag) {
1045  unsigned int extension_bytes;
1046  extension_bytes = get_leb(&gb);
1047  if (extension_bytes > INT_MAX / 8)
1048  return AVERROR_INVALIDDATA;
1049  skip_bits_long(&gb, extension_bytes * 8);
1050  }
1051 
1052  if (get_bits_left(&gb) < 0)
1053  return AVERROR_INVALIDDATA;
1054 
1055  size = *obu_size + start;
1056  if (size > INT_MAX)
1057  return AVERROR_INVALIDDATA;
1058 
1059  *obu_size -= get_bits_count(&gb) / 8 - start;
1060  *start_pos = size - *obu_size;
1061 
1062  return size;
1063 }
1064 
1066  int max_size, void *log_ctx)
1067 {
1069  int ret;
1070 
1071  while (1) {
1072  unsigned obu_size;
1073  enum IAMF_OBU_Type type;
1074  int start_pos, len, size;
1075 
1076  if ((ret = ffio_ensure_seekback(pb, FFMIN(MAX_IAMF_OBU_HEADER_SIZE, max_size))) < 0)
1077  return ret;
1078  size = avio_read(pb, header, FFMIN(MAX_IAMF_OBU_HEADER_SIZE, max_size));
1079  if (size < 0)
1080  return size;
1082 
1083  len = ff_iamf_parse_obu_header(header, size, &obu_size, &start_pos, &type, NULL, NULL);
1084  if (len < 0 || obu_size > max_size) {
1085  av_log(log_ctx, AV_LOG_ERROR, "Failed to read obu header\n");
1086  avio_seek(pb, -size, SEEK_CUR);
1087  return len;
1088  }
1089 
1091  avio_seek(pb, -size, SEEK_CUR);
1092  break;
1093  }
1094 
1095  avio_seek(pb, -(size - start_pos), SEEK_CUR);
1096  switch (type) {
1098  ret = codec_config_obu(log_ctx, c, pb, obu_size);
1099  break;
1101  ret = audio_element_obu(log_ctx, c, pb, obu_size);
1102  break;
1104  ret = mix_presentation_obu(log_ctx, c, pb, obu_size);
1105  break;
1106  default: {
1107  int64_t offset = avio_skip(pb, obu_size);
1108  if (offset < 0)
1109  ret = offset;
1110  break;
1111  }
1112  }
1113  if (ret < 0) {
1114  av_log(log_ctx, AV_LOG_ERROR, "Failed to read obu type %d\n", type);
1115  return ret;
1116  }
1117  max_size -= obu_size + start_pos;
1118  if (max_size < 0)
1119  return AVERROR_INVALIDDATA;
1120  if (!max_size)
1121  break;
1122  }
1123 
1124  return 0;
1125 }
update_extradata
static int update_extradata(AVCodecParameters *codecpar)
Definition: iamf_parse.c:276
AV_CODEC_ID_PCM_S16LE
@ AV_CODEC_ID_PCM_S16LE
Definition: codec_id.h:328
iamf.h
ff_iamf_free_mix_presentation
void ff_iamf_free_mix_presentation(IAMFMixPresentation **pmix_presentation)
Definition: iamf.c:85
skip_bits_long
static void skip_bits_long(GetBitContext *s, int n)
Skips the specified number of bits.
Definition: get_bits.h:278
AV_IAMF_SUBMIX_LAYOUT_TYPE_LOUDSPEAKERS
@ AV_IAMF_SUBMIX_LAYOUT_TYPE_LOUDSPEAKERS
The layout follows the loudspeaker sound system convention of ITU-2051-3.
Definition: iamf.h:497
AV_LOG_WARNING
#define AV_LOG_WARNING
Something somehow does not look correct.
Definition: log.h:186
AVCodecParameters::extradata
uint8_t * extradata
Extra binary data needed for initializing the decoder, codec-dependent.
Definition: codec_par.h:69
MP4DecConfigDescrTag
#define MP4DecConfigDescrTag
Definition: isom.h:369
ffio_init_context
void ffio_init_context(FFIOContext *s, unsigned char *buffer, int buffer_size, int write_flag, void *opaque, int(*read_packet)(void *opaque, uint8_t *buf, int buf_size), int(*write_packet)(void *opaque, const uint8_t *buf, int buf_size), int64_t(*seek)(void *opaque, int64_t offset, int whence))
Definition: aviobuf.c:49
mix
static int mix(int c0, int c1)
Definition: 4xm.c:715
get_bits_left
static int get_bits_left(GetBitContext *gb)
Definition: get_bits.h:695
AVERROR
Filter the word “frame” indicates either a video frame or a group of audio as stored in an AVFrame structure Format for each input and each output the list of supported formats For video that means pixel format For audio that means channel sample they are references to shared objects When the negotiation mechanism computes the intersection of the formats supported at each end of a all references to both lists are replaced with a reference to the intersection And when a single format is eventually chosen for a link amongst the remaining all references to the list are updated That means that if a filter requires that its input and output have the same format amongst a supported all it has to do is use a reference to the same list of formats query_formats can leave some formats unset and return AVERROR(EAGAIN) to cause the negotiation mechanism toagain later. That can be used by filters with complex requirements to use the format negotiated on one link to set the formats supported on another. Frame references ownership and permissions
put_bits32
static void av_unused put_bits32(PutBitContext *s, uint32_t value)
Write exactly 32 bits into a bitstream.
Definition: put_bits.h:291
AVCodecParameters::codec_type
enum AVMediaType codec_type
General type of the encoded data.
Definition: codec_par.h:51
AVChannelLayout::u
union AVChannelLayout::@352 u
Details about which channels are present in this layout.
AV_WL32
#define AV_WL32(p, v)
Definition: intreadwrite.h:424
AV_CHANNEL_LAYOUT_STEREO
#define AV_CHANNEL_LAYOUT_STEREO
Definition: channel_layout.h:379
put_bytes_output
static int put_bytes_output(const PutBitContext *s)
Definition: put_bits.h:89
IAMF_OBU_IA_SEQUENCE_HEADER
@ IAMF_OBU_IA_SEQUENCE_HEADER
Definition: iamf.h:63
ff_mp4_obj_type
const AVCodecTag ff_mp4_obj_type[]
Definition: isom.c:34
AVCodecParameters
This struct describes the properties of an encoded stream.
Definition: codec_par.h:47
AVIAMFAudioElement::default_w
unsigned int default_w
Default weight value as defined in section 3.6 of IAMF.
Definition: iamf.h:393
IAMFAudioElement::nb_substreams
unsigned int nb_substreams
Definition: iamf.h:99
av_iamf_param_definition_alloc
AVIAMFParamDefinition * av_iamf_param_definition_alloc(enum AVIAMFParamDefinitionType type, unsigned int nb_subblocks, size_t *out_size)
Allocates memory for AVIAMFParamDefinition, plus an array of.
Definition: iamf.c:159
get_bits_long
static unsigned int get_bits_long(GetBitContext *s, int n)
Read 0-32 bits.
Definition: get_bits.h:421
int64_t
long long int64_t
Definition: coverity.c:34
init_put_bits
static void init_put_bits(PutBitContext *s, uint8_t *buffer, int buffer_size)
Initialize the PutBitContext s.
Definition: put_bits.h:62
get_bits_count
static int get_bits_count(const GetBitContext *s)
Definition: get_bits.h:266
AVChannelLayout::map
AVChannelCustom * map
This member must be used when the channel order is AV_CHANNEL_ORDER_CUSTOM.
Definition: channel_layout.h:354
put_bits
static void put_bits(Jpeg2000EncoderContext *s, int val, int n)
put n times val bit
Definition: j2kenc.c:222
tmp
static uint8_t tmp[11]
Definition: aes_ctr.c:28
ff_iamf_sound_system_map
const struct IAMFSoundSystemMap ff_iamf_sound_system_map[13]
Definition: iamf.c:48
put_bits64
static void put_bits64(PutBitContext *s, int n, uint64_t value)
Write up to 64 bits into a bitstream.
Definition: put_bits.h:334
AVCodecParameters::seek_preroll
int seek_preroll
Audio only.
Definition: codec_par.h:214
b
#define b
Definition: input.c:41
AVIOContext::error
int error
contains the error code or 0 if no error happened
Definition: avio.h:239
AVIAMFSubmixLayout::layout_type
enum AVIAMFSubmixLayoutType layout_type
Definition: iamf.h:513
AVIAMFParamDefinition
Parameters as defined in section 3.6.1 of IAMF.
Definition: iamf.h:193
AVIAMFSubmixElement::default_mix_gain
AVRational default_mix_gain
Default mix gain value to apply when there are no AVIAMFParamDefinition with element_mix_config's par...
Definition: iamf.h:469
AV_CODEC_ID_FLAC
@ AV_CODEC_ID_FLAC
Definition: codec_id.h:452
AVChannelLayout::order
enum AVChannelOrder order
Channel order used in this layout.
Definition: channel_layout.h:308
iamf_parse.h
ambisonics_config
static int ambisonics_config(void *s, AVIOContext *pb, IAMFAudioElement *audio_element, const IAMFCodecConfig *codec_config)
Definition: iamf_parse.c:407
AVChannelLayout::nb_channels
int nb_channels
Number of channels in this layout.
Definition: channel_layout.h:313
FFIOContext
Definition: avio_internal.h:28
flac_decoder_config
static int flac_decoder_config(IAMFCodecConfig *codec_config, AVIOContext *pb, int len)
Definition: iamf_parse.c:117
av_malloc
#define av_malloc(s)
Definition: tableprint_vlc.h:30
IAMFMixPresentation::cmix
const AVIAMFMixPresentation * cmix
Definition: iamf.h:108
MPEG4AudioConfig
Definition: mpeg4audio.h:29
AVIAMFSubmixLayout::digital_peak
AVRational digital_peak
The digital (sampled) peak value of the audio signal, as defined in ITU-1770-4.
Definition: iamf.h:531
skip_bits
static void skip_bits(GetBitContext *s, int n)
Definition: get_bits.h:381
get_bits
static unsigned int get_bits(GetBitContext *s, int n)
Read 1-25 bits.
Definition: get_bits.h:335
mpeg4audio.h
AVIAMFSubmixLayout::integrated_loudness
AVRational integrated_loudness
The program integrated loudness information, as defined in ITU-1770-4.
Definition: iamf.h:526
av_iamf_mix_presentation_add_submix
AVIAMFSubmix * av_iamf_mix_presentation_add_submix(AVIAMFMixPresentation *mix_presentation)
Allocate a submix and add it to a given AVIAMFMixPresentation.
IAMFCodecConfig::extradata
uint8_t * extradata
Definition: iamf.h:74
MP4DecSpecificDescrTag
#define MP4DecSpecificDescrTag
Definition: isom.h:370
AOT_ESCAPE
@ AOT_ESCAPE
Y Escape Value.
Definition: mpeg4audio.h:100
AV_CODEC_ID_PCM_S16BE
@ AV_CODEC_ID_PCM_S16BE
Definition: codec_id.h:329
IAMFParamDefinition
Definition: iamf.h:121
fail
#define fail()
Definition: checkasm.h:179
GetBitContext
Definition: get_bits.h:108
AVIAMFSubmixLayout
Submix layout as defined in section 3.7.6 of IAMF.
Definition: iamf.h:510
IAMF_ANCHOR_ELEMENT_ALBUM
@ IAMF_ANCHOR_ELEMENT_ALBUM
Definition: iamf.h:142
put_bits_left
static int put_bits_left(PutBitContext *s)
Definition: put_bits.h:125
avio_tell
static av_always_inline int64_t avio_tell(AVIOContext *s)
ftell() equivalent for AVIOContext.
Definition: avio.h:494
av_iamf_audio_element_alloc
AVIAMFAudioElement * av_iamf_audio_element_alloc(void)
Allocates a AVIAMFAudioElement, and initializes its fields with default values.
Definition: iamf.c:322
type
it s the only field you need to keep assuming you have a context There is some magic you don t need to care about around this just let it vf type
Definition: writing_filters.txt:86
IAMF_OBU_IA_PARAMETER_BLOCK
@ IAMF_OBU_IA_PARAMETER_BLOCK
Definition: iamf.h:41
AVIAMFAudioElement::audio_element_type
enum AVIAMFAudioElementType audio_element_type
Audio element type as defined in section 3.6 of IAMF.
Definition: iamf.h:388
opus_decoder_config
static int opus_decoder_config(IAMFCodecConfig *codec_config, AVIOContext *pb, int len)
Definition: iamf_parse.c:36
AVIAMFReconGain
Recon Gain Info Parameter Data as defined in section 3.8.3 of IAMF.
Definition: iamf.h:148
param_parse
static int param_parse(void *s, IAMFContext *c, AVIOContext *pb, unsigned int type, const IAMFAudioElement *audio_element, AVIAMFParamDefinition **out_param_definition)
Definition: iamf_parse.c:492
codec_config_obu
static int codec_config_obu(void *s, IAMFContext *c, AVIOContext *pb, int len)
Definition: iamf_parse.c:165
AV_DICT_DONT_STRDUP_VAL
#define AV_DICT_DONT_STRDUP_VAL
Take ownership of a value that's been allocated with av_malloc() or another memory allocation functio...
Definition: dict.h:79
IAMFAudioElement::element
AVIAMFAudioElement * element
element backs celement iff the AVIAMFAudioElement is owned by this structure.
Definition: iamf.h:95
AV_IAMF_PARAMETER_DEFINITION_RECON_GAIN
@ AV_IAMF_PARAMETER_DEFINITION_RECON_GAIN
Subblocks are of struct type AVIAMFReconGain.
Definition: iamf.h:181
AVIAMFSubmixElement::annotations
AVDictionary * annotations
A dictionary of strings describing the submix in different languages.
Definition: iamf.h:490
avassert.h
avio_rb32
unsigned int avio_rb32(AVIOContext *s)
Definition: aviobuf.c:760
AV_LOG_ERROR
#define AV_LOG_ERROR
Something went wrong and cannot losslessly be recovered.
Definition: log.h:180
FF_ARRAY_ELEMS
#define FF_ARRAY_ELEMS(a)
Definition: sinewin_tablegen.c:29
init_get_bits8
static int init_get_bits8(GetBitContext *s, const uint8_t *buffer, int byte_size)
Initialize GetBitContext.
Definition: get_bits.h:545
IAMFCodecConfig::sample_rate
int sample_rate
Definition: iamf.h:72
IAMF_OBU_IA_MIX_PRESENTATION
@ IAMF_OBU_IA_MIX_PRESENTATION
Definition: iamf.h:40
duration
int64_t duration
Definition: movenc.c:64
AVCodecParameters::frame_size
int frame_size
Audio only.
Definition: codec_par.h:195
av_iamf_submix_add_layout
AVIAMFSubmixLayout * av_iamf_submix_add_layout(AVIAMFSubmix *submix)
Allocate a submix layout and add it to a given AVIAMFSubmix.
avpriv_mpeg4audio_get_config2
int avpriv_mpeg4audio_get_config2(MPEG4AudioConfig *c, const uint8_t *buf, int size, int sync_extension, void *logctx)
Parse MPEG-4 systems extradata from a raw buffer to retrieve audio configuration.
Definition: mpeg4audio.c:165
intreadwrite.h
s
#define s(width, name)
Definition: cbs_vp9.c:198
IAMFSubStream::audio_substream_id
unsigned int audio_substream_id
Definition: iamf.h:83
IAMFLayer::substream_count
unsigned int substream_count
Definition: iamf.h:78
AVIAMFSubmixLayout::dialogue_anchored_loudness
AVRational dialogue_anchored_loudness
The Dialogue loudness information, as defined in ITU-1770-4.
Definition: iamf.h:539
av_realloc_array
void * av_realloc_array(void *ptr, size_t nmemb, size_t size)
Definition: mem.c:215
floor
static __device__ float floor(float a)
Definition: cuda_runtime.h:173
AVMEDIA_TYPE_AUDIO
@ AVMEDIA_TYPE_AUDIO
Definition: avutil.h:202
av_iamf_param_definition_get_subblock
static av_always_inline void * av_iamf_param_definition_get_subblock(const AVIAMFParamDefinition *par, unsigned int idx)
Get the subblock at the specified.
Definition: iamf.h:260
AV_CHANNEL_ORDER_UNSPEC
@ AV_CHANNEL_ORDER_UNSPEC
Only the channel count is specified, without any further information about the channel order.
Definition: channel_layout.h:112
av_assert0
#define av_assert0(cond)
assert() equivalent, that is always enabled.
Definition: avassert.h:40
AVIAMFSubmixElement::headphones_rendering_mode
enum AVIAMFHeadphonesMode headphones_rendering_mode
A value that indicates whether the referenced channel-based Audio Element shall be rendered to stereo...
Definition: iamf.h:478
ffio_read_leb
unsigned int ffio_read_leb(AVIOContext *s)
Read a unsigned integer coded as a variable number of up to eight little-endian bytes,...
Definition: aviobuf.c:926
AV_LOG_DEBUG
#define AV_LOG_DEBUG
Stuff which is only useful for libav* developers.
Definition: log.h:201
get_bits.h
AVIAMFLayer::ch_layout
AVChannelLayout ch_layout
Definition: iamf.h:297
IAMFAudioElement::nb_layers
unsigned int nb_layers
Definition: iamf.h:104
ff_iamfdec_read_descriptors
int ff_iamfdec_read_descriptors(IAMFContext *c, AVIOContext *pb, int max_size, void *log_ctx)
Definition: iamf_parse.c:1065
codec_id
enum AVCodecID codec_id
Definition: vaapi_decode.c:387
PutBitContext
Definition: put_bits.h:50
IAMFAudioElement::audio_element_id
unsigned int audio_element_id
Definition: iamf.h:96
AVIAMFDemixingInfo
Demixing Info Parameter Data as defined in section 3.8.2 of IAMF.
Definition: iamf.h:128
IAMFSoundSystemMap::layout
AVChannelLayout layout
Definition: iamf.h:163
AV_CHANNEL_ORDER_AMBISONIC
@ AV_CHANNEL_ORDER_AMBISONIC
The audio is represented as the decomposition of the sound field into spherical harmonics.
Definition: channel_layout.h:148
NULL
#define NULL
Definition: coverity.c:32
get_leb
static unsigned get_leb(GetBitContext *s)
Read a unsigned integer coded as a variable number of up to eight little-endian bytes,...
Definition: leb.h:35
isom.h
IAMF_OBU_IA_AUDIO_ELEMENT
@ IAMF_OBU_IA_AUDIO_ELEMENT
Definition: iamf.h:39
AVRational
Rational number (pair of numerator and denominator).
Definition: rational.h:58
AVIAMFParamDefinition::duration
unsigned int duration
The accumulated duration of all blocks in this parameter definition, in units of 1 / parameter_rate.
Definition: iamf.h:231
ff_iamf_get_codec_config
static IAMFCodecConfig * ff_iamf_get_codec_config(const IAMFContext *c, unsigned int codec_config_id)
Definition: iamf.h:170
get_bits1
static unsigned int get_bits1(GetBitContext *s)
Definition: get_bits.h:388
audio_element_obu
static int audio_element_obu(void *s, IAMFContext *c, AVIOContext *pb, int len)
Definition: iamf_parse.c:602
AVIAMFLayer
A layer defining a Channel Layout in the Audio Element.
Definition: iamf.h:294
IAMF_OBU_IA_CODEC_CONFIG
@ IAMF_OBU_IA_CODEC_CONFIG
Definition: iamf.h:38
IAMFSubStream
Definition: iamf.h:82
IAMFAudioElement::layers
IAMFLayer * layers
Definition: iamf.h:103
FLAC_STREAMINFO_SIZE
#define FLAC_STREAMINFO_SIZE
Definition: flac.h:32
AV_DICT_DONT_OVERWRITE
#define AV_DICT_DONT_OVERWRITE
Don't overwrite existing entries.
Definition: dict.h:81
AVCodecParameters::ch_layout
AVChannelLayout ch_layout
Audio only.
Definition: codec_par.h:180
IAMFAudioElement::celement
const AVIAMFAudioElement * celement
Definition: iamf.h:90
c
Undefined Behavior In the C some operations are like signed integer dereferencing freed accessing outside allocated Undefined Behavior must not occur in a C it is not safe even if the output of undefined operations is unused The unsafety may seem nit picking but Optimizing compilers have in fact optimized code on the assumption that no undefined Behavior occurs Optimizing code based on wrong assumptions can and has in some cases lead to effects beyond the output of computations The signed integer overflow problem in speed critical code Code which is highly optimized and works with signed integers sometimes has the problem that often the output of the computation does not c
Definition: undefined.txt:32
ff_mp4_read_descr
int ff_mp4_read_descr(void *logctx, AVIOContext *pb, int *tag)
Definition: isom.c:295
AVCodecParameters::sample_rate
int sample_rate
Audio only.
Definition: codec_par.h:184
ff_iamf_parse_obu_header
int ff_iamf_parse_obu_header(const uint8_t *buf, int buf_size, unsigned *obu_size, int *start_pos, enum IAMF_OBU_Type *type, unsigned *skip_samples, unsigned *discard_padding)
Definition: iamf_parse.c:1010
AVIAMFLayer::output_gain_flags
unsigned int output_gain_flags
Output gain channel flags as defined in section 3.6.2 of IAMF.
Definition: iamf.h:310
AVCodecID
AVCodecID
Identify the syntax and semantics of the bitstream.
Definition: codec_id.h:49
AVIAMFSubmixElement::audio_element_id
unsigned int audio_element_id
The id of the Audio Element this submix element references.
Definition: iamf.h:452
AVCodecParameters::extradata_size
int extradata_size
Size of the extradata content in bytes.
Definition: codec_par.h:73
AVIAMFSubmix
Submix layout as defined in section 3.7 of IAMF.
Definition: iamf.h:552
AV_WB32
#define AV_WB32(p, v)
Definition: intreadwrite.h:417
AV_CODEC_ID_AAC
@ AV_CODEC_ID_AAC
Definition: codec_id.h:442
IAMFAudioElement
Definition: iamf.h:89
AVIAMFReconGain::subblock_duration
unsigned int subblock_duration
Duration for the given subblock, in units of 1 / parameter_rate.
Definition: iamf.h:156
AVIOContext
Bytestream IO Context.
Definition: avio.h:160
IAMFCodecConfig::nb_samples
unsigned nb_samples
Definition: iamf.h:70
AV_CODEC_ID_PCM_S24LE
@ AV_CODEC_ID_PCM_S24LE
Definition: codec_id.h:340
AVIAMFDemixingInfo::subblock_duration
unsigned int subblock_duration
Duration for the given subblock, in units of 1 / parameter_rate.
Definition: iamf.h:136
ff_codec_get_id
enum AVCodecID ff_codec_get_id(const AVCodecTag *tags, unsigned int tag)
Definition: utils.c:145
IAMFCodecConfig
Definition: iamf.h:66
AVChannelLayout
An AVChannelLayout holds information about the channel layout of audio data.
Definition: channel_layout.h:303
IAMFCodecConfig::extradata_size
int extradata_size
Definition: iamf.h:73
avio_get_str
int avio_get_str(AVIOContext *pb, int maxlen, char *buf, int buflen)
Read a string from pb into buf.
Definition: aviobuf.c:865
size
int size
Definition: twinvq_data.h:10344
av_make_q
static AVRational av_make_q(int num, int den)
Create an AVRational.
Definition: rational.h:71
IAMFLayer::coupled_substream_count
unsigned int coupled_substream_count
Definition: iamf.h:79
MKBETAG
#define MKBETAG(a, b, c, d)
Definition: macros.h:56
AV_RB32
uint64_t_TMPL AV_WL64 unsigned int_TMPL AV_WL32 unsigned int_TMPL AV_WL24 unsigned int_TMPL AV_WL16 uint64_t_TMPL AV_WB64 unsigned int_TMPL AV_RB32
Definition: bytestream.h:96
AV_CODEC_ID_OPUS
@ AV_CODEC_ID_OPUS
Definition: codec_id.h:500
av_iamf_mix_presentation_alloc
AVIAMFMixPresentation * av_iamf_mix_presentation_alloc(void)
Allocates a AVIAMFMixPresentation, and initializes its fields with default values.
Definition: iamf.c:520
IAMFContext
Definition: iamf.h:128
header
static const uint8_t header[24]
Definition: sdr2.c:68
AV_WL16
#define AV_WL16(p, v)
Definition: intreadwrite.h:410
avio_r8
int avio_r8(AVIOContext *s)
Definition: aviobuf.c:602
IAMFAudioElement::substreams
IAMFSubStream * substreams
Definition: iamf.h:98
AVIAMFParamDefinition::constant_subblock_duration
unsigned int constant_subblock_duration
The duration of every subblock in the case where all subblocks, with the optional exception of the la...
Definition: iamf.h:238
av_iamf_submix_add_element
AVIAMFSubmixElement * av_iamf_submix_add_element(AVIAMFSubmix *submix)
Allocate a submix element and add it to a given AVIAMFSubmix.
AVIAMFAudioElement
Information on how to combine one or more audio streams, as defined in section 3.6 of IAMF.
Definition: iamf.h:356
ipcm_decoder_config
static int ipcm_decoder_config(IAMFCodecConfig *codec_config, AVIOContext *pb, int len)
Definition: iamf_parse.c:144
ffio_ensure_seekback
int ffio_ensure_seekback(AVIOContext *s, int64_t buf_size)
Ensures that the requested seekback buffer size will be available.
Definition: aviobuf.c:1022
offset
it s the only field you need to keep assuming you have a context There is some magic you don t need to care about around this just let it vf offset
Definition: writing_filters.txt:86
AVIAMFMixGain
Mix Gain Parameter Data as defined in section 3.8.1 of IAMF.
Definition: iamf.h:77
leb.h
avcodec_parameters_alloc
AVCodecParameters * avcodec_parameters_alloc(void)
Allocate a new AVCodecParameters and set its fields to default values (unknown/invalid/0).
Definition: codec_par.c:56
get_bits64
static uint64_t get_bits64(GetBitContext *s, int n)
Read 0-64 bits.
Definition: get_bits.h:453
log.h
AV_CODEC_ID_NONE
@ AV_CODEC_ID_NONE
Definition: codec_id.h:50
i
#define i(width, name, range_min, range_max)
Definition: cbs_h2645.c:255
AVIAMFParamDefinition::parameter_id
unsigned int parameter_id
Identifier for the paremeter substream.
Definition: iamf.h:218
avio_internal.h
AVIAMFLayer::demixing_matrix
AVRational * demixing_matrix
Demixing matrix as defined in section 3.6.3 of IAMF.
Definition: iamf.h:340
av_malloc_array
#define av_malloc_array(a, b)
Definition: tableprint_vlc.h:31
AVIAMFMixPresentation
Information on how to render and mix one or more AVIAMFAudioElement to generate the final audio outpu...
Definition: iamf.h:609
common.h
aac_decoder_config
static int aac_decoder_config(IAMFCodecConfig *codec_config, AVIOContext *pb, int len, void *logctx)
Definition: iamf_parse.c:60
FFMIN
#define FFMIN(a, b)
Definition: macros.h:49
param_definition
static int param_definition(const IAMFContext *iamf, const IAMFParamDefinition *param_def, AVIOContext *dyn_bc, void *log_ctx)
Definition: iamf_writer.c:586
AV_CODEC_ID_PCM_S32BE
@ AV_CODEC_ID_PCM_S32BE
Definition: codec_id.h:337
av_mallocz
void * av_mallocz(size_t size)
Allocate a memory block with alignment suitable for all memory accesses (including vectors if availab...
Definition: mem.c:254
len
int len
Definition: vorbis_enc_data.h:426
IAMFMixPresentation::count_label
unsigned int count_label
Definition: iamf.h:117
av_calloc
void * av_calloc(size_t nmemb, size_t size)
Definition: mem.c:262
AVIAMFParamDefinition::nb_subblocks
unsigned int nb_subblocks
Number of subblocks in the array.
Definition: iamf.h:208
AV_IAMF_AUDIO_ELEMENT_TYPE_SCENE
@ AV_IAMF_AUDIO_ELEMENT_TYPE_SCENE
Definition: iamf.h:346
AV_WB8
#define AV_WB8(p, d)
Definition: intreadwrite.h:394
tag
uint32_t tag
Definition: movenc.c:1791
ret
ret
Definition: filter_design.txt:187
avio_seek
int64_t avio_seek(AVIOContext *s, int64_t offset, int whence)
fseek() equivalent for AVIOContext.
Definition: aviobuf.c:230
ff_iamf_free_audio_element
void ff_iamf_free_audio_element(IAMFAudioElement **paudio_element)
Definition: iamf.c:70
avio_rb16
unsigned int avio_rb16(AVIOContext *s)
Definition: aviobuf.c:745
AV_INPUT_BUFFER_PADDING_SIZE
#define AV_INPUT_BUFFER_PADDING_SIZE
Definition: defs.h:40
left
Tag MUST be and< 10hcoeff half pel interpolation filter coefficients, hcoeff[0] are the 2 middle coefficients[1] are the next outer ones and so on, resulting in a filter like:...eff[2], hcoeff[1], hcoeff[0], hcoeff[0], hcoeff[1], hcoeff[2] ... the sign of the coefficients is not explicitly stored but alternates after each coeff and coeff[0] is positive, so ...,+,-,+,-,+,+,-,+,-,+,... hcoeff[0] is not explicitly stored but found by subtracting the sum of all stored coefficients with signs from 32 hcoeff[0]=32 - hcoeff[1] - hcoeff[2] - ... a good choice for hcoeff and htaps is htaps=6 hcoeff={40,-10, 2} an alternative which requires more computations at both encoder and decoder side and may or may not be better is htaps=8 hcoeff={42,-14, 6,-2}ref_frames minimum of the number of available reference frames and max_ref_frames for example the first frame after a key frame always has ref_frames=1spatial_decomposition_type wavelet type 0 is a 9/7 symmetric compact integer wavelet 1 is a 5/3 symmetric compact integer wavelet others are reserved stored as delta from last, last is reset to 0 if always_reset||keyframeqlog quality(logarithmic quantizer scale) stored as delta from last, last is reset to 0 if always_reset||keyframemv_scale stored as delta from last, last is reset to 0 if always_reset||keyframe FIXME check that everything works fine if this changes between framesqbias dequantization bias stored as delta from last, last is reset to 0 if always_reset||keyframeblock_max_depth maximum depth of the block tree stored as delta from last, last is reset to 0 if always_reset||keyframequant_table quantization tableHighlevel bitstream structure:==============================--------------------------------------------|Header|--------------------------------------------|------------------------------------|||Block0||||split?||||yes no||||......... intra?||||:Block01 :yes no||||:Block02 :....... ..........||||:Block03 ::y DC ::ref index:||||:Block04 ::cb DC ::motion x :||||......... :cr DC ::motion y :||||....... ..........|||------------------------------------||------------------------------------|||Block1|||...|--------------------------------------------|------------ ------------ ------------|||Y subbands||Cb subbands||Cr subbands||||--- ---||--- ---||--- ---|||||LL0||HL0||||LL0||HL0||||LL0||HL0|||||--- ---||--- ---||--- ---||||--- ---||--- ---||--- ---|||||LH0||HH0||||LH0||HH0||||LH0||HH0|||||--- ---||--- ---||--- ---||||--- ---||--- ---||--- ---|||||HL1||LH1||||HL1||LH1||||HL1||LH1|||||--- ---||--- ---||--- ---||||--- ---||--- ---||--- ---|||||HH1||HL2||||HH1||HL2||||HH1||HL2|||||...||...||...|||------------ ------------ ------------|--------------------------------------------Decoding process:=================------------|||Subbands|------------||||------------|Intra DC||||LL0 subband prediction ------------|\ Dequantization ------------------- \||Reference frames|\ IDWT|------- -------|Motion \|||Frame 0||Frame 1||Compensation . OBMC v -------|------- -------|--------------. \------> Frame n output Frame Frame<----------------------------------/|...|------------------- Range Coder:============Binary Range Coder:------------------- The implemented range coder is an adapted version based upon "Range encoding: an algorithm for removing redundancy from a digitised message." by G. N. N. Martin. The symbols encoded by the Snow range coder are bits(0|1). The associated probabilities are not fix but change depending on the symbol mix seen so far. bit seen|new state ---------+----------------------------------------------- 0|256 - state_transition_table[256 - old_state];1|state_transition_table[old_state];state_transition_table={ 0, 0, 0, 0, 0, 0, 0, 0, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 126, 127, 128, 129, 130, 131, 132, 133, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 149, 150, 151, 152, 152, 153, 154, 155, 156, 157, 158, 159, 160, 161, 162, 163, 164, 165, 166, 167, 168, 169, 170, 171, 171, 172, 173, 174, 175, 176, 177, 178, 179, 180, 181, 182, 183, 184, 185, 186, 187, 188, 189, 190, 190, 191, 192, 194, 194, 195, 196, 197, 198, 199, 200, 201, 202, 202, 204, 205, 206, 207, 208, 209, 209, 210, 211, 212, 213, 215, 215, 216, 217, 218, 219, 220, 220, 222, 223, 224, 225, 226, 227, 227, 229, 229, 230, 231, 232, 234, 234, 235, 236, 237, 238, 239, 240, 241, 242, 243, 244, 245, 246, 247, 248, 248, 0, 0, 0, 0, 0, 0, 0};FIXME Range Coding of integers:------------------------- FIXME Neighboring Blocks:===================left and top are set to the respective blocks unless they are outside of the image in which case they are set to the Null block top-left is set to the top left block unless it is outside of the image in which case it is set to the left block if this block has no larger parent block or it is at the left side of its parent block and the top right block is not outside of the image then the top right block is used for top-right else the top-left block is used Null block y, cb, cr are 128 level, ref, mx and my are 0 Motion Vector Prediction:=========================1. the motion vectors of all the neighboring blocks are scaled to compensate for the difference of reference frames scaled_mv=(mv *(256 *(current_reference+1)/(mv.reference+1))+128)> the median of the scaled left
Definition: snow.txt:386
U
#define U(x)
Definition: vpx_arith.h:37
IAMF_OBU_Type
IAMF_OBU_Type
Definition: iamf.h:37
label_string
static int label_string(AVIOContext *pb, char **label)
Definition: iamf_parse.c:775
IAMFMixPresentation
Definition: iamf.h:107
AV_CHANNEL_ORDER_CUSTOM
@ AV_CHANNEL_ORDER_CUSTOM
The channel order does not correspond to any other predefined order and is stored as an explicit map.
Definition: channel_layout.h:125
IAMFMixPresentation::language_label
char ** language_label
Definition: iamf.h:118
AVIAMFSubmix::default_mix_gain
AVRational default_mix_gain
Default mix gain value to apply when there are no AVIAMFParamDefinition with output_mix_config's para...
Definition: iamf.h:599
AVIAMFSubmixLayout::album_anchored_loudness
AVRational album_anchored_loudness
The Album loudness information, as defined in ITU-1770-4.
Definition: iamf.h:543
AVIAMFSubmixLayout::true_peak
AVRational true_peak
The true peak of the audio signal, as defined in ITU-1770-4.
Definition: iamf.h:535
mode
mode
Definition: ebur128.h:83
AVIAMFSubmixLayout::sound_system
AVChannelLayout sound_system
Channel layout matching one of Sound Systems A to J of ITU-2051-3, plus 7.1.2ch and 3....
Definition: iamf.h:521
IAMFCodecConfig::codec_id
enum AVCodecID codec_id
Definition: iamf.h:68
IAMFCodecConfig::codec_config_id
unsigned codec_config_id
Definition: iamf.h:67
avio_read
int avio_read(AVIOContext *s, unsigned char *buf, int size)
Read size bytes from AVIOContext into buf.
Definition: aviobuf.c:611
sign_extend
static av_const int sign_extend(int val, unsigned bits)
Definition: mathops.h:133
AVIOContext::eof_reached
int eof_reached
true if was unable to read due to error or eof
Definition: avio.h:238
IAMF_ANCHOR_ELEMENT_DIALOGUE
@ IAMF_ANCHOR_ELEMENT_DIALOGUE
Definition: iamf.h:141
AV_IAMF_PARAMETER_DEFINITION_MIX_GAIN
@ AV_IAMF_PARAMETER_DEFINITION_MIX_GAIN
Subblocks are of struct type AVIAMFMixGain.
Definition: iamf.h:173
MAX_IAMF_OBU_HEADER_SIZE
#define MAX_IAMF_OBU_HEADER_SIZE
Definition: iamf.h:34
avio_skip
int64_t avio_skip(AVIOContext *s, int64_t offset)
Skip given number of bytes forward.
Definition: aviobuf.c:317
mix_presentation_obu
static int mix_presentation_obu(void *s, IAMFContext *c, AVIOContext *pb, int len)
Definition: iamf_parse.c:792
av_iamf_audio_element_add_layer
AVIAMFLayer * av_iamf_audio_element_add_layer(AVIAMFAudioElement *audio_element)
Allocate a layer and add it to a given AVIAMFAudioElement.
av_channel_layout_copy
int av_channel_layout_copy(AVChannelLayout *dst, const AVChannelLayout *src)
Make a copy of a channel layout.
Definition: channel_layout.c:439
av_strdup
char * av_strdup(const char *s)
Duplicate a string.
Definition: mem.c:270
AV_CODEC_ID_PCM_S32LE
@ AV_CODEC_ID_PCM_S32LE
Definition: codec_id.h:336
AVIAMFAudioElement::demixing_info
AVIAMFParamDefinition * demixing_info
Demixing information used to reconstruct a scalable channel audio representation.
Definition: iamf.h:376
AVIAMFDemixingInfo::dmixp_mode
unsigned int dmixp_mode
Pre-defined combination of demixing parameters.
Definition: iamf.h:140
AVIAMFSubmix::output_mix_config
AVIAMFParamDefinition * output_mix_config
Information required for post-processing the mixed audio signal to generate the audio signal for play...
Definition: iamf.h:591
AVIAMFLayer::ambisonics_mode
enum AVIAMFAmbisonicsMode ambisonics_mode
Ambisonics mode as defined in section 3.6.3 of IAMF.
Definition: iamf.h:328
flush_put_bits
static void flush_put_bits(PutBitContext *s)
Pad the end of the output stream with zeros.
Definition: put_bits.h:143
AV_CHANNEL_LAYOUT_MONO
#define AV_CHANNEL_LAYOUT_MONO
Definition: channel_layout.h:378
AV_IAMF_SUBMIX_LAYOUT_TYPE_BINAURAL
@ AV_IAMF_SUBMIX_LAYOUT_TYPE_BINAURAL
The layout is binaural.
Definition: iamf.h:501
AVIAMFLayer::flags
unsigned int flags
A bitmask which may contain a combination of AV_IAMF_LAYER_FLAG_* flags.
Definition: iamf.h:302
av_free
#define av_free(p)
Definition: tableprint_vlc.h:33
AVIAMFLayer::output_gain
AVRational output_gain
Output gain as defined in section 3.6.2 of IAMF.
Definition: iamf.h:316
AVCodecParameters::codec_id
enum AVCodecID codec_id
Specific type of the encoded data (the codec used).
Definition: codec_par.h:55
av_dict_set
int av_dict_set(AVDictionary **pm, const char *key, const char *value, int flags)
Set the given entry in *pm, overwriting an existing entry.
Definition: dict.c:88
AVIAMFSubmixElement::element_mix_config
AVIAMFParamDefinition * element_mix_config
Information required required for applying any processing to the referenced and rendered Audio Elemen...
Definition: iamf.h:461
AV_CHAN_AMBISONIC_BASE
@ AV_CHAN_AMBISONIC_BASE
Range of channels between AV_CHAN_AMBISONIC_BASE and AV_CHAN_AMBISONIC_END represent Ambisonic compon...
Definition: channel_layout.h:101
AVIAMFParamDefinition::parameter_rate
unsigned int parameter_rate
Sample rate for the paremeter substream.
Definition: iamf.h:222
ff_iamf_scalable_ch_layouts
const AVChannelLayout ff_iamf_scalable_ch_layouts[10]
Definition: iamf.c:27
AVIAMFSubmixElement
Submix element as defined in section 3.7 of IAMF.
Definition: iamf.h:446
AV_IAMF_AUDIO_ELEMENT_TYPE_CHANNEL
@ AV_IAMF_AUDIO_ELEMENT_TYPE_CHANNEL
Definition: iamf.h:345
IAMFAudioElement::codec_config_id
unsigned int codec_config_id
Definition: iamf.h:101
av_log
#define av_log(a,...)
Definition: tableprint_vlc.h:27
AVERROR_INVALIDDATA
#define AVERROR_INVALIDDATA
Invalid data found when processing input.
Definition: error.h:61
ffio_read_size
int ffio_read_size(AVIOContext *s, unsigned char *buf, int size)
Read size bytes from AVIOContext into buf.
Definition: aviobuf.c:661
AVIAMFAudioElement::recon_gain_info
AVIAMFParamDefinition * recon_gain_info
Recon gain information used to reconstruct a scalable channel audio representation.
Definition: iamf.h:383
IAMFMixPresentation::mix
AVIAMFMixPresentation * mix
mix backs cmix iff the AVIAMFMixPresentation is owned by this structure.
Definition: iamf.h:113
scalable_channel_layout_config
static int scalable_channel_layout_config(void *s, AVIOContext *pb, IAMFAudioElement *audio_element, const IAMFCodecConfig *codec_config)
Definition: iamf_parse.c:340
flac.h
AV_RB24
uint64_t_TMPL AV_WL64 unsigned int_TMPL AV_WL32 unsigned int_TMPL AV_WL24 unsigned int_TMPL AV_WL16 uint64_t_TMPL AV_WB64 unsigned int_TMPL AV_WB32 unsigned int_TMPL AV_RB24
Definition: bytestream.h:97
IAMFSubStream::codecpar
AVCodecParameters * codecpar
Definition: iamf.h:86
put_bits.h
IAMFCodecConfig::audio_roll_distance
int audio_roll_distance
Definition: iamf.h:71
IAMFMixPresentation::mix_presentation_id
unsigned int mix_presentation_id
Definition: iamf.h:114
AV_CODEC_ID_PCM_S24BE
@ AV_CODEC_ID_PCM_S24BE
Definition: codec_id.h:341
AVChannelCustom::id
enum AVChannel id
Definition: channel_layout.h:268
skip
static void BS_FUNC() skip(BSCTX *bc, unsigned int n)
Skip n bits in the buffer.
Definition: bitstream_template.h:375
AV_IAMF_PARAMETER_DEFINITION_DEMIXING
@ AV_IAMF_PARAMETER_DEFINITION_DEMIXING
Subblocks are of struct type AVIAMFDemixingInfo.
Definition: iamf.h:177
AV_RB16
uint64_t_TMPL AV_WL64 unsigned int_TMPL AV_WL32 unsigned int_TMPL AV_WL24 unsigned int_TMPL AV_WL16 uint64_t_TMPL AV_WB64 unsigned int_TMPL AV_WB32 unsigned int_TMPL AV_WB24 unsigned int_TMPL AV_RB16
Definition: bytestream.h:98
MPEG4AudioConfig::sample_rate
int sample_rate
Definition: mpeg4audio.h:32