mpeg4audio.h 8.7 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177
  1. /*
  2. * MPEG-4 Audio common header
  3. * Copyright (c) 2008 Baptiste Coudurier <baptiste.coudurier@free.fr>
  4. *
  5. * This file is part of FFmpeg.
  6. *
  7. * FFmpeg is free software; you can redistribute it and/or
  8. * modify it under the terms of the GNU Lesser General Public
  9. * License as published by the Free Software Foundation; either
  10. * version 2.1 of the License, or (at your option) any later version.
  11. *
  12. * FFmpeg is distributed in the hope that it will be useful,
  13. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  14. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  15. * Lesser General Public License for more details.
  16. *
  17. * You should have received a copy of the GNU Lesser General Public
  18. * License along with FFmpeg; if not, write to the Free Software
  19. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  20. */
  21. #ifndef AVCODEC_MPEG4AUDIO_H
  22. #define AVCODEC_MPEG4AUDIO_H
  23. #include <stdint.h>
  24. #include "libavutil/attributes.h"
  25. #include "get_bits.h"
  26. #include "internal.h"
  27. #include "put_bits.h"
  28. typedef struct MPEG4AudioConfig {
  29. int object_type;
  30. int sampling_index;
  31. int sample_rate;
  32. int chan_config;
  33. int sbr; ///< -1 implicit, 1 presence
  34. int ext_object_type;
  35. int ext_sampling_index;
  36. int ext_sample_rate;
  37. int ext_chan_config;
  38. int channels;
  39. int ps; ///< -1 implicit, 1 presence
  40. int frame_length_short;
  41. } MPEG4AudioConfig;
  42. extern av_export_avcodec const int avpriv_mpeg4audio_sample_rates[16];
  43. extern const uint8_t ff_mpeg4audio_channels[14];
  44. /**
  45. * Parse MPEG-4 systems extradata from a potentially unaligned GetBitContext to retrieve audio configuration.
  46. * @param[in] c MPEG4AudioConfig structure to fill.
  47. * @param[in] gb Extradata from container.
  48. * @param[in] sync_extension look for a sync extension after config if true.
  49. * @param[in] logctx opaque struct starting with an AVClass element, used for logging.
  50. * @return negative AVERROR code on error, on success AudioSpecificConfig bit index in extradata.
  51. */
  52. int ff_mpeg4audio_get_config_gb(MPEG4AudioConfig *c, GetBitContext *gb,
  53. int sync_extension, void *logctx);
  54. #if LIBAVCODEC_VERSION_MAJOR < 59
  55. /**
  56. * Parse MPEG-4 systems extradata from a raw buffer to retrieve audio configuration.
  57. * @param[in] c MPEG4AudioConfig structure to fill.
  58. * @param[in] buf Extradata from container.
  59. * @param[in] bit_size Extradata size in bits.
  60. * @param[in] sync_extension look for a sync extension after config if true.
  61. * @return negative AVERROR code on error, on success AudioSpecificConfig bit index in extradata.
  62. */
  63. int avpriv_mpeg4audio_get_config(MPEG4AudioConfig *c, const uint8_t *buf,
  64. int bit_size, int sync_extension);
  65. #endif
  66. /**
  67. * Parse MPEG-4 systems extradata from a raw buffer to retrieve audio configuration.
  68. * @param[in] c MPEG4AudioConfig structure to fill.
  69. * @param[in] buf Extradata from container.
  70. * @param[in] size Extradata size in bytes.
  71. * @param[in] sync_extension look for a sync extension after config if true.
  72. * @param[in] logctx opaque struct starting with an AVClass element, used for logging.
  73. * @return negative AVERROR code on error, AudioSpecificConfig bit index in extradata on success.
  74. */
  75. int avpriv_mpeg4audio_get_config2(MPEG4AudioConfig *c, const uint8_t *buf,
  76. int size, int sync_extension, void *logctx);
  77. enum AudioObjectType {
  78. AOT_NULL,
  79. // Support? Name
  80. AOT_AAC_MAIN, ///< Y Main
  81. AOT_AAC_LC, ///< Y Low Complexity
  82. AOT_AAC_SSR, ///< N (code in SoC repo) Scalable Sample Rate
  83. AOT_AAC_LTP, ///< Y Long Term Prediction
  84. AOT_SBR, ///< Y Spectral Band Replication
  85. AOT_AAC_SCALABLE, ///< N Scalable
  86. AOT_TWINVQ, ///< N Twin Vector Quantizer
  87. AOT_CELP, ///< N Code Excited Linear Prediction
  88. AOT_HVXC, ///< N Harmonic Vector eXcitation Coding
  89. AOT_TTSI = 12, ///< N Text-To-Speech Interface
  90. AOT_MAINSYNTH, ///< N Main Synthesis
  91. AOT_WAVESYNTH, ///< N Wavetable Synthesis
  92. AOT_MIDI, ///< N General MIDI
  93. AOT_SAFX, ///< N Algorithmic Synthesis and Audio Effects
  94. AOT_ER_AAC_LC, ///< N Error Resilient Low Complexity
  95. AOT_ER_AAC_LTP = 19, ///< N Error Resilient Long Term Prediction
  96. AOT_ER_AAC_SCALABLE, ///< N Error Resilient Scalable
  97. AOT_ER_TWINVQ, ///< N Error Resilient Twin Vector Quantizer
  98. AOT_ER_BSAC, ///< N Error Resilient Bit-Sliced Arithmetic Coding
  99. AOT_ER_AAC_LD, ///< N Error Resilient Low Delay
  100. AOT_ER_CELP, ///< N Error Resilient Code Excited Linear Prediction
  101. AOT_ER_HVXC, ///< N Error Resilient Harmonic Vector eXcitation Coding
  102. AOT_ER_HILN, ///< N Error Resilient Harmonic and Individual Lines plus Noise
  103. AOT_ER_PARAM, ///< N Error Resilient Parametric
  104. AOT_SSC, ///< N SinuSoidal Coding
  105. AOT_PS, ///< N Parametric Stereo
  106. AOT_SURROUND, ///< N MPEG Surround
  107. AOT_ESCAPE, ///< Y Escape Value
  108. AOT_L1, ///< Y Layer 1
  109. AOT_L2, ///< Y Layer 2
  110. AOT_L3, ///< Y Layer 3
  111. AOT_DST, ///< N Direct Stream Transfer
  112. AOT_ALS, ///< Y Audio LosslesS
  113. AOT_SLS, ///< N Scalable LosslesS
  114. AOT_SLS_NON_CORE, ///< N Scalable LosslesS (non core)
  115. AOT_ER_AAC_ELD, ///< N Error Resilient Enhanced Low Delay
  116. AOT_SMR_SIMPLE, ///< N Symbolic Music Representation Simple
  117. AOT_SMR_MAIN, ///< N Symbolic Music Representation Main
  118. AOT_USAC_NOSBR, ///< N Unified Speech and Audio Coding (no SBR)
  119. AOT_SAOC, ///< N Spatial Audio Object Coding
  120. AOT_LD_SURROUND, ///< N Low Delay MPEG Surround
  121. AOT_USAC, ///< N Unified Speech and Audio Coding
  122. };
  123. #define MAX_PCE_SIZE 320 ///<Maximum size of a PCE including the 3-bit ID_PCE
  124. ///<marker and the comment
  125. static av_always_inline unsigned int ff_pce_copy_bits(PutBitContext *pb,
  126. GetBitContext *gb,
  127. int bits)
  128. {
  129. unsigned int el = get_bits(gb, bits);
  130. put_bits(pb, bits, el);
  131. return el;
  132. }
  133. static inline int ff_copy_pce_data(PutBitContext *pb, GetBitContext *gb)
  134. {
  135. int five_bit_ch, four_bit_ch, comment_size, bits;
  136. int offset = put_bits_count(pb);
  137. ff_pce_copy_bits(pb, gb, 10); // Tag, Object Type, Frequency
  138. five_bit_ch = ff_pce_copy_bits(pb, gb, 4); // Front
  139. five_bit_ch += ff_pce_copy_bits(pb, gb, 4); // Side
  140. five_bit_ch += ff_pce_copy_bits(pb, gb, 4); // Back
  141. four_bit_ch = ff_pce_copy_bits(pb, gb, 2); // LFE
  142. four_bit_ch += ff_pce_copy_bits(pb, gb, 3); // Data
  143. five_bit_ch += ff_pce_copy_bits(pb, gb, 4); // Coupling
  144. if (ff_pce_copy_bits(pb, gb, 1)) // Mono Mixdown
  145. ff_pce_copy_bits(pb, gb, 4);
  146. if (ff_pce_copy_bits(pb, gb, 1)) // Stereo Mixdown
  147. ff_pce_copy_bits(pb, gb, 4);
  148. if (ff_pce_copy_bits(pb, gb, 1)) // Matrix Mixdown
  149. ff_pce_copy_bits(pb, gb, 3);
  150. for (bits = five_bit_ch*5+four_bit_ch*4; bits > 16; bits -= 16)
  151. ff_pce_copy_bits(pb, gb, 16);
  152. if (bits)
  153. ff_pce_copy_bits(pb, gb, bits);
  154. avpriv_align_put_bits(pb);
  155. align_get_bits(gb);
  156. comment_size = ff_pce_copy_bits(pb, gb, 8);
  157. for (; comment_size > 0; comment_size--)
  158. ff_pce_copy_bits(pb, gb, 8);
  159. return put_bits_count(pb) - offset;
  160. }
  161. #endif /* AVCODEC_MPEG4AUDIO_H */