You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

1947 lines
71KB

  1. /*
  2. * DCA compatible decoder
  3. * Copyright (C) 2004 Gildas Bazin
  4. * Copyright (C) 2004 Benjamin Zores
  5. * Copyright (C) 2006 Benjamin Larsson
  6. * Copyright (C) 2007 Konstantin Shishkov
  7. *
  8. * This file is part of FFmpeg.
  9. *
  10. * FFmpeg is free software; you can redistribute it and/or
  11. * modify it under the terms of the GNU Lesser General Public
  12. * License as published by the Free Software Foundation; either
  13. * version 2.1 of the License, or (at your option) any later version.
  14. *
  15. * FFmpeg is distributed in the hope that it will be useful,
  16. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  17. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  18. * Lesser General Public License for more details.
  19. *
  20. * You should have received a copy of the GNU Lesser General Public
  21. * License along with FFmpeg; if not, write to the Free Software
  22. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  23. */
  24. #include <math.h>
  25. #include <stddef.h>
  26. #include <stdio.h>
  27. #include "libavutil/common.h"
  28. #include "libavutil/intmath.h"
  29. #include "libavutil/intreadwrite.h"
  30. #include "libavutil/audioconvert.h"
  31. #include "avcodec.h"
  32. #include "dsputil.h"
  33. #include "fft.h"
  34. #include "get_bits.h"
  35. #include "put_bits.h"
  36. #include "dcadata.h"
  37. #include "dcahuff.h"
  38. #include "dca.h"
  39. #include "synth_filter.h"
  40. #include "dcadsp.h"
  41. #include "fmtconvert.h"
  42. #if ARCH_ARM
  43. # include "arm/dca.h"
  44. #endif
  45. //#define TRACE
  46. #define DCA_PRIM_CHANNELS_MAX (7)
  47. #define DCA_SUBBANDS (32)
  48. #define DCA_ABITS_MAX (32) /* Should be 28 */
  49. #define DCA_SUBSUBFRAMES_MAX (4)
  50. #define DCA_SUBFRAMES_MAX (16)
  51. #define DCA_BLOCKS_MAX (16)
  52. #define DCA_LFE_MAX (3)
  53. enum DCAMode {
  54. DCA_MONO = 0,
  55. DCA_CHANNEL,
  56. DCA_STEREO,
  57. DCA_STEREO_SUMDIFF,
  58. DCA_STEREO_TOTAL,
  59. DCA_3F,
  60. DCA_2F1R,
  61. DCA_3F1R,
  62. DCA_2F2R,
  63. DCA_3F2R,
  64. DCA_4F2R
  65. };
  66. /* these are unconfirmed but should be mostly correct */
  67. enum DCAExSSSpeakerMask {
  68. DCA_EXSS_FRONT_CENTER = 0x0001,
  69. DCA_EXSS_FRONT_LEFT_RIGHT = 0x0002,
  70. DCA_EXSS_SIDE_REAR_LEFT_RIGHT = 0x0004,
  71. DCA_EXSS_LFE = 0x0008,
  72. DCA_EXSS_REAR_CENTER = 0x0010,
  73. DCA_EXSS_FRONT_HIGH_LEFT_RIGHT = 0x0020,
  74. DCA_EXSS_REAR_LEFT_RIGHT = 0x0040,
  75. DCA_EXSS_FRONT_HIGH_CENTER = 0x0080,
  76. DCA_EXSS_OVERHEAD = 0x0100,
  77. DCA_EXSS_CENTER_LEFT_RIGHT = 0x0200,
  78. DCA_EXSS_WIDE_LEFT_RIGHT = 0x0400,
  79. DCA_EXSS_SIDE_LEFT_RIGHT = 0x0800,
  80. DCA_EXSS_LFE2 = 0x1000,
  81. DCA_EXSS_SIDE_HIGH_LEFT_RIGHT = 0x2000,
  82. DCA_EXSS_REAR_HIGH_CENTER = 0x4000,
  83. DCA_EXSS_REAR_HIGH_LEFT_RIGHT = 0x8000,
  84. };
  85. enum DCAExtensionMask {
  86. DCA_EXT_CORE = 0x001, ///< core in core substream
  87. DCA_EXT_XXCH = 0x002, ///< XXCh channels extension in core substream
  88. DCA_EXT_X96 = 0x004, ///< 96/24 extension in core substream
  89. DCA_EXT_XCH = 0x008, ///< XCh channel extension in core substream
  90. DCA_EXT_EXSS_CORE = 0x010, ///< core in ExSS (extension substream)
  91. DCA_EXT_EXSS_XBR = 0x020, ///< extended bitrate extension in ExSS
  92. DCA_EXT_EXSS_XXCH = 0x040, ///< XXCh channels extension in ExSS
  93. DCA_EXT_EXSS_X96 = 0x080, ///< 96/24 extension in ExSS
  94. DCA_EXT_EXSS_LBR = 0x100, ///< low bitrate component in ExSS
  95. DCA_EXT_EXSS_XLL = 0x200, ///< lossless extension in ExSS
  96. };
  97. /* -1 are reserved or unknown */
  98. static const int dca_ext_audio_descr_mask[] = {
  99. DCA_EXT_XCH,
  100. -1,
  101. DCA_EXT_X96,
  102. DCA_EXT_XCH | DCA_EXT_X96,
  103. -1,
  104. -1,
  105. DCA_EXT_XXCH,
  106. -1,
  107. };
  108. /* extensions that reside in core substream */
  109. #define DCA_CORE_EXTS (DCA_EXT_XCH | DCA_EXT_XXCH | DCA_EXT_X96)
  110. /* Tables for mapping dts channel configurations to libavcodec multichannel api.
  111. * Some compromises have been made for special configurations. Most configurations
  112. * are never used so complete accuracy is not needed.
  113. *
  114. * L = left, R = right, C = center, S = surround, F = front, R = rear, T = total, OV = overhead.
  115. * S -> side, when both rear and back are configured move one of them to the side channel
  116. * OV -> center back
  117. * All 2 channel configurations -> AV_CH_LAYOUT_STEREO
  118. */
  119. static const int64_t dca_core_channel_layout[] = {
  120. AV_CH_FRONT_CENTER, ///< 1, A
  121. AV_CH_LAYOUT_STEREO, ///< 2, A + B (dual mono)
  122. AV_CH_LAYOUT_STEREO, ///< 2, L + R (stereo)
  123. AV_CH_LAYOUT_STEREO, ///< 2, (L+R) + (L-R) (sum-difference)
  124. AV_CH_LAYOUT_STEREO, ///< 2, LT +RT (left and right total)
  125. AV_CH_LAYOUT_STEREO|AV_CH_FRONT_CENTER, ///< 3, C+L+R
  126. AV_CH_LAYOUT_STEREO|AV_CH_BACK_CENTER, ///< 3, L+R+S
  127. AV_CH_LAYOUT_STEREO|AV_CH_FRONT_CENTER|AV_CH_BACK_CENTER, ///< 4, C + L + R+ S
  128. AV_CH_LAYOUT_STEREO|AV_CH_SIDE_LEFT|AV_CH_SIDE_RIGHT, ///< 4, L + R +SL+ SR
  129. AV_CH_LAYOUT_STEREO|AV_CH_FRONT_CENTER|AV_CH_SIDE_LEFT|AV_CH_SIDE_RIGHT, ///< 5, C + L + R+ SL+SR
  130. AV_CH_LAYOUT_STEREO|AV_CH_SIDE_LEFT|AV_CH_SIDE_RIGHT|AV_CH_FRONT_LEFT_OF_CENTER|AV_CH_FRONT_RIGHT_OF_CENTER, ///< 6, CL + CR + L + R + SL + SR
  131. AV_CH_LAYOUT_STEREO|AV_CH_BACK_LEFT|AV_CH_BACK_RIGHT|AV_CH_FRONT_CENTER|AV_CH_BACK_CENTER, ///< 6, C + L + R+ LR + RR + OV
  132. AV_CH_FRONT_CENTER|AV_CH_FRONT_RIGHT_OF_CENTER|AV_CH_FRONT_LEFT_OF_CENTER|AV_CH_BACK_CENTER|AV_CH_BACK_LEFT|AV_CH_BACK_RIGHT, ///< 6, CF+ CR+LF+ RF+LR + RR
  133. AV_CH_FRONT_LEFT_OF_CENTER|AV_CH_FRONT_CENTER|AV_CH_FRONT_RIGHT_OF_CENTER|AV_CH_LAYOUT_STEREO|AV_CH_SIDE_LEFT|AV_CH_SIDE_RIGHT, ///< 7, CL + C + CR + L + R + SL + SR
  134. AV_CH_FRONT_LEFT_OF_CENTER|AV_CH_FRONT_RIGHT_OF_CENTER|AV_CH_LAYOUT_STEREO|AV_CH_SIDE_LEFT|AV_CH_SIDE_RIGHT|AV_CH_BACK_LEFT|AV_CH_BACK_RIGHT, ///< 8, CL + CR + L + R + SL1 + SL2+ SR1 + SR2
  135. AV_CH_FRONT_LEFT_OF_CENTER|AV_CH_FRONT_CENTER|AV_CH_FRONT_RIGHT_OF_CENTER|AV_CH_LAYOUT_STEREO|AV_CH_SIDE_LEFT|AV_CH_BACK_CENTER|AV_CH_SIDE_RIGHT, ///< 8, CL + C+ CR + L + R + SL + S+ SR
  136. };
  137. static const int8_t dca_lfe_index[] = {
  138. 1,2,2,2,2,3,2,3,2,3,2,3,1,3,2,3
  139. };
  140. static const int8_t dca_channel_reorder_lfe[][9] = {
  141. { 0, -1, -1, -1, -1, -1, -1, -1, -1},
  142. { 0, 1, -1, -1, -1, -1, -1, -1, -1},
  143. { 0, 1, -1, -1, -1, -1, -1, -1, -1},
  144. { 0, 1, -1, -1, -1, -1, -1, -1, -1},
  145. { 0, 1, -1, -1, -1, -1, -1, -1, -1},
  146. { 2, 0, 1, -1, -1, -1, -1, -1, -1},
  147. { 0, 1, 3, -1, -1, -1, -1, -1, -1},
  148. { 2, 0, 1, 4, -1, -1, -1, -1, -1},
  149. { 0, 1, 3, 4, -1, -1, -1, -1, -1},
  150. { 2, 0, 1, 4, 5, -1, -1, -1, -1},
  151. { 3, 4, 0, 1, 5, 6, -1, -1, -1},
  152. { 2, 0, 1, 4, 5, 6, -1, -1, -1},
  153. { 0, 6, 4, 5, 2, 3, -1, -1, -1},
  154. { 4, 2, 5, 0, 1, 6, 7, -1, -1},
  155. { 5, 6, 0, 1, 7, 3, 8, 4, -1},
  156. { 4, 2, 5, 0, 1, 6, 8, 7, -1},
  157. };
  158. static const int8_t dca_channel_reorder_lfe_xch[][9] = {
  159. { 0, 2, -1, -1, -1, -1, -1, -1, -1},
  160. { 0, 1, 3, -1, -1, -1, -1, -1, -1},
  161. { 0, 1, 3, -1, -1, -1, -1, -1, -1},
  162. { 0, 1, 3, -1, -1, -1, -1, -1, -1},
  163. { 0, 1, 3, -1, -1, -1, -1, -1, -1},
  164. { 2, 0, 1, 4, -1, -1, -1, -1, -1},
  165. { 0, 1, 3, 4, -1, -1, -1, -1, -1},
  166. { 2, 0, 1, 4, 5, -1, -1, -1, -1},
  167. { 0, 1, 4, 5, 3, -1, -1, -1, -1},
  168. { 2, 0, 1, 5, 6, 4, -1, -1, -1},
  169. { 3, 4, 0, 1, 6, 7, 5, -1, -1},
  170. { 2, 0, 1, 4, 5, 6, 7, -1, -1},
  171. { 0, 6, 4, 5, 2, 3, 7, -1, -1},
  172. { 4, 2, 5, 0, 1, 7, 8, 6, -1},
  173. { 5, 6, 0, 1, 8, 3, 9, 4, 7},
  174. { 4, 2, 5, 0, 1, 6, 9, 8, 7},
  175. };
  176. static const int8_t dca_channel_reorder_nolfe[][9] = {
  177. { 0, -1, -1, -1, -1, -1, -1, -1, -1},
  178. { 0, 1, -1, -1, -1, -1, -1, -1, -1},
  179. { 0, 1, -1, -1, -1, -1, -1, -1, -1},
  180. { 0, 1, -1, -1, -1, -1, -1, -1, -1},
  181. { 0, 1, -1, -1, -1, -1, -1, -1, -1},
  182. { 2, 0, 1, -1, -1, -1, -1, -1, -1},
  183. { 0, 1, 2, -1, -1, -1, -1, -1, -1},
  184. { 2, 0, 1, 3, -1, -1, -1, -1, -1},
  185. { 0, 1, 2, 3, -1, -1, -1, -1, -1},
  186. { 2, 0, 1, 3, 4, -1, -1, -1, -1},
  187. { 2, 3, 0, 1, 4, 5, -1, -1, -1},
  188. { 2, 0, 1, 3, 4, 5, -1, -1, -1},
  189. { 0, 5, 3, 4, 1, 2, -1, -1, -1},
  190. { 3, 2, 4, 0, 1, 5, 6, -1, -1},
  191. { 4, 5, 0, 1, 6, 2, 7, 3, -1},
  192. { 3, 2, 4, 0, 1, 5, 7, 6, -1},
  193. };
  194. static const int8_t dca_channel_reorder_nolfe_xch[][9] = {
  195. { 0, 1, -1, -1, -1, -1, -1, -1, -1},
  196. { 0, 1, 2, -1, -1, -1, -1, -1, -1},
  197. { 0, 1, 2, -1, -1, -1, -1, -1, -1},
  198. { 0, 1, 2, -1, -1, -1, -1, -1, -1},
  199. { 0, 1, 2, -1, -1, -1, -1, -1, -1},
  200. { 2, 0, 1, 3, -1, -1, -1, -1, -1},
  201. { 0, 1, 2, 3, -1, -1, -1, -1, -1},
  202. { 2, 0, 1, 3, 4, -1, -1, -1, -1},
  203. { 0, 1, 3, 4, 2, -1, -1, -1, -1},
  204. { 2, 0, 1, 4, 5, 3, -1, -1, -1},
  205. { 2, 3, 0, 1, 5, 6, 4, -1, -1},
  206. { 2, 0, 1, 3, 4, 5, 6, -1, -1},
  207. { 0, 5, 3, 4, 1, 2, 6, -1, -1},
  208. { 3, 2, 4, 0, 1, 6, 7, 5, -1},
  209. { 4, 5, 0, 1, 7, 2, 8, 3, 6},
  210. { 3, 2, 4, 0, 1, 5, 8, 7, 6},
  211. };
  212. #define DCA_DOLBY 101 /* FIXME */
  213. #define DCA_CHANNEL_BITS 6
  214. #define DCA_CHANNEL_MASK 0x3F
  215. #define DCA_LFE 0x80
  216. #define HEADER_SIZE 14
  217. #define DCA_MAX_FRAME_SIZE 16384
  218. #define DCA_MAX_EXSS_HEADER_SIZE 4096
  219. #define DCA_BUFFER_PADDING_SIZE 1024
  220. /** Bit allocation */
  221. typedef struct {
  222. int offset; ///< code values offset
  223. int maxbits[8]; ///< max bits in VLC
  224. int wrap; ///< wrap for get_vlc2()
  225. VLC vlc[8]; ///< actual codes
  226. } BitAlloc;
  227. static BitAlloc dca_bitalloc_index; ///< indexes for samples VLC select
  228. static BitAlloc dca_tmode; ///< transition mode VLCs
  229. static BitAlloc dca_scalefactor; ///< scalefactor VLCs
  230. static BitAlloc dca_smpl_bitalloc[11]; ///< samples VLCs
  231. static av_always_inline int get_bitalloc(GetBitContext *gb, BitAlloc *ba, int idx)
  232. {
  233. return get_vlc2(gb, ba->vlc[idx].table, ba->vlc[idx].bits, ba->wrap) + ba->offset;
  234. }
  235. typedef struct {
  236. AVCodecContext *avctx;
  237. /* Frame header */
  238. int frame_type; ///< type of the current frame
  239. int samples_deficit; ///< deficit sample count
  240. int crc_present; ///< crc is present in the bitstream
  241. int sample_blocks; ///< number of PCM sample blocks
  242. int frame_size; ///< primary frame byte size
  243. int amode; ///< audio channels arrangement
  244. int sample_rate; ///< audio sampling rate
  245. int bit_rate; ///< transmission bit rate
  246. int bit_rate_index; ///< transmission bit rate index
  247. int downmix; ///< embedded downmix enabled
  248. int dynrange; ///< embedded dynamic range flag
  249. int timestamp; ///< embedded time stamp flag
  250. int aux_data; ///< auxiliary data flag
  251. int hdcd; ///< source material is mastered in HDCD
  252. int ext_descr; ///< extension audio descriptor flag
  253. int ext_coding; ///< extended coding flag
  254. int aspf; ///< audio sync word insertion flag
  255. int lfe; ///< low frequency effects flag
  256. int predictor_history; ///< predictor history flag
  257. int header_crc; ///< header crc check bytes
  258. int multirate_inter; ///< multirate interpolator switch
  259. int version; ///< encoder software revision
  260. int copy_history; ///< copy history
  261. int source_pcm_res; ///< source pcm resolution
  262. int front_sum; ///< front sum/difference flag
  263. int surround_sum; ///< surround sum/difference flag
  264. int dialog_norm; ///< dialog normalisation parameter
  265. /* Primary audio coding header */
  266. int subframes; ///< number of subframes
  267. int is_channels_set; ///< check for if the channel number is already set
  268. int total_channels; ///< number of channels including extensions
  269. int prim_channels; ///< number of primary audio channels
  270. int subband_activity[DCA_PRIM_CHANNELS_MAX]; ///< subband activity count
  271. int vq_start_subband[DCA_PRIM_CHANNELS_MAX]; ///< high frequency vq start subband
  272. int joint_intensity[DCA_PRIM_CHANNELS_MAX]; ///< joint intensity coding index
  273. int transient_huffman[DCA_PRIM_CHANNELS_MAX]; ///< transient mode code book
  274. int scalefactor_huffman[DCA_PRIM_CHANNELS_MAX]; ///< scale factor code book
  275. int bitalloc_huffman[DCA_PRIM_CHANNELS_MAX]; ///< bit allocation quantizer select
  276. int quant_index_huffman[DCA_PRIM_CHANNELS_MAX][DCA_ABITS_MAX]; ///< quantization index codebook select
  277. float scalefactor_adj[DCA_PRIM_CHANNELS_MAX][DCA_ABITS_MAX]; ///< scale factor adjustment
  278. /* Primary audio coding side information */
  279. int subsubframes[DCA_SUBFRAMES_MAX]; ///< number of subsubframes
  280. int partial_samples[DCA_SUBFRAMES_MAX]; ///< partial subsubframe samples count
  281. int prediction_mode[DCA_PRIM_CHANNELS_MAX][DCA_SUBBANDS]; ///< prediction mode (ADPCM used or not)
  282. int prediction_vq[DCA_PRIM_CHANNELS_MAX][DCA_SUBBANDS]; ///< prediction VQ coefs
  283. int bitalloc[DCA_PRIM_CHANNELS_MAX][DCA_SUBBANDS]; ///< bit allocation index
  284. int transition_mode[DCA_PRIM_CHANNELS_MAX][DCA_SUBBANDS]; ///< transition mode (transients)
  285. int scale_factor[DCA_PRIM_CHANNELS_MAX][DCA_SUBBANDS][2]; ///< scale factors (2 if transient)
  286. int joint_huff[DCA_PRIM_CHANNELS_MAX]; ///< joint subband scale factors codebook
  287. int joint_scale_factor[DCA_PRIM_CHANNELS_MAX][DCA_SUBBANDS]; ///< joint subband scale factors
  288. int downmix_coef[DCA_PRIM_CHANNELS_MAX][2]; ///< stereo downmix coefficients
  289. int dynrange_coef; ///< dynamic range coefficient
  290. int high_freq_vq[DCA_PRIM_CHANNELS_MAX][DCA_SUBBANDS]; ///< VQ encoded high frequency subbands
  291. float lfe_data[2 * DCA_LFE_MAX * (DCA_BLOCKS_MAX + 4)]; ///< Low frequency effect data
  292. int lfe_scale_factor;
  293. /* Subband samples history (for ADPCM) */
  294. DECLARE_ALIGNED(16, float, subband_samples_hist)[DCA_PRIM_CHANNELS_MAX][DCA_SUBBANDS][4];
  295. DECLARE_ALIGNED(32, float, subband_fir_hist)[DCA_PRIM_CHANNELS_MAX][512];
  296. DECLARE_ALIGNED(32, float, subband_fir_noidea)[DCA_PRIM_CHANNELS_MAX][32];
  297. int hist_index[DCA_PRIM_CHANNELS_MAX];
  298. DECLARE_ALIGNED(32, float, raXin)[32];
  299. int output; ///< type of output
  300. float scale_bias; ///< output scale
  301. DECLARE_ALIGNED(32, float, subband_samples)[DCA_BLOCKS_MAX][DCA_PRIM_CHANNELS_MAX][DCA_SUBBANDS][8];
  302. DECLARE_ALIGNED(32, float, samples)[(DCA_PRIM_CHANNELS_MAX+1)*256];
  303. const float *samples_chanptr[DCA_PRIM_CHANNELS_MAX+1];
  304. uint8_t dca_buffer[DCA_MAX_FRAME_SIZE + DCA_MAX_EXSS_HEADER_SIZE + DCA_BUFFER_PADDING_SIZE];
  305. int dca_buffer_size; ///< how much data is in the dca_buffer
  306. const int8_t* channel_order_tab; ///< channel reordering table, lfe and non lfe
  307. GetBitContext gb;
  308. /* Current position in DCA frame */
  309. int current_subframe;
  310. int current_subsubframe;
  311. int core_ext_mask; ///< present extensions in the core substream
  312. /* XCh extension information */
  313. int xch_present; ///< XCh extension present and valid
  314. int xch_base_channel; ///< index of first (only) channel containing XCH data
  315. /* ExSS header parser */
  316. int static_fields; ///< static fields present
  317. int mix_metadata; ///< mixing metadata present
  318. int num_mix_configs; ///< number of mix out configurations
  319. int mix_config_num_ch[4]; ///< number of channels in each mix out configuration
  320. int profile;
  321. int debug_flag; ///< used for suppressing repeated error messages output
  322. DSPContext dsp;
  323. FFTContext imdct;
  324. SynthFilterContext synth;
  325. DCADSPContext dcadsp;
  326. FmtConvertContext fmt_conv;
  327. } DCAContext;
  328. static const uint16_t dca_vlc_offs[] = {
  329. 0, 512, 640, 768, 1282, 1794, 2436, 3080, 3770, 4454, 5364,
  330. 5372, 5380, 5388, 5392, 5396, 5412, 5420, 5428, 5460, 5492, 5508,
  331. 5572, 5604, 5668, 5796, 5860, 5892, 6412, 6668, 6796, 7308, 7564,
  332. 7820, 8076, 8620, 9132, 9388, 9910, 10166, 10680, 11196, 11726, 12240,
  333. 12752, 13298, 13810, 14326, 14840, 15500, 16022, 16540, 17158, 17678, 18264,
  334. 18796, 19352, 19926, 20468, 21472, 22398, 23014, 23622,
  335. };
  336. static av_cold void dca_init_vlcs(void)
  337. {
  338. static int vlcs_initialized = 0;
  339. int i, j, c = 14;
  340. static VLC_TYPE dca_table[23622][2];
  341. if (vlcs_initialized)
  342. return;
  343. dca_bitalloc_index.offset = 1;
  344. dca_bitalloc_index.wrap = 2;
  345. for (i = 0; i < 5; i++) {
  346. dca_bitalloc_index.vlc[i].table = &dca_table[dca_vlc_offs[i]];
  347. dca_bitalloc_index.vlc[i].table_allocated = dca_vlc_offs[i + 1] - dca_vlc_offs[i];
  348. init_vlc(&dca_bitalloc_index.vlc[i], bitalloc_12_vlc_bits[i], 12,
  349. bitalloc_12_bits[i], 1, 1,
  350. bitalloc_12_codes[i], 2, 2, INIT_VLC_USE_NEW_STATIC);
  351. }
  352. dca_scalefactor.offset = -64;
  353. dca_scalefactor.wrap = 2;
  354. for (i = 0; i < 5; i++) {
  355. dca_scalefactor.vlc[i].table = &dca_table[dca_vlc_offs[i + 5]];
  356. dca_scalefactor.vlc[i].table_allocated = dca_vlc_offs[i + 6] - dca_vlc_offs[i + 5];
  357. init_vlc(&dca_scalefactor.vlc[i], SCALES_VLC_BITS, 129,
  358. scales_bits[i], 1, 1,
  359. scales_codes[i], 2, 2, INIT_VLC_USE_NEW_STATIC);
  360. }
  361. dca_tmode.offset = 0;
  362. dca_tmode.wrap = 1;
  363. for (i = 0; i < 4; i++) {
  364. dca_tmode.vlc[i].table = &dca_table[dca_vlc_offs[i + 10]];
  365. dca_tmode.vlc[i].table_allocated = dca_vlc_offs[i + 11] - dca_vlc_offs[i + 10];
  366. init_vlc(&dca_tmode.vlc[i], tmode_vlc_bits[i], 4,
  367. tmode_bits[i], 1, 1,
  368. tmode_codes[i], 2, 2, INIT_VLC_USE_NEW_STATIC);
  369. }
  370. for (i = 0; i < 10; i++)
  371. for (j = 0; j < 7; j++){
  372. if (!bitalloc_codes[i][j]) break;
  373. dca_smpl_bitalloc[i+1].offset = bitalloc_offsets[i];
  374. dca_smpl_bitalloc[i+1].wrap = 1 + (j > 4);
  375. dca_smpl_bitalloc[i+1].vlc[j].table = &dca_table[dca_vlc_offs[c]];
  376. dca_smpl_bitalloc[i+1].vlc[j].table_allocated = dca_vlc_offs[c + 1] - dca_vlc_offs[c];
  377. init_vlc(&dca_smpl_bitalloc[i+1].vlc[j], bitalloc_maxbits[i][j],
  378. bitalloc_sizes[i],
  379. bitalloc_bits[i][j], 1, 1,
  380. bitalloc_codes[i][j], 2, 2, INIT_VLC_USE_NEW_STATIC);
  381. c++;
  382. }
  383. vlcs_initialized = 1;
  384. }
  385. static inline void get_array(GetBitContext *gb, int *dst, int len, int bits)
  386. {
  387. while(len--)
  388. *dst++ = get_bits(gb, bits);
  389. }
  390. static int dca_parse_audio_coding_header(DCAContext * s, int base_channel)
  391. {
  392. int i, j;
  393. static const float adj_table[4] = { 1.0, 1.1250, 1.2500, 1.4375 };
  394. static const int bitlen[11] = { 0, 1, 2, 2, 2, 2, 3, 3, 3, 3, 3 };
  395. static const int thr[11] = { 0, 1, 3, 3, 3, 3, 7, 7, 7, 7, 7 };
  396. s->total_channels = get_bits(&s->gb, 3) + 1 + base_channel;
  397. s->prim_channels = s->total_channels;
  398. if (s->prim_channels > DCA_PRIM_CHANNELS_MAX)
  399. s->prim_channels = DCA_PRIM_CHANNELS_MAX;
  400. for (i = base_channel; i < s->prim_channels; i++) {
  401. s->subband_activity[i] = get_bits(&s->gb, 5) + 2;
  402. if (s->subband_activity[i] > DCA_SUBBANDS)
  403. s->subband_activity[i] = DCA_SUBBANDS;
  404. }
  405. for (i = base_channel; i < s->prim_channels; i++) {
  406. s->vq_start_subband[i] = get_bits(&s->gb, 5) + 1;
  407. if (s->vq_start_subband[i] > DCA_SUBBANDS)
  408. s->vq_start_subband[i] = DCA_SUBBANDS;
  409. }
  410. get_array(&s->gb, s->joint_intensity + base_channel, s->prim_channels - base_channel, 3);
  411. get_array(&s->gb, s->transient_huffman + base_channel, s->prim_channels - base_channel, 2);
  412. get_array(&s->gb, s->scalefactor_huffman + base_channel, s->prim_channels - base_channel, 3);
  413. get_array(&s->gb, s->bitalloc_huffman + base_channel, s->prim_channels - base_channel, 3);
  414. /* Get codebooks quantization indexes */
  415. if (!base_channel)
  416. memset(s->quant_index_huffman, 0, sizeof(s->quant_index_huffman));
  417. for (j = 1; j < 11; j++)
  418. for (i = base_channel; i < s->prim_channels; i++)
  419. s->quant_index_huffman[i][j] = get_bits(&s->gb, bitlen[j]);
  420. /* Get scale factor adjustment */
  421. for (j = 0; j < 11; j++)
  422. for (i = base_channel; i < s->prim_channels; i++)
  423. s->scalefactor_adj[i][j] = 1;
  424. for (j = 1; j < 11; j++)
  425. for (i = base_channel; i < s->prim_channels; i++)
  426. if (s->quant_index_huffman[i][j] < thr[j])
  427. s->scalefactor_adj[i][j] = adj_table[get_bits(&s->gb, 2)];
  428. if (s->crc_present) {
  429. /* Audio header CRC check */
  430. get_bits(&s->gb, 16);
  431. }
  432. s->current_subframe = 0;
  433. s->current_subsubframe = 0;
  434. #ifdef TRACE
  435. av_log(s->avctx, AV_LOG_DEBUG, "subframes: %i\n", s->subframes);
  436. av_log(s->avctx, AV_LOG_DEBUG, "prim channels: %i\n", s->prim_channels);
  437. for (i = base_channel; i < s->prim_channels; i++){
  438. av_log(s->avctx, AV_LOG_DEBUG, "subband activity: %i\n", s->subband_activity[i]);
  439. av_log(s->avctx, AV_LOG_DEBUG, "vq start subband: %i\n", s->vq_start_subband[i]);
  440. av_log(s->avctx, AV_LOG_DEBUG, "joint intensity: %i\n", s->joint_intensity[i]);
  441. av_log(s->avctx, AV_LOG_DEBUG, "transient mode codebook: %i\n", s->transient_huffman[i]);
  442. av_log(s->avctx, AV_LOG_DEBUG, "scale factor codebook: %i\n", s->scalefactor_huffman[i]);
  443. av_log(s->avctx, AV_LOG_DEBUG, "bit allocation quantizer: %i\n", s->bitalloc_huffman[i]);
  444. av_log(s->avctx, AV_LOG_DEBUG, "quant index huff:");
  445. for (j = 0; j < 11; j++)
  446. av_log(s->avctx, AV_LOG_DEBUG, " %i",
  447. s->quant_index_huffman[i][j]);
  448. av_log(s->avctx, AV_LOG_DEBUG, "\n");
  449. av_log(s->avctx, AV_LOG_DEBUG, "scalefac adj:");
  450. for (j = 0; j < 11; j++)
  451. av_log(s->avctx, AV_LOG_DEBUG, " %1.3f", s->scalefactor_adj[i][j]);
  452. av_log(s->avctx, AV_LOG_DEBUG, "\n");
  453. }
  454. #endif
  455. return 0;
  456. }
  457. static int dca_parse_frame_header(DCAContext * s)
  458. {
  459. init_get_bits(&s->gb, s->dca_buffer, s->dca_buffer_size * 8);
  460. /* Sync code */
  461. get_bits(&s->gb, 32);
  462. /* Frame header */
  463. s->frame_type = get_bits(&s->gb, 1);
  464. s->samples_deficit = get_bits(&s->gb, 5) + 1;
  465. s->crc_present = get_bits(&s->gb, 1);
  466. s->sample_blocks = get_bits(&s->gb, 7) + 1;
  467. s->frame_size = get_bits(&s->gb, 14) + 1;
  468. if (s->frame_size < 95)
  469. return -1;
  470. s->amode = get_bits(&s->gb, 6);
  471. s->sample_rate = dca_sample_rates[get_bits(&s->gb, 4)];
  472. if (!s->sample_rate)
  473. return -1;
  474. s->bit_rate_index = get_bits(&s->gb, 5);
  475. s->bit_rate = dca_bit_rates[s->bit_rate_index];
  476. if (!s->bit_rate)
  477. return -1;
  478. s->downmix = get_bits(&s->gb, 1);
  479. s->dynrange = get_bits(&s->gb, 1);
  480. s->timestamp = get_bits(&s->gb, 1);
  481. s->aux_data = get_bits(&s->gb, 1);
  482. s->hdcd = get_bits(&s->gb, 1);
  483. s->ext_descr = get_bits(&s->gb, 3);
  484. s->ext_coding = get_bits(&s->gb, 1);
  485. s->aspf = get_bits(&s->gb, 1);
  486. s->lfe = get_bits(&s->gb, 2);
  487. s->predictor_history = get_bits(&s->gb, 1);
  488. /* TODO: check CRC */
  489. if (s->crc_present)
  490. s->header_crc = get_bits(&s->gb, 16);
  491. s->multirate_inter = get_bits(&s->gb, 1);
  492. s->version = get_bits(&s->gb, 4);
  493. s->copy_history = get_bits(&s->gb, 2);
  494. s->source_pcm_res = get_bits(&s->gb, 3);
  495. s->front_sum = get_bits(&s->gb, 1);
  496. s->surround_sum = get_bits(&s->gb, 1);
  497. s->dialog_norm = get_bits(&s->gb, 4);
  498. /* FIXME: channels mixing levels */
  499. s->output = s->amode;
  500. if (s->lfe) s->output |= DCA_LFE;
  501. #ifdef TRACE
  502. av_log(s->avctx, AV_LOG_DEBUG, "frame type: %i\n", s->frame_type);
  503. av_log(s->avctx, AV_LOG_DEBUG, "samples deficit: %i\n", s->samples_deficit);
  504. av_log(s->avctx, AV_LOG_DEBUG, "crc present: %i\n", s->crc_present);
  505. av_log(s->avctx, AV_LOG_DEBUG, "sample blocks: %i (%i samples)\n",
  506. s->sample_blocks, s->sample_blocks * 32);
  507. av_log(s->avctx, AV_LOG_DEBUG, "frame size: %i bytes\n", s->frame_size);
  508. av_log(s->avctx, AV_LOG_DEBUG, "amode: %i (%i channels)\n",
  509. s->amode, dca_channels[s->amode]);
  510. av_log(s->avctx, AV_LOG_DEBUG, "sample rate: %i Hz\n",
  511. s->sample_rate);
  512. av_log(s->avctx, AV_LOG_DEBUG, "bit rate: %i bits/s\n",
  513. s->bit_rate);
  514. av_log(s->avctx, AV_LOG_DEBUG, "downmix: %i\n", s->downmix);
  515. av_log(s->avctx, AV_LOG_DEBUG, "dynrange: %i\n", s->dynrange);
  516. av_log(s->avctx, AV_LOG_DEBUG, "timestamp: %i\n", s->timestamp);
  517. av_log(s->avctx, AV_LOG_DEBUG, "aux_data: %i\n", s->aux_data);
  518. av_log(s->avctx, AV_LOG_DEBUG, "hdcd: %i\n", s->hdcd);
  519. av_log(s->avctx, AV_LOG_DEBUG, "ext descr: %i\n", s->ext_descr);
  520. av_log(s->avctx, AV_LOG_DEBUG, "ext coding: %i\n", s->ext_coding);
  521. av_log(s->avctx, AV_LOG_DEBUG, "aspf: %i\n", s->aspf);
  522. av_log(s->avctx, AV_LOG_DEBUG, "lfe: %i\n", s->lfe);
  523. av_log(s->avctx, AV_LOG_DEBUG, "predictor history: %i\n",
  524. s->predictor_history);
  525. av_log(s->avctx, AV_LOG_DEBUG, "header crc: %i\n", s->header_crc);
  526. av_log(s->avctx, AV_LOG_DEBUG, "multirate inter: %i\n",
  527. s->multirate_inter);
  528. av_log(s->avctx, AV_LOG_DEBUG, "version number: %i\n", s->version);
  529. av_log(s->avctx, AV_LOG_DEBUG, "copy history: %i\n", s->copy_history);
  530. av_log(s->avctx, AV_LOG_DEBUG,
  531. "source pcm resolution: %i (%i bits/sample)\n",
  532. s->source_pcm_res, dca_bits_per_sample[s->source_pcm_res]);
  533. av_log(s->avctx, AV_LOG_DEBUG, "front sum: %i\n", s->front_sum);
  534. av_log(s->avctx, AV_LOG_DEBUG, "surround sum: %i\n", s->surround_sum);
  535. av_log(s->avctx, AV_LOG_DEBUG, "dialog norm: %i\n", s->dialog_norm);
  536. av_log(s->avctx, AV_LOG_DEBUG, "\n");
  537. #endif
  538. /* Primary audio coding header */
  539. s->subframes = get_bits(&s->gb, 4) + 1;
  540. return dca_parse_audio_coding_header(s, 0);
  541. }
  542. static inline int get_scale(GetBitContext *gb, int level, int value)
  543. {
  544. if (level < 5) {
  545. /* huffman encoded */
  546. value += get_bitalloc(gb, &dca_scalefactor, level);
  547. } else if (level < 8)
  548. value = get_bits(gb, level + 1);
  549. return value;
  550. }
  551. static int dca_subframe_header(DCAContext * s, int base_channel, int block_index)
  552. {
  553. /* Primary audio coding side information */
  554. int j, k;
  555. if (get_bits_left(&s->gb) < 0)
  556. return -1;
  557. if (!base_channel) {
  558. s->subsubframes[s->current_subframe] = get_bits(&s->gb, 2) + 1;
  559. s->partial_samples[s->current_subframe] = get_bits(&s->gb, 3);
  560. }
  561. for (j = base_channel; j < s->prim_channels; j++) {
  562. for (k = 0; k < s->subband_activity[j]; k++)
  563. s->prediction_mode[j][k] = get_bits(&s->gb, 1);
  564. }
  565. /* Get prediction codebook */
  566. for (j = base_channel; j < s->prim_channels; j++) {
  567. for (k = 0; k < s->subband_activity[j]; k++) {
  568. if (s->prediction_mode[j][k] > 0) {
  569. /* (Prediction coefficient VQ address) */
  570. s->prediction_vq[j][k] = get_bits(&s->gb, 12);
  571. }
  572. }
  573. }
  574. /* Bit allocation index */
  575. for (j = base_channel; j < s->prim_channels; j++) {
  576. for (k = 0; k < s->vq_start_subband[j]; k++) {
  577. if (s->bitalloc_huffman[j] == 6)
  578. s->bitalloc[j][k] = get_bits(&s->gb, 5);
  579. else if (s->bitalloc_huffman[j] == 5)
  580. s->bitalloc[j][k] = get_bits(&s->gb, 4);
  581. else if (s->bitalloc_huffman[j] == 7) {
  582. av_log(s->avctx, AV_LOG_ERROR,
  583. "Invalid bit allocation index\n");
  584. return -1;
  585. } else {
  586. s->bitalloc[j][k] =
  587. get_bitalloc(&s->gb, &dca_bitalloc_index, s->bitalloc_huffman[j]);
  588. }
  589. if (s->bitalloc[j][k] > 26) {
  590. // av_log(s->avctx,AV_LOG_DEBUG,"bitalloc index [%i][%i] too big (%i)\n",
  591. // j, k, s->bitalloc[j][k]);
  592. return -1;
  593. }
  594. }
  595. }
  596. /* Transition mode */
  597. for (j = base_channel; j < s->prim_channels; j++) {
  598. for (k = 0; k < s->subband_activity[j]; k++) {
  599. s->transition_mode[j][k] = 0;
  600. if (s->subsubframes[s->current_subframe] > 1 &&
  601. k < s->vq_start_subband[j] && s->bitalloc[j][k] > 0) {
  602. s->transition_mode[j][k] =
  603. get_bitalloc(&s->gb, &dca_tmode, s->transient_huffman[j]);
  604. }
  605. }
  606. }
  607. if (get_bits_left(&s->gb) < 0)
  608. return -1;
  609. for (j = base_channel; j < s->prim_channels; j++) {
  610. const uint32_t *scale_table;
  611. int scale_sum;
  612. memset(s->scale_factor[j], 0, s->subband_activity[j] * sizeof(s->scale_factor[0][0][0]) * 2);
  613. if (s->scalefactor_huffman[j] == 6)
  614. scale_table = scale_factor_quant7;
  615. else
  616. scale_table = scale_factor_quant6;
  617. /* When huffman coded, only the difference is encoded */
  618. scale_sum = 0;
  619. for (k = 0; k < s->subband_activity[j]; k++) {
  620. if (k >= s->vq_start_subband[j] || s->bitalloc[j][k] > 0) {
  621. scale_sum = get_scale(&s->gb, s->scalefactor_huffman[j], scale_sum);
  622. s->scale_factor[j][k][0] = scale_table[scale_sum];
  623. }
  624. if (k < s->vq_start_subband[j] && s->transition_mode[j][k]) {
  625. /* Get second scale factor */
  626. scale_sum = get_scale(&s->gb, s->scalefactor_huffman[j], scale_sum);
  627. s->scale_factor[j][k][1] = scale_table[scale_sum];
  628. }
  629. }
  630. }
  631. /* Joint subband scale factor codebook select */
  632. for (j = base_channel; j < s->prim_channels; j++) {
  633. /* Transmitted only if joint subband coding enabled */
  634. if (s->joint_intensity[j] > 0)
  635. s->joint_huff[j] = get_bits(&s->gb, 3);
  636. }
  637. if (get_bits_left(&s->gb) < 0)
  638. return -1;
  639. /* Scale factors for joint subband coding */
  640. for (j = base_channel; j < s->prim_channels; j++) {
  641. int source_channel;
  642. /* Transmitted only if joint subband coding enabled */
  643. if (s->joint_intensity[j] > 0) {
  644. int scale = 0;
  645. source_channel = s->joint_intensity[j] - 1;
  646. /* When huffman coded, only the difference is encoded
  647. * (is this valid as well for joint scales ???) */
  648. for (k = s->subband_activity[j]; k < s->subband_activity[source_channel]; k++) {
  649. scale = get_scale(&s->gb, s->joint_huff[j], 0);
  650. scale += 64; /* bias */
  651. s->joint_scale_factor[j][k] = scale; /*joint_scale_table[scale]; */
  652. }
  653. if (!(s->debug_flag & 0x02)) {
  654. av_log(s->avctx, AV_LOG_DEBUG,
  655. "Joint stereo coding not supported\n");
  656. s->debug_flag |= 0x02;
  657. }
  658. }
  659. }
  660. /* Stereo downmix coefficients */
  661. if (!base_channel && s->prim_channels > 2) {
  662. if (s->downmix) {
  663. for (j = base_channel; j < s->prim_channels; j++) {
  664. s->downmix_coef[j][0] = get_bits(&s->gb, 7);
  665. s->downmix_coef[j][1] = get_bits(&s->gb, 7);
  666. }
  667. } else {
  668. int am = s->amode & DCA_CHANNEL_MASK;
  669. for (j = base_channel; j < s->prim_channels; j++) {
  670. s->downmix_coef[j][0] = dca_default_coeffs[am][j][0];
  671. s->downmix_coef[j][1] = dca_default_coeffs[am][j][1];
  672. }
  673. }
  674. }
  675. /* Dynamic range coefficient */
  676. if (!base_channel && s->dynrange)
  677. s->dynrange_coef = get_bits(&s->gb, 8);
  678. /* Side information CRC check word */
  679. if (s->crc_present) {
  680. get_bits(&s->gb, 16);
  681. }
  682. /*
  683. * Primary audio data arrays
  684. */
  685. /* VQ encoded high frequency subbands */
  686. for (j = base_channel; j < s->prim_channels; j++)
  687. for (k = s->vq_start_subband[j]; k < s->subband_activity[j]; k++)
  688. /* 1 vector -> 32 samples */
  689. s->high_freq_vq[j][k] = get_bits(&s->gb, 10);
  690. /* Low frequency effect data */
  691. if (!base_channel && s->lfe) {
  692. /* LFE samples */
  693. int lfe_samples = 2 * s->lfe * (4 + block_index);
  694. int lfe_end_sample = 2 * s->lfe * (4 + block_index + s->subsubframes[s->current_subframe]);
  695. float lfe_scale;
  696. for (j = lfe_samples; j < lfe_end_sample; j++) {
  697. /* Signed 8 bits int */
  698. s->lfe_data[j] = get_sbits(&s->gb, 8);
  699. }
  700. /* Scale factor index */
  701. s->lfe_scale_factor = scale_factor_quant7[get_bits(&s->gb, 8)];
  702. /* Quantization step size * scale factor */
  703. lfe_scale = 0.035 * s->lfe_scale_factor;
  704. for (j = lfe_samples; j < lfe_end_sample; j++)
  705. s->lfe_data[j] *= lfe_scale;
  706. }
  707. #ifdef TRACE
  708. av_log(s->avctx, AV_LOG_DEBUG, "subsubframes: %i\n", s->subsubframes[s->current_subframe]);
  709. av_log(s->avctx, AV_LOG_DEBUG, "partial samples: %i\n",
  710. s->partial_samples[s->current_subframe]);
  711. for (j = base_channel; j < s->prim_channels; j++) {
  712. av_log(s->avctx, AV_LOG_DEBUG, "prediction mode:");
  713. for (k = 0; k < s->subband_activity[j]; k++)
  714. av_log(s->avctx, AV_LOG_DEBUG, " %i", s->prediction_mode[j][k]);
  715. av_log(s->avctx, AV_LOG_DEBUG, "\n");
  716. }
  717. for (j = base_channel; j < s->prim_channels; j++) {
  718. for (k = 0; k < s->subband_activity[j]; k++)
  719. av_log(s->avctx, AV_LOG_DEBUG,
  720. "prediction coefs: %f, %f, %f, %f\n",
  721. (float) adpcm_vb[s->prediction_vq[j][k]][0] / 8192,
  722. (float) adpcm_vb[s->prediction_vq[j][k]][1] / 8192,
  723. (float) adpcm_vb[s->prediction_vq[j][k]][2] / 8192,
  724. (float) adpcm_vb[s->prediction_vq[j][k]][3] / 8192);
  725. }
  726. for (j = base_channel; j < s->prim_channels; j++) {
  727. av_log(s->avctx, AV_LOG_DEBUG, "bitalloc index: ");
  728. for (k = 0; k < s->vq_start_subband[j]; k++)
  729. av_log(s->avctx, AV_LOG_DEBUG, "%2.2i ", s->bitalloc[j][k]);
  730. av_log(s->avctx, AV_LOG_DEBUG, "\n");
  731. }
  732. for (j = base_channel; j < s->prim_channels; j++) {
  733. av_log(s->avctx, AV_LOG_DEBUG, "Transition mode:");
  734. for (k = 0; k < s->subband_activity[j]; k++)
  735. av_log(s->avctx, AV_LOG_DEBUG, " %i", s->transition_mode[j][k]);
  736. av_log(s->avctx, AV_LOG_DEBUG, "\n");
  737. }
  738. for (j = base_channel; j < s->prim_channels; j++) {
  739. av_log(s->avctx, AV_LOG_DEBUG, "Scale factor:");
  740. for (k = 0; k < s->subband_activity[j]; k++) {
  741. if (k >= s->vq_start_subband[j] || s->bitalloc[j][k] > 0)
  742. av_log(s->avctx, AV_LOG_DEBUG, " %i", s->scale_factor[j][k][0]);
  743. if (k < s->vq_start_subband[j] && s->transition_mode[j][k])
  744. av_log(s->avctx, AV_LOG_DEBUG, " %i(t)", s->scale_factor[j][k][1]);
  745. }
  746. av_log(s->avctx, AV_LOG_DEBUG, "\n");
  747. }
  748. for (j = base_channel; j < s->prim_channels; j++) {
  749. if (s->joint_intensity[j] > 0) {
  750. int source_channel = s->joint_intensity[j] - 1;
  751. av_log(s->avctx, AV_LOG_DEBUG, "Joint scale factor index:\n");
  752. for (k = s->subband_activity[j]; k < s->subband_activity[source_channel]; k++)
  753. av_log(s->avctx, AV_LOG_DEBUG, " %i", s->joint_scale_factor[j][k]);
  754. av_log(s->avctx, AV_LOG_DEBUG, "\n");
  755. }
  756. }
  757. if (!base_channel && s->prim_channels > 2 && s->downmix) {
  758. av_log(s->avctx, AV_LOG_DEBUG, "Downmix coeffs:\n");
  759. for (j = 0; j < s->prim_channels; j++) {
  760. av_log(s->avctx, AV_LOG_DEBUG, "Channel 0,%d = %f\n", j, dca_downmix_coeffs[s->downmix_coef[j][0]]);
  761. av_log(s->avctx, AV_LOG_DEBUG, "Channel 1,%d = %f\n", j, dca_downmix_coeffs[s->downmix_coef[j][1]]);
  762. }
  763. av_log(s->avctx, AV_LOG_DEBUG, "\n");
  764. }
  765. for (j = base_channel; j < s->prim_channels; j++)
  766. for (k = s->vq_start_subband[j]; k < s->subband_activity[j]; k++)
  767. av_log(s->avctx, AV_LOG_DEBUG, "VQ index: %i\n", s->high_freq_vq[j][k]);
  768. if (!base_channel && s->lfe) {
  769. int lfe_samples = 2 * s->lfe * (4 + block_index);
  770. int lfe_end_sample = 2 * s->lfe * (4 + block_index + s->subsubframes[s->current_subframe]);
  771. av_log(s->avctx, AV_LOG_DEBUG, "LFE samples:\n");
  772. for (j = lfe_samples; j < lfe_end_sample; j++)
  773. av_log(s->avctx, AV_LOG_DEBUG, " %f", s->lfe_data[j]);
  774. av_log(s->avctx, AV_LOG_DEBUG, "\n");
  775. }
  776. #endif
  777. return 0;
  778. }
  779. static void qmf_32_subbands(DCAContext * s, int chans,
  780. float samples_in[32][8], float *samples_out,
  781. float scale)
  782. {
  783. const float *prCoeff;
  784. int i;
  785. int sb_act = s->subband_activity[chans];
  786. int subindex;
  787. scale *= sqrt(1/8.0);
  788. /* Select filter */
  789. if (!s->multirate_inter) /* Non-perfect reconstruction */
  790. prCoeff = fir_32bands_nonperfect;
  791. else /* Perfect reconstruction */
  792. prCoeff = fir_32bands_perfect;
  793. for (i = sb_act; i < 32; i++)
  794. s->raXin[i] = 0.0;
  795. /* Reconstructed channel sample index */
  796. for (subindex = 0; subindex < 8; subindex++) {
  797. /* Load in one sample from each subband and clear inactive subbands */
  798. for (i = 0; i < sb_act; i++){
  799. unsigned sign = (i - 1) & 2;
  800. uint32_t v = AV_RN32A(&samples_in[i][subindex]) ^ sign << 30;
  801. AV_WN32A(&s->raXin[i], v);
  802. }
  803. s->synth.synth_filter_float(&s->imdct,
  804. s->subband_fir_hist[chans], &s->hist_index[chans],
  805. s->subband_fir_noidea[chans], prCoeff,
  806. samples_out, s->raXin, scale);
  807. samples_out+= 32;
  808. }
  809. }
  810. static void lfe_interpolation_fir(DCAContext *s, int decimation_select,
  811. int num_deci_sample, float *samples_in,
  812. float *samples_out, float scale)
  813. {
  814. /* samples_in: An array holding decimated samples.
  815. * Samples in current subframe starts from samples_in[0],
  816. * while samples_in[-1], samples_in[-2], ..., stores samples
  817. * from last subframe as history.
  818. *
  819. * samples_out: An array holding interpolated samples
  820. */
  821. int decifactor;
  822. const float *prCoeff;
  823. int deciindex;
  824. /* Select decimation filter */
  825. if (decimation_select == 1) {
  826. decifactor = 64;
  827. prCoeff = lfe_fir_128;
  828. } else {
  829. decifactor = 32;
  830. prCoeff = lfe_fir_64;
  831. }
  832. /* Interpolation */
  833. for (deciindex = 0; deciindex < num_deci_sample; deciindex++) {
  834. s->dcadsp.lfe_fir(samples_out, samples_in, prCoeff, decifactor,
  835. scale);
  836. samples_in++;
  837. samples_out += 2 * decifactor;
  838. }
  839. }
  840. /* downmixing routines */
  841. #define MIX_REAR1(samples, si1, rs, coef) \
  842. samples[i] += samples[si1] * coef[rs][0]; \
  843. samples[i+256] += samples[si1] * coef[rs][1];
  844. #define MIX_REAR2(samples, si1, si2, rs, coef) \
  845. samples[i] += samples[si1] * coef[rs][0] + samples[si2] * coef[rs+1][0]; \
  846. samples[i+256] += samples[si1] * coef[rs][1] + samples[si2] * coef[rs+1][1];
  847. #define MIX_FRONT3(samples, coef) \
  848. t = samples[i+c]; \
  849. u = samples[i+l]; \
  850. v = samples[i+r]; \
  851. samples[i] = t * coef[0][0] + u * coef[1][0] + v * coef[2][0]; \
  852. samples[i+256] = t * coef[0][1] + u * coef[1][1] + v * coef[2][1];
  853. #define DOWNMIX_TO_STEREO(op1, op2) \
  854. for (i = 0; i < 256; i++){ \
  855. op1 \
  856. op2 \
  857. }
  858. static void dca_downmix(float *samples, int srcfmt,
  859. int downmix_coef[DCA_PRIM_CHANNELS_MAX][2],
  860. const int8_t *channel_mapping)
  861. {
  862. int c,l,r,sl,sr,s;
  863. int i;
  864. float t, u, v;
  865. float coef[DCA_PRIM_CHANNELS_MAX][2];
  866. for (i=0; i<DCA_PRIM_CHANNELS_MAX; i++) {
  867. coef[i][0] = dca_downmix_coeffs[downmix_coef[i][0]];
  868. coef[i][1] = dca_downmix_coeffs[downmix_coef[i][1]];
  869. }
  870. switch (srcfmt) {
  871. case DCA_MONO:
  872. case DCA_CHANNEL:
  873. case DCA_STEREO_TOTAL:
  874. case DCA_STEREO_SUMDIFF:
  875. case DCA_4F2R:
  876. av_log(NULL, 0, "Not implemented!\n");
  877. break;
  878. case DCA_STEREO:
  879. break;
  880. case DCA_3F:
  881. c = channel_mapping[0] * 256;
  882. l = channel_mapping[1] * 256;
  883. r = channel_mapping[2] * 256;
  884. DOWNMIX_TO_STEREO(MIX_FRONT3(samples, coef),);
  885. break;
  886. case DCA_2F1R:
  887. s = channel_mapping[2] * 256;
  888. DOWNMIX_TO_STEREO(MIX_REAR1(samples, i + s, 2, coef),);
  889. break;
  890. case DCA_3F1R:
  891. c = channel_mapping[0] * 256;
  892. l = channel_mapping[1] * 256;
  893. r = channel_mapping[2] * 256;
  894. s = channel_mapping[3] * 256;
  895. DOWNMIX_TO_STEREO(MIX_FRONT3(samples, coef),
  896. MIX_REAR1(samples, i + s, 3, coef));
  897. break;
  898. case DCA_2F2R:
  899. sl = channel_mapping[2] * 256;
  900. sr = channel_mapping[3] * 256;
  901. DOWNMIX_TO_STEREO(MIX_REAR2(samples, i + sl, i + sr, 2, coef),);
  902. break;
  903. case DCA_3F2R:
  904. c = channel_mapping[0] * 256;
  905. l = channel_mapping[1] * 256;
  906. r = channel_mapping[2] * 256;
  907. sl = channel_mapping[3] * 256;
  908. sr = channel_mapping[4] * 256;
  909. DOWNMIX_TO_STEREO(MIX_FRONT3(samples, coef),
  910. MIX_REAR2(samples, i + sl, i + sr, 3, coef));
  911. break;
  912. }
  913. }
  914. /* Very compact version of the block code decoder that does not use table
  915. * look-up but is slightly slower */
  916. static int decode_blockcode(int code, int levels, int *values)
  917. {
  918. int i;
  919. int offset = (levels - 1) >> 1;
  920. for (i = 0; i < 4; i++) {
  921. int div = FASTDIV(code, levels);
  922. values[i] = code - offset - div*levels;
  923. code = div;
  924. }
  925. if (code == 0)
  926. return 0;
  927. else {
  928. av_log(NULL, AV_LOG_ERROR, "ERROR: block code look-up failed\n");
  929. return -1;
  930. }
  931. }
  932. static const uint8_t abits_sizes[7] = { 7, 10, 12, 13, 15, 17, 19 };
  933. static const uint8_t abits_levels[7] = { 3, 5, 7, 9, 13, 17, 25 };
  934. #ifndef int8x8_fmul_int32
  935. static inline void int8x8_fmul_int32(float *dst, const int8_t *src, int scale)
  936. {
  937. float fscale = scale / 16.0;
  938. int i;
  939. for (i = 0; i < 8; i++)
  940. dst[i] = src[i] * fscale;
  941. }
  942. #endif
  943. static int dca_subsubframe(DCAContext * s, int base_channel, int block_index)
  944. {
  945. int k, l;
  946. int subsubframe = s->current_subsubframe;
  947. const float *quant_step_table;
  948. /* FIXME */
  949. float (*subband_samples)[DCA_SUBBANDS][8] = s->subband_samples[block_index];
  950. LOCAL_ALIGNED_16(int, block, [8]);
  951. /*
  952. * Audio data
  953. */
  954. /* Select quantization step size table */
  955. if (s->bit_rate_index == 0x1f)
  956. quant_step_table = lossless_quant_d;
  957. else
  958. quant_step_table = lossy_quant_d;
  959. for (k = base_channel; k < s->prim_channels; k++) {
  960. if (get_bits_left(&s->gb) < 0)
  961. return -1;
  962. for (l = 0; l < s->vq_start_subband[k]; l++) {
  963. int m;
  964. /* Select the mid-tread linear quantizer */
  965. int abits = s->bitalloc[k][l];
  966. float quant_step_size = quant_step_table[abits];
  967. /*
  968. * Determine quantization index code book and its type
  969. */
  970. /* Select quantization index code book */
  971. int sel = s->quant_index_huffman[k][abits];
  972. /*
  973. * Extract bits from the bit stream
  974. */
  975. if (!abits){
  976. memset(subband_samples[k][l], 0, 8 * sizeof(subband_samples[0][0][0]));
  977. } else {
  978. /* Deal with transients */
  979. int sfi = s->transition_mode[k][l] && subsubframe >= s->transition_mode[k][l];
  980. float rscale = quant_step_size * s->scale_factor[k][l][sfi] * s->scalefactor_adj[k][sel];
  981. if (abits >= 11 || !dca_smpl_bitalloc[abits].vlc[sel].table){
  982. if (abits <= 7){
  983. /* Block code */
  984. int block_code1, block_code2, size, levels;
  985. size = abits_sizes[abits-1];
  986. levels = abits_levels[abits-1];
  987. block_code1 = get_bits(&s->gb, size);
  988. /* FIXME Should test return value */
  989. decode_blockcode(block_code1, levels, block);
  990. block_code2 = get_bits(&s->gb, size);
  991. decode_blockcode(block_code2, levels, &block[4]);
  992. }else{
  993. /* no coding */
  994. for (m = 0; m < 8; m++)
  995. block[m] = get_sbits(&s->gb, abits - 3);
  996. }
  997. }else{
  998. /* Huffman coded */
  999. for (m = 0; m < 8; m++)
  1000. block[m] = get_bitalloc(&s->gb, &dca_smpl_bitalloc[abits], sel);
  1001. }
  1002. s->fmt_conv.int32_to_float_fmul_scalar(subband_samples[k][l],
  1003. block, rscale, 8);
  1004. }
  1005. /*
  1006. * Inverse ADPCM if in prediction mode
  1007. */
  1008. if (s->prediction_mode[k][l]) {
  1009. int n;
  1010. for (m = 0; m < 8; m++) {
  1011. for (n = 1; n <= 4; n++)
  1012. if (m >= n)
  1013. subband_samples[k][l][m] +=
  1014. (adpcm_vb[s->prediction_vq[k][l]][n - 1] *
  1015. subband_samples[k][l][m - n] / 8192);
  1016. else if (s->predictor_history)
  1017. subband_samples[k][l][m] +=
  1018. (adpcm_vb[s->prediction_vq[k][l]][n - 1] *
  1019. s->subband_samples_hist[k][l][m - n +
  1020. 4] / 8192);
  1021. }
  1022. }
  1023. }
  1024. /*
  1025. * Decode VQ encoded high frequencies
  1026. */
  1027. for (l = s->vq_start_subband[k]; l < s->subband_activity[k]; l++) {
  1028. /* 1 vector -> 32 samples but we only need the 8 samples
  1029. * for this subsubframe. */
  1030. int hfvq = s->high_freq_vq[k][l];
  1031. if (!s->debug_flag & 0x01) {
  1032. av_log(s->avctx, AV_LOG_DEBUG, "Stream with high frequencies VQ coding\n");
  1033. s->debug_flag |= 0x01;
  1034. }
  1035. int8x8_fmul_int32(subband_samples[k][l],
  1036. &high_freq_vq[hfvq][subsubframe * 8],
  1037. s->scale_factor[k][l][0]);
  1038. }
  1039. }
  1040. /* Check for DSYNC after subsubframe */
  1041. if (s->aspf || subsubframe == s->subsubframes[s->current_subframe] - 1) {
  1042. if (0xFFFF == get_bits(&s->gb, 16)) { /* 0xFFFF */
  1043. #ifdef TRACE
  1044. av_log(s->avctx, AV_LOG_DEBUG, "Got subframe DSYNC\n");
  1045. #endif
  1046. } else {
  1047. av_log(s->avctx, AV_LOG_ERROR, "Didn't get subframe DSYNC\n");
  1048. }
  1049. }
  1050. /* Backup predictor history for adpcm */
  1051. for (k = base_channel; k < s->prim_channels; k++)
  1052. for (l = 0; l < s->vq_start_subband[k]; l++)
  1053. memcpy(s->subband_samples_hist[k][l], &subband_samples[k][l][4],
  1054. 4 * sizeof(subband_samples[0][0][0]));
  1055. return 0;
  1056. }
  1057. static int dca_filter_channels(DCAContext * s, int block_index)
  1058. {
  1059. float (*subband_samples)[DCA_SUBBANDS][8] = s->subband_samples[block_index];
  1060. int k;
  1061. /* 32 subbands QMF */
  1062. for (k = 0; k < s->prim_channels; k++) {
  1063. /* static float pcm_to_double[8] =
  1064. {32768.0, 32768.0, 524288.0, 524288.0, 0, 8388608.0, 8388608.0};*/
  1065. qmf_32_subbands(s, k, subband_samples[k], &s->samples[256 * s->channel_order_tab[k]],
  1066. M_SQRT1_2*s->scale_bias /*pcm_to_double[s->source_pcm_res] */ );
  1067. }
  1068. /* Down mixing */
  1069. if (s->avctx->request_channels == 2 && s->prim_channels > 2) {
  1070. dca_downmix(s->samples, s->amode, s->downmix_coef, s->channel_order_tab);
  1071. }
  1072. /* Generate LFE samples for this subsubframe FIXME!!! */
  1073. if (s->output & DCA_LFE) {
  1074. lfe_interpolation_fir(s, s->lfe, 2 * s->lfe,
  1075. s->lfe_data + 2 * s->lfe * (block_index + 4),
  1076. &s->samples[256 * dca_lfe_index[s->amode]],
  1077. (1.0/256.0)*s->scale_bias);
  1078. /* Outputs 20bits pcm samples */
  1079. }
  1080. return 0;
  1081. }
  1082. static int dca_subframe_footer(DCAContext * s, int base_channel)
  1083. {
  1084. int aux_data_count = 0, i;
  1085. /*
  1086. * Unpack optional information
  1087. */
  1088. /* presumably optional information only appears in the core? */
  1089. if (!base_channel) {
  1090. if (s->timestamp)
  1091. get_bits(&s->gb, 32);
  1092. if (s->aux_data)
  1093. aux_data_count = get_bits(&s->gb, 6);
  1094. for (i = 0; i < aux_data_count; i++)
  1095. get_bits(&s->gb, 8);
  1096. if (s->crc_present && (s->downmix || s->dynrange))
  1097. get_bits(&s->gb, 16);
  1098. }
  1099. return 0;
  1100. }
  1101. /**
  1102. * Decode a dca frame block
  1103. *
  1104. * @param s pointer to the DCAContext
  1105. */
  1106. static int dca_decode_block(DCAContext * s, int base_channel, int block_index)
  1107. {
  1108. /* Sanity check */
  1109. if (s->current_subframe >= s->subframes) {
  1110. av_log(s->avctx, AV_LOG_DEBUG, "check failed: %i>%i",
  1111. s->current_subframe, s->subframes);
  1112. return -1;
  1113. }
  1114. if (!s->current_subsubframe) {
  1115. #ifdef TRACE
  1116. av_log(s->avctx, AV_LOG_DEBUG, "DSYNC dca_subframe_header\n");
  1117. #endif
  1118. /* Read subframe header */
  1119. if (dca_subframe_header(s, base_channel, block_index))
  1120. return -1;
  1121. }
  1122. /* Read subsubframe */
  1123. #ifdef TRACE
  1124. av_log(s->avctx, AV_LOG_DEBUG, "DSYNC dca_subsubframe\n");
  1125. #endif
  1126. if (dca_subsubframe(s, base_channel, block_index))
  1127. return -1;
  1128. /* Update state */
  1129. s->current_subsubframe++;
  1130. if (s->current_subsubframe >= s->subsubframes[s->current_subframe]) {
  1131. s->current_subsubframe = 0;
  1132. s->current_subframe++;
  1133. }
  1134. if (s->current_subframe >= s->subframes) {
  1135. #ifdef TRACE
  1136. av_log(s->avctx, AV_LOG_DEBUG, "DSYNC dca_subframe_footer\n");
  1137. #endif
  1138. /* Read subframe footer */
  1139. if (dca_subframe_footer(s, base_channel))
  1140. return -1;
  1141. }
  1142. return 0;
  1143. }
  1144. /**
  1145. * Convert bitstream to one representation based on sync marker
  1146. */
  1147. static int dca_convert_bitstream(const uint8_t * src, int src_size, uint8_t * dst,
  1148. int max_size)
  1149. {
  1150. uint32_t mrk;
  1151. int i, tmp;
  1152. const uint16_t *ssrc = (const uint16_t *) src;
  1153. uint16_t *sdst = (uint16_t *) dst;
  1154. PutBitContext pb;
  1155. if ((unsigned)src_size > (unsigned)max_size) {
  1156. // av_log(NULL, AV_LOG_ERROR, "Input frame size larger than DCA_MAX_FRAME_SIZE!\n");
  1157. // return -1;
  1158. src_size = max_size;
  1159. }
  1160. mrk = AV_RB32(src);
  1161. switch (mrk) {
  1162. case DCA_MARKER_RAW_BE:
  1163. memcpy(dst, src, src_size);
  1164. return src_size;
  1165. case DCA_MARKER_RAW_LE:
  1166. for (i = 0; i < (src_size + 1) >> 1; i++)
  1167. *sdst++ = av_bswap16(*ssrc++);
  1168. return src_size;
  1169. case DCA_MARKER_14B_BE:
  1170. case DCA_MARKER_14B_LE:
  1171. init_put_bits(&pb, dst, max_size);
  1172. for (i = 0; i < (src_size + 1) >> 1; i++, src += 2) {
  1173. tmp = ((mrk == DCA_MARKER_14B_BE) ? AV_RB16(src) : AV_RL16(src)) & 0x3FFF;
  1174. put_bits(&pb, 14, tmp);
  1175. }
  1176. flush_put_bits(&pb);
  1177. return (put_bits_count(&pb) + 7) >> 3;
  1178. default:
  1179. return -1;
  1180. }
  1181. }
  1182. /**
  1183. * Return the number of channels in an ExSS speaker mask (HD)
  1184. */
  1185. static int dca_exss_mask2count(int mask)
  1186. {
  1187. /* count bits that mean speaker pairs twice */
  1188. return av_popcount(mask)
  1189. + av_popcount(mask & (
  1190. DCA_EXSS_CENTER_LEFT_RIGHT
  1191. | DCA_EXSS_FRONT_LEFT_RIGHT
  1192. | DCA_EXSS_FRONT_HIGH_LEFT_RIGHT
  1193. | DCA_EXSS_WIDE_LEFT_RIGHT
  1194. | DCA_EXSS_SIDE_LEFT_RIGHT
  1195. | DCA_EXSS_SIDE_HIGH_LEFT_RIGHT
  1196. | DCA_EXSS_SIDE_REAR_LEFT_RIGHT
  1197. | DCA_EXSS_REAR_LEFT_RIGHT
  1198. | DCA_EXSS_REAR_HIGH_LEFT_RIGHT
  1199. ));
  1200. }
  1201. /**
  1202. * Skip mixing coefficients of a single mix out configuration (HD)
  1203. */
  1204. static void dca_exss_skip_mix_coeffs(GetBitContext *gb, int channels, int out_ch)
  1205. {
  1206. int i;
  1207. for (i = 0; i < channels; i++) {
  1208. int mix_map_mask = get_bits(gb, out_ch);
  1209. int num_coeffs = av_popcount(mix_map_mask);
  1210. skip_bits_long(gb, num_coeffs * 6);
  1211. }
  1212. }
  1213. /**
  1214. * Parse extension substream asset header (HD)
  1215. */
  1216. static int dca_exss_parse_asset_header(DCAContext *s)
  1217. {
  1218. int header_pos = get_bits_count(&s->gb);
  1219. int header_size;
  1220. int channels;
  1221. int embedded_stereo = 0;
  1222. int embedded_6ch = 0;
  1223. int drc_code_present;
  1224. int extensions_mask;
  1225. int i, j;
  1226. if (get_bits_left(&s->gb) < 16)
  1227. return -1;
  1228. /* We will parse just enough to get to the extensions bitmask with which
  1229. * we can set the profile value. */
  1230. header_size = get_bits(&s->gb, 9) + 1;
  1231. skip_bits(&s->gb, 3); // asset index
  1232. if (s->static_fields) {
  1233. if (get_bits1(&s->gb))
  1234. skip_bits(&s->gb, 4); // asset type descriptor
  1235. if (get_bits1(&s->gb))
  1236. skip_bits_long(&s->gb, 24); // language descriptor
  1237. if (get_bits1(&s->gb)) {
  1238. /* How can one fit 1024 bytes of text here if the maximum value
  1239. * for the asset header size field above was 512 bytes? */
  1240. int text_length = get_bits(&s->gb, 10) + 1;
  1241. if (get_bits_left(&s->gb) < text_length * 8)
  1242. return -1;
  1243. skip_bits_long(&s->gb, text_length * 8); // info text
  1244. }
  1245. skip_bits(&s->gb, 5); // bit resolution - 1
  1246. skip_bits(&s->gb, 4); // max sample rate code
  1247. channels = get_bits(&s->gb, 8) + 1;
  1248. if (get_bits1(&s->gb)) { // 1-to-1 channels to speakers
  1249. int spkr_remap_sets;
  1250. int spkr_mask_size = 16;
  1251. int num_spkrs[7];
  1252. if (channels > 2)
  1253. embedded_stereo = get_bits1(&s->gb);
  1254. if (channels > 6)
  1255. embedded_6ch = get_bits1(&s->gb);
  1256. if (get_bits1(&s->gb)) {
  1257. spkr_mask_size = (get_bits(&s->gb, 2) + 1) << 2;
  1258. skip_bits(&s->gb, spkr_mask_size); // spkr activity mask
  1259. }
  1260. spkr_remap_sets = get_bits(&s->gb, 3);
  1261. for (i = 0; i < spkr_remap_sets; i++) {
  1262. /* std layout mask for each remap set */
  1263. num_spkrs[i] = dca_exss_mask2count(get_bits(&s->gb, spkr_mask_size));
  1264. }
  1265. for (i = 0; i < spkr_remap_sets; i++) {
  1266. int num_dec_ch_remaps = get_bits(&s->gb, 5) + 1;
  1267. if (get_bits_left(&s->gb) < 0)
  1268. return -1;
  1269. for (j = 0; j < num_spkrs[i]; j++) {
  1270. int remap_dec_ch_mask = get_bits_long(&s->gb, num_dec_ch_remaps);
  1271. int num_dec_ch = av_popcount(remap_dec_ch_mask);
  1272. skip_bits_long(&s->gb, num_dec_ch * 5); // remap codes
  1273. }
  1274. }
  1275. } else {
  1276. skip_bits(&s->gb, 3); // representation type
  1277. }
  1278. }
  1279. drc_code_present = get_bits1(&s->gb);
  1280. if (drc_code_present)
  1281. get_bits(&s->gb, 8); // drc code
  1282. if (get_bits1(&s->gb))
  1283. skip_bits(&s->gb, 5); // dialog normalization code
  1284. if (drc_code_present && embedded_stereo)
  1285. get_bits(&s->gb, 8); // drc stereo code
  1286. if (s->mix_metadata && get_bits1(&s->gb)) {
  1287. skip_bits(&s->gb, 1); // external mix
  1288. skip_bits(&s->gb, 6); // post mix gain code
  1289. if (get_bits(&s->gb, 2) != 3) // mixer drc code
  1290. skip_bits(&s->gb, 3); // drc limit
  1291. else
  1292. skip_bits(&s->gb, 8); // custom drc code
  1293. if (get_bits1(&s->gb)) // channel specific scaling
  1294. for (i = 0; i < s->num_mix_configs; i++)
  1295. skip_bits_long(&s->gb, s->mix_config_num_ch[i] * 6); // scale codes
  1296. else
  1297. skip_bits_long(&s->gb, s->num_mix_configs * 6); // scale codes
  1298. for (i = 0; i < s->num_mix_configs; i++) {
  1299. if (get_bits_left(&s->gb) < 0)
  1300. return -1;
  1301. dca_exss_skip_mix_coeffs(&s->gb, channels, s->mix_config_num_ch[i]);
  1302. if (embedded_6ch)
  1303. dca_exss_skip_mix_coeffs(&s->gb, 6, s->mix_config_num_ch[i]);
  1304. if (embedded_stereo)
  1305. dca_exss_skip_mix_coeffs(&s->gb, 2, s->mix_config_num_ch[i]);
  1306. }
  1307. }
  1308. switch (get_bits(&s->gb, 2)) {
  1309. case 0: extensions_mask = get_bits(&s->gb, 12); break;
  1310. case 1: extensions_mask = DCA_EXT_EXSS_XLL; break;
  1311. case 2: extensions_mask = DCA_EXT_EXSS_LBR; break;
  1312. case 3: extensions_mask = 0; /* aux coding */ break;
  1313. }
  1314. /* not parsed further, we were only interested in the extensions mask */
  1315. if (get_bits_left(&s->gb) < 0)
  1316. return -1;
  1317. if (get_bits_count(&s->gb) - header_pos > header_size * 8) {
  1318. av_log(s->avctx, AV_LOG_WARNING, "Asset header size mismatch.\n");
  1319. return -1;
  1320. }
  1321. skip_bits_long(&s->gb, header_pos + header_size * 8 - get_bits_count(&s->gb));
  1322. if (extensions_mask & DCA_EXT_EXSS_XLL)
  1323. s->profile = FF_PROFILE_DTS_HD_MA;
  1324. else if (extensions_mask & (DCA_EXT_EXSS_XBR | DCA_EXT_EXSS_X96 |
  1325. DCA_EXT_EXSS_XXCH))
  1326. s->profile = FF_PROFILE_DTS_HD_HRA;
  1327. if (!(extensions_mask & DCA_EXT_CORE))
  1328. av_log(s->avctx, AV_LOG_WARNING, "DTS core detection mismatch.\n");
  1329. if ((extensions_mask & DCA_CORE_EXTS) != s->core_ext_mask)
  1330. av_log(s->avctx, AV_LOG_WARNING, "DTS extensions detection mismatch (%d, %d)\n",
  1331. extensions_mask & DCA_CORE_EXTS, s->core_ext_mask);
  1332. return 0;
  1333. }
  1334. /**
  1335. * Parse extension substream header (HD)
  1336. */
  1337. static void dca_exss_parse_header(DCAContext *s)
  1338. {
  1339. int ss_index;
  1340. int blownup;
  1341. int num_audiop = 1;
  1342. int num_assets = 1;
  1343. int active_ss_mask[8];
  1344. int i, j;
  1345. if (get_bits_left(&s->gb) < 52)
  1346. return;
  1347. skip_bits(&s->gb, 8); // user data
  1348. ss_index = get_bits(&s->gb, 2);
  1349. blownup = get_bits1(&s->gb);
  1350. skip_bits(&s->gb, 8 + 4 * blownup); // header_size
  1351. skip_bits(&s->gb, 16 + 4 * blownup); // hd_size
  1352. s->static_fields = get_bits1(&s->gb);
  1353. if (s->static_fields) {
  1354. skip_bits(&s->gb, 2); // reference clock code
  1355. skip_bits(&s->gb, 3); // frame duration code
  1356. if (get_bits1(&s->gb))
  1357. skip_bits_long(&s->gb, 36); // timestamp
  1358. /* a single stream can contain multiple audio assets that can be
  1359. * combined to form multiple audio presentations */
  1360. num_audiop = get_bits(&s->gb, 3) + 1;
  1361. if (num_audiop > 1) {
  1362. av_log_ask_for_sample(s->avctx, "Multiple DTS-HD audio presentations.");
  1363. /* ignore such streams for now */
  1364. return;
  1365. }
  1366. num_assets = get_bits(&s->gb, 3) + 1;
  1367. if (num_assets > 1) {
  1368. av_log_ask_for_sample(s->avctx, "Multiple DTS-HD audio assets.");
  1369. /* ignore such streams for now */
  1370. return;
  1371. }
  1372. for (i = 0; i < num_audiop; i++)
  1373. active_ss_mask[i] = get_bits(&s->gb, ss_index + 1);
  1374. for (i = 0; i < num_audiop; i++)
  1375. for (j = 0; j <= ss_index; j++)
  1376. if (active_ss_mask[i] & (1 << j))
  1377. skip_bits(&s->gb, 8); // active asset mask
  1378. s->mix_metadata = get_bits1(&s->gb);
  1379. if (s->mix_metadata) {
  1380. int mix_out_mask_size;
  1381. skip_bits(&s->gb, 2); // adjustment level
  1382. mix_out_mask_size = (get_bits(&s->gb, 2) + 1) << 2;
  1383. s->num_mix_configs = get_bits(&s->gb, 2) + 1;
  1384. for (i = 0; i < s->num_mix_configs; i++) {
  1385. int mix_out_mask = get_bits(&s->gb, mix_out_mask_size);
  1386. s->mix_config_num_ch[i] = dca_exss_mask2count(mix_out_mask);
  1387. }
  1388. }
  1389. }
  1390. for (i = 0; i < num_assets; i++)
  1391. skip_bits_long(&s->gb, 16 + 4 * blownup); // asset size
  1392. for (i = 0; i < num_assets; i++) {
  1393. if (dca_exss_parse_asset_header(s))
  1394. return;
  1395. }
  1396. /* not parsed further, we were only interested in the extensions mask
  1397. * from the asset header */
  1398. }
  1399. /**
  1400. * Main frame decoding function
  1401. * FIXME add arguments
  1402. */
  1403. static int dca_decode_frame(AVCodecContext * avctx,
  1404. void *data, int *data_size,
  1405. AVPacket *avpkt)
  1406. {
  1407. const uint8_t *buf = avpkt->data;
  1408. int buf_size = avpkt->size;
  1409. int lfe_samples;
  1410. int num_core_channels = 0;
  1411. int i;
  1412. float *samples_flt = data;
  1413. int16_t *samples_s16 = data;
  1414. int out_size;
  1415. DCAContext *s = avctx->priv_data;
  1416. int channels;
  1417. int core_ss_end;
  1418. s->xch_present = 0;
  1419. s->dca_buffer_size = dca_convert_bitstream(buf, buf_size, s->dca_buffer,
  1420. DCA_MAX_FRAME_SIZE + DCA_MAX_EXSS_HEADER_SIZE);
  1421. if (s->dca_buffer_size == -1) {
  1422. av_log(avctx, AV_LOG_ERROR, "Not a valid DCA frame\n");
  1423. return -1;
  1424. }
  1425. init_get_bits(&s->gb, s->dca_buffer, s->dca_buffer_size * 8);
  1426. if (dca_parse_frame_header(s) < 0) {
  1427. //seems like the frame is corrupt, try with the next one
  1428. *data_size=0;
  1429. return buf_size;
  1430. }
  1431. //set AVCodec values with parsed data
  1432. avctx->sample_rate = s->sample_rate;
  1433. avctx->bit_rate = s->bit_rate;
  1434. avctx->frame_size = s->sample_blocks * 32;
  1435. s->profile = FF_PROFILE_DTS;
  1436. for (i = 0; i < (s->sample_blocks / 8); i++) {
  1437. dca_decode_block(s, 0, i);
  1438. }
  1439. /* record number of core channels incase less than max channels are requested */
  1440. num_core_channels = s->prim_channels;
  1441. if (s->ext_coding)
  1442. s->core_ext_mask = dca_ext_audio_descr_mask[s->ext_descr];
  1443. else
  1444. s->core_ext_mask = 0;
  1445. core_ss_end = FFMIN(s->frame_size, s->dca_buffer_size) * 8;
  1446. /* only scan for extensions if ext_descr was unknown or indicated a
  1447. * supported XCh extension */
  1448. if (s->core_ext_mask < 0 || s->core_ext_mask & DCA_EXT_XCH) {
  1449. /* if ext_descr was unknown, clear s->core_ext_mask so that the
  1450. * extensions scan can fill it up */
  1451. s->core_ext_mask = FFMAX(s->core_ext_mask, 0);
  1452. /* extensions start at 32-bit boundaries into bitstream */
  1453. skip_bits_long(&s->gb, (-get_bits_count(&s->gb)) & 31);
  1454. while(core_ss_end - get_bits_count(&s->gb) >= 32) {
  1455. uint32_t bits = get_bits_long(&s->gb, 32);
  1456. switch(bits) {
  1457. case 0x5a5a5a5a: {
  1458. int ext_amode, xch_fsize;
  1459. s->xch_base_channel = s->prim_channels;
  1460. /* validate sync word using XCHFSIZE field */
  1461. xch_fsize = show_bits(&s->gb, 10);
  1462. if((s->frame_size != (get_bits_count(&s->gb) >> 3) - 4 + xch_fsize) &&
  1463. (s->frame_size != (get_bits_count(&s->gb) >> 3) - 4 + xch_fsize + 1))
  1464. continue;
  1465. /* skip length-to-end-of-frame field for the moment */
  1466. skip_bits(&s->gb, 10);
  1467. s->core_ext_mask |= DCA_EXT_XCH;
  1468. /* extension amode should == 1, number of channels in extension */
  1469. /* AFAIK XCh is not used for more channels */
  1470. if ((ext_amode = get_bits(&s->gb, 4)) != 1) {
  1471. av_log(avctx, AV_LOG_ERROR, "XCh extension amode %d not"
  1472. " supported!\n",ext_amode);
  1473. continue;
  1474. }
  1475. /* much like core primary audio coding header */
  1476. dca_parse_audio_coding_header(s, s->xch_base_channel);
  1477. for (i = 0; i < (s->sample_blocks / 8); i++) {
  1478. dca_decode_block(s, s->xch_base_channel, i);
  1479. }
  1480. s->xch_present = 1;
  1481. break;
  1482. }
  1483. case 0x47004a03:
  1484. /* XXCh: extended channels */
  1485. /* usually found either in core or HD part in DTS-HD HRA streams,
  1486. * but not in DTS-ES which contains XCh extensions instead */
  1487. s->core_ext_mask |= DCA_EXT_XXCH;
  1488. break;
  1489. case 0x1d95f262: {
  1490. int fsize96 = show_bits(&s->gb, 12) + 1;
  1491. if (s->frame_size != (get_bits_count(&s->gb) >> 3) - 4 + fsize96)
  1492. continue;
  1493. av_log(avctx, AV_LOG_DEBUG, "X96 extension found at %d bits\n", get_bits_count(&s->gb));
  1494. skip_bits(&s->gb, 12);
  1495. av_log(avctx, AV_LOG_DEBUG, "FSIZE96 = %d bytes\n", fsize96);
  1496. av_log(avctx, AV_LOG_DEBUG, "REVNO = %d\n", get_bits(&s->gb, 4));
  1497. s->core_ext_mask |= DCA_EXT_X96;
  1498. break;
  1499. }
  1500. }
  1501. skip_bits_long(&s->gb, (-get_bits_count(&s->gb)) & 31);
  1502. }
  1503. } else {
  1504. /* no supported extensions, skip the rest of the core substream */
  1505. skip_bits_long(&s->gb, core_ss_end - get_bits_count(&s->gb));
  1506. }
  1507. if (s->core_ext_mask & DCA_EXT_X96)
  1508. s->profile = FF_PROFILE_DTS_96_24;
  1509. else if (s->core_ext_mask & (DCA_EXT_XCH | DCA_EXT_XXCH))
  1510. s->profile = FF_PROFILE_DTS_ES;
  1511. /* check for ExSS (HD part) */
  1512. if (s->dca_buffer_size - s->frame_size > 32
  1513. && get_bits_long(&s->gb, 32) == DCA_HD_MARKER)
  1514. dca_exss_parse_header(s);
  1515. avctx->profile = s->profile;
  1516. channels = s->prim_channels + !!s->lfe;
  1517. if (s->amode<16) {
  1518. avctx->channel_layout = dca_core_channel_layout[s->amode];
  1519. if (s->xch_present && (!avctx->request_channels ||
  1520. avctx->request_channels > num_core_channels + !!s->lfe)) {
  1521. avctx->channel_layout |= AV_CH_BACK_CENTER;
  1522. if (s->lfe) {
  1523. avctx->channel_layout |= AV_CH_LOW_FREQUENCY;
  1524. s->channel_order_tab = dca_channel_reorder_lfe_xch[s->amode];
  1525. } else {
  1526. s->channel_order_tab = dca_channel_reorder_nolfe_xch[s->amode];
  1527. }
  1528. } else {
  1529. channels = num_core_channels + !!s->lfe;
  1530. s->xch_present = 0; /* disable further xch processing */
  1531. if (s->lfe) {
  1532. avctx->channel_layout |= AV_CH_LOW_FREQUENCY;
  1533. s->channel_order_tab = dca_channel_reorder_lfe[s->amode];
  1534. } else
  1535. s->channel_order_tab = dca_channel_reorder_nolfe[s->amode];
  1536. }
  1537. if (channels > !!s->lfe &&
  1538. s->channel_order_tab[channels - 1 - !!s->lfe] < 0)
  1539. return -1;
  1540. if (avctx->request_channels == 2 && s->prim_channels > 2) {
  1541. channels = 2;
  1542. s->output = DCA_STEREO;
  1543. avctx->channel_layout = AV_CH_LAYOUT_STEREO;
  1544. }
  1545. else if (avctx->request_channel_layout & AV_CH_LAYOUT_NATIVE) {
  1546. static const int8_t dca_channel_order_native[9] = { 0, 1, 2, 3, 4, 5, 6, 7, 8 };
  1547. s->channel_order_tab = dca_channel_order_native;
  1548. }
  1549. } else {
  1550. av_log(avctx, AV_LOG_ERROR, "Non standard configuration %d !\n",s->amode);
  1551. return -1;
  1552. }
  1553. /* There is nothing that prevents a dts frame to change channel configuration
  1554. but FFmpeg doesn't support that so only set the channels if it is previously
  1555. unset. Ideally during the first probe for channels the crc should be checked
  1556. and only set avctx->channels when the crc is ok. Right now the decoder could
  1557. set the channels based on a broken first frame.*/
  1558. if (s->is_channels_set == 0) {
  1559. s->is_channels_set = 1;
  1560. avctx->channels = channels;
  1561. }
  1562. if (avctx->channels != channels) {
  1563. av_log(avctx, AV_LOG_ERROR, "DCA decoder does not support number of "
  1564. "channels changing in stream. Skipping frame.\n");
  1565. return -1;
  1566. }
  1567. out_size = 256 / 8 * s->sample_blocks * channels *
  1568. av_get_bytes_per_sample(avctx->sample_fmt);
  1569. if (*data_size < out_size)
  1570. return -1;
  1571. *data_size = out_size;
  1572. /* filter to get final output */
  1573. for (i = 0; i < (s->sample_blocks / 8); i++) {
  1574. dca_filter_channels(s, i);
  1575. /* If this was marked as a DTS-ES stream we need to subtract back- */
  1576. /* channel from SL & SR to remove matrixed back-channel signal */
  1577. if((s->source_pcm_res & 1) && s->xch_present) {
  1578. float* back_chan = s->samples + s->channel_order_tab[s->xch_base_channel] * 256;
  1579. float* lt_chan = s->samples + s->channel_order_tab[s->xch_base_channel - 2] * 256;
  1580. float* rt_chan = s->samples + s->channel_order_tab[s->xch_base_channel - 1] * 256;
  1581. s->dsp.vector_fmac_scalar(lt_chan, back_chan, -M_SQRT1_2, 256);
  1582. s->dsp.vector_fmac_scalar(rt_chan, back_chan, -M_SQRT1_2, 256);
  1583. }
  1584. if (avctx->sample_fmt == AV_SAMPLE_FMT_FLT) {
  1585. s->fmt_conv.float_interleave(samples_flt, s->samples_chanptr, 256,
  1586. channels);
  1587. samples_flt += 256 * channels;
  1588. } else {
  1589. s->fmt_conv.float_to_int16_interleave(samples_s16,
  1590. s->samples_chanptr, 256,
  1591. channels);
  1592. samples_s16 += 256 * channels;
  1593. }
  1594. }
  1595. /* update lfe history */
  1596. lfe_samples = 2 * s->lfe * (s->sample_blocks / 8);
  1597. for (i = 0; i < 2 * s->lfe * 4; i++) {
  1598. s->lfe_data[i] = s->lfe_data[i + lfe_samples];
  1599. }
  1600. return buf_size;
  1601. }
  1602. /**
  1603. * DCA initialization
  1604. *
  1605. * @param avctx pointer to the AVCodecContext
  1606. */
  1607. static av_cold int dca_decode_init(AVCodecContext * avctx)
  1608. {
  1609. DCAContext *s = avctx->priv_data;
  1610. int i;
  1611. s->avctx = avctx;
  1612. dca_init_vlcs();
  1613. dsputil_init(&s->dsp, avctx);
  1614. ff_mdct_init(&s->imdct, 6, 1, 1.0);
  1615. ff_synth_filter_init(&s->synth);
  1616. ff_dcadsp_init(&s->dcadsp);
  1617. ff_fmt_convert_init(&s->fmt_conv, avctx);
  1618. for (i = 0; i < DCA_PRIM_CHANNELS_MAX+1; i++)
  1619. s->samples_chanptr[i] = s->samples + i * 256;
  1620. if (avctx->request_sample_fmt == AV_SAMPLE_FMT_FLT) {
  1621. avctx->sample_fmt = AV_SAMPLE_FMT_FLT;
  1622. s->scale_bias = 1.0 / 32768.0;
  1623. } else {
  1624. avctx->sample_fmt = AV_SAMPLE_FMT_S16;
  1625. s->scale_bias = 1.0;
  1626. }
  1627. /* allow downmixing to stereo */
  1628. if (avctx->channels > 0 && avctx->request_channels < avctx->channels &&
  1629. avctx->request_channels == 2) {
  1630. avctx->channels = avctx->request_channels;
  1631. }
  1632. return 0;
  1633. }
  1634. static av_cold int dca_decode_end(AVCodecContext * avctx)
  1635. {
  1636. DCAContext *s = avctx->priv_data;
  1637. ff_mdct_end(&s->imdct);
  1638. return 0;
  1639. }
  1640. static const AVProfile profiles[] = {
  1641. { FF_PROFILE_DTS, "DTS" },
  1642. { FF_PROFILE_DTS_ES, "DTS-ES" },
  1643. { FF_PROFILE_DTS_96_24, "DTS 96/24" },
  1644. { FF_PROFILE_DTS_HD_HRA, "DTS-HD HRA" },
  1645. { FF_PROFILE_DTS_HD_MA, "DTS-HD MA" },
  1646. { FF_PROFILE_UNKNOWN },
  1647. };
  1648. AVCodec ff_dca_decoder = {
  1649. .name = "dca",
  1650. .type = AVMEDIA_TYPE_AUDIO,
  1651. .id = CODEC_ID_DTS,
  1652. .priv_data_size = sizeof(DCAContext),
  1653. .init = dca_decode_init,
  1654. .decode = dca_decode_frame,
  1655. .close = dca_decode_end,
  1656. .long_name = NULL_IF_CONFIG_SMALL("DCA (DTS Coherent Acoustics)"),
  1657. .capabilities = CODEC_CAP_CHANNEL_CONF,
  1658. .sample_fmts = (const enum AVSampleFormat[]) {
  1659. AV_SAMPLE_FMT_FLT, AV_SAMPLE_FMT_S16, AV_SAMPLE_FMT_NONE
  1660. },
  1661. .profiles = NULL_IF_CONFIG_SMALL(profiles),
  1662. };