You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

1688 lines
62KB

  1. /*
  2. * This file is part of Libav.
  3. *
  4. * Libav is free software; you can redistribute it and/or
  5. * modify it under the terms of the GNU Lesser General Public
  6. * License as published by the Free Software Foundation; either
  7. * version 2.1 of the License, or (at your option) any later version.
  8. *
  9. * Libav is distributed in the hope that it will be useful,
  10. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  11. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  12. * Lesser General Public License for more details.
  13. *
  14. * You should have received a copy of the GNU Lesser General Public
  15. * License along with Libav; if not, write to the Free Software
  16. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  17. */
  18. /**
  19. * @file
  20. * Vorbis I decoder
  21. * @author Denes Balatoni ( dbalatoni programozo hu )
  22. */
  23. #include <inttypes.h>
  24. #include <math.h>
  25. #define ALT_BITSTREAM_READER_LE
  26. #include "avcodec.h"
  27. #include "get_bits.h"
  28. #include "dsputil.h"
  29. #include "fft.h"
  30. #include "fmtconvert.h"
  31. #include "vorbis.h"
  32. #include "xiph.h"
  33. #define V_NB_BITS 8
  34. #define V_NB_BITS2 11
  35. #define V_MAX_VLCS (1 << 16)
  36. #define V_MAX_PARTITIONS (1 << 20)
  37. #undef NDEBUG
  38. #include <assert.h>
  39. typedef struct {
  40. uint8_t dimensions;
  41. uint8_t lookup_type;
  42. uint8_t maxdepth;
  43. VLC vlc;
  44. float *codevectors;
  45. unsigned int nb_bits;
  46. } vorbis_codebook;
  47. typedef union vorbis_floor_u vorbis_floor_data;
  48. typedef struct vorbis_floor0_s vorbis_floor0;
  49. typedef struct vorbis_floor1_s vorbis_floor1;
  50. struct vorbis_context_s;
  51. typedef
  52. int (* vorbis_floor_decode_func)
  53. (struct vorbis_context_s *, vorbis_floor_data *, float *);
  54. typedef struct {
  55. uint8_t floor_type;
  56. vorbis_floor_decode_func decode;
  57. union vorbis_floor_u {
  58. struct vorbis_floor0_s {
  59. uint8_t order;
  60. uint16_t rate;
  61. uint16_t bark_map_size;
  62. int32_t *map[2];
  63. uint32_t map_size[2];
  64. uint8_t amplitude_bits;
  65. uint8_t amplitude_offset;
  66. uint8_t num_books;
  67. uint8_t *book_list;
  68. float *lsp;
  69. } t0;
  70. struct vorbis_floor1_s {
  71. uint8_t partitions;
  72. uint8_t partition_class[32];
  73. uint8_t class_dimensions[16];
  74. uint8_t class_subclasses[16];
  75. uint8_t class_masterbook[16];
  76. int16_t subclass_books[16][8];
  77. uint8_t multiplier;
  78. uint16_t x_list_dim;
  79. vorbis_floor1_entry *list;
  80. } t1;
  81. } data;
  82. } vorbis_floor;
  83. typedef struct {
  84. uint16_t type;
  85. uint32_t begin;
  86. uint32_t end;
  87. unsigned partition_size;
  88. uint8_t classifications;
  89. uint8_t classbook;
  90. int16_t books[64][8];
  91. uint8_t maxpass;
  92. uint16_t ptns_to_read;
  93. uint8_t *classifs;
  94. } vorbis_residue;
  95. typedef struct {
  96. uint8_t submaps;
  97. uint16_t coupling_steps;
  98. uint8_t *magnitude;
  99. uint8_t *angle;
  100. uint8_t *mux;
  101. uint8_t submap_floor[16];
  102. uint8_t submap_residue[16];
  103. } vorbis_mapping;
  104. typedef struct {
  105. uint8_t blockflag;
  106. uint16_t windowtype;
  107. uint16_t transformtype;
  108. uint8_t mapping;
  109. } vorbis_mode;
  110. typedef struct vorbis_context_s {
  111. AVCodecContext *avccontext;
  112. GetBitContext gb;
  113. DSPContext dsp;
  114. FmtConvertContext fmt_conv;
  115. FFTContext mdct[2];
  116. uint8_t first_frame;
  117. uint32_t version;
  118. uint8_t audio_channels;
  119. uint32_t audio_samplerate;
  120. uint32_t bitrate_maximum;
  121. uint32_t bitrate_nominal;
  122. uint32_t bitrate_minimum;
  123. uint32_t blocksize[2];
  124. const float *win[2];
  125. uint16_t codebook_count;
  126. vorbis_codebook *codebooks;
  127. uint8_t floor_count;
  128. vorbis_floor *floors;
  129. uint8_t residue_count;
  130. vorbis_residue *residues;
  131. uint8_t mapping_count;
  132. vorbis_mapping *mappings;
  133. uint8_t mode_count;
  134. vorbis_mode *modes;
  135. uint8_t mode_number; // mode number for the current packet
  136. uint8_t previous_window;
  137. float *channel_residues;
  138. float *channel_floors;
  139. float *saved;
  140. float scale_bias; // for float->int conversion
  141. } vorbis_context;
  142. /* Helper functions */
  143. #define BARK(x) \
  144. (13.1f * atan(0.00074f * (x)) + 2.24f * atan(1.85e-8f * (x) * (x)) + 1e-4f * (x))
  145. static const char idx_err_str[] = "Index value %d out of range (0 - %d) for %s at %s:%i\n";
  146. #define VALIDATE_INDEX(idx, limit) \
  147. if (idx >= limit) {\
  148. av_log(vc->avccontext, AV_LOG_ERROR,\
  149. idx_err_str,\
  150. (int)(idx), (int)(limit - 1), #idx, __FILE__, __LINE__);\
  151. return AVERROR_INVALIDDATA;\
  152. }
  153. #define GET_VALIDATED_INDEX(idx, bits, limit) \
  154. {\
  155. idx = get_bits(gb, bits);\
  156. VALIDATE_INDEX(idx, limit)\
  157. }
  158. static float vorbisfloat2float(unsigned val)
  159. {
  160. double mant = val & 0x1fffff;
  161. long exp = (val & 0x7fe00000L) >> 21;
  162. if (val & 0x80000000)
  163. mant = -mant;
  164. return ldexp(mant, exp - 20 - 768);
  165. }
  166. // Free all allocated memory -----------------------------------------
  167. static void vorbis_free(vorbis_context *vc)
  168. {
  169. int i;
  170. av_freep(&vc->channel_residues);
  171. av_freep(&vc->channel_floors);
  172. av_freep(&vc->saved);
  173. for (i = 0; i < vc->residue_count; i++)
  174. av_free(vc->residues[i].classifs);
  175. av_freep(&vc->residues);
  176. av_freep(&vc->modes);
  177. ff_mdct_end(&vc->mdct[0]);
  178. ff_mdct_end(&vc->mdct[1]);
  179. for (i = 0; i < vc->codebook_count; ++i) {
  180. av_free(vc->codebooks[i].codevectors);
  181. free_vlc(&vc->codebooks[i].vlc);
  182. }
  183. av_freep(&vc->codebooks);
  184. for (i = 0; i < vc->floor_count; ++i) {
  185. if (vc->floors[i].floor_type == 0) {
  186. av_free(vc->floors[i].data.t0.map[0]);
  187. av_free(vc->floors[i].data.t0.map[1]);
  188. av_free(vc->floors[i].data.t0.book_list);
  189. av_free(vc->floors[i].data.t0.lsp);
  190. } else {
  191. av_free(vc->floors[i].data.t1.list);
  192. }
  193. }
  194. av_freep(&vc->floors);
  195. for (i = 0; i < vc->mapping_count; ++i) {
  196. av_free(vc->mappings[i].magnitude);
  197. av_free(vc->mappings[i].angle);
  198. av_free(vc->mappings[i].mux);
  199. }
  200. av_freep(&vc->mappings);
  201. }
  202. // Parse setup header -------------------------------------------------
  203. // Process codebooks part
  204. static int vorbis_parse_setup_hdr_codebooks(vorbis_context *vc)
  205. {
  206. unsigned cb;
  207. uint8_t *tmp_vlc_bits;
  208. uint32_t *tmp_vlc_codes;
  209. GetBitContext *gb = &vc->gb;
  210. uint16_t *codebook_multiplicands;
  211. int ret = 0;
  212. vc->codebook_count = get_bits(gb, 8) + 1;
  213. av_dlog(NULL, " Codebooks: %d \n", vc->codebook_count);
  214. vc->codebooks = av_mallocz(vc->codebook_count * sizeof(*vc->codebooks));
  215. tmp_vlc_bits = av_mallocz(V_MAX_VLCS * sizeof(*tmp_vlc_bits));
  216. tmp_vlc_codes = av_mallocz(V_MAX_VLCS * sizeof(*tmp_vlc_codes));
  217. codebook_multiplicands = av_malloc(V_MAX_VLCS * sizeof(*codebook_multiplicands));
  218. for (cb = 0; cb < vc->codebook_count; ++cb) {
  219. vorbis_codebook *codebook_setup = &vc->codebooks[cb];
  220. unsigned ordered, t, entries, used_entries = 0;
  221. av_dlog(NULL, " %u. Codebook\n", cb);
  222. if (get_bits(gb, 24) != 0x564342) {
  223. av_log(vc->avccontext, AV_LOG_ERROR,
  224. " %u. Codebook setup data corrupt.\n", cb);
  225. ret = AVERROR_INVALIDDATA;
  226. goto error;
  227. }
  228. codebook_setup->dimensions=get_bits(gb, 16);
  229. if (codebook_setup->dimensions > 16 || codebook_setup->dimensions == 0) {
  230. av_log(vc->avccontext, AV_LOG_ERROR,
  231. " %u. Codebook's dimension is invalid (%d).\n",
  232. cb, codebook_setup->dimensions);
  233. ret = AVERROR_INVALIDDATA;
  234. goto error;
  235. }
  236. entries = get_bits(gb, 24);
  237. if (entries > V_MAX_VLCS) {
  238. av_log(vc->avccontext, AV_LOG_ERROR,
  239. " %u. Codebook has too many entries (%u).\n",
  240. cb, entries);
  241. ret = AVERROR_INVALIDDATA;
  242. goto error;
  243. }
  244. ordered = get_bits1(gb);
  245. av_dlog(NULL, " codebook_dimensions %d, codebook_entries %u\n",
  246. codebook_setup->dimensions, entries);
  247. if (!ordered) {
  248. unsigned ce, flag;
  249. unsigned sparse = get_bits1(gb);
  250. av_dlog(NULL, " not ordered \n");
  251. if (sparse) {
  252. av_dlog(NULL, " sparse \n");
  253. used_entries = 0;
  254. for (ce = 0; ce < entries; ++ce) {
  255. flag = get_bits1(gb);
  256. if (flag) {
  257. tmp_vlc_bits[ce] = get_bits(gb, 5) + 1;
  258. ++used_entries;
  259. } else
  260. tmp_vlc_bits[ce] = 0;
  261. }
  262. } else {
  263. av_dlog(NULL, " not sparse \n");
  264. used_entries = entries;
  265. for (ce = 0; ce < entries; ++ce)
  266. tmp_vlc_bits[ce] = get_bits(gb, 5) + 1;
  267. }
  268. } else {
  269. unsigned current_entry = 0;
  270. unsigned current_length = get_bits(gb, 5) + 1;
  271. av_dlog(NULL, " ordered, current length: %u\n", current_length); //FIXME
  272. used_entries = entries;
  273. for (; current_entry < used_entries && current_length <= 32; ++current_length) {
  274. unsigned i, number;
  275. av_dlog(NULL, " number bits: %u ", ilog(entries - current_entry));
  276. number = get_bits(gb, ilog(entries - current_entry));
  277. av_dlog(NULL, " number: %u\n", number);
  278. for (i = current_entry; i < number+current_entry; ++i)
  279. if (i < used_entries)
  280. tmp_vlc_bits[i] = current_length;
  281. current_entry+=number;
  282. }
  283. if (current_entry>used_entries) {
  284. av_log(vc->avccontext, AV_LOG_ERROR, " More codelengths than codes in codebook. \n");
  285. ret = AVERROR_INVALIDDATA;
  286. goto error;
  287. }
  288. }
  289. codebook_setup->lookup_type = get_bits(gb, 4);
  290. av_dlog(NULL, " lookup type: %d : %s \n", codebook_setup->lookup_type,
  291. codebook_setup->lookup_type ? "vq" : "no lookup");
  292. // If the codebook is used for (inverse) VQ, calculate codevectors.
  293. if (codebook_setup->lookup_type == 1) {
  294. unsigned i, j, k;
  295. unsigned codebook_lookup_values = ff_vorbis_nth_root(entries, codebook_setup->dimensions);
  296. float codebook_minimum_value = vorbisfloat2float(get_bits_long(gb, 32));
  297. float codebook_delta_value = vorbisfloat2float(get_bits_long(gb, 32));
  298. unsigned codebook_value_bits = get_bits(gb, 4) + 1;
  299. unsigned codebook_sequence_p = get_bits1(gb);
  300. av_dlog(NULL, " We expect %d numbers for building the codevectors. \n",
  301. codebook_lookup_values);
  302. av_dlog(NULL, " delta %f minmum %f \n",
  303. codebook_delta_value, codebook_minimum_value);
  304. for (i = 0; i < codebook_lookup_values; ++i) {
  305. codebook_multiplicands[i] = get_bits(gb, codebook_value_bits);
  306. av_dlog(NULL, " multiplicands*delta+minmum : %e \n",
  307. (float)codebook_multiplicands[i] * codebook_delta_value + codebook_minimum_value);
  308. av_dlog(NULL, " multiplicand %u\n", codebook_multiplicands[i]);
  309. }
  310. // Weed out unused vlcs and build codevector vector
  311. codebook_setup->codevectors = used_entries ? av_mallocz(used_entries *
  312. codebook_setup->dimensions *
  313. sizeof(*codebook_setup->codevectors))
  314. : NULL;
  315. for (j = 0, i = 0; i < entries; ++i) {
  316. unsigned dim = codebook_setup->dimensions;
  317. if (tmp_vlc_bits[i]) {
  318. float last = 0.0;
  319. unsigned lookup_offset = i;
  320. av_dlog(vc->avccontext, "Lookup offset %u ,", i);
  321. for (k = 0; k < dim; ++k) {
  322. unsigned multiplicand_offset = lookup_offset % codebook_lookup_values;
  323. codebook_setup->codevectors[j * dim + k] = codebook_multiplicands[multiplicand_offset] * codebook_delta_value + codebook_minimum_value + last;
  324. if (codebook_sequence_p)
  325. last = codebook_setup->codevectors[j * dim + k];
  326. lookup_offset/=codebook_lookup_values;
  327. }
  328. tmp_vlc_bits[j] = tmp_vlc_bits[i];
  329. av_dlog(vc->avccontext, "real lookup offset %u, vector: ", j);
  330. for (k = 0; k < dim; ++k)
  331. av_dlog(vc->avccontext, " %f ",
  332. codebook_setup->codevectors[j * dim + k]);
  333. av_dlog(vc->avccontext, "\n");
  334. ++j;
  335. }
  336. }
  337. if (j != used_entries) {
  338. av_log(vc->avccontext, AV_LOG_ERROR, "Bug in codevector vector building code. \n");
  339. ret = AVERROR_INVALIDDATA;
  340. goto error;
  341. }
  342. entries = used_entries;
  343. } else if (codebook_setup->lookup_type >= 2) {
  344. av_log(vc->avccontext, AV_LOG_ERROR, "Codebook lookup type not supported. \n");
  345. ret = AVERROR_INVALIDDATA;
  346. goto error;
  347. }
  348. // Initialize VLC table
  349. if (ff_vorbis_len2vlc(tmp_vlc_bits, tmp_vlc_codes, entries)) {
  350. av_log(vc->avccontext, AV_LOG_ERROR, " Invalid code lengths while generating vlcs. \n");
  351. ret = AVERROR_INVALIDDATA;
  352. goto error;
  353. }
  354. codebook_setup->maxdepth = 0;
  355. for (t = 0; t < entries; ++t)
  356. if (tmp_vlc_bits[t] >= codebook_setup->maxdepth)
  357. codebook_setup->maxdepth = tmp_vlc_bits[t];
  358. if (codebook_setup->maxdepth > 3 * V_NB_BITS)
  359. codebook_setup->nb_bits = V_NB_BITS2;
  360. else
  361. codebook_setup->nb_bits = V_NB_BITS;
  362. codebook_setup->maxdepth = (codebook_setup->maxdepth+codebook_setup->nb_bits - 1) / codebook_setup->nb_bits;
  363. if ((ret = init_vlc(&codebook_setup->vlc, codebook_setup->nb_bits,
  364. entries, tmp_vlc_bits, sizeof(*tmp_vlc_bits),
  365. sizeof(*tmp_vlc_bits), tmp_vlc_codes,
  366. sizeof(*tmp_vlc_codes), sizeof(*tmp_vlc_codes),
  367. INIT_VLC_LE))) {
  368. av_log(vc->avccontext, AV_LOG_ERROR, " Error generating vlc tables. \n");
  369. goto error;
  370. }
  371. }
  372. av_free(tmp_vlc_bits);
  373. av_free(tmp_vlc_codes);
  374. av_free(codebook_multiplicands);
  375. return 0;
  376. // Error:
  377. error:
  378. av_free(tmp_vlc_bits);
  379. av_free(tmp_vlc_codes);
  380. av_free(codebook_multiplicands);
  381. return ret;
  382. }
  383. // Process time domain transforms part (unused in Vorbis I)
  384. static int vorbis_parse_setup_hdr_tdtransforms(vorbis_context *vc)
  385. {
  386. GetBitContext *gb = &vc->gb;
  387. unsigned i, vorbis_time_count = get_bits(gb, 6) + 1;
  388. for (i = 0; i < vorbis_time_count; ++i) {
  389. unsigned vorbis_tdtransform = get_bits(gb, 16);
  390. av_dlog(NULL, " Vorbis time domain transform %u: %u\n",
  391. vorbis_time_count, vorbis_tdtransform);
  392. if (vorbis_tdtransform) {
  393. av_log(vc->avccontext, AV_LOG_ERROR, "Vorbis time domain transform data nonzero. \n");
  394. return AVERROR_INVALIDDATA;
  395. }
  396. }
  397. return 0;
  398. }
  399. // Process floors part
  400. static int vorbis_floor0_decode(vorbis_context *vc,
  401. vorbis_floor_data *vfu, float *vec);
  402. static void create_map(vorbis_context *vc, unsigned floor_number);
  403. static int vorbis_floor1_decode(vorbis_context *vc,
  404. vorbis_floor_data *vfu, float *vec);
  405. static int vorbis_parse_setup_hdr_floors(vorbis_context *vc)
  406. {
  407. GetBitContext *gb = &vc->gb;
  408. int i,j,k;
  409. vc->floor_count = get_bits(gb, 6) + 1;
  410. vc->floors = av_mallocz(vc->floor_count * sizeof(*vc->floors));
  411. for (i = 0; i < vc->floor_count; ++i) {
  412. vorbis_floor *floor_setup = &vc->floors[i];
  413. floor_setup->floor_type = get_bits(gb, 16);
  414. av_dlog(NULL, " %d. floor type %d \n", i, floor_setup->floor_type);
  415. if (floor_setup->floor_type == 1) {
  416. int maximum_class = -1;
  417. unsigned rangebits, rangemax, floor1_values = 2;
  418. floor_setup->decode = vorbis_floor1_decode;
  419. floor_setup->data.t1.partitions = get_bits(gb, 5);
  420. av_dlog(NULL, " %d.floor: %d partitions \n",
  421. i, floor_setup->data.t1.partitions);
  422. for (j = 0; j < floor_setup->data.t1.partitions; ++j) {
  423. floor_setup->data.t1.partition_class[j] = get_bits(gb, 4);
  424. if (floor_setup->data.t1.partition_class[j] > maximum_class)
  425. maximum_class = floor_setup->data.t1.partition_class[j];
  426. av_dlog(NULL, " %d. floor %d partition class %d \n",
  427. i, j, floor_setup->data.t1.partition_class[j]);
  428. }
  429. av_dlog(NULL, " maximum class %d \n", maximum_class);
  430. for (j = 0; j <= maximum_class; ++j) {
  431. floor_setup->data.t1.class_dimensions[j] = get_bits(gb, 3) + 1;
  432. floor_setup->data.t1.class_subclasses[j] = get_bits(gb, 2);
  433. av_dlog(NULL, " %d floor %d class dim: %d subclasses %d \n", i, j,
  434. floor_setup->data.t1.class_dimensions[j],
  435. floor_setup->data.t1.class_subclasses[j]);
  436. if (floor_setup->data.t1.class_subclasses[j]) {
  437. GET_VALIDATED_INDEX(floor_setup->data.t1.class_masterbook[j], 8, vc->codebook_count)
  438. av_dlog(NULL, " masterbook: %d \n", floor_setup->data.t1.class_masterbook[j]);
  439. }
  440. for (k = 0; k < (1 << floor_setup->data.t1.class_subclasses[j]); ++k) {
  441. int16_t bits = get_bits(gb, 8) - 1;
  442. if (bits != -1)
  443. VALIDATE_INDEX(bits, vc->codebook_count)
  444. floor_setup->data.t1.subclass_books[j][k] = bits;
  445. av_dlog(NULL, " book %d. : %d \n", k, floor_setup->data.t1.subclass_books[j][k]);
  446. }
  447. }
  448. floor_setup->data.t1.multiplier = get_bits(gb, 2) + 1;
  449. floor_setup->data.t1.x_list_dim = 2;
  450. for (j = 0; j < floor_setup->data.t1.partitions; ++j)
  451. floor_setup->data.t1.x_list_dim+=floor_setup->data.t1.class_dimensions[floor_setup->data.t1.partition_class[j]];
  452. floor_setup->data.t1.list = av_mallocz(floor_setup->data.t1.x_list_dim *
  453. sizeof(*floor_setup->data.t1.list));
  454. rangebits = get_bits(gb, 4);
  455. rangemax = (1 << rangebits);
  456. if (rangemax > vc->blocksize[1] / 2) {
  457. av_log(vc->avccontext, AV_LOG_ERROR,
  458. "Floor value is too large for blocksize: %u (%"PRIu32")\n",
  459. rangemax, vc->blocksize[1] / 2);
  460. return AVERROR_INVALIDDATA;
  461. }
  462. floor_setup->data.t1.list[0].x = 0;
  463. floor_setup->data.t1.list[1].x = rangemax;
  464. for (j = 0; j < floor_setup->data.t1.partitions; ++j) {
  465. for (k = 0; k < floor_setup->data.t1.class_dimensions[floor_setup->data.t1.partition_class[j]]; ++k, ++floor1_values) {
  466. floor_setup->data.t1.list[floor1_values].x = get_bits(gb, rangebits);
  467. av_dlog(NULL, " %u. floor1 Y coord. %d\n", floor1_values,
  468. floor_setup->data.t1.list[floor1_values].x);
  469. }
  470. }
  471. // Precalculate order of x coordinates - needed for decode
  472. ff_vorbis_ready_floor1_list(floor_setup->data.t1.list, floor_setup->data.t1.x_list_dim);
  473. } else if (floor_setup->floor_type == 0) {
  474. unsigned max_codebook_dim = 0;
  475. floor_setup->decode = vorbis_floor0_decode;
  476. floor_setup->data.t0.order = get_bits(gb, 8);
  477. floor_setup->data.t0.rate = get_bits(gb, 16);
  478. floor_setup->data.t0.bark_map_size = get_bits(gb, 16);
  479. floor_setup->data.t0.amplitude_bits = get_bits(gb, 6);
  480. /* zero would result in a div by zero later *
  481. * 2^0 - 1 == 0 */
  482. if (floor_setup->data.t0.amplitude_bits == 0) {
  483. av_log(vc->avccontext, AV_LOG_ERROR,
  484. "Floor 0 amplitude bits is 0.\n");
  485. return AVERROR_INVALIDDATA;
  486. }
  487. floor_setup->data.t0.amplitude_offset = get_bits(gb, 8);
  488. floor_setup->data.t0.num_books = get_bits(gb, 4) + 1;
  489. /* allocate mem for booklist */
  490. floor_setup->data.t0.book_list =
  491. av_malloc(floor_setup->data.t0.num_books);
  492. if (!floor_setup->data.t0.book_list)
  493. return AVERROR(ENOMEM);
  494. /* read book indexes */
  495. {
  496. int idx;
  497. unsigned book_idx;
  498. for (idx = 0; idx < floor_setup->data.t0.num_books; ++idx) {
  499. GET_VALIDATED_INDEX(book_idx, 8, vc->codebook_count)
  500. floor_setup->data.t0.book_list[idx] = book_idx;
  501. if (vc->codebooks[book_idx].dimensions > max_codebook_dim)
  502. max_codebook_dim = vc->codebooks[book_idx].dimensions;
  503. }
  504. }
  505. create_map(vc, i);
  506. /* codebook dim is for padding if codebook dim doesn't *
  507. * divide order+1 then we need to read more data */
  508. floor_setup->data.t0.lsp =
  509. av_malloc((floor_setup->data.t0.order + 1 + max_codebook_dim)
  510. * sizeof(*floor_setup->data.t0.lsp));
  511. if (!floor_setup->data.t0.lsp)
  512. return AVERROR(ENOMEM);
  513. /* debug output parsed headers */
  514. av_dlog(NULL, "floor0 order: %u\n", floor_setup->data.t0.order);
  515. av_dlog(NULL, "floor0 rate: %u\n", floor_setup->data.t0.rate);
  516. av_dlog(NULL, "floor0 bark map size: %u\n",
  517. floor_setup->data.t0.bark_map_size);
  518. av_dlog(NULL, "floor0 amplitude bits: %u\n",
  519. floor_setup->data.t0.amplitude_bits);
  520. av_dlog(NULL, "floor0 amplitude offset: %u\n",
  521. floor_setup->data.t0.amplitude_offset);
  522. av_dlog(NULL, "floor0 number of books: %u\n",
  523. floor_setup->data.t0.num_books);
  524. av_dlog(NULL, "floor0 book list pointer: %p\n",
  525. floor_setup->data.t0.book_list);
  526. {
  527. int idx;
  528. for (idx = 0; idx < floor_setup->data.t0.num_books; ++idx) {
  529. av_dlog(NULL, " Book %d: %u\n", idx + 1,
  530. floor_setup->data.t0.book_list[idx]);
  531. }
  532. }
  533. } else {
  534. av_log(vc->avccontext, AV_LOG_ERROR, "Invalid floor type!\n");
  535. return AVERROR_INVALIDDATA;
  536. }
  537. }
  538. return 0;
  539. }
  540. // Process residues part
  541. static int vorbis_parse_setup_hdr_residues(vorbis_context *vc)
  542. {
  543. GetBitContext *gb = &vc->gb;
  544. unsigned i, j, k;
  545. vc->residue_count = get_bits(gb, 6)+1;
  546. vc->residues = av_mallocz(vc->residue_count * sizeof(*vc->residues));
  547. av_dlog(NULL, " There are %d residues. \n", vc->residue_count);
  548. for (i = 0; i < vc->residue_count; ++i) {
  549. vorbis_residue *res_setup = &vc->residues[i];
  550. uint8_t cascade[64];
  551. unsigned high_bits, low_bits;
  552. res_setup->type = get_bits(gb, 16);
  553. av_dlog(NULL, " %u. residue type %d\n", i, res_setup->type);
  554. res_setup->begin = get_bits(gb, 24);
  555. res_setup->end = get_bits(gb, 24);
  556. res_setup->partition_size = get_bits(gb, 24) + 1;
  557. /* Validations to prevent a buffer overflow later. */
  558. if (res_setup->begin>res_setup->end ||
  559. res_setup->end > vc->avccontext->channels * vc->blocksize[1] / 2 ||
  560. (res_setup->end-res_setup->begin) / res_setup->partition_size > V_MAX_PARTITIONS) {
  561. av_log(vc->avccontext, AV_LOG_ERROR,
  562. "partition out of bounds: type, begin, end, size, blocksize: %"PRIu16", %"PRIu32", %"PRIu32", %u, %"PRIu32"\n",
  563. res_setup->type, res_setup->begin, res_setup->end,
  564. res_setup->partition_size, vc->blocksize[1] / 2);
  565. return AVERROR_INVALIDDATA;
  566. }
  567. res_setup->classifications = get_bits(gb, 6) + 1;
  568. GET_VALIDATED_INDEX(res_setup->classbook, 8, vc->codebook_count)
  569. res_setup->ptns_to_read =
  570. (res_setup->end - res_setup->begin) / res_setup->partition_size;
  571. res_setup->classifs = av_malloc(res_setup->ptns_to_read *
  572. vc->audio_channels *
  573. sizeof(*res_setup->classifs));
  574. if (!res_setup->classifs)
  575. return AVERROR(ENOMEM);
  576. av_dlog(NULL, " begin %d end %d part.size %d classif.s %d classbook %d \n",
  577. res_setup->begin, res_setup->end, res_setup->partition_size,
  578. res_setup->classifications, res_setup->classbook);
  579. for (j = 0; j < res_setup->classifications; ++j) {
  580. high_bits = 0;
  581. low_bits = get_bits(gb, 3);
  582. if (get_bits1(gb))
  583. high_bits = get_bits(gb, 5);
  584. cascade[j] = (high_bits << 3) + low_bits;
  585. av_dlog(NULL, " %u class cascade depth: %d\n", j, ilog(cascade[j]));
  586. }
  587. res_setup->maxpass = 0;
  588. for (j = 0; j < res_setup->classifications; ++j) {
  589. for (k = 0; k < 8; ++k) {
  590. if (cascade[j]&(1 << k)) {
  591. GET_VALIDATED_INDEX(res_setup->books[j][k], 8, vc->codebook_count)
  592. av_dlog(NULL, " %u class cascade depth %u book: %d\n",
  593. j, k, res_setup->books[j][k]);
  594. if (k>res_setup->maxpass)
  595. res_setup->maxpass = k;
  596. } else {
  597. res_setup->books[j][k] = -1;
  598. }
  599. }
  600. }
  601. }
  602. return 0;
  603. }
  604. // Process mappings part
  605. static int vorbis_parse_setup_hdr_mappings(vorbis_context *vc)
  606. {
  607. GetBitContext *gb = &vc->gb;
  608. unsigned i, j;
  609. vc->mapping_count = get_bits(gb, 6)+1;
  610. vc->mappings = av_mallocz(vc->mapping_count * sizeof(*vc->mappings));
  611. av_dlog(NULL, " There are %d mappings. \n", vc->mapping_count);
  612. for (i = 0; i < vc->mapping_count; ++i) {
  613. vorbis_mapping *mapping_setup = &vc->mappings[i];
  614. if (get_bits(gb, 16)) {
  615. av_log(vc->avccontext, AV_LOG_ERROR, "Other mappings than type 0 are not compliant with the Vorbis I specification. \n");
  616. return AVERROR_INVALIDDATA;
  617. }
  618. if (get_bits1(gb)) {
  619. mapping_setup->submaps = get_bits(gb, 4) + 1;
  620. } else {
  621. mapping_setup->submaps = 1;
  622. }
  623. if (get_bits1(gb)) {
  624. mapping_setup->coupling_steps = get_bits(gb, 8) + 1;
  625. mapping_setup->magnitude = av_mallocz(mapping_setup->coupling_steps *
  626. sizeof(*mapping_setup->magnitude));
  627. mapping_setup->angle = av_mallocz(mapping_setup->coupling_steps *
  628. sizeof(*mapping_setup->angle));
  629. for (j = 0; j < mapping_setup->coupling_steps; ++j) {
  630. GET_VALIDATED_INDEX(mapping_setup->magnitude[j], ilog(vc->audio_channels - 1), vc->audio_channels)
  631. GET_VALIDATED_INDEX(mapping_setup->angle[j], ilog(vc->audio_channels - 1), vc->audio_channels)
  632. }
  633. } else {
  634. mapping_setup->coupling_steps = 0;
  635. }
  636. av_dlog(NULL, " %u mapping coupling steps: %d\n",
  637. i, mapping_setup->coupling_steps);
  638. if (get_bits(gb, 2)) {
  639. av_log(vc->avccontext, AV_LOG_ERROR, "%u. mapping setup data invalid.\n", i);
  640. return AVERROR_INVALIDDATA; // following spec.
  641. }
  642. if (mapping_setup->submaps>1) {
  643. mapping_setup->mux = av_mallocz(vc->audio_channels *
  644. sizeof(*mapping_setup->mux));
  645. for (j = 0; j < vc->audio_channels; ++j)
  646. mapping_setup->mux[j] = get_bits(gb, 4);
  647. }
  648. for (j = 0; j < mapping_setup->submaps; ++j) {
  649. skip_bits(gb, 8); // FIXME check?
  650. GET_VALIDATED_INDEX(mapping_setup->submap_floor[j], 8, vc->floor_count)
  651. GET_VALIDATED_INDEX(mapping_setup->submap_residue[j], 8, vc->residue_count)
  652. av_dlog(NULL, " %u mapping %u submap : floor %d, residue %d\n", i, j,
  653. mapping_setup->submap_floor[j],
  654. mapping_setup->submap_residue[j]);
  655. }
  656. }
  657. return 0;
  658. }
  659. // Process modes part
  660. static void create_map(vorbis_context *vc, unsigned floor_number)
  661. {
  662. vorbis_floor *floors = vc->floors;
  663. vorbis_floor0 *vf;
  664. int idx;
  665. int blockflag, n;
  666. int32_t *map;
  667. for (blockflag = 0; blockflag < 2; ++blockflag) {
  668. n = vc->blocksize[blockflag] / 2;
  669. floors[floor_number].data.t0.map[blockflag] =
  670. av_malloc((n + 1) * sizeof(int32_t)); // n + sentinel
  671. map = floors[floor_number].data.t0.map[blockflag];
  672. vf = &floors[floor_number].data.t0;
  673. for (idx = 0; idx < n; ++idx) {
  674. map[idx] = floor(BARK((vf->rate * idx) / (2.0f * n)) *
  675. ((vf->bark_map_size) /
  676. BARK(vf->rate / 2.0f)));
  677. if (vf->bark_map_size-1 < map[idx])
  678. map[idx] = vf->bark_map_size - 1;
  679. }
  680. map[n] = -1;
  681. vf->map_size[blockflag] = n;
  682. }
  683. for (idx = 0; idx <= n; ++idx) {
  684. av_dlog(NULL, "floor0 map: map at pos %d is %d\n", idx, map[idx]);
  685. }
  686. }
  687. static int vorbis_parse_setup_hdr_modes(vorbis_context *vc)
  688. {
  689. GetBitContext *gb = &vc->gb;
  690. unsigned i;
  691. vc->mode_count = get_bits(gb, 6) + 1;
  692. vc->modes = av_mallocz(vc->mode_count * sizeof(*vc->modes));
  693. av_dlog(NULL, " There are %d modes.\n", vc->mode_count);
  694. for (i = 0; i < vc->mode_count; ++i) {
  695. vorbis_mode *mode_setup = &vc->modes[i];
  696. mode_setup->blockflag = get_bits1(gb);
  697. mode_setup->windowtype = get_bits(gb, 16); //FIXME check
  698. mode_setup->transformtype = get_bits(gb, 16); //FIXME check
  699. GET_VALIDATED_INDEX(mode_setup->mapping, 8, vc->mapping_count);
  700. av_dlog(NULL, " %u mode: blockflag %d, windowtype %d, transformtype %d, mapping %d\n",
  701. i, mode_setup->blockflag, mode_setup->windowtype,
  702. mode_setup->transformtype, mode_setup->mapping);
  703. }
  704. return 0;
  705. }
  706. // Process the whole setup header using the functions above
  707. static int vorbis_parse_setup_hdr(vorbis_context *vc)
  708. {
  709. GetBitContext *gb = &vc->gb;
  710. int ret;
  711. if ((get_bits(gb, 8) != 'v') || (get_bits(gb, 8) != 'o') ||
  712. (get_bits(gb, 8) != 'r') || (get_bits(gb, 8) != 'b') ||
  713. (get_bits(gb, 8) != 'i') || (get_bits(gb, 8) != 's')) {
  714. av_log(vc->avccontext, AV_LOG_ERROR, " Vorbis setup header packet corrupt (no vorbis signature). \n");
  715. return AVERROR_INVALIDDATA;
  716. }
  717. if ((ret = vorbis_parse_setup_hdr_codebooks(vc))) {
  718. av_log(vc->avccontext, AV_LOG_ERROR, " Vorbis setup header packet corrupt (codebooks). \n");
  719. return ret;
  720. }
  721. if ((ret = vorbis_parse_setup_hdr_tdtransforms(vc))) {
  722. av_log(vc->avccontext, AV_LOG_ERROR, " Vorbis setup header packet corrupt (time domain transforms). \n");
  723. return ret;
  724. }
  725. if ((ret = vorbis_parse_setup_hdr_floors(vc))) {
  726. av_log(vc->avccontext, AV_LOG_ERROR, " Vorbis setup header packet corrupt (floors). \n");
  727. return ret;
  728. }
  729. if ((ret = vorbis_parse_setup_hdr_residues(vc))) {
  730. av_log(vc->avccontext, AV_LOG_ERROR, " Vorbis setup header packet corrupt (residues). \n");
  731. return ret;
  732. }
  733. if ((ret = vorbis_parse_setup_hdr_mappings(vc))) {
  734. av_log(vc->avccontext, AV_LOG_ERROR, " Vorbis setup header packet corrupt (mappings). \n");
  735. return ret;
  736. }
  737. if ((ret = vorbis_parse_setup_hdr_modes(vc))) {
  738. av_log(vc->avccontext, AV_LOG_ERROR, " Vorbis setup header packet corrupt (modes). \n");
  739. return ret;
  740. }
  741. if (!get_bits1(gb)) {
  742. av_log(vc->avccontext, AV_LOG_ERROR, " Vorbis setup header packet corrupt (framing flag). \n");
  743. return AVERROR_INVALIDDATA; // framing flag bit unset error
  744. }
  745. return 0;
  746. }
  747. // Process the identification header
  748. static int vorbis_parse_id_hdr(vorbis_context *vc)
  749. {
  750. GetBitContext *gb = &vc->gb;
  751. unsigned bl0, bl1;
  752. if ((get_bits(gb, 8) != 'v') || (get_bits(gb, 8) != 'o') ||
  753. (get_bits(gb, 8) != 'r') || (get_bits(gb, 8) != 'b') ||
  754. (get_bits(gb, 8) != 'i') || (get_bits(gb, 8) != 's')) {
  755. av_log(vc->avccontext, AV_LOG_ERROR, " Vorbis id header packet corrupt (no vorbis signature). \n");
  756. return AVERROR_INVALIDDATA;
  757. }
  758. vc->version = get_bits_long(gb, 32); //FIXME check 0
  759. vc->audio_channels = get_bits(gb, 8);
  760. if (vc->audio_channels <= 0) {
  761. av_log(vc->avccontext, AV_LOG_ERROR, "Invalid number of channels\n");
  762. return AVERROR_INVALIDDATA;
  763. }
  764. vc->audio_samplerate = get_bits_long(gb, 32);
  765. if (vc->audio_samplerate <= 0) {
  766. av_log(vc->avccontext, AV_LOG_ERROR, "Invalid samplerate\n");
  767. return AVERROR_INVALIDDATA;
  768. }
  769. vc->bitrate_maximum = get_bits_long(gb, 32);
  770. vc->bitrate_nominal = get_bits_long(gb, 32);
  771. vc->bitrate_minimum = get_bits_long(gb, 32);
  772. bl0 = get_bits(gb, 4);
  773. bl1 = get_bits(gb, 4);
  774. vc->blocksize[0] = (1 << bl0);
  775. vc->blocksize[1] = (1 << bl1);
  776. if (bl0 > 13 || bl0 < 6 || bl1 > 13 || bl1 < 6 || bl1 < bl0) {
  777. av_log(vc->avccontext, AV_LOG_ERROR, " Vorbis id header packet corrupt (illegal blocksize). \n");
  778. return AVERROR_INVALIDDATA;
  779. }
  780. vc->win[0] = ff_vorbis_vwin[bl0 - 6];
  781. vc->win[1] = ff_vorbis_vwin[bl1 - 6];
  782. if ((get_bits1(gb)) == 0) {
  783. av_log(vc->avccontext, AV_LOG_ERROR, " Vorbis id header packet corrupt (framing flag not set). \n");
  784. return AVERROR_INVALIDDATA;
  785. }
  786. vc->channel_residues = av_malloc((vc->blocksize[1] / 2) * vc->audio_channels * sizeof(*vc->channel_residues));
  787. vc->channel_floors = av_malloc((vc->blocksize[1] / 2) * vc->audio_channels * sizeof(*vc->channel_floors));
  788. vc->saved = av_mallocz((vc->blocksize[1] / 4) * vc->audio_channels * sizeof(*vc->saved));
  789. vc->previous_window = 0;
  790. ff_mdct_init(&vc->mdct[0], bl0, 1, -vc->scale_bias);
  791. ff_mdct_init(&vc->mdct[1], bl1, 1, -vc->scale_bias);
  792. av_dlog(NULL, " vorbis version %d \n audio_channels %d \n audio_samplerate %d \n bitrate_max %d \n bitrate_nom %d \n bitrate_min %d \n blk_0 %d blk_1 %d \n ",
  793. vc->version, vc->audio_channels, vc->audio_samplerate, vc->bitrate_maximum, vc->bitrate_nominal, vc->bitrate_minimum, vc->blocksize[0], vc->blocksize[1]);
  794. /*
  795. BLK = vc->blocksize[0];
  796. for (i = 0; i < BLK / 2; ++i) {
  797. vc->win[0][i] = sin(0.5*3.14159265358*(sin(((float)i + 0.5) / (float)BLK*3.14159265358))*(sin(((float)i + 0.5) / (float)BLK*3.14159265358)));
  798. }
  799. */
  800. return 0;
  801. }
  802. // Process the extradata using the functions above (identification header, setup header)
  803. static av_cold int vorbis_decode_init(AVCodecContext *avccontext)
  804. {
  805. vorbis_context *vc = avccontext->priv_data;
  806. uint8_t *headers = avccontext->extradata;
  807. int headers_len = avccontext->extradata_size;
  808. uint8_t *header_start[3];
  809. int header_len[3];
  810. GetBitContext *gb = &(vc->gb);
  811. int hdr_type, ret;
  812. vc->avccontext = avccontext;
  813. dsputil_init(&vc->dsp, avccontext);
  814. ff_fmt_convert_init(&vc->fmt_conv, avccontext);
  815. if (avccontext->request_sample_fmt == AV_SAMPLE_FMT_FLT) {
  816. avccontext->sample_fmt = AV_SAMPLE_FMT_FLT;
  817. vc->scale_bias = 1.0f;
  818. } else {
  819. avccontext->sample_fmt = AV_SAMPLE_FMT_S16;
  820. vc->scale_bias = 32768.0f;
  821. }
  822. if (!headers_len) {
  823. av_log(avccontext, AV_LOG_ERROR, "Extradata missing.\n");
  824. return AVERROR_INVALIDDATA;
  825. }
  826. if ((ret = avpriv_split_xiph_headers(headers, headers_len, 30, header_start, header_len)) < 0) {
  827. av_log(avccontext, AV_LOG_ERROR, "Extradata corrupt.\n");
  828. return ret;
  829. }
  830. init_get_bits(gb, header_start[0], header_len[0]*8);
  831. hdr_type = get_bits(gb, 8);
  832. if (hdr_type != 1) {
  833. av_log(avccontext, AV_LOG_ERROR, "First header is not the id header.\n");
  834. return AVERROR_INVALIDDATA;
  835. }
  836. if ((ret = vorbis_parse_id_hdr(vc))) {
  837. av_log(avccontext, AV_LOG_ERROR, "Id header corrupt.\n");
  838. vorbis_free(vc);
  839. return ret;
  840. }
  841. init_get_bits(gb, header_start[2], header_len[2]*8);
  842. hdr_type = get_bits(gb, 8);
  843. if (hdr_type != 5) {
  844. av_log(avccontext, AV_LOG_ERROR, "Third header is not the setup header.\n");
  845. vorbis_free(vc);
  846. return AVERROR_INVALIDDATA;
  847. }
  848. if ((ret = vorbis_parse_setup_hdr(vc))) {
  849. av_log(avccontext, AV_LOG_ERROR, "Setup header corrupt.\n");
  850. vorbis_free(vc);
  851. return ret;
  852. }
  853. if (vc->audio_channels > 8)
  854. avccontext->channel_layout = 0;
  855. else
  856. avccontext->channel_layout = ff_vorbis_channel_layouts[vc->audio_channels - 1];
  857. avccontext->channels = vc->audio_channels;
  858. avccontext->sample_rate = vc->audio_samplerate;
  859. avccontext->frame_size = FFMIN(vc->blocksize[0], vc->blocksize[1]) >> 2;
  860. return 0;
  861. }
  862. // Decode audiopackets -------------------------------------------------
  863. // Read and decode floor
  864. static int vorbis_floor0_decode(vorbis_context *vc,
  865. vorbis_floor_data *vfu, float *vec)
  866. {
  867. vorbis_floor0 *vf = &vfu->t0;
  868. float *lsp = vf->lsp;
  869. unsigned amplitude, book_idx;
  870. unsigned blockflag = vc->modes[vc->mode_number].blockflag;
  871. amplitude = get_bits(&vc->gb, vf->amplitude_bits);
  872. if (amplitude > 0) {
  873. float last = 0;
  874. unsigned idx, lsp_len = 0;
  875. vorbis_codebook codebook;
  876. book_idx = get_bits(&vc->gb, ilog(vf->num_books));
  877. if (book_idx >= vf->num_books) {
  878. av_log(vc->avccontext, AV_LOG_ERROR,
  879. "floor0 dec: booknumber too high!\n");
  880. book_idx = 0;
  881. }
  882. av_dlog(NULL, "floor0 dec: booknumber: %u\n", book_idx);
  883. codebook = vc->codebooks[vf->book_list[book_idx]];
  884. /* Invalid codebook! */
  885. if (!codebook.codevectors)
  886. return AVERROR_INVALIDDATA;
  887. while (lsp_len<vf->order) {
  888. int vec_off;
  889. av_dlog(NULL, "floor0 dec: book dimension: %d\n", codebook.dimensions);
  890. av_dlog(NULL, "floor0 dec: maximum depth: %d\n", codebook.maxdepth);
  891. /* read temp vector */
  892. vec_off = get_vlc2(&vc->gb, codebook.vlc.table,
  893. codebook.nb_bits, codebook.maxdepth)
  894. * codebook.dimensions;
  895. av_dlog(NULL, "floor0 dec: vector offset: %d\n", vec_off);
  896. /* copy each vector component and add last to it */
  897. for (idx = 0; idx < codebook.dimensions; ++idx)
  898. lsp[lsp_len+idx] = codebook.codevectors[vec_off+idx] + last;
  899. last = lsp[lsp_len+idx-1]; /* set last to last vector component */
  900. lsp_len += codebook.dimensions;
  901. }
  902. /* DEBUG: output lsp coeffs */
  903. {
  904. int idx;
  905. for (idx = 0; idx < lsp_len; ++idx)
  906. av_dlog(NULL, "floor0 dec: coeff at %d is %f\n", idx, lsp[idx]);
  907. }
  908. /* synthesize floor output vector */
  909. {
  910. int i;
  911. int order = vf->order;
  912. float wstep = M_PI / vf->bark_map_size;
  913. for (i = 0; i < order; i++)
  914. lsp[i] = 2.0f * cos(lsp[i]);
  915. av_dlog(NULL, "floor0 synth: map_size = %"PRIu32"; m = %d; wstep = %f\n",
  916. vf->map_size[blockflag], order, wstep);
  917. i = 0;
  918. while (i < vf->map_size[blockflag]) {
  919. int j, iter_cond = vf->map[blockflag][i];
  920. float p = 0.5f;
  921. float q = 0.5f;
  922. float two_cos_w = 2.0f * cos(wstep * iter_cond); // needed all times
  923. /* similar part for the q and p products */
  924. for (j = 0; j + 1 < order; j += 2) {
  925. q *= lsp[j] - two_cos_w;
  926. p *= lsp[j + 1] - two_cos_w;
  927. }
  928. if (j == order) { // even order
  929. p *= p * (2.0f - two_cos_w);
  930. q *= q * (2.0f + two_cos_w);
  931. } else { // odd order
  932. q *= two_cos_w-lsp[j]; // one more time for q
  933. /* final step and square */
  934. p *= p * (4.f - two_cos_w * two_cos_w);
  935. q *= q;
  936. }
  937. /* calculate linear floor value */
  938. q = exp((((amplitude*vf->amplitude_offset) /
  939. (((1 << vf->amplitude_bits) - 1) * sqrt(p + q)))
  940. - vf->amplitude_offset) * .11512925f);
  941. /* fill vector */
  942. do {
  943. vec[i] = q; ++i;
  944. } while (vf->map[blockflag][i] == iter_cond);
  945. }
  946. }
  947. } else {
  948. /* this channel is unused */
  949. return 1;
  950. }
  951. av_dlog(NULL, " Floor0 decoded\n");
  952. return 0;
  953. }
  954. static int vorbis_floor1_decode(vorbis_context *vc,
  955. vorbis_floor_data *vfu, float *vec)
  956. {
  957. vorbis_floor1 *vf = &vfu->t1;
  958. GetBitContext *gb = &vc->gb;
  959. uint16_t range_v[4] = { 256, 128, 86, 64 };
  960. unsigned range = range_v[vf->multiplier - 1];
  961. uint16_t floor1_Y[258];
  962. uint16_t floor1_Y_final[258];
  963. int floor1_flag[258];
  964. unsigned class, cdim, cbits, csub, cval, offset, i, j;
  965. int book, adx, ady, dy, off, predicted, err;
  966. if (!get_bits1(gb)) // silence
  967. return 1;
  968. // Read values (or differences) for the floor's points
  969. floor1_Y[0] = get_bits(gb, ilog(range - 1));
  970. floor1_Y[1] = get_bits(gb, ilog(range - 1));
  971. av_dlog(NULL, "floor 0 Y %d floor 1 Y %d \n", floor1_Y[0], floor1_Y[1]);
  972. offset = 2;
  973. for (i = 0; i < vf->partitions; ++i) {
  974. class = vf->partition_class[i];
  975. cdim = vf->class_dimensions[class];
  976. cbits = vf->class_subclasses[class];
  977. csub = (1 << cbits) - 1;
  978. cval = 0;
  979. av_dlog(NULL, "Cbits %u\n", cbits);
  980. if (cbits) // this reads all subclasses for this partition's class
  981. cval = get_vlc2(gb, vc->codebooks[vf->class_masterbook[class]].vlc.table,
  982. vc->codebooks[vf->class_masterbook[class]].nb_bits, 3);
  983. for (j = 0; j < cdim; ++j) {
  984. book = vf->subclass_books[class][cval & csub];
  985. av_dlog(NULL, "book %d Cbits %u cval %u bits:%d\n",
  986. book, cbits, cval, get_bits_count(gb));
  987. cval = cval >> cbits;
  988. if (book > -1) {
  989. floor1_Y[offset+j] = get_vlc2(gb, vc->codebooks[book].vlc.table,
  990. vc->codebooks[book].nb_bits, 3);
  991. } else {
  992. floor1_Y[offset+j] = 0;
  993. }
  994. av_dlog(NULL, " floor(%d) = %d \n",
  995. vf->list[offset+j].x, floor1_Y[offset+j]);
  996. }
  997. offset+=cdim;
  998. }
  999. // Amplitude calculation from the differences
  1000. floor1_flag[0] = 1;
  1001. floor1_flag[1] = 1;
  1002. floor1_Y_final[0] = floor1_Y[0];
  1003. floor1_Y_final[1] = floor1_Y[1];
  1004. for (i = 2; i < vf->x_list_dim; ++i) {
  1005. unsigned val, highroom, lowroom, room, high_neigh_offs, low_neigh_offs;
  1006. low_neigh_offs = vf->list[i].low;
  1007. high_neigh_offs = vf->list[i].high;
  1008. dy = floor1_Y_final[high_neigh_offs] - floor1_Y_final[low_neigh_offs]; // render_point begin
  1009. adx = vf->list[high_neigh_offs].x - vf->list[low_neigh_offs].x;
  1010. ady = FFABS(dy);
  1011. err = ady * (vf->list[i].x - vf->list[low_neigh_offs].x);
  1012. off = err / adx;
  1013. if (dy < 0) {
  1014. predicted = floor1_Y_final[low_neigh_offs] - off;
  1015. } else {
  1016. predicted = floor1_Y_final[low_neigh_offs] + off;
  1017. } // render_point end
  1018. val = floor1_Y[i];
  1019. highroom = range-predicted;
  1020. lowroom = predicted;
  1021. if (highroom < lowroom) {
  1022. room = highroom * 2;
  1023. } else {
  1024. room = lowroom * 2; // SPEC mispelling
  1025. }
  1026. if (val) {
  1027. floor1_flag[low_neigh_offs] = 1;
  1028. floor1_flag[high_neigh_offs] = 1;
  1029. floor1_flag[i] = 1;
  1030. if (val >= room) {
  1031. if (highroom > lowroom) {
  1032. floor1_Y_final[i] = val - lowroom + predicted;
  1033. } else {
  1034. floor1_Y_final[i] = predicted - val + highroom - 1;
  1035. }
  1036. } else {
  1037. if (val & 1) {
  1038. floor1_Y_final[i] = predicted - (val + 1) / 2;
  1039. } else {
  1040. floor1_Y_final[i] = predicted + val / 2;
  1041. }
  1042. }
  1043. } else {
  1044. floor1_flag[i] = 0;
  1045. floor1_Y_final[i] = predicted;
  1046. }
  1047. av_dlog(NULL, " Decoded floor(%d) = %u / val %u\n",
  1048. vf->list[i].x, floor1_Y_final[i], val);
  1049. }
  1050. // Curve synth - connect the calculated dots and convert from dB scale FIXME optimize ?
  1051. ff_vorbis_floor1_render_list(vf->list, vf->x_list_dim, floor1_Y_final, floor1_flag, vf->multiplier, vec, vf->list[1].x);
  1052. av_dlog(NULL, " Floor decoded\n");
  1053. return 0;
  1054. }
  1055. // Read and decode residue
  1056. static av_always_inline int vorbis_residue_decode_internal(vorbis_context *vc,
  1057. vorbis_residue *vr,
  1058. unsigned ch,
  1059. uint8_t *do_not_decode,
  1060. float *vec,
  1061. unsigned vlen,
  1062. int vr_type)
  1063. {
  1064. GetBitContext *gb = &vc->gb;
  1065. unsigned c_p_c = vc->codebooks[vr->classbook].dimensions;
  1066. unsigned ptns_to_read = vr->ptns_to_read;
  1067. uint8_t *classifs = vr->classifs;
  1068. unsigned pass, ch_used, i, j, k, l;
  1069. if (vr_type == 2) {
  1070. for (j = 1; j < ch; ++j)
  1071. do_not_decode[0] &= do_not_decode[j]; // FIXME - clobbering input
  1072. if (do_not_decode[0])
  1073. return 0;
  1074. ch_used = 1;
  1075. } else {
  1076. ch_used = ch;
  1077. }
  1078. av_dlog(NULL, " residue type 0/1/2 decode begin, ch: %d cpc %d \n", ch, c_p_c);
  1079. for (pass = 0; pass <= vr->maxpass; ++pass) { // FIXME OPTIMIZE?
  1080. uint16_t voffset, partition_count, j_times_ptns_to_read;
  1081. voffset = vr->begin;
  1082. for (partition_count = 0; partition_count < ptns_to_read;) { // SPEC error
  1083. if (!pass) {
  1084. unsigned inverse_class = ff_inverse[vr->classifications];
  1085. for (j_times_ptns_to_read = 0, j = 0; j < ch_used; ++j) {
  1086. if (!do_not_decode[j]) {
  1087. unsigned temp = get_vlc2(gb, vc->codebooks[vr->classbook].vlc.table,
  1088. vc->codebooks[vr->classbook].nb_bits, 3);
  1089. av_dlog(NULL, "Classword: %u\n", temp);
  1090. assert(vr->classifications > 1 && temp <= 65536); //needed for inverse[]
  1091. for (i = 0; i < c_p_c; ++i) {
  1092. unsigned temp2;
  1093. temp2 = (((uint64_t)temp) * inverse_class) >> 32;
  1094. if (partition_count + c_p_c - 1 - i < ptns_to_read)
  1095. classifs[j_times_ptns_to_read + partition_count + c_p_c - 1 - i] = temp - temp2 * vr->classifications;
  1096. temp = temp2;
  1097. }
  1098. }
  1099. j_times_ptns_to_read += ptns_to_read;
  1100. }
  1101. }
  1102. for (i = 0; (i < c_p_c) && (partition_count < ptns_to_read); ++i) {
  1103. for (j_times_ptns_to_read = 0, j = 0; j < ch_used; ++j) {
  1104. unsigned voffs;
  1105. if (!do_not_decode[j]) {
  1106. unsigned vqclass = classifs[j_times_ptns_to_read + partition_count];
  1107. int vqbook = vr->books[vqclass][pass];
  1108. if (vqbook >= 0 && vc->codebooks[vqbook].codevectors) {
  1109. unsigned coffs;
  1110. unsigned dim = vc->codebooks[vqbook].dimensions;
  1111. unsigned step = dim == 1 ? vr->partition_size
  1112. : FASTDIV(vr->partition_size, dim);
  1113. vorbis_codebook codebook = vc->codebooks[vqbook];
  1114. if (vr_type == 0) {
  1115. voffs = voffset+j*vlen;
  1116. for (k = 0; k < step; ++k) {
  1117. coffs = get_vlc2(gb, codebook.vlc.table, codebook.nb_bits, 3) * dim;
  1118. for (l = 0; l < dim; ++l)
  1119. vec[voffs + k + l * step] += codebook.codevectors[coffs + l]; // FPMATH
  1120. }
  1121. } else if (vr_type == 1) {
  1122. voffs = voffset + j * vlen;
  1123. for (k = 0; k < step; ++k) {
  1124. coffs = get_vlc2(gb, codebook.vlc.table, codebook.nb_bits, 3) * dim;
  1125. for (l = 0; l < dim; ++l, ++voffs) {
  1126. vec[voffs]+=codebook.codevectors[coffs+l]; // FPMATH
  1127. av_dlog(NULL, " pass %d offs: %d curr: %f change: %f cv offs.: %d \n",
  1128. pass, voffs, vec[voffs], codebook.codevectors[coffs+l], coffs);
  1129. }
  1130. }
  1131. } else if (vr_type == 2 && ch == 2 && (voffset & 1) == 0 && (dim & 1) == 0) { // most frequent case optimized
  1132. voffs = voffset >> 1;
  1133. if (dim == 2) {
  1134. for (k = 0; k < step; ++k) {
  1135. coffs = get_vlc2(gb, codebook.vlc.table, codebook.nb_bits, 3) * 2;
  1136. vec[voffs + k ] += codebook.codevectors[coffs ]; // FPMATH
  1137. vec[voffs + k + vlen] += codebook.codevectors[coffs + 1]; // FPMATH
  1138. }
  1139. } else if (dim == 4) {
  1140. for (k = 0; k < step; ++k, voffs += 2) {
  1141. coffs = get_vlc2(gb, codebook.vlc.table, codebook.nb_bits, 3) * 4;
  1142. vec[voffs ] += codebook.codevectors[coffs ]; // FPMATH
  1143. vec[voffs + 1 ] += codebook.codevectors[coffs + 2]; // FPMATH
  1144. vec[voffs + vlen ] += codebook.codevectors[coffs + 1]; // FPMATH
  1145. vec[voffs + vlen + 1] += codebook.codevectors[coffs + 3]; // FPMATH
  1146. }
  1147. } else
  1148. for (k = 0; k < step; ++k) {
  1149. coffs = get_vlc2(gb, codebook.vlc.table, codebook.nb_bits, 3) * dim;
  1150. for (l = 0; l < dim; l += 2, voffs++) {
  1151. vec[voffs ] += codebook.codevectors[coffs + l ]; // FPMATH
  1152. vec[voffs + vlen] += codebook.codevectors[coffs + l + 1]; // FPMATH
  1153. av_dlog(NULL, " pass %d offs: %d curr: %f change: %f cv offs.: %d+%d \n",
  1154. pass, voffset / ch + (voffs % ch) * vlen,
  1155. vec[voffset / ch + (voffs % ch) * vlen],
  1156. codebook.codevectors[coffs + l], coffs, l);
  1157. }
  1158. }
  1159. } else if (vr_type == 2) {
  1160. voffs = voffset;
  1161. for (k = 0; k < step; ++k) {
  1162. coffs = get_vlc2(gb, codebook.vlc.table, codebook.nb_bits, 3) * dim;
  1163. for (l = 0; l < dim; ++l, ++voffs) {
  1164. vec[voffs / ch + (voffs % ch) * vlen] += codebook.codevectors[coffs + l]; // FPMATH FIXME use if and counter instead of / and %
  1165. av_dlog(NULL, " pass %d offs: %d curr: %f change: %f cv offs.: %d+%d \n",
  1166. pass, voffset / ch + (voffs % ch) * vlen,
  1167. vec[voffset / ch + (voffs % ch) * vlen],
  1168. codebook.codevectors[coffs + l], coffs, l);
  1169. }
  1170. }
  1171. }
  1172. }
  1173. }
  1174. j_times_ptns_to_read += ptns_to_read;
  1175. }
  1176. ++partition_count;
  1177. voffset += vr->partition_size;
  1178. }
  1179. }
  1180. }
  1181. return 0;
  1182. }
  1183. static inline int vorbis_residue_decode(vorbis_context *vc, vorbis_residue *vr,
  1184. unsigned ch,
  1185. uint8_t *do_not_decode,
  1186. float *vec, unsigned vlen)
  1187. {
  1188. if (vr->type == 2)
  1189. return vorbis_residue_decode_internal(vc, vr, ch, do_not_decode, vec, vlen, 2);
  1190. else if (vr->type == 1)
  1191. return vorbis_residue_decode_internal(vc, vr, ch, do_not_decode, vec, vlen, 1);
  1192. else if (vr->type == 0)
  1193. return vorbis_residue_decode_internal(vc, vr, ch, do_not_decode, vec, vlen, 0);
  1194. else {
  1195. av_log(vc->avccontext, AV_LOG_ERROR, " Invalid residue type while residue decode?! \n");
  1196. return AVERROR_INVALIDDATA;
  1197. }
  1198. }
  1199. void vorbis_inverse_coupling(float *mag, float *ang, int blocksize)
  1200. {
  1201. int i;
  1202. for (i = 0; i < blocksize; i++) {
  1203. if (mag[i] > 0.0) {
  1204. if (ang[i] > 0.0) {
  1205. ang[i] = mag[i] - ang[i];
  1206. } else {
  1207. float temp = ang[i];
  1208. ang[i] = mag[i];
  1209. mag[i] += temp;
  1210. }
  1211. } else {
  1212. if (ang[i] > 0.0) {
  1213. ang[i] += mag[i];
  1214. } else {
  1215. float temp = ang[i];
  1216. ang[i] = mag[i];
  1217. mag[i] -= temp;
  1218. }
  1219. }
  1220. }
  1221. }
  1222. // Decode the audio packet using the functions above
  1223. static int vorbis_parse_audio_packet(vorbis_context *vc)
  1224. {
  1225. GetBitContext *gb = &vc->gb;
  1226. FFTContext *mdct;
  1227. unsigned previous_window = vc->previous_window;
  1228. unsigned mode_number, blockflag, blocksize;
  1229. int i, j;
  1230. uint8_t no_residue[255];
  1231. uint8_t do_not_decode[255];
  1232. vorbis_mapping *mapping;
  1233. float *ch_res_ptr = vc->channel_residues;
  1234. float *ch_floor_ptr = vc->channel_floors;
  1235. uint8_t res_chan[255];
  1236. unsigned res_num = 0;
  1237. int retlen = 0;
  1238. if (get_bits1(gb)) {
  1239. av_log(vc->avccontext, AV_LOG_ERROR, "Not a Vorbis I audio packet.\n");
  1240. return AVERROR_INVALIDDATA; // packet type not audio
  1241. }
  1242. if (vc->mode_count == 1) {
  1243. mode_number = 0;
  1244. } else {
  1245. GET_VALIDATED_INDEX(mode_number, ilog(vc->mode_count-1), vc->mode_count)
  1246. }
  1247. vc->mode_number = mode_number;
  1248. mapping = &vc->mappings[vc->modes[mode_number].mapping];
  1249. av_dlog(NULL, " Mode number: %u , mapping: %d , blocktype %d\n", mode_number,
  1250. vc->modes[mode_number].mapping, vc->modes[mode_number].blockflag);
  1251. blockflag = vc->modes[mode_number].blockflag;
  1252. blocksize = vc->blocksize[blockflag];
  1253. if (blockflag)
  1254. skip_bits(gb, 2); // previous_window, next_window
  1255. memset(ch_res_ptr, 0, sizeof(float) * vc->audio_channels * blocksize / 2); //FIXME can this be removed ?
  1256. memset(ch_floor_ptr, 0, sizeof(float) * vc->audio_channels * blocksize / 2); //FIXME can this be removed ?
  1257. // Decode floor
  1258. for (i = 0; i < vc->audio_channels; ++i) {
  1259. vorbis_floor *floor;
  1260. int ret;
  1261. if (mapping->submaps > 1) {
  1262. floor = &vc->floors[mapping->submap_floor[mapping->mux[i]]];
  1263. } else {
  1264. floor = &vc->floors[mapping->submap_floor[0]];
  1265. }
  1266. ret = floor->decode(vc, &floor->data, ch_floor_ptr);
  1267. if (ret < 0) {
  1268. av_log(vc->avccontext, AV_LOG_ERROR, "Invalid codebook in vorbis_floor_decode.\n");
  1269. return AVERROR_INVALIDDATA;
  1270. }
  1271. no_residue[i] = ret;
  1272. ch_floor_ptr += blocksize / 2;
  1273. }
  1274. // Nonzero vector propagate
  1275. for (i = mapping->coupling_steps - 1; i >= 0; --i) {
  1276. if (!(no_residue[mapping->magnitude[i]] & no_residue[mapping->angle[i]])) {
  1277. no_residue[mapping->magnitude[i]] = 0;
  1278. no_residue[mapping->angle[i]] = 0;
  1279. }
  1280. }
  1281. // Decode residue
  1282. for (i = 0; i < mapping->submaps; ++i) {
  1283. vorbis_residue *residue;
  1284. unsigned ch = 0;
  1285. for (j = 0; j < vc->audio_channels; ++j) {
  1286. if ((mapping->submaps == 1) || (i == mapping->mux[j])) {
  1287. res_chan[j] = res_num;
  1288. if (no_residue[j]) {
  1289. do_not_decode[ch] = 1;
  1290. } else {
  1291. do_not_decode[ch] = 0;
  1292. }
  1293. ++ch;
  1294. ++res_num;
  1295. }
  1296. }
  1297. residue = &vc->residues[mapping->submap_residue[i]];
  1298. vorbis_residue_decode(vc, residue, ch, do_not_decode, ch_res_ptr, blocksize/2);
  1299. ch_res_ptr += ch * blocksize / 2;
  1300. }
  1301. // Inverse coupling
  1302. for (i = mapping->coupling_steps - 1; i >= 0; --i) { //warning: i has to be signed
  1303. float *mag, *ang;
  1304. mag = vc->channel_residues+res_chan[mapping->magnitude[i]] * blocksize / 2;
  1305. ang = vc->channel_residues+res_chan[mapping->angle[i]] * blocksize / 2;
  1306. vc->dsp.vorbis_inverse_coupling(mag, ang, blocksize / 2);
  1307. }
  1308. // Dotproduct, MDCT
  1309. mdct = &vc->mdct[blockflag];
  1310. for (j = vc->audio_channels-1;j >= 0; j--) {
  1311. ch_floor_ptr = vc->channel_floors + j * blocksize / 2;
  1312. ch_res_ptr = vc->channel_residues + res_chan[j] * blocksize / 2;
  1313. vc->dsp.vector_fmul(ch_floor_ptr, ch_floor_ptr, ch_res_ptr, blocksize / 2);
  1314. mdct->imdct_half(mdct, ch_res_ptr, ch_floor_ptr);
  1315. }
  1316. // Overlap/add, save data for next overlapping FPMATH
  1317. retlen = (blocksize + vc->blocksize[previous_window]) / 4;
  1318. for (j = 0; j < vc->audio_channels; j++) {
  1319. unsigned bs0 = vc->blocksize[0];
  1320. unsigned bs1 = vc->blocksize[1];
  1321. float *residue = vc->channel_residues + res_chan[j] * blocksize / 2;
  1322. float *saved = vc->saved + j * bs1 / 4;
  1323. float *ret = vc->channel_floors + j * retlen;
  1324. float *buf = residue;
  1325. const float *win = vc->win[blockflag & previous_window];
  1326. if (blockflag == previous_window) {
  1327. vc->dsp.vector_fmul_window(ret, saved, buf, win, blocksize / 4);
  1328. } else if (blockflag > previous_window) {
  1329. vc->dsp.vector_fmul_window(ret, saved, buf, win, bs0 / 4);
  1330. memcpy(ret+bs0/2, buf+bs0/4, ((bs1-bs0)/4) * sizeof(float));
  1331. } else {
  1332. memcpy(ret, saved, ((bs1 - bs0) / 4) * sizeof(float));
  1333. vc->dsp.vector_fmul_window(ret + (bs1 - bs0) / 4, saved + (bs1 - bs0) / 4, buf, win, bs0 / 4);
  1334. }
  1335. memcpy(saved, buf + blocksize / 4, blocksize / 4 * sizeof(float));
  1336. }
  1337. vc->previous_window = blockflag;
  1338. return retlen;
  1339. }
  1340. // Return the decoded audio packet through the standard api
  1341. static int vorbis_decode_frame(AVCodecContext *avccontext,
  1342. void *data, int *data_size,
  1343. AVPacket *avpkt)
  1344. {
  1345. const uint8_t *buf = avpkt->data;
  1346. int buf_size = avpkt->size;
  1347. vorbis_context *vc = avccontext->priv_data;
  1348. GetBitContext *gb = &(vc->gb);
  1349. const float *channel_ptrs[255];
  1350. int i, len, out_size;
  1351. av_dlog(NULL, "packet length %d \n", buf_size);
  1352. init_get_bits(gb, buf, buf_size*8);
  1353. if ((len = vorbis_parse_audio_packet(vc)) <= 0)
  1354. return len;
  1355. if (!vc->first_frame) {
  1356. vc->first_frame = 1;
  1357. *data_size = 0;
  1358. return buf_size;
  1359. }
  1360. av_dlog(NULL, "parsed %d bytes %d bits, returned %d samples (*ch*bits) \n",
  1361. get_bits_count(gb) / 8, get_bits_count(gb) % 8, len);
  1362. out_size = len * vc->audio_channels *
  1363. av_get_bytes_per_sample(avccontext->sample_fmt);
  1364. if (*data_size < out_size) {
  1365. av_log(avccontext, AV_LOG_ERROR, "output buffer is too small\n");
  1366. return AVERROR(EINVAL);
  1367. }
  1368. if (vc->audio_channels > 8) {
  1369. for (i = 0; i < vc->audio_channels; i++)
  1370. channel_ptrs[i] = vc->channel_floors + i * len;
  1371. } else {
  1372. for (i = 0; i < vc->audio_channels; i++)
  1373. channel_ptrs[i] = vc->channel_floors +
  1374. len * ff_vorbis_channel_layout_offsets[vc->audio_channels - 1][i];
  1375. }
  1376. if (avccontext->sample_fmt == AV_SAMPLE_FMT_FLT)
  1377. vc->fmt_conv.float_interleave(data, channel_ptrs, len, vc->audio_channels);
  1378. else
  1379. vc->fmt_conv.float_to_int16_interleave(data, channel_ptrs, len,
  1380. vc->audio_channels);
  1381. *data_size = out_size;
  1382. return buf_size;
  1383. }
  1384. // Close decoder
  1385. static av_cold int vorbis_decode_close(AVCodecContext *avccontext)
  1386. {
  1387. vorbis_context *vc = avccontext->priv_data;
  1388. vorbis_free(vc);
  1389. return 0;
  1390. }
  1391. AVCodec ff_vorbis_decoder = {
  1392. .name = "vorbis",
  1393. .type = AVMEDIA_TYPE_AUDIO,
  1394. .id = CODEC_ID_VORBIS,
  1395. .priv_data_size = sizeof(vorbis_context),
  1396. .init = vorbis_decode_init,
  1397. .close = vorbis_decode_close,
  1398. .decode = vorbis_decode_frame,
  1399. .long_name = NULL_IF_CONFIG_SMALL("Vorbis"),
  1400. .channel_layouts = ff_vorbis_channel_layouts,
  1401. .sample_fmts = (const enum AVSampleFormat[]) {
  1402. AV_SAMPLE_FMT_FLT, AV_SAMPLE_FMT_S16, AV_SAMPLE_FMT_NONE
  1403. },
  1404. };