You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

1697 lines
63KB

  1. /*
  2. * This file is part of Libav.
  3. *
  4. * Libav is free software; you can redistribute it and/or
  5. * modify it under the terms of the GNU Lesser General Public
  6. * License as published by the Free Software Foundation; either
  7. * version 2.1 of the License, or (at your option) any later version.
  8. *
  9. * Libav is distributed in the hope that it will be useful,
  10. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  11. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  12. * Lesser General Public License for more details.
  13. *
  14. * You should have received a copy of the GNU Lesser General Public
  15. * License along with Libav; if not, write to the Free Software
  16. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  17. */
  18. /**
  19. * @file
  20. * Vorbis I decoder
  21. * @author Denes Balatoni ( dbalatoni programozo hu )
  22. */
  23. #include <inttypes.h>
  24. #include <math.h>
  25. #define ALT_BITSTREAM_READER_LE
  26. #include "avcodec.h"
  27. #include "get_bits.h"
  28. #include "dsputil.h"
  29. #include "fft.h"
  30. #include "fmtconvert.h"
  31. #include "vorbis.h"
  32. #include "xiph.h"
  33. #define V_NB_BITS 8
  34. #define V_NB_BITS2 11
  35. #define V_MAX_VLCS (1 << 16)
  36. #define V_MAX_PARTITIONS (1 << 20)
  37. #undef NDEBUG
  38. #include <assert.h>
  39. typedef struct {
  40. uint8_t dimensions;
  41. uint8_t lookup_type;
  42. uint8_t maxdepth;
  43. VLC vlc;
  44. float *codevectors;
  45. unsigned int nb_bits;
  46. } vorbis_codebook;
  47. typedef union vorbis_floor_u vorbis_floor_data;
  48. typedef struct vorbis_floor0_s vorbis_floor0;
  49. typedef struct vorbis_floor1_s vorbis_floor1;
  50. struct vorbis_context_s;
  51. typedef
  52. int (* vorbis_floor_decode_func)
  53. (struct vorbis_context_s *, vorbis_floor_data *, float *);
  54. typedef struct {
  55. uint8_t floor_type;
  56. vorbis_floor_decode_func decode;
  57. union vorbis_floor_u {
  58. struct vorbis_floor0_s {
  59. uint8_t order;
  60. uint16_t rate;
  61. uint16_t bark_map_size;
  62. int32_t *map[2];
  63. uint32_t map_size[2];
  64. uint8_t amplitude_bits;
  65. uint8_t amplitude_offset;
  66. uint8_t num_books;
  67. uint8_t *book_list;
  68. float *lsp;
  69. } t0;
  70. struct vorbis_floor1_s {
  71. uint8_t partitions;
  72. uint8_t partition_class[32];
  73. uint8_t class_dimensions[16];
  74. uint8_t class_subclasses[16];
  75. uint8_t class_masterbook[16];
  76. int16_t subclass_books[16][8];
  77. uint8_t multiplier;
  78. uint16_t x_list_dim;
  79. vorbis_floor1_entry *list;
  80. } t1;
  81. } data;
  82. } vorbis_floor;
  83. typedef struct {
  84. uint16_t type;
  85. uint32_t begin;
  86. uint32_t end;
  87. unsigned partition_size;
  88. uint8_t classifications;
  89. uint8_t classbook;
  90. int16_t books[64][8];
  91. uint8_t maxpass;
  92. uint16_t ptns_to_read;
  93. uint8_t *classifs;
  94. } vorbis_residue;
  95. typedef struct {
  96. uint8_t submaps;
  97. uint16_t coupling_steps;
  98. uint8_t *magnitude;
  99. uint8_t *angle;
  100. uint8_t *mux;
  101. uint8_t submap_floor[16];
  102. uint8_t submap_residue[16];
  103. } vorbis_mapping;
  104. typedef struct {
  105. uint8_t blockflag;
  106. uint16_t windowtype;
  107. uint16_t transformtype;
  108. uint8_t mapping;
  109. } vorbis_mode;
  110. typedef struct vorbis_context_s {
  111. AVCodecContext *avccontext;
  112. GetBitContext gb;
  113. DSPContext dsp;
  114. FmtConvertContext fmt_conv;
  115. FFTContext mdct[2];
  116. uint8_t first_frame;
  117. uint32_t version;
  118. uint8_t audio_channels;
  119. uint32_t audio_samplerate;
  120. uint32_t bitrate_maximum;
  121. uint32_t bitrate_nominal;
  122. uint32_t bitrate_minimum;
  123. uint32_t blocksize[2];
  124. const float *win[2];
  125. uint16_t codebook_count;
  126. vorbis_codebook *codebooks;
  127. uint8_t floor_count;
  128. vorbis_floor *floors;
  129. uint8_t residue_count;
  130. vorbis_residue *residues;
  131. uint8_t mapping_count;
  132. vorbis_mapping *mappings;
  133. uint8_t mode_count;
  134. vorbis_mode *modes;
  135. uint8_t mode_number; // mode number for the current packet
  136. uint8_t previous_window;
  137. float *channel_residues;
  138. float *channel_floors;
  139. float *saved;
  140. float scale_bias; // for float->int conversion
  141. } vorbis_context;
  142. /* Helper functions */
  143. #define BARK(x) \
  144. (13.1f * atan(0.00074f * (x)) + 2.24f * atan(1.85e-8f * (x) * (x)) + 1e-4f * (x))
  145. static const char idx_err_str[] = "Index value %d out of range (0 - %d) for %s at %s:%i\n";
  146. #define VALIDATE_INDEX(idx, limit) \
  147. if (idx >= limit) {\
  148. av_log(vc->avccontext, AV_LOG_ERROR,\
  149. idx_err_str,\
  150. (int)(idx), (int)(limit - 1), #idx, __FILE__, __LINE__);\
  151. return AVERROR_INVALIDDATA;\
  152. }
  153. #define GET_VALIDATED_INDEX(idx, bits, limit) \
  154. {\
  155. idx = get_bits(gb, bits);\
  156. VALIDATE_INDEX(idx, limit)\
  157. }
  158. static float vorbisfloat2float(unsigned val)
  159. {
  160. double mant = val & 0x1fffff;
  161. long exp = (val & 0x7fe00000L) >> 21;
  162. if (val & 0x80000000)
  163. mant = -mant;
  164. return ldexp(mant, exp - 20 - 768);
  165. }
  166. // Free all allocated memory -----------------------------------------
  167. static void vorbis_free(vorbis_context *vc)
  168. {
  169. int i;
  170. av_freep(&vc->channel_residues);
  171. av_freep(&vc->channel_floors);
  172. av_freep(&vc->saved);
  173. for (i = 0; i < vc->residue_count; i++)
  174. av_free(vc->residues[i].classifs);
  175. av_freep(&vc->residues);
  176. av_freep(&vc->modes);
  177. ff_mdct_end(&vc->mdct[0]);
  178. ff_mdct_end(&vc->mdct[1]);
  179. for (i = 0; i < vc->codebook_count; ++i) {
  180. av_free(vc->codebooks[i].codevectors);
  181. free_vlc(&vc->codebooks[i].vlc);
  182. }
  183. av_freep(&vc->codebooks);
  184. for (i = 0; i < vc->floor_count; ++i) {
  185. if (vc->floors[i].floor_type == 0) {
  186. av_free(vc->floors[i].data.t0.map[0]);
  187. av_free(vc->floors[i].data.t0.map[1]);
  188. av_free(vc->floors[i].data.t0.book_list);
  189. av_free(vc->floors[i].data.t0.lsp);
  190. } else {
  191. av_free(vc->floors[i].data.t1.list);
  192. }
  193. }
  194. av_freep(&vc->floors);
  195. for (i = 0; i < vc->mapping_count; ++i) {
  196. av_free(vc->mappings[i].magnitude);
  197. av_free(vc->mappings[i].angle);
  198. av_free(vc->mappings[i].mux);
  199. }
  200. av_freep(&vc->mappings);
  201. }
  202. // Parse setup header -------------------------------------------------
  203. // Process codebooks part
  204. static int vorbis_parse_setup_hdr_codebooks(vorbis_context *vc)
  205. {
  206. unsigned cb;
  207. uint8_t *tmp_vlc_bits;
  208. uint32_t *tmp_vlc_codes;
  209. GetBitContext *gb = &vc->gb;
  210. uint16_t *codebook_multiplicands;
  211. int ret = 0;
  212. vc->codebook_count = get_bits(gb, 8) + 1;
  213. av_dlog(NULL, " Codebooks: %d \n", vc->codebook_count);
  214. vc->codebooks = av_mallocz(vc->codebook_count * sizeof(*vc->codebooks));
  215. tmp_vlc_bits = av_mallocz(V_MAX_VLCS * sizeof(*tmp_vlc_bits));
  216. tmp_vlc_codes = av_mallocz(V_MAX_VLCS * sizeof(*tmp_vlc_codes));
  217. codebook_multiplicands = av_malloc(V_MAX_VLCS * sizeof(*codebook_multiplicands));
  218. for (cb = 0; cb < vc->codebook_count; ++cb) {
  219. vorbis_codebook *codebook_setup = &vc->codebooks[cb];
  220. unsigned ordered, t, entries, used_entries = 0;
  221. av_dlog(NULL, " %u. Codebook\n", cb);
  222. if (get_bits(gb, 24) != 0x564342) {
  223. av_log(vc->avccontext, AV_LOG_ERROR,
  224. " %u. Codebook setup data corrupt.\n", cb);
  225. ret = AVERROR_INVALIDDATA;
  226. goto error;
  227. }
  228. codebook_setup->dimensions=get_bits(gb, 16);
  229. if (codebook_setup->dimensions > 16 || codebook_setup->dimensions == 0) {
  230. av_log(vc->avccontext, AV_LOG_ERROR,
  231. " %u. Codebook's dimension is invalid (%d).\n",
  232. cb, codebook_setup->dimensions);
  233. ret = AVERROR_INVALIDDATA;
  234. goto error;
  235. }
  236. entries = get_bits(gb, 24);
  237. if (entries > V_MAX_VLCS) {
  238. av_log(vc->avccontext, AV_LOG_ERROR,
  239. " %u. Codebook has too many entries (%u).\n",
  240. cb, entries);
  241. ret = AVERROR_INVALIDDATA;
  242. goto error;
  243. }
  244. ordered = get_bits1(gb);
  245. av_dlog(NULL, " codebook_dimensions %d, codebook_entries %u\n",
  246. codebook_setup->dimensions, entries);
  247. if (!ordered) {
  248. unsigned ce, flag;
  249. unsigned sparse = get_bits1(gb);
  250. av_dlog(NULL, " not ordered \n");
  251. if (sparse) {
  252. av_dlog(NULL, " sparse \n");
  253. used_entries = 0;
  254. for (ce = 0; ce < entries; ++ce) {
  255. flag = get_bits1(gb);
  256. if (flag) {
  257. tmp_vlc_bits[ce] = get_bits(gb, 5) + 1;
  258. ++used_entries;
  259. } else
  260. tmp_vlc_bits[ce] = 0;
  261. }
  262. } else {
  263. av_dlog(NULL, " not sparse \n");
  264. used_entries = entries;
  265. for (ce = 0; ce < entries; ++ce)
  266. tmp_vlc_bits[ce] = get_bits(gb, 5) + 1;
  267. }
  268. } else {
  269. unsigned current_entry = 0;
  270. unsigned current_length = get_bits(gb, 5) + 1;
  271. av_dlog(NULL, " ordered, current length: %u\n", current_length); //FIXME
  272. used_entries = entries;
  273. for (; current_entry < used_entries && current_length <= 32; ++current_length) {
  274. unsigned i, number;
  275. av_dlog(NULL, " number bits: %u ", ilog(entries - current_entry));
  276. number = get_bits(gb, ilog(entries - current_entry));
  277. av_dlog(NULL, " number: %u\n", number);
  278. for (i = current_entry; i < number+current_entry; ++i)
  279. if (i < used_entries)
  280. tmp_vlc_bits[i] = current_length;
  281. current_entry+=number;
  282. }
  283. if (current_entry>used_entries) {
  284. av_log(vc->avccontext, AV_LOG_ERROR, " More codelengths than codes in codebook. \n");
  285. ret = AVERROR_INVALIDDATA;
  286. goto error;
  287. }
  288. }
  289. codebook_setup->lookup_type = get_bits(gb, 4);
  290. av_dlog(NULL, " lookup type: %d : %s \n", codebook_setup->lookup_type,
  291. codebook_setup->lookup_type ? "vq" : "no lookup");
  292. // If the codebook is used for (inverse) VQ, calculate codevectors.
  293. if (codebook_setup->lookup_type == 1) {
  294. unsigned i, j, k;
  295. unsigned codebook_lookup_values = ff_vorbis_nth_root(entries, codebook_setup->dimensions);
  296. float codebook_minimum_value = vorbisfloat2float(get_bits_long(gb, 32));
  297. float codebook_delta_value = vorbisfloat2float(get_bits_long(gb, 32));
  298. unsigned codebook_value_bits = get_bits(gb, 4) + 1;
  299. unsigned codebook_sequence_p = get_bits1(gb);
  300. av_dlog(NULL, " We expect %d numbers for building the codevectors. \n",
  301. codebook_lookup_values);
  302. av_dlog(NULL, " delta %f minmum %f \n",
  303. codebook_delta_value, codebook_minimum_value);
  304. for (i = 0; i < codebook_lookup_values; ++i) {
  305. codebook_multiplicands[i] = get_bits(gb, codebook_value_bits);
  306. av_dlog(NULL, " multiplicands*delta+minmum : %e \n",
  307. (float)codebook_multiplicands[i] * codebook_delta_value + codebook_minimum_value);
  308. av_dlog(NULL, " multiplicand %u\n", codebook_multiplicands[i]);
  309. }
  310. // Weed out unused vlcs and build codevector vector
  311. codebook_setup->codevectors = used_entries ? av_mallocz(used_entries *
  312. codebook_setup->dimensions *
  313. sizeof(*codebook_setup->codevectors))
  314. : NULL;
  315. for (j = 0, i = 0; i < entries; ++i) {
  316. unsigned dim = codebook_setup->dimensions;
  317. if (tmp_vlc_bits[i]) {
  318. float last = 0.0;
  319. unsigned lookup_offset = i;
  320. av_dlog(vc->avccontext, "Lookup offset %u ,", i);
  321. for (k = 0; k < dim; ++k) {
  322. unsigned multiplicand_offset = lookup_offset % codebook_lookup_values;
  323. codebook_setup->codevectors[j * dim + k] = codebook_multiplicands[multiplicand_offset] * codebook_delta_value + codebook_minimum_value + last;
  324. if (codebook_sequence_p)
  325. last = codebook_setup->codevectors[j * dim + k];
  326. lookup_offset/=codebook_lookup_values;
  327. }
  328. tmp_vlc_bits[j] = tmp_vlc_bits[i];
  329. av_dlog(vc->avccontext, "real lookup offset %u, vector: ", j);
  330. for (k = 0; k < dim; ++k)
  331. av_dlog(vc->avccontext, " %f ",
  332. codebook_setup->codevectors[j * dim + k]);
  333. av_dlog(vc->avccontext, "\n");
  334. ++j;
  335. }
  336. }
  337. if (j != used_entries) {
  338. av_log(vc->avccontext, AV_LOG_ERROR, "Bug in codevector vector building code. \n");
  339. ret = AVERROR_INVALIDDATA;
  340. goto error;
  341. }
  342. entries = used_entries;
  343. } else if (codebook_setup->lookup_type >= 2) {
  344. av_log(vc->avccontext, AV_LOG_ERROR, "Codebook lookup type not supported. \n");
  345. ret = AVERROR_INVALIDDATA;
  346. goto error;
  347. }
  348. // Initialize VLC table
  349. if (ff_vorbis_len2vlc(tmp_vlc_bits, tmp_vlc_codes, entries)) {
  350. av_log(vc->avccontext, AV_LOG_ERROR, " Invalid code lengths while generating vlcs. \n");
  351. ret = AVERROR_INVALIDDATA;
  352. goto error;
  353. }
  354. codebook_setup->maxdepth = 0;
  355. for (t = 0; t < entries; ++t)
  356. if (tmp_vlc_bits[t] >= codebook_setup->maxdepth)
  357. codebook_setup->maxdepth = tmp_vlc_bits[t];
  358. if (codebook_setup->maxdepth > 3 * V_NB_BITS)
  359. codebook_setup->nb_bits = V_NB_BITS2;
  360. else
  361. codebook_setup->nb_bits = V_NB_BITS;
  362. codebook_setup->maxdepth = (codebook_setup->maxdepth+codebook_setup->nb_bits - 1) / codebook_setup->nb_bits;
  363. if ((ret = init_vlc(&codebook_setup->vlc, codebook_setup->nb_bits,
  364. entries, tmp_vlc_bits, sizeof(*tmp_vlc_bits),
  365. sizeof(*tmp_vlc_bits), tmp_vlc_codes,
  366. sizeof(*tmp_vlc_codes), sizeof(*tmp_vlc_codes),
  367. INIT_VLC_LE))) {
  368. av_log(vc->avccontext, AV_LOG_ERROR, " Error generating vlc tables. \n");
  369. goto error;
  370. }
  371. }
  372. av_free(tmp_vlc_bits);
  373. av_free(tmp_vlc_codes);
  374. av_free(codebook_multiplicands);
  375. return 0;
  376. // Error:
  377. error:
  378. av_free(tmp_vlc_bits);
  379. av_free(tmp_vlc_codes);
  380. av_free(codebook_multiplicands);
  381. return ret;
  382. }
  383. // Process time domain transforms part (unused in Vorbis I)
  384. static int vorbis_parse_setup_hdr_tdtransforms(vorbis_context *vc)
  385. {
  386. GetBitContext *gb = &vc->gb;
  387. unsigned i, vorbis_time_count = get_bits(gb, 6) + 1;
  388. for (i = 0; i < vorbis_time_count; ++i) {
  389. unsigned vorbis_tdtransform = get_bits(gb, 16);
  390. av_dlog(NULL, " Vorbis time domain transform %u: %u\n",
  391. vorbis_time_count, vorbis_tdtransform);
  392. if (vorbis_tdtransform) {
  393. av_log(vc->avccontext, AV_LOG_ERROR, "Vorbis time domain transform data nonzero. \n");
  394. return AVERROR_INVALIDDATA;
  395. }
  396. }
  397. return 0;
  398. }
  399. // Process floors part
  400. static int vorbis_floor0_decode(vorbis_context *vc,
  401. vorbis_floor_data *vfu, float *vec);
  402. static void create_map(vorbis_context *vc, unsigned floor_number);
  403. static int vorbis_floor1_decode(vorbis_context *vc,
  404. vorbis_floor_data *vfu, float *vec);
  405. static int vorbis_parse_setup_hdr_floors(vorbis_context *vc)
  406. {
  407. GetBitContext *gb = &vc->gb;
  408. int i,j,k;
  409. vc->floor_count = get_bits(gb, 6) + 1;
  410. vc->floors = av_mallocz(vc->floor_count * sizeof(*vc->floors));
  411. for (i = 0; i < vc->floor_count; ++i) {
  412. vorbis_floor *floor_setup = &vc->floors[i];
  413. floor_setup->floor_type = get_bits(gb, 16);
  414. av_dlog(NULL, " %d. floor type %d \n", i, floor_setup->floor_type);
  415. if (floor_setup->floor_type == 1) {
  416. int maximum_class = -1;
  417. unsigned rangebits, rangemax, floor1_values = 2;
  418. floor_setup->decode = vorbis_floor1_decode;
  419. floor_setup->data.t1.partitions = get_bits(gb, 5);
  420. av_dlog(NULL, " %d.floor: %d partitions \n",
  421. i, floor_setup->data.t1.partitions);
  422. for (j = 0; j < floor_setup->data.t1.partitions; ++j) {
  423. floor_setup->data.t1.partition_class[j] = get_bits(gb, 4);
  424. if (floor_setup->data.t1.partition_class[j] > maximum_class)
  425. maximum_class = floor_setup->data.t1.partition_class[j];
  426. av_dlog(NULL, " %d. floor %d partition class %d \n",
  427. i, j, floor_setup->data.t1.partition_class[j]);
  428. }
  429. av_dlog(NULL, " maximum class %d \n", maximum_class);
  430. for (j = 0; j <= maximum_class; ++j) {
  431. floor_setup->data.t1.class_dimensions[j] = get_bits(gb, 3) + 1;
  432. floor_setup->data.t1.class_subclasses[j] = get_bits(gb, 2);
  433. av_dlog(NULL, " %d floor %d class dim: %d subclasses %d \n", i, j,
  434. floor_setup->data.t1.class_dimensions[j],
  435. floor_setup->data.t1.class_subclasses[j]);
  436. if (floor_setup->data.t1.class_subclasses[j]) {
  437. GET_VALIDATED_INDEX(floor_setup->data.t1.class_masterbook[j], 8, vc->codebook_count)
  438. av_dlog(NULL, " masterbook: %d \n", floor_setup->data.t1.class_masterbook[j]);
  439. }
  440. for (k = 0; k < (1 << floor_setup->data.t1.class_subclasses[j]); ++k) {
  441. int16_t bits = get_bits(gb, 8) - 1;
  442. if (bits != -1)
  443. VALIDATE_INDEX(bits, vc->codebook_count)
  444. floor_setup->data.t1.subclass_books[j][k] = bits;
  445. av_dlog(NULL, " book %d. : %d \n", k, floor_setup->data.t1.subclass_books[j][k]);
  446. }
  447. }
  448. floor_setup->data.t1.multiplier = get_bits(gb, 2) + 1;
  449. floor_setup->data.t1.x_list_dim = 2;
  450. for (j = 0; j < floor_setup->data.t1.partitions; ++j)
  451. floor_setup->data.t1.x_list_dim+=floor_setup->data.t1.class_dimensions[floor_setup->data.t1.partition_class[j]];
  452. floor_setup->data.t1.list = av_mallocz(floor_setup->data.t1.x_list_dim *
  453. sizeof(*floor_setup->data.t1.list));
  454. rangebits = get_bits(gb, 4);
  455. rangemax = (1 << rangebits);
  456. if (rangemax > vc->blocksize[1] / 2) {
  457. av_log(vc->avccontext, AV_LOG_ERROR,
  458. "Floor value is too large for blocksize: %u (%"PRIu32")\n",
  459. rangemax, vc->blocksize[1] / 2);
  460. return AVERROR_INVALIDDATA;
  461. }
  462. floor_setup->data.t1.list[0].x = 0;
  463. floor_setup->data.t1.list[1].x = rangemax;
  464. for (j = 0; j < floor_setup->data.t1.partitions; ++j) {
  465. for (k = 0; k < floor_setup->data.t1.class_dimensions[floor_setup->data.t1.partition_class[j]]; ++k, ++floor1_values) {
  466. floor_setup->data.t1.list[floor1_values].x = get_bits(gb, rangebits);
  467. av_dlog(NULL, " %u. floor1 Y coord. %d\n", floor1_values,
  468. floor_setup->data.t1.list[floor1_values].x);
  469. }
  470. }
  471. // Precalculate order of x coordinates - needed for decode
  472. ff_vorbis_ready_floor1_list(floor_setup->data.t1.list, floor_setup->data.t1.x_list_dim);
  473. } else if (floor_setup->floor_type == 0) {
  474. unsigned max_codebook_dim = 0;
  475. floor_setup->decode = vorbis_floor0_decode;
  476. floor_setup->data.t0.order = get_bits(gb, 8);
  477. floor_setup->data.t0.rate = get_bits(gb, 16);
  478. floor_setup->data.t0.bark_map_size = get_bits(gb, 16);
  479. floor_setup->data.t0.amplitude_bits = get_bits(gb, 6);
  480. /* zero would result in a div by zero later *
  481. * 2^0 - 1 == 0 */
  482. if (floor_setup->data.t0.amplitude_bits == 0) {
  483. av_log(vc->avccontext, AV_LOG_ERROR,
  484. "Floor 0 amplitude bits is 0.\n");
  485. return AVERROR_INVALIDDATA;
  486. }
  487. floor_setup->data.t0.amplitude_offset = get_bits(gb, 8);
  488. floor_setup->data.t0.num_books = get_bits(gb, 4) + 1;
  489. /* allocate mem for booklist */
  490. floor_setup->data.t0.book_list =
  491. av_malloc(floor_setup->data.t0.num_books);
  492. if (!floor_setup->data.t0.book_list)
  493. return AVERROR(ENOMEM);
  494. /* read book indexes */
  495. {
  496. int idx;
  497. unsigned book_idx;
  498. for (idx = 0; idx < floor_setup->data.t0.num_books; ++idx) {
  499. GET_VALIDATED_INDEX(book_idx, 8, vc->codebook_count)
  500. floor_setup->data.t0.book_list[idx] = book_idx;
  501. if (vc->codebooks[book_idx].dimensions > max_codebook_dim)
  502. max_codebook_dim = vc->codebooks[book_idx].dimensions;
  503. }
  504. }
  505. create_map(vc, i);
  506. /* codebook dim is for padding if codebook dim doesn't *
  507. * divide order+1 then we need to read more data */
  508. floor_setup->data.t0.lsp =
  509. av_malloc((floor_setup->data.t0.order + 1 + max_codebook_dim)
  510. * sizeof(*floor_setup->data.t0.lsp));
  511. if (!floor_setup->data.t0.lsp)
  512. return AVERROR(ENOMEM);
  513. /* debug output parsed headers */
  514. av_dlog(NULL, "floor0 order: %u\n", floor_setup->data.t0.order);
  515. av_dlog(NULL, "floor0 rate: %u\n", floor_setup->data.t0.rate);
  516. av_dlog(NULL, "floor0 bark map size: %u\n",
  517. floor_setup->data.t0.bark_map_size);
  518. av_dlog(NULL, "floor0 amplitude bits: %u\n",
  519. floor_setup->data.t0.amplitude_bits);
  520. av_dlog(NULL, "floor0 amplitude offset: %u\n",
  521. floor_setup->data.t0.amplitude_offset);
  522. av_dlog(NULL, "floor0 number of books: %u\n",
  523. floor_setup->data.t0.num_books);
  524. av_dlog(NULL, "floor0 book list pointer: %p\n",
  525. floor_setup->data.t0.book_list);
  526. {
  527. int idx;
  528. for (idx = 0; idx < floor_setup->data.t0.num_books; ++idx) {
  529. av_dlog(NULL, " Book %d: %u\n", idx + 1,
  530. floor_setup->data.t0.book_list[idx]);
  531. }
  532. }
  533. } else {
  534. av_log(vc->avccontext, AV_LOG_ERROR, "Invalid floor type!\n");
  535. return AVERROR_INVALIDDATA;
  536. }
  537. }
  538. return 0;
  539. }
  540. // Process residues part
  541. static int vorbis_parse_setup_hdr_residues(vorbis_context *vc)
  542. {
  543. GetBitContext *gb = &vc->gb;
  544. unsigned i, j, k;
  545. vc->residue_count = get_bits(gb, 6)+1;
  546. vc->residues = av_mallocz(vc->residue_count * sizeof(*vc->residues));
  547. av_dlog(NULL, " There are %d residues. \n", vc->residue_count);
  548. for (i = 0; i < vc->residue_count; ++i) {
  549. vorbis_residue *res_setup = &vc->residues[i];
  550. uint8_t cascade[64];
  551. unsigned high_bits, low_bits;
  552. res_setup->type = get_bits(gb, 16);
  553. av_dlog(NULL, " %u. residue type %d\n", i, res_setup->type);
  554. res_setup->begin = get_bits(gb, 24);
  555. res_setup->end = get_bits(gb, 24);
  556. res_setup->partition_size = get_bits(gb, 24) + 1;
  557. /* Validations to prevent a buffer overflow later. */
  558. if (res_setup->begin>res_setup->end ||
  559. res_setup->end > vc->avccontext->channels * vc->blocksize[1] / 2 ||
  560. (res_setup->end-res_setup->begin) / res_setup->partition_size > V_MAX_PARTITIONS) {
  561. av_log(vc->avccontext, AV_LOG_ERROR,
  562. "partition out of bounds: type, begin, end, size, blocksize: %"PRIu16", %"PRIu32", %"PRIu32", %u, %"PRIu32"\n",
  563. res_setup->type, res_setup->begin, res_setup->end,
  564. res_setup->partition_size, vc->blocksize[1] / 2);
  565. return AVERROR_INVALIDDATA;
  566. }
  567. res_setup->classifications = get_bits(gb, 6) + 1;
  568. GET_VALIDATED_INDEX(res_setup->classbook, 8, vc->codebook_count)
  569. res_setup->ptns_to_read =
  570. (res_setup->end - res_setup->begin) / res_setup->partition_size;
  571. res_setup->classifs = av_malloc(res_setup->ptns_to_read *
  572. vc->audio_channels *
  573. sizeof(*res_setup->classifs));
  574. if (!res_setup->classifs)
  575. return AVERROR(ENOMEM);
  576. av_dlog(NULL, " begin %d end %d part.size %d classif.s %d classbook %d \n",
  577. res_setup->begin, res_setup->end, res_setup->partition_size,
  578. res_setup->classifications, res_setup->classbook);
  579. for (j = 0; j < res_setup->classifications; ++j) {
  580. high_bits = 0;
  581. low_bits = get_bits(gb, 3);
  582. if (get_bits1(gb))
  583. high_bits = get_bits(gb, 5);
  584. cascade[j] = (high_bits << 3) + low_bits;
  585. av_dlog(NULL, " %u class cascade depth: %d\n", j, ilog(cascade[j]));
  586. }
  587. res_setup->maxpass = 0;
  588. for (j = 0; j < res_setup->classifications; ++j) {
  589. for (k = 0; k < 8; ++k) {
  590. if (cascade[j]&(1 << k)) {
  591. GET_VALIDATED_INDEX(res_setup->books[j][k], 8, vc->codebook_count)
  592. av_dlog(NULL, " %u class cascade depth %u book: %d\n",
  593. j, k, res_setup->books[j][k]);
  594. if (k>res_setup->maxpass)
  595. res_setup->maxpass = k;
  596. } else {
  597. res_setup->books[j][k] = -1;
  598. }
  599. }
  600. }
  601. }
  602. return 0;
  603. }
  604. // Process mappings part
  605. static int vorbis_parse_setup_hdr_mappings(vorbis_context *vc)
  606. {
  607. GetBitContext *gb = &vc->gb;
  608. unsigned i, j;
  609. vc->mapping_count = get_bits(gb, 6)+1;
  610. vc->mappings = av_mallocz(vc->mapping_count * sizeof(*vc->mappings));
  611. av_dlog(NULL, " There are %d mappings. \n", vc->mapping_count);
  612. for (i = 0; i < vc->mapping_count; ++i) {
  613. vorbis_mapping *mapping_setup = &vc->mappings[i];
  614. if (get_bits(gb, 16)) {
  615. av_log(vc->avccontext, AV_LOG_ERROR, "Other mappings than type 0 are not compliant with the Vorbis I specification. \n");
  616. return AVERROR_INVALIDDATA;
  617. }
  618. if (get_bits1(gb)) {
  619. mapping_setup->submaps = get_bits(gb, 4) + 1;
  620. } else {
  621. mapping_setup->submaps = 1;
  622. }
  623. if (get_bits1(gb)) {
  624. mapping_setup->coupling_steps = get_bits(gb, 8) + 1;
  625. mapping_setup->magnitude = av_mallocz(mapping_setup->coupling_steps *
  626. sizeof(*mapping_setup->magnitude));
  627. mapping_setup->angle = av_mallocz(mapping_setup->coupling_steps *
  628. sizeof(*mapping_setup->angle));
  629. for (j = 0; j < mapping_setup->coupling_steps; ++j) {
  630. GET_VALIDATED_INDEX(mapping_setup->magnitude[j], ilog(vc->audio_channels - 1), vc->audio_channels)
  631. GET_VALIDATED_INDEX(mapping_setup->angle[j], ilog(vc->audio_channels - 1), vc->audio_channels)
  632. }
  633. } else {
  634. mapping_setup->coupling_steps = 0;
  635. }
  636. av_dlog(NULL, " %u mapping coupling steps: %d\n",
  637. i, mapping_setup->coupling_steps);
  638. if (get_bits(gb, 2)) {
  639. av_log(vc->avccontext, AV_LOG_ERROR, "%u. mapping setup data invalid.\n", i);
  640. return AVERROR_INVALIDDATA; // following spec.
  641. }
  642. if (mapping_setup->submaps>1) {
  643. mapping_setup->mux = av_mallocz(vc->audio_channels *
  644. sizeof(*mapping_setup->mux));
  645. for (j = 0; j < vc->audio_channels; ++j)
  646. mapping_setup->mux[j] = get_bits(gb, 4);
  647. }
  648. for (j = 0; j < mapping_setup->submaps; ++j) {
  649. skip_bits(gb, 8); // FIXME check?
  650. GET_VALIDATED_INDEX(mapping_setup->submap_floor[j], 8, vc->floor_count)
  651. GET_VALIDATED_INDEX(mapping_setup->submap_residue[j], 8, vc->residue_count)
  652. av_dlog(NULL, " %u mapping %u submap : floor %d, residue %d\n", i, j,
  653. mapping_setup->submap_floor[j],
  654. mapping_setup->submap_residue[j]);
  655. }
  656. }
  657. return 0;
  658. }
  659. // Process modes part
  660. static void create_map(vorbis_context *vc, unsigned floor_number)
  661. {
  662. vorbis_floor *floors = vc->floors;
  663. vorbis_floor0 *vf;
  664. int idx;
  665. int blockflag, n;
  666. int32_t *map;
  667. for (blockflag = 0; blockflag < 2; ++blockflag) {
  668. n = vc->blocksize[blockflag] / 2;
  669. floors[floor_number].data.t0.map[blockflag] =
  670. av_malloc((n + 1) * sizeof(int32_t)); // n + sentinel
  671. map = floors[floor_number].data.t0.map[blockflag];
  672. vf = &floors[floor_number].data.t0;
  673. for (idx = 0; idx < n; ++idx) {
  674. map[idx] = floor(BARK((vf->rate * idx) / (2.0f * n)) *
  675. ((vf->bark_map_size) /
  676. BARK(vf->rate / 2.0f)));
  677. if (vf->bark_map_size-1 < map[idx])
  678. map[idx] = vf->bark_map_size - 1;
  679. }
  680. map[n] = -1;
  681. vf->map_size[blockflag] = n;
  682. }
  683. for (idx = 0; idx <= n; ++idx) {
  684. av_dlog(NULL, "floor0 map: map at pos %d is %d\n", idx, map[idx]);
  685. }
  686. }
  687. static int vorbis_parse_setup_hdr_modes(vorbis_context *vc)
  688. {
  689. GetBitContext *gb = &vc->gb;
  690. unsigned i;
  691. vc->mode_count = get_bits(gb, 6) + 1;
  692. vc->modes = av_mallocz(vc->mode_count * sizeof(*vc->modes));
  693. av_dlog(NULL, " There are %d modes.\n", vc->mode_count);
  694. for (i = 0; i < vc->mode_count; ++i) {
  695. vorbis_mode *mode_setup = &vc->modes[i];
  696. mode_setup->blockflag = get_bits1(gb);
  697. mode_setup->windowtype = get_bits(gb, 16); //FIXME check
  698. mode_setup->transformtype = get_bits(gb, 16); //FIXME check
  699. GET_VALIDATED_INDEX(mode_setup->mapping, 8, vc->mapping_count);
  700. av_dlog(NULL, " %u mode: blockflag %d, windowtype %d, transformtype %d, mapping %d\n",
  701. i, mode_setup->blockflag, mode_setup->windowtype,
  702. mode_setup->transformtype, mode_setup->mapping);
  703. }
  704. return 0;
  705. }
  706. // Process the whole setup header using the functions above
  707. static int vorbis_parse_setup_hdr(vorbis_context *vc)
  708. {
  709. GetBitContext *gb = &vc->gb;
  710. int ret;
  711. if ((get_bits(gb, 8) != 'v') || (get_bits(gb, 8) != 'o') ||
  712. (get_bits(gb, 8) != 'r') || (get_bits(gb, 8) != 'b') ||
  713. (get_bits(gb, 8) != 'i') || (get_bits(gb, 8) != 's')) {
  714. av_log(vc->avccontext, AV_LOG_ERROR, " Vorbis setup header packet corrupt (no vorbis signature). \n");
  715. return AVERROR_INVALIDDATA;
  716. }
  717. if ((ret = vorbis_parse_setup_hdr_codebooks(vc))) {
  718. av_log(vc->avccontext, AV_LOG_ERROR, " Vorbis setup header packet corrupt (codebooks). \n");
  719. return ret;
  720. }
  721. if ((ret = vorbis_parse_setup_hdr_tdtransforms(vc))) {
  722. av_log(vc->avccontext, AV_LOG_ERROR, " Vorbis setup header packet corrupt (time domain transforms). \n");
  723. return ret;
  724. }
  725. if ((ret = vorbis_parse_setup_hdr_floors(vc))) {
  726. av_log(vc->avccontext, AV_LOG_ERROR, " Vorbis setup header packet corrupt (floors). \n");
  727. return ret;
  728. }
  729. if ((ret = vorbis_parse_setup_hdr_residues(vc))) {
  730. av_log(vc->avccontext, AV_LOG_ERROR, " Vorbis setup header packet corrupt (residues). \n");
  731. return ret;
  732. }
  733. if ((ret = vorbis_parse_setup_hdr_mappings(vc))) {
  734. av_log(vc->avccontext, AV_LOG_ERROR, " Vorbis setup header packet corrupt (mappings). \n");
  735. return ret;
  736. }
  737. if ((ret = vorbis_parse_setup_hdr_modes(vc))) {
  738. av_log(vc->avccontext, AV_LOG_ERROR, " Vorbis setup header packet corrupt (modes). \n");
  739. return ret;
  740. }
  741. if (!get_bits1(gb)) {
  742. av_log(vc->avccontext, AV_LOG_ERROR, " Vorbis setup header packet corrupt (framing flag). \n");
  743. return AVERROR_INVALIDDATA; // framing flag bit unset error
  744. }
  745. return 0;
  746. }
  747. // Process the identification header
  748. static int vorbis_parse_id_hdr(vorbis_context *vc)
  749. {
  750. GetBitContext *gb = &vc->gb;
  751. unsigned bl0, bl1;
  752. if ((get_bits(gb, 8) != 'v') || (get_bits(gb, 8) != 'o') ||
  753. (get_bits(gb, 8) != 'r') || (get_bits(gb, 8) != 'b') ||
  754. (get_bits(gb, 8) != 'i') || (get_bits(gb, 8) != 's')) {
  755. av_log(vc->avccontext, AV_LOG_ERROR, " Vorbis id header packet corrupt (no vorbis signature). \n");
  756. return AVERROR_INVALIDDATA;
  757. }
  758. vc->version = get_bits_long(gb, 32); //FIXME check 0
  759. vc->audio_channels = get_bits(gb, 8);
  760. if (vc->audio_channels <= 0) {
  761. av_log(vc->avccontext, AV_LOG_ERROR, "Invalid number of channels\n");
  762. return AVERROR_INVALIDDATA;
  763. }
  764. vc->audio_samplerate = get_bits_long(gb, 32);
  765. if (vc->audio_samplerate <= 0) {
  766. av_log(vc->avccontext, AV_LOG_ERROR, "Invalid samplerate\n");
  767. return AVERROR_INVALIDDATA;
  768. }
  769. vc->bitrate_maximum = get_bits_long(gb, 32);
  770. vc->bitrate_nominal = get_bits_long(gb, 32);
  771. vc->bitrate_minimum = get_bits_long(gb, 32);
  772. bl0 = get_bits(gb, 4);
  773. bl1 = get_bits(gb, 4);
  774. vc->blocksize[0] = (1 << bl0);
  775. vc->blocksize[1] = (1 << bl1);
  776. if (bl0 > 13 || bl0 < 6 || bl1 > 13 || bl1 < 6 || bl1 < bl0) {
  777. av_log(vc->avccontext, AV_LOG_ERROR, " Vorbis id header packet corrupt (illegal blocksize). \n");
  778. return AVERROR_INVALIDDATA;
  779. }
  780. // output format int16
  781. if (vc->blocksize[1] / 2 * vc->audio_channels * 2 > AVCODEC_MAX_AUDIO_FRAME_SIZE) {
  782. av_log(vc->avccontext, AV_LOG_ERROR, "Vorbis channel count makes "
  783. "output packets too large.\n");
  784. return AVERROR_PATCHWELCOME;
  785. }
  786. vc->win[0] = ff_vorbis_vwin[bl0 - 6];
  787. vc->win[1] = ff_vorbis_vwin[bl1 - 6];
  788. if ((get_bits1(gb)) == 0) {
  789. av_log(vc->avccontext, AV_LOG_ERROR, " Vorbis id header packet corrupt (framing flag not set). \n");
  790. return AVERROR_INVALIDDATA;
  791. }
  792. vc->channel_residues = av_malloc((vc->blocksize[1] / 2) * vc->audio_channels * sizeof(*vc->channel_residues));
  793. vc->channel_floors = av_malloc((vc->blocksize[1] / 2) * vc->audio_channels * sizeof(*vc->channel_floors));
  794. vc->saved = av_mallocz((vc->blocksize[1] / 4) * vc->audio_channels * sizeof(*vc->saved));
  795. vc->previous_window = 0;
  796. ff_mdct_init(&vc->mdct[0], bl0, 1, -vc->scale_bias);
  797. ff_mdct_init(&vc->mdct[1], bl1, 1, -vc->scale_bias);
  798. av_dlog(NULL, " vorbis version %d \n audio_channels %d \n audio_samplerate %d \n bitrate_max %d \n bitrate_nom %d \n bitrate_min %d \n blk_0 %d blk_1 %d \n ",
  799. vc->version, vc->audio_channels, vc->audio_samplerate, vc->bitrate_maximum, vc->bitrate_nominal, vc->bitrate_minimum, vc->blocksize[0], vc->blocksize[1]);
  800. /*
  801. BLK = vc->blocksize[0];
  802. for (i = 0; i < BLK / 2; ++i) {
  803. vc->win[0][i] = sin(0.5*3.14159265358*(sin(((float)i + 0.5) / (float)BLK*3.14159265358))*(sin(((float)i + 0.5) / (float)BLK*3.14159265358)));
  804. }
  805. */
  806. return 0;
  807. }
  808. // Process the extradata using the functions above (identification header, setup header)
  809. static av_cold int vorbis_decode_init(AVCodecContext *avccontext)
  810. {
  811. vorbis_context *vc = avccontext->priv_data;
  812. uint8_t *headers = avccontext->extradata;
  813. int headers_len = avccontext->extradata_size;
  814. uint8_t *header_start[3];
  815. int header_len[3];
  816. GetBitContext *gb = &(vc->gb);
  817. int hdr_type, ret;
  818. vc->avccontext = avccontext;
  819. dsputil_init(&vc->dsp, avccontext);
  820. ff_fmt_convert_init(&vc->fmt_conv, avccontext);
  821. if (avccontext->request_sample_fmt == AV_SAMPLE_FMT_FLT) {
  822. avccontext->sample_fmt = AV_SAMPLE_FMT_FLT;
  823. vc->scale_bias = 1.0f;
  824. } else {
  825. avccontext->sample_fmt = AV_SAMPLE_FMT_S16;
  826. vc->scale_bias = 32768.0f;
  827. }
  828. if (!headers_len) {
  829. av_log(avccontext, AV_LOG_ERROR, "Extradata missing.\n");
  830. return AVERROR_INVALIDDATA;
  831. }
  832. if ((ret = avpriv_split_xiph_headers(headers, headers_len, 30, header_start, header_len)) < 0) {
  833. av_log(avccontext, AV_LOG_ERROR, "Extradata corrupt.\n");
  834. return ret;
  835. }
  836. init_get_bits(gb, header_start[0], header_len[0]*8);
  837. hdr_type = get_bits(gb, 8);
  838. if (hdr_type != 1) {
  839. av_log(avccontext, AV_LOG_ERROR, "First header is not the id header.\n");
  840. return AVERROR_INVALIDDATA;
  841. }
  842. if ((ret = vorbis_parse_id_hdr(vc))) {
  843. av_log(avccontext, AV_LOG_ERROR, "Id header corrupt.\n");
  844. vorbis_free(vc);
  845. return ret;
  846. }
  847. init_get_bits(gb, header_start[2], header_len[2]*8);
  848. hdr_type = get_bits(gb, 8);
  849. if (hdr_type != 5) {
  850. av_log(avccontext, AV_LOG_ERROR, "Third header is not the setup header.\n");
  851. vorbis_free(vc);
  852. return AVERROR_INVALIDDATA;
  853. }
  854. if ((ret = vorbis_parse_setup_hdr(vc))) {
  855. av_log(avccontext, AV_LOG_ERROR, "Setup header corrupt.\n");
  856. vorbis_free(vc);
  857. return ret;
  858. }
  859. if (vc->audio_channels > 8)
  860. avccontext->channel_layout = 0;
  861. else
  862. avccontext->channel_layout = ff_vorbis_channel_layouts[vc->audio_channels - 1];
  863. avccontext->channels = vc->audio_channels;
  864. avccontext->sample_rate = vc->audio_samplerate;
  865. avccontext->frame_size = FFMIN(vc->blocksize[0], vc->blocksize[1]) >> 2;
  866. return 0;
  867. }
  868. // Decode audiopackets -------------------------------------------------
  869. // Read and decode floor
  870. static int vorbis_floor0_decode(vorbis_context *vc,
  871. vorbis_floor_data *vfu, float *vec)
  872. {
  873. vorbis_floor0 *vf = &vfu->t0;
  874. float *lsp = vf->lsp;
  875. unsigned amplitude, book_idx;
  876. unsigned blockflag = vc->modes[vc->mode_number].blockflag;
  877. amplitude = get_bits(&vc->gb, vf->amplitude_bits);
  878. if (amplitude > 0) {
  879. float last = 0;
  880. unsigned idx, lsp_len = 0;
  881. vorbis_codebook codebook;
  882. book_idx = get_bits(&vc->gb, ilog(vf->num_books));
  883. if (book_idx >= vf->num_books) {
  884. av_log(vc->avccontext, AV_LOG_ERROR,
  885. "floor0 dec: booknumber too high!\n");
  886. book_idx = 0;
  887. }
  888. av_dlog(NULL, "floor0 dec: booknumber: %u\n", book_idx);
  889. codebook = vc->codebooks[vf->book_list[book_idx]];
  890. /* Invalid codebook! */
  891. if (!codebook.codevectors)
  892. return AVERROR_INVALIDDATA;
  893. while (lsp_len<vf->order) {
  894. int vec_off;
  895. av_dlog(NULL, "floor0 dec: book dimension: %d\n", codebook.dimensions);
  896. av_dlog(NULL, "floor0 dec: maximum depth: %d\n", codebook.maxdepth);
  897. /* read temp vector */
  898. vec_off = get_vlc2(&vc->gb, codebook.vlc.table,
  899. codebook.nb_bits, codebook.maxdepth)
  900. * codebook.dimensions;
  901. av_dlog(NULL, "floor0 dec: vector offset: %d\n", vec_off);
  902. /* copy each vector component and add last to it */
  903. for (idx = 0; idx < codebook.dimensions; ++idx)
  904. lsp[lsp_len+idx] = codebook.codevectors[vec_off+idx] + last;
  905. last = lsp[lsp_len+idx-1]; /* set last to last vector component */
  906. lsp_len += codebook.dimensions;
  907. }
  908. /* DEBUG: output lsp coeffs */
  909. {
  910. int idx;
  911. for (idx = 0; idx < lsp_len; ++idx)
  912. av_dlog(NULL, "floor0 dec: coeff at %d is %f\n", idx, lsp[idx]);
  913. }
  914. /* synthesize floor output vector */
  915. {
  916. int i;
  917. int order = vf->order;
  918. float wstep = M_PI / vf->bark_map_size;
  919. for (i = 0; i < order; i++)
  920. lsp[i] = 2.0f * cos(lsp[i]);
  921. av_dlog(NULL, "floor0 synth: map_size = %"PRIu32"; m = %d; wstep = %f\n",
  922. vf->map_size[blockflag], order, wstep);
  923. i = 0;
  924. while (i < vf->map_size[blockflag]) {
  925. int j, iter_cond = vf->map[blockflag][i];
  926. float p = 0.5f;
  927. float q = 0.5f;
  928. float two_cos_w = 2.0f * cos(wstep * iter_cond); // needed all times
  929. /* similar part for the q and p products */
  930. for (j = 0; j + 1 < order; j += 2) {
  931. q *= lsp[j] - two_cos_w;
  932. p *= lsp[j + 1] - two_cos_w;
  933. }
  934. if (j == order) { // even order
  935. p *= p * (2.0f - two_cos_w);
  936. q *= q * (2.0f + two_cos_w);
  937. } else { // odd order
  938. q *= two_cos_w-lsp[j]; // one more time for q
  939. /* final step and square */
  940. p *= p * (4.f - two_cos_w * two_cos_w);
  941. q *= q;
  942. }
  943. /* calculate linear floor value */
  944. q = exp((((amplitude*vf->amplitude_offset) /
  945. (((1 << vf->amplitude_bits) - 1) * sqrt(p + q)))
  946. - vf->amplitude_offset) * .11512925f);
  947. /* fill vector */
  948. do {
  949. vec[i] = q; ++i;
  950. } while (vf->map[blockflag][i] == iter_cond);
  951. }
  952. }
  953. } else {
  954. /* this channel is unused */
  955. return 1;
  956. }
  957. av_dlog(NULL, " Floor0 decoded\n");
  958. return 0;
  959. }
  960. static int vorbis_floor1_decode(vorbis_context *vc,
  961. vorbis_floor_data *vfu, float *vec)
  962. {
  963. vorbis_floor1 *vf = &vfu->t1;
  964. GetBitContext *gb = &vc->gb;
  965. uint16_t range_v[4] = { 256, 128, 86, 64 };
  966. unsigned range = range_v[vf->multiplier - 1];
  967. uint16_t floor1_Y[258];
  968. uint16_t floor1_Y_final[258];
  969. int floor1_flag[258];
  970. unsigned class, cdim, cbits, csub, cval, offset, i, j;
  971. int book, adx, ady, dy, off, predicted, err;
  972. if (!get_bits1(gb)) // silence
  973. return 1;
  974. // Read values (or differences) for the floor's points
  975. floor1_Y[0] = get_bits(gb, ilog(range - 1));
  976. floor1_Y[1] = get_bits(gb, ilog(range - 1));
  977. av_dlog(NULL, "floor 0 Y %d floor 1 Y %d \n", floor1_Y[0], floor1_Y[1]);
  978. offset = 2;
  979. for (i = 0; i < vf->partitions; ++i) {
  980. class = vf->partition_class[i];
  981. cdim = vf->class_dimensions[class];
  982. cbits = vf->class_subclasses[class];
  983. csub = (1 << cbits) - 1;
  984. cval = 0;
  985. av_dlog(NULL, "Cbits %u\n", cbits);
  986. if (cbits) // this reads all subclasses for this partition's class
  987. cval = get_vlc2(gb, vc->codebooks[vf->class_masterbook[class]].vlc.table,
  988. vc->codebooks[vf->class_masterbook[class]].nb_bits, 3);
  989. for (j = 0; j < cdim; ++j) {
  990. book = vf->subclass_books[class][cval & csub];
  991. av_dlog(NULL, "book %d Cbits %u cval %u bits:%d\n",
  992. book, cbits, cval, get_bits_count(gb));
  993. cval = cval >> cbits;
  994. if (book > -1) {
  995. floor1_Y[offset+j] = get_vlc2(gb, vc->codebooks[book].vlc.table,
  996. vc->codebooks[book].nb_bits, 3);
  997. } else {
  998. floor1_Y[offset+j] = 0;
  999. }
  1000. av_dlog(NULL, " floor(%d) = %d \n",
  1001. vf->list[offset+j].x, floor1_Y[offset+j]);
  1002. }
  1003. offset+=cdim;
  1004. }
  1005. // Amplitude calculation from the differences
  1006. floor1_flag[0] = 1;
  1007. floor1_flag[1] = 1;
  1008. floor1_Y_final[0] = floor1_Y[0];
  1009. floor1_Y_final[1] = floor1_Y[1];
  1010. for (i = 2; i < vf->x_list_dim; ++i) {
  1011. unsigned val, highroom, lowroom, room, high_neigh_offs, low_neigh_offs;
  1012. low_neigh_offs = vf->list[i].low;
  1013. high_neigh_offs = vf->list[i].high;
  1014. dy = floor1_Y_final[high_neigh_offs] - floor1_Y_final[low_neigh_offs]; // render_point begin
  1015. adx = vf->list[high_neigh_offs].x - vf->list[low_neigh_offs].x;
  1016. ady = FFABS(dy);
  1017. err = ady * (vf->list[i].x - vf->list[low_neigh_offs].x);
  1018. off = err / adx;
  1019. if (dy < 0) {
  1020. predicted = floor1_Y_final[low_neigh_offs] - off;
  1021. } else {
  1022. predicted = floor1_Y_final[low_neigh_offs] + off;
  1023. } // render_point end
  1024. val = floor1_Y[i];
  1025. highroom = range-predicted;
  1026. lowroom = predicted;
  1027. if (highroom < lowroom) {
  1028. room = highroom * 2;
  1029. } else {
  1030. room = lowroom * 2; // SPEC mispelling
  1031. }
  1032. if (val) {
  1033. floor1_flag[low_neigh_offs] = 1;
  1034. floor1_flag[high_neigh_offs] = 1;
  1035. floor1_flag[i] = 1;
  1036. if (val >= room) {
  1037. if (highroom > lowroom) {
  1038. floor1_Y_final[i] = val - lowroom + predicted;
  1039. } else {
  1040. floor1_Y_final[i] = predicted - val + highroom - 1;
  1041. }
  1042. } else {
  1043. if (val & 1) {
  1044. floor1_Y_final[i] = predicted - (val + 1) / 2;
  1045. } else {
  1046. floor1_Y_final[i] = predicted + val / 2;
  1047. }
  1048. }
  1049. } else {
  1050. floor1_flag[i] = 0;
  1051. floor1_Y_final[i] = predicted;
  1052. }
  1053. av_dlog(NULL, " Decoded floor(%d) = %u / val %u\n",
  1054. vf->list[i].x, floor1_Y_final[i], val);
  1055. }
  1056. // Curve synth - connect the calculated dots and convert from dB scale FIXME optimize ?
  1057. ff_vorbis_floor1_render_list(vf->list, vf->x_list_dim, floor1_Y_final, floor1_flag, vf->multiplier, vec, vf->list[1].x);
  1058. av_dlog(NULL, " Floor decoded\n");
  1059. return 0;
  1060. }
  1061. // Read and decode residue
  1062. static av_always_inline int vorbis_residue_decode_internal(vorbis_context *vc,
  1063. vorbis_residue *vr,
  1064. unsigned ch,
  1065. uint8_t *do_not_decode,
  1066. float *vec,
  1067. unsigned vlen,
  1068. int vr_type)
  1069. {
  1070. GetBitContext *gb = &vc->gb;
  1071. unsigned c_p_c = vc->codebooks[vr->classbook].dimensions;
  1072. unsigned ptns_to_read = vr->ptns_to_read;
  1073. uint8_t *classifs = vr->classifs;
  1074. unsigned pass, ch_used, i, j, k, l;
  1075. if (vr_type == 2) {
  1076. for (j = 1; j < ch; ++j)
  1077. do_not_decode[0] &= do_not_decode[j]; // FIXME - clobbering input
  1078. if (do_not_decode[0])
  1079. return 0;
  1080. ch_used = 1;
  1081. } else {
  1082. ch_used = ch;
  1083. }
  1084. av_dlog(NULL, " residue type 0/1/2 decode begin, ch: %d cpc %d \n", ch, c_p_c);
  1085. for (pass = 0; pass <= vr->maxpass; ++pass) { // FIXME OPTIMIZE?
  1086. uint16_t voffset, partition_count, j_times_ptns_to_read;
  1087. voffset = vr->begin;
  1088. for (partition_count = 0; partition_count < ptns_to_read;) { // SPEC error
  1089. if (!pass) {
  1090. unsigned inverse_class = ff_inverse[vr->classifications];
  1091. for (j_times_ptns_to_read = 0, j = 0; j < ch_used; ++j) {
  1092. if (!do_not_decode[j]) {
  1093. unsigned temp = get_vlc2(gb, vc->codebooks[vr->classbook].vlc.table,
  1094. vc->codebooks[vr->classbook].nb_bits, 3);
  1095. av_dlog(NULL, "Classword: %u\n", temp);
  1096. assert(vr->classifications > 1 && temp <= 65536); //needed for inverse[]
  1097. for (i = 0; i < c_p_c; ++i) {
  1098. unsigned temp2;
  1099. temp2 = (((uint64_t)temp) * inverse_class) >> 32;
  1100. if (partition_count + c_p_c - 1 - i < ptns_to_read)
  1101. classifs[j_times_ptns_to_read + partition_count + c_p_c - 1 - i] = temp - temp2 * vr->classifications;
  1102. temp = temp2;
  1103. }
  1104. }
  1105. j_times_ptns_to_read += ptns_to_read;
  1106. }
  1107. }
  1108. for (i = 0; (i < c_p_c) && (partition_count < ptns_to_read); ++i) {
  1109. for (j_times_ptns_to_read = 0, j = 0; j < ch_used; ++j) {
  1110. unsigned voffs;
  1111. if (!do_not_decode[j]) {
  1112. unsigned vqclass = classifs[j_times_ptns_to_read + partition_count];
  1113. int vqbook = vr->books[vqclass][pass];
  1114. if (vqbook >= 0 && vc->codebooks[vqbook].codevectors) {
  1115. unsigned coffs;
  1116. unsigned dim = vc->codebooks[vqbook].dimensions;
  1117. unsigned step = dim == 1 ? vr->partition_size
  1118. : FASTDIV(vr->partition_size, dim);
  1119. vorbis_codebook codebook = vc->codebooks[vqbook];
  1120. if (vr_type == 0) {
  1121. voffs = voffset+j*vlen;
  1122. for (k = 0; k < step; ++k) {
  1123. coffs = get_vlc2(gb, codebook.vlc.table, codebook.nb_bits, 3) * dim;
  1124. for (l = 0; l < dim; ++l)
  1125. vec[voffs + k + l * step] += codebook.codevectors[coffs + l]; // FPMATH
  1126. }
  1127. } else if (vr_type == 1) {
  1128. voffs = voffset + j * vlen;
  1129. for (k = 0; k < step; ++k) {
  1130. coffs = get_vlc2(gb, codebook.vlc.table, codebook.nb_bits, 3) * dim;
  1131. for (l = 0; l < dim; ++l, ++voffs) {
  1132. vec[voffs]+=codebook.codevectors[coffs+l]; // FPMATH
  1133. av_dlog(NULL, " pass %d offs: %d curr: %f change: %f cv offs.: %d \n",
  1134. pass, voffs, vec[voffs], codebook.codevectors[coffs+l], coffs);
  1135. }
  1136. }
  1137. } else if (vr_type == 2 && ch == 2 && (voffset & 1) == 0 && (dim & 1) == 0) { // most frequent case optimized
  1138. voffs = voffset >> 1;
  1139. if (dim == 2) {
  1140. for (k = 0; k < step; ++k) {
  1141. coffs = get_vlc2(gb, codebook.vlc.table, codebook.nb_bits, 3) * 2;
  1142. vec[voffs + k ] += codebook.codevectors[coffs ]; // FPMATH
  1143. vec[voffs + k + vlen] += codebook.codevectors[coffs + 1]; // FPMATH
  1144. }
  1145. } else if (dim == 4) {
  1146. for (k = 0; k < step; ++k, voffs += 2) {
  1147. coffs = get_vlc2(gb, codebook.vlc.table, codebook.nb_bits, 3) * 4;
  1148. vec[voffs ] += codebook.codevectors[coffs ]; // FPMATH
  1149. vec[voffs + 1 ] += codebook.codevectors[coffs + 2]; // FPMATH
  1150. vec[voffs + vlen ] += codebook.codevectors[coffs + 1]; // FPMATH
  1151. vec[voffs + vlen + 1] += codebook.codevectors[coffs + 3]; // FPMATH
  1152. }
  1153. } else
  1154. for (k = 0; k < step; ++k) {
  1155. coffs = get_vlc2(gb, codebook.vlc.table, codebook.nb_bits, 3) * dim;
  1156. for (l = 0; l < dim; l += 2, voffs++) {
  1157. vec[voffs ] += codebook.codevectors[coffs + l ]; // FPMATH
  1158. vec[voffs + vlen] += codebook.codevectors[coffs + l + 1]; // FPMATH
  1159. av_dlog(NULL, " pass %d offs: %d curr: %f change: %f cv offs.: %d+%d \n",
  1160. pass, voffset / ch + (voffs % ch) * vlen,
  1161. vec[voffset / ch + (voffs % ch) * vlen],
  1162. codebook.codevectors[coffs + l], coffs, l);
  1163. }
  1164. }
  1165. } else if (vr_type == 2) {
  1166. voffs = voffset;
  1167. for (k = 0; k < step; ++k) {
  1168. coffs = get_vlc2(gb, codebook.vlc.table, codebook.nb_bits, 3) * dim;
  1169. for (l = 0; l < dim; ++l, ++voffs) {
  1170. vec[voffs / ch + (voffs % ch) * vlen] += codebook.codevectors[coffs + l]; // FPMATH FIXME use if and counter instead of / and %
  1171. av_dlog(NULL, " pass %d offs: %d curr: %f change: %f cv offs.: %d+%d \n",
  1172. pass, voffset / ch + (voffs % ch) * vlen,
  1173. vec[voffset / ch + (voffs % ch) * vlen],
  1174. codebook.codevectors[coffs + l], coffs, l);
  1175. }
  1176. }
  1177. }
  1178. }
  1179. }
  1180. j_times_ptns_to_read += ptns_to_read;
  1181. }
  1182. ++partition_count;
  1183. voffset += vr->partition_size;
  1184. }
  1185. }
  1186. }
  1187. return 0;
  1188. }
  1189. static inline int vorbis_residue_decode(vorbis_context *vc, vorbis_residue *vr,
  1190. unsigned ch,
  1191. uint8_t *do_not_decode,
  1192. float *vec, unsigned vlen)
  1193. {
  1194. if (vr->type == 2)
  1195. return vorbis_residue_decode_internal(vc, vr, ch, do_not_decode, vec, vlen, 2);
  1196. else if (vr->type == 1)
  1197. return vorbis_residue_decode_internal(vc, vr, ch, do_not_decode, vec, vlen, 1);
  1198. else if (vr->type == 0)
  1199. return vorbis_residue_decode_internal(vc, vr, ch, do_not_decode, vec, vlen, 0);
  1200. else {
  1201. av_log(vc->avccontext, AV_LOG_ERROR, " Invalid residue type while residue decode?! \n");
  1202. return AVERROR_INVALIDDATA;
  1203. }
  1204. }
  1205. void vorbis_inverse_coupling(float *mag, float *ang, int blocksize)
  1206. {
  1207. int i;
  1208. for (i = 0; i < blocksize; i++) {
  1209. if (mag[i] > 0.0) {
  1210. if (ang[i] > 0.0) {
  1211. ang[i] = mag[i] - ang[i];
  1212. } else {
  1213. float temp = ang[i];
  1214. ang[i] = mag[i];
  1215. mag[i] += temp;
  1216. }
  1217. } else {
  1218. if (ang[i] > 0.0) {
  1219. ang[i] += mag[i];
  1220. } else {
  1221. float temp = ang[i];
  1222. ang[i] = mag[i];
  1223. mag[i] -= temp;
  1224. }
  1225. }
  1226. }
  1227. }
  1228. // Decode the audio packet using the functions above
  1229. static int vorbis_parse_audio_packet(vorbis_context *vc)
  1230. {
  1231. GetBitContext *gb = &vc->gb;
  1232. FFTContext *mdct;
  1233. unsigned previous_window = vc->previous_window;
  1234. unsigned mode_number, blockflag, blocksize;
  1235. int i, j;
  1236. uint8_t no_residue[255];
  1237. uint8_t do_not_decode[255];
  1238. vorbis_mapping *mapping;
  1239. float *ch_res_ptr = vc->channel_residues;
  1240. float *ch_floor_ptr = vc->channel_floors;
  1241. uint8_t res_chan[255];
  1242. unsigned res_num = 0;
  1243. int retlen = 0;
  1244. if (get_bits1(gb)) {
  1245. av_log(vc->avccontext, AV_LOG_ERROR, "Not a Vorbis I audio packet.\n");
  1246. return AVERROR_INVALIDDATA; // packet type not audio
  1247. }
  1248. if (vc->mode_count == 1) {
  1249. mode_number = 0;
  1250. } else {
  1251. GET_VALIDATED_INDEX(mode_number, ilog(vc->mode_count-1), vc->mode_count)
  1252. }
  1253. vc->mode_number = mode_number;
  1254. mapping = &vc->mappings[vc->modes[mode_number].mapping];
  1255. av_dlog(NULL, " Mode number: %u , mapping: %d , blocktype %d\n", mode_number,
  1256. vc->modes[mode_number].mapping, vc->modes[mode_number].blockflag);
  1257. blockflag = vc->modes[mode_number].blockflag;
  1258. blocksize = vc->blocksize[blockflag];
  1259. if (blockflag)
  1260. skip_bits(gb, 2); // previous_window, next_window
  1261. memset(ch_res_ptr, 0, sizeof(float) * vc->audio_channels * blocksize / 2); //FIXME can this be removed ?
  1262. memset(ch_floor_ptr, 0, sizeof(float) * vc->audio_channels * blocksize / 2); //FIXME can this be removed ?
  1263. // Decode floor
  1264. for (i = 0; i < vc->audio_channels; ++i) {
  1265. vorbis_floor *floor;
  1266. int ret;
  1267. if (mapping->submaps > 1) {
  1268. floor = &vc->floors[mapping->submap_floor[mapping->mux[i]]];
  1269. } else {
  1270. floor = &vc->floors[mapping->submap_floor[0]];
  1271. }
  1272. ret = floor->decode(vc, &floor->data, ch_floor_ptr);
  1273. if (ret < 0) {
  1274. av_log(vc->avccontext, AV_LOG_ERROR, "Invalid codebook in vorbis_floor_decode.\n");
  1275. return AVERROR_INVALIDDATA;
  1276. }
  1277. no_residue[i] = ret;
  1278. ch_floor_ptr += blocksize / 2;
  1279. }
  1280. // Nonzero vector propagate
  1281. for (i = mapping->coupling_steps - 1; i >= 0; --i) {
  1282. if (!(no_residue[mapping->magnitude[i]] & no_residue[mapping->angle[i]])) {
  1283. no_residue[mapping->magnitude[i]] = 0;
  1284. no_residue[mapping->angle[i]] = 0;
  1285. }
  1286. }
  1287. // Decode residue
  1288. for (i = 0; i < mapping->submaps; ++i) {
  1289. vorbis_residue *residue;
  1290. unsigned ch = 0;
  1291. for (j = 0; j < vc->audio_channels; ++j) {
  1292. if ((mapping->submaps == 1) || (i == mapping->mux[j])) {
  1293. res_chan[j] = res_num;
  1294. if (no_residue[j]) {
  1295. do_not_decode[ch] = 1;
  1296. } else {
  1297. do_not_decode[ch] = 0;
  1298. }
  1299. ++ch;
  1300. ++res_num;
  1301. }
  1302. }
  1303. residue = &vc->residues[mapping->submap_residue[i]];
  1304. vorbis_residue_decode(vc, residue, ch, do_not_decode, ch_res_ptr, blocksize/2);
  1305. ch_res_ptr += ch * blocksize / 2;
  1306. }
  1307. // Inverse coupling
  1308. for (i = mapping->coupling_steps - 1; i >= 0; --i) { //warning: i has to be signed
  1309. float *mag, *ang;
  1310. mag = vc->channel_residues+res_chan[mapping->magnitude[i]] * blocksize / 2;
  1311. ang = vc->channel_residues+res_chan[mapping->angle[i]] * blocksize / 2;
  1312. vc->dsp.vorbis_inverse_coupling(mag, ang, blocksize / 2);
  1313. }
  1314. // Dotproduct, MDCT
  1315. mdct = &vc->mdct[blockflag];
  1316. for (j = vc->audio_channels-1;j >= 0; j--) {
  1317. ch_floor_ptr = vc->channel_floors + j * blocksize / 2;
  1318. ch_res_ptr = vc->channel_residues + res_chan[j] * blocksize / 2;
  1319. vc->dsp.vector_fmul(ch_floor_ptr, ch_floor_ptr, ch_res_ptr, blocksize / 2);
  1320. mdct->imdct_half(mdct, ch_res_ptr, ch_floor_ptr);
  1321. }
  1322. // Overlap/add, save data for next overlapping FPMATH
  1323. retlen = (blocksize + vc->blocksize[previous_window]) / 4;
  1324. for (j = 0; j < vc->audio_channels; j++) {
  1325. unsigned bs0 = vc->blocksize[0];
  1326. unsigned bs1 = vc->blocksize[1];
  1327. float *residue = vc->channel_residues + res_chan[j] * blocksize / 2;
  1328. float *saved = vc->saved + j * bs1 / 4;
  1329. float *ret = vc->channel_floors + j * retlen;
  1330. float *buf = residue;
  1331. const float *win = vc->win[blockflag & previous_window];
  1332. if (blockflag == previous_window) {
  1333. vc->dsp.vector_fmul_window(ret, saved, buf, win, blocksize / 4);
  1334. } else if (blockflag > previous_window) {
  1335. vc->dsp.vector_fmul_window(ret, saved, buf, win, bs0 / 4);
  1336. memcpy(ret+bs0/2, buf+bs0/4, ((bs1-bs0)/4) * sizeof(float));
  1337. } else {
  1338. memcpy(ret, saved, ((bs1 - bs0) / 4) * sizeof(float));
  1339. vc->dsp.vector_fmul_window(ret + (bs1 - bs0) / 4, saved + (bs1 - bs0) / 4, buf, win, bs0 / 4);
  1340. }
  1341. memcpy(saved, buf + blocksize / 4, blocksize / 4 * sizeof(float));
  1342. }
  1343. vc->previous_window = blockflag;
  1344. return retlen;
  1345. }
  1346. // Return the decoded audio packet through the standard api
  1347. static int vorbis_decode_frame(AVCodecContext *avccontext,
  1348. void *data, int *data_size,
  1349. AVPacket *avpkt)
  1350. {
  1351. const uint8_t *buf = avpkt->data;
  1352. int buf_size = avpkt->size;
  1353. vorbis_context *vc = avccontext->priv_data;
  1354. GetBitContext *gb = &(vc->gb);
  1355. const float *channel_ptrs[255];
  1356. int i, len, out_size;
  1357. if (!buf_size)
  1358. return 0;
  1359. av_dlog(NULL, "packet length %d \n", buf_size);
  1360. init_get_bits(gb, buf, buf_size*8);
  1361. if ((len = vorbis_parse_audio_packet(vc)) <= 0)
  1362. return len;
  1363. if (!vc->first_frame) {
  1364. vc->first_frame = 1;
  1365. *data_size = 0;
  1366. return buf_size;
  1367. }
  1368. av_dlog(NULL, "parsed %d bytes %d bits, returned %d samples (*ch*bits) \n",
  1369. get_bits_count(gb) / 8, get_bits_count(gb) % 8, len);
  1370. out_size = len * vc->audio_channels *
  1371. av_get_bytes_per_sample(avccontext->sample_fmt);
  1372. if (*data_size < out_size) {
  1373. av_log(avccontext, AV_LOG_ERROR, "output buffer is too small\n");
  1374. return AVERROR(EINVAL);
  1375. }
  1376. if (vc->audio_channels > 8) {
  1377. for (i = 0; i < vc->audio_channels; i++)
  1378. channel_ptrs[i] = vc->channel_floors + i * len;
  1379. } else {
  1380. for (i = 0; i < vc->audio_channels; i++)
  1381. channel_ptrs[i] = vc->channel_floors +
  1382. len * ff_vorbis_channel_layout_offsets[vc->audio_channels - 1][i];
  1383. }
  1384. if (avccontext->sample_fmt == AV_SAMPLE_FMT_FLT)
  1385. vc->fmt_conv.float_interleave(data, channel_ptrs, len, vc->audio_channels);
  1386. else
  1387. vc->fmt_conv.float_to_int16_interleave(data, channel_ptrs, len,
  1388. vc->audio_channels);
  1389. *data_size = out_size;
  1390. return buf_size;
  1391. }
  1392. // Close decoder
  1393. static av_cold int vorbis_decode_close(AVCodecContext *avccontext)
  1394. {
  1395. vorbis_context *vc = avccontext->priv_data;
  1396. vorbis_free(vc);
  1397. return 0;
  1398. }
  1399. AVCodec ff_vorbis_decoder = {
  1400. .name = "vorbis",
  1401. .type = AVMEDIA_TYPE_AUDIO,
  1402. .id = CODEC_ID_VORBIS,
  1403. .priv_data_size = sizeof(vorbis_context),
  1404. .init = vorbis_decode_init,
  1405. .close = vorbis_decode_close,
  1406. .decode = vorbis_decode_frame,
  1407. .long_name = NULL_IF_CONFIG_SMALL("Vorbis"),
  1408. .channel_layouts = ff_vorbis_channel_layouts,
  1409. .sample_fmts = (const enum AVSampleFormat[]) {
  1410. AV_SAMPLE_FMT_FLT, AV_SAMPLE_FMT_S16, AV_SAMPLE_FMT_NONE
  1411. },
  1412. };