You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

557 lines
18KB

  1. /*
  2. * WavPack lossless audio decoder
  3. * Copyright (c) 2006 Konstantin Shishkov
  4. *
  5. * This file is part of FFmpeg.
  6. *
  7. * FFmpeg is free software; you can redistribute it and/or
  8. * modify it under the terms of the GNU Lesser General Public
  9. * License as published by the Free Software Foundation; either
  10. * version 2.1 of the License, or (at your option) any later version.
  11. *
  12. * FFmpeg is distributed in the hope that it will be useful,
  13. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  14. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  15. * Lesser General Public License for more details.
  16. *
  17. * You should have received a copy of the GNU Lesser General Public
  18. * License along with FFmpeg; if not, write to the Free Software
  19. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  20. */
  21. #define ALT_BITSTREAM_READER_LE
  22. #include "avcodec.h"
  23. #include "bitstream.h"
  24. /**
  25. * @file wavpack.c
  26. * WavPack lossless audio decoder
  27. */
  28. #define WV_JOINT 0x0010
  29. enum WP_ID_Flags{
  30. WP_IDF_MASK = 0x1F,
  31. WP_IDF_IGNORE = 0x20,
  32. WP_IDF_ODD = 0x40,
  33. WP_IDF_LONG = 0x80
  34. };
  35. enum WP_ID{
  36. WP_ID_DUMMY = 0,
  37. WP_ID_ENCINFO,
  38. WP_ID_DECTERMS,
  39. WP_ID_DECWEIGHTS,
  40. WP_ID_DECSAMPLES,
  41. WP_ID_ENTROPY,
  42. WP_ID_HYBRID,
  43. WP_ID_SHAPING,
  44. WP_ID_FLOATINFO,
  45. WP_ID_INT32INFO,
  46. WP_ID_DATA,
  47. WP_ID_CORR,
  48. WP_ID_FLT,
  49. WP_ID_CHANINFO
  50. };
  51. #define MAX_TERMS 16
  52. typedef struct Decorr {
  53. int delta;
  54. int value;
  55. int weightA;
  56. int weightB;
  57. int samplesA[8];
  58. int samplesB[8];
  59. } Decorr;
  60. typedef struct WavpackContext {
  61. AVCodecContext *avctx;
  62. int stereo;
  63. int joint;
  64. uint32_t CRC;
  65. GetBitContext gb;
  66. int data_size; // in bits
  67. int samples;
  68. int median[6];
  69. int terms;
  70. Decorr decorr[MAX_TERMS];
  71. int zero, one, zeroes;
  72. } WavpackContext;
  73. // exponent table copied from WavPack source
  74. static const uint8_t wp_exp2_table [256] = {
  75. 0x00, 0x01, 0x01, 0x02, 0x03, 0x03, 0x04, 0x05, 0x06, 0x06, 0x07, 0x08, 0x08, 0x09, 0x0a, 0x0b,
  76. 0x0b, 0x0c, 0x0d, 0x0e, 0x0e, 0x0f, 0x10, 0x10, 0x11, 0x12, 0x13, 0x13, 0x14, 0x15, 0x16, 0x16,
  77. 0x17, 0x18, 0x19, 0x19, 0x1a, 0x1b, 0x1c, 0x1d, 0x1d, 0x1e, 0x1f, 0x20, 0x20, 0x21, 0x22, 0x23,
  78. 0x24, 0x24, 0x25, 0x26, 0x27, 0x28, 0x28, 0x29, 0x2a, 0x2b, 0x2c, 0x2c, 0x2d, 0x2e, 0x2f, 0x30,
  79. 0x30, 0x31, 0x32, 0x33, 0x34, 0x35, 0x35, 0x36, 0x37, 0x38, 0x39, 0x3a, 0x3a, 0x3b, 0x3c, 0x3d,
  80. 0x3e, 0x3f, 0x40, 0x41, 0x41, 0x42, 0x43, 0x44, 0x45, 0x46, 0x47, 0x48, 0x48, 0x49, 0x4a, 0x4b,
  81. 0x4c, 0x4d, 0x4e, 0x4f, 0x50, 0x51, 0x51, 0x52, 0x53, 0x54, 0x55, 0x56, 0x57, 0x58, 0x59, 0x5a,
  82. 0x5b, 0x5c, 0x5d, 0x5e, 0x5e, 0x5f, 0x60, 0x61, 0x62, 0x63, 0x64, 0x65, 0x66, 0x67, 0x68, 0x69,
  83. 0x6a, 0x6b, 0x6c, 0x6d, 0x6e, 0x6f, 0x70, 0x71, 0x72, 0x73, 0x74, 0x75, 0x76, 0x77, 0x78, 0x79,
  84. 0x7a, 0x7b, 0x7c, 0x7d, 0x7e, 0x7f, 0x80, 0x81, 0x82, 0x83, 0x84, 0x85, 0x87, 0x88, 0x89, 0x8a,
  85. 0x8b, 0x8c, 0x8d, 0x8e, 0x8f, 0x90, 0x91, 0x92, 0x93, 0x95, 0x96, 0x97, 0x98, 0x99, 0x9a, 0x9b,
  86. 0x9c, 0x9d, 0x9f, 0xa0, 0xa1, 0xa2, 0xa3, 0xa4, 0xa5, 0xa6, 0xa8, 0xa9, 0xaa, 0xab, 0xac, 0xad,
  87. 0xaf, 0xb0, 0xb1, 0xb2, 0xb3, 0xb4, 0xb6, 0xb7, 0xb8, 0xb9, 0xba, 0xbc, 0xbd, 0xbe, 0xbf, 0xc0,
  88. 0xc2, 0xc3, 0xc4, 0xc5, 0xc6, 0xc8, 0xc9, 0xca, 0xcb, 0xcd, 0xce, 0xcf, 0xd0, 0xd2, 0xd3, 0xd4,
  89. 0xd6, 0xd7, 0xd8, 0xd9, 0xdb, 0xdc, 0xdd, 0xde, 0xe0, 0xe1, 0xe2, 0xe4, 0xe5, 0xe6, 0xe8, 0xe9,
  90. 0xea, 0xec, 0xed, 0xee, 0xf0, 0xf1, 0xf2, 0xf4, 0xf5, 0xf6, 0xf8, 0xf9, 0xfa, 0xfc, 0xfd, 0xff
  91. };
  92. static av_always_inline int wp_exp2(int16_t val)
  93. {
  94. int res, neg = 0;
  95. if(val < 0){
  96. val = -val;
  97. neg = 1;
  98. }
  99. res = wp_exp2_table[val & 0xFF] | 0x100;
  100. val >>= 8;
  101. res = (val > 9) ? (res << (val - 9)) : (res >> (9 - val));
  102. return neg ? -res : res;
  103. }
  104. static inline int get_unary(GetBitContext *gb){
  105. int r=0;
  106. while(get_bits1(gb) && r<33)r++;
  107. return r;
  108. }
  109. // macros for manipulating median values
  110. #define GET_MED(n) ((median[n] >> 4) + 1)
  111. #define DEC_MED(n) median[n] -= ((median[n] + (128>>n) - 2) / (128>>n)) * 2
  112. #define INC_MED(n) median[n] += ((median[n] + (128>>n)) / (128>>n)) * 5
  113. // macros for applying weight
  114. #define UPDATE_WEIGHT_CLIP(weight, delta, samples, in) \
  115. if(samples && in){ \
  116. if((samples ^ in) < 0){ \
  117. weight -= delta; \
  118. if(weight < -1024) weight = -1024; \
  119. }else{ \
  120. weight += delta; \
  121. if(weight > 1024) weight = 1024; \
  122. } \
  123. }
  124. static av_always_inline int get_tail(GetBitContext *gb, int k)
  125. {
  126. int p, e, res;
  127. if(k<1)return 0;
  128. p = av_log2(k);
  129. e = (1 << (p + 1)) - k - 1;
  130. res = p ? get_bits(gb, p) : 0;
  131. if(res >= e){
  132. res = (res<<1) - e + get_bits1(gb);
  133. }
  134. return res;
  135. }
  136. static int wv_get_value(WavpackContext *ctx, GetBitContext *gb, int *median, int *last)
  137. {
  138. int t, t2;
  139. int sign, base, add, ret;
  140. *last = 0;
  141. if((ctx->median[0] < 2U) && (ctx->median[3] < 2U) && !ctx->zero && !ctx->one){
  142. if(ctx->zeroes){
  143. ctx->zeroes--;
  144. if(ctx->zeroes)
  145. return 0;
  146. }else{
  147. t = get_unary(gb);
  148. if(t >= 2) t = get_bits(gb, t - 1) | (1 << (t-1));
  149. ctx->zeroes = t;
  150. if(ctx->zeroes){
  151. memset(ctx->median, 0, sizeof(ctx->median));
  152. return 0;
  153. }
  154. }
  155. }
  156. if(get_bits_count(gb) >= ctx->data_size){
  157. *last = 1;
  158. return 0;
  159. }
  160. if(ctx->zero){
  161. t = 0;
  162. ctx->zero = 0;
  163. }else{
  164. t = get_unary(gb);
  165. if(get_bits_count(gb) >= ctx->data_size){
  166. *last = 1;
  167. return 0;
  168. }
  169. if(t == 16) {
  170. t2 = get_unary(gb);
  171. if(t2 < 2) t += t2;
  172. else t += get_bits(gb, t2 - 1) | (1 << (t2 - 1));
  173. }
  174. if(ctx->one){
  175. ctx->one = t&1;
  176. t = (t>>1) + 1;
  177. }else{
  178. ctx->one = t&1;
  179. t >>= 1;
  180. }
  181. ctx->zero = !ctx->one;
  182. }
  183. if(!t){
  184. base = 0;
  185. add = GET_MED(0) - 1;
  186. DEC_MED(0);
  187. }else if(t == 1){
  188. base = GET_MED(0);
  189. add = GET_MED(1) - 1;
  190. INC_MED(0);
  191. DEC_MED(1);
  192. }else if(t == 2){
  193. base = GET_MED(0) + GET_MED(1);
  194. add = GET_MED(2) - 1;
  195. INC_MED(0);
  196. INC_MED(1);
  197. DEC_MED(2);
  198. }else{
  199. base = GET_MED(0) + GET_MED(1) + GET_MED(2) * (t - 2);
  200. add = GET_MED(2) - 1;
  201. INC_MED(0);
  202. INC_MED(1);
  203. INC_MED(2);
  204. }
  205. ret = base + get_tail(gb, add);
  206. sign = get_bits1(gb);
  207. return sign ? ~ret : ret;
  208. }
  209. static int wv_unpack_stereo(WavpackContext *s, GetBitContext *gb, int16_t *dst)
  210. {
  211. int i, j, count = 0;
  212. int last, t;
  213. int A, B, L, L2, R, R2;
  214. int pos = 0;
  215. uint32_t crc = 0xFFFFFFFF;
  216. s->one = s->zero = s->zeroes = 0;
  217. do{
  218. L = wv_get_value(s, gb, s->median, &last);
  219. if(last) break;
  220. R = wv_get_value(s, gb, s->median + 3, &last);
  221. if(last) break;
  222. for(i = 0; i < s->terms; i++){
  223. t = s->decorr[i].value;
  224. j = 0;
  225. if(t > 0){
  226. if(t > 8){
  227. if(t & 1){
  228. A = 2 * s->decorr[i].samplesA[0] - s->decorr[i].samplesA[1];
  229. B = 2 * s->decorr[i].samplesB[0] - s->decorr[i].samplesB[1];
  230. }else{
  231. A = (3 * s->decorr[i].samplesA[0] - s->decorr[i].samplesA[1]) >> 1;
  232. B = (3 * s->decorr[i].samplesB[0] - s->decorr[i].samplesB[1]) >> 1;
  233. }
  234. s->decorr[i].samplesA[1] = s->decorr[i].samplesA[0];
  235. s->decorr[i].samplesB[1] = s->decorr[i].samplesB[0];
  236. j = 0;
  237. }else{
  238. A = s->decorr[i].samplesA[pos];
  239. B = s->decorr[i].samplesB[pos];
  240. j = (pos + t) & 7;
  241. }
  242. L2 = L + ((s->decorr[i].weightA * A + 512) >> 10);
  243. R2 = R + ((s->decorr[i].weightB * B + 512) >> 10);
  244. if(A && L) s->decorr[i].weightA -= ((((L ^ A) >> 30) & 2) - 1) * s->decorr[i].delta;
  245. if(B && R) s->decorr[i].weightB -= ((((R ^ B) >> 30) & 2) - 1) * s->decorr[i].delta;
  246. s->decorr[i].samplesA[j] = L = L2;
  247. s->decorr[i].samplesB[j] = R = R2;
  248. }else if(t == -1){
  249. L2 = L + ((s->decorr[i].weightA * s->decorr[i].samplesA[0] + 512) >> 10);
  250. UPDATE_WEIGHT_CLIP(s->decorr[i].weightA, s->decorr[i].delta, s->decorr[i].samplesA[0], L);
  251. L = L2;
  252. R2 = R + ((s->decorr[i].weightB * L2 + 512) >> 10);
  253. UPDATE_WEIGHT_CLIP(s->decorr[i].weightB, s->decorr[i].delta, L2, R);
  254. R = R2;
  255. s->decorr[i].samplesA[0] = R;
  256. }else{
  257. R2 = R + ((s->decorr[i].weightB * s->decorr[i].samplesB[0] + 512) >> 10);
  258. UPDATE_WEIGHT_CLIP(s->decorr[i].weightB, s->decorr[i].delta, s->decorr[i].samplesB[0], R);
  259. R = R2;
  260. if(t == -3){
  261. R2 = s->decorr[i].samplesA[0];
  262. s->decorr[i].samplesA[0] = R;
  263. }
  264. L2 = L + ((s->decorr[i].weightA * R2 + 512) >> 10);
  265. UPDATE_WEIGHT_CLIP(s->decorr[i].weightA, s->decorr[i].delta, R2, L);
  266. L = L2;
  267. s->decorr[i].samplesB[0] = L;
  268. }
  269. }
  270. pos = (pos + 1) & 7;
  271. if(s->joint)
  272. L += (R -= (L >> 1));
  273. crc = (crc * 3 + L) * 3 + R;
  274. *dst++ = L;
  275. *dst++ = R;
  276. count++;
  277. }while(!last && count < s->samples);
  278. if(crc != s->CRC){
  279. av_log(s->avctx, AV_LOG_ERROR, "CRC error\n");
  280. return -1;
  281. }
  282. return count * 2;
  283. }
  284. static int wv_unpack_mono(WavpackContext *s, GetBitContext *gb, int16_t *dst)
  285. {
  286. int i, j, count = 0;
  287. int last, t;
  288. int A, S, T;
  289. int pos = 0;
  290. uint32_t crc = 0xFFFFFFFF;
  291. s->one = s->zero = s->zeroes = 0;
  292. do{
  293. T = wv_get_value(s, gb, s->median, &last);
  294. S = 0;
  295. if(last) break;
  296. for(i = 0; i < s->terms; i++){
  297. t = s->decorr[i].value;
  298. if(t > 8){
  299. if(t & 1)
  300. A = 2 * s->decorr[i].samplesA[0] - s->decorr[i].samplesA[1];
  301. else
  302. A = (3 * s->decorr[i].samplesA[0] - s->decorr[i].samplesA[1]) >> 1;
  303. s->decorr[i].samplesA[1] = s->decorr[i].samplesA[0];
  304. j = 0;
  305. }else{
  306. A = s->decorr[i].samplesA[pos];
  307. j = (pos + t) & 7;
  308. }
  309. S = T + ((s->decorr[i].weightA * A + 512) >> 10);
  310. if(A && T) s->decorr[i].weightA -= ((((T ^ A) >> 30) & 2) - 1) * s->decorr[i].delta;
  311. s->decorr[i].samplesA[j] = T = S;
  312. }
  313. pos = (pos + 1) & 7;
  314. crc = crc * 3 + S;
  315. *dst++ = S;
  316. count++;
  317. }while(!last && count < s->samples);
  318. if(crc != s->CRC){
  319. av_log(s->avctx, AV_LOG_ERROR, "CRC error\n");
  320. return -1;
  321. }
  322. return count;
  323. }
  324. static int wavpack_decode_init(AVCodecContext *avctx)
  325. {
  326. WavpackContext *s = avctx->priv_data;
  327. s->avctx = avctx;
  328. s->stereo = (avctx->channels == 2);
  329. return 0;
  330. }
  331. static int wavpack_decode_close(AVCodecContext *avctx)
  332. {
  333. // WavpackContext *s = avctx->priv_data;
  334. return 0;
  335. }
  336. static int wavpack_decode_frame(AVCodecContext *avctx,
  337. void *data, int *data_size,
  338. uint8_t *buf, int buf_size)
  339. {
  340. WavpackContext *s = avctx->priv_data;
  341. int16_t *samples = data;
  342. int samplecount;
  343. int got_terms = 0, got_weights = 0, got_samples = 0, got_entropy = 0, got_bs = 0;
  344. uint8_t* buf_end = buf + buf_size;
  345. int i, j, id, size, ssize, weights, t;
  346. if (buf_size == 0) return 0;
  347. memset(s->decorr, 0, MAX_TERMS * sizeof(Decorr));
  348. s->samples = AV_RL32(buf); buf += 4;
  349. if(!s->samples) return buf_size;
  350. /* should not happen but who knows */
  351. if(s->samples * 2 * avctx->channels > AVCODEC_MAX_AUDIO_FRAME_SIZE){
  352. av_log(avctx, AV_LOG_ERROR, "Packet size is too big to be handled in lavc!\n");
  353. return -1;
  354. }
  355. s->joint = AV_RL32(buf) & WV_JOINT; buf += 4;
  356. s->CRC = AV_RL32(buf); buf += 4;
  357. // parse metadata blocks
  358. while(buf < buf_end){
  359. id = *buf++;
  360. size = *buf++;
  361. if(id & WP_IDF_LONG) {
  362. size |= (*buf++) << 8;
  363. size |= (*buf++) << 16;
  364. }
  365. size <<= 1; // size is specified in words
  366. ssize = size;
  367. if(id & WP_IDF_ODD) size--;
  368. if(size < 0){
  369. av_log(avctx, AV_LOG_ERROR, "Got incorrect block %02X with size %i\n", id, size);
  370. break;
  371. }
  372. if(buf + ssize > buf_end){
  373. av_log(avctx, AV_LOG_ERROR, "Block size %i is out of bounds\n", size);
  374. break;
  375. }
  376. if(id & WP_IDF_IGNORE){
  377. buf += ssize;
  378. continue;
  379. }
  380. switch(id & WP_IDF_MASK){
  381. case WP_ID_DECTERMS:
  382. s->terms = size;
  383. if(s->terms > MAX_TERMS){
  384. av_log(avctx, AV_LOG_ERROR, "Too many decorrelation terms\n");
  385. buf += ssize;
  386. continue;
  387. }
  388. for(i = 0; i < s->terms; i++) {
  389. s->decorr[s->terms - i - 1].value = (*buf & 0x1F) - 5;
  390. s->decorr[s->terms - i - 1].delta = *buf >> 5;
  391. buf++;
  392. }
  393. got_terms = 1;
  394. break;
  395. case WP_ID_DECWEIGHTS:
  396. if(!got_terms){
  397. av_log(avctx, AV_LOG_ERROR, "No decorrelation terms met\n");
  398. continue;
  399. }
  400. weights = size >> s->stereo;
  401. if(weights > MAX_TERMS || weights > s->terms){
  402. av_log(avctx, AV_LOG_ERROR, "Too many decorrelation weights\n");
  403. buf += ssize;
  404. continue;
  405. }
  406. for(i = 0; i < weights; i++) {
  407. t = (int8_t)(*buf++);
  408. s->decorr[s->terms - i - 1].weightA = t << 3;
  409. if(s->decorr[s->terms - i - 1].weightA > 0)
  410. s->decorr[s->terms - i - 1].weightA += (s->decorr[s->terms - i - 1].weightA + 64) >> 7;
  411. if(s->stereo){
  412. t = (int8_t)(*buf++);
  413. s->decorr[s->terms - i - 1].weightB = t << 3;
  414. if(s->decorr[s->terms - i - 1].weightB > 0)
  415. s->decorr[s->terms - i - 1].weightB += (s->decorr[s->terms - i - 1].weightB + 64) >> 7;
  416. }
  417. }
  418. got_weights = 1;
  419. break;
  420. case WP_ID_DECSAMPLES:
  421. if(!got_terms){
  422. av_log(avctx, AV_LOG_ERROR, "No decorrelation terms met\n");
  423. continue;
  424. }
  425. t = 0;
  426. for(i = s->terms - 1; (i >= 0) && (t < size); i--) {
  427. if(s->decorr[i].value > 8){
  428. s->decorr[i].samplesA[0] = wp_exp2(AV_RL16(buf)); buf += 2;
  429. s->decorr[i].samplesA[1] = wp_exp2(AV_RL16(buf)); buf += 2;
  430. if(s->stereo){
  431. s->decorr[i].samplesB[0] = wp_exp2(AV_RL16(buf)); buf += 2;
  432. s->decorr[i].samplesB[1] = wp_exp2(AV_RL16(buf)); buf += 2;
  433. t += 4;
  434. }
  435. t += 4;
  436. }else if(s->decorr[i].value < 0){
  437. s->decorr[i].samplesA[0] = wp_exp2(AV_RL16(buf)); buf += 2;
  438. s->decorr[i].samplesB[0] = wp_exp2(AV_RL16(buf)); buf += 2;
  439. t += 4;
  440. }else{
  441. for(j = 0; j < s->decorr[i].value; j++){
  442. s->decorr[i].samplesA[j] = wp_exp2(AV_RL16(buf)); buf += 2;
  443. if(s->stereo){
  444. s->decorr[i].samplesB[j] = wp_exp2(AV_RL16(buf)); buf += 2;
  445. }
  446. }
  447. t += s->decorr[i].value * 2 * avctx->channels;
  448. }
  449. }
  450. got_samples = 1;
  451. break;
  452. case WP_ID_ENTROPY:
  453. if(size != 6 * avctx->channels){
  454. av_log(avctx, AV_LOG_ERROR, "Entropy vars size should be %i, got %i", 6 * avctx->channels, size);
  455. buf += ssize;
  456. continue;
  457. }
  458. for(i = 0; i < 3 * avctx->channels; i++){
  459. s->median[i] = wp_exp2(AV_RL16(buf));
  460. buf += 2;
  461. }
  462. got_entropy = 1;
  463. break;
  464. case WP_ID_DATA:
  465. init_get_bits(&s->gb, buf, size * 8);
  466. s->data_size = size * 8;
  467. buf += size;
  468. got_bs = 1;
  469. break;
  470. default:
  471. buf += size;
  472. }
  473. if(id & WP_IDF_ODD) buf++;
  474. }
  475. if(!got_terms){
  476. av_log(avctx, AV_LOG_ERROR, "No block with decorrelation terms\n");
  477. return -1;
  478. }
  479. if(!got_weights){
  480. av_log(avctx, AV_LOG_ERROR, "No block with decorrelation weights\n");
  481. return -1;
  482. }
  483. if(!got_samples){
  484. av_log(avctx, AV_LOG_ERROR, "No block with decorrelation samples\n");
  485. return -1;
  486. }
  487. if(!got_entropy){
  488. av_log(avctx, AV_LOG_ERROR, "No block with entropy info\n");
  489. return -1;
  490. }
  491. if(!got_bs){
  492. av_log(avctx, AV_LOG_ERROR, "Packed samples not found\n");
  493. return -1;
  494. }
  495. if(s->stereo)
  496. samplecount = wv_unpack_stereo(s, &s->gb, samples);
  497. else
  498. samplecount = wv_unpack_mono(s, &s->gb, samples);
  499. *data_size = samplecount * 2;
  500. return buf_size;
  501. }
  502. AVCodec wavpack_decoder = {
  503. "wavpack",
  504. CODEC_TYPE_AUDIO,
  505. CODEC_ID_WAVPACK,
  506. sizeof(WavpackContext),
  507. wavpack_decode_init,
  508. NULL,
  509. wavpack_decode_close,
  510. wavpack_decode_frame,
  511. };