You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

549 lines
17KB

  1. /*
  2. * WavPack lossless audio decoder
  3. * Copyright (c) 2006 Konstantin Shishkov
  4. *
  5. * This library is free software; you can redistribute it and/or
  6. * modify it under the terms of the GNU Lesser General Public
  7. * License as published by the Free Software Foundation; either
  8. * version 2 of the License, or (at your option) any later version.
  9. *
  10. * This library is distributed in the hope that it will be useful,
  11. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  12. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  13. * Lesser General Public License for more details.
  14. *
  15. * You should have received a copy of the GNU Lesser General Public
  16. * License along with this library; if not, write to the Free Software
  17. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  18. */
  19. #define ALT_BITSTREAM_READER_LE
  20. #include "avcodec.h"
  21. #include "bitstream.h"
  22. /**
  23. * @file wavpack.c
  24. * WavPack lossless audio decoder
  25. */
  26. #define WV_JOINT 0x0010
  27. enum WP_ID_Flags{
  28. WP_IDF_MASK = 0x1F,
  29. WP_IDF_IGNORE = 0x20,
  30. WP_IDF_ODD = 0x40,
  31. WP_IDF_LONG = 0x80
  32. };
  33. enum WP_ID{
  34. WP_ID_DUMMY = 0,
  35. WP_ID_ENCINFO,
  36. WP_ID_DECTERMS,
  37. WP_ID_DECWEIGHTS,
  38. WP_ID_DECSAMPLES,
  39. WP_ID_ENTROPY,
  40. WP_ID_HYBRID,
  41. WP_ID_SHAPING,
  42. WP_ID_FLOATINFO,
  43. WP_ID_INT32INFO,
  44. WP_ID_DATA,
  45. WP_ID_CORR,
  46. WP_ID_FLT,
  47. WP_ID_CHANINFO
  48. };
  49. #define MAX_TERMS 16
  50. typedef struct Decorr {
  51. int delta;
  52. int value;
  53. int weightA;
  54. int weightB;
  55. int samplesA[8];
  56. int samplesB[8];
  57. } Decorr;
  58. typedef struct WavpackContext {
  59. AVCodecContext *avctx;
  60. int stereo;
  61. int joint;
  62. uint32_t CRC;
  63. GetBitContext gb;
  64. int data_size; // in bits
  65. int samples;
  66. int median[6];
  67. int terms;
  68. Decorr decorr[MAX_TERMS];
  69. int zero, one, zeroes;
  70. } WavpackContext;
  71. // exponent table copied from WavPack source
  72. static const uint8_t wp_exp2_table [256] = {
  73. 0x00, 0x01, 0x01, 0x02, 0x03, 0x03, 0x04, 0x05, 0x06, 0x06, 0x07, 0x08, 0x08, 0x09, 0x0a, 0x0b,
  74. 0x0b, 0x0c, 0x0d, 0x0e, 0x0e, 0x0f, 0x10, 0x10, 0x11, 0x12, 0x13, 0x13, 0x14, 0x15, 0x16, 0x16,
  75. 0x17, 0x18, 0x19, 0x19, 0x1a, 0x1b, 0x1c, 0x1d, 0x1d, 0x1e, 0x1f, 0x20, 0x20, 0x21, 0x22, 0x23,
  76. 0x24, 0x24, 0x25, 0x26, 0x27, 0x28, 0x28, 0x29, 0x2a, 0x2b, 0x2c, 0x2c, 0x2d, 0x2e, 0x2f, 0x30,
  77. 0x30, 0x31, 0x32, 0x33, 0x34, 0x35, 0x35, 0x36, 0x37, 0x38, 0x39, 0x3a, 0x3a, 0x3b, 0x3c, 0x3d,
  78. 0x3e, 0x3f, 0x40, 0x41, 0x41, 0x42, 0x43, 0x44, 0x45, 0x46, 0x47, 0x48, 0x48, 0x49, 0x4a, 0x4b,
  79. 0x4c, 0x4d, 0x4e, 0x4f, 0x50, 0x51, 0x51, 0x52, 0x53, 0x54, 0x55, 0x56, 0x57, 0x58, 0x59, 0x5a,
  80. 0x5b, 0x5c, 0x5d, 0x5e, 0x5e, 0x5f, 0x60, 0x61, 0x62, 0x63, 0x64, 0x65, 0x66, 0x67, 0x68, 0x69,
  81. 0x6a, 0x6b, 0x6c, 0x6d, 0x6e, 0x6f, 0x70, 0x71, 0x72, 0x73, 0x74, 0x75, 0x76, 0x77, 0x78, 0x79,
  82. 0x7a, 0x7b, 0x7c, 0x7d, 0x7e, 0x7f, 0x80, 0x81, 0x82, 0x83, 0x84, 0x85, 0x87, 0x88, 0x89, 0x8a,
  83. 0x8b, 0x8c, 0x8d, 0x8e, 0x8f, 0x90, 0x91, 0x92, 0x93, 0x95, 0x96, 0x97, 0x98, 0x99, 0x9a, 0x9b,
  84. 0x9c, 0x9d, 0x9f, 0xa0, 0xa1, 0xa2, 0xa3, 0xa4, 0xa5, 0xa6, 0xa8, 0xa9, 0xaa, 0xab, 0xac, 0xad,
  85. 0xaf, 0xb0, 0xb1, 0xb2, 0xb3, 0xb4, 0xb6, 0xb7, 0xb8, 0xb9, 0xba, 0xbc, 0xbd, 0xbe, 0xbf, 0xc0,
  86. 0xc2, 0xc3, 0xc4, 0xc5, 0xc6, 0xc8, 0xc9, 0xca, 0xcb, 0xcd, 0xce, 0xcf, 0xd0, 0xd2, 0xd3, 0xd4,
  87. 0xd6, 0xd7, 0xd8, 0xd9, 0xdb, 0xdc, 0xdd, 0xde, 0xe0, 0xe1, 0xe2, 0xe4, 0xe5, 0xe6, 0xe8, 0xe9,
  88. 0xea, 0xec, 0xed, 0xee, 0xf0, 0xf1, 0xf2, 0xf4, 0xf5, 0xf6, 0xf8, 0xf9, 0xfa, 0xfc, 0xfd, 0xff
  89. };
  90. static always_inline int wp_exp2(int16_t val)
  91. {
  92. int res, neg = 0;
  93. if(val < 0){
  94. val = -val;
  95. neg = 1;
  96. }
  97. res = wp_exp2_table[val & 0xFF] | 0x100;
  98. val >>= 8;
  99. res = (val > 9) ? (res << (val - 9)) : (res >> (9 - val));
  100. return neg ? -res : res;
  101. }
  102. static inline int get_unary(GetBitContext *gb){
  103. int r=0;
  104. while(get_bits1(gb) && r<33)r++;
  105. return r;
  106. }
  107. // macros for manipulating median values
  108. #define GET_MED(n) ((median[n] >> 4) + 1)
  109. #define DEC_MED(n) median[n] -= ((median[n] + (128>>n) - 2) / (128>>n)) * 2
  110. #define INC_MED(n) median[n] += ((median[n] + (128>>n)) / (128>>n)) * 5
  111. // macros for applying weight
  112. #define UPDATE_WEIGHT_CLIP(weight, delta, samples, in) \
  113. if(samples && in){ \
  114. if((samples ^ in) < 0){ \
  115. weight -= delta; \
  116. if(weight < -1024) weight = -1024; \
  117. }else{ \
  118. weight += delta; \
  119. if(weight > 1024) weight = 1024; \
  120. } \
  121. }
  122. static always_inline int get_tail(GetBitContext *gb, int k)
  123. {
  124. int p, e, res;
  125. if(k<1 || k>65535)return 0;
  126. p = av_log2_16bit(k);
  127. e = (1 << (p + 1)) - k - 1;
  128. res = p ? get_bits(gb, p) : 0;
  129. if(res >= e){
  130. res = (res<<1) - e + get_bits1(gb);
  131. }
  132. return res;
  133. }
  134. static int wv_get_value(WavpackContext *ctx, GetBitContext *gb, int *median, int *last)
  135. {
  136. int t, t2;
  137. int sign, base, add, ret;
  138. *last = 0;
  139. if((ctx->median[0] < 2U) && (ctx->median[3] < 2U) && !ctx->zero && !ctx->one){
  140. if(ctx->zeroes){
  141. ctx->zeroes--;
  142. if(ctx->zeroes)
  143. return 0;
  144. }else{
  145. t = get_unary(gb);
  146. if(t >= 2) t = get_bits(gb, t - 1) | (1 << (t-1));
  147. ctx->zeroes = t;
  148. if(ctx->zeroes){
  149. memset(ctx->median, 0, sizeof(ctx->median));
  150. return 0;
  151. }
  152. }
  153. }
  154. if(get_bits_count(gb) >= ctx->data_size){
  155. *last = 1;
  156. return 0;
  157. }
  158. if(ctx->zero){
  159. t = 0;
  160. ctx->zero = 0;
  161. }else{
  162. t = get_unary(gb);
  163. if(get_bits_count(gb) >= ctx->data_size){
  164. *last = 1;
  165. return 0;
  166. }
  167. if(t == 16) {
  168. t2 = get_unary(gb);
  169. if(t2 < 2) t += t2;
  170. else t += get_bits(gb, t2 - 1) | (1 << (t2 - 1));
  171. }
  172. if(ctx->one){
  173. ctx->one = t&1;
  174. t = (t>>1) + 1;
  175. }else{
  176. ctx->one = t&1;
  177. t >>= 1;
  178. }
  179. ctx->zero = !ctx->one;
  180. }
  181. if(!t){
  182. base = 0;
  183. add = GET_MED(0) - 1;
  184. DEC_MED(0);
  185. }else if(t == 1){
  186. base = GET_MED(0);
  187. add = GET_MED(1) - 1;
  188. INC_MED(0);
  189. DEC_MED(1);
  190. }else if(t == 2){
  191. base = GET_MED(0) + GET_MED(1);
  192. add = GET_MED(2) - 1;
  193. INC_MED(0);
  194. INC_MED(1);
  195. DEC_MED(2);
  196. }else{
  197. base = GET_MED(0) + GET_MED(1) + GET_MED(2) * (t - 2);
  198. add = GET_MED(2) - 1;
  199. INC_MED(0);
  200. INC_MED(1);
  201. INC_MED(2);
  202. }
  203. ret = base + get_tail(gb, add);
  204. sign = get_bits1(gb);
  205. return sign ? ~ret : ret;
  206. }
  207. static int wv_unpack_stereo(WavpackContext *s, GetBitContext *gb, int16_t *dst)
  208. {
  209. int i, j, count = 0;
  210. int last, t;
  211. int A, B, L, L2, R, R2;
  212. int pos = 0;
  213. uint32_t crc = 0xFFFFFFFF;
  214. s->one = s->zero = s->zeroes = 0;
  215. do{
  216. L = wv_get_value(s, gb, s->median, &last);
  217. if(last) break;
  218. R = wv_get_value(s, gb, s->median + 3, &last);
  219. if(last) break;
  220. for(i = 0; i < s->terms; i++){
  221. t = s->decorr[i].value;
  222. j = 0;
  223. if(t > 0){
  224. if(t > 8){
  225. if(t & 1){
  226. A = 2 * s->decorr[i].samplesA[0] - s->decorr[i].samplesA[1];
  227. B = 2 * s->decorr[i].samplesB[0] - s->decorr[i].samplesB[1];
  228. }else{
  229. A = (3 * s->decorr[i].samplesA[0] - s->decorr[i].samplesA[1]) >> 1;
  230. B = (3 * s->decorr[i].samplesB[0] - s->decorr[i].samplesB[1]) >> 1;
  231. }
  232. s->decorr[i].samplesA[1] = s->decorr[i].samplesA[0];
  233. s->decorr[i].samplesB[1] = s->decorr[i].samplesB[0];
  234. j = 0;
  235. }else{
  236. A = s->decorr[i].samplesA[pos];
  237. B = s->decorr[i].samplesB[pos];
  238. j = (pos + t) & 7;
  239. }
  240. L2 = L + ((s->decorr[i].weightA * A + 512) >> 10);
  241. R2 = R + ((s->decorr[i].weightB * B + 512) >> 10);
  242. if(A && L) s->decorr[i].weightA -= ((((L ^ A) >> 30) & 2) - 1) * s->decorr[i].delta;
  243. if(B && R) s->decorr[i].weightB -= ((((R ^ B) >> 30) & 2) - 1) * s->decorr[i].delta;
  244. s->decorr[i].samplesA[j] = L = L2;
  245. s->decorr[i].samplesB[j] = R = R2;
  246. }else if(t == -1){
  247. L2 = L + ((s->decorr[i].weightA * s->decorr[i].samplesA[0] + 512) >> 10);
  248. UPDATE_WEIGHT_CLIP(s->decorr[i].weightA, s->decorr[i].delta, s->decorr[i].samplesA[0], L);
  249. L = L2;
  250. R2 = R + ((s->decorr[i].weightB * L2 + 512) >> 10);
  251. UPDATE_WEIGHT_CLIP(s->decorr[i].weightB, s->decorr[i].delta, L2, R);
  252. R = R2;
  253. s->decorr[i].samplesA[0] = R;
  254. }else{
  255. R2 = R + ((s->decorr[i].weightB * s->decorr[i].samplesB[0] + 512) >> 10);
  256. UPDATE_WEIGHT_CLIP(s->decorr[i].weightB, s->decorr[i].delta, s->decorr[i].samplesB[0], R);
  257. R = R2;
  258. if(t == -3){
  259. R2 = s->decorr[i].samplesA[0];
  260. s->decorr[i].samplesA[0] = R;
  261. }
  262. L2 = L + ((s->decorr[i].weightA * R2 + 512) >> 10);
  263. UPDATE_WEIGHT_CLIP(s->decorr[i].weightA, s->decorr[i].delta, R2, L);
  264. L = L2;
  265. s->decorr[i].samplesB[0] = L;
  266. }
  267. }
  268. pos = (pos + 1) & 7;
  269. if(s->joint)
  270. L += (R -= (L >> 1));
  271. crc = (crc * 3 + L) * 3 + R;
  272. *dst++ = L;
  273. *dst++ = R;
  274. count++;
  275. }while(!last && count < s->samples);
  276. if(crc != s->CRC){
  277. av_log(s->avctx, AV_LOG_ERROR, "CRC error\n");
  278. return -1;
  279. }
  280. return count * 2;
  281. }
  282. static int wv_unpack_mono(WavpackContext *s, GetBitContext *gb, int16_t *dst)
  283. {
  284. int i, j, count = 0;
  285. int last, t;
  286. int A, S, T;
  287. int pos = 0;
  288. uint32_t crc = 0xFFFFFFFF;
  289. s->one = s->zero = s->zeroes = 0;
  290. do{
  291. T = wv_get_value(s, gb, s->median, &last);
  292. S = 0;
  293. if(last) break;
  294. for(i = 0; i < s->terms; i++){
  295. t = s->decorr[i].value;
  296. if(t > 8){
  297. if(t & 1)
  298. A = 2 * s->decorr[i].samplesA[0] - s->decorr[i].samplesA[1];
  299. else
  300. A = (3 * s->decorr[i].samplesA[0] - s->decorr[i].samplesA[1]) >> 1;
  301. s->decorr[i].samplesA[1] = s->decorr[i].samplesA[0];
  302. j = 0;
  303. }else{
  304. A = s->decorr[i].samplesA[pos];
  305. j = (pos + t) & 7;
  306. }
  307. S = T + ((s->decorr[i].weightA * A + 512) >> 10);
  308. if(A && T) s->decorr[i].weightA -= ((((T ^ A) >> 30) & 2) - 1) * s->decorr[i].delta;
  309. s->decorr[i].samplesA[j] = T = S;
  310. }
  311. pos = (pos + 1) & 7;
  312. crc = crc * 3 + S;
  313. *dst++ = S;
  314. count++;
  315. }while(!last && count < s->samples);
  316. if(crc != s->CRC){
  317. av_log(s->avctx, AV_LOG_ERROR, "CRC error\n");
  318. return -1;
  319. }
  320. return count;
  321. }
  322. static int wavpack_decode_init(AVCodecContext *avctx)
  323. {
  324. WavpackContext *s = avctx->priv_data;
  325. s->avctx = avctx;
  326. s->stereo = (avctx->channels == 2);
  327. return 0;
  328. }
  329. static int wavpack_decode_close(AVCodecContext *avctx)
  330. {
  331. // WavpackContext *s = avctx->priv_data;
  332. return 0;
  333. }
  334. static int wavpack_decode_frame(AVCodecContext *avctx,
  335. void *data, int *data_size,
  336. uint8_t *buf, int buf_size)
  337. {
  338. WavpackContext *s = avctx->priv_data;
  339. int16_t *samples = data;
  340. int samplecount;
  341. int got_terms = 0, got_weights = 0, got_samples = 0, got_entropy = 0, got_bs = 0;
  342. uint8_t* buf_end = buf + buf_size;
  343. int i, j, id, size, ssize, weights, t;
  344. if (buf_size == 0) return 0;
  345. memset(s->decorr, 0, MAX_TERMS * sizeof(Decorr));
  346. s->samples = LE_32(buf); buf += 4;
  347. s->joint = LE_32(buf) & WV_JOINT; buf += 4;
  348. s->CRC = LE_32(buf); buf += 4;
  349. // parse metadata blocks
  350. while(buf < buf_end){
  351. id = *buf++;
  352. size = *buf++;
  353. if(id & WP_IDF_LONG) {
  354. size |= (*buf++) << 8;
  355. size |= (*buf++) << 16;
  356. }
  357. size <<= 1; // size is specified in words
  358. ssize = size;
  359. if(id & WP_IDF_ODD) size--;
  360. if(size < 0){
  361. av_log(avctx, AV_LOG_ERROR, "Got incorrect block %02X with size %i\n", id, size);
  362. break;
  363. }
  364. if(buf + ssize > buf_end){
  365. av_log(avctx, AV_LOG_ERROR, "Block size %i is out of bounds\n", size);
  366. break;
  367. }
  368. if(id & WP_IDF_IGNORE){
  369. buf += ssize;
  370. continue;
  371. }
  372. switch(id & WP_IDF_MASK){
  373. case WP_ID_DECTERMS:
  374. s->terms = size;
  375. if(s->terms > MAX_TERMS){
  376. av_log(avctx, AV_LOG_ERROR, "Too many decorrelation terms\n");
  377. buf += ssize;
  378. continue;
  379. }
  380. for(i = 0; i < s->terms; i++) {
  381. s->decorr[s->terms - i - 1].value = (*buf & 0x1F) - 5;
  382. s->decorr[s->terms - i - 1].delta = *buf >> 5;
  383. buf++;
  384. }
  385. got_terms = 1;
  386. break;
  387. case WP_ID_DECWEIGHTS:
  388. if(!got_terms){
  389. av_log(avctx, AV_LOG_ERROR, "No decorrelation terms met\n");
  390. continue;
  391. }
  392. weights = size >> s->stereo;
  393. if(weights > MAX_TERMS || weights > s->terms){
  394. av_log(avctx, AV_LOG_ERROR, "Too many decorrelation weights\n");
  395. buf += ssize;
  396. continue;
  397. }
  398. for(i = 0; i < weights; i++) {
  399. t = (int8_t)(*buf++);
  400. s->decorr[s->terms - i - 1].weightA = t << 3;
  401. if(s->decorr[s->terms - i - 1].weightA > 0)
  402. s->decorr[s->terms - i - 1].weightA += (s->decorr[s->terms - i - 1].weightA + 64) >> 7;
  403. if(s->stereo){
  404. t = (int8_t)(*buf++);
  405. s->decorr[s->terms - i - 1].weightB = t << 3;
  406. if(s->decorr[s->terms - i - 1].weightB > 0)
  407. s->decorr[s->terms - i - 1].weightB += (s->decorr[s->terms - i - 1].weightB + 64) >> 7;
  408. }
  409. }
  410. got_weights = 1;
  411. break;
  412. case WP_ID_DECSAMPLES:
  413. if(!got_terms){
  414. av_log(avctx, AV_LOG_ERROR, "No decorrelation terms met\n");
  415. continue;
  416. }
  417. t = 0;
  418. for(i = s->terms - 1; (i >= 0) && (t < size); i--) {
  419. if(s->decorr[i].value > 8){
  420. s->decorr[i].samplesA[0] = wp_exp2(LE_16(buf)); buf += 2;
  421. s->decorr[i].samplesA[1] = wp_exp2(LE_16(buf)); buf += 2;
  422. if(s->stereo){
  423. s->decorr[i].samplesB[0] = wp_exp2(LE_16(buf)); buf += 2;
  424. s->decorr[i].samplesB[1] = wp_exp2(LE_16(buf)); buf += 2;
  425. t += 4;
  426. }
  427. t += 4;
  428. }else if(s->decorr[i].value < 0){
  429. s->decorr[i].samplesA[0] = wp_exp2(LE_16(buf)); buf += 2;
  430. s->decorr[i].samplesB[0] = wp_exp2(LE_16(buf)); buf += 2;
  431. t += 4;
  432. }else{
  433. for(j = 0; j < s->decorr[i].value; j++){
  434. s->decorr[i].samplesA[j] = wp_exp2(LE_16(buf)); buf += 2;
  435. if(s->stereo){
  436. s->decorr[i].samplesB[j] = wp_exp2(LE_16(buf)); buf += 2;
  437. }
  438. }
  439. t += s->decorr[i].value * 2 * avctx->channels;
  440. }
  441. }
  442. got_samples = 1;
  443. break;
  444. case WP_ID_ENTROPY:
  445. if(size != 6 * avctx->channels){
  446. av_log(avctx, AV_LOG_ERROR, "Entropy vars size should be %i, got %i", 6 * avctx->channels, size);
  447. buf += ssize;
  448. continue;
  449. }
  450. for(i = 0; i < 3 * avctx->channels; i++){
  451. s->median[i] = wp_exp2(LE_16(buf));
  452. buf += 2;
  453. }
  454. got_entropy = 1;
  455. break;
  456. case WP_ID_DATA:
  457. init_get_bits(&s->gb, buf, size * 8);
  458. s->data_size = size * 8;
  459. buf += size;
  460. got_bs = 1;
  461. break;
  462. default:
  463. buf += size;
  464. }
  465. if(id & WP_IDF_ODD) buf++;
  466. }
  467. if(!got_terms){
  468. av_log(avctx, AV_LOG_ERROR, "No block with decorrelation terms\n");
  469. return -1;
  470. }
  471. if(!got_weights){
  472. av_log(avctx, AV_LOG_ERROR, "No block with decorrelation weights\n");
  473. return -1;
  474. }
  475. if(!got_samples){
  476. av_log(avctx, AV_LOG_ERROR, "No block with decorrelation samples\n");
  477. return -1;
  478. }
  479. if(!got_entropy){
  480. av_log(avctx, AV_LOG_ERROR, "No block with entropy info\n");
  481. return -1;
  482. }
  483. if(!got_bs){
  484. av_log(avctx, AV_LOG_ERROR, "Packed samples not found\n");
  485. return -1;
  486. }
  487. if(s->stereo)
  488. samplecount = wv_unpack_stereo(s, &s->gb, samples);
  489. else
  490. samplecount = wv_unpack_mono(s, &s->gb, samples);
  491. *data_size = samplecount * 2;
  492. return buf_size;
  493. }
  494. AVCodec wavpack_decoder = {
  495. "wavpack",
  496. CODEC_TYPE_AUDIO,
  497. CODEC_ID_WAVPACK,
  498. sizeof(WavpackContext),
  499. wavpack_decode_init,
  500. NULL,
  501. wavpack_decode_close,
  502. wavpack_decode_frame,
  503. };