You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

432 lines
15KB

  1. /*
  2. * Assorted DPCM codecs
  3. * Copyright (c) 2003 The FFmpeg project
  4. *
  5. * This file is part of FFmpeg.
  6. *
  7. * FFmpeg is free software; you can redistribute it and/or
  8. * modify it under the terms of the GNU Lesser General Public
  9. * License as published by the Free Software Foundation; either
  10. * version 2.1 of the License, or (at your option) any later version.
  11. *
  12. * FFmpeg is distributed in the hope that it will be useful,
  13. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  14. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  15. * Lesser General Public License for more details.
  16. *
  17. * You should have received a copy of the GNU Lesser General Public
  18. * License along with FFmpeg; if not, write to the Free Software
  19. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  20. */
  21. /**
  22. * @file
  23. * Assorted DPCM (differential pulse code modulation) audio codecs
  24. * by Mike Melanson (melanson@pcisys.net)
  25. * Xan DPCM decoder by Mario Brito (mbrito@student.dei.uc.pt)
  26. * for more information on the specific data formats, visit:
  27. * http://www.pcisys.net/~melanson/codecs/simpleaudio.html
  28. * SOL DPCMs implemented by Konstantin Shishkov
  29. *
  30. * Note about using the Xan DPCM decoder: Xan DPCM is used in AVI files
  31. * found in the Wing Commander IV computer game. These AVI files contain
  32. * WAVEFORMAT headers which report the audio format as 0x01: raw PCM.
  33. * Clearly incorrect. To detect Xan DPCM, you will probably have to
  34. * special-case your AVI demuxer to use Xan DPCM if the file uses 'Xxan'
  35. * (Xan video) for its video codec. Alternately, such AVI files also contain
  36. * the fourcc 'Axan' in the 'auds' chunk of the AVI header.
  37. */
  38. #include "libavutil/intreadwrite.h"
  39. #include "avcodec.h"
  40. #include "bytestream.h"
  41. #include "internal.h"
  42. #include "mathops.h"
  43. typedef struct DPCMContext {
  44. int16_t array[256];
  45. int sample[2]; ///< previous sample (for SOL_DPCM)
  46. const int8_t *sol_table; ///< delta table for SOL_DPCM
  47. } DPCMContext;
  48. static const int32_t derf_steps[96] = {
  49. 0, 1, 2, 3, 4, 5, 6, 7,
  50. 8, 9, 10, 11, 12, 13, 14, 16,
  51. 17, 19, 21, 23, 25, 28, 31, 34,
  52. 37, 41, 45, 50, 55, 60, 66, 73,
  53. 80, 88, 97, 107, 118, 130, 143, 157,
  54. 173, 190, 209, 230, 253, 279, 307, 337,
  55. 371, 408, 449, 494, 544, 598, 658, 724,
  56. 796, 876, 963, 1060, 1166, 1282, 1411, 1552,
  57. 1707, 1878, 2066, 2272, 2499, 2749, 3024, 3327,
  58. 3660, 4026, 4428, 4871, 5358, 5894, 6484, 7132,
  59. 7845, 8630, 9493, 10442, 11487, 12635, 13899, 15289,
  60. 16818, 18500, 20350, 22385, 24623, 27086, 29794, 32767,
  61. };
  62. static const int16_t interplay_delta_table[] = {
  63. 0, 1, 2, 3, 4, 5, 6, 7,
  64. 8, 9, 10, 11, 12, 13, 14, 15,
  65. 16, 17, 18, 19, 20, 21, 22, 23,
  66. 24, 25, 26, 27, 28, 29, 30, 31,
  67. 32, 33, 34, 35, 36, 37, 38, 39,
  68. 40, 41, 42, 43, 47, 51, 56, 61,
  69. 66, 72, 79, 86, 94, 102, 112, 122,
  70. 133, 145, 158, 173, 189, 206, 225, 245,
  71. 267, 292, 318, 348, 379, 414, 452, 493,
  72. 538, 587, 640, 699, 763, 832, 908, 991,
  73. 1081, 1180, 1288, 1405, 1534, 1673, 1826, 1993,
  74. 2175, 2373, 2590, 2826, 3084, 3365, 3672, 4008,
  75. 4373, 4772, 5208, 5683, 6202, 6767, 7385, 8059,
  76. 8794, 9597, 10472, 11428, 12471, 13609, 14851, 16206,
  77. 17685, 19298, 21060, 22981, 25078, 27367, 29864, 32589,
  78. -29973, -26728, -23186, -19322, -15105, -10503, -5481, -1,
  79. 1, 1, 5481, 10503, 15105, 19322, 23186, 26728,
  80. 29973, -32589, -29864, -27367, -25078, -22981, -21060, -19298,
  81. -17685, -16206, -14851, -13609, -12471, -11428, -10472, -9597,
  82. -8794, -8059, -7385, -6767, -6202, -5683, -5208, -4772,
  83. -4373, -4008, -3672, -3365, -3084, -2826, -2590, -2373,
  84. -2175, -1993, -1826, -1673, -1534, -1405, -1288, -1180,
  85. -1081, -991, -908, -832, -763, -699, -640, -587,
  86. -538, -493, -452, -414, -379, -348, -318, -292,
  87. -267, -245, -225, -206, -189, -173, -158, -145,
  88. -133, -122, -112, -102, -94, -86, -79, -72,
  89. -66, -61, -56, -51, -47, -43, -42, -41,
  90. -40, -39, -38, -37, -36, -35, -34, -33,
  91. -32, -31, -30, -29, -28, -27, -26, -25,
  92. -24, -23, -22, -21, -20, -19, -18, -17,
  93. -16, -15, -14, -13, -12, -11, -10, -9,
  94. -8, -7, -6, -5, -4, -3, -2, -1
  95. };
  96. static const int8_t sol_table_old[16] = {
  97. 0x0, 0x1, 0x2, 0x3, 0x6, 0xA, 0xF, 0x15,
  98. -0x15, -0xF, -0xA, -0x6, -0x3, -0x2, -0x1, 0x0
  99. };
  100. static const int8_t sol_table_new[16] = {
  101. 0x0, 0x1, 0x2, 0x3, 0x6, 0xA, 0xF, 0x15,
  102. 0x0, -0x1, -0x2, -0x3, -0x6, -0xA, -0xF, -0x15
  103. };
  104. static const int16_t sol_table_16[128] = {
  105. 0x000, 0x008, 0x010, 0x020, 0x030, 0x040, 0x050, 0x060, 0x070, 0x080,
  106. 0x090, 0x0A0, 0x0B0, 0x0C0, 0x0D0, 0x0E0, 0x0F0, 0x100, 0x110, 0x120,
  107. 0x130, 0x140, 0x150, 0x160, 0x170, 0x180, 0x190, 0x1A0, 0x1B0, 0x1C0,
  108. 0x1D0, 0x1E0, 0x1F0, 0x200, 0x208, 0x210, 0x218, 0x220, 0x228, 0x230,
  109. 0x238, 0x240, 0x248, 0x250, 0x258, 0x260, 0x268, 0x270, 0x278, 0x280,
  110. 0x288, 0x290, 0x298, 0x2A0, 0x2A8, 0x2B0, 0x2B8, 0x2C0, 0x2C8, 0x2D0,
  111. 0x2D8, 0x2E0, 0x2E8, 0x2F0, 0x2F8, 0x300, 0x308, 0x310, 0x318, 0x320,
  112. 0x328, 0x330, 0x338, 0x340, 0x348, 0x350, 0x358, 0x360, 0x368, 0x370,
  113. 0x378, 0x380, 0x388, 0x390, 0x398, 0x3A0, 0x3A8, 0x3B0, 0x3B8, 0x3C0,
  114. 0x3C8, 0x3D0, 0x3D8, 0x3E0, 0x3E8, 0x3F0, 0x3F8, 0x400, 0x440, 0x480,
  115. 0x4C0, 0x500, 0x540, 0x580, 0x5C0, 0x600, 0x640, 0x680, 0x6C0, 0x700,
  116. 0x740, 0x780, 0x7C0, 0x800, 0x900, 0xA00, 0xB00, 0xC00, 0xD00, 0xE00,
  117. 0xF00, 0x1000, 0x1400, 0x1800, 0x1C00, 0x2000, 0x3000, 0x4000
  118. };
  119. static av_cold int dpcm_decode_init(AVCodecContext *avctx)
  120. {
  121. DPCMContext *s = avctx->priv_data;
  122. int i;
  123. if (avctx->channels < 1 || avctx->channels > 2) {
  124. av_log(avctx, AV_LOG_ERROR, "invalid number of channels\n");
  125. return AVERROR(EINVAL);
  126. }
  127. s->sample[0] = s->sample[1] = 0;
  128. switch(avctx->codec->id) {
  129. case AV_CODEC_ID_ROQ_DPCM:
  130. /* initialize square table */
  131. for (i = 0; i < 128; i++) {
  132. int16_t square = i * i;
  133. s->array[i ] = square;
  134. s->array[i + 128] = -square;
  135. }
  136. break;
  137. case AV_CODEC_ID_SOL_DPCM:
  138. switch(avctx->codec_tag){
  139. case 1:
  140. s->sol_table = sol_table_old;
  141. s->sample[0] = s->sample[1] = 0x80;
  142. break;
  143. case 2:
  144. s->sol_table = sol_table_new;
  145. s->sample[0] = s->sample[1] = 0x80;
  146. break;
  147. case 3:
  148. break;
  149. default:
  150. av_log(avctx, AV_LOG_ERROR, "Unknown SOL subcodec\n");
  151. return -1;
  152. }
  153. break;
  154. case AV_CODEC_ID_SDX2_DPCM:
  155. for (i = -128; i < 128; i++) {
  156. int16_t square = i * i * 2;
  157. s->array[i+128] = i < 0 ? -square: square;
  158. }
  159. break;
  160. case AV_CODEC_ID_GREMLIN_DPCM: {
  161. int delta = 0;
  162. int code = 64;
  163. int step = 45;
  164. s->array[0] = 0;
  165. for (i = 0; i < 127; i++) {
  166. delta += (code >> 5);
  167. code += step;
  168. step += 2;
  169. s->array[i*2 + 1] = delta;
  170. s->array[i*2 + 2] = -delta;
  171. }
  172. s->array[255] = delta + (code >> 5);
  173. }
  174. break;
  175. default:
  176. break;
  177. }
  178. if (avctx->codec->id == AV_CODEC_ID_SOL_DPCM && avctx->codec_tag != 3)
  179. avctx->sample_fmt = AV_SAMPLE_FMT_U8;
  180. else
  181. avctx->sample_fmt = AV_SAMPLE_FMT_S16;
  182. return 0;
  183. }
  184. static int dpcm_decode_frame(AVCodecContext *avctx, void *data,
  185. int *got_frame_ptr, AVPacket *avpkt)
  186. {
  187. int buf_size = avpkt->size;
  188. DPCMContext *s = avctx->priv_data;
  189. AVFrame *frame = data;
  190. int out = 0, ret;
  191. int predictor[2];
  192. int ch = 0;
  193. int stereo = avctx->channels - 1;
  194. int16_t *output_samples, *samples_end;
  195. GetByteContext gb;
  196. if (stereo && (buf_size & 1))
  197. buf_size--;
  198. bytestream2_init(&gb, avpkt->data, buf_size);
  199. /* calculate output size */
  200. switch(avctx->codec->id) {
  201. case AV_CODEC_ID_ROQ_DPCM:
  202. out = buf_size - 8;
  203. break;
  204. case AV_CODEC_ID_INTERPLAY_DPCM:
  205. out = buf_size - 6 - avctx->channels;
  206. break;
  207. case AV_CODEC_ID_XAN_DPCM:
  208. out = buf_size - 2 * avctx->channels;
  209. break;
  210. case AV_CODEC_ID_SOL_DPCM:
  211. if (avctx->codec_tag != 3)
  212. out = buf_size * 2;
  213. else
  214. out = buf_size;
  215. break;
  216. case AV_CODEC_ID_DERF_DPCM:
  217. case AV_CODEC_ID_GREMLIN_DPCM:
  218. case AV_CODEC_ID_SDX2_DPCM:
  219. out = buf_size;
  220. break;
  221. }
  222. if (out <= 0) {
  223. av_log(avctx, AV_LOG_ERROR, "packet is too small\n");
  224. return AVERROR(EINVAL);
  225. }
  226. if (out % avctx->channels) {
  227. av_log(avctx, AV_LOG_WARNING, "channels have differing number of samples\n");
  228. }
  229. /* get output buffer */
  230. frame->nb_samples = (out + avctx->channels - 1) / avctx->channels;
  231. if ((ret = ff_get_buffer(avctx, frame, 0)) < 0)
  232. return ret;
  233. output_samples = (int16_t *)frame->data[0];
  234. samples_end = output_samples + out;
  235. switch(avctx->codec->id) {
  236. case AV_CODEC_ID_ROQ_DPCM:
  237. bytestream2_skipu(&gb, 6);
  238. if (stereo) {
  239. predictor[1] = sign_extend(bytestream2_get_byteu(&gb) << 8, 16);
  240. predictor[0] = sign_extend(bytestream2_get_byteu(&gb) << 8, 16);
  241. } else {
  242. predictor[0] = sign_extend(bytestream2_get_le16u(&gb), 16);
  243. }
  244. /* decode the samples */
  245. while (output_samples < samples_end) {
  246. predictor[ch] += s->array[bytestream2_get_byteu(&gb)];
  247. predictor[ch] = av_clip_int16(predictor[ch]);
  248. *output_samples++ = predictor[ch];
  249. /* toggle channel */
  250. ch ^= stereo;
  251. }
  252. break;
  253. case AV_CODEC_ID_INTERPLAY_DPCM:
  254. bytestream2_skipu(&gb, 6); /* skip over the stream mask and stream length */
  255. for (ch = 0; ch < avctx->channels; ch++) {
  256. predictor[ch] = sign_extend(bytestream2_get_le16u(&gb), 16);
  257. *output_samples++ = predictor[ch];
  258. }
  259. ch = 0;
  260. while (output_samples < samples_end) {
  261. predictor[ch] += interplay_delta_table[bytestream2_get_byteu(&gb)];
  262. predictor[ch] = av_clip_int16(predictor[ch]);
  263. *output_samples++ = predictor[ch];
  264. /* toggle channel */
  265. ch ^= stereo;
  266. }
  267. break;
  268. case AV_CODEC_ID_XAN_DPCM:
  269. {
  270. int shift[2] = { 4, 4 };
  271. for (ch = 0; ch < avctx->channels; ch++)
  272. predictor[ch] = sign_extend(bytestream2_get_le16u(&gb), 16);
  273. ch = 0;
  274. while (output_samples < samples_end) {
  275. int diff = bytestream2_get_byteu(&gb);
  276. int n = diff & 3;
  277. if (n == 3)
  278. shift[ch]++;
  279. else
  280. shift[ch] -= (2 * n);
  281. diff = sign_extend((diff &~ 3) << 8, 16);
  282. /* saturate the shifter to a lower limit of 0 */
  283. if (shift[ch] < 0)
  284. shift[ch] = 0;
  285. diff >>= shift[ch];
  286. predictor[ch] += diff;
  287. predictor[ch] = av_clip_int16(predictor[ch]);
  288. *output_samples++ = predictor[ch];
  289. /* toggle channel */
  290. ch ^= stereo;
  291. }
  292. break;
  293. }
  294. case AV_CODEC_ID_SOL_DPCM:
  295. if (avctx->codec_tag != 3) {
  296. uint8_t *output_samples_u8 = frame->data[0],
  297. *samples_end_u8 = output_samples_u8 + out;
  298. while (output_samples_u8 < samples_end_u8) {
  299. int n = bytestream2_get_byteu(&gb);
  300. s->sample[0] += s->sol_table[n >> 4];
  301. s->sample[0] = av_clip_uint8(s->sample[0]);
  302. *output_samples_u8++ = s->sample[0];
  303. s->sample[stereo] += s->sol_table[n & 0x0F];
  304. s->sample[stereo] = av_clip_uint8(s->sample[stereo]);
  305. *output_samples_u8++ = s->sample[stereo];
  306. }
  307. } else {
  308. while (output_samples < samples_end) {
  309. int n = bytestream2_get_byteu(&gb);
  310. if (n & 0x80) s->sample[ch] -= sol_table_16[n & 0x7F];
  311. else s->sample[ch] += sol_table_16[n & 0x7F];
  312. s->sample[ch] = av_clip_int16(s->sample[ch]);
  313. *output_samples++ = s->sample[ch];
  314. /* toggle channel */
  315. ch ^= stereo;
  316. }
  317. }
  318. break;
  319. case AV_CODEC_ID_SDX2_DPCM:
  320. while (output_samples < samples_end) {
  321. int8_t n = bytestream2_get_byteu(&gb);
  322. if (!(n & 1))
  323. s->sample[ch] = 0;
  324. s->sample[ch] += s->array[n + 128];
  325. s->sample[ch] = av_clip_int16(s->sample[ch]);
  326. *output_samples++ = s->sample[ch];
  327. ch ^= stereo;
  328. }
  329. break;
  330. case AV_CODEC_ID_GREMLIN_DPCM: {
  331. int idx = 0;
  332. while (output_samples < samples_end) {
  333. uint8_t n = bytestream2_get_byteu(&gb);
  334. *output_samples++ = s->sample[idx] += (unsigned)s->array[n];
  335. idx ^= 1;
  336. }
  337. }
  338. break;
  339. case AV_CODEC_ID_DERF_DPCM: {
  340. int idx = 0;
  341. while (output_samples < samples_end) {
  342. uint8_t n = bytestream2_get_byteu(&gb);
  343. int index = FFMIN(n & 0x7f, 95);
  344. s->sample[idx] += (n & 0x80 ? -1: 1) * derf_steps[index];
  345. s->sample[idx] = av_clip_int16(s->sample[idx]);
  346. *output_samples++ = s->sample[idx];
  347. idx ^= stereo;
  348. }
  349. }
  350. break;
  351. }
  352. *got_frame_ptr = 1;
  353. return avpkt->size;
  354. }
  355. #define DPCM_DECODER(id_, name_, long_name_) \
  356. AVCodec ff_ ## name_ ## _decoder = { \
  357. .name = #name_, \
  358. .long_name = NULL_IF_CONFIG_SMALL(long_name_), \
  359. .type = AVMEDIA_TYPE_AUDIO, \
  360. .id = id_, \
  361. .priv_data_size = sizeof(DPCMContext), \
  362. .init = dpcm_decode_init, \
  363. .decode = dpcm_decode_frame, \
  364. .capabilities = AV_CODEC_CAP_DR1, \
  365. }
  366. DPCM_DECODER(AV_CODEC_ID_DERF_DPCM, derf_dpcm, "DPCM Xilam DERF");
  367. DPCM_DECODER(AV_CODEC_ID_GREMLIN_DPCM, gremlin_dpcm, "DPCM Gremlin");
  368. DPCM_DECODER(AV_CODEC_ID_INTERPLAY_DPCM, interplay_dpcm, "DPCM Interplay");
  369. DPCM_DECODER(AV_CODEC_ID_ROQ_DPCM, roq_dpcm, "DPCM id RoQ");
  370. DPCM_DECODER(AV_CODEC_ID_SDX2_DPCM, sdx2_dpcm, "DPCM Squareroot-Delta-Exact");
  371. DPCM_DECODER(AV_CODEC_ID_SOL_DPCM, sol_dpcm, "DPCM Sol");
  372. DPCM_DECODER(AV_CODEC_ID_XAN_DPCM, xan_dpcm, "DPCM Xan");