You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

626 lines
19KB

  1. /*
  2. * Wing Commander/Xan Video Decoder
  3. * Copyright (C) 2003 The FFmpeg project
  4. *
  5. * This file is part of Libav.
  6. *
  7. * Libav is free software; you can redistribute it and/or
  8. * modify it under the terms of the GNU Lesser General Public
  9. * License as published by the Free Software Foundation; either
  10. * version 2.1 of the License, or (at your option) any later version.
  11. *
  12. * Libav is distributed in the hope that it will be useful,
  13. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  14. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  15. * Lesser General Public License for more details.
  16. *
  17. * You should have received a copy of the GNU Lesser General Public
  18. * License along with Libav; if not, write to the Free Software
  19. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  20. */
  21. /**
  22. * @file
  23. * Xan video decoder for Wing Commander III computer game
  24. * by Mario Brito (mbrito@student.dei.uc.pt)
  25. * and Mike Melanson (melanson@pcisys.net)
  26. *
  27. * The xan_wc3 decoder outputs PAL8 data.
  28. */
  29. #include <stdio.h>
  30. #include <stdlib.h>
  31. #include <string.h>
  32. #include "libavutil/intreadwrite.h"
  33. #include "libavutil/mem.h"
  34. #define BITSTREAM_READER_LE
  35. #include "avcodec.h"
  36. #include "bitstream.h"
  37. #include "bytestream.h"
  38. #include "internal.h"
  39. #define RUNTIME_GAMMA 0
  40. #define VGA__TAG MKTAG('V', 'G', 'A', ' ')
  41. #define PALT_TAG MKTAG('P', 'A', 'L', 'T')
  42. #define SHOT_TAG MKTAG('S', 'H', 'O', 'T')
  43. #define PALETTE_COUNT 256
  44. #define PALETTE_SIZE (PALETTE_COUNT * 3)
  45. #define PALETTES_MAX 256
  46. typedef struct XanContext {
  47. AVCodecContext *avctx;
  48. AVFrame *last_frame;
  49. const unsigned char *buf;
  50. int size;
  51. /* scratch space */
  52. unsigned char *buffer1;
  53. int buffer1_size;
  54. unsigned char *buffer2;
  55. int buffer2_size;
  56. unsigned *palettes;
  57. int palettes_count;
  58. int cur_palette;
  59. int frame_size;
  60. } XanContext;
  61. static av_cold int xan_decode_end(AVCodecContext *avctx)
  62. {
  63. XanContext *s = avctx->priv_data;
  64. av_frame_free(&s->last_frame);
  65. av_freep(&s->buffer1);
  66. av_freep(&s->buffer2);
  67. av_freep(&s->palettes);
  68. return 0;
  69. }
  70. static av_cold int xan_decode_init(AVCodecContext *avctx)
  71. {
  72. XanContext *s = avctx->priv_data;
  73. s->avctx = avctx;
  74. s->frame_size = 0;
  75. avctx->pix_fmt = AV_PIX_FMT_PAL8;
  76. s->buffer1_size = avctx->width * avctx->height;
  77. s->buffer1 = av_malloc(s->buffer1_size);
  78. if (!s->buffer1)
  79. return AVERROR(ENOMEM);
  80. s->buffer2_size = avctx->width * avctx->height;
  81. s->buffer2 = av_malloc(s->buffer2_size + 130);
  82. if (!s->buffer2) {
  83. av_freep(&s->buffer1);
  84. return AVERROR(ENOMEM);
  85. }
  86. s->last_frame = av_frame_alloc();
  87. if (!s->last_frame) {
  88. xan_decode_end(avctx);
  89. return AVERROR(ENOMEM);
  90. }
  91. return 0;
  92. }
  93. static int xan_huffman_decode(unsigned char *dest, int dest_len,
  94. const unsigned char *src, int src_len)
  95. {
  96. unsigned char byte = *src++;
  97. unsigned char ival = byte + 0x16;
  98. const unsigned char * ptr = src + byte*2;
  99. int ptr_len = src_len - 1 - byte*2;
  100. unsigned char val = ival;
  101. unsigned char *dest_end = dest + dest_len;
  102. unsigned char *dest_start = dest;
  103. BitstreamContext bc;
  104. if (ptr_len < 0)
  105. return AVERROR_INVALIDDATA;
  106. bitstream_init8(&bc, ptr, ptr_len);
  107. while (val != 0x16) {
  108. unsigned idx = val - 0x17 + bitstream_read_bit(&bc) * byte;
  109. if (idx >= 2 * byte)
  110. return AVERROR_INVALIDDATA;
  111. val = src[idx];
  112. if (val < 0x16) {
  113. if (dest >= dest_end)
  114. return dest_len;
  115. *dest++ = val;
  116. val = ival;
  117. }
  118. }
  119. return dest - dest_start;
  120. }
  121. /**
  122. * unpack simple compression
  123. *
  124. * @param dest destination buffer of dest_len, must be padded with at least 130 bytes
  125. */
  126. static void xan_unpack(unsigned char *dest, int dest_len,
  127. const unsigned char *src, int src_len)
  128. {
  129. unsigned char opcode;
  130. int size;
  131. unsigned char *dest_org = dest;
  132. unsigned char *dest_end = dest + dest_len;
  133. GetByteContext ctx;
  134. bytestream2_init(&ctx, src, src_len);
  135. while (dest < dest_end && bytestream2_get_bytes_left(&ctx)) {
  136. opcode = bytestream2_get_byte(&ctx);
  137. if (opcode < 0xe0) {
  138. int size2, back;
  139. if ((opcode & 0x80) == 0) {
  140. size = opcode & 3;
  141. back = ((opcode & 0x60) << 3) + bytestream2_get_byte(&ctx) + 1;
  142. size2 = ((opcode & 0x1c) >> 2) + 3;
  143. } else if ((opcode & 0x40) == 0) {
  144. size = bytestream2_peek_byte(&ctx) >> 6;
  145. back = (bytestream2_get_be16(&ctx) & 0x3fff) + 1;
  146. size2 = (opcode & 0x3f) + 4;
  147. } else {
  148. size = opcode & 3;
  149. back = ((opcode & 0x10) << 12) + bytestream2_get_be16(&ctx) + 1;
  150. size2 = ((opcode & 0x0c) << 6) + bytestream2_get_byte(&ctx) + 5;
  151. }
  152. if (dest_end - dest < size + size2 ||
  153. dest + size - dest_org < back ||
  154. bytestream2_get_bytes_left(&ctx) < size)
  155. return;
  156. bytestream2_get_buffer(&ctx, dest, size);
  157. dest += size;
  158. av_memcpy_backptr(dest, back, size2);
  159. dest += size2;
  160. } else {
  161. int finish = opcode >= 0xfc;
  162. size = finish ? opcode & 3 : ((opcode & 0x1f) << 2) + 4;
  163. if (dest_end - dest < size || bytestream2_get_bytes_left(&ctx) < size)
  164. return;
  165. bytestream2_get_buffer(&ctx, dest, size);
  166. dest += size;
  167. if (finish)
  168. return;
  169. }
  170. }
  171. }
  172. static inline void xan_wc3_output_pixel_run(XanContext *s, AVFrame *frame,
  173. const unsigned char *pixel_buffer, int x, int y, int pixel_count)
  174. {
  175. int stride;
  176. int line_inc;
  177. int index;
  178. int current_x;
  179. int width = s->avctx->width;
  180. unsigned char *palette_plane;
  181. palette_plane = frame->data[0];
  182. stride = frame->linesize[0];
  183. line_inc = stride - width;
  184. index = y * stride + x;
  185. current_x = x;
  186. while (pixel_count && index < s->frame_size) {
  187. int count = FFMIN(pixel_count, width - current_x);
  188. memcpy(palette_plane + index, pixel_buffer, count);
  189. pixel_count -= count;
  190. index += count;
  191. pixel_buffer += count;
  192. current_x += count;
  193. if (current_x >= width) {
  194. index += line_inc;
  195. current_x = 0;
  196. }
  197. }
  198. }
  199. static inline void xan_wc3_copy_pixel_run(XanContext *s, AVFrame *frame,
  200. int x, int y,
  201. int pixel_count, int motion_x,
  202. int motion_y)
  203. {
  204. int stride;
  205. int line_inc;
  206. int curframe_index, prevframe_index;
  207. int curframe_x, prevframe_x;
  208. int width = s->avctx->width;
  209. unsigned char *palette_plane, *prev_palette_plane;
  210. if (y + motion_y < 0 || y + motion_y >= s->avctx->height ||
  211. x + motion_x < 0 || x + motion_x >= s->avctx->width)
  212. return;
  213. palette_plane = frame->data[0];
  214. prev_palette_plane = s->last_frame->data[0];
  215. if (!prev_palette_plane)
  216. prev_palette_plane = palette_plane;
  217. stride = frame->linesize[0];
  218. line_inc = stride - width;
  219. curframe_index = y * stride + x;
  220. curframe_x = x;
  221. prevframe_index = (y + motion_y) * stride + x + motion_x;
  222. prevframe_x = x + motion_x;
  223. while (pixel_count &&
  224. curframe_index < s->frame_size &&
  225. prevframe_index < s->frame_size) {
  226. int count = FFMIN3(pixel_count, width - curframe_x,
  227. width - prevframe_x);
  228. memcpy(palette_plane + curframe_index,
  229. prev_palette_plane + prevframe_index, count);
  230. pixel_count -= count;
  231. curframe_index += count;
  232. prevframe_index += count;
  233. curframe_x += count;
  234. prevframe_x += count;
  235. if (curframe_x >= width) {
  236. curframe_index += line_inc;
  237. curframe_x = 0;
  238. }
  239. if (prevframe_x >= width) {
  240. prevframe_index += line_inc;
  241. prevframe_x = 0;
  242. }
  243. }
  244. }
  245. static int xan_wc3_decode_frame(XanContext *s, AVFrame *frame)
  246. {
  247. int width = s->avctx->width;
  248. int height = s->avctx->height;
  249. int total_pixels = width * height;
  250. unsigned char opcode;
  251. unsigned char flag = 0;
  252. int size = 0;
  253. int motion_x, motion_y;
  254. int x, y, ret;
  255. unsigned char *opcode_buffer = s->buffer1;
  256. unsigned char *opcode_buffer_end = s->buffer1 + s->buffer1_size;
  257. int opcode_buffer_size = s->buffer1_size;
  258. const unsigned char *imagedata_buffer = s->buffer2;
  259. /* pointers to segments inside the compressed chunk */
  260. const unsigned char *huffman_segment;
  261. GetByteContext size_segment;
  262. GetByteContext vector_segment;
  263. const unsigned char *imagedata_segment;
  264. int huffman_offset, size_offset, vector_offset, imagedata_offset,
  265. imagedata_size;
  266. if (s->size < 8)
  267. return AVERROR_INVALIDDATA;
  268. huffman_offset = AV_RL16(&s->buf[0]);
  269. size_offset = AV_RL16(&s->buf[2]);
  270. vector_offset = AV_RL16(&s->buf[4]);
  271. imagedata_offset = AV_RL16(&s->buf[6]);
  272. if (huffman_offset >= s->size ||
  273. size_offset >= s->size ||
  274. vector_offset >= s->size ||
  275. imagedata_offset >= s->size)
  276. return AVERROR_INVALIDDATA;
  277. huffman_segment = s->buf + huffman_offset;
  278. bytestream2_init(&size_segment, s->buf + size_offset, s->size - size_offset);
  279. bytestream2_init(&vector_segment, s->buf + vector_offset, s->size - vector_offset);
  280. imagedata_segment = s->buf + imagedata_offset;
  281. if ((ret = xan_huffman_decode(opcode_buffer, opcode_buffer_size,
  282. huffman_segment, s->size - huffman_offset)) < 0)
  283. return AVERROR_INVALIDDATA;
  284. opcode_buffer_end = opcode_buffer + ret;
  285. if (imagedata_segment[0] == 2) {
  286. xan_unpack(s->buffer2, s->buffer2_size,
  287. &imagedata_segment[1], s->size - imagedata_offset - 1);
  288. imagedata_size = s->buffer2_size;
  289. } else {
  290. imagedata_size = s->size - imagedata_offset - 1;
  291. imagedata_buffer = &imagedata_segment[1];
  292. }
  293. /* use the decoded data segments to build the frame */
  294. x = y = 0;
  295. while (total_pixels && opcode_buffer < opcode_buffer_end) {
  296. opcode = *opcode_buffer++;
  297. size = 0;
  298. switch (opcode) {
  299. case 0:
  300. flag ^= 1;
  301. continue;
  302. case 1:
  303. case 2:
  304. case 3:
  305. case 4:
  306. case 5:
  307. case 6:
  308. case 7:
  309. case 8:
  310. size = opcode;
  311. break;
  312. case 12:
  313. case 13:
  314. case 14:
  315. case 15:
  316. case 16:
  317. case 17:
  318. case 18:
  319. size += (opcode - 10);
  320. break;
  321. case 9:
  322. case 19:
  323. size = bytestream2_get_byte(&size_segment);
  324. break;
  325. case 10:
  326. case 20:
  327. size = bytestream2_get_be16(&size_segment);
  328. break;
  329. case 11:
  330. case 21:
  331. size = bytestream2_get_be24(&size_segment);
  332. break;
  333. }
  334. if (size > total_pixels)
  335. break;
  336. if (opcode < 12) {
  337. flag ^= 1;
  338. if (flag) {
  339. /* run of (size) pixels is unchanged from last frame */
  340. xan_wc3_copy_pixel_run(s, frame, x, y, size, 0, 0);
  341. } else {
  342. /* output a run of pixels from imagedata_buffer */
  343. if (imagedata_size < size)
  344. break;
  345. xan_wc3_output_pixel_run(s, frame, imagedata_buffer, x, y, size);
  346. imagedata_buffer += size;
  347. imagedata_size -= size;
  348. }
  349. } else {
  350. /* run-based motion compensation from last frame */
  351. uint8_t vector = bytestream2_get_byte(&vector_segment);
  352. motion_x = sign_extend(vector >> 4, 4);
  353. motion_y = sign_extend(vector & 0xF, 4);
  354. /* copy a run of pixels from the previous frame */
  355. xan_wc3_copy_pixel_run(s, frame, x, y, size, motion_x, motion_y);
  356. flag = 0;
  357. }
  358. /* coordinate accounting */
  359. total_pixels -= size;
  360. y += (x + size) / width;
  361. x = (x + size) % width;
  362. }
  363. return 0;
  364. }
  365. #if RUNTIME_GAMMA
  366. static inline unsigned mul(unsigned a, unsigned b)
  367. {
  368. return (a * b) >> 16;
  369. }
  370. static inline unsigned pow4(unsigned a)
  371. {
  372. unsigned square = mul(a, a);
  373. return mul(square, square);
  374. }
  375. static inline unsigned pow5(unsigned a)
  376. {
  377. return mul(pow4(a), a);
  378. }
  379. static uint8_t gamma_corr(uint8_t in) {
  380. unsigned lo, hi = 0xff40, target;
  381. int i = 15;
  382. in = (in << 2) | (in >> 6);
  383. /* equivalent float code:
  384. if (in >= 252)
  385. return 253;
  386. return round(pow(in / 256.0, 0.8) * 256);
  387. */
  388. lo = target = in << 8;
  389. do {
  390. unsigned mid = (lo + hi) >> 1;
  391. unsigned pow = pow5(mid);
  392. if (pow > target) hi = mid;
  393. else lo = mid;
  394. } while (--i);
  395. return (pow4((lo + hi) >> 1) + 0x80) >> 8;
  396. }
  397. #else
  398. /**
  399. * This is a gamma correction that xan3 applies to all palette entries.
  400. *
  401. * There is a peculiarity, namely that the values are clamped to 253 -
  402. * it seems likely that this table was calculated by a buggy fixed-point
  403. * implementation, the one above under RUNTIME_GAMMA behaves like this for
  404. * example.
  405. * The exponent value of 0.8 can be explained by this as well, since 0.8 = 4/5
  406. * and thus pow(x, 0.8) is still easy to calculate.
  407. * Also, the input values are first rotated to the left by 2.
  408. */
  409. static const uint8_t gamma_lookup[256] = {
  410. 0x00, 0x09, 0x10, 0x16, 0x1C, 0x21, 0x27, 0x2C,
  411. 0x31, 0x35, 0x3A, 0x3F, 0x43, 0x48, 0x4C, 0x50,
  412. 0x54, 0x59, 0x5D, 0x61, 0x65, 0x69, 0x6D, 0x71,
  413. 0x75, 0x79, 0x7D, 0x80, 0x84, 0x88, 0x8C, 0x8F,
  414. 0x93, 0x97, 0x9A, 0x9E, 0xA2, 0xA5, 0xA9, 0xAC,
  415. 0xB0, 0xB3, 0xB7, 0xBA, 0xBE, 0xC1, 0xC5, 0xC8,
  416. 0xCB, 0xCF, 0xD2, 0xD5, 0xD9, 0xDC, 0xDF, 0xE3,
  417. 0xE6, 0xE9, 0xED, 0xF0, 0xF3, 0xF6, 0xFA, 0xFD,
  418. 0x03, 0x0B, 0x12, 0x18, 0x1D, 0x23, 0x28, 0x2D,
  419. 0x32, 0x36, 0x3B, 0x40, 0x44, 0x49, 0x4D, 0x51,
  420. 0x56, 0x5A, 0x5E, 0x62, 0x66, 0x6A, 0x6E, 0x72,
  421. 0x76, 0x7A, 0x7D, 0x81, 0x85, 0x89, 0x8D, 0x90,
  422. 0x94, 0x98, 0x9B, 0x9F, 0xA2, 0xA6, 0xAA, 0xAD,
  423. 0xB1, 0xB4, 0xB8, 0xBB, 0xBF, 0xC2, 0xC5, 0xC9,
  424. 0xCC, 0xD0, 0xD3, 0xD6, 0xDA, 0xDD, 0xE0, 0xE4,
  425. 0xE7, 0xEA, 0xED, 0xF1, 0xF4, 0xF7, 0xFA, 0xFD,
  426. 0x05, 0x0D, 0x13, 0x19, 0x1F, 0x24, 0x29, 0x2E,
  427. 0x33, 0x38, 0x3C, 0x41, 0x45, 0x4A, 0x4E, 0x52,
  428. 0x57, 0x5B, 0x5F, 0x63, 0x67, 0x6B, 0x6F, 0x73,
  429. 0x77, 0x7B, 0x7E, 0x82, 0x86, 0x8A, 0x8D, 0x91,
  430. 0x95, 0x99, 0x9C, 0xA0, 0xA3, 0xA7, 0xAA, 0xAE,
  431. 0xB2, 0xB5, 0xB9, 0xBC, 0xBF, 0xC3, 0xC6, 0xCA,
  432. 0xCD, 0xD0, 0xD4, 0xD7, 0xDA, 0xDE, 0xE1, 0xE4,
  433. 0xE8, 0xEB, 0xEE, 0xF1, 0xF5, 0xF8, 0xFB, 0xFD,
  434. 0x07, 0x0E, 0x15, 0x1A, 0x20, 0x25, 0x2A, 0x2F,
  435. 0x34, 0x39, 0x3D, 0x42, 0x46, 0x4B, 0x4F, 0x53,
  436. 0x58, 0x5C, 0x60, 0x64, 0x68, 0x6C, 0x70, 0x74,
  437. 0x78, 0x7C, 0x7F, 0x83, 0x87, 0x8B, 0x8E, 0x92,
  438. 0x96, 0x99, 0x9D, 0xA1, 0xA4, 0xA8, 0xAB, 0xAF,
  439. 0xB2, 0xB6, 0xB9, 0xBD, 0xC0, 0xC4, 0xC7, 0xCB,
  440. 0xCE, 0xD1, 0xD5, 0xD8, 0xDB, 0xDF, 0xE2, 0xE5,
  441. 0xE9, 0xEC, 0xEF, 0xF2, 0xF6, 0xF9, 0xFC, 0xFD
  442. };
  443. #endif
  444. static int xan_decode_frame(AVCodecContext *avctx,
  445. void *data, int *got_frame,
  446. AVPacket *avpkt)
  447. {
  448. AVFrame *frame = data;
  449. const uint8_t *buf = avpkt->data;
  450. int ret, buf_size = avpkt->size;
  451. XanContext *s = avctx->priv_data;
  452. GetByteContext ctx;
  453. int tag = 0;
  454. bytestream2_init(&ctx, buf, buf_size);
  455. while (bytestream2_get_bytes_left(&ctx) > 8 && tag != VGA__TAG) {
  456. unsigned *tmpptr;
  457. uint32_t new_pal;
  458. int size;
  459. int i;
  460. tag = bytestream2_get_le32(&ctx);
  461. size = bytestream2_get_be32(&ctx);
  462. size = FFMIN(size, bytestream2_get_bytes_left(&ctx));
  463. switch (tag) {
  464. case PALT_TAG:
  465. if (size < PALETTE_SIZE)
  466. return AVERROR_INVALIDDATA;
  467. if (s->palettes_count >= PALETTES_MAX)
  468. return AVERROR_INVALIDDATA;
  469. tmpptr = av_realloc(s->palettes,
  470. (s->palettes_count + 1) * AVPALETTE_SIZE);
  471. if (!tmpptr)
  472. return AVERROR(ENOMEM);
  473. s->palettes = tmpptr;
  474. tmpptr += s->palettes_count * AVPALETTE_COUNT;
  475. for (i = 0; i < PALETTE_COUNT; i++) {
  476. #if RUNTIME_GAMMA
  477. int r = gamma_corr(bytestream2_get_byteu(&ctx));
  478. int g = gamma_corr(bytestream2_get_byteu(&ctx));
  479. int b = gamma_corr(bytestream2_get_byteu(&ctx));
  480. #else
  481. int r = gamma_lookup[bytestream2_get_byteu(&ctx)];
  482. int g = gamma_lookup[bytestream2_get_byteu(&ctx)];
  483. int b = gamma_lookup[bytestream2_get_byteu(&ctx)];
  484. #endif
  485. *tmpptr++ = (r << 16) | (g << 8) | b;
  486. }
  487. s->palettes_count++;
  488. break;
  489. case SHOT_TAG:
  490. if (size < 4)
  491. return AVERROR_INVALIDDATA;
  492. new_pal = bytestream2_get_le32(&ctx);
  493. if (new_pal < s->palettes_count) {
  494. s->cur_palette = new_pal;
  495. } else
  496. av_log(avctx, AV_LOG_ERROR, "Invalid palette selected\n");
  497. break;
  498. case VGA__TAG:
  499. break;
  500. default:
  501. bytestream2_skip(&ctx, size);
  502. break;
  503. }
  504. }
  505. buf_size = bytestream2_get_bytes_left(&ctx);
  506. if (s->palettes_count <= 0) {
  507. av_log(s->avctx, AV_LOG_ERROR, "No palette found\n");
  508. return AVERROR_INVALIDDATA;
  509. }
  510. if ((ret = ff_get_buffer(avctx, frame, AV_GET_BUFFER_FLAG_REF))) {
  511. av_log(s->avctx, AV_LOG_ERROR, "get_buffer() failed\n");
  512. return ret;
  513. }
  514. if (!s->frame_size)
  515. s->frame_size = frame->linesize[0] * s->avctx->height;
  516. memcpy(frame->data[1],
  517. s->palettes + s->cur_palette * AVPALETTE_COUNT, AVPALETTE_SIZE);
  518. s->buf = ctx.buffer;
  519. s->size = buf_size;
  520. if (xan_wc3_decode_frame(s, frame) < 0)
  521. return AVERROR_INVALIDDATA;
  522. av_frame_unref(s->last_frame);
  523. if ((ret = av_frame_ref(s->last_frame, frame)) < 0)
  524. return ret;
  525. *got_frame = 1;
  526. /* always report that the buffer was completely consumed */
  527. return buf_size;
  528. }
  529. AVCodec ff_xan_wc3_decoder = {
  530. .name = "xan_wc3",
  531. .long_name = NULL_IF_CONFIG_SMALL("Wing Commander III / Xan"),
  532. .type = AVMEDIA_TYPE_VIDEO,
  533. .id = AV_CODEC_ID_XAN_WC3,
  534. .priv_data_size = sizeof(XanContext),
  535. .init = xan_decode_init,
  536. .close = xan_decode_end,
  537. .decode = xan_decode_frame,
  538. .capabilities = AV_CODEC_CAP_DR1,
  539. };