You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

613 lines
20KB

  1. /*
  2. * Westwood Studios VQA Video Decoder
  3. * Copyright (C) 2003 the ffmpeg project
  4. *
  5. * This file is part of Libav.
  6. *
  7. * Libav is free software; you can redistribute it and/or
  8. * modify it under the terms of the GNU Lesser General Public
  9. * License as published by the Free Software Foundation; either
  10. * version 2.1 of the License, or (at your option) any later version.
  11. *
  12. * Libav is distributed in the hope that it will be useful,
  13. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  14. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  15. * Lesser General Public License for more details.
  16. *
  17. * You should have received a copy of the GNU Lesser General Public
  18. * License along with Libav; if not, write to the Free Software
  19. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  20. */
  21. /**
  22. * @file
  23. * VQA Video Decoder
  24. * @author Mike Melanson (melanson@pcisys.net)
  25. * @see http://wiki.multimedia.cx/index.php?title=VQA
  26. *
  27. * The VQA video decoder outputs PAL8 or RGB555 colorspace data, depending
  28. * on the type of data in the file.
  29. *
  30. * This decoder needs the 42-byte VQHD header from the beginning
  31. * of the VQA file passed through the extradata field. The VQHD header
  32. * is laid out as:
  33. *
  34. * bytes 0-3 chunk fourcc: 'VQHD'
  35. * bytes 4-7 chunk size in big-endian format, should be 0x0000002A
  36. * bytes 8-49 VQHD chunk data
  37. *
  38. * Bytes 8-49 are what this decoder expects to see.
  39. *
  40. * Briefly, VQA is a vector quantized animation format that operates in a
  41. * VGA palettized colorspace. It operates on pixel vectors (blocks)
  42. * of either 4x2 or 4x4 in size. Compressed VQA chunks can contain vector
  43. * codebooks, palette information, and code maps for rendering vectors onto
  44. * frames. Any of these components can also be compressed with a run-length
  45. * encoding (RLE) algorithm commonly referred to as "format80".
  46. *
  47. * VQA takes a novel approach to rate control. Each group of n frames
  48. * (usually, n = 8) relies on a different vector codebook. Rather than
  49. * transporting an entire codebook every 8th frame, the new codebook is
  50. * broken up into 8 pieces and sent along with the compressed video chunks
  51. * for each of the 8 frames preceding the 8 frames which require the
  52. * codebook. A full codebook is also sent on the very first frame of a
  53. * file. This is an interesting technique, although it makes random file
  54. * seeking difficult despite the fact that the frames are all intracoded.
  55. *
  56. * V1,2 VQA uses 12-bit codebook indexes. If the 12-bit indexes were
  57. * packed into bytes and then RLE compressed, bytewise, the results would
  58. * be poor. That is why the coding method divides each index into 2 parts,
  59. * the top 4 bits and the bottom 8 bits, then RL encodes the 4-bit pieces
  60. * together and the 8-bit pieces together. If most of the vectors are
  61. * clustered into one group of 256 vectors, most of the 4-bit index pieces
  62. * should be the same.
  63. */
  64. #include <stdio.h>
  65. #include <stdlib.h>
  66. #include <string.h>
  67. #include "libavutil/intreadwrite.h"
  68. #include "libavutil/imgutils.h"
  69. #include "avcodec.h"
  70. #define PALETTE_COUNT 256
  71. #define VQA_HEADER_SIZE 0x2A
  72. #define CHUNK_PREAMBLE_SIZE 8
  73. /* allocate the maximum vector space, regardless of the file version:
  74. * (0xFF00 codebook vectors + 0x100 solid pixel vectors) * (4x4 pixels/block) */
  75. #define MAX_CODEBOOK_VECTORS 0xFF00
  76. #define SOLID_PIXEL_VECTORS 0x100
  77. #define MAX_VECTORS (MAX_CODEBOOK_VECTORS + SOLID_PIXEL_VECTORS)
  78. #define MAX_CODEBOOK_SIZE (MAX_VECTORS * 4 * 4)
  79. #define CBF0_TAG MKBETAG('C', 'B', 'F', '0')
  80. #define CBFZ_TAG MKBETAG('C', 'B', 'F', 'Z')
  81. #define CBP0_TAG MKBETAG('C', 'B', 'P', '0')
  82. #define CBPZ_TAG MKBETAG('C', 'B', 'P', 'Z')
  83. #define CPL0_TAG MKBETAG('C', 'P', 'L', '0')
  84. #define CPLZ_TAG MKBETAG('C', 'P', 'L', 'Z')
  85. #define VPTZ_TAG MKBETAG('V', 'P', 'T', 'Z')
  86. typedef struct VqaContext {
  87. AVCodecContext *avctx;
  88. AVFrame frame;
  89. const unsigned char *buf;
  90. int size;
  91. uint32_t palette[PALETTE_COUNT];
  92. int width; /* width of a frame */
  93. int height; /* height of a frame */
  94. int vector_width; /* width of individual vector */
  95. int vector_height; /* height of individual vector */
  96. int vqa_version; /* this should be either 1, 2 or 3 */
  97. unsigned char *codebook; /* the current codebook */
  98. int codebook_size;
  99. unsigned char *next_codebook_buffer; /* accumulator for next codebook */
  100. int next_codebook_buffer_index;
  101. unsigned char *decode_buffer;
  102. int decode_buffer_size;
  103. /* number of frames to go before replacing codebook */
  104. int partial_countdown;
  105. int partial_count;
  106. } VqaContext;
  107. static av_cold int vqa_decode_init(AVCodecContext *avctx)
  108. {
  109. VqaContext *s = avctx->priv_data;
  110. unsigned char *vqa_header;
  111. int i, j, codebook_index;
  112. s->avctx = avctx;
  113. avctx->pix_fmt = PIX_FMT_PAL8;
  114. /* make sure the extradata made it */
  115. if (s->avctx->extradata_size != VQA_HEADER_SIZE) {
  116. av_log(s->avctx, AV_LOG_ERROR, " VQA video: expected extradata size of %d\n", VQA_HEADER_SIZE);
  117. return -1;
  118. }
  119. /* load up the VQA parameters from the header */
  120. vqa_header = (unsigned char *)s->avctx->extradata;
  121. s->vqa_version = vqa_header[0];
  122. s->width = AV_RL16(&vqa_header[6]);
  123. s->height = AV_RL16(&vqa_header[8]);
  124. if(av_image_check_size(s->width, s->height, 0, avctx)){
  125. s->width= s->height= 0;
  126. return -1;
  127. }
  128. s->vector_width = vqa_header[10];
  129. s->vector_height = vqa_header[11];
  130. s->partial_count = s->partial_countdown = vqa_header[13];
  131. /* the vector dimensions have to meet very stringent requirements */
  132. if ((s->vector_width != 4) ||
  133. ((s->vector_height != 2) && (s->vector_height != 4))) {
  134. /* return without further initialization */
  135. return -1;
  136. }
  137. /* allocate codebooks */
  138. s->codebook_size = MAX_CODEBOOK_SIZE;
  139. s->codebook = av_malloc(s->codebook_size);
  140. s->next_codebook_buffer = av_malloc(s->codebook_size);
  141. /* initialize the solid-color vectors */
  142. if (s->vector_height == 4) {
  143. codebook_index = 0xFF00 * 16;
  144. for (i = 0; i < 256; i++)
  145. for (j = 0; j < 16; j++)
  146. s->codebook[codebook_index++] = i;
  147. } else {
  148. codebook_index = 0xF00 * 8;
  149. for (i = 0; i < 256; i++)
  150. for (j = 0; j < 8; j++)
  151. s->codebook[codebook_index++] = i;
  152. }
  153. s->next_codebook_buffer_index = 0;
  154. /* allocate decode buffer */
  155. s->decode_buffer_size = (s->width / s->vector_width) *
  156. (s->height / s->vector_height) * 2;
  157. s->decode_buffer = av_malloc(s->decode_buffer_size);
  158. s->frame.data[0] = NULL;
  159. return 0;
  160. }
  161. #define CHECK_COUNT() \
  162. if (dest_index + count > dest_size) { \
  163. av_log(NULL, AV_LOG_ERROR, " VQA video: decode_format80 problem: next op would overflow dest_index\n"); \
  164. av_log(NULL, AV_LOG_ERROR, " VQA video: current dest_index = %d, count = %d, dest_size = %d\n", \
  165. dest_index, count, dest_size); \
  166. return; \
  167. }
  168. static void decode_format80(const unsigned char *src, int src_size,
  169. unsigned char *dest, int dest_size, int check_size) {
  170. int src_index = 0;
  171. int dest_index = 0;
  172. int count;
  173. int src_pos;
  174. unsigned char color;
  175. int i;
  176. while (src_index < src_size) {
  177. av_dlog(NULL, " opcode %02X: ", src[src_index]);
  178. /* 0x80 means that frame is finished */
  179. if (src[src_index] == 0x80)
  180. return;
  181. if (dest_index >= dest_size) {
  182. av_log(NULL, AV_LOG_ERROR, " VQA video: decode_format80 problem: dest_index (%d) exceeded dest_size (%d)\n",
  183. dest_index, dest_size);
  184. return;
  185. }
  186. if (src[src_index] == 0xFF) {
  187. src_index++;
  188. count = AV_RL16(&src[src_index]);
  189. src_index += 2;
  190. src_pos = AV_RL16(&src[src_index]);
  191. src_index += 2;
  192. av_dlog(NULL, "(1) copy %X bytes from absolute pos %X\n", count, src_pos);
  193. CHECK_COUNT();
  194. for (i = 0; i < count; i++)
  195. dest[dest_index + i] = dest[src_pos + i];
  196. dest_index += count;
  197. } else if (src[src_index] == 0xFE) {
  198. src_index++;
  199. count = AV_RL16(&src[src_index]);
  200. src_index += 2;
  201. color = src[src_index++];
  202. av_dlog(NULL, "(2) set %X bytes to %02X\n", count, color);
  203. CHECK_COUNT();
  204. memset(&dest[dest_index], color, count);
  205. dest_index += count;
  206. } else if ((src[src_index] & 0xC0) == 0xC0) {
  207. count = (src[src_index++] & 0x3F) + 3;
  208. src_pos = AV_RL16(&src[src_index]);
  209. src_index += 2;
  210. av_dlog(NULL, "(3) copy %X bytes from absolute pos %X\n", count, src_pos);
  211. CHECK_COUNT();
  212. for (i = 0; i < count; i++)
  213. dest[dest_index + i] = dest[src_pos + i];
  214. dest_index += count;
  215. } else if (src[src_index] > 0x80) {
  216. count = src[src_index++] & 0x3F;
  217. av_dlog(NULL, "(4) copy %X bytes from source to dest\n", count);
  218. CHECK_COUNT();
  219. memcpy(&dest[dest_index], &src[src_index], count);
  220. src_index += count;
  221. dest_index += count;
  222. } else {
  223. count = ((src[src_index] & 0x70) >> 4) + 3;
  224. src_pos = AV_RB16(&src[src_index]) & 0x0FFF;
  225. src_index += 2;
  226. av_dlog(NULL, "(5) copy %X bytes from relpos %X\n", count, src_pos);
  227. CHECK_COUNT();
  228. for (i = 0; i < count; i++)
  229. dest[dest_index + i] = dest[dest_index - src_pos + i];
  230. dest_index += count;
  231. }
  232. }
  233. /* validate that the entire destination buffer was filled; this is
  234. * important for decoding frame maps since each vector needs to have a
  235. * codebook entry; it is not important for compressed codebooks because
  236. * not every entry needs to be filled */
  237. if (check_size)
  238. if (dest_index < dest_size)
  239. av_log(NULL, AV_LOG_ERROR, " VQA video: decode_format80 problem: decode finished with dest_index (%d) < dest_size (%d)\n",
  240. dest_index, dest_size);
  241. }
  242. static void vqa_decode_chunk(VqaContext *s)
  243. {
  244. unsigned int chunk_type;
  245. unsigned int chunk_size;
  246. int byte_skip;
  247. unsigned int index = 0;
  248. int i;
  249. unsigned char r, g, b;
  250. int index_shift;
  251. int cbf0_chunk = -1;
  252. int cbfz_chunk = -1;
  253. int cbp0_chunk = -1;
  254. int cbpz_chunk = -1;
  255. int cpl0_chunk = -1;
  256. int cplz_chunk = -1;
  257. int vptz_chunk = -1;
  258. int x, y;
  259. int lines = 0;
  260. int pixel_ptr;
  261. int vector_index = 0;
  262. int lobyte = 0;
  263. int hibyte = 0;
  264. int lobytes = 0;
  265. int hibytes = s->decode_buffer_size / 2;
  266. /* first, traverse through the frame and find the subchunks */
  267. while (index < s->size) {
  268. chunk_type = AV_RB32(&s->buf[index]);
  269. chunk_size = AV_RB32(&s->buf[index + 4]);
  270. switch (chunk_type) {
  271. case CBF0_TAG:
  272. cbf0_chunk = index;
  273. break;
  274. case CBFZ_TAG:
  275. cbfz_chunk = index;
  276. break;
  277. case CBP0_TAG:
  278. cbp0_chunk = index;
  279. break;
  280. case CBPZ_TAG:
  281. cbpz_chunk = index;
  282. break;
  283. case CPL0_TAG:
  284. cpl0_chunk = index;
  285. break;
  286. case CPLZ_TAG:
  287. cplz_chunk = index;
  288. break;
  289. case VPTZ_TAG:
  290. vptz_chunk = index;
  291. break;
  292. default:
  293. av_log(s->avctx, AV_LOG_ERROR, " VQA video: Found unknown chunk type: %c%c%c%c (%08X)\n",
  294. (chunk_type >> 24) & 0xFF,
  295. (chunk_type >> 16) & 0xFF,
  296. (chunk_type >> 8) & 0xFF,
  297. (chunk_type >> 0) & 0xFF,
  298. chunk_type);
  299. break;
  300. }
  301. byte_skip = chunk_size & 0x01;
  302. index += (CHUNK_PREAMBLE_SIZE + chunk_size + byte_skip);
  303. }
  304. /* next, deal with the palette */
  305. if ((cpl0_chunk != -1) && (cplz_chunk != -1)) {
  306. /* a chunk should not have both chunk types */
  307. av_log(s->avctx, AV_LOG_ERROR, " VQA video: problem: found both CPL0 and CPLZ chunks\n");
  308. return;
  309. }
  310. /* decompress the palette chunk */
  311. if (cplz_chunk != -1) {
  312. /* yet to be handled */
  313. }
  314. /* convert the RGB palette into the machine's endian format */
  315. if (cpl0_chunk != -1) {
  316. chunk_size = AV_RB32(&s->buf[cpl0_chunk + 4]);
  317. /* sanity check the palette size */
  318. if (chunk_size / 3 > 256) {
  319. av_log(s->avctx, AV_LOG_ERROR, " VQA video: problem: found a palette chunk with %d colors\n",
  320. chunk_size / 3);
  321. return;
  322. }
  323. cpl0_chunk += CHUNK_PREAMBLE_SIZE;
  324. for (i = 0; i < chunk_size / 3; i++) {
  325. /* scale by 4 to transform 6-bit palette -> 8-bit */
  326. r = s->buf[cpl0_chunk++] * 4;
  327. g = s->buf[cpl0_chunk++] * 4;
  328. b = s->buf[cpl0_chunk++] * 4;
  329. s->palette[i] = (r << 16) | (g << 8) | (b);
  330. }
  331. }
  332. /* next, look for a full codebook */
  333. if ((cbf0_chunk != -1) && (cbfz_chunk != -1)) {
  334. /* a chunk should not have both chunk types */
  335. av_log(s->avctx, AV_LOG_ERROR, " VQA video: problem: found both CBF0 and CBFZ chunks\n");
  336. return;
  337. }
  338. /* decompress the full codebook chunk */
  339. if (cbfz_chunk != -1) {
  340. chunk_size = AV_RB32(&s->buf[cbfz_chunk + 4]);
  341. cbfz_chunk += CHUNK_PREAMBLE_SIZE;
  342. decode_format80(&s->buf[cbfz_chunk], chunk_size,
  343. s->codebook, s->codebook_size, 0);
  344. }
  345. /* copy a full codebook */
  346. if (cbf0_chunk != -1) {
  347. chunk_size = AV_RB32(&s->buf[cbf0_chunk + 4]);
  348. /* sanity check the full codebook size */
  349. if (chunk_size > MAX_CODEBOOK_SIZE) {
  350. av_log(s->avctx, AV_LOG_ERROR, " VQA video: problem: CBF0 chunk too large (0x%X bytes)\n",
  351. chunk_size);
  352. return;
  353. }
  354. cbf0_chunk += CHUNK_PREAMBLE_SIZE;
  355. memcpy(s->codebook, &s->buf[cbf0_chunk], chunk_size);
  356. }
  357. /* decode the frame */
  358. if (vptz_chunk == -1) {
  359. /* something is wrong if there is no VPTZ chunk */
  360. av_log(s->avctx, AV_LOG_ERROR, " VQA video: problem: no VPTZ chunk found\n");
  361. return;
  362. }
  363. chunk_size = AV_RB32(&s->buf[vptz_chunk + 4]);
  364. vptz_chunk += CHUNK_PREAMBLE_SIZE;
  365. decode_format80(&s->buf[vptz_chunk], chunk_size,
  366. s->decode_buffer, s->decode_buffer_size, 1);
  367. /* render the final PAL8 frame */
  368. if (s->vector_height == 4)
  369. index_shift = 4;
  370. else
  371. index_shift = 3;
  372. for (y = 0; y < s->frame.linesize[0] * s->height;
  373. y += s->frame.linesize[0] * s->vector_height) {
  374. for (x = y; x < y + s->width; x += 4, lobytes++, hibytes++) {
  375. pixel_ptr = x;
  376. /* get the vector index, the method for which varies according to
  377. * VQA file version */
  378. switch (s->vqa_version) {
  379. case 1:
  380. lobyte = s->decode_buffer[lobytes * 2];
  381. hibyte = s->decode_buffer[(lobytes * 2) + 1];
  382. vector_index = ((hibyte << 8) | lobyte) >> 3;
  383. vector_index <<= index_shift;
  384. lines = s->vector_height;
  385. /* uniform color fill - a quick hack */
  386. if (hibyte == 0xFF) {
  387. while (lines--) {
  388. s->frame.data[0][pixel_ptr + 0] = 255 - lobyte;
  389. s->frame.data[0][pixel_ptr + 1] = 255 - lobyte;
  390. s->frame.data[0][pixel_ptr + 2] = 255 - lobyte;
  391. s->frame.data[0][pixel_ptr + 3] = 255 - lobyte;
  392. pixel_ptr += s->frame.linesize[0];
  393. }
  394. lines=0;
  395. }
  396. break;
  397. case 2:
  398. lobyte = s->decode_buffer[lobytes];
  399. hibyte = s->decode_buffer[hibytes];
  400. vector_index = (hibyte << 8) | lobyte;
  401. vector_index <<= index_shift;
  402. lines = s->vector_height;
  403. break;
  404. case 3:
  405. /* not implemented yet */
  406. lines = 0;
  407. break;
  408. }
  409. while (lines--) {
  410. s->frame.data[0][pixel_ptr + 0] = s->codebook[vector_index++];
  411. s->frame.data[0][pixel_ptr + 1] = s->codebook[vector_index++];
  412. s->frame.data[0][pixel_ptr + 2] = s->codebook[vector_index++];
  413. s->frame.data[0][pixel_ptr + 3] = s->codebook[vector_index++];
  414. pixel_ptr += s->frame.linesize[0];
  415. }
  416. }
  417. }
  418. /* handle partial codebook */
  419. if ((cbp0_chunk != -1) && (cbpz_chunk != -1)) {
  420. /* a chunk should not have both chunk types */
  421. av_log(s->avctx, AV_LOG_ERROR, " VQA video: problem: found both CBP0 and CBPZ chunks\n");
  422. return;
  423. }
  424. if (cbp0_chunk != -1) {
  425. chunk_size = AV_RB32(&s->buf[cbp0_chunk + 4]);
  426. cbp0_chunk += CHUNK_PREAMBLE_SIZE;
  427. /* accumulate partial codebook */
  428. memcpy(&s->next_codebook_buffer[s->next_codebook_buffer_index],
  429. &s->buf[cbp0_chunk], chunk_size);
  430. s->next_codebook_buffer_index += chunk_size;
  431. s->partial_countdown--;
  432. if (s->partial_countdown == 0) {
  433. /* time to replace codebook */
  434. memcpy(s->codebook, s->next_codebook_buffer,
  435. s->next_codebook_buffer_index);
  436. /* reset accounting */
  437. s->next_codebook_buffer_index = 0;
  438. s->partial_countdown = s->partial_count;
  439. }
  440. }
  441. if (cbpz_chunk != -1) {
  442. chunk_size = AV_RB32(&s->buf[cbpz_chunk + 4]);
  443. cbpz_chunk += CHUNK_PREAMBLE_SIZE;
  444. /* accumulate partial codebook */
  445. memcpy(&s->next_codebook_buffer[s->next_codebook_buffer_index],
  446. &s->buf[cbpz_chunk], chunk_size);
  447. s->next_codebook_buffer_index += chunk_size;
  448. s->partial_countdown--;
  449. if (s->partial_countdown == 0) {
  450. /* decompress codebook */
  451. decode_format80(s->next_codebook_buffer,
  452. s->next_codebook_buffer_index,
  453. s->codebook, s->codebook_size, 0);
  454. /* reset accounting */
  455. s->next_codebook_buffer_index = 0;
  456. s->partial_countdown = s->partial_count;
  457. }
  458. }
  459. }
  460. static int vqa_decode_frame(AVCodecContext *avctx,
  461. void *data, int *data_size,
  462. AVPacket *avpkt)
  463. {
  464. const uint8_t *buf = avpkt->data;
  465. int buf_size = avpkt->size;
  466. VqaContext *s = avctx->priv_data;
  467. s->buf = buf;
  468. s->size = buf_size;
  469. if (s->frame.data[0])
  470. avctx->release_buffer(avctx, &s->frame);
  471. if (avctx->get_buffer(avctx, &s->frame)) {
  472. av_log(s->avctx, AV_LOG_ERROR, " VQA Video: get_buffer() failed\n");
  473. return -1;
  474. }
  475. vqa_decode_chunk(s);
  476. /* make the palette available on the way out */
  477. memcpy(s->frame.data[1], s->palette, PALETTE_COUNT * 4);
  478. s->frame.palette_has_changed = 1;
  479. *data_size = sizeof(AVFrame);
  480. *(AVFrame*)data = s->frame;
  481. /* report that the buffer was completely consumed */
  482. return buf_size;
  483. }
  484. static av_cold int vqa_decode_end(AVCodecContext *avctx)
  485. {
  486. VqaContext *s = avctx->priv_data;
  487. av_free(s->codebook);
  488. av_free(s->next_codebook_buffer);
  489. av_free(s->decode_buffer);
  490. if (s->frame.data[0])
  491. avctx->release_buffer(avctx, &s->frame);
  492. return 0;
  493. }
  494. AVCodec ff_vqa_decoder = {
  495. .name = "vqavideo",
  496. .type = AVMEDIA_TYPE_VIDEO,
  497. .id = CODEC_ID_WS_VQA,
  498. .priv_data_size = sizeof(VqaContext),
  499. .init = vqa_decode_init,
  500. .close = vqa_decode_end,
  501. .decode = vqa_decode_frame,
  502. .capabilities = CODEC_CAP_DR1,
  503. .long_name = NULL_IF_CONFIG_SMALL("Westwood Studios VQA (Vector Quantized Animation) video"),
  504. };