You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

625 lines
20KB

  1. /*
  2. * Westwood Studios VQA Video Decoder
  3. * Copyright (C) 2003 the ffmpeg project
  4. *
  5. * This file is part of FFmpeg.
  6. *
  7. * FFmpeg is free software; you can redistribute it and/or
  8. * modify it under the terms of the GNU Lesser General Public
  9. * License as published by the Free Software Foundation; either
  10. * version 2.1 of the License, or (at your option) any later version.
  11. *
  12. * FFmpeg is distributed in the hope that it will be useful,
  13. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  14. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  15. * Lesser General Public License for more details.
  16. *
  17. * You should have received a copy of the GNU Lesser General Public
  18. * License along with FFmpeg; if not, write to the Free Software
  19. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  20. */
  21. /**
  22. * @file
  23. * VQA Video Decoder
  24. * @author Mike Melanson (melanson@pcisys.net)
  25. * @see http://wiki.multimedia.cx/index.php?title=VQA
  26. *
  27. * The VQA video decoder outputs PAL8 or RGB555 colorspace data, depending
  28. * on the type of data in the file.
  29. *
  30. * This decoder needs the 42-byte VQHD header from the beginning
  31. * of the VQA file passed through the extradata field. The VQHD header
  32. * is laid out as:
  33. *
  34. * bytes 0-3 chunk fourcc: 'VQHD'
  35. * bytes 4-7 chunk size in big-endian format, should be 0x0000002A
  36. * bytes 8-49 VQHD chunk data
  37. *
  38. * Bytes 8-49 are what this decoder expects to see.
  39. *
  40. * Briefly, VQA is a vector quantized animation format that operates in a
  41. * VGA palettized colorspace. It operates on pixel vectors (blocks)
  42. * of either 4x2 or 4x4 in size. Compressed VQA chunks can contain vector
  43. * codebooks, palette information, and code maps for rendering vectors onto
  44. * frames. Any of these components can also be compressed with a run-length
  45. * encoding (RLE) algorithm commonly referred to as "format80".
  46. *
  47. * VQA takes a novel approach to rate control. Each group of n frames
  48. * (usually, n = 8) relies on a different vector codebook. Rather than
  49. * transporting an entire codebook every 8th frame, the new codebook is
  50. * broken up into 8 pieces and sent along with the compressed video chunks
  51. * for each of the 8 frames preceding the 8 frames which require the
  52. * codebook. A full codebook is also sent on the very first frame of a
  53. * file. This is an interesting technique, although it makes random file
  54. * seeking difficult despite the fact that the frames are all intracoded.
  55. *
  56. * V1,2 VQA uses 12-bit codebook indexes. If the 12-bit indexes were
  57. * packed into bytes and then RLE compressed, bytewise, the results would
  58. * be poor. That is why the coding method divides each index into 2 parts,
  59. * the top 4 bits and the bottom 8 bits, then RL encodes the 4-bit pieces
  60. * together and the 8-bit pieces together. If most of the vectors are
  61. * clustered into one group of 256 vectors, most of the 4-bit index pieces
  62. * should be the same.
  63. */
  64. #include <stdio.h>
  65. #include <stdlib.h>
  66. #include <string.h>
  67. #include "libavutil/intreadwrite.h"
  68. #include "libavutil/imgutils.h"
  69. #include "avcodec.h"
  70. #define PALETTE_COUNT 256
  71. #define VQA_HEADER_SIZE 0x2A
  72. #define CHUNK_PREAMBLE_SIZE 8
  73. /* allocate the maximum vector space, regardless of the file version:
  74. * (0xFF00 codebook vectors + 0x100 solid pixel vectors) * (4x4 pixels/block) */
  75. #define MAX_CODEBOOK_VECTORS 0xFF00
  76. #define SOLID_PIXEL_VECTORS 0x100
  77. #define MAX_VECTORS (MAX_CODEBOOK_VECTORS + SOLID_PIXEL_VECTORS)
  78. #define MAX_CODEBOOK_SIZE (MAX_VECTORS * 4 * 4)
  79. #define CBF0_TAG MKBETAG('C', 'B', 'F', '0')
  80. #define CBFZ_TAG MKBETAG('C', 'B', 'F', 'Z')
  81. #define CBP0_TAG MKBETAG('C', 'B', 'P', '0')
  82. #define CBPZ_TAG MKBETAG('C', 'B', 'P', 'Z')
  83. #define CPL0_TAG MKBETAG('C', 'P', 'L', '0')
  84. #define CPLZ_TAG MKBETAG('C', 'P', 'L', 'Z')
  85. #define VPTZ_TAG MKBETAG('V', 'P', 'T', 'Z')
  86. typedef struct VqaContext {
  87. AVCodecContext *avctx;
  88. AVFrame frame;
  89. const unsigned char *buf;
  90. int size;
  91. uint32_t palette[PALETTE_COUNT];
  92. int width; /* width of a frame */
  93. int height; /* height of a frame */
  94. int vector_width; /* width of individual vector */
  95. int vector_height; /* height of individual vector */
  96. int vqa_version; /* this should be either 1, 2 or 3 */
  97. unsigned char *codebook; /* the current codebook */
  98. int codebook_size;
  99. unsigned char *next_codebook_buffer; /* accumulator for next codebook */
  100. int next_codebook_buffer_index;
  101. unsigned char *decode_buffer;
  102. int decode_buffer_size;
  103. /* number of frames to go before replacing codebook */
  104. int partial_countdown;
  105. int partial_count;
  106. } VqaContext;
  107. static av_cold int vqa_decode_init(AVCodecContext *avctx)
  108. {
  109. VqaContext *s = avctx->priv_data;
  110. unsigned char *vqa_header;
  111. int i, j, codebook_index;
  112. s->avctx = avctx;
  113. avctx->pix_fmt = PIX_FMT_PAL8;
  114. /* make sure the extradata made it */
  115. if (s->avctx->extradata_size != VQA_HEADER_SIZE) {
  116. av_log(s->avctx, AV_LOG_ERROR, " VQA video: expected extradata size of %d\n", VQA_HEADER_SIZE);
  117. return -1;
  118. }
  119. /* load up the VQA parameters from the header */
  120. vqa_header = (unsigned char *)s->avctx->extradata;
  121. s->vqa_version = vqa_header[0];
  122. if (s->vqa_version < 1 || s->vqa_version > 3) {
  123. av_log(s->avctx, AV_LOG_ERROR, " VQA video: unsupported version %d\n", s->vqa_version);
  124. return -1;
  125. }
  126. s->width = AV_RL16(&vqa_header[6]);
  127. s->height = AV_RL16(&vqa_header[8]);
  128. if(av_image_check_size(s->width, s->height, 0, avctx)){
  129. s->width= s->height= 0;
  130. return -1;
  131. }
  132. s->vector_width = vqa_header[10];
  133. s->vector_height = vqa_header[11];
  134. s->partial_count = s->partial_countdown = vqa_header[13];
  135. /* the vector dimensions have to meet very stringent requirements */
  136. if ((s->vector_width != 4) ||
  137. ((s->vector_height != 2) && (s->vector_height != 4))) {
  138. /* return without further initialization */
  139. return -1;
  140. }
  141. /* allocate codebooks */
  142. s->codebook_size = MAX_CODEBOOK_SIZE;
  143. s->codebook = av_malloc(s->codebook_size);
  144. s->next_codebook_buffer = av_malloc(s->codebook_size);
  145. /* initialize the solid-color vectors */
  146. if (s->vector_height == 4) {
  147. codebook_index = 0xFF00 * 16;
  148. for (i = 0; i < 256; i++)
  149. for (j = 0; j < 16; j++)
  150. s->codebook[codebook_index++] = i;
  151. } else {
  152. codebook_index = 0xF00 * 8;
  153. for (i = 0; i < 256; i++)
  154. for (j = 0; j < 8; j++)
  155. s->codebook[codebook_index++] = i;
  156. }
  157. s->next_codebook_buffer_index = 0;
  158. /* allocate decode buffer */
  159. s->decode_buffer_size = (s->width / s->vector_width) *
  160. (s->height / s->vector_height) * 2;
  161. s->decode_buffer = av_malloc(s->decode_buffer_size);
  162. avcodec_get_frame_defaults(&s->frame);
  163. s->frame.data[0] = NULL;
  164. return 0;
  165. }
  166. #define CHECK_COUNT() \
  167. if (dest_index + count > dest_size) { \
  168. av_log(NULL, AV_LOG_ERROR, " VQA video: decode_format80 problem: next op would overflow dest_index\n"); \
  169. av_log(NULL, AV_LOG_ERROR, " VQA video: current dest_index = %d, count = %d, dest_size = %d\n", \
  170. dest_index, count, dest_size); \
  171. return; \
  172. }
  173. static void decode_format80(const unsigned char *src, int src_size,
  174. unsigned char *dest, int dest_size, int check_size) {
  175. int src_index = 0;
  176. int dest_index = 0;
  177. int count;
  178. int src_pos;
  179. unsigned char color;
  180. int i;
  181. while (src_index < src_size) {
  182. av_dlog(NULL, " opcode %02X: ", src[src_index]);
  183. /* 0x80 means that frame is finished */
  184. if (src[src_index] == 0x80)
  185. return;
  186. if (dest_index >= dest_size) {
  187. av_log(NULL, AV_LOG_ERROR, " VQA video: decode_format80 problem: dest_index (%d) exceeded dest_size (%d)\n",
  188. dest_index, dest_size);
  189. return;
  190. }
  191. if (src[src_index] == 0xFF) {
  192. src_index++;
  193. count = AV_RL16(&src[src_index]);
  194. src_index += 2;
  195. src_pos = AV_RL16(&src[src_index]);
  196. src_index += 2;
  197. av_dlog(NULL, "(1) copy %X bytes from absolute pos %X\n", count, src_pos);
  198. CHECK_COUNT();
  199. if (src_pos + count > dest_size)
  200. return;
  201. for (i = 0; i < count; i++)
  202. dest[dest_index + i] = dest[src_pos + i];
  203. dest_index += count;
  204. } else if (src[src_index] == 0xFE) {
  205. src_index++;
  206. count = AV_RL16(&src[src_index]);
  207. src_index += 2;
  208. color = src[src_index++];
  209. av_dlog(NULL, "(2) set %X bytes to %02X\n", count, color);
  210. CHECK_COUNT();
  211. memset(&dest[dest_index], color, count);
  212. dest_index += count;
  213. } else if ((src[src_index] & 0xC0) == 0xC0) {
  214. count = (src[src_index++] & 0x3F) + 3;
  215. src_pos = AV_RL16(&src[src_index]);
  216. src_index += 2;
  217. av_dlog(NULL, "(3) copy %X bytes from absolute pos %X\n", count, src_pos);
  218. CHECK_COUNT();
  219. if (src_pos + count > dest_size)
  220. return;
  221. for (i = 0; i < count; i++)
  222. dest[dest_index + i] = dest[src_pos + i];
  223. dest_index += count;
  224. } else if (src[src_index] > 0x80) {
  225. count = src[src_index++] & 0x3F;
  226. av_dlog(NULL, "(4) copy %X bytes from source to dest\n", count);
  227. CHECK_COUNT();
  228. memcpy(&dest[dest_index], &src[src_index], count);
  229. src_index += count;
  230. dest_index += count;
  231. } else {
  232. count = ((src[src_index] & 0x70) >> 4) + 3;
  233. src_pos = AV_RB16(&src[src_index]) & 0x0FFF;
  234. src_index += 2;
  235. av_dlog(NULL, "(5) copy %X bytes from relpos %X\n", count, src_pos);
  236. CHECK_COUNT();
  237. if (dest_index < src_pos)
  238. return;
  239. for (i = 0; i < count; i++)
  240. dest[dest_index + i] = dest[dest_index - src_pos + i];
  241. dest_index += count;
  242. }
  243. }
  244. /* validate that the entire destination buffer was filled; this is
  245. * important for decoding frame maps since each vector needs to have a
  246. * codebook entry; it is not important for compressed codebooks because
  247. * not every entry needs to be filled */
  248. if (check_size)
  249. if (dest_index < dest_size)
  250. av_log(NULL, AV_LOG_ERROR, " VQA video: decode_format80 problem: decode finished with dest_index (%d) < dest_size (%d)\n",
  251. dest_index, dest_size);
  252. }
  253. static void vqa_decode_chunk(VqaContext *s)
  254. {
  255. unsigned int chunk_type;
  256. unsigned int chunk_size;
  257. int byte_skip;
  258. unsigned int index = 0;
  259. int i;
  260. unsigned char r, g, b;
  261. int index_shift;
  262. int cbf0_chunk = -1;
  263. int cbfz_chunk = -1;
  264. int cbp0_chunk = -1;
  265. int cbpz_chunk = -1;
  266. int cpl0_chunk = -1;
  267. int cplz_chunk = -1;
  268. int vptz_chunk = -1;
  269. int x, y;
  270. int lines = 0;
  271. int pixel_ptr;
  272. int vector_index = 0;
  273. int lobyte = 0;
  274. int hibyte = 0;
  275. int lobytes = 0;
  276. int hibytes = s->decode_buffer_size / 2;
  277. /* first, traverse through the frame and find the subchunks */
  278. while (index < s->size) {
  279. chunk_type = AV_RB32(&s->buf[index]);
  280. chunk_size = AV_RB32(&s->buf[index + 4]);
  281. switch (chunk_type) {
  282. case CBF0_TAG:
  283. cbf0_chunk = index;
  284. break;
  285. case CBFZ_TAG:
  286. cbfz_chunk = index;
  287. break;
  288. case CBP0_TAG:
  289. cbp0_chunk = index;
  290. break;
  291. case CBPZ_TAG:
  292. cbpz_chunk = index;
  293. break;
  294. case CPL0_TAG:
  295. cpl0_chunk = index;
  296. break;
  297. case CPLZ_TAG:
  298. cplz_chunk = index;
  299. break;
  300. case VPTZ_TAG:
  301. vptz_chunk = index;
  302. break;
  303. default:
  304. av_log(s->avctx, AV_LOG_ERROR, " VQA video: Found unknown chunk type: %c%c%c%c (%08X)\n",
  305. (chunk_type >> 24) & 0xFF,
  306. (chunk_type >> 16) & 0xFF,
  307. (chunk_type >> 8) & 0xFF,
  308. (chunk_type >> 0) & 0xFF,
  309. chunk_type);
  310. break;
  311. }
  312. byte_skip = chunk_size & 0x01;
  313. index += (CHUNK_PREAMBLE_SIZE + chunk_size + byte_skip);
  314. }
  315. /* next, deal with the palette */
  316. if ((cpl0_chunk != -1) && (cplz_chunk != -1)) {
  317. /* a chunk should not have both chunk types */
  318. av_log(s->avctx, AV_LOG_ERROR, " VQA video: problem: found both CPL0 and CPLZ chunks\n");
  319. return;
  320. }
  321. /* decompress the palette chunk */
  322. if (cplz_chunk != -1) {
  323. /* yet to be handled */
  324. }
  325. /* convert the RGB palette into the machine's endian format */
  326. if (cpl0_chunk != -1) {
  327. chunk_size = AV_RB32(&s->buf[cpl0_chunk + 4]);
  328. /* sanity check the palette size */
  329. if (chunk_size / 3 > 256) {
  330. av_log(s->avctx, AV_LOG_ERROR, " VQA video: problem: found a palette chunk with %d colors\n",
  331. chunk_size / 3);
  332. return;
  333. }
  334. cpl0_chunk += CHUNK_PREAMBLE_SIZE;
  335. for (i = 0; i < chunk_size / 3; i++) {
  336. /* scale by 4 to transform 6-bit palette -> 8-bit */
  337. r = s->buf[cpl0_chunk++] * 4;
  338. g = s->buf[cpl0_chunk++] * 4;
  339. b = s->buf[cpl0_chunk++] * 4;
  340. s->palette[i] = 0xFF << 24 | r << 16 | g << 8 | b;
  341. s->palette[i] |= s->palette[i] >> 6 & 0x30303;
  342. }
  343. }
  344. /* next, look for a full codebook */
  345. if ((cbf0_chunk != -1) && (cbfz_chunk != -1)) {
  346. /* a chunk should not have both chunk types */
  347. av_log(s->avctx, AV_LOG_ERROR, " VQA video: problem: found both CBF0 and CBFZ chunks\n");
  348. return;
  349. }
  350. /* decompress the full codebook chunk */
  351. if (cbfz_chunk != -1) {
  352. chunk_size = AV_RB32(&s->buf[cbfz_chunk + 4]);
  353. cbfz_chunk += CHUNK_PREAMBLE_SIZE;
  354. decode_format80(&s->buf[cbfz_chunk], chunk_size,
  355. s->codebook, s->codebook_size, 0);
  356. }
  357. /* copy a full codebook */
  358. if (cbf0_chunk != -1) {
  359. chunk_size = AV_RB32(&s->buf[cbf0_chunk + 4]);
  360. /* sanity check the full codebook size */
  361. if (chunk_size > MAX_CODEBOOK_SIZE) {
  362. av_log(s->avctx, AV_LOG_ERROR, " VQA video: problem: CBF0 chunk too large (0x%X bytes)\n",
  363. chunk_size);
  364. return;
  365. }
  366. cbf0_chunk += CHUNK_PREAMBLE_SIZE;
  367. memcpy(s->codebook, &s->buf[cbf0_chunk], chunk_size);
  368. }
  369. /* decode the frame */
  370. if (vptz_chunk == -1) {
  371. /* something is wrong if there is no VPTZ chunk */
  372. av_log(s->avctx, AV_LOG_ERROR, " VQA video: problem: no VPTZ chunk found\n");
  373. return;
  374. }
  375. chunk_size = AV_RB32(&s->buf[vptz_chunk + 4]);
  376. vptz_chunk += CHUNK_PREAMBLE_SIZE;
  377. decode_format80(&s->buf[vptz_chunk], chunk_size,
  378. s->decode_buffer, s->decode_buffer_size, 1);
  379. /* render the final PAL8 frame */
  380. if (s->vector_height == 4)
  381. index_shift = 4;
  382. else
  383. index_shift = 3;
  384. for (y = 0; y < s->frame.linesize[0] * s->height;
  385. y += s->frame.linesize[0] * s->vector_height) {
  386. for (x = y; x < y + s->width; x += 4, lobytes++, hibytes++) {
  387. pixel_ptr = x;
  388. /* get the vector index, the method for which varies according to
  389. * VQA file version */
  390. switch (s->vqa_version) {
  391. case 1:
  392. lobyte = s->decode_buffer[lobytes * 2];
  393. hibyte = s->decode_buffer[(lobytes * 2) + 1];
  394. vector_index = ((hibyte << 8) | lobyte) >> 3;
  395. vector_index <<= index_shift;
  396. lines = s->vector_height;
  397. /* uniform color fill - a quick hack */
  398. if (hibyte == 0xFF) {
  399. while (lines--) {
  400. s->frame.data[0][pixel_ptr + 0] = 255 - lobyte;
  401. s->frame.data[0][pixel_ptr + 1] = 255 - lobyte;
  402. s->frame.data[0][pixel_ptr + 2] = 255 - lobyte;
  403. s->frame.data[0][pixel_ptr + 3] = 255 - lobyte;
  404. pixel_ptr += s->frame.linesize[0];
  405. }
  406. lines=0;
  407. }
  408. break;
  409. case 2:
  410. lobyte = s->decode_buffer[lobytes];
  411. hibyte = s->decode_buffer[hibytes];
  412. vector_index = (hibyte << 8) | lobyte;
  413. vector_index <<= index_shift;
  414. lines = s->vector_height;
  415. break;
  416. case 3:
  417. /* not implemented yet */
  418. lines = 0;
  419. break;
  420. }
  421. while (lines--) {
  422. s->frame.data[0][pixel_ptr + 0] = s->codebook[vector_index++];
  423. s->frame.data[0][pixel_ptr + 1] = s->codebook[vector_index++];
  424. s->frame.data[0][pixel_ptr + 2] = s->codebook[vector_index++];
  425. s->frame.data[0][pixel_ptr + 3] = s->codebook[vector_index++];
  426. pixel_ptr += s->frame.linesize[0];
  427. }
  428. }
  429. }
  430. /* handle partial codebook */
  431. if ((cbp0_chunk != -1) && (cbpz_chunk != -1)) {
  432. /* a chunk should not have both chunk types */
  433. av_log(s->avctx, AV_LOG_ERROR, " VQA video: problem: found both CBP0 and CBPZ chunks\n");
  434. return;
  435. }
  436. if (cbp0_chunk != -1) {
  437. chunk_size = AV_RB32(&s->buf[cbp0_chunk + 4]);
  438. cbp0_chunk += CHUNK_PREAMBLE_SIZE;
  439. /* accumulate partial codebook */
  440. memcpy(&s->next_codebook_buffer[s->next_codebook_buffer_index],
  441. &s->buf[cbp0_chunk], chunk_size);
  442. s->next_codebook_buffer_index += chunk_size;
  443. s->partial_countdown--;
  444. if (s->partial_countdown == 0) {
  445. /* time to replace codebook */
  446. memcpy(s->codebook, s->next_codebook_buffer,
  447. s->next_codebook_buffer_index);
  448. /* reset accounting */
  449. s->next_codebook_buffer_index = 0;
  450. s->partial_countdown = s->partial_count;
  451. }
  452. }
  453. if (cbpz_chunk != -1) {
  454. chunk_size = AV_RB32(&s->buf[cbpz_chunk + 4]);
  455. cbpz_chunk += CHUNK_PREAMBLE_SIZE;
  456. /* accumulate partial codebook */
  457. memcpy(&s->next_codebook_buffer[s->next_codebook_buffer_index],
  458. &s->buf[cbpz_chunk], chunk_size);
  459. s->next_codebook_buffer_index += chunk_size;
  460. s->partial_countdown--;
  461. if (s->partial_countdown == 0) {
  462. /* decompress codebook */
  463. decode_format80(s->next_codebook_buffer,
  464. s->next_codebook_buffer_index,
  465. s->codebook, s->codebook_size, 0);
  466. /* reset accounting */
  467. s->next_codebook_buffer_index = 0;
  468. s->partial_countdown = s->partial_count;
  469. }
  470. }
  471. }
  472. static int vqa_decode_frame(AVCodecContext *avctx,
  473. void *data, int *data_size,
  474. AVPacket *avpkt)
  475. {
  476. const uint8_t *buf = avpkt->data;
  477. int buf_size = avpkt->size;
  478. VqaContext *s = avctx->priv_data;
  479. s->buf = buf;
  480. s->size = buf_size;
  481. if (s->frame.data[0])
  482. avctx->release_buffer(avctx, &s->frame);
  483. if (avctx->get_buffer(avctx, &s->frame)) {
  484. av_log(s->avctx, AV_LOG_ERROR, " VQA Video: get_buffer() failed\n");
  485. return -1;
  486. }
  487. vqa_decode_chunk(s);
  488. /* make the palette available on the way out */
  489. memcpy(s->frame.data[1], s->palette, PALETTE_COUNT * 4);
  490. s->frame.palette_has_changed = 1;
  491. *data_size = sizeof(AVFrame);
  492. *(AVFrame*)data = s->frame;
  493. /* report that the buffer was completely consumed */
  494. return buf_size;
  495. }
  496. static av_cold int vqa_decode_end(AVCodecContext *avctx)
  497. {
  498. VqaContext *s = avctx->priv_data;
  499. av_free(s->codebook);
  500. av_free(s->next_codebook_buffer);
  501. av_free(s->decode_buffer);
  502. if (s->frame.data[0])
  503. avctx->release_buffer(avctx, &s->frame);
  504. return 0;
  505. }
  506. AVCodec ff_vqa_decoder = {
  507. .name = "vqavideo",
  508. .type = AVMEDIA_TYPE_VIDEO,
  509. .id = CODEC_ID_WS_VQA,
  510. .priv_data_size = sizeof(VqaContext),
  511. .init = vqa_decode_init,
  512. .close = vqa_decode_end,
  513. .decode = vqa_decode_frame,
  514. .capabilities = CODEC_CAP_DR1,
  515. .long_name = NULL_IF_CONFIG_SMALL("Westwood Studios VQA (Vector Quantized Animation) video"),
  516. };