You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

267 lines
8.7KB

  1. /*
  2. * Westwood Studios VQA Format Demuxer
  3. * Copyright (c) 2003 The ffmpeg Project
  4. *
  5. * This file is part of FFmpeg.
  6. *
  7. * FFmpeg is free software; you can redistribute it and/or
  8. * modify it under the terms of the GNU Lesser General Public
  9. * License as published by the Free Software Foundation; either
  10. * version 2.1 of the License, or (at your option) any later version.
  11. *
  12. * FFmpeg is distributed in the hope that it will be useful,
  13. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  14. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  15. * Lesser General Public License for more details.
  16. *
  17. * You should have received a copy of the GNU Lesser General Public
  18. * License along with FFmpeg; if not, write to the Free Software
  19. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  20. */
  21. /**
  22. * @file
  23. * Westwood Studios VQA file demuxer
  24. * by Mike Melanson (melanson@pcisys.net)
  25. * for more information on the Westwood file formats, visit:
  26. * http://www.pcisys.net/~melanson/codecs/
  27. * http://www.geocities.com/SiliconValley/8682/aud3.txt
  28. */
  29. #include "libavutil/intreadwrite.h"
  30. #include "avformat.h"
  31. #include "internal.h"
  32. #define FORM_TAG MKBETAG('F', 'O', 'R', 'M')
  33. #define WVQA_TAG MKBETAG('W', 'V', 'Q', 'A')
  34. #define VQHD_TAG MKBETAG('V', 'Q', 'H', 'D')
  35. #define FINF_TAG MKBETAG('F', 'I', 'N', 'F')
  36. #define SND0_TAG MKBETAG('S', 'N', 'D', '0')
  37. #define SND1_TAG MKBETAG('S', 'N', 'D', '1')
  38. #define SND2_TAG MKBETAG('S', 'N', 'D', '2')
  39. #define VQFR_TAG MKBETAG('V', 'Q', 'F', 'R')
  40. /* don't know what these tags are for, but acknowledge their existence */
  41. #define CINF_TAG MKBETAG('C', 'I', 'N', 'F')
  42. #define CINH_TAG MKBETAG('C', 'I', 'N', 'H')
  43. #define CIND_TAG MKBETAG('C', 'I', 'N', 'D')
  44. #define PINF_TAG MKBETAG('P', 'I', 'N', 'F')
  45. #define PINH_TAG MKBETAG('P', 'I', 'N', 'H')
  46. #define PIND_TAG MKBETAG('P', 'I', 'N', 'D')
  47. #define CMDS_TAG MKBETAG('C', 'M', 'D', 'S')
  48. #define VQA_HEADER_SIZE 0x2A
  49. #define VQA_PREAMBLE_SIZE 8
  50. typedef struct WsVqaDemuxContext {
  51. int audio_channels;
  52. int audio_stream_index;
  53. int video_stream_index;
  54. } WsVqaDemuxContext;
  55. static int wsvqa_probe(AVProbeData *p)
  56. {
  57. /* need 12 bytes to qualify */
  58. if (p->buf_size < 12)
  59. return 0;
  60. /* check for the VQA signatures */
  61. if ((AV_RB32(&p->buf[0]) != FORM_TAG) ||
  62. (AV_RB32(&p->buf[8]) != WVQA_TAG))
  63. return 0;
  64. return AVPROBE_SCORE_MAX;
  65. }
  66. static int wsvqa_read_header(AVFormatContext *s)
  67. {
  68. WsVqaDemuxContext *wsvqa = s->priv_data;
  69. AVIOContext *pb = s->pb;
  70. AVStream *st;
  71. unsigned char *header;
  72. unsigned char scratch[VQA_PREAMBLE_SIZE];
  73. unsigned int chunk_tag;
  74. unsigned int chunk_size;
  75. int fps, version, flags, sample_rate, channels;
  76. /* initialize the video decoder stream */
  77. st = avformat_new_stream(s, NULL);
  78. if (!st)
  79. return AVERROR(ENOMEM);
  80. st->start_time = 0;
  81. wsvqa->video_stream_index = st->index;
  82. st->codec->codec_type = AVMEDIA_TYPE_VIDEO;
  83. st->codec->codec_id = CODEC_ID_WS_VQA;
  84. st->codec->codec_tag = 0; /* no fourcc */
  85. /* skip to the start of the VQA header */
  86. avio_seek(pb, 20, SEEK_SET);
  87. /* the VQA header needs to go to the decoder */
  88. st->codec->extradata_size = VQA_HEADER_SIZE;
  89. st->codec->extradata = av_mallocz(VQA_HEADER_SIZE + FF_INPUT_BUFFER_PADDING_SIZE);
  90. header = (unsigned char *)st->codec->extradata;
  91. if (avio_read(pb, st->codec->extradata, VQA_HEADER_SIZE) !=
  92. VQA_HEADER_SIZE) {
  93. av_free(st->codec->extradata);
  94. return AVERROR(EIO);
  95. }
  96. st->codec->width = AV_RL16(&header[6]);
  97. st->codec->height = AV_RL16(&header[8]);
  98. fps = header[12];
  99. if (fps < 1 || fps > 30) {
  100. av_log(s, AV_LOG_ERROR, "invalid fps: %d\n", fps);
  101. return AVERROR_INVALIDDATA;
  102. }
  103. avpriv_set_pts_info(st, 64, 1, fps);
  104. /* initialize the audio decoder stream for VQA v1 or nonzero samplerate */
  105. version = AV_RL16(&header[ 0]);
  106. flags = AV_RL16(&header[ 2]);
  107. sample_rate = AV_RL16(&header[24]);
  108. channels = header[26];
  109. if (sample_rate || (version == 1 && flags == 1)) {
  110. st = avformat_new_stream(s, NULL);
  111. if (!st)
  112. return AVERROR(ENOMEM);
  113. st->start_time = 0;
  114. st->codec->codec_type = AVMEDIA_TYPE_AUDIO;
  115. st->codec->extradata_size = VQA_HEADER_SIZE;
  116. st->codec->extradata = av_mallocz(VQA_HEADER_SIZE + FF_INPUT_BUFFER_PADDING_SIZE);
  117. if (!st->codec->extradata)
  118. return AVERROR(ENOMEM);
  119. memcpy(st->codec->extradata, header, VQA_HEADER_SIZE);
  120. if (!sample_rate)
  121. sample_rate = 22050;
  122. st->codec->sample_rate = sample_rate;
  123. avpriv_set_pts_info(st, 64, 1, st->codec->sample_rate);
  124. if (!channels)
  125. channels = 1;
  126. st->codec->channels = channels;
  127. switch (version) {
  128. case 1:
  129. st->codec->codec_id = CODEC_ID_WESTWOOD_SND1;
  130. break;
  131. case 2:
  132. case 3:
  133. st->codec->codec_id = CODEC_ID_ADPCM_IMA_WS;
  134. st->codec->bits_per_coded_sample = 4;
  135. st->codec->bit_rate = channels * sample_rate * 4;
  136. break;
  137. default:
  138. /* NOTE: version 0 is supposedly raw pcm_u8 or pcm_s16le, but we do
  139. not have any samples to validate this */
  140. av_log_ask_for_sample(s, "VQA version %d audio\n", version);
  141. return AVERROR_PATCHWELCOME;
  142. }
  143. wsvqa->audio_stream_index = st->index;
  144. wsvqa->audio_channels = st->codec->channels;
  145. }
  146. /* there are 0 or more chunks before the FINF chunk; iterate until
  147. * FINF has been skipped and the file will be ready to be demuxed */
  148. do {
  149. if (avio_read(pb, scratch, VQA_PREAMBLE_SIZE) != VQA_PREAMBLE_SIZE)
  150. return AVERROR(EIO);
  151. chunk_tag = AV_RB32(&scratch[0]);
  152. chunk_size = AV_RB32(&scratch[4]);
  153. /* catch any unknown header tags, for curiousity */
  154. switch (chunk_tag) {
  155. case CINF_TAG:
  156. case CINH_TAG:
  157. case CIND_TAG:
  158. case PINF_TAG:
  159. case PINH_TAG:
  160. case PIND_TAG:
  161. case FINF_TAG:
  162. case CMDS_TAG:
  163. break;
  164. default:
  165. av_log (s, AV_LOG_ERROR, " note: unknown chunk seen (%c%c%c%c)\n",
  166. scratch[0], scratch[1],
  167. scratch[2], scratch[3]);
  168. break;
  169. }
  170. avio_skip(pb, chunk_size);
  171. } while (chunk_tag != FINF_TAG);
  172. return 0;
  173. }
  174. static int wsvqa_read_packet(AVFormatContext *s,
  175. AVPacket *pkt)
  176. {
  177. WsVqaDemuxContext *wsvqa = s->priv_data;
  178. AVIOContext *pb = s->pb;
  179. int ret = -1;
  180. unsigned char preamble[VQA_PREAMBLE_SIZE];
  181. unsigned int chunk_type;
  182. unsigned int chunk_size;
  183. int skip_byte;
  184. while (avio_read(pb, preamble, VQA_PREAMBLE_SIZE) == VQA_PREAMBLE_SIZE) {
  185. chunk_type = AV_RB32(&preamble[0]);
  186. chunk_size = AV_RB32(&preamble[4]);
  187. skip_byte = chunk_size & 0x01;
  188. if ((chunk_type == SND2_TAG || chunk_type == SND1_TAG) && wsvqa->audio_channels == 0) {
  189. av_log(s, AV_LOG_ERROR, "audio chunk without any audio header information found\n");
  190. return AVERROR_INVALIDDATA;
  191. }
  192. if ((chunk_type == SND1_TAG) || (chunk_type == SND2_TAG) || (chunk_type == VQFR_TAG)) {
  193. ret= av_get_packet(pb, pkt, chunk_size);
  194. if (ret<0)
  195. return AVERROR(EIO);
  196. if (chunk_type == SND2_TAG) {
  197. pkt->stream_index = wsvqa->audio_stream_index;
  198. /* 2 samples/byte, 1 or 2 samples per frame depending on stereo */
  199. pkt->duration = (chunk_size * 2) / wsvqa->audio_channels;
  200. } else if(chunk_type == SND1_TAG) {
  201. pkt->stream_index = wsvqa->audio_stream_index;
  202. /* unpacked size is stored in header */
  203. pkt->duration = AV_RL16(pkt->data) / wsvqa->audio_channels;
  204. } else {
  205. pkt->stream_index = wsvqa->video_stream_index;
  206. pkt->duration = 1;
  207. }
  208. /* stay on 16-bit alignment */
  209. if (skip_byte)
  210. avio_skip(pb, 1);
  211. return ret;
  212. } else {
  213. switch(chunk_type){
  214. case CMDS_TAG:
  215. case SND0_TAG:
  216. break;
  217. default:
  218. av_log(s, AV_LOG_INFO, "Skipping unknown chunk 0x%08X\n", chunk_type);
  219. }
  220. avio_skip(pb, chunk_size + skip_byte);
  221. }
  222. }
  223. return ret;
  224. }
  225. AVInputFormat ff_wsvqa_demuxer = {
  226. .name = "wsvqa",
  227. .long_name = NULL_IF_CONFIG_SMALL("Westwood Studios VQA format"),
  228. .priv_data_size = sizeof(WsVqaDemuxContext),
  229. .read_probe = wsvqa_probe,
  230. .read_header = wsvqa_read_header,
  231. .read_packet = wsvqa_read_packet,
  232. };