You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

390 lines
13KB

  1. /*
  2. * id Quake II CIN File Demuxer
  3. * Copyright (c) 2003 The ffmpeg Project
  4. *
  5. * This file is part of FFmpeg.
  6. *
  7. * FFmpeg is free software; you can redistribute it and/or
  8. * modify it under the terms of the GNU Lesser General Public
  9. * License as published by the Free Software Foundation; either
  10. * version 2.1 of the License, or (at your option) any later version.
  11. *
  12. * FFmpeg is distributed in the hope that it will be useful,
  13. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  14. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  15. * Lesser General Public License for more details.
  16. *
  17. * You should have received a copy of the GNU Lesser General Public
  18. * License along with FFmpeg; if not, write to the Free Software
  19. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  20. */
  21. /**
  22. * @file
  23. * id Quake II CIN file demuxer by Mike Melanson (melanson@pcisys.net)
  24. * For more information about the id CIN format, visit:
  25. * http://www.csse.monash.edu.au/~timf/
  26. *
  27. * CIN is a somewhat quirky and ill-defined format. Here are some notes
  28. * for anyone trying to understand the technical details of this format:
  29. *
  30. * The format has no definite file signature. This is problematic for a
  31. * general-purpose media player that wants to automatically detect file
  32. * types. However, a CIN file does start with 5 32-bit numbers that
  33. * specify audio and video parameters. This demuxer gets around the lack
  34. * of file signature by performing sanity checks on those parameters.
  35. * Probabalistically, this is a reasonable solution since the number of
  36. * valid combinations of the 5 parameters is a very small subset of the
  37. * total 160-bit number space.
  38. *
  39. * Refer to the function idcin_probe() for the precise A/V parameters
  40. * that this demuxer allows.
  41. *
  42. * Next, each audio and video frame has a duration of 1/14 sec. If the
  43. * audio sample rate is a multiple of the common frequency 22050 Hz it will
  44. * divide evenly by 14. However, if the sample rate is 11025 Hz:
  45. * 11025 (samples/sec) / 14 (frames/sec) = 787.5 (samples/frame)
  46. * The way the CIN stores audio in this case is by storing 787 sample
  47. * frames in the first audio frame and 788 sample frames in the second
  48. * audio frame. Therefore, the total number of bytes in an audio frame
  49. * is given as:
  50. * audio frame #0: 787 * (bytes/sample) * (# channels) bytes in frame
  51. * audio frame #1: 788 * (bytes/sample) * (# channels) bytes in frame
  52. * audio frame #2: 787 * (bytes/sample) * (# channels) bytes in frame
  53. * audio frame #3: 788 * (bytes/sample) * (# channels) bytes in frame
  54. *
  55. * Finally, not all id CIN creation tools agree on the resolution of the
  56. * color palette, apparently. Some creation tools specify red, green, and
  57. * blue palette components in terms of 6-bit VGA color DAC values which
  58. * range from 0..63. Other tools specify the RGB components as full 8-bit
  59. * values that range from 0..255. Since there are no markers in the file to
  60. * differentiate between the two variants, this demuxer uses the following
  61. * heuristic:
  62. * - load the 768 palette bytes from disk
  63. * - assume that they will need to be shifted left by 2 bits to
  64. * transform them from 6-bit values to 8-bit values
  65. * - scan through all 768 palette bytes
  66. * - if any bytes exceed 63, do not shift the bytes at all before
  67. * transmitting them to the video decoder
  68. */
  69. #include "libavutil/channel_layout.h"
  70. #include "libavutil/imgutils.h"
  71. #include "libavutil/intreadwrite.h"
  72. #include "avformat.h"
  73. #include "internal.h"
  74. #define HUFFMAN_TABLE_SIZE (64 * 1024)
  75. #define IDCIN_FPS 14
  76. typedef struct IdcinDemuxContext {
  77. int video_stream_index;
  78. int audio_stream_index;
  79. int audio_chunk_size1;
  80. int audio_chunk_size2;
  81. int block_align;
  82. /* demux state variables */
  83. int current_audio_chunk;
  84. int next_chunk_is_video;
  85. int audio_present;
  86. int64_t first_pkt_pos;
  87. } IdcinDemuxContext;
  88. static int idcin_probe(AVProbeData *p)
  89. {
  90. unsigned int number, sample_rate;
  91. unsigned int w, h;
  92. int i;
  93. /*
  94. * This is what you could call a "probabilistic" file check: id CIN
  95. * files don't have a definite file signature. In lieu of such a marker,
  96. * perform sanity checks on the 5 32-bit header fields:
  97. * width, height: greater than 0, less than or equal to 1024
  98. * audio sample rate: greater than or equal to 8000, less than or
  99. * equal to 48000, or 0 for no audio
  100. * audio sample width (bytes/sample): 0 for no audio, or 1 or 2
  101. * audio channels: 0 for no audio, or 1 or 2
  102. */
  103. /* check we have enough data to do all checks, otherwise the
  104. 0-padding may cause a wrong recognition */
  105. if (p->buf_size < 20 + HUFFMAN_TABLE_SIZE + 12)
  106. return 0;
  107. /* check the video width */
  108. w = AV_RL32(&p->buf[0]);
  109. if ((w == 0) || (w > 1024))
  110. return 0;
  111. /* check the video height */
  112. h = AV_RL32(&p->buf[4]);
  113. if ((h == 0) || (h > 1024))
  114. return 0;
  115. /* check the audio sample rate */
  116. sample_rate = AV_RL32(&p->buf[8]);
  117. if (sample_rate && (sample_rate < 8000 || sample_rate > 48000))
  118. return 0;
  119. /* check the audio bytes/sample */
  120. number = AV_RL32(&p->buf[12]);
  121. if (number > 2 || sample_rate && !number)
  122. return 0;
  123. /* check the audio channels */
  124. number = AV_RL32(&p->buf[16]);
  125. if (number > 2 || sample_rate && !number)
  126. return 0;
  127. i = 20 + HUFFMAN_TABLE_SIZE;
  128. if (AV_RL32(&p->buf[i]) == 1)
  129. i += 768;
  130. if (i+12 > p->buf_size || AV_RL32(&p->buf[i+8]) != w*h)
  131. return 1;
  132. /* return half certainty since this check is a bit sketchy */
  133. return AVPROBE_SCORE_EXTENSION;
  134. }
  135. static int idcin_read_header(AVFormatContext *s)
  136. {
  137. AVIOContext *pb = s->pb;
  138. IdcinDemuxContext *idcin = s->priv_data;
  139. AVStream *st;
  140. unsigned int width, height;
  141. unsigned int sample_rate, bytes_per_sample, channels;
  142. int ret;
  143. /* get the 5 header parameters */
  144. width = avio_rl32(pb);
  145. height = avio_rl32(pb);
  146. sample_rate = avio_rl32(pb);
  147. bytes_per_sample = avio_rl32(pb);
  148. channels = avio_rl32(pb);
  149. if (s->pb->eof_reached) {
  150. av_log(s, AV_LOG_ERROR, "incomplete header\n");
  151. return s->pb->error ? s->pb->error : AVERROR_EOF;
  152. }
  153. if (av_image_check_size(width, height, 0, s) < 0)
  154. return AVERROR_INVALIDDATA;
  155. if (sample_rate > 0) {
  156. if (sample_rate < 14 || sample_rate > INT_MAX) {
  157. av_log(s, AV_LOG_ERROR, "invalid sample rate: %u\n", sample_rate);
  158. return AVERROR_INVALIDDATA;
  159. }
  160. if (bytes_per_sample < 1 || bytes_per_sample > 2) {
  161. av_log(s, AV_LOG_ERROR, "invalid bytes per sample: %u\n",
  162. bytes_per_sample);
  163. return AVERROR_INVALIDDATA;
  164. }
  165. if (channels < 1 || channels > 2) {
  166. av_log(s, AV_LOG_ERROR, "invalid channels: %u\n", channels);
  167. return AVERROR_INVALIDDATA;
  168. }
  169. idcin->audio_present = 1;
  170. } else {
  171. /* if sample rate is 0, assume no audio */
  172. idcin->audio_present = 0;
  173. }
  174. st = avformat_new_stream(s, NULL);
  175. if (!st)
  176. return AVERROR(ENOMEM);
  177. avpriv_set_pts_info(st, 33, 1, IDCIN_FPS);
  178. st->start_time = 0;
  179. idcin->video_stream_index = st->index;
  180. st->codec->codec_type = AVMEDIA_TYPE_VIDEO;
  181. st->codec->codec_id = AV_CODEC_ID_IDCIN;
  182. st->codec->codec_tag = 0; /* no fourcc */
  183. st->codec->width = width;
  184. st->codec->height = height;
  185. /* load up the Huffman tables into extradata */
  186. if (ff_alloc_extradata(st->codec, HUFFMAN_TABLE_SIZE))
  187. return AVERROR(ENOMEM);
  188. ret = avio_read(pb, st->codec->extradata, HUFFMAN_TABLE_SIZE);
  189. if (ret < 0) {
  190. return ret;
  191. } else if (ret != HUFFMAN_TABLE_SIZE) {
  192. av_log(s, AV_LOG_ERROR, "incomplete header\n");
  193. return AVERROR(EIO);
  194. }
  195. if (idcin->audio_present) {
  196. idcin->audio_present = 1;
  197. st = avformat_new_stream(s, NULL);
  198. if (!st)
  199. return AVERROR(ENOMEM);
  200. avpriv_set_pts_info(st, 63, 1, sample_rate);
  201. st->start_time = 0;
  202. idcin->audio_stream_index = st->index;
  203. st->codec->codec_type = AVMEDIA_TYPE_AUDIO;
  204. st->codec->codec_tag = 1;
  205. st->codec->channels = channels;
  206. st->codec->channel_layout = channels > 1 ? AV_CH_LAYOUT_STEREO :
  207. AV_CH_LAYOUT_MONO;
  208. st->codec->sample_rate = sample_rate;
  209. st->codec->bits_per_coded_sample = bytes_per_sample * 8;
  210. st->codec->bit_rate = sample_rate * bytes_per_sample * 8 * channels;
  211. st->codec->block_align = idcin->block_align = bytes_per_sample * channels;
  212. if (bytes_per_sample == 1)
  213. st->codec->codec_id = AV_CODEC_ID_PCM_U8;
  214. else
  215. st->codec->codec_id = AV_CODEC_ID_PCM_S16LE;
  216. if (sample_rate % 14 != 0) {
  217. idcin->audio_chunk_size1 = (sample_rate / 14) *
  218. bytes_per_sample * channels;
  219. idcin->audio_chunk_size2 = (sample_rate / 14 + 1) *
  220. bytes_per_sample * channels;
  221. } else {
  222. idcin->audio_chunk_size1 = idcin->audio_chunk_size2 =
  223. (sample_rate / 14) * bytes_per_sample * channels;
  224. }
  225. idcin->current_audio_chunk = 0;
  226. }
  227. idcin->next_chunk_is_video = 1;
  228. idcin->first_pkt_pos = avio_tell(s->pb);
  229. return 0;
  230. }
  231. static int idcin_read_packet(AVFormatContext *s,
  232. AVPacket *pkt)
  233. {
  234. int ret;
  235. unsigned int command;
  236. unsigned int chunk_size;
  237. IdcinDemuxContext *idcin = s->priv_data;
  238. AVIOContext *pb = s->pb;
  239. int i;
  240. int palette_scale;
  241. unsigned char r, g, b;
  242. unsigned char palette_buffer[768];
  243. uint32_t palette[256];
  244. if (url_feof(s->pb))
  245. return s->pb->error ? s->pb->error : AVERROR_EOF;
  246. if (idcin->next_chunk_is_video) {
  247. command = avio_rl32(pb);
  248. if (command == 2) {
  249. return AVERROR(EIO);
  250. } else if (command == 1) {
  251. /* trigger a palette change */
  252. ret = avio_read(pb, palette_buffer, 768);
  253. if (ret < 0) {
  254. return ret;
  255. } else if (ret != 768) {
  256. av_log(s, AV_LOG_ERROR, "incomplete packet\n");
  257. return AVERROR(EIO);
  258. }
  259. /* scale the palette as necessary */
  260. palette_scale = 2;
  261. for (i = 0; i < 768; i++)
  262. if (palette_buffer[i] > 63) {
  263. palette_scale = 0;
  264. break;
  265. }
  266. for (i = 0; i < 256; i++) {
  267. r = palette_buffer[i * 3 ] << palette_scale;
  268. g = palette_buffer[i * 3 + 1] << palette_scale;
  269. b = palette_buffer[i * 3 + 2] << palette_scale;
  270. palette[i] = (0xFFU << 24) | (r << 16) | (g << 8) | (b);
  271. if (palette_scale == 2)
  272. palette[i] |= palette[i] >> 6 & 0x30303;
  273. }
  274. }
  275. if (s->pb->eof_reached) {
  276. av_log(s, AV_LOG_ERROR, "incomplete packet\n");
  277. return s->pb->error ? s->pb->error : AVERROR_EOF;
  278. }
  279. chunk_size = avio_rl32(pb);
  280. if (chunk_size < 4 || chunk_size > INT_MAX - 4) {
  281. av_log(s, AV_LOG_ERROR, "invalid chunk size: %u\n", chunk_size);
  282. return AVERROR_INVALIDDATA;
  283. }
  284. /* skip the number of decoded bytes (always equal to width * height) */
  285. avio_skip(pb, 4);
  286. if (chunk_size < 4)
  287. return AVERROR_INVALIDDATA;
  288. chunk_size -= 4;
  289. ret= av_get_packet(pb, pkt, chunk_size);
  290. if (ret < 0)
  291. return ret;
  292. else if (ret != chunk_size) {
  293. av_log(s, AV_LOG_ERROR, "incomplete packet\n");
  294. av_free_packet(pkt);
  295. return AVERROR(EIO);
  296. }
  297. if (command == 1) {
  298. uint8_t *pal;
  299. pal = av_packet_new_side_data(pkt, AV_PKT_DATA_PALETTE,
  300. AVPALETTE_SIZE);
  301. if (!pal) {
  302. av_free_packet(pkt);
  303. return AVERROR(ENOMEM);
  304. }
  305. memcpy(pal, palette, AVPALETTE_SIZE);
  306. pkt->flags |= AV_PKT_FLAG_KEY;
  307. }
  308. pkt->stream_index = idcin->video_stream_index;
  309. pkt->duration = 1;
  310. } else {
  311. /* send out the audio chunk */
  312. if (idcin->current_audio_chunk)
  313. chunk_size = idcin->audio_chunk_size2;
  314. else
  315. chunk_size = idcin->audio_chunk_size1;
  316. ret= av_get_packet(pb, pkt, chunk_size);
  317. if (ret < 0)
  318. return ret;
  319. pkt->stream_index = idcin->audio_stream_index;
  320. pkt->duration = chunk_size / idcin->block_align;
  321. idcin->current_audio_chunk ^= 1;
  322. }
  323. if (idcin->audio_present)
  324. idcin->next_chunk_is_video ^= 1;
  325. return 0;
  326. }
  327. static int idcin_read_seek(AVFormatContext *s, int stream_index,
  328. int64_t timestamp, int flags)
  329. {
  330. IdcinDemuxContext *idcin = s->priv_data;
  331. if (idcin->first_pkt_pos > 0) {
  332. int ret = avio_seek(s->pb, idcin->first_pkt_pos, SEEK_SET);
  333. if (ret < 0)
  334. return ret;
  335. ff_update_cur_dts(s, s->streams[idcin->video_stream_index], 0);
  336. idcin->next_chunk_is_video = 1;
  337. idcin->current_audio_chunk = 0;
  338. return 0;
  339. }
  340. return -1;
  341. }
  342. AVInputFormat ff_idcin_demuxer = {
  343. .name = "idcin",
  344. .long_name = NULL_IF_CONFIG_SMALL("id Cinematic"),
  345. .priv_data_size = sizeof(IdcinDemuxContext),
  346. .read_probe = idcin_probe,
  347. .read_header = idcin_read_header,
  348. .read_packet = idcin_read_packet,
  349. .read_seek = idcin_read_seek,
  350. .flags = AVFMT_NO_BYTE_SEEK,
  351. };