You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

361 lines
12KB

  1. /*
  2. * 4X Technologies .4xm File Demuxer (no muxer)
  3. * Copyright (c) 2003 The ffmpeg Project
  4. *
  5. * This file is part of FFmpeg.
  6. *
  7. * FFmpeg is free software; you can redistribute it and/or
  8. * modify it under the terms of the GNU Lesser General Public
  9. * License as published by the Free Software Foundation; either
  10. * version 2.1 of the License, or (at your option) any later version.
  11. *
  12. * FFmpeg is distributed in the hope that it will be useful,
  13. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  14. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  15. * Lesser General Public License for more details.
  16. *
  17. * You should have received a copy of the GNU Lesser General Public
  18. * License along with FFmpeg; if not, write to the Free Software
  19. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  20. */
  21. /**
  22. * @file
  23. * 4X Technologies file demuxer
  24. * by Mike Melanson (melanson@pcisys.net)
  25. * for more information on the .4xm file format, visit:
  26. * http://www.pcisys.net/~melanson/codecs/
  27. */
  28. #include "libavutil/intreadwrite.h"
  29. #include "libavutil/intfloat_readwrite.h"
  30. #include "avformat.h"
  31. #include "internal.h"
  32. #define RIFF_TAG MKTAG('R', 'I', 'F', 'F')
  33. #define FOURXMV_TAG MKTAG('4', 'X', 'M', 'V')
  34. #define LIST_TAG MKTAG('L', 'I', 'S', 'T')
  35. #define HEAD_TAG MKTAG('H', 'E', 'A', 'D')
  36. #define TRK__TAG MKTAG('T', 'R', 'K', '_')
  37. #define MOVI_TAG MKTAG('M', 'O', 'V', 'I')
  38. #define VTRK_TAG MKTAG('V', 'T', 'R', 'K')
  39. #define STRK_TAG MKTAG('S', 'T', 'R', 'K')
  40. #define std__TAG MKTAG('s', 't', 'd', '_')
  41. #define name_TAG MKTAG('n', 'a', 'm', 'e')
  42. #define vtrk_TAG MKTAG('v', 't', 'r', 'k')
  43. #define strk_TAG MKTAG('s', 't', 'r', 'k')
  44. #define ifrm_TAG MKTAG('i', 'f', 'r', 'm')
  45. #define pfrm_TAG MKTAG('p', 'f', 'r', 'm')
  46. #define cfrm_TAG MKTAG('c', 'f', 'r', 'm')
  47. #define ifr2_TAG MKTAG('i', 'f', 'r', '2')
  48. #define pfr2_TAG MKTAG('p', 'f', 'r', '2')
  49. #define cfr2_TAG MKTAG('c', 'f', 'r', '2')
  50. #define snd__TAG MKTAG('s', 'n', 'd', '_')
  51. #define vtrk_SIZE 0x44
  52. #define strk_SIZE 0x28
  53. #define GET_LIST_HEADER() \
  54. fourcc_tag = avio_rl32(pb); \
  55. size = avio_rl32(pb); \
  56. if (fourcc_tag != LIST_TAG) \
  57. return AVERROR_INVALIDDATA; \
  58. fourcc_tag = avio_rl32(pb);
  59. typedef struct AudioTrack {
  60. int sample_rate;
  61. int bits;
  62. int channels;
  63. int stream_index;
  64. int adpcm;
  65. int64_t audio_pts;
  66. } AudioTrack;
  67. typedef struct FourxmDemuxContext {
  68. int width;
  69. int height;
  70. int video_stream_index;
  71. int track_count;
  72. AudioTrack *tracks;
  73. int64_t video_pts;
  74. float fps;
  75. } FourxmDemuxContext;
  76. static int fourxm_probe(AVProbeData *p)
  77. {
  78. if ((AV_RL32(&p->buf[0]) != RIFF_TAG) ||
  79. (AV_RL32(&p->buf[8]) != FOURXMV_TAG))
  80. return 0;
  81. return AVPROBE_SCORE_MAX;
  82. }
  83. static int fourxm_read_header(AVFormatContext *s,
  84. AVFormatParameters *ap)
  85. {
  86. AVIOContext *pb = s->pb;
  87. unsigned int fourcc_tag;
  88. unsigned int size;
  89. int header_size;
  90. FourxmDemuxContext *fourxm = s->priv_data;
  91. unsigned char *header;
  92. int i, ret;
  93. AVStream *st;
  94. fourxm->track_count = 0;
  95. fourxm->tracks = NULL;
  96. fourxm->fps = 1.0;
  97. /* skip the first 3 32-bit numbers */
  98. avio_skip(pb, 12);
  99. /* check for LIST-HEAD */
  100. GET_LIST_HEADER();
  101. header_size = size - 4;
  102. if (fourcc_tag != HEAD_TAG || header_size < 0)
  103. return AVERROR_INVALIDDATA;
  104. /* allocate space for the header and load the whole thing */
  105. header = av_malloc(header_size);
  106. if (!header)
  107. return AVERROR(ENOMEM);
  108. if (avio_read(pb, header, header_size) != header_size){
  109. av_free(header);
  110. return AVERROR(EIO);
  111. }
  112. /* take the lazy approach and search for any and all vtrk and strk chunks */
  113. for (i = 0; i < header_size - 8; i++) {
  114. fourcc_tag = AV_RL32(&header[i]);
  115. size = AV_RL32(&header[i + 4]);
  116. if (fourcc_tag == std__TAG) {
  117. fourxm->fps = av_int2flt(AV_RL32(&header[i + 12]));
  118. } else if (fourcc_tag == vtrk_TAG) {
  119. /* check that there is enough data */
  120. if (size != vtrk_SIZE) {
  121. ret= AVERROR_INVALIDDATA;
  122. goto fail;
  123. }
  124. fourxm->width = AV_RL32(&header[i + 36]);
  125. fourxm->height = AV_RL32(&header[i + 40]);
  126. /* allocate a new AVStream */
  127. st = avformat_new_stream(s, NULL);
  128. if (!st){
  129. ret= AVERROR(ENOMEM);
  130. goto fail;
  131. }
  132. avpriv_set_pts_info(st, 60, 1, fourxm->fps);
  133. fourxm->video_stream_index = st->index;
  134. st->codec->codec_type = AVMEDIA_TYPE_VIDEO;
  135. st->codec->codec_id = CODEC_ID_4XM;
  136. st->codec->extradata_size = 4;
  137. st->codec->extradata = av_malloc(4);
  138. AV_WL32(st->codec->extradata, AV_RL32(&header[i + 16]));
  139. st->codec->width = fourxm->width;
  140. st->codec->height = fourxm->height;
  141. i += 8 + size;
  142. } else if (fourcc_tag == strk_TAG) {
  143. int current_track;
  144. /* check that there is enough data */
  145. if (size != strk_SIZE) {
  146. ret= AVERROR_INVALIDDATA;
  147. goto fail;
  148. }
  149. current_track = AV_RL32(&header[i + 8]);
  150. if((unsigned)current_track >= UINT_MAX / sizeof(AudioTrack) - 1){
  151. av_log(s, AV_LOG_ERROR, "current_track too large\n");
  152. ret= -1;
  153. goto fail;
  154. }
  155. if (current_track + 1 > fourxm->track_count) {
  156. fourxm->tracks = av_realloc_f(fourxm->tracks,
  157. sizeof(AudioTrack),
  158. current_track + 1);
  159. if (!fourxm->tracks) {
  160. ret = AVERROR(ENOMEM);
  161. goto fail;
  162. }
  163. memset(&fourxm->tracks[fourxm->track_count], 0,
  164. sizeof(AudioTrack) * (current_track + 1 - fourxm->track_count));
  165. fourxm->track_count = current_track + 1;
  166. }
  167. fourxm->tracks[current_track].adpcm = AV_RL32(&header[i + 12]);
  168. fourxm->tracks[current_track].channels = AV_RL32(&header[i + 36]);
  169. fourxm->tracks[current_track].sample_rate = AV_RL32(&header[i + 40]);
  170. fourxm->tracks[current_track].bits = AV_RL32(&header[i + 44]);
  171. fourxm->tracks[current_track].audio_pts = 0;
  172. if( fourxm->tracks[current_track].channels <= 0
  173. || fourxm->tracks[current_track].sample_rate <= 0
  174. || fourxm->tracks[current_track].bits < 0){
  175. av_log(s, AV_LOG_ERROR, "audio header invalid\n");
  176. ret= -1;
  177. goto fail;
  178. }
  179. i += 8 + size;
  180. /* allocate a new AVStream */
  181. st = avformat_new_stream(s, NULL);
  182. if (!st){
  183. ret= AVERROR(ENOMEM);
  184. goto fail;
  185. }
  186. st->id = current_track;
  187. avpriv_set_pts_info(st, 60, 1, fourxm->tracks[current_track].sample_rate);
  188. fourxm->tracks[current_track].stream_index = st->index;
  189. st->codec->codec_type = AVMEDIA_TYPE_AUDIO;
  190. st->codec->codec_tag = 0;
  191. st->codec->channels = fourxm->tracks[current_track].channels;
  192. st->codec->sample_rate = fourxm->tracks[current_track].sample_rate;
  193. st->codec->bits_per_coded_sample = fourxm->tracks[current_track].bits;
  194. st->codec->bit_rate = st->codec->channels * st->codec->sample_rate *
  195. st->codec->bits_per_coded_sample;
  196. st->codec->block_align = st->codec->channels * st->codec->bits_per_coded_sample;
  197. if (fourxm->tracks[current_track].adpcm){
  198. st->codec->codec_id = CODEC_ID_ADPCM_4XM;
  199. }else if (st->codec->bits_per_coded_sample == 8){
  200. st->codec->codec_id = CODEC_ID_PCM_U8;
  201. }else
  202. st->codec->codec_id = CODEC_ID_PCM_S16LE;
  203. }
  204. }
  205. /* skip over the LIST-MOVI chunk (which is where the stream should be */
  206. GET_LIST_HEADER();
  207. if (fourcc_tag != MOVI_TAG){
  208. ret= AVERROR_INVALIDDATA;
  209. goto fail;
  210. }
  211. av_free(header);
  212. /* initialize context members */
  213. fourxm->video_pts = -1; /* first frame will push to 0 */
  214. return 0;
  215. fail:
  216. av_freep(&fourxm->tracks);
  217. av_free(header);
  218. return ret;
  219. }
  220. static int fourxm_read_packet(AVFormatContext *s,
  221. AVPacket *pkt)
  222. {
  223. FourxmDemuxContext *fourxm = s->priv_data;
  224. AVIOContext *pb = s->pb;
  225. unsigned int fourcc_tag;
  226. unsigned int size;
  227. int ret = 0;
  228. unsigned int track_number;
  229. int packet_read = 0;
  230. unsigned char header[8];
  231. int audio_frame_count;
  232. while (!packet_read) {
  233. if ((ret = avio_read(s->pb, header, 8)) < 0)
  234. return ret;
  235. fourcc_tag = AV_RL32(&header[0]);
  236. size = AV_RL32(&header[4]);
  237. if (url_feof(pb))
  238. return AVERROR(EIO);
  239. switch (fourcc_tag) {
  240. case LIST_TAG:
  241. /* this is a good time to bump the video pts */
  242. fourxm->video_pts ++;
  243. /* skip the LIST-* tag and move on to the next fourcc */
  244. avio_rl32(pb);
  245. break;
  246. case ifrm_TAG:
  247. case pfrm_TAG:
  248. case cfrm_TAG:
  249. case ifr2_TAG:
  250. case pfr2_TAG:
  251. case cfr2_TAG:
  252. /* allocate 8 more bytes than 'size' to account for fourcc
  253. * and size */
  254. if (size + 8 < size || av_new_packet(pkt, size + 8))
  255. return AVERROR(EIO);
  256. pkt->stream_index = fourxm->video_stream_index;
  257. pkt->pts = fourxm->video_pts;
  258. pkt->pos = avio_tell(s->pb);
  259. memcpy(pkt->data, header, 8);
  260. ret = avio_read(s->pb, &pkt->data[8], size);
  261. if (ret < 0){
  262. av_free_packet(pkt);
  263. }else
  264. packet_read = 1;
  265. break;
  266. case snd__TAG:
  267. track_number = avio_rl32(pb);
  268. avio_skip(pb, 4);
  269. size-=8;
  270. if (track_number < fourxm->track_count && fourxm->tracks[track_number].channels>0) {
  271. ret= av_get_packet(s->pb, pkt, size);
  272. if(ret<0)
  273. return AVERROR(EIO);
  274. pkt->stream_index =
  275. fourxm->tracks[track_number].stream_index;
  276. pkt->pts = fourxm->tracks[track_number].audio_pts;
  277. packet_read = 1;
  278. /* pts accounting */
  279. audio_frame_count = size;
  280. if (fourxm->tracks[track_number].adpcm)
  281. audio_frame_count -=
  282. 2 * (fourxm->tracks[track_number].channels);
  283. audio_frame_count /=
  284. fourxm->tracks[track_number].channels;
  285. if (fourxm->tracks[track_number].adpcm){
  286. audio_frame_count *= 2;
  287. }else
  288. audio_frame_count /=
  289. (fourxm->tracks[track_number].bits / 8);
  290. fourxm->tracks[track_number].audio_pts += audio_frame_count;
  291. } else {
  292. avio_skip(pb, size);
  293. }
  294. break;
  295. default:
  296. avio_skip(pb, size);
  297. break;
  298. }
  299. }
  300. return ret;
  301. }
  302. static int fourxm_read_close(AVFormatContext *s)
  303. {
  304. FourxmDemuxContext *fourxm = s->priv_data;
  305. av_freep(&fourxm->tracks);
  306. return 0;
  307. }
  308. AVInputFormat ff_fourxm_demuxer = {
  309. .name = "4xm",
  310. .long_name = NULL_IF_CONFIG_SMALL("4X Technologies format"),
  311. .priv_data_size = sizeof(FourxmDemuxContext),
  312. .read_probe = fourxm_probe,
  313. .read_header = fourxm_read_header,
  314. .read_packet = fourxm_read_packet,
  315. .read_close = fourxm_read_close,
  316. };