You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

1002 lines
33KB

  1. /*
  2. * "Real" compatible demuxer.
  3. * Copyright (c) 2000, 2001 Fabrice Bellard
  4. *
  5. * This file is part of FFmpeg.
  6. *
  7. * FFmpeg is free software; you can redistribute it and/or
  8. * modify it under the terms of the GNU Lesser General Public
  9. * License as published by the Free Software Foundation; either
  10. * version 2.1 of the License, or (at your option) any later version.
  11. *
  12. * FFmpeg is distributed in the hope that it will be useful,
  13. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  14. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  15. * Lesser General Public License for more details.
  16. *
  17. * You should have received a copy of the GNU Lesser General Public
  18. * License along with FFmpeg; if not, write to the Free Software
  19. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  20. */
  21. #include "libavutil/avassert.h"
  22. #include "libavutil/avstring.h"
  23. #include "libavutil/channel_layout.h"
  24. #include "libavutil/intreadwrite.h"
  25. #include "libavutil/dict.h"
  26. #include "avformat.h"
  27. #include "internal.h"
  28. #include "riff.h"
  29. #include "rmsipr.h"
  30. #include "rm.h"
  31. #define DEINT_ID_GENR MKTAG('g', 'e', 'n', 'r') ///< interleaving for Cooker/Atrac
  32. #define DEINT_ID_INT0 MKTAG('I', 'n', 't', '0') ///< no interleaving needed
  33. #define DEINT_ID_INT4 MKTAG('I', 'n', 't', '4') ///< interleaving for 28.8
  34. #define DEINT_ID_SIPR MKTAG('s', 'i', 'p', 'r') ///< interleaving for Sipro
  35. #define DEINT_ID_VBRF MKTAG('v', 'b', 'r', 'f') ///< VBR case for AAC
  36. #define DEINT_ID_VBRS MKTAG('v', 'b', 'r', 's') ///< VBR case for AAC
  37. struct RMStream {
  38. AVPacket pkt; ///< place to store merged video frame / reordered audio data
  39. int videobufsize; ///< current assembled frame size
  40. int videobufpos; ///< position for the next slice in the video buffer
  41. int curpic_num; ///< picture number of current frame
  42. int cur_slice, slices;
  43. int64_t pktpos; ///< first slice position in file
  44. /// Audio descrambling matrix parameters
  45. int64_t audiotimestamp; ///< Audio packet timestamp
  46. int sub_packet_cnt; // Subpacket counter, used while reading
  47. int sub_packet_size, sub_packet_h, coded_framesize; ///< Descrambling parameters from container
  48. int audio_framesize; /// Audio frame size from container
  49. int sub_packet_lengths[16]; /// Length of each subpacket
  50. int32_t deint_id; ///< deinterleaver used in audio stream
  51. };
  52. typedef struct {
  53. int nb_packets;
  54. int old_format;
  55. int current_stream;
  56. int remaining_len;
  57. int audio_stream_num; ///< Stream number for audio packets
  58. int audio_pkt_cnt; ///< Output packet counter
  59. } RMDemuxContext;
  60. static inline void get_strl(AVIOContext *pb, char *buf, int buf_size, int len)
  61. {
  62. int i;
  63. char *q, r;
  64. q = buf;
  65. for(i=0;i<len;i++) {
  66. r = avio_r8(pb);
  67. if (i < buf_size - 1)
  68. *q++ = r;
  69. }
  70. if (buf_size > 0) *q = '\0';
  71. }
  72. static void get_str8(AVIOContext *pb, char *buf, int buf_size)
  73. {
  74. get_strl(pb, buf, buf_size, avio_r8(pb));
  75. }
  76. static int rm_read_extradata(AVIOContext *pb, AVCodecContext *avctx, unsigned size)
  77. {
  78. if (size >= 1<<24)
  79. return -1;
  80. avctx->extradata = av_malloc(size + FF_INPUT_BUFFER_PADDING_SIZE);
  81. if (!avctx->extradata)
  82. return AVERROR(ENOMEM);
  83. avctx->extradata_size = avio_read(pb, avctx->extradata, size);
  84. memset(avctx->extradata + avctx->extradata_size, 0, FF_INPUT_BUFFER_PADDING_SIZE);
  85. if (avctx->extradata_size != size)
  86. return AVERROR(EIO);
  87. return 0;
  88. }
  89. static void rm_read_metadata(AVFormatContext *s, int wide)
  90. {
  91. char buf[1024];
  92. int i;
  93. for (i=0; i<FF_ARRAY_ELEMS(ff_rm_metadata); i++) {
  94. int len = wide ? avio_rb16(s->pb) : avio_r8(s->pb);
  95. get_strl(s->pb, buf, sizeof(buf), len);
  96. av_dict_set(&s->metadata, ff_rm_metadata[i], buf, 0);
  97. }
  98. }
  99. RMStream *ff_rm_alloc_rmstream (void)
  100. {
  101. RMStream *rms = av_mallocz(sizeof(RMStream));
  102. rms->curpic_num = -1;
  103. return rms;
  104. }
  105. void ff_rm_free_rmstream (RMStream *rms)
  106. {
  107. av_free_packet(&rms->pkt);
  108. }
  109. static int rm_read_audio_stream_info(AVFormatContext *s, AVIOContext *pb,
  110. AVStream *st, RMStream *ast, int read_all)
  111. {
  112. char buf[256];
  113. uint32_t version;
  114. int ret;
  115. /* ra type header */
  116. version = avio_rb16(pb); /* version */
  117. if (version == 3) {
  118. int header_size = avio_rb16(pb);
  119. int64_t startpos = avio_tell(pb);
  120. avio_skip(pb, 14);
  121. rm_read_metadata(s, 0);
  122. if ((startpos + header_size) >= avio_tell(pb) + 2) {
  123. // fourcc (should always be "lpcJ")
  124. avio_r8(pb);
  125. get_str8(pb, buf, sizeof(buf));
  126. }
  127. // Skip extra header crap (this should never happen)
  128. if ((startpos + header_size) > avio_tell(pb))
  129. avio_skip(pb, header_size + startpos - avio_tell(pb));
  130. st->codec->sample_rate = 8000;
  131. st->codec->channels = 1;
  132. st->codec->channel_layout = AV_CH_LAYOUT_MONO;
  133. st->codec->codec_type = AVMEDIA_TYPE_AUDIO;
  134. st->codec->codec_id = AV_CODEC_ID_RA_144;
  135. ast->deint_id = DEINT_ID_INT0;
  136. } else {
  137. int flavor, sub_packet_h, coded_framesize, sub_packet_size;
  138. int codecdata_length;
  139. /* old version (4) */
  140. avio_skip(pb, 2); /* unused */
  141. avio_rb32(pb); /* .ra4 */
  142. avio_rb32(pb); /* data size */
  143. avio_rb16(pb); /* version2 */
  144. avio_rb32(pb); /* header size */
  145. flavor= avio_rb16(pb); /* add codec info / flavor */
  146. ast->coded_framesize = coded_framesize = avio_rb32(pb); /* coded frame size */
  147. avio_rb32(pb); /* ??? */
  148. avio_rb32(pb); /* ??? */
  149. avio_rb32(pb); /* ??? */
  150. ast->sub_packet_h = sub_packet_h = avio_rb16(pb); /* 1 */
  151. st->codec->block_align= avio_rb16(pb); /* frame size */
  152. ast->sub_packet_size = sub_packet_size = avio_rb16(pb); /* sub packet size */
  153. avio_rb16(pb); /* ??? */
  154. if (version == 5) {
  155. avio_rb16(pb); avio_rb16(pb); avio_rb16(pb);
  156. }
  157. st->codec->sample_rate = avio_rb16(pb);
  158. avio_rb32(pb);
  159. st->codec->channels = avio_rb16(pb);
  160. if (version == 5) {
  161. ast->deint_id = avio_rl32(pb);
  162. avio_read(pb, buf, 4);
  163. buf[4] = 0;
  164. } else {
  165. get_str8(pb, buf, sizeof(buf)); /* desc */
  166. ast->deint_id = AV_RL32(buf);
  167. get_str8(pb, buf, sizeof(buf)); /* desc */
  168. }
  169. st->codec->codec_type = AVMEDIA_TYPE_AUDIO;
  170. st->codec->codec_tag = AV_RL32(buf);
  171. st->codec->codec_id = ff_codec_get_id(ff_rm_codec_tags,
  172. st->codec->codec_tag);
  173. switch (st->codec->codec_id) {
  174. case AV_CODEC_ID_AC3:
  175. st->need_parsing = AVSTREAM_PARSE_FULL;
  176. break;
  177. case AV_CODEC_ID_RA_288:
  178. st->codec->extradata_size= 0;
  179. ast->audio_framesize = st->codec->block_align;
  180. st->codec->block_align = coded_framesize;
  181. break;
  182. case AV_CODEC_ID_COOK:
  183. st->need_parsing = AVSTREAM_PARSE_HEADERS;
  184. case AV_CODEC_ID_ATRAC3:
  185. case AV_CODEC_ID_SIPR:
  186. avio_rb16(pb); avio_r8(pb);
  187. if (version == 5)
  188. avio_r8(pb);
  189. codecdata_length = avio_rb32(pb);
  190. if(codecdata_length + FF_INPUT_BUFFER_PADDING_SIZE <= (unsigned)codecdata_length){
  191. av_log(s, AV_LOG_ERROR, "codecdata_length too large\n");
  192. return -1;
  193. }
  194. ast->audio_framesize = st->codec->block_align;
  195. if (st->codec->codec_id == AV_CODEC_ID_SIPR) {
  196. if (flavor > 3) {
  197. av_log(s, AV_LOG_ERROR, "bad SIPR file flavor %d\n",
  198. flavor);
  199. return -1;
  200. }
  201. st->codec->block_align = ff_sipr_subpk_size[flavor];
  202. } else {
  203. if(sub_packet_size <= 0){
  204. av_log(s, AV_LOG_ERROR, "sub_packet_size is invalid\n");
  205. return -1;
  206. }
  207. st->codec->block_align = ast->sub_packet_size;
  208. }
  209. if ((ret = rm_read_extradata(pb, st->codec, codecdata_length)) < 0)
  210. return ret;
  211. break;
  212. case AV_CODEC_ID_AAC:
  213. avio_rb16(pb); avio_r8(pb);
  214. if (version == 5)
  215. avio_r8(pb);
  216. codecdata_length = avio_rb32(pb);
  217. if(codecdata_length + FF_INPUT_BUFFER_PADDING_SIZE <= (unsigned)codecdata_length){
  218. av_log(s, AV_LOG_ERROR, "codecdata_length too large\n");
  219. return -1;
  220. }
  221. if (codecdata_length >= 1) {
  222. avio_r8(pb);
  223. if ((ret = rm_read_extradata(pb, st->codec, codecdata_length - 1)) < 0)
  224. return ret;
  225. }
  226. break;
  227. default:
  228. av_strlcpy(st->codec->codec_name, buf, sizeof(st->codec->codec_name));
  229. }
  230. if (ast->deint_id == DEINT_ID_INT4 ||
  231. ast->deint_id == DEINT_ID_GENR ||
  232. ast->deint_id == DEINT_ID_SIPR) {
  233. if (st->codec->block_align <= 0 ||
  234. ast->audio_framesize * sub_packet_h > (unsigned)INT_MAX ||
  235. ast->audio_framesize * sub_packet_h < st->codec->block_align)
  236. return AVERROR_INVALIDDATA;
  237. if (av_new_packet(&ast->pkt, ast->audio_framesize * sub_packet_h) < 0)
  238. return AVERROR(ENOMEM);
  239. }
  240. switch (ast->deint_id) {
  241. case DEINT_ID_INT4:
  242. if (ast->coded_framesize > ast->audio_framesize ||
  243. sub_packet_h <= 1 ||
  244. ast->coded_framesize * sub_packet_h > (2 + (sub_packet_h & 1)) * ast->audio_framesize)
  245. return AVERROR_INVALIDDATA;
  246. break;
  247. case DEINT_ID_GENR:
  248. if (ast->sub_packet_size <= 0 ||
  249. ast->sub_packet_size > ast->audio_framesize)
  250. return AVERROR_INVALIDDATA;
  251. break;
  252. case DEINT_ID_SIPR:
  253. case DEINT_ID_INT0:
  254. case DEINT_ID_VBRS:
  255. case DEINT_ID_VBRF:
  256. break;
  257. default:
  258. av_log(s, AV_LOG_ERROR, "Unknown interleaver %X\n", ast->deint_id);
  259. return AVERROR_INVALIDDATA;
  260. }
  261. if (read_all) {
  262. avio_r8(pb);
  263. avio_r8(pb);
  264. avio_r8(pb);
  265. rm_read_metadata(s, 0);
  266. }
  267. }
  268. return 0;
  269. }
  270. int
  271. ff_rm_read_mdpr_codecdata (AVFormatContext *s, AVIOContext *pb,
  272. AVStream *st, RMStream *rst, int codec_data_size, const uint8_t *mime)
  273. {
  274. unsigned int v;
  275. int size;
  276. int64_t codec_pos;
  277. int ret;
  278. avpriv_set_pts_info(st, 64, 1, 1000);
  279. codec_pos = avio_tell(pb);
  280. v = avio_rb32(pb);
  281. if (v == MKTAG(0xfd, 'a', 'r', '.')) {
  282. /* ra type header */
  283. if (rm_read_audio_stream_info(s, pb, st, rst, 0))
  284. return -1;
  285. } else if (v == MKBETAG('L', 'S', 'D', ':')) {
  286. avio_seek(pb, -4, SEEK_CUR);
  287. if ((ret = rm_read_extradata(pb, st->codec, codec_data_size)) < 0)
  288. return ret;
  289. st->codec->codec_type = AVMEDIA_TYPE_AUDIO;
  290. st->codec->codec_tag = AV_RL32(st->codec->extradata);
  291. st->codec->codec_id = ff_codec_get_id(ff_rm_codec_tags,
  292. st->codec->codec_tag);
  293. } else if(mime && !strcmp(mime, "logical-fileinfo")){
  294. int stream_count, rule_count, property_count, i;
  295. ff_free_stream(s, st);
  296. if (avio_rb16(pb) != 0) {
  297. av_log(s, AV_LOG_WARNING, "Unsupported version\n");
  298. goto skip;
  299. }
  300. stream_count = avio_rb16(pb);
  301. avio_skip(pb, 6*stream_count);
  302. rule_count = avio_rb16(pb);
  303. avio_skip(pb, 2*rule_count);
  304. property_count = avio_rb16(pb);
  305. for(i=0; i<property_count; i++){
  306. uint8_t name[128], val[128];
  307. avio_rb32(pb);
  308. if (avio_rb16(pb) != 0) {
  309. av_log(s, AV_LOG_WARNING, "Unsupported Name value property version\n");
  310. goto skip; //FIXME skip just this one
  311. }
  312. get_str8(pb, name, sizeof(name));
  313. switch(avio_rb32(pb)) {
  314. case 2: get_strl(pb, val, sizeof(val), avio_rb16(pb));
  315. av_dict_set(&s->metadata, name, val, 0);
  316. break;
  317. default: avio_skip(pb, avio_rb16(pb));
  318. }
  319. }
  320. } else {
  321. int fps;
  322. if (avio_rl32(pb) != MKTAG('V', 'I', 'D', 'O')) {
  323. fail1:
  324. av_log(s, AV_LOG_WARNING, "Unsupported stream type %08x\n", v);
  325. goto skip;
  326. }
  327. st->codec->codec_tag = avio_rl32(pb);
  328. st->codec->codec_id = ff_codec_get_id(ff_rm_codec_tags,
  329. st->codec->codec_tag);
  330. av_dlog(s, "%X %X\n", st->codec->codec_tag, MKTAG('R', 'V', '2', '0'));
  331. if (st->codec->codec_id == AV_CODEC_ID_NONE)
  332. goto fail1;
  333. st->codec->width = avio_rb16(pb);
  334. st->codec->height = avio_rb16(pb);
  335. avio_skip(pb, 2); // looks like bits per sample
  336. avio_skip(pb, 4); // always zero?
  337. st->codec->codec_type = AVMEDIA_TYPE_VIDEO;
  338. st->need_parsing = AVSTREAM_PARSE_TIMESTAMPS;
  339. fps = avio_rb32(pb);
  340. if ((ret = rm_read_extradata(pb, st->codec, codec_data_size - (avio_tell(pb) - codec_pos))) < 0)
  341. return ret;
  342. av_reduce(&st->avg_frame_rate.den, &st->avg_frame_rate.num,
  343. 0x10000, fps, (1 << 30) - 1);
  344. #if FF_API_R_FRAME_RATE
  345. st->r_frame_rate = st->avg_frame_rate;
  346. #endif
  347. }
  348. skip:
  349. /* skip codec info */
  350. size = avio_tell(pb) - codec_pos;
  351. avio_skip(pb, codec_data_size - size);
  352. return 0;
  353. }
  354. /** this function assumes that the demuxer has already seeked to the start
  355. * of the INDX chunk, and will bail out if not. */
  356. static int rm_read_index(AVFormatContext *s)
  357. {
  358. AVIOContext *pb = s->pb;
  359. unsigned int size, n_pkts, str_id, next_off, n, pos, pts;
  360. AVStream *st;
  361. do {
  362. if (avio_rl32(pb) != MKTAG('I','N','D','X'))
  363. return -1;
  364. size = avio_rb32(pb);
  365. if (size < 20)
  366. return -1;
  367. avio_skip(pb, 2);
  368. n_pkts = avio_rb32(pb);
  369. str_id = avio_rb16(pb);
  370. next_off = avio_rb32(pb);
  371. for (n = 0; n < s->nb_streams; n++)
  372. if (s->streams[n]->id == str_id) {
  373. st = s->streams[n];
  374. break;
  375. }
  376. if (n == s->nb_streams) {
  377. av_log(s, AV_LOG_ERROR,
  378. "Invalid stream index %d for index at pos %"PRId64"\n",
  379. str_id, avio_tell(pb));
  380. goto skip;
  381. } else if ((avio_size(pb) - avio_tell(pb)) / 14 < n_pkts) {
  382. av_log(s, AV_LOG_ERROR,
  383. "Nr. of packets in packet index for stream index %d "
  384. "exceeds filesize (%"PRId64" at %"PRId64" = %"PRId64")\n",
  385. str_id, avio_size(pb), avio_tell(pb),
  386. (avio_size(pb) - avio_tell(pb)) / 14);
  387. goto skip;
  388. }
  389. for (n = 0; n < n_pkts; n++) {
  390. avio_skip(pb, 2);
  391. pts = avio_rb32(pb);
  392. pos = avio_rb32(pb);
  393. avio_skip(pb, 4); /* packet no. */
  394. av_add_index_entry(st, pos, pts, 0, 0, AVINDEX_KEYFRAME);
  395. }
  396. skip:
  397. if (next_off && avio_tell(pb) < next_off &&
  398. avio_seek(pb, next_off, SEEK_SET) < 0) {
  399. av_log(s, AV_LOG_ERROR,
  400. "Non-linear index detected, not supported\n");
  401. return -1;
  402. }
  403. } while (next_off);
  404. return 0;
  405. }
  406. static int rm_read_header_old(AVFormatContext *s)
  407. {
  408. RMDemuxContext *rm = s->priv_data;
  409. AVStream *st;
  410. rm->old_format = 1;
  411. st = avformat_new_stream(s, NULL);
  412. if (!st)
  413. return -1;
  414. st->priv_data = ff_rm_alloc_rmstream();
  415. return rm_read_audio_stream_info(s, s->pb, st, st->priv_data, 1);
  416. }
  417. static int rm_read_header(AVFormatContext *s)
  418. {
  419. RMDemuxContext *rm = s->priv_data;
  420. AVStream *st;
  421. AVIOContext *pb = s->pb;
  422. unsigned int tag;
  423. int tag_size;
  424. unsigned int start_time, duration;
  425. unsigned int data_off = 0, indx_off = 0;
  426. char buf[128], mime[128];
  427. int flags = 0;
  428. tag = avio_rl32(pb);
  429. if (tag == MKTAG('.', 'r', 'a', 0xfd)) {
  430. /* very old .ra format */
  431. return rm_read_header_old(s);
  432. } else if (tag != MKTAG('.', 'R', 'M', 'F')) {
  433. return AVERROR(EIO);
  434. }
  435. tag_size = avio_rb32(pb);
  436. avio_skip(pb, tag_size - 8);
  437. for(;;) {
  438. if (url_feof(pb))
  439. return -1;
  440. tag = avio_rl32(pb);
  441. tag_size = avio_rb32(pb);
  442. avio_rb16(pb);
  443. av_dlog(s, "tag=%c%c%c%c (%08x) size=%d\n",
  444. (tag ) & 0xff,
  445. (tag >> 8) & 0xff,
  446. (tag >> 16) & 0xff,
  447. (tag >> 24) & 0xff,
  448. tag,
  449. tag_size);
  450. if (tag_size < 10 && tag != MKTAG('D', 'A', 'T', 'A'))
  451. return -1;
  452. switch(tag) {
  453. case MKTAG('P', 'R', 'O', 'P'):
  454. /* file header */
  455. avio_rb32(pb); /* max bit rate */
  456. avio_rb32(pb); /* avg bit rate */
  457. avio_rb32(pb); /* max packet size */
  458. avio_rb32(pb); /* avg packet size */
  459. avio_rb32(pb); /* nb packets */
  460. duration = avio_rb32(pb); /* duration */
  461. s->duration = av_rescale(duration, AV_TIME_BASE, 1000);
  462. avio_rb32(pb); /* preroll */
  463. indx_off = avio_rb32(pb); /* index offset */
  464. data_off = avio_rb32(pb); /* data offset */
  465. avio_rb16(pb); /* nb streams */
  466. flags = avio_rb16(pb); /* flags */
  467. break;
  468. case MKTAG('C', 'O', 'N', 'T'):
  469. rm_read_metadata(s, 1);
  470. break;
  471. case MKTAG('M', 'D', 'P', 'R'):
  472. st = avformat_new_stream(s, NULL);
  473. if (!st)
  474. return AVERROR(ENOMEM);
  475. st->id = avio_rb16(pb);
  476. avio_rb32(pb); /* max bit rate */
  477. st->codec->bit_rate = avio_rb32(pb); /* bit rate */
  478. avio_rb32(pb); /* max packet size */
  479. avio_rb32(pb); /* avg packet size */
  480. start_time = avio_rb32(pb); /* start time */
  481. avio_rb32(pb); /* preroll */
  482. duration = avio_rb32(pb); /* duration */
  483. st->start_time = start_time;
  484. st->duration = duration;
  485. if(duration>0)
  486. s->duration = AV_NOPTS_VALUE;
  487. get_str8(pb, buf, sizeof(buf)); /* desc */
  488. get_str8(pb, mime, sizeof(mime)); /* mimetype */
  489. st->codec->codec_type = AVMEDIA_TYPE_DATA;
  490. st->priv_data = ff_rm_alloc_rmstream();
  491. if (ff_rm_read_mdpr_codecdata(s, s->pb, st, st->priv_data,
  492. avio_rb32(pb), mime) < 0)
  493. return -1;
  494. break;
  495. case MKTAG('D', 'A', 'T', 'A'):
  496. goto header_end;
  497. default:
  498. /* unknown tag: skip it */
  499. avio_skip(pb, tag_size - 10);
  500. break;
  501. }
  502. }
  503. header_end:
  504. rm->nb_packets = avio_rb32(pb); /* number of packets */
  505. if (!rm->nb_packets && (flags & 4))
  506. rm->nb_packets = 3600 * 25;
  507. avio_rb32(pb); /* next data header */
  508. if (!data_off)
  509. data_off = avio_tell(pb) - 18;
  510. if (indx_off && pb->seekable && !(s->flags & AVFMT_FLAG_IGNIDX) &&
  511. avio_seek(pb, indx_off, SEEK_SET) >= 0) {
  512. rm_read_index(s);
  513. avio_seek(pb, data_off + 18, SEEK_SET);
  514. }
  515. return 0;
  516. }
  517. static int get_num(AVIOContext *pb, int *len)
  518. {
  519. int n, n1;
  520. n = avio_rb16(pb);
  521. (*len)-=2;
  522. n &= 0x7FFF;
  523. if (n >= 0x4000) {
  524. return n - 0x4000;
  525. } else {
  526. n1 = avio_rb16(pb);
  527. (*len)-=2;
  528. return (n << 16) | n1;
  529. }
  530. }
  531. /* multiple of 20 bytes for ra144 (ugly) */
  532. #define RAW_PACKET_SIZE 1000
  533. static int sync(AVFormatContext *s, int64_t *timestamp, int *flags, int *stream_index, int64_t *pos){
  534. RMDemuxContext *rm = s->priv_data;
  535. AVIOContext *pb = s->pb;
  536. AVStream *st;
  537. uint32_t state=0xFFFFFFFF;
  538. while(!url_feof(pb)){
  539. int len, num, i;
  540. *pos= avio_tell(pb) - 3;
  541. if(rm->remaining_len > 0){
  542. num= rm->current_stream;
  543. len= rm->remaining_len;
  544. *timestamp = AV_NOPTS_VALUE;
  545. *flags= 0;
  546. }else{
  547. state= (state<<8) + avio_r8(pb);
  548. if(state == MKBETAG('I', 'N', 'D', 'X')){
  549. int n_pkts, expected_len;
  550. len = avio_rb32(pb);
  551. avio_skip(pb, 2);
  552. n_pkts = avio_rb32(pb);
  553. expected_len = 20 + n_pkts * 14;
  554. if (len == 20)
  555. /* some files don't add index entries to chunk size... */
  556. len = expected_len;
  557. else if (len != expected_len)
  558. av_log(s, AV_LOG_WARNING,
  559. "Index size %d (%d pkts) is wrong, should be %d.\n",
  560. len, n_pkts, expected_len);
  561. len -= 14; // we already read part of the index header
  562. if(len<0)
  563. continue;
  564. goto skip;
  565. } else if (state == MKBETAG('D','A','T','A')) {
  566. av_log(s, AV_LOG_WARNING,
  567. "DATA tag in middle of chunk, file may be broken.\n");
  568. }
  569. if(state > (unsigned)0xFFFF || state <= 12)
  570. continue;
  571. len=state - 12;
  572. state= 0xFFFFFFFF;
  573. num = avio_rb16(pb);
  574. *timestamp = avio_rb32(pb);
  575. avio_r8(pb); /* reserved */
  576. *flags = avio_r8(pb); /* flags */
  577. }
  578. for(i=0;i<s->nb_streams;i++) {
  579. st = s->streams[i];
  580. if (num == st->id)
  581. break;
  582. }
  583. if (i == s->nb_streams) {
  584. skip:
  585. /* skip packet if unknown number */
  586. avio_skip(pb, len);
  587. rm->remaining_len = 0;
  588. continue;
  589. }
  590. *stream_index= i;
  591. return len;
  592. }
  593. return -1;
  594. }
  595. static int rm_assemble_video_frame(AVFormatContext *s, AVIOContext *pb,
  596. RMDemuxContext *rm, RMStream *vst,
  597. AVPacket *pkt, int len, int *pseq,
  598. int64_t *timestamp)
  599. {
  600. int hdr, seq, pic_num, len2, pos;
  601. int type;
  602. hdr = avio_r8(pb); len--;
  603. type = hdr >> 6;
  604. if(type != 3){ // not frame as a part of packet
  605. seq = avio_r8(pb); len--;
  606. }
  607. if(type != 1){ // not whole frame
  608. len2 = get_num(pb, &len);
  609. pos = get_num(pb, &len);
  610. pic_num = avio_r8(pb); len--;
  611. }
  612. if(len<0)
  613. return -1;
  614. rm->remaining_len = len;
  615. if(type&1){ // frame, not slice
  616. if(type == 3){ // frame as a part of packet
  617. len= len2;
  618. *timestamp = pos;
  619. }
  620. if(rm->remaining_len < len)
  621. return -1;
  622. rm->remaining_len -= len;
  623. if(av_new_packet(pkt, len + 9) < 0)
  624. return AVERROR(EIO);
  625. pkt->data[0] = 0;
  626. AV_WL32(pkt->data + 1, 1);
  627. AV_WL32(pkt->data + 5, 0);
  628. avio_read(pb, pkt->data + 9, len);
  629. return 0;
  630. }
  631. //now we have to deal with single slice
  632. *pseq = seq;
  633. if((seq & 0x7F) == 1 || vst->curpic_num != pic_num){
  634. vst->slices = ((hdr & 0x3F) << 1) + 1;
  635. vst->videobufsize = len2 + 8*vst->slices + 1;
  636. av_free_packet(&vst->pkt); //FIXME this should be output.
  637. if(av_new_packet(&vst->pkt, vst->videobufsize) < 0)
  638. return AVERROR(ENOMEM);
  639. vst->videobufpos = 8*vst->slices + 1;
  640. vst->cur_slice = 0;
  641. vst->curpic_num = pic_num;
  642. vst->pktpos = avio_tell(pb);
  643. }
  644. if(type == 2)
  645. len = FFMIN(len, pos);
  646. if(++vst->cur_slice > vst->slices)
  647. return 1;
  648. AV_WL32(vst->pkt.data - 7 + 8*vst->cur_slice, 1);
  649. AV_WL32(vst->pkt.data - 3 + 8*vst->cur_slice, vst->videobufpos - 8*vst->slices - 1);
  650. if(vst->videobufpos + len > vst->videobufsize)
  651. return 1;
  652. if (avio_read(pb, vst->pkt.data + vst->videobufpos, len) != len)
  653. return AVERROR(EIO);
  654. vst->videobufpos += len;
  655. rm->remaining_len-= len;
  656. if (type == 2 || vst->videobufpos == vst->videobufsize) {
  657. vst->pkt.data[0] = vst->cur_slice-1;
  658. *pkt= vst->pkt;
  659. vst->pkt.data= NULL;
  660. vst->pkt.size= 0;
  661. if(vst->slices != vst->cur_slice) //FIXME find out how to set slices correct from the begin
  662. memmove(pkt->data + 1 + 8*vst->cur_slice, pkt->data + 1 + 8*vst->slices,
  663. vst->videobufpos - 1 - 8*vst->slices);
  664. pkt->size = vst->videobufpos + 8*(vst->cur_slice - vst->slices);
  665. pkt->pts = AV_NOPTS_VALUE;
  666. pkt->pos = vst->pktpos;
  667. vst->slices = 0;
  668. return 0;
  669. }
  670. return 1;
  671. }
  672. static inline void
  673. rm_ac3_swap_bytes (AVStream *st, AVPacket *pkt)
  674. {
  675. uint8_t *ptr;
  676. int j;
  677. if (st->codec->codec_id == AV_CODEC_ID_AC3) {
  678. ptr = pkt->data;
  679. for (j=0;j<pkt->size;j+=2) {
  680. FFSWAP(int, ptr[0], ptr[1]);
  681. ptr += 2;
  682. }
  683. }
  684. }
  685. int
  686. ff_rm_parse_packet (AVFormatContext *s, AVIOContext *pb,
  687. AVStream *st, RMStream *ast, int len, AVPacket *pkt,
  688. int *seq, int flags, int64_t timestamp)
  689. {
  690. RMDemuxContext *rm = s->priv_data;
  691. if (st->codec->codec_type == AVMEDIA_TYPE_VIDEO) {
  692. rm->current_stream= st->id;
  693. if(rm_assemble_video_frame(s, pb, rm, ast, pkt, len, seq, &timestamp))
  694. return -1; //got partial frame
  695. } else if (st->codec->codec_type == AVMEDIA_TYPE_AUDIO) {
  696. if ((ast->deint_id == DEINT_ID_GENR) ||
  697. (ast->deint_id == DEINT_ID_INT4) ||
  698. (ast->deint_id == DEINT_ID_SIPR)) {
  699. int x;
  700. int sps = ast->sub_packet_size;
  701. int cfs = ast->coded_framesize;
  702. int h = ast->sub_packet_h;
  703. int y = ast->sub_packet_cnt;
  704. int w = ast->audio_framesize;
  705. if (flags & 2)
  706. y = ast->sub_packet_cnt = 0;
  707. if (!y)
  708. ast->audiotimestamp = timestamp;
  709. switch (ast->deint_id) {
  710. case DEINT_ID_INT4:
  711. for (x = 0; x < h/2; x++)
  712. avio_read(pb, ast->pkt.data+x*2*w+y*cfs, cfs);
  713. break;
  714. case DEINT_ID_GENR:
  715. for (x = 0; x < w/sps; x++)
  716. avio_read(pb, ast->pkt.data+sps*(h*x+((h+1)/2)*(y&1)+(y>>1)), sps);
  717. break;
  718. case DEINT_ID_SIPR:
  719. avio_read(pb, ast->pkt.data + y * w, w);
  720. break;
  721. }
  722. if (++(ast->sub_packet_cnt) < h)
  723. return -1;
  724. if (ast->deint_id == DEINT_ID_SIPR)
  725. ff_rm_reorder_sipr_data(ast->pkt.data, h, w);
  726. ast->sub_packet_cnt = 0;
  727. rm->audio_stream_num = st->index;
  728. rm->audio_pkt_cnt = h * w / st->codec->block_align;
  729. } else if ((ast->deint_id == DEINT_ID_VBRF) ||
  730. (ast->deint_id == DEINT_ID_VBRS)) {
  731. int x;
  732. rm->audio_stream_num = st->index;
  733. ast->sub_packet_cnt = (avio_rb16(pb) & 0xf0) >> 4;
  734. if (ast->sub_packet_cnt) {
  735. for (x = 0; x < ast->sub_packet_cnt; x++)
  736. ast->sub_packet_lengths[x] = avio_rb16(pb);
  737. rm->audio_pkt_cnt = ast->sub_packet_cnt;
  738. ast->audiotimestamp = timestamp;
  739. } else
  740. return -1;
  741. } else {
  742. av_get_packet(pb, pkt, len);
  743. rm_ac3_swap_bytes(st, pkt);
  744. }
  745. } else
  746. av_get_packet(pb, pkt, len);
  747. pkt->stream_index = st->index;
  748. #if 0
  749. if (st->codec->codec_type == AVMEDIA_TYPE_VIDEO) {
  750. if(st->codec->codec_id == AV_CODEC_ID_RV20){
  751. int seq= 128*(pkt->data[2]&0x7F) + (pkt->data[3]>>1);
  752. av_log(s, AV_LOG_DEBUG, "%d %"PRId64" %d\n", *timestamp, *timestamp*512LL/25, seq);
  753. seq |= (timestamp&~0x3FFF);
  754. if(seq - timestamp > 0x2000) seq -= 0x4000;
  755. if(seq - timestamp < -0x2000) seq += 0x4000;
  756. }
  757. }
  758. #endif
  759. pkt->pts = timestamp;
  760. if (flags & 2)
  761. pkt->flags |= AV_PKT_FLAG_KEY;
  762. return st->codec->codec_type == AVMEDIA_TYPE_AUDIO ? rm->audio_pkt_cnt : 0;
  763. }
  764. int
  765. ff_rm_retrieve_cache (AVFormatContext *s, AVIOContext *pb,
  766. AVStream *st, RMStream *ast, AVPacket *pkt)
  767. {
  768. RMDemuxContext *rm = s->priv_data;
  769. av_assert0 (rm->audio_pkt_cnt > 0);
  770. if (ast->deint_id == DEINT_ID_VBRF ||
  771. ast->deint_id == DEINT_ID_VBRS)
  772. av_get_packet(pb, pkt, ast->sub_packet_lengths[ast->sub_packet_cnt - rm->audio_pkt_cnt]);
  773. else {
  774. if(av_new_packet(pkt, st->codec->block_align) < 0)
  775. return AVERROR(ENOMEM);
  776. memcpy(pkt->data, ast->pkt.data + st->codec->block_align * //FIXME avoid this
  777. (ast->sub_packet_h * ast->audio_framesize / st->codec->block_align - rm->audio_pkt_cnt),
  778. st->codec->block_align);
  779. }
  780. rm->audio_pkt_cnt--;
  781. if ((pkt->pts = ast->audiotimestamp) != AV_NOPTS_VALUE) {
  782. ast->audiotimestamp = AV_NOPTS_VALUE;
  783. pkt->flags = AV_PKT_FLAG_KEY;
  784. } else
  785. pkt->flags = 0;
  786. pkt->stream_index = st->index;
  787. return rm->audio_pkt_cnt;
  788. }
  789. static int rm_read_packet(AVFormatContext *s, AVPacket *pkt)
  790. {
  791. RMDemuxContext *rm = s->priv_data;
  792. AVStream *st;
  793. int i, len, res, seq = 1;
  794. int64_t timestamp, pos;
  795. int flags;
  796. for (;;) {
  797. if (rm->audio_pkt_cnt) {
  798. // If there are queued audio packet return them first
  799. st = s->streams[rm->audio_stream_num];
  800. res = ff_rm_retrieve_cache(s, s->pb, st, st->priv_data, pkt);
  801. if(res < 0)
  802. return res;
  803. flags = 0;
  804. } else {
  805. if (rm->old_format) {
  806. RMStream *ast;
  807. st = s->streams[0];
  808. ast = st->priv_data;
  809. timestamp = AV_NOPTS_VALUE;
  810. len = !ast->audio_framesize ? RAW_PACKET_SIZE :
  811. ast->coded_framesize * ast->sub_packet_h / 2;
  812. flags = (seq++ == 1) ? 2 : 0;
  813. pos = avio_tell(s->pb);
  814. } else {
  815. len=sync(s, &timestamp, &flags, &i, &pos);
  816. if (len > 0)
  817. st = s->streams[i];
  818. }
  819. if(len<0 || url_feof(s->pb))
  820. return AVERROR(EIO);
  821. res = ff_rm_parse_packet (s, s->pb, st, st->priv_data, len, pkt,
  822. &seq, flags, timestamp);
  823. if((flags&2) && (seq&0x7F) == 1)
  824. av_add_index_entry(st, pos, timestamp, 0, 0, AVINDEX_KEYFRAME);
  825. if (res)
  826. continue;
  827. }
  828. if( (st->discard >= AVDISCARD_NONKEY && !(flags&2))
  829. || st->discard >= AVDISCARD_ALL){
  830. av_free_packet(pkt);
  831. } else
  832. break;
  833. }
  834. return 0;
  835. }
  836. static int rm_read_close(AVFormatContext *s)
  837. {
  838. int i;
  839. for (i=0;i<s->nb_streams;i++)
  840. ff_rm_free_rmstream(s->streams[i]->priv_data);
  841. return 0;
  842. }
  843. static int rm_probe(AVProbeData *p)
  844. {
  845. /* check file header */
  846. if ((p->buf[0] == '.' && p->buf[1] == 'R' &&
  847. p->buf[2] == 'M' && p->buf[3] == 'F' &&
  848. p->buf[4] == 0 && p->buf[5] == 0) ||
  849. (p->buf[0] == '.' && p->buf[1] == 'r' &&
  850. p->buf[2] == 'a' && p->buf[3] == 0xfd))
  851. return AVPROBE_SCORE_MAX;
  852. else
  853. return 0;
  854. }
  855. static int64_t rm_read_dts(AVFormatContext *s, int stream_index,
  856. int64_t *ppos, int64_t pos_limit)
  857. {
  858. RMDemuxContext *rm = s->priv_data;
  859. int64_t pos, dts;
  860. int stream_index2, flags, len, h;
  861. pos = *ppos;
  862. if(rm->old_format)
  863. return AV_NOPTS_VALUE;
  864. if (avio_seek(s->pb, pos, SEEK_SET) < 0)
  865. return AV_NOPTS_VALUE;
  866. rm->remaining_len=0;
  867. for(;;){
  868. int seq=1;
  869. AVStream *st;
  870. len=sync(s, &dts, &flags, &stream_index2, &pos);
  871. if(len<0)
  872. return AV_NOPTS_VALUE;
  873. st = s->streams[stream_index2];
  874. if (st->codec->codec_type == AVMEDIA_TYPE_VIDEO) {
  875. h= avio_r8(s->pb); len--;
  876. if(!(h & 0x40)){
  877. seq = avio_r8(s->pb); len--;
  878. }
  879. }
  880. if((flags&2) && (seq&0x7F) == 1){
  881. av_dlog(s, "%d %d-%d %"PRId64" %d\n",
  882. flags, stream_index2, stream_index, dts, seq);
  883. av_add_index_entry(st, pos, dts, 0, 0, AVINDEX_KEYFRAME);
  884. if(stream_index2 == stream_index)
  885. break;
  886. }
  887. avio_skip(s->pb, len);
  888. }
  889. *ppos = pos;
  890. return dts;
  891. }
  892. AVInputFormat ff_rm_demuxer = {
  893. .name = "rm",
  894. .long_name = NULL_IF_CONFIG_SMALL("RealMedia"),
  895. .priv_data_size = sizeof(RMDemuxContext),
  896. .read_probe = rm_probe,
  897. .read_header = rm_read_header,
  898. .read_packet = rm_read_packet,
  899. .read_close = rm_read_close,
  900. .read_timestamp = rm_read_dts,
  901. };
  902. AVInputFormat ff_rdt_demuxer = {
  903. .name = "rdt",
  904. .long_name = NULL_IF_CONFIG_SMALL("RDT demuxer"),
  905. .priv_data_size = sizeof(RMDemuxContext),
  906. .read_close = rm_read_close,
  907. .flags = AVFMT_NOFILE,
  908. };