You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

1005 lines
33KB

  1. /*
  2. * "Real" compatible demuxer.
  3. * Copyright (c) 2000, 2001 Fabrice Bellard
  4. *
  5. * This file is part of FFmpeg.
  6. *
  7. * FFmpeg is free software; you can redistribute it and/or
  8. * modify it under the terms of the GNU Lesser General Public
  9. * License as published by the Free Software Foundation; either
  10. * version 2.1 of the License, or (at your option) any later version.
  11. *
  12. * FFmpeg is distributed in the hope that it will be useful,
  13. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  14. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  15. * Lesser General Public License for more details.
  16. *
  17. * You should have received a copy of the GNU Lesser General Public
  18. * License along with FFmpeg; if not, write to the Free Software
  19. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  20. */
  21. #include "libavutil/avassert.h"
  22. #include "libavutil/avstring.h"
  23. #include "libavutil/channel_layout.h"
  24. #include "libavutil/intreadwrite.h"
  25. #include "libavutil/dict.h"
  26. #include "avformat.h"
  27. #include "internal.h"
  28. #include "rmsipr.h"
  29. #include "rm.h"
  30. #define DEINT_ID_GENR MKTAG('g', 'e', 'n', 'r') ///< interleaving for Cooker/Atrac
  31. #define DEINT_ID_INT0 MKTAG('I', 'n', 't', '0') ///< no interleaving needed
  32. #define DEINT_ID_INT4 MKTAG('I', 'n', 't', '4') ///< interleaving for 28.8
  33. #define DEINT_ID_SIPR MKTAG('s', 'i', 'p', 'r') ///< interleaving for Sipro
  34. #define DEINT_ID_VBRF MKTAG('v', 'b', 'r', 'f') ///< VBR case for AAC
  35. #define DEINT_ID_VBRS MKTAG('v', 'b', 'r', 's') ///< VBR case for AAC
  36. struct RMStream {
  37. AVPacket pkt; ///< place to store merged video frame / reordered audio data
  38. int videobufsize; ///< current assembled frame size
  39. int videobufpos; ///< position for the next slice in the video buffer
  40. int curpic_num; ///< picture number of current frame
  41. int cur_slice, slices;
  42. int64_t pktpos; ///< first slice position in file
  43. /// Audio descrambling matrix parameters
  44. int64_t audiotimestamp; ///< Audio packet timestamp
  45. int sub_packet_cnt; // Subpacket counter, used while reading
  46. int sub_packet_size, sub_packet_h, coded_framesize; ///< Descrambling parameters from container
  47. int audio_framesize; /// Audio frame size from container
  48. int sub_packet_lengths[16]; /// Length of each subpacket
  49. int32_t deint_id; ///< deinterleaver used in audio stream
  50. };
  51. typedef struct {
  52. int nb_packets;
  53. int old_format;
  54. int current_stream;
  55. int remaining_len;
  56. int audio_stream_num; ///< Stream number for audio packets
  57. int audio_pkt_cnt; ///< Output packet counter
  58. } RMDemuxContext;
  59. static inline void get_strl(AVIOContext *pb, char *buf, int buf_size, int len)
  60. {
  61. int i;
  62. char *q, r;
  63. q = buf;
  64. for(i=0;i<len;i++) {
  65. r = avio_r8(pb);
  66. if (i < buf_size - 1)
  67. *q++ = r;
  68. }
  69. if (buf_size > 0) *q = '\0';
  70. }
  71. static void get_str8(AVIOContext *pb, char *buf, int buf_size)
  72. {
  73. get_strl(pb, buf, buf_size, avio_r8(pb));
  74. }
  75. static int rm_read_extradata(AVIOContext *pb, AVCodecContext *avctx, unsigned size)
  76. {
  77. if (size >= 1<<24)
  78. return -1;
  79. avctx->extradata = av_malloc(size + FF_INPUT_BUFFER_PADDING_SIZE);
  80. if (!avctx->extradata)
  81. return AVERROR(ENOMEM);
  82. avctx->extradata_size = avio_read(pb, avctx->extradata, size);
  83. memset(avctx->extradata + avctx->extradata_size, 0, FF_INPUT_BUFFER_PADDING_SIZE);
  84. if (avctx->extradata_size != size)
  85. return AVERROR(EIO);
  86. return 0;
  87. }
  88. static void rm_read_metadata(AVFormatContext *s, int wide)
  89. {
  90. char buf[1024];
  91. int i;
  92. for (i=0; i<FF_ARRAY_ELEMS(ff_rm_metadata); i++) {
  93. int len = wide ? avio_rb16(s->pb) : avio_r8(s->pb);
  94. get_strl(s->pb, buf, sizeof(buf), len);
  95. av_dict_set(&s->metadata, ff_rm_metadata[i], buf, 0);
  96. }
  97. }
  98. RMStream *ff_rm_alloc_rmstream (void)
  99. {
  100. RMStream *rms = av_mallocz(sizeof(RMStream));
  101. rms->curpic_num = -1;
  102. return rms;
  103. }
  104. void ff_rm_free_rmstream (RMStream *rms)
  105. {
  106. av_free_packet(&rms->pkt);
  107. }
  108. static int rm_read_audio_stream_info(AVFormatContext *s, AVIOContext *pb,
  109. AVStream *st, RMStream *ast, int read_all)
  110. {
  111. char buf[256];
  112. uint32_t version;
  113. int ret;
  114. /* ra type header */
  115. version = avio_rb16(pb); /* version */
  116. if (version == 3) {
  117. int header_size = avio_rb16(pb);
  118. int64_t startpos = avio_tell(pb);
  119. avio_skip(pb, 14);
  120. rm_read_metadata(s, 0);
  121. if ((startpos + header_size) >= avio_tell(pb) + 2) {
  122. // fourcc (should always be "lpcJ")
  123. avio_r8(pb);
  124. get_str8(pb, buf, sizeof(buf));
  125. }
  126. // Skip extra header crap (this should never happen)
  127. if ((startpos + header_size) > avio_tell(pb))
  128. avio_skip(pb, header_size + startpos - avio_tell(pb));
  129. st->codec->sample_rate = 8000;
  130. st->codec->channels = 1;
  131. st->codec->channel_layout = AV_CH_LAYOUT_MONO;
  132. st->codec->codec_type = AVMEDIA_TYPE_AUDIO;
  133. st->codec->codec_id = AV_CODEC_ID_RA_144;
  134. ast->deint_id = DEINT_ID_INT0;
  135. } else {
  136. int flavor, sub_packet_h, coded_framesize, sub_packet_size;
  137. int codecdata_length;
  138. /* old version (4) */
  139. avio_skip(pb, 2); /* unused */
  140. avio_rb32(pb); /* .ra4 */
  141. avio_rb32(pb); /* data size */
  142. avio_rb16(pb); /* version2 */
  143. avio_rb32(pb); /* header size */
  144. flavor= avio_rb16(pb); /* add codec info / flavor */
  145. ast->coded_framesize = coded_framesize = avio_rb32(pb); /* coded frame size */
  146. avio_rb32(pb); /* ??? */
  147. avio_rb32(pb); /* ??? */
  148. avio_rb32(pb); /* ??? */
  149. ast->sub_packet_h = sub_packet_h = avio_rb16(pb); /* 1 */
  150. st->codec->block_align= avio_rb16(pb); /* frame size */
  151. ast->sub_packet_size = sub_packet_size = avio_rb16(pb); /* sub packet size */
  152. avio_rb16(pb); /* ??? */
  153. if (version == 5) {
  154. avio_rb16(pb); avio_rb16(pb); avio_rb16(pb);
  155. }
  156. st->codec->sample_rate = avio_rb16(pb);
  157. avio_rb32(pb);
  158. st->codec->channels = avio_rb16(pb);
  159. if (version == 5) {
  160. ast->deint_id = avio_rl32(pb);
  161. avio_read(pb, buf, 4);
  162. buf[4] = 0;
  163. } else {
  164. get_str8(pb, buf, sizeof(buf)); /* desc */
  165. ast->deint_id = AV_RL32(buf);
  166. get_str8(pb, buf, sizeof(buf)); /* desc */
  167. }
  168. st->codec->codec_type = AVMEDIA_TYPE_AUDIO;
  169. st->codec->codec_tag = AV_RL32(buf);
  170. st->codec->codec_id = ff_codec_get_id(ff_rm_codec_tags,
  171. st->codec->codec_tag);
  172. switch (st->codec->codec_id) {
  173. case AV_CODEC_ID_AC3:
  174. st->need_parsing = AVSTREAM_PARSE_FULL;
  175. break;
  176. case AV_CODEC_ID_RA_288:
  177. st->codec->extradata_size= 0;
  178. ast->audio_framesize = st->codec->block_align;
  179. st->codec->block_align = coded_framesize;
  180. break;
  181. case AV_CODEC_ID_COOK:
  182. st->need_parsing = AVSTREAM_PARSE_HEADERS;
  183. case AV_CODEC_ID_ATRAC3:
  184. case AV_CODEC_ID_SIPR:
  185. if (read_all) {
  186. codecdata_length = 0;
  187. } else {
  188. avio_rb16(pb); avio_r8(pb);
  189. if (version == 5)
  190. avio_r8(pb);
  191. codecdata_length = avio_rb32(pb);
  192. if(codecdata_length + FF_INPUT_BUFFER_PADDING_SIZE <= (unsigned)codecdata_length){
  193. av_log(s, AV_LOG_ERROR, "codecdata_length too large\n");
  194. return -1;
  195. }
  196. }
  197. ast->audio_framesize = st->codec->block_align;
  198. if (st->codec->codec_id == AV_CODEC_ID_SIPR) {
  199. if (flavor > 3) {
  200. av_log(s, AV_LOG_ERROR, "bad SIPR file flavor %d\n",
  201. flavor);
  202. return -1;
  203. }
  204. st->codec->block_align = ff_sipr_subpk_size[flavor];
  205. } else {
  206. if(sub_packet_size <= 0){
  207. av_log(s, AV_LOG_ERROR, "sub_packet_size is invalid\n");
  208. return -1;
  209. }
  210. st->codec->block_align = ast->sub_packet_size;
  211. }
  212. if ((ret = rm_read_extradata(pb, st->codec, codecdata_length)) < 0)
  213. return ret;
  214. break;
  215. case AV_CODEC_ID_AAC:
  216. avio_rb16(pb); avio_r8(pb);
  217. if (version == 5)
  218. avio_r8(pb);
  219. codecdata_length = avio_rb32(pb);
  220. if(codecdata_length + FF_INPUT_BUFFER_PADDING_SIZE <= (unsigned)codecdata_length){
  221. av_log(s, AV_LOG_ERROR, "codecdata_length too large\n");
  222. return -1;
  223. }
  224. if (codecdata_length >= 1) {
  225. avio_r8(pb);
  226. if ((ret = rm_read_extradata(pb, st->codec, codecdata_length - 1)) < 0)
  227. return ret;
  228. }
  229. break;
  230. default:
  231. av_strlcpy(st->codec->codec_name, buf, sizeof(st->codec->codec_name));
  232. }
  233. if (ast->deint_id == DEINT_ID_INT4 ||
  234. ast->deint_id == DEINT_ID_GENR ||
  235. ast->deint_id == DEINT_ID_SIPR) {
  236. if (st->codec->block_align <= 0 ||
  237. ast->audio_framesize * sub_packet_h > (unsigned)INT_MAX ||
  238. ast->audio_framesize * sub_packet_h < st->codec->block_align)
  239. return AVERROR_INVALIDDATA;
  240. if (av_new_packet(&ast->pkt, ast->audio_framesize * sub_packet_h) < 0)
  241. return AVERROR(ENOMEM);
  242. }
  243. switch (ast->deint_id) {
  244. case DEINT_ID_INT4:
  245. if (ast->coded_framesize > ast->audio_framesize ||
  246. sub_packet_h <= 1 ||
  247. ast->coded_framesize * sub_packet_h > (2 + (sub_packet_h & 1)) * ast->audio_framesize)
  248. return AVERROR_INVALIDDATA;
  249. break;
  250. case DEINT_ID_GENR:
  251. if (ast->sub_packet_size <= 0 ||
  252. ast->sub_packet_size > ast->audio_framesize)
  253. return AVERROR_INVALIDDATA;
  254. break;
  255. case DEINT_ID_SIPR:
  256. case DEINT_ID_INT0:
  257. case DEINT_ID_VBRS:
  258. case DEINT_ID_VBRF:
  259. break;
  260. default:
  261. av_log(s, AV_LOG_ERROR, "Unknown interleaver %X\n", ast->deint_id);
  262. return AVERROR_INVALIDDATA;
  263. }
  264. if (read_all) {
  265. avio_r8(pb);
  266. avio_r8(pb);
  267. avio_r8(pb);
  268. rm_read_metadata(s, 0);
  269. }
  270. }
  271. return 0;
  272. }
  273. int
  274. ff_rm_read_mdpr_codecdata (AVFormatContext *s, AVIOContext *pb,
  275. AVStream *st, RMStream *rst, int codec_data_size, const uint8_t *mime)
  276. {
  277. unsigned int v;
  278. int size;
  279. int64_t codec_pos;
  280. int ret;
  281. avpriv_set_pts_info(st, 64, 1, 1000);
  282. codec_pos = avio_tell(pb);
  283. v = avio_rb32(pb);
  284. if (v == MKTAG(0xfd, 'a', 'r', '.')) {
  285. /* ra type header */
  286. if (rm_read_audio_stream_info(s, pb, st, rst, 0))
  287. return -1;
  288. } else if (v == MKBETAG('L', 'S', 'D', ':')) {
  289. avio_seek(pb, -4, SEEK_CUR);
  290. if ((ret = rm_read_extradata(pb, st->codec, codec_data_size)) < 0)
  291. return ret;
  292. st->codec->codec_type = AVMEDIA_TYPE_AUDIO;
  293. st->codec->codec_tag = AV_RL32(st->codec->extradata);
  294. st->codec->codec_id = ff_codec_get_id(ff_rm_codec_tags,
  295. st->codec->codec_tag);
  296. } else if(mime && !strcmp(mime, "logical-fileinfo")){
  297. int stream_count, rule_count, property_count, i;
  298. ff_free_stream(s, st);
  299. if (avio_rb16(pb) != 0) {
  300. av_log(s, AV_LOG_WARNING, "Unsupported version\n");
  301. goto skip;
  302. }
  303. stream_count = avio_rb16(pb);
  304. avio_skip(pb, 6*stream_count);
  305. rule_count = avio_rb16(pb);
  306. avio_skip(pb, 2*rule_count);
  307. property_count = avio_rb16(pb);
  308. for(i=0; i<property_count; i++){
  309. uint8_t name[128], val[128];
  310. avio_rb32(pb);
  311. if (avio_rb16(pb) != 0) {
  312. av_log(s, AV_LOG_WARNING, "Unsupported Name value property version\n");
  313. goto skip; //FIXME skip just this one
  314. }
  315. get_str8(pb, name, sizeof(name));
  316. switch(avio_rb32(pb)) {
  317. case 2: get_strl(pb, val, sizeof(val), avio_rb16(pb));
  318. av_dict_set(&s->metadata, name, val, 0);
  319. break;
  320. default: avio_skip(pb, avio_rb16(pb));
  321. }
  322. }
  323. } else {
  324. int fps;
  325. if (avio_rl32(pb) != MKTAG('V', 'I', 'D', 'O')) {
  326. fail1:
  327. av_log(s, AV_LOG_WARNING, "Unsupported stream type %08x\n", v);
  328. goto skip;
  329. }
  330. st->codec->codec_tag = avio_rl32(pb);
  331. st->codec->codec_id = ff_codec_get_id(ff_rm_codec_tags,
  332. st->codec->codec_tag);
  333. av_dlog(s, "%X %X\n", st->codec->codec_tag, MKTAG('R', 'V', '2', '0'));
  334. if (st->codec->codec_id == AV_CODEC_ID_NONE)
  335. goto fail1;
  336. st->codec->width = avio_rb16(pb);
  337. st->codec->height = avio_rb16(pb);
  338. avio_skip(pb, 2); // looks like bits per sample
  339. avio_skip(pb, 4); // always zero?
  340. st->codec->codec_type = AVMEDIA_TYPE_VIDEO;
  341. st->need_parsing = AVSTREAM_PARSE_TIMESTAMPS;
  342. fps = avio_rb32(pb);
  343. if ((ret = rm_read_extradata(pb, st->codec, codec_data_size - (avio_tell(pb) - codec_pos))) < 0)
  344. return ret;
  345. av_reduce(&st->avg_frame_rate.den, &st->avg_frame_rate.num,
  346. 0x10000, fps, (1 << 30) - 1);
  347. #if FF_API_R_FRAME_RATE
  348. st->r_frame_rate = st->avg_frame_rate;
  349. #endif
  350. }
  351. skip:
  352. /* skip codec info */
  353. size = avio_tell(pb) - codec_pos;
  354. avio_skip(pb, codec_data_size - size);
  355. return 0;
  356. }
  357. /** this function assumes that the demuxer has already seeked to the start
  358. * of the INDX chunk, and will bail out if not. */
  359. static int rm_read_index(AVFormatContext *s)
  360. {
  361. AVIOContext *pb = s->pb;
  362. unsigned int size, n_pkts, str_id, next_off, n, pos, pts;
  363. AVStream *st;
  364. do {
  365. if (avio_rl32(pb) != MKTAG('I','N','D','X'))
  366. return -1;
  367. size = avio_rb32(pb);
  368. if (size < 20)
  369. return -1;
  370. avio_skip(pb, 2);
  371. n_pkts = avio_rb32(pb);
  372. str_id = avio_rb16(pb);
  373. next_off = avio_rb32(pb);
  374. for (n = 0; n < s->nb_streams; n++)
  375. if (s->streams[n]->id == str_id) {
  376. st = s->streams[n];
  377. break;
  378. }
  379. if (n == s->nb_streams) {
  380. av_log(s, AV_LOG_ERROR,
  381. "Invalid stream index %d for index at pos %"PRId64"\n",
  382. str_id, avio_tell(pb));
  383. goto skip;
  384. } else if ((avio_size(pb) - avio_tell(pb)) / 14 < n_pkts) {
  385. av_log(s, AV_LOG_ERROR,
  386. "Nr. of packets in packet index for stream index %d "
  387. "exceeds filesize (%"PRId64" at %"PRId64" = %"PRId64")\n",
  388. str_id, avio_size(pb), avio_tell(pb),
  389. (avio_size(pb) - avio_tell(pb)) / 14);
  390. goto skip;
  391. }
  392. for (n = 0; n < n_pkts; n++) {
  393. avio_skip(pb, 2);
  394. pts = avio_rb32(pb);
  395. pos = avio_rb32(pb);
  396. avio_skip(pb, 4); /* packet no. */
  397. av_add_index_entry(st, pos, pts, 0, 0, AVINDEX_KEYFRAME);
  398. }
  399. skip:
  400. if (next_off && avio_tell(pb) < next_off &&
  401. avio_seek(pb, next_off, SEEK_SET) < 0) {
  402. av_log(s, AV_LOG_ERROR,
  403. "Non-linear index detected, not supported\n");
  404. return -1;
  405. }
  406. } while (next_off);
  407. return 0;
  408. }
  409. static int rm_read_header_old(AVFormatContext *s)
  410. {
  411. RMDemuxContext *rm = s->priv_data;
  412. AVStream *st;
  413. rm->old_format = 1;
  414. st = avformat_new_stream(s, NULL);
  415. if (!st)
  416. return -1;
  417. st->priv_data = ff_rm_alloc_rmstream();
  418. return rm_read_audio_stream_info(s, s->pb, st, st->priv_data, 1);
  419. }
  420. static int rm_read_header(AVFormatContext *s)
  421. {
  422. RMDemuxContext *rm = s->priv_data;
  423. AVStream *st;
  424. AVIOContext *pb = s->pb;
  425. unsigned int tag;
  426. int tag_size;
  427. unsigned int start_time, duration;
  428. unsigned int data_off = 0, indx_off = 0;
  429. char buf[128], mime[128];
  430. int flags = 0;
  431. tag = avio_rl32(pb);
  432. if (tag == MKTAG('.', 'r', 'a', 0xfd)) {
  433. /* very old .ra format */
  434. return rm_read_header_old(s);
  435. } else if (tag != MKTAG('.', 'R', 'M', 'F')) {
  436. return AVERROR(EIO);
  437. }
  438. tag_size = avio_rb32(pb);
  439. avio_skip(pb, tag_size - 8);
  440. for(;;) {
  441. if (url_feof(pb))
  442. return -1;
  443. tag = avio_rl32(pb);
  444. tag_size = avio_rb32(pb);
  445. avio_rb16(pb);
  446. av_dlog(s, "tag=%c%c%c%c (%08x) size=%d\n",
  447. (tag ) & 0xff,
  448. (tag >> 8) & 0xff,
  449. (tag >> 16) & 0xff,
  450. (tag >> 24) & 0xff,
  451. tag,
  452. tag_size);
  453. if (tag_size < 10 && tag != MKTAG('D', 'A', 'T', 'A'))
  454. return -1;
  455. switch(tag) {
  456. case MKTAG('P', 'R', 'O', 'P'):
  457. /* file header */
  458. avio_rb32(pb); /* max bit rate */
  459. avio_rb32(pb); /* avg bit rate */
  460. avio_rb32(pb); /* max packet size */
  461. avio_rb32(pb); /* avg packet size */
  462. avio_rb32(pb); /* nb packets */
  463. duration = avio_rb32(pb); /* duration */
  464. s->duration = av_rescale(duration, AV_TIME_BASE, 1000);
  465. avio_rb32(pb); /* preroll */
  466. indx_off = avio_rb32(pb); /* index offset */
  467. data_off = avio_rb32(pb); /* data offset */
  468. avio_rb16(pb); /* nb streams */
  469. flags = avio_rb16(pb); /* flags */
  470. break;
  471. case MKTAG('C', 'O', 'N', 'T'):
  472. rm_read_metadata(s, 1);
  473. break;
  474. case MKTAG('M', 'D', 'P', 'R'):
  475. st = avformat_new_stream(s, NULL);
  476. if (!st)
  477. return AVERROR(ENOMEM);
  478. st->id = avio_rb16(pb);
  479. avio_rb32(pb); /* max bit rate */
  480. st->codec->bit_rate = avio_rb32(pb); /* bit rate */
  481. avio_rb32(pb); /* max packet size */
  482. avio_rb32(pb); /* avg packet size */
  483. start_time = avio_rb32(pb); /* start time */
  484. avio_rb32(pb); /* preroll */
  485. duration = avio_rb32(pb); /* duration */
  486. st->start_time = start_time;
  487. st->duration = duration;
  488. if(duration>0)
  489. s->duration = AV_NOPTS_VALUE;
  490. get_str8(pb, buf, sizeof(buf)); /* desc */
  491. get_str8(pb, mime, sizeof(mime)); /* mimetype */
  492. st->codec->codec_type = AVMEDIA_TYPE_DATA;
  493. st->priv_data = ff_rm_alloc_rmstream();
  494. if (ff_rm_read_mdpr_codecdata(s, s->pb, st, st->priv_data,
  495. avio_rb32(pb), mime) < 0)
  496. return -1;
  497. break;
  498. case MKTAG('D', 'A', 'T', 'A'):
  499. goto header_end;
  500. default:
  501. /* unknown tag: skip it */
  502. avio_skip(pb, tag_size - 10);
  503. break;
  504. }
  505. }
  506. header_end:
  507. rm->nb_packets = avio_rb32(pb); /* number of packets */
  508. if (!rm->nb_packets && (flags & 4))
  509. rm->nb_packets = 3600 * 25;
  510. avio_rb32(pb); /* next data header */
  511. if (!data_off)
  512. data_off = avio_tell(pb) - 18;
  513. if (indx_off && pb->seekable && !(s->flags & AVFMT_FLAG_IGNIDX) &&
  514. avio_seek(pb, indx_off, SEEK_SET) >= 0) {
  515. rm_read_index(s);
  516. avio_seek(pb, data_off + 18, SEEK_SET);
  517. }
  518. return 0;
  519. }
  520. static int get_num(AVIOContext *pb, int *len)
  521. {
  522. int n, n1;
  523. n = avio_rb16(pb);
  524. (*len)-=2;
  525. n &= 0x7FFF;
  526. if (n >= 0x4000) {
  527. return n - 0x4000;
  528. } else {
  529. n1 = avio_rb16(pb);
  530. (*len)-=2;
  531. return (n << 16) | n1;
  532. }
  533. }
  534. /* multiple of 20 bytes for ra144 (ugly) */
  535. #define RAW_PACKET_SIZE 1000
  536. static int sync(AVFormatContext *s, int64_t *timestamp, int *flags, int *stream_index, int64_t *pos){
  537. RMDemuxContext *rm = s->priv_data;
  538. AVIOContext *pb = s->pb;
  539. AVStream *st;
  540. uint32_t state=0xFFFFFFFF;
  541. while(!url_feof(pb)){
  542. int len, num, i;
  543. *pos= avio_tell(pb) - 3;
  544. if(rm->remaining_len > 0){
  545. num= rm->current_stream;
  546. len= rm->remaining_len;
  547. *timestamp = AV_NOPTS_VALUE;
  548. *flags= 0;
  549. }else{
  550. state= (state<<8) + avio_r8(pb);
  551. if(state == MKBETAG('I', 'N', 'D', 'X')){
  552. int n_pkts, expected_len;
  553. len = avio_rb32(pb);
  554. avio_skip(pb, 2);
  555. n_pkts = avio_rb32(pb);
  556. expected_len = 20 + n_pkts * 14;
  557. if (len == 20)
  558. /* some files don't add index entries to chunk size... */
  559. len = expected_len;
  560. else if (len != expected_len)
  561. av_log(s, AV_LOG_WARNING,
  562. "Index size %d (%d pkts) is wrong, should be %d.\n",
  563. len, n_pkts, expected_len);
  564. len -= 14; // we already read part of the index header
  565. if(len<0)
  566. continue;
  567. goto skip;
  568. } else if (state == MKBETAG('D','A','T','A')) {
  569. av_log(s, AV_LOG_WARNING,
  570. "DATA tag in middle of chunk, file may be broken.\n");
  571. }
  572. if(state > (unsigned)0xFFFF || state <= 12)
  573. continue;
  574. len=state - 12;
  575. state= 0xFFFFFFFF;
  576. num = avio_rb16(pb);
  577. *timestamp = avio_rb32(pb);
  578. avio_r8(pb); /* reserved */
  579. *flags = avio_r8(pb); /* flags */
  580. }
  581. for(i=0;i<s->nb_streams;i++) {
  582. st = s->streams[i];
  583. if (num == st->id)
  584. break;
  585. }
  586. if (i == s->nb_streams) {
  587. skip:
  588. /* skip packet if unknown number */
  589. avio_skip(pb, len);
  590. rm->remaining_len = 0;
  591. continue;
  592. }
  593. *stream_index= i;
  594. return len;
  595. }
  596. return -1;
  597. }
  598. static int rm_assemble_video_frame(AVFormatContext *s, AVIOContext *pb,
  599. RMDemuxContext *rm, RMStream *vst,
  600. AVPacket *pkt, int len, int *pseq,
  601. int64_t *timestamp)
  602. {
  603. int hdr, seq, pic_num, len2, pos;
  604. int type;
  605. hdr = avio_r8(pb); len--;
  606. type = hdr >> 6;
  607. if(type != 3){ // not frame as a part of packet
  608. seq = avio_r8(pb); len--;
  609. }
  610. if(type != 1){ // not whole frame
  611. len2 = get_num(pb, &len);
  612. pos = get_num(pb, &len);
  613. pic_num = avio_r8(pb); len--;
  614. }
  615. if(len<0)
  616. return -1;
  617. rm->remaining_len = len;
  618. if(type&1){ // frame, not slice
  619. if(type == 3){ // frame as a part of packet
  620. len= len2;
  621. *timestamp = pos;
  622. }
  623. if(rm->remaining_len < len)
  624. return -1;
  625. rm->remaining_len -= len;
  626. if(av_new_packet(pkt, len + 9) < 0)
  627. return AVERROR(EIO);
  628. pkt->data[0] = 0;
  629. AV_WL32(pkt->data + 1, 1);
  630. AV_WL32(pkt->data + 5, 0);
  631. avio_read(pb, pkt->data + 9, len);
  632. return 0;
  633. }
  634. //now we have to deal with single slice
  635. *pseq = seq;
  636. if((seq & 0x7F) == 1 || vst->curpic_num != pic_num){
  637. vst->slices = ((hdr & 0x3F) << 1) + 1;
  638. vst->videobufsize = len2 + 8*vst->slices + 1;
  639. av_free_packet(&vst->pkt); //FIXME this should be output.
  640. if(av_new_packet(&vst->pkt, vst->videobufsize) < 0)
  641. return AVERROR(ENOMEM);
  642. vst->videobufpos = 8*vst->slices + 1;
  643. vst->cur_slice = 0;
  644. vst->curpic_num = pic_num;
  645. vst->pktpos = avio_tell(pb);
  646. }
  647. if(type == 2)
  648. len = FFMIN(len, pos);
  649. if(++vst->cur_slice > vst->slices)
  650. return 1;
  651. AV_WL32(vst->pkt.data - 7 + 8*vst->cur_slice, 1);
  652. AV_WL32(vst->pkt.data - 3 + 8*vst->cur_slice, vst->videobufpos - 8*vst->slices - 1);
  653. if(vst->videobufpos + len > vst->videobufsize)
  654. return 1;
  655. if (avio_read(pb, vst->pkt.data + vst->videobufpos, len) != len)
  656. return AVERROR(EIO);
  657. vst->videobufpos += len;
  658. rm->remaining_len-= len;
  659. if (type == 2 || vst->videobufpos == vst->videobufsize) {
  660. vst->pkt.data[0] = vst->cur_slice-1;
  661. *pkt= vst->pkt;
  662. vst->pkt.data= NULL;
  663. vst->pkt.size= 0;
  664. if(vst->slices != vst->cur_slice) //FIXME find out how to set slices correct from the begin
  665. memmove(pkt->data + 1 + 8*vst->cur_slice, pkt->data + 1 + 8*vst->slices,
  666. vst->videobufpos - 1 - 8*vst->slices);
  667. pkt->size = vst->videobufpos + 8*(vst->cur_slice - vst->slices);
  668. pkt->pts = AV_NOPTS_VALUE;
  669. pkt->pos = vst->pktpos;
  670. vst->slices = 0;
  671. return 0;
  672. }
  673. return 1;
  674. }
  675. static inline void
  676. rm_ac3_swap_bytes (AVStream *st, AVPacket *pkt)
  677. {
  678. uint8_t *ptr;
  679. int j;
  680. if (st->codec->codec_id == AV_CODEC_ID_AC3) {
  681. ptr = pkt->data;
  682. for (j=0;j<pkt->size;j+=2) {
  683. FFSWAP(int, ptr[0], ptr[1]);
  684. ptr += 2;
  685. }
  686. }
  687. }
  688. int
  689. ff_rm_parse_packet (AVFormatContext *s, AVIOContext *pb,
  690. AVStream *st, RMStream *ast, int len, AVPacket *pkt,
  691. int *seq, int flags, int64_t timestamp)
  692. {
  693. RMDemuxContext *rm = s->priv_data;
  694. if (st->codec->codec_type == AVMEDIA_TYPE_VIDEO) {
  695. rm->current_stream= st->id;
  696. if(rm_assemble_video_frame(s, pb, rm, ast, pkt, len, seq, &timestamp))
  697. return -1; //got partial frame
  698. } else if (st->codec->codec_type == AVMEDIA_TYPE_AUDIO) {
  699. if ((ast->deint_id == DEINT_ID_GENR) ||
  700. (ast->deint_id == DEINT_ID_INT4) ||
  701. (ast->deint_id == DEINT_ID_SIPR)) {
  702. int x;
  703. int sps = ast->sub_packet_size;
  704. int cfs = ast->coded_framesize;
  705. int h = ast->sub_packet_h;
  706. int y = ast->sub_packet_cnt;
  707. int w = ast->audio_framesize;
  708. if (flags & 2)
  709. y = ast->sub_packet_cnt = 0;
  710. if (!y)
  711. ast->audiotimestamp = timestamp;
  712. switch (ast->deint_id) {
  713. case DEINT_ID_INT4:
  714. for (x = 0; x < h/2; x++)
  715. avio_read(pb, ast->pkt.data+x*2*w+y*cfs, cfs);
  716. break;
  717. case DEINT_ID_GENR:
  718. for (x = 0; x < w/sps; x++)
  719. avio_read(pb, ast->pkt.data+sps*(h*x+((h+1)/2)*(y&1)+(y>>1)), sps);
  720. break;
  721. case DEINT_ID_SIPR:
  722. avio_read(pb, ast->pkt.data + y * w, w);
  723. break;
  724. }
  725. if (++(ast->sub_packet_cnt) < h)
  726. return -1;
  727. if (ast->deint_id == DEINT_ID_SIPR)
  728. ff_rm_reorder_sipr_data(ast->pkt.data, h, w);
  729. ast->sub_packet_cnt = 0;
  730. rm->audio_stream_num = st->index;
  731. rm->audio_pkt_cnt = h * w / st->codec->block_align;
  732. } else if ((ast->deint_id == DEINT_ID_VBRF) ||
  733. (ast->deint_id == DEINT_ID_VBRS)) {
  734. int x;
  735. rm->audio_stream_num = st->index;
  736. ast->sub_packet_cnt = (avio_rb16(pb) & 0xf0) >> 4;
  737. if (ast->sub_packet_cnt) {
  738. for (x = 0; x < ast->sub_packet_cnt; x++)
  739. ast->sub_packet_lengths[x] = avio_rb16(pb);
  740. rm->audio_pkt_cnt = ast->sub_packet_cnt;
  741. ast->audiotimestamp = timestamp;
  742. } else
  743. return -1;
  744. } else {
  745. av_get_packet(pb, pkt, len);
  746. rm_ac3_swap_bytes(st, pkt);
  747. }
  748. } else
  749. av_get_packet(pb, pkt, len);
  750. pkt->stream_index = st->index;
  751. #if 0
  752. if (st->codec->codec_type == AVMEDIA_TYPE_VIDEO) {
  753. if(st->codec->codec_id == AV_CODEC_ID_RV20){
  754. int seq= 128*(pkt->data[2]&0x7F) + (pkt->data[3]>>1);
  755. av_log(s, AV_LOG_DEBUG, "%d %"PRId64" %d\n", *timestamp, *timestamp*512LL/25, seq);
  756. seq |= (timestamp&~0x3FFF);
  757. if(seq - timestamp > 0x2000) seq -= 0x4000;
  758. if(seq - timestamp < -0x2000) seq += 0x4000;
  759. }
  760. }
  761. #endif
  762. pkt->pts = timestamp;
  763. if (flags & 2)
  764. pkt->flags |= AV_PKT_FLAG_KEY;
  765. return st->codec->codec_type == AVMEDIA_TYPE_AUDIO ? rm->audio_pkt_cnt : 0;
  766. }
  767. int
  768. ff_rm_retrieve_cache (AVFormatContext *s, AVIOContext *pb,
  769. AVStream *st, RMStream *ast, AVPacket *pkt)
  770. {
  771. RMDemuxContext *rm = s->priv_data;
  772. av_assert0 (rm->audio_pkt_cnt > 0);
  773. if (ast->deint_id == DEINT_ID_VBRF ||
  774. ast->deint_id == DEINT_ID_VBRS)
  775. av_get_packet(pb, pkt, ast->sub_packet_lengths[ast->sub_packet_cnt - rm->audio_pkt_cnt]);
  776. else {
  777. if(av_new_packet(pkt, st->codec->block_align) < 0)
  778. return AVERROR(ENOMEM);
  779. memcpy(pkt->data, ast->pkt.data + st->codec->block_align * //FIXME avoid this
  780. (ast->sub_packet_h * ast->audio_framesize / st->codec->block_align - rm->audio_pkt_cnt),
  781. st->codec->block_align);
  782. }
  783. rm->audio_pkt_cnt--;
  784. if ((pkt->pts = ast->audiotimestamp) != AV_NOPTS_VALUE) {
  785. ast->audiotimestamp = AV_NOPTS_VALUE;
  786. pkt->flags = AV_PKT_FLAG_KEY;
  787. } else
  788. pkt->flags = 0;
  789. pkt->stream_index = st->index;
  790. return rm->audio_pkt_cnt;
  791. }
  792. static int rm_read_packet(AVFormatContext *s, AVPacket *pkt)
  793. {
  794. RMDemuxContext *rm = s->priv_data;
  795. AVStream *st;
  796. int i, len, res, seq = 1;
  797. int64_t timestamp, pos;
  798. int flags;
  799. for (;;) {
  800. if (rm->audio_pkt_cnt) {
  801. // If there are queued audio packet return them first
  802. st = s->streams[rm->audio_stream_num];
  803. res = ff_rm_retrieve_cache(s, s->pb, st, st->priv_data, pkt);
  804. if(res < 0)
  805. return res;
  806. flags = 0;
  807. } else {
  808. if (rm->old_format) {
  809. RMStream *ast;
  810. st = s->streams[0];
  811. ast = st->priv_data;
  812. timestamp = AV_NOPTS_VALUE;
  813. len = !ast->audio_framesize ? RAW_PACKET_SIZE :
  814. ast->coded_framesize * ast->sub_packet_h / 2;
  815. flags = (seq++ == 1) ? 2 : 0;
  816. pos = avio_tell(s->pb);
  817. } else {
  818. len=sync(s, &timestamp, &flags, &i, &pos);
  819. if (len > 0)
  820. st = s->streams[i];
  821. }
  822. if(len<0 || url_feof(s->pb))
  823. return AVERROR(EIO);
  824. res = ff_rm_parse_packet (s, s->pb, st, st->priv_data, len, pkt,
  825. &seq, flags, timestamp);
  826. if((flags&2) && (seq&0x7F) == 1)
  827. av_add_index_entry(st, pos, timestamp, 0, 0, AVINDEX_KEYFRAME);
  828. if (res)
  829. continue;
  830. }
  831. if( (st->discard >= AVDISCARD_NONKEY && !(flags&2))
  832. || st->discard >= AVDISCARD_ALL){
  833. av_free_packet(pkt);
  834. } else
  835. break;
  836. }
  837. return 0;
  838. }
  839. static int rm_read_close(AVFormatContext *s)
  840. {
  841. int i;
  842. for (i=0;i<s->nb_streams;i++)
  843. ff_rm_free_rmstream(s->streams[i]->priv_data);
  844. return 0;
  845. }
  846. static int rm_probe(AVProbeData *p)
  847. {
  848. /* check file header */
  849. if ((p->buf[0] == '.' && p->buf[1] == 'R' &&
  850. p->buf[2] == 'M' && p->buf[3] == 'F' &&
  851. p->buf[4] == 0 && p->buf[5] == 0) ||
  852. (p->buf[0] == '.' && p->buf[1] == 'r' &&
  853. p->buf[2] == 'a' && p->buf[3] == 0xfd))
  854. return AVPROBE_SCORE_MAX;
  855. else
  856. return 0;
  857. }
  858. static int64_t rm_read_dts(AVFormatContext *s, int stream_index,
  859. int64_t *ppos, int64_t pos_limit)
  860. {
  861. RMDemuxContext *rm = s->priv_data;
  862. int64_t pos, dts;
  863. int stream_index2, flags, len, h;
  864. pos = *ppos;
  865. if(rm->old_format)
  866. return AV_NOPTS_VALUE;
  867. if (avio_seek(s->pb, pos, SEEK_SET) < 0)
  868. return AV_NOPTS_VALUE;
  869. rm->remaining_len=0;
  870. for(;;){
  871. int seq=1;
  872. AVStream *st;
  873. len=sync(s, &dts, &flags, &stream_index2, &pos);
  874. if(len<0)
  875. return AV_NOPTS_VALUE;
  876. st = s->streams[stream_index2];
  877. if (st->codec->codec_type == AVMEDIA_TYPE_VIDEO) {
  878. h= avio_r8(s->pb); len--;
  879. if(!(h & 0x40)){
  880. seq = avio_r8(s->pb); len--;
  881. }
  882. }
  883. if((flags&2) && (seq&0x7F) == 1){
  884. av_dlog(s, "%d %d-%d %"PRId64" %d\n",
  885. flags, stream_index2, stream_index, dts, seq);
  886. av_add_index_entry(st, pos, dts, 0, 0, AVINDEX_KEYFRAME);
  887. if(stream_index2 == stream_index)
  888. break;
  889. }
  890. avio_skip(s->pb, len);
  891. }
  892. *ppos = pos;
  893. return dts;
  894. }
  895. AVInputFormat ff_rm_demuxer = {
  896. .name = "rm",
  897. .long_name = NULL_IF_CONFIG_SMALL("RealMedia"),
  898. .priv_data_size = sizeof(RMDemuxContext),
  899. .read_probe = rm_probe,
  900. .read_header = rm_read_header,
  901. .read_packet = rm_read_packet,
  902. .read_close = rm_read_close,
  903. .read_timestamp = rm_read_dts,
  904. };
  905. AVInputFormat ff_rdt_demuxer = {
  906. .name = "rdt",
  907. .long_name = NULL_IF_CONFIG_SMALL("RDT demuxer"),
  908. .priv_data_size = sizeof(RMDemuxContext),
  909. .read_close = rm_read_close,
  910. .flags = AVFMT_NOFILE,
  911. };