You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

973 lines
32KB

  1. /*
  2. * "Real" compatible demuxer.
  3. * Copyright (c) 2000, 2001 Fabrice Bellard
  4. *
  5. * This file is part of Libav.
  6. *
  7. * Libav is free software; you can redistribute it and/or
  8. * modify it under the terms of the GNU Lesser General Public
  9. * License as published by the Free Software Foundation; either
  10. * version 2.1 of the License, or (at your option) any later version.
  11. *
  12. * Libav is distributed in the hope that it will be useful,
  13. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  14. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  15. * Lesser General Public License for more details.
  16. *
  17. * You should have received a copy of the GNU Lesser General Public
  18. * License along with Libav; if not, write to the Free Software
  19. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  20. */
  21. #include <inttypes.h>
  22. #include "libavutil/avstring.h"
  23. #include "libavutil/channel_layout.h"
  24. #include "libavutil/internal.h"
  25. #include "libavutil/intreadwrite.h"
  26. #include "libavutil/dict.h"
  27. #include "avformat.h"
  28. #include "internal.h"
  29. #include "rmsipr.h"
  30. #include "rm.h"
  31. #define DEINT_ID_GENR MKTAG('g', 'e', 'n', 'r') ///< interleaving for Cooker/ATRAC
  32. #define DEINT_ID_INT0 MKTAG('I', 'n', 't', '0') ///< no interleaving needed
  33. #define DEINT_ID_INT4 MKTAG('I', 'n', 't', '4') ///< interleaving for 28.8
  34. #define DEINT_ID_SIPR MKTAG('s', 'i', 'p', 'r') ///< interleaving for Sipro
  35. #define DEINT_ID_VBRF MKTAG('v', 'b', 'r', 'f') ///< VBR case for AAC
  36. #define DEINT_ID_VBRS MKTAG('v', 'b', 'r', 's') ///< VBR case for AAC
  37. struct RMStream {
  38. AVPacket pkt; ///< place to store merged video frame / reordered audio data
  39. int videobufsize; ///< current assembled frame size
  40. int videobufpos; ///< position for the next slice in the video buffer
  41. int curpic_num; ///< picture number of current frame
  42. int cur_slice, slices;
  43. int64_t pktpos; ///< first slice position in file
  44. /// Audio descrambling matrix parameters
  45. int64_t audiotimestamp; ///< Audio packet timestamp
  46. int sub_packet_cnt; // Subpacket counter, used while reading
  47. int sub_packet_size, sub_packet_h, coded_framesize; ///< Descrambling parameters from container
  48. int audio_framesize; /// Audio frame size from container
  49. int sub_packet_lengths[16]; /// Length of each subpacket
  50. int32_t deint_id; ///< deinterleaver used in audio stream
  51. };
  52. typedef struct {
  53. int nb_packets;
  54. int old_format;
  55. int current_stream;
  56. int remaining_len;
  57. int audio_stream_num; ///< Stream number for audio packets
  58. int audio_pkt_cnt; ///< Output packet counter
  59. } RMDemuxContext;
  60. static inline void get_strl(AVIOContext *pb, char *buf, int buf_size, int len)
  61. {
  62. int i;
  63. char *q, r;
  64. q = buf;
  65. for(i=0;i<len;i++) {
  66. r = avio_r8(pb);
  67. if (i < buf_size - 1)
  68. *q++ = r;
  69. }
  70. if (buf_size > 0) *q = '\0';
  71. }
  72. static void get_str8(AVIOContext *pb, char *buf, int buf_size)
  73. {
  74. get_strl(pb, buf, buf_size, avio_r8(pb));
  75. }
  76. static int rm_read_extradata(AVIOContext *pb, AVCodecContext *avctx, unsigned size)
  77. {
  78. if (size >= 1<<24)
  79. return -1;
  80. avctx->extradata = av_malloc(size + FF_INPUT_BUFFER_PADDING_SIZE);
  81. if (!avctx->extradata)
  82. return AVERROR(ENOMEM);
  83. avctx->extradata_size = avio_read(pb, avctx->extradata, size);
  84. memset(avctx->extradata + avctx->extradata_size, 0, FF_INPUT_BUFFER_PADDING_SIZE);
  85. if (avctx->extradata_size != size)
  86. return AVERROR(EIO);
  87. return 0;
  88. }
  89. static void rm_read_metadata(AVFormatContext *s, AVIOContext *pb, int wide)
  90. {
  91. char buf[1024];
  92. int i;
  93. for (i=0; i<FF_ARRAY_ELEMS(ff_rm_metadata); i++) {
  94. int len = wide ? avio_rb16(pb) : avio_r8(pb);
  95. get_strl(pb, buf, sizeof(buf), len);
  96. av_dict_set(&s->metadata, ff_rm_metadata[i], buf, 0);
  97. }
  98. }
  99. RMStream *ff_rm_alloc_rmstream (void)
  100. {
  101. RMStream *rms = av_mallocz(sizeof(RMStream));
  102. rms->curpic_num = -1;
  103. return rms;
  104. }
  105. void ff_rm_free_rmstream (RMStream *rms)
  106. {
  107. av_free_packet(&rms->pkt);
  108. }
  109. static int rm_read_audio_stream_info(AVFormatContext *s, AVIOContext *pb,
  110. AVStream *st, RMStream *ast, int read_all)
  111. {
  112. char buf[256];
  113. uint32_t version;
  114. int ret;
  115. /* ra type header */
  116. version = avio_rb16(pb); /* version */
  117. if (version == 3) {
  118. int header_size = avio_rb16(pb);
  119. int64_t startpos = avio_tell(pb);
  120. avio_skip(pb, 14);
  121. rm_read_metadata(s, pb, 0);
  122. if ((startpos + header_size) >= avio_tell(pb) + 2) {
  123. // fourcc (should always be "lpcJ")
  124. avio_r8(pb);
  125. get_str8(pb, buf, sizeof(buf));
  126. }
  127. // Skip extra header crap (this should never happen)
  128. if ((startpos + header_size) > avio_tell(pb))
  129. avio_skip(pb, header_size + startpos - avio_tell(pb));
  130. st->codec->sample_rate = 8000;
  131. st->codec->channels = 1;
  132. st->codec->channel_layout = AV_CH_LAYOUT_MONO;
  133. st->codec->codec_type = AVMEDIA_TYPE_AUDIO;
  134. st->codec->codec_id = AV_CODEC_ID_RA_144;
  135. ast->deint_id = DEINT_ID_INT0;
  136. } else {
  137. int flavor, sub_packet_h, coded_framesize, sub_packet_size;
  138. int codecdata_length;
  139. /* old version (4) */
  140. avio_skip(pb, 2); /* unused */
  141. avio_rb32(pb); /* .ra4 */
  142. avio_rb32(pb); /* data size */
  143. avio_rb16(pb); /* version2 */
  144. avio_rb32(pb); /* header size */
  145. flavor= avio_rb16(pb); /* add codec info / flavor */
  146. ast->coded_framesize = coded_framesize = avio_rb32(pb); /* coded frame size */
  147. avio_rb32(pb); /* ??? */
  148. avio_rb32(pb); /* ??? */
  149. avio_rb32(pb); /* ??? */
  150. ast->sub_packet_h = sub_packet_h = avio_rb16(pb); /* 1 */
  151. st->codec->block_align= avio_rb16(pb); /* frame size */
  152. ast->sub_packet_size = sub_packet_size = avio_rb16(pb); /* sub packet size */
  153. avio_rb16(pb); /* ??? */
  154. if (version == 5) {
  155. avio_rb16(pb); avio_rb16(pb); avio_rb16(pb);
  156. }
  157. st->codec->sample_rate = avio_rb16(pb);
  158. avio_rb32(pb);
  159. st->codec->channels = avio_rb16(pb);
  160. if (version == 5) {
  161. ast->deint_id = avio_rl32(pb);
  162. avio_read(pb, buf, 4);
  163. buf[4] = 0;
  164. } else {
  165. get_str8(pb, buf, sizeof(buf)); /* desc */
  166. ast->deint_id = AV_RL32(buf);
  167. get_str8(pb, buf, sizeof(buf)); /* desc */
  168. }
  169. st->codec->codec_type = AVMEDIA_TYPE_AUDIO;
  170. st->codec->codec_tag = AV_RL32(buf);
  171. st->codec->codec_id = ff_codec_get_id(ff_rm_codec_tags,
  172. st->codec->codec_tag);
  173. switch (st->codec->codec_id) {
  174. case AV_CODEC_ID_AC3:
  175. st->need_parsing = AVSTREAM_PARSE_FULL;
  176. break;
  177. case AV_CODEC_ID_RA_288:
  178. st->codec->extradata_size= 0;
  179. ast->audio_framesize = st->codec->block_align;
  180. st->codec->block_align = coded_framesize;
  181. break;
  182. case AV_CODEC_ID_COOK:
  183. st->need_parsing = AVSTREAM_PARSE_HEADERS;
  184. case AV_CODEC_ID_ATRAC3:
  185. case AV_CODEC_ID_SIPR:
  186. avio_rb16(pb); avio_r8(pb);
  187. if (version == 5)
  188. avio_r8(pb);
  189. codecdata_length = avio_rb32(pb);
  190. if(codecdata_length + FF_INPUT_BUFFER_PADDING_SIZE <= (unsigned)codecdata_length){
  191. av_log(s, AV_LOG_ERROR, "codecdata_length too large\n");
  192. return -1;
  193. }
  194. ast->audio_framesize = st->codec->block_align;
  195. if (st->codec->codec_id == AV_CODEC_ID_SIPR) {
  196. if (flavor > 3) {
  197. av_log(s, AV_LOG_ERROR, "bad SIPR file flavor %d\n",
  198. flavor);
  199. return -1;
  200. }
  201. st->codec->block_align = ff_sipr_subpk_size[flavor];
  202. } else {
  203. if(sub_packet_size <= 0){
  204. av_log(s, AV_LOG_ERROR, "sub_packet_size is invalid\n");
  205. return -1;
  206. }
  207. st->codec->block_align = ast->sub_packet_size;
  208. }
  209. if ((ret = rm_read_extradata(pb, st->codec, codecdata_length)) < 0)
  210. return ret;
  211. break;
  212. case AV_CODEC_ID_AAC:
  213. avio_rb16(pb); avio_r8(pb);
  214. if (version == 5)
  215. avio_r8(pb);
  216. codecdata_length = avio_rb32(pb);
  217. if(codecdata_length + FF_INPUT_BUFFER_PADDING_SIZE <= (unsigned)codecdata_length){
  218. av_log(s, AV_LOG_ERROR, "codecdata_length too large\n");
  219. return -1;
  220. }
  221. if (codecdata_length >= 1) {
  222. avio_r8(pb);
  223. if ((ret = rm_read_extradata(pb, st->codec, codecdata_length - 1)) < 0)
  224. return ret;
  225. }
  226. break;
  227. }
  228. if (ast->deint_id == DEINT_ID_INT4 ||
  229. ast->deint_id == DEINT_ID_GENR ||
  230. ast->deint_id == DEINT_ID_SIPR) {
  231. if (st->codec->block_align <= 0 ||
  232. ast->audio_framesize * sub_packet_h > (unsigned)INT_MAX ||
  233. ast->audio_framesize * sub_packet_h < st->codec->block_align)
  234. return AVERROR_INVALIDDATA;
  235. if (av_new_packet(&ast->pkt, ast->audio_framesize * sub_packet_h) < 0)
  236. return AVERROR(ENOMEM);
  237. }
  238. switch (ast->deint_id) {
  239. case DEINT_ID_INT4:
  240. if (ast->coded_framesize > ast->audio_framesize ||
  241. sub_packet_h <= 1 ||
  242. ast->coded_framesize * sub_packet_h > (2 + (sub_packet_h & 1)) * ast->audio_framesize)
  243. return AVERROR_INVALIDDATA;
  244. break;
  245. case DEINT_ID_GENR:
  246. if (ast->sub_packet_size <= 0 ||
  247. ast->sub_packet_size > ast->audio_framesize)
  248. return AVERROR_INVALIDDATA;
  249. break;
  250. case DEINT_ID_SIPR:
  251. case DEINT_ID_INT0:
  252. case DEINT_ID_VBRS:
  253. case DEINT_ID_VBRF:
  254. break;
  255. default:
  256. av_log(NULL, 0 ,"Unknown interleaver %"PRIX32"\n", ast->deint_id);
  257. return AVERROR_INVALIDDATA;
  258. }
  259. if (read_all) {
  260. avio_r8(pb);
  261. avio_r8(pb);
  262. avio_r8(pb);
  263. rm_read_metadata(s, pb, 0);
  264. }
  265. }
  266. return 0;
  267. }
  268. int
  269. ff_rm_read_mdpr_codecdata (AVFormatContext *s, AVIOContext *pb,
  270. AVStream *st, RMStream *rst, int codec_data_size)
  271. {
  272. unsigned int v;
  273. int size;
  274. int64_t codec_pos;
  275. int ret;
  276. avpriv_set_pts_info(st, 64, 1, 1000);
  277. codec_pos = avio_tell(pb);
  278. v = avio_rb32(pb);
  279. if (v == MKTAG(0xfd, 'a', 'r', '.')) {
  280. /* ra type header */
  281. if (rm_read_audio_stream_info(s, pb, st, rst, 0))
  282. return -1;
  283. } else if (v == MKBETAG('L', 'S', 'D', ':')) {
  284. avio_seek(pb, -4, SEEK_CUR);
  285. if ((ret = rm_read_extradata(pb, st->codec, codec_data_size)) < 0)
  286. return ret;
  287. st->codec->codec_type = AVMEDIA_TYPE_AUDIO;
  288. st->codec->codec_tag = AV_RL32(st->codec->extradata);
  289. st->codec->codec_id = ff_codec_get_id(ff_rm_codec_tags,
  290. st->codec->codec_tag);
  291. } else {
  292. int fps;
  293. if (avio_rl32(pb) != MKTAG('V', 'I', 'D', 'O')) {
  294. fail1:
  295. av_log(st->codec, AV_LOG_ERROR, "Unsupported video codec\n");
  296. goto skip;
  297. }
  298. st->codec->codec_tag = avio_rl32(pb);
  299. st->codec->codec_id = ff_codec_get_id(ff_rm_codec_tags,
  300. st->codec->codec_tag);
  301. av_dlog(s, "%X %X\n", st->codec->codec_tag, MKTAG('R', 'V', '2', '0'));
  302. if (st->codec->codec_id == AV_CODEC_ID_NONE)
  303. goto fail1;
  304. st->codec->width = avio_rb16(pb);
  305. st->codec->height = avio_rb16(pb);
  306. avio_skip(pb, 2); // looks like bits per sample
  307. avio_skip(pb, 4); // always zero?
  308. st->codec->codec_type = AVMEDIA_TYPE_VIDEO;
  309. st->need_parsing = AVSTREAM_PARSE_TIMESTAMPS;
  310. fps = avio_rb32(pb);
  311. if ((ret = rm_read_extradata(pb, st->codec, codec_data_size - (avio_tell(pb) - codec_pos))) < 0)
  312. return ret;
  313. if (fps > 0) {
  314. av_reduce(&st->avg_frame_rate.den, &st->avg_frame_rate.num,
  315. 0x10000, fps, (1 << 30) - 1);
  316. } else if (s->error_recognition & AV_EF_EXPLODE) {
  317. av_log(s, AV_LOG_ERROR, "Invalid framerate\n");
  318. return AVERROR_INVALIDDATA;
  319. }
  320. }
  321. skip:
  322. /* skip codec info */
  323. size = avio_tell(pb) - codec_pos;
  324. avio_skip(pb, codec_data_size - size);
  325. return 0;
  326. }
  327. /** this function assumes that the demuxer has already seeked to the start
  328. * of the INDX chunk, and will bail out if not. */
  329. static int rm_read_index(AVFormatContext *s)
  330. {
  331. AVIOContext *pb = s->pb;
  332. unsigned int size, n_pkts, str_id, next_off, n, pos, pts;
  333. AVStream *st;
  334. do {
  335. if (avio_rl32(pb) != MKTAG('I','N','D','X'))
  336. return -1;
  337. size = avio_rb32(pb);
  338. if (size < 20)
  339. return -1;
  340. avio_skip(pb, 2);
  341. n_pkts = avio_rb32(pb);
  342. str_id = avio_rb16(pb);
  343. next_off = avio_rb32(pb);
  344. for (n = 0; n < s->nb_streams; n++)
  345. if (s->streams[n]->id == str_id) {
  346. st = s->streams[n];
  347. break;
  348. }
  349. if (n == s->nb_streams) {
  350. av_log(s, AV_LOG_ERROR,
  351. "Invalid stream index %d for index at pos %"PRId64"\n",
  352. str_id, avio_tell(pb));
  353. goto skip;
  354. } else if ((avio_size(pb) - avio_tell(pb)) / 14 < n_pkts) {
  355. av_log(s, AV_LOG_ERROR,
  356. "Nr. of packets in packet index for stream index %d "
  357. "exceeds filesize (%"PRId64" at %"PRId64" = %"PRId64")\n",
  358. str_id, avio_size(pb), avio_tell(pb),
  359. (avio_size(pb) - avio_tell(pb)) / 14);
  360. goto skip;
  361. }
  362. for (n = 0; n < n_pkts; n++) {
  363. avio_skip(pb, 2);
  364. pts = avio_rb32(pb);
  365. pos = avio_rb32(pb);
  366. avio_skip(pb, 4); /* packet no. */
  367. av_add_index_entry(st, pos, pts, 0, 0, AVINDEX_KEYFRAME);
  368. }
  369. skip:
  370. if (next_off && avio_tell(pb) < next_off &&
  371. avio_seek(pb, next_off, SEEK_SET) < 0) {
  372. av_log(s, AV_LOG_ERROR,
  373. "Non-linear index detected, not supported\n");
  374. return -1;
  375. }
  376. } while (next_off);
  377. return 0;
  378. }
  379. static int rm_read_header_old(AVFormatContext *s)
  380. {
  381. RMDemuxContext *rm = s->priv_data;
  382. AVStream *st;
  383. rm->old_format = 1;
  384. st = avformat_new_stream(s, NULL);
  385. if (!st)
  386. return -1;
  387. st->priv_data = ff_rm_alloc_rmstream();
  388. return rm_read_audio_stream_info(s, s->pb, st, st->priv_data, 1);
  389. }
  390. static int rm_read_header(AVFormatContext *s)
  391. {
  392. RMDemuxContext *rm = s->priv_data;
  393. AVStream *st;
  394. AVIOContext *pb = s->pb;
  395. unsigned int tag;
  396. int tag_size;
  397. unsigned int start_time, duration;
  398. unsigned int data_off = 0, indx_off = 0;
  399. char buf[128];
  400. int flags = 0;
  401. tag = avio_rl32(pb);
  402. if (tag == MKTAG('.', 'r', 'a', 0xfd)) {
  403. /* very old .ra format */
  404. return rm_read_header_old(s);
  405. } else if (tag != MKTAG('.', 'R', 'M', 'F')) {
  406. return AVERROR(EIO);
  407. }
  408. tag_size = avio_rb32(pb);
  409. avio_skip(pb, tag_size - 8);
  410. for(;;) {
  411. if (pb->eof_reached)
  412. return -1;
  413. tag = avio_rl32(pb);
  414. tag_size = avio_rb32(pb);
  415. avio_rb16(pb);
  416. av_dlog(s, "tag=%c%c%c%c (%08x) size=%d\n",
  417. (tag ) & 0xff,
  418. (tag >> 8) & 0xff,
  419. (tag >> 16) & 0xff,
  420. (tag >> 24) & 0xff,
  421. tag,
  422. tag_size);
  423. if (tag_size < 10 && tag != MKTAG('D', 'A', 'T', 'A'))
  424. return -1;
  425. switch(tag) {
  426. case MKTAG('P', 'R', 'O', 'P'):
  427. /* file header */
  428. avio_rb32(pb); /* max bit rate */
  429. avio_rb32(pb); /* avg bit rate */
  430. avio_rb32(pb); /* max packet size */
  431. avio_rb32(pb); /* avg packet size */
  432. avio_rb32(pb); /* nb packets */
  433. avio_rb32(pb); /* duration */
  434. avio_rb32(pb); /* preroll */
  435. indx_off = avio_rb32(pb); /* index offset */
  436. data_off = avio_rb32(pb); /* data offset */
  437. avio_rb16(pb); /* nb streams */
  438. flags = avio_rb16(pb); /* flags */
  439. break;
  440. case MKTAG('C', 'O', 'N', 'T'):
  441. rm_read_metadata(s, pb, 1);
  442. break;
  443. case MKTAG('M', 'D', 'P', 'R'):
  444. st = avformat_new_stream(s, NULL);
  445. if (!st)
  446. return AVERROR(ENOMEM);
  447. st->id = avio_rb16(pb);
  448. avio_rb32(pb); /* max bit rate */
  449. st->codec->bit_rate = avio_rb32(pb); /* bit rate */
  450. avio_rb32(pb); /* max packet size */
  451. avio_rb32(pb); /* avg packet size */
  452. start_time = avio_rb32(pb); /* start time */
  453. avio_rb32(pb); /* preroll */
  454. duration = avio_rb32(pb); /* duration */
  455. st->start_time = start_time;
  456. st->duration = duration;
  457. get_str8(pb, buf, sizeof(buf)); /* desc */
  458. get_str8(pb, buf, sizeof(buf)); /* mimetype */
  459. st->codec->codec_type = AVMEDIA_TYPE_DATA;
  460. st->priv_data = ff_rm_alloc_rmstream();
  461. if (ff_rm_read_mdpr_codecdata(s, s->pb, st, st->priv_data,
  462. avio_rb32(pb)) < 0)
  463. return -1;
  464. break;
  465. case MKTAG('D', 'A', 'T', 'A'):
  466. goto header_end;
  467. default:
  468. /* unknown tag: skip it */
  469. avio_skip(pb, tag_size - 10);
  470. break;
  471. }
  472. }
  473. header_end:
  474. rm->nb_packets = avio_rb32(pb); /* number of packets */
  475. if (!rm->nb_packets && (flags & 4))
  476. rm->nb_packets = 3600 * 25;
  477. avio_rb32(pb); /* next data header */
  478. if (!data_off)
  479. data_off = avio_tell(pb) - 18;
  480. if (indx_off && pb->seekable && !(s->flags & AVFMT_FLAG_IGNIDX) &&
  481. avio_seek(pb, indx_off, SEEK_SET) >= 0) {
  482. rm_read_index(s);
  483. avio_seek(pb, data_off + 18, SEEK_SET);
  484. }
  485. return 0;
  486. }
  487. static int get_num(AVIOContext *pb, int *len)
  488. {
  489. int n, n1;
  490. n = avio_rb16(pb);
  491. (*len)-=2;
  492. n &= 0x7FFF;
  493. if (n >= 0x4000) {
  494. return n - 0x4000;
  495. } else {
  496. n1 = avio_rb16(pb);
  497. (*len)-=2;
  498. return (n << 16) | n1;
  499. }
  500. }
  501. /* multiple of 20 bytes for ra144 (ugly) */
  502. #define RAW_PACKET_SIZE 1000
  503. static int sync(AVFormatContext *s, int64_t *timestamp, int *flags, int *stream_index, int64_t *pos){
  504. RMDemuxContext *rm = s->priv_data;
  505. AVIOContext *pb = s->pb;
  506. AVStream *st;
  507. uint32_t state=0xFFFFFFFF;
  508. while(!pb->eof_reached){
  509. int len, num, i;
  510. *pos= avio_tell(pb) - 3;
  511. if(rm->remaining_len > 0){
  512. num= rm->current_stream;
  513. len= rm->remaining_len;
  514. *timestamp = AV_NOPTS_VALUE;
  515. *flags= 0;
  516. }else{
  517. state= (state<<8) + avio_r8(pb);
  518. if(state == MKBETAG('I', 'N', 'D', 'X')){
  519. int n_pkts, expected_len;
  520. len = avio_rb32(pb);
  521. avio_skip(pb, 2);
  522. n_pkts = avio_rb32(pb);
  523. expected_len = 20 + n_pkts * 14;
  524. if (len == 20)
  525. /* some files don't add index entries to chunk size... */
  526. len = expected_len;
  527. else if (len != expected_len)
  528. av_log(s, AV_LOG_WARNING,
  529. "Index size %d (%d pkts) is wrong, should be %d.\n",
  530. len, n_pkts, expected_len);
  531. len -= 14; // we already read part of the index header
  532. if(len<0)
  533. continue;
  534. goto skip;
  535. } else if (state == MKBETAG('D','A','T','A')) {
  536. av_log(s, AV_LOG_WARNING,
  537. "DATA tag in middle of chunk, file may be broken.\n");
  538. }
  539. if(state > (unsigned)0xFFFF || state <= 12)
  540. continue;
  541. len=state - 12;
  542. state= 0xFFFFFFFF;
  543. num = avio_rb16(pb);
  544. *timestamp = avio_rb32(pb);
  545. avio_r8(pb); /* reserved */
  546. *flags = avio_r8(pb); /* flags */
  547. }
  548. for(i=0;i<s->nb_streams;i++) {
  549. st = s->streams[i];
  550. if (num == st->id)
  551. break;
  552. }
  553. if (i == s->nb_streams) {
  554. skip:
  555. /* skip packet if unknown number */
  556. avio_skip(pb, len);
  557. rm->remaining_len = 0;
  558. continue;
  559. }
  560. *stream_index= i;
  561. return len;
  562. }
  563. return -1;
  564. }
  565. static int rm_assemble_video_frame(AVFormatContext *s, AVIOContext *pb,
  566. RMDemuxContext *rm, RMStream *vst,
  567. AVPacket *pkt, int len, int *pseq,
  568. int64_t *timestamp)
  569. {
  570. int hdr, seq, pic_num, len2, pos;
  571. int type;
  572. hdr = avio_r8(pb); len--;
  573. type = hdr >> 6;
  574. if(type != 3){ // not frame as a part of packet
  575. seq = avio_r8(pb); len--;
  576. }
  577. if(type != 1){ // not whole frame
  578. len2 = get_num(pb, &len);
  579. pos = get_num(pb, &len);
  580. pic_num = avio_r8(pb); len--;
  581. }
  582. if(len<0)
  583. return -1;
  584. rm->remaining_len = len;
  585. if(type&1){ // frame, not slice
  586. if(type == 3){ // frame as a part of packet
  587. len= len2;
  588. *timestamp = pos;
  589. }
  590. if(rm->remaining_len < len)
  591. return -1;
  592. rm->remaining_len -= len;
  593. if(av_new_packet(pkt, len + 9) < 0)
  594. return AVERROR(EIO);
  595. pkt->data[0] = 0;
  596. AV_WL32(pkt->data + 1, 1);
  597. AV_WL32(pkt->data + 5, 0);
  598. avio_read(pb, pkt->data + 9, len);
  599. return 0;
  600. }
  601. //now we have to deal with single slice
  602. *pseq = seq;
  603. if((seq & 0x7F) == 1 || vst->curpic_num != pic_num){
  604. vst->slices = ((hdr & 0x3F) << 1) + 1;
  605. vst->videobufsize = len2 + 8*vst->slices + 1;
  606. av_free_packet(&vst->pkt); //FIXME this should be output.
  607. if(av_new_packet(&vst->pkt, vst->videobufsize) < 0)
  608. return AVERROR(ENOMEM);
  609. vst->videobufpos = 8*vst->slices + 1;
  610. vst->cur_slice = 0;
  611. vst->curpic_num = pic_num;
  612. vst->pktpos = avio_tell(pb);
  613. }
  614. if(type == 2)
  615. len = FFMIN(len, pos);
  616. if(++vst->cur_slice > vst->slices)
  617. return 1;
  618. AV_WL32(vst->pkt.data - 7 + 8*vst->cur_slice, 1);
  619. AV_WL32(vst->pkt.data - 3 + 8*vst->cur_slice, vst->videobufpos - 8*vst->slices - 1);
  620. if(vst->videobufpos + len > vst->videobufsize)
  621. return 1;
  622. if (avio_read(pb, vst->pkt.data + vst->videobufpos, len) != len)
  623. return AVERROR(EIO);
  624. vst->videobufpos += len;
  625. rm->remaining_len-= len;
  626. if (type == 2 || vst->videobufpos == vst->videobufsize) {
  627. vst->pkt.data[0] = vst->cur_slice-1;
  628. *pkt= vst->pkt;
  629. vst->pkt.data= NULL;
  630. vst->pkt.size= 0;
  631. vst->pkt.buf = NULL;
  632. #if FF_API_DESTRUCT_PACKET
  633. FF_DISABLE_DEPRECATION_WARNINGS
  634. vst->pkt.destruct = NULL;
  635. FF_ENABLE_DEPRECATION_WARNINGS
  636. #endif
  637. if(vst->slices != vst->cur_slice) //FIXME find out how to set slices correct from the begin
  638. memmove(pkt->data + 1 + 8*vst->cur_slice, pkt->data + 1 + 8*vst->slices,
  639. vst->videobufpos - 1 - 8*vst->slices);
  640. pkt->size = vst->videobufpos + 8*(vst->cur_slice - vst->slices);
  641. pkt->pts = AV_NOPTS_VALUE;
  642. pkt->pos = vst->pktpos;
  643. vst->slices = 0;
  644. return 0;
  645. }
  646. return 1;
  647. }
  648. static inline void
  649. rm_ac3_swap_bytes (AVStream *st, AVPacket *pkt)
  650. {
  651. uint8_t *ptr;
  652. int j;
  653. if (st->codec->codec_id == AV_CODEC_ID_AC3) {
  654. ptr = pkt->data;
  655. for (j=0;j<pkt->size;j+=2) {
  656. FFSWAP(int, ptr[0], ptr[1]);
  657. ptr += 2;
  658. }
  659. }
  660. }
  661. int
  662. ff_rm_parse_packet (AVFormatContext *s, AVIOContext *pb,
  663. AVStream *st, RMStream *ast, int len, AVPacket *pkt,
  664. int *seq, int flags, int64_t timestamp)
  665. {
  666. RMDemuxContext *rm = s->priv_data;
  667. if (st->codec->codec_type == AVMEDIA_TYPE_VIDEO) {
  668. rm->current_stream= st->id;
  669. if(rm_assemble_video_frame(s, pb, rm, ast, pkt, len, seq, &timestamp))
  670. return -1; //got partial frame
  671. } else if (st->codec->codec_type == AVMEDIA_TYPE_AUDIO) {
  672. if ((ast->deint_id == DEINT_ID_GENR) ||
  673. (ast->deint_id == DEINT_ID_INT4) ||
  674. (ast->deint_id == DEINT_ID_SIPR)) {
  675. int x;
  676. int sps = ast->sub_packet_size;
  677. int cfs = ast->coded_framesize;
  678. int h = ast->sub_packet_h;
  679. int y = ast->sub_packet_cnt;
  680. int w = ast->audio_framesize;
  681. if (flags & 2)
  682. y = ast->sub_packet_cnt = 0;
  683. if (!y)
  684. ast->audiotimestamp = timestamp;
  685. switch (ast->deint_id) {
  686. case DEINT_ID_INT4:
  687. for (x = 0; x < h/2; x++)
  688. avio_read(pb, ast->pkt.data+x*2*w+y*cfs, cfs);
  689. break;
  690. case DEINT_ID_GENR:
  691. for (x = 0; x < w/sps; x++)
  692. avio_read(pb, ast->pkt.data+sps*(h*x+((h+1)/2)*(y&1)+(y>>1)), sps);
  693. break;
  694. case DEINT_ID_SIPR:
  695. avio_read(pb, ast->pkt.data + y * w, w);
  696. break;
  697. }
  698. if (++(ast->sub_packet_cnt) < h)
  699. return -1;
  700. if (ast->deint_id == DEINT_ID_SIPR)
  701. ff_rm_reorder_sipr_data(ast->pkt.data, h, w);
  702. ast->sub_packet_cnt = 0;
  703. rm->audio_stream_num = st->index;
  704. rm->audio_pkt_cnt = h * w / st->codec->block_align;
  705. } else if ((ast->deint_id == DEINT_ID_VBRF) ||
  706. (ast->deint_id == DEINT_ID_VBRS)) {
  707. int x;
  708. rm->audio_stream_num = st->index;
  709. ast->sub_packet_cnt = (avio_rb16(pb) & 0xf0) >> 4;
  710. if (ast->sub_packet_cnt) {
  711. for (x = 0; x < ast->sub_packet_cnt; x++)
  712. ast->sub_packet_lengths[x] = avio_rb16(pb);
  713. rm->audio_pkt_cnt = ast->sub_packet_cnt;
  714. ast->audiotimestamp = timestamp;
  715. } else
  716. return -1;
  717. } else {
  718. av_get_packet(pb, pkt, len);
  719. rm_ac3_swap_bytes(st, pkt);
  720. }
  721. } else
  722. av_get_packet(pb, pkt, len);
  723. pkt->stream_index = st->index;
  724. #if 0
  725. if (st->codec->codec_type == AVMEDIA_TYPE_VIDEO) {
  726. if(st->codec->codec_id == AV_CODEC_ID_RV20){
  727. int seq= 128*(pkt->data[2]&0x7F) + (pkt->data[3]>>1);
  728. av_log(s, AV_LOG_DEBUG, "%d %"PRId64" %d\n", *timestamp, *timestamp*512LL/25, seq);
  729. seq |= (timestamp&~0x3FFF);
  730. if(seq - timestamp > 0x2000) seq -= 0x4000;
  731. if(seq - timestamp < -0x2000) seq += 0x4000;
  732. }
  733. }
  734. #endif
  735. pkt->pts = timestamp;
  736. if (flags & 2)
  737. pkt->flags |= AV_PKT_FLAG_KEY;
  738. return st->codec->codec_type == AVMEDIA_TYPE_AUDIO ? rm->audio_pkt_cnt : 0;
  739. }
  740. int
  741. ff_rm_retrieve_cache (AVFormatContext *s, AVIOContext *pb,
  742. AVStream *st, RMStream *ast, AVPacket *pkt)
  743. {
  744. RMDemuxContext *rm = s->priv_data;
  745. assert (rm->audio_pkt_cnt > 0);
  746. if (ast->deint_id == DEINT_ID_VBRF ||
  747. ast->deint_id == DEINT_ID_VBRS)
  748. av_get_packet(pb, pkt, ast->sub_packet_lengths[ast->sub_packet_cnt - rm->audio_pkt_cnt]);
  749. else {
  750. av_new_packet(pkt, st->codec->block_align);
  751. memcpy(pkt->data, ast->pkt.data + st->codec->block_align * //FIXME avoid this
  752. (ast->sub_packet_h * ast->audio_framesize / st->codec->block_align - rm->audio_pkt_cnt),
  753. st->codec->block_align);
  754. }
  755. rm->audio_pkt_cnt--;
  756. if ((pkt->pts = ast->audiotimestamp) != AV_NOPTS_VALUE) {
  757. ast->audiotimestamp = AV_NOPTS_VALUE;
  758. pkt->flags = AV_PKT_FLAG_KEY;
  759. } else
  760. pkt->flags = 0;
  761. pkt->stream_index = st->index;
  762. return rm->audio_pkt_cnt;
  763. }
  764. static int rm_read_packet(AVFormatContext *s, AVPacket *pkt)
  765. {
  766. RMDemuxContext *rm = s->priv_data;
  767. AVStream *st;
  768. int i, len, res, seq = 1;
  769. int64_t timestamp, pos;
  770. int flags;
  771. for (;;) {
  772. if (rm->audio_pkt_cnt) {
  773. // If there are queued audio packet return them first
  774. st = s->streams[rm->audio_stream_num];
  775. ff_rm_retrieve_cache(s, s->pb, st, st->priv_data, pkt);
  776. flags = 0;
  777. } else {
  778. if (rm->old_format) {
  779. RMStream *ast;
  780. st = s->streams[0];
  781. ast = st->priv_data;
  782. timestamp = AV_NOPTS_VALUE;
  783. len = !ast->audio_framesize ? RAW_PACKET_SIZE :
  784. ast->coded_framesize * ast->sub_packet_h / 2;
  785. flags = (seq++ == 1) ? 2 : 0;
  786. pos = avio_tell(s->pb);
  787. } else {
  788. len=sync(s, &timestamp, &flags, &i, &pos);
  789. if (len > 0)
  790. st = s->streams[i];
  791. }
  792. if(len<0 || s->pb->eof_reached)
  793. return AVERROR(EIO);
  794. res = ff_rm_parse_packet (s, s->pb, st, st->priv_data, len, pkt,
  795. &seq, flags, timestamp);
  796. if((flags&2) && (seq&0x7F) == 1)
  797. av_add_index_entry(st, pos, timestamp, 0, 0, AVINDEX_KEYFRAME);
  798. if (res)
  799. continue;
  800. }
  801. if( (st->discard >= AVDISCARD_NONKEY && !(flags&2))
  802. || st->discard >= AVDISCARD_ALL){
  803. av_free_packet(pkt);
  804. } else
  805. break;
  806. }
  807. return 0;
  808. }
  809. static int rm_read_close(AVFormatContext *s)
  810. {
  811. int i;
  812. for (i=0;i<s->nb_streams;i++)
  813. ff_rm_free_rmstream(s->streams[i]->priv_data);
  814. return 0;
  815. }
  816. static int rm_probe(AVProbeData *p)
  817. {
  818. /* check file header */
  819. if ((p->buf[0] == '.' && p->buf[1] == 'R' &&
  820. p->buf[2] == 'M' && p->buf[3] == 'F' &&
  821. p->buf[4] == 0 && p->buf[5] == 0) ||
  822. (p->buf[0] == '.' && p->buf[1] == 'r' &&
  823. p->buf[2] == 'a' && p->buf[3] == 0xfd))
  824. return AVPROBE_SCORE_MAX;
  825. else
  826. return 0;
  827. }
  828. static int64_t rm_read_dts(AVFormatContext *s, int stream_index,
  829. int64_t *ppos, int64_t pos_limit)
  830. {
  831. RMDemuxContext *rm = s->priv_data;
  832. int64_t pos, dts;
  833. int stream_index2, flags, len, h;
  834. pos = *ppos;
  835. if(rm->old_format)
  836. return AV_NOPTS_VALUE;
  837. avio_seek(s->pb, pos, SEEK_SET);
  838. rm->remaining_len=0;
  839. for(;;){
  840. int seq=1;
  841. AVStream *st;
  842. len=sync(s, &dts, &flags, &stream_index2, &pos);
  843. if(len<0)
  844. return AV_NOPTS_VALUE;
  845. st = s->streams[stream_index2];
  846. if (st->codec->codec_type == AVMEDIA_TYPE_VIDEO) {
  847. h= avio_r8(s->pb); len--;
  848. if(!(h & 0x40)){
  849. seq = avio_r8(s->pb); len--;
  850. }
  851. }
  852. if((flags&2) && (seq&0x7F) == 1){
  853. av_dlog(s, "%d %d-%d %"PRId64" %d\n",
  854. flags, stream_index2, stream_index, dts, seq);
  855. av_add_index_entry(st, pos, dts, 0, 0, AVINDEX_KEYFRAME);
  856. if(stream_index2 == stream_index)
  857. break;
  858. }
  859. avio_skip(s->pb, len);
  860. }
  861. *ppos = pos;
  862. return dts;
  863. }
  864. AVInputFormat ff_rm_demuxer = {
  865. .name = "rm",
  866. .long_name = NULL_IF_CONFIG_SMALL("RealMedia"),
  867. .priv_data_size = sizeof(RMDemuxContext),
  868. .read_probe = rm_probe,
  869. .read_header = rm_read_header,
  870. .read_packet = rm_read_packet,
  871. .read_close = rm_read_close,
  872. .read_timestamp = rm_read_dts,
  873. };
  874. AVInputFormat ff_rdt_demuxer = {
  875. .name = "rdt",
  876. .long_name = NULL_IF_CONFIG_SMALL("RDT demuxer"),
  877. .priv_data_size = sizeof(RMDemuxContext),
  878. .read_close = rm_read_close,
  879. .flags = AVFMT_NOFILE,
  880. };