You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

980 lines
32KB

  1. /*
  2. * "Real" compatible demuxer.
  3. * Copyright (c) 2000, 2001 Fabrice Bellard
  4. *
  5. * This file is part of Libav.
  6. *
  7. * Libav is free software; you can redistribute it and/or
  8. * modify it under the terms of the GNU Lesser General Public
  9. * License as published by the Free Software Foundation; either
  10. * version 2.1 of the License, or (at your option) any later version.
  11. *
  12. * Libav is distributed in the hope that it will be useful,
  13. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  14. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  15. * Lesser General Public License for more details.
  16. *
  17. * You should have received a copy of the GNU Lesser General Public
  18. * License along with Libav; if not, write to the Free Software
  19. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  20. */
  21. #include <inttypes.h>
  22. #include "libavutil/avstring.h"
  23. #include "libavutil/channel_layout.h"
  24. #include "libavutil/internal.h"
  25. #include "libavutil/intreadwrite.h"
  26. #include "libavutil/dict.h"
  27. #include "avformat.h"
  28. #include "internal.h"
  29. #include "rmsipr.h"
  30. #include "rm.h"
  31. #define DEINT_ID_GENR MKTAG('g', 'e', 'n', 'r') ///< interleaving for Cooker/ATRAC
  32. #define DEINT_ID_INT0 MKTAG('I', 'n', 't', '0') ///< no interleaving needed
  33. #define DEINT_ID_INT4 MKTAG('I', 'n', 't', '4') ///< interleaving for 28.8
  34. #define DEINT_ID_SIPR MKTAG('s', 'i', 'p', 'r') ///< interleaving for Sipro
  35. #define DEINT_ID_VBRF MKTAG('v', 'b', 'r', 'f') ///< VBR case for AAC
  36. #define DEINT_ID_VBRS MKTAG('v', 'b', 'r', 's') ///< VBR case for AAC
  37. struct RMStream {
  38. AVPacket pkt; ///< place to store merged video frame / reordered audio data
  39. int videobufsize; ///< current assembled frame size
  40. int videobufpos; ///< position for the next slice in the video buffer
  41. int curpic_num; ///< picture number of current frame
  42. int cur_slice, slices;
  43. int64_t pktpos; ///< first slice position in file
  44. /// Audio descrambling matrix parameters
  45. int64_t audiotimestamp; ///< Audio packet timestamp
  46. int sub_packet_cnt; // Subpacket counter, used while reading
  47. int sub_packet_size, sub_packet_h, coded_framesize; ///< Descrambling parameters from container
  48. int audio_framesize; /// Audio frame size from container
  49. int sub_packet_lengths[16]; /// Length of each subpacket
  50. int32_t deint_id; ///< deinterleaver used in audio stream
  51. };
  52. typedef struct RMDemuxContext {
  53. int nb_packets;
  54. int old_format;
  55. int current_stream;
  56. int remaining_len;
  57. int audio_stream_num; ///< Stream number for audio packets
  58. int audio_pkt_cnt; ///< Output packet counter
  59. } RMDemuxContext;
  60. static inline void get_strl(AVIOContext *pb, char *buf, int buf_size, int len)
  61. {
  62. int i;
  63. char *q, r;
  64. q = buf;
  65. for(i=0;i<len;i++) {
  66. r = avio_r8(pb);
  67. if (i < buf_size - 1)
  68. *q++ = r;
  69. }
  70. if (buf_size > 0) *q = '\0';
  71. }
  72. static void get_str8(AVIOContext *pb, char *buf, int buf_size)
  73. {
  74. get_strl(pb, buf, buf_size, avio_r8(pb));
  75. }
  76. static int rm_read_extradata(AVIOContext *pb, AVCodecContext *avctx, unsigned size)
  77. {
  78. if (size >= 1<<24)
  79. return -1;
  80. avctx->extradata = av_mallocz(size + FF_INPUT_BUFFER_PADDING_SIZE);
  81. if (!avctx->extradata)
  82. return AVERROR(ENOMEM);
  83. avctx->extradata_size = avio_read(pb, avctx->extradata, size);
  84. if (avctx->extradata_size != size)
  85. return AVERROR(EIO);
  86. return 0;
  87. }
  88. static void rm_read_metadata(AVFormatContext *s, AVIOContext *pb, int wide)
  89. {
  90. char buf[1024];
  91. int i;
  92. for (i=0; i<FF_ARRAY_ELEMS(ff_rm_metadata); i++) {
  93. int len = wide ? avio_rb16(pb) : avio_r8(pb);
  94. get_strl(pb, buf, sizeof(buf), len);
  95. av_dict_set(&s->metadata, ff_rm_metadata[i], buf, 0);
  96. }
  97. }
  98. RMStream *ff_rm_alloc_rmstream (void)
  99. {
  100. RMStream *rms = av_mallocz(sizeof(RMStream));
  101. if (!rms)
  102. return NULL;
  103. rms->curpic_num = -1;
  104. return rms;
  105. }
  106. void ff_rm_free_rmstream (RMStream *rms)
  107. {
  108. av_free_packet(&rms->pkt);
  109. }
  110. static int rm_read_audio_stream_info(AVFormatContext *s, AVIOContext *pb,
  111. AVStream *st, RMStream *ast, int read_all)
  112. {
  113. char buf[256];
  114. uint32_t version;
  115. int ret;
  116. /* ra type header */
  117. version = avio_rb16(pb); /* version */
  118. if (version == 3) {
  119. int header_size = avio_rb16(pb);
  120. int64_t startpos = avio_tell(pb);
  121. avio_skip(pb, 14);
  122. rm_read_metadata(s, pb, 0);
  123. if ((startpos + header_size) >= avio_tell(pb) + 2) {
  124. // fourcc (should always be "lpcJ")
  125. avio_r8(pb);
  126. get_str8(pb, buf, sizeof(buf));
  127. }
  128. // Skip extra header crap (this should never happen)
  129. if ((startpos + header_size) > avio_tell(pb))
  130. avio_skip(pb, header_size + startpos - avio_tell(pb));
  131. st->codec->sample_rate = 8000;
  132. st->codec->channels = 1;
  133. st->codec->channel_layout = AV_CH_LAYOUT_MONO;
  134. st->codec->codec_type = AVMEDIA_TYPE_AUDIO;
  135. st->codec->codec_id = AV_CODEC_ID_RA_144;
  136. ast->deint_id = DEINT_ID_INT0;
  137. } else {
  138. int flavor, sub_packet_h, coded_framesize, sub_packet_size;
  139. int codecdata_length;
  140. /* old version (4) */
  141. avio_skip(pb, 2); /* unused */
  142. avio_rb32(pb); /* .ra4 */
  143. avio_rb32(pb); /* data size */
  144. avio_rb16(pb); /* version2 */
  145. avio_rb32(pb); /* header size */
  146. flavor= avio_rb16(pb); /* add codec info / flavor */
  147. ast->coded_framesize = coded_framesize = avio_rb32(pb); /* coded frame size */
  148. avio_rb32(pb); /* ??? */
  149. avio_rb32(pb); /* ??? */
  150. avio_rb32(pb); /* ??? */
  151. ast->sub_packet_h = sub_packet_h = avio_rb16(pb); /* 1 */
  152. st->codec->block_align= avio_rb16(pb); /* frame size */
  153. ast->sub_packet_size = sub_packet_size = avio_rb16(pb); /* sub packet size */
  154. avio_rb16(pb); /* ??? */
  155. if (version == 5) {
  156. avio_rb16(pb); avio_rb16(pb); avio_rb16(pb);
  157. }
  158. st->codec->sample_rate = avio_rb16(pb);
  159. avio_rb32(pb);
  160. st->codec->channels = avio_rb16(pb);
  161. if (version == 5) {
  162. ast->deint_id = avio_rl32(pb);
  163. avio_read(pb, buf, 4);
  164. buf[4] = 0;
  165. } else {
  166. get_str8(pb, buf, sizeof(buf)); /* desc */
  167. ast->deint_id = AV_RL32(buf);
  168. get_str8(pb, buf, sizeof(buf)); /* desc */
  169. }
  170. st->codec->codec_type = AVMEDIA_TYPE_AUDIO;
  171. st->codec->codec_tag = AV_RL32(buf);
  172. st->codec->codec_id = ff_codec_get_id(ff_rm_codec_tags,
  173. st->codec->codec_tag);
  174. switch (st->codec->codec_id) {
  175. case AV_CODEC_ID_AC3:
  176. st->need_parsing = AVSTREAM_PARSE_FULL;
  177. break;
  178. case AV_CODEC_ID_RA_288:
  179. st->codec->extradata_size= 0;
  180. ast->audio_framesize = st->codec->block_align;
  181. st->codec->block_align = coded_framesize;
  182. break;
  183. case AV_CODEC_ID_COOK:
  184. st->need_parsing = AVSTREAM_PARSE_HEADERS;
  185. case AV_CODEC_ID_ATRAC3:
  186. case AV_CODEC_ID_SIPR:
  187. avio_rb16(pb); avio_r8(pb);
  188. if (version == 5)
  189. avio_r8(pb);
  190. codecdata_length = avio_rb32(pb);
  191. if(codecdata_length + FF_INPUT_BUFFER_PADDING_SIZE <= (unsigned)codecdata_length){
  192. av_log(s, AV_LOG_ERROR, "codecdata_length too large\n");
  193. return -1;
  194. }
  195. ast->audio_framesize = st->codec->block_align;
  196. if (st->codec->codec_id == AV_CODEC_ID_SIPR) {
  197. if (flavor > 3) {
  198. av_log(s, AV_LOG_ERROR, "bad SIPR file flavor %d\n",
  199. flavor);
  200. return -1;
  201. }
  202. st->codec->block_align = ff_sipr_subpk_size[flavor];
  203. } else {
  204. if(sub_packet_size <= 0){
  205. av_log(s, AV_LOG_ERROR, "sub_packet_size is invalid\n");
  206. return -1;
  207. }
  208. st->codec->block_align = ast->sub_packet_size;
  209. }
  210. if ((ret = rm_read_extradata(pb, st->codec, codecdata_length)) < 0)
  211. return ret;
  212. break;
  213. case AV_CODEC_ID_AAC:
  214. avio_rb16(pb); avio_r8(pb);
  215. if (version == 5)
  216. avio_r8(pb);
  217. codecdata_length = avio_rb32(pb);
  218. if(codecdata_length + FF_INPUT_BUFFER_PADDING_SIZE <= (unsigned)codecdata_length){
  219. av_log(s, AV_LOG_ERROR, "codecdata_length too large\n");
  220. return -1;
  221. }
  222. if (codecdata_length >= 1) {
  223. avio_r8(pb);
  224. if ((ret = rm_read_extradata(pb, st->codec, codecdata_length - 1)) < 0)
  225. return ret;
  226. }
  227. break;
  228. }
  229. if (ast->deint_id == DEINT_ID_INT4 ||
  230. ast->deint_id == DEINT_ID_GENR ||
  231. ast->deint_id == DEINT_ID_SIPR) {
  232. if (st->codec->block_align <= 0 ||
  233. ast->audio_framesize * sub_packet_h > (unsigned)INT_MAX ||
  234. ast->audio_framesize * sub_packet_h < st->codec->block_align)
  235. return AVERROR_INVALIDDATA;
  236. if (av_new_packet(&ast->pkt, ast->audio_framesize * sub_packet_h) < 0)
  237. return AVERROR(ENOMEM);
  238. }
  239. switch (ast->deint_id) {
  240. case DEINT_ID_INT4:
  241. if (ast->coded_framesize > ast->audio_framesize ||
  242. sub_packet_h <= 1 ||
  243. ast->coded_framesize * sub_packet_h > (2 + (sub_packet_h & 1)) * ast->audio_framesize)
  244. return AVERROR_INVALIDDATA;
  245. break;
  246. case DEINT_ID_GENR:
  247. if (ast->sub_packet_size <= 0 ||
  248. ast->sub_packet_size > ast->audio_framesize)
  249. return AVERROR_INVALIDDATA;
  250. break;
  251. case DEINT_ID_SIPR:
  252. case DEINT_ID_INT0:
  253. case DEINT_ID_VBRS:
  254. case DEINT_ID_VBRF:
  255. break;
  256. default:
  257. av_log(NULL, 0 ,"Unknown interleaver %"PRIX32"\n", ast->deint_id);
  258. return AVERROR_INVALIDDATA;
  259. }
  260. if (read_all) {
  261. avio_r8(pb);
  262. avio_r8(pb);
  263. avio_r8(pb);
  264. rm_read_metadata(s, pb, 0);
  265. }
  266. }
  267. return 0;
  268. }
  269. int ff_rm_read_mdpr_codecdata(AVFormatContext *s, AVIOContext *pb,
  270. AVStream *st, RMStream *rst,
  271. unsigned int codec_data_size)
  272. {
  273. unsigned int v;
  274. int size;
  275. int64_t codec_pos;
  276. int ret;
  277. avpriv_set_pts_info(st, 64, 1, 1000);
  278. codec_pos = avio_tell(pb);
  279. v = avio_rb32(pb);
  280. if (v == MKTAG(0xfd, 'a', 'r', '.')) {
  281. /* ra type header */
  282. if (rm_read_audio_stream_info(s, pb, st, rst, 0))
  283. return -1;
  284. } else if (v == MKBETAG('L', 'S', 'D', ':')) {
  285. avio_seek(pb, -4, SEEK_CUR);
  286. if ((ret = rm_read_extradata(pb, st->codec, codec_data_size)) < 0)
  287. return ret;
  288. st->codec->codec_type = AVMEDIA_TYPE_AUDIO;
  289. st->codec->codec_tag = AV_RL32(st->codec->extradata);
  290. st->codec->codec_id = ff_codec_get_id(ff_rm_codec_tags,
  291. st->codec->codec_tag);
  292. } else {
  293. int fps;
  294. if (avio_rl32(pb) != MKTAG('V', 'I', 'D', 'O')) {
  295. fail1:
  296. av_log(st->codec, AV_LOG_ERROR, "Unsupported video codec\n");
  297. goto skip;
  298. }
  299. st->codec->codec_tag = avio_rl32(pb);
  300. st->codec->codec_id = ff_codec_get_id(ff_rm_codec_tags,
  301. st->codec->codec_tag);
  302. av_dlog(s, "%X %X\n", st->codec->codec_tag, MKTAG('R', 'V', '2', '0'));
  303. if (st->codec->codec_id == AV_CODEC_ID_NONE)
  304. goto fail1;
  305. st->codec->width = avio_rb16(pb);
  306. st->codec->height = avio_rb16(pb);
  307. avio_skip(pb, 2); // looks like bits per sample
  308. avio_skip(pb, 4); // always zero?
  309. st->codec->codec_type = AVMEDIA_TYPE_VIDEO;
  310. st->need_parsing = AVSTREAM_PARSE_TIMESTAMPS;
  311. fps = avio_rb32(pb);
  312. if ((ret = rm_read_extradata(pb, st->codec, codec_data_size - (avio_tell(pb) - codec_pos))) < 0)
  313. return ret;
  314. if (fps > 0) {
  315. av_reduce(&st->avg_frame_rate.den, &st->avg_frame_rate.num,
  316. 0x10000, fps, (1 << 30) - 1);
  317. } else if (s->error_recognition & AV_EF_EXPLODE) {
  318. av_log(s, AV_LOG_ERROR, "Invalid framerate\n");
  319. return AVERROR_INVALIDDATA;
  320. }
  321. }
  322. skip:
  323. /* skip codec info */
  324. size = avio_tell(pb) - codec_pos;
  325. avio_skip(pb, codec_data_size - size);
  326. return 0;
  327. }
  328. /** this function assumes that the demuxer has already seeked to the start
  329. * of the INDX chunk, and will bail out if not. */
  330. static int rm_read_index(AVFormatContext *s)
  331. {
  332. AVIOContext *pb = s->pb;
  333. unsigned int size, n_pkts, str_id, next_off, n, pos, pts;
  334. AVStream *st;
  335. do {
  336. if (avio_rl32(pb) != MKTAG('I','N','D','X'))
  337. return -1;
  338. size = avio_rb32(pb);
  339. if (size < 20)
  340. return -1;
  341. avio_skip(pb, 2);
  342. n_pkts = avio_rb32(pb);
  343. str_id = avio_rb16(pb);
  344. next_off = avio_rb32(pb);
  345. for (n = 0; n < s->nb_streams; n++)
  346. if (s->streams[n]->id == str_id) {
  347. st = s->streams[n];
  348. break;
  349. }
  350. if (n == s->nb_streams) {
  351. av_log(s, AV_LOG_ERROR,
  352. "Invalid stream index %d for index at pos %"PRId64"\n",
  353. str_id, avio_tell(pb));
  354. goto skip;
  355. } else if ((avio_size(pb) - avio_tell(pb)) / 14 < n_pkts) {
  356. av_log(s, AV_LOG_ERROR,
  357. "Nr. of packets in packet index for stream index %d "
  358. "exceeds filesize (%"PRId64" at %"PRId64" = %"PRId64")\n",
  359. str_id, avio_size(pb), avio_tell(pb),
  360. (avio_size(pb) - avio_tell(pb)) / 14);
  361. goto skip;
  362. }
  363. for (n = 0; n < n_pkts; n++) {
  364. avio_skip(pb, 2);
  365. pts = avio_rb32(pb);
  366. pos = avio_rb32(pb);
  367. avio_skip(pb, 4); /* packet no. */
  368. av_add_index_entry(st, pos, pts, 0, 0, AVINDEX_KEYFRAME);
  369. }
  370. skip:
  371. if (next_off && avio_tell(pb) < next_off &&
  372. avio_seek(pb, next_off, SEEK_SET) < 0) {
  373. av_log(s, AV_LOG_ERROR,
  374. "Non-linear index detected, not supported\n");
  375. return -1;
  376. }
  377. } while (next_off);
  378. return 0;
  379. }
  380. static int rm_read_header_old(AVFormatContext *s)
  381. {
  382. RMDemuxContext *rm = s->priv_data;
  383. AVStream *st;
  384. rm->old_format = 1;
  385. st = avformat_new_stream(s, NULL);
  386. if (!st)
  387. return -1;
  388. st->priv_data = ff_rm_alloc_rmstream();
  389. if (!st->priv_data)
  390. return AVERROR(ENOMEM);
  391. return rm_read_audio_stream_info(s, s->pb, st, st->priv_data, 1);
  392. }
  393. static int rm_read_header(AVFormatContext *s)
  394. {
  395. RMDemuxContext *rm = s->priv_data;
  396. AVStream *st;
  397. AVIOContext *pb = s->pb;
  398. unsigned int tag;
  399. int tag_size;
  400. unsigned int start_time, duration;
  401. unsigned int data_off = 0, indx_off = 0;
  402. char buf[128];
  403. int flags = 0;
  404. tag = avio_rl32(pb);
  405. if (tag == MKTAG('.', 'r', 'a', 0xfd)) {
  406. /* very old .ra format */
  407. return rm_read_header_old(s);
  408. } else if (tag != MKTAG('.', 'R', 'M', 'F')) {
  409. return AVERROR(EIO);
  410. }
  411. tag_size = avio_rb32(pb);
  412. avio_skip(pb, tag_size - 8);
  413. for(;;) {
  414. if (pb->eof_reached)
  415. return -1;
  416. tag = avio_rl32(pb);
  417. tag_size = avio_rb32(pb);
  418. avio_rb16(pb);
  419. av_dlog(s, "tag=%c%c%c%c (%08x) size=%d\n",
  420. (tag ) & 0xff,
  421. (tag >> 8) & 0xff,
  422. (tag >> 16) & 0xff,
  423. (tag >> 24) & 0xff,
  424. tag,
  425. tag_size);
  426. if (tag_size < 10 && tag != MKTAG('D', 'A', 'T', 'A'))
  427. return -1;
  428. switch(tag) {
  429. case MKTAG('P', 'R', 'O', 'P'):
  430. /* file header */
  431. avio_rb32(pb); /* max bit rate */
  432. avio_rb32(pb); /* avg bit rate */
  433. avio_rb32(pb); /* max packet size */
  434. avio_rb32(pb); /* avg packet size */
  435. avio_rb32(pb); /* nb packets */
  436. avio_rb32(pb); /* duration */
  437. avio_rb32(pb); /* preroll */
  438. indx_off = avio_rb32(pb); /* index offset */
  439. data_off = avio_rb32(pb); /* data offset */
  440. avio_rb16(pb); /* nb streams */
  441. flags = avio_rb16(pb); /* flags */
  442. break;
  443. case MKTAG('C', 'O', 'N', 'T'):
  444. rm_read_metadata(s, pb, 1);
  445. break;
  446. case MKTAG('M', 'D', 'P', 'R'):
  447. st = avformat_new_stream(s, NULL);
  448. if (!st)
  449. return AVERROR(ENOMEM);
  450. st->id = avio_rb16(pb);
  451. avio_rb32(pb); /* max bit rate */
  452. st->codec->bit_rate = avio_rb32(pb); /* bit rate */
  453. avio_rb32(pb); /* max packet size */
  454. avio_rb32(pb); /* avg packet size */
  455. start_time = avio_rb32(pb); /* start time */
  456. avio_rb32(pb); /* preroll */
  457. duration = avio_rb32(pb); /* duration */
  458. st->start_time = start_time;
  459. st->duration = duration;
  460. get_str8(pb, buf, sizeof(buf)); /* desc */
  461. get_str8(pb, buf, sizeof(buf)); /* mimetype */
  462. st->codec->codec_type = AVMEDIA_TYPE_DATA;
  463. st->priv_data = ff_rm_alloc_rmstream();
  464. if (!st->priv_data)
  465. return AVERROR(ENOMEM);
  466. if (ff_rm_read_mdpr_codecdata(s, s->pb, st, st->priv_data,
  467. avio_rb32(pb)) < 0)
  468. return -1;
  469. break;
  470. case MKTAG('D', 'A', 'T', 'A'):
  471. goto header_end;
  472. default:
  473. /* unknown tag: skip it */
  474. avio_skip(pb, tag_size - 10);
  475. break;
  476. }
  477. }
  478. header_end:
  479. rm->nb_packets = avio_rb32(pb); /* number of packets */
  480. if (!rm->nb_packets && (flags & 4))
  481. rm->nb_packets = 3600 * 25;
  482. avio_rb32(pb); /* next data header */
  483. if (!data_off)
  484. data_off = avio_tell(pb) - 18;
  485. if (indx_off && pb->seekable && !(s->flags & AVFMT_FLAG_IGNIDX) &&
  486. avio_seek(pb, indx_off, SEEK_SET) >= 0) {
  487. rm_read_index(s);
  488. avio_seek(pb, data_off + 18, SEEK_SET);
  489. }
  490. return 0;
  491. }
  492. static int get_num(AVIOContext *pb, int *len)
  493. {
  494. int n, n1;
  495. n = avio_rb16(pb);
  496. (*len)-=2;
  497. n &= 0x7FFF;
  498. if (n >= 0x4000) {
  499. return n - 0x4000;
  500. } else {
  501. n1 = avio_rb16(pb);
  502. (*len)-=2;
  503. return (n << 16) | n1;
  504. }
  505. }
  506. /* multiple of 20 bytes for ra144 (ugly) */
  507. #define RAW_PACKET_SIZE 1000
  508. static int sync(AVFormatContext *s, int64_t *timestamp, int *flags, int *stream_index, int64_t *pos){
  509. RMDemuxContext *rm = s->priv_data;
  510. AVIOContext *pb = s->pb;
  511. AVStream *st;
  512. uint32_t state=0xFFFFFFFF;
  513. while(!pb->eof_reached){
  514. int len, num, i;
  515. *pos= avio_tell(pb) - 3;
  516. if(rm->remaining_len > 0){
  517. num= rm->current_stream;
  518. len= rm->remaining_len;
  519. *timestamp = AV_NOPTS_VALUE;
  520. *flags= 0;
  521. }else{
  522. state= (state<<8) + avio_r8(pb);
  523. if(state == MKBETAG('I', 'N', 'D', 'X')){
  524. int n_pkts, expected_len;
  525. len = avio_rb32(pb);
  526. avio_skip(pb, 2);
  527. n_pkts = avio_rb32(pb);
  528. expected_len = 20 + n_pkts * 14;
  529. if (len == 20)
  530. /* some files don't add index entries to chunk size... */
  531. len = expected_len;
  532. else if (len != expected_len)
  533. av_log(s, AV_LOG_WARNING,
  534. "Index size %d (%d pkts) is wrong, should be %d.\n",
  535. len, n_pkts, expected_len);
  536. len -= 14; // we already read part of the index header
  537. if(len<0)
  538. continue;
  539. goto skip;
  540. } else if (state == MKBETAG('D','A','T','A')) {
  541. av_log(s, AV_LOG_WARNING,
  542. "DATA tag in middle of chunk, file may be broken.\n");
  543. }
  544. if(state > (unsigned)0xFFFF || state <= 12)
  545. continue;
  546. len=state - 12;
  547. state= 0xFFFFFFFF;
  548. num = avio_rb16(pb);
  549. *timestamp = avio_rb32(pb);
  550. avio_r8(pb); /* reserved */
  551. *flags = avio_r8(pb); /* flags */
  552. }
  553. for(i=0;i<s->nb_streams;i++) {
  554. st = s->streams[i];
  555. if (num == st->id)
  556. break;
  557. }
  558. if (i == s->nb_streams) {
  559. skip:
  560. /* skip packet if unknown number */
  561. avio_skip(pb, len);
  562. rm->remaining_len = 0;
  563. continue;
  564. }
  565. *stream_index= i;
  566. return len;
  567. }
  568. return -1;
  569. }
  570. static int rm_assemble_video_frame(AVFormatContext *s, AVIOContext *pb,
  571. RMDemuxContext *rm, RMStream *vst,
  572. AVPacket *pkt, int len, int *pseq,
  573. int64_t *timestamp)
  574. {
  575. int hdr, seq, pic_num, len2, pos;
  576. int type;
  577. hdr = avio_r8(pb); len--;
  578. type = hdr >> 6;
  579. if(type != 3){ // not frame as a part of packet
  580. seq = avio_r8(pb); len--;
  581. }
  582. if(type != 1){ // not whole frame
  583. len2 = get_num(pb, &len);
  584. pos = get_num(pb, &len);
  585. pic_num = avio_r8(pb); len--;
  586. }
  587. if(len<0)
  588. return -1;
  589. rm->remaining_len = len;
  590. if(type&1){ // frame, not slice
  591. if(type == 3){ // frame as a part of packet
  592. len= len2;
  593. *timestamp = pos;
  594. }
  595. if(rm->remaining_len < len)
  596. return -1;
  597. rm->remaining_len -= len;
  598. if(av_new_packet(pkt, len + 9) < 0)
  599. return AVERROR(EIO);
  600. pkt->data[0] = 0;
  601. AV_WL32(pkt->data + 1, 1);
  602. AV_WL32(pkt->data + 5, 0);
  603. avio_read(pb, pkt->data + 9, len);
  604. return 0;
  605. }
  606. //now we have to deal with single slice
  607. *pseq = seq;
  608. if((seq & 0x7F) == 1 || vst->curpic_num != pic_num){
  609. vst->slices = ((hdr & 0x3F) << 1) + 1;
  610. vst->videobufsize = len2 + 8*vst->slices + 1;
  611. av_free_packet(&vst->pkt); //FIXME this should be output.
  612. if(av_new_packet(&vst->pkt, vst->videobufsize) < 0)
  613. return AVERROR(ENOMEM);
  614. vst->videobufpos = 8*vst->slices + 1;
  615. vst->cur_slice = 0;
  616. vst->curpic_num = pic_num;
  617. vst->pktpos = avio_tell(pb);
  618. }
  619. if(type == 2)
  620. len = FFMIN(len, pos);
  621. if(++vst->cur_slice > vst->slices)
  622. return 1;
  623. AV_WL32(vst->pkt.data - 7 + 8*vst->cur_slice, 1);
  624. AV_WL32(vst->pkt.data - 3 + 8*vst->cur_slice, vst->videobufpos - 8*vst->slices - 1);
  625. if(vst->videobufpos + len > vst->videobufsize)
  626. return 1;
  627. if (avio_read(pb, vst->pkt.data + vst->videobufpos, len) != len)
  628. return AVERROR(EIO);
  629. vst->videobufpos += len;
  630. rm->remaining_len-= len;
  631. if (type == 2 || vst->videobufpos == vst->videobufsize) {
  632. vst->pkt.data[0] = vst->cur_slice-1;
  633. *pkt= vst->pkt;
  634. vst->pkt.data= NULL;
  635. vst->pkt.size= 0;
  636. vst->pkt.buf = NULL;
  637. #if FF_API_DESTRUCT_PACKET
  638. FF_DISABLE_DEPRECATION_WARNINGS
  639. vst->pkt.destruct = NULL;
  640. FF_ENABLE_DEPRECATION_WARNINGS
  641. #endif
  642. if(vst->slices != vst->cur_slice) //FIXME find out how to set slices correct from the begin
  643. memmove(pkt->data + 1 + 8*vst->cur_slice, pkt->data + 1 + 8*vst->slices,
  644. vst->videobufpos - 1 - 8*vst->slices);
  645. pkt->size = vst->videobufpos + 8*(vst->cur_slice - vst->slices);
  646. pkt->pts = AV_NOPTS_VALUE;
  647. pkt->pos = vst->pktpos;
  648. vst->slices = 0;
  649. return 0;
  650. }
  651. return 1;
  652. }
  653. static inline void
  654. rm_ac3_swap_bytes (AVStream *st, AVPacket *pkt)
  655. {
  656. uint8_t *ptr;
  657. int j;
  658. if (st->codec->codec_id == AV_CODEC_ID_AC3) {
  659. ptr = pkt->data;
  660. for (j=0;j<pkt->size;j+=2) {
  661. FFSWAP(int, ptr[0], ptr[1]);
  662. ptr += 2;
  663. }
  664. }
  665. }
  666. int
  667. ff_rm_parse_packet (AVFormatContext *s, AVIOContext *pb,
  668. AVStream *st, RMStream *ast, int len, AVPacket *pkt,
  669. int *seq, int flags, int64_t timestamp)
  670. {
  671. RMDemuxContext *rm = s->priv_data;
  672. if (st->codec->codec_type == AVMEDIA_TYPE_VIDEO) {
  673. rm->current_stream= st->id;
  674. if(rm_assemble_video_frame(s, pb, rm, ast, pkt, len, seq, &timestamp))
  675. return -1; //got partial frame
  676. } else if (st->codec->codec_type == AVMEDIA_TYPE_AUDIO) {
  677. if ((ast->deint_id == DEINT_ID_GENR) ||
  678. (ast->deint_id == DEINT_ID_INT4) ||
  679. (ast->deint_id == DEINT_ID_SIPR)) {
  680. int x;
  681. int sps = ast->sub_packet_size;
  682. int cfs = ast->coded_framesize;
  683. int h = ast->sub_packet_h;
  684. int y = ast->sub_packet_cnt;
  685. int w = ast->audio_framesize;
  686. if (flags & 2)
  687. y = ast->sub_packet_cnt = 0;
  688. if (!y)
  689. ast->audiotimestamp = timestamp;
  690. switch (ast->deint_id) {
  691. case DEINT_ID_INT4:
  692. for (x = 0; x < h/2; x++)
  693. avio_read(pb, ast->pkt.data+x*2*w+y*cfs, cfs);
  694. break;
  695. case DEINT_ID_GENR:
  696. for (x = 0; x < w/sps; x++)
  697. avio_read(pb, ast->pkt.data+sps*(h*x+((h+1)/2)*(y&1)+(y>>1)), sps);
  698. break;
  699. case DEINT_ID_SIPR:
  700. avio_read(pb, ast->pkt.data + y * w, w);
  701. break;
  702. }
  703. if (++(ast->sub_packet_cnt) < h)
  704. return -1;
  705. if (ast->deint_id == DEINT_ID_SIPR)
  706. ff_rm_reorder_sipr_data(ast->pkt.data, h, w);
  707. ast->sub_packet_cnt = 0;
  708. rm->audio_stream_num = st->index;
  709. rm->audio_pkt_cnt = h * w / st->codec->block_align;
  710. } else if ((ast->deint_id == DEINT_ID_VBRF) ||
  711. (ast->deint_id == DEINT_ID_VBRS)) {
  712. int x;
  713. rm->audio_stream_num = st->index;
  714. ast->sub_packet_cnt = (avio_rb16(pb) & 0xf0) >> 4;
  715. if (ast->sub_packet_cnt) {
  716. for (x = 0; x < ast->sub_packet_cnt; x++)
  717. ast->sub_packet_lengths[x] = avio_rb16(pb);
  718. rm->audio_pkt_cnt = ast->sub_packet_cnt;
  719. ast->audiotimestamp = timestamp;
  720. } else
  721. return -1;
  722. } else {
  723. av_get_packet(pb, pkt, len);
  724. rm_ac3_swap_bytes(st, pkt);
  725. }
  726. } else
  727. av_get_packet(pb, pkt, len);
  728. pkt->stream_index = st->index;
  729. #if 0
  730. if (st->codec->codec_type == AVMEDIA_TYPE_VIDEO) {
  731. if(st->codec->codec_id == AV_CODEC_ID_RV20){
  732. int seq= 128*(pkt->data[2]&0x7F) + (pkt->data[3]>>1);
  733. av_log(s, AV_LOG_DEBUG, "%d %"PRId64" %d\n", *timestamp, *timestamp*512LL/25, seq);
  734. seq |= (timestamp&~0x3FFF);
  735. if(seq - timestamp > 0x2000) seq -= 0x4000;
  736. if(seq - timestamp < -0x2000) seq += 0x4000;
  737. }
  738. }
  739. #endif
  740. pkt->pts = timestamp;
  741. if (flags & 2)
  742. pkt->flags |= AV_PKT_FLAG_KEY;
  743. return st->codec->codec_type == AVMEDIA_TYPE_AUDIO ? rm->audio_pkt_cnt : 0;
  744. }
  745. int
  746. ff_rm_retrieve_cache (AVFormatContext *s, AVIOContext *pb,
  747. AVStream *st, RMStream *ast, AVPacket *pkt)
  748. {
  749. RMDemuxContext *rm = s->priv_data;
  750. assert (rm->audio_pkt_cnt > 0);
  751. if (ast->deint_id == DEINT_ID_VBRF ||
  752. ast->deint_id == DEINT_ID_VBRS)
  753. av_get_packet(pb, pkt, ast->sub_packet_lengths[ast->sub_packet_cnt - rm->audio_pkt_cnt]);
  754. else {
  755. int ret = av_new_packet(pkt, st->codec->block_align);
  756. if (ret < 0)
  757. return ret;
  758. memcpy(pkt->data, ast->pkt.data + st->codec->block_align * //FIXME avoid this
  759. (ast->sub_packet_h * ast->audio_framesize / st->codec->block_align - rm->audio_pkt_cnt),
  760. st->codec->block_align);
  761. }
  762. rm->audio_pkt_cnt--;
  763. if ((pkt->pts = ast->audiotimestamp) != AV_NOPTS_VALUE) {
  764. ast->audiotimestamp = AV_NOPTS_VALUE;
  765. pkt->flags = AV_PKT_FLAG_KEY;
  766. } else
  767. pkt->flags = 0;
  768. pkt->stream_index = st->index;
  769. return rm->audio_pkt_cnt;
  770. }
  771. static int rm_read_packet(AVFormatContext *s, AVPacket *pkt)
  772. {
  773. RMDemuxContext *rm = s->priv_data;
  774. AVStream *st;
  775. int i, len, res, seq = 1;
  776. int64_t timestamp, pos;
  777. int flags;
  778. for (;;) {
  779. if (rm->audio_pkt_cnt) {
  780. // If there are queued audio packet return them first
  781. st = s->streams[rm->audio_stream_num];
  782. ff_rm_retrieve_cache(s, s->pb, st, st->priv_data, pkt);
  783. flags = 0;
  784. } else {
  785. if (rm->old_format) {
  786. RMStream *ast;
  787. st = s->streams[0];
  788. ast = st->priv_data;
  789. timestamp = AV_NOPTS_VALUE;
  790. len = !ast->audio_framesize ? RAW_PACKET_SIZE :
  791. ast->coded_framesize * ast->sub_packet_h / 2;
  792. flags = (seq++ == 1) ? 2 : 0;
  793. pos = avio_tell(s->pb);
  794. } else {
  795. len=sync(s, &timestamp, &flags, &i, &pos);
  796. if (len > 0)
  797. st = s->streams[i];
  798. }
  799. if (len <= 0 || s->pb->eof_reached)
  800. return AVERROR(EIO);
  801. res = ff_rm_parse_packet (s, s->pb, st, st->priv_data, len, pkt,
  802. &seq, flags, timestamp);
  803. if((flags&2) && (seq&0x7F) == 1)
  804. av_add_index_entry(st, pos, timestamp, 0, 0, AVINDEX_KEYFRAME);
  805. if (res)
  806. continue;
  807. }
  808. if( (st->discard >= AVDISCARD_NONKEY && !(flags&2))
  809. || st->discard >= AVDISCARD_ALL){
  810. av_free_packet(pkt);
  811. } else
  812. break;
  813. }
  814. return 0;
  815. }
  816. static int rm_read_close(AVFormatContext *s)
  817. {
  818. int i;
  819. for (i=0;i<s->nb_streams;i++)
  820. ff_rm_free_rmstream(s->streams[i]->priv_data);
  821. return 0;
  822. }
  823. static int rm_probe(AVProbeData *p)
  824. {
  825. /* check file header */
  826. if ((p->buf[0] == '.' && p->buf[1] == 'R' &&
  827. p->buf[2] == 'M' && p->buf[3] == 'F' &&
  828. p->buf[4] == 0 && p->buf[5] == 0) ||
  829. (p->buf[0] == '.' && p->buf[1] == 'r' &&
  830. p->buf[2] == 'a' && p->buf[3] == 0xfd))
  831. return AVPROBE_SCORE_MAX;
  832. else
  833. return 0;
  834. }
  835. static int64_t rm_read_dts(AVFormatContext *s, int stream_index,
  836. int64_t *ppos, int64_t pos_limit)
  837. {
  838. RMDemuxContext *rm = s->priv_data;
  839. int64_t pos, dts;
  840. int stream_index2, flags, len, h;
  841. pos = *ppos;
  842. if(rm->old_format)
  843. return AV_NOPTS_VALUE;
  844. avio_seek(s->pb, pos, SEEK_SET);
  845. rm->remaining_len=0;
  846. for(;;){
  847. int seq=1;
  848. AVStream *st;
  849. len=sync(s, &dts, &flags, &stream_index2, &pos);
  850. if(len<0)
  851. return AV_NOPTS_VALUE;
  852. st = s->streams[stream_index2];
  853. if (st->codec->codec_type == AVMEDIA_TYPE_VIDEO) {
  854. h= avio_r8(s->pb); len--;
  855. if(!(h & 0x40)){
  856. seq = avio_r8(s->pb); len--;
  857. }
  858. }
  859. if((flags&2) && (seq&0x7F) == 1){
  860. av_dlog(s, "%d %d-%d %"PRId64" %d\n",
  861. flags, stream_index2, stream_index, dts, seq);
  862. av_add_index_entry(st, pos, dts, 0, 0, AVINDEX_KEYFRAME);
  863. if(stream_index2 == stream_index)
  864. break;
  865. }
  866. avio_skip(s->pb, len);
  867. }
  868. *ppos = pos;
  869. return dts;
  870. }
  871. AVInputFormat ff_rm_demuxer = {
  872. .name = "rm",
  873. .long_name = NULL_IF_CONFIG_SMALL("RealMedia"),
  874. .priv_data_size = sizeof(RMDemuxContext),
  875. .read_probe = rm_probe,
  876. .read_header = rm_read_header,
  877. .read_packet = rm_read_packet,
  878. .read_close = rm_read_close,
  879. .read_timestamp = rm_read_dts,
  880. };
  881. AVInputFormat ff_rdt_demuxer = {
  882. .name = "rdt",
  883. .long_name = NULL_IF_CONFIG_SMALL("RDT demuxer"),
  884. .priv_data_size = sizeof(RMDemuxContext),
  885. .read_close = rm_read_close,
  886. .flags = AVFMT_NOFILE,
  887. };