You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

1124 lines
37KB

  1. /*
  2. * "Real" compatible demuxer.
  3. * Copyright (c) 2000, 2001 Fabrice Bellard
  4. *
  5. * This file is part of FFmpeg.
  6. *
  7. * FFmpeg is free software; you can redistribute it and/or
  8. * modify it under the terms of the GNU Lesser General Public
  9. * License as published by the Free Software Foundation; either
  10. * version 2.1 of the License, or (at your option) any later version.
  11. *
  12. * FFmpeg is distributed in the hope that it will be useful,
  13. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  14. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  15. * Lesser General Public License for more details.
  16. *
  17. * You should have received a copy of the GNU Lesser General Public
  18. * License along with FFmpeg; if not, write to the Free Software
  19. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  20. */
  21. #include <inttypes.h>
  22. #include "libavutil/avassert.h"
  23. #include "libavutil/avstring.h"
  24. #include "libavutil/channel_layout.h"
  25. #include "libavutil/internal.h"
  26. #include "libavutil/intreadwrite.h"
  27. #include "libavutil/dict.h"
  28. #include "avformat.h"
  29. #include "avio_internal.h"
  30. #include "internal.h"
  31. #include "rmsipr.h"
  32. #include "rm.h"
  33. #define DEINT_ID_GENR MKTAG('g', 'e', 'n', 'r') ///< interleaving for Cooker/ATRAC
  34. #define DEINT_ID_INT0 MKTAG('I', 'n', 't', '0') ///< no interleaving needed
  35. #define DEINT_ID_INT4 MKTAG('I', 'n', 't', '4') ///< interleaving for 28.8
  36. #define DEINT_ID_SIPR MKTAG('s', 'i', 'p', 'r') ///< interleaving for Sipro
  37. #define DEINT_ID_VBRF MKTAG('v', 'b', 'r', 'f') ///< VBR case for AAC
  38. #define DEINT_ID_VBRS MKTAG('v', 'b', 'r', 's') ///< VBR case for AAC
  39. struct RMStream {
  40. AVPacket pkt; ///< place to store merged video frame / reordered audio data
  41. int videobufsize; ///< current assembled frame size
  42. int videobufpos; ///< position for the next slice in the video buffer
  43. int curpic_num; ///< picture number of current frame
  44. int cur_slice, slices;
  45. int64_t pktpos; ///< first slice position in file
  46. /// Audio descrambling matrix parameters
  47. int64_t audiotimestamp; ///< Audio packet timestamp
  48. int sub_packet_cnt; // Subpacket counter, used while reading
  49. int sub_packet_size, sub_packet_h, coded_framesize; ///< Descrambling parameters from container
  50. int audio_framesize; /// Audio frame size from container
  51. int sub_packet_lengths[16]; /// Length of each subpacket
  52. int32_t deint_id; ///< deinterleaver used in audio stream
  53. };
  54. typedef struct RMDemuxContext {
  55. int nb_packets;
  56. int old_format;
  57. int current_stream;
  58. int remaining_len;
  59. int audio_stream_num; ///< Stream number for audio packets
  60. int audio_pkt_cnt; ///< Output packet counter
  61. } RMDemuxContext;
  62. static int rm_read_close(AVFormatContext *s);
  63. static inline void get_strl(AVIOContext *pb, char *buf, int buf_size, int len)
  64. {
  65. int i;
  66. char *q, r;
  67. q = buf;
  68. for(i=0;i<len;i++) {
  69. r = avio_r8(pb);
  70. if (i < buf_size - 1)
  71. *q++ = r;
  72. }
  73. if (buf_size > 0) *q = '\0';
  74. }
  75. static void get_str8(AVIOContext *pb, char *buf, int buf_size)
  76. {
  77. get_strl(pb, buf, buf_size, avio_r8(pb));
  78. }
  79. static int rm_read_extradata(AVIOContext *pb, AVCodecContext *avctx, unsigned size)
  80. {
  81. if (size >= 1<<24) {
  82. av_log(avctx, AV_LOG_ERROR, "extradata size %u too large\n", size);
  83. return -1;
  84. }
  85. if (ff_get_extradata(avctx, pb, size) < 0)
  86. return AVERROR(ENOMEM);
  87. return 0;
  88. }
  89. static void rm_read_metadata(AVFormatContext *s, AVIOContext *pb, int wide)
  90. {
  91. char buf[1024];
  92. int i;
  93. for (i=0; i<FF_ARRAY_ELEMS(ff_rm_metadata); i++) {
  94. int len = wide ? avio_rb16(pb) : avio_r8(pb);
  95. get_strl(pb, buf, sizeof(buf), len);
  96. av_dict_set(&s->metadata, ff_rm_metadata[i], buf, 0);
  97. }
  98. }
  99. RMStream *ff_rm_alloc_rmstream (void)
  100. {
  101. RMStream *rms = av_mallocz(sizeof(RMStream));
  102. if (!rms)
  103. return NULL;
  104. rms->curpic_num = -1;
  105. return rms;
  106. }
  107. void ff_rm_free_rmstream (RMStream *rms)
  108. {
  109. av_free_packet(&rms->pkt);
  110. }
  111. static int rm_read_audio_stream_info(AVFormatContext *s, AVIOContext *pb,
  112. AVStream *st, RMStream *ast, int read_all)
  113. {
  114. char buf[256];
  115. uint32_t version;
  116. int ret;
  117. /* ra type header */
  118. version = avio_rb16(pb); /* version */
  119. if (version == 3) {
  120. unsigned bytes_per_minute;
  121. int header_size = avio_rb16(pb);
  122. int64_t startpos = avio_tell(pb);
  123. avio_skip(pb, 8);
  124. bytes_per_minute = avio_rb16(pb);
  125. avio_skip(pb, 4);
  126. rm_read_metadata(s, pb, 0);
  127. if ((startpos + header_size) >= avio_tell(pb) + 2) {
  128. // fourcc (should always be "lpcJ")
  129. avio_r8(pb);
  130. get_str8(pb, buf, sizeof(buf));
  131. }
  132. // Skip extra header crap (this should never happen)
  133. if ((startpos + header_size) > avio_tell(pb))
  134. avio_skip(pb, header_size + startpos - avio_tell(pb));
  135. if (bytes_per_minute)
  136. st->codec->bit_rate = 8LL * bytes_per_minute / 60;
  137. st->codec->sample_rate = 8000;
  138. st->codec->channels = 1;
  139. st->codec->channel_layout = AV_CH_LAYOUT_MONO;
  140. st->codec->codec_type = AVMEDIA_TYPE_AUDIO;
  141. st->codec->codec_id = AV_CODEC_ID_RA_144;
  142. ast->deint_id = DEINT_ID_INT0;
  143. } else {
  144. int flavor, sub_packet_h, coded_framesize, sub_packet_size;
  145. int codecdata_length;
  146. unsigned bytes_per_minute;
  147. /* old version (4) */
  148. avio_skip(pb, 2); /* unused */
  149. avio_rb32(pb); /* .ra4 */
  150. avio_rb32(pb); /* data size */
  151. avio_rb16(pb); /* version2 */
  152. avio_rb32(pb); /* header size */
  153. flavor= avio_rb16(pb); /* add codec info / flavor */
  154. ast->coded_framesize = coded_framesize = avio_rb32(pb); /* coded frame size */
  155. avio_rb32(pb); /* ??? */
  156. bytes_per_minute = avio_rb32(pb);
  157. if (version == 4) {
  158. if (bytes_per_minute)
  159. st->codec->bit_rate = 8LL * bytes_per_minute / 60;
  160. }
  161. avio_rb32(pb); /* ??? */
  162. ast->sub_packet_h = sub_packet_h = avio_rb16(pb); /* 1 */
  163. st->codec->block_align= avio_rb16(pb); /* frame size */
  164. ast->sub_packet_size = sub_packet_size = avio_rb16(pb); /* sub packet size */
  165. avio_rb16(pb); /* ??? */
  166. if (version == 5) {
  167. avio_rb16(pb); avio_rb16(pb); avio_rb16(pb);
  168. }
  169. st->codec->sample_rate = avio_rb16(pb);
  170. avio_rb32(pb);
  171. st->codec->channels = avio_rb16(pb);
  172. if (version == 5) {
  173. ast->deint_id = avio_rl32(pb);
  174. avio_read(pb, buf, 4);
  175. buf[4] = 0;
  176. } else {
  177. AV_WL32(buf, 0);
  178. get_str8(pb, buf, sizeof(buf)); /* desc */
  179. ast->deint_id = AV_RL32(buf);
  180. get_str8(pb, buf, sizeof(buf)); /* desc */
  181. }
  182. st->codec->codec_type = AVMEDIA_TYPE_AUDIO;
  183. st->codec->codec_tag = AV_RL32(buf);
  184. st->codec->codec_id = ff_codec_get_id(ff_rm_codec_tags,
  185. st->codec->codec_tag);
  186. switch (st->codec->codec_id) {
  187. case AV_CODEC_ID_AC3:
  188. st->need_parsing = AVSTREAM_PARSE_FULL;
  189. break;
  190. case AV_CODEC_ID_RA_288:
  191. st->codec->extradata_size= 0;
  192. ast->audio_framesize = st->codec->block_align;
  193. st->codec->block_align = coded_framesize;
  194. break;
  195. case AV_CODEC_ID_COOK:
  196. st->need_parsing = AVSTREAM_PARSE_HEADERS;
  197. case AV_CODEC_ID_ATRAC3:
  198. case AV_CODEC_ID_SIPR:
  199. if (read_all) {
  200. codecdata_length = 0;
  201. } else {
  202. avio_rb16(pb); avio_r8(pb);
  203. if (version == 5)
  204. avio_r8(pb);
  205. codecdata_length = avio_rb32(pb);
  206. if(codecdata_length + FF_INPUT_BUFFER_PADDING_SIZE <= (unsigned)codecdata_length){
  207. av_log(s, AV_LOG_ERROR, "codecdata_length too large\n");
  208. return -1;
  209. }
  210. }
  211. ast->audio_framesize = st->codec->block_align;
  212. if (st->codec->codec_id == AV_CODEC_ID_SIPR) {
  213. if (flavor > 3) {
  214. av_log(s, AV_LOG_ERROR, "bad SIPR file flavor %d\n",
  215. flavor);
  216. return -1;
  217. }
  218. st->codec->block_align = ff_sipr_subpk_size[flavor];
  219. } else {
  220. if(sub_packet_size <= 0){
  221. av_log(s, AV_LOG_ERROR, "sub_packet_size is invalid\n");
  222. return -1;
  223. }
  224. st->codec->block_align = ast->sub_packet_size;
  225. }
  226. if ((ret = rm_read_extradata(pb, st->codec, codecdata_length)) < 0)
  227. return ret;
  228. break;
  229. case AV_CODEC_ID_AAC:
  230. avio_rb16(pb); avio_r8(pb);
  231. if (version == 5)
  232. avio_r8(pb);
  233. codecdata_length = avio_rb32(pb);
  234. if(codecdata_length + FF_INPUT_BUFFER_PADDING_SIZE <= (unsigned)codecdata_length){
  235. av_log(s, AV_LOG_ERROR, "codecdata_length too large\n");
  236. return -1;
  237. }
  238. if (codecdata_length >= 1) {
  239. avio_r8(pb);
  240. if ((ret = rm_read_extradata(pb, st->codec, codecdata_length - 1)) < 0)
  241. return ret;
  242. }
  243. break;
  244. }
  245. switch (ast->deint_id) {
  246. case DEINT_ID_INT4:
  247. if (ast->coded_framesize > ast->audio_framesize ||
  248. sub_packet_h <= 1 ||
  249. ast->coded_framesize * sub_packet_h > (2 + (sub_packet_h & 1)) * ast->audio_framesize)
  250. return AVERROR_INVALIDDATA;
  251. if (ast->coded_framesize * sub_packet_h != 2*ast->audio_framesize) {
  252. avpriv_request_sample(s, "mismatching interleaver parameters");
  253. return AVERROR_INVALIDDATA;
  254. }
  255. break;
  256. case DEINT_ID_GENR:
  257. if (ast->sub_packet_size <= 0 ||
  258. ast->sub_packet_size > ast->audio_framesize)
  259. return AVERROR_INVALIDDATA;
  260. if (ast->audio_framesize % ast->sub_packet_size)
  261. return AVERROR_INVALIDDATA;
  262. break;
  263. case DEINT_ID_SIPR:
  264. case DEINT_ID_INT0:
  265. case DEINT_ID_VBRS:
  266. case DEINT_ID_VBRF:
  267. break;
  268. default:
  269. av_log(s, AV_LOG_ERROR ,"Unknown interleaver %"PRIX32"\n", ast->deint_id);
  270. return AVERROR_INVALIDDATA;
  271. }
  272. if (ast->deint_id == DEINT_ID_INT4 ||
  273. ast->deint_id == DEINT_ID_GENR ||
  274. ast->deint_id == DEINT_ID_SIPR) {
  275. if (st->codec->block_align <= 0 ||
  276. ast->audio_framesize * sub_packet_h > (unsigned)INT_MAX ||
  277. ast->audio_framesize * sub_packet_h < st->codec->block_align)
  278. return AVERROR_INVALIDDATA;
  279. if (av_new_packet(&ast->pkt, ast->audio_framesize * sub_packet_h) < 0)
  280. return AVERROR(ENOMEM);
  281. }
  282. if (read_all) {
  283. avio_r8(pb);
  284. avio_r8(pb);
  285. avio_r8(pb);
  286. rm_read_metadata(s, pb, 0);
  287. }
  288. }
  289. return 0;
  290. }
  291. int ff_rm_read_mdpr_codecdata(AVFormatContext *s, AVIOContext *pb,
  292. AVStream *st, RMStream *rst,
  293. unsigned int codec_data_size, const uint8_t *mime)
  294. {
  295. unsigned int v;
  296. int size;
  297. int64_t codec_pos;
  298. int ret;
  299. if (codec_data_size > INT_MAX)
  300. return AVERROR_INVALIDDATA;
  301. avpriv_set_pts_info(st, 64, 1, 1000);
  302. codec_pos = avio_tell(pb);
  303. v = avio_rb32(pb);
  304. if (v == MKBETAG('M', 'L', 'T', 'I')) {
  305. int number_of_streams = avio_rb16(pb);
  306. int number_of_mdpr;
  307. int i;
  308. for (i = 0; i<number_of_streams; i++)
  309. avio_rb16(pb);
  310. number_of_mdpr = avio_rb16(pb);
  311. if (number_of_mdpr != 1) {
  312. avpriv_request_sample(s, "MLTI with multiple MDPR");
  313. }
  314. avio_rb32(pb);
  315. v = avio_rb32(pb);
  316. }
  317. if (v == MKTAG(0xfd, 'a', 'r', '.')) {
  318. /* ra type header */
  319. if (rm_read_audio_stream_info(s, pb, st, rst, 0))
  320. return -1;
  321. } else if (v == MKBETAG('L', 'S', 'D', ':')) {
  322. avio_seek(pb, -4, SEEK_CUR);
  323. if ((ret = rm_read_extradata(pb, st->codec, codec_data_size)) < 0)
  324. return ret;
  325. st->codec->codec_type = AVMEDIA_TYPE_AUDIO;
  326. st->codec->codec_tag = AV_RL32(st->codec->extradata);
  327. st->codec->codec_id = ff_codec_get_id(ff_rm_codec_tags,
  328. st->codec->codec_tag);
  329. } else if(mime && !strcmp(mime, "logical-fileinfo")){
  330. int stream_count, rule_count, property_count, i;
  331. ff_free_stream(s, st);
  332. if (avio_rb16(pb) != 0) {
  333. av_log(s, AV_LOG_WARNING, "Unsupported version\n");
  334. goto skip;
  335. }
  336. stream_count = avio_rb16(pb);
  337. avio_skip(pb, 6*stream_count);
  338. rule_count = avio_rb16(pb);
  339. avio_skip(pb, 2*rule_count);
  340. property_count = avio_rb16(pb);
  341. for(i=0; i<property_count; i++){
  342. uint8_t name[128], val[128];
  343. avio_rb32(pb);
  344. if (avio_rb16(pb) != 0) {
  345. av_log(s, AV_LOG_WARNING, "Unsupported Name value property version\n");
  346. goto skip; //FIXME skip just this one
  347. }
  348. get_str8(pb, name, sizeof(name));
  349. switch(avio_rb32(pb)) {
  350. case 2: get_strl(pb, val, sizeof(val), avio_rb16(pb));
  351. av_dict_set(&s->metadata, name, val, 0);
  352. break;
  353. default: avio_skip(pb, avio_rb16(pb));
  354. }
  355. }
  356. } else {
  357. int fps;
  358. if (avio_rl32(pb) != MKTAG('V', 'I', 'D', 'O')) {
  359. fail1:
  360. av_log(s, AV_LOG_WARNING, "Unsupported stream type %08x\n", v);
  361. goto skip;
  362. }
  363. st->codec->codec_tag = avio_rl32(pb);
  364. st->codec->codec_id = ff_codec_get_id(ff_rm_codec_tags,
  365. st->codec->codec_tag);
  366. av_dlog(s, "%X %X\n", st->codec->codec_tag, MKTAG('R', 'V', '2', '0'));
  367. if (st->codec->codec_id == AV_CODEC_ID_NONE)
  368. goto fail1;
  369. st->codec->width = avio_rb16(pb);
  370. st->codec->height = avio_rb16(pb);
  371. avio_skip(pb, 2); // looks like bits per sample
  372. avio_skip(pb, 4); // always zero?
  373. st->codec->codec_type = AVMEDIA_TYPE_VIDEO;
  374. st->need_parsing = AVSTREAM_PARSE_TIMESTAMPS;
  375. fps = avio_rb32(pb);
  376. if ((ret = rm_read_extradata(pb, st->codec, codec_data_size - (avio_tell(pb) - codec_pos))) < 0)
  377. return ret;
  378. if (fps > 0) {
  379. av_reduce(&st->avg_frame_rate.den, &st->avg_frame_rate.num,
  380. 0x10000, fps, (1 << 30) - 1);
  381. #if FF_API_R_FRAME_RATE
  382. st->r_frame_rate = st->avg_frame_rate;
  383. #endif
  384. } else if (s->error_recognition & AV_EF_EXPLODE) {
  385. av_log(s, AV_LOG_ERROR, "Invalid framerate\n");
  386. return AVERROR_INVALIDDATA;
  387. }
  388. }
  389. skip:
  390. /* skip codec info */
  391. size = avio_tell(pb) - codec_pos;
  392. if (codec_data_size >= size) {
  393. avio_skip(pb, codec_data_size - size);
  394. } else {
  395. av_log(s, AV_LOG_WARNING, "codec_data_size %u < size %d\n", codec_data_size, size);
  396. }
  397. return 0;
  398. }
  399. /** this function assumes that the demuxer has already seeked to the start
  400. * of the INDX chunk, and will bail out if not. */
  401. static int rm_read_index(AVFormatContext *s)
  402. {
  403. AVIOContext *pb = s->pb;
  404. unsigned int size, n_pkts, str_id, next_off, n, pos, pts;
  405. AVStream *st;
  406. do {
  407. if (avio_rl32(pb) != MKTAG('I','N','D','X'))
  408. return -1;
  409. size = avio_rb32(pb);
  410. if (size < 20)
  411. return -1;
  412. avio_skip(pb, 2);
  413. n_pkts = avio_rb32(pb);
  414. str_id = avio_rb16(pb);
  415. next_off = avio_rb32(pb);
  416. for (n = 0; n < s->nb_streams; n++)
  417. if (s->streams[n]->id == str_id) {
  418. st = s->streams[n];
  419. break;
  420. }
  421. if (n == s->nb_streams) {
  422. av_log(s, AV_LOG_ERROR,
  423. "Invalid stream index %d for index at pos %"PRId64"\n",
  424. str_id, avio_tell(pb));
  425. goto skip;
  426. } else if ((avio_size(pb) - avio_tell(pb)) / 14 < n_pkts) {
  427. av_log(s, AV_LOG_ERROR,
  428. "Nr. of packets in packet index for stream index %d "
  429. "exceeds filesize (%"PRId64" at %"PRId64" = %"PRId64")\n",
  430. str_id, avio_size(pb), avio_tell(pb),
  431. (avio_size(pb) - avio_tell(pb)) / 14);
  432. goto skip;
  433. }
  434. for (n = 0; n < n_pkts; n++) {
  435. avio_skip(pb, 2);
  436. pts = avio_rb32(pb);
  437. pos = avio_rb32(pb);
  438. avio_skip(pb, 4); /* packet no. */
  439. av_add_index_entry(st, pos, pts, 0, 0, AVINDEX_KEYFRAME);
  440. }
  441. skip:
  442. if (next_off && avio_tell(pb) < next_off &&
  443. avio_seek(pb, next_off, SEEK_SET) < 0) {
  444. av_log(s, AV_LOG_ERROR,
  445. "Non-linear index detected, not supported\n");
  446. return -1;
  447. }
  448. } while (next_off);
  449. return 0;
  450. }
  451. static int rm_read_header_old(AVFormatContext *s)
  452. {
  453. RMDemuxContext *rm = s->priv_data;
  454. AVStream *st;
  455. rm->old_format = 1;
  456. st = avformat_new_stream(s, NULL);
  457. if (!st)
  458. return -1;
  459. st->priv_data = ff_rm_alloc_rmstream();
  460. if (!st->priv_data)
  461. return AVERROR(ENOMEM);
  462. return rm_read_audio_stream_info(s, s->pb, st, st->priv_data, 1);
  463. }
  464. static int rm_read_header(AVFormatContext *s)
  465. {
  466. RMDemuxContext *rm = s->priv_data;
  467. AVStream *st;
  468. AVIOContext *pb = s->pb;
  469. unsigned int tag;
  470. int tag_size;
  471. unsigned int start_time, duration;
  472. unsigned int data_off = 0, indx_off = 0;
  473. char buf[128], mime[128];
  474. int flags = 0;
  475. int ret = -1;
  476. tag = avio_rl32(pb);
  477. if (tag == MKTAG('.', 'r', 'a', 0xfd)) {
  478. /* very old .ra format */
  479. return rm_read_header_old(s);
  480. } else if (tag != MKTAG('.', 'R', 'M', 'F')) {
  481. return AVERROR(EIO);
  482. }
  483. tag_size = avio_rb32(pb);
  484. avio_skip(pb, tag_size - 8);
  485. for(;;) {
  486. if (avio_feof(pb))
  487. goto fail;
  488. tag = avio_rl32(pb);
  489. tag_size = avio_rb32(pb);
  490. avio_rb16(pb);
  491. av_dlog(s, "tag=%c%c%c%c (%08x) size=%d\n",
  492. (tag ) & 0xff,
  493. (tag >> 8) & 0xff,
  494. (tag >> 16) & 0xff,
  495. (tag >> 24) & 0xff,
  496. tag,
  497. tag_size);
  498. if (tag_size < 10 && tag != MKTAG('D', 'A', 'T', 'A'))
  499. goto fail;
  500. switch(tag) {
  501. case MKTAG('P', 'R', 'O', 'P'):
  502. /* file header */
  503. avio_rb32(pb); /* max bit rate */
  504. avio_rb32(pb); /* avg bit rate */
  505. avio_rb32(pb); /* max packet size */
  506. avio_rb32(pb); /* avg packet size */
  507. avio_rb32(pb); /* nb packets */
  508. duration = avio_rb32(pb); /* duration */
  509. s->duration = av_rescale(duration, AV_TIME_BASE, 1000);
  510. avio_rb32(pb); /* preroll */
  511. indx_off = avio_rb32(pb); /* index offset */
  512. data_off = avio_rb32(pb); /* data offset */
  513. avio_rb16(pb); /* nb streams */
  514. flags = avio_rb16(pb); /* flags */
  515. break;
  516. case MKTAG('C', 'O', 'N', 'T'):
  517. rm_read_metadata(s, pb, 1);
  518. break;
  519. case MKTAG('M', 'D', 'P', 'R'):
  520. st = avformat_new_stream(s, NULL);
  521. if (!st) {
  522. ret = AVERROR(ENOMEM);
  523. goto fail;
  524. }
  525. st->id = avio_rb16(pb);
  526. avio_rb32(pb); /* max bit rate */
  527. st->codec->bit_rate = avio_rb32(pb); /* bit rate */
  528. avio_rb32(pb); /* max packet size */
  529. avio_rb32(pb); /* avg packet size */
  530. start_time = avio_rb32(pb); /* start time */
  531. avio_rb32(pb); /* preroll */
  532. duration = avio_rb32(pb); /* duration */
  533. st->start_time = start_time;
  534. st->duration = duration;
  535. if(duration>0)
  536. s->duration = AV_NOPTS_VALUE;
  537. get_str8(pb, buf, sizeof(buf)); /* desc */
  538. get_str8(pb, mime, sizeof(mime)); /* mimetype */
  539. st->codec->codec_type = AVMEDIA_TYPE_DATA;
  540. st->priv_data = ff_rm_alloc_rmstream();
  541. if (!st->priv_data)
  542. return AVERROR(ENOMEM);
  543. if (ff_rm_read_mdpr_codecdata(s, s->pb, st, st->priv_data,
  544. avio_rb32(pb), mime) < 0)
  545. goto fail;
  546. break;
  547. case MKTAG('D', 'A', 'T', 'A'):
  548. goto header_end;
  549. default:
  550. /* unknown tag: skip it */
  551. avio_skip(pb, tag_size - 10);
  552. break;
  553. }
  554. }
  555. header_end:
  556. rm->nb_packets = avio_rb32(pb); /* number of packets */
  557. if (!rm->nb_packets && (flags & 4))
  558. rm->nb_packets = 3600 * 25;
  559. avio_rb32(pb); /* next data header */
  560. if (!data_off)
  561. data_off = avio_tell(pb) - 18;
  562. if (indx_off && pb->seekable && !(s->flags & AVFMT_FLAG_IGNIDX) &&
  563. avio_seek(pb, indx_off, SEEK_SET) >= 0) {
  564. rm_read_index(s);
  565. avio_seek(pb, data_off + 18, SEEK_SET);
  566. }
  567. return 0;
  568. fail:
  569. rm_read_close(s);
  570. return ret;
  571. }
  572. static int get_num(AVIOContext *pb, int *len)
  573. {
  574. int n, n1;
  575. n = avio_rb16(pb);
  576. (*len)-=2;
  577. n &= 0x7FFF;
  578. if (n >= 0x4000) {
  579. return n - 0x4000;
  580. } else {
  581. n1 = avio_rb16(pb);
  582. (*len)-=2;
  583. return (n << 16) | n1;
  584. }
  585. }
  586. /* multiple of 20 bytes for ra144 (ugly) */
  587. #define RAW_PACKET_SIZE 1000
  588. static int rm_sync(AVFormatContext *s, int64_t *timestamp, int *flags, int *stream_index, int64_t *pos){
  589. RMDemuxContext *rm = s->priv_data;
  590. AVIOContext *pb = s->pb;
  591. AVStream *st;
  592. uint32_t state=0xFFFFFFFF;
  593. while(!avio_feof(pb)){
  594. int len, num, i;
  595. *pos= avio_tell(pb) - 3;
  596. if(rm->remaining_len > 0){
  597. num= rm->current_stream;
  598. len= rm->remaining_len;
  599. *timestamp = AV_NOPTS_VALUE;
  600. *flags= 0;
  601. }else{
  602. state= (state<<8) + avio_r8(pb);
  603. if(state == MKBETAG('I', 'N', 'D', 'X')){
  604. int n_pkts, expected_len;
  605. len = avio_rb32(pb);
  606. avio_skip(pb, 2);
  607. n_pkts = avio_rb32(pb);
  608. expected_len = 20 + n_pkts * 14;
  609. if (len == 20)
  610. /* some files don't add index entries to chunk size... */
  611. len = expected_len;
  612. else if (len != expected_len)
  613. av_log(s, AV_LOG_WARNING,
  614. "Index size %d (%d pkts) is wrong, should be %d.\n",
  615. len, n_pkts, expected_len);
  616. len -= 14; // we already read part of the index header
  617. if(len<0)
  618. continue;
  619. goto skip;
  620. } else if (state == MKBETAG('D','A','T','A')) {
  621. av_log(s, AV_LOG_WARNING,
  622. "DATA tag in middle of chunk, file may be broken.\n");
  623. }
  624. if(state > (unsigned)0xFFFF || state <= 12)
  625. continue;
  626. len=state - 12;
  627. state= 0xFFFFFFFF;
  628. num = avio_rb16(pb);
  629. *timestamp = avio_rb32(pb);
  630. avio_r8(pb); /* reserved */
  631. *flags = avio_r8(pb); /* flags */
  632. }
  633. for(i=0;i<s->nb_streams;i++) {
  634. st = s->streams[i];
  635. if (num == st->id)
  636. break;
  637. }
  638. if (i == s->nb_streams) {
  639. skip:
  640. /* skip packet if unknown number */
  641. avio_skip(pb, len);
  642. rm->remaining_len = 0;
  643. continue;
  644. }
  645. *stream_index= i;
  646. return len;
  647. }
  648. return -1;
  649. }
  650. static int rm_assemble_video_frame(AVFormatContext *s, AVIOContext *pb,
  651. RMDemuxContext *rm, RMStream *vst,
  652. AVPacket *pkt, int len, int *pseq,
  653. int64_t *timestamp)
  654. {
  655. int hdr;
  656. int seq = 0, pic_num = 0, len2 = 0, pos = 0; //init to silcense compiler warning
  657. int type;
  658. int ret;
  659. hdr = avio_r8(pb); len--;
  660. type = hdr >> 6;
  661. if(type != 3){ // not frame as a part of packet
  662. seq = avio_r8(pb); len--;
  663. }
  664. if(type != 1){ // not whole frame
  665. len2 = get_num(pb, &len);
  666. pos = get_num(pb, &len);
  667. pic_num = avio_r8(pb); len--;
  668. }
  669. if(len<0) {
  670. av_log(s, AV_LOG_ERROR, "Insufficient data\n");
  671. return -1;
  672. }
  673. rm->remaining_len = len;
  674. if(type&1){ // frame, not slice
  675. if(type == 3){ // frame as a part of packet
  676. len= len2;
  677. *timestamp = pos;
  678. }
  679. if(rm->remaining_len < len) {
  680. av_log(s, AV_LOG_ERROR, "Insufficient remaining len\n");
  681. return -1;
  682. }
  683. rm->remaining_len -= len;
  684. if(av_new_packet(pkt, len + 9) < 0)
  685. return AVERROR(EIO);
  686. pkt->data[0] = 0;
  687. AV_WL32(pkt->data + 1, 1);
  688. AV_WL32(pkt->data + 5, 0);
  689. if ((ret = avio_read(pb, pkt->data + 9, len)) != len) {
  690. av_free_packet(pkt);
  691. av_log(s, AV_LOG_ERROR, "Failed to read %d bytes\n", len);
  692. return ret < 0 ? ret : AVERROR(EIO);
  693. }
  694. return 0;
  695. }
  696. //now we have to deal with single slice
  697. *pseq = seq;
  698. if((seq & 0x7F) == 1 || vst->curpic_num != pic_num){
  699. if (len2 > ffio_limit(pb, len2)) {
  700. av_log(s, AV_LOG_ERROR, "Impossibly sized packet\n");
  701. return AVERROR_INVALIDDATA;
  702. }
  703. vst->slices = ((hdr & 0x3F) << 1) + 1;
  704. vst->videobufsize = len2 + 8*vst->slices + 1;
  705. av_free_packet(&vst->pkt); //FIXME this should be output.
  706. if(av_new_packet(&vst->pkt, vst->videobufsize) < 0)
  707. return AVERROR(ENOMEM);
  708. memset(vst->pkt.data, 0, vst->pkt.size);
  709. vst->videobufpos = 8*vst->slices + 1;
  710. vst->cur_slice = 0;
  711. vst->curpic_num = pic_num;
  712. vst->pktpos = avio_tell(pb);
  713. }
  714. if(type == 2)
  715. len = FFMIN(len, pos);
  716. if(++vst->cur_slice > vst->slices) {
  717. av_log(s, AV_LOG_ERROR, "cur slice %d, too large\n", vst->cur_slice);
  718. return 1;
  719. }
  720. if(!vst->pkt.data)
  721. return AVERROR(ENOMEM);
  722. AV_WL32(vst->pkt.data - 7 + 8*vst->cur_slice, 1);
  723. AV_WL32(vst->pkt.data - 3 + 8*vst->cur_slice, vst->videobufpos - 8*vst->slices - 1);
  724. if(vst->videobufpos + len > vst->videobufsize) {
  725. av_log(s, AV_LOG_ERROR, "outside videobufsize\n");
  726. return 1;
  727. }
  728. if (avio_read(pb, vst->pkt.data + vst->videobufpos, len) != len)
  729. return AVERROR(EIO);
  730. vst->videobufpos += len;
  731. rm->remaining_len-= len;
  732. if (type == 2 || vst->videobufpos == vst->videobufsize) {
  733. vst->pkt.data[0] = vst->cur_slice-1;
  734. *pkt= vst->pkt;
  735. vst->pkt.data= NULL;
  736. vst->pkt.size= 0;
  737. vst->pkt.buf = NULL;
  738. #if FF_API_DESTRUCT_PACKET
  739. FF_DISABLE_DEPRECATION_WARNINGS
  740. vst->pkt.destruct = NULL;
  741. FF_ENABLE_DEPRECATION_WARNINGS
  742. #endif
  743. if(vst->slices != vst->cur_slice) //FIXME find out how to set slices correct from the begin
  744. memmove(pkt->data + 1 + 8*vst->cur_slice, pkt->data + 1 + 8*vst->slices,
  745. vst->videobufpos - 1 - 8*vst->slices);
  746. pkt->size = vst->videobufpos + 8*(vst->cur_slice - vst->slices);
  747. pkt->pts = AV_NOPTS_VALUE;
  748. pkt->pos = vst->pktpos;
  749. vst->slices = 0;
  750. return 0;
  751. }
  752. return 1;
  753. }
  754. static inline void
  755. rm_ac3_swap_bytes (AVStream *st, AVPacket *pkt)
  756. {
  757. uint8_t *ptr;
  758. int j;
  759. if (st->codec->codec_id == AV_CODEC_ID_AC3) {
  760. ptr = pkt->data;
  761. for (j=0;j<pkt->size;j+=2) {
  762. FFSWAP(int, ptr[0], ptr[1]);
  763. ptr += 2;
  764. }
  765. }
  766. }
  767. static int readfull(AVFormatContext *s, AVIOContext *pb, uint8_t *dst, int n) {
  768. int ret = avio_read(pb, dst, n);
  769. if (ret != n) {
  770. if (ret >= 0) memset(dst + ret, 0, n - ret);
  771. else memset(dst , 0, n);
  772. av_log(s, AV_LOG_ERROR, "Failed to fully read block\n");
  773. }
  774. return ret;
  775. }
  776. int
  777. ff_rm_parse_packet (AVFormatContext *s, AVIOContext *pb,
  778. AVStream *st, RMStream *ast, int len, AVPacket *pkt,
  779. int *seq, int flags, int64_t timestamp)
  780. {
  781. RMDemuxContext *rm = s->priv_data;
  782. int ret;
  783. if (st->codec->codec_type == AVMEDIA_TYPE_VIDEO) {
  784. rm->current_stream= st->id;
  785. ret = rm_assemble_video_frame(s, pb, rm, ast, pkt, len, seq, &timestamp);
  786. if(ret)
  787. return ret < 0 ? ret : -1; //got partial frame or error
  788. } else if (st->codec->codec_type == AVMEDIA_TYPE_AUDIO) {
  789. if ((ast->deint_id == DEINT_ID_GENR) ||
  790. (ast->deint_id == DEINT_ID_INT4) ||
  791. (ast->deint_id == DEINT_ID_SIPR)) {
  792. int x;
  793. int sps = ast->sub_packet_size;
  794. int cfs = ast->coded_framesize;
  795. int h = ast->sub_packet_h;
  796. int y = ast->sub_packet_cnt;
  797. int w = ast->audio_framesize;
  798. if (flags & 2)
  799. y = ast->sub_packet_cnt = 0;
  800. if (!y)
  801. ast->audiotimestamp = timestamp;
  802. switch (ast->deint_id) {
  803. case DEINT_ID_INT4:
  804. for (x = 0; x < h/2; x++)
  805. readfull(s, pb, ast->pkt.data+x*2*w+y*cfs, cfs);
  806. break;
  807. case DEINT_ID_GENR:
  808. for (x = 0; x < w/sps; x++)
  809. readfull(s, pb, ast->pkt.data+sps*(h*x+((h+1)/2)*(y&1)+(y>>1)), sps);
  810. break;
  811. case DEINT_ID_SIPR:
  812. readfull(s, pb, ast->pkt.data + y * w, w);
  813. break;
  814. }
  815. if (++(ast->sub_packet_cnt) < h)
  816. return -1;
  817. if (ast->deint_id == DEINT_ID_SIPR)
  818. ff_rm_reorder_sipr_data(ast->pkt.data, h, w);
  819. ast->sub_packet_cnt = 0;
  820. rm->audio_stream_num = st->index;
  821. rm->audio_pkt_cnt = h * w / st->codec->block_align;
  822. } else if ((ast->deint_id == DEINT_ID_VBRF) ||
  823. (ast->deint_id == DEINT_ID_VBRS)) {
  824. int x;
  825. rm->audio_stream_num = st->index;
  826. ast->sub_packet_cnt = (avio_rb16(pb) & 0xf0) >> 4;
  827. if (ast->sub_packet_cnt) {
  828. for (x = 0; x < ast->sub_packet_cnt; x++)
  829. ast->sub_packet_lengths[x] = avio_rb16(pb);
  830. rm->audio_pkt_cnt = ast->sub_packet_cnt;
  831. ast->audiotimestamp = timestamp;
  832. } else
  833. return -1;
  834. } else {
  835. if ((ret = av_get_packet(pb, pkt, len)) < 0)
  836. return ret;
  837. rm_ac3_swap_bytes(st, pkt);
  838. }
  839. } else {
  840. if ((ret = av_get_packet(pb, pkt, len)) < 0)
  841. return ret;
  842. }
  843. pkt->stream_index = st->index;
  844. #if 0
  845. if (st->codec->codec_type == AVMEDIA_TYPE_VIDEO) {
  846. if(st->codec->codec_id == AV_CODEC_ID_RV20){
  847. int seq= 128*(pkt->data[2]&0x7F) + (pkt->data[3]>>1);
  848. av_log(s, AV_LOG_DEBUG, "%d %"PRId64" %d\n", *timestamp, *timestamp*512LL/25, seq);
  849. seq |= (timestamp&~0x3FFF);
  850. if(seq - timestamp > 0x2000) seq -= 0x4000;
  851. if(seq - timestamp < -0x2000) seq += 0x4000;
  852. }
  853. }
  854. #endif
  855. pkt->pts = timestamp;
  856. if (flags & 2)
  857. pkt->flags |= AV_PKT_FLAG_KEY;
  858. return st->codec->codec_type == AVMEDIA_TYPE_AUDIO ? rm->audio_pkt_cnt : 0;
  859. }
  860. int
  861. ff_rm_retrieve_cache (AVFormatContext *s, AVIOContext *pb,
  862. AVStream *st, RMStream *ast, AVPacket *pkt)
  863. {
  864. RMDemuxContext *rm = s->priv_data;
  865. av_assert0 (rm->audio_pkt_cnt > 0);
  866. if (ast->deint_id == DEINT_ID_VBRF ||
  867. ast->deint_id == DEINT_ID_VBRS) {
  868. int ret = av_get_packet(pb, pkt, ast->sub_packet_lengths[ast->sub_packet_cnt - rm->audio_pkt_cnt]);
  869. if (ret < 0)
  870. return ret;
  871. } else {
  872. int ret = av_new_packet(pkt, st->codec->block_align);
  873. if (ret < 0)
  874. return ret;
  875. memcpy(pkt->data, ast->pkt.data + st->codec->block_align * //FIXME avoid this
  876. (ast->sub_packet_h * ast->audio_framesize / st->codec->block_align - rm->audio_pkt_cnt),
  877. st->codec->block_align);
  878. }
  879. rm->audio_pkt_cnt--;
  880. if ((pkt->pts = ast->audiotimestamp) != AV_NOPTS_VALUE) {
  881. ast->audiotimestamp = AV_NOPTS_VALUE;
  882. pkt->flags = AV_PKT_FLAG_KEY;
  883. } else
  884. pkt->flags = 0;
  885. pkt->stream_index = st->index;
  886. return rm->audio_pkt_cnt;
  887. }
  888. static int rm_read_packet(AVFormatContext *s, AVPacket *pkt)
  889. {
  890. RMDemuxContext *rm = s->priv_data;
  891. AVStream *st = NULL; // init to silence compiler warning
  892. int i, len, res, seq = 1;
  893. int64_t timestamp, pos;
  894. int flags;
  895. for (;;) {
  896. if (rm->audio_pkt_cnt) {
  897. // If there are queued audio packet return them first
  898. st = s->streams[rm->audio_stream_num];
  899. res = ff_rm_retrieve_cache(s, s->pb, st, st->priv_data, pkt);
  900. if(res < 0)
  901. return res;
  902. flags = 0;
  903. } else {
  904. if (rm->old_format) {
  905. RMStream *ast;
  906. st = s->streams[0];
  907. ast = st->priv_data;
  908. timestamp = AV_NOPTS_VALUE;
  909. len = !ast->audio_framesize ? RAW_PACKET_SIZE :
  910. ast->coded_framesize * ast->sub_packet_h / 2;
  911. flags = (seq++ == 1) ? 2 : 0;
  912. pos = avio_tell(s->pb);
  913. } else {
  914. len = rm_sync(s, &timestamp, &flags, &i, &pos);
  915. if (len > 0)
  916. st = s->streams[i];
  917. }
  918. if (len <= 0 || avio_feof(s->pb))
  919. return AVERROR(EIO);
  920. res = ff_rm_parse_packet (s, s->pb, st, st->priv_data, len, pkt,
  921. &seq, flags, timestamp);
  922. if (res < -1)
  923. return res;
  924. if((flags&2) && (seq&0x7F) == 1)
  925. av_add_index_entry(st, pos, timestamp, 0, 0, AVINDEX_KEYFRAME);
  926. if (res)
  927. continue;
  928. }
  929. if( (st->discard >= AVDISCARD_NONKEY && !(flags&2))
  930. || st->discard >= AVDISCARD_ALL){
  931. av_free_packet(pkt);
  932. } else
  933. break;
  934. }
  935. return 0;
  936. }
  937. static int rm_read_close(AVFormatContext *s)
  938. {
  939. int i;
  940. for (i=0;i<s->nb_streams;i++)
  941. ff_rm_free_rmstream(s->streams[i]->priv_data);
  942. return 0;
  943. }
  944. static int rm_probe(AVProbeData *p)
  945. {
  946. /* check file header */
  947. if ((p->buf[0] == '.' && p->buf[1] == 'R' &&
  948. p->buf[2] == 'M' && p->buf[3] == 'F' &&
  949. p->buf[4] == 0 && p->buf[5] == 0) ||
  950. (p->buf[0] == '.' && p->buf[1] == 'r' &&
  951. p->buf[2] == 'a' && p->buf[3] == 0xfd))
  952. return AVPROBE_SCORE_MAX;
  953. else
  954. return 0;
  955. }
  956. static int64_t rm_read_dts(AVFormatContext *s, int stream_index,
  957. int64_t *ppos, int64_t pos_limit)
  958. {
  959. RMDemuxContext *rm = s->priv_data;
  960. int64_t pos, dts;
  961. int stream_index2, flags, len, h;
  962. pos = *ppos;
  963. if(rm->old_format)
  964. return AV_NOPTS_VALUE;
  965. if (avio_seek(s->pb, pos, SEEK_SET) < 0)
  966. return AV_NOPTS_VALUE;
  967. rm->remaining_len=0;
  968. for(;;){
  969. int seq=1;
  970. AVStream *st;
  971. len = rm_sync(s, &dts, &flags, &stream_index2, &pos);
  972. if(len<0)
  973. return AV_NOPTS_VALUE;
  974. st = s->streams[stream_index2];
  975. if (st->codec->codec_type == AVMEDIA_TYPE_VIDEO) {
  976. h= avio_r8(s->pb); len--;
  977. if(!(h & 0x40)){
  978. seq = avio_r8(s->pb); len--;
  979. }
  980. }
  981. if((flags&2) && (seq&0x7F) == 1){
  982. av_dlog(s, "%d %d-%d %"PRId64" %d\n",
  983. flags, stream_index2, stream_index, dts, seq);
  984. av_add_index_entry(st, pos, dts, 0, 0, AVINDEX_KEYFRAME);
  985. if(stream_index2 == stream_index)
  986. break;
  987. }
  988. avio_skip(s->pb, len);
  989. }
  990. *ppos = pos;
  991. return dts;
  992. }
  993. static int rm_read_seek(AVFormatContext *s, int stream_index,
  994. int64_t pts, int flags)
  995. {
  996. RMDemuxContext *rm = s->priv_data;
  997. if (ff_seek_frame_binary(s, stream_index, pts, flags) < 0)
  998. return -1;
  999. rm->audio_pkt_cnt = 0;
  1000. return 0;
  1001. }
  1002. AVInputFormat ff_rm_demuxer = {
  1003. .name = "rm",
  1004. .long_name = NULL_IF_CONFIG_SMALL("RealMedia"),
  1005. .priv_data_size = sizeof(RMDemuxContext),
  1006. .read_probe = rm_probe,
  1007. .read_header = rm_read_header,
  1008. .read_packet = rm_read_packet,
  1009. .read_close = rm_read_close,
  1010. .read_timestamp = rm_read_dts,
  1011. .read_seek = rm_read_seek,
  1012. };
  1013. AVInputFormat ff_rdt_demuxer = {
  1014. .name = "rdt",
  1015. .long_name = NULL_IF_CONFIG_SMALL("RDT demuxer"),
  1016. .priv_data_size = sizeof(RMDemuxContext),
  1017. .read_close = rm_read_close,
  1018. .flags = AVFMT_NOFILE,
  1019. };