You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

1147 lines
38KB

  1. /*
  2. * "Real" compatible muxer and demuxer.
  3. * Copyright (c) 2000, 2001 Fabrice Bellard.
  4. *
  5. * This file is part of FFmpeg.
  6. *
  7. * FFmpeg is free software; you can redistribute it and/or
  8. * modify it under the terms of the GNU Lesser General Public
  9. * License as published by the Free Software Foundation; either
  10. * version 2.1 of the License, or (at your option) any later version.
  11. *
  12. * FFmpeg is distributed in the hope that it will be useful,
  13. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  14. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  15. * Lesser General Public License for more details.
  16. *
  17. * You should have received a copy of the GNU Lesser General Public
  18. * License along with FFmpeg; if not, write to the Free Software
  19. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  20. */
  21. #include "avformat.h"
  22. /* in ms */
  23. #define BUFFER_DURATION 0
  24. typedef struct {
  25. int nb_packets;
  26. int packet_total_size;
  27. int packet_max_size;
  28. /* codec related output */
  29. int bit_rate;
  30. float frame_rate;
  31. int nb_frames; /* current frame number */
  32. int total_frames; /* total number of frames */
  33. int num;
  34. AVCodecContext *enc;
  35. } StreamInfo;
  36. typedef struct {
  37. StreamInfo streams[2];
  38. StreamInfo *audio_stream, *video_stream;
  39. int data_pos; /* position of the data after the header */
  40. int nb_packets;
  41. int old_format;
  42. int current_stream;
  43. int remaining_len;
  44. /// Audio descrambling matrix parameters
  45. uint8_t *audiobuf; ///< place to store reordered audio data
  46. int64_t audiotimestamp; ///< Audio packet timestamp
  47. int sub_packet_cnt; // Subpacket counter, used while reading
  48. int sub_packet_size, sub_packet_h, coded_framesize; ///< Descrambling parameters from container
  49. int audio_stream_num; ///< Stream number for audio packets
  50. int audio_pkt_cnt; ///< Output packet counter
  51. int audio_framesize; /// Audio frame size from container
  52. int sub_packet_lengths[16]; /// Length of each aac subpacket
  53. } RMContext;
  54. #ifdef CONFIG_MUXERS
  55. static void put_str(ByteIOContext *s, const char *tag)
  56. {
  57. put_be16(s,strlen(tag));
  58. while (*tag) {
  59. put_byte(s, *tag++);
  60. }
  61. }
  62. static void put_str8(ByteIOContext *s, const char *tag)
  63. {
  64. put_byte(s, strlen(tag));
  65. while (*tag) {
  66. put_byte(s, *tag++);
  67. }
  68. }
  69. static void rv10_write_header(AVFormatContext *ctx,
  70. int data_size, int index_pos)
  71. {
  72. RMContext *rm = ctx->priv_data;
  73. ByteIOContext *s = &ctx->pb;
  74. StreamInfo *stream;
  75. unsigned char *data_offset_ptr, *start_ptr;
  76. const char *desc, *mimetype;
  77. int nb_packets, packet_total_size, packet_max_size, size, packet_avg_size, i;
  78. int bit_rate, v, duration, flags, data_pos;
  79. start_ptr = s->buf_ptr;
  80. put_tag(s, ".RMF");
  81. put_be32(s,18); /* header size */
  82. put_be16(s,0);
  83. put_be32(s,0);
  84. put_be32(s,4 + ctx->nb_streams); /* num headers */
  85. put_tag(s,"PROP");
  86. put_be32(s, 50);
  87. put_be16(s, 0);
  88. packet_max_size = 0;
  89. packet_total_size = 0;
  90. nb_packets = 0;
  91. bit_rate = 0;
  92. duration = 0;
  93. for(i=0;i<ctx->nb_streams;i++) {
  94. StreamInfo *stream = &rm->streams[i];
  95. bit_rate += stream->bit_rate;
  96. if (stream->packet_max_size > packet_max_size)
  97. packet_max_size = stream->packet_max_size;
  98. nb_packets += stream->nb_packets;
  99. packet_total_size += stream->packet_total_size;
  100. /* select maximum duration */
  101. v = (int) (1000.0 * (float)stream->total_frames / stream->frame_rate);
  102. if (v > duration)
  103. duration = v;
  104. }
  105. put_be32(s, bit_rate); /* max bit rate */
  106. put_be32(s, bit_rate); /* avg bit rate */
  107. put_be32(s, packet_max_size); /* max packet size */
  108. if (nb_packets > 0)
  109. packet_avg_size = packet_total_size / nb_packets;
  110. else
  111. packet_avg_size = 0;
  112. put_be32(s, packet_avg_size); /* avg packet size */
  113. put_be32(s, nb_packets); /* num packets */
  114. put_be32(s, duration); /* duration */
  115. put_be32(s, BUFFER_DURATION); /* preroll */
  116. put_be32(s, index_pos); /* index offset */
  117. /* computation of data the data offset */
  118. data_offset_ptr = s->buf_ptr;
  119. put_be32(s, 0); /* data offset : will be patched after */
  120. put_be16(s, ctx->nb_streams); /* num streams */
  121. flags = 1 | 2; /* save allowed & perfect play */
  122. if (url_is_streamed(s))
  123. flags |= 4; /* live broadcast */
  124. put_be16(s, flags);
  125. /* comments */
  126. put_tag(s,"CONT");
  127. size = strlen(ctx->title) + strlen(ctx->author) + strlen(ctx->copyright) +
  128. strlen(ctx->comment) + 4 * 2 + 10;
  129. put_be32(s,size);
  130. put_be16(s,0);
  131. put_str(s, ctx->title);
  132. put_str(s, ctx->author);
  133. put_str(s, ctx->copyright);
  134. put_str(s, ctx->comment);
  135. for(i=0;i<ctx->nb_streams;i++) {
  136. int codec_data_size;
  137. stream = &rm->streams[i];
  138. if (stream->enc->codec_type == CODEC_TYPE_AUDIO) {
  139. desc = "The Audio Stream";
  140. mimetype = "audio/x-pn-realaudio";
  141. codec_data_size = 73;
  142. } else {
  143. desc = "The Video Stream";
  144. mimetype = "video/x-pn-realvideo";
  145. codec_data_size = 34;
  146. }
  147. put_tag(s,"MDPR");
  148. size = 10 + 9 * 4 + strlen(desc) + strlen(mimetype) + codec_data_size;
  149. put_be32(s, size);
  150. put_be16(s, 0);
  151. put_be16(s, i); /* stream number */
  152. put_be32(s, stream->bit_rate); /* max bit rate */
  153. put_be32(s, stream->bit_rate); /* avg bit rate */
  154. put_be32(s, stream->packet_max_size); /* max packet size */
  155. if (stream->nb_packets > 0)
  156. packet_avg_size = stream->packet_total_size /
  157. stream->nb_packets;
  158. else
  159. packet_avg_size = 0;
  160. put_be32(s, packet_avg_size); /* avg packet size */
  161. put_be32(s, 0); /* start time */
  162. put_be32(s, BUFFER_DURATION); /* preroll */
  163. /* duration */
  164. if (url_is_streamed(s) || !stream->total_frames)
  165. put_be32(s, (int)(3600 * 1000));
  166. else
  167. put_be32(s, (int)(stream->total_frames * 1000 / stream->frame_rate));
  168. put_str8(s, desc);
  169. put_str8(s, mimetype);
  170. put_be32(s, codec_data_size);
  171. if (stream->enc->codec_type == CODEC_TYPE_AUDIO) {
  172. int coded_frame_size, fscode, sample_rate;
  173. sample_rate = stream->enc->sample_rate;
  174. coded_frame_size = (stream->enc->bit_rate *
  175. stream->enc->frame_size) / (8 * sample_rate);
  176. /* audio codec info */
  177. put_tag(s, ".ra");
  178. put_byte(s, 0xfd);
  179. put_be32(s, 0x00040000); /* version */
  180. put_tag(s, ".ra4");
  181. put_be32(s, 0x01b53530); /* stream length */
  182. put_be16(s, 4); /* unknown */
  183. put_be32(s, 0x39); /* header size */
  184. switch(sample_rate) {
  185. case 48000:
  186. case 24000:
  187. case 12000:
  188. fscode = 1;
  189. break;
  190. default:
  191. case 44100:
  192. case 22050:
  193. case 11025:
  194. fscode = 2;
  195. break;
  196. case 32000:
  197. case 16000:
  198. case 8000:
  199. fscode = 3;
  200. }
  201. put_be16(s, fscode); /* codec additional info, for AC3, seems
  202. to be a frequency code */
  203. /* special hack to compensate rounding errors... */
  204. if (coded_frame_size == 557)
  205. coded_frame_size--;
  206. put_be32(s, coded_frame_size); /* frame length */
  207. put_be32(s, 0x51540); /* unknown */
  208. put_be32(s, 0x249f0); /* unknown */
  209. put_be32(s, 0x249f0); /* unknown */
  210. put_be16(s, 0x01);
  211. /* frame length : seems to be very important */
  212. put_be16(s, coded_frame_size);
  213. put_be32(s, 0); /* unknown */
  214. put_be16(s, stream->enc->sample_rate); /* sample rate */
  215. put_be32(s, 0x10); /* unknown */
  216. put_be16(s, stream->enc->channels);
  217. put_str8(s, "Int0"); /* codec name */
  218. put_str8(s, "dnet"); /* codec name */
  219. put_be16(s, 0); /* title length */
  220. put_be16(s, 0); /* author length */
  221. put_be16(s, 0); /* copyright length */
  222. put_byte(s, 0); /* end of header */
  223. } else {
  224. /* video codec info */
  225. put_be32(s,34); /* size */
  226. if(stream->enc->codec_id == CODEC_ID_RV10)
  227. put_tag(s,"VIDORV10");
  228. else
  229. put_tag(s,"VIDORV20");
  230. put_be16(s, stream->enc->width);
  231. put_be16(s, stream->enc->height);
  232. put_be16(s, (int) stream->frame_rate); /* frames per seconds ? */
  233. put_be32(s,0); /* unknown meaning */
  234. put_be16(s, (int) stream->frame_rate); /* unknown meaning */
  235. put_be32(s,0); /* unknown meaning */
  236. put_be16(s, 8); /* unknown meaning */
  237. /* Seems to be the codec version: only use basic H263. The next
  238. versions seems to add a diffential DC coding as in
  239. MPEG... nothing new under the sun */
  240. if(stream->enc->codec_id == CODEC_ID_RV10)
  241. put_be32(s,0x10000000);
  242. else
  243. put_be32(s,0x20103001);
  244. //put_be32(s,0x10003000);
  245. }
  246. }
  247. /* patch data offset field */
  248. data_pos = s->buf_ptr - start_ptr;
  249. rm->data_pos = data_pos;
  250. data_offset_ptr[0] = data_pos >> 24;
  251. data_offset_ptr[1] = data_pos >> 16;
  252. data_offset_ptr[2] = data_pos >> 8;
  253. data_offset_ptr[3] = data_pos;
  254. /* data stream */
  255. put_tag(s,"DATA");
  256. put_be32(s,data_size + 10 + 8);
  257. put_be16(s,0);
  258. put_be32(s, nb_packets); /* number of packets */
  259. put_be32(s,0); /* next data header */
  260. }
  261. static void write_packet_header(AVFormatContext *ctx, StreamInfo *stream,
  262. int length, int key_frame)
  263. {
  264. int timestamp;
  265. ByteIOContext *s = &ctx->pb;
  266. stream->nb_packets++;
  267. stream->packet_total_size += length;
  268. if (length > stream->packet_max_size)
  269. stream->packet_max_size = length;
  270. put_be16(s,0); /* version */
  271. put_be16(s,length + 12);
  272. put_be16(s, stream->num); /* stream number */
  273. timestamp = (1000 * (float)stream->nb_frames) / stream->frame_rate;
  274. put_be32(s, timestamp); /* timestamp */
  275. put_byte(s, 0); /* reserved */
  276. put_byte(s, key_frame ? 2 : 0); /* flags */
  277. }
  278. static int rm_write_header(AVFormatContext *s)
  279. {
  280. RMContext *rm = s->priv_data;
  281. StreamInfo *stream;
  282. int n;
  283. AVCodecContext *codec;
  284. for(n=0;n<s->nb_streams;n++) {
  285. s->streams[n]->id = n;
  286. codec = s->streams[n]->codec;
  287. stream = &rm->streams[n];
  288. memset(stream, 0, sizeof(StreamInfo));
  289. stream->num = n;
  290. stream->bit_rate = codec->bit_rate;
  291. stream->enc = codec;
  292. switch(codec->codec_type) {
  293. case CODEC_TYPE_AUDIO:
  294. rm->audio_stream = stream;
  295. stream->frame_rate = (float)codec->sample_rate / (float)codec->frame_size;
  296. /* XXX: dummy values */
  297. stream->packet_max_size = 1024;
  298. stream->nb_packets = 0;
  299. stream->total_frames = stream->nb_packets;
  300. break;
  301. case CODEC_TYPE_VIDEO:
  302. rm->video_stream = stream;
  303. stream->frame_rate = (float)codec->time_base.den / (float)codec->time_base.num;
  304. /* XXX: dummy values */
  305. stream->packet_max_size = 4096;
  306. stream->nb_packets = 0;
  307. stream->total_frames = stream->nb_packets;
  308. break;
  309. default:
  310. return -1;
  311. }
  312. }
  313. rv10_write_header(s, 0, 0);
  314. put_flush_packet(&s->pb);
  315. return 0;
  316. }
  317. static int rm_write_audio(AVFormatContext *s, const uint8_t *buf, int size, int flags)
  318. {
  319. uint8_t *buf1;
  320. RMContext *rm = s->priv_data;
  321. ByteIOContext *pb = &s->pb;
  322. StreamInfo *stream = rm->audio_stream;
  323. int i;
  324. /* XXX: suppress this malloc */
  325. buf1= (uint8_t*) av_malloc( size * sizeof(uint8_t) );
  326. write_packet_header(s, stream, size, !!(flags & PKT_FLAG_KEY));
  327. /* for AC3, the words seems to be reversed */
  328. for(i=0;i<size;i+=2) {
  329. buf1[i] = buf[i+1];
  330. buf1[i+1] = buf[i];
  331. }
  332. put_buffer(pb, buf1, size);
  333. put_flush_packet(pb);
  334. stream->nb_frames++;
  335. av_free(buf1);
  336. return 0;
  337. }
  338. static int rm_write_video(AVFormatContext *s, const uint8_t *buf, int size, int flags)
  339. {
  340. RMContext *rm = s->priv_data;
  341. ByteIOContext *pb = &s->pb;
  342. StreamInfo *stream = rm->video_stream;
  343. int key_frame = !!(flags & PKT_FLAG_KEY);
  344. /* XXX: this is incorrect: should be a parameter */
  345. /* Well, I spent some time finding the meaning of these bits. I am
  346. not sure I understood everything, but it works !! */
  347. #if 1
  348. write_packet_header(s, stream, size + 7, key_frame);
  349. /* bit 7: '1' if final packet of a frame converted in several packets */
  350. put_byte(pb, 0x81);
  351. /* bit 7: '1' if I frame. bits 6..0 : sequence number in current
  352. frame starting from 1 */
  353. if (key_frame) {
  354. put_byte(pb, 0x81);
  355. } else {
  356. put_byte(pb, 0x01);
  357. }
  358. put_be16(pb, 0x4000 + (size)); /* total frame size */
  359. put_be16(pb, 0x4000 + (size)); /* offset from the start or the end */
  360. #else
  361. /* full frame */
  362. write_packet_header(s, size + 6);
  363. put_byte(pb, 0xc0);
  364. put_be16(pb, 0x4000 + size); /* total frame size */
  365. put_be16(pb, 0x4000 + packet_number * 126); /* position in stream */
  366. #endif
  367. put_byte(pb, stream->nb_frames & 0xff);
  368. put_buffer(pb, buf, size);
  369. put_flush_packet(pb);
  370. stream->nb_frames++;
  371. return 0;
  372. }
  373. static int rm_write_packet(AVFormatContext *s, AVPacket *pkt)
  374. {
  375. if (s->streams[pkt->stream_index]->codec->codec_type ==
  376. CODEC_TYPE_AUDIO)
  377. return rm_write_audio(s, pkt->data, pkt->size, pkt->flags);
  378. else
  379. return rm_write_video(s, pkt->data, pkt->size, pkt->flags);
  380. }
  381. static int rm_write_trailer(AVFormatContext *s)
  382. {
  383. RMContext *rm = s->priv_data;
  384. int data_size, index_pos, i;
  385. ByteIOContext *pb = &s->pb;
  386. if (!url_is_streamed(&s->pb)) {
  387. /* end of file: finish to write header */
  388. index_pos = url_fseek(pb, 0, SEEK_CUR);
  389. data_size = index_pos - rm->data_pos;
  390. /* index */
  391. put_tag(pb, "INDX");
  392. put_be32(pb, 10 + 10 * s->nb_streams);
  393. put_be16(pb, 0);
  394. for(i=0;i<s->nb_streams;i++) {
  395. put_be32(pb, 0); /* zero indices */
  396. put_be16(pb, i); /* stream number */
  397. put_be32(pb, 0); /* next index */
  398. }
  399. /* undocumented end header */
  400. put_be32(pb, 0);
  401. put_be32(pb, 0);
  402. url_fseek(pb, 0, SEEK_SET);
  403. for(i=0;i<s->nb_streams;i++)
  404. rm->streams[i].total_frames = rm->streams[i].nb_frames;
  405. rv10_write_header(s, data_size, index_pos);
  406. } else {
  407. /* undocumented end header */
  408. put_be32(pb, 0);
  409. put_be32(pb, 0);
  410. }
  411. put_flush_packet(pb);
  412. return 0;
  413. }
  414. #endif //CONFIG_MUXERS
  415. /***************************************************/
  416. static void get_str(ByteIOContext *pb, char *buf, int buf_size)
  417. {
  418. int len, i;
  419. char *q;
  420. len = get_be16(pb);
  421. q = buf;
  422. for(i=0;i<len;i++) {
  423. if (i < buf_size - 1)
  424. *q++ = get_byte(pb);
  425. }
  426. *q = '\0';
  427. }
  428. static void get_str8(ByteIOContext *pb, char *buf, int buf_size)
  429. {
  430. int len, i;
  431. char *q;
  432. len = get_byte(pb);
  433. q = buf;
  434. for(i=0;i<len;i++) {
  435. if (i < buf_size - 1)
  436. *q++ = get_byte(pb);
  437. }
  438. *q = '\0';
  439. }
  440. static int rm_read_audio_stream_info(AVFormatContext *s, AVStream *st,
  441. int read_all)
  442. {
  443. RMContext *rm = s->priv_data;
  444. ByteIOContext *pb = &s->pb;
  445. char buf[256];
  446. uint32_t version;
  447. int i;
  448. /* ra type header */
  449. version = get_be32(pb); /* version */
  450. if (((version >> 16) & 0xff) == 3) {
  451. int64_t startpos = url_ftell(pb);
  452. /* very old version */
  453. for(i = 0; i < 14; i++)
  454. get_byte(pb);
  455. get_str8(pb, s->title, sizeof(s->title));
  456. get_str8(pb, s->author, sizeof(s->author));
  457. get_str8(pb, s->copyright, sizeof(s->copyright));
  458. get_str8(pb, s->comment, sizeof(s->comment));
  459. if ((startpos + (version & 0xffff)) >= url_ftell(pb) + 2) {
  460. // fourcc (should always be "lpcJ")
  461. get_byte(pb);
  462. get_str8(pb, buf, sizeof(buf));
  463. }
  464. // Skip extra header crap (this should never happen)
  465. if ((startpos + (version & 0xffff)) > url_ftell(pb))
  466. url_fskip(pb, (version & 0xffff) + startpos - url_ftell(pb));
  467. st->codec->sample_rate = 8000;
  468. st->codec->channels = 1;
  469. st->codec->codec_type = CODEC_TYPE_AUDIO;
  470. st->codec->codec_id = CODEC_ID_RA_144;
  471. } else {
  472. int flavor, sub_packet_h, coded_framesize, sub_packet_size;
  473. /* old version (4) */
  474. get_be32(pb); /* .ra4 */
  475. get_be32(pb); /* data size */
  476. get_be16(pb); /* version2 */
  477. get_be32(pb); /* header size */
  478. flavor= get_be16(pb); /* add codec info / flavor */
  479. rm->coded_framesize = coded_framesize = get_be32(pb); /* coded frame size */
  480. get_be32(pb); /* ??? */
  481. get_be32(pb); /* ??? */
  482. get_be32(pb); /* ??? */
  483. rm->sub_packet_h = sub_packet_h = get_be16(pb); /* 1 */
  484. st->codec->block_align= get_be16(pb); /* frame size */
  485. rm->sub_packet_size = sub_packet_size = get_be16(pb); /* sub packet size */
  486. get_be16(pb); /* ??? */
  487. if (((version >> 16) & 0xff) == 5) {
  488. get_be16(pb); get_be16(pb); get_be16(pb); }
  489. st->codec->sample_rate = get_be16(pb);
  490. get_be32(pb);
  491. st->codec->channels = get_be16(pb);
  492. if (((version >> 16) & 0xff) == 5) {
  493. get_be32(pb);
  494. buf[0] = get_byte(pb);
  495. buf[1] = get_byte(pb);
  496. buf[2] = get_byte(pb);
  497. buf[3] = get_byte(pb);
  498. buf[4] = 0;
  499. } else {
  500. get_str8(pb, buf, sizeof(buf)); /* desc */
  501. get_str8(pb, buf, sizeof(buf)); /* desc */
  502. }
  503. st->codec->codec_type = CODEC_TYPE_AUDIO;
  504. if (!strcmp(buf, "dnet")) {
  505. st->codec->codec_id = CODEC_ID_AC3;
  506. } else if (!strcmp(buf, "28_8")) {
  507. st->codec->codec_id = CODEC_ID_RA_288;
  508. st->codec->extradata_size= 0;
  509. rm->audio_framesize = st->codec->block_align;
  510. st->codec->block_align = coded_framesize;
  511. if(rm->audio_framesize >= UINT_MAX / sub_packet_h){
  512. av_log(s, AV_LOG_ERROR, "rm->audio_framesize * sub_packet_h too large\n");
  513. return -1;
  514. }
  515. rm->audiobuf = av_malloc(rm->audio_framesize * sub_packet_h);
  516. } else if (!strcmp(buf, "cook")) {
  517. int codecdata_length, i;
  518. get_be16(pb); get_byte(pb);
  519. if (((version >> 16) & 0xff) == 5)
  520. get_byte(pb);
  521. codecdata_length = get_be32(pb);
  522. if(codecdata_length + FF_INPUT_BUFFER_PADDING_SIZE <= (unsigned)codecdata_length){
  523. av_log(s, AV_LOG_ERROR, "codecdata_length too large\n");
  524. return -1;
  525. }
  526. st->codec->codec_id = CODEC_ID_COOK;
  527. st->codec->extradata_size= codecdata_length;
  528. st->codec->extradata= av_mallocz(st->codec->extradata_size + FF_INPUT_BUFFER_PADDING_SIZE);
  529. for(i = 0; i < codecdata_length; i++)
  530. ((uint8_t*)st->codec->extradata)[i] = get_byte(pb);
  531. rm->audio_framesize = st->codec->block_align;
  532. st->codec->block_align = rm->sub_packet_size;
  533. if(rm->audio_framesize >= UINT_MAX / sub_packet_h){
  534. av_log(s, AV_LOG_ERROR, "rm->audio_framesize * sub_packet_h too large\n");
  535. return -1;
  536. }
  537. rm->audiobuf = av_malloc(rm->audio_framesize * sub_packet_h);
  538. } else if (!strcmp(buf, "raac") || !strcmp(buf, "racp")) {
  539. int codecdata_length, i;
  540. get_be16(pb); get_byte(pb);
  541. if (((version >> 16) & 0xff) == 5)
  542. get_byte(pb);
  543. st->codec->codec_id = CODEC_ID_AAC;
  544. codecdata_length = get_be32(pb);
  545. if(codecdata_length + FF_INPUT_BUFFER_PADDING_SIZE <= (unsigned)codecdata_length){
  546. av_log(s, AV_LOG_ERROR, "codecdata_length too large\n");
  547. return -1;
  548. }
  549. if (codecdata_length >= 1) {
  550. st->codec->extradata_size = codecdata_length - 1;
  551. st->codec->extradata = av_mallocz(st->codec->extradata_size + FF_INPUT_BUFFER_PADDING_SIZE);
  552. get_byte(pb);
  553. for(i = 0; i < st->codec->extradata_size; i++)
  554. ((uint8_t*)st->codec->extradata)[i] = get_byte(pb);
  555. }
  556. } else {
  557. st->codec->codec_id = CODEC_ID_NONE;
  558. pstrcpy(st->codec->codec_name, sizeof(st->codec->codec_name),
  559. buf);
  560. }
  561. if (read_all) {
  562. get_byte(pb);
  563. get_byte(pb);
  564. get_byte(pb);
  565. get_str8(pb, s->title, sizeof(s->title));
  566. get_str8(pb, s->author, sizeof(s->author));
  567. get_str8(pb, s->copyright, sizeof(s->copyright));
  568. get_str8(pb, s->comment, sizeof(s->comment));
  569. }
  570. }
  571. return 0;
  572. }
  573. static int rm_read_header_old(AVFormatContext *s, AVFormatParameters *ap)
  574. {
  575. RMContext *rm = s->priv_data;
  576. AVStream *st;
  577. rm->old_format = 1;
  578. st = av_new_stream(s, 0);
  579. if (!st)
  580. return -1;
  581. return rm_read_audio_stream_info(s, st, 1);
  582. }
  583. static int rm_read_header(AVFormatContext *s, AVFormatParameters *ap)
  584. {
  585. RMContext *rm = s->priv_data;
  586. AVStream *st;
  587. ByteIOContext *pb = &s->pb;
  588. unsigned int tag, v;
  589. int tag_size, size, codec_data_size, i;
  590. int64_t codec_pos;
  591. unsigned int start_time, duration;
  592. char buf[128];
  593. int flags = 0;
  594. tag = get_le32(pb);
  595. if (tag == MKTAG('.', 'r', 'a', 0xfd)) {
  596. /* very old .ra format */
  597. return rm_read_header_old(s, ap);
  598. } else if (tag != MKTAG('.', 'R', 'M', 'F')) {
  599. return AVERROR_IO;
  600. }
  601. get_be32(pb); /* header size */
  602. get_be16(pb);
  603. get_be32(pb);
  604. get_be32(pb); /* number of headers */
  605. for(;;) {
  606. if (url_feof(pb))
  607. goto fail;
  608. tag = get_le32(pb);
  609. tag_size = get_be32(pb);
  610. get_be16(pb);
  611. #if 0
  612. printf("tag=%c%c%c%c (%08x) size=%d\n",
  613. (tag) & 0xff,
  614. (tag >> 8) & 0xff,
  615. (tag >> 16) & 0xff,
  616. (tag >> 24) & 0xff,
  617. tag,
  618. tag_size);
  619. #endif
  620. if (tag_size < 10 && tag != MKTAG('D', 'A', 'T', 'A'))
  621. goto fail;
  622. switch(tag) {
  623. case MKTAG('P', 'R', 'O', 'P'):
  624. /* file header */
  625. get_be32(pb); /* max bit rate */
  626. get_be32(pb); /* avg bit rate */
  627. get_be32(pb); /* max packet size */
  628. get_be32(pb); /* avg packet size */
  629. get_be32(pb); /* nb packets */
  630. get_be32(pb); /* duration */
  631. get_be32(pb); /* preroll */
  632. get_be32(pb); /* index offset */
  633. get_be32(pb); /* data offset */
  634. get_be16(pb); /* nb streams */
  635. flags = get_be16(pb); /* flags */
  636. break;
  637. case MKTAG('C', 'O', 'N', 'T'):
  638. get_str(pb, s->title, sizeof(s->title));
  639. get_str(pb, s->author, sizeof(s->author));
  640. get_str(pb, s->copyright, sizeof(s->copyright));
  641. get_str(pb, s->comment, sizeof(s->comment));
  642. break;
  643. case MKTAG('M', 'D', 'P', 'R'):
  644. st = av_new_stream(s, 0);
  645. if (!st)
  646. goto fail;
  647. st->id = get_be16(pb);
  648. get_be32(pb); /* max bit rate */
  649. st->codec->bit_rate = get_be32(pb); /* bit rate */
  650. get_be32(pb); /* max packet size */
  651. get_be32(pb); /* avg packet size */
  652. start_time = get_be32(pb); /* start time */
  653. get_be32(pb); /* preroll */
  654. duration = get_be32(pb); /* duration */
  655. st->start_time = start_time;
  656. st->duration = duration;
  657. get_str8(pb, buf, sizeof(buf)); /* desc */
  658. get_str8(pb, buf, sizeof(buf)); /* mimetype */
  659. codec_data_size = get_be32(pb);
  660. codec_pos = url_ftell(pb);
  661. st->codec->codec_type = CODEC_TYPE_DATA;
  662. av_set_pts_info(st, 64, 1, 1000);
  663. v = get_be32(pb);
  664. if (v == MKTAG(0xfd, 'a', 'r', '.')) {
  665. /* ra type header */
  666. if (rm_read_audio_stream_info(s, st, 0))
  667. return -1;
  668. } else {
  669. int fps, fps2;
  670. if (get_le32(pb) != MKTAG('V', 'I', 'D', 'O')) {
  671. fail1:
  672. av_log(st->codec, AV_LOG_ERROR, "Unsupported video codec\n");
  673. goto skip;
  674. }
  675. st->codec->codec_tag = get_le32(pb);
  676. // av_log(NULL, AV_LOG_DEBUG, "%X %X\n", st->codec->codec_tag, MKTAG('R', 'V', '2', '0'));
  677. if ( st->codec->codec_tag != MKTAG('R', 'V', '1', '0')
  678. && st->codec->codec_tag != MKTAG('R', 'V', '2', '0')
  679. && st->codec->codec_tag != MKTAG('R', 'V', '3', '0')
  680. && st->codec->codec_tag != MKTAG('R', 'V', '4', '0'))
  681. goto fail1;
  682. st->codec->width = get_be16(pb);
  683. st->codec->height = get_be16(pb);
  684. st->codec->time_base.num= 1;
  685. fps= get_be16(pb);
  686. st->codec->codec_type = CODEC_TYPE_VIDEO;
  687. get_be32(pb);
  688. fps2= get_be16(pb);
  689. get_be16(pb);
  690. st->codec->extradata_size= codec_data_size - (url_ftell(pb) - codec_pos);
  691. if(st->codec->extradata_size + FF_INPUT_BUFFER_PADDING_SIZE <= (unsigned)st->codec->extradata_size){
  692. //check is redundant as get_buffer() will catch this
  693. av_log(s, AV_LOG_ERROR, "st->codec->extradata_size too large\n");
  694. return -1;
  695. }
  696. st->codec->extradata= av_mallocz(st->codec->extradata_size + FF_INPUT_BUFFER_PADDING_SIZE);
  697. get_buffer(pb, st->codec->extradata, st->codec->extradata_size);
  698. // av_log(NULL, AV_LOG_DEBUG, "fps= %d fps2= %d\n", fps, fps2);
  699. st->codec->time_base.den = fps * st->codec->time_base.num;
  700. switch(((uint8_t*)st->codec->extradata)[4]>>4){
  701. case 1: st->codec->codec_id = CODEC_ID_RV10; break;
  702. case 2: st->codec->codec_id = CODEC_ID_RV20; break;
  703. case 3: st->codec->codec_id = CODEC_ID_RV30; break;
  704. case 4: st->codec->codec_id = CODEC_ID_RV40; break;
  705. default: goto fail1;
  706. }
  707. }
  708. skip:
  709. /* skip codec info */
  710. size = url_ftell(pb) - codec_pos;
  711. url_fskip(pb, codec_data_size - size);
  712. break;
  713. case MKTAG('D', 'A', 'T', 'A'):
  714. goto header_end;
  715. default:
  716. /* unknown tag: skip it */
  717. url_fskip(pb, tag_size - 10);
  718. break;
  719. }
  720. }
  721. header_end:
  722. rm->nb_packets = get_be32(pb); /* number of packets */
  723. if (!rm->nb_packets && (flags & 4))
  724. rm->nb_packets = 3600 * 25;
  725. get_be32(pb); /* next data header */
  726. return 0;
  727. fail:
  728. for(i=0;i<s->nb_streams;i++) {
  729. av_free(s->streams[i]);
  730. }
  731. return AVERROR_IO;
  732. }
  733. static int get_num(ByteIOContext *pb, int *len)
  734. {
  735. int n, n1;
  736. n = get_be16(pb);
  737. (*len)-=2;
  738. if (n >= 0x4000) {
  739. return n - 0x4000;
  740. } else {
  741. n1 = get_be16(pb);
  742. (*len)-=2;
  743. return (n << 16) | n1;
  744. }
  745. }
  746. /* multiple of 20 bytes for ra144 (ugly) */
  747. #define RAW_PACKET_SIZE 1000
  748. static int sync(AVFormatContext *s, int64_t *timestamp, int *flags, int *stream_index, int64_t *pos){
  749. RMContext *rm = s->priv_data;
  750. ByteIOContext *pb = &s->pb;
  751. int len, num, res, i;
  752. AVStream *st;
  753. uint32_t state=0xFFFFFFFF;
  754. while(!url_feof(pb)){
  755. *pos= url_ftell(pb);
  756. if(rm->remaining_len > 0){
  757. num= rm->current_stream;
  758. len= rm->remaining_len;
  759. *timestamp = AV_NOPTS_VALUE;
  760. *flags= 0;
  761. }else{
  762. state= (state<<8) + get_byte(pb);
  763. if(state == MKBETAG('I', 'N', 'D', 'X')){
  764. len = get_be16(pb) - 6;
  765. if(len<0)
  766. continue;
  767. goto skip;
  768. }
  769. if(state > (unsigned)0xFFFF || state < 12)
  770. continue;
  771. len=state;
  772. state= 0xFFFFFFFF;
  773. num = get_be16(pb);
  774. *timestamp = get_be32(pb);
  775. res= get_byte(pb); /* reserved */
  776. *flags = get_byte(pb); /* flags */
  777. len -= 12;
  778. }
  779. for(i=0;i<s->nb_streams;i++) {
  780. st = s->streams[i];
  781. if (num == st->id)
  782. break;
  783. }
  784. if (i == s->nb_streams) {
  785. skip:
  786. /* skip packet if unknown number */
  787. url_fskip(pb, len);
  788. rm->remaining_len -= len;
  789. continue;
  790. }
  791. *stream_index= i;
  792. return len;
  793. }
  794. return -1;
  795. }
  796. static int rm_read_packet(AVFormatContext *s, AVPacket *pkt)
  797. {
  798. RMContext *rm = s->priv_data;
  799. ByteIOContext *pb = &s->pb;
  800. AVStream *st;
  801. int i, len, tmp, j;
  802. int64_t timestamp, pos;
  803. uint8_t *ptr;
  804. int flags;
  805. if (rm->audio_pkt_cnt) {
  806. // If there are queued audio packet return them first
  807. st = s->streams[rm->audio_stream_num];
  808. if (st->codec->codec_id == CODEC_ID_AAC)
  809. av_get_packet(pb, pkt, rm->sub_packet_lengths[rm->sub_packet_cnt - rm->audio_pkt_cnt]);
  810. else {
  811. av_new_packet(pkt, st->codec->block_align);
  812. memcpy(pkt->data, rm->audiobuf + st->codec->block_align *
  813. (rm->sub_packet_h * rm->audio_framesize / st->codec->block_align - rm->audio_pkt_cnt),
  814. st->codec->block_align);
  815. }
  816. rm->audio_pkt_cnt--;
  817. pkt->flags = 0;
  818. pkt->stream_index = rm->audio_stream_num;
  819. } else if (rm->old_format) {
  820. st = s->streams[0];
  821. if (st->codec->codec_id == CODEC_ID_RA_288) {
  822. int x, y;
  823. for (y = 0; y < rm->sub_packet_h; y++)
  824. for (x = 0; x < rm->sub_packet_h/2; x++)
  825. if (get_buffer(pb, rm->audiobuf+x*2*rm->audio_framesize+y*rm->coded_framesize, rm->coded_framesize) <= 0)
  826. return AVERROR_IO;
  827. rm->audio_stream_num = 0;
  828. rm->audio_pkt_cnt = rm->sub_packet_h * rm->audio_framesize / st->codec->block_align - 1;
  829. // Release first audio packet
  830. av_new_packet(pkt, st->codec->block_align);
  831. memcpy(pkt->data, rm->audiobuf, st->codec->block_align);
  832. pkt->flags |= PKT_FLAG_KEY; // Mark first packet as keyframe
  833. pkt->stream_index = 0;
  834. } else {
  835. /* just read raw bytes */
  836. len = RAW_PACKET_SIZE;
  837. len= av_get_packet(pb, pkt, len);
  838. pkt->stream_index = 0;
  839. if (len <= 0) {
  840. return AVERROR_IO;
  841. }
  842. pkt->size = len;
  843. }
  844. } else {
  845. int seq=1;
  846. resync:
  847. len=sync(s, &timestamp, &flags, &i, &pos);
  848. if(len<0)
  849. return AVERROR_IO;
  850. st = s->streams[i];
  851. if (st->codec->codec_type == CODEC_TYPE_VIDEO) {
  852. int h, pic_num, len2, pos;
  853. h= get_byte(pb); len--;
  854. if(!(h & 0x40)){
  855. seq = get_byte(pb); len--;
  856. }
  857. if((h & 0xc0) == 0x40){
  858. len2= pos= 0;
  859. }else{
  860. len2 = get_num(pb, &len);
  861. pos = get_num(pb, &len);
  862. }
  863. /* picture number */
  864. pic_num= get_byte(pb); len--;
  865. rm->remaining_len= len;
  866. rm->current_stream= st->id;
  867. // av_log(NULL, AV_LOG_DEBUG, "%X len:%d pos:%d len2:%d pic_num:%d\n",h, len, pos, len2, pic_num);
  868. if(len2 && len2<len)
  869. len=len2;
  870. rm->remaining_len-= len;
  871. av_get_packet(pb, pkt, len);
  872. }
  873. if (st->codec->codec_type == CODEC_TYPE_AUDIO) {
  874. if ((st->codec->codec_id == CODEC_ID_RA_288) ||
  875. (st->codec->codec_id == CODEC_ID_COOK)) {
  876. int x;
  877. int sps = rm->sub_packet_size;
  878. int cfs = rm->coded_framesize;
  879. int h = rm->sub_packet_h;
  880. int y = rm->sub_packet_cnt;
  881. int w = rm->audio_framesize;
  882. if (flags & 2)
  883. y = rm->sub_packet_cnt = 0;
  884. if (!y)
  885. rm->audiotimestamp = timestamp;
  886. switch(st->codec->codec_id) {
  887. case CODEC_ID_RA_288:
  888. for (x = 0; x < h/2; x++)
  889. get_buffer(pb, rm->audiobuf+x*2*w+y*cfs, cfs);
  890. break;
  891. case CODEC_ID_COOK:
  892. for (x = 0; x < w/sps; x++)
  893. get_buffer(pb, rm->audiobuf+sps*(h*x+((h+1)/2)*(y&1)+(y>>1)), sps);
  894. break;
  895. }
  896. if (++(rm->sub_packet_cnt) < h)
  897. goto resync;
  898. else {
  899. rm->sub_packet_cnt = 0;
  900. rm->audio_stream_num = i;
  901. rm->audio_pkt_cnt = h * w / st->codec->block_align - 1;
  902. // Release first audio packet
  903. av_new_packet(pkt, st->codec->block_align);
  904. memcpy(pkt->data, rm->audiobuf, st->codec->block_align);
  905. timestamp = rm->audiotimestamp;
  906. flags = 2; // Mark first packet as keyframe
  907. }
  908. } else if (st->codec->codec_id == CODEC_ID_AAC) {
  909. int x;
  910. rm->audio_stream_num = i;
  911. rm->sub_packet_cnt = (get_be16(pb) & 0xf0) >> 4;
  912. if (rm->sub_packet_cnt) {
  913. for (x = 0; x < rm->sub_packet_cnt; x++)
  914. rm->sub_packet_lengths[x] = get_be16(pb);
  915. // Release first audio packet
  916. rm->audio_pkt_cnt = rm->sub_packet_cnt - 1;
  917. av_get_packet(pb, pkt, rm->sub_packet_lengths[0]);
  918. flags = 2; // Mark first packet as keyframe
  919. }
  920. } else
  921. av_get_packet(pb, pkt, len);
  922. }
  923. if( (st->discard >= AVDISCARD_NONKEY && !(flags&2))
  924. || st->discard >= AVDISCARD_ALL){
  925. av_free_packet(pkt);
  926. goto resync;
  927. }
  928. pkt->stream_index = i;
  929. #if 0
  930. if (st->codec->codec_type == CODEC_TYPE_VIDEO) {
  931. if(st->codec->codec_id == CODEC_ID_RV20){
  932. int seq= 128*(pkt->data[2]&0x7F) + (pkt->data[3]>>1);
  933. av_log(NULL, AV_LOG_DEBUG, "%d %"PRId64" %d\n", timestamp, timestamp*512LL/25, seq);
  934. seq |= (timestamp&~0x3FFF);
  935. if(seq - timestamp > 0x2000) seq -= 0x4000;
  936. if(seq - timestamp < -0x2000) seq += 0x4000;
  937. }
  938. }
  939. #endif
  940. pkt->pts= timestamp;
  941. if(flags&2){
  942. pkt->flags |= PKT_FLAG_KEY;
  943. if((seq&0x7F) == 1)
  944. av_add_index_entry(st, pos, timestamp, 0, 0, AVINDEX_KEYFRAME);
  945. }
  946. }
  947. /* for AC3, needs to swap bytes */
  948. if (st->codec->codec_id == CODEC_ID_AC3) {
  949. ptr = pkt->data;
  950. for(j=0;j<len;j+=2) {
  951. tmp = ptr[0];
  952. ptr[0] = ptr[1];
  953. ptr[1] = tmp;
  954. ptr += 2;
  955. }
  956. }
  957. return 0;
  958. }
  959. static int rm_read_close(AVFormatContext *s)
  960. {
  961. RMContext *rm = s->priv_data;
  962. av_free(rm->audiobuf);
  963. return 0;
  964. }
  965. static int rm_probe(AVProbeData *p)
  966. {
  967. /* check file header */
  968. if (p->buf_size <= 32)
  969. return 0;
  970. if ((p->buf[0] == '.' && p->buf[1] == 'R' &&
  971. p->buf[2] == 'M' && p->buf[3] == 'F' &&
  972. p->buf[4] == 0 && p->buf[5] == 0) ||
  973. (p->buf[0] == '.' && p->buf[1] == 'r' &&
  974. p->buf[2] == 'a' && p->buf[3] == 0xfd))
  975. return AVPROBE_SCORE_MAX;
  976. else
  977. return 0;
  978. }
  979. static int64_t rm_read_dts(AVFormatContext *s, int stream_index,
  980. int64_t *ppos, int64_t pos_limit)
  981. {
  982. RMContext *rm = s->priv_data;
  983. int64_t pos, dts;
  984. int stream_index2, flags, len, h;
  985. pos = *ppos;
  986. if(rm->old_format)
  987. return AV_NOPTS_VALUE;
  988. url_fseek(&s->pb, pos, SEEK_SET);
  989. rm->remaining_len=0;
  990. for(;;){
  991. int seq=1;
  992. AVStream *st;
  993. len=sync(s, &dts, &flags, &stream_index2, &pos);
  994. if(len<0)
  995. return AV_NOPTS_VALUE;
  996. st = s->streams[stream_index2];
  997. if (st->codec->codec_type == CODEC_TYPE_VIDEO) {
  998. h= get_byte(&s->pb); len--;
  999. if(!(h & 0x40)){
  1000. seq = get_byte(&s->pb); len--;
  1001. }
  1002. }
  1003. if((flags&2) && (seq&0x7F) == 1){
  1004. // av_log(s, AV_LOG_DEBUG, "%d %d-%d %"PRId64" %d\n", flags, stream_index2, stream_index, dts, seq);
  1005. av_add_index_entry(st, pos, dts, 0, 0, AVINDEX_KEYFRAME);
  1006. if(stream_index2 == stream_index)
  1007. break;
  1008. }
  1009. url_fskip(&s->pb, len);
  1010. }
  1011. *ppos = pos;
  1012. return dts;
  1013. }
  1014. #ifdef CONFIG_RM_DEMUXER
  1015. AVInputFormat rm_demuxer = {
  1016. "rm",
  1017. "rm format",
  1018. sizeof(RMContext),
  1019. rm_probe,
  1020. rm_read_header,
  1021. rm_read_packet,
  1022. rm_read_close,
  1023. NULL,
  1024. rm_read_dts,
  1025. };
  1026. #endif
  1027. #ifdef CONFIG_RM_MUXER
  1028. AVOutputFormat rm_muxer = {
  1029. "rm",
  1030. "rm format",
  1031. "application/vnd.rn-realmedia",
  1032. "rm,ra",
  1033. sizeof(RMContext),
  1034. CODEC_ID_AC3,
  1035. CODEC_ID_RV10,
  1036. rm_write_header,
  1037. rm_write_packet,
  1038. rm_write_trailer,
  1039. };
  1040. #endif