You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

473 lines
15KB

  1. /*
  2. * "Real" compatible muxer.
  3. * Copyright (c) 2000, 2001 Fabrice Bellard
  4. *
  5. * This file is part of FFmpeg.
  6. *
  7. * FFmpeg is free software; you can redistribute it and/or
  8. * modify it under the terms of the GNU Lesser General Public
  9. * License as published by the Free Software Foundation; either
  10. * version 2.1 of the License, or (at your option) any later version.
  11. *
  12. * FFmpeg is distributed in the hope that it will be useful,
  13. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  14. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  15. * Lesser General Public License for more details.
  16. *
  17. * You should have received a copy of the GNU Lesser General Public
  18. * License along with FFmpeg; if not, write to the Free Software
  19. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  20. */
  21. #include "avformat.h"
  22. #include "rm.h"
  23. typedef struct {
  24. int nb_packets;
  25. int packet_total_size;
  26. int packet_max_size;
  27. /* codec related output */
  28. int bit_rate;
  29. float frame_rate;
  30. int nb_frames; /* current frame number */
  31. int total_frames; /* total number of frames */
  32. int num;
  33. AVCodecContext *enc;
  34. } StreamInfo;
  35. typedef struct {
  36. StreamInfo streams[2];
  37. StreamInfo *audio_stream, *video_stream;
  38. int data_pos; /* position of the data after the header */
  39. } RMMuxContext;
  40. /* in ms */
  41. #define BUFFER_DURATION 0
  42. static void put_str(ByteIOContext *s, const char *tag)
  43. {
  44. put_be16(s,strlen(tag));
  45. while (*tag) {
  46. put_byte(s, *tag++);
  47. }
  48. }
  49. static void put_str8(ByteIOContext *s, const char *tag)
  50. {
  51. put_byte(s, strlen(tag));
  52. while (*tag) {
  53. put_byte(s, *tag++);
  54. }
  55. }
  56. static int rv10_write_header(AVFormatContext *ctx,
  57. int data_size, int index_pos)
  58. {
  59. RMMuxContext *rm = ctx->priv_data;
  60. ByteIOContext *s = ctx->pb;
  61. StreamInfo *stream;
  62. unsigned char *data_offset_ptr, *start_ptr;
  63. const char *desc, *mimetype;
  64. int nb_packets, packet_total_size, packet_max_size, size, packet_avg_size, i;
  65. int bit_rate, v, duration, flags, data_pos;
  66. AVMetadataTag *tag;
  67. start_ptr = s->buf_ptr;
  68. put_tag(s, ".RMF");
  69. put_be32(s,18); /* header size */
  70. put_be16(s,0);
  71. put_be32(s,0);
  72. put_be32(s,4 + ctx->nb_streams); /* num headers */
  73. put_tag(s,"PROP");
  74. put_be32(s, 50);
  75. put_be16(s, 0);
  76. packet_max_size = 0;
  77. packet_total_size = 0;
  78. nb_packets = 0;
  79. bit_rate = 0;
  80. duration = 0;
  81. for(i=0;i<ctx->nb_streams;i++) {
  82. StreamInfo *stream = &rm->streams[i];
  83. bit_rate += stream->bit_rate;
  84. if (stream->packet_max_size > packet_max_size)
  85. packet_max_size = stream->packet_max_size;
  86. nb_packets += stream->nb_packets;
  87. packet_total_size += stream->packet_total_size;
  88. /* select maximum duration */
  89. v = (int) (1000.0 * (float)stream->total_frames / stream->frame_rate);
  90. if (v > duration)
  91. duration = v;
  92. }
  93. put_be32(s, bit_rate); /* max bit rate */
  94. put_be32(s, bit_rate); /* avg bit rate */
  95. put_be32(s, packet_max_size); /* max packet size */
  96. if (nb_packets > 0)
  97. packet_avg_size = packet_total_size / nb_packets;
  98. else
  99. packet_avg_size = 0;
  100. put_be32(s, packet_avg_size); /* avg packet size */
  101. put_be32(s, nb_packets); /* num packets */
  102. put_be32(s, duration); /* duration */
  103. put_be32(s, BUFFER_DURATION); /* preroll */
  104. put_be32(s, index_pos); /* index offset */
  105. /* computation of data the data offset */
  106. data_offset_ptr = s->buf_ptr;
  107. put_be32(s, 0); /* data offset : will be patched after */
  108. put_be16(s, ctx->nb_streams); /* num streams */
  109. flags = 1 | 2; /* save allowed & perfect play */
  110. if (url_is_streamed(s))
  111. flags |= 4; /* live broadcast */
  112. put_be16(s, flags);
  113. /* comments */
  114. put_tag(s,"CONT");
  115. size = 4 * 2 + 10;
  116. for(i=0; i<FF_ARRAY_ELEMS(ff_rm_metadata); i++) {
  117. tag = av_metadata_get(ctx->metadata, ff_rm_metadata[i], NULL, 0);
  118. if(tag) size += strlen(tag->value);
  119. }
  120. put_be32(s,size);
  121. put_be16(s,0);
  122. for(i=0; i<FF_ARRAY_ELEMS(ff_rm_metadata); i++) {
  123. tag = av_metadata_get(ctx->metadata, ff_rm_metadata[i], NULL, 0);
  124. put_str(s, tag ? tag->value : "");
  125. }
  126. for(i=0;i<ctx->nb_streams;i++) {
  127. int codec_data_size;
  128. stream = &rm->streams[i];
  129. if (stream->enc->codec_type == AVMEDIA_TYPE_AUDIO) {
  130. desc = "The Audio Stream";
  131. mimetype = "audio/x-pn-realaudio";
  132. codec_data_size = 73;
  133. } else {
  134. desc = "The Video Stream";
  135. mimetype = "video/x-pn-realvideo";
  136. codec_data_size = 34;
  137. }
  138. put_tag(s,"MDPR");
  139. size = 10 + 9 * 4 + strlen(desc) + strlen(mimetype) + codec_data_size;
  140. put_be32(s, size);
  141. put_be16(s, 0);
  142. put_be16(s, i); /* stream number */
  143. put_be32(s, stream->bit_rate); /* max bit rate */
  144. put_be32(s, stream->bit_rate); /* avg bit rate */
  145. put_be32(s, stream->packet_max_size); /* max packet size */
  146. if (stream->nb_packets > 0)
  147. packet_avg_size = stream->packet_total_size /
  148. stream->nb_packets;
  149. else
  150. packet_avg_size = 0;
  151. put_be32(s, packet_avg_size); /* avg packet size */
  152. put_be32(s, 0); /* start time */
  153. put_be32(s, BUFFER_DURATION); /* preroll */
  154. /* duration */
  155. if (url_is_streamed(s) || !stream->total_frames)
  156. put_be32(s, (int)(3600 * 1000));
  157. else
  158. put_be32(s, (int)(stream->total_frames * 1000 / stream->frame_rate));
  159. put_str8(s, desc);
  160. put_str8(s, mimetype);
  161. put_be32(s, codec_data_size);
  162. if (stream->enc->codec_type == AVMEDIA_TYPE_AUDIO) {
  163. int coded_frame_size, fscode, sample_rate;
  164. sample_rate = stream->enc->sample_rate;
  165. coded_frame_size = (stream->enc->bit_rate *
  166. stream->enc->frame_size) / (8 * sample_rate);
  167. /* audio codec info */
  168. put_tag(s, ".ra");
  169. put_byte(s, 0xfd);
  170. put_be32(s, 0x00040000); /* version */
  171. put_tag(s, ".ra4");
  172. put_be32(s, 0x01b53530); /* stream length */
  173. put_be16(s, 4); /* unknown */
  174. put_be32(s, 0x39); /* header size */
  175. switch(sample_rate) {
  176. case 48000:
  177. case 24000:
  178. case 12000:
  179. fscode = 1;
  180. break;
  181. default:
  182. case 44100:
  183. case 22050:
  184. case 11025:
  185. fscode = 2;
  186. break;
  187. case 32000:
  188. case 16000:
  189. case 8000:
  190. fscode = 3;
  191. }
  192. put_be16(s, fscode); /* codec additional info, for AC-3, seems
  193. to be a frequency code */
  194. /* special hack to compensate rounding errors... */
  195. if (coded_frame_size == 557)
  196. coded_frame_size--;
  197. put_be32(s, coded_frame_size); /* frame length */
  198. put_be32(s, 0x51540); /* unknown */
  199. put_be32(s, 0x249f0); /* unknown */
  200. put_be32(s, 0x249f0); /* unknown */
  201. put_be16(s, 0x01);
  202. /* frame length : seems to be very important */
  203. put_be16(s, coded_frame_size);
  204. put_be32(s, 0); /* unknown */
  205. put_be16(s, stream->enc->sample_rate); /* sample rate */
  206. put_be32(s, 0x10); /* unknown */
  207. put_be16(s, stream->enc->channels);
  208. put_str8(s, "Int0"); /* codec name */
  209. if (stream->enc->codec_tag) {
  210. put_byte(s, 4); /* tag length */
  211. put_le32(s, stream->enc->codec_tag);
  212. } else {
  213. av_log(ctx, AV_LOG_ERROR, "Invalid codec tag\n");
  214. return -1;
  215. }
  216. put_be16(s, 0); /* title length */
  217. put_be16(s, 0); /* author length */
  218. put_be16(s, 0); /* copyright length */
  219. put_byte(s, 0); /* end of header */
  220. } else {
  221. /* video codec info */
  222. put_be32(s,34); /* size */
  223. if(stream->enc->codec_id == CODEC_ID_RV10)
  224. put_tag(s,"VIDORV10");
  225. else
  226. put_tag(s,"VIDORV20");
  227. put_be16(s, stream->enc->width);
  228. put_be16(s, stream->enc->height);
  229. put_be16(s, (int) stream->frame_rate); /* frames per seconds ? */
  230. put_be32(s,0); /* unknown meaning */
  231. put_be16(s, (int) stream->frame_rate); /* unknown meaning */
  232. put_be32(s,0); /* unknown meaning */
  233. put_be16(s, 8); /* unknown meaning */
  234. /* Seems to be the codec version: only use basic H263. The next
  235. versions seems to add a diffential DC coding as in
  236. MPEG... nothing new under the sun */
  237. if(stream->enc->codec_id == CODEC_ID_RV10)
  238. put_be32(s,0x10000000);
  239. else
  240. put_be32(s,0x20103001);
  241. //put_be32(s,0x10003000);
  242. }
  243. }
  244. /* patch data offset field */
  245. data_pos = s->buf_ptr - start_ptr;
  246. rm->data_pos = data_pos;
  247. data_offset_ptr[0] = data_pos >> 24;
  248. data_offset_ptr[1] = data_pos >> 16;
  249. data_offset_ptr[2] = data_pos >> 8;
  250. data_offset_ptr[3] = data_pos;
  251. /* data stream */
  252. put_tag(s,"DATA");
  253. put_be32(s,data_size + 10 + 8);
  254. put_be16(s,0);
  255. put_be32(s, nb_packets); /* number of packets */
  256. put_be32(s,0); /* next data header */
  257. return 0;
  258. }
  259. static void write_packet_header(AVFormatContext *ctx, StreamInfo *stream,
  260. int length, int key_frame)
  261. {
  262. int timestamp;
  263. ByteIOContext *s = ctx->pb;
  264. stream->nb_packets++;
  265. stream->packet_total_size += length;
  266. if (length > stream->packet_max_size)
  267. stream->packet_max_size = length;
  268. put_be16(s,0); /* version */
  269. put_be16(s,length + 12);
  270. put_be16(s, stream->num); /* stream number */
  271. timestamp = (1000 * (float)stream->nb_frames) / stream->frame_rate;
  272. put_be32(s, timestamp); /* timestamp */
  273. put_byte(s, 0); /* reserved */
  274. put_byte(s, key_frame ? 2 : 0); /* flags */
  275. }
  276. static int rm_write_header(AVFormatContext *s)
  277. {
  278. RMMuxContext *rm = s->priv_data;
  279. StreamInfo *stream;
  280. int n;
  281. AVCodecContext *codec;
  282. for(n=0;n<s->nb_streams;n++) {
  283. s->streams[n]->id = n;
  284. codec = s->streams[n]->codec;
  285. stream = &rm->streams[n];
  286. memset(stream, 0, sizeof(StreamInfo));
  287. stream->num = n;
  288. stream->bit_rate = codec->bit_rate;
  289. stream->enc = codec;
  290. switch(codec->codec_type) {
  291. case AVMEDIA_TYPE_AUDIO:
  292. rm->audio_stream = stream;
  293. stream->frame_rate = (float)codec->sample_rate / (float)codec->frame_size;
  294. /* XXX: dummy values */
  295. stream->packet_max_size = 1024;
  296. stream->nb_packets = 0;
  297. stream->total_frames = stream->nb_packets;
  298. break;
  299. case AVMEDIA_TYPE_VIDEO:
  300. rm->video_stream = stream;
  301. stream->frame_rate = (float)codec->time_base.den / (float)codec->time_base.num;
  302. /* XXX: dummy values */
  303. stream->packet_max_size = 4096;
  304. stream->nb_packets = 0;
  305. stream->total_frames = stream->nb_packets;
  306. break;
  307. default:
  308. return -1;
  309. }
  310. }
  311. if (rv10_write_header(s, 0, 0))
  312. return AVERROR_INVALIDDATA;
  313. put_flush_packet(s->pb);
  314. return 0;
  315. }
  316. static int rm_write_audio(AVFormatContext *s, const uint8_t *buf, int size, int flags)
  317. {
  318. uint8_t *buf1;
  319. RMMuxContext *rm = s->priv_data;
  320. ByteIOContext *pb = s->pb;
  321. StreamInfo *stream = rm->audio_stream;
  322. int i;
  323. /* XXX: suppress this malloc */
  324. buf1= (uint8_t*) av_malloc( size * sizeof(uint8_t) );
  325. write_packet_header(s, stream, size, !!(flags & AV_PKT_FLAG_KEY));
  326. if (stream->enc->codec_id == CODEC_ID_AC3) {
  327. /* for AC-3, the words seem to be reversed */
  328. for(i=0;i<size;i+=2) {
  329. buf1[i] = buf[i+1];
  330. buf1[i+1] = buf[i];
  331. }
  332. put_buffer(pb, buf1, size);
  333. } else {
  334. put_buffer(pb, buf, size);
  335. }
  336. put_flush_packet(pb);
  337. stream->nb_frames++;
  338. av_free(buf1);
  339. return 0;
  340. }
  341. static int rm_write_video(AVFormatContext *s, const uint8_t *buf, int size, int flags)
  342. {
  343. RMMuxContext *rm = s->priv_data;
  344. ByteIOContext *pb = s->pb;
  345. StreamInfo *stream = rm->video_stream;
  346. int key_frame = !!(flags & AV_PKT_FLAG_KEY);
  347. /* XXX: this is incorrect: should be a parameter */
  348. /* Well, I spent some time finding the meaning of these bits. I am
  349. not sure I understood everything, but it works !! */
  350. #if 1
  351. write_packet_header(s, stream, size + 7 + (size >= 0x4000)*4, key_frame);
  352. /* bit 7: '1' if final packet of a frame converted in several packets */
  353. put_byte(pb, 0x81);
  354. /* bit 7: '1' if I frame. bits 6..0 : sequence number in current
  355. frame starting from 1 */
  356. if (key_frame) {
  357. put_byte(pb, 0x81);
  358. } else {
  359. put_byte(pb, 0x01);
  360. }
  361. if(size >= 0x4000){
  362. put_be32(pb, size); /* total frame size */
  363. put_be32(pb, size); /* offset from the start or the end */
  364. }else{
  365. put_be16(pb, 0x4000 | size); /* total frame size */
  366. put_be16(pb, 0x4000 | size); /* offset from the start or the end */
  367. }
  368. #else
  369. /* full frame */
  370. write_packet_header(s, size + 6);
  371. put_byte(pb, 0xc0);
  372. put_be16(pb, 0x4000 + size); /* total frame size */
  373. put_be16(pb, 0x4000 + packet_number * 126); /* position in stream */
  374. #endif
  375. put_byte(pb, stream->nb_frames & 0xff);
  376. put_buffer(pb, buf, size);
  377. put_flush_packet(pb);
  378. stream->nb_frames++;
  379. return 0;
  380. }
  381. static int rm_write_packet(AVFormatContext *s, AVPacket *pkt)
  382. {
  383. if (s->streams[pkt->stream_index]->codec->codec_type ==
  384. AVMEDIA_TYPE_AUDIO)
  385. return rm_write_audio(s, pkt->data, pkt->size, pkt->flags);
  386. else
  387. return rm_write_video(s, pkt->data, pkt->size, pkt->flags);
  388. }
  389. static int rm_write_trailer(AVFormatContext *s)
  390. {
  391. RMMuxContext *rm = s->priv_data;
  392. int data_size, index_pos, i;
  393. ByteIOContext *pb = s->pb;
  394. if (!url_is_streamed(s->pb)) {
  395. /* end of file: finish to write header */
  396. index_pos = url_fseek(pb, 0, SEEK_CUR);
  397. data_size = index_pos - rm->data_pos;
  398. /* FIXME: write index */
  399. /* undocumented end header */
  400. put_be32(pb, 0);
  401. put_be32(pb, 0);
  402. url_fseek(pb, 0, SEEK_SET);
  403. for(i=0;i<s->nb_streams;i++)
  404. rm->streams[i].total_frames = rm->streams[i].nb_frames;
  405. rv10_write_header(s, data_size, 0);
  406. } else {
  407. /* undocumented end header */
  408. put_be32(pb, 0);
  409. put_be32(pb, 0);
  410. }
  411. put_flush_packet(pb);
  412. return 0;
  413. }
  414. AVOutputFormat rm_muxer = {
  415. "rm",
  416. NULL_IF_CONFIG_SMALL("RealMedia format"),
  417. "application/vnd.rn-realmedia",
  418. "rm,ra",
  419. sizeof(RMMuxContext),
  420. CODEC_ID_AC3,
  421. CODEC_ID_RV10,
  422. rm_write_header,
  423. rm_write_packet,
  424. rm_write_trailer,
  425. .codec_tag= (const AVCodecTag* const []){ff_rm_codec_tags, 0},
  426. };