You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

474 lines
16KB

  1. /*
  2. * "Real" compatible muxer.
  3. * Copyright (c) 2000, 2001 Fabrice Bellard
  4. *
  5. * This file is part of Libav.
  6. *
  7. * Libav is free software; you can redistribute it and/or
  8. * modify it under the terms of the GNU Lesser General Public
  9. * License as published by the Free Software Foundation; either
  10. * version 2.1 of the License, or (at your option) any later version.
  11. *
  12. * Libav is distributed in the hope that it will be useful,
  13. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  14. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  15. * Lesser General Public License for more details.
  16. *
  17. * You should have received a copy of the GNU Lesser General Public
  18. * License along with Libav; if not, write to the Free Software
  19. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  20. */
  21. #include "avformat.h"
  22. #include "avio_internal.h"
  23. #include "rm.h"
  24. #include "libavutil/dict.h"
  25. typedef struct StreamInfo {
  26. int nb_packets;
  27. int packet_total_size;
  28. int packet_max_size;
  29. /* codec related output */
  30. int bit_rate;
  31. float frame_rate;
  32. int nb_frames; /* current frame number */
  33. int total_frames; /* total number of frames */
  34. int num;
  35. AVCodecParameters *par;
  36. } StreamInfo;
  37. typedef struct RMMuxContext {
  38. StreamInfo streams[2];
  39. StreamInfo *audio_stream, *video_stream;
  40. int data_pos; /* position of the data after the header */
  41. } RMMuxContext;
  42. /* in ms */
  43. #define BUFFER_DURATION 0
  44. /* the header needs at most 7 + 4 + 12 B */
  45. #define MAX_HEADER_SIZE (7 + 4 + 12)
  46. /* UINT16_MAX is the maximal chunk size */
  47. #define MAX_PACKET_SIZE (UINT16_MAX - MAX_HEADER_SIZE)
  48. static void put_str(AVIOContext *s, const char *tag)
  49. {
  50. avio_wb16(s,strlen(tag));
  51. while (*tag) {
  52. avio_w8(s, *tag++);
  53. }
  54. }
  55. static void put_str8(AVIOContext *s, const char *tag)
  56. {
  57. avio_w8(s, strlen(tag));
  58. while (*tag) {
  59. avio_w8(s, *tag++);
  60. }
  61. }
  62. static int rv10_write_header(AVFormatContext *ctx,
  63. int data_size, int index_pos)
  64. {
  65. RMMuxContext *rm = ctx->priv_data;
  66. AVIOContext *s = ctx->pb;
  67. StreamInfo *stream;
  68. unsigned char *data_offset_ptr, *start_ptr;
  69. const char *desc, *mimetype;
  70. int nb_packets, packet_total_size, packet_max_size, size, packet_avg_size, i;
  71. int bit_rate, v, duration, flags, data_pos;
  72. AVDictionaryEntry *tag;
  73. start_ptr = s->buf_ptr;
  74. ffio_wfourcc(s, ".RMF");
  75. avio_wb32(s,18); /* header size */
  76. avio_wb16(s,0);
  77. avio_wb32(s,0);
  78. avio_wb32(s,4 + ctx->nb_streams); /* num headers */
  79. ffio_wfourcc(s,"PROP");
  80. avio_wb32(s, 50);
  81. avio_wb16(s, 0);
  82. packet_max_size = 0;
  83. packet_total_size = 0;
  84. nb_packets = 0;
  85. bit_rate = 0;
  86. duration = 0;
  87. for(i=0;i<ctx->nb_streams;i++) {
  88. StreamInfo *stream = &rm->streams[i];
  89. bit_rate += stream->bit_rate;
  90. if (stream->packet_max_size > packet_max_size)
  91. packet_max_size = stream->packet_max_size;
  92. nb_packets += stream->nb_packets;
  93. packet_total_size += stream->packet_total_size;
  94. /* select maximum duration */
  95. v = (int) (1000.0 * (float)stream->total_frames / stream->frame_rate);
  96. if (v > duration)
  97. duration = v;
  98. }
  99. avio_wb32(s, bit_rate); /* max bit rate */
  100. avio_wb32(s, bit_rate); /* avg bit rate */
  101. avio_wb32(s, packet_max_size); /* max packet size */
  102. if (nb_packets > 0)
  103. packet_avg_size = packet_total_size / nb_packets;
  104. else
  105. packet_avg_size = 0;
  106. avio_wb32(s, packet_avg_size); /* avg packet size */
  107. avio_wb32(s, nb_packets); /* num packets */
  108. avio_wb32(s, duration); /* duration */
  109. avio_wb32(s, BUFFER_DURATION); /* preroll */
  110. avio_wb32(s, index_pos); /* index offset */
  111. /* computation of data the data offset */
  112. data_offset_ptr = s->buf_ptr;
  113. avio_wb32(s, 0); /* data offset : will be patched after */
  114. avio_wb16(s, ctx->nb_streams); /* num streams */
  115. flags = 1 | 2; /* save allowed & perfect play */
  116. if (!(s->seekable & AVIO_SEEKABLE_NORMAL))
  117. flags |= 4; /* live broadcast */
  118. avio_wb16(s, flags);
  119. /* comments */
  120. ffio_wfourcc(s,"CONT");
  121. size = 4 * 2 + 10;
  122. for(i=0; i<FF_ARRAY_ELEMS(ff_rm_metadata); i++) {
  123. tag = av_dict_get(ctx->metadata, ff_rm_metadata[i], NULL, 0);
  124. if(tag) size += strlen(tag->value);
  125. }
  126. avio_wb32(s,size);
  127. avio_wb16(s,0);
  128. for(i=0; i<FF_ARRAY_ELEMS(ff_rm_metadata); i++) {
  129. tag = av_dict_get(ctx->metadata, ff_rm_metadata[i], NULL, 0);
  130. put_str(s, tag ? tag->value : "");
  131. }
  132. for(i=0;i<ctx->nb_streams;i++) {
  133. int codec_data_size;
  134. stream = &rm->streams[i];
  135. if (stream->par->codec_type == AVMEDIA_TYPE_AUDIO) {
  136. desc = "The Audio Stream";
  137. mimetype = "audio/x-pn-realaudio";
  138. codec_data_size = 73;
  139. } else {
  140. desc = "The Video Stream";
  141. mimetype = "video/x-pn-realvideo";
  142. codec_data_size = 34;
  143. }
  144. ffio_wfourcc(s,"MDPR");
  145. size = 10 + 9 * 4 + strlen(desc) + strlen(mimetype) + codec_data_size;
  146. avio_wb32(s, size);
  147. avio_wb16(s, 0);
  148. avio_wb16(s, i); /* stream number */
  149. avio_wb32(s, stream->bit_rate); /* max bit rate */
  150. avio_wb32(s, stream->bit_rate); /* avg bit rate */
  151. avio_wb32(s, stream->packet_max_size); /* max packet size */
  152. if (stream->nb_packets > 0)
  153. packet_avg_size = stream->packet_total_size /
  154. stream->nb_packets;
  155. else
  156. packet_avg_size = 0;
  157. avio_wb32(s, packet_avg_size); /* avg packet size */
  158. avio_wb32(s, 0); /* start time */
  159. avio_wb32(s, BUFFER_DURATION); /* preroll */
  160. /* duration */
  161. if (!(s->seekable & AVIO_SEEKABLE_NORMAL) || !stream->total_frames)
  162. avio_wb32(s, (int)(3600 * 1000));
  163. else
  164. avio_wb32(s, (int)(stream->total_frames * 1000 / stream->frame_rate));
  165. put_str8(s, desc);
  166. put_str8(s, mimetype);
  167. avio_wb32(s, codec_data_size);
  168. if (stream->par->codec_type == AVMEDIA_TYPE_AUDIO) {
  169. int coded_frame_size, fscode, sample_rate;
  170. int frame_size = av_get_audio_frame_duration2(stream->par, 0);
  171. sample_rate = stream->par->sample_rate;
  172. coded_frame_size = (stream->par->bit_rate *
  173. frame_size) / (8 * sample_rate);
  174. /* audio codec info */
  175. avio_write(s, ".ra", 3);
  176. avio_w8(s, 0xfd);
  177. avio_wb32(s, 0x00040000); /* version */
  178. ffio_wfourcc(s, ".ra4");
  179. avio_wb32(s, 0x01b53530); /* stream length */
  180. avio_wb16(s, 4); /* unknown */
  181. avio_wb32(s, 0x39); /* header size */
  182. switch(sample_rate) {
  183. case 48000:
  184. case 24000:
  185. case 12000:
  186. fscode = 1;
  187. break;
  188. default:
  189. case 44100:
  190. case 22050:
  191. case 11025:
  192. fscode = 2;
  193. break;
  194. case 32000:
  195. case 16000:
  196. case 8000:
  197. fscode = 3;
  198. }
  199. avio_wb16(s, fscode); /* codec additional info, for AC-3, seems
  200. to be a frequency code */
  201. /* special hack to compensate rounding errors... */
  202. if (coded_frame_size == 557)
  203. coded_frame_size--;
  204. avio_wb32(s, coded_frame_size); /* frame length */
  205. avio_wb32(s, 0x51540); /* unknown */
  206. avio_wb32(s, 0x249f0); /* unknown */
  207. avio_wb32(s, 0x249f0); /* unknown */
  208. avio_wb16(s, 0x01);
  209. /* frame length : seems to be very important */
  210. avio_wb16(s, coded_frame_size);
  211. avio_wb32(s, 0); /* unknown */
  212. avio_wb16(s, stream->par->sample_rate); /* sample rate */
  213. avio_wb32(s, 0x10); /* unknown */
  214. avio_wb16(s, stream->par->channels);
  215. put_str8(s, "Int0"); /* codec name */
  216. if (stream->par->codec_tag) {
  217. avio_w8(s, 4); /* tag length */
  218. avio_wl32(s, stream->par->codec_tag);
  219. } else {
  220. av_log(ctx, AV_LOG_ERROR, "Invalid codec tag\n");
  221. return -1;
  222. }
  223. avio_wb16(s, 0); /* title length */
  224. avio_wb16(s, 0); /* author length */
  225. avio_wb16(s, 0); /* copyright length */
  226. avio_w8(s, 0); /* end of header */
  227. } else {
  228. /* video codec info */
  229. avio_wb32(s,34); /* size */
  230. ffio_wfourcc(s, "VIDO");
  231. if(stream->par->codec_id == AV_CODEC_ID_RV10)
  232. ffio_wfourcc(s,"RV10");
  233. else
  234. ffio_wfourcc(s,"RV20");
  235. avio_wb16(s, stream->par->width);
  236. avio_wb16(s, stream->par->height);
  237. avio_wb16(s, (int) stream->frame_rate); /* frames per seconds ? */
  238. avio_wb32(s,0); /* unknown meaning */
  239. avio_wb16(s, (int) stream->frame_rate); /* unknown meaning */
  240. avio_wb32(s,0); /* unknown meaning */
  241. avio_wb16(s, 8); /* unknown meaning */
  242. /* Seems to be the codec version: only use basic H.263. The next
  243. versions seems to add a differential DC coding as in
  244. MPEG... nothing new under the sun. */
  245. if(stream->par->codec_id == AV_CODEC_ID_RV10)
  246. avio_wb32(s,0x10000000);
  247. else
  248. avio_wb32(s,0x20103001);
  249. //avio_wb32(s,0x10003000);
  250. }
  251. }
  252. /* patch data offset field */
  253. data_pos = s->buf_ptr - start_ptr;
  254. rm->data_pos = data_pos;
  255. data_offset_ptr[0] = data_pos >> 24;
  256. data_offset_ptr[1] = data_pos >> 16;
  257. data_offset_ptr[2] = data_pos >> 8;
  258. data_offset_ptr[3] = data_pos;
  259. /* data stream */
  260. ffio_wfourcc(s, "DATA");
  261. avio_wb32(s,data_size + 10 + 8);
  262. avio_wb16(s,0);
  263. avio_wb32(s, nb_packets); /* number of packets */
  264. avio_wb32(s,0); /* next data header */
  265. return 0;
  266. }
  267. static void write_packet_header(AVFormatContext *ctx, StreamInfo *stream,
  268. int length, int key_frame)
  269. {
  270. int timestamp;
  271. AVIOContext *s = ctx->pb;
  272. stream->nb_packets++;
  273. stream->packet_total_size += length;
  274. if (length > stream->packet_max_size)
  275. stream->packet_max_size = length;
  276. avio_wb16(s,0); /* version */
  277. avio_wb16(s,length + 12);
  278. avio_wb16(s, stream->num); /* stream number */
  279. timestamp = (1000 * (float)stream->nb_frames) / stream->frame_rate;
  280. avio_wb32(s, timestamp); /* timestamp */
  281. avio_w8(s, 0); /* reserved */
  282. avio_w8(s, key_frame ? 2 : 0); /* flags */
  283. }
  284. static int rm_write_header(AVFormatContext *s)
  285. {
  286. RMMuxContext *rm = s->priv_data;
  287. StreamInfo *stream;
  288. int n;
  289. AVCodecParameters *par;
  290. for(n=0;n<s->nb_streams;n++) {
  291. AVStream *st = s->streams[n];
  292. int frame_size;
  293. s->streams[n]->id = n;
  294. par = s->streams[n]->codecpar;
  295. stream = &rm->streams[n];
  296. memset(stream, 0, sizeof(StreamInfo));
  297. stream->num = n;
  298. stream->bit_rate = par->bit_rate;
  299. stream->par = par;
  300. switch (par->codec_type) {
  301. case AVMEDIA_TYPE_AUDIO:
  302. rm->audio_stream = stream;
  303. frame_size = av_get_audio_frame_duration2(par, 0);
  304. stream->frame_rate = (float)par->sample_rate / (float)frame_size;
  305. /* XXX: dummy values */
  306. stream->packet_max_size = 1024;
  307. stream->nb_packets = 0;
  308. stream->total_frames = stream->nb_packets;
  309. break;
  310. case AVMEDIA_TYPE_VIDEO:
  311. rm->video_stream = stream;
  312. // TODO: should be avg_frame_rate
  313. stream->frame_rate = (float)st->time_base.den / (float)st->time_base.num;
  314. /* XXX: dummy values */
  315. stream->packet_max_size = 4096;
  316. stream->nb_packets = 0;
  317. stream->total_frames = stream->nb_packets;
  318. break;
  319. default:
  320. return -1;
  321. }
  322. }
  323. if (rv10_write_header(s, 0, 0))
  324. return AVERROR_INVALIDDATA;
  325. avio_flush(s->pb);
  326. return 0;
  327. }
  328. static int rm_write_audio(AVFormatContext *s, const uint8_t *buf, int size, int flags)
  329. {
  330. RMMuxContext *rm = s->priv_data;
  331. AVIOContext *pb = s->pb;
  332. StreamInfo *stream = rm->audio_stream;
  333. int i;
  334. write_packet_header(s, stream, size, !!(flags & AV_PKT_FLAG_KEY));
  335. if (stream->par->codec_id == AV_CODEC_ID_AC3) {
  336. /* for AC-3, the words seem to be reversed */
  337. for (i = 0; i < size; i += 2) {
  338. avio_w8(pb, buf[i + 1]);
  339. avio_w8(pb, buf[i]);
  340. }
  341. } else {
  342. avio_write(pb, buf, size);
  343. }
  344. stream->nb_frames++;
  345. return 0;
  346. }
  347. static int rm_write_video(AVFormatContext *s, const uint8_t *buf, int size, int flags)
  348. {
  349. RMMuxContext *rm = s->priv_data;
  350. AVIOContext *pb = s->pb;
  351. StreamInfo *stream = rm->video_stream;
  352. int key_frame = !!(flags & AV_PKT_FLAG_KEY);
  353. /* XXX: this is incorrect: should be a parameter */
  354. /* Well, I spent some time finding the meaning of these bits. I am
  355. not sure I understood everything, but it works !! */
  356. if (size > MAX_PACKET_SIZE) {
  357. avpriv_report_missing_feature(s, "Muxing packets larger than 64 kB");
  358. return AVERROR(ENOSYS);
  359. }
  360. write_packet_header(s, stream, size + 7 + (size >= 0x4000)*4, key_frame);
  361. /* bit 7: '1' if final packet of a frame converted in several packets */
  362. avio_w8(pb, 0x81);
  363. /* bit 7: '1' if I-frame. bits 6..0 : sequence number in current
  364. frame starting from 1 */
  365. if (key_frame) {
  366. avio_w8(pb, 0x81);
  367. } else {
  368. avio_w8(pb, 0x01);
  369. }
  370. if(size >= 0x4000){
  371. avio_wb32(pb, size); /* total frame size */
  372. avio_wb32(pb, size); /* offset from the start or the end */
  373. }else{
  374. avio_wb16(pb, 0x4000 | size); /* total frame size */
  375. avio_wb16(pb, 0x4000 | size); /* offset from the start or the end */
  376. }
  377. avio_w8(pb, stream->nb_frames & 0xff);
  378. avio_write(pb, buf, size);
  379. stream->nb_frames++;
  380. return 0;
  381. }
  382. static int rm_write_packet(AVFormatContext *s, AVPacket *pkt)
  383. {
  384. if (s->streams[pkt->stream_index]->codecpar->codec_type ==
  385. AVMEDIA_TYPE_AUDIO)
  386. return rm_write_audio(s, pkt->data, pkt->size, pkt->flags);
  387. else
  388. return rm_write_video(s, pkt->data, pkt->size, pkt->flags);
  389. }
  390. static int rm_write_trailer(AVFormatContext *s)
  391. {
  392. RMMuxContext *rm = s->priv_data;
  393. int data_size, index_pos, i;
  394. AVIOContext *pb = s->pb;
  395. if (s->pb->seekable & AVIO_SEEKABLE_NORMAL) {
  396. /* end of file: finish to write header */
  397. index_pos = avio_tell(pb);
  398. data_size = index_pos - rm->data_pos;
  399. /* FIXME: write index */
  400. /* undocumented end header */
  401. avio_wb32(pb, 0);
  402. avio_wb32(pb, 0);
  403. avio_seek(pb, 0, SEEK_SET);
  404. for(i=0;i<s->nb_streams;i++)
  405. rm->streams[i].total_frames = rm->streams[i].nb_frames;
  406. rv10_write_header(s, data_size, 0);
  407. } else {
  408. /* undocumented end header */
  409. avio_wb32(pb, 0);
  410. avio_wb32(pb, 0);
  411. }
  412. return 0;
  413. }
  414. AVOutputFormat ff_rm_muxer = {
  415. .name = "rm",
  416. .long_name = NULL_IF_CONFIG_SMALL("RealMedia"),
  417. .mime_type = "application/vnd.rn-realmedia",
  418. .extensions = "rm,ra",
  419. .priv_data_size = sizeof(RMMuxContext),
  420. .audio_codec = AV_CODEC_ID_AC3,
  421. .video_codec = AV_CODEC_ID_RV10,
  422. .write_header = rm_write_header,
  423. .write_packet = rm_write_packet,
  424. .write_trailer = rm_write_trailer,
  425. .codec_tag = (const AVCodecTag* const []){ ff_rm_codec_tags, 0 },
  426. };