You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

1952 lines
63KB

  1. /*
  2. * MOV, 3GP, MP4 muxer
  3. * Copyright (c) 2003 Thomas Raivio
  4. * Copyright (c) 2004 Gildas Bazin <gbazin at videolan dot org>
  5. *
  6. * This file is part of FFmpeg.
  7. *
  8. * FFmpeg is free software; you can redistribute it and/or
  9. * modify it under the terms of the GNU Lesser General Public
  10. * License as published by the Free Software Foundation; either
  11. * version 2.1 of the License, or (at your option) any later version.
  12. *
  13. * FFmpeg is distributed in the hope that it will be useful,
  14. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  15. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  16. * Lesser General Public License for more details.
  17. *
  18. * You should have received a copy of the GNU Lesser General Public
  19. * License along with FFmpeg; if not, write to the Free Software
  20. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  21. */
  22. #include "avformat.h"
  23. #include "riff.h"
  24. #include "avio.h"
  25. #include "isom.h"
  26. #include "avc.h"
  27. #include "libavcodec/bitstream.h"
  28. #undef NDEBUG
  29. #include <assert.h>
  30. #define MOV_INDEX_CLUSTER_SIZE 16384
  31. #define globalTimescale 1000
  32. #define MODE_MP4 0x01
  33. #define MODE_MOV 0x02
  34. #define MODE_3GP 0x04
  35. #define MODE_PSP 0x08 // example working PSP command line:
  36. // ffmpeg -i testinput.avi -f psp -r 14.985 -s 320x240 -b 768 -ar 24000 -ab 32 M4V00001.MP4
  37. #define MODE_3G2 0x10
  38. #define MODE_IPOD 0x20
  39. typedef struct MOVIentry {
  40. unsigned int flags, size;
  41. uint64_t pos;
  42. unsigned int samplesInChunk;
  43. char key_frame;
  44. unsigned int entries;
  45. int64_t cts;
  46. int64_t dts;
  47. } MOVIentry;
  48. typedef struct MOVIndex {
  49. int mode;
  50. int entry;
  51. long timescale;
  52. long time;
  53. int64_t trackDuration;
  54. long sampleCount;
  55. long sampleSize;
  56. int hasKeyframes;
  57. int hasBframes;
  58. int language;
  59. int trackID;
  60. int tag; ///< stsd fourcc
  61. AVCodecContext *enc;
  62. int vosLen;
  63. uint8_t *vosData;
  64. MOVIentry *cluster;
  65. int audio_vbr;
  66. int height; ///< active picture (w/o VBI) height for D-10/IMX
  67. } MOVTrack;
  68. typedef struct MOVMuxContext {
  69. int mode;
  70. int64_t time;
  71. int nb_streams;
  72. int64_t mdat_pos;
  73. uint64_t mdat_size;
  74. long timescale;
  75. MOVTrack tracks[MAX_STREAMS];
  76. } MOVMuxContext;
  77. //FIXME support 64 bit variant with wide placeholders
  78. static int64_t updateSize(ByteIOContext *pb, int64_t pos)
  79. {
  80. int64_t curpos = url_ftell(pb);
  81. url_fseek(pb, pos, SEEK_SET);
  82. put_be32(pb, curpos - pos); /* rewrite size */
  83. url_fseek(pb, curpos, SEEK_SET);
  84. return curpos - pos;
  85. }
  86. /* Chunk offset atom */
  87. static int mov_write_stco_tag(ByteIOContext *pb, MOVTrack *track)
  88. {
  89. int i;
  90. int mode64 = 0; // use 32 bit size variant if possible
  91. int64_t pos = url_ftell(pb);
  92. put_be32(pb, 0); /* size */
  93. if (pos > UINT32_MAX) {
  94. mode64 = 1;
  95. put_tag(pb, "co64");
  96. } else
  97. put_tag(pb, "stco");
  98. put_be32(pb, 0); /* version & flags */
  99. put_be32(pb, track->entry); /* entry count */
  100. for (i=0; i<track->entry; i++) {
  101. if(mode64 == 1)
  102. put_be64(pb, track->cluster[i].pos);
  103. else
  104. put_be32(pb, track->cluster[i].pos);
  105. }
  106. return updateSize(pb, pos);
  107. }
  108. /* Sample size atom */
  109. static int mov_write_stsz_tag(ByteIOContext *pb, MOVTrack *track)
  110. {
  111. int equalChunks = 1;
  112. int i, j, entries = 0, tst = -1, oldtst = -1;
  113. int64_t pos = url_ftell(pb);
  114. put_be32(pb, 0); /* size */
  115. put_tag(pb, "stsz");
  116. put_be32(pb, 0); /* version & flags */
  117. for (i=0; i<track->entry; i++) {
  118. tst = track->cluster[i].size/track->cluster[i].entries;
  119. if(oldtst != -1 && tst != oldtst) {
  120. equalChunks = 0;
  121. }
  122. oldtst = tst;
  123. entries += track->cluster[i].entries;
  124. }
  125. if (equalChunks) {
  126. int sSize = track->cluster[0].size/track->cluster[0].entries;
  127. put_be32(pb, sSize); // sample size
  128. put_be32(pb, entries); // sample count
  129. }
  130. else {
  131. put_be32(pb, 0); // sample size
  132. put_be32(pb, entries); // sample count
  133. for (i=0; i<track->entry; i++) {
  134. for (j=0; j<track->cluster[i].entries; j++) {
  135. put_be32(pb, track->cluster[i].size /
  136. track->cluster[i].entries);
  137. }
  138. }
  139. }
  140. return updateSize(pb, pos);
  141. }
  142. /* Sample to chunk atom */
  143. static int mov_write_stsc_tag(ByteIOContext *pb, MOVTrack *track)
  144. {
  145. int index = 0, oldval = -1, i;
  146. int64_t entryPos, curpos;
  147. int64_t pos = url_ftell(pb);
  148. put_be32(pb, 0); /* size */
  149. put_tag(pb, "stsc");
  150. put_be32(pb, 0); // version & flags
  151. entryPos = url_ftell(pb);
  152. put_be32(pb, track->entry); // entry count
  153. for (i=0; i<track->entry; i++) {
  154. if(oldval != track->cluster[i].samplesInChunk)
  155. {
  156. put_be32(pb, i+1); // first chunk
  157. put_be32(pb, track->cluster[i].samplesInChunk); // samples per chunk
  158. put_be32(pb, 0x1); // sample description index
  159. oldval = track->cluster[i].samplesInChunk;
  160. index++;
  161. }
  162. }
  163. curpos = url_ftell(pb);
  164. url_fseek(pb, entryPos, SEEK_SET);
  165. put_be32(pb, index); // rewrite size
  166. url_fseek(pb, curpos, SEEK_SET);
  167. return updateSize(pb, pos);
  168. }
  169. /* Sync sample atom */
  170. static int mov_write_stss_tag(ByteIOContext *pb, MOVTrack *track)
  171. {
  172. int64_t curpos, entryPos;
  173. int i, index = 0;
  174. int64_t pos = url_ftell(pb);
  175. put_be32(pb, 0); // size
  176. put_tag(pb, "stss");
  177. put_be32(pb, 0); // version & flags
  178. entryPos = url_ftell(pb);
  179. put_be32(pb, track->entry); // entry count
  180. for (i=0; i<track->entry; i++) {
  181. if(track->cluster[i].key_frame == 1) {
  182. put_be32(pb, i+1);
  183. index++;
  184. }
  185. }
  186. curpos = url_ftell(pb);
  187. url_fseek(pb, entryPos, SEEK_SET);
  188. put_be32(pb, index); // rewrite size
  189. url_fseek(pb, curpos, SEEK_SET);
  190. return updateSize(pb, pos);
  191. }
  192. static int mov_write_amr_tag(ByteIOContext *pb, MOVTrack *track)
  193. {
  194. put_be32(pb, 0x11); /* size */
  195. if (track->mode == MODE_MOV) put_tag(pb, "samr");
  196. else put_tag(pb, "damr");
  197. put_tag(pb, "FFMP");
  198. put_byte(pb, 0); /* decoder version */
  199. put_be16(pb, 0x81FF); /* Mode set (all modes for AMR_NB) */
  200. put_byte(pb, 0x00); /* Mode change period (no restriction) */
  201. put_byte(pb, 0x01); /* Frames per sample */
  202. return 0x11;
  203. }
  204. static int mov_write_ac3_tag(ByteIOContext *pb, MOVTrack *track)
  205. {
  206. GetBitContext gbc;
  207. PutBitContext pbc;
  208. uint8_t buf[3];
  209. int fscod, bsid, bsmod, acmod, lfeon, frmsizecod;
  210. if (track->vosLen < 7)
  211. return -1;
  212. put_be32(pb, 11);
  213. put_tag(pb, "dac3");
  214. init_get_bits(&gbc, track->vosData+4, track->vosLen-4);
  215. fscod = get_bits(&gbc, 2);
  216. frmsizecod = get_bits(&gbc, 6);
  217. bsid = get_bits(&gbc, 5);
  218. bsmod = get_bits(&gbc, 3);
  219. acmod = get_bits(&gbc, 3);
  220. if (acmod == 2) {
  221. skip_bits(&gbc, 2); // dsurmod
  222. } else {
  223. if ((acmod & 1) && acmod != 1)
  224. skip_bits(&gbc, 2); // cmixlev
  225. if (acmod & 4)
  226. skip_bits(&gbc, 2); // surmixlev
  227. }
  228. lfeon = get_bits1(&gbc);
  229. init_put_bits(&pbc, buf, sizeof(buf));
  230. put_bits(&pbc, 2, fscod);
  231. put_bits(&pbc, 5, bsid);
  232. put_bits(&pbc, 3, bsmod);
  233. put_bits(&pbc, 3, acmod);
  234. put_bits(&pbc, 1, lfeon);
  235. put_bits(&pbc, 5, frmsizecod>>1); // bit_rate_code
  236. put_bits(&pbc, 5, 0); // reserved
  237. flush_put_bits(&pbc);
  238. put_buffer(pb, buf, sizeof(buf));
  239. return 11;
  240. }
  241. /**
  242. * This function writes extradata "as is".
  243. * Extradata must be formated like a valid atom (with size and tag)
  244. */
  245. static int mov_write_extradata_tag(ByteIOContext *pb, MOVTrack *track)
  246. {
  247. put_buffer(pb, track->enc->extradata, track->enc->extradata_size);
  248. return track->enc->extradata_size;
  249. }
  250. static int mov_write_enda_tag(ByteIOContext *pb)
  251. {
  252. put_be32(pb, 10);
  253. put_tag(pb, "enda");
  254. put_be16(pb, 1); /* little endian */
  255. return 10;
  256. }
  257. static unsigned int descrLength(unsigned int len)
  258. {
  259. int i;
  260. for(i=1; len>>(7*i); i++);
  261. return len + 1 + i;
  262. }
  263. static void putDescr(ByteIOContext *pb, int tag, unsigned int size)
  264. {
  265. int i= descrLength(size) - size - 2;
  266. put_byte(pb, tag);
  267. for(; i>0; i--)
  268. put_byte(pb, (size>>(7*i)) | 0x80);
  269. put_byte(pb, size & 0x7F);
  270. }
  271. static int mov_write_esds_tag(ByteIOContext *pb, MOVTrack *track) // Basic
  272. {
  273. int64_t pos = url_ftell(pb);
  274. int decoderSpecificInfoLen = track->vosLen ? descrLength(track->vosLen):0;
  275. put_be32(pb, 0); // size
  276. put_tag(pb, "esds");
  277. put_be32(pb, 0); // Version
  278. // ES descriptor
  279. putDescr(pb, 0x03, 3 + descrLength(13 + decoderSpecificInfoLen) +
  280. descrLength(1));
  281. put_be16(pb, track->trackID);
  282. put_byte(pb, 0x00); // flags (= no flags)
  283. // DecoderConfig descriptor
  284. putDescr(pb, 0x04, 13 + decoderSpecificInfoLen);
  285. // Object type indication
  286. if ((track->enc->codec_id == CODEC_ID_MP2 ||
  287. track->enc->codec_id == CODEC_ID_MP3) &&
  288. track->enc->sample_rate > 24000)
  289. put_byte(pb, 0x6B); // 11172-3
  290. else
  291. put_byte(pb, codec_get_tag(ff_mp4_obj_type, track->enc->codec_id));
  292. // the following fields is made of 6 bits to identify the streamtype (4 for video, 5 for audio)
  293. // plus 1 bit to indicate upstream and 1 bit set to 1 (reserved)
  294. if(track->enc->codec_type == CODEC_TYPE_AUDIO)
  295. put_byte(pb, 0x15); // flags (= Audiostream)
  296. else
  297. put_byte(pb, 0x11); // flags (= Visualstream)
  298. put_byte(pb, track->enc->rc_buffer_size>>(3+16)); // Buffersize DB (24 bits)
  299. put_be16(pb, (track->enc->rc_buffer_size>>3)&0xFFFF); // Buffersize DB
  300. put_be32(pb, FFMAX(track->enc->bit_rate, track->enc->rc_max_rate)); // maxbitrate (FIXME should be max rate in any 1 sec window)
  301. if(track->enc->rc_max_rate != track->enc->rc_min_rate || track->enc->rc_min_rate==0)
  302. put_be32(pb, 0); // vbr
  303. else
  304. put_be32(pb, track->enc->rc_max_rate); // avg bitrate
  305. if (track->vosLen) {
  306. // DecoderSpecific info descriptor
  307. putDescr(pb, 0x05, track->vosLen);
  308. put_buffer(pb, track->vosData, track->vosLen);
  309. }
  310. // SL descriptor
  311. putDescr(pb, 0x06, 1);
  312. put_byte(pb, 0x02);
  313. return updateSize(pb, pos);
  314. }
  315. static int mov_write_wave_tag(ByteIOContext *pb, MOVTrack *track)
  316. {
  317. int64_t pos = url_ftell(pb);
  318. put_be32(pb, 0); /* size */
  319. put_tag(pb, "wave");
  320. put_be32(pb, 12); /* size */
  321. put_tag(pb, "frma");
  322. put_le32(pb, track->tag);
  323. if (track->enc->codec_id == CODEC_ID_AAC) {
  324. /* useless atom needed by mplayer, ipod, not needed by quicktime */
  325. put_be32(pb, 12); /* size */
  326. put_tag(pb, "mp4a");
  327. put_be32(pb, 0);
  328. mov_write_esds_tag(pb, track);
  329. } else if (track->enc->codec_id == CODEC_ID_PCM_S24LE ||
  330. track->enc->codec_id == CODEC_ID_PCM_S32LE) {
  331. mov_write_enda_tag(pb);
  332. } else if (track->enc->codec_id == CODEC_ID_AMR_NB) {
  333. mov_write_amr_tag(pb, track);
  334. } else if (track->enc->codec_id == CODEC_ID_AC3) {
  335. mov_write_ac3_tag(pb, track);
  336. } else if (track->enc->codec_id == CODEC_ID_ALAC) {
  337. mov_write_extradata_tag(pb, track);
  338. }
  339. put_be32(pb, 8); /* size */
  340. put_be32(pb, 0); /* null tag */
  341. return updateSize(pb, pos);
  342. }
  343. static int mov_write_glbl_tag(ByteIOContext *pb, MOVTrack *track)
  344. {
  345. put_be32(pb, track->vosLen+8);
  346. put_tag(pb, "glbl");
  347. put_buffer(pb, track->vosData, track->vosLen);
  348. return 8+track->vosLen;
  349. }
  350. static int mov_write_audio_tag(ByteIOContext *pb, MOVTrack *track)
  351. {
  352. int64_t pos = url_ftell(pb);
  353. int version = track->mode == MODE_MOV &&
  354. (track->audio_vbr ||
  355. track->enc->codec_id == CODEC_ID_PCM_S32LE ||
  356. track->enc->codec_id == CODEC_ID_PCM_S24LE);
  357. put_be32(pb, 0); /* size */
  358. put_le32(pb, track->tag); // store it byteswapped
  359. put_be32(pb, 0); /* Reserved */
  360. put_be16(pb, 0); /* Reserved */
  361. put_be16(pb, 1); /* Data-reference index, XXX == 1 */
  362. /* SoundDescription */
  363. put_be16(pb, version); /* Version */
  364. put_be16(pb, 0); /* Revision level */
  365. put_be32(pb, 0); /* Reserved */
  366. if (track->mode == MODE_MOV) {
  367. put_be16(pb, track->enc->channels);
  368. if (track->enc->codec_id == CODEC_ID_PCM_U8 ||
  369. track->enc->codec_id == CODEC_ID_PCM_S8)
  370. put_be16(pb, 8); /* bits per sample */
  371. else
  372. put_be16(pb, 16);
  373. put_be16(pb, track->audio_vbr ? -2 : 0); /* compression ID */
  374. } else { /* reserved for mp4/3gp */
  375. put_be16(pb, 2);
  376. put_be16(pb, 16);
  377. put_be16(pb, 0);
  378. }
  379. put_be16(pb, 0); /* packet size (= 0) */
  380. put_be16(pb, track->timescale); /* Time scale */
  381. put_be16(pb, 0); /* Reserved */
  382. if(version == 1) { /* SoundDescription V1 extended info */
  383. put_be32(pb, track->enc->frame_size); /* Samples per packet */
  384. put_be32(pb, track->sampleSize / track->enc->channels); /* Bytes per packet */
  385. put_be32(pb, track->sampleSize); /* Bytes per frame */
  386. put_be32(pb, 2); /* Bytes per sample */
  387. }
  388. if(track->mode == MODE_MOV &&
  389. (track->enc->codec_id == CODEC_ID_AAC ||
  390. track->enc->codec_id == CODEC_ID_AC3 ||
  391. track->enc->codec_id == CODEC_ID_AMR_NB ||
  392. track->enc->codec_id == CODEC_ID_PCM_S24LE ||
  393. track->enc->codec_id == CODEC_ID_PCM_S32LE ||
  394. track->enc->codec_id == CODEC_ID_ALAC))
  395. mov_write_wave_tag(pb, track);
  396. else if(track->tag == MKTAG('m','p','4','a'))
  397. mov_write_esds_tag(pb, track);
  398. else if(track->enc->codec_id == CODEC_ID_AMR_NB)
  399. mov_write_amr_tag(pb, track);
  400. else if(track->enc->codec_id == CODEC_ID_AC3)
  401. mov_write_ac3_tag(pb, track);
  402. else if(track->enc->codec_id == CODEC_ID_ALAC)
  403. mov_write_extradata_tag(pb, track);
  404. else if(track->vosLen > 0)
  405. mov_write_glbl_tag(pb, track);
  406. return updateSize(pb, pos);
  407. }
  408. static int mov_write_d263_tag(ByteIOContext *pb)
  409. {
  410. put_be32(pb, 0xf); /* size */
  411. put_tag(pb, "d263");
  412. put_tag(pb, "FFMP");
  413. put_byte(pb, 0); /* decoder version */
  414. /* FIXME use AVCodecContext level/profile, when encoder will set values */
  415. put_byte(pb, 0xa); /* level */
  416. put_byte(pb, 0); /* profile */
  417. return 0xf;
  418. }
  419. /* TODO: No idea about these values */
  420. static int mov_write_svq3_tag(ByteIOContext *pb)
  421. {
  422. put_be32(pb, 0x15);
  423. put_tag(pb, "SMI ");
  424. put_tag(pb, "SEQH");
  425. put_be32(pb, 0x5);
  426. put_be32(pb, 0xe2c0211d);
  427. put_be32(pb, 0xc0000000);
  428. put_byte(pb, 0);
  429. return 0x15;
  430. }
  431. static int mov_write_avcc_tag(ByteIOContext *pb, MOVTrack *track)
  432. {
  433. int64_t pos = url_ftell(pb);
  434. put_be32(pb, 0);
  435. put_tag(pb, "avcC");
  436. ff_isom_write_avcc(pb, track->vosData, track->vosLen);
  437. return updateSize(pb, pos);
  438. }
  439. /* also used by all avid codecs (dv, imx, meridien) and their variants */
  440. static int mov_write_avid_tag(ByteIOContext *pb, MOVTrack *track)
  441. {
  442. int i;
  443. put_be32(pb, 24); /* size */
  444. put_tag(pb, "ACLR");
  445. put_tag(pb, "ACLR");
  446. put_tag(pb, "0001");
  447. put_be32(pb, 1); /* yuv 1 / rgb 2 ? */
  448. put_be32(pb, 0); /* unknown */
  449. put_be32(pb, 24); /* size */
  450. put_tag(pb, "APRG");
  451. put_tag(pb, "APRG");
  452. put_tag(pb, "0001");
  453. put_be32(pb, 1); /* unknown */
  454. put_be32(pb, 0); /* unknown */
  455. put_be32(pb, 120); /* size */
  456. put_tag(pb, "ARES");
  457. put_tag(pb, "ARES");
  458. put_tag(pb, "0001");
  459. put_be32(pb, AV_RB32(track->vosData + 0x28)); /* dnxhd cid, some id ? */
  460. put_be32(pb, track->enc->width);
  461. /* values below are based on samples created with quicktime and avid codecs */
  462. if (track->vosData[5] & 2) { // interlaced
  463. put_be32(pb, track->enc->height/2);
  464. put_be32(pb, 2); /* unknown */
  465. put_be32(pb, 0); /* unknown */
  466. put_be32(pb, 4); /* unknown */
  467. } else {
  468. put_be32(pb, track->enc->height);
  469. put_be32(pb, 1); /* unknown */
  470. put_be32(pb, 0); /* unknown */
  471. if (track->enc->height == 1080)
  472. put_be32(pb, 5); /* unknown */
  473. else
  474. put_be32(pb, 6); /* unknown */
  475. }
  476. /* padding */
  477. for (i = 0; i < 10; i++)
  478. put_be64(pb, 0);
  479. /* extra padding for stsd needed */
  480. put_be32(pb, 0);
  481. return 0;
  482. }
  483. static const AVCodecTag codec_3gp_tags[] = {
  484. { CODEC_ID_H263, MKTAG('s','2','6','3') },
  485. { CODEC_ID_H264, MKTAG('a','v','c','1') },
  486. { CODEC_ID_MPEG4, MKTAG('m','p','4','v') },
  487. { CODEC_ID_AAC, MKTAG('m','p','4','a') },
  488. { CODEC_ID_AMR_NB, MKTAG('s','a','m','r') },
  489. { CODEC_ID_AMR_WB, MKTAG('s','a','w','b') },
  490. { CODEC_ID_MOV_TEXT, MKTAG('t','x','3','g') },
  491. { CODEC_ID_NONE, 0 },
  492. };
  493. static const AVCodecTag mov_pix_fmt_tags[] = {
  494. { PIX_FMT_YUYV422, MKTAG('y','u','v','s') },
  495. { PIX_FMT_UYVY422, MKTAG('2','v','u','y') },
  496. { PIX_FMT_BGR555, MKTAG('r','a','w',' ') },
  497. { PIX_FMT_RGB24, MKTAG('r','a','w',' ') },
  498. { PIX_FMT_BGR32_1, MKTAG('r','a','w',' ') },
  499. };
  500. static const AVCodecTag codec_ipod_tags[] = {
  501. { CODEC_ID_H264, MKTAG('a','v','c','1') },
  502. { CODEC_ID_MPEG4, MKTAG('m','p','4','v') },
  503. { CODEC_ID_AAC, MKTAG('m','p','4','a') },
  504. { CODEC_ID_ALAC, MKTAG('a','l','a','c') },
  505. { CODEC_ID_AC3, MKTAG('a','c','-','3') },
  506. { CODEC_ID_MOV_TEXT, MKTAG('t','x','3','g') },
  507. { CODEC_ID_MOV_TEXT, MKTAG('t','e','x','t') },
  508. { CODEC_ID_NONE, 0 },
  509. };
  510. static int mov_find_codec_tag(AVFormatContext *s, MOVTrack *track)
  511. {
  512. int tag = track->enc->codec_tag;
  513. if (track->mode == MODE_MP4 || track->mode == MODE_PSP) {
  514. if (!codec_get_tag(ff_mp4_obj_type, track->enc->codec_id))
  515. return 0;
  516. if (track->enc->codec_id == CODEC_ID_H264) tag = MKTAG('a','v','c','1');
  517. else if (track->enc->codec_id == CODEC_ID_AC3) tag = MKTAG('a','c','-','3');
  518. else if (track->enc->codec_id == CODEC_ID_DIRAC) tag = MKTAG('d','r','a','c');
  519. else if (track->enc->codec_id == CODEC_ID_MOV_TEXT) tag = MKTAG('t','x','3','g');
  520. else if (track->enc->codec_type == CODEC_TYPE_VIDEO) tag = MKTAG('m','p','4','v');
  521. else if (track->enc->codec_type == CODEC_TYPE_AUDIO) tag = MKTAG('m','p','4','a');
  522. } else if (track->mode == MODE_IPOD) {
  523. if (track->enc->codec_type == CODEC_TYPE_SUBTITLE &&
  524. (tag == MKTAG('t','x','3','g') ||
  525. tag == MKTAG('t','e','x','t')))
  526. track->tag = tag; // keep original tag
  527. else
  528. tag = codec_get_tag(codec_ipod_tags, track->enc->codec_id);
  529. if (!match_ext(s->filename, "m4a") && !match_ext(s->filename, "m4v"))
  530. av_log(s, AV_LOG_WARNING, "Warning, extension is not .m4a nor .m4v "
  531. "Quicktime/Ipod might not play the file\n");
  532. } else if (track->mode & MODE_3GP) {
  533. tag = codec_get_tag(codec_3gp_tags, track->enc->codec_id);
  534. } else if (!tag || (track->enc->strict_std_compliance >= FF_COMPLIANCE_NORMAL &&
  535. (tag == MKTAG('d','v','c','p') ||
  536. track->enc->codec_id == CODEC_ID_RAWVIDEO))) {
  537. if (track->enc->codec_id == CODEC_ID_DVVIDEO) {
  538. if (track->enc->height == 480) /* NTSC */
  539. if (track->enc->pix_fmt == PIX_FMT_YUV422P) tag = MKTAG('d','v','5','n');
  540. else tag = MKTAG('d','v','c',' ');
  541. else if (track->enc->pix_fmt == PIX_FMT_YUV422P) tag = MKTAG('d','v','5','p');
  542. else if (track->enc->pix_fmt == PIX_FMT_YUV420P) tag = MKTAG('d','v','c','p');
  543. else tag = MKTAG('d','v','p','p');
  544. } else if (track->enc->codec_id == CODEC_ID_RAWVIDEO) {
  545. tag = codec_get_tag(mov_pix_fmt_tags, track->enc->pix_fmt);
  546. if (!tag) // restore tag
  547. tag = track->enc->codec_tag;
  548. } else {
  549. if (track->enc->codec_type == CODEC_TYPE_VIDEO) {
  550. tag = codec_get_tag(codec_movvideo_tags, track->enc->codec_id);
  551. if (!tag) { // if no mac fcc found, try with Microsoft tags
  552. tag = codec_get_tag(codec_bmp_tags, track->enc->codec_id);
  553. if (tag)
  554. av_log(s, AV_LOG_INFO, "Warning, using MS style video codec tag, "
  555. "the file may be unplayable!\n");
  556. }
  557. } else if (track->enc->codec_type == CODEC_TYPE_AUDIO) {
  558. tag = codec_get_tag(codec_movaudio_tags, track->enc->codec_id);
  559. if (!tag) { // if no mac fcc found, try with Microsoft tags
  560. int ms_tag = codec_get_tag(codec_wav_tags, track->enc->codec_id);
  561. if (ms_tag) {
  562. tag = MKTAG('m', 's', ((ms_tag >> 8) & 0xff), (ms_tag & 0xff));
  563. av_log(s, AV_LOG_INFO, "Warning, using MS style audio codec tag, "
  564. "the file may be unplayable!\n");
  565. }
  566. }
  567. } else if (track->enc->codec_type == CODEC_TYPE_SUBTITLE) {
  568. tag = codec_get_tag(ff_codec_movsubtitle_tags, track->enc->codec_id);
  569. }
  570. }
  571. }
  572. return tag;
  573. }
  574. /** Write uuid atom.
  575. * Needed to make file play in iPods running newest firmware
  576. * goes after avcC atom in moov.trak.mdia.minf.stbl.stsd.avc1
  577. */
  578. static int mov_write_uuid_tag_ipod(ByteIOContext *pb)
  579. {
  580. put_be32(pb, 28);
  581. put_tag(pb, "uuid");
  582. put_be32(pb, 0x6b6840f2);
  583. put_be32(pb, 0x5f244fc5);
  584. put_be32(pb, 0xba39a51b);
  585. put_be32(pb, 0xcf0323f3);
  586. put_be32(pb, 0x0);
  587. return 28;
  588. }
  589. static int mov_write_subtitle_tag(ByteIOContext *pb, MOVTrack *track)
  590. {
  591. int64_t pos = url_ftell(pb);
  592. put_be32(pb, 0); /* size */
  593. put_le32(pb, track->tag); // store it byteswapped
  594. put_be32(pb, 0); /* Reserved */
  595. put_be16(pb, 0); /* Reserved */
  596. put_be16(pb, 1); /* Data-reference index */
  597. if (track->enc->extradata_size)
  598. put_buffer(pb, track->enc->extradata, track->enc->extradata_size);
  599. return updateSize(pb, pos);
  600. }
  601. static int mov_write_video_tag(ByteIOContext *pb, MOVTrack *track)
  602. {
  603. int64_t pos = url_ftell(pb);
  604. char compressor_name[32];
  605. put_be32(pb, 0); /* size */
  606. put_le32(pb, track->tag); // store it byteswapped
  607. put_be32(pb, 0); /* Reserved */
  608. put_be16(pb, 0); /* Reserved */
  609. put_be16(pb, 1); /* Data-reference index */
  610. put_be16(pb, 0); /* Codec stream version */
  611. put_be16(pb, 0); /* Codec stream revision (=0) */
  612. if (track->mode == MODE_MOV) {
  613. put_tag(pb, "FFMP"); /* Vendor */
  614. if(track->enc->codec_id == CODEC_ID_RAWVIDEO) {
  615. put_be32(pb, 0); /* Temporal Quality */
  616. put_be32(pb, 0x400); /* Spatial Quality = lossless*/
  617. } else {
  618. put_be32(pb, 0x200); /* Temporal Quality = normal */
  619. put_be32(pb, 0x200); /* Spatial Quality = normal */
  620. }
  621. } else {
  622. put_be32(pb, 0); /* Reserved */
  623. put_be32(pb, 0); /* Reserved */
  624. put_be32(pb, 0); /* Reserved */
  625. }
  626. put_be16(pb, track->enc->width); /* Video width */
  627. put_be16(pb, track->height); /* Video height */
  628. put_be32(pb, 0x00480000); /* Horizontal resolution 72dpi */
  629. put_be32(pb, 0x00480000); /* Vertical resolution 72dpi */
  630. put_be32(pb, 0); /* Data size (= 0) */
  631. put_be16(pb, 1); /* Frame count (= 1) */
  632. memset(compressor_name,0,32);
  633. /* FIXME not sure, ISO 14496-1 draft where it shall be set to 0 */
  634. if (track->mode == MODE_MOV && track->enc->codec && track->enc->codec->name)
  635. strncpy(compressor_name,track->enc->codec->name,31);
  636. put_byte(pb, strlen(compressor_name));
  637. put_buffer(pb, compressor_name, 31);
  638. if (track->mode == MODE_MOV && track->enc->bits_per_coded_sample)
  639. put_be16(pb, track->enc->bits_per_coded_sample);
  640. else
  641. put_be16(pb, 0x18); /* Reserved */
  642. put_be16(pb, 0xffff); /* Reserved */
  643. if(track->tag == MKTAG('m','p','4','v'))
  644. mov_write_esds_tag(pb, track);
  645. else if(track->enc->codec_id == CODEC_ID_H263)
  646. mov_write_d263_tag(pb);
  647. else if(track->enc->codec_id == CODEC_ID_SVQ3)
  648. mov_write_svq3_tag(pb);
  649. else if(track->enc->codec_id == CODEC_ID_DNXHD)
  650. mov_write_avid_tag(pb, track);
  651. else if(track->enc->codec_id == CODEC_ID_H264) {
  652. mov_write_avcc_tag(pb, track);
  653. if(track->mode == MODE_IPOD)
  654. mov_write_uuid_tag_ipod(pb);
  655. } else if(track->vosLen > 0)
  656. mov_write_glbl_tag(pb, track);
  657. return updateSize(pb, pos);
  658. }
  659. static int mov_write_stsd_tag(ByteIOContext *pb, MOVTrack *track)
  660. {
  661. int64_t pos = url_ftell(pb);
  662. put_be32(pb, 0); /* size */
  663. put_tag(pb, "stsd");
  664. put_be32(pb, 0); /* version & flags */
  665. put_be32(pb, 1); /* entry count */
  666. if (track->enc->codec_type == CODEC_TYPE_VIDEO)
  667. mov_write_video_tag(pb, track);
  668. else if (track->enc->codec_type == CODEC_TYPE_AUDIO)
  669. mov_write_audio_tag(pb, track);
  670. else if (track->enc->codec_type == CODEC_TYPE_SUBTITLE)
  671. mov_write_subtitle_tag(pb, track);
  672. return updateSize(pb, pos);
  673. }
  674. static int mov_write_ctts_tag(ByteIOContext *pb, MOVTrack *track)
  675. {
  676. MOVStts *ctts_entries;
  677. uint32_t entries = 0;
  678. uint32_t atom_size;
  679. int i;
  680. ctts_entries = av_malloc((track->entry + 1) * sizeof(*ctts_entries)); /* worst case */
  681. ctts_entries[0].count = 1;
  682. ctts_entries[0].duration = track->cluster[0].cts;
  683. for (i=1; i<track->entry; i++) {
  684. if (track->cluster[i].cts == ctts_entries[entries].duration) {
  685. ctts_entries[entries].count++; /* compress */
  686. } else {
  687. entries++;
  688. ctts_entries[entries].duration = track->cluster[i].cts;
  689. ctts_entries[entries].count = 1;
  690. }
  691. }
  692. entries++; /* last one */
  693. atom_size = 16 + (entries * 8);
  694. put_be32(pb, atom_size); /* size */
  695. put_tag(pb, "ctts");
  696. put_be32(pb, 0); /* version & flags */
  697. put_be32(pb, entries); /* entry count */
  698. for (i=0; i<entries; i++) {
  699. put_be32(pb, ctts_entries[i].count);
  700. put_be32(pb, ctts_entries[i].duration);
  701. }
  702. av_free(ctts_entries);
  703. return atom_size;
  704. }
  705. /* Time to sample atom */
  706. static int mov_write_stts_tag(ByteIOContext *pb, MOVTrack *track)
  707. {
  708. MOVStts *stts_entries;
  709. uint32_t entries = -1;
  710. uint32_t atom_size;
  711. int i;
  712. if (track->enc->codec_type == CODEC_TYPE_AUDIO && !track->audio_vbr) {
  713. stts_entries = av_malloc(sizeof(*stts_entries)); /* one entry */
  714. stts_entries[0].count = track->sampleCount;
  715. stts_entries[0].duration = 1;
  716. entries = 1;
  717. } else {
  718. stts_entries = av_malloc(track->entry * sizeof(*stts_entries)); /* worst case */
  719. for (i=0; i<track->entry; i++) {
  720. int64_t duration = i + 1 == track->entry ?
  721. track->trackDuration - track->cluster[i].dts + track->cluster[0].dts : /* readjusting */
  722. track->cluster[i+1].dts - track->cluster[i].dts;
  723. if (i && duration == stts_entries[entries].duration) {
  724. stts_entries[entries].count++; /* compress */
  725. } else {
  726. entries++;
  727. stts_entries[entries].duration = duration;
  728. stts_entries[entries].count = 1;
  729. }
  730. }
  731. entries++; /* last one */
  732. }
  733. atom_size = 16 + (entries * 8);
  734. put_be32(pb, atom_size); /* size */
  735. put_tag(pb, "stts");
  736. put_be32(pb, 0); /* version & flags */
  737. put_be32(pb, entries); /* entry count */
  738. for (i=0; i<entries; i++) {
  739. put_be32(pb, stts_entries[i].count);
  740. put_be32(pb, stts_entries[i].duration);
  741. }
  742. av_free(stts_entries);
  743. return atom_size;
  744. }
  745. static int mov_write_dref_tag(ByteIOContext *pb)
  746. {
  747. put_be32(pb, 28); /* size */
  748. put_tag(pb, "dref");
  749. put_be32(pb, 0); /* version & flags */
  750. put_be32(pb, 1); /* entry count */
  751. put_be32(pb, 0xc); /* size */
  752. put_tag(pb, "url ");
  753. put_be32(pb, 1); /* version & flags */
  754. return 28;
  755. }
  756. static int mov_write_stbl_tag(ByteIOContext *pb, MOVTrack *track)
  757. {
  758. int64_t pos = url_ftell(pb);
  759. put_be32(pb, 0); /* size */
  760. put_tag(pb, "stbl");
  761. mov_write_stsd_tag(pb, track);
  762. mov_write_stts_tag(pb, track);
  763. if (track->enc->codec_type == CODEC_TYPE_VIDEO &&
  764. track->hasKeyframes && track->hasKeyframes < track->entry)
  765. mov_write_stss_tag(pb, track);
  766. if (track->enc->codec_type == CODEC_TYPE_VIDEO &&
  767. track->hasBframes)
  768. mov_write_ctts_tag(pb, track);
  769. mov_write_stsc_tag(pb, track);
  770. mov_write_stsz_tag(pb, track);
  771. mov_write_stco_tag(pb, track);
  772. return updateSize(pb, pos);
  773. }
  774. static int mov_write_dinf_tag(ByteIOContext *pb)
  775. {
  776. int64_t pos = url_ftell(pb);
  777. put_be32(pb, 0); /* size */
  778. put_tag(pb, "dinf");
  779. mov_write_dref_tag(pb);
  780. return updateSize(pb, pos);
  781. }
  782. static int mov_write_nmhd_tag(ByteIOContext *pb)
  783. {
  784. put_be32(pb, 12);
  785. put_tag(pb, "nmhd");
  786. put_be32(pb, 0);
  787. return 12;
  788. }
  789. static int mov_write_gmhd_tag(ByteIOContext *pb)
  790. {
  791. put_be32(pb, 0x20); /* size */
  792. put_tag(pb, "gmhd");
  793. put_be32(pb, 0x18); /* gmin size */
  794. put_tag(pb, "gmin"); /* generic media info */
  795. put_be32(pb, 0); /* version & flags */
  796. put_be16(pb, 0x40); /* graphics mode = */
  797. put_be16(pb, 0x8000); /* opColor (r?) */
  798. put_be16(pb, 0x8000); /* opColor (g?) */
  799. put_be16(pb, 0x8000); /* opColor (b?) */
  800. put_be16(pb, 0); /* balance */
  801. put_be16(pb, 0); /* reserved */
  802. return 0x20;
  803. }
  804. static int mov_write_smhd_tag(ByteIOContext *pb)
  805. {
  806. put_be32(pb, 16); /* size */
  807. put_tag(pb, "smhd");
  808. put_be32(pb, 0); /* version & flags */
  809. put_be16(pb, 0); /* reserved (balance, normally = 0) */
  810. put_be16(pb, 0); /* reserved */
  811. return 16;
  812. }
  813. static int mov_write_vmhd_tag(ByteIOContext *pb)
  814. {
  815. put_be32(pb, 0x14); /* size (always 0x14) */
  816. put_tag(pb, "vmhd");
  817. put_be32(pb, 0x01); /* version & flags */
  818. put_be64(pb, 0); /* reserved (graphics mode = copy) */
  819. return 0x14;
  820. }
  821. static int mov_write_hdlr_tag(ByteIOContext *pb, MOVTrack *track)
  822. {
  823. const char *hdlr, *descr = NULL, *hdlr_type = NULL;
  824. int64_t pos = url_ftell(pb);
  825. if (!track) { /* no media --> data handler */
  826. hdlr = "dhlr";
  827. hdlr_type = "url ";
  828. descr = "DataHandler";
  829. } else {
  830. hdlr = (track->mode == MODE_MOV) ? "mhlr" : "\0\0\0\0";
  831. if (track->enc->codec_type == CODEC_TYPE_VIDEO) {
  832. hdlr_type = "vide";
  833. descr = "VideoHandler";
  834. } else if (track->enc->codec_type == CODEC_TYPE_AUDIO) {
  835. hdlr_type = "soun";
  836. descr = "SoundHandler";
  837. } else if (track->enc->codec_type == CODEC_TYPE_SUBTITLE) {
  838. if (track->tag == MKTAG('t','x','3','g')) hdlr_type = "sbtl";
  839. else hdlr_type = "text";
  840. descr = "SubtitleHandler";
  841. }
  842. }
  843. put_be32(pb, 0); /* size */
  844. put_tag(pb, "hdlr");
  845. put_be32(pb, 0); /* Version & flags */
  846. put_buffer(pb, hdlr, 4); /* handler */
  847. put_tag(pb, hdlr_type); /* handler type */
  848. put_be32(pb ,0); /* reserved */
  849. put_be32(pb ,0); /* reserved */
  850. put_be32(pb ,0); /* reserved */
  851. put_byte(pb, strlen(descr)); /* string counter */
  852. put_buffer(pb, descr, strlen(descr)); /* handler description */
  853. return updateSize(pb, pos);
  854. }
  855. static int mov_write_minf_tag(ByteIOContext *pb, MOVTrack *track)
  856. {
  857. int64_t pos = url_ftell(pb);
  858. put_be32(pb, 0); /* size */
  859. put_tag(pb, "minf");
  860. if(track->enc->codec_type == CODEC_TYPE_VIDEO)
  861. mov_write_vmhd_tag(pb);
  862. else if (track->enc->codec_type == CODEC_TYPE_AUDIO)
  863. mov_write_smhd_tag(pb);
  864. else if (track->enc->codec_type == CODEC_TYPE_SUBTITLE) {
  865. if (track->tag == MKTAG('t','e','x','t')) mov_write_gmhd_tag(pb);
  866. else mov_write_nmhd_tag(pb);
  867. }
  868. if (track->mode == MODE_MOV) /* FIXME: Why do it for MODE_MOV only ? */
  869. mov_write_hdlr_tag(pb, NULL);
  870. mov_write_dinf_tag(pb);
  871. mov_write_stbl_tag(pb, track);
  872. return updateSize(pb, pos);
  873. }
  874. static int mov_write_mdhd_tag(ByteIOContext *pb, MOVTrack *track)
  875. {
  876. int version = track->trackDuration < INT32_MAX ? 0 : 1;
  877. (version == 1) ? put_be32(pb, 44) : put_be32(pb, 32); /* size */
  878. put_tag(pb, "mdhd");
  879. put_byte(pb, version);
  880. put_be24(pb, 0); /* flags */
  881. if (version == 1) {
  882. put_be64(pb, track->time);
  883. put_be64(pb, track->time);
  884. } else {
  885. put_be32(pb, track->time); /* creation time */
  886. put_be32(pb, track->time); /* modification time */
  887. }
  888. put_be32(pb, track->timescale); /* time scale (sample rate for audio) */
  889. (version == 1) ? put_be64(pb, track->trackDuration) : put_be32(pb, track->trackDuration); /* duration */
  890. put_be16(pb, track->language); /* language */
  891. put_be16(pb, 0); /* reserved (quality) */
  892. if(version!=0 && track->mode == MODE_MOV){
  893. av_log(NULL, AV_LOG_ERROR,
  894. "FATAL error, file duration too long for timebase, this file will not be\n"
  895. "playable with quicktime. Choose a different timebase or a different\n"
  896. "container format\n");
  897. }
  898. return 32;
  899. }
  900. static int mov_write_mdia_tag(ByteIOContext *pb, MOVTrack *track)
  901. {
  902. int64_t pos = url_ftell(pb);
  903. put_be32(pb, 0); /* size */
  904. put_tag(pb, "mdia");
  905. mov_write_mdhd_tag(pb, track);
  906. mov_write_hdlr_tag(pb, track);
  907. mov_write_minf_tag(pb, track);
  908. return updateSize(pb, pos);
  909. }
  910. static int mov_write_tkhd_tag(ByteIOContext *pb, MOVTrack *track, AVStream *st)
  911. {
  912. int64_t duration = av_rescale_rnd(track->trackDuration, globalTimescale, track->timescale, AV_ROUND_UP);
  913. int version = duration < INT32_MAX ? 0 : 1;
  914. (version == 1) ? put_be32(pb, 104) : put_be32(pb, 92); /* size */
  915. put_tag(pb, "tkhd");
  916. put_byte(pb, version);
  917. put_be24(pb, 0xf); /* flags (track enabled) */
  918. if (version == 1) {
  919. put_be64(pb, track->time);
  920. put_be64(pb, track->time);
  921. } else {
  922. put_be32(pb, track->time); /* creation time */
  923. put_be32(pb, track->time); /* modification time */
  924. }
  925. put_be32(pb, track->trackID); /* track-id */
  926. put_be32(pb, 0); /* reserved */
  927. (version == 1) ? put_be64(pb, duration) : put_be32(pb, duration);
  928. put_be32(pb, 0); /* reserved */
  929. put_be32(pb, 0); /* reserved */
  930. put_be32(pb, 0x0); /* reserved (Layer & Alternate group) */
  931. /* Volume, only for audio */
  932. if(track->enc->codec_type == CODEC_TYPE_AUDIO)
  933. put_be16(pb, 0x0100);
  934. else
  935. put_be16(pb, 0);
  936. put_be16(pb, 0); /* reserved */
  937. /* Matrix structure */
  938. put_be32(pb, 0x00010000); /* reserved */
  939. put_be32(pb, 0x0); /* reserved */
  940. put_be32(pb, 0x0); /* reserved */
  941. put_be32(pb, 0x0); /* reserved */
  942. put_be32(pb, 0x00010000); /* reserved */
  943. put_be32(pb, 0x0); /* reserved */
  944. put_be32(pb, 0x0); /* reserved */
  945. put_be32(pb, 0x0); /* reserved */
  946. put_be32(pb, 0x40000000); /* reserved */
  947. /* Track width and height, for visual only */
  948. if(track->enc->codec_type == CODEC_TYPE_VIDEO ||
  949. track->enc->codec_type == CODEC_TYPE_SUBTITLE) {
  950. double sample_aspect_ratio = av_q2d(st->sample_aspect_ratio);
  951. if(!sample_aspect_ratio || track->height != track->enc->height)
  952. sample_aspect_ratio = 1;
  953. put_be32(pb, sample_aspect_ratio * track->enc->width*0x10000);
  954. put_be32(pb, track->height*0x10000);
  955. }
  956. else {
  957. put_be32(pb, 0);
  958. put_be32(pb, 0);
  959. }
  960. return 0x5c;
  961. }
  962. // This box seems important for the psp playback ... without it the movie seems to hang
  963. static int mov_write_edts_tag(ByteIOContext *pb, MOVTrack *track)
  964. {
  965. put_be32(pb, 0x24); /* size */
  966. put_tag(pb, "edts");
  967. put_be32(pb, 0x1c); /* size */
  968. put_tag(pb, "elst");
  969. put_be32(pb, 0x0);
  970. put_be32(pb, 0x1);
  971. put_be32(pb, av_rescale_rnd(track->trackDuration, globalTimescale, track->timescale, AV_ROUND_UP)); /* duration ... doesn't seem to effect psp */
  972. put_be32(pb, track->cluster[0].cts); /* first pts is cts since dts is 0 */
  973. put_be32(pb, 0x00010000);
  974. return 0x24;
  975. }
  976. // goes at the end of each track! ... Critical for PSP playback ("Incompatible data" without it)
  977. static int mov_write_uuid_tag_psp(ByteIOContext *pb, MOVTrack *mov)
  978. {
  979. put_be32(pb, 0x34); /* size ... reports as 28 in mp4box! */
  980. put_tag(pb, "uuid");
  981. put_tag(pb, "USMT");
  982. put_be32(pb, 0x21d24fce);
  983. put_be32(pb, 0xbb88695c);
  984. put_be32(pb, 0xfac9c740);
  985. put_be32(pb, 0x1c); // another size here!
  986. put_tag(pb, "MTDT");
  987. put_be32(pb, 0x00010012);
  988. put_be32(pb, 0x0a);
  989. put_be32(pb, 0x55c40000);
  990. put_be32(pb, 0x1);
  991. put_be32(pb, 0x0);
  992. return 0x34;
  993. }
  994. static int mov_write_trak_tag(ByteIOContext *pb, MOVTrack *track, AVStream *st)
  995. {
  996. int64_t pos = url_ftell(pb);
  997. put_be32(pb, 0); /* size */
  998. put_tag(pb, "trak");
  999. mov_write_tkhd_tag(pb, track, st);
  1000. if (track->mode == MODE_PSP || track->hasBframes)
  1001. mov_write_edts_tag(pb, track); // PSP Movies require edts box
  1002. mov_write_mdia_tag(pb, track);
  1003. if (track->mode == MODE_PSP)
  1004. mov_write_uuid_tag_psp(pb,track); // PSP Movies require this uuid box
  1005. return updateSize(pb, pos);
  1006. }
  1007. #if 0
  1008. /* TODO: Not sorted out, but not necessary either */
  1009. static int mov_write_iods_tag(ByteIOContext *pb, MOVMuxContext *mov)
  1010. {
  1011. put_be32(pb, 0x15); /* size */
  1012. put_tag(pb, "iods");
  1013. put_be32(pb, 0); /* version & flags */
  1014. put_be16(pb, 0x1007);
  1015. put_byte(pb, 0);
  1016. put_be16(pb, 0x4fff);
  1017. put_be16(pb, 0xfffe);
  1018. put_be16(pb, 0x01ff);
  1019. return 0x15;
  1020. }
  1021. #endif
  1022. static int mov_write_mvhd_tag(ByteIOContext *pb, MOVMuxContext *mov)
  1023. {
  1024. int maxTrackID = 1, i;
  1025. int64_t maxTrackLenTemp, maxTrackLen = 0;
  1026. int version;
  1027. for (i=0; i<mov->nb_streams; i++) {
  1028. if(mov->tracks[i].entry > 0) {
  1029. maxTrackLenTemp = av_rescale_rnd(mov->tracks[i].trackDuration, globalTimescale, mov->tracks[i].timescale, AV_ROUND_UP);
  1030. if(maxTrackLen < maxTrackLenTemp)
  1031. maxTrackLen = maxTrackLenTemp;
  1032. if(maxTrackID < mov->tracks[i].trackID)
  1033. maxTrackID = mov->tracks[i].trackID;
  1034. }
  1035. }
  1036. version = maxTrackLen < UINT32_MAX ? 0 : 1;
  1037. (version == 1) ? put_be32(pb, 120) : put_be32(pb, 108); /* size */
  1038. put_tag(pb, "mvhd");
  1039. put_byte(pb, version);
  1040. put_be24(pb, 0); /* flags */
  1041. if (version == 1) {
  1042. put_be64(pb, mov->time);
  1043. put_be64(pb, mov->time);
  1044. } else {
  1045. put_be32(pb, mov->time); /* creation time */
  1046. put_be32(pb, mov->time); /* modification time */
  1047. }
  1048. put_be32(pb, mov->timescale); /* timescale */
  1049. (version == 1) ? put_be64(pb, maxTrackLen) : put_be32(pb, maxTrackLen); /* duration of longest track */
  1050. put_be32(pb, 0x00010000); /* reserved (preferred rate) 1.0 = normal */
  1051. put_be16(pb, 0x0100); /* reserved (preferred volume) 1.0 = normal */
  1052. put_be16(pb, 0); /* reserved */
  1053. put_be32(pb, 0); /* reserved */
  1054. put_be32(pb, 0); /* reserved */
  1055. /* Matrix structure */
  1056. put_be32(pb, 0x00010000); /* reserved */
  1057. put_be32(pb, 0x0); /* reserved */
  1058. put_be32(pb, 0x0); /* reserved */
  1059. put_be32(pb, 0x0); /* reserved */
  1060. put_be32(pb, 0x00010000); /* reserved */
  1061. put_be32(pb, 0x0); /* reserved */
  1062. put_be32(pb, 0x0); /* reserved */
  1063. put_be32(pb, 0x0); /* reserved */
  1064. put_be32(pb, 0x40000000); /* reserved */
  1065. put_be32(pb, 0); /* reserved (preview time) */
  1066. put_be32(pb, 0); /* reserved (preview duration) */
  1067. put_be32(pb, 0); /* reserved (poster time) */
  1068. put_be32(pb, 0); /* reserved (selection time) */
  1069. put_be32(pb, 0); /* reserved (selection duration) */
  1070. put_be32(pb, 0); /* reserved (current time) */
  1071. put_be32(pb, maxTrackID+1); /* Next track id */
  1072. return 0x6c;
  1073. }
  1074. static int mov_write_itunes_hdlr_tag(ByteIOContext *pb, MOVMuxContext *mov,
  1075. AVFormatContext *s)
  1076. {
  1077. int64_t pos = url_ftell(pb);
  1078. put_be32(pb, 0); /* size */
  1079. put_tag(pb, "hdlr");
  1080. put_be32(pb, 0);
  1081. put_be32(pb, 0);
  1082. put_tag(pb, "mdir");
  1083. put_tag(pb, "appl");
  1084. put_be32(pb, 0);
  1085. put_be32(pb, 0);
  1086. put_be16(pb, 0);
  1087. return updateSize(pb, pos);
  1088. }
  1089. /* helper function to write a data tag with the specified string as data */
  1090. static int mov_write_string_data_tag(ByteIOContext *pb, const char *data, int lang, int long_style)
  1091. {
  1092. if(long_style){
  1093. int64_t pos = url_ftell(pb);
  1094. put_be32(pb, 0); /* size */
  1095. put_tag(pb, "data");
  1096. put_be32(pb, 1);
  1097. put_be32(pb, 0);
  1098. put_buffer(pb, data, strlen(data));
  1099. return updateSize(pb, pos);
  1100. }else{
  1101. put_be16(pb, strlen(data)); /* string length */
  1102. put_be16(pb, lang);
  1103. put_buffer(pb, data, strlen(data));
  1104. return strlen(data) + 4;
  1105. }
  1106. }
  1107. static int mov_write_string_tag(ByteIOContext *pb, const char *name, const char *value, int lang, int long_style){
  1108. int size = 0;
  1109. if (value && value[0]) {
  1110. int64_t pos = url_ftell(pb);
  1111. put_be32(pb, 0); /* size */
  1112. put_tag(pb, name);
  1113. mov_write_string_data_tag(pb, value, lang, long_style);
  1114. size= updateSize(pb, pos);
  1115. }
  1116. return size;
  1117. }
  1118. static int mov_write_string_metadata(AVFormatContext *s, ByteIOContext *pb,
  1119. const char *name, const char *tag,
  1120. int long_style)
  1121. {
  1122. int l, lang = 0, len, len2;
  1123. AVMetadataTag *t, *t2 = NULL;
  1124. char tag2[16];
  1125. if (!(t = av_metadata_get(s->metadata, tag, NULL, 0)))
  1126. return 0;
  1127. len = strlen(t->key);
  1128. snprintf(tag2, sizeof(tag2), "%s-", tag);
  1129. while ((t2 = av_metadata_get(s->metadata, tag2, t2, AV_METADATA_IGNORE_SUFFIX))) {
  1130. len2 = strlen(t2->key);
  1131. if (len2 == len+4 && !strcmp(t->value, t2->value)
  1132. && (l=ff_mov_iso639_to_lang(&t2->key[len2-3], 0)) >= 0) {
  1133. lang = l;
  1134. break;
  1135. }
  1136. }
  1137. return mov_write_string_tag(pb, name, t->value, lang, long_style);
  1138. }
  1139. /* iTunes track number */
  1140. static int mov_write_trkn_tag(ByteIOContext *pb, MOVMuxContext *mov,
  1141. AVFormatContext *s)
  1142. {
  1143. AVMetadataTag *t = av_metadata_get(s->metadata, "track", NULL, 0);
  1144. int size = 0, track = t ? atoi(t->value) : 0;
  1145. if (track) {
  1146. int64_t pos = url_ftell(pb);
  1147. put_be32(pb, 0); /* size */
  1148. put_tag(pb, "trkn");
  1149. {
  1150. int64_t pos = url_ftell(pb);
  1151. put_be32(pb, 0); /* size */
  1152. put_tag(pb, "data");
  1153. put_be32(pb, 0); // 8 bytes empty
  1154. put_be32(pb, 0);
  1155. put_be16(pb, 0); // empty
  1156. put_be16(pb, track); // track number
  1157. put_be16(pb, 0); // total track number
  1158. put_be16(pb, 0); // empty
  1159. updateSize(pb, pos);
  1160. }
  1161. size = updateSize(pb, pos);
  1162. }
  1163. return size;
  1164. }
  1165. /* iTunes meta data list */
  1166. static int mov_write_ilst_tag(ByteIOContext *pb, MOVMuxContext *mov,
  1167. AVFormatContext *s)
  1168. {
  1169. int64_t pos = url_ftell(pb);
  1170. put_be32(pb, 0); /* size */
  1171. put_tag(pb, "ilst");
  1172. mov_write_string_metadata(s, pb, "\251nam", "title" , 1);
  1173. mov_write_string_metadata(s, pb, "\251ART", "author" , 1);
  1174. mov_write_string_metadata(s, pb, "\251wrt", "author" , 1);
  1175. mov_write_string_metadata(s, pb, "\251alb", "album" , 1);
  1176. mov_write_string_metadata(s, pb, "\251day", "year" , 1);
  1177. mov_write_string_tag(pb, "\251too", LIBAVFORMAT_IDENT, 0, 1);
  1178. mov_write_string_metadata(s, pb, "\251cmt", "comment" , 1);
  1179. mov_write_string_metadata(s, pb, "\251gen", "genre" , 1);
  1180. mov_write_string_metadata(s, pb, "\251cpy", "copyright", 1);
  1181. mov_write_trkn_tag(pb, mov, s);
  1182. return updateSize(pb, pos);
  1183. }
  1184. /* iTunes meta data tag */
  1185. static int mov_write_meta_tag(ByteIOContext *pb, MOVMuxContext *mov,
  1186. AVFormatContext *s)
  1187. {
  1188. int size = 0;
  1189. int64_t pos = url_ftell(pb);
  1190. put_be32(pb, 0); /* size */
  1191. put_tag(pb, "meta");
  1192. put_be32(pb, 0);
  1193. mov_write_itunes_hdlr_tag(pb, mov, s);
  1194. mov_write_ilst_tag(pb, mov, s);
  1195. size = updateSize(pb, pos);
  1196. return size;
  1197. }
  1198. static int utf8len(const uint8_t *b)
  1199. {
  1200. int len=0;
  1201. int val;
  1202. while(*b){
  1203. GET_UTF8(val, *b++, return -1;)
  1204. len++;
  1205. }
  1206. return len;
  1207. }
  1208. static int ascii_to_wc(ByteIOContext *pb, const uint8_t *b)
  1209. {
  1210. int val;
  1211. while(*b){
  1212. GET_UTF8(val, *b++, return -1;)
  1213. put_be16(pb, val);
  1214. }
  1215. put_be16(pb, 0x00);
  1216. return 0;
  1217. }
  1218. static uint16_t language_code(const char *str)
  1219. {
  1220. return (((str[0]-0x60) & 0x1F) << 10) + (((str[1]-0x60) & 0x1F) << 5) + ((str[2]-0x60) & 0x1F);
  1221. }
  1222. static int mov_write_3gp_udta_tag(ByteIOContext *pb, AVFormatContext *s,
  1223. const char *tag, const char *str)
  1224. {
  1225. int64_t pos = url_ftell(pb);
  1226. AVMetadataTag *t = av_metadata_get(s->metadata, str, NULL, 0);
  1227. if (!t || !utf8len(t->value))
  1228. return 0;
  1229. put_be32(pb, 0); /* size */
  1230. put_tag (pb, tag); /* type */
  1231. put_be32(pb, 0); /* version + flags */
  1232. if (!strcmp(tag, "yrrc"))
  1233. put_be16(pb, atoi(t->value));
  1234. else {
  1235. put_be16(pb, language_code("eng")); /* language */
  1236. ascii_to_wc(pb, t->value);
  1237. if (!strcmp(tag, "albm") &&
  1238. (t = av_metadata_get(s->metadata, "year", NULL, 0)))
  1239. put_byte(pb, atoi(t->value));
  1240. }
  1241. return updateSize(pb, pos);
  1242. }
  1243. static int mov_write_udta_tag(ByteIOContext *pb, MOVMuxContext *mov,
  1244. AVFormatContext *s)
  1245. {
  1246. ByteIOContext *pb_buf;
  1247. int i, ret, size;
  1248. uint8_t *buf;
  1249. for (i = 0; i < s->nb_streams; i++)
  1250. if (mov->tracks[i].enc->flags & CODEC_FLAG_BITEXACT) {
  1251. return 0;
  1252. }
  1253. ret = url_open_dyn_buf(&pb_buf);
  1254. if(ret < 0)
  1255. return ret;
  1256. if (mov->mode & MODE_3GP) {
  1257. mov_write_3gp_udta_tag(pb_buf, s, "titl", "title");
  1258. mov_write_3gp_udta_tag(pb_buf, s, "auth", "author");
  1259. mov_write_3gp_udta_tag(pb_buf, s, "gnre", "genre");
  1260. mov_write_3gp_udta_tag(pb_buf, s, "dscp", "comment");
  1261. mov_write_3gp_udta_tag(pb_buf, s, "albm", "album");
  1262. mov_write_3gp_udta_tag(pb_buf, s, "cprt", "copyright");
  1263. mov_write_3gp_udta_tag(pb_buf, s, "yrrc", "year");
  1264. } else if (mov->mode == MODE_MOV) { // the title field breaks gtkpod with mp4 and my suspicion is that stuff is not valid in mp4
  1265. mov_write_string_metadata(s, pb_buf, "\251nam", "title" , 0);
  1266. mov_write_string_metadata(s, pb_buf, "\251aut", "author" , 0);
  1267. mov_write_string_metadata(s, pb_buf, "\251alb", "album" , 0);
  1268. mov_write_string_metadata(s, pb_buf, "\251day", "year" , 0);
  1269. mov_write_string_tag(pb_buf, "\251enc", LIBAVFORMAT_IDENT, 0, 0);
  1270. mov_write_string_metadata(s, pb_buf, "\251des", "comment" , 0);
  1271. mov_write_string_metadata(s, pb_buf, "\251gen", "genre" , 0);
  1272. mov_write_string_metadata(s, pb_buf, "\251cpy", "copyright" , 0);
  1273. } else {
  1274. /* iTunes meta data */
  1275. mov_write_meta_tag(pb_buf, mov, s);
  1276. }
  1277. if ((size = url_close_dyn_buf(pb_buf, &buf)) > 0) {
  1278. put_be32(pb, size+8);
  1279. put_tag(pb, "udta");
  1280. put_buffer(pb, buf, size);
  1281. av_free(buf);
  1282. }
  1283. return 0;
  1284. }
  1285. static void mov_write_psp_udta_tag(ByteIOContext *pb,
  1286. const char *str, const char *lang, int type)
  1287. {
  1288. int len = utf8len(str)+1;
  1289. if(len<=0)
  1290. return;
  1291. put_be16(pb, len*2+10); /* size */
  1292. put_be32(pb, type); /* type */
  1293. put_be16(pb, language_code(lang)); /* language */
  1294. put_be16(pb, 0x01); /* ? */
  1295. ascii_to_wc(pb, str);
  1296. }
  1297. static int mov_write_uuidusmt_tag(ByteIOContext *pb, AVFormatContext *s)
  1298. {
  1299. AVMetadataTag *title = av_metadata_get(s->metadata, "title", NULL, 0);
  1300. int64_t pos, pos2;
  1301. if (title) {
  1302. pos = url_ftell(pb);
  1303. put_be32(pb, 0); /* size placeholder*/
  1304. put_tag(pb, "uuid");
  1305. put_tag(pb, "USMT");
  1306. put_be32(pb, 0x21d24fce); /* 96 bit UUID */
  1307. put_be32(pb, 0xbb88695c);
  1308. put_be32(pb, 0xfac9c740);
  1309. pos2 = url_ftell(pb);
  1310. put_be32(pb, 0); /* size placeholder*/
  1311. put_tag(pb, "MTDT");
  1312. put_be16(pb, 4);
  1313. // ?
  1314. put_be16(pb, 0x0C); /* size */
  1315. put_be32(pb, 0x0B); /* type */
  1316. put_be16(pb, language_code("und")); /* language */
  1317. put_be16(pb, 0x0); /* ? */
  1318. put_be16(pb, 0x021C); /* data */
  1319. mov_write_psp_udta_tag(pb, LIBAVCODEC_IDENT, "eng", 0x04);
  1320. mov_write_psp_udta_tag(pb, title->value, "eng", 0x01);
  1321. // snprintf(dt,32,"%04d/%02d/%02d %02d:%02d:%02d",t_st->tm_year+1900,t_st->tm_mon+1,t_st->tm_mday,t_st->tm_hour,t_st->tm_min,t_st->tm_sec);
  1322. mov_write_psp_udta_tag(pb, "2006/04/01 11:11:11", "und", 0x03);
  1323. updateSize(pb, pos2);
  1324. return updateSize(pb, pos);
  1325. }
  1326. return 0;
  1327. }
  1328. static int mov_write_moov_tag(ByteIOContext *pb, MOVMuxContext *mov,
  1329. AVFormatContext *s)
  1330. {
  1331. int i;
  1332. int64_t pos = url_ftell(pb);
  1333. put_be32(pb, 0); /* size placeholder*/
  1334. put_tag(pb, "moov");
  1335. mov->timescale = globalTimescale;
  1336. for (i=0; i<mov->nb_streams; i++) {
  1337. if(mov->tracks[i].entry <= 0) continue;
  1338. mov->tracks[i].time = mov->time;
  1339. mov->tracks[i].trackID = i+1;
  1340. }
  1341. mov_write_mvhd_tag(pb, mov);
  1342. //mov_write_iods_tag(pb, mov);
  1343. for (i=0; i<mov->nb_streams; i++) {
  1344. if(mov->tracks[i].entry > 0) {
  1345. mov_write_trak_tag(pb, &(mov->tracks[i]), s->streams[i]);
  1346. }
  1347. }
  1348. if (mov->mode == MODE_PSP)
  1349. mov_write_uuidusmt_tag(pb, s);
  1350. else
  1351. mov_write_udta_tag(pb, mov, s);
  1352. return updateSize(pb, pos);
  1353. }
  1354. static int mov_write_mdat_tag(ByteIOContext *pb, MOVMuxContext *mov)
  1355. {
  1356. put_be32(pb, 8); // placeholder for extended size field (64 bit)
  1357. put_tag(pb, mov->mode == MODE_MOV ? "wide" : "free");
  1358. mov->mdat_pos = url_ftell(pb);
  1359. put_be32(pb, 0); /* size placeholder*/
  1360. put_tag(pb, "mdat");
  1361. return 0;
  1362. }
  1363. /* TODO: This needs to be more general */
  1364. static int mov_write_ftyp_tag(ByteIOContext *pb, AVFormatContext *s)
  1365. {
  1366. MOVMuxContext *mov = s->priv_data;
  1367. int64_t pos = url_ftell(pb);
  1368. int has_h264 = 0, has_video = 0;
  1369. int minor = 0x200;
  1370. int i;
  1371. for (i = 0; i < s->nb_streams; i++) {
  1372. AVStream *st = s->streams[i];
  1373. if (st->codec->codec_type == CODEC_TYPE_VIDEO)
  1374. has_video = 1;
  1375. if (st->codec->codec_id == CODEC_ID_H264)
  1376. has_h264 = 1;
  1377. }
  1378. put_be32(pb, 0); /* size */
  1379. put_tag(pb, "ftyp");
  1380. if (mov->mode == MODE_3GP) {
  1381. put_tag(pb, has_h264 ? "3gp6" : "3gp4");
  1382. minor = has_h264 ? 0x100 : 0x200;
  1383. } else if (mov->mode & MODE_3G2) {
  1384. put_tag(pb, has_h264 ? "3g2b" : "3g2a");
  1385. minor = has_h264 ? 0x20000 : 0x10000;
  1386. }else if (mov->mode == MODE_PSP)
  1387. put_tag(pb, "MSNV");
  1388. else if (mov->mode == MODE_MP4)
  1389. put_tag(pb, "isom");
  1390. else if (mov->mode == MODE_IPOD)
  1391. put_tag(pb, has_video ? "M4V ":"M4A ");
  1392. else
  1393. put_tag(pb, "qt ");
  1394. put_be32(pb, minor);
  1395. if(mov->mode == MODE_MOV)
  1396. put_tag(pb, "qt ");
  1397. else{
  1398. put_tag(pb, "isom");
  1399. put_tag(pb, "iso2");
  1400. if(has_h264)
  1401. put_tag(pb, "avc1");
  1402. }
  1403. if (mov->mode == MODE_3GP)
  1404. put_tag(pb, has_h264 ? "3gp6":"3gp4");
  1405. else if (mov->mode & MODE_3G2)
  1406. put_tag(pb, has_h264 ? "3g2b":"3g2a");
  1407. else if (mov->mode == MODE_PSP)
  1408. put_tag(pb, "MSNV");
  1409. else if (mov->mode == MODE_MP4)
  1410. put_tag(pb, "mp41");
  1411. return updateSize(pb, pos);
  1412. }
  1413. static void mov_write_uuidprof_tag(ByteIOContext *pb, AVFormatContext *s)
  1414. {
  1415. AVCodecContext *VideoCodec = s->streams[0]->codec;
  1416. AVCodecContext *AudioCodec = s->streams[1]->codec;
  1417. int AudioRate = AudioCodec->sample_rate;
  1418. int FrameRate = ((VideoCodec->time_base.den) * (0x10000))/ (VideoCodec->time_base.num);
  1419. int audio_kbitrate= AudioCodec->bit_rate / 1000;
  1420. int video_kbitrate= FFMIN(VideoCodec->bit_rate / 1000, 800 - audio_kbitrate);
  1421. put_be32(pb, 0x94); /* size */
  1422. put_tag(pb, "uuid");
  1423. put_tag(pb, "PROF");
  1424. put_be32(pb, 0x21d24fce); /* 96 bit UUID */
  1425. put_be32(pb, 0xbb88695c);
  1426. put_be32(pb, 0xfac9c740);
  1427. put_be32(pb, 0x0); /* ? */
  1428. put_be32(pb, 0x3); /* 3 sections ? */
  1429. put_be32(pb, 0x14); /* size */
  1430. put_tag(pb, "FPRF");
  1431. put_be32(pb, 0x0); /* ? */
  1432. put_be32(pb, 0x0); /* ? */
  1433. put_be32(pb, 0x0); /* ? */
  1434. put_be32(pb, 0x2c); /* size */
  1435. put_tag(pb, "APRF"); /* audio */
  1436. put_be32(pb, 0x0);
  1437. put_be32(pb, 0x2); /* TrackID */
  1438. put_tag(pb, "mp4a");
  1439. put_be32(pb, 0x20f);
  1440. put_be32(pb, 0x0);
  1441. put_be32(pb, audio_kbitrate);
  1442. put_be32(pb, audio_kbitrate);
  1443. put_be32(pb, AudioRate);
  1444. put_be32(pb, AudioCodec->channels);
  1445. put_be32(pb, 0x34); /* size */
  1446. put_tag(pb, "VPRF"); /* video */
  1447. put_be32(pb, 0x0);
  1448. put_be32(pb, 0x1); /* TrackID */
  1449. if (VideoCodec->codec_id == CODEC_ID_H264) {
  1450. put_tag(pb, "avc1");
  1451. put_be16(pb, 0x014D);
  1452. put_be16(pb, 0x0015);
  1453. } else {
  1454. put_tag(pb, "mp4v");
  1455. put_be16(pb, 0x0000);
  1456. put_be16(pb, 0x0103);
  1457. }
  1458. put_be32(pb, 0x0);
  1459. put_be32(pb, video_kbitrate);
  1460. put_be32(pb, video_kbitrate);
  1461. put_be32(pb, FrameRate);
  1462. put_be32(pb, FrameRate);
  1463. put_be16(pb, VideoCodec->width);
  1464. put_be16(pb, VideoCodec->height);
  1465. put_be32(pb, 0x010001); /* ? */
  1466. }
  1467. static int mov_write_header(AVFormatContext *s)
  1468. {
  1469. ByteIOContext *pb = s->pb;
  1470. MOVMuxContext *mov = s->priv_data;
  1471. int i;
  1472. if (url_is_streamed(s->pb)) {
  1473. av_log(s, AV_LOG_ERROR, "muxer does not support non seekable output\n");
  1474. return -1;
  1475. }
  1476. /* Default mode == MP4 */
  1477. mov->mode = MODE_MP4;
  1478. if (s->oformat != NULL) {
  1479. if (!strcmp("3gp", s->oformat->name)) mov->mode = MODE_3GP;
  1480. else if (!strcmp("3g2", s->oformat->name)) mov->mode = MODE_3GP|MODE_3G2;
  1481. else if (!strcmp("mov", s->oformat->name)) mov->mode = MODE_MOV;
  1482. else if (!strcmp("psp", s->oformat->name)) mov->mode = MODE_PSP;
  1483. else if (!strcmp("ipod",s->oformat->name)) mov->mode = MODE_IPOD;
  1484. mov_write_ftyp_tag(pb,s);
  1485. if (mov->mode == MODE_PSP) {
  1486. if (s->nb_streams != 2) {
  1487. av_log(s, AV_LOG_ERROR, "PSP mode need one video and one audio stream\n");
  1488. return -1;
  1489. }
  1490. mov_write_uuidprof_tag(pb,s);
  1491. }
  1492. }
  1493. for(i=0; i<s->nb_streams; i++){
  1494. AVStream *st= s->streams[i];
  1495. MOVTrack *track= &mov->tracks[i];
  1496. AVMetadataTag *lang = av_metadata_get(st->metadata, "language", NULL,0);
  1497. track->enc = st->codec;
  1498. track->language = ff_mov_iso639_to_lang(lang?lang->value:"und", mov->mode!=MODE_MOV);
  1499. if (track->language < 0)
  1500. track->language = 0;
  1501. track->mode = mov->mode;
  1502. track->tag = mov_find_codec_tag(s, track);
  1503. if (!track->tag) {
  1504. av_log(s, AV_LOG_ERROR, "track %d: could not find tag, "
  1505. "codec not currently supported in container\n", i);
  1506. return -1;
  1507. }
  1508. if(st->codec->codec_type == CODEC_TYPE_VIDEO){
  1509. if (track->tag == MKTAG('m','x','3','p') || track->tag == MKTAG('m','x','3','n') ||
  1510. track->tag == MKTAG('m','x','4','p') || track->tag == MKTAG('m','x','4','n') ||
  1511. track->tag == MKTAG('m','x','5','p') || track->tag == MKTAG('m','x','5','n')) {
  1512. if (st->codec->width != 720 || (st->codec->height != 608 && st->codec->height != 512)) {
  1513. av_log(s, AV_LOG_ERROR, "D-10/IMX must use 720x608 or 720x512 video resolution\n");
  1514. return -1;
  1515. }
  1516. track->height = track->tag>>24 == 'n' ? 486 : 576;
  1517. }
  1518. track->timescale = st->codec->time_base.den;
  1519. av_set_pts_info(st, 64, 1, st->codec->time_base.den);
  1520. if (track->mode == MODE_MOV && track->timescale > 100000)
  1521. av_log(s, AV_LOG_WARNING,
  1522. "WARNING codec timebase is very high. If duration is too long,\n"
  1523. "file may not be playable by quicktime. Specify a shorter timebase\n"
  1524. "or choose different container.\n");
  1525. }else if(st->codec->codec_type == CODEC_TYPE_AUDIO){
  1526. track->timescale = st->codec->sample_rate;
  1527. av_set_pts_info(st, 64, 1, st->codec->sample_rate);
  1528. if(!st->codec->frame_size && !av_get_bits_per_sample(st->codec->codec_id)) {
  1529. av_log(s, AV_LOG_ERROR, "track %d: codec frame size is not set\n", i);
  1530. return -1;
  1531. }else if(st->codec->frame_size > 1){ /* assume compressed audio */
  1532. track->audio_vbr = 1;
  1533. }else{
  1534. st->codec->frame_size = 1;
  1535. track->sampleSize = (av_get_bits_per_sample(st->codec->codec_id) >> 3) * st->codec->channels;
  1536. }
  1537. if(track->mode != MODE_MOV &&
  1538. track->enc->codec_id == CODEC_ID_MP3 && track->enc->sample_rate < 16000){
  1539. av_log(s, AV_LOG_ERROR, "track %d: muxing mp3 at %dhz is not supported\n",
  1540. i, track->enc->sample_rate);
  1541. return -1;
  1542. }
  1543. }else if(st->codec->codec_type == CODEC_TYPE_SUBTITLE){
  1544. track->timescale = st->codec->time_base.den;
  1545. av_set_pts_info(st, 64, 1, st->codec->time_base.den);
  1546. }
  1547. if (!track->height)
  1548. track->height = st->codec->height;
  1549. }
  1550. mov_write_mdat_tag(pb, mov);
  1551. mov->time = s->timestamp + 0x7C25B080; //1970 based -> 1904 based
  1552. mov->nb_streams = s->nb_streams;
  1553. put_flush_packet(pb);
  1554. return 0;
  1555. }
  1556. static int mov_write_packet(AVFormatContext *s, AVPacket *pkt)
  1557. {
  1558. MOVMuxContext *mov = s->priv_data;
  1559. ByteIOContext *pb = s->pb;
  1560. MOVTrack *trk = &mov->tracks[pkt->stream_index];
  1561. AVCodecContext *enc = trk->enc;
  1562. unsigned int samplesInChunk = 0;
  1563. int size= pkt->size;
  1564. if (url_is_streamed(s->pb)) return 0; /* Can't handle that */
  1565. if (!size) return 0; /* Discard 0 sized packets */
  1566. if (enc->codec_id == CODEC_ID_AMR_NB) {
  1567. /* We must find out how many AMR blocks there are in one packet */
  1568. static uint16_t packed_size[16] =
  1569. {13, 14, 16, 18, 20, 21, 27, 32, 6, 0, 0, 0, 0, 0, 0, 0};
  1570. int len = 0;
  1571. while (len < size && samplesInChunk < 100) {
  1572. len += packed_size[(pkt->data[len] >> 3) & 0x0F];
  1573. samplesInChunk++;
  1574. }
  1575. if(samplesInChunk > 1){
  1576. av_log(s, AV_LOG_ERROR, "fatal error, input is not a single packet, implement a AVParser for it\n");
  1577. return -1;
  1578. }
  1579. } else if (trk->sampleSize)
  1580. samplesInChunk = size/trk->sampleSize;
  1581. else
  1582. samplesInChunk = 1;
  1583. /* copy extradata if it exists */
  1584. if (trk->vosLen == 0 && enc->extradata_size > 0) {
  1585. trk->vosLen = enc->extradata_size;
  1586. trk->vosData = av_malloc(trk->vosLen);
  1587. memcpy(trk->vosData, enc->extradata, trk->vosLen);
  1588. }
  1589. if (enc->codec_id == CODEC_ID_H264 && trk->vosLen > 0 && *(uint8_t *)trk->vosData != 1) {
  1590. /* from x264 or from bytestream h264 */
  1591. /* nal reformating needed */
  1592. size = ff_avc_parse_nal_units(pb, pkt->data, pkt->size);
  1593. } else {
  1594. put_buffer(pb, pkt->data, size);
  1595. }
  1596. if ((enc->codec_id == CODEC_ID_DNXHD ||
  1597. enc->codec_id == CODEC_ID_AC3) && !trk->vosLen) {
  1598. /* copy frame to create needed atoms */
  1599. trk->vosLen = size;
  1600. trk->vosData = av_malloc(size);
  1601. if (!trk->vosData)
  1602. return AVERROR(ENOMEM);
  1603. memcpy(trk->vosData, pkt->data, size);
  1604. }
  1605. if (!(trk->entry % MOV_INDEX_CLUSTER_SIZE)) {
  1606. trk->cluster = av_realloc(trk->cluster, (trk->entry + MOV_INDEX_CLUSTER_SIZE) * sizeof(*trk->cluster));
  1607. if (!trk->cluster)
  1608. return -1;
  1609. }
  1610. trk->cluster[trk->entry].pos = url_ftell(pb) - size;
  1611. trk->cluster[trk->entry].samplesInChunk = samplesInChunk;
  1612. trk->cluster[trk->entry].size = size;
  1613. trk->cluster[trk->entry].entries = samplesInChunk;
  1614. trk->cluster[trk->entry].dts = pkt->dts;
  1615. trk->trackDuration = pkt->dts - trk->cluster[0].dts + pkt->duration;
  1616. if (pkt->pts == AV_NOPTS_VALUE) {
  1617. av_log(s, AV_LOG_WARNING, "pts has no value\n");
  1618. pkt->pts = pkt->dts;
  1619. }
  1620. if (pkt->dts != pkt->pts)
  1621. trk->hasBframes = 1;
  1622. trk->cluster[trk->entry].cts = pkt->pts - pkt->dts;
  1623. trk->cluster[trk->entry].key_frame = !!(pkt->flags & PKT_FLAG_KEY);
  1624. if(trk->cluster[trk->entry].key_frame)
  1625. trk->hasKeyframes++;
  1626. trk->entry++;
  1627. trk->sampleCount += samplesInChunk;
  1628. mov->mdat_size += size;
  1629. put_flush_packet(pb);
  1630. return 0;
  1631. }
  1632. static int mov_write_trailer(AVFormatContext *s)
  1633. {
  1634. MOVMuxContext *mov = s->priv_data;
  1635. ByteIOContext *pb = s->pb;
  1636. int res = 0;
  1637. int i;
  1638. int64_t moov_pos = url_ftell(pb);
  1639. /* Write size of mdat tag */
  1640. if (mov->mdat_size+8 <= UINT32_MAX) {
  1641. url_fseek(pb, mov->mdat_pos, SEEK_SET);
  1642. put_be32(pb, mov->mdat_size+8);
  1643. } else {
  1644. /* overwrite 'wide' placeholder atom */
  1645. url_fseek(pb, mov->mdat_pos - 8, SEEK_SET);
  1646. put_be32(pb, 1); /* special value: real atom size will be 64 bit value after tag field */
  1647. put_tag(pb, "mdat");
  1648. put_be64(pb, mov->mdat_size+16);
  1649. }
  1650. url_fseek(pb, moov_pos, SEEK_SET);
  1651. mov_write_moov_tag(pb, mov, s);
  1652. for (i=0; i<mov->nb_streams; i++) {
  1653. av_freep(&mov->tracks[i].cluster);
  1654. if(mov->tracks[i].vosLen) av_free(mov->tracks[i].vosData);
  1655. }
  1656. put_flush_packet(pb);
  1657. return res;
  1658. }
  1659. #if CONFIG_MOV_MUXER
  1660. AVOutputFormat mov_muxer = {
  1661. "mov",
  1662. NULL_IF_CONFIG_SMALL("MOV format"),
  1663. NULL,
  1664. "mov",
  1665. sizeof(MOVMuxContext),
  1666. CODEC_ID_AAC,
  1667. CODEC_ID_MPEG4,
  1668. mov_write_header,
  1669. mov_write_packet,
  1670. mov_write_trailer,
  1671. .flags = AVFMT_GLOBALHEADER | AVFMT_VARIABLE_FPS,
  1672. .codec_tag = (const AVCodecTag* const []){codec_movvideo_tags, codec_movaudio_tags, 0},
  1673. };
  1674. #endif
  1675. #if CONFIG_TGP_MUXER
  1676. AVOutputFormat tgp_muxer = {
  1677. "3gp",
  1678. NULL_IF_CONFIG_SMALL("3GP format"),
  1679. NULL,
  1680. "3gp",
  1681. sizeof(MOVMuxContext),
  1682. CODEC_ID_AMR_NB,
  1683. CODEC_ID_H263,
  1684. mov_write_header,
  1685. mov_write_packet,
  1686. mov_write_trailer,
  1687. .flags = AVFMT_GLOBALHEADER,
  1688. .codec_tag = (const AVCodecTag* const []){codec_3gp_tags, 0},
  1689. };
  1690. #endif
  1691. #if CONFIG_MP4_MUXER
  1692. AVOutputFormat mp4_muxer = {
  1693. "mp4",
  1694. NULL_IF_CONFIG_SMALL("MP4 format"),
  1695. "application/mp4",
  1696. "mp4",
  1697. sizeof(MOVMuxContext),
  1698. CODEC_ID_AAC,
  1699. CODEC_ID_MPEG4,
  1700. mov_write_header,
  1701. mov_write_packet,
  1702. mov_write_trailer,
  1703. .flags = AVFMT_GLOBALHEADER | AVFMT_VARIABLE_FPS,
  1704. .codec_tag = (const AVCodecTag* const []){ff_mp4_obj_type, 0},
  1705. };
  1706. #endif
  1707. #if CONFIG_PSP_MUXER
  1708. AVOutputFormat psp_muxer = {
  1709. "psp",
  1710. NULL_IF_CONFIG_SMALL("PSP MP4 format"),
  1711. NULL,
  1712. "mp4,psp",
  1713. sizeof(MOVMuxContext),
  1714. CODEC_ID_AAC,
  1715. CODEC_ID_MPEG4,
  1716. mov_write_header,
  1717. mov_write_packet,
  1718. mov_write_trailer,
  1719. .flags = AVFMT_GLOBALHEADER,
  1720. .codec_tag = (const AVCodecTag* const []){ff_mp4_obj_type, 0},
  1721. };
  1722. #endif
  1723. #if CONFIG_TG2_MUXER
  1724. AVOutputFormat tg2_muxer = {
  1725. "3g2",
  1726. NULL_IF_CONFIG_SMALL("3GP2 format"),
  1727. NULL,
  1728. "3g2",
  1729. sizeof(MOVMuxContext),
  1730. CODEC_ID_AMR_NB,
  1731. CODEC_ID_H263,
  1732. mov_write_header,
  1733. mov_write_packet,
  1734. mov_write_trailer,
  1735. .flags = AVFMT_GLOBALHEADER,
  1736. .codec_tag = (const AVCodecTag* const []){codec_3gp_tags, 0},
  1737. };
  1738. #endif
  1739. #if CONFIG_IPOD_MUXER
  1740. AVOutputFormat ipod_muxer = {
  1741. "ipod",
  1742. NULL_IF_CONFIG_SMALL("iPod H.264 MP4 format"),
  1743. "application/mp4",
  1744. "m4v,m4a",
  1745. sizeof(MOVMuxContext),
  1746. CODEC_ID_AAC,
  1747. CODEC_ID_H264,
  1748. mov_write_header,
  1749. mov_write_packet,
  1750. mov_write_trailer,
  1751. .flags = AVFMT_GLOBALHEADER,
  1752. .codec_tag = (const AVCodecTag* const []){codec_ipod_tags, 0},
  1753. };
  1754. #endif