You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

1873 lines
62KB

  1. /*
  2. * Matroska muxer
  3. * Copyright (c) 2007 David Conrad
  4. *
  5. * This file is part of Libav.
  6. *
  7. * Libav is free software; you can redistribute it and/or
  8. * modify it under the terms of the GNU Lesser General Public
  9. * License as published by the Free Software Foundation; either
  10. * version 2.1 of the License, or (at your option) any later version.
  11. *
  12. * Libav is distributed in the hope that it will be useful,
  13. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  14. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  15. * Lesser General Public License for more details.
  16. *
  17. * You should have received a copy of the GNU Lesser General Public
  18. * License along with Libav; if not, write to the Free Software
  19. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  20. */
  21. #include <stdint.h>
  22. #include "avc.h"
  23. #include "hevc.h"
  24. #include "avformat.h"
  25. #include "avlanguage.h"
  26. #include "flacenc.h"
  27. #include "internal.h"
  28. #include "isom.h"
  29. #include "matroska.h"
  30. #include "riff.h"
  31. #include "vorbiscomment.h"
  32. #include "wv.h"
  33. #include "libavutil/avstring.h"
  34. #include "libavutil/channel_layout.h"
  35. #include "libavutil/dict.h"
  36. #include "libavutil/intfloat.h"
  37. #include "libavutil/intreadwrite.h"
  38. #include "libavutil/lfg.h"
  39. #include "libavutil/mathematics.h"
  40. #include "libavutil/opt.h"
  41. #include "libavutil/random_seed.h"
  42. #include "libavutil/samplefmt.h"
  43. #include "libavutil/stereo3d.h"
  44. #include "libavcodec/xiph.h"
  45. #include "libavcodec/mpeg4audio.h"
  46. typedef struct ebml_master {
  47. int64_t pos; ///< absolute offset in the file where the master's elements start
  48. int sizebytes; ///< how many bytes were reserved for the size
  49. } ebml_master;
  50. typedef struct mkv_seekhead_entry {
  51. unsigned int elementid;
  52. uint64_t segmentpos;
  53. } mkv_seekhead_entry;
  54. typedef struct mkv_seekhead {
  55. int64_t filepos;
  56. int64_t segment_offset; ///< the file offset to the beginning of the segment
  57. int reserved_size; ///< -1 if appending to file
  58. int max_entries;
  59. mkv_seekhead_entry *entries;
  60. int num_entries;
  61. } mkv_seekhead;
  62. typedef struct mkv_cuepoint {
  63. uint64_t pts;
  64. int tracknum;
  65. int64_t cluster_pos; ///< file offset of the cluster containing the block
  66. } mkv_cuepoint;
  67. typedef struct mkv_cues {
  68. int64_t segment_offset;
  69. mkv_cuepoint *entries;
  70. int num_entries;
  71. } mkv_cues;
  72. typedef struct mkv_track {
  73. int write_dts;
  74. int64_t ts_offset;
  75. } mkv_track;
  76. #define MODE_MATROSKAv2 0x01
  77. #define MODE_WEBM 0x02
  78. typedef struct MatroskaMuxContext {
  79. const AVClass *class;
  80. int mode;
  81. AVIOContext *dyn_bc;
  82. ebml_master segment;
  83. int64_t segment_offset;
  84. ebml_master cluster;
  85. int64_t cluster_pos; ///< file offset of the current cluster
  86. int64_t cluster_pts;
  87. int64_t duration_offset;
  88. int64_t duration;
  89. mkv_seekhead *main_seekhead;
  90. mkv_cues *cues;
  91. mkv_track *tracks;
  92. AVPacket cur_audio_pkt;
  93. int have_attachments;
  94. int reserve_cues_space;
  95. int cluster_size_limit;
  96. int64_t cues_pos;
  97. int64_t cluster_time_limit;
  98. int wrote_chapters;
  99. } MatroskaMuxContext;
  100. /** 2 bytes * 3 for EBML IDs, 3 1-byte EBML lengths, 8 bytes for 64 bit
  101. * offset, 4 bytes for target EBML ID */
  102. #define MAX_SEEKENTRY_SIZE 21
  103. /** per-cuepoint-track - 3 1-byte EBML IDs, 3 1-byte EBML sizes, 2
  104. * 8-byte uint max */
  105. #define MAX_CUETRACKPOS_SIZE 22
  106. /** per-cuepoint - 2 1-byte EBML IDs, 2 1-byte EBML sizes, 8-byte uint max */
  107. #define MAX_CUEPOINT_SIZE(num_tracks) 12 + MAX_CUETRACKPOS_SIZE * num_tracks
  108. static int ebml_id_size(unsigned int id)
  109. {
  110. return (av_log2(id + 1) - 1) / 7 + 1;
  111. }
  112. static void put_ebml_id(AVIOContext *pb, unsigned int id)
  113. {
  114. int i = ebml_id_size(id);
  115. while (i--)
  116. avio_w8(pb, id >> (i * 8));
  117. }
  118. /**
  119. * Write an EBML size meaning "unknown size".
  120. *
  121. * @param bytes The number of bytes the size should occupy (maximum: 8).
  122. */
  123. static void put_ebml_size_unknown(AVIOContext *pb, int bytes)
  124. {
  125. assert(bytes <= 8);
  126. avio_w8(pb, 0x1ff >> bytes);
  127. while (--bytes)
  128. avio_w8(pb, 0xff);
  129. }
  130. /**
  131. * Calculate how many bytes are needed to represent a given number in EBML.
  132. */
  133. static int ebml_num_size(uint64_t num)
  134. {
  135. int bytes = 1;
  136. while ((num + 1) >> bytes * 7)
  137. bytes++;
  138. return bytes;
  139. }
  140. /**
  141. * Write a number in EBML variable length format.
  142. *
  143. * @param bytes The number of bytes that need to be used to write the number.
  144. * If zero, any number of bytes can be used.
  145. */
  146. static void put_ebml_num(AVIOContext *pb, uint64_t num, int bytes)
  147. {
  148. int i, needed_bytes = ebml_num_size(num);
  149. // sizes larger than this are currently undefined in EBML
  150. assert(num < (1ULL << 56) - 1);
  151. if (bytes == 0)
  152. // don't care how many bytes are used, so use the min
  153. bytes = needed_bytes;
  154. // the bytes needed to write the given size would exceed the bytes
  155. // that we need to use, so write unknown size. This shouldn't happen.
  156. assert(bytes >= needed_bytes);
  157. num |= 1ULL << bytes * 7;
  158. for (i = bytes - 1; i >= 0; i--)
  159. avio_w8(pb, num >> i * 8);
  160. }
  161. static void put_ebml_uint(AVIOContext *pb, unsigned int elementid, uint64_t val)
  162. {
  163. int i, bytes = 1;
  164. uint64_t tmp = val;
  165. while (tmp >>= 8)
  166. bytes++;
  167. put_ebml_id(pb, elementid);
  168. put_ebml_num(pb, bytes, 0);
  169. for (i = bytes - 1; i >= 0; i--)
  170. avio_w8(pb, val >> i * 8);
  171. }
  172. static void put_ebml_float(AVIOContext *pb, unsigned int elementid, double val)
  173. {
  174. put_ebml_id(pb, elementid);
  175. put_ebml_num(pb, 8, 0);
  176. avio_wb64(pb, av_double2int(val));
  177. }
  178. static void put_ebml_binary(AVIOContext *pb, unsigned int elementid,
  179. const void *buf, int size)
  180. {
  181. put_ebml_id(pb, elementid);
  182. put_ebml_num(pb, size, 0);
  183. avio_write(pb, buf, size);
  184. }
  185. static void put_ebml_string(AVIOContext *pb, unsigned int elementid,
  186. const char *str)
  187. {
  188. put_ebml_binary(pb, elementid, str, strlen(str));
  189. }
  190. /**
  191. * Write a void element of a given size. Useful for reserving space in
  192. * the file to be written to later.
  193. *
  194. * @param size The number of bytes to reserve, which must be at least 2.
  195. */
  196. static void put_ebml_void(AVIOContext *pb, uint64_t size)
  197. {
  198. int64_t currentpos = avio_tell(pb);
  199. assert(size >= 2);
  200. put_ebml_id(pb, EBML_ID_VOID);
  201. // we need to subtract the length needed to store the size from the
  202. // size we need to reserve so 2 cases, we use 8 bytes to store the
  203. // size if possible, 1 byte otherwise
  204. if (size < 10)
  205. put_ebml_num(pb, size - 1, 0);
  206. else
  207. put_ebml_num(pb, size - 9, 8);
  208. while (avio_tell(pb) < currentpos + size)
  209. avio_w8(pb, 0);
  210. }
  211. static ebml_master start_ebml_master(AVIOContext *pb, unsigned int elementid,
  212. uint64_t expectedsize)
  213. {
  214. int bytes = expectedsize ? ebml_num_size(expectedsize) : 8;
  215. put_ebml_id(pb, elementid);
  216. put_ebml_size_unknown(pb, bytes);
  217. return (ebml_master) {avio_tell(pb), bytes };
  218. }
  219. static void end_ebml_master(AVIOContext *pb, ebml_master master)
  220. {
  221. int64_t pos = avio_tell(pb);
  222. if (avio_seek(pb, master.pos - master.sizebytes, SEEK_SET) < 0)
  223. return;
  224. put_ebml_num(pb, pos - master.pos, master.sizebytes);
  225. avio_seek(pb, pos, SEEK_SET);
  226. }
  227. static void put_xiph_size(AVIOContext *pb, int size)
  228. {
  229. int i;
  230. for (i = 0; i < size / 255; i++)
  231. avio_w8(pb, 255);
  232. avio_w8(pb, size % 255);
  233. }
  234. /**
  235. * Initialize a mkv_seekhead element to be ready to index level 1 Matroska
  236. * elements. If a maximum number of elements is specified, enough space
  237. * will be reserved at the current file location to write a seek head of
  238. * that size.
  239. *
  240. * @param segment_offset The absolute offset to the position in the file
  241. * where the segment begins.
  242. * @param numelements The maximum number of elements that will be indexed
  243. * by this seek head, 0 if unlimited.
  244. */
  245. static mkv_seekhead *mkv_start_seekhead(AVIOContext *pb, int64_t segment_offset,
  246. int numelements)
  247. {
  248. mkv_seekhead *new_seekhead = av_mallocz(sizeof(mkv_seekhead));
  249. if (!new_seekhead)
  250. return NULL;
  251. new_seekhead->segment_offset = segment_offset;
  252. if (numelements > 0) {
  253. new_seekhead->filepos = avio_tell(pb);
  254. // 21 bytes max for a seek entry, 10 bytes max for the SeekHead ID
  255. // and size, and 3 bytes to guarantee that an EBML void element
  256. // will fit afterwards
  257. new_seekhead->reserved_size = numelements * MAX_SEEKENTRY_SIZE + 13;
  258. new_seekhead->max_entries = numelements;
  259. put_ebml_void(pb, new_seekhead->reserved_size);
  260. }
  261. return new_seekhead;
  262. }
  263. static int mkv_add_seekhead_entry(mkv_seekhead *seekhead, unsigned int elementid, uint64_t filepos)
  264. {
  265. int err;
  266. // don't store more elements than we reserved space for
  267. if (seekhead->max_entries > 0 && seekhead->max_entries <= seekhead->num_entries)
  268. return -1;
  269. if ((err = av_reallocp_array(&seekhead->entries, seekhead->num_entries + 1,
  270. sizeof(*seekhead->entries))) < 0) {
  271. seekhead->num_entries = 0;
  272. return err;
  273. }
  274. seekhead->entries[seekhead->num_entries].elementid = elementid;
  275. seekhead->entries[seekhead->num_entries++].segmentpos = filepos - seekhead->segment_offset;
  276. return 0;
  277. }
  278. /**
  279. * Write the seek head to the file and free it. If a maximum number of
  280. * elements was specified to mkv_start_seekhead(), the seek head will
  281. * be written at the location reserved for it. Otherwise, it is written
  282. * at the current location in the file.
  283. *
  284. * @return The file offset where the seekhead was written,
  285. * -1 if an error occurred.
  286. */
  287. static int64_t mkv_write_seekhead(AVIOContext *pb, mkv_seekhead *seekhead)
  288. {
  289. ebml_master metaseek, seekentry;
  290. int64_t currentpos;
  291. int i;
  292. currentpos = avio_tell(pb);
  293. if (seekhead->reserved_size > 0) {
  294. if (avio_seek(pb, seekhead->filepos, SEEK_SET) < 0) {
  295. currentpos = -1;
  296. goto fail;
  297. }
  298. }
  299. metaseek = start_ebml_master(pb, MATROSKA_ID_SEEKHEAD, seekhead->reserved_size);
  300. for (i = 0; i < seekhead->num_entries; i++) {
  301. mkv_seekhead_entry *entry = &seekhead->entries[i];
  302. seekentry = start_ebml_master(pb, MATROSKA_ID_SEEKENTRY, MAX_SEEKENTRY_SIZE);
  303. put_ebml_id(pb, MATROSKA_ID_SEEKID);
  304. put_ebml_num(pb, ebml_id_size(entry->elementid), 0);
  305. put_ebml_id(pb, entry->elementid);
  306. put_ebml_uint(pb, MATROSKA_ID_SEEKPOSITION, entry->segmentpos);
  307. end_ebml_master(pb, seekentry);
  308. }
  309. end_ebml_master(pb, metaseek);
  310. if (seekhead->reserved_size > 0) {
  311. uint64_t remaining = seekhead->filepos + seekhead->reserved_size - avio_tell(pb);
  312. put_ebml_void(pb, remaining);
  313. avio_seek(pb, currentpos, SEEK_SET);
  314. currentpos = seekhead->filepos;
  315. }
  316. fail:
  317. av_free(seekhead->entries);
  318. av_free(seekhead);
  319. return currentpos;
  320. }
  321. static mkv_cues *mkv_start_cues(int64_t segment_offset)
  322. {
  323. mkv_cues *cues = av_mallocz(sizeof(mkv_cues));
  324. if (!cues)
  325. return NULL;
  326. cues->segment_offset = segment_offset;
  327. return cues;
  328. }
  329. static int mkv_add_cuepoint(mkv_cues *cues, int stream, int64_t ts, int64_t cluster_pos)
  330. {
  331. int err;
  332. if (ts < 0)
  333. return 0;
  334. if ((err = av_reallocp_array(&cues->entries, cues->num_entries + 1,
  335. sizeof(*cues->entries))) < 0) {
  336. cues->num_entries = 0;
  337. return err;
  338. }
  339. cues->entries[cues->num_entries].pts = ts;
  340. cues->entries[cues->num_entries].tracknum = stream + 1;
  341. cues->entries[cues->num_entries++].cluster_pos = cluster_pos - cues->segment_offset;
  342. return 0;
  343. }
  344. static int64_t mkv_write_cues(AVIOContext *pb, mkv_cues *cues, int num_tracks)
  345. {
  346. ebml_master cues_element;
  347. int64_t currentpos;
  348. int i, j;
  349. currentpos = avio_tell(pb);
  350. cues_element = start_ebml_master(pb, MATROSKA_ID_CUES, 0);
  351. for (i = 0; i < cues->num_entries; i++) {
  352. ebml_master cuepoint, track_positions;
  353. mkv_cuepoint *entry = &cues->entries[i];
  354. uint64_t pts = entry->pts;
  355. cuepoint = start_ebml_master(pb, MATROSKA_ID_POINTENTRY, MAX_CUEPOINT_SIZE(num_tracks));
  356. put_ebml_uint(pb, MATROSKA_ID_CUETIME, pts);
  357. // put all the entries from different tracks that have the exact same
  358. // timestamp into the same CuePoint
  359. for (j = 0; j < cues->num_entries - i && entry[j].pts == pts; j++) {
  360. track_positions = start_ebml_master(pb, MATROSKA_ID_CUETRACKPOSITION, MAX_CUETRACKPOS_SIZE);
  361. put_ebml_uint(pb, MATROSKA_ID_CUETRACK , entry[j].tracknum );
  362. put_ebml_uint(pb, MATROSKA_ID_CUECLUSTERPOSITION, entry[j].cluster_pos);
  363. end_ebml_master(pb, track_positions);
  364. }
  365. i += j - 1;
  366. end_ebml_master(pb, cuepoint);
  367. }
  368. end_ebml_master(pb, cues_element);
  369. return currentpos;
  370. }
  371. static int put_xiph_codecpriv(AVFormatContext *s, AVIOContext *pb, AVCodecParameters *par)
  372. {
  373. uint8_t *header_start[3];
  374. int header_len[3];
  375. int first_header_size;
  376. int j;
  377. if (par->codec_id == AV_CODEC_ID_VORBIS)
  378. first_header_size = 30;
  379. else
  380. first_header_size = 42;
  381. if (avpriv_split_xiph_headers(par->extradata, par->extradata_size,
  382. first_header_size, header_start, header_len) < 0) {
  383. av_log(s, AV_LOG_ERROR, "Extradata corrupt.\n");
  384. return -1;
  385. }
  386. avio_w8(pb, 2); // number packets - 1
  387. for (j = 0; j < 2; j++) {
  388. put_xiph_size(pb, header_len[j]);
  389. }
  390. for (j = 0; j < 3; j++)
  391. avio_write(pb, header_start[j], header_len[j]);
  392. return 0;
  393. }
  394. static int put_wv_codecpriv(AVIOContext *pb, AVCodecParameters *par)
  395. {
  396. if (par->extradata && par->extradata_size == 2)
  397. avio_write(pb, par->extradata, 2);
  398. else
  399. avio_wl16(pb, 0x403); // fallback to the version mentioned in matroska specs
  400. return 0;
  401. }
  402. static int put_flac_codecpriv(AVFormatContext *s,
  403. AVIOContext *pb, AVCodecParameters *par)
  404. {
  405. int write_comment = (par->channel_layout &&
  406. !(par->channel_layout & ~0x3ffffULL) &&
  407. !ff_flac_is_native_layout(par->channel_layout));
  408. int ret = ff_flac_write_header(pb, par->extradata, par->extradata_size,
  409. !write_comment);
  410. if (ret < 0)
  411. return ret;
  412. if (write_comment) {
  413. const char *vendor = (s->flags & AVFMT_FLAG_BITEXACT) ?
  414. "Libav" : LIBAVFORMAT_IDENT;
  415. AVDictionary *dict = NULL;
  416. uint8_t buf[32], *data, *p;
  417. int len;
  418. snprintf(buf, sizeof(buf), "0x%"PRIx64, par->channel_layout);
  419. av_dict_set(&dict, "WAVEFORMATEXTENSIBLE_CHANNEL_MASK", buf, 0);
  420. len = ff_vorbiscomment_length(dict, vendor);
  421. data = av_malloc(len + 4);
  422. if (!data) {
  423. av_dict_free(&dict);
  424. return AVERROR(ENOMEM);
  425. }
  426. data[0] = 0x84;
  427. AV_WB24(data + 1, len);
  428. p = data + 4;
  429. ff_vorbiscomment_write(&p, &dict, vendor);
  430. avio_write(pb, data, len + 4);
  431. av_freep(&data);
  432. av_dict_free(&dict);
  433. }
  434. return 0;
  435. }
  436. static int get_aac_sample_rates(AVFormatContext *s, AVCodecParameters *par,
  437. int *sample_rate, int *output_sample_rate)
  438. {
  439. MPEG4AudioConfig mp4ac;
  440. if (avpriv_mpeg4audio_get_config(&mp4ac, par->extradata,
  441. par->extradata_size * 8, 1) < 0) {
  442. av_log(s, AV_LOG_ERROR,
  443. "Error parsing AAC extradata, unable to determine samplerate.\n");
  444. return AVERROR(EINVAL);
  445. }
  446. *sample_rate = mp4ac.sample_rate;
  447. *output_sample_rate = mp4ac.ext_sample_rate;
  448. return 0;
  449. }
  450. static int mkv_write_native_codecprivate(AVFormatContext *s,
  451. AVCodecParameters *par,
  452. AVIOContext *dyn_cp)
  453. {
  454. switch (par->codec_id) {
  455. case AV_CODEC_ID_VORBIS:
  456. case AV_CODEC_ID_THEORA:
  457. return put_xiph_codecpriv(s, dyn_cp, par);
  458. case AV_CODEC_ID_FLAC:
  459. return put_flac_codecpriv(s, dyn_cp, par);
  460. case AV_CODEC_ID_WAVPACK:
  461. return put_wv_codecpriv(dyn_cp, par);
  462. case AV_CODEC_ID_H264:
  463. return ff_isom_write_avcc(dyn_cp, par->extradata,
  464. par->extradata_size);
  465. case AV_CODEC_ID_HEVC:
  466. return ff_isom_write_hvcc(dyn_cp, par->extradata,
  467. par->extradata_size, 0);
  468. case AV_CODEC_ID_ALAC:
  469. if (par->extradata_size < 36) {
  470. av_log(s, AV_LOG_ERROR,
  471. "Invalid extradata found, ALAC expects a 36-byte "
  472. "QuickTime atom.");
  473. return AVERROR_INVALIDDATA;
  474. } else
  475. avio_write(dyn_cp, par->extradata + 12,
  476. par->extradata_size - 12);
  477. break;
  478. default:
  479. if (par->extradata_size)
  480. avio_write(dyn_cp, par->extradata, par->extradata_size);
  481. }
  482. return 0;
  483. }
  484. static int mkv_write_codecprivate(AVFormatContext *s, AVIOContext *pb,
  485. AVCodecParameters *par,
  486. int native_id, int qt_id)
  487. {
  488. AVIOContext *dyn_cp;
  489. uint8_t *codecpriv;
  490. int ret, codecpriv_size;
  491. ret = avio_open_dyn_buf(&dyn_cp);
  492. if (ret < 0)
  493. return ret;
  494. if (native_id) {
  495. ret = mkv_write_native_codecprivate(s, par, dyn_cp);
  496. } else if (par->codec_type == AVMEDIA_TYPE_VIDEO) {
  497. if (qt_id) {
  498. if (!par->codec_tag)
  499. par->codec_tag = ff_codec_get_tag(ff_codec_movvideo_tags,
  500. par->codec_id);
  501. if (par->extradata_size)
  502. avio_write(dyn_cp, par->extradata, par->extradata_size);
  503. } else {
  504. if (!par->codec_tag)
  505. par->codec_tag = ff_codec_get_tag(ff_codec_bmp_tags,
  506. par->codec_id);
  507. if (!par->codec_tag) {
  508. av_log(s, AV_LOG_ERROR, "No bmp codec ID found.\n");
  509. ret = -1;
  510. }
  511. ff_put_bmp_header(dyn_cp, par, ff_codec_bmp_tags, 0);
  512. }
  513. } else if (par->codec_type == AVMEDIA_TYPE_AUDIO) {
  514. unsigned int tag;
  515. tag = ff_codec_get_tag(ff_codec_wav_tags, par->codec_id);
  516. if (!tag) {
  517. av_log(s, AV_LOG_ERROR, "No wav codec ID found.\n");
  518. ret = -1;
  519. }
  520. if (!par->codec_tag)
  521. par->codec_tag = tag;
  522. ff_put_wav_header(s, dyn_cp, par);
  523. }
  524. codecpriv_size = avio_close_dyn_buf(dyn_cp, &codecpriv);
  525. if (codecpriv_size)
  526. put_ebml_binary(pb, MATROSKA_ID_CODECPRIVATE, codecpriv,
  527. codecpriv_size);
  528. av_free(codecpriv);
  529. return ret;
  530. }
  531. static void mkv_write_field_order(AVIOContext *pb,
  532. enum AVFieldOrder field_order)
  533. {
  534. switch (field_order) {
  535. case AV_FIELD_UNKNOWN:
  536. put_ebml_uint(pb, MATROSKA_ID_VIDEOFLAGINTERLACED,
  537. MATROSKA_VIDEO_INTERLACE_FLAG_UNDETERMINED);
  538. break;
  539. case AV_FIELD_PROGRESSIVE:
  540. put_ebml_uint(pb, MATROSKA_ID_VIDEOFLAGINTERLACED,
  541. MATROSKA_VIDEO_INTERLACE_FLAG_PROGRESSIVE);
  542. break;
  543. case AV_FIELD_TT:
  544. case AV_FIELD_BB:
  545. case AV_FIELD_TB:
  546. case AV_FIELD_BT:
  547. put_ebml_uint(pb, MATROSKA_ID_VIDEOFLAGINTERLACED,
  548. MATROSKA_VIDEO_INTERLACE_FLAG_INTERLACED);
  549. switch (field_order) {
  550. case AV_FIELD_TT:
  551. put_ebml_uint(pb, MATROSKA_ID_VIDEOFIELDORDER,
  552. MATROSKA_VIDEO_FIELDORDER_TT);
  553. break;
  554. case AV_FIELD_BB:
  555. put_ebml_uint(pb, MATROSKA_ID_VIDEOFIELDORDER,
  556. MATROSKA_VIDEO_FIELDORDER_BB);
  557. break;
  558. case AV_FIELD_TB:
  559. put_ebml_uint(pb, MATROSKA_ID_VIDEOFIELDORDER,
  560. MATROSKA_VIDEO_FIELDORDER_TB);
  561. break;
  562. case AV_FIELD_BT:
  563. put_ebml_uint(pb, MATROSKA_ID_VIDEOFIELDORDER,
  564. MATROSKA_VIDEO_FIELDORDER_BT);
  565. break;
  566. }
  567. }
  568. }
  569. static int mkv_write_stereo_mode(AVFormatContext *s, AVIOContext *pb,
  570. AVStream *st, int mode)
  571. {
  572. int i;
  573. int display_width, display_height;
  574. int h_width = 1, h_height = 1;
  575. AVCodecParameters *par = st->codecpar;
  576. AVDictionaryEntry *tag;
  577. MatroskaVideoStereoModeType format = MATROSKA_VIDEO_STEREOMODE_TYPE_NB;
  578. // convert metadata into proper side data and add it to the stream
  579. if ((tag = av_dict_get(s->metadata, "stereo_mode", NULL, 0))) {
  580. int stereo_mode = atoi(tag->value);
  581. if (stereo_mode < MATROSKA_VIDEO_STEREOMODE_TYPE_NB &&
  582. stereo_mode != 10 && stereo_mode != 12) {
  583. int ret = ff_mkv_stereo3d_conv(st, stereo_mode);
  584. if (ret < 0)
  585. return ret;
  586. }
  587. }
  588. // iterate to find the stereo3d side data
  589. for (i = 0; i < st->nb_side_data; i++) {
  590. AVPacketSideData sd = st->side_data[i];
  591. if (sd.type == AV_PKT_DATA_STEREO3D) {
  592. AVStereo3D *stereo = (AVStereo3D *)sd.data;
  593. switch (stereo->type) {
  594. case AV_STEREO3D_2D:
  595. format = MATROSKA_VIDEO_STEREOMODE_TYPE_MONO;
  596. break;
  597. case AV_STEREO3D_SIDEBYSIDE:
  598. format = (stereo->flags & AV_STEREO3D_FLAG_INVERT)
  599. ? MATROSKA_VIDEO_STEREOMODE_TYPE_RIGHT_LEFT
  600. : MATROSKA_VIDEO_STEREOMODE_TYPE_LEFT_RIGHT;
  601. h_width = 2;
  602. break;
  603. case AV_STEREO3D_TOPBOTTOM:
  604. format = MATROSKA_VIDEO_STEREOMODE_TYPE_TOP_BOTTOM;
  605. if (stereo->flags & AV_STEREO3D_FLAG_INVERT)
  606. format--;
  607. h_height = 2;
  608. break;
  609. case AV_STEREO3D_CHECKERBOARD:
  610. format = MATROSKA_VIDEO_STEREOMODE_TYPE_CHECKERBOARD_LR;
  611. if (stereo->flags & AV_STEREO3D_FLAG_INVERT)
  612. format--;
  613. break;
  614. case AV_STEREO3D_LINES:
  615. format = MATROSKA_VIDEO_STEREOMODE_TYPE_ROW_INTERLEAVED_LR;
  616. if (stereo->flags & AV_STEREO3D_FLAG_INVERT)
  617. format--;
  618. h_height = 2;
  619. break;
  620. case AV_STEREO3D_COLUMNS:
  621. format = MATROSKA_VIDEO_STEREOMODE_TYPE_COL_INTERLEAVED_LR;
  622. if (stereo->flags & AV_STEREO3D_FLAG_INVERT)
  623. format--;
  624. h_width = 2;
  625. break;
  626. case AV_STEREO3D_FRAMESEQUENCE:
  627. format = MATROSKA_VIDEO_STEREOMODE_TYPE_BOTH_EYES_BLOCK_LR;
  628. if (stereo->flags & AV_STEREO3D_FLAG_INVERT)
  629. format++;
  630. break;
  631. }
  632. break;
  633. }
  634. }
  635. // if webm, do not write unsupported modes
  636. if (mode == MODE_WEBM &&
  637. (format > MATROSKA_VIDEO_STEREOMODE_TYPE_TOP_BOTTOM &&
  638. format != MATROSKA_VIDEO_STEREOMODE_TYPE_RIGHT_LEFT))
  639. format = MATROSKA_VIDEO_STEREOMODE_TYPE_NB;
  640. // write StereoMode if format is valid
  641. if (format < MATROSKA_VIDEO_STEREOMODE_TYPE_NB)
  642. put_ebml_uint(pb, MATROSKA_ID_VIDEOSTEREOMODE, format);
  643. // write DisplayWidth and DisplayHeight, they contain the size of
  644. // a single source view and/or the display aspect ratio
  645. display_width = par->width / h_width;
  646. display_height = par->height / h_height;
  647. if (st->sample_aspect_ratio.num) {
  648. display_width *= av_q2d(st->sample_aspect_ratio);
  649. put_ebml_uint(pb, MATROSKA_ID_VIDEODISPLAYUNIT, 3); // DAR
  650. }
  651. if (st->sample_aspect_ratio.num ||
  652. format < MATROSKA_VIDEO_STEREOMODE_TYPE_NB) {
  653. put_ebml_uint(pb, MATROSKA_ID_VIDEODISPLAYWIDTH, display_width);
  654. put_ebml_uint(pb, MATROSKA_ID_VIDEODISPLAYHEIGHT, display_height);
  655. }
  656. return 0;
  657. }
  658. static int mkv_write_track(AVFormatContext *s, MatroskaMuxContext *mkv,
  659. int i, AVIOContext *pb)
  660. {
  661. AVStream *st = s->streams[i];
  662. AVCodecParameters *par = st->codecpar;
  663. ebml_master subinfo, track;
  664. int native_id = 0;
  665. int qt_id = 0;
  666. int bit_depth = av_get_bits_per_sample(par->codec_id);
  667. int sample_rate = par->sample_rate;
  668. int output_sample_rate = 0;
  669. int j, ret;
  670. AVDictionaryEntry *tag;
  671. // ms precision is the de-facto standard timescale for mkv files
  672. avpriv_set_pts_info(st, 64, 1, 1000);
  673. if (par->codec_type == AVMEDIA_TYPE_ATTACHMENT) {
  674. mkv->have_attachments = 1;
  675. return 0;
  676. }
  677. if (!bit_depth)
  678. bit_depth = av_get_bytes_per_sample(par->format) << 3;
  679. if (par->codec_id == AV_CODEC_ID_AAC) {
  680. ret = get_aac_sample_rates(s, par, &sample_rate, &output_sample_rate);
  681. if (ret < 0)
  682. return ret;
  683. }
  684. track = start_ebml_master(pb, MATROSKA_ID_TRACKENTRY, 0);
  685. put_ebml_uint (pb, MATROSKA_ID_TRACKNUMBER , i + 1);
  686. put_ebml_uint (pb, MATROSKA_ID_TRACKUID , i + 1);
  687. put_ebml_uint (pb, MATROSKA_ID_TRACKFLAGLACING , 0); // no lacing (yet)
  688. if ((tag = av_dict_get(st->metadata, "title", NULL, 0)))
  689. put_ebml_string(pb, MATROSKA_ID_TRACKNAME, tag->value);
  690. tag = av_dict_get(st->metadata, "language", NULL, 0);
  691. put_ebml_string(pb, MATROSKA_ID_TRACKLANGUAGE, tag ? tag->value:"und");
  692. // The default value for TRACKFLAGDEFAULT is 1, so add element
  693. // if we need to clear it.
  694. if (!(st->disposition & AV_DISPOSITION_DEFAULT))
  695. put_ebml_uint(pb, MATROSKA_ID_TRACKFLAGDEFAULT, !!(st->disposition & AV_DISPOSITION_DEFAULT));
  696. if (st->disposition & AV_DISPOSITION_FORCED)
  697. put_ebml_uint(pb, MATROSKA_ID_TRACKFLAGFORCED, !!(st->disposition & AV_DISPOSITION_FORCED));
  698. if (par->codec_type == AVMEDIA_TYPE_AUDIO && par->initial_padding) {
  699. mkv->tracks[i].ts_offset = av_rescale_q(par->initial_padding,
  700. (AVRational){ 1, par->sample_rate },
  701. st->time_base);
  702. put_ebml_uint(pb, MATROSKA_ID_CODECDELAY,
  703. av_rescale_q(par->initial_padding,
  704. (AVRational){ 1, par->sample_rate },
  705. (AVRational){ 1, 1000000000 }));
  706. }
  707. // look for a codec ID string specific to mkv to use,
  708. // if none are found, use AVI codes
  709. for (j = 0; ff_mkv_codec_tags[j].id != AV_CODEC_ID_NONE; j++) {
  710. if (ff_mkv_codec_tags[j].id == par->codec_id) {
  711. put_ebml_string(pb, MATROSKA_ID_CODECID, ff_mkv_codec_tags[j].str);
  712. native_id = 1;
  713. break;
  714. }
  715. }
  716. if (mkv->mode == MODE_WEBM && !(par->codec_id == AV_CODEC_ID_VP8 ||
  717. par->codec_id == AV_CODEC_ID_VP9 ||
  718. par->codec_id == AV_CODEC_ID_OPUS ||
  719. par->codec_id == AV_CODEC_ID_VORBIS)) {
  720. av_log(s, AV_LOG_ERROR,
  721. "Only VP8 or VP9 video and Vorbis or Opus audio are supported for WebM.\n");
  722. return AVERROR(EINVAL);
  723. }
  724. switch (par->codec_type) {
  725. case AVMEDIA_TYPE_VIDEO:
  726. put_ebml_uint(pb, MATROSKA_ID_TRACKTYPE, MATROSKA_TRACK_TYPE_VIDEO);
  727. if (st->avg_frame_rate.num > 0 && st->avg_frame_rate.den > 0)
  728. put_ebml_uint(pb, MATROSKA_ID_TRACKDEFAULTDURATION, 1E9 / av_q2d(st->avg_frame_rate));
  729. if (!native_id &&
  730. ff_codec_get_tag(ff_codec_movvideo_tags, par->codec_id) &&
  731. (!ff_codec_get_tag(ff_codec_bmp_tags, par->codec_id) ||
  732. par->codec_id == AV_CODEC_ID_SVQ1 ||
  733. par->codec_id == AV_CODEC_ID_SVQ3 ||
  734. par->codec_id == AV_CODEC_ID_CINEPAK))
  735. qt_id = 1;
  736. if (qt_id)
  737. put_ebml_string(pb, MATROSKA_ID_CODECID, "V_QUICKTIME");
  738. else if (!native_id) {
  739. // if there is no mkv-specific codec ID, use VFW mode
  740. put_ebml_string(pb, MATROSKA_ID_CODECID, "V_MS/VFW/FOURCC");
  741. mkv->tracks[i].write_dts = 1;
  742. }
  743. subinfo = start_ebml_master(pb, MATROSKA_ID_TRACKVIDEO, 0);
  744. put_ebml_uint (pb, MATROSKA_ID_VIDEOPIXELWIDTH , par->width);
  745. put_ebml_uint (pb, MATROSKA_ID_VIDEOPIXELHEIGHT, par->height);
  746. mkv_write_field_order(pb, par->field_order);
  747. // check both side data and metadata for stereo information,
  748. // write the result to the bitstream if any is found
  749. ret = mkv_write_stereo_mode(s, pb, st, mkv->mode);
  750. if (ret < 0)
  751. return ret;
  752. end_ebml_master(pb, subinfo);
  753. break;
  754. case AVMEDIA_TYPE_AUDIO:
  755. put_ebml_uint(pb, MATROSKA_ID_TRACKTYPE, MATROSKA_TRACK_TYPE_AUDIO);
  756. if (!native_id)
  757. // no mkv-specific ID, use ACM mode
  758. put_ebml_string(pb, MATROSKA_ID_CODECID, "A_MS/ACM");
  759. subinfo = start_ebml_master(pb, MATROSKA_ID_TRACKAUDIO, 0);
  760. put_ebml_uint (pb, MATROSKA_ID_AUDIOCHANNELS , par->channels);
  761. put_ebml_float (pb, MATROSKA_ID_AUDIOSAMPLINGFREQ, sample_rate);
  762. if (output_sample_rate)
  763. put_ebml_float(pb, MATROSKA_ID_AUDIOOUTSAMPLINGFREQ, output_sample_rate);
  764. if (bit_depth)
  765. put_ebml_uint(pb, MATROSKA_ID_AUDIOBITDEPTH, bit_depth);
  766. end_ebml_master(pb, subinfo);
  767. break;
  768. case AVMEDIA_TYPE_SUBTITLE:
  769. put_ebml_uint(pb, MATROSKA_ID_TRACKTYPE, MATROSKA_TRACK_TYPE_SUBTITLE);
  770. if (!native_id) {
  771. av_log(s, AV_LOG_ERROR, "Subtitle codec %d is not supported.\n", par->codec_id);
  772. return AVERROR(ENOSYS);
  773. }
  774. break;
  775. default:
  776. av_log(s, AV_LOG_ERROR, "Only audio, video, and subtitles are supported for Matroska.\n");
  777. break;
  778. }
  779. ret = mkv_write_codecprivate(s, pb, par, native_id, qt_id);
  780. if (ret < 0)
  781. return ret;
  782. end_ebml_master(pb, track);
  783. return 0;
  784. }
  785. static int mkv_write_tracks(AVFormatContext *s)
  786. {
  787. MatroskaMuxContext *mkv = s->priv_data;
  788. AVIOContext *pb = s->pb;
  789. ebml_master tracks;
  790. int i, ret;
  791. ret = mkv_add_seekhead_entry(mkv->main_seekhead, MATROSKA_ID_TRACKS, avio_tell(pb));
  792. if (ret < 0)
  793. return ret;
  794. tracks = start_ebml_master(pb, MATROSKA_ID_TRACKS, 0);
  795. for (i = 0; i < s->nb_streams; i++) {
  796. ret = mkv_write_track(s, mkv, i, pb);
  797. if (ret < 0)
  798. return ret;
  799. }
  800. end_ebml_master(pb, tracks);
  801. return 0;
  802. }
  803. static int mkv_write_chapters(AVFormatContext *s)
  804. {
  805. MatroskaMuxContext *mkv = s->priv_data;
  806. AVIOContext *pb = s->pb;
  807. ebml_master chapters, editionentry;
  808. AVRational scale = {1, 1E9};
  809. int i, ret;
  810. if (!s->nb_chapters || mkv->wrote_chapters)
  811. return 0;
  812. ret = mkv_add_seekhead_entry(mkv->main_seekhead, MATROSKA_ID_CHAPTERS, avio_tell(pb));
  813. if (ret < 0) return ret;
  814. chapters = start_ebml_master(pb, MATROSKA_ID_CHAPTERS , 0);
  815. editionentry = start_ebml_master(pb, MATROSKA_ID_EDITIONENTRY, 0);
  816. put_ebml_uint(pb, MATROSKA_ID_EDITIONFLAGDEFAULT, 1);
  817. put_ebml_uint(pb, MATROSKA_ID_EDITIONFLAGHIDDEN , 0);
  818. for (i = 0; i < s->nb_chapters; i++) {
  819. ebml_master chapteratom, chapterdisplay;
  820. AVChapter *c = s->chapters[i];
  821. int64_t chapterstart = av_rescale_q(c->start, c->time_base, scale);
  822. int64_t chapterend = av_rescale_q(c->end, c->time_base, scale);
  823. AVDictionaryEntry *t = NULL;
  824. if (chapterstart < 0 || chapterstart > chapterend || chapterend < 0) {
  825. av_log(s, AV_LOG_ERROR,
  826. "Invalid chapter start (%"PRId64") or end (%"PRId64").\n",
  827. chapterstart, chapterend);
  828. return AVERROR_INVALIDDATA;
  829. }
  830. chapteratom = start_ebml_master(pb, MATROSKA_ID_CHAPTERATOM, 0);
  831. put_ebml_uint(pb, MATROSKA_ID_CHAPTERUID, c->id);
  832. put_ebml_uint(pb, MATROSKA_ID_CHAPTERTIMESTART, chapterstart);
  833. put_ebml_uint(pb, MATROSKA_ID_CHAPTERTIMEEND, chapterend);
  834. put_ebml_uint(pb, MATROSKA_ID_CHAPTERFLAGHIDDEN , 0);
  835. put_ebml_uint(pb, MATROSKA_ID_CHAPTERFLAGENABLED, 1);
  836. if ((t = av_dict_get(c->metadata, "title", NULL, 0))) {
  837. chapterdisplay = start_ebml_master(pb, MATROSKA_ID_CHAPTERDISPLAY, 0);
  838. put_ebml_string(pb, MATROSKA_ID_CHAPSTRING, t->value);
  839. put_ebml_string(pb, MATROSKA_ID_CHAPLANG , "und");
  840. end_ebml_master(pb, chapterdisplay);
  841. }
  842. end_ebml_master(pb, chapteratom);
  843. }
  844. end_ebml_master(pb, editionentry);
  845. end_ebml_master(pb, chapters);
  846. mkv->wrote_chapters = 1;
  847. return 0;
  848. }
  849. static int mkv_write_simpletag(AVIOContext *pb, AVDictionaryEntry *t)
  850. {
  851. uint8_t *key = av_strdup(t->key);
  852. uint8_t *p = key;
  853. const uint8_t *lang = NULL;
  854. ebml_master tag;
  855. if (!key)
  856. return AVERROR(ENOMEM);
  857. if ((p = strrchr(p, '-')) &&
  858. (lang = av_convert_lang_to(p + 1, AV_LANG_ISO639_2_BIBL)))
  859. *p = 0;
  860. p = key;
  861. while (*p) {
  862. if (*p == ' ')
  863. *p = '_';
  864. else if (*p >= 'a' && *p <= 'z')
  865. *p -= 'a' - 'A';
  866. p++;
  867. }
  868. tag = start_ebml_master(pb, MATROSKA_ID_SIMPLETAG, 0);
  869. put_ebml_string(pb, MATROSKA_ID_TAGNAME, key);
  870. if (lang)
  871. put_ebml_string(pb, MATROSKA_ID_TAGLANG, lang);
  872. put_ebml_string(pb, MATROSKA_ID_TAGSTRING, t->value);
  873. end_ebml_master(pb, tag);
  874. av_freep(&key);
  875. return 0;
  876. }
  877. static int mkv_write_tag(AVFormatContext *s, AVDictionary *m, unsigned int elementid,
  878. unsigned int uid, ebml_master *tags)
  879. {
  880. MatroskaMuxContext *mkv = s->priv_data;
  881. ebml_master tag, targets;
  882. AVDictionaryEntry *t = NULL;
  883. int ret;
  884. if (!tags->pos) {
  885. ret = mkv_add_seekhead_entry(mkv->main_seekhead, MATROSKA_ID_TAGS, avio_tell(s->pb));
  886. if (ret < 0) return ret;
  887. *tags = start_ebml_master(s->pb, MATROSKA_ID_TAGS, 0);
  888. }
  889. tag = start_ebml_master(s->pb, MATROSKA_ID_TAG, 0);
  890. targets = start_ebml_master(s->pb, MATROSKA_ID_TAGTARGETS, 0);
  891. if (elementid)
  892. put_ebml_uint(s->pb, elementid, uid);
  893. end_ebml_master(s->pb, targets);
  894. while ((t = av_dict_get(m, "", t, AV_DICT_IGNORE_SUFFIX))) {
  895. if (av_strcasecmp(t->key, "title") &&
  896. av_strcasecmp(t->key, "encoding_tool") &&
  897. (elementid != MATROSKA_ID_TAGTARGETS_TRACKUID ||
  898. av_strcasecmp(t->key, "language"))) {
  899. ret = mkv_write_simpletag(s->pb, t);
  900. if (ret < 0)
  901. return ret;
  902. }
  903. }
  904. end_ebml_master(s->pb, tag);
  905. return 0;
  906. }
  907. static int mkv_write_tags(AVFormatContext *s)
  908. {
  909. ebml_master tags = {0};
  910. int i, ret;
  911. ff_metadata_conv_ctx(s, ff_mkv_metadata_conv, NULL);
  912. if (av_dict_get(s->metadata, "", NULL, AV_DICT_IGNORE_SUFFIX)) {
  913. ret = mkv_write_tag(s, s->metadata, 0, 0, &tags);
  914. if (ret < 0) return ret;
  915. }
  916. for (i = 0; i < s->nb_streams; i++) {
  917. AVStream *st = s->streams[i];
  918. if (!av_dict_get(st->metadata, "", 0, AV_DICT_IGNORE_SUFFIX))
  919. continue;
  920. ret = mkv_write_tag(s, st->metadata, MATROSKA_ID_TAGTARGETS_TRACKUID, i + 1, &tags);
  921. if (ret < 0) return ret;
  922. }
  923. for (i = 0; i < s->nb_chapters; i++) {
  924. AVChapter *ch = s->chapters[i];
  925. if (!av_dict_get(ch->metadata, "", NULL, AV_DICT_IGNORE_SUFFIX))
  926. continue;
  927. ret = mkv_write_tag(s, ch->metadata, MATROSKA_ID_TAGTARGETS_CHAPTERUID, ch->id, &tags);
  928. if (ret < 0) return ret;
  929. }
  930. if (tags.pos)
  931. end_ebml_master(s->pb, tags);
  932. return 0;
  933. }
  934. static int mkv_write_attachments(AVFormatContext *s)
  935. {
  936. MatroskaMuxContext *mkv = s->priv_data;
  937. AVIOContext *pb = s->pb;
  938. ebml_master attachments;
  939. AVLFG c;
  940. int i, ret;
  941. if (!mkv->have_attachments)
  942. return 0;
  943. av_lfg_init(&c, av_get_random_seed());
  944. ret = mkv_add_seekhead_entry(mkv->main_seekhead, MATROSKA_ID_ATTACHMENTS, avio_tell(pb));
  945. if (ret < 0) return ret;
  946. attachments = start_ebml_master(pb, MATROSKA_ID_ATTACHMENTS, 0);
  947. for (i = 0; i < s->nb_streams; i++) {
  948. AVStream *st = s->streams[i];
  949. ebml_master attached_file;
  950. AVDictionaryEntry *t;
  951. const char *mimetype = NULL;
  952. if (st->codecpar->codec_type != AVMEDIA_TYPE_ATTACHMENT)
  953. continue;
  954. attached_file = start_ebml_master(pb, MATROSKA_ID_ATTACHEDFILE, 0);
  955. if (t = av_dict_get(st->metadata, "title", NULL, 0))
  956. put_ebml_string(pb, MATROSKA_ID_FILEDESC, t->value);
  957. if (!(t = av_dict_get(st->metadata, "filename", NULL, 0))) {
  958. av_log(s, AV_LOG_ERROR, "Attachment stream %d has no filename tag.\n", i);
  959. return AVERROR(EINVAL);
  960. }
  961. put_ebml_string(pb, MATROSKA_ID_FILENAME, t->value);
  962. if (t = av_dict_get(st->metadata, "mimetype", NULL, 0))
  963. mimetype = t->value;
  964. else if (st->codecpar->codec_id != AV_CODEC_ID_NONE ) {
  965. int i;
  966. for (i = 0; ff_mkv_mime_tags[i].id != AV_CODEC_ID_NONE; i++)
  967. if (ff_mkv_mime_tags[i].id == st->codecpar->codec_id) {
  968. mimetype = ff_mkv_mime_tags[i].str;
  969. break;
  970. }
  971. for (i = 0; ff_mkv_image_mime_tags[i].id != AV_CODEC_ID_NONE; i++)
  972. if (ff_mkv_image_mime_tags[i].id == st->codecpar->codec_id) {
  973. mimetype = ff_mkv_image_mime_tags[i].str;
  974. break;
  975. }
  976. }
  977. if (!mimetype) {
  978. av_log(s, AV_LOG_ERROR, "Attachment stream %d has no mimetype tag and "
  979. "it cannot be deduced from the codec id.\n", i);
  980. return AVERROR(EINVAL);
  981. }
  982. put_ebml_string(pb, MATROSKA_ID_FILEMIMETYPE, mimetype);
  983. put_ebml_binary(pb, MATROSKA_ID_FILEDATA, st->codecpar->extradata, st->codecpar->extradata_size);
  984. put_ebml_uint(pb, MATROSKA_ID_FILEUID, av_lfg_get(&c));
  985. end_ebml_master(pb, attached_file);
  986. }
  987. end_ebml_master(pb, attachments);
  988. return 0;
  989. }
  990. static int mkv_write_header(AVFormatContext *s)
  991. {
  992. MatroskaMuxContext *mkv = s->priv_data;
  993. AVIOContext *pb = s->pb;
  994. ebml_master ebml_header, segment_info;
  995. AVDictionaryEntry *tag;
  996. int ret, i;
  997. if (!strcmp(s->oformat->name, "webm"))
  998. mkv->mode = MODE_WEBM;
  999. else
  1000. mkv->mode = MODE_MATROSKAv2;
  1001. mkv->tracks = av_mallocz(s->nb_streams * sizeof(*mkv->tracks));
  1002. if (!mkv->tracks)
  1003. return AVERROR(ENOMEM);
  1004. ebml_header = start_ebml_master(pb, EBML_ID_HEADER, 0);
  1005. put_ebml_uint (pb, EBML_ID_EBMLVERSION , 1);
  1006. put_ebml_uint (pb, EBML_ID_EBMLREADVERSION , 1);
  1007. put_ebml_uint (pb, EBML_ID_EBMLMAXIDLENGTH , 4);
  1008. put_ebml_uint (pb, EBML_ID_EBMLMAXSIZELENGTH , 8);
  1009. put_ebml_string (pb, EBML_ID_DOCTYPE , s->oformat->name);
  1010. put_ebml_uint (pb, EBML_ID_DOCTYPEVERSION , 4);
  1011. put_ebml_uint (pb, EBML_ID_DOCTYPEREADVERSION , 2);
  1012. end_ebml_master(pb, ebml_header);
  1013. mkv->segment = start_ebml_master(pb, MATROSKA_ID_SEGMENT, 0);
  1014. mkv->segment_offset = avio_tell(pb);
  1015. // we write 2 seek heads - one at the end of the file to point to each
  1016. // cluster, and one at the beginning to point to all other level one
  1017. // elements (including the seek head at the end of the file), which
  1018. // isn't more than 10 elements if we only write one of each other
  1019. // currently defined level 1 element
  1020. mkv->main_seekhead = mkv_start_seekhead(pb, mkv->segment_offset, 10);
  1021. if (!mkv->main_seekhead)
  1022. return AVERROR(ENOMEM);
  1023. ret = mkv_add_seekhead_entry(mkv->main_seekhead, MATROSKA_ID_INFO, avio_tell(pb));
  1024. if (ret < 0) return ret;
  1025. segment_info = start_ebml_master(pb, MATROSKA_ID_INFO, 0);
  1026. put_ebml_uint(pb, MATROSKA_ID_TIMECODESCALE, 1000000);
  1027. if ((tag = av_dict_get(s->metadata, "title", NULL, 0)))
  1028. put_ebml_string(pb, MATROSKA_ID_TITLE, tag->value);
  1029. if (!(s->flags & AVFMT_FLAG_BITEXACT)) {
  1030. uint32_t segment_uid[4];
  1031. AVLFG lfg;
  1032. av_lfg_init(&lfg, av_get_random_seed());
  1033. for (i = 0; i < 4; i++)
  1034. segment_uid[i] = av_lfg_get(&lfg);
  1035. put_ebml_string(pb, MATROSKA_ID_MUXINGAPP, LIBAVFORMAT_IDENT);
  1036. if ((tag = av_dict_get(s->metadata, "encoding_tool", NULL, 0)))
  1037. put_ebml_string(pb, MATROSKA_ID_WRITINGAPP, tag->value);
  1038. else
  1039. put_ebml_string(pb, MATROSKA_ID_WRITINGAPP, LIBAVFORMAT_IDENT);
  1040. put_ebml_binary(pb, MATROSKA_ID_SEGMENTUID, segment_uid, 16);
  1041. }
  1042. // reserve space for the duration
  1043. mkv->duration = 0;
  1044. mkv->duration_offset = avio_tell(pb);
  1045. put_ebml_void(pb, 11); // assumes double-precision float to be written
  1046. end_ebml_master(pb, segment_info);
  1047. ret = mkv_write_tracks(s);
  1048. if (ret < 0)
  1049. return ret;
  1050. if (mkv->mode != MODE_WEBM) {
  1051. ret = mkv_write_chapters(s);
  1052. if (ret < 0)
  1053. return ret;
  1054. ret = mkv_write_tags(s);
  1055. if (ret < 0)
  1056. return ret;
  1057. ret = mkv_write_attachments(s);
  1058. if (ret < 0)
  1059. return ret;
  1060. }
  1061. if (!s->pb->seekable)
  1062. mkv_write_seekhead(pb, mkv->main_seekhead);
  1063. mkv->cues = mkv_start_cues(mkv->segment_offset);
  1064. if (!mkv->cues)
  1065. return AVERROR(ENOMEM);
  1066. if (pb->seekable && mkv->reserve_cues_space) {
  1067. mkv->cues_pos = avio_tell(pb);
  1068. put_ebml_void(pb, mkv->reserve_cues_space);
  1069. }
  1070. av_init_packet(&mkv->cur_audio_pkt);
  1071. mkv->cur_audio_pkt.size = 0;
  1072. avio_flush(pb);
  1073. // start a new cluster every 5 MB or 5 sec, or 32k / 1 sec for streaming or
  1074. // after 4k and on a keyframe
  1075. if (pb->seekable) {
  1076. if (mkv->cluster_time_limit < 0)
  1077. mkv->cluster_time_limit = 5000;
  1078. if (mkv->cluster_size_limit < 0)
  1079. mkv->cluster_size_limit = 5 * 1024 * 1024;
  1080. } else {
  1081. if (mkv->cluster_time_limit < 0)
  1082. mkv->cluster_time_limit = 1000;
  1083. if (mkv->cluster_size_limit < 0)
  1084. mkv->cluster_size_limit = 32 * 1024;
  1085. }
  1086. return 0;
  1087. }
  1088. static int mkv_blockgroup_size(int pkt_size)
  1089. {
  1090. int size = pkt_size + 4;
  1091. size += ebml_num_size(size);
  1092. size += 2; // EBML ID for block and block duration
  1093. size += 8; // max size of block duration
  1094. size += ebml_num_size(size);
  1095. size += 1; // blockgroup EBML ID
  1096. return size;
  1097. }
  1098. static int ass_get_duration(AVFormatContext *s, const uint8_t *p)
  1099. {
  1100. int sh, sm, ss, sc, eh, em, es, ec;
  1101. uint64_t start, end;
  1102. if (sscanf(p, "%*[^,],%d:%d:%d%*c%d,%d:%d:%d%*c%d",
  1103. &sh, &sm, &ss, &sc, &eh, &em, &es, &ec) != 8)
  1104. return 0;
  1105. if (sh > 9 || sm > 59 || ss > 59 || sc > 99 ||
  1106. eh > 9 || em > 59 || es > 59 || ec > 99) {
  1107. av_log(s, AV_LOG_WARNING,
  1108. "Non-standard time reference %d:%d:%d.%d,%d:%d:%d.%d\n",
  1109. sh, sm, ss, sc, eh, em, es, ec);
  1110. return 0;
  1111. }
  1112. start = 3600000 * sh + 60000 * sm + 1000 * ss + 10 * sc;
  1113. end = 3600000 * eh + 60000 * em + 1000 * es + 10 * ec;
  1114. if (start > end) {
  1115. av_log(s, AV_LOG_WARNING,
  1116. "Unexpected time reference %d:%d:%d.%d,%d:%d:%d.%d\n",
  1117. sh, sm, ss, sc, eh, em, es, ec);
  1118. return 0;
  1119. }
  1120. return end - start;
  1121. }
  1122. static int mkv_write_ass_blocks(AVFormatContext *s, AVIOContext *pb,
  1123. AVPacket *pkt)
  1124. {
  1125. MatroskaMuxContext *mkv = s->priv_data;
  1126. int i, layer = 0, max_duration = 0, size, line_size, data_size = pkt->size;
  1127. uint8_t *start, *end, *data = pkt->data;
  1128. ebml_master blockgroup;
  1129. char buffer[2048];
  1130. while (data_size) {
  1131. int duration = ass_get_duration(s, data);
  1132. max_duration = FFMAX(duration, max_duration);
  1133. end = memchr(data, '\n', data_size);
  1134. size = line_size = end ? end - data + 1 : data_size;
  1135. size -= end ? (end[-1] == '\r') + 1 : 0;
  1136. start = data;
  1137. for (i = 0; i < 3; i++, start++)
  1138. if (!(start = memchr(start, ',', size - (start - data))))
  1139. return max_duration;
  1140. size -= start - data;
  1141. sscanf(data, "Dialogue: %d,", &layer);
  1142. i = snprintf(buffer, sizeof(buffer), "%" PRId64 ",%d,",
  1143. s->streams[pkt->stream_index]->nb_frames, layer);
  1144. size = FFMIN(i + size, sizeof(buffer));
  1145. memcpy(buffer + i, start, size - i);
  1146. av_log(s, AV_LOG_DEBUG,
  1147. "Writing block at offset %" PRIu64 ", size %d, "
  1148. "pts %" PRId64 ", duration %d\n",
  1149. avio_tell(pb), size, pkt->pts, duration);
  1150. blockgroup = start_ebml_master(pb, MATROSKA_ID_BLOCKGROUP,
  1151. mkv_blockgroup_size(size));
  1152. put_ebml_id(pb, MATROSKA_ID_BLOCK);
  1153. put_ebml_num(pb, size + 4, 0);
  1154. // this assumes stream_index is less than 126
  1155. avio_w8(pb, 0x80 | (pkt->stream_index + 1));
  1156. avio_wb16(pb, pkt->pts - mkv->cluster_pts);
  1157. avio_w8(pb, 0);
  1158. avio_write(pb, buffer, size);
  1159. put_ebml_uint(pb, MATROSKA_ID_BLOCKDURATION, duration);
  1160. end_ebml_master(pb, blockgroup);
  1161. data += line_size;
  1162. data_size -= line_size;
  1163. }
  1164. return max_duration;
  1165. }
  1166. static int mkv_strip_wavpack(const uint8_t *src, uint8_t **pdst, int *size)
  1167. {
  1168. uint8_t *dst;
  1169. int srclen = *size;
  1170. int offset = 0;
  1171. int ret;
  1172. dst = av_malloc(srclen);
  1173. if (!dst)
  1174. return AVERROR(ENOMEM);
  1175. while (srclen >= WV_HEADER_SIZE) {
  1176. WvHeader header;
  1177. ret = ff_wv_parse_header(&header, src);
  1178. if (ret < 0)
  1179. goto fail;
  1180. src += WV_HEADER_SIZE;
  1181. srclen -= WV_HEADER_SIZE;
  1182. if (srclen < header.blocksize) {
  1183. ret = AVERROR_INVALIDDATA;
  1184. goto fail;
  1185. }
  1186. if (header.initial) {
  1187. AV_WL32(dst + offset, header.samples);
  1188. offset += 4;
  1189. }
  1190. AV_WL32(dst + offset, header.flags);
  1191. AV_WL32(dst + offset + 4, header.crc);
  1192. offset += 8;
  1193. if (!(header.initial && header.final)) {
  1194. AV_WL32(dst + offset, header.blocksize);
  1195. offset += 4;
  1196. }
  1197. memcpy(dst + offset, src, header.blocksize);
  1198. src += header.blocksize;
  1199. srclen -= header.blocksize;
  1200. offset += header.blocksize;
  1201. }
  1202. *pdst = dst;
  1203. *size = offset;
  1204. return 0;
  1205. fail:
  1206. av_freep(&dst);
  1207. return ret;
  1208. }
  1209. static void mkv_write_block(AVFormatContext *s, AVIOContext *pb,
  1210. unsigned int blockid, AVPacket *pkt, int flags)
  1211. {
  1212. MatroskaMuxContext *mkv = s->priv_data;
  1213. AVCodecParameters *par = s->streams[pkt->stream_index]->codecpar;
  1214. uint8_t *data = NULL;
  1215. int offset = 0, size = pkt->size;
  1216. int64_t ts = mkv->tracks[pkt->stream_index].write_dts ? pkt->dts : pkt->pts;
  1217. av_log(s, AV_LOG_DEBUG, "Writing block at offset %" PRIu64 ", size %d, "
  1218. "pts %" PRId64 ", dts %" PRId64 ", duration %" PRId64 ", flags %d\n",
  1219. avio_tell(pb), pkt->size, pkt->pts, pkt->dts, pkt->duration, flags);
  1220. if (par->codec_id == AV_CODEC_ID_H264 && par->extradata_size > 0 &&
  1221. (AV_RB24(par->extradata) == 1 || AV_RB32(par->extradata) == 1))
  1222. ff_avc_parse_nal_units_buf(pkt->data, &data, &size);
  1223. else if (par->codec_id == AV_CODEC_ID_HEVC && par->extradata_size > 6 &&
  1224. (AV_RB24(par->extradata) == 1 || AV_RB32(par->extradata) == 1))
  1225. /* extradata is Annex B, assume the bitstream is too and convert it */
  1226. ff_hevc_annexb2mp4_buf(pkt->data, &data, &size, 0, NULL);
  1227. else if (par->codec_id == AV_CODEC_ID_WAVPACK) {
  1228. int ret = mkv_strip_wavpack(pkt->data, &data, &size);
  1229. if (ret < 0) {
  1230. av_log(s, AV_LOG_ERROR, "Error stripping a WavPack packet.\n");
  1231. return;
  1232. }
  1233. } else
  1234. data = pkt->data;
  1235. if (par->codec_id == AV_CODEC_ID_PRORES) {
  1236. /* Matroska specification requires to remove the first QuickTime atom
  1237. */
  1238. size -= 8;
  1239. offset = 8;
  1240. }
  1241. put_ebml_id(pb, blockid);
  1242. put_ebml_num(pb, size + 4, 0);
  1243. // this assumes stream_index is less than 126
  1244. avio_w8(pb, 0x80 | (pkt->stream_index + 1));
  1245. avio_wb16(pb, ts - mkv->cluster_pts);
  1246. avio_w8(pb, flags);
  1247. avio_write(pb, data + offset, size);
  1248. if (data != pkt->data)
  1249. av_free(data);
  1250. }
  1251. static int srt_get_duration(uint8_t **buf)
  1252. {
  1253. int i, duration = 0;
  1254. for (i = 0; i < 2 && !duration; i++) {
  1255. int s_hour, s_min, s_sec, s_hsec, e_hour, e_min, e_sec, e_hsec;
  1256. if (sscanf(*buf, "%d:%2d:%2d%*1[,.]%3d --> %d:%2d:%2d%*1[,.]%3d",
  1257. &s_hour, &s_min, &s_sec, &s_hsec,
  1258. &e_hour, &e_min, &e_sec, &e_hsec) == 8) {
  1259. s_min += 60 * s_hour;
  1260. e_min += 60 * e_hour;
  1261. s_sec += 60 * s_min;
  1262. e_sec += 60 * e_min;
  1263. s_hsec += 1000 * s_sec;
  1264. e_hsec += 1000 * e_sec;
  1265. duration = e_hsec - s_hsec;
  1266. }
  1267. *buf += strcspn(*buf, "\n") + 1;
  1268. }
  1269. return duration;
  1270. }
  1271. static int mkv_write_srt_blocks(AVFormatContext *s, AVIOContext *pb,
  1272. AVPacket *pkt)
  1273. {
  1274. ebml_master blockgroup;
  1275. AVPacket pkt2 = *pkt;
  1276. int64_t duration = srt_get_duration(&pkt2.data);
  1277. pkt2.size -= pkt2.data - pkt->data;
  1278. blockgroup = start_ebml_master(pb, MATROSKA_ID_BLOCKGROUP,
  1279. mkv_blockgroup_size(pkt2.size));
  1280. mkv_write_block(s, pb, MATROSKA_ID_BLOCK, &pkt2, 0);
  1281. put_ebml_uint(pb, MATROSKA_ID_BLOCKDURATION, duration);
  1282. end_ebml_master(pb, blockgroup);
  1283. return duration;
  1284. }
  1285. static void mkv_flush_dynbuf(AVFormatContext *s)
  1286. {
  1287. MatroskaMuxContext *mkv = s->priv_data;
  1288. int bufsize;
  1289. uint8_t *dyn_buf;
  1290. if (!mkv->dyn_bc)
  1291. return;
  1292. bufsize = avio_close_dyn_buf(mkv->dyn_bc, &dyn_buf);
  1293. avio_write(s->pb, dyn_buf, bufsize);
  1294. av_free(dyn_buf);
  1295. mkv->dyn_bc = NULL;
  1296. }
  1297. static int mkv_write_packet_internal(AVFormatContext *s, AVPacket *pkt)
  1298. {
  1299. MatroskaMuxContext *mkv = s->priv_data;
  1300. AVIOContext *pb = s->pb;
  1301. AVCodecParameters *par = s->streams[pkt->stream_index]->codecpar;
  1302. int keyframe = !!(pkt->flags & AV_PKT_FLAG_KEY);
  1303. int duration = pkt->duration;
  1304. int ret;
  1305. int64_t ts = mkv->tracks[pkt->stream_index].write_dts ? pkt->dts : pkt->pts;
  1306. if (ts == AV_NOPTS_VALUE) {
  1307. av_log(s, AV_LOG_ERROR, "Can't write packet with unknown timestamp\n");
  1308. return AVERROR(EINVAL);
  1309. }
  1310. ts += mkv->tracks[pkt->stream_index].ts_offset;
  1311. if (!s->pb->seekable) {
  1312. if (!mkv->dyn_bc) {
  1313. ret = avio_open_dyn_buf(&mkv->dyn_bc);
  1314. if (ret < 0)
  1315. return ret;
  1316. }
  1317. pb = mkv->dyn_bc;
  1318. }
  1319. if (!mkv->cluster_pos) {
  1320. mkv->cluster_pos = avio_tell(s->pb);
  1321. mkv->cluster = start_ebml_master(pb, MATROSKA_ID_CLUSTER, 0);
  1322. put_ebml_uint(pb, MATROSKA_ID_CLUSTERTIMECODE, FFMAX(0, ts));
  1323. mkv->cluster_pts = FFMAX(0, ts);
  1324. }
  1325. if (par->codec_type != AVMEDIA_TYPE_SUBTITLE) {
  1326. mkv_write_block(s, pb, MATROSKA_ID_SIMPLEBLOCK, pkt, keyframe << 7);
  1327. } else if (par->codec_id == AV_CODEC_ID_SSA) {
  1328. duration = mkv_write_ass_blocks(s, pb, pkt);
  1329. } else if (par->codec_id == AV_CODEC_ID_SRT) {
  1330. duration = mkv_write_srt_blocks(s, pb, pkt);
  1331. } else {
  1332. ebml_master blockgroup = start_ebml_master(pb, MATROSKA_ID_BLOCKGROUP,
  1333. mkv_blockgroup_size(pkt->size));
  1334. duration = pkt->duration;
  1335. #if FF_API_CONVERGENCE_DURATION
  1336. FF_DISABLE_DEPRECATION_WARNINGS
  1337. if (pkt->convergence_duration)
  1338. duration = pkt->convergence_duration;
  1339. FF_ENABLE_DEPRECATION_WARNINGS
  1340. #endif
  1341. mkv_write_block(s, pb, MATROSKA_ID_BLOCK, pkt, 0);
  1342. put_ebml_uint(pb, MATROSKA_ID_BLOCKDURATION, duration);
  1343. end_ebml_master(pb, blockgroup);
  1344. }
  1345. if (par->codec_type == AVMEDIA_TYPE_VIDEO && keyframe) {
  1346. ret = mkv_add_cuepoint(mkv->cues, pkt->stream_index, ts,
  1347. mkv->cluster_pos);
  1348. if (ret < 0)
  1349. return ret;
  1350. }
  1351. mkv->duration = FFMAX(mkv->duration, ts + duration);
  1352. return 0;
  1353. }
  1354. static int mkv_write_packet(AVFormatContext *s, AVPacket *pkt)
  1355. {
  1356. MatroskaMuxContext *mkv = s->priv_data;
  1357. int codec_type = s->streams[pkt->stream_index]->codecpar->codec_type;
  1358. int keyframe = !!(pkt->flags & AV_PKT_FLAG_KEY);
  1359. int cluster_size;
  1360. int64_t cluster_time;
  1361. AVIOContext *pb;
  1362. int ret;
  1363. if (mkv->tracks[pkt->stream_index].write_dts)
  1364. cluster_time = pkt->dts - mkv->cluster_pts;
  1365. else
  1366. cluster_time = pkt->pts - mkv->cluster_pts;
  1367. cluster_time += mkv->tracks[pkt->stream_index].ts_offset;
  1368. // start a new cluster every 5 MB or 5 sec, or 32k / 1 sec for streaming or
  1369. // after 4k and on a keyframe
  1370. if (s->pb->seekable) {
  1371. pb = s->pb;
  1372. cluster_size = avio_tell(pb) - mkv->cluster_pos;
  1373. } else {
  1374. pb = mkv->dyn_bc;
  1375. cluster_size = avio_tell(pb);
  1376. }
  1377. if (mkv->cluster_pos &&
  1378. (cluster_size > mkv->cluster_size_limit ||
  1379. cluster_time > mkv->cluster_time_limit ||
  1380. (codec_type == AVMEDIA_TYPE_VIDEO && keyframe &&
  1381. cluster_size > 4 * 1024))) {
  1382. av_log(s, AV_LOG_DEBUG,
  1383. "Starting new cluster at offset %" PRIu64 " bytes, "
  1384. "pts %" PRIu64 "dts %" PRIu64 "\n",
  1385. avio_tell(pb), pkt->pts, pkt->dts);
  1386. end_ebml_master(pb, mkv->cluster);
  1387. mkv->cluster_pos = 0;
  1388. if (mkv->dyn_bc)
  1389. mkv_flush_dynbuf(s);
  1390. avio_flush(s->pb);
  1391. }
  1392. // check if we have an audio packet cached
  1393. if (mkv->cur_audio_pkt.size > 0) {
  1394. ret = mkv_write_packet_internal(s, &mkv->cur_audio_pkt);
  1395. av_packet_unref(&mkv->cur_audio_pkt);
  1396. if (ret < 0) {
  1397. av_log(s, AV_LOG_ERROR,
  1398. "Could not write cached audio packet ret:%d\n", ret);
  1399. return ret;
  1400. }
  1401. }
  1402. // buffer an audio packet to ensure the packet containing the video
  1403. // keyframe's timecode is contained in the same cluster for WebM
  1404. if (codec_type == AVMEDIA_TYPE_AUDIO) {
  1405. ret = av_packet_ref(&mkv->cur_audio_pkt, pkt);
  1406. } else
  1407. ret = mkv_write_packet_internal(s, pkt);
  1408. return ret;
  1409. }
  1410. static int mkv_write_flush_packet(AVFormatContext *s, AVPacket *pkt)
  1411. {
  1412. MatroskaMuxContext *mkv = s->priv_data;
  1413. AVIOContext *pb;
  1414. if (s->pb->seekable)
  1415. pb = s->pb;
  1416. else
  1417. pb = mkv->dyn_bc;
  1418. if (!pkt) {
  1419. if (mkv->cluster_pos) {
  1420. av_log(s, AV_LOG_DEBUG,
  1421. "Flushing cluster at offset %" PRIu64 " bytes\n",
  1422. avio_tell(pb));
  1423. end_ebml_master(pb, mkv->cluster);
  1424. mkv->cluster_pos = 0;
  1425. if (mkv->dyn_bc)
  1426. mkv_flush_dynbuf(s);
  1427. avio_flush(s->pb);
  1428. }
  1429. return 1;
  1430. }
  1431. return mkv_write_packet(s, pkt);
  1432. }
  1433. static int mkv_write_trailer(AVFormatContext *s)
  1434. {
  1435. MatroskaMuxContext *mkv = s->priv_data;
  1436. AVIOContext *pb = s->pb;
  1437. int64_t currentpos, cuespos;
  1438. int ret;
  1439. // check if we have an audio packet cached
  1440. if (mkv->cur_audio_pkt.size > 0) {
  1441. ret = mkv_write_packet_internal(s, &mkv->cur_audio_pkt);
  1442. av_packet_unref(&mkv->cur_audio_pkt);
  1443. if (ret < 0) {
  1444. av_log(s, AV_LOG_ERROR,
  1445. "Could not write cached audio packet ret:%d\n", ret);
  1446. return ret;
  1447. }
  1448. }
  1449. if (mkv->dyn_bc) {
  1450. end_ebml_master(mkv->dyn_bc, mkv->cluster);
  1451. mkv_flush_dynbuf(s);
  1452. } else if (mkv->cluster_pos) {
  1453. end_ebml_master(pb, mkv->cluster);
  1454. }
  1455. if (mkv->mode != MODE_WEBM) {
  1456. ret = mkv_write_chapters(s);
  1457. if (ret < 0)
  1458. return ret;
  1459. }
  1460. if (pb->seekable) {
  1461. if (mkv->cues->num_entries) {
  1462. if (mkv->reserve_cues_space) {
  1463. int64_t cues_end;
  1464. currentpos = avio_tell(pb);
  1465. avio_seek(pb, mkv->cues_pos, SEEK_SET);
  1466. cuespos = mkv_write_cues(pb, mkv->cues, s->nb_streams);
  1467. cues_end = avio_tell(pb);
  1468. if (cues_end > cuespos + mkv->reserve_cues_space) {
  1469. av_log(s, AV_LOG_ERROR,
  1470. "Insufficient space reserved for cues: %d "
  1471. "(needed: %" PRId64 ").\n",
  1472. mkv->reserve_cues_space, cues_end - cuespos);
  1473. return AVERROR(EINVAL);
  1474. }
  1475. if (cues_end < cuespos + mkv->reserve_cues_space)
  1476. put_ebml_void(pb, mkv->reserve_cues_space -
  1477. (cues_end - cuespos));
  1478. avio_seek(pb, currentpos, SEEK_SET);
  1479. } else {
  1480. cuespos = mkv_write_cues(pb, mkv->cues, s->nb_streams);
  1481. }
  1482. ret = mkv_add_seekhead_entry(mkv->main_seekhead, MATROSKA_ID_CUES,
  1483. cuespos);
  1484. if (ret < 0)
  1485. return ret;
  1486. }
  1487. mkv_write_seekhead(pb, mkv->main_seekhead);
  1488. // update the duration
  1489. av_log(s, AV_LOG_DEBUG, "end duration = %" PRIu64 "\n", mkv->duration);
  1490. currentpos = avio_tell(pb);
  1491. avio_seek(pb, mkv->duration_offset, SEEK_SET);
  1492. put_ebml_float(pb, MATROSKA_ID_DURATION, mkv->duration);
  1493. avio_seek(pb, currentpos, SEEK_SET);
  1494. }
  1495. end_ebml_master(pb, mkv->segment);
  1496. av_free(mkv->tracks);
  1497. av_freep(&mkv->cues->entries);
  1498. av_freep(&mkv->cues);
  1499. return 0;
  1500. }
  1501. static int mkv_query_codec(enum AVCodecID codec_id, int std_compliance)
  1502. {
  1503. int i;
  1504. for (i = 0; ff_mkv_codec_tags[i].id != AV_CODEC_ID_NONE; i++)
  1505. if (ff_mkv_codec_tags[i].id == codec_id)
  1506. return 1;
  1507. if (std_compliance < FF_COMPLIANCE_NORMAL) {
  1508. enum AVMediaType type = avcodec_get_type(codec_id);
  1509. // mkv theoretically supports any video/audio through VFW/ACM
  1510. if (type == AVMEDIA_TYPE_VIDEO || type == AVMEDIA_TYPE_AUDIO)
  1511. return 1;
  1512. }
  1513. return 0;
  1514. }
  1515. #define OFFSET(x) offsetof(MatroskaMuxContext, x)
  1516. #define FLAGS AV_OPT_FLAG_ENCODING_PARAM
  1517. static const AVOption options[] = {
  1518. { "reserve_index_space", "Reserve a given amount of space (in bytes) at the beginning of the file for the index (cues).", OFFSET(reserve_cues_space), AV_OPT_TYPE_INT, { .i64 = 0 }, 0, INT_MAX, FLAGS },
  1519. { "cluster_size_limit", "Store at most the provided amount of bytes in a cluster. ", OFFSET(cluster_size_limit), AV_OPT_TYPE_INT , { .i64 = -1 }, -1, INT_MAX, FLAGS },
  1520. { "cluster_time_limit", "Store at most the provided number of milliseconds in a cluster.", OFFSET(cluster_time_limit), AV_OPT_TYPE_INT64, { .i64 = -1 }, -1, INT64_MAX, FLAGS },
  1521. { NULL },
  1522. };
  1523. #if CONFIG_MATROSKA_MUXER
  1524. static const AVClass matroska_class = {
  1525. .class_name = "matroska muxer",
  1526. .item_name = av_default_item_name,
  1527. .option = options,
  1528. .version = LIBAVUTIL_VERSION_INT,
  1529. };
  1530. AVOutputFormat ff_matroska_muxer = {
  1531. .name = "matroska",
  1532. .long_name = NULL_IF_CONFIG_SMALL("Matroska"),
  1533. .mime_type = "video/x-matroska",
  1534. .extensions = "mkv",
  1535. .priv_data_size = sizeof(MatroskaMuxContext),
  1536. .audio_codec = CONFIG_LIBVORBIS_ENCODER ?
  1537. AV_CODEC_ID_VORBIS : AV_CODEC_ID_AC3,
  1538. .video_codec = CONFIG_LIBX264_ENCODER ?
  1539. AV_CODEC_ID_H264 : AV_CODEC_ID_MPEG4,
  1540. .write_header = mkv_write_header,
  1541. .write_packet = mkv_write_flush_packet,
  1542. .write_trailer = mkv_write_trailer,
  1543. .flags = AVFMT_GLOBALHEADER | AVFMT_VARIABLE_FPS |
  1544. AVFMT_TS_NONSTRICT | AVFMT_ALLOW_FLUSH,
  1545. .codec_tag = (const AVCodecTag* const []){
  1546. ff_codec_bmp_tags, ff_codec_wav_tags, 0
  1547. },
  1548. .subtitle_codec = AV_CODEC_ID_SSA,
  1549. .query_codec = mkv_query_codec,
  1550. .priv_class = &matroska_class,
  1551. };
  1552. #endif
  1553. #if CONFIG_WEBM_MUXER
  1554. static const AVClass webm_class = {
  1555. .class_name = "webm muxer",
  1556. .item_name = av_default_item_name,
  1557. .option = options,
  1558. .version = LIBAVUTIL_VERSION_INT,
  1559. };
  1560. AVOutputFormat ff_webm_muxer = {
  1561. .name = "webm",
  1562. .long_name = NULL_IF_CONFIG_SMALL("WebM"),
  1563. .mime_type = "video/webm",
  1564. .extensions = "webm",
  1565. .priv_data_size = sizeof(MatroskaMuxContext),
  1566. .audio_codec = CONFIG_LIBOPUS_ENCODER ? AV_CODEC_ID_OPUS : AV_CODEC_ID_VORBIS,
  1567. .video_codec = CONFIG_LIBVPX_VP9_ENCODER? AV_CODEC_ID_VP9 : AV_CODEC_ID_VP8,
  1568. .write_header = mkv_write_header,
  1569. .write_packet = mkv_write_flush_packet,
  1570. .write_trailer = mkv_write_trailer,
  1571. .flags = AVFMT_GLOBALHEADER | AVFMT_VARIABLE_FPS |
  1572. AVFMT_TS_NONSTRICT | AVFMT_ALLOW_FLUSH,
  1573. .priv_class = &webm_class,
  1574. };
  1575. #endif
  1576. #if CONFIG_MATROSKA_AUDIO_MUXER
  1577. static const AVClass mka_class = {
  1578. .class_name = "matroska audio muxer",
  1579. .item_name = av_default_item_name,
  1580. .option = options,
  1581. .version = LIBAVUTIL_VERSION_INT,
  1582. };
  1583. AVOutputFormat ff_matroska_audio_muxer = {
  1584. .name = "matroska",
  1585. .long_name = NULL_IF_CONFIG_SMALL("Matroska"),
  1586. .mime_type = "audio/x-matroska",
  1587. .extensions = "mka",
  1588. .priv_data_size = sizeof(MatroskaMuxContext),
  1589. .audio_codec = CONFIG_LIBVORBIS_ENCODER ?
  1590. AV_CODEC_ID_VORBIS : AV_CODEC_ID_AC3,
  1591. .video_codec = AV_CODEC_ID_NONE,
  1592. .write_header = mkv_write_header,
  1593. .write_packet = mkv_write_flush_packet,
  1594. .write_trailer = mkv_write_trailer,
  1595. .flags = AVFMT_GLOBALHEADER | AVFMT_TS_NONSTRICT |
  1596. AVFMT_ALLOW_FLUSH,
  1597. .codec_tag = (const AVCodecTag* const []){ ff_codec_wav_tags, 0 },
  1598. .priv_class = &mka_class,
  1599. };
  1600. #endif