You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

1013 lines
38KB

  1. /*
  2. * MXF demuxer.
  3. * Copyright (c) 2006 SmartJog S.A., Baptiste Coudurier <baptiste dot coudurier at smartjog dot com>
  4. *
  5. * This file is part of FFmpeg.
  6. *
  7. * FFmpeg is free software; you can redistribute it and/or
  8. * modify it under the terms of the GNU Lesser General Public
  9. * License as published by the Free Software Foundation; either
  10. * version 2.1 of the License, or (at your option) any later version.
  11. *
  12. * FFmpeg is distributed in the hope that it will be useful,
  13. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  14. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  15. * Lesser General Public License for more details.
  16. *
  17. * You should have received a copy of the GNU Lesser General Public
  18. * License along with FFmpeg; if not, write to the Free Software
  19. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  20. */
  21. /*
  22. * References
  23. * SMPTE 336M KLV Data Encoding Protocol Using Key-Length-Value
  24. * SMPTE 377M MXF File Format Specifications
  25. * SMPTE 378M Operational Pattern 1a
  26. * SMPTE 379M MXF Generic Container
  27. * SMPTE 381M Mapping MPEG Streams into the MXF Generic Container
  28. * SMPTE 382M Mapping AES3 and Broadcast Wave Audio into the MXF Generic Container
  29. * SMPTE 383M Mapping DV-DIF Data to the MXF Generic Container
  30. *
  31. * Principle
  32. * Search for Track numbers which will identify essence element KLV packets.
  33. * Search for SourcePackage which define tracks which contains Track numbers.
  34. * Material Package contains tracks with reference to SourcePackage tracks.
  35. * Search for Descriptors (Picture, Sound) which contains codec info and parameters.
  36. * Assign Descriptors to correct Tracks.
  37. *
  38. * Metadata reading functions read Local Tags, get InstanceUID(0x3C0A) then add MetaDataSet to MXFContext.
  39. * Metadata parsing resolves Strong References to objects.
  40. *
  41. * Simple demuxer, only OP1A supported and some files might not work at all.
  42. * Only tracks with associated descriptors will be decoded. "Highly Desirable" SMPTE 377M D.1
  43. */
  44. //#define DEBUG
  45. #include "libavutil/aes.h"
  46. #include "libavcodec/bytestream.h"
  47. #include "avformat.h"
  48. #include "mxf.h"
  49. typedef struct {
  50. UID uid;
  51. enum MXFMetadataSetType type;
  52. UID source_container_ul;
  53. } MXFCryptoContext;
  54. typedef struct {
  55. UID uid;
  56. enum MXFMetadataSetType type;
  57. UID source_package_uid;
  58. UID data_definition_ul;
  59. int64_t duration;
  60. int64_t start_position;
  61. int source_track_id;
  62. } MXFStructuralComponent;
  63. typedef struct {
  64. UID uid;
  65. enum MXFMetadataSetType type;
  66. UID data_definition_ul;
  67. UID *structural_components_refs;
  68. int structural_components_count;
  69. int64_t duration;
  70. } MXFSequence;
  71. typedef struct {
  72. UID uid;
  73. enum MXFMetadataSetType type;
  74. MXFSequence *sequence; /* mandatory, and only one */
  75. UID sequence_ref;
  76. int track_id;
  77. uint8_t track_number[4];
  78. AVRational edit_rate;
  79. } MXFTrack;
  80. typedef struct {
  81. UID uid;
  82. enum MXFMetadataSetType type;
  83. UID essence_container_ul;
  84. UID essence_codec_ul;
  85. AVRational sample_rate;
  86. AVRational aspect_ratio;
  87. int width;
  88. int height;
  89. int channels;
  90. int bits_per_sample;
  91. UID *sub_descriptors_refs;
  92. int sub_descriptors_count;
  93. int linked_track_id;
  94. uint8_t *extradata;
  95. int extradata_size;
  96. enum PixelFormat pix_fmt;
  97. } MXFDescriptor;
  98. typedef struct {
  99. UID uid;
  100. enum MXFMetadataSetType type;
  101. } MXFIndexTableSegment;
  102. typedef struct {
  103. UID uid;
  104. enum MXFMetadataSetType type;
  105. UID package_uid;
  106. UID *tracks_refs;
  107. int tracks_count;
  108. MXFDescriptor *descriptor; /* only one */
  109. UID descriptor_ref;
  110. } MXFPackage;
  111. typedef struct {
  112. UID uid;
  113. enum MXFMetadataSetType type;
  114. } MXFMetadataSet;
  115. typedef struct {
  116. UID *packages_refs;
  117. int packages_count;
  118. MXFMetadataSet **metadata_sets;
  119. int metadata_sets_count;
  120. AVFormatContext *fc;
  121. struct AVAES *aesc;
  122. uint8_t *local_tags;
  123. int local_tags_count;
  124. } MXFContext;
  125. enum MXFWrappingScheme {
  126. Frame,
  127. Clip,
  128. };
  129. typedef struct {
  130. const UID key;
  131. int (*read)();
  132. int ctx_size;
  133. enum MXFMetadataSetType type;
  134. } MXFMetadataReadTableEntry;
  135. /* partial keys to match */
  136. static const uint8_t mxf_header_partition_pack_key[] = { 0x06,0x0e,0x2b,0x34,0x02,0x05,0x01,0x01,0x0d,0x01,0x02,0x01,0x01,0x02 };
  137. static const uint8_t mxf_essence_element_key[] = { 0x06,0x0e,0x2b,0x34,0x01,0x02,0x01,0x01,0x0d,0x01,0x03,0x01 };
  138. static const uint8_t mxf_klv_key[] = { 0x06,0x0e,0x2b,0x34 };
  139. /* complete keys to match */
  140. static const uint8_t mxf_crypto_source_container_ul[] = { 0x06,0x0e,0x2b,0x34,0x01,0x01,0x01,0x09,0x06,0x01,0x01,0x02,0x02,0x00,0x00,0x00 };
  141. static const uint8_t mxf_encrypted_triplet_key[] = { 0x06,0x0e,0x2b,0x34,0x02,0x04,0x01,0x07,0x0d,0x01,0x03,0x01,0x02,0x7e,0x01,0x00 };
  142. static const uint8_t mxf_encrypted_essence_container[] = { 0x06,0x0e,0x2b,0x34,0x04,0x01,0x01,0x07,0x0d,0x01,0x03,0x01,0x02,0x0b,0x01,0x00 };
  143. static const uint8_t mxf_sony_mpeg4_extradata[] = { 0x06,0x0e,0x2b,0x34,0x04,0x01,0x01,0x01,0x0e,0x06,0x06,0x02,0x02,0x01,0x00,0x00 };
  144. #define IS_KLV_KEY(x, y) (!memcmp(x, y, sizeof(y)))
  145. static int64_t klv_decode_ber_length(ByteIOContext *pb)
  146. {
  147. uint64_t size = get_byte(pb);
  148. if (size & 0x80) { /* long form */
  149. int bytes_num = size & 0x7f;
  150. /* SMPTE 379M 5.3.4 guarantee that bytes_num must not exceed 8 bytes */
  151. if (bytes_num > 8)
  152. return -1;
  153. size = 0;
  154. while (bytes_num--)
  155. size = size << 8 | get_byte(pb);
  156. }
  157. return size;
  158. }
  159. static int mxf_read_sync(ByteIOContext *pb, const uint8_t *key, unsigned size)
  160. {
  161. int i, b;
  162. for (i = 0; i < size && !url_feof(pb); i++) {
  163. b = get_byte(pb);
  164. if (b == key[0])
  165. i = 0;
  166. else if (b != key[i])
  167. i = -1;
  168. }
  169. return i == size;
  170. }
  171. static int klv_read_packet(KLVPacket *klv, ByteIOContext *pb)
  172. {
  173. if (!mxf_read_sync(pb, mxf_klv_key, 4))
  174. return -1;
  175. klv->offset = url_ftell(pb) - 4;
  176. memcpy(klv->key, mxf_klv_key, 4);
  177. get_buffer(pb, klv->key + 4, 12);
  178. klv->length = klv_decode_ber_length(pb);
  179. return klv->length == -1 ? -1 : 0;
  180. }
  181. static int mxf_get_stream_index(AVFormatContext *s, KLVPacket *klv)
  182. {
  183. int i;
  184. for (i = 0; i < s->nb_streams; i++) {
  185. MXFTrack *track = s->streams[i]->priv_data;
  186. /* SMPTE 379M 7.3 */
  187. if (!memcmp(klv->key + sizeof(mxf_essence_element_key), track->track_number, sizeof(track->track_number)))
  188. return i;
  189. }
  190. /* return 0 if only one stream, for OP Atom files with 0 as track number */
  191. return s->nb_streams == 1 ? 0 : -1;
  192. }
  193. /* XXX: use AVBitStreamFilter */
  194. static int mxf_get_d10_aes3_packet(ByteIOContext *pb, AVStream *st, AVPacket *pkt, int64_t length)
  195. {
  196. const uint8_t *buf_ptr, *end_ptr;
  197. uint8_t *data_ptr;
  198. int i;
  199. if (length > 61444) /* worst case PAL 1920 samples 8 channels */
  200. return -1;
  201. av_new_packet(pkt, length);
  202. get_buffer(pb, pkt->data, length);
  203. data_ptr = pkt->data;
  204. end_ptr = pkt->data + length;
  205. buf_ptr = pkt->data + 4; /* skip SMPTE 331M header */
  206. for (; buf_ptr < end_ptr; ) {
  207. for (i = 0; i < st->codec->channels; i++) {
  208. uint32_t sample = bytestream_get_le32(&buf_ptr);
  209. if (st->codec->bits_per_coded_sample == 24)
  210. bytestream_put_le24(&data_ptr, (sample >> 4) & 0xffffff);
  211. else
  212. bytestream_put_le16(&data_ptr, (sample >> 12) & 0xffff);
  213. }
  214. buf_ptr += 32 - st->codec->channels*4; // always 8 channels stored SMPTE 331M
  215. }
  216. pkt->size = data_ptr - pkt->data;
  217. return 0;
  218. }
  219. static int mxf_decrypt_triplet(AVFormatContext *s, AVPacket *pkt, KLVPacket *klv)
  220. {
  221. static const uint8_t checkv[16] = {0x43, 0x48, 0x55, 0x4b, 0x43, 0x48, 0x55, 0x4b, 0x43, 0x48, 0x55, 0x4b, 0x43, 0x48, 0x55, 0x4b};
  222. MXFContext *mxf = s->priv_data;
  223. ByteIOContext *pb = s->pb;
  224. int64_t end = url_ftell(pb) + klv->length;
  225. uint64_t size;
  226. uint64_t orig_size;
  227. uint64_t plaintext_size;
  228. uint8_t ivec[16];
  229. uint8_t tmpbuf[16];
  230. int index;
  231. if (!mxf->aesc && s->key && s->keylen == 16) {
  232. mxf->aesc = av_malloc(av_aes_size);
  233. if (!mxf->aesc)
  234. return -1;
  235. av_aes_init(mxf->aesc, s->key, 128, 1);
  236. }
  237. // crypto context
  238. url_fskip(pb, klv_decode_ber_length(pb));
  239. // plaintext offset
  240. klv_decode_ber_length(pb);
  241. plaintext_size = get_be64(pb);
  242. // source klv key
  243. klv_decode_ber_length(pb);
  244. get_buffer(pb, klv->key, 16);
  245. if (!IS_KLV_KEY(klv, mxf_essence_element_key))
  246. return -1;
  247. index = mxf_get_stream_index(s, klv);
  248. if (index < 0)
  249. return -1;
  250. // source size
  251. klv_decode_ber_length(pb);
  252. orig_size = get_be64(pb);
  253. if (orig_size < plaintext_size)
  254. return -1;
  255. // enc. code
  256. size = klv_decode_ber_length(pb);
  257. if (size < 32 || size - 32 < orig_size)
  258. return -1;
  259. get_buffer(pb, ivec, 16);
  260. get_buffer(pb, tmpbuf, 16);
  261. if (mxf->aesc)
  262. av_aes_crypt(mxf->aesc, tmpbuf, tmpbuf, 1, ivec, 1);
  263. if (memcmp(tmpbuf, checkv, 16))
  264. av_log(s, AV_LOG_ERROR, "probably incorrect decryption key\n");
  265. size -= 32;
  266. av_get_packet(pb, pkt, size);
  267. size -= plaintext_size;
  268. if (mxf->aesc)
  269. av_aes_crypt(mxf->aesc, &pkt->data[plaintext_size],
  270. &pkt->data[plaintext_size], size >> 4, ivec, 1);
  271. pkt->size = orig_size;
  272. pkt->stream_index = index;
  273. url_fskip(pb, end - url_ftell(pb));
  274. return 0;
  275. }
  276. static int mxf_read_packet(AVFormatContext *s, AVPacket *pkt)
  277. {
  278. KLVPacket klv;
  279. while (!url_feof(s->pb)) {
  280. if (klv_read_packet(&klv, s->pb) < 0)
  281. return -1;
  282. PRINT_KEY(s, "read packet", klv.key);
  283. dprintf(s, "size %lld offset %#llx\n", klv.length, klv.offset);
  284. if (IS_KLV_KEY(klv.key, mxf_encrypted_triplet_key)) {
  285. int res = mxf_decrypt_triplet(s, pkt, &klv);
  286. if (res < 0) {
  287. av_log(s, AV_LOG_ERROR, "invalid encoded triplet\n");
  288. return -1;
  289. }
  290. return 0;
  291. }
  292. if (IS_KLV_KEY(klv.key, mxf_essence_element_key)) {
  293. int index = mxf_get_stream_index(s, &klv);
  294. if (index < 0) {
  295. av_log(s, AV_LOG_ERROR, "error getting stream index %d\n", AV_RB32(klv.key+12));
  296. goto skip;
  297. }
  298. if (s->streams[index]->discard == AVDISCARD_ALL)
  299. goto skip;
  300. /* check for 8 channels AES3 element */
  301. if (klv.key[12] == 0x06 && klv.key[13] == 0x01 && klv.key[14] == 0x10) {
  302. if (mxf_get_d10_aes3_packet(s->pb, s->streams[index], pkt, klv.length) < 0) {
  303. av_log(s, AV_LOG_ERROR, "error reading D-10 aes3 frame\n");
  304. return -1;
  305. }
  306. } else
  307. av_get_packet(s->pb, pkt, klv.length);
  308. pkt->stream_index = index;
  309. pkt->pos = klv.offset;
  310. return 0;
  311. } else
  312. skip:
  313. url_fskip(s->pb, klv.length);
  314. }
  315. return AVERROR_EOF;
  316. }
  317. static int mxf_read_primer_pack(MXFContext *mxf)
  318. {
  319. ByteIOContext *pb = mxf->fc->pb;
  320. int item_num = get_be32(pb);
  321. int item_len = get_be32(pb);
  322. if (item_len != 18) {
  323. av_log(mxf->fc, AV_LOG_ERROR, "unsupported primer pack item length\n");
  324. return -1;
  325. }
  326. if (item_num > UINT_MAX / item_len)
  327. return -1;
  328. mxf->local_tags_count = item_num;
  329. mxf->local_tags = av_malloc(item_num*item_len);
  330. if (!mxf->local_tags)
  331. return -1;
  332. get_buffer(pb, mxf->local_tags, item_num*item_len);
  333. return 0;
  334. }
  335. static int mxf_add_metadata_set(MXFContext *mxf, void *metadata_set)
  336. {
  337. if (mxf->metadata_sets_count+1 >= UINT_MAX / sizeof(*mxf->metadata_sets))
  338. return AVERROR(ENOMEM);
  339. mxf->metadata_sets = av_realloc(mxf->metadata_sets, (mxf->metadata_sets_count + 1) * sizeof(*mxf->metadata_sets));
  340. if (!mxf->metadata_sets)
  341. return -1;
  342. mxf->metadata_sets[mxf->metadata_sets_count] = metadata_set;
  343. mxf->metadata_sets_count++;
  344. return 0;
  345. }
  346. static int mxf_read_cryptographic_context(MXFCryptoContext *cryptocontext, ByteIOContext *pb, int tag, int size, UID uid)
  347. {
  348. if (size != 16)
  349. return -1;
  350. if (IS_KLV_KEY(uid, mxf_crypto_source_container_ul))
  351. get_buffer(pb, cryptocontext->source_container_ul, 16);
  352. return 0;
  353. }
  354. static int mxf_read_content_storage(MXFContext *mxf, ByteIOContext *pb, int tag)
  355. {
  356. switch (tag) {
  357. case 0x1901:
  358. mxf->packages_count = get_be32(pb);
  359. if (mxf->packages_count >= UINT_MAX / sizeof(UID))
  360. return -1;
  361. mxf->packages_refs = av_malloc(mxf->packages_count * sizeof(UID));
  362. if (!mxf->packages_refs)
  363. return -1;
  364. url_fskip(pb, 4); /* useless size of objects, always 16 according to specs */
  365. get_buffer(pb, (uint8_t *)mxf->packages_refs, mxf->packages_count * sizeof(UID));
  366. break;
  367. }
  368. return 0;
  369. }
  370. static int mxf_read_source_clip(MXFStructuralComponent *source_clip, ByteIOContext *pb, int tag)
  371. {
  372. switch(tag) {
  373. case 0x0202:
  374. source_clip->duration = get_be64(pb);
  375. break;
  376. case 0x1201:
  377. source_clip->start_position = get_be64(pb);
  378. break;
  379. case 0x1101:
  380. /* UMID, only get last 16 bytes */
  381. url_fskip(pb, 16);
  382. get_buffer(pb, source_clip->source_package_uid, 16);
  383. break;
  384. case 0x1102:
  385. source_clip->source_track_id = get_be32(pb);
  386. break;
  387. }
  388. return 0;
  389. }
  390. static int mxf_read_material_package(MXFPackage *package, ByteIOContext *pb, int tag)
  391. {
  392. switch(tag) {
  393. case 0x4403:
  394. package->tracks_count = get_be32(pb);
  395. if (package->tracks_count >= UINT_MAX / sizeof(UID))
  396. return -1;
  397. package->tracks_refs = av_malloc(package->tracks_count * sizeof(UID));
  398. if (!package->tracks_refs)
  399. return -1;
  400. url_fskip(pb, 4); /* useless size of objects, always 16 according to specs */
  401. get_buffer(pb, (uint8_t *)package->tracks_refs, package->tracks_count * sizeof(UID));
  402. break;
  403. }
  404. return 0;
  405. }
  406. static int mxf_read_track(MXFTrack *track, ByteIOContext *pb, int tag)
  407. {
  408. switch(tag) {
  409. case 0x4801:
  410. track->track_id = get_be32(pb);
  411. break;
  412. case 0x4804:
  413. get_buffer(pb, track->track_number, 4);
  414. break;
  415. case 0x4B01:
  416. track->edit_rate.den = get_be32(pb);
  417. track->edit_rate.num = get_be32(pb);
  418. break;
  419. case 0x4803:
  420. get_buffer(pb, track->sequence_ref, 16);
  421. break;
  422. }
  423. return 0;
  424. }
  425. static int mxf_read_sequence(MXFSequence *sequence, ByteIOContext *pb, int tag)
  426. {
  427. switch(tag) {
  428. case 0x0202:
  429. sequence->duration = get_be64(pb);
  430. break;
  431. case 0x0201:
  432. get_buffer(pb, sequence->data_definition_ul, 16);
  433. break;
  434. case 0x1001:
  435. sequence->structural_components_count = get_be32(pb);
  436. if (sequence->structural_components_count >= UINT_MAX / sizeof(UID))
  437. return -1;
  438. sequence->structural_components_refs = av_malloc(sequence->structural_components_count * sizeof(UID));
  439. if (!sequence->structural_components_refs)
  440. return -1;
  441. url_fskip(pb, 4); /* useless size of objects, always 16 according to specs */
  442. get_buffer(pb, (uint8_t *)sequence->structural_components_refs, sequence->structural_components_count * sizeof(UID));
  443. break;
  444. }
  445. return 0;
  446. }
  447. static int mxf_read_source_package(MXFPackage *package, ByteIOContext *pb, int tag)
  448. {
  449. switch(tag) {
  450. case 0x4403:
  451. package->tracks_count = get_be32(pb);
  452. if (package->tracks_count >= UINT_MAX / sizeof(UID))
  453. return -1;
  454. package->tracks_refs = av_malloc(package->tracks_count * sizeof(UID));
  455. if (!package->tracks_refs)
  456. return -1;
  457. url_fskip(pb, 4); /* useless size of objects, always 16 according to specs */
  458. get_buffer(pb, (uint8_t *)package->tracks_refs, package->tracks_count * sizeof(UID));
  459. break;
  460. case 0x4401:
  461. /* UMID, only get last 16 bytes */
  462. url_fskip(pb, 16);
  463. get_buffer(pb, package->package_uid, 16);
  464. break;
  465. case 0x4701:
  466. get_buffer(pb, package->descriptor_ref, 16);
  467. break;
  468. }
  469. return 0;
  470. }
  471. static int mxf_read_index_table_segment(MXFIndexTableSegment *segment, ByteIOContext *pb, int tag)
  472. {
  473. switch(tag) {
  474. case 0x3F05: dprintf(NULL, "EditUnitByteCount %d\n", get_be32(pb)); break;
  475. case 0x3F06: dprintf(NULL, "IndexSID %d\n", get_be32(pb)); break;
  476. case 0x3F07: dprintf(NULL, "BodySID %d\n", get_be32(pb)); break;
  477. case 0x3F0B: dprintf(NULL, "IndexEditRate %d/%d\n", get_be32(pb), get_be32(pb)); break;
  478. case 0x3F0C: dprintf(NULL, "IndexStartPosition %lld\n", get_be64(pb)); break;
  479. case 0x3F0D: dprintf(NULL, "IndexDuration %lld\n", get_be64(pb)); break;
  480. }
  481. return 0;
  482. }
  483. static void mxf_read_pixel_layout(ByteIOContext *pb, MXFDescriptor *descriptor)
  484. {
  485. int code, value, ofs = 0;
  486. char layout[16] = {};
  487. do {
  488. code = get_byte(pb);
  489. value = get_byte(pb);
  490. dprintf(NULL, "pixel layout: code %#x\n", code);
  491. if (ofs < 16) {
  492. layout[ofs++] = code;
  493. layout[ofs++] = value;
  494. }
  495. } while (code != 0); /* SMPTE 377M E.2.46 */
  496. ff_mxf_decode_pixel_layout(layout, &descriptor->pix_fmt);
  497. }
  498. static int mxf_read_generic_descriptor(MXFDescriptor *descriptor, ByteIOContext *pb, int tag, int size, UID uid)
  499. {
  500. switch(tag) {
  501. case 0x3F01:
  502. descriptor->sub_descriptors_count = get_be32(pb);
  503. if (descriptor->sub_descriptors_count >= UINT_MAX / sizeof(UID))
  504. return -1;
  505. descriptor->sub_descriptors_refs = av_malloc(descriptor->sub_descriptors_count * sizeof(UID));
  506. if (!descriptor->sub_descriptors_refs)
  507. return -1;
  508. url_fskip(pb, 4); /* useless size of objects, always 16 according to specs */
  509. get_buffer(pb, (uint8_t *)descriptor->sub_descriptors_refs, descriptor->sub_descriptors_count * sizeof(UID));
  510. break;
  511. case 0x3004:
  512. get_buffer(pb, descriptor->essence_container_ul, 16);
  513. break;
  514. case 0x3006:
  515. descriptor->linked_track_id = get_be32(pb);
  516. break;
  517. case 0x3201: /* PictureEssenceCoding */
  518. get_buffer(pb, descriptor->essence_codec_ul, 16);
  519. break;
  520. case 0x3203:
  521. descriptor->width = get_be32(pb);
  522. break;
  523. case 0x3202:
  524. descriptor->height = get_be32(pb);
  525. break;
  526. case 0x320E:
  527. descriptor->aspect_ratio.num = get_be32(pb);
  528. descriptor->aspect_ratio.den = get_be32(pb);
  529. break;
  530. case 0x3D03:
  531. descriptor->sample_rate.num = get_be32(pb);
  532. descriptor->sample_rate.den = get_be32(pb);
  533. break;
  534. case 0x3D06: /* SoundEssenceCompression */
  535. get_buffer(pb, descriptor->essence_codec_ul, 16);
  536. break;
  537. case 0x3D07:
  538. descriptor->channels = get_be32(pb);
  539. break;
  540. case 0x3D01:
  541. descriptor->bits_per_sample = get_be32(pb);
  542. break;
  543. case 0x3401:
  544. mxf_read_pixel_layout(pb, descriptor);
  545. break;
  546. default:
  547. /* Private uid used by SONY C0023S01.mxf */
  548. if (IS_KLV_KEY(uid, mxf_sony_mpeg4_extradata)) {
  549. descriptor->extradata = av_malloc(size);
  550. if (!descriptor->extradata)
  551. return -1;
  552. descriptor->extradata_size = size;
  553. get_buffer(pb, descriptor->extradata, size);
  554. }
  555. break;
  556. }
  557. return 0;
  558. }
  559. /*
  560. * Match an uid independently of the version byte and up to len common bytes
  561. * Returns: boolean
  562. */
  563. static int mxf_match_uid(const UID key, const UID uid, int len)
  564. {
  565. int i;
  566. for (i = 0; i < len; i++) {
  567. if (i != 7 && key[i] != uid[i])
  568. return 0;
  569. }
  570. return 1;
  571. }
  572. static const MXFCodecUL *mxf_get_codec_ul(const MXFCodecUL *uls, UID *uid)
  573. {
  574. while (uls->uid[0]) {
  575. if(mxf_match_uid(uls->uid, *uid, uls->matching_len))
  576. break;
  577. uls++;
  578. }
  579. return uls;
  580. }
  581. static void *mxf_resolve_strong_ref(MXFContext *mxf, UID *strong_ref, enum MXFMetadataSetType type)
  582. {
  583. int i;
  584. if (!strong_ref)
  585. return NULL;
  586. for (i = 0; i < mxf->metadata_sets_count; i++) {
  587. if (!memcmp(*strong_ref, mxf->metadata_sets[i]->uid, 16) &&
  588. (type == AnyType || mxf->metadata_sets[i]->type == type)) {
  589. return mxf->metadata_sets[i];
  590. }
  591. }
  592. return NULL;
  593. }
  594. static const MXFCodecUL mxf_essence_container_uls[] = {
  595. // video essence container uls
  596. { { 0x06,0x0E,0x2B,0x34,0x04,0x01,0x01,0x02,0x0D,0x01,0x03,0x01,0x02,0x04,0x60,0x01 }, 14, CODEC_ID_MPEG2VIDEO }, /* MPEG-ES Frame wrapped */
  597. { { 0x06,0x0E,0x2B,0x34,0x04,0x01,0x01,0x01,0x0D,0x01,0x03,0x01,0x02,0x02,0x41,0x01 }, 14, CODEC_ID_DVVIDEO }, /* DV 625 25mbps */
  598. // sound essence container uls
  599. { { 0x06,0x0E,0x2B,0x34,0x04,0x01,0x01,0x01,0x0D,0x01,0x03,0x01,0x02,0x06,0x01,0x00 }, 14, CODEC_ID_PCM_S16LE }, /* BWF Frame wrapped */
  600. { { 0x06,0x0E,0x2B,0x34,0x04,0x01,0x01,0x02,0x0D,0x01,0x03,0x01,0x02,0x04,0x40,0x01 }, 14, CODEC_ID_MP2 }, /* MPEG-ES Frame wrapped, 0x40 ??? stream id */
  601. { { 0x06,0x0E,0x2B,0x34,0x04,0x01,0x01,0x01,0x0D,0x01,0x03,0x01,0x02,0x01,0x01,0x01 }, 14, CODEC_ID_PCM_S16LE }, /* D-10 Mapping 50Mbps PAL Extended Template */
  602. { { 0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00 }, 0, CODEC_ID_NONE },
  603. };
  604. static int mxf_parse_structural_metadata(MXFContext *mxf)
  605. {
  606. MXFPackage *material_package = NULL;
  607. MXFPackage *temp_package = NULL;
  608. int i, j, k;
  609. dprintf(mxf->fc, "metadata sets count %d\n", mxf->metadata_sets_count);
  610. /* TODO: handle multiple material packages (OP3x) */
  611. for (i = 0; i < mxf->packages_count; i++) {
  612. material_package = mxf_resolve_strong_ref(mxf, &mxf->packages_refs[i], MaterialPackage);
  613. if (material_package) break;
  614. }
  615. if (!material_package) {
  616. av_log(mxf->fc, AV_LOG_ERROR, "no material package found\n");
  617. return -1;
  618. }
  619. for (i = 0; i < material_package->tracks_count; i++) {
  620. MXFPackage *source_package = NULL;
  621. MXFTrack *material_track = NULL;
  622. MXFTrack *source_track = NULL;
  623. MXFTrack *temp_track = NULL;
  624. MXFDescriptor *descriptor = NULL;
  625. MXFStructuralComponent *component = NULL;
  626. UID *essence_container_ul = NULL;
  627. const MXFCodecUL *codec_ul = NULL;
  628. const MXFCodecUL *container_ul = NULL;
  629. AVStream *st;
  630. if (!(material_track = mxf_resolve_strong_ref(mxf, &material_package->tracks_refs[i], Track))) {
  631. av_log(mxf->fc, AV_LOG_ERROR, "could not resolve material track strong ref\n");
  632. continue;
  633. }
  634. if (!(material_track->sequence = mxf_resolve_strong_ref(mxf, &material_track->sequence_ref, Sequence))) {
  635. av_log(mxf->fc, AV_LOG_ERROR, "could not resolve material track sequence strong ref\n");
  636. continue;
  637. }
  638. /* TODO: handle multiple source clips */
  639. for (j = 0; j < material_track->sequence->structural_components_count; j++) {
  640. /* TODO: handle timecode component */
  641. component = mxf_resolve_strong_ref(mxf, &material_track->sequence->structural_components_refs[j], SourceClip);
  642. if (!component)
  643. continue;
  644. for (k = 0; k < mxf->packages_count; k++) {
  645. temp_package = mxf_resolve_strong_ref(mxf, &mxf->packages_refs[k], SourcePackage);
  646. if (!temp_package)
  647. continue;
  648. if (!memcmp(temp_package->package_uid, component->source_package_uid, 16)) {
  649. source_package = temp_package;
  650. break;
  651. }
  652. }
  653. if (!source_package) {
  654. av_log(mxf->fc, AV_LOG_ERROR, "material track %d: no corresponding source package found\n", material_track->track_id);
  655. break;
  656. }
  657. for (k = 0; k < source_package->tracks_count; k++) {
  658. if (!(temp_track = mxf_resolve_strong_ref(mxf, &source_package->tracks_refs[k], Track))) {
  659. av_log(mxf->fc, AV_LOG_ERROR, "could not resolve source track strong ref\n");
  660. return -1;
  661. }
  662. if (temp_track->track_id == component->source_track_id) {
  663. source_track = temp_track;
  664. break;
  665. }
  666. }
  667. if (!source_track) {
  668. av_log(mxf->fc, AV_LOG_ERROR, "material track %d: no corresponding source track found\n", material_track->track_id);
  669. break;
  670. }
  671. }
  672. if (!source_track)
  673. continue;
  674. st = av_new_stream(mxf->fc, source_track->track_id);
  675. if (!st) {
  676. av_log(mxf->fc, AV_LOG_ERROR, "could not allocate stream\n");
  677. return -1;
  678. }
  679. st->priv_data = source_track;
  680. st->duration = component->duration;
  681. if (st->duration == -1)
  682. st->duration = AV_NOPTS_VALUE;
  683. st->start_time = component->start_position;
  684. av_set_pts_info(st, 64, material_track->edit_rate.num, material_track->edit_rate.den);
  685. if (!(source_track->sequence = mxf_resolve_strong_ref(mxf, &source_track->sequence_ref, Sequence))) {
  686. av_log(mxf->fc, AV_LOG_ERROR, "could not resolve source track sequence strong ref\n");
  687. return -1;
  688. }
  689. PRINT_KEY(mxf->fc, "data definition ul", source_track->sequence->data_definition_ul);
  690. codec_ul = mxf_get_codec_ul(ff_mxf_data_definition_uls, &source_track->sequence->data_definition_ul);
  691. st->codec->codec_type = codec_ul->id;
  692. source_package->descriptor = mxf_resolve_strong_ref(mxf, &source_package->descriptor_ref, AnyType);
  693. if (source_package->descriptor) {
  694. if (source_package->descriptor->type == MultipleDescriptor) {
  695. for (j = 0; j < source_package->descriptor->sub_descriptors_count; j++) {
  696. MXFDescriptor *sub_descriptor = mxf_resolve_strong_ref(mxf, &source_package->descriptor->sub_descriptors_refs[j], Descriptor);
  697. if (!sub_descriptor) {
  698. av_log(mxf->fc, AV_LOG_ERROR, "could not resolve sub descriptor strong ref\n");
  699. continue;
  700. }
  701. if (sub_descriptor->linked_track_id == source_track->track_id) {
  702. descriptor = sub_descriptor;
  703. break;
  704. }
  705. }
  706. } else if (source_package->descriptor->type == Descriptor)
  707. descriptor = source_package->descriptor;
  708. }
  709. if (!descriptor) {
  710. av_log(mxf->fc, AV_LOG_INFO, "source track %d: stream %d, no descriptor found\n", source_track->track_id, st->index);
  711. continue;
  712. }
  713. PRINT_KEY(mxf->fc, "essence codec ul", descriptor->essence_codec_ul);
  714. PRINT_KEY(mxf->fc, "essence container ul", descriptor->essence_container_ul);
  715. essence_container_ul = &descriptor->essence_container_ul;
  716. /* HACK: replacing the original key with mxf_encrypted_essence_container
  717. * is not allowed according to s429-6, try to find correct information anyway */
  718. if (IS_KLV_KEY(essence_container_ul, mxf_encrypted_essence_container)) {
  719. av_log(mxf->fc, AV_LOG_INFO, "broken encrypted mxf file\n");
  720. for (k = 0; k < mxf->metadata_sets_count; k++) {
  721. MXFMetadataSet *metadata = mxf->metadata_sets[k];
  722. if (metadata->type == CryptoContext) {
  723. essence_container_ul = &((MXFCryptoContext *)metadata)->source_container_ul;
  724. break;
  725. }
  726. }
  727. }
  728. /* TODO: drop PictureEssenceCoding and SoundEssenceCompression, only check EssenceContainer */
  729. codec_ul = mxf_get_codec_ul(ff_mxf_codec_uls, &descriptor->essence_codec_ul);
  730. st->codec->codec_id = codec_ul->id;
  731. if (descriptor->extradata) {
  732. st->codec->extradata = descriptor->extradata;
  733. st->codec->extradata_size = descriptor->extradata_size;
  734. }
  735. if (st->codec->codec_type == AVMEDIA_TYPE_VIDEO) {
  736. container_ul = mxf_get_codec_ul(mxf_essence_container_uls, essence_container_ul);
  737. if (st->codec->codec_id == CODEC_ID_NONE)
  738. st->codec->codec_id = container_ul->id;
  739. st->codec->width = descriptor->width;
  740. st->codec->height = descriptor->height;
  741. if (st->codec->codec_id == CODEC_ID_RAWVIDEO)
  742. st->codec->pix_fmt = descriptor->pix_fmt;
  743. st->need_parsing = AVSTREAM_PARSE_HEADERS;
  744. } else if (st->codec->codec_type == AVMEDIA_TYPE_AUDIO) {
  745. container_ul = mxf_get_codec_ul(mxf_essence_container_uls, essence_container_ul);
  746. if (st->codec->codec_id == CODEC_ID_NONE)
  747. st->codec->codec_id = container_ul->id;
  748. st->codec->channels = descriptor->channels;
  749. st->codec->bits_per_coded_sample = descriptor->bits_per_sample;
  750. st->codec->sample_rate = descriptor->sample_rate.num / descriptor->sample_rate.den;
  751. /* TODO: implement CODEC_ID_RAWAUDIO */
  752. if (st->codec->codec_id == CODEC_ID_PCM_S16LE) {
  753. if (descriptor->bits_per_sample == 24)
  754. st->codec->codec_id = CODEC_ID_PCM_S24LE;
  755. else if (descriptor->bits_per_sample == 32)
  756. st->codec->codec_id = CODEC_ID_PCM_S32LE;
  757. } else if (st->codec->codec_id == CODEC_ID_PCM_S16BE) {
  758. if (descriptor->bits_per_sample == 24)
  759. st->codec->codec_id = CODEC_ID_PCM_S24BE;
  760. else if (descriptor->bits_per_sample == 32)
  761. st->codec->codec_id = CODEC_ID_PCM_S32BE;
  762. } else if (st->codec->codec_id == CODEC_ID_MP2) {
  763. st->need_parsing = AVSTREAM_PARSE_FULL;
  764. }
  765. }
  766. if (st->codec->codec_type != AVMEDIA_TYPE_DATA && (*essence_container_ul)[15] > 0x01) {
  767. av_log(mxf->fc, AV_LOG_WARNING, "only frame wrapped mappings are correctly supported\n");
  768. st->need_parsing = AVSTREAM_PARSE_FULL;
  769. }
  770. }
  771. return 0;
  772. }
  773. static const MXFMetadataReadTableEntry mxf_metadata_read_table[] = {
  774. { { 0x06,0x0E,0x2B,0x34,0x02,0x05,0x01,0x01,0x0d,0x01,0x02,0x01,0x01,0x05,0x01,0x00 }, mxf_read_primer_pack },
  775. { { 0x06,0x0E,0x2B,0x34,0x02,0x53,0x01,0x01,0x0d,0x01,0x01,0x01,0x01,0x01,0x18,0x00 }, mxf_read_content_storage, 0, AnyType },
  776. { { 0x06,0x0E,0x2B,0x34,0x02,0x53,0x01,0x01,0x0d,0x01,0x01,0x01,0x01,0x01,0x37,0x00 }, mxf_read_source_package, sizeof(MXFPackage), SourcePackage },
  777. { { 0x06,0x0E,0x2B,0x34,0x02,0x53,0x01,0x01,0x0d,0x01,0x01,0x01,0x01,0x01,0x36,0x00 }, mxf_read_material_package, sizeof(MXFPackage), MaterialPackage },
  778. { { 0x06,0x0E,0x2B,0x34,0x02,0x53,0x01,0x01,0x0d,0x01,0x01,0x01,0x01,0x01,0x0F,0x00 }, mxf_read_sequence, sizeof(MXFSequence), Sequence },
  779. { { 0x06,0x0E,0x2B,0x34,0x02,0x53,0x01,0x01,0x0d,0x01,0x01,0x01,0x01,0x01,0x11,0x00 }, mxf_read_source_clip, sizeof(MXFStructuralComponent), SourceClip },
  780. { { 0x06,0x0E,0x2B,0x34,0x02,0x53,0x01,0x01,0x0d,0x01,0x01,0x01,0x01,0x01,0x44,0x00 }, mxf_read_generic_descriptor, sizeof(MXFDescriptor), MultipleDescriptor },
  781. { { 0x06,0x0E,0x2B,0x34,0x02,0x53,0x01,0x01,0x0d,0x01,0x01,0x01,0x01,0x01,0x42,0x00 }, mxf_read_generic_descriptor, sizeof(MXFDescriptor), Descriptor }, /* Generic Sound */
  782. { { 0x06,0x0E,0x2B,0x34,0x02,0x53,0x01,0x01,0x0d,0x01,0x01,0x01,0x01,0x01,0x28,0x00 }, mxf_read_generic_descriptor, sizeof(MXFDescriptor), Descriptor }, /* CDCI */
  783. { { 0x06,0x0E,0x2B,0x34,0x02,0x53,0x01,0x01,0x0d,0x01,0x01,0x01,0x01,0x01,0x29,0x00 }, mxf_read_generic_descriptor, sizeof(MXFDescriptor), Descriptor }, /* RGBA */
  784. { { 0x06,0x0E,0x2B,0x34,0x02,0x53,0x01,0x01,0x0d,0x01,0x01,0x01,0x01,0x01,0x51,0x00 }, mxf_read_generic_descriptor, sizeof(MXFDescriptor), Descriptor }, /* MPEG 2 Video */
  785. { { 0x06,0x0E,0x2B,0x34,0x02,0x53,0x01,0x01,0x0d,0x01,0x01,0x01,0x01,0x01,0x48,0x00 }, mxf_read_generic_descriptor, sizeof(MXFDescriptor), Descriptor }, /* Wave */
  786. { { 0x06,0x0E,0x2B,0x34,0x02,0x53,0x01,0x01,0x0d,0x01,0x01,0x01,0x01,0x01,0x47,0x00 }, mxf_read_generic_descriptor, sizeof(MXFDescriptor), Descriptor }, /* AES3 */
  787. { { 0x06,0x0E,0x2B,0x34,0x02,0x53,0x01,0x01,0x0d,0x01,0x01,0x01,0x01,0x01,0x3A,0x00 }, mxf_read_track, sizeof(MXFTrack), Track }, /* Static Track */
  788. { { 0x06,0x0E,0x2B,0x34,0x02,0x53,0x01,0x01,0x0d,0x01,0x01,0x01,0x01,0x01,0x3B,0x00 }, mxf_read_track, sizeof(MXFTrack), Track }, /* Generic Track */
  789. { { 0x06,0x0E,0x2B,0x34,0x02,0x53,0x01,0x01,0x0d,0x01,0x04,0x01,0x02,0x02,0x00,0x00 }, mxf_read_cryptographic_context, sizeof(MXFCryptoContext), CryptoContext },
  790. { { 0x06,0x0E,0x2B,0x34,0x02,0x53,0x01,0x01,0x0d,0x01,0x02,0x01,0x01,0x10,0x01,0x00 }, mxf_read_index_table_segment, sizeof(MXFIndexTableSegment), IndexTableSegment },
  791. { { 0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00 }, NULL, 0, AnyType },
  792. };
  793. static int mxf_read_local_tags(MXFContext *mxf, KLVPacket *klv, int (*read_child)(), int ctx_size, enum MXFMetadataSetType type)
  794. {
  795. ByteIOContext *pb = mxf->fc->pb;
  796. MXFMetadataSet *ctx = ctx_size ? av_mallocz(ctx_size) : mxf;
  797. uint64_t klv_end = url_ftell(pb) + klv->length;
  798. if (!ctx)
  799. return -1;
  800. while (url_ftell(pb) + 4 < klv_end) {
  801. int tag = get_be16(pb);
  802. int size = get_be16(pb); /* KLV specified by 0x53 */
  803. uint64_t next = url_ftell(pb) + size;
  804. UID uid = {0};
  805. dprintf(mxf->fc, "local tag %#04x size %d\n", tag, size);
  806. if (!size) { /* ignore empty tag, needed for some files with empty UMID tag */
  807. av_log(mxf->fc, AV_LOG_ERROR, "local tag %#04x with 0 size\n", tag);
  808. continue;
  809. }
  810. if (tag > 0x7FFF) { /* dynamic tag */
  811. int i;
  812. for (i = 0; i < mxf->local_tags_count; i++) {
  813. int local_tag = AV_RB16(mxf->local_tags+i*18);
  814. if (local_tag == tag) {
  815. memcpy(uid, mxf->local_tags+i*18+2, 16);
  816. dprintf(mxf->fc, "local tag %#04x\n", local_tag);
  817. PRINT_KEY(mxf->fc, "uid", uid);
  818. }
  819. }
  820. }
  821. if (ctx_size && tag == 0x3C0A)
  822. get_buffer(pb, ctx->uid, 16);
  823. else if (read_child(ctx, pb, tag, size, uid) < 0)
  824. return -1;
  825. url_fseek(pb, next, SEEK_SET);
  826. }
  827. if (ctx_size) ctx->type = type;
  828. return ctx_size ? mxf_add_metadata_set(mxf, ctx) : 0;
  829. }
  830. static int mxf_read_header(AVFormatContext *s, AVFormatParameters *ap)
  831. {
  832. MXFContext *mxf = s->priv_data;
  833. KLVPacket klv;
  834. if (!mxf_read_sync(s->pb, mxf_header_partition_pack_key, 14)) {
  835. av_log(s, AV_LOG_ERROR, "could not find header partition pack key\n");
  836. return -1;
  837. }
  838. url_fseek(s->pb, -14, SEEK_CUR);
  839. mxf->fc = s;
  840. while (!url_feof(s->pb)) {
  841. const MXFMetadataReadTableEntry *metadata;
  842. if (klv_read_packet(&klv, s->pb) < 0)
  843. return -1;
  844. PRINT_KEY(s, "read header", klv.key);
  845. dprintf(s, "size %lld offset %#llx\n", klv.length, klv.offset);
  846. if (IS_KLV_KEY(klv.key, mxf_encrypted_triplet_key) ||
  847. IS_KLV_KEY(klv.key, mxf_essence_element_key)) {
  848. /* FIXME avoid seek */
  849. url_fseek(s->pb, klv.offset, SEEK_SET);
  850. break;
  851. }
  852. for (metadata = mxf_metadata_read_table; metadata->read; metadata++) {
  853. if (IS_KLV_KEY(klv.key, metadata->key)) {
  854. int (*read)() = klv.key[5] == 0x53 ? mxf_read_local_tags : metadata->read;
  855. if (read(mxf, &klv, metadata->read, metadata->ctx_size, metadata->type) < 0) {
  856. av_log(s, AV_LOG_ERROR, "error reading header metadata\n");
  857. return -1;
  858. }
  859. break;
  860. }
  861. }
  862. if (!metadata->read)
  863. url_fskip(s->pb, klv.length);
  864. }
  865. return mxf_parse_structural_metadata(mxf);
  866. }
  867. static int mxf_read_close(AVFormatContext *s)
  868. {
  869. MXFContext *mxf = s->priv_data;
  870. int i;
  871. av_freep(&mxf->packages_refs);
  872. for (i = 0; i < s->nb_streams; i++)
  873. s->streams[i]->priv_data = NULL;
  874. for (i = 0; i < mxf->metadata_sets_count; i++) {
  875. switch (mxf->metadata_sets[i]->type) {
  876. case MultipleDescriptor:
  877. av_freep(&((MXFDescriptor *)mxf->metadata_sets[i])->sub_descriptors_refs);
  878. break;
  879. case Sequence:
  880. av_freep(&((MXFSequence *)mxf->metadata_sets[i])->structural_components_refs);
  881. break;
  882. case SourcePackage:
  883. case MaterialPackage:
  884. av_freep(&((MXFPackage *)mxf->metadata_sets[i])->tracks_refs);
  885. break;
  886. default:
  887. break;
  888. }
  889. av_freep(&mxf->metadata_sets[i]);
  890. }
  891. av_freep(&mxf->metadata_sets);
  892. av_freep(&mxf->aesc);
  893. av_freep(&mxf->local_tags);
  894. return 0;
  895. }
  896. static int mxf_probe(AVProbeData *p) {
  897. uint8_t *bufp = p->buf;
  898. uint8_t *end = p->buf + p->buf_size;
  899. if (p->buf_size < sizeof(mxf_header_partition_pack_key))
  900. return 0;
  901. /* Must skip Run-In Sequence and search for MXF header partition pack key SMPTE 377M 5.5 */
  902. end -= sizeof(mxf_header_partition_pack_key);
  903. for (; bufp < end; bufp++) {
  904. if (IS_KLV_KEY(bufp, mxf_header_partition_pack_key))
  905. return AVPROBE_SCORE_MAX;
  906. }
  907. return 0;
  908. }
  909. /* rudimentary byte seek */
  910. /* XXX: use MXF Index */
  911. static int mxf_read_seek(AVFormatContext *s, int stream_index, int64_t sample_time, int flags)
  912. {
  913. AVStream *st = s->streams[stream_index];
  914. int64_t seconds;
  915. if (!s->bit_rate)
  916. return -1;
  917. if (sample_time < 0)
  918. sample_time = 0;
  919. seconds = av_rescale(sample_time, st->time_base.num, st->time_base.den);
  920. url_fseek(s->pb, (s->bit_rate * seconds) >> 3, SEEK_SET);
  921. av_update_cur_dts(s, st, sample_time);
  922. return 0;
  923. }
  924. AVInputFormat mxf_demuxer = {
  925. "mxf",
  926. NULL_IF_CONFIG_SMALL("Material eXchange Format"),
  927. sizeof(MXFContext),
  928. mxf_probe,
  929. mxf_read_header,
  930. mxf_read_packet,
  931. mxf_read_close,
  932. mxf_read_seek,
  933. };