You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

997 lines
36KB

  1. /*
  2. * MXF demuxer.
  3. * Copyright (c) 2006 SmartJog S.A., Baptiste Coudurier <baptiste dot coudurier at smartjog dot com>.
  4. *
  5. * This file is part of FFmpeg.
  6. *
  7. * FFmpeg is free software; you can redistribute it and/or
  8. * modify it under the terms of the GNU Lesser General Public
  9. * License as published by the Free Software Foundation; either
  10. * version 2.1 of the License, or (at your option) any later version.
  11. *
  12. * FFmpeg is distributed in the hope that it will be useful,
  13. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  14. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  15. * Lesser General Public License for more details.
  16. *
  17. * You should have received a copy of the GNU Lesser General Public
  18. * License along with FFmpeg; if not, write to the Free Software
  19. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  20. */
  21. /*
  22. * References
  23. * SMPTE 336M KLV Data Encoding Protocol Using Key-Length-Value
  24. * SMPTE 377M MXF File Format Specifications
  25. * SMPTE 378M Operational Pattern 1a
  26. * SMPTE 379M MXF Generic Container
  27. * SMPTE 381M Mapping MPEG Streams into the MXF Generic Container
  28. * SMPTE 382M Mapping AES3 and Broadcast Wave Audio into the MXF Generic Container
  29. * SMPTE 383M Mapping DV-DIF Data to the MXF Generic Container
  30. *
  31. * Principle
  32. * Search for Track numbers which will identify essence element KLV packets.
  33. * Search for SourcePackage which define tracks which contains Track numbers.
  34. * Material Package contains tracks with reference to SourcePackage tracks.
  35. * Search for Descriptors (Picture, Sound) which contains codec info and parameters.
  36. * Assign Descriptors to correct Tracks.
  37. *
  38. * Metadata reading functions read Local Tags, get InstanceUID(0x3C0A) then add MetaDataSet to MXFContext.
  39. * Metadata parsing resolves Strong References to objects.
  40. *
  41. * Simple demuxer, only OP1A supported and some files might not work at all.
  42. * Only tracks with associated descriptors will be decoded. "Highly Desirable" SMPTE 377M D.1
  43. */
  44. //#define DEBUG
  45. #include "libavutil/aes.h"
  46. #include "mxf.h"
  47. typedef struct {
  48. UID uid;
  49. enum MXFMetadataSetType type;
  50. UID source_container_ul;
  51. } MXFCryptoContext;
  52. typedef struct {
  53. UID uid;
  54. enum MXFMetadataSetType type;
  55. UID source_package_uid;
  56. UID data_definition_ul;
  57. int64_t duration;
  58. int64_t start_position;
  59. int source_track_id;
  60. } MXFStructuralComponent;
  61. typedef struct {
  62. UID uid;
  63. enum MXFMetadataSetType type;
  64. UID data_definition_ul;
  65. UID *structural_components_refs;
  66. int structural_components_count;
  67. int64_t duration;
  68. } MXFSequence;
  69. typedef struct {
  70. UID uid;
  71. enum MXFMetadataSetType type;
  72. MXFSequence *sequence; /* mandatory, and only one */
  73. UID sequence_ref;
  74. int track_id;
  75. uint8_t track_number[4];
  76. AVRational edit_rate;
  77. } MXFTrack;
  78. typedef struct {
  79. UID uid;
  80. enum MXFMetadataSetType type;
  81. UID essence_container_ul;
  82. UID essence_codec_ul;
  83. AVRational sample_rate;
  84. AVRational aspect_ratio;
  85. int width;
  86. int height;
  87. int channels;
  88. int bits_per_sample;
  89. UID *sub_descriptors_refs;
  90. int sub_descriptors_count;
  91. int linked_track_id;
  92. uint8_t *extradata;
  93. int extradata_size;
  94. } MXFDescriptor;
  95. typedef struct {
  96. UID uid;
  97. enum MXFMetadataSetType type;
  98. UID package_uid;
  99. UID *tracks_refs;
  100. int tracks_count;
  101. MXFDescriptor *descriptor; /* only one */
  102. UID descriptor_ref;
  103. } MXFPackage;
  104. typedef struct {
  105. UID uid;
  106. enum MXFMetadataSetType type;
  107. } MXFMetadataSet;
  108. typedef struct {
  109. UID *packages_refs;
  110. int packages_count;
  111. MXFMetadataSet **metadata_sets;
  112. int metadata_sets_count;
  113. AVFormatContext *fc;
  114. struct AVAES *aesc;
  115. uint8_t *local_tags;
  116. int local_tags_count;
  117. } MXFContext;
  118. enum MXFWrappingScheme {
  119. Frame,
  120. Clip,
  121. };
  122. typedef struct {
  123. const UID key;
  124. int (*read)();
  125. int ctx_size;
  126. enum MXFMetadataSetType type;
  127. } MXFMetadataReadTableEntry;
  128. /* partial keys to match */
  129. static const uint8_t mxf_header_partition_pack_key[] = { 0x06,0x0e,0x2b,0x34,0x02,0x05,0x01,0x01,0x0d,0x01,0x02,0x01,0x01,0x02 };
  130. static const uint8_t mxf_essence_element_key[] = { 0x06,0x0e,0x2b,0x34,0x01,0x02,0x01,0x01,0x0d,0x01,0x03,0x01 };
  131. static const uint8_t mxf_klv_key[] = { 0x06,0x0e,0x2b,0x34 };
  132. /* complete keys to match */
  133. static const uint8_t mxf_crypto_source_container_ul[] = { 0x06,0x0e,0x2b,0x34,0x01,0x01,0x01,0x09,0x06,0x01,0x01,0x02,0x02,0x00,0x00,0x00 };
  134. static const uint8_t mxf_encrypted_triplet_key[] = { 0x06,0x0e,0x2b,0x34,0x02,0x04,0x01,0x07,0x0d,0x01,0x03,0x01,0x02,0x7e,0x01,0x00 };
  135. static const uint8_t mxf_encrypted_essence_container[] = { 0x06,0x0e,0x2b,0x34,0x04,0x01,0x01,0x07,0x0d,0x01,0x03,0x01,0x02,0x0b,0x01,0x00 };
  136. static const uint8_t mxf_sony_mpeg4_extradata[] = { 0x06,0x0e,0x2b,0x34,0x04,0x01,0x01,0x01,0x0e,0x06,0x06,0x02,0x02,0x01,0x00,0x00 };
  137. #define IS_KLV_KEY(x, y) (!memcmp(x, y, sizeof(y)))
  138. static int64_t klv_decode_ber_length(ByteIOContext *pb)
  139. {
  140. uint64_t size = get_byte(pb);
  141. if (size & 0x80) { /* long form */
  142. int bytes_num = size & 0x7f;
  143. /* SMPTE 379M 5.3.4 guarantee that bytes_num must not exceed 8 bytes */
  144. if (bytes_num > 8)
  145. return -1;
  146. size = 0;
  147. while (bytes_num--)
  148. size = size << 8 | get_byte(pb);
  149. }
  150. return size;
  151. }
  152. static int mxf_read_sync(ByteIOContext *pb, const uint8_t *key, unsigned size)
  153. {
  154. int i, b;
  155. for (i = 0; i < size && !url_feof(pb); i++) {
  156. b = get_byte(pb);
  157. if (b == key[0])
  158. i = 0;
  159. else if (b != key[i])
  160. i = -1;
  161. }
  162. return i == size;
  163. }
  164. static int klv_read_packet(KLVPacket *klv, ByteIOContext *pb)
  165. {
  166. if (!mxf_read_sync(pb, mxf_klv_key, 4))
  167. return -1;
  168. klv->offset = url_ftell(pb) - 4;
  169. memcpy(klv->key, mxf_klv_key, 4);
  170. get_buffer(pb, klv->key + 4, 12);
  171. klv->length = klv_decode_ber_length(pb);
  172. return klv->length == -1 ? -1 : 0;
  173. }
  174. static int mxf_get_stream_index(AVFormatContext *s, KLVPacket *klv)
  175. {
  176. int i;
  177. for (i = 0; i < s->nb_streams; i++) {
  178. MXFTrack *track = s->streams[i]->priv_data;
  179. /* SMPTE 379M 7.3 */
  180. if (!memcmp(klv->key + sizeof(mxf_essence_element_key), track->track_number, sizeof(track->track_number)))
  181. return i;
  182. }
  183. /* return 0 if only one stream, for OP Atom files with 0 as track number */
  184. return s->nb_streams == 1 ? 0 : -1;
  185. }
  186. /* XXX: use AVBitStreamFilter */
  187. static int mxf_get_d10_aes3_packet(ByteIOContext *pb, AVStream *st, AVPacket *pkt, int64_t length)
  188. {
  189. uint8_t buffer[61444];
  190. const uint8_t *buf_ptr, *end_ptr;
  191. uint8_t *data_ptr;
  192. int i;
  193. if (length > 61444) /* worst case PAL 1920 samples 8 channels */
  194. return -1;
  195. get_buffer(pb, buffer, length);
  196. av_new_packet(pkt, length);
  197. data_ptr = pkt->data;
  198. end_ptr = buffer + length;
  199. buf_ptr = buffer + 4; /* skip SMPTE 331M header */
  200. for (; buf_ptr < end_ptr; ) {
  201. for (i = 0; i < st->codec->channels; i++) {
  202. uint32_t sample = bytestream_get_le32(&buf_ptr);
  203. if (st->codec->bits_per_sample == 24)
  204. bytestream_put_le24(&data_ptr, (sample >> 4) & 0xffffff);
  205. else
  206. bytestream_put_le16(&data_ptr, (sample >> 12) & 0xffff);
  207. }
  208. buf_ptr += 32 - st->codec->channels*4; // always 8 channels stored SMPTE 331M
  209. }
  210. pkt->size = data_ptr - pkt->data;
  211. return 0;
  212. }
  213. static int mxf_decrypt_triplet(AVFormatContext *s, AVPacket *pkt, KLVPacket *klv)
  214. {
  215. static const uint8_t checkv[16] = {0x43, 0x48, 0x55, 0x4b, 0x43, 0x48, 0x55, 0x4b, 0x43, 0x48, 0x55, 0x4b, 0x43, 0x48, 0x55, 0x4b};
  216. MXFContext *mxf = s->priv_data;
  217. ByteIOContext *pb = s->pb;
  218. offset_t end = url_ftell(pb) + klv->length;
  219. uint64_t size;
  220. uint64_t orig_size;
  221. uint64_t plaintext_size;
  222. uint8_t ivec[16];
  223. uint8_t tmpbuf[16];
  224. int index;
  225. if (!mxf->aesc && s->key && s->keylen == 16) {
  226. mxf->aesc = av_malloc(av_aes_size);
  227. if (!mxf->aesc)
  228. return -1;
  229. av_aes_init(mxf->aesc, s->key, 128, 1);
  230. }
  231. // crypto context
  232. url_fskip(pb, klv_decode_ber_length(pb));
  233. // plaintext offset
  234. klv_decode_ber_length(pb);
  235. plaintext_size = get_be64(pb);
  236. // source klv key
  237. klv_decode_ber_length(pb);
  238. get_buffer(pb, klv->key, 16);
  239. if (!IS_KLV_KEY(klv, mxf_essence_element_key))
  240. return -1;
  241. index = mxf_get_stream_index(s, klv);
  242. if (index < 0)
  243. return -1;
  244. // source size
  245. klv_decode_ber_length(pb);
  246. orig_size = get_be64(pb);
  247. if (orig_size < plaintext_size)
  248. return -1;
  249. // enc. code
  250. size = klv_decode_ber_length(pb);
  251. if (size < 32 || size - 32 < orig_size)
  252. return -1;
  253. get_buffer(pb, ivec, 16);
  254. get_buffer(pb, tmpbuf, 16);
  255. if (mxf->aesc)
  256. av_aes_crypt(mxf->aesc, tmpbuf, tmpbuf, 1, ivec, 1);
  257. if (memcmp(tmpbuf, checkv, 16))
  258. av_log(s, AV_LOG_ERROR, "probably incorrect decryption key\n");
  259. size -= 32;
  260. av_get_packet(pb, pkt, size);
  261. size -= plaintext_size;
  262. if (mxf->aesc)
  263. av_aes_crypt(mxf->aesc, &pkt->data[plaintext_size],
  264. &pkt->data[plaintext_size], size >> 4, ivec, 1);
  265. pkt->size = orig_size;
  266. pkt->stream_index = index;
  267. url_fskip(pb, end - url_ftell(pb));
  268. return 0;
  269. }
  270. static int mxf_read_packet(AVFormatContext *s, AVPacket *pkt)
  271. {
  272. KLVPacket klv;
  273. while (!url_feof(s->pb)) {
  274. if (klv_read_packet(&klv, s->pb) < 0)
  275. return -1;
  276. #ifdef DEBUG
  277. PRINT_KEY(s, "read packet", klv.key);
  278. #endif
  279. if (IS_KLV_KEY(klv.key, mxf_encrypted_triplet_key)) {
  280. int res = mxf_decrypt_triplet(s, pkt, &klv);
  281. if (res < 0) {
  282. av_log(s, AV_LOG_ERROR, "invalid encoded triplet\n");
  283. return -1;
  284. }
  285. return 0;
  286. }
  287. if (IS_KLV_KEY(klv.key, mxf_essence_element_key)) {
  288. int index = mxf_get_stream_index(s, &klv);
  289. if (index < 0) {
  290. av_log(s, AV_LOG_ERROR, "error getting stream index %x\n", AV_RB32(klv.key+12));
  291. goto skip;
  292. }
  293. if (s->streams[index]->discard == AVDISCARD_ALL)
  294. goto skip;
  295. /* check for 8 channels AES3 element */
  296. if (klv.key[12] == 0x06 && klv.key[13] == 0x01 && klv.key[14] == 0x10) {
  297. if (mxf_get_d10_aes3_packet(s->pb, s->streams[index], pkt, klv.length) < 0) {
  298. av_log(s, AV_LOG_ERROR, "error reading D-10 aes3 frame\n");
  299. return -1;
  300. }
  301. } else
  302. av_get_packet(s->pb, pkt, klv.length);
  303. pkt->stream_index = index;
  304. pkt->pos = klv.offset;
  305. return 0;
  306. } else
  307. skip:
  308. url_fskip(s->pb, klv.length);
  309. }
  310. return AVERROR(EIO);
  311. }
  312. static int mxf_read_primer_pack(MXFContext *mxf)
  313. {
  314. ByteIOContext *pb = mxf->fc->pb;
  315. int item_num = get_be32(pb);
  316. int item_len = get_be32(pb);
  317. if (item_len != 18) {
  318. av_log(mxf->fc, AV_LOG_ERROR, "unsupported primer pack item length\n");
  319. return -1;
  320. }
  321. if (item_num > UINT_MAX / item_len)
  322. return -1;
  323. mxf->local_tags_count = item_num;
  324. mxf->local_tags = av_malloc(item_num*item_len);
  325. if (!mxf->local_tags)
  326. return -1;
  327. get_buffer(pb, mxf->local_tags, item_num*item_len);
  328. return 0;
  329. }
  330. static int mxf_add_metadata_set(MXFContext *mxf, void *metadata_set)
  331. {
  332. mxf->metadata_sets = av_realloc(mxf->metadata_sets, (mxf->metadata_sets_count + 1) * sizeof(*mxf->metadata_sets));
  333. if (!mxf->metadata_sets)
  334. return -1;
  335. mxf->metadata_sets[mxf->metadata_sets_count] = metadata_set;
  336. mxf->metadata_sets_count++;
  337. return 0;
  338. }
  339. static int mxf_read_cryptographic_context(MXFCryptoContext *cryptocontext, ByteIOContext *pb, int tag, int size, UID uid)
  340. {
  341. if (size != 16)
  342. return -1;
  343. if (IS_KLV_KEY(uid, mxf_crypto_source_container_ul))
  344. get_buffer(pb, cryptocontext->source_container_ul, 16);
  345. return 0;
  346. }
  347. static int mxf_read_content_storage(MXFContext *mxf, ByteIOContext *pb, int tag)
  348. {
  349. switch (tag) {
  350. case 0x1901:
  351. mxf->packages_count = get_be32(pb);
  352. if (mxf->packages_count >= UINT_MAX / sizeof(UID))
  353. return -1;
  354. mxf->packages_refs = av_malloc(mxf->packages_count * sizeof(UID));
  355. if (!mxf->packages_refs)
  356. return -1;
  357. url_fskip(pb, 4); /* useless size of objects, always 16 according to specs */
  358. get_buffer(pb, (uint8_t *)mxf->packages_refs, mxf->packages_count * sizeof(UID));
  359. break;
  360. }
  361. return 0;
  362. }
  363. static int mxf_read_source_clip(MXFStructuralComponent *source_clip, ByteIOContext *pb, int tag)
  364. {
  365. switch(tag) {
  366. case 0x0202:
  367. source_clip->duration = get_be64(pb);
  368. break;
  369. case 0x1201:
  370. source_clip->start_position = get_be64(pb);
  371. break;
  372. case 0x1101:
  373. /* UMID, only get last 16 bytes */
  374. url_fskip(pb, 16);
  375. get_buffer(pb, source_clip->source_package_uid, 16);
  376. break;
  377. case 0x1102:
  378. source_clip->source_track_id = get_be32(pb);
  379. break;
  380. }
  381. return 0;
  382. }
  383. static int mxf_read_material_package(MXFPackage *package, ByteIOContext *pb, int tag)
  384. {
  385. switch(tag) {
  386. case 0x4403:
  387. package->tracks_count = get_be32(pb);
  388. if (package->tracks_count >= UINT_MAX / sizeof(UID))
  389. return -1;
  390. package->tracks_refs = av_malloc(package->tracks_count * sizeof(UID));
  391. if (!package->tracks_refs)
  392. return -1;
  393. url_fskip(pb, 4); /* useless size of objects, always 16 according to specs */
  394. get_buffer(pb, (uint8_t *)package->tracks_refs, package->tracks_count * sizeof(UID));
  395. break;
  396. }
  397. return 0;
  398. }
  399. static int mxf_read_track(MXFTrack *track, ByteIOContext *pb, int tag)
  400. {
  401. switch(tag) {
  402. case 0x4801:
  403. track->track_id = get_be32(pb);
  404. break;
  405. case 0x4804:
  406. get_buffer(pb, track->track_number, 4);
  407. break;
  408. case 0x4B01:
  409. track->edit_rate.den = get_be32(pb);
  410. track->edit_rate.num = get_be32(pb);
  411. break;
  412. case 0x4803:
  413. get_buffer(pb, track->sequence_ref, 16);
  414. break;
  415. }
  416. return 0;
  417. }
  418. static int mxf_read_sequence(MXFSequence *sequence, ByteIOContext *pb, int tag)
  419. {
  420. switch(tag) {
  421. case 0x0202:
  422. sequence->duration = get_be64(pb);
  423. break;
  424. case 0x0201:
  425. get_buffer(pb, sequence->data_definition_ul, 16);
  426. break;
  427. case 0x1001:
  428. sequence->structural_components_count = get_be32(pb);
  429. if (sequence->structural_components_count >= UINT_MAX / sizeof(UID))
  430. return -1;
  431. sequence->structural_components_refs = av_malloc(sequence->structural_components_count * sizeof(UID));
  432. if (!sequence->structural_components_refs)
  433. return -1;
  434. url_fskip(pb, 4); /* useless size of objects, always 16 according to specs */
  435. get_buffer(pb, (uint8_t *)sequence->structural_components_refs, sequence->structural_components_count * sizeof(UID));
  436. break;
  437. }
  438. return 0;
  439. }
  440. static int mxf_read_source_package(MXFPackage *package, ByteIOContext *pb, int tag)
  441. {
  442. switch(tag) {
  443. case 0x4403:
  444. package->tracks_count = get_be32(pb);
  445. if (package->tracks_count >= UINT_MAX / sizeof(UID))
  446. return -1;
  447. package->tracks_refs = av_malloc(package->tracks_count * sizeof(UID));
  448. if (!package->tracks_refs)
  449. return -1;
  450. url_fskip(pb, 4); /* useless size of objects, always 16 according to specs */
  451. get_buffer(pb, (uint8_t *)package->tracks_refs, package->tracks_count * sizeof(UID));
  452. break;
  453. case 0x4401:
  454. /* UMID, only get last 16 bytes */
  455. url_fskip(pb, 16);
  456. get_buffer(pb, package->package_uid, 16);
  457. break;
  458. case 0x4701:
  459. get_buffer(pb, package->descriptor_ref, 16);
  460. break;
  461. }
  462. return 0;
  463. }
  464. static void mxf_read_pixel_layout(ByteIOContext *pb, MXFDescriptor *descriptor)
  465. {
  466. int code;
  467. do {
  468. code = get_byte(pb);
  469. dprintf(NULL, "pixel layout: code 0x%x\n", code);
  470. switch (code) {
  471. case 0x52: /* R */
  472. descriptor->bits_per_sample += get_byte(pb);
  473. break;
  474. case 0x47: /* G */
  475. descriptor->bits_per_sample += get_byte(pb);
  476. break;
  477. case 0x42: /* B */
  478. descriptor->bits_per_sample += get_byte(pb);
  479. break;
  480. default:
  481. get_byte(pb);
  482. }
  483. } while (code != 0); /* SMPTE 377M E.2.46 */
  484. }
  485. static int mxf_read_generic_descriptor(MXFDescriptor *descriptor, ByteIOContext *pb, int tag, int size, UID uid)
  486. {
  487. switch(tag) {
  488. case 0x3F01:
  489. descriptor->sub_descriptors_count = get_be32(pb);
  490. if (descriptor->sub_descriptors_count >= UINT_MAX / sizeof(UID))
  491. return -1;
  492. descriptor->sub_descriptors_refs = av_malloc(descriptor->sub_descriptors_count * sizeof(UID));
  493. if (!descriptor->sub_descriptors_refs)
  494. return -1;
  495. url_fskip(pb, 4); /* useless size of objects, always 16 according to specs */
  496. get_buffer(pb, (uint8_t *)descriptor->sub_descriptors_refs, descriptor->sub_descriptors_count * sizeof(UID));
  497. break;
  498. case 0x3004:
  499. get_buffer(pb, descriptor->essence_container_ul, 16);
  500. break;
  501. case 0x3006:
  502. descriptor->linked_track_id = get_be32(pb);
  503. break;
  504. case 0x3201: /* PictureEssenceCoding */
  505. get_buffer(pb, descriptor->essence_codec_ul, 16);
  506. break;
  507. case 0x3203:
  508. descriptor->width = get_be32(pb);
  509. break;
  510. case 0x3202:
  511. descriptor->height = get_be32(pb);
  512. break;
  513. case 0x320E:
  514. descriptor->aspect_ratio.num = get_be32(pb);
  515. descriptor->aspect_ratio.den = get_be32(pb);
  516. break;
  517. case 0x3D03:
  518. descriptor->sample_rate.num = get_be32(pb);
  519. descriptor->sample_rate.den = get_be32(pb);
  520. break;
  521. case 0x3D06: /* SoundEssenceCompression */
  522. get_buffer(pb, descriptor->essence_codec_ul, 16);
  523. break;
  524. case 0x3D07:
  525. descriptor->channels = get_be32(pb);
  526. break;
  527. case 0x3D01:
  528. descriptor->bits_per_sample = get_be32(pb);
  529. break;
  530. case 0x3401:
  531. mxf_read_pixel_layout(pb, descriptor);
  532. break;
  533. default:
  534. /* Private uid used by SONY C0023S01.mxf */
  535. if (IS_KLV_KEY(uid, mxf_sony_mpeg4_extradata)) {
  536. descriptor->extradata = av_malloc(size);
  537. if (!descriptor->extradata)
  538. return -1;
  539. descriptor->extradata_size = size;
  540. get_buffer(pb, descriptor->extradata, size);
  541. }
  542. break;
  543. }
  544. return 0;
  545. }
  546. /*
  547. * Match an uid independently of the version byte and up to len common bytes
  548. * Returns: boolean
  549. */
  550. static int mxf_match_uid(const UID key, const UID uid, int len)
  551. {
  552. int i;
  553. for (i = 0; i < len; i++) {
  554. if (i != 7 && key[i] != uid[i])
  555. return 0;
  556. }
  557. return 1;
  558. }
  559. static const MXFCodecUL *mxf_get_codec_ul(const MXFCodecUL *uls, UID *uid)
  560. {
  561. while (uls->id != CODEC_ID_NONE) {
  562. if(mxf_match_uid(uls->uid, *uid, uls->matching_len))
  563. break;
  564. uls++;
  565. }
  566. return uls;
  567. }
  568. static enum CodecType mxf_get_codec_type(const MXFDataDefinitionUL *uls, UID *uid)
  569. {
  570. while (uls->type != CODEC_TYPE_DATA) {
  571. if(mxf_match_uid(uls->uid, *uid, 16))
  572. break;
  573. uls++;
  574. }
  575. return uls->type;
  576. }
  577. static void *mxf_resolve_strong_ref(MXFContext *mxf, UID *strong_ref, enum MXFMetadataSetType type)
  578. {
  579. int i;
  580. if (!strong_ref)
  581. return NULL;
  582. for (i = 0; i < mxf->metadata_sets_count; i++) {
  583. if (!memcmp(*strong_ref, mxf->metadata_sets[i]->uid, 16) &&
  584. (type == AnyType || mxf->metadata_sets[i]->type == type)) {
  585. return mxf->metadata_sets[i];
  586. }
  587. }
  588. return NULL;
  589. }
  590. static int mxf_parse_structural_metadata(MXFContext *mxf)
  591. {
  592. MXFPackage *material_package = NULL;
  593. MXFPackage *temp_package = NULL;
  594. int i, j, k;
  595. dprintf(mxf->fc, "metadata sets count %d\n", mxf->metadata_sets_count);
  596. /* TODO: handle multiple material packages (OP3x) */
  597. for (i = 0; i < mxf->packages_count; i++) {
  598. material_package = mxf_resolve_strong_ref(mxf, &mxf->packages_refs[i], MaterialPackage);
  599. if (material_package) break;
  600. }
  601. if (!material_package) {
  602. av_log(mxf->fc, AV_LOG_ERROR, "no material package found\n");
  603. return -1;
  604. }
  605. for (i = 0; i < material_package->tracks_count; i++) {
  606. MXFPackage *source_package = NULL;
  607. MXFTrack *material_track = NULL;
  608. MXFTrack *source_track = NULL;
  609. MXFTrack *temp_track = NULL;
  610. MXFDescriptor *descriptor = NULL;
  611. MXFStructuralComponent *component = NULL;
  612. UID *essence_container_ul = NULL;
  613. const MXFCodecUL *codec_ul = NULL;
  614. const MXFCodecUL *container_ul = NULL;
  615. AVStream *st;
  616. if (!(material_track = mxf_resolve_strong_ref(mxf, &material_package->tracks_refs[i], Track))) {
  617. av_log(mxf->fc, AV_LOG_ERROR, "could not resolve material track strong ref\n");
  618. continue;
  619. }
  620. if (!(material_track->sequence = mxf_resolve_strong_ref(mxf, &material_track->sequence_ref, Sequence))) {
  621. av_log(mxf->fc, AV_LOG_ERROR, "could not resolve material track sequence strong ref\n");
  622. return -1;
  623. }
  624. /* TODO: handle multiple source clips */
  625. for (j = 0; j < material_track->sequence->structural_components_count; j++) {
  626. /* TODO: handle timecode component */
  627. component = mxf_resolve_strong_ref(mxf, &material_track->sequence->structural_components_refs[j], SourceClip);
  628. if (!component)
  629. continue;
  630. for (k = 0; k < mxf->packages_count; k++) {
  631. temp_package = mxf_resolve_strong_ref(mxf, &mxf->packages_refs[k], SourcePackage);
  632. if (!temp_package)
  633. continue;
  634. if (!memcmp(temp_package->package_uid, component->source_package_uid, 16)) {
  635. source_package = temp_package;
  636. break;
  637. }
  638. }
  639. if (!source_package) {
  640. av_log(mxf->fc, AV_LOG_ERROR, "material track %d: no corresponding source package found\n", material_track->track_id);
  641. break;
  642. }
  643. for (k = 0; k < source_package->tracks_count; k++) {
  644. if (!(temp_track = mxf_resolve_strong_ref(mxf, &source_package->tracks_refs[k], Track))) {
  645. av_log(mxf->fc, AV_LOG_ERROR, "could not resolve source track strong ref\n");
  646. return -1;
  647. }
  648. if (temp_track->track_id == component->source_track_id) {
  649. source_track = temp_track;
  650. break;
  651. }
  652. }
  653. if (!source_track) {
  654. av_log(mxf->fc, AV_LOG_ERROR, "material track %d: no corresponding source track found\n", material_track->track_id);
  655. break;
  656. }
  657. }
  658. if (!source_track)
  659. continue;
  660. st = av_new_stream(mxf->fc, source_track->track_id);
  661. if (!st) {
  662. av_log(mxf->fc, AV_LOG_ERROR, "could not allocate stream\n");
  663. return -1;
  664. }
  665. st->priv_data = source_track;
  666. st->duration = component->duration;
  667. if (st->duration == -1)
  668. st->duration = AV_NOPTS_VALUE;
  669. st->start_time = component->start_position;
  670. av_set_pts_info(st, 64, material_track->edit_rate.num, material_track->edit_rate.den);
  671. if (!(source_track->sequence = mxf_resolve_strong_ref(mxf, &source_track->sequence_ref, Sequence))) {
  672. av_log(mxf->fc, AV_LOG_ERROR, "could not resolve source track sequence strong ref\n");
  673. return -1;
  674. }
  675. #ifdef DEBUG
  676. PRINT_KEY(mxf->fc, "data definition ul", source_track->sequence->data_definition_ul);
  677. #endif
  678. st->codec->codec_type = mxf_get_codec_type(ff_mxf_data_definition_uls, &source_track->sequence->data_definition_ul);
  679. source_package->descriptor = mxf_resolve_strong_ref(mxf, &source_package->descriptor_ref, AnyType);
  680. if (source_package->descriptor) {
  681. if (source_package->descriptor->type == MultipleDescriptor) {
  682. for (j = 0; j < source_package->descriptor->sub_descriptors_count; j++) {
  683. MXFDescriptor *sub_descriptor = mxf_resolve_strong_ref(mxf, &source_package->descriptor->sub_descriptors_refs[j], Descriptor);
  684. if (!sub_descriptor) {
  685. av_log(mxf->fc, AV_LOG_ERROR, "could not resolve sub descriptor strong ref\n");
  686. continue;
  687. }
  688. if (sub_descriptor->linked_track_id == source_track->track_id) {
  689. descriptor = sub_descriptor;
  690. break;
  691. }
  692. }
  693. } else if (source_package->descriptor->type == Descriptor)
  694. descriptor = source_package->descriptor;
  695. }
  696. if (!descriptor) {
  697. av_log(mxf->fc, AV_LOG_INFO, "source track %d: stream %d, no descriptor found\n", source_track->track_id, st->index);
  698. continue;
  699. }
  700. #ifdef DEBUG
  701. PRINT_KEY(mxf->fc, "essence codec ul", descriptor->essence_codec_ul);
  702. PRINT_KEY(mxf->fc, "essence container ul", descriptor->essence_container_ul);
  703. #endif
  704. essence_container_ul = &descriptor->essence_container_ul;
  705. /* HACK: replacing the original key with mxf_encrypted_essence_container
  706. * is not allowed according to s429-6, try to find correct information anyway */
  707. if (IS_KLV_KEY(essence_container_ul, mxf_encrypted_essence_container)) {
  708. av_log(mxf->fc, AV_LOG_INFO, "broken encrypted mxf file\n");
  709. for (k = 0; k < mxf->metadata_sets_count; k++) {
  710. MXFMetadataSet *metadata = mxf->metadata_sets[k];
  711. if (metadata->type == CryptoContext) {
  712. essence_container_ul = &((MXFCryptoContext *)metadata)->source_container_ul;
  713. break;
  714. }
  715. }
  716. }
  717. /* TODO: drop PictureEssenceCoding and SoundEssenceCompression, only check EssenceContainer */
  718. codec_ul = mxf_get_codec_ul(ff_mxf_codec_uls, &descriptor->essence_codec_ul);
  719. st->codec->codec_id = codec_ul->id;
  720. if (descriptor->extradata) {
  721. st->codec->extradata = descriptor->extradata;
  722. st->codec->extradata_size = descriptor->extradata_size;
  723. }
  724. if (st->codec->codec_type == CODEC_TYPE_VIDEO) {
  725. container_ul = mxf_get_codec_ul(ff_mxf_essence_container_uls, essence_container_ul);
  726. if (st->codec->codec_id == CODEC_ID_NONE)
  727. st->codec->codec_id = container_ul->id;
  728. st->codec->width = descriptor->width;
  729. st->codec->height = descriptor->height;
  730. st->codec->bits_per_sample = descriptor->bits_per_sample; /* Uncompressed */
  731. st->need_parsing = AVSTREAM_PARSE_HEADERS;
  732. } else if (st->codec->codec_type == CODEC_TYPE_AUDIO) {
  733. container_ul = mxf_get_codec_ul(ff_mxf_essence_container_uls, essence_container_ul);
  734. if (st->codec->codec_id == CODEC_ID_NONE)
  735. st->codec->codec_id = container_ul->id;
  736. st->codec->channels = descriptor->channels;
  737. st->codec->bits_per_sample = descriptor->bits_per_sample;
  738. st->codec->sample_rate = descriptor->sample_rate.num / descriptor->sample_rate.den;
  739. /* TODO: implement CODEC_ID_RAWAUDIO */
  740. if (st->codec->codec_id == CODEC_ID_PCM_S16LE) {
  741. if (descriptor->bits_per_sample == 24)
  742. st->codec->codec_id = CODEC_ID_PCM_S24LE;
  743. else if (descriptor->bits_per_sample == 32)
  744. st->codec->codec_id = CODEC_ID_PCM_S32LE;
  745. } else if (st->codec->codec_id == CODEC_ID_PCM_S16BE) {
  746. if (descriptor->bits_per_sample == 24)
  747. st->codec->codec_id = CODEC_ID_PCM_S24BE;
  748. else if (descriptor->bits_per_sample == 32)
  749. st->codec->codec_id = CODEC_ID_PCM_S32BE;
  750. } else if (st->codec->codec_id == CODEC_ID_MP2) {
  751. st->need_parsing = AVSTREAM_PARSE_FULL;
  752. }
  753. }
  754. if (st->codec->codec_type != CODEC_TYPE_DATA && (*essence_container_ul)[15] > 0x01) {
  755. av_log(mxf->fc, AV_LOG_WARNING, "only frame wrapped mappings are correctly supported\n");
  756. st->need_parsing = AVSTREAM_PARSE_FULL;
  757. }
  758. }
  759. return 0;
  760. }
  761. static const MXFMetadataReadTableEntry mxf_metadata_read_table[] = {
  762. { { 0x06,0x0E,0x2B,0x34,0x02,0x05,0x01,0x01,0x0d,0x01,0x02,0x01,0x01,0x05,0x01,0x00 }, mxf_read_primer_pack },
  763. { { 0x06,0x0E,0x2B,0x34,0x02,0x53,0x01,0x01,0x0d,0x01,0x01,0x01,0x01,0x01,0x18,0x00 }, mxf_read_content_storage, 0, AnyType },
  764. { { 0x06,0x0E,0x2B,0x34,0x02,0x53,0x01,0x01,0x0d,0x01,0x01,0x01,0x01,0x01,0x37,0x00 }, mxf_read_source_package, sizeof(MXFPackage), SourcePackage },
  765. { { 0x06,0x0E,0x2B,0x34,0x02,0x53,0x01,0x01,0x0d,0x01,0x01,0x01,0x01,0x01,0x36,0x00 }, mxf_read_material_package, sizeof(MXFPackage), MaterialPackage },
  766. { { 0x06,0x0E,0x2B,0x34,0x02,0x53,0x01,0x01,0x0d,0x01,0x01,0x01,0x01,0x01,0x0F,0x00 }, mxf_read_sequence, sizeof(MXFSequence), Sequence },
  767. { { 0x06,0x0E,0x2B,0x34,0x02,0x53,0x01,0x01,0x0d,0x01,0x01,0x01,0x01,0x01,0x11,0x00 }, mxf_read_source_clip, sizeof(MXFStructuralComponent), SourceClip },
  768. { { 0x06,0x0E,0x2B,0x34,0x02,0x53,0x01,0x01,0x0d,0x01,0x01,0x01,0x01,0x01,0x44,0x00 }, mxf_read_generic_descriptor, sizeof(MXFDescriptor), MultipleDescriptor },
  769. { { 0x06,0x0E,0x2B,0x34,0x02,0x53,0x01,0x01,0x0d,0x01,0x01,0x01,0x01,0x01,0x42,0x00 }, mxf_read_generic_descriptor, sizeof(MXFDescriptor), Descriptor }, /* Generic Sound */
  770. { { 0x06,0x0E,0x2B,0x34,0x02,0x53,0x01,0x01,0x0d,0x01,0x01,0x01,0x01,0x01,0x28,0x00 }, mxf_read_generic_descriptor, sizeof(MXFDescriptor), Descriptor }, /* CDCI */
  771. { { 0x06,0x0E,0x2B,0x34,0x02,0x53,0x01,0x01,0x0d,0x01,0x01,0x01,0x01,0x01,0x29,0x00 }, mxf_read_generic_descriptor, sizeof(MXFDescriptor), Descriptor }, /* RGBA */
  772. { { 0x06,0x0E,0x2B,0x34,0x02,0x53,0x01,0x01,0x0d,0x01,0x01,0x01,0x01,0x01,0x51,0x00 }, mxf_read_generic_descriptor, sizeof(MXFDescriptor), Descriptor }, /* MPEG 2 Video */
  773. { { 0x06,0x0E,0x2B,0x34,0x02,0x53,0x01,0x01,0x0d,0x01,0x01,0x01,0x01,0x01,0x48,0x00 }, mxf_read_generic_descriptor, sizeof(MXFDescriptor), Descriptor }, /* Wave */
  774. { { 0x06,0x0E,0x2B,0x34,0x02,0x53,0x01,0x01,0x0d,0x01,0x01,0x01,0x01,0x01,0x47,0x00 }, mxf_read_generic_descriptor, sizeof(MXFDescriptor), Descriptor }, /* AES3 */
  775. { { 0x06,0x0E,0x2B,0x34,0x02,0x53,0x01,0x01,0x0d,0x01,0x01,0x01,0x01,0x01,0x3A,0x00 }, mxf_read_track, sizeof(MXFTrack), Track }, /* Static Track */
  776. { { 0x06,0x0E,0x2B,0x34,0x02,0x53,0x01,0x01,0x0d,0x01,0x01,0x01,0x01,0x01,0x3B,0x00 }, mxf_read_track, sizeof(MXFTrack), Track }, /* Generic Track */
  777. { { 0x06,0x0E,0x2B,0x34,0x02,0x53,0x01,0x01,0x0d,0x01,0x04,0x01,0x02,0x02,0x00,0x00 }, mxf_read_cryptographic_context, sizeof(MXFCryptoContext), CryptoContext },
  778. { { 0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00 }, NULL, 0, AnyType },
  779. };
  780. static int mxf_read_local_tags(MXFContext *mxf, KLVPacket *klv, int (*read_child)(), int ctx_size, enum MXFMetadataSetType type)
  781. {
  782. ByteIOContext *pb = mxf->fc->pb;
  783. MXFMetadataSet *ctx = ctx_size ? av_mallocz(ctx_size) : mxf;
  784. uint64_t klv_end = url_ftell(pb) + klv->length;
  785. if (!ctx)
  786. return -1;
  787. while (url_ftell(pb) + 4 < klv_end) {
  788. int tag = get_be16(pb);
  789. int size = get_be16(pb); /* KLV specified by 0x53 */
  790. uint64_t next = url_ftell(pb) + size;
  791. UID uid = {0};
  792. if (!size) { /* ignore empty tag, needed for some files with empty UMID tag */
  793. av_log(mxf->fc, AV_LOG_ERROR, "local tag 0x%04X with 0 size\n", tag);
  794. continue;
  795. }
  796. if (tag > 0x7FFF) { /* dynamic tag */
  797. int i;
  798. for (i = 0; i < mxf->local_tags_count; i++) {
  799. int local_tag = AV_RB16(mxf->local_tags+i*18);
  800. if (local_tag == tag) {
  801. memcpy(uid, mxf->local_tags+i*18+2, 16);
  802. dprintf(mxf->fc, "local tag 0x%04X\n", local_tag);
  803. #ifdef DEBUG
  804. PRINT_KEY(mxf->fc, "uid", uid);
  805. #endif
  806. }
  807. }
  808. }
  809. if (ctx_size && tag == 0x3C0A)
  810. get_buffer(pb, ctx->uid, 16);
  811. else if (read_child(ctx, pb, tag, size, uid) < 0)
  812. return -1;
  813. url_fseek(pb, next, SEEK_SET);
  814. }
  815. if (ctx_size) ctx->type = type;
  816. return ctx_size ? mxf_add_metadata_set(mxf, ctx) : 0;
  817. }
  818. static int mxf_read_header(AVFormatContext *s, AVFormatParameters *ap)
  819. {
  820. MXFContext *mxf = s->priv_data;
  821. KLVPacket klv;
  822. if (!mxf_read_sync(s->pb, mxf_header_partition_pack_key, 14)) {
  823. av_log(s, AV_LOG_ERROR, "could not find header partition pack key\n");
  824. return -1;
  825. }
  826. url_fseek(s->pb, -14, SEEK_CUR);
  827. mxf->fc = s;
  828. while (!url_feof(s->pb)) {
  829. const MXFMetadataReadTableEntry *metadata;
  830. if (klv_read_packet(&klv, s->pb) < 0)
  831. return -1;
  832. #ifdef DEBUG
  833. PRINT_KEY(s, "read header", klv.key);
  834. #endif
  835. if (IS_KLV_KEY(klv.key, mxf_encrypted_triplet_key) ||
  836. IS_KLV_KEY(klv.key, mxf_essence_element_key)) {
  837. /* FIXME avoid seek */
  838. url_fseek(s->pb, klv.offset, SEEK_SET);
  839. break;
  840. }
  841. for (metadata = mxf_metadata_read_table; metadata->read; metadata++) {
  842. if (IS_KLV_KEY(klv.key, metadata->key)) {
  843. int (*read)() = klv.key[5] == 0x53 ? mxf_read_local_tags : metadata->read;
  844. if (read(mxf, &klv, metadata->read, metadata->ctx_size, metadata->type) < 0) {
  845. av_log(s, AV_LOG_ERROR, "error reading header metadata\n");
  846. return -1;
  847. }
  848. break;
  849. }
  850. }
  851. if (!metadata->read)
  852. url_fskip(s->pb, klv.length);
  853. }
  854. return mxf_parse_structural_metadata(mxf);
  855. }
  856. static int mxf_read_close(AVFormatContext *s)
  857. {
  858. MXFContext *mxf = s->priv_data;
  859. int i;
  860. av_freep(&mxf->packages_refs);
  861. for (i = 0; i < mxf->metadata_sets_count; i++) {
  862. switch (mxf->metadata_sets[i]->type) {
  863. case MultipleDescriptor:
  864. av_freep(&((MXFDescriptor *)mxf->metadata_sets[i])->sub_descriptors_refs);
  865. break;
  866. case Sequence:
  867. av_freep(&((MXFSequence *)mxf->metadata_sets[i])->structural_components_refs);
  868. break;
  869. case SourcePackage:
  870. case MaterialPackage:
  871. av_freep(&((MXFPackage *)mxf->metadata_sets[i])->tracks_refs);
  872. break;
  873. case Track:
  874. mxf->metadata_sets[i] = NULL; /* will be freed later */
  875. break;
  876. default:
  877. break;
  878. }
  879. av_freep(&mxf->metadata_sets[i]);
  880. }
  881. av_freep(&mxf->metadata_sets);
  882. av_freep(&mxf->aesc);
  883. av_freep(&mxf->local_tags);
  884. return 0;
  885. }
  886. static int mxf_probe(AVProbeData *p) {
  887. uint8_t *bufp = p->buf;
  888. uint8_t *end = p->buf + p->buf_size;
  889. if (p->buf_size < sizeof(mxf_header_partition_pack_key))
  890. return 0;
  891. /* Must skip Run-In Sequence and search for MXF header partition pack key SMPTE 377M 5.5 */
  892. end -= sizeof(mxf_header_partition_pack_key);
  893. for (; bufp < end; bufp++) {
  894. if (IS_KLV_KEY(bufp, mxf_header_partition_pack_key))
  895. return AVPROBE_SCORE_MAX;
  896. }
  897. return 0;
  898. }
  899. /* rudimentary byte seek */
  900. /* XXX: use MXF Index */
  901. static int mxf_read_seek(AVFormatContext *s, int stream_index, int64_t sample_time, int flags)
  902. {
  903. AVStream *st = s->streams[stream_index];
  904. int64_t seconds;
  905. if (!s->bit_rate)
  906. return -1;
  907. if (sample_time < 0)
  908. sample_time = 0;
  909. seconds = av_rescale(sample_time, st->time_base.num, st->time_base.den);
  910. url_fseek(s->pb, (s->bit_rate * seconds) >> 3, SEEK_SET);
  911. av_update_cur_dts(s, st, sample_time);
  912. return 0;
  913. }
  914. AVInputFormat mxf_demuxer = {
  915. "mxf",
  916. NULL_IF_CONFIG_SMALL("Material eXchange Format"),
  917. sizeof(MXFContext),
  918. mxf_probe,
  919. mxf_read_header,
  920. mxf_read_packet,
  921. mxf_read_close,
  922. mxf_read_seek,
  923. };