You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

593 lines
19KB

  1. /*
  2. * GXF demuxer.
  3. * Copyright (c) 2006 Reimar Doeffinger
  4. *
  5. * This file is part of FFmpeg.
  6. *
  7. * FFmpeg is free software; you can redistribute it and/or
  8. * modify it under the terms of the GNU Lesser General Public
  9. * License as published by the Free Software Foundation; either
  10. * version 2.1 of the License, or (at your option) any later version.
  11. *
  12. * FFmpeg is distributed in the hope that it will be useful,
  13. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  14. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  15. * Lesser General Public License for more details.
  16. *
  17. * You should have received a copy of the GNU Lesser General Public
  18. * License along with FFmpeg; if not, write to the Free Software
  19. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  20. */
  21. #include "libavutil/common.h"
  22. #include "avformat.h"
  23. #include "internal.h"
  24. #include "gxf.h"
  25. #include "libavcodec/mpeg12data.h"
  26. struct gxf_stream_info {
  27. int64_t first_field;
  28. int64_t last_field;
  29. AVRational frames_per_second;
  30. int32_t fields_per_frame;
  31. int64_t track_aux_data;
  32. };
  33. /**
  34. * @brief parse gxf timecode and add it to metadata
  35. */
  36. static int add_timecode_metadata(AVDictionary **pm, const char *key, uint32_t timecode, int fields_per_frame)
  37. {
  38. char tmp[128];
  39. int field = timecode & 0xff;
  40. int frame = fields_per_frame ? field / fields_per_frame : field;
  41. int second = (timecode >> 8) & 0xff;
  42. int minute = (timecode >> 16) & 0xff;
  43. int hour = (timecode >> 24) & 0x1f;
  44. int drop = (timecode >> 29) & 1;
  45. // bit 30: color_frame, unused
  46. // ignore invalid time code
  47. if (timecode >> 31)
  48. return 0;
  49. snprintf(tmp, sizeof(tmp), "%02d:%02d:%02d%c%02d",
  50. hour, minute, second, drop ? ';' : ':', frame);
  51. return av_dict_set(pm, key, tmp, 0);
  52. }
  53. /**
  54. * @brief parses a packet header, extracting type and length
  55. * @param pb AVIOContext to read header from
  56. * @param type detected packet type is stored here
  57. * @param length detected packet length, excluding header is stored here
  58. * @return 0 if header not found or contains invalid data, 1 otherwise
  59. */
  60. static int parse_packet_header(AVIOContext *pb, GXFPktType *type, int *length) {
  61. if (avio_rb32(pb))
  62. return 0;
  63. if (avio_r8(pb) != 1)
  64. return 0;
  65. *type = avio_r8(pb);
  66. *length = avio_rb32(pb);
  67. if ((*length >> 24) || *length < 16)
  68. return 0;
  69. *length -= 16;
  70. if (avio_rb32(pb))
  71. return 0;
  72. if (avio_r8(pb) != 0xe1)
  73. return 0;
  74. if (avio_r8(pb) != 0xe2)
  75. return 0;
  76. return 1;
  77. }
  78. /**
  79. * @brief check if file starts with a PKT_MAP header
  80. */
  81. static int gxf_probe(AVProbeData *p) {
  82. static const uint8_t startcode[] = {0, 0, 0, 0, 1, 0xbc}; // start with map packet
  83. static const uint8_t endcode[] = {0, 0, 0, 0, 0xe1, 0xe2};
  84. if (!memcmp(p->buf, startcode, sizeof(startcode)) &&
  85. !memcmp(&p->buf[16 - sizeof(endcode)], endcode, sizeof(endcode)))
  86. return AVPROBE_SCORE_MAX;
  87. return 0;
  88. }
  89. /**
  90. * @brief gets the stream index for the track with the specified id, creates new
  91. * stream if not found
  92. * @param id id of stream to find / add
  93. * @param format stream format identifier
  94. */
  95. static int get_sindex(AVFormatContext *s, int id, int format) {
  96. int i;
  97. AVStream *st = NULL;
  98. i = ff_find_stream_index(s, id);
  99. if (i >= 0)
  100. return i;
  101. st = avformat_new_stream(s, NULL);
  102. if (!st)
  103. return AVERROR(ENOMEM);
  104. st->id = id;
  105. switch (format) {
  106. case 3:
  107. case 4:
  108. st->codec->codec_type = AVMEDIA_TYPE_VIDEO;
  109. st->codec->codec_id = AV_CODEC_ID_MJPEG;
  110. break;
  111. case 13:
  112. case 15:
  113. st->codec->codec_type = AVMEDIA_TYPE_VIDEO;
  114. st->codec->codec_id = AV_CODEC_ID_DVVIDEO;
  115. break;
  116. case 14:
  117. case 16:
  118. st->codec->codec_type = AVMEDIA_TYPE_VIDEO;
  119. st->codec->codec_id = AV_CODEC_ID_DVVIDEO;
  120. break;
  121. case 11:
  122. case 12:
  123. case 20:
  124. st->codec->codec_type = AVMEDIA_TYPE_VIDEO;
  125. st->codec->codec_id = AV_CODEC_ID_MPEG2VIDEO;
  126. st->need_parsing = AVSTREAM_PARSE_HEADERS; //get keyframe flag etc.
  127. break;
  128. case 22:
  129. case 23:
  130. st->codec->codec_type = AVMEDIA_TYPE_VIDEO;
  131. st->codec->codec_id = AV_CODEC_ID_MPEG1VIDEO;
  132. st->need_parsing = AVSTREAM_PARSE_HEADERS; //get keyframe flag etc.
  133. break;
  134. case 9:
  135. st->codec->codec_type = AVMEDIA_TYPE_AUDIO;
  136. st->codec->codec_id = AV_CODEC_ID_PCM_S24LE;
  137. st->codec->channels = 1;
  138. st->codec->sample_rate = 48000;
  139. st->codec->bit_rate = 3 * 1 * 48000 * 8;
  140. st->codec->block_align = 3 * 1;
  141. st->codec->bits_per_coded_sample = 24;
  142. break;
  143. case 10:
  144. st->codec->codec_type = AVMEDIA_TYPE_AUDIO;
  145. st->codec->codec_id = AV_CODEC_ID_PCM_S16LE;
  146. st->codec->channels = 1;
  147. st->codec->sample_rate = 48000;
  148. st->codec->bit_rate = 2 * 1 * 48000 * 8;
  149. st->codec->block_align = 2 * 1;
  150. st->codec->bits_per_coded_sample = 16;
  151. break;
  152. case 17:
  153. st->codec->codec_type = AVMEDIA_TYPE_AUDIO;
  154. st->codec->codec_id = AV_CODEC_ID_AC3;
  155. st->codec->channels = 2;
  156. st->codec->sample_rate = 48000;
  157. break;
  158. // timecode tracks:
  159. case 7:
  160. case 8:
  161. case 24:
  162. st->codec->codec_type = AVMEDIA_TYPE_DATA;
  163. st->codec->codec_id = AV_CODEC_ID_NONE;
  164. break;
  165. default:
  166. st->codec->codec_type = AVMEDIA_TYPE_UNKNOWN;
  167. st->codec->codec_id = AV_CODEC_ID_NONE;
  168. break;
  169. }
  170. return s->nb_streams - 1;
  171. }
  172. /**
  173. * @brief filters out interesting tags from material information.
  174. * @param len length of tag section, will be adjusted to contain remaining bytes
  175. * @param si struct to store collected information into
  176. */
  177. static void gxf_material_tags(AVIOContext *pb, int *len, struct gxf_stream_info *si) {
  178. si->first_field = AV_NOPTS_VALUE;
  179. si->last_field = AV_NOPTS_VALUE;
  180. while (*len >= 2) {
  181. GXFMatTag tag = avio_r8(pb);
  182. int tlen = avio_r8(pb);
  183. *len -= 2;
  184. if (tlen > *len)
  185. return;
  186. *len -= tlen;
  187. if (tlen == 4) {
  188. uint32_t value = avio_rb32(pb);
  189. if (tag == MAT_FIRST_FIELD)
  190. si->first_field = value;
  191. else if (tag == MAT_LAST_FIELD)
  192. si->last_field = value;
  193. } else
  194. avio_skip(pb, tlen);
  195. }
  196. }
  197. static const AVRational frame_rate_tab[] = {
  198. { 60, 1},
  199. {60000, 1001},
  200. { 50, 1},
  201. { 30, 1},
  202. {30000, 1001},
  203. { 25, 1},
  204. { 24, 1},
  205. {24000, 1001},
  206. { 0, 0},
  207. };
  208. /**
  209. * @brief convert fps tag value to AVRational fps
  210. * @param fps fps value from tag
  211. * @return fps as AVRational, or 0 / 0 if unknown
  212. */
  213. static AVRational fps_tag2avr(int32_t fps) {
  214. if (fps < 1 || fps > 9) fps = 9;
  215. return frame_rate_tab[fps - 1];
  216. }
  217. /**
  218. * @brief convert UMF attributes flags to AVRational fps
  219. * @param flags UMF flags to convert
  220. * @return fps as AVRational, or 0 / 0 if unknown
  221. */
  222. static AVRational fps_umf2avr(uint32_t flags) {
  223. static const AVRational map[] = {{50, 1}, {60000, 1001}, {24, 1},
  224. {25, 1}, {30000, 1001}};
  225. int idx = av_log2((flags & 0x7c0) >> 6);
  226. return map[idx];
  227. }
  228. /**
  229. * @brief filters out interesting tags from track information.
  230. * @param len length of tag section, will be adjusted to contain remaining bytes
  231. * @param si struct to store collected information into
  232. */
  233. static void gxf_track_tags(AVIOContext *pb, int *len, struct gxf_stream_info *si) {
  234. si->frames_per_second = (AVRational){0, 0};
  235. si->fields_per_frame = 0;
  236. si->track_aux_data = 0x80000000;
  237. while (*len >= 2) {
  238. GXFTrackTag tag = avio_r8(pb);
  239. int tlen = avio_r8(pb);
  240. *len -= 2;
  241. if (tlen > *len)
  242. return;
  243. *len -= tlen;
  244. if (tlen == 4) {
  245. uint32_t value = avio_rb32(pb);
  246. if (tag == TRACK_FPS)
  247. si->frames_per_second = fps_tag2avr(value);
  248. else if (tag == TRACK_FPF && (value == 1 || value == 2))
  249. si->fields_per_frame = value;
  250. } else if (tlen == 8 && tag == TRACK_AUX)
  251. si->track_aux_data = avio_rl64(pb);
  252. else
  253. avio_skip(pb, tlen);
  254. }
  255. }
  256. /**
  257. * @brief read index from FLT packet into stream 0 av_index
  258. */
  259. static void gxf_read_index(AVFormatContext *s, int pkt_len) {
  260. AVIOContext *pb = s->pb;
  261. AVStream *st;
  262. uint32_t fields_per_map = avio_rl32(pb);
  263. uint32_t map_cnt = avio_rl32(pb);
  264. int i;
  265. pkt_len -= 8;
  266. if ((s->flags & AVFMT_FLAG_IGNIDX) || !s->streams) {
  267. avio_skip(pb, pkt_len);
  268. return;
  269. }
  270. st = s->streams[0];
  271. if (map_cnt > 1000) {
  272. av_log(s, AV_LOG_ERROR, "too many index entries %u (%x)\n", map_cnt, map_cnt);
  273. map_cnt = 1000;
  274. }
  275. if (pkt_len < 4 * map_cnt) {
  276. av_log(s, AV_LOG_ERROR, "invalid index length\n");
  277. avio_skip(pb, pkt_len);
  278. return;
  279. }
  280. pkt_len -= 4 * map_cnt;
  281. av_add_index_entry(st, 0, 0, 0, 0, 0);
  282. for (i = 0; i < map_cnt; i++)
  283. av_add_index_entry(st, (uint64_t)avio_rl32(pb) * 1024,
  284. i * (uint64_t)fields_per_map + 1, 0, 0, 0);
  285. avio_skip(pb, pkt_len);
  286. }
  287. static int gxf_header(AVFormatContext *s) {
  288. AVIOContext *pb = s->pb;
  289. GXFPktType pkt_type;
  290. int map_len;
  291. int len;
  292. AVRational main_timebase = {0, 0};
  293. struct gxf_stream_info *si = s->priv_data;
  294. int i;
  295. if (!parse_packet_header(pb, &pkt_type, &map_len) || pkt_type != PKT_MAP) {
  296. av_log(s, AV_LOG_ERROR, "map packet not found\n");
  297. return 0;
  298. }
  299. map_len -= 2;
  300. if (avio_r8(pb) != 0x0e0 || avio_r8(pb) != 0xff) {
  301. av_log(s, AV_LOG_ERROR, "unknown version or invalid map preamble\n");
  302. return 0;
  303. }
  304. map_len -= 2;
  305. len = avio_rb16(pb); // length of material data section
  306. if (len > map_len) {
  307. av_log(s, AV_LOG_ERROR, "material data longer than map data\n");
  308. return 0;
  309. }
  310. map_len -= len;
  311. gxf_material_tags(pb, &len, si);
  312. avio_skip(pb, len);
  313. map_len -= 2;
  314. len = avio_rb16(pb); // length of track description
  315. if (len > map_len) {
  316. av_log(s, AV_LOG_ERROR, "track description longer than map data\n");
  317. return 0;
  318. }
  319. map_len -= len;
  320. while (len > 0) {
  321. int track_type, track_id, track_len;
  322. AVStream *st;
  323. int idx;
  324. len -= 4;
  325. track_type = avio_r8(pb);
  326. track_id = avio_r8(pb);
  327. track_len = avio_rb16(pb);
  328. len -= track_len;
  329. if (!(track_type & 0x80)) {
  330. av_log(s, AV_LOG_ERROR, "invalid track type %x\n", track_type);
  331. continue;
  332. }
  333. track_type &= 0x7f;
  334. if ((track_id & 0xc0) != 0xc0) {
  335. av_log(s, AV_LOG_ERROR, "invalid track id %x\n", track_id);
  336. continue;
  337. }
  338. track_id &= 0x3f;
  339. gxf_track_tags(pb, &track_len, si);
  340. // check for timecode tracks
  341. if (track_type == 7 || track_type == 8 || track_type == 24) {
  342. add_timecode_metadata(&s->metadata, "timecode",
  343. si->track_aux_data & 0xffffffff,
  344. si->fields_per_frame);
  345. }
  346. avio_skip(pb, track_len);
  347. idx = get_sindex(s, track_id, track_type);
  348. if (idx < 0) continue;
  349. st = s->streams[idx];
  350. if (!main_timebase.num || !main_timebase.den) {
  351. main_timebase.num = si->frames_per_second.den;
  352. main_timebase.den = si->frames_per_second.num * 2;
  353. }
  354. st->start_time = si->first_field;
  355. if (si->first_field != AV_NOPTS_VALUE && si->last_field != AV_NOPTS_VALUE)
  356. st->duration = si->last_field - si->first_field;
  357. }
  358. if (len < 0)
  359. av_log(s, AV_LOG_ERROR, "invalid track description length specified\n");
  360. if (map_len)
  361. avio_skip(pb, map_len);
  362. if (!parse_packet_header(pb, &pkt_type, &len)) {
  363. av_log(s, AV_LOG_ERROR, "sync lost in header\n");
  364. return -1;
  365. }
  366. if (pkt_type == PKT_FLT) {
  367. gxf_read_index(s, len);
  368. if (!parse_packet_header(pb, &pkt_type, &len)) {
  369. av_log(s, AV_LOG_ERROR, "sync lost in header\n");
  370. return -1;
  371. }
  372. }
  373. if (pkt_type == PKT_UMF) {
  374. if (len >= 0x39) {
  375. AVRational fps;
  376. len -= 0x39;
  377. avio_skip(pb, 5); // preamble
  378. avio_skip(pb, 0x30); // payload description
  379. fps = fps_umf2avr(avio_rl32(pb));
  380. if (!main_timebase.num || !main_timebase.den) {
  381. av_log(s, AV_LOG_WARNING, "No FPS track tag, using UMF fps tag."
  382. " This might give wrong results.\n");
  383. // this may not always be correct, but simply the best we can get
  384. main_timebase.num = fps.den;
  385. main_timebase.den = fps.num * 2;
  386. }
  387. if (len >= 0x18) {
  388. len -= 0x18;
  389. avio_skip(pb, 0x10);
  390. add_timecode_metadata(&s->metadata, "timecode_at_mark_in",
  391. avio_rl32(pb), si->fields_per_frame);
  392. add_timecode_metadata(&s->metadata, "timecode_at_mark_out",
  393. avio_rl32(pb), si->fields_per_frame);
  394. }
  395. } else
  396. av_log(s, AV_LOG_INFO, "UMF packet too short\n");
  397. } else
  398. av_log(s, AV_LOG_INFO, "UMF packet missing\n");
  399. avio_skip(pb, len);
  400. // set a fallback value, 60000/1001 is specified for audio-only files
  401. // so use that regardless of why we do not know the video frame rate.
  402. if (!main_timebase.num || !main_timebase.den)
  403. main_timebase = (AVRational){1001, 60000};
  404. for (i = 0; i < s->nb_streams; i++) {
  405. AVStream *st = s->streams[i];
  406. avpriv_set_pts_info(st, 32, main_timebase.num, main_timebase.den);
  407. }
  408. return 0;
  409. }
  410. #define READ_ONE() \
  411. { \
  412. if (!max_interval-- || url_feof(pb)) \
  413. goto out; \
  414. tmp = tmp << 8 | avio_r8(pb); \
  415. }
  416. /**
  417. * @brief resync the stream on the next media packet with specified properties
  418. * @param max_interval how many bytes to search for matching packet at most
  419. * @param track track id the media packet must belong to, -1 for any
  420. * @param timestamp minimum timestamp (== field number) the packet must have, -1 for any
  421. * @return timestamp of packet found
  422. */
  423. static int64_t gxf_resync_media(AVFormatContext *s, uint64_t max_interval, int track, int timestamp) {
  424. uint32_t tmp;
  425. uint64_t last_pos;
  426. uint64_t last_found_pos = 0;
  427. int cur_track;
  428. int64_t cur_timestamp = AV_NOPTS_VALUE;
  429. int len;
  430. AVIOContext *pb = s->pb;
  431. GXFPktType type;
  432. tmp = avio_rb32(pb);
  433. start:
  434. while (tmp)
  435. READ_ONE();
  436. READ_ONE();
  437. if (tmp != 1)
  438. goto start;
  439. last_pos = avio_tell(pb);
  440. if (avio_seek(pb, -5, SEEK_CUR) < 0)
  441. goto out;
  442. if (!parse_packet_header(pb, &type, &len) || type != PKT_MEDIA) {
  443. if (avio_seek(pb, last_pos, SEEK_SET) < 0)
  444. goto out;
  445. goto start;
  446. }
  447. avio_r8(pb);
  448. cur_track = avio_r8(pb);
  449. cur_timestamp = avio_rb32(pb);
  450. last_found_pos = avio_tell(pb) - 16 - 6;
  451. if ((track >= 0 && track != cur_track) || (timestamp >= 0 && timestamp > cur_timestamp)) {
  452. if (avio_seek(pb, last_pos, SEEK_SET) >= 0)
  453. goto start;
  454. }
  455. out:
  456. if (last_found_pos)
  457. avio_seek(pb, last_found_pos, SEEK_SET);
  458. return cur_timestamp;
  459. }
  460. static int gxf_packet(AVFormatContext *s, AVPacket *pkt) {
  461. AVIOContext *pb = s->pb;
  462. GXFPktType pkt_type;
  463. int pkt_len;
  464. struct gxf_stream_info *si = s->priv_data;
  465. while (!pb->eof_reached) {
  466. AVStream *st;
  467. int track_type, track_id, ret;
  468. int field_nr, field_info, skip = 0;
  469. int stream_index;
  470. if (!parse_packet_header(pb, &pkt_type, &pkt_len)) {
  471. if (!url_feof(pb))
  472. av_log(s, AV_LOG_ERROR, "sync lost\n");
  473. return -1;
  474. }
  475. if (pkt_type == PKT_FLT) {
  476. gxf_read_index(s, pkt_len);
  477. continue;
  478. }
  479. if (pkt_type != PKT_MEDIA) {
  480. avio_skip(pb, pkt_len);
  481. continue;
  482. }
  483. if (pkt_len < 16) {
  484. av_log(s, AV_LOG_ERROR, "invalid media packet length\n");
  485. continue;
  486. }
  487. pkt_len -= 16;
  488. track_type = avio_r8(pb);
  489. track_id = avio_r8(pb);
  490. stream_index = get_sindex(s, track_id, track_type);
  491. if (stream_index < 0)
  492. return stream_index;
  493. st = s->streams[stream_index];
  494. field_nr = avio_rb32(pb);
  495. field_info = avio_rb32(pb);
  496. avio_rb32(pb); // "timeline" field number
  497. avio_r8(pb); // flags
  498. avio_r8(pb); // reserved
  499. if (st->codec->codec_id == AV_CODEC_ID_PCM_S24LE ||
  500. st->codec->codec_id == AV_CODEC_ID_PCM_S16LE) {
  501. int first = field_info >> 16;
  502. int last = field_info & 0xffff; // last is exclusive
  503. int bps = av_get_bits_per_sample(st->codec->codec_id)>>3;
  504. if (first <= last && last*bps <= pkt_len) {
  505. avio_skip(pb, first*bps);
  506. skip = pkt_len - last*bps;
  507. pkt_len = (last-first)*bps;
  508. } else
  509. av_log(s, AV_LOG_ERROR, "invalid first and last sample values\n");
  510. }
  511. ret = av_get_packet(pb, pkt, pkt_len);
  512. if (skip)
  513. avio_skip(pb, skip);
  514. pkt->stream_index = stream_index;
  515. pkt->dts = field_nr;
  516. //set duration manually for DV or else lavf misdetects the frame rate
  517. if (st->codec->codec_id == AV_CODEC_ID_DVVIDEO)
  518. pkt->duration = si->fields_per_frame;
  519. return ret;
  520. }
  521. return AVERROR_EOF;
  522. }
  523. static int gxf_seek(AVFormatContext *s, int stream_index, int64_t timestamp, int flags) {
  524. int res = 0;
  525. uint64_t pos;
  526. uint64_t maxlen = 100 * 1024 * 1024;
  527. AVStream *st = s->streams[0];
  528. int64_t start_time = s->streams[stream_index]->start_time;
  529. int64_t found;
  530. int idx;
  531. if (timestamp < start_time) timestamp = start_time;
  532. idx = av_index_search_timestamp(st, timestamp - start_time,
  533. AVSEEK_FLAG_ANY | AVSEEK_FLAG_BACKWARD);
  534. if (idx < 0)
  535. return -1;
  536. pos = st->index_entries[idx].pos;
  537. if (idx < st->nb_index_entries - 2)
  538. maxlen = st->index_entries[idx + 2].pos - pos;
  539. maxlen = FFMAX(maxlen, 200 * 1024);
  540. res = avio_seek(s->pb, pos, SEEK_SET);
  541. if (res < 0)
  542. return res;
  543. found = gxf_resync_media(s, maxlen, -1, timestamp);
  544. if (FFABS(found - timestamp) > 4)
  545. return -1;
  546. return 0;
  547. }
  548. static int64_t gxf_read_timestamp(AVFormatContext *s, int stream_index,
  549. int64_t *pos, int64_t pos_limit) {
  550. AVIOContext *pb = s->pb;
  551. int64_t res;
  552. if (avio_seek(pb, *pos, SEEK_SET) < 0)
  553. return AV_NOPTS_VALUE;
  554. res = gxf_resync_media(s, pos_limit - *pos, -1, -1);
  555. *pos = avio_tell(pb);
  556. return res;
  557. }
  558. AVInputFormat ff_gxf_demuxer = {
  559. .name = "gxf",
  560. .long_name = NULL_IF_CONFIG_SMALL("GXF (General eXchange Format)"),
  561. .priv_data_size = sizeof(struct gxf_stream_info),
  562. .read_probe = gxf_probe,
  563. .read_header = gxf_header,
  564. .read_packet = gxf_packet,
  565. .read_seek = gxf_seek,
  566. .read_timestamp = gxf_read_timestamp,
  567. };