You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

592 lines
19KB

  1. /*
  2. * GXF demuxer.
  3. * Copyright (c) 2006 Reimar Doeffinger
  4. *
  5. * This file is part of FFmpeg.
  6. *
  7. * FFmpeg is free software; you can redistribute it and/or
  8. * modify it under the terms of the GNU Lesser General Public
  9. * License as published by the Free Software Foundation; either
  10. * version 2.1 of the License, or (at your option) any later version.
  11. *
  12. * FFmpeg is distributed in the hope that it will be useful,
  13. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  14. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  15. * Lesser General Public License for more details.
  16. *
  17. * You should have received a copy of the GNU Lesser General Public
  18. * License along with FFmpeg; if not, write to the Free Software
  19. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  20. */
  21. #include "libavutil/common.h"
  22. #include "avformat.h"
  23. #include "internal.h"
  24. #include "gxf.h"
  25. #include "libavcodec/mpeg12data.h"
  26. struct gxf_stream_info {
  27. int64_t first_field;
  28. int64_t last_field;
  29. AVRational frames_per_second;
  30. int32_t fields_per_frame;
  31. int64_t track_aux_data;
  32. };
  33. /**
  34. * @brief parse gxf timecode and add it to metadata
  35. */
  36. static int add_timecode_metadata(AVDictionary **pm, const char *key, uint32_t timecode, int fields_per_frame)
  37. {
  38. char tmp[128];
  39. int field = timecode & 0xff;
  40. int frame = fields_per_frame ? field / fields_per_frame : field;
  41. int second = (timecode >> 8) & 0xff;
  42. int minute = (timecode >> 16) & 0xff;
  43. int hour = (timecode >> 24) & 0x1f;
  44. int drop = (timecode >> 29) & 1;
  45. // bit 30: color_frame, unused
  46. // ignore invalid time code
  47. if (timecode >> 31)
  48. return 0;
  49. snprintf(tmp, sizeof(tmp), "%02d:%02d:%02d%c%02d",
  50. hour, minute, second, drop ? ';' : ':', frame);
  51. return av_dict_set(pm, key, tmp, 0);
  52. }
  53. /**
  54. * @brief parses a packet header, extracting type and length
  55. * @param pb AVIOContext to read header from
  56. * @param type detected packet type is stored here
  57. * @param length detected packet length, excluding header is stored here
  58. * @return 0 if header not found or contains invalid data, 1 otherwise
  59. */
  60. static int parse_packet_header(AVIOContext *pb, GXFPktType *type, int *length) {
  61. if (avio_rb32(pb))
  62. return 0;
  63. if (avio_r8(pb) != 1)
  64. return 0;
  65. *type = avio_r8(pb);
  66. *length = avio_rb32(pb);
  67. if ((*length >> 24) || *length < 16)
  68. return 0;
  69. *length -= 16;
  70. if (avio_rb32(pb))
  71. return 0;
  72. if (avio_r8(pb) != 0xe1)
  73. return 0;
  74. if (avio_r8(pb) != 0xe2)
  75. return 0;
  76. return 1;
  77. }
  78. /**
  79. * @brief check if file starts with a PKT_MAP header
  80. */
  81. static int gxf_probe(AVProbeData *p) {
  82. static const uint8_t startcode[] = {0, 0, 0, 0, 1, 0xbc}; // start with map packet
  83. static const uint8_t endcode[] = {0, 0, 0, 0, 0xe1, 0xe2};
  84. if (!memcmp(p->buf, startcode, sizeof(startcode)) &&
  85. !memcmp(&p->buf[16 - sizeof(endcode)], endcode, sizeof(endcode)))
  86. return AVPROBE_SCORE_MAX;
  87. return 0;
  88. }
  89. /**
  90. * @brief gets the stream index for the track with the specified id, creates new
  91. * stream if not found
  92. * @param id id of stream to find / add
  93. * @param format stream format identifier
  94. */
  95. static int get_sindex(AVFormatContext *s, int id, int format) {
  96. int i;
  97. AVStream *st = NULL;
  98. i = ff_find_stream_index(s, id);
  99. if (i >= 0)
  100. return i;
  101. st = avformat_new_stream(s, NULL);
  102. if (!st)
  103. return AVERROR(ENOMEM);
  104. st->id = id;
  105. switch (format) {
  106. case 3:
  107. case 4:
  108. st->codec->codec_type = AVMEDIA_TYPE_VIDEO;
  109. st->codec->codec_id = AV_CODEC_ID_MJPEG;
  110. break;
  111. case 13:
  112. case 15:
  113. st->codec->codec_type = AVMEDIA_TYPE_VIDEO;
  114. st->codec->codec_id = AV_CODEC_ID_DVVIDEO;
  115. break;
  116. case 14:
  117. case 16:
  118. st->codec->codec_type = AVMEDIA_TYPE_VIDEO;
  119. st->codec->codec_id = AV_CODEC_ID_DVVIDEO;
  120. break;
  121. case 11:
  122. case 12:
  123. case 20:
  124. st->codec->codec_type = AVMEDIA_TYPE_VIDEO;
  125. st->codec->codec_id = AV_CODEC_ID_MPEG2VIDEO;
  126. st->need_parsing = AVSTREAM_PARSE_HEADERS; //get keyframe flag etc.
  127. break;
  128. case 22:
  129. case 23:
  130. st->codec->codec_type = AVMEDIA_TYPE_VIDEO;
  131. st->codec->codec_id = AV_CODEC_ID_MPEG1VIDEO;
  132. st->need_parsing = AVSTREAM_PARSE_HEADERS; //get keyframe flag etc.
  133. break;
  134. case 9:
  135. st->codec->codec_type = AVMEDIA_TYPE_AUDIO;
  136. st->codec->codec_id = AV_CODEC_ID_PCM_S24LE;
  137. st->codec->channels = 1;
  138. st->codec->sample_rate = 48000;
  139. st->codec->bit_rate = 3 * 1 * 48000 * 8;
  140. st->codec->block_align = 3 * 1;
  141. st->codec->bits_per_coded_sample = 24;
  142. break;
  143. case 10:
  144. st->codec->codec_type = AVMEDIA_TYPE_AUDIO;
  145. st->codec->codec_id = AV_CODEC_ID_PCM_S16LE;
  146. st->codec->channels = 1;
  147. st->codec->sample_rate = 48000;
  148. st->codec->bit_rate = 2 * 1 * 48000 * 8;
  149. st->codec->block_align = 2 * 1;
  150. st->codec->bits_per_coded_sample = 16;
  151. break;
  152. case 17:
  153. st->codec->codec_type = AVMEDIA_TYPE_AUDIO;
  154. st->codec->codec_id = AV_CODEC_ID_AC3;
  155. st->codec->channels = 2;
  156. st->codec->sample_rate = 48000;
  157. break;
  158. // timecode tracks:
  159. case 7:
  160. case 8:
  161. case 24:
  162. st->codec->codec_type = AVMEDIA_TYPE_DATA;
  163. st->codec->codec_id = AV_CODEC_ID_NONE;
  164. break;
  165. default:
  166. st->codec->codec_type = AVMEDIA_TYPE_UNKNOWN;
  167. st->codec->codec_id = AV_CODEC_ID_NONE;
  168. break;
  169. }
  170. return s->nb_streams - 1;
  171. }
  172. /**
  173. * @brief filters out interesting tags from material information.
  174. * @param len length of tag section, will be adjusted to contain remaining bytes
  175. * @param si struct to store collected information into
  176. */
  177. static void gxf_material_tags(AVIOContext *pb, int *len, struct gxf_stream_info *si) {
  178. si->first_field = AV_NOPTS_VALUE;
  179. si->last_field = AV_NOPTS_VALUE;
  180. while (*len >= 2) {
  181. GXFMatTag tag = avio_r8(pb);
  182. int tlen = avio_r8(pb);
  183. *len -= 2;
  184. if (tlen > *len)
  185. return;
  186. *len -= tlen;
  187. if (tlen == 4) {
  188. uint32_t value = avio_rb32(pb);
  189. if (tag == MAT_FIRST_FIELD)
  190. si->first_field = value;
  191. else if (tag == MAT_LAST_FIELD)
  192. si->last_field = value;
  193. } else
  194. avio_skip(pb, tlen);
  195. }
  196. }
  197. static const AVRational frame_rate_tab[] = {
  198. { 60, 1},
  199. {60000, 1001},
  200. { 50, 1},
  201. { 30, 1},
  202. {30000, 1001},
  203. { 25, 1},
  204. { 24, 1},
  205. {24000, 1001},
  206. { 0, 0},
  207. };
  208. /**
  209. * @brief convert fps tag value to AVRational fps
  210. * @param fps fps value from tag
  211. * @return fps as AVRational, or 0 / 0 if unknown
  212. */
  213. static AVRational fps_tag2avr(int32_t fps) {
  214. if (fps < 1 || fps > 9) fps = 9;
  215. return frame_rate_tab[fps - 1];
  216. }
  217. /**
  218. * @brief convert UMF attributes flags to AVRational fps
  219. * @param flags UMF flags to convert
  220. * @return fps as AVRational, or 0 / 0 if unknown
  221. */
  222. static AVRational fps_umf2avr(uint32_t flags) {
  223. static const AVRational map[] = {{50, 1}, {60000, 1001}, {24, 1},
  224. {25, 1}, {30000, 1001}};
  225. int idx = av_log2((flags & 0x7c0) >> 6);
  226. return map[idx];
  227. }
  228. /**
  229. * @brief filters out interesting tags from track information.
  230. * @param len length of tag section, will be adjusted to contain remaining bytes
  231. * @param si struct to store collected information into
  232. */
  233. static void gxf_track_tags(AVIOContext *pb, int *len, struct gxf_stream_info *si) {
  234. si->frames_per_second = (AVRational){0, 0};
  235. si->fields_per_frame = 0;
  236. si->track_aux_data = 0x80000000;
  237. while (*len >= 2) {
  238. GXFTrackTag tag = avio_r8(pb);
  239. int tlen = avio_r8(pb);
  240. *len -= 2;
  241. if (tlen > *len)
  242. return;
  243. *len -= tlen;
  244. if (tlen == 4) {
  245. uint32_t value = avio_rb32(pb);
  246. if (tag == TRACK_FPS)
  247. si->frames_per_second = fps_tag2avr(value);
  248. else if (tag == TRACK_FPF && (value == 1 || value == 2))
  249. si->fields_per_frame = value;
  250. } else if (tlen == 8 && tag == TRACK_AUX)
  251. si->track_aux_data = avio_rl64(pb);
  252. else
  253. avio_skip(pb, tlen);
  254. }
  255. }
  256. /**
  257. * @brief read index from FLT packet into stream 0 av_index
  258. */
  259. static void gxf_read_index(AVFormatContext *s, int pkt_len) {
  260. AVIOContext *pb = s->pb;
  261. AVStream *st = s->streams[0];
  262. uint32_t fields_per_map = avio_rl32(pb);
  263. uint32_t map_cnt = avio_rl32(pb);
  264. int i;
  265. pkt_len -= 8;
  266. if (s->flags & AVFMT_FLAG_IGNIDX) {
  267. avio_skip(pb, pkt_len);
  268. return;
  269. }
  270. if (map_cnt > 1000) {
  271. av_log(s, AV_LOG_ERROR, "too many index entries %u (%x)\n", map_cnt, map_cnt);
  272. map_cnt = 1000;
  273. }
  274. if (pkt_len < 4 * map_cnt) {
  275. av_log(s, AV_LOG_ERROR, "invalid index length\n");
  276. avio_skip(pb, pkt_len);
  277. return;
  278. }
  279. pkt_len -= 4 * map_cnt;
  280. av_add_index_entry(st, 0, 0, 0, 0, 0);
  281. for (i = 0; i < map_cnt; i++)
  282. av_add_index_entry(st, (uint64_t)avio_rl32(pb) * 1024,
  283. i * (uint64_t)fields_per_map + 1, 0, 0, 0);
  284. avio_skip(pb, pkt_len);
  285. }
  286. static int gxf_header(AVFormatContext *s) {
  287. AVIOContext *pb = s->pb;
  288. GXFPktType pkt_type;
  289. int map_len;
  290. int len;
  291. AVRational main_timebase = {0, 0};
  292. struct gxf_stream_info *si = s->priv_data;
  293. int i;
  294. if (!parse_packet_header(pb, &pkt_type, &map_len) || pkt_type != PKT_MAP) {
  295. av_log(s, AV_LOG_ERROR, "map packet not found\n");
  296. return 0;
  297. }
  298. map_len -= 2;
  299. if (avio_r8(pb) != 0x0e0 || avio_r8(pb) != 0xff) {
  300. av_log(s, AV_LOG_ERROR, "unknown version or invalid map preamble\n");
  301. return 0;
  302. }
  303. map_len -= 2;
  304. len = avio_rb16(pb); // length of material data section
  305. if (len > map_len) {
  306. av_log(s, AV_LOG_ERROR, "material data longer than map data\n");
  307. return 0;
  308. }
  309. map_len -= len;
  310. gxf_material_tags(pb, &len, si);
  311. avio_skip(pb, len);
  312. map_len -= 2;
  313. len = avio_rb16(pb); // length of track description
  314. if (len > map_len) {
  315. av_log(s, AV_LOG_ERROR, "track description longer than map data\n");
  316. return 0;
  317. }
  318. map_len -= len;
  319. while (len > 0) {
  320. int track_type, track_id, track_len;
  321. AVStream *st;
  322. int idx;
  323. len -= 4;
  324. track_type = avio_r8(pb);
  325. track_id = avio_r8(pb);
  326. track_len = avio_rb16(pb);
  327. len -= track_len;
  328. if (!(track_type & 0x80)) {
  329. av_log(s, AV_LOG_ERROR, "invalid track type %x\n", track_type);
  330. continue;
  331. }
  332. track_type &= 0x7f;
  333. if ((track_id & 0xc0) != 0xc0) {
  334. av_log(s, AV_LOG_ERROR, "invalid track id %x\n", track_id);
  335. continue;
  336. }
  337. track_id &= 0x3f;
  338. gxf_track_tags(pb, &track_len, si);
  339. // check for timecode tracks
  340. if (track_type == 7 || track_type == 8 || track_type == 24) {
  341. add_timecode_metadata(&s->metadata, "timecode",
  342. si->track_aux_data & 0xffffffff,
  343. si->fields_per_frame);
  344. }
  345. avio_skip(pb, track_len);
  346. idx = get_sindex(s, track_id, track_type);
  347. if (idx < 0) continue;
  348. st = s->streams[idx];
  349. if (!main_timebase.num || !main_timebase.den) {
  350. main_timebase.num = si->frames_per_second.den;
  351. main_timebase.den = si->frames_per_second.num * 2;
  352. }
  353. st->start_time = si->first_field;
  354. if (si->first_field != AV_NOPTS_VALUE && si->last_field != AV_NOPTS_VALUE)
  355. st->duration = si->last_field - si->first_field;
  356. }
  357. if (len < 0)
  358. av_log(s, AV_LOG_ERROR, "invalid track description length specified\n");
  359. if (map_len)
  360. avio_skip(pb, map_len);
  361. if (!parse_packet_header(pb, &pkt_type, &len)) {
  362. av_log(s, AV_LOG_ERROR, "sync lost in header\n");
  363. return -1;
  364. }
  365. if (pkt_type == PKT_FLT) {
  366. gxf_read_index(s, len);
  367. if (!parse_packet_header(pb, &pkt_type, &len)) {
  368. av_log(s, AV_LOG_ERROR, "sync lost in header\n");
  369. return -1;
  370. }
  371. }
  372. if (pkt_type == PKT_UMF) {
  373. if (len >= 0x39) {
  374. AVRational fps;
  375. len -= 0x39;
  376. avio_skip(pb, 5); // preamble
  377. avio_skip(pb, 0x30); // payload description
  378. fps = fps_umf2avr(avio_rl32(pb));
  379. if (!main_timebase.num || !main_timebase.den) {
  380. av_log(s, AV_LOG_WARNING, "No FPS track tag, using UMF fps tag."
  381. " This might give wrong results.\n");
  382. // this may not always be correct, but simply the best we can get
  383. main_timebase.num = fps.den;
  384. main_timebase.den = fps.num * 2;
  385. }
  386. if (len >= 0x18) {
  387. len -= 0x18;
  388. avio_skip(pb, 0x10);
  389. add_timecode_metadata(&s->metadata, "timecode_at_mark_in",
  390. avio_rl32(pb), si->fields_per_frame);
  391. add_timecode_metadata(&s->metadata, "timecode_at_mark_out",
  392. avio_rl32(pb), si->fields_per_frame);
  393. }
  394. } else
  395. av_log(s, AV_LOG_INFO, "UMF packet too short\n");
  396. } else
  397. av_log(s, AV_LOG_INFO, "UMF packet missing\n");
  398. avio_skip(pb, len);
  399. // set a fallback value, 60000/1001 is specified for audio-only files
  400. // so use that regardless of why we do not know the video frame rate.
  401. if (!main_timebase.num || !main_timebase.den)
  402. main_timebase = (AVRational){1001, 60000};
  403. for (i = 0; i < s->nb_streams; i++) {
  404. AVStream *st = s->streams[i];
  405. avpriv_set_pts_info(st, 32, main_timebase.num, main_timebase.den);
  406. }
  407. return 0;
  408. }
  409. #define READ_ONE() \
  410. { \
  411. if (!max_interval-- || url_feof(pb)) \
  412. goto out; \
  413. tmp = tmp << 8 | avio_r8(pb); \
  414. }
  415. /**
  416. * @brief resync the stream on the next media packet with specified properties
  417. * @param max_interval how many bytes to search for matching packet at most
  418. * @param track track id the media packet must belong to, -1 for any
  419. * @param timestamp minimum timestamp (== field number) the packet must have, -1 for any
  420. * @return timestamp of packet found
  421. */
  422. static int64_t gxf_resync_media(AVFormatContext *s, uint64_t max_interval, int track, int timestamp) {
  423. uint32_t tmp;
  424. uint64_t last_pos;
  425. uint64_t last_found_pos = 0;
  426. int cur_track;
  427. int64_t cur_timestamp = AV_NOPTS_VALUE;
  428. int len;
  429. AVIOContext *pb = s->pb;
  430. GXFPktType type;
  431. tmp = avio_rb32(pb);
  432. start:
  433. while (tmp)
  434. READ_ONE();
  435. READ_ONE();
  436. if (tmp != 1)
  437. goto start;
  438. last_pos = avio_tell(pb);
  439. if (avio_seek(pb, -5, SEEK_CUR) < 0)
  440. goto out;
  441. if (!parse_packet_header(pb, &type, &len) || type != PKT_MEDIA) {
  442. if (avio_seek(pb, last_pos, SEEK_SET) < 0)
  443. goto out;
  444. goto start;
  445. }
  446. avio_r8(pb);
  447. cur_track = avio_r8(pb);
  448. cur_timestamp = avio_rb32(pb);
  449. last_found_pos = avio_tell(pb) - 16 - 6;
  450. if ((track >= 0 && track != cur_track) || (timestamp >= 0 && timestamp > cur_timestamp)) {
  451. if (avio_seek(pb, last_pos, SEEK_SET) >= 0)
  452. goto start;
  453. }
  454. out:
  455. if (last_found_pos)
  456. avio_seek(pb, last_found_pos, SEEK_SET);
  457. return cur_timestamp;
  458. }
  459. static int gxf_packet(AVFormatContext *s, AVPacket *pkt) {
  460. AVIOContext *pb = s->pb;
  461. GXFPktType pkt_type;
  462. int pkt_len;
  463. struct gxf_stream_info *si = s->priv_data;
  464. while (!pb->eof_reached) {
  465. AVStream *st;
  466. int track_type, track_id, ret;
  467. int field_nr, field_info, skip = 0;
  468. int stream_index;
  469. if (!parse_packet_header(pb, &pkt_type, &pkt_len)) {
  470. if (!url_feof(pb))
  471. av_log(s, AV_LOG_ERROR, "sync lost\n");
  472. return -1;
  473. }
  474. if (pkt_type == PKT_FLT) {
  475. gxf_read_index(s, pkt_len);
  476. continue;
  477. }
  478. if (pkt_type != PKT_MEDIA) {
  479. avio_skip(pb, pkt_len);
  480. continue;
  481. }
  482. if (pkt_len < 16) {
  483. av_log(s, AV_LOG_ERROR, "invalid media packet length\n");
  484. continue;
  485. }
  486. pkt_len -= 16;
  487. track_type = avio_r8(pb);
  488. track_id = avio_r8(pb);
  489. stream_index = get_sindex(s, track_id, track_type);
  490. if (stream_index < 0)
  491. return stream_index;
  492. st = s->streams[stream_index];
  493. field_nr = avio_rb32(pb);
  494. field_info = avio_rb32(pb);
  495. avio_rb32(pb); // "timeline" field number
  496. avio_r8(pb); // flags
  497. avio_r8(pb); // reserved
  498. if (st->codec->codec_id == AV_CODEC_ID_PCM_S24LE ||
  499. st->codec->codec_id == AV_CODEC_ID_PCM_S16LE) {
  500. int first = field_info >> 16;
  501. int last = field_info & 0xffff; // last is exclusive
  502. int bps = av_get_bits_per_sample(st->codec->codec_id)>>3;
  503. if (first <= last && last*bps <= pkt_len) {
  504. avio_skip(pb, first*bps);
  505. skip = pkt_len - last*bps;
  506. pkt_len = (last-first)*bps;
  507. } else
  508. av_log(s, AV_LOG_ERROR, "invalid first and last sample values\n");
  509. }
  510. ret = av_get_packet(pb, pkt, pkt_len);
  511. if (skip)
  512. avio_skip(pb, skip);
  513. pkt->stream_index = stream_index;
  514. pkt->dts = field_nr;
  515. //set duration manually for DV or else lavf misdetects the frame rate
  516. if (st->codec->codec_id == AV_CODEC_ID_DVVIDEO)
  517. pkt->duration = si->fields_per_frame;
  518. return ret;
  519. }
  520. return AVERROR_EOF;
  521. }
  522. static int gxf_seek(AVFormatContext *s, int stream_index, int64_t timestamp, int flags) {
  523. int res = 0;
  524. uint64_t pos;
  525. uint64_t maxlen = 100 * 1024 * 1024;
  526. AVStream *st = s->streams[0];
  527. int64_t start_time = s->streams[stream_index]->start_time;
  528. int64_t found;
  529. int idx;
  530. if (timestamp < start_time) timestamp = start_time;
  531. idx = av_index_search_timestamp(st, timestamp - start_time,
  532. AVSEEK_FLAG_ANY | AVSEEK_FLAG_BACKWARD);
  533. if (idx < 0)
  534. return -1;
  535. pos = st->index_entries[idx].pos;
  536. if (idx < st->nb_index_entries - 2)
  537. maxlen = st->index_entries[idx + 2].pos - pos;
  538. maxlen = FFMAX(maxlen, 200 * 1024);
  539. res = avio_seek(s->pb, pos, SEEK_SET);
  540. if (res < 0)
  541. return res;
  542. found = gxf_resync_media(s, maxlen, -1, timestamp);
  543. if (FFABS(found - timestamp) > 4)
  544. return -1;
  545. return 0;
  546. }
  547. static int64_t gxf_read_timestamp(AVFormatContext *s, int stream_index,
  548. int64_t *pos, int64_t pos_limit) {
  549. AVIOContext *pb = s->pb;
  550. int64_t res;
  551. if (avio_seek(pb, *pos, SEEK_SET) < 0)
  552. return AV_NOPTS_VALUE;
  553. res = gxf_resync_media(s, pos_limit - *pos, -1, -1);
  554. *pos = avio_tell(pb);
  555. return res;
  556. }
  557. AVInputFormat ff_gxf_demuxer = {
  558. .name = "gxf",
  559. .long_name = NULL_IF_CONFIG_SMALL("GXF (General eXchange Format)"),
  560. .priv_data_size = sizeof(struct gxf_stream_info),
  561. .read_probe = gxf_probe,
  562. .read_header = gxf_header,
  563. .read_packet = gxf_packet,
  564. .read_seek = gxf_seek,
  565. .read_timestamp = gxf_read_timestamp,
  566. };