You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

1000 lines
31KB

  1. /*
  2. * GXF muxer.
  3. * Copyright (c) 2006 SmartJog S.A., Baptiste Coudurier <baptiste dot coudurier at smartjog dot com>
  4. *
  5. * This file is part of FFmpeg.
  6. *
  7. * FFmpeg is free software; you can redistribute it and/or
  8. * modify it under the terms of the GNU Lesser General Public
  9. * License as published by the Free Software Foundation; either
  10. * version 2.1 of the License, or (at your option) any later version.
  11. *
  12. * FFmpeg is distributed in the hope that it will be useful,
  13. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  14. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  15. * Lesser General Public License for more details.
  16. *
  17. * You should have received a copy of the GNU Lesser General Public
  18. * License along with FFmpeg; if not, write to the Free Software
  19. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  20. */
  21. #include "libavutil/avassert.h"
  22. #include "libavutil/intfloat.h"
  23. #include "libavutil/opt.h"
  24. #include "libavutil/mathematics.h"
  25. #include "libavutil/timecode.h"
  26. #include "avformat.h"
  27. #include "internal.h"
  28. #include "gxf.h"
  29. #include "audiointerleave.h"
  30. #define GXF_AUDIO_PACKET_SIZE 65536
  31. #define GXF_TIMECODE(c, d, h, m, s, f) \
  32. ((c) << 30 | (d) << 29 | (h) << 24 | (m) << 16 | (s) << 8 | (f))
  33. typedef struct GXFTimecode{
  34. int hh;
  35. int mm;
  36. int ss;
  37. int ff;
  38. int color;
  39. int drop;
  40. } GXFTimecode;
  41. typedef struct GXFStreamContext {
  42. AudioInterleaveContext aic;
  43. uint32_t track_type;
  44. uint32_t sample_size;
  45. uint32_t sample_rate;
  46. uint16_t media_type;
  47. uint16_t media_info;
  48. int frame_rate_index;
  49. int lines_index;
  50. int fields;
  51. int iframes;
  52. int pframes;
  53. int bframes;
  54. int p_per_gop;
  55. int b_per_i_or_p; ///< number of B frames per I frame or P frame
  56. int first_gop_closed;
  57. unsigned order; ///< interleaving order
  58. } GXFStreamContext;
  59. typedef struct GXFContext {
  60. AVClass *av_class;
  61. uint32_t nb_fields;
  62. uint16_t audio_tracks;
  63. uint16_t mpeg_tracks;
  64. int64_t creation_time;
  65. uint32_t umf_start_offset;
  66. uint32_t umf_track_offset;
  67. uint32_t umf_media_offset;
  68. uint32_t umf_length;
  69. uint16_t umf_track_size;
  70. uint16_t umf_media_size;
  71. AVRational time_base;
  72. int flags;
  73. GXFStreamContext timecode_track;
  74. unsigned *flt_entries; ///< offsets of packets /1024, starts after 2nd video field
  75. unsigned flt_entries_nb;
  76. uint64_t *map_offsets; ///< offset of map packets
  77. unsigned map_offsets_nb;
  78. unsigned packet_count;
  79. GXFTimecode tc;
  80. } GXFContext;
  81. static const struct {
  82. int height, index;
  83. } gxf_lines_tab[] = {
  84. { 480, 1 }, /* NTSC */
  85. { 512, 1 }, /* NTSC + VBI */
  86. { 576, 2 }, /* PAL */
  87. { 608, 2 }, /* PAL + VBI */
  88. { 1080, 4 },
  89. { 720, 6 },
  90. };
  91. static const AVCodecTag gxf_media_types[] = {
  92. { AV_CODEC_ID_MJPEG , 3 }, /* NTSC */
  93. { AV_CODEC_ID_MJPEG , 4 }, /* PAL */
  94. { AV_CODEC_ID_PCM_S24LE , 9 },
  95. { AV_CODEC_ID_PCM_S16LE , 10 },
  96. { AV_CODEC_ID_MPEG2VIDEO, 11 }, /* NTSC */
  97. { AV_CODEC_ID_MPEG2VIDEO, 12 }, /* PAL */
  98. { AV_CODEC_ID_DVVIDEO , 13 }, /* NTSC */
  99. { AV_CODEC_ID_DVVIDEO , 14 }, /* PAL */
  100. { AV_CODEC_ID_DVVIDEO , 15 }, /* 50M NTSC */
  101. { AV_CODEC_ID_DVVIDEO , 16 }, /* 50M PAL */
  102. { AV_CODEC_ID_AC3 , 17 },
  103. //{ AV_CODEC_ID_NONE, , 18 }, /* Non compressed 24 bit audio */
  104. { AV_CODEC_ID_MPEG2VIDEO, 20 }, /* MPEG HD */
  105. { AV_CODEC_ID_MPEG1VIDEO, 22 }, /* NTSC */
  106. { AV_CODEC_ID_MPEG1VIDEO, 23 }, /* PAL */
  107. { AV_CODEC_ID_NONE, 0 },
  108. };
  109. #define SERVER_PATH "EXT:/PDR/default/"
  110. #define ES_NAME_PATTERN "EXT:/PDR/default/ES."
  111. static int gxf_find_lines_index(AVStream *st)
  112. {
  113. GXFStreamContext *sc = st->priv_data;
  114. int i;
  115. for (i = 0; i < 6; ++i) {
  116. if (st->codec->height == gxf_lines_tab[i].height) {
  117. sc->lines_index = gxf_lines_tab[i].index;
  118. return 0;
  119. }
  120. }
  121. return -1;
  122. }
  123. static void gxf_write_padding(AVIOContext *pb, int64_t to_pad)
  124. {
  125. for (; to_pad > 0; to_pad--) {
  126. avio_w8(pb, 0);
  127. }
  128. }
  129. static int64_t updatePacketSize(AVIOContext *pb, int64_t pos)
  130. {
  131. int64_t curpos;
  132. int size;
  133. size = avio_tell(pb) - pos;
  134. if (size % 4) {
  135. gxf_write_padding(pb, 4 - size % 4);
  136. size = avio_tell(pb) - pos;
  137. }
  138. curpos = avio_tell(pb);
  139. avio_seek(pb, pos + 6, SEEK_SET);
  140. avio_wb32(pb, size);
  141. avio_seek(pb, curpos, SEEK_SET);
  142. return curpos - pos;
  143. }
  144. static int64_t updateSize(AVIOContext *pb, int64_t pos)
  145. {
  146. int64_t curpos;
  147. curpos = avio_tell(pb);
  148. avio_seek(pb, pos, SEEK_SET);
  149. avio_wb16(pb, curpos - pos - 2);
  150. avio_seek(pb, curpos, SEEK_SET);
  151. return curpos - pos;
  152. }
  153. static void gxf_write_packet_header(AVIOContext *pb, GXFPktType type)
  154. {
  155. avio_wb32(pb, 0); /* packet leader for synchro */
  156. avio_w8(pb, 1);
  157. avio_w8(pb, type); /* map packet */
  158. avio_wb32(pb, 0); /* size */
  159. avio_wb32(pb, 0); /* reserved */
  160. avio_w8(pb, 0xE1); /* trailer 1 */
  161. avio_w8(pb, 0xE2); /* trailer 2 */
  162. }
  163. static int gxf_write_mpeg_auxiliary(AVIOContext *pb, AVStream *st)
  164. {
  165. GXFStreamContext *sc = st->priv_data;
  166. char buffer[1024];
  167. int size, starting_line;
  168. if (sc->iframes) {
  169. sc->p_per_gop = sc->pframes / sc->iframes;
  170. if (sc->pframes % sc->iframes)
  171. sc->p_per_gop++;
  172. if (sc->pframes) {
  173. sc->b_per_i_or_p = sc->bframes / sc->pframes;
  174. if (sc->bframes % sc->pframes)
  175. sc->b_per_i_or_p++;
  176. }
  177. if (sc->p_per_gop > 9)
  178. sc->p_per_gop = 9; /* ensure value won't take more than one char */
  179. if (sc->b_per_i_or_p > 9)
  180. sc->b_per_i_or_p = 9; /* ensure value won't take more than one char */
  181. }
  182. if (st->codec->height == 512 || st->codec->height == 608)
  183. starting_line = 7; // VBI
  184. else if (st->codec->height == 480)
  185. starting_line = 20;
  186. else
  187. starting_line = 23; // default PAL
  188. size = snprintf(buffer, sizeof(buffer), "Ver 1\nBr %.6f\nIpg 1\nPpi %d\nBpiop %d\n"
  189. "Pix 0\nCf %d\nCg %d\nSl %d\nnl16 %d\nVi 1\nf1 1\n",
  190. (float)st->codec->bit_rate, sc->p_per_gop, sc->b_per_i_or_p,
  191. st->codec->pix_fmt == AV_PIX_FMT_YUV422P ? 2 : 1, sc->first_gop_closed == 1,
  192. starting_line, (st->codec->height + 15) / 16);
  193. av_assert0(size < sizeof(buffer));
  194. avio_w8(pb, TRACK_MPG_AUX);
  195. avio_w8(pb, size + 1);
  196. avio_write(pb, (uint8_t *)buffer, size + 1);
  197. return size + 3;
  198. }
  199. static int gxf_write_timecode_auxiliary(AVIOContext *pb, GXFContext *gxf)
  200. {
  201. uint32_t timecode = GXF_TIMECODE(gxf->tc.color, gxf->tc.drop,
  202. gxf->tc.hh, gxf->tc.mm,
  203. gxf->tc.ss, gxf->tc.ff);
  204. avio_wl32(pb, timecode);
  205. /* reserved */
  206. avio_wl32(pb, 0);
  207. return 8;
  208. }
  209. static int gxf_write_track_description(AVFormatContext *s, GXFStreamContext *sc, int index)
  210. {
  211. GXFContext *gxf = s->priv_data;
  212. AVIOContext *pb = s->pb;
  213. int64_t pos;
  214. int mpeg = sc->track_type == 4 || sc->track_type == 9;
  215. /* track description section */
  216. avio_w8(pb, sc->media_type + 0x80);
  217. avio_w8(pb, index + 0xC0);
  218. pos = avio_tell(pb);
  219. avio_wb16(pb, 0); /* size */
  220. /* media file name */
  221. avio_w8(pb, TRACK_NAME);
  222. avio_w8(pb, strlen(ES_NAME_PATTERN) + 3);
  223. avio_write(pb, ES_NAME_PATTERN, sizeof(ES_NAME_PATTERN) - 1);
  224. avio_wb16(pb, sc->media_info);
  225. avio_w8(pb, 0);
  226. if (!mpeg) {
  227. /* auxiliary information */
  228. avio_w8(pb, TRACK_AUX);
  229. avio_w8(pb, 8);
  230. if (sc->track_type == 3)
  231. gxf_write_timecode_auxiliary(pb, gxf);
  232. else
  233. avio_wl64(pb, 0);
  234. }
  235. /* file system version */
  236. avio_w8(pb, TRACK_VER);
  237. avio_w8(pb, 4);
  238. avio_wb32(pb, 0);
  239. if (mpeg)
  240. gxf_write_mpeg_auxiliary(pb, s->streams[index]);
  241. /* frame rate */
  242. avio_w8(pb, TRACK_FPS);
  243. avio_w8(pb, 4);
  244. avio_wb32(pb, sc->frame_rate_index);
  245. /* lines per frame */
  246. avio_w8(pb, TRACK_LINES);
  247. avio_w8(pb, 4);
  248. avio_wb32(pb, sc->lines_index);
  249. /* fields per frame */
  250. avio_w8(pb, TRACK_FPF);
  251. avio_w8(pb, 4);
  252. avio_wb32(pb, sc->fields);
  253. return updateSize(pb, pos);
  254. }
  255. static int gxf_write_material_data_section(AVFormatContext *s)
  256. {
  257. GXFContext *gxf = s->priv_data;
  258. AVIOContext *pb = s->pb;
  259. int64_t pos;
  260. int len;
  261. const char *filename = strrchr(s->filename, '/');
  262. pos = avio_tell(pb);
  263. avio_wb16(pb, 0); /* size */
  264. /* name */
  265. if (filename)
  266. filename++;
  267. else
  268. filename = s->filename;
  269. len = strlen(filename);
  270. avio_w8(pb, MAT_NAME);
  271. avio_w8(pb, strlen(SERVER_PATH) + len + 1);
  272. avio_write(pb, SERVER_PATH, sizeof(SERVER_PATH) - 1);
  273. avio_write(pb, filename, len);
  274. avio_w8(pb, 0);
  275. /* first field */
  276. avio_w8(pb, MAT_FIRST_FIELD);
  277. avio_w8(pb, 4);
  278. avio_wb32(pb, 0);
  279. /* last field */
  280. avio_w8(pb, MAT_LAST_FIELD);
  281. avio_w8(pb, 4);
  282. avio_wb32(pb, gxf->nb_fields);
  283. /* reserved */
  284. avio_w8(pb, MAT_MARK_IN);
  285. avio_w8(pb, 4);
  286. avio_wb32(pb, 0);
  287. avio_w8(pb, MAT_MARK_OUT);
  288. avio_w8(pb, 4);
  289. avio_wb32(pb, gxf->nb_fields);
  290. /* estimated size */
  291. avio_w8(pb, MAT_SIZE);
  292. avio_w8(pb, 4);
  293. avio_wb32(pb, avio_size(pb) / 1024);
  294. return updateSize(pb, pos);
  295. }
  296. static int gxf_write_track_description_section(AVFormatContext *s)
  297. {
  298. GXFContext *gxf = s->priv_data;
  299. AVIOContext *pb = s->pb;
  300. int64_t pos;
  301. int i;
  302. pos = avio_tell(pb);
  303. avio_wb16(pb, 0); /* size */
  304. for (i = 0; i < s->nb_streams; ++i)
  305. gxf_write_track_description(s, s->streams[i]->priv_data, i);
  306. gxf_write_track_description(s, &gxf->timecode_track, s->nb_streams);
  307. return updateSize(pb, pos);
  308. }
  309. static int gxf_write_map_packet(AVFormatContext *s, int rewrite)
  310. {
  311. GXFContext *gxf = s->priv_data;
  312. AVIOContext *pb = s->pb;
  313. int64_t pos = avio_tell(pb);
  314. if (!rewrite) {
  315. if (!(gxf->map_offsets_nb % 30)) {
  316. gxf->map_offsets = av_realloc_f(gxf->map_offsets,
  317. sizeof(*gxf->map_offsets),
  318. gxf->map_offsets_nb+30);
  319. if (!gxf->map_offsets) {
  320. av_log(s, AV_LOG_ERROR, "could not realloc map offsets\n");
  321. return -1;
  322. }
  323. }
  324. gxf->map_offsets[gxf->map_offsets_nb++] = pos; // do not increment here
  325. }
  326. gxf_write_packet_header(pb, PKT_MAP);
  327. /* preamble */
  328. avio_w8(pb, 0xE0); /* version */
  329. avio_w8(pb, 0xFF); /* reserved */
  330. gxf_write_material_data_section(s);
  331. gxf_write_track_description_section(s);
  332. return updatePacketSize(pb, pos);
  333. }
  334. static int gxf_write_flt_packet(AVFormatContext *s)
  335. {
  336. GXFContext *gxf = s->priv_data;
  337. AVIOContext *pb = s->pb;
  338. int64_t pos = avio_tell(pb);
  339. int fields_per_flt = (gxf->nb_fields+1) / 1000 + 1;
  340. int flt_entries = gxf->nb_fields / fields_per_flt;
  341. int i = 0;
  342. gxf_write_packet_header(pb, PKT_FLT);
  343. avio_wl32(pb, fields_per_flt); /* number of fields */
  344. avio_wl32(pb, flt_entries); /* number of active flt entries */
  345. if (gxf->flt_entries) {
  346. for (i = 0; i < flt_entries; i++)
  347. avio_wl32(pb, gxf->flt_entries[(i*fields_per_flt)>>1]);
  348. }
  349. for (; i < 1000; i++)
  350. avio_wl32(pb, 0);
  351. return updatePacketSize(pb, pos);
  352. }
  353. static int gxf_write_umf_material_description(AVFormatContext *s)
  354. {
  355. GXFContext *gxf = s->priv_data;
  356. AVIOContext *pb = s->pb;
  357. int timecode_base = gxf->time_base.den == 60000 ? 60 : 50;
  358. int64_t timestamp = 0;
  359. AVDictionaryEntry *t;
  360. uint64_t nb_fields;
  361. uint32_t timecode_in; // timecode at mark in
  362. uint32_t timecode_out; // timecode at mark out
  363. if (t = av_dict_get(s->metadata, "creation_time", NULL, 0))
  364. timestamp = ff_iso8601_to_unix_time(t->value);
  365. timecode_in = GXF_TIMECODE(gxf->tc.color, gxf->tc.drop,
  366. gxf->tc.hh, gxf->tc.mm,
  367. gxf->tc.ss, gxf->tc.ff);
  368. nb_fields = gxf->nb_fields +
  369. gxf->tc.hh * (timecode_base * 3600) +
  370. gxf->tc.mm * (timecode_base * 60) +
  371. gxf->tc.ss * timecode_base +
  372. gxf->tc.ff;
  373. timecode_out = GXF_TIMECODE(gxf->tc.color, gxf->tc.drop,
  374. nb_fields / (timecode_base * 3600) % 24,
  375. nb_fields / (timecode_base * 60) % 60,
  376. nb_fields / timecode_base % 60,
  377. nb_fields % timecode_base);
  378. avio_wl32(pb, gxf->flags);
  379. avio_wl32(pb, gxf->nb_fields); /* length of the longest track */
  380. avio_wl32(pb, gxf->nb_fields); /* length of the shortest track */
  381. avio_wl32(pb, 0); /* mark in */
  382. avio_wl32(pb, gxf->nb_fields); /* mark out */
  383. avio_wl32(pb, timecode_in); /* timecode mark in */
  384. avio_wl32(pb, timecode_out); /* timecode mark out */
  385. avio_wl64(pb, timestamp); /* modification time */
  386. avio_wl64(pb, timestamp); /* creation time */
  387. avio_wl16(pb, 0); /* reserved */
  388. avio_wl16(pb, 0); /* reserved */
  389. avio_wl16(pb, gxf->audio_tracks);
  390. avio_wl16(pb, 1); /* timecode track count */
  391. avio_wl16(pb, 0); /* reserved */
  392. avio_wl16(pb, gxf->mpeg_tracks);
  393. return 48;
  394. }
  395. static int gxf_write_umf_payload(AVFormatContext *s)
  396. {
  397. GXFContext *gxf = s->priv_data;
  398. AVIOContext *pb = s->pb;
  399. avio_wl32(pb, gxf->umf_length); /* total length of the umf data */
  400. avio_wl32(pb, 3); /* version */
  401. avio_wl32(pb, s->nb_streams+1);
  402. avio_wl32(pb, gxf->umf_track_offset); /* umf track section offset */
  403. avio_wl32(pb, gxf->umf_track_size);
  404. avio_wl32(pb, s->nb_streams+1);
  405. avio_wl32(pb, gxf->umf_media_offset);
  406. avio_wl32(pb, gxf->umf_media_size);
  407. avio_wl32(pb, gxf->umf_length); /* user data offset */
  408. avio_wl32(pb, 0); /* user data size */
  409. avio_wl32(pb, 0); /* reserved */
  410. avio_wl32(pb, 0); /* reserved */
  411. return 48;
  412. }
  413. static int gxf_write_umf_track_description(AVFormatContext *s)
  414. {
  415. AVIOContext *pb = s->pb;
  416. GXFContext *gxf = s->priv_data;
  417. int64_t pos = avio_tell(pb);
  418. int i;
  419. gxf->umf_track_offset = pos - gxf->umf_start_offset;
  420. for (i = 0; i < s->nb_streams; ++i) {
  421. GXFStreamContext *sc = s->streams[i]->priv_data;
  422. avio_wl16(pb, sc->media_info);
  423. avio_wl16(pb, 1);
  424. }
  425. avio_wl16(pb, gxf->timecode_track.media_info);
  426. avio_wl16(pb, 1);
  427. return avio_tell(pb) - pos;
  428. }
  429. static int gxf_write_umf_media_mpeg(AVIOContext *pb, AVStream *st)
  430. {
  431. GXFStreamContext *sc = st->priv_data;
  432. if (st->codec->pix_fmt == AV_PIX_FMT_YUV422P)
  433. avio_wl32(pb, 2);
  434. else
  435. avio_wl32(pb, 1); /* default to 420 */
  436. avio_wl32(pb, sc->first_gop_closed == 1); /* closed = 1, open = 0, unknown = 255 */
  437. avio_wl32(pb, 3); /* top = 1, bottom = 2, frame = 3, unknown = 0 */
  438. avio_wl32(pb, 1); /* I picture per GOP */
  439. avio_wl32(pb, sc->p_per_gop);
  440. avio_wl32(pb, sc->b_per_i_or_p);
  441. if (st->codec->codec_id == AV_CODEC_ID_MPEG2VIDEO)
  442. avio_wl32(pb, 2);
  443. else if (st->codec->codec_id == AV_CODEC_ID_MPEG1VIDEO)
  444. avio_wl32(pb, 1);
  445. else
  446. avio_wl32(pb, 0);
  447. avio_wl32(pb, 0); /* reserved */
  448. return 32;
  449. }
  450. static int gxf_write_umf_media_timecode(AVIOContext *pb, int drop)
  451. {
  452. avio_wl32(pb, drop); /* drop frame */
  453. avio_wl32(pb, 0); /* reserved */
  454. avio_wl32(pb, 0); /* reserved */
  455. avio_wl32(pb, 0); /* reserved */
  456. avio_wl32(pb, 0); /* reserved */
  457. avio_wl32(pb, 0); /* reserved */
  458. avio_wl32(pb, 0); /* reserved */
  459. avio_wl32(pb, 0); /* reserved */
  460. return 32;
  461. }
  462. static int gxf_write_umf_media_dv(AVIOContext *pb, GXFStreamContext *sc)
  463. {
  464. int i;
  465. for (i = 0; i < 8; i++) {
  466. avio_wb32(pb, 0);
  467. }
  468. return 32;
  469. }
  470. static int gxf_write_umf_media_audio(AVIOContext *pb, GXFStreamContext *sc)
  471. {
  472. avio_wl64(pb, av_double2int(1)); /* sound level to begin to */
  473. avio_wl64(pb, av_double2int(1)); /* sound level to begin to */
  474. avio_wl32(pb, 0); /* number of fields over which to ramp up sound level */
  475. avio_wl32(pb, 0); /* number of fields over which to ramp down sound level */
  476. avio_wl32(pb, 0); /* reserved */
  477. avio_wl32(pb, 0); /* reserved */
  478. return 32;
  479. }
  480. static int gxf_write_umf_media_description(AVFormatContext *s)
  481. {
  482. GXFContext *gxf = s->priv_data;
  483. AVIOContext *pb = s->pb;
  484. int64_t pos;
  485. int i, j;
  486. pos = avio_tell(pb);
  487. gxf->umf_media_offset = pos - gxf->umf_start_offset;
  488. for (i = 0; i <= s->nb_streams; ++i) {
  489. GXFStreamContext *sc;
  490. int64_t startpos, curpos;
  491. if (i == s->nb_streams)
  492. sc = &gxf->timecode_track;
  493. else
  494. sc = s->streams[i]->priv_data;
  495. startpos = avio_tell(pb);
  496. avio_wl16(pb, 0); /* length */
  497. avio_wl16(pb, sc->media_info);
  498. avio_wl16(pb, 0); /* reserved */
  499. avio_wl16(pb, 0); /* reserved */
  500. avio_wl32(pb, gxf->nb_fields);
  501. avio_wl32(pb, 0); /* attributes rw, ro */
  502. avio_wl32(pb, 0); /* mark in */
  503. avio_wl32(pb, gxf->nb_fields); /* mark out */
  504. avio_write(pb, ES_NAME_PATTERN, strlen(ES_NAME_PATTERN));
  505. avio_wb16(pb, sc->media_info);
  506. for (j = strlen(ES_NAME_PATTERN)+2; j < 88; j++)
  507. avio_w8(pb, 0);
  508. avio_wl32(pb, sc->track_type);
  509. avio_wl32(pb, sc->sample_rate);
  510. avio_wl32(pb, sc->sample_size);
  511. avio_wl32(pb, 0); /* reserved */
  512. if (sc == &gxf->timecode_track)
  513. gxf_write_umf_media_timecode(pb, gxf->tc.drop);
  514. else {
  515. AVStream *st = s->streams[i];
  516. switch (st->codec->codec_id) {
  517. case AV_CODEC_ID_MPEG1VIDEO:
  518. case AV_CODEC_ID_MPEG2VIDEO:
  519. gxf_write_umf_media_mpeg(pb, st);
  520. break;
  521. case AV_CODEC_ID_PCM_S16LE:
  522. gxf_write_umf_media_audio(pb, sc);
  523. break;
  524. case AV_CODEC_ID_DVVIDEO:
  525. gxf_write_umf_media_dv(pb, sc);
  526. break;
  527. }
  528. }
  529. curpos = avio_tell(pb);
  530. avio_seek(pb, startpos, SEEK_SET);
  531. avio_wl16(pb, curpos - startpos);
  532. avio_seek(pb, curpos, SEEK_SET);
  533. }
  534. return avio_tell(pb) - pos;
  535. }
  536. static int gxf_write_umf_packet(AVFormatContext *s)
  537. {
  538. GXFContext *gxf = s->priv_data;
  539. AVIOContext *pb = s->pb;
  540. int64_t pos = avio_tell(pb);
  541. gxf_write_packet_header(pb, PKT_UMF);
  542. /* preamble */
  543. avio_w8(pb, 3); /* first and last (only) packet */
  544. avio_wb32(pb, gxf->umf_length); /* data length */
  545. gxf->umf_start_offset = avio_tell(pb);
  546. gxf_write_umf_payload(s);
  547. gxf_write_umf_material_description(s);
  548. gxf->umf_track_size = gxf_write_umf_track_description(s);
  549. gxf->umf_media_size = gxf_write_umf_media_description(s);
  550. gxf->umf_length = avio_tell(pb) - gxf->umf_start_offset;
  551. return updatePacketSize(pb, pos);
  552. }
  553. static const int GXF_samples_per_frame[] = { 32768, 0 };
  554. static void gxf_init_timecode_track(GXFStreamContext *sc, GXFStreamContext *vsc)
  555. {
  556. if (!vsc)
  557. return;
  558. sc->media_type = vsc->sample_rate == 60 ? 7 : 8;
  559. sc->sample_rate = vsc->sample_rate;
  560. sc->media_info = ('T'<<8) | '0';
  561. sc->track_type = 3;
  562. sc->frame_rate_index = vsc->frame_rate_index;
  563. sc->lines_index = vsc->lines_index;
  564. sc->sample_size = 16;
  565. sc->fields = vsc->fields;
  566. }
  567. static int gxf_init_timecode(AVFormatContext *s, GXFTimecode *tc, const char *tcstr, int fields)
  568. {
  569. char c;
  570. if (sscanf(tcstr, "%d:%d:%d%c%d", &tc->hh, &tc->mm, &tc->ss, &c, &tc->ff) != 5) {
  571. av_log(s, AV_LOG_ERROR, "unable to parse timecode, "
  572. "syntax: hh:mm:ss[:;.]ff\n");
  573. return -1;
  574. }
  575. tc->color = 0;
  576. tc->drop = c != ':';
  577. if (fields == 2)
  578. tc->ff = tc->ff * 2;
  579. return 0;
  580. }
  581. static int gxf_write_header(AVFormatContext *s)
  582. {
  583. AVIOContext *pb = s->pb;
  584. GXFContext *gxf = s->priv_data;
  585. GXFStreamContext *vsc = NULL;
  586. uint8_t tracks[255] = {0};
  587. int i, media_info = 0;
  588. AVDictionaryEntry *tcr = av_dict_get(s->metadata, "timecode", NULL, 0);
  589. if (!pb->seekable) {
  590. av_log(s, AV_LOG_ERROR, "gxf muxer does not support streamed output, patch welcome\n");
  591. return -1;
  592. }
  593. gxf->flags |= 0x00080000; /* material is simple clip */
  594. for (i = 0; i < s->nb_streams; ++i) {
  595. AVStream *st = s->streams[i];
  596. GXFStreamContext *sc = av_mallocz(sizeof(*sc));
  597. if (!sc)
  598. return AVERROR(ENOMEM);
  599. st->priv_data = sc;
  600. sc->media_type = ff_codec_get_tag(gxf_media_types, st->codec->codec_id);
  601. if (st->codec->codec_type == AVMEDIA_TYPE_AUDIO) {
  602. if (st->codec->codec_id != AV_CODEC_ID_PCM_S16LE) {
  603. av_log(s, AV_LOG_ERROR, "only 16 BIT PCM LE allowed for now\n");
  604. return -1;
  605. }
  606. if (st->codec->sample_rate != 48000) {
  607. av_log(s, AV_LOG_ERROR, "only 48000hz sampling rate is allowed\n");
  608. return -1;
  609. }
  610. if (st->codec->channels != 1) {
  611. av_log(s, AV_LOG_ERROR, "only mono tracks are allowed\n");
  612. return -1;
  613. }
  614. sc->track_type = 2;
  615. sc->sample_rate = st->codec->sample_rate;
  616. avpriv_set_pts_info(st, 64, 1, sc->sample_rate);
  617. sc->sample_size = 16;
  618. sc->frame_rate_index = -2;
  619. sc->lines_index = -2;
  620. sc->fields = -2;
  621. gxf->audio_tracks++;
  622. gxf->flags |= 0x04000000; /* audio is 16 bit pcm */
  623. media_info = 'A';
  624. } else if (st->codec->codec_type == AVMEDIA_TYPE_VIDEO) {
  625. if (i != 0) {
  626. av_log(s, AV_LOG_ERROR, "video stream must be the first track\n");
  627. return -1;
  628. }
  629. /* FIXME check from time_base ? */
  630. if (st->codec->height == 480 || st->codec->height == 512) { /* NTSC or NTSC+VBI */
  631. sc->frame_rate_index = 5;
  632. sc->sample_rate = 60;
  633. gxf->flags |= 0x00000080;
  634. gxf->time_base = (AVRational){ 1001, 60000 };
  635. } else if (st->codec->height == 576 || st->codec->height == 608) { /* PAL or PAL+VBI */
  636. sc->frame_rate_index = 6;
  637. sc->media_type++;
  638. sc->sample_rate = 50;
  639. gxf->flags |= 0x00000040;
  640. gxf->time_base = (AVRational){ 1, 50 };
  641. } else {
  642. av_log(s, AV_LOG_ERROR, "unsupported video resolution, "
  643. "gxf muxer only accepts PAL or NTSC resolutions currently\n");
  644. return -1;
  645. }
  646. if (!tcr)
  647. tcr = av_dict_get(st->metadata, "timecode", NULL, 0);
  648. avpriv_set_pts_info(st, 64, gxf->time_base.num, gxf->time_base.den);
  649. if (gxf_find_lines_index(st) < 0)
  650. sc->lines_index = -1;
  651. sc->sample_size = st->codec->bit_rate;
  652. sc->fields = 2; /* interlaced */
  653. vsc = sc;
  654. switch (st->codec->codec_id) {
  655. case AV_CODEC_ID_MJPEG:
  656. sc->track_type = 1;
  657. gxf->flags |= 0x00004000;
  658. media_info = 'J';
  659. break;
  660. case AV_CODEC_ID_MPEG1VIDEO:
  661. sc->track_type = 9;
  662. gxf->mpeg_tracks++;
  663. media_info = 'L';
  664. break;
  665. case AV_CODEC_ID_MPEG2VIDEO:
  666. sc->first_gop_closed = -1;
  667. sc->track_type = 4;
  668. gxf->mpeg_tracks++;
  669. gxf->flags |= 0x00008000;
  670. media_info = 'M';
  671. break;
  672. case AV_CODEC_ID_DVVIDEO:
  673. if (st->codec->pix_fmt == AV_PIX_FMT_YUV422P) {
  674. sc->media_type += 2;
  675. sc->track_type = 6;
  676. gxf->flags |= 0x00002000;
  677. media_info = 'E';
  678. } else {
  679. sc->track_type = 5;
  680. gxf->flags |= 0x00001000;
  681. media_info = 'D';
  682. }
  683. break;
  684. default:
  685. av_log(s, AV_LOG_ERROR, "video codec not supported\n");
  686. return -1;
  687. }
  688. }
  689. /* FIXME first 10 audio tracks are 0 to 9 next 22 are A to V */
  690. sc->media_info = media_info<<8 | ('0'+tracks[media_info]++);
  691. sc->order = s->nb_streams - st->index;
  692. }
  693. if (ff_audio_interleave_init(s, GXF_samples_per_frame, (AVRational){ 1, 48000 }) < 0)
  694. return -1;
  695. if (tcr && vsc)
  696. gxf_init_timecode(s, &gxf->tc, tcr->value, vsc->fields);
  697. gxf_init_timecode_track(&gxf->timecode_track, vsc);
  698. gxf->flags |= 0x200000; // time code track is non-drop frame
  699. gxf_write_map_packet(s, 0);
  700. gxf_write_flt_packet(s);
  701. gxf_write_umf_packet(s);
  702. gxf->packet_count = 3;
  703. avio_flush(pb);
  704. return 0;
  705. }
  706. static int gxf_write_eos_packet(AVIOContext *pb)
  707. {
  708. int64_t pos = avio_tell(pb);
  709. gxf_write_packet_header(pb, PKT_EOS);
  710. return updatePacketSize(pb, pos);
  711. }
  712. static int gxf_write_trailer(AVFormatContext *s)
  713. {
  714. GXFContext *gxf = s->priv_data;
  715. AVIOContext *pb = s->pb;
  716. int64_t end;
  717. int i;
  718. ff_audio_interleave_close(s);
  719. gxf_write_eos_packet(pb);
  720. end = avio_tell(pb);
  721. avio_seek(pb, 0, SEEK_SET);
  722. /* overwrite map, flt and umf packets with new values */
  723. gxf_write_map_packet(s, 1);
  724. gxf_write_flt_packet(s);
  725. gxf_write_umf_packet(s);
  726. avio_flush(pb);
  727. /* update duration in all map packets */
  728. for (i = 1; i < gxf->map_offsets_nb; i++) {
  729. avio_seek(pb, gxf->map_offsets[i], SEEK_SET);
  730. gxf_write_map_packet(s, 1);
  731. avio_flush(pb);
  732. }
  733. avio_seek(pb, end, SEEK_SET);
  734. av_freep(&gxf->flt_entries);
  735. av_freep(&gxf->map_offsets);
  736. return 0;
  737. }
  738. static int gxf_parse_mpeg_frame(GXFStreamContext *sc, const uint8_t *buf, int size)
  739. {
  740. uint32_t c=-1;
  741. int i;
  742. for(i=0; i<size-4 && c!=0x100; i++){
  743. c = (c<<8) + buf[i];
  744. if(c == 0x1B8 && sc->first_gop_closed == -1) /* GOP start code */
  745. sc->first_gop_closed= (buf[i+4]>>6)&1;
  746. }
  747. return (buf[i+1]>>3)&7;
  748. }
  749. static int gxf_write_media_preamble(AVFormatContext *s, AVPacket *pkt, int size)
  750. {
  751. GXFContext *gxf = s->priv_data;
  752. AVIOContext *pb = s->pb;
  753. AVStream *st = s->streams[pkt->stream_index];
  754. GXFStreamContext *sc = st->priv_data;
  755. unsigned field_nb;
  756. /* If the video is frame-encoded, the frame numbers shall be represented by
  757. * even field numbers.
  758. * see SMPTE360M-2004 6.4.2.1.3 Media field number */
  759. if (st->codec->codec_type == AVMEDIA_TYPE_VIDEO) {
  760. field_nb = gxf->nb_fields;
  761. } else {
  762. field_nb = av_rescale_rnd(pkt->dts, gxf->time_base.den,
  763. (int64_t)48000*gxf->time_base.num, AV_ROUND_UP);
  764. }
  765. avio_w8(pb, sc->media_type);
  766. avio_w8(pb, st->index);
  767. avio_wb32(pb, field_nb);
  768. if (st->codec->codec_type == AVMEDIA_TYPE_AUDIO) {
  769. avio_wb16(pb, 0);
  770. avio_wb16(pb, size / 2);
  771. } else if (st->codec->codec_id == AV_CODEC_ID_MPEG2VIDEO) {
  772. int frame_type = gxf_parse_mpeg_frame(sc, pkt->data, pkt->size);
  773. if (frame_type == AV_PICTURE_TYPE_I) {
  774. avio_w8(pb, 0x0d);
  775. sc->iframes++;
  776. } else if (frame_type == AV_PICTURE_TYPE_B) {
  777. avio_w8(pb, 0x0f);
  778. sc->bframes++;
  779. } else {
  780. avio_w8(pb, 0x0e);
  781. sc->pframes++;
  782. }
  783. avio_wb24(pb, size);
  784. } else if (st->codec->codec_id == AV_CODEC_ID_DVVIDEO) {
  785. avio_w8(pb, size / 4096);
  786. avio_wb24(pb, 0);
  787. } else
  788. avio_wb32(pb, size);
  789. avio_wb32(pb, field_nb);
  790. avio_w8(pb, 1); /* flags */
  791. avio_w8(pb, 0); /* reserved */
  792. return 16;
  793. }
  794. static int gxf_write_packet(AVFormatContext *s, AVPacket *pkt)
  795. {
  796. GXFContext *gxf = s->priv_data;
  797. AVIOContext *pb = s->pb;
  798. AVStream *st = s->streams[pkt->stream_index];
  799. int64_t pos = avio_tell(pb);
  800. int padding = 0;
  801. int packet_start_offset = avio_tell(pb) / 1024;
  802. gxf_write_packet_header(pb, PKT_MEDIA);
  803. if (st->codec->codec_id == AV_CODEC_ID_MPEG2VIDEO && pkt->size % 4) /* MPEG-2 frames must be padded */
  804. padding = 4 - pkt->size % 4;
  805. else if (st->codec->codec_type == AVMEDIA_TYPE_AUDIO)
  806. padding = GXF_AUDIO_PACKET_SIZE - pkt->size;
  807. gxf_write_media_preamble(s, pkt, pkt->size + padding);
  808. avio_write(pb, pkt->data, pkt->size);
  809. gxf_write_padding(pb, padding);
  810. if (st->codec->codec_type == AVMEDIA_TYPE_VIDEO) {
  811. if (!(gxf->flt_entries_nb % 500)) {
  812. gxf->flt_entries = av_realloc_f(gxf->flt_entries,
  813. sizeof(*gxf->flt_entries),
  814. gxf->flt_entries_nb+500);
  815. if (!gxf->flt_entries) {
  816. av_log(s, AV_LOG_ERROR, "could not reallocate flt entries\n");
  817. return -1;
  818. }
  819. }
  820. gxf->flt_entries[gxf->flt_entries_nb++] = packet_start_offset;
  821. gxf->nb_fields += 2; // count fields
  822. }
  823. updatePacketSize(pb, pos);
  824. gxf->packet_count++;
  825. if (gxf->packet_count == 100) {
  826. gxf_write_map_packet(s, 0);
  827. gxf->packet_count = 0;
  828. }
  829. avio_flush(pb);
  830. return 0;
  831. }
  832. static int gxf_compare_field_nb(AVFormatContext *s, AVPacket *next, AVPacket *cur)
  833. {
  834. GXFContext *gxf = s->priv_data;
  835. AVPacket *pkt[2] = { cur, next };
  836. int i, field_nb[2];
  837. GXFStreamContext *sc[2];
  838. for (i = 0; i < 2; i++) {
  839. AVStream *st = s->streams[pkt[i]->stream_index];
  840. sc[i] = st->priv_data;
  841. if (st->codec->codec_type == AVMEDIA_TYPE_AUDIO) {
  842. field_nb[i] = av_rescale_rnd(pkt[i]->dts, gxf->time_base.den,
  843. (int64_t)48000*gxf->time_base.num, AV_ROUND_UP);
  844. field_nb[i] &= ~1; // compare against even field number because audio must be before video
  845. } else
  846. field_nb[i] = pkt[i]->dts; // dts are field based
  847. }
  848. return field_nb[1] > field_nb[0] ||
  849. (field_nb[1] == field_nb[0] && sc[1]->order > sc[0]->order);
  850. }
  851. static int gxf_interleave_packet(AVFormatContext *s, AVPacket *out, AVPacket *pkt, int flush)
  852. {
  853. if (pkt && s->streams[pkt->stream_index]->codec->codec_type == AVMEDIA_TYPE_VIDEO)
  854. pkt->duration = 2; // enforce 2 fields
  855. return ff_audio_rechunk_interleave(s, out, pkt, flush,
  856. ff_interleave_packet_per_dts, gxf_compare_field_nb);
  857. }
  858. AVOutputFormat ff_gxf_muxer = {
  859. .name = "gxf",
  860. .long_name = NULL_IF_CONFIG_SMALL("GXF (General eXchange Format)"),
  861. .extensions = "gxf",
  862. .priv_data_size = sizeof(GXFContext),
  863. .audio_codec = AV_CODEC_ID_PCM_S16LE,
  864. .video_codec = AV_CODEC_ID_MPEG2VIDEO,
  865. .write_header = gxf_write_header,
  866. .write_packet = gxf_write_packet,
  867. .write_trailer = gxf_write_trailer,
  868. .interleave_packet = gxf_interleave_packet,
  869. };