You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

958 lines
29KB

  1. /*
  2. * GXF muxer.
  3. * Copyright (c) 2006 SmartJog S.A., Baptiste Coudurier <baptiste dot coudurier at smartjog dot com>
  4. *
  5. * This file is part of Libav.
  6. *
  7. * Libav is free software; you can redistribute it and/or
  8. * modify it under the terms of the GNU Lesser General Public
  9. * License as published by the Free Software Foundation; either
  10. * version 2.1 of the License, or (at your option) any later version.
  11. *
  12. * Libav is distributed in the hope that it will be useful,
  13. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  14. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  15. * Lesser General Public License for more details.
  16. *
  17. * You should have received a copy of the GNU Lesser General Public
  18. * License along with Libav; if not, write to the Free Software
  19. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  20. */
  21. #include "libavutil/intfloat_readwrite.h"
  22. #include "libavutil/mathematics.h"
  23. #include "avformat.h"
  24. #include "gxf.h"
  25. #include "riff.h"
  26. #include "audiointerleave.h"
  27. #define GXF_AUDIO_PACKET_SIZE 65536
  28. typedef struct GXFStreamContext {
  29. AudioInterleaveContext aic;
  30. uint32_t track_type;
  31. uint32_t sample_size;
  32. uint32_t sample_rate;
  33. uint16_t media_type;
  34. uint16_t media_info;
  35. int frame_rate_index;
  36. int lines_index;
  37. int fields;
  38. int iframes;
  39. int pframes;
  40. int bframes;
  41. int p_per_gop;
  42. int b_per_i_or_p; ///< number of B frames per I frame or P frame
  43. int first_gop_closed;
  44. unsigned order; ///< interleaving order
  45. } GXFStreamContext;
  46. typedef struct GXFContext {
  47. uint32_t nb_fields;
  48. uint16_t audio_tracks;
  49. uint16_t mpeg_tracks;
  50. int64_t creation_time;
  51. uint32_t umf_start_offset;
  52. uint32_t umf_track_offset;
  53. uint32_t umf_media_offset;
  54. uint32_t umf_length;
  55. uint16_t umf_track_size;
  56. uint16_t umf_media_size;
  57. AVRational time_base;
  58. int flags;
  59. GXFStreamContext timecode_track;
  60. unsigned *flt_entries; ///< offsets of packets /1024, starts after 2nd video field
  61. unsigned flt_entries_nb;
  62. uint64_t *map_offsets; ///< offset of map packets
  63. unsigned map_offsets_nb;
  64. unsigned packet_count;
  65. } GXFContext;
  66. static const struct {
  67. int height, index;
  68. } gxf_lines_tab[] = {
  69. { 480, 1 }, /* NTSC */
  70. { 512, 1 }, /* NTSC + VBI */
  71. { 576, 2 }, /* PAL */
  72. { 608, 2 }, /* PAL + VBI */
  73. { 1080, 4 },
  74. { 720, 6 },
  75. };
  76. static const AVCodecTag gxf_media_types[] = {
  77. { CODEC_ID_MJPEG , 3 }, /* NTSC */
  78. { CODEC_ID_MJPEG , 4 }, /* PAL */
  79. { CODEC_ID_PCM_S24LE , 9 },
  80. { CODEC_ID_PCM_S16LE , 10 },
  81. { CODEC_ID_MPEG2VIDEO, 11 }, /* NTSC */
  82. { CODEC_ID_MPEG2VIDEO, 12 }, /* PAL */
  83. { CODEC_ID_DVVIDEO , 13 }, /* NTSC */
  84. { CODEC_ID_DVVIDEO , 14 }, /* PAL */
  85. { CODEC_ID_DVVIDEO , 15 }, /* 50M NTSC */
  86. { CODEC_ID_DVVIDEO , 16 }, /* 50M PAL */
  87. { CODEC_ID_AC3 , 17 },
  88. //{ CODEC_ID_NONE, , 18 }, /* Non compressed 24 bit audio */
  89. { CODEC_ID_MPEG2VIDEO, 20 }, /* MPEG HD */
  90. { CODEC_ID_MPEG1VIDEO, 22 }, /* NTSC */
  91. { CODEC_ID_MPEG1VIDEO, 23 }, /* PAL */
  92. { CODEC_ID_NONE, 0 },
  93. };
  94. #define SERVER_PATH "EXT:/PDR/default/"
  95. #define ES_NAME_PATTERN "EXT:/PDR/default/ES."
  96. static int gxf_find_lines_index(AVStream *st)
  97. {
  98. GXFStreamContext *sc = st->priv_data;
  99. int i;
  100. for (i = 0; i < 6; ++i) {
  101. if (st->codec->height == gxf_lines_tab[i].height) {
  102. sc->lines_index = gxf_lines_tab[i].index;
  103. return 0;
  104. }
  105. }
  106. return -1;
  107. }
  108. static void gxf_write_padding(AVIOContext *pb, int64_t to_pad)
  109. {
  110. for (; to_pad > 0; to_pad--) {
  111. avio_w8(pb, 0);
  112. }
  113. }
  114. static int64_t updatePacketSize(AVIOContext *pb, int64_t pos)
  115. {
  116. int64_t curpos;
  117. int size;
  118. size = avio_tell(pb) - pos;
  119. if (size % 4) {
  120. gxf_write_padding(pb, 4 - size % 4);
  121. size = avio_tell(pb) - pos;
  122. }
  123. curpos = avio_tell(pb);
  124. avio_seek(pb, pos + 6, SEEK_SET);
  125. avio_wb32(pb, size);
  126. avio_seek(pb, curpos, SEEK_SET);
  127. return curpos - pos;
  128. }
  129. static int64_t updateSize(AVIOContext *pb, int64_t pos)
  130. {
  131. int64_t curpos;
  132. curpos = avio_tell(pb);
  133. avio_seek(pb, pos, SEEK_SET);
  134. avio_wb16(pb, curpos - pos - 2);
  135. avio_seek(pb, curpos, SEEK_SET);
  136. return curpos - pos;
  137. }
  138. static void gxf_write_packet_header(AVIOContext *pb, GXFPktType type)
  139. {
  140. avio_wb32(pb, 0); /* packet leader for synchro */
  141. avio_w8(pb, 1);
  142. avio_w8(pb, type); /* map packet */
  143. avio_wb32(pb, 0); /* size */
  144. avio_wb32(pb, 0); /* reserved */
  145. avio_w8(pb, 0xE1); /* trailer 1 */
  146. avio_w8(pb, 0xE2); /* trailer 2 */
  147. }
  148. static int gxf_write_mpeg_auxiliary(AVIOContext *pb, AVStream *st)
  149. {
  150. GXFStreamContext *sc = st->priv_data;
  151. char buffer[1024];
  152. int size, starting_line;
  153. if (sc->iframes) {
  154. sc->p_per_gop = sc->pframes / sc->iframes;
  155. if (sc->pframes % sc->iframes)
  156. sc->p_per_gop++;
  157. if (sc->pframes) {
  158. sc->b_per_i_or_p = sc->bframes / sc->pframes;
  159. if (sc->bframes % sc->pframes)
  160. sc->b_per_i_or_p++;
  161. }
  162. if (sc->p_per_gop > 9)
  163. sc->p_per_gop = 9; /* ensure value won't take more than one char */
  164. if (sc->b_per_i_or_p > 9)
  165. sc->b_per_i_or_p = 9; /* ensure value won't take more than one char */
  166. }
  167. if (st->codec->height == 512 || st->codec->height == 608)
  168. starting_line = 7; // VBI
  169. else if (st->codec->height == 480)
  170. starting_line = 20;
  171. else
  172. starting_line = 23; // default PAL
  173. size = snprintf(buffer, 1024, "Ver 1\nBr %.6f\nIpg 1\nPpi %d\nBpiop %d\n"
  174. "Pix 0\nCf %d\nCg %d\nSl %d\nnl16 %d\nVi 1\nf1 1\n",
  175. (float)st->codec->bit_rate, sc->p_per_gop, sc->b_per_i_or_p,
  176. st->codec->pix_fmt == PIX_FMT_YUV422P ? 2 : 1, sc->first_gop_closed == 1,
  177. starting_line, (st->codec->height + 15) / 16);
  178. avio_w8(pb, TRACK_MPG_AUX);
  179. avio_w8(pb, size + 1);
  180. avio_write(pb, (uint8_t *)buffer, size + 1);
  181. return size + 3;
  182. }
  183. static int gxf_write_timecode_auxiliary(AVIOContext *pb, GXFStreamContext *sc)
  184. {
  185. avio_w8(pb, 0); /* fields */
  186. avio_w8(pb, 0); /* seconds */
  187. avio_w8(pb, 0); /* minutes */
  188. avio_w8(pb, 0); /* flags + hours */
  189. /* reserved */
  190. avio_wb32(pb, 0);
  191. return 8;
  192. }
  193. static int gxf_write_track_description(AVFormatContext *s, GXFStreamContext *sc, int index)
  194. {
  195. AVIOContext *pb = s->pb;
  196. int64_t pos;
  197. int mpeg = sc->track_type == 4 || sc->track_type == 9;
  198. /* track description section */
  199. avio_w8(pb, sc->media_type + 0x80);
  200. avio_w8(pb, index + 0xC0);
  201. pos = avio_tell(pb);
  202. avio_wb16(pb, 0); /* size */
  203. /* media file name */
  204. avio_w8(pb, TRACK_NAME);
  205. avio_w8(pb, strlen(ES_NAME_PATTERN) + 3);
  206. avio_write(pb, ES_NAME_PATTERN, sizeof(ES_NAME_PATTERN) - 1);
  207. avio_wb16(pb, sc->media_info);
  208. avio_w8(pb, 0);
  209. if (!mpeg) {
  210. /* auxiliary information */
  211. avio_w8(pb, TRACK_AUX);
  212. avio_w8(pb, 8);
  213. if (sc->track_type == 3)
  214. gxf_write_timecode_auxiliary(pb, sc);
  215. else
  216. avio_wl64(pb, 0);
  217. }
  218. /* file system version */
  219. avio_w8(pb, TRACK_VER);
  220. avio_w8(pb, 4);
  221. avio_wb32(pb, 0);
  222. if (mpeg)
  223. gxf_write_mpeg_auxiliary(pb, s->streams[index]);
  224. /* frame rate */
  225. avio_w8(pb, TRACK_FPS);
  226. avio_w8(pb, 4);
  227. avio_wb32(pb, sc->frame_rate_index);
  228. /* lines per frame */
  229. avio_w8(pb, TRACK_LINES);
  230. avio_w8(pb, 4);
  231. avio_wb32(pb, sc->lines_index);
  232. /* fields per frame */
  233. avio_w8(pb, TRACK_FPF);
  234. avio_w8(pb, 4);
  235. avio_wb32(pb, sc->fields);
  236. return updateSize(pb, pos);
  237. }
  238. static int gxf_write_material_data_section(AVFormatContext *s)
  239. {
  240. GXFContext *gxf = s->priv_data;
  241. AVIOContext *pb = s->pb;
  242. int64_t pos;
  243. int len;
  244. const char *filename = strrchr(s->filename, '/');
  245. pos = avio_tell(pb);
  246. avio_wb16(pb, 0); /* size */
  247. /* name */
  248. if (filename)
  249. filename++;
  250. else
  251. filename = s->filename;
  252. len = strlen(filename);
  253. avio_w8(pb, MAT_NAME);
  254. avio_w8(pb, strlen(SERVER_PATH) + len + 1);
  255. avio_write(pb, SERVER_PATH, sizeof(SERVER_PATH) - 1);
  256. avio_write(pb, filename, len);
  257. avio_w8(pb, 0);
  258. /* first field */
  259. avio_w8(pb, MAT_FIRST_FIELD);
  260. avio_w8(pb, 4);
  261. avio_wb32(pb, 0);
  262. /* last field */
  263. avio_w8(pb, MAT_LAST_FIELD);
  264. avio_w8(pb, 4);
  265. avio_wb32(pb, gxf->nb_fields);
  266. /* reserved */
  267. avio_w8(pb, MAT_MARK_IN);
  268. avio_w8(pb, 4);
  269. avio_wb32(pb, 0);
  270. avio_w8(pb, MAT_MARK_OUT);
  271. avio_w8(pb, 4);
  272. avio_wb32(pb, gxf->nb_fields);
  273. /* estimated size */
  274. avio_w8(pb, MAT_SIZE);
  275. avio_w8(pb, 4);
  276. avio_wb32(pb, avio_size(pb) / 1024);
  277. return updateSize(pb, pos);
  278. }
  279. static int gxf_write_track_description_section(AVFormatContext *s)
  280. {
  281. GXFContext *gxf = s->priv_data;
  282. AVIOContext *pb = s->pb;
  283. int64_t pos;
  284. int i;
  285. pos = avio_tell(pb);
  286. avio_wb16(pb, 0); /* size */
  287. for (i = 0; i < s->nb_streams; ++i)
  288. gxf_write_track_description(s, s->streams[i]->priv_data, i);
  289. gxf_write_track_description(s, &gxf->timecode_track, s->nb_streams);
  290. return updateSize(pb, pos);
  291. }
  292. static int gxf_write_map_packet(AVFormatContext *s, int rewrite)
  293. {
  294. GXFContext *gxf = s->priv_data;
  295. AVIOContext *pb = s->pb;
  296. int64_t pos = avio_tell(pb);
  297. if (!rewrite) {
  298. if (!(gxf->map_offsets_nb % 30)) {
  299. gxf->map_offsets = av_realloc(gxf->map_offsets,
  300. (gxf->map_offsets_nb+30)*sizeof(*gxf->map_offsets));
  301. if (!gxf->map_offsets) {
  302. av_log(s, AV_LOG_ERROR, "could not realloc map offsets\n");
  303. return -1;
  304. }
  305. }
  306. gxf->map_offsets[gxf->map_offsets_nb++] = pos; // do not increment here
  307. }
  308. gxf_write_packet_header(pb, PKT_MAP);
  309. /* preamble */
  310. avio_w8(pb, 0xE0); /* version */
  311. avio_w8(pb, 0xFF); /* reserved */
  312. gxf_write_material_data_section(s);
  313. gxf_write_track_description_section(s);
  314. return updatePacketSize(pb, pos);
  315. }
  316. static int gxf_write_flt_packet(AVFormatContext *s)
  317. {
  318. GXFContext *gxf = s->priv_data;
  319. AVIOContext *pb = s->pb;
  320. int64_t pos = avio_tell(pb);
  321. int fields_per_flt = (gxf->nb_fields+1) / 1000 + 1;
  322. int flt_entries = gxf->nb_fields / fields_per_flt;
  323. int i = 0;
  324. gxf_write_packet_header(pb, PKT_FLT);
  325. avio_wl32(pb, fields_per_flt); /* number of fields */
  326. avio_wl32(pb, flt_entries); /* number of active flt entries */
  327. if (gxf->flt_entries) {
  328. for (i = 0; i < flt_entries; i++)
  329. avio_wl32(pb, gxf->flt_entries[(i*fields_per_flt)>>1]);
  330. }
  331. for (; i < 1000; i++)
  332. avio_wl32(pb, 0);
  333. return updatePacketSize(pb, pos);
  334. }
  335. static int gxf_write_umf_material_description(AVFormatContext *s)
  336. {
  337. GXFContext *gxf = s->priv_data;
  338. AVIOContext *pb = s->pb;
  339. int timecode_base = gxf->time_base.den == 60000 ? 60 : 50;
  340. int64_t timestamp = 0;
  341. AVDictionaryEntry *t;
  342. uint32_t timecode;
  343. #if FF_API_TIMESTAMP
  344. if (s->timestamp)
  345. timestamp = s->timestamp;
  346. else
  347. #endif
  348. if (t = av_dict_get(s->metadata, "creation_time", NULL, 0))
  349. timestamp = ff_iso8601_to_unix_time(t->value);
  350. // XXX drop frame
  351. timecode =
  352. gxf->nb_fields / (timecode_base * 3600) % 24 << 24 | // hours
  353. gxf->nb_fields / (timecode_base * 60) % 60 << 16 | // minutes
  354. gxf->nb_fields / timecode_base % 60 << 8 | // seconds
  355. gxf->nb_fields % timecode_base; // fields
  356. avio_wl32(pb, gxf->flags);
  357. avio_wl32(pb, gxf->nb_fields); /* length of the longest track */
  358. avio_wl32(pb, gxf->nb_fields); /* length of the shortest track */
  359. avio_wl32(pb, 0); /* mark in */
  360. avio_wl32(pb, gxf->nb_fields); /* mark out */
  361. avio_wl32(pb, 0); /* timecode mark in */
  362. avio_wl32(pb, timecode); /* timecode mark out */
  363. avio_wl64(pb, timestamp); /* modification time */
  364. avio_wl64(pb, timestamp); /* creation time */
  365. avio_wl16(pb, 0); /* reserved */
  366. avio_wl16(pb, 0); /* reserved */
  367. avio_wl16(pb, gxf->audio_tracks);
  368. avio_wl16(pb, 1); /* timecode track count */
  369. avio_wl16(pb, 0); /* reserved */
  370. avio_wl16(pb, gxf->mpeg_tracks);
  371. return 48;
  372. }
  373. static int gxf_write_umf_payload(AVFormatContext *s)
  374. {
  375. GXFContext *gxf = s->priv_data;
  376. AVIOContext *pb = s->pb;
  377. avio_wl32(pb, gxf->umf_length); /* total length of the umf data */
  378. avio_wl32(pb, 3); /* version */
  379. avio_wl32(pb, s->nb_streams+1);
  380. avio_wl32(pb, gxf->umf_track_offset); /* umf track section offset */
  381. avio_wl32(pb, gxf->umf_track_size);
  382. avio_wl32(pb, s->nb_streams+1);
  383. avio_wl32(pb, gxf->umf_media_offset);
  384. avio_wl32(pb, gxf->umf_media_size);
  385. avio_wl32(pb, gxf->umf_length); /* user data offset */
  386. avio_wl32(pb, 0); /* user data size */
  387. avio_wl32(pb, 0); /* reserved */
  388. avio_wl32(pb, 0); /* reserved */
  389. return 48;
  390. }
  391. static int gxf_write_umf_track_description(AVFormatContext *s)
  392. {
  393. AVIOContext *pb = s->pb;
  394. GXFContext *gxf = s->priv_data;
  395. int64_t pos = avio_tell(pb);
  396. int i;
  397. gxf->umf_track_offset = pos - gxf->umf_start_offset;
  398. for (i = 0; i < s->nb_streams; ++i) {
  399. GXFStreamContext *sc = s->streams[i]->priv_data;
  400. avio_wl16(pb, sc->media_info);
  401. avio_wl16(pb, 1);
  402. }
  403. avio_wl16(pb, gxf->timecode_track.media_info);
  404. avio_wl16(pb, 1);
  405. return avio_tell(pb) - pos;
  406. }
  407. static int gxf_write_umf_media_mpeg(AVIOContext *pb, AVStream *st)
  408. {
  409. GXFStreamContext *sc = st->priv_data;
  410. if (st->codec->pix_fmt == PIX_FMT_YUV422P)
  411. avio_wl32(pb, 2);
  412. else
  413. avio_wl32(pb, 1); /* default to 420 */
  414. avio_wl32(pb, sc->first_gop_closed == 1); /* closed = 1, open = 0, unknown = 255 */
  415. avio_wl32(pb, 3); /* top = 1, bottom = 2, frame = 3, unknown = 0 */
  416. avio_wl32(pb, 1); /* I picture per GOP */
  417. avio_wl32(pb, sc->p_per_gop);
  418. avio_wl32(pb, sc->b_per_i_or_p);
  419. if (st->codec->codec_id == CODEC_ID_MPEG2VIDEO)
  420. avio_wl32(pb, 2);
  421. else if (st->codec->codec_id == CODEC_ID_MPEG1VIDEO)
  422. avio_wl32(pb, 1);
  423. else
  424. avio_wl32(pb, 0);
  425. avio_wl32(pb, 0); /* reserved */
  426. return 32;
  427. }
  428. static int gxf_write_umf_media_timecode(AVIOContext *pb, GXFStreamContext *sc)
  429. {
  430. avio_wl32(pb, 1); /* non drop frame */
  431. avio_wl32(pb, 0); /* reserved */
  432. avio_wl32(pb, 0); /* reserved */
  433. avio_wl32(pb, 0); /* reserved */
  434. avio_wl32(pb, 0); /* reserved */
  435. avio_wl32(pb, 0); /* reserved */
  436. avio_wl32(pb, 0); /* reserved */
  437. avio_wl32(pb, 0); /* reserved */
  438. return 32;
  439. }
  440. static int gxf_write_umf_media_dv(AVIOContext *pb, GXFStreamContext *sc)
  441. {
  442. int i;
  443. for (i = 0; i < 8; i++) {
  444. avio_wb32(pb, 0);
  445. }
  446. return 32;
  447. }
  448. static int gxf_write_umf_media_audio(AVIOContext *pb, GXFStreamContext *sc)
  449. {
  450. avio_wl64(pb, av_dbl2int(1)); /* sound level to begin to */
  451. avio_wl64(pb, av_dbl2int(1)); /* sound level to begin to */
  452. avio_wl32(pb, 0); /* number of fields over which to ramp up sound level */
  453. avio_wl32(pb, 0); /* number of fields over which to ramp down sound level */
  454. avio_wl32(pb, 0); /* reserved */
  455. avio_wl32(pb, 0); /* reserved */
  456. return 32;
  457. }
  458. #if 0
  459. static int gxf_write_umf_media_mjpeg(AVIOContext *pb, GXFStreamContext *sc)
  460. {
  461. avio_wb64(pb, 0); /* FIXME FLOAT max chroma quant level */
  462. avio_wb64(pb, 0); /* FIXME FLOAT max luma quant level */
  463. avio_wb64(pb, 0); /* FIXME FLOAT min chroma quant level */
  464. avio_wb64(pb, 0); /* FIXME FLOAT min luma quant level */
  465. return 32;
  466. }
  467. #endif
  468. static int gxf_write_umf_media_description(AVFormatContext *s)
  469. {
  470. GXFContext *gxf = s->priv_data;
  471. AVIOContext *pb = s->pb;
  472. int64_t pos;
  473. int i, j;
  474. pos = avio_tell(pb);
  475. gxf->umf_media_offset = pos - gxf->umf_start_offset;
  476. for (i = 0; i <= s->nb_streams; ++i) {
  477. GXFStreamContext *sc;
  478. int64_t startpos, curpos;
  479. if (i == s->nb_streams)
  480. sc = &gxf->timecode_track;
  481. else
  482. sc = s->streams[i]->priv_data;
  483. startpos = avio_tell(pb);
  484. avio_wl16(pb, 0); /* length */
  485. avio_wl16(pb, sc->media_info);
  486. avio_wl16(pb, 0); /* reserved */
  487. avio_wl16(pb, 0); /* reserved */
  488. avio_wl32(pb, gxf->nb_fields);
  489. avio_wl32(pb, 0); /* attributes rw, ro */
  490. avio_wl32(pb, 0); /* mark in */
  491. avio_wl32(pb, gxf->nb_fields); /* mark out */
  492. avio_write(pb, ES_NAME_PATTERN, strlen(ES_NAME_PATTERN));
  493. avio_wb16(pb, sc->media_info);
  494. for (j = strlen(ES_NAME_PATTERN)+2; j < 88; j++)
  495. avio_w8(pb, 0);
  496. avio_wl32(pb, sc->track_type);
  497. avio_wl32(pb, sc->sample_rate);
  498. avio_wl32(pb, sc->sample_size);
  499. avio_wl32(pb, 0); /* reserved */
  500. if (sc == &gxf->timecode_track)
  501. gxf_write_umf_media_timecode(pb, sc); /* 8 0bytes */
  502. else {
  503. AVStream *st = s->streams[i];
  504. switch (st->codec->codec_id) {
  505. case CODEC_ID_MPEG1VIDEO:
  506. case CODEC_ID_MPEG2VIDEO:
  507. gxf_write_umf_media_mpeg(pb, st);
  508. break;
  509. case CODEC_ID_PCM_S16LE:
  510. gxf_write_umf_media_audio(pb, sc);
  511. break;
  512. case CODEC_ID_DVVIDEO:
  513. gxf_write_umf_media_dv(pb, sc);
  514. break;
  515. }
  516. }
  517. curpos = avio_tell(pb);
  518. avio_seek(pb, startpos, SEEK_SET);
  519. avio_wl16(pb, curpos - startpos);
  520. avio_seek(pb, curpos, SEEK_SET);
  521. }
  522. return avio_tell(pb) - pos;
  523. }
  524. static int gxf_write_umf_packet(AVFormatContext *s)
  525. {
  526. GXFContext *gxf = s->priv_data;
  527. AVIOContext *pb = s->pb;
  528. int64_t pos = avio_tell(pb);
  529. gxf_write_packet_header(pb, PKT_UMF);
  530. /* preamble */
  531. avio_w8(pb, 3); /* first and last (only) packet */
  532. avio_wb32(pb, gxf->umf_length); /* data length */
  533. gxf->umf_start_offset = avio_tell(pb);
  534. gxf_write_umf_payload(s);
  535. gxf_write_umf_material_description(s);
  536. gxf->umf_track_size = gxf_write_umf_track_description(s);
  537. gxf->umf_media_size = gxf_write_umf_media_description(s);
  538. gxf->umf_length = avio_tell(pb) - gxf->umf_start_offset;
  539. return updatePacketSize(pb, pos);
  540. }
  541. static const int GXF_samples_per_frame[] = { 32768, 0 };
  542. static void gxf_init_timecode_track(GXFStreamContext *sc, GXFStreamContext *vsc)
  543. {
  544. if (!vsc)
  545. return;
  546. sc->media_type = vsc->sample_rate == 60 ? 7 : 8;
  547. sc->sample_rate = vsc->sample_rate;
  548. sc->media_info = ('T'<<8) | '0';
  549. sc->track_type = 3;
  550. sc->frame_rate_index = vsc->frame_rate_index;
  551. sc->lines_index = vsc->lines_index;
  552. sc->sample_size = 16;
  553. sc->fields = vsc->fields;
  554. }
  555. static int gxf_write_header(AVFormatContext *s)
  556. {
  557. AVIOContext *pb = s->pb;
  558. GXFContext *gxf = s->priv_data;
  559. GXFStreamContext *vsc = NULL;
  560. uint8_t tracks[255] = {0};
  561. int i, media_info = 0;
  562. if (!pb->seekable) {
  563. av_log(s, AV_LOG_ERROR, "gxf muxer does not support streamed output, patch welcome");
  564. return -1;
  565. }
  566. gxf->flags |= 0x00080000; /* material is simple clip */
  567. for (i = 0; i < s->nb_streams; ++i) {
  568. AVStream *st = s->streams[i];
  569. GXFStreamContext *sc = av_mallocz(sizeof(*sc));
  570. if (!sc)
  571. return AVERROR(ENOMEM);
  572. st->priv_data = sc;
  573. sc->media_type = ff_codec_get_tag(gxf_media_types, st->codec->codec_id);
  574. if (st->codec->codec_type == AVMEDIA_TYPE_AUDIO) {
  575. if (st->codec->codec_id != CODEC_ID_PCM_S16LE) {
  576. av_log(s, AV_LOG_ERROR, "only 16 BIT PCM LE allowed for now\n");
  577. return -1;
  578. }
  579. if (st->codec->sample_rate != 48000) {
  580. av_log(s, AV_LOG_ERROR, "only 48000hz sampling rate is allowed\n");
  581. return -1;
  582. }
  583. if (st->codec->channels != 1) {
  584. av_log(s, AV_LOG_ERROR, "only mono tracks are allowed\n");
  585. return -1;
  586. }
  587. sc->track_type = 2;
  588. sc->sample_rate = st->codec->sample_rate;
  589. av_set_pts_info(st, 64, 1, sc->sample_rate);
  590. sc->sample_size = 16;
  591. sc->frame_rate_index = -2;
  592. sc->lines_index = -2;
  593. sc->fields = -2;
  594. gxf->audio_tracks++;
  595. gxf->flags |= 0x04000000; /* audio is 16 bit pcm */
  596. media_info = 'A';
  597. } else if (st->codec->codec_type == AVMEDIA_TYPE_VIDEO) {
  598. if (i != 0) {
  599. av_log(s, AV_LOG_ERROR, "video stream must be the first track\n");
  600. return -1;
  601. }
  602. /* FIXME check from time_base ? */
  603. if (st->codec->height == 480 || st->codec->height == 512) { /* NTSC or NTSC+VBI */
  604. sc->frame_rate_index = 5;
  605. sc->sample_rate = 60;
  606. gxf->flags |= 0x00000080;
  607. gxf->time_base = (AVRational){ 1001, 60000 };
  608. } else if (st->codec->height == 576 || st->codec->height == 608) { /* PAL or PAL+VBI */
  609. sc->frame_rate_index = 6;
  610. sc->media_type++;
  611. sc->sample_rate = 50;
  612. gxf->flags |= 0x00000040;
  613. gxf->time_base = (AVRational){ 1, 50 };
  614. } else {
  615. av_log(s, AV_LOG_ERROR, "unsupported video resolution, "
  616. "gxf muxer only accepts PAL or NTSC resolutions currently\n");
  617. return -1;
  618. }
  619. av_set_pts_info(st, 64, gxf->time_base.num, gxf->time_base.den);
  620. if (gxf_find_lines_index(st) < 0)
  621. sc->lines_index = -1;
  622. sc->sample_size = st->codec->bit_rate;
  623. sc->fields = 2; /* interlaced */
  624. vsc = sc;
  625. switch (st->codec->codec_id) {
  626. case CODEC_ID_MJPEG:
  627. sc->track_type = 1;
  628. gxf->flags |= 0x00004000;
  629. media_info = 'J';
  630. break;
  631. case CODEC_ID_MPEG1VIDEO:
  632. sc->track_type = 9;
  633. gxf->mpeg_tracks++;
  634. media_info = 'L';
  635. break;
  636. case CODEC_ID_MPEG2VIDEO:
  637. sc->first_gop_closed = -1;
  638. sc->track_type = 4;
  639. gxf->mpeg_tracks++;
  640. gxf->flags |= 0x00008000;
  641. media_info = 'M';
  642. break;
  643. case CODEC_ID_DVVIDEO:
  644. if (st->codec->pix_fmt == PIX_FMT_YUV422P) {
  645. sc->media_type += 2;
  646. sc->track_type = 6;
  647. gxf->flags |= 0x00002000;
  648. media_info = 'E';
  649. } else {
  650. sc->track_type = 5;
  651. gxf->flags |= 0x00001000;
  652. media_info = 'D';
  653. }
  654. break;
  655. default:
  656. av_log(s, AV_LOG_ERROR, "video codec not supported\n");
  657. return -1;
  658. }
  659. }
  660. /* FIXME first 10 audio tracks are 0 to 9 next 22 are A to V */
  661. sc->media_info = media_info<<8 | ('0'+tracks[media_info]++);
  662. sc->order = s->nb_streams - st->index;
  663. }
  664. if (ff_audio_interleave_init(s, GXF_samples_per_frame, (AVRational){ 1, 48000 }) < 0)
  665. return -1;
  666. gxf_init_timecode_track(&gxf->timecode_track, vsc);
  667. gxf->flags |= 0x200000; // time code track is non-drop frame
  668. gxf_write_map_packet(s, 0);
  669. gxf_write_flt_packet(s);
  670. gxf_write_umf_packet(s);
  671. gxf->packet_count = 3;
  672. avio_flush(pb);
  673. return 0;
  674. }
  675. static int gxf_write_eos_packet(AVIOContext *pb)
  676. {
  677. int64_t pos = avio_tell(pb);
  678. gxf_write_packet_header(pb, PKT_EOS);
  679. return updatePacketSize(pb, pos);
  680. }
  681. static int gxf_write_trailer(AVFormatContext *s)
  682. {
  683. GXFContext *gxf = s->priv_data;
  684. AVIOContext *pb = s->pb;
  685. int64_t end;
  686. int i;
  687. ff_audio_interleave_close(s);
  688. gxf_write_eos_packet(pb);
  689. end = avio_tell(pb);
  690. avio_seek(pb, 0, SEEK_SET);
  691. /* overwrite map, flt and umf packets with new values */
  692. gxf_write_map_packet(s, 1);
  693. gxf_write_flt_packet(s);
  694. gxf_write_umf_packet(s);
  695. avio_flush(pb);
  696. /* update duration in all map packets */
  697. for (i = 1; i < gxf->map_offsets_nb; i++) {
  698. avio_seek(pb, gxf->map_offsets[i], SEEK_SET);
  699. gxf_write_map_packet(s, 1);
  700. avio_flush(pb);
  701. }
  702. avio_seek(pb, end, SEEK_SET);
  703. av_freep(&gxf->flt_entries);
  704. av_freep(&gxf->map_offsets);
  705. return 0;
  706. }
  707. static int gxf_parse_mpeg_frame(GXFStreamContext *sc, const uint8_t *buf, int size)
  708. {
  709. uint32_t c=-1;
  710. int i;
  711. for(i=0; i<size-4 && c!=0x100; i++){
  712. c = (c<<8) + buf[i];
  713. if(c == 0x1B8 && sc->first_gop_closed == -1) /* GOP start code */
  714. sc->first_gop_closed= (buf[i+4]>>6)&1;
  715. }
  716. return (buf[i+1]>>3)&7;
  717. }
  718. static int gxf_write_media_preamble(AVFormatContext *s, AVPacket *pkt, int size)
  719. {
  720. GXFContext *gxf = s->priv_data;
  721. AVIOContext *pb = s->pb;
  722. AVStream *st = s->streams[pkt->stream_index];
  723. GXFStreamContext *sc = st->priv_data;
  724. unsigned field_nb;
  725. /* If the video is frame-encoded, the frame numbers shall be represented by
  726. * even field numbers.
  727. * see SMPTE360M-2004 6.4.2.1.3 Media field number */
  728. if (st->codec->codec_type == AVMEDIA_TYPE_VIDEO) {
  729. field_nb = gxf->nb_fields;
  730. } else {
  731. field_nb = av_rescale_rnd(pkt->dts, gxf->time_base.den,
  732. (int64_t)48000*gxf->time_base.num, AV_ROUND_UP);
  733. }
  734. avio_w8(pb, sc->media_type);
  735. avio_w8(pb, st->index);
  736. avio_wb32(pb, field_nb);
  737. if (st->codec->codec_type == AVMEDIA_TYPE_AUDIO) {
  738. avio_wb16(pb, 0);
  739. avio_wb16(pb, size / 2);
  740. } else if (st->codec->codec_id == CODEC_ID_MPEG2VIDEO) {
  741. int frame_type = gxf_parse_mpeg_frame(sc, pkt->data, pkt->size);
  742. if (frame_type == AV_PICTURE_TYPE_I) {
  743. avio_w8(pb, 0x0d);
  744. sc->iframes++;
  745. } else if (frame_type == AV_PICTURE_TYPE_B) {
  746. avio_w8(pb, 0x0f);
  747. sc->bframes++;
  748. } else {
  749. avio_w8(pb, 0x0e);
  750. sc->pframes++;
  751. }
  752. avio_wb24(pb, size);
  753. } else if (st->codec->codec_id == CODEC_ID_DVVIDEO) {
  754. avio_w8(pb, size / 4096);
  755. avio_wb24(pb, 0);
  756. } else
  757. avio_wb32(pb, size);
  758. avio_wb32(pb, field_nb);
  759. avio_w8(pb, 1); /* flags */
  760. avio_w8(pb, 0); /* reserved */
  761. return 16;
  762. }
  763. static int gxf_write_packet(AVFormatContext *s, AVPacket *pkt)
  764. {
  765. GXFContext *gxf = s->priv_data;
  766. AVIOContext *pb = s->pb;
  767. AVStream *st = s->streams[pkt->stream_index];
  768. int64_t pos = avio_tell(pb);
  769. int padding = 0;
  770. int packet_start_offset = avio_tell(pb) / 1024;
  771. gxf_write_packet_header(pb, PKT_MEDIA);
  772. if (st->codec->codec_id == CODEC_ID_MPEG2VIDEO && pkt->size % 4) /* MPEG-2 frames must be padded */
  773. padding = 4 - pkt->size % 4;
  774. else if (st->codec->codec_type == AVMEDIA_TYPE_AUDIO)
  775. padding = GXF_AUDIO_PACKET_SIZE - pkt->size;
  776. gxf_write_media_preamble(s, pkt, pkt->size + padding);
  777. avio_write(pb, pkt->data, pkt->size);
  778. gxf_write_padding(pb, padding);
  779. if (st->codec->codec_type == AVMEDIA_TYPE_VIDEO) {
  780. if (!(gxf->flt_entries_nb % 500)) {
  781. gxf->flt_entries = av_realloc(gxf->flt_entries,
  782. (gxf->flt_entries_nb+500)*sizeof(*gxf->flt_entries));
  783. if (!gxf->flt_entries) {
  784. av_log(s, AV_LOG_ERROR, "could not reallocate flt entries\n");
  785. return -1;
  786. }
  787. }
  788. gxf->flt_entries[gxf->flt_entries_nb++] = packet_start_offset;
  789. gxf->nb_fields += 2; // count fields
  790. }
  791. updatePacketSize(pb, pos);
  792. gxf->packet_count++;
  793. if (gxf->packet_count == 100) {
  794. gxf_write_map_packet(s, 0);
  795. gxf->packet_count = 0;
  796. }
  797. avio_flush(pb);
  798. return 0;
  799. }
  800. static int gxf_compare_field_nb(AVFormatContext *s, AVPacket *next, AVPacket *cur)
  801. {
  802. GXFContext *gxf = s->priv_data;
  803. AVPacket *pkt[2] = { cur, next };
  804. int i, field_nb[2];
  805. GXFStreamContext *sc[2];
  806. for (i = 0; i < 2; i++) {
  807. AVStream *st = s->streams[pkt[i]->stream_index];
  808. sc[i] = st->priv_data;
  809. if (st->codec->codec_type == AVMEDIA_TYPE_AUDIO) {
  810. field_nb[i] = av_rescale_rnd(pkt[i]->dts, gxf->time_base.den,
  811. (int64_t)48000*gxf->time_base.num, AV_ROUND_UP);
  812. field_nb[i] &= ~1; // compare against even field number because audio must be before video
  813. } else
  814. field_nb[i] = pkt[i]->dts; // dts are field based
  815. }
  816. return field_nb[1] > field_nb[0] ||
  817. (field_nb[1] == field_nb[0] && sc[1]->order > sc[0]->order);
  818. }
  819. static int gxf_interleave_packet(AVFormatContext *s, AVPacket *out, AVPacket *pkt, int flush)
  820. {
  821. if (pkt && s->streams[pkt->stream_index]->codec->codec_type == AVMEDIA_TYPE_VIDEO)
  822. pkt->duration = 2; // enforce 2 fields
  823. return ff_audio_rechunk_interleave(s, out, pkt, flush,
  824. av_interleave_packet_per_dts, gxf_compare_field_nb);
  825. }
  826. AVOutputFormat ff_gxf_muxer = {
  827. .name = "gxf",
  828. .long_name = NULL_IF_CONFIG_SMALL("GXF format"),
  829. .extensions = "gxf",
  830. .priv_data_size = sizeof(GXFContext),
  831. .audio_codec = CODEC_ID_PCM_S16LE,
  832. .video_codec = CODEC_ID_MPEG2VIDEO,
  833. .write_header = gxf_write_header,
  834. .write_packet = gxf_write_packet,
  835. .write_trailer = gxf_write_trailer,
  836. .interleave_packet = gxf_interleave_packet,
  837. };