You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

481 lines
17KB

  1. /*
  2. * ISO Media common code
  3. * Copyright (c) 2001 Fabrice Bellard
  4. * Copyright (c) 2002 Francois Revol <revol@free.fr>
  5. * Copyright (c) 2006 Baptiste Coudurier <baptiste.coudurier@free.fr>
  6. *
  7. * This file is part of FFmpeg.
  8. *
  9. * FFmpeg is free software; you can redistribute it and/or
  10. * modify it under the terms of the GNU Lesser General Public
  11. * License as published by the Free Software Foundation; either
  12. * version 2.1 of the License, or (at your option) any later version.
  13. *
  14. * FFmpeg is distributed in the hope that it will be useful,
  15. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  16. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  17. * Lesser General Public License for more details.
  18. *
  19. * You should have received a copy of the GNU Lesser General Public
  20. * License along with FFmpeg; if not, write to the Free Software
  21. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  22. */
  23. #include "avformat.h"
  24. #include "internal.h"
  25. #include "isom.h"
  26. #include "libavcodec/mpeg4audio.h"
  27. #include "libavcodec/mpegaudiodata.h"
  28. #include "libavutil/avstring.h"
  29. #include "libavutil/intreadwrite.h"
  30. /* http://www.mp4ra.org */
  31. /* ordered by muxing preference */
  32. const AVCodecTag ff_mp4_obj_type[] = {
  33. { AV_CODEC_ID_MOV_TEXT , 0x08 },
  34. { AV_CODEC_ID_MPEG4 , 0x20 },
  35. { AV_CODEC_ID_H264 , 0x21 },
  36. { AV_CODEC_ID_HEVC , 0x23 },
  37. { AV_CODEC_ID_AAC , 0x40 },
  38. { AV_CODEC_ID_MP4ALS , 0x40 }, /* 14496-3 ALS */
  39. { AV_CODEC_ID_MPEG2VIDEO , 0x61 }, /* MPEG-2 Main */
  40. { AV_CODEC_ID_MPEG2VIDEO , 0x60 }, /* MPEG-2 Simple */
  41. { AV_CODEC_ID_MPEG2VIDEO , 0x62 }, /* MPEG-2 SNR */
  42. { AV_CODEC_ID_MPEG2VIDEO , 0x63 }, /* MPEG-2 Spatial */
  43. { AV_CODEC_ID_MPEG2VIDEO , 0x64 }, /* MPEG-2 High */
  44. { AV_CODEC_ID_MPEG2VIDEO , 0x65 }, /* MPEG-2 422 */
  45. { AV_CODEC_ID_AAC , 0x66 }, /* MPEG-2 AAC Main */
  46. { AV_CODEC_ID_AAC , 0x67 }, /* MPEG-2 AAC Low */
  47. { AV_CODEC_ID_AAC , 0x68 }, /* MPEG-2 AAC SSR */
  48. { AV_CODEC_ID_MP3 , 0x69 }, /* 13818-3 */
  49. { AV_CODEC_ID_MP2 , 0x69 }, /* 11172-3 */
  50. { AV_CODEC_ID_MPEG1VIDEO , 0x6A }, /* 11172-2 */
  51. { AV_CODEC_ID_MP3 , 0x6B }, /* 11172-3 */
  52. { AV_CODEC_ID_MJPEG , 0x6C }, /* 10918-1 */
  53. { AV_CODEC_ID_PNG , 0x6D },
  54. { AV_CODEC_ID_JPEG2000 , 0x6E }, /* 15444-1 */
  55. { AV_CODEC_ID_VC1 , 0xA3 },
  56. { AV_CODEC_ID_DIRAC , 0xA4 },
  57. { AV_CODEC_ID_AC3 , 0xA5 },
  58. { AV_CODEC_ID_EAC3 , 0xA6 },
  59. { AV_CODEC_ID_DTS , 0xA9 }, /* mp4ra.org */
  60. { AV_CODEC_ID_OPUS , 0xAD }, /* mp4ra.org */
  61. { AV_CODEC_ID_VP9 , 0xB1 }, /* mp4ra.org */
  62. { AV_CODEC_ID_FLAC , 0xC1 }, /* nonstandard, update when there is a standard value */
  63. { AV_CODEC_ID_TSCC2 , 0xD0 }, /* nonstandard, camtasia uses it */
  64. { AV_CODEC_ID_EVRC , 0xD1 }, /* nonstandard, pvAuthor uses it */
  65. { AV_CODEC_ID_VORBIS , 0xDD }, /* nonstandard, gpac uses it */
  66. { AV_CODEC_ID_DVD_SUBTITLE, 0xE0 }, /* nonstandard, see unsupported-embedded-subs-2.mp4 */
  67. { AV_CODEC_ID_QCELP , 0xE1 },
  68. { AV_CODEC_ID_MPEG4SYSTEMS, 0x01 },
  69. { AV_CODEC_ID_MPEG4SYSTEMS, 0x02 },
  70. { AV_CODEC_ID_NONE , 0 },
  71. };
  72. const AVCodecTag ff_codec_movsubtitle_tags[] = {
  73. { AV_CODEC_ID_MOV_TEXT, MKTAG('t', 'e', 'x', 't') },
  74. { AV_CODEC_ID_MOV_TEXT, MKTAG('t', 'x', '3', 'g') },
  75. { AV_CODEC_ID_EIA_608, MKTAG('c', '6', '0', '8') },
  76. { AV_CODEC_ID_NONE, 0 },
  77. };
  78. const AVCodecTag ff_codec_movdata_tags[] = {
  79. { AV_CODEC_ID_BIN_DATA, MKTAG('g', 'p', 'm', 'd') },
  80. { AV_CODEC_ID_NONE, 0 },
  81. };
  82. /* map numeric codes from mdhd atom to ISO 639 */
  83. /* cf. QTFileFormat.pdf p253, qtff.pdf p205 */
  84. /* http://developer.apple.com/documentation/mac/Text/Text-368.html */
  85. /* deprecated by putting the code as 3*5 bits ASCII */
  86. static const char mov_mdhd_language_map[][4] = {
  87. "eng", /* 0 English */
  88. "fra", /* 1 French */
  89. "ger", /* 2 German */
  90. "ita", /* 3 Italian */
  91. "dut", /* 4 Dutch */
  92. "sve", /* 5 Swedish */
  93. "spa", /* 6 Spanish */
  94. "dan", /* 7 Danish */
  95. "por", /* 8 Portuguese */
  96. "nor", /* 9 Norwegian */
  97. "heb", /* 10 Hebrew */
  98. "jpn", /* 11 Japanese */
  99. "ara", /* 12 Arabic */
  100. "fin", /* 13 Finnish */
  101. "gre", /* 14 Greek */
  102. "ice", /* 15 Icelandic */
  103. "mlt", /* 16 Maltese */
  104. "tur", /* 17 Turkish */
  105. "hr ", /* 18 Croatian */
  106. "chi", /* 19 Traditional Chinese */
  107. "urd", /* 20 Urdu */
  108. "hin", /* 21 Hindi */
  109. "tha", /* 22 Thai */
  110. "kor", /* 23 Korean */
  111. "lit", /* 24 Lithuanian */
  112. "pol", /* 25 Polish */
  113. "hun", /* 26 Hungarian */
  114. "est", /* 27 Estonian */
  115. "lav", /* 28 Latvian */
  116. "", /* 29 Sami */
  117. "fo ", /* 30 Faroese */
  118. "", /* 31 Farsi */
  119. "rus", /* 32 Russian */
  120. "chi", /* 33 Simplified Chinese */
  121. "", /* 34 Flemish */
  122. "iri", /* 35 Irish */
  123. "alb", /* 36 Albanian */
  124. "ron", /* 37 Romanian */
  125. "ces", /* 38 Czech */
  126. "slk", /* 39 Slovak */
  127. "slv", /* 40 Slovenian */
  128. "yid", /* 41 Yiddish */
  129. "sr ", /* 42 Serbian */
  130. "mac", /* 43 Macedonian */
  131. "bul", /* 44 Bulgarian */
  132. "ukr", /* 45 Ukrainian */
  133. "bel", /* 46 Belarusian */
  134. "uzb", /* 47 Uzbek */
  135. "kaz", /* 48 Kazakh */
  136. "aze", /* 49 Azerbaijani */
  137. "aze", /* 50 AzerbaijanAr */
  138. "arm", /* 51 Armenian */
  139. "geo", /* 52 Georgian */
  140. "mol", /* 53 Moldavian */
  141. "kir", /* 54 Kirghiz */
  142. "tgk", /* 55 Tajiki */
  143. "tuk", /* 56 Turkmen */
  144. "mon", /* 57 Mongolian */
  145. "", /* 58 MongolianCyr */
  146. "pus", /* 59 Pashto */
  147. "kur", /* 60 Kurdish */
  148. "kas", /* 61 Kashmiri */
  149. "snd", /* 62 Sindhi */
  150. "tib", /* 63 Tibetan */
  151. "nep", /* 64 Nepali */
  152. "san", /* 65 Sanskrit */
  153. "mar", /* 66 Marathi */
  154. "ben", /* 67 Bengali */
  155. "asm", /* 68 Assamese */
  156. "guj", /* 69 Gujarati */
  157. "pa ", /* 70 Punjabi */
  158. "ori", /* 71 Oriya */
  159. "mal", /* 72 Malayalam */
  160. "kan", /* 73 Kannada */
  161. "tam", /* 74 Tamil */
  162. "tel", /* 75 Telugu */
  163. "", /* 76 Sinhala */
  164. "bur", /* 77 Burmese */
  165. "khm", /* 78 Khmer */
  166. "lao", /* 79 Lao */
  167. "vie", /* 80 Vietnamese */
  168. "ind", /* 81 Indonesian */
  169. "tgl", /* 82 Tagalog */
  170. "may", /* 83 MalayRoman */
  171. "may", /* 84 MalayArabic */
  172. "amh", /* 85 Amharic */
  173. "tir", /* 86 Galla */
  174. "orm", /* 87 Oromo */
  175. "som", /* 88 Somali */
  176. "swa", /* 89 Swahili */
  177. "", /* 90 Kinyarwanda */
  178. "run", /* 91 Rundi */
  179. "", /* 92 Nyanja */
  180. "mlg", /* 93 Malagasy */
  181. "epo", /* 94 Esperanto */
  182. "", /* 95 */
  183. "", /* 96 */
  184. "", /* 97 */
  185. "", /* 98 */
  186. "", /* 99 */
  187. "", /* 100 */
  188. "", /* 101 */
  189. "", /* 102 */
  190. "", /* 103 */
  191. "", /* 104 */
  192. "", /* 105 */
  193. "", /* 106 */
  194. "", /* 107 */
  195. "", /* 108 */
  196. "", /* 109 */
  197. "", /* 110 */
  198. "", /* 111 */
  199. "", /* 112 */
  200. "", /* 113 */
  201. "", /* 114 */
  202. "", /* 115 */
  203. "", /* 116 */
  204. "", /* 117 */
  205. "", /* 118 */
  206. "", /* 119 */
  207. "", /* 120 */
  208. "", /* 121 */
  209. "", /* 122 */
  210. "", /* 123 */
  211. "", /* 124 */
  212. "", /* 125 */
  213. "", /* 126 */
  214. "", /* 127 */
  215. "wel", /* 128 Welsh */
  216. "baq", /* 129 Basque */
  217. "cat", /* 130 Catalan */
  218. "lat", /* 131 Latin */
  219. "que", /* 132 Quechua */
  220. "grn", /* 133 Guarani */
  221. "aym", /* 134 Aymara */
  222. "tat", /* 135 Tatar */
  223. "uig", /* 136 Uighur */
  224. "dzo", /* 137 Dzongkha */
  225. "jav", /* 138 JavaneseRom */
  226. };
  227. int ff_mov_iso639_to_lang(const char lang[4], int mp4)
  228. {
  229. int i, code = 0;
  230. /* old way, only for QT? */
  231. for (i = 0; lang[0] && !mp4 && i < FF_ARRAY_ELEMS(mov_mdhd_language_map); i++) {
  232. if (!strcmp(lang, mov_mdhd_language_map[i]))
  233. return i;
  234. }
  235. /* XXX:can we do that in mov too? */
  236. if (!mp4)
  237. return -1;
  238. /* handle undefined as such */
  239. if (lang[0] == '\0')
  240. lang = "und";
  241. /* 5 bits ASCII */
  242. for (i = 0; i < 3; i++) {
  243. uint8_t c = lang[i];
  244. c -= 0x60;
  245. if (c > 0x1f)
  246. return -1;
  247. code <<= 5;
  248. code |= c;
  249. }
  250. return code;
  251. }
  252. int ff_mov_lang_to_iso639(unsigned code, char to[4])
  253. {
  254. int i;
  255. memset(to, 0, 4);
  256. /* is it the mangled iso code? */
  257. /* see http://www.geocities.com/xhelmboyx/quicktime/formats/mp4-layout.txt */
  258. if (code >= 0x400 && code != 0x7fff) {
  259. for (i = 2; i >= 0; i--) {
  260. to[i] = 0x60 + (code & 0x1f);
  261. code >>= 5;
  262. }
  263. return 1;
  264. }
  265. /* old fashion apple lang code */
  266. if (code >= FF_ARRAY_ELEMS(mov_mdhd_language_map))
  267. return 0;
  268. if (!mov_mdhd_language_map[code][0])
  269. return 0;
  270. memcpy(to, mov_mdhd_language_map[code], 4);
  271. return 1;
  272. }
  273. int ff_mp4_read_descr_len(AVIOContext *pb)
  274. {
  275. int len = 0;
  276. int count = 4;
  277. while (count--) {
  278. int c = avio_r8(pb);
  279. len = (len << 7) | (c & 0x7f);
  280. if (!(c & 0x80))
  281. break;
  282. }
  283. return len;
  284. }
  285. int ff_mp4_read_descr(AVFormatContext *fc, AVIOContext *pb, int *tag)
  286. {
  287. int len;
  288. *tag = avio_r8(pb);
  289. len = ff_mp4_read_descr_len(pb);
  290. av_log(fc, AV_LOG_TRACE, "MPEG-4 description: tag=0x%02x len=%d\n", *tag, len);
  291. return len;
  292. }
  293. void ff_mp4_parse_es_descr(AVIOContext *pb, int *es_id)
  294. {
  295. int flags;
  296. if (es_id) *es_id = avio_rb16(pb);
  297. else avio_rb16(pb);
  298. flags = avio_r8(pb);
  299. if (flags & 0x80) //streamDependenceFlag
  300. avio_rb16(pb);
  301. if (flags & 0x40) { //URL_Flag
  302. int len = avio_r8(pb);
  303. avio_skip(pb, len);
  304. }
  305. if (flags & 0x20) //OCRstreamFlag
  306. avio_rb16(pb);
  307. }
  308. static const AVCodecTag mp4_audio_types[] = {
  309. { AV_CODEC_ID_MP3ON4, AOT_PS }, /* old mp3on4 draft */
  310. { AV_CODEC_ID_MP3ON4, AOT_L1 }, /* layer 1 */
  311. { AV_CODEC_ID_MP3ON4, AOT_L2 }, /* layer 2 */
  312. { AV_CODEC_ID_MP3ON4, AOT_L3 }, /* layer 3 */
  313. { AV_CODEC_ID_MP4ALS, AOT_ALS }, /* MPEG-4 ALS */
  314. { AV_CODEC_ID_NONE, AOT_NULL },
  315. };
  316. int ff_mp4_read_dec_config_descr(AVFormatContext *fc, AVStream *st, AVIOContext *pb)
  317. {
  318. enum AVCodecID codec_id;
  319. unsigned v;
  320. int len, tag;
  321. int ret;
  322. int object_type_id = avio_r8(pb);
  323. avio_r8(pb); /* stream type */
  324. avio_rb24(pb); /* buffer size db */
  325. v = avio_rb32(pb);
  326. // TODO: fix this with codecpar
  327. #if FF_API_LAVF_AVCTX
  328. FF_DISABLE_DEPRECATION_WARNINGS
  329. if (v < INT32_MAX)
  330. st->codec->rc_max_rate = v;
  331. FF_ENABLE_DEPRECATION_WARNINGS
  332. #endif
  333. st->codecpar->bit_rate = avio_rb32(pb); /* avg bitrate */
  334. codec_id= ff_codec_get_id(ff_mp4_obj_type, object_type_id);
  335. if (codec_id)
  336. st->codecpar->codec_id = codec_id;
  337. av_log(fc, AV_LOG_TRACE, "esds object type id 0x%02x\n", object_type_id);
  338. len = ff_mp4_read_descr(fc, pb, &tag);
  339. if (tag == MP4DecSpecificDescrTag) {
  340. av_log(fc, AV_LOG_TRACE, "Specific MPEG-4 header len=%d\n", len);
  341. /* As per 14496-3:2009 9.D.2.2, No decSpecificInfo is defined
  342. for MPEG-1 Audio or MPEG-2 Audio; MPEG-2 AAC excluded. */
  343. if (object_type_id == 0x69 || object_type_id == 0x6b)
  344. return 0;
  345. if (!len || (uint64_t)len > (1<<30))
  346. return AVERROR_INVALIDDATA;
  347. if ((ret = ff_get_extradata(fc, st->codecpar, pb, len)) < 0)
  348. return ret;
  349. if (st->codecpar->codec_id == AV_CODEC_ID_AAC) {
  350. MPEG4AudioConfig cfg = {0};
  351. ret = avpriv_mpeg4audio_get_config2(&cfg, st->codecpar->extradata,
  352. st->codecpar->extradata_size, 1, fc);
  353. if (ret < 0)
  354. return ret;
  355. st->codecpar->channels = cfg.channels;
  356. if (cfg.object_type == 29 && cfg.sampling_index < 3) // old mp3on4
  357. st->codecpar->sample_rate = avpriv_mpa_freq_tab[cfg.sampling_index];
  358. else if (cfg.ext_sample_rate)
  359. st->codecpar->sample_rate = cfg.ext_sample_rate;
  360. else
  361. st->codecpar->sample_rate = cfg.sample_rate;
  362. av_log(fc, AV_LOG_TRACE, "mp4a config channels %d obj %d ext obj %d "
  363. "sample rate %d ext sample rate %d\n", st->codecpar->channels,
  364. cfg.object_type, cfg.ext_object_type,
  365. cfg.sample_rate, cfg.ext_sample_rate);
  366. if (!(st->codecpar->codec_id = ff_codec_get_id(mp4_audio_types,
  367. cfg.object_type)))
  368. st->codecpar->codec_id = AV_CODEC_ID_AAC;
  369. }
  370. }
  371. return 0;
  372. }
  373. typedef struct MovChannelLayout {
  374. int64_t channel_layout;
  375. uint32_t layout_tag;
  376. } MovChannelLayout;
  377. static const MovChannelLayout mov_channel_layout[] = {
  378. { AV_CH_LAYOUT_MONO, (100<<16) | 1}, // kCAFChannelLayoutTag_Mono
  379. { AV_CH_LAYOUT_STEREO, (101<<16) | 2}, // kCAFChannelLayoutTag_Stereo
  380. { AV_CH_LAYOUT_STEREO, (102<<16) | 2}, // kCAFChannelLayoutTag_StereoHeadphones
  381. { AV_CH_LAYOUT_2_1, (131<<16) | 3}, // kCAFChannelLayoutTag_ITU_2_1
  382. { AV_CH_LAYOUT_QUAD, (132<<16) | 4}, // kCAFChannelLayoutTag_ITU_2_2
  383. { AV_CH_LAYOUT_2_2, (132<<16) | 4}, // kCAFChannelLayoutTag_ITU_2_2
  384. { AV_CH_LAYOUT_QUAD, (108<<16) | 4}, // kCAFChannelLayoutTag_Quadraphonic
  385. { AV_CH_LAYOUT_SURROUND, (113<<16) | 3}, // kCAFChannelLayoutTag_MPEG_3_0_A
  386. { AV_CH_LAYOUT_4POINT0, (115<<16) | 4}, // kCAFChannelLayoutTag_MPEG_4_0_A
  387. { AV_CH_LAYOUT_5POINT0_BACK, (117<<16) | 5}, // kCAFChannelLayoutTag_MPEG_5_0_A
  388. { AV_CH_LAYOUT_5POINT0, (117<<16) | 5}, // kCAFChannelLayoutTag_MPEG_5_0_A
  389. { AV_CH_LAYOUT_5POINT1_BACK, (121<<16) | 6}, // kCAFChannelLayoutTag_MPEG_5_1_A
  390. { AV_CH_LAYOUT_5POINT1, (121<<16) | 6}, // kCAFChannelLayoutTag_MPEG_5_1_A
  391. { AV_CH_LAYOUT_7POINT1, (128<<16) | 8}, // kCAFChannelLayoutTag_MPEG_7_1_C
  392. { AV_CH_LAYOUT_7POINT1_WIDE, (126<<16) | 8}, // kCAFChannelLayoutTag_MPEG_7_1_A
  393. { AV_CH_LAYOUT_5POINT1_BACK|AV_CH_LAYOUT_STEREO_DOWNMIX, (130<<16) | 8}, // kCAFChannelLayoutTag_SMPTE_DTV
  394. { AV_CH_LAYOUT_STEREO|AV_CH_LOW_FREQUENCY, (133<<16) | 3}, // kCAFChannelLayoutTag_DVD_4
  395. { AV_CH_LAYOUT_2_1|AV_CH_LOW_FREQUENCY, (134<<16) | 4}, // kCAFChannelLayoutTag_DVD_5
  396. { AV_CH_LAYOUT_QUAD|AV_CH_LOW_FREQUENCY, (135<<16) | 4}, // kCAFChannelLayoutTag_DVD_6
  397. { AV_CH_LAYOUT_2_2|AV_CH_LOW_FREQUENCY, (135<<16) | 4}, // kCAFChannelLayoutTag_DVD_6
  398. { AV_CH_LAYOUT_SURROUND|AV_CH_LOW_FREQUENCY, (136<<16) | 4}, // kCAFChannelLayoutTag_DVD_10
  399. { AV_CH_LAYOUT_4POINT0|AV_CH_LOW_FREQUENCY, (137<<16) | 5}, // kCAFChannelLayoutTag_DVD_11
  400. { 0, 0},
  401. };
  402. #if 0
  403. int ff_mov_read_chan(AVFormatContext *s, AVStream *st, int64_t size)
  404. {
  405. AVCodecContext *codec= st->codec;
  406. uint32_t layout_tag;
  407. AVIOContext *pb = s->pb;
  408. const MovChannelLayout *layouts = mov_channel_layout;
  409. if (size < 12)
  410. return AVERROR_INVALIDDATA;
  411. layout_tag = avio_rb32(pb);
  412. size -= 4;
  413. if (layout_tag == 0) { // kCAFChannelLayoutTag_UseChannelDescriptions
  414. // Channel descriptions not implemented
  415. av_log_ask_for_sample(s, "Unimplemented container channel layout.\n");
  416. avio_skip(pb, size);
  417. return 0;
  418. }
  419. if (layout_tag == 0x10000) { // kCAFChannelLayoutTag_UseChannelBitmap
  420. codec->channel_layout = avio_rb32(pb);
  421. size -= 4;
  422. avio_skip(pb, size);
  423. return 0;
  424. }
  425. while (layouts->channel_layout) {
  426. if (layout_tag == layouts->layout_tag) {
  427. codec->channel_layout = layouts->channel_layout;
  428. break;
  429. }
  430. layouts++;
  431. }
  432. if (!codec->channel_layout)
  433. av_log(s, AV_LOG_WARNING, "Unknown container channel layout.\n");
  434. avio_skip(pb, size);
  435. return 0;
  436. }
  437. #endif
  438. void ff_mov_write_chan(AVIOContext *pb, int64_t channel_layout)
  439. {
  440. const MovChannelLayout *layouts;
  441. uint32_t layout_tag = 0;
  442. for (layouts = mov_channel_layout; layouts->channel_layout; layouts++)
  443. if (channel_layout == layouts->channel_layout) {
  444. layout_tag = layouts->layout_tag;
  445. break;
  446. }
  447. if (layout_tag) {
  448. avio_wb32(pb, layout_tag); // mChannelLayoutTag
  449. avio_wb32(pb, 0); // mChannelBitmap
  450. } else {
  451. avio_wb32(pb, 0x10000); // kCAFChannelLayoutTag_UseChannelBitmap
  452. avio_wb32(pb, channel_layout);
  453. }
  454. avio_wb32(pb, 0); // mNumberChannelDescriptions
  455. }