You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

280 lines
9.2KB

  1. /*
  2. * Core Audio Format muxer
  3. * Copyright (c) 2011 Carl Eugen Hoyos
  4. *
  5. * This file is part of FFmpeg.
  6. *
  7. * FFmpeg is free software; you can redistribute it and/or
  8. * modify it under the terms of the GNU Lesser General Public
  9. * License as published by the Free Software Foundation; either
  10. * version 2.1 of the License, or (at your option) any later version.
  11. *
  12. * FFmpeg is distributed in the hope that it will be useful,
  13. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  14. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  15. * Lesser General Public License for more details.
  16. *
  17. * You should have received a copy of the GNU Lesser General Public
  18. * License along with FFmpeg; if not, write to the Free Software
  19. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  20. */
  21. #include "avformat.h"
  22. #include "caf.h"
  23. #include "isom.h"
  24. #include "avio_internal.h"
  25. #include "libavutil/intfloat.h"
  26. #include "libavutil/dict.h"
  27. typedef struct {
  28. int64_t data;
  29. uint8_t *pkt_sizes;
  30. int size_buffer_size;
  31. int size_entries_used;
  32. int packets;
  33. } CAFContext;
  34. static uint32_t codec_flags(enum AVCodecID codec_id) {
  35. switch (codec_id) {
  36. case AV_CODEC_ID_PCM_F32BE:
  37. case AV_CODEC_ID_PCM_F64BE:
  38. return 1; //< kCAFLinearPCMFormatFlagIsFloat
  39. case AV_CODEC_ID_PCM_S16LE:
  40. case AV_CODEC_ID_PCM_S24LE:
  41. case AV_CODEC_ID_PCM_S32LE:
  42. return 2; //< kCAFLinearPCMFormatFlagIsLittleEndian
  43. case AV_CODEC_ID_PCM_F32LE:
  44. case AV_CODEC_ID_PCM_F64LE:
  45. return 3; //< kCAFLinearPCMFormatFlagIsFloat | kCAFLinearPCMFormatFlagIsLittleEndian
  46. default:
  47. return 0;
  48. }
  49. }
  50. static uint32_t samples_per_packet(enum AVCodecID codec_id, int channels) {
  51. switch (codec_id) {
  52. case AV_CODEC_ID_PCM_S8:
  53. case AV_CODEC_ID_PCM_S16LE:
  54. case AV_CODEC_ID_PCM_S16BE:
  55. case AV_CODEC_ID_PCM_S24LE:
  56. case AV_CODEC_ID_PCM_S24BE:
  57. case AV_CODEC_ID_PCM_S32LE:
  58. case AV_CODEC_ID_PCM_S32BE:
  59. case AV_CODEC_ID_PCM_F32LE:
  60. case AV_CODEC_ID_PCM_F32BE:
  61. case AV_CODEC_ID_PCM_F64LE:
  62. case AV_CODEC_ID_PCM_F64BE:
  63. case AV_CODEC_ID_PCM_ALAW:
  64. case AV_CODEC_ID_PCM_MULAW:
  65. return 1;
  66. case AV_CODEC_ID_MACE3:
  67. case AV_CODEC_ID_MACE6:
  68. return 6;
  69. case AV_CODEC_ID_ADPCM_IMA_QT:
  70. return 64;
  71. case AV_CODEC_ID_AMR_NB:
  72. case AV_CODEC_ID_GSM:
  73. case AV_CODEC_ID_ILBC:
  74. case AV_CODEC_ID_QCELP:
  75. return 160;
  76. case AV_CODEC_ID_GSM_MS:
  77. return 320;
  78. case AV_CODEC_ID_MP1:
  79. return 384;
  80. case AV_CODEC_ID_MP2:
  81. case AV_CODEC_ID_MP3:
  82. return 1152;
  83. case AV_CODEC_ID_AC3:
  84. return 1536;
  85. case AV_CODEC_ID_ALAC:
  86. case AV_CODEC_ID_QDM2:
  87. return 4096;
  88. case AV_CODEC_ID_ADPCM_IMA_WAV:
  89. return (1024 - 4 * channels) * 8 / (4 * channels) + 1;
  90. case AV_CODEC_ID_ADPCM_MS:
  91. return (1024 - 7 * channels) * 2 / channels + 2;
  92. default:
  93. return 0;
  94. }
  95. }
  96. static int caf_write_header(AVFormatContext *s)
  97. {
  98. AVIOContext *pb = s->pb;
  99. AVCodecContext *enc = s->streams[0]->codec;
  100. CAFContext *caf = s->priv_data;
  101. AVDictionaryEntry *t = NULL;
  102. unsigned int codec_tag = ff_codec_get_tag(ff_codec_caf_tags, enc->codec_id);
  103. int64_t chunk_size = 0;
  104. switch (enc->codec_id) {
  105. case AV_CODEC_ID_AAC:
  106. case AV_CODEC_ID_AC3:
  107. av_log(s, AV_LOG_ERROR, "muxing codec currently unsupported\n");
  108. return AVERROR_PATCHWELCOME;
  109. }
  110. switch (enc->codec_id) {
  111. case AV_CODEC_ID_PCM_S8:
  112. case AV_CODEC_ID_PCM_S16LE:
  113. case AV_CODEC_ID_PCM_S16BE:
  114. case AV_CODEC_ID_PCM_S24LE:
  115. case AV_CODEC_ID_PCM_S24BE:
  116. case AV_CODEC_ID_PCM_S32LE:
  117. case AV_CODEC_ID_PCM_S32BE:
  118. case AV_CODEC_ID_PCM_F32LE:
  119. case AV_CODEC_ID_PCM_F32BE:
  120. case AV_CODEC_ID_PCM_F64LE:
  121. case AV_CODEC_ID_PCM_F64BE:
  122. case AV_CODEC_ID_PCM_ALAW:
  123. case AV_CODEC_ID_PCM_MULAW:
  124. codec_tag = MKTAG('l','p','c','m');
  125. }
  126. if (!codec_tag) {
  127. av_log(s, AV_LOG_ERROR, "unsupported codec\n");
  128. return AVERROR_INVALIDDATA;
  129. }
  130. if (!enc->block_align && !pb->seekable) {
  131. av_log(s, AV_LOG_ERROR, "Muxing variable packet size not supported on non seekable output\n");
  132. return AVERROR_INVALIDDATA;
  133. }
  134. ffio_wfourcc(pb, "caff"); //< mFileType
  135. avio_wb16(pb, 1); //< mFileVersion
  136. avio_wb16(pb, 0); //< mFileFlags
  137. ffio_wfourcc(pb, "desc"); //< Audio Description chunk
  138. avio_wb64(pb, 32); //< mChunkSize
  139. avio_wb64(pb, av_double2int(enc->sample_rate)); //< mSampleRate
  140. avio_wl32(pb, codec_tag); //< mFormatID
  141. avio_wb32(pb, codec_flags(enc->codec_id)); //< mFormatFlags
  142. avio_wb32(pb, enc->block_align); //< mBytesPerPacket
  143. avio_wb32(pb, samples_per_packet(enc->codec_id, enc->channels)); //< mFramesPerPacket
  144. avio_wb32(pb, enc->channels); //< mChannelsPerFrame
  145. avio_wb32(pb, av_get_bits_per_sample(enc->codec_id)); //< mBitsPerChannel
  146. if (enc->channel_layout) {
  147. ffio_wfourcc(pb, "chan");
  148. avio_wb64(pb, 12);
  149. ff_mov_write_chan(pb, enc->channel_layout);
  150. }
  151. if (enc->codec_id == AV_CODEC_ID_ALAC) {
  152. ffio_wfourcc(pb, "kuki");
  153. avio_wb64(pb, 12 + enc->extradata_size);
  154. avio_write(pb, "\0\0\0\14frmaalac", 12);
  155. avio_write(pb, enc->extradata, enc->extradata_size);
  156. } else if (enc->codec_id == AV_CODEC_ID_AMR_NB) {
  157. ffio_wfourcc(pb, "kuki");
  158. avio_wb64(pb, 29);
  159. avio_write(pb, "\0\0\0\14frmasamr", 12);
  160. avio_wb32(pb, 0x11); /* size */
  161. avio_write(pb, "samrFFMP", 8);
  162. avio_w8(pb, 0); /* decoder version */
  163. avio_wb16(pb, 0x81FF); /* Mode set (all modes for AMR_NB) */
  164. avio_w8(pb, 0x00); /* Mode change period (no restriction) */
  165. avio_w8(pb, 0x01); /* Frames per sample */
  166. } else if (enc->codec_id == AV_CODEC_ID_QDM2) {
  167. ffio_wfourcc(pb, "kuki");
  168. avio_wb64(pb, enc->extradata_size);
  169. avio_write(pb, enc->extradata, enc->extradata_size);
  170. }
  171. if (av_dict_count(s->metadata)) {
  172. ffio_wfourcc(pb, "info"); //< Information chunk
  173. while ((t = av_dict_get(s->metadata, "", t, AV_DICT_IGNORE_SUFFIX))) {
  174. chunk_size += strlen(t->key) + strlen(t->value) + 2;
  175. }
  176. avio_wb64(pb, chunk_size + 4);
  177. avio_wb32(pb, av_dict_count(s->metadata));
  178. t = NULL;
  179. while ((t = av_dict_get(s->metadata, "", t, AV_DICT_IGNORE_SUFFIX))) {
  180. avio_put_str(pb, t->key);
  181. avio_put_str(pb, t->value);
  182. }
  183. }
  184. ffio_wfourcc(pb, "data"); //< Audio Data chunk
  185. caf->data = avio_tell(pb);
  186. avio_wb64(pb, -1); //< mChunkSize
  187. avio_wb32(pb, 0); //< mEditCount
  188. avio_flush(pb);
  189. return 0;
  190. }
  191. static int caf_write_packet(AVFormatContext *s, AVPacket *pkt)
  192. {
  193. CAFContext *caf = s->priv_data;
  194. avio_write(s->pb, pkt->data, pkt->size);
  195. if (!s->streams[0]->codec->block_align) {
  196. void *pkt_sizes = caf->pkt_sizes;
  197. int i, alloc_size = caf->size_entries_used + 5;
  198. if (alloc_size < 0) {
  199. caf->pkt_sizes = NULL;
  200. } else {
  201. caf->pkt_sizes = av_fast_realloc(caf->pkt_sizes,
  202. &caf->size_buffer_size,
  203. alloc_size);
  204. }
  205. if (!caf->pkt_sizes) {
  206. av_free(pkt_sizes);
  207. return AVERROR(ENOMEM);
  208. }
  209. for (i = 4; i > 0; i--) {
  210. unsigned top = pkt->size >> i * 7;
  211. if (top)
  212. caf->pkt_sizes[caf->size_entries_used++] = 128 | top;
  213. }
  214. caf->pkt_sizes[caf->size_entries_used++] = pkt->size & 127;
  215. caf->packets++;
  216. }
  217. return 0;
  218. }
  219. static int caf_write_trailer(AVFormatContext *s)
  220. {
  221. AVIOContext *pb = s->pb;
  222. AVCodecContext *enc = s->streams[0]->codec;
  223. if (pb->seekable) {
  224. CAFContext *caf = s->priv_data;
  225. int64_t file_size = avio_tell(pb);
  226. avio_seek(pb, caf->data, SEEK_SET);
  227. avio_wb64(pb, file_size - caf->data - 8);
  228. avio_seek(pb, file_size, SEEK_SET);
  229. if (!enc->block_align) {
  230. ffio_wfourcc(pb, "pakt");
  231. avio_wb64(pb, caf->size_entries_used + 24);
  232. avio_wb64(pb, caf->packets); ///< mNumberPackets
  233. avio_wb64(pb, caf->packets * samples_per_packet(enc->codec_id, enc->channels)); ///< mNumberValidFrames
  234. avio_wb32(pb, 0); ///< mPrimingFrames
  235. avio_wb32(pb, 0); ///< mRemainderFrames
  236. avio_write(pb, caf->pkt_sizes, caf->size_entries_used);
  237. av_freep(&caf->pkt_sizes);
  238. caf->size_buffer_size = 0;
  239. }
  240. avio_flush(pb);
  241. }
  242. return 0;
  243. }
  244. AVOutputFormat ff_caf_muxer = {
  245. .name = "caf",
  246. .long_name = NULL_IF_CONFIG_SMALL("Apple CAF (Core Audio Format)"),
  247. .mime_type = "audio/x-caf",
  248. .extensions = "caf",
  249. .priv_data_size = sizeof(CAFContext),
  250. .audio_codec = AV_CODEC_ID_PCM_S16BE,
  251. .video_codec = AV_CODEC_ID_NONE,
  252. .write_header = caf_write_header,
  253. .write_packet = caf_write_packet,
  254. .write_trailer = caf_write_trailer,
  255. .codec_tag = (const AVCodecTag* const []){ff_codec_caf_tags, 0},
  256. };