You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

273 lines
9.1KB

  1. /*
  2. * Core Audio Format muxer
  3. * Copyright (c) 2011 Carl Eugen Hoyos
  4. *
  5. * This file is part of FFmpeg.
  6. *
  7. * FFmpeg is free software; you can redistribute it and/or
  8. * modify it under the terms of the GNU Lesser General Public
  9. * License as published by the Free Software Foundation; either
  10. * version 2.1 of the License, or (at your option) any later version.
  11. *
  12. * FFmpeg is distributed in the hope that it will be useful,
  13. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  14. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  15. * Lesser General Public License for more details.
  16. *
  17. * You should have received a copy of the GNU Lesser General Public
  18. * License along with FFmpeg; if not, write to the Free Software
  19. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  20. */
  21. #include "avformat.h"
  22. #include "caf.h"
  23. #include "isom.h"
  24. #include "avio_internal.h"
  25. #include "libavutil/intfloat.h"
  26. #include "libavutil/dict.h"
  27. typedef struct {
  28. int64_t data;
  29. uint8_t *pkt_sizes;
  30. int size_buffer_size;
  31. int size_entries_used;
  32. int packets;
  33. } CAFContext;
  34. static uint32_t codec_flags(enum AVCodecID codec_id) {
  35. switch (codec_id) {
  36. case AV_CODEC_ID_PCM_F32BE:
  37. case AV_CODEC_ID_PCM_F64BE:
  38. return 1; //< kCAFLinearPCMFormatFlagIsFloat
  39. case AV_CODEC_ID_PCM_S16LE:
  40. case AV_CODEC_ID_PCM_S24LE:
  41. case AV_CODEC_ID_PCM_S32LE:
  42. return 2; //< kCAFLinearPCMFormatFlagIsLittleEndian
  43. case AV_CODEC_ID_PCM_F32LE:
  44. case AV_CODEC_ID_PCM_F64LE:
  45. return 3; //< kCAFLinearPCMFormatFlagIsFloat | kCAFLinearPCMFormatFlagIsLittleEndian
  46. default:
  47. return 0;
  48. }
  49. }
  50. static uint32_t samples_per_packet(enum AVCodecID codec_id, int channels, int block_align) {
  51. switch (codec_id) {
  52. case AV_CODEC_ID_PCM_S8:
  53. case AV_CODEC_ID_PCM_S16LE:
  54. case AV_CODEC_ID_PCM_S16BE:
  55. case AV_CODEC_ID_PCM_S24LE:
  56. case AV_CODEC_ID_PCM_S24BE:
  57. case AV_CODEC_ID_PCM_S32LE:
  58. case AV_CODEC_ID_PCM_S32BE:
  59. case AV_CODEC_ID_PCM_F32LE:
  60. case AV_CODEC_ID_PCM_F32BE:
  61. case AV_CODEC_ID_PCM_F64LE:
  62. case AV_CODEC_ID_PCM_F64BE:
  63. case AV_CODEC_ID_PCM_ALAW:
  64. case AV_CODEC_ID_PCM_MULAW:
  65. return 1;
  66. case AV_CODEC_ID_MACE3:
  67. case AV_CODEC_ID_MACE6:
  68. return 6;
  69. case AV_CODEC_ID_ADPCM_IMA_QT:
  70. return 64;
  71. case AV_CODEC_ID_AMR_NB:
  72. case AV_CODEC_ID_GSM:
  73. case AV_CODEC_ID_ILBC:
  74. case AV_CODEC_ID_QCELP:
  75. return 160;
  76. case AV_CODEC_ID_GSM_MS:
  77. return 320;
  78. case AV_CODEC_ID_MP1:
  79. return 384;
  80. case AV_CODEC_ID_MP2:
  81. case AV_CODEC_ID_MP3:
  82. return 1152;
  83. case AV_CODEC_ID_AC3:
  84. return 1536;
  85. case AV_CODEC_ID_QDM2:
  86. return 2048 * channels;
  87. case AV_CODEC_ID_ALAC:
  88. return 4096;
  89. case AV_CODEC_ID_ADPCM_IMA_WAV:
  90. return (block_align - 4 * channels) * 8 / (4 * channels) + 1;
  91. case AV_CODEC_ID_ADPCM_MS:
  92. return (block_align - 7 * channels) * 2 / channels + 2;
  93. default:
  94. return 0;
  95. }
  96. }
  97. static int caf_write_header(AVFormatContext *s)
  98. {
  99. AVIOContext *pb = s->pb;
  100. AVCodecContext *enc = s->streams[0]->codec;
  101. CAFContext *caf = s->priv_data;
  102. AVDictionaryEntry *t = NULL;
  103. unsigned int codec_tag = ff_codec_get_tag(ff_codec_caf_tags, enc->codec_id);
  104. int64_t chunk_size = 0;
  105. int frame_size = enc->frame_size;
  106. if (s->nb_streams != 1) {
  107. av_log(s, AV_LOG_ERROR, "CAF files have exactly one stream\n");
  108. return AVERROR(EINVAL);
  109. }
  110. switch (enc->codec_id) {
  111. case AV_CODEC_ID_AAC:
  112. av_log(s, AV_LOG_ERROR, "muxing codec currently unsupported\n");
  113. return AVERROR_PATCHWELCOME;
  114. }
  115. if (!codec_tag) {
  116. av_log(s, AV_LOG_ERROR, "unsupported codec\n");
  117. return AVERROR_INVALIDDATA;
  118. }
  119. if (!enc->block_align && !pb->seekable) {
  120. av_log(s, AV_LOG_ERROR, "Muxing variable packet size not supported on non seekable output\n");
  121. return AVERROR_INVALIDDATA;
  122. }
  123. if (enc->codec_id != AV_CODEC_ID_MP3 || frame_size != 576)
  124. frame_size = samples_per_packet(enc->codec_id, enc->channels, enc->block_align);
  125. ffio_wfourcc(pb, "caff"); //< mFileType
  126. avio_wb16(pb, 1); //< mFileVersion
  127. avio_wb16(pb, 0); //< mFileFlags
  128. ffio_wfourcc(pb, "desc"); //< Audio Description chunk
  129. avio_wb64(pb, 32); //< mChunkSize
  130. avio_wb64(pb, av_double2int(enc->sample_rate)); //< mSampleRate
  131. avio_wl32(pb, codec_tag); //< mFormatID
  132. avio_wb32(pb, codec_flags(enc->codec_id)); //< mFormatFlags
  133. avio_wb32(pb, enc->block_align); //< mBytesPerPacket
  134. avio_wb32(pb, frame_size); //< mFramesPerPacket
  135. avio_wb32(pb, enc->channels); //< mChannelsPerFrame
  136. avio_wb32(pb, av_get_bits_per_sample(enc->codec_id)); //< mBitsPerChannel
  137. if (enc->channel_layout) {
  138. ffio_wfourcc(pb, "chan");
  139. avio_wb64(pb, 12);
  140. ff_mov_write_chan(pb, enc->channel_layout);
  141. }
  142. if (enc->codec_id == AV_CODEC_ID_ALAC) {
  143. ffio_wfourcc(pb, "kuki");
  144. avio_wb64(pb, 12 + enc->extradata_size);
  145. avio_write(pb, "\0\0\0\14frmaalac", 12);
  146. avio_write(pb, enc->extradata, enc->extradata_size);
  147. } else if (enc->codec_id == AV_CODEC_ID_AMR_NB) {
  148. ffio_wfourcc(pb, "kuki");
  149. avio_wb64(pb, 29);
  150. avio_write(pb, "\0\0\0\14frmasamr", 12);
  151. avio_wb32(pb, 0x11); /* size */
  152. avio_write(pb, "samrFFMP", 8);
  153. avio_w8(pb, 0); /* decoder version */
  154. avio_wb16(pb, 0x81FF); /* Mode set (all modes for AMR_NB) */
  155. avio_w8(pb, 0x00); /* Mode change period (no restriction) */
  156. avio_w8(pb, 0x01); /* Frames per sample */
  157. } else if (enc->codec_id == AV_CODEC_ID_QDM2) {
  158. ffio_wfourcc(pb, "kuki");
  159. avio_wb64(pb, enc->extradata_size);
  160. avio_write(pb, enc->extradata, enc->extradata_size);
  161. }
  162. ff_standardize_creation_time(s);
  163. if (av_dict_count(s->metadata)) {
  164. ffio_wfourcc(pb, "info"); //< Information chunk
  165. while ((t = av_dict_get(s->metadata, "", t, AV_DICT_IGNORE_SUFFIX))) {
  166. chunk_size += strlen(t->key) + strlen(t->value) + 2;
  167. }
  168. avio_wb64(pb, chunk_size + 4);
  169. avio_wb32(pb, av_dict_count(s->metadata));
  170. t = NULL;
  171. while ((t = av_dict_get(s->metadata, "", t, AV_DICT_IGNORE_SUFFIX))) {
  172. avio_put_str(pb, t->key);
  173. avio_put_str(pb, t->value);
  174. }
  175. }
  176. ffio_wfourcc(pb, "data"); //< Audio Data chunk
  177. caf->data = avio_tell(pb);
  178. avio_wb64(pb, -1); //< mChunkSize
  179. avio_wb32(pb, 0); //< mEditCount
  180. avio_flush(pb);
  181. return 0;
  182. }
  183. static int caf_write_packet(AVFormatContext *s, AVPacket *pkt)
  184. {
  185. CAFContext *caf = s->priv_data;
  186. avio_write(s->pb, pkt->data, pkt->size);
  187. if (!s->streams[0]->codec->block_align) {
  188. void *pkt_sizes = caf->pkt_sizes;
  189. int i, alloc_size = caf->size_entries_used + 5;
  190. if (alloc_size < 0) {
  191. caf->pkt_sizes = NULL;
  192. } else {
  193. caf->pkt_sizes = av_fast_realloc(caf->pkt_sizes,
  194. &caf->size_buffer_size,
  195. alloc_size);
  196. }
  197. if (!caf->pkt_sizes) {
  198. av_free(pkt_sizes);
  199. return AVERROR(ENOMEM);
  200. }
  201. for (i = 4; i > 0; i--) {
  202. unsigned top = pkt->size >> i * 7;
  203. if (top)
  204. caf->pkt_sizes[caf->size_entries_used++] = 128 | top;
  205. }
  206. caf->pkt_sizes[caf->size_entries_used++] = pkt->size & 127;
  207. caf->packets++;
  208. }
  209. return 0;
  210. }
  211. static int caf_write_trailer(AVFormatContext *s)
  212. {
  213. CAFContext *caf = s->priv_data;
  214. AVIOContext *pb = s->pb;
  215. AVCodecContext *enc = s->streams[0]->codec;
  216. if (pb->seekable) {
  217. int64_t file_size = avio_tell(pb);
  218. avio_seek(pb, caf->data, SEEK_SET);
  219. avio_wb64(pb, file_size - caf->data - 8);
  220. avio_seek(pb, file_size, SEEK_SET);
  221. if (!enc->block_align) {
  222. ffio_wfourcc(pb, "pakt");
  223. avio_wb64(pb, caf->size_entries_used + 24);
  224. avio_wb64(pb, caf->packets); ///< mNumberPackets
  225. avio_wb64(pb, caf->packets * samples_per_packet(enc->codec_id, enc->channels, enc->block_align)); ///< mNumberValidFrames
  226. avio_wb32(pb, 0); ///< mPrimingFrames
  227. avio_wb32(pb, 0); ///< mRemainderFrames
  228. avio_write(pb, caf->pkt_sizes, caf->size_entries_used);
  229. caf->size_buffer_size = 0;
  230. }
  231. avio_flush(pb);
  232. }
  233. av_freep(&caf->pkt_sizes);
  234. return 0;
  235. }
  236. AVOutputFormat ff_caf_muxer = {
  237. .name = "caf",
  238. .long_name = NULL_IF_CONFIG_SMALL("Apple CAF (Core Audio Format)"),
  239. .mime_type = "audio/x-caf",
  240. .extensions = "caf",
  241. .priv_data_size = sizeof(CAFContext),
  242. .audio_codec = AV_CODEC_ID_PCM_S16BE,
  243. .video_codec = AV_CODEC_ID_NONE,
  244. .write_header = caf_write_header,
  245. .write_packet = caf_write_packet,
  246. .write_trailer = caf_write_trailer,
  247. .codec_tag = (const AVCodecTag* const []){ff_codec_caf_tags, 0},
  248. };