You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

157 lines
4.9KB

  1. /*
  2. * AMR Audio encoder stub
  3. * Copyright (c) 2003 the ffmpeg project
  4. *
  5. * This file is part of Libav.
  6. *
  7. * Libav is free software; you can redistribute it and/or
  8. * modify it under the terms of the GNU Lesser General Public
  9. * License as published by the Free Software Foundation; either
  10. * version 2.1 of the License, or (at your option) any later version.
  11. *
  12. * Libav is distributed in the hope that it will be useful,
  13. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  14. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  15. * Lesser General Public License for more details.
  16. *
  17. * You should have received a copy of the GNU Lesser General Public
  18. * License along with Libav; if not, write to the Free Software
  19. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  20. */
  21. #include <vo-amrwbenc/enc_if.h>
  22. #include "libavutil/avstring.h"
  23. #include "libavutil/opt.h"
  24. #include "avcodec.h"
  25. #include "internal.h"
  26. #define MAX_PACKET_SIZE (1 + (477 + 7) / 8)
  27. typedef struct AMRWBContext {
  28. AVClass *av_class;
  29. void *state;
  30. int mode;
  31. int last_bitrate;
  32. int allow_dtx;
  33. } AMRWBContext;
  34. static const AVOption options[] = {
  35. { "dtx", "Allow DTX (generate comfort noise)", offsetof(AMRWBContext, allow_dtx), AV_OPT_TYPE_INT, { 0 }, 0, 1, AV_OPT_FLAG_AUDIO_PARAM | AV_OPT_FLAG_ENCODING_PARAM },
  36. { NULL }
  37. };
  38. static const AVClass class = {
  39. "libvo_amrwbenc", av_default_item_name, options, LIBAVUTIL_VERSION_INT
  40. };
  41. static int get_wb_bitrate_mode(int bitrate, void *log_ctx)
  42. {
  43. /* make the correspondance between bitrate and mode */
  44. static const int rates[] = { 6600, 8850, 12650, 14250, 15850, 18250,
  45. 19850, 23050, 23850 };
  46. int i, best = -1, min_diff = 0;
  47. char log_buf[200];
  48. for (i = 0; i < 9; i++) {
  49. if (rates[i] == bitrate)
  50. return i;
  51. if (best < 0 || abs(rates[i] - bitrate) < min_diff) {
  52. best = i;
  53. min_diff = abs(rates[i] - bitrate);
  54. }
  55. }
  56. /* no bitrate matching exactly, log a warning */
  57. snprintf(log_buf, sizeof(log_buf), "bitrate not supported: use one of ");
  58. for (i = 0; i < 9; i++)
  59. av_strlcatf(log_buf, sizeof(log_buf), "%.2fk, ", rates[i] / 1000.f);
  60. av_strlcatf(log_buf, sizeof(log_buf), "using %.2fk", rates[best] / 1000.f);
  61. av_log(log_ctx, AV_LOG_WARNING, "%s\n", log_buf);
  62. return best;
  63. }
  64. static av_cold int amr_wb_encode_init(AVCodecContext *avctx)
  65. {
  66. AMRWBContext *s = avctx->priv_data;
  67. if (avctx->sample_rate != 16000) {
  68. av_log(avctx, AV_LOG_ERROR, "Only 16000Hz sample rate supported\n");
  69. return AVERROR(ENOSYS);
  70. }
  71. if (avctx->channels != 1) {
  72. av_log(avctx, AV_LOG_ERROR, "Only mono supported\n");
  73. return AVERROR(ENOSYS);
  74. }
  75. s->mode = get_wb_bitrate_mode(avctx->bit_rate, avctx);
  76. s->last_bitrate = avctx->bit_rate;
  77. avctx->frame_size = 320;
  78. avctx->delay = 80;
  79. #if FF_API_OLD_ENCODE_AUDIO
  80. avctx->coded_frame = avcodec_alloc_frame();
  81. if (!avctx->coded_frame)
  82. return AVERROR(ENOMEM);
  83. #endif
  84. s->state = E_IF_init();
  85. return 0;
  86. }
  87. static int amr_wb_encode_close(AVCodecContext *avctx)
  88. {
  89. AMRWBContext *s = avctx->priv_data;
  90. E_IF_exit(s->state);
  91. av_freep(&avctx->coded_frame);
  92. return 0;
  93. }
  94. static int amr_wb_encode_frame(AVCodecContext *avctx, AVPacket *avpkt,
  95. const AVFrame *frame, int *got_packet_ptr)
  96. {
  97. AMRWBContext *s = avctx->priv_data;
  98. const int16_t *samples = (const int16_t *)frame->data[0];
  99. int size, ret;
  100. if ((ret = ff_alloc_packet(avpkt, MAX_PACKET_SIZE))) {
  101. av_log(avctx, AV_LOG_ERROR, "Error getting output packet\n");
  102. return ret;
  103. }
  104. if (s->last_bitrate != avctx->bit_rate) {
  105. s->mode = get_wb_bitrate_mode(avctx->bit_rate, avctx);
  106. s->last_bitrate = avctx->bit_rate;
  107. }
  108. size = E_IF_encode(s->state, s->mode, samples, avpkt->data, s->allow_dtx);
  109. if (size <= 0 || size > MAX_PACKET_SIZE) {
  110. av_log(avctx, AV_LOG_ERROR, "Error encoding frame\n");
  111. return AVERROR(EINVAL);
  112. }
  113. if (frame->pts != AV_NOPTS_VALUE)
  114. avpkt->pts = frame->pts - ff_samples_to_time_base(avctx, avctx->delay);
  115. avpkt->size = size;
  116. *got_packet_ptr = 1;
  117. return 0;
  118. }
  119. AVCodec ff_libvo_amrwbenc_encoder = {
  120. .name = "libvo_amrwbenc",
  121. .type = AVMEDIA_TYPE_AUDIO,
  122. .id = CODEC_ID_AMR_WB,
  123. .priv_data_size = sizeof(AMRWBContext),
  124. .init = amr_wb_encode_init,
  125. .encode2 = amr_wb_encode_frame,
  126. .close = amr_wb_encode_close,
  127. .sample_fmts = (const enum AVSampleFormat[]){ AV_SAMPLE_FMT_S16,
  128. AV_SAMPLE_FMT_NONE },
  129. .long_name = NULL_IF_CONFIG_SMALL("Android VisualOn Adaptive "
  130. "Multi-Rate (AMR) Wide-Band"),
  131. .priv_class = &class,
  132. };