You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

161 lines
5.0KB

  1. /*
  2. * AMR Audio encoder stub
  3. * Copyright (c) 2003 the ffmpeg project
  4. *
  5. * This file is part of Libav.
  6. *
  7. * Libav is free software; you can redistribute it and/or
  8. * modify it under the terms of the GNU Lesser General Public
  9. * License as published by the Free Software Foundation; either
  10. * version 2.1 of the License, or (at your option) any later version.
  11. *
  12. * Libav is distributed in the hope that it will be useful,
  13. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  14. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  15. * Lesser General Public License for more details.
  16. *
  17. * You should have received a copy of the GNU Lesser General Public
  18. * License along with Libav; if not, write to the Free Software
  19. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  20. */
  21. #include <vo-amrwbenc/enc_if.h>
  22. #include <stdio.h>
  23. #include <stdlib.h>
  24. #include "libavutil/avstring.h"
  25. #include "libavutil/internal.h"
  26. #include "libavutil/mem.h"
  27. #include "libavutil/opt.h"
  28. #include "avcodec.h"
  29. #include "internal.h"
  30. #define MAX_PACKET_SIZE (1 + (477 + 7) / 8)
  31. typedef struct AMRWBContext {
  32. AVClass *av_class;
  33. void *state;
  34. int mode;
  35. int last_bitrate;
  36. int allow_dtx;
  37. } AMRWBContext;
  38. static const AVOption options[] = {
  39. { "dtx", "Allow DTX (generate comfort noise)", offsetof(AMRWBContext, allow_dtx), AV_OPT_TYPE_INT, { .i64 = 0 }, 0, 1, AV_OPT_FLAG_AUDIO_PARAM | AV_OPT_FLAG_ENCODING_PARAM },
  40. { NULL }
  41. };
  42. static const AVClass class = {
  43. "libvo_amrwbenc", av_default_item_name, options, LIBAVUTIL_VERSION_INT
  44. };
  45. static int get_wb_bitrate_mode(int bitrate, void *log_ctx)
  46. {
  47. /* make the correspondance between bitrate and mode */
  48. static const int rates[] = { 6600, 8850, 12650, 14250, 15850, 18250,
  49. 19850, 23050, 23850 };
  50. int i, best = -1, min_diff = 0;
  51. char log_buf[200];
  52. for (i = 0; i < 9; i++) {
  53. if (rates[i] == bitrate)
  54. return i;
  55. if (best < 0 || abs(rates[i] - bitrate) < min_diff) {
  56. best = i;
  57. min_diff = abs(rates[i] - bitrate);
  58. }
  59. }
  60. /* no bitrate matching exactly, log a warning */
  61. snprintf(log_buf, sizeof(log_buf), "bitrate not supported: use one of ");
  62. for (i = 0; i < 9; i++)
  63. av_strlcatf(log_buf, sizeof(log_buf), "%.2fk, ", rates[i] / 1000.f);
  64. av_strlcatf(log_buf, sizeof(log_buf), "using %.2fk", rates[best] / 1000.f);
  65. av_log(log_ctx, AV_LOG_WARNING, "%s\n", log_buf);
  66. return best;
  67. }
  68. static av_cold int amr_wb_encode_init(AVCodecContext *avctx)
  69. {
  70. AMRWBContext *s = avctx->priv_data;
  71. if (avctx->sample_rate != 16000) {
  72. av_log(avctx, AV_LOG_ERROR, "Only 16000Hz sample rate supported\n");
  73. return AVERROR(ENOSYS);
  74. }
  75. if (avctx->channels != 1) {
  76. av_log(avctx, AV_LOG_ERROR, "Only mono supported\n");
  77. return AVERROR(ENOSYS);
  78. }
  79. s->mode = get_wb_bitrate_mode(avctx->bit_rate, avctx);
  80. s->last_bitrate = avctx->bit_rate;
  81. avctx->frame_size = 320;
  82. avctx->delay = 80;
  83. #if FF_API_OLD_ENCODE_AUDIO
  84. avctx->coded_frame = avcodec_alloc_frame();
  85. if (!avctx->coded_frame)
  86. return AVERROR(ENOMEM);
  87. #endif
  88. s->state = E_IF_init();
  89. return 0;
  90. }
  91. static int amr_wb_encode_close(AVCodecContext *avctx)
  92. {
  93. AMRWBContext *s = avctx->priv_data;
  94. E_IF_exit(s->state);
  95. av_freep(&avctx->coded_frame);
  96. return 0;
  97. }
  98. static int amr_wb_encode_frame(AVCodecContext *avctx, AVPacket *avpkt,
  99. const AVFrame *frame, int *got_packet_ptr)
  100. {
  101. AMRWBContext *s = avctx->priv_data;
  102. const int16_t *samples = (const int16_t *)frame->data[0];
  103. int size, ret;
  104. if ((ret = ff_alloc_packet(avpkt, MAX_PACKET_SIZE))) {
  105. av_log(avctx, AV_LOG_ERROR, "Error getting output packet\n");
  106. return ret;
  107. }
  108. if (s->last_bitrate != avctx->bit_rate) {
  109. s->mode = get_wb_bitrate_mode(avctx->bit_rate, avctx);
  110. s->last_bitrate = avctx->bit_rate;
  111. }
  112. size = E_IF_encode(s->state, s->mode, samples, avpkt->data, s->allow_dtx);
  113. if (size <= 0 || size > MAX_PACKET_SIZE) {
  114. av_log(avctx, AV_LOG_ERROR, "Error encoding frame\n");
  115. return AVERROR(EINVAL);
  116. }
  117. if (frame->pts != AV_NOPTS_VALUE)
  118. avpkt->pts = frame->pts - ff_samples_to_time_base(avctx, avctx->delay);
  119. avpkt->size = size;
  120. *got_packet_ptr = 1;
  121. return 0;
  122. }
  123. AVCodec ff_libvo_amrwbenc_encoder = {
  124. .name = "libvo_amrwbenc",
  125. .type = AVMEDIA_TYPE_AUDIO,
  126. .id = AV_CODEC_ID_AMR_WB,
  127. .priv_data_size = sizeof(AMRWBContext),
  128. .init = amr_wb_encode_init,
  129. .encode2 = amr_wb_encode_frame,
  130. .close = amr_wb_encode_close,
  131. .sample_fmts = (const enum AVSampleFormat[]){ AV_SAMPLE_FMT_S16,
  132. AV_SAMPLE_FMT_NONE },
  133. .long_name = NULL_IF_CONFIG_SMALL("Android VisualOn AMR-WB "
  134. "(Adaptive Multi-Rate Wide-Band)"),
  135. .priv_class = &class,
  136. };