You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

159 lines
5.0KB

  1. /*
  2. * AMR Audio encoder stub
  3. * Copyright (c) 2003 The FFmpeg project
  4. *
  5. * This file is part of Libav.
  6. *
  7. * Libav is free software; you can redistribute it and/or
  8. * modify it under the terms of the GNU Lesser General Public
  9. * License as published by the Free Software Foundation; either
  10. * version 2.1 of the License, or (at your option) any later version.
  11. *
  12. * Libav is distributed in the hope that it will be useful,
  13. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  14. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  15. * Lesser General Public License for more details.
  16. *
  17. * You should have received a copy of the GNU Lesser General Public
  18. * License along with Libav; if not, write to the Free Software
  19. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  20. */
  21. #include <vo-amrwbenc/enc_if.h>
  22. #include <stdio.h>
  23. #include <stdlib.h>
  24. #include "libavutil/avstring.h"
  25. #include "libavutil/internal.h"
  26. #include "libavutil/mem.h"
  27. #include "libavutil/opt.h"
  28. #include "avcodec.h"
  29. #include "internal.h"
  30. #define MAX_PACKET_SIZE (1 + (477 + 7) / 8)
  31. typedef struct AMRWBContext {
  32. AVClass *av_class;
  33. void *state;
  34. int mode;
  35. int last_bitrate;
  36. int allow_dtx;
  37. } AMRWBContext;
  38. static const AVOption options[] = {
  39. { "dtx", "Allow DTX (generate comfort noise)", offsetof(AMRWBContext, allow_dtx), AV_OPT_TYPE_INT, { .i64 = 0 }, 0, 1, AV_OPT_FLAG_AUDIO_PARAM | AV_OPT_FLAG_ENCODING_PARAM },
  40. { NULL }
  41. };
  42. static const AVClass class = {
  43. .class_name = "libvo_amrwbenc",
  44. .item_name = av_default_item_name,
  45. .option = options,
  46. .version = LIBAVUTIL_VERSION_INT,
  47. };
  48. static int get_wb_bitrate_mode(int bitrate, void *log_ctx)
  49. {
  50. /* make the correspondence between bitrate and mode */
  51. static const int rates[] = { 6600, 8850, 12650, 14250, 15850, 18250,
  52. 19850, 23050, 23850 };
  53. int i, best = -1, min_diff = 0;
  54. char log_buf[200];
  55. for (i = 0; i < 9; i++) {
  56. if (rates[i] == bitrate)
  57. return i;
  58. if (best < 0 || abs(rates[i] - bitrate) < min_diff) {
  59. best = i;
  60. min_diff = abs(rates[i] - bitrate);
  61. }
  62. }
  63. /* no bitrate matching exactly, log a warning */
  64. snprintf(log_buf, sizeof(log_buf), "bitrate not supported: use one of ");
  65. for (i = 0; i < 9; i++)
  66. av_strlcatf(log_buf, sizeof(log_buf), "%.2fk, ", rates[i] / 1000.f);
  67. av_strlcatf(log_buf, sizeof(log_buf), "using %.2fk", rates[best] / 1000.f);
  68. av_log(log_ctx, AV_LOG_WARNING, "%s\n", log_buf);
  69. return best;
  70. }
  71. static av_cold int amr_wb_encode_init(AVCodecContext *avctx)
  72. {
  73. AMRWBContext *s = avctx->priv_data;
  74. if (avctx->sample_rate != 16000) {
  75. av_log(avctx, AV_LOG_ERROR, "Only 16000Hz sample rate supported\n");
  76. return AVERROR(ENOSYS);
  77. }
  78. if (avctx->channels != 1) {
  79. av_log(avctx, AV_LOG_ERROR, "Only mono supported\n");
  80. return AVERROR(ENOSYS);
  81. }
  82. s->mode = get_wb_bitrate_mode(avctx->bit_rate, avctx);
  83. s->last_bitrate = avctx->bit_rate;
  84. avctx->frame_size = 320;
  85. avctx->initial_padding = 80;
  86. s->state = E_IF_init();
  87. return 0;
  88. }
  89. static int amr_wb_encode_close(AVCodecContext *avctx)
  90. {
  91. AMRWBContext *s = avctx->priv_data;
  92. E_IF_exit(s->state);
  93. return 0;
  94. }
  95. static int amr_wb_encode_frame(AVCodecContext *avctx, AVPacket *avpkt,
  96. const AVFrame *frame, int *got_packet_ptr)
  97. {
  98. AMRWBContext *s = avctx->priv_data;
  99. const int16_t *samples = (const int16_t *)frame->data[0];
  100. int size, ret;
  101. if ((ret = ff_alloc_packet(avpkt, MAX_PACKET_SIZE))) {
  102. av_log(avctx, AV_LOG_ERROR, "Error getting output packet\n");
  103. return ret;
  104. }
  105. if (s->last_bitrate != avctx->bit_rate) {
  106. s->mode = get_wb_bitrate_mode(avctx->bit_rate, avctx);
  107. s->last_bitrate = avctx->bit_rate;
  108. }
  109. size = E_IF_encode(s->state, s->mode, samples, avpkt->data, s->allow_dtx);
  110. if (size <= 0 || size > MAX_PACKET_SIZE) {
  111. av_log(avctx, AV_LOG_ERROR, "Error encoding frame\n");
  112. return AVERROR(EINVAL);
  113. }
  114. if (frame->pts != AV_NOPTS_VALUE)
  115. avpkt->pts = frame->pts - ff_samples_to_time_base(avctx, avctx->initial_padding);
  116. avpkt->size = size;
  117. *got_packet_ptr = 1;
  118. return 0;
  119. }
  120. AVCodec ff_libvo_amrwbenc_encoder = {
  121. .name = "libvo_amrwbenc",
  122. .long_name = NULL_IF_CONFIG_SMALL("Android VisualOn AMR-WB "
  123. "(Adaptive Multi-Rate Wide-Band)"),
  124. .type = AVMEDIA_TYPE_AUDIO,
  125. .id = AV_CODEC_ID_AMR_WB,
  126. .priv_data_size = sizeof(AMRWBContext),
  127. .init = amr_wb_encode_init,
  128. .encode2 = amr_wb_encode_frame,
  129. .close = amr_wb_encode_close,
  130. .sample_fmts = (const enum AVSampleFormat[]){ AV_SAMPLE_FMT_S16,
  131. AV_SAMPLE_FMT_NONE },
  132. .priv_class = &class,
  133. .wrapper_name = "libvo_amrwbenc",
  134. };