You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

145 lines
5.9KB

  1. /*
  2. * AAC encoder
  3. * Copyright (C) 2008 Konstantin Shishkov
  4. *
  5. * This file is part of FFmpeg.
  6. *
  7. * FFmpeg is free software; you can redistribute it and/or
  8. * modify it under the terms of the GNU Lesser General Public
  9. * License as published by the Free Software Foundation; either
  10. * version 2.1 of the License, or (at your option) any later version.
  11. *
  12. * FFmpeg is distributed in the hope that it will be useful,
  13. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  14. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  15. * Lesser General Public License for more details.
  16. *
  17. * You should have received a copy of the GNU Lesser General Public
  18. * License along with FFmpeg; if not, write to the Free Software
  19. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  20. */
  21. #ifndef AVCODEC_AACENC_H
  22. #define AVCODEC_AACENC_H
  23. #include "libavutil/float_dsp.h"
  24. #include "avcodec.h"
  25. #include "put_bits.h"
  26. #include "aac.h"
  27. #include "audio_frame_queue.h"
  28. #include "psymodel.h"
  29. #include "lpc.h"
  30. typedef enum AACCoder {
  31. AAC_CODER_ANMR = 0,
  32. AAC_CODER_TWOLOOP,
  33. AAC_CODER_FAST,
  34. AAC_CODER_NB,
  35. }AACCoder;
  36. typedef struct AACEncOptions {
  37. int coder;
  38. int pns;
  39. int tns;
  40. int ltp;
  41. int pred;
  42. int mid_side;
  43. int intensity_stereo;
  44. } AACEncOptions;
  45. struct AACEncContext;
  46. typedef struct AACCoefficientsEncoder {
  47. void (*search_for_quantizers)(AVCodecContext *avctx, struct AACEncContext *s,
  48. SingleChannelElement *sce, const float lambda);
  49. void (*encode_window_bands_info)(struct AACEncContext *s, SingleChannelElement *sce,
  50. int win, int group_len, const float lambda);
  51. void (*quantize_and_encode_band)(struct AACEncContext *s, PutBitContext *pb, const float *in, float *out, int size,
  52. int scale_idx, int cb, const float lambda, int rtz);
  53. void (*encode_tns_info)(struct AACEncContext *s, SingleChannelElement *sce);
  54. void (*encode_ltp_info)(struct AACEncContext *s, SingleChannelElement *sce, int common_window);
  55. void (*encode_main_pred)(struct AACEncContext *s, SingleChannelElement *sce);
  56. void (*adjust_common_pred)(struct AACEncContext *s, ChannelElement *cpe);
  57. void (*adjust_common_ltp)(struct AACEncContext *s, ChannelElement *cpe);
  58. void (*apply_main_pred)(struct AACEncContext *s, SingleChannelElement *sce);
  59. void (*apply_tns_filt)(struct AACEncContext *s, SingleChannelElement *sce);
  60. void (*update_ltp)(struct AACEncContext *s, SingleChannelElement *sce);
  61. void (*ltp_insert_new_frame)(struct AACEncContext *s);
  62. void (*set_special_band_scalefactors)(struct AACEncContext *s, SingleChannelElement *sce);
  63. void (*search_for_pns)(struct AACEncContext *s, AVCodecContext *avctx, SingleChannelElement *sce);
  64. void (*mark_pns)(struct AACEncContext *s, AVCodecContext *avctx, SingleChannelElement *sce);
  65. void (*search_for_tns)(struct AACEncContext *s, SingleChannelElement *sce);
  66. void (*search_for_ltp)(struct AACEncContext *s, SingleChannelElement *sce, int common_window);
  67. void (*search_for_ms)(struct AACEncContext *s, ChannelElement *cpe);
  68. void (*search_for_is)(struct AACEncContext *s, AVCodecContext *avctx, ChannelElement *cpe);
  69. void (*search_for_pred)(struct AACEncContext *s, SingleChannelElement *sce);
  70. } AACCoefficientsEncoder;
  71. extern const AACCoefficientsEncoder ff_aac_coders[];
  72. typedef struct AACQuantizeBandCostCacheEntry {
  73. float rd;
  74. float energy;
  75. int bits;
  76. char cb;
  77. char rtz;
  78. uint16_t generation;
  79. } AACQuantizeBandCostCacheEntry;
  80. /**
  81. * AAC encoder context
  82. */
  83. typedef struct AACEncContext {
  84. AVClass *av_class;
  85. AACEncOptions options; ///< encoding options
  86. PutBitContext pb;
  87. FFTContext mdct1024; ///< long (1024 samples) frame transform context
  88. FFTContext mdct128; ///< short (128 samples) frame transform context
  89. AVFloatDSPContext *fdsp;
  90. float *planar_samples[8]; ///< saved preprocessed input
  91. int profile; ///< copied from avctx
  92. LPCContext lpc; ///< used by TNS
  93. int samplerate_index; ///< MPEG-4 samplerate index
  94. int channels; ///< channel count
  95. const uint8_t *chan_map; ///< channel configuration map
  96. ChannelElement *cpe; ///< channel elements
  97. FFPsyContext psy;
  98. struct FFPsyPreprocessContext* psypp;
  99. const AACCoefficientsEncoder *coder;
  100. int cur_channel; ///< current channel for coder context
  101. int random_state;
  102. float lambda;
  103. int last_frame_pb_count; ///< number of bits for the previous frame
  104. float lambda_sum; ///< sum(lambda), for Qvg reporting
  105. int lambda_count; ///< count(lambda), for Qvg reporting
  106. enum RawDataBlockType cur_type; ///< channel group type cur_channel belongs to
  107. AudioFrameQueue afq;
  108. DECLARE_ALIGNED(16, int, qcoefs)[96]; ///< quantized coefficients
  109. DECLARE_ALIGNED(32, float, scoefs)[1024]; ///< scaled coefficients
  110. uint16_t quantize_band_cost_cache_generation;
  111. AACQuantizeBandCostCacheEntry quantize_band_cost_cache[256][128]; ///< memoization area for quantize_band_cost
  112. void (*abs_pow34)(float *out, const float *in, const int size);
  113. void (*quant_bands)(int *out, const float *in, const float *scaled,
  114. int size, int is_signed, int maxval, const float Q34,
  115. const float rounding);
  116. struct {
  117. float *samples;
  118. } buffer;
  119. } AACEncContext;
  120. void ff_aac_dsp_init_x86(AACEncContext *s);
  121. void ff_aac_coder_init_mips(AACEncContext *c);
  122. void ff_quantize_band_cost_cache_init(struct AACEncContext *s);
  123. #endif /* AVCODEC_AACENC_H */