You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

235 lines
7.7KB

  1. /*
  2. * NellyMoser audio decoder
  3. * Copyright (c) 2007 a840bda5870ba11f19698ff6eb9581dfb0f95fa5,
  4. * 539459aeb7d425140b62a3ec7dbf6dc8e408a306, and
  5. * 520e17cd55896441042b14df2566a6eb610ed444
  6. * Copyright (c) 2007 Loic Minier <lool at dooz.org>
  7. * Benjamin Larsson
  8. *
  9. * Permission is hereby granted, free of charge, to any person obtaining a
  10. * copy of this software and associated documentation files (the "Software"),
  11. * to deal in the Software without restriction, including without limitation
  12. * the rights to use, copy, modify, merge, publish, distribute, sublicense,
  13. * and/or sell copies of the Software, and to permit persons to whom the
  14. * Software is furnished to do so, subject to the following conditions:
  15. *
  16. * The above copyright notice and this permission notice shall be included in
  17. * all copies or substantial portions of the Software.
  18. *
  19. * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  20. * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  21. * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
  22. * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
  23. * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
  24. * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
  25. * DEALINGS IN THE SOFTWARE.
  26. */
  27. /**
  28. * @file
  29. * The 3 alphanumeric copyright notices are md5summed they are from the original
  30. * implementors. The original code is available from http://code.google.com/p/nelly2pcm/
  31. */
  32. #include "nellymoser.h"
  33. #include "libavutil/lfg.h"
  34. #include "libavutil/random_seed.h"
  35. #include "libavutil/audioconvert.h"
  36. #include "avcodec.h"
  37. #include "dsputil.h"
  38. #include "fft.h"
  39. #include "fmtconvert.h"
  40. #include "sinewin.h"
  41. #define BITSTREAM_READER_LE
  42. #include "get_bits.h"
  43. typedef struct NellyMoserDecodeContext {
  44. AVCodecContext* avctx;
  45. AVFrame frame;
  46. float *float_buf;
  47. AVLFG random_state;
  48. GetBitContext gb;
  49. float scale_bias;
  50. DSPContext dsp;
  51. FFTContext imdct_ctx;
  52. FmtConvertContext fmt_conv;
  53. DECLARE_ALIGNED(32, float, imdct_buf)[2][NELLY_BUF_LEN];
  54. float *imdct_out;
  55. float *imdct_prev;
  56. } NellyMoserDecodeContext;
  57. static void nelly_decode_block(NellyMoserDecodeContext *s,
  58. const unsigned char block[NELLY_BLOCK_LEN],
  59. float audio[NELLY_SAMPLES])
  60. {
  61. int i,j;
  62. float buf[NELLY_FILL_LEN], pows[NELLY_FILL_LEN];
  63. float *aptr, *bptr, *pptr, val, pval;
  64. int bits[NELLY_BUF_LEN];
  65. unsigned char v;
  66. init_get_bits(&s->gb, block, NELLY_BLOCK_LEN * 8);
  67. bptr = buf;
  68. pptr = pows;
  69. val = ff_nelly_init_table[get_bits(&s->gb, 6)];
  70. for (i=0 ; i<NELLY_BANDS ; i++) {
  71. if (i > 0)
  72. val += ff_nelly_delta_table[get_bits(&s->gb, 5)];
  73. pval = -pow(2, val/2048) * s->scale_bias;
  74. for (j = 0; j < ff_nelly_band_sizes_table[i]; j++) {
  75. *bptr++ = val;
  76. *pptr++ = pval;
  77. }
  78. }
  79. ff_nelly_get_sample_bits(buf, bits);
  80. for (i = 0; i < 2; i++) {
  81. aptr = audio + i * NELLY_BUF_LEN;
  82. init_get_bits(&s->gb, block, NELLY_BLOCK_LEN * 8);
  83. skip_bits_long(&s->gb, NELLY_HEADER_BITS + i*NELLY_DETAIL_BITS);
  84. for (j = 0; j < NELLY_FILL_LEN; j++) {
  85. if (bits[j] <= 0) {
  86. aptr[j] = M_SQRT1_2*pows[j];
  87. if (av_lfg_get(&s->random_state) & 1)
  88. aptr[j] *= -1.0;
  89. } else {
  90. v = get_bits(&s->gb, bits[j]);
  91. aptr[j] = ff_nelly_dequantization_table[(1<<bits[j])-1+v]*pows[j];
  92. }
  93. }
  94. memset(&aptr[NELLY_FILL_LEN], 0,
  95. (NELLY_BUF_LEN - NELLY_FILL_LEN) * sizeof(float));
  96. s->imdct_ctx.imdct_half(&s->imdct_ctx, s->imdct_out, aptr);
  97. s->dsp.vector_fmul_window(aptr, s->imdct_prev + NELLY_BUF_LEN/2, s->imdct_out, ff_sine_128, NELLY_BUF_LEN/2);
  98. FFSWAP(float *, s->imdct_out, s->imdct_prev);
  99. }
  100. }
  101. static av_cold int decode_init(AVCodecContext * avctx) {
  102. NellyMoserDecodeContext *s = avctx->priv_data;
  103. s->avctx = avctx;
  104. s->imdct_out = s->imdct_buf[0];
  105. s->imdct_prev = s->imdct_buf[1];
  106. av_lfg_init(&s->random_state, 0);
  107. ff_mdct_init(&s->imdct_ctx, 8, 1, 1.0);
  108. ff_dsputil_init(&s->dsp, avctx);
  109. if (avctx->request_sample_fmt == AV_SAMPLE_FMT_FLT) {
  110. s->scale_bias = 1.0/(32768*8);
  111. avctx->sample_fmt = AV_SAMPLE_FMT_FLT;
  112. } else {
  113. s->scale_bias = 1.0/(1*8);
  114. avctx->sample_fmt = AV_SAMPLE_FMT_S16;
  115. ff_fmt_convert_init(&s->fmt_conv, avctx);
  116. s->float_buf = av_mallocz(NELLY_SAMPLES * sizeof(*s->float_buf));
  117. if (!s->float_buf) {
  118. av_log(avctx, AV_LOG_ERROR, "error allocating float buffer\n");
  119. return AVERROR(ENOMEM);
  120. }
  121. }
  122. /* Generate overlap window */
  123. if (!ff_sine_128[127])
  124. ff_init_ff_sine_windows(7);
  125. avctx->channel_layout = AV_CH_LAYOUT_MONO;
  126. avcodec_get_frame_defaults(&s->frame);
  127. avctx->coded_frame = &s->frame;
  128. return 0;
  129. }
  130. static int decode_tag(AVCodecContext *avctx, void *data,
  131. int *got_frame_ptr, AVPacket *avpkt)
  132. {
  133. const uint8_t *buf = avpkt->data;
  134. const uint8_t *side=av_packet_get_side_data(avpkt, 'F', NULL);
  135. int buf_size = avpkt->size;
  136. NellyMoserDecodeContext *s = avctx->priv_data;
  137. int blocks, i, ret;
  138. int16_t *samples_s16;
  139. float *samples_flt;
  140. blocks = buf_size / NELLY_BLOCK_LEN;
  141. if (blocks <= 0) {
  142. av_log(avctx, AV_LOG_ERROR, "Packet is too small\n");
  143. return AVERROR_INVALIDDATA;
  144. }
  145. if (buf_size % NELLY_BLOCK_LEN) {
  146. av_log(avctx, AV_LOG_WARNING, "Leftover bytes: %d.\n",
  147. buf_size % NELLY_BLOCK_LEN);
  148. }
  149. /* Normal numbers of blocks for sample rates:
  150. * 8000 Hz - 1
  151. * 11025 Hz - 2
  152. * 16000 Hz - 3
  153. * 22050 Hz - 4
  154. * 44100 Hz - 8
  155. */
  156. if(side && blocks>1 && avctx->sample_rate%11025==0 && (1<<((side[0]>>2)&3)) == blocks)
  157. avctx->sample_rate= 11025*(blocks/2);
  158. /* get output buffer */
  159. s->frame.nb_samples = NELLY_SAMPLES * blocks;
  160. if ((ret = avctx->get_buffer(avctx, &s->frame)) < 0) {
  161. av_log(avctx, AV_LOG_ERROR, "get_buffer() failed\n");
  162. return ret;
  163. }
  164. samples_s16 = (int16_t *)s->frame.data[0];
  165. samples_flt = (float *)s->frame.data[0];
  166. for (i=0 ; i<blocks ; i++) {
  167. if (avctx->sample_fmt == AV_SAMPLE_FMT_FLT) {
  168. nelly_decode_block(s, buf, samples_flt);
  169. samples_flt += NELLY_SAMPLES;
  170. } else {
  171. nelly_decode_block(s, buf, s->float_buf);
  172. s->fmt_conv.float_to_int16(samples_s16, s->float_buf, NELLY_SAMPLES);
  173. samples_s16 += NELLY_SAMPLES;
  174. }
  175. buf += NELLY_BLOCK_LEN;
  176. }
  177. *got_frame_ptr = 1;
  178. *(AVFrame *)data = s->frame;
  179. return buf_size;
  180. }
  181. static av_cold int decode_end(AVCodecContext * avctx) {
  182. NellyMoserDecodeContext *s = avctx->priv_data;
  183. av_freep(&s->float_buf);
  184. ff_mdct_end(&s->imdct_ctx);
  185. return 0;
  186. }
  187. AVCodec ff_nellymoser_decoder = {
  188. .name = "nellymoser",
  189. .type = AVMEDIA_TYPE_AUDIO,
  190. .id = AV_CODEC_ID_NELLYMOSER,
  191. .priv_data_size = sizeof(NellyMoserDecodeContext),
  192. .init = decode_init,
  193. .close = decode_end,
  194. .decode = decode_tag,
  195. .capabilities = CODEC_CAP_DR1 | CODEC_CAP_PARAM_CHANGE,
  196. .long_name = NULL_IF_CONFIG_SMALL("Nellymoser Asao"),
  197. .sample_fmts = (const enum AVSampleFormat[]) { AV_SAMPLE_FMT_FLT,
  198. AV_SAMPLE_FMT_S16,
  199. AV_SAMPLE_FMT_NONE },
  200. };