You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

273 lines
7.7KB

  1. /*
  2. * RealAudio 2.0 (28.8K)
  3. * Copyright (c) 2003 the ffmpeg project
  4. *
  5. * This file is part of FFmpeg.
  6. *
  7. * FFmpeg is free software; you can redistribute it and/or
  8. * modify it under the terms of the GNU Lesser General Public
  9. * License as published by the Free Software Foundation; either
  10. * version 2.1 of the License, or (at your option) any later version.
  11. *
  12. * FFmpeg is distributed in the hope that it will be useful,
  13. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  14. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  15. * Lesser General Public License for more details.
  16. *
  17. * You should have received a copy of the GNU Lesser General Public
  18. * License along with FFmpeg; if not, write to the Free Software
  19. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  20. */
  21. #include "avcodec.h"
  22. #define ALT_BITSTREAM_READER_LE
  23. #include "bitstream.h"
  24. #include "ra288.h"
  25. typedef struct {
  26. float sp_lpc[36]; ///< LPC coefficients for speech data (spec: A)
  27. float gain_lpc[10]; ///< LPC coefficients for gain (spec: GB)
  28. float sp_hist[111]; ///< Speech data history (spec: SB)
  29. /** Speech part of the gain autocorrelation (spec: REXP) */
  30. float sp_rec[37];
  31. float gain_hist[38]; ///< Log-gain history (spec: SBLG)
  32. /** Recursive part of the gain autocorrelation (spec: REXPLG) */
  33. float gain_rec[11];
  34. float sp_block[41]; ///< Speech data of four blocks (spec: STTMP)
  35. float gain_block[10]; ///< Gain data of four blocks (spec: GSTATE)
  36. } RA288Context;
  37. static av_cold int ra288_decode_init(AVCodecContext *avctx)
  38. {
  39. avctx->sample_fmt = SAMPLE_FMT_S16;
  40. return 0;
  41. }
  42. static inline float scalar_product_float(const float * v1, const float * v2,
  43. int size)
  44. {
  45. float res = 0.;
  46. while (size--)
  47. res += *v1++ * *v2++;
  48. return res;
  49. }
  50. static void colmult(float *tgt, const float *m1, const float *m2, int n)
  51. {
  52. while (n--)
  53. *tgt++ = *m1++ * *m2++;
  54. }
  55. static void decode(RA288Context *ractx, float gain, int cb_coef)
  56. {
  57. int i, j;
  58. double sumsum;
  59. float sum, buffer[5];
  60. memmove(ractx->sp_block + 5, ractx->sp_block, 36*sizeof(*ractx->sp_block));
  61. for (i=4; i >= 0; i--)
  62. ractx->sp_block[i] = -scalar_product_float(ractx->sp_block + i + 1,
  63. ractx->sp_lpc, 36);
  64. /* block 46 of G.728 spec */
  65. sum = 32. - scalar_product_float(ractx->gain_lpc, ractx->gain_block, 10);
  66. /* block 47 of G.728 spec */
  67. sum = av_clipf(sum, 0, 60);
  68. /* block 48 of G.728 spec */
  69. sumsum = exp(sum * 0.1151292546497) * gain; /* pow(10.0,sum/20)*gain */
  70. for (i=0; i < 5; i++)
  71. buffer[i] = codetable[cb_coef][i] * sumsum;
  72. sum = scalar_product_float(buffer, buffer, 5) / 5;
  73. sum = FFMAX(sum, 1);
  74. /* shift and store */
  75. memmove(ractx->gain_block, ractx->gain_block - 1,
  76. 10 * sizeof(*ractx->gain_block));
  77. *ractx->gain_block = 10 * log10(sum) - 32;
  78. for (i=1; i < 5; i++)
  79. for (j=i-1; j >= 0; j--)
  80. buffer[i] -= ractx->sp_lpc[i-j-1] * buffer[j];
  81. /* output */
  82. for (i=0; i < 5; i++)
  83. ractx->sp_block[4-i] =
  84. av_clipf(ractx->sp_block[4-i] + buffer[i], -4095, 4095);
  85. }
  86. /**
  87. * Converts autocorrelation coefficients to LPC coefficients using the
  88. * Levinson-Durbin algorithm. See blocks 37 and 50 of the G.728 specification.
  89. *
  90. * @return 0 if success, -1 if fail
  91. */
  92. static int eval_lpc_coeffs(const float *in, float *tgt, int n)
  93. {
  94. int i, j;
  95. double f0, f1, f2;
  96. if (in[n] == 0)
  97. return -1;
  98. if ((f0 = *in) <= 0)
  99. return -1;
  100. in--; // To avoid a -1 subtraction in the inner loop
  101. for (i=1; i <= n; i++) {
  102. f1 = in[i+1];
  103. for (j=0; j < i - 1; j++)
  104. f1 += in[i-j]*tgt[j];
  105. tgt[i-1] = f2 = -f1/f0;
  106. for (j=0; j < i >> 1; j++) {
  107. float temp = tgt[j] + tgt[i-j-2]*f2;
  108. tgt[i-j-2] += tgt[j]*f2;
  109. tgt[j] = temp;
  110. }
  111. if ((f0 += f1*f2) < 0)
  112. return -1;
  113. }
  114. return 0;
  115. }
  116. static void prodsum(float *tgt, const float *src, int len, int n)
  117. {
  118. for (; n >= 0; n--)
  119. tgt[n] = scalar_product_float(src, src - n, len);
  120. }
  121. /**
  122. * Hybrid window filtering. See blocks 36 and 49 of the G.728 specification.
  123. *
  124. * @note This function is slightly different from that described in the spec.
  125. * It expects in[0] to be the newest sample and in[n-1] to be the oldest
  126. * one stored. The spec has in the more ordinary way (in[0] the oldest
  127. * and in[n-1] the newest).
  128. *
  129. * @param order the order of the filter
  130. * @param n the length of the input
  131. * @param non_rec the number of non-recursive samples
  132. * @param out the filter output
  133. * @param in pointer to the input of the filter
  134. * @param hist pointer to the input history of the filter. It is updated by
  135. * this function.
  136. * @param out pointer to the non-recursive part of the output
  137. * @param out2 pointer to the recursive part of the output
  138. * @param window pointer to the windowing function table
  139. */
  140. static void do_hybrid_window(int order, int n, int non_rec, const float *in,
  141. float *out, float *hist, float *out2,
  142. const float *window)
  143. {
  144. int i;
  145. float buffer1[order + 1];
  146. float buffer2[order + 1];
  147. float work[order + n + non_rec];
  148. /* update history */
  149. memmove(hist, hist + n, (order + non_rec)*sizeof(*hist));
  150. for (i=0; i < n; i++)
  151. hist[order + non_rec + i] = in[n-i-1];
  152. colmult(work, window, hist, order + n + non_rec);
  153. prodsum(buffer1, work + order , n , order);
  154. prodsum(buffer2, work + order + n, non_rec, order);
  155. for (i=0; i <= order; i++) {
  156. out2[i] = out2[i] * 0.5625 + buffer1[i];
  157. out [i] = out2[i] + buffer2[i];
  158. }
  159. /* Multiply by the white noise correcting factor (WNCF) */
  160. *out *= 257./256.;
  161. }
  162. /**
  163. * Backward synthesis filter. Find the LPC coefficients from past speech data.
  164. */
  165. static void backward_filter(RA288Context *ractx)
  166. {
  167. float temp1[37]; // RTMP in the spec
  168. float temp2[11]; // GPTPMP in the spec
  169. do_hybrid_window(36, 40, 35, ractx->sp_block, temp1, ractx->sp_hist,
  170. ractx->sp_rec, syn_window);
  171. if (!eval_lpc_coeffs(temp1, ractx->sp_lpc, 36))
  172. colmult(ractx->sp_lpc, ractx->sp_lpc, syn_bw_tab, 36);
  173. do_hybrid_window(10, 8, 20, ractx->gain_block, temp2, ractx->gain_hist,
  174. ractx->gain_rec, gain_window);
  175. if (!eval_lpc_coeffs(temp2, ractx->gain_lpc, 10))
  176. colmult(ractx->gain_lpc, ractx->gain_lpc, gain_bw_tab, 10);
  177. }
  178. static int ra288_decode_frame(AVCodecContext * avctx, void *data,
  179. int *data_size, const uint8_t * buf,
  180. int buf_size)
  181. {
  182. int16_t *out = data;
  183. int i, j;
  184. RA288Context *ractx = avctx->priv_data;
  185. GetBitContext gb;
  186. if (buf_size < avctx->block_align) {
  187. av_log(avctx, AV_LOG_ERROR,
  188. "Error! Input buffer is too small [%d<%d]\n",
  189. buf_size, avctx->block_align);
  190. return 0;
  191. }
  192. init_get_bits(&gb, buf, avctx->block_align * 8);
  193. for (i=0; i < 32; i++) {
  194. float gain = amptable[get_bits(&gb, 3)];
  195. int cb_coef = get_bits(&gb, 6 + (i&1));
  196. decode(ractx, gain, cb_coef);
  197. for (j=0; j < 5; j++)
  198. *(out++) = 8 * ractx->sp_block[4 - j];
  199. if ((i & 7) == 3)
  200. backward_filter(ractx);
  201. }
  202. *data_size = (char *)out - (char *)data;
  203. return avctx->block_align;
  204. }
  205. AVCodec ra_288_decoder =
  206. {
  207. "real_288",
  208. CODEC_TYPE_AUDIO,
  209. CODEC_ID_RA_288,
  210. sizeof(RA288Context),
  211. ra288_decode_init,
  212. NULL,
  213. NULL,
  214. ra288_decode_frame,
  215. .long_name = NULL_IF_CONFIG_SMALL("RealAudio 2.0 (28.8K)"),
  216. };