You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

227 lines
5.2KB

  1. /*
  2. * (I)DCT Transforms
  3. * Copyright (c) 2009 Peter Ross <pross@xvid.org>
  4. * Copyright (c) 2010 Alex Converse <alex.converse@gmail.com>
  5. * Copyright (c) 2010 Vitor Sessak
  6. *
  7. * This file is part of FFmpeg.
  8. *
  9. * FFmpeg is free software; you can redistribute it and/or
  10. * modify it under the terms of the GNU Lesser General Public
  11. * License as published by the Free Software Foundation; either
  12. * version 2.1 of the License, or (at your option) any later version.
  13. *
  14. * FFmpeg is distributed in the hope that it will be useful,
  15. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  16. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  17. * Lesser General Public License for more details.
  18. *
  19. * You should have received a copy of the GNU Lesser General Public
  20. * License along with FFmpeg; if not, write to the Free Software
  21. * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA
  22. */
  23. /**
  24. * @file
  25. * (Inverse) Discrete Cosine Transforms. These are also known as the
  26. * type II and type III DCTs respectively.
  27. */
  28. #include <math.h>
  29. #include "libavutil/mathematics.h"
  30. #include "fft.h"
  31. #include "x86/fft.h"
  32. #define DCT32_FLOAT
  33. #include "dct32.c"
  34. /* sin((M_PI * x / (2*n)) */
  35. #define SIN(s,n,x) (s->costab[(n) - (x)])
  36. /* cos((M_PI * x / (2*n)) */
  37. #define COS(s,n,x) (s->costab[x])
  38. static void ff_dst_calc_I_c(DCTContext *ctx, FFTSample *data)
  39. {
  40. int n = 1 << ctx->nbits;
  41. int i;
  42. data[0] = 0;
  43. for(i = 1; i < n/2; i++) {
  44. float tmp1 = data[i ];
  45. float tmp2 = data[n - i];
  46. float s = SIN(ctx, n, 2*i);
  47. s *= tmp1 + tmp2;
  48. tmp1 = (tmp1 - tmp2) * 0.5f;
  49. data[i ] = s + tmp1;
  50. data[n - i] = s - tmp1;
  51. }
  52. data[n/2] *= 2;
  53. ff_rdft_calc(&ctx->rdft, data);
  54. data[0] *= 0.5f;
  55. for(i = 1; i < n-2; i += 2) {
  56. data[i + 1] += data[i - 1];
  57. data[i ] = -data[i + 2];
  58. }
  59. data[n-1] = 0;
  60. }
  61. static void ff_dct_calc_I_c(DCTContext *ctx, FFTSample *data)
  62. {
  63. int n = 1 << ctx->nbits;
  64. int i;
  65. float next = -0.5f * (data[0] - data[n]);
  66. for(i = 0; i < n/2; i++) {
  67. float tmp1 = data[i ];
  68. float tmp2 = data[n - i];
  69. float s = SIN(ctx, n, 2*i);
  70. float c = COS(ctx, n, 2*i);
  71. c *= tmp1 - tmp2;
  72. s *= tmp1 - tmp2;
  73. next += c;
  74. tmp1 = (tmp1 + tmp2) * 0.5f;
  75. data[i ] = tmp1 - s;
  76. data[n - i] = tmp1 + s;
  77. }
  78. ff_rdft_calc(&ctx->rdft, data);
  79. data[n] = data[1];
  80. data[1] = next;
  81. for(i = 3; i <= n; i += 2)
  82. data[i] = data[i - 2] - data[i];
  83. }
  84. static void ff_dct_calc_III_c(DCTContext *ctx, FFTSample *data)
  85. {
  86. int n = 1 << ctx->nbits;
  87. int i;
  88. float next = data[n - 1];
  89. float inv_n = 1.0f / n;
  90. for (i = n - 2; i >= 2; i -= 2) {
  91. float val1 = data[i ];
  92. float val2 = data[i - 1] - data[i + 1];
  93. float c = COS(ctx, n, i);
  94. float s = SIN(ctx, n, i);
  95. data[i ] = c * val1 + s * val2;
  96. data[i + 1] = s * val1 - c * val2;
  97. }
  98. data[1] = 2 * next;
  99. ff_rdft_calc(&ctx->rdft, data);
  100. for (i = 0; i < n / 2; i++) {
  101. float tmp1 = data[i ] * inv_n;
  102. float tmp2 = data[n - i - 1] * inv_n;
  103. float csc = ctx->csc2[i] * (tmp1 - tmp2);
  104. tmp1 += tmp2;
  105. data[i ] = tmp1 + csc;
  106. data[n - i - 1] = tmp1 - csc;
  107. }
  108. }
  109. static void ff_dct_calc_II_c(DCTContext *ctx, FFTSample *data)
  110. {
  111. int n = 1 << ctx->nbits;
  112. int i;
  113. float next;
  114. for (i=0; i < n/2; i++) {
  115. float tmp1 = data[i ];
  116. float tmp2 = data[n - i - 1];
  117. float s = SIN(ctx, n, 2*i + 1);
  118. s *= tmp1 - tmp2;
  119. tmp1 = (tmp1 + tmp2) * 0.5f;
  120. data[i ] = tmp1 + s;
  121. data[n-i-1] = tmp1 - s;
  122. }
  123. ff_rdft_calc(&ctx->rdft, data);
  124. next = data[1] * 0.5;
  125. data[1] *= -1;
  126. for (i = n - 2; i >= 0; i -= 2) {
  127. float inr = data[i ];
  128. float ini = data[i + 1];
  129. float c = COS(ctx, n, i);
  130. float s = SIN(ctx, n, i);
  131. data[i ] = c * inr + s * ini;
  132. data[i+1] = next;
  133. next += s * inr - c * ini;
  134. }
  135. }
  136. static void dct32_func(DCTContext *ctx, FFTSample *data)
  137. {
  138. ctx->dct32(data, data);
  139. }
  140. void ff_dct_calc(DCTContext *s, FFTSample *data)
  141. {
  142. s->dct_calc(s, data);
  143. }
  144. av_cold int ff_dct_init(DCTContext *s, int nbits, enum DCTTransformType inverse)
  145. {
  146. int n = 1 << nbits;
  147. int i;
  148. s->nbits = nbits;
  149. s->inverse = inverse;
  150. ff_init_ff_cos_tabs(nbits+2);
  151. s->costab = ff_cos_tabs[nbits+2];
  152. s->csc2 = av_malloc(n/2 * sizeof(FFTSample));
  153. if (ff_rdft_init(&s->rdft, nbits, inverse == DCT_III) < 0) {
  154. av_free(s->csc2);
  155. return -1;
  156. }
  157. for (i = 0; i < n/2; i++)
  158. s->csc2[i] = 0.5 / sin((M_PI / (2*n) * (2*i + 1)));
  159. switch(inverse) {
  160. case DCT_I : s->dct_calc = ff_dct_calc_I_c; break;
  161. case DCT_II : s->dct_calc = ff_dct_calc_II_c ; break;
  162. case DCT_III: s->dct_calc = ff_dct_calc_III_c; break;
  163. case DST_I : s->dct_calc = ff_dst_calc_I_c; break;
  164. }
  165. if (inverse == DCT_II && nbits == 5)
  166. s->dct_calc = dct32_func;
  167. s->dct32 = dct32;
  168. if (HAVE_MMX) ff_dct_init_mmx(s);
  169. return 0;
  170. }
  171. av_cold void ff_dct_end(DCTContext *s)
  172. {
  173. ff_rdft_end(&s->rdft);
  174. av_free(s->csc2);
  175. }