You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

87 lines
2.7KB

  1. /*
  2. * This file is part of Libav.
  3. *
  4. * Libav is free software; you can redistribute it and/or
  5. * modify it under the terms of the GNU Lesser General Public
  6. * License as published by the Free Software Foundation; either
  7. * version 2.1 of the License, or (at your option) any later version.
  8. *
  9. * Libav is distributed in the hope that it will be useful,
  10. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  11. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  12. * Lesser General Public License for more details.
  13. *
  14. * You should have received a copy of the GNU Lesser General Public
  15. * License along with Libav; if not, write to the Free Software
  16. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  17. */
  18. #include "config.h"
  19. #include "fdct.h"
  20. #include "xvididct.h"
  21. #include "simple_idct.h"
  22. static const struct algo fdct_tab_arch[] = {
  23. #if HAVE_MMX_INLINE
  24. { "MMX", ff_fdct_mmx, FF_IDCT_PERM_NONE, AV_CPU_FLAG_MMX },
  25. #endif
  26. #if HAVE_MMXEXT_INLINE
  27. { "MMXEXT", ff_fdct_mmxext, FF_IDCT_PERM_NONE, AV_CPU_FLAG_MMXEXT },
  28. #endif
  29. #if HAVE_SSE2_INLINE
  30. { "SSE2", ff_fdct_sse2, FF_IDCT_PERM_NONE, AV_CPU_FLAG_SSE2 },
  31. #endif
  32. { 0 }
  33. };
  34. static const struct algo idct_tab_arch[] = {
  35. #if HAVE_MMX_INLINE
  36. { "SIMPLE-MMX", ff_simple_idct_mmx, FF_IDCT_PERM_SIMPLE, AV_CPU_FLAG_MMX },
  37. #endif
  38. #if CONFIG_MPEG4_DECODER
  39. #if HAVE_MMX_INLINE
  40. { "XVID-MMX", ff_xvid_idct_mmx, FF_IDCT_PERM_NONE, AV_CPU_FLAG_MMX, 1 },
  41. #endif
  42. #if HAVE_MMXEXT_INLINE
  43. { "XVID-MMXEXT", ff_xvid_idct_mmxext, FF_IDCT_PERM_NONE, AV_CPU_FLAG_MMXEXT, 1 },
  44. #endif
  45. #if HAVE_SSE2_INLINE
  46. { "XVID-SSE2", ff_xvid_idct_sse2, FF_IDCT_PERM_SSE2, AV_CPU_FLAG_SSE2, 1 },
  47. #endif
  48. #endif /* CONFIG_MPEG4_DECODER */
  49. { 0 }
  50. };
  51. static short idct_simple_mmx_perm[64] = {
  52. 0x00, 0x08, 0x04, 0x09, 0x01, 0x0C, 0x05, 0x0D,
  53. 0x10, 0x18, 0x14, 0x19, 0x11, 0x1C, 0x15, 0x1D,
  54. 0x20, 0x28, 0x24, 0x29, 0x21, 0x2C, 0x25, 0x2D,
  55. 0x12, 0x1A, 0x16, 0x1B, 0x13, 0x1E, 0x17, 0x1F,
  56. 0x02, 0x0A, 0x06, 0x0B, 0x03, 0x0E, 0x07, 0x0F,
  57. 0x30, 0x38, 0x34, 0x39, 0x31, 0x3C, 0x35, 0x3D,
  58. 0x22, 0x2A, 0x26, 0x2B, 0x23, 0x2E, 0x27, 0x2F,
  59. 0x32, 0x3A, 0x36, 0x3B, 0x33, 0x3E, 0x37, 0x3F,
  60. };
  61. static const uint8_t idct_sse2_row_perm[8] = { 0, 4, 1, 5, 2, 6, 3, 7 };
  62. static int permute_x86(int16_t dst[64], const int16_t src[64],
  63. enum idct_permutation_type perm_type)
  64. {
  65. int i;
  66. switch (perm_type) {
  67. case FF_IDCT_PERM_SIMPLE:
  68. for (i = 0; i < 64; i++)
  69. dst[idct_simple_mmx_perm[i]] = src[i];
  70. return 1;
  71. case FF_IDCT_PERM_SSE2:
  72. for (i = 0; i < 64; i++)
  73. dst[(i & 0x38) | idct_sse2_row_perm[i & 7]] = src[i];
  74. return 1;
  75. }
  76. return 0;
  77. }