You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

74 lines
2.1KB

  1. /*
  2. * This file is part of Libav.
  3. *
  4. * Libav is free software; you can redistribute it and/or
  5. * modify it under the terms of the GNU Lesser General Public
  6. * License as published by the Free Software Foundation; either
  7. * version 2.1 of the License, or (at your option) any later version.
  8. *
  9. * Libav is distributed in the hope that it will be useful,
  10. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  11. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  12. * Lesser General Public License for more details.
  13. *
  14. * You should have received a copy of the GNU Lesser General Public
  15. * License along with Libav; if not, write to the Free Software
  16. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  17. */
  18. #include "config.h"
  19. #include "libavutil/attributes.h"
  20. #include "libavutil/cpu.h"
  21. #include "libavutil/x86/asm.h"
  22. #include "libavutil/x86/cpu.h"
  23. #include "libavcodec/svq1enc.h"
  24. #if HAVE_INLINE_ASM
  25. static int ssd_int8_vs_int16_mmx(const int8_t *pix1, const int16_t *pix2,
  26. int size)
  27. {
  28. int sum;
  29. x86_reg i = size;
  30. __asm__ volatile (
  31. "pxor %%mm4, %%mm4 \n"
  32. "1: \n"
  33. "sub $8, %0 \n"
  34. "movq (%2, %0), %%mm2 \n"
  35. "movq (%3, %0, 2), %%mm0 \n"
  36. "movq 8(%3, %0, 2), %%mm1 \n"
  37. "punpckhbw %%mm2, %%mm3 \n"
  38. "punpcklbw %%mm2, %%mm2 \n"
  39. "psraw $8, %%mm3 \n"
  40. "psraw $8, %%mm2 \n"
  41. "psubw %%mm3, %%mm1 \n"
  42. "psubw %%mm2, %%mm0 \n"
  43. "pmaddwd %%mm1, %%mm1 \n"
  44. "pmaddwd %%mm0, %%mm0 \n"
  45. "paddd %%mm1, %%mm4 \n"
  46. "paddd %%mm0, %%mm4 \n"
  47. "jg 1b \n"
  48. "movq %%mm4, %%mm3 \n"
  49. "psrlq $32, %%mm3 \n"
  50. "paddd %%mm3, %%mm4 \n"
  51. "movd %%mm4, %1 \n"
  52. : "+r" (i), "=r" (sum)
  53. : "r" (pix1), "r" (pix2));
  54. return sum;
  55. }
  56. #endif /* HAVE_INLINE_ASM */
  57. av_cold void ff_svq1enc_init_x86(SVQ1EncContext *c)
  58. {
  59. #if HAVE_INLINE_ASM
  60. int cpu_flags = av_get_cpu_flags();
  61. if (INLINE_MMX(cpu_flags)) {
  62. c->ssd_int8_vs_int16 = ssd_int8_vs_int16_mmx;
  63. }
  64. #endif /* HAVE_INLINE_ASM */
  65. }