You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

127 lines
5.3KB

  1. /*
  2. * ARM optimized DSP utils
  3. * Copyright (c) 2001 Lionel Ulmer
  4. *
  5. * This file is part of FFmpeg.
  6. *
  7. * FFmpeg is free software; you can redistribute it and/or
  8. * modify it under the terms of the GNU Lesser General Public
  9. * License as published by the Free Software Foundation; either
  10. * version 2.1 of the License, or (at your option) any later version.
  11. *
  12. * FFmpeg is distributed in the hope that it will be useful,
  13. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  14. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  15. * Lesser General Public License for more details.
  16. *
  17. * You should have received a copy of the GNU Lesser General Public
  18. * License along with FFmpeg; if not, write to the Free Software
  19. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  20. */
  21. #include "libavcodec/dsputil.h"
  22. #include "dsputil_arm.h"
  23. void ff_j_rev_dct_arm(DCTELEM *data);
  24. void ff_simple_idct_arm(DCTELEM *data);
  25. /* XXX: local hack */
  26. static void (*ff_put_pixels_clamped)(const DCTELEM *block, uint8_t *pixels, int line_size);
  27. static void (*ff_add_pixels_clamped)(const DCTELEM *block, uint8_t *pixels, int line_size);
  28. void ff_put_pixels8_arm(uint8_t *block, const uint8_t *pixels, int line_size, int h);
  29. void ff_put_pixels8_x2_arm(uint8_t *block, const uint8_t *pixels, int line_size, int h);
  30. void ff_put_pixels8_y2_arm(uint8_t *block, const uint8_t *pixels, int line_size, int h);
  31. void ff_put_pixels8_xy2_arm(uint8_t *block, const uint8_t *pixels, int line_size, int h);
  32. void ff_put_no_rnd_pixels8_x2_arm(uint8_t *block, const uint8_t *pixels, int line_size, int h);
  33. void ff_put_no_rnd_pixels8_y2_arm(uint8_t *block, const uint8_t *pixels, int line_size, int h);
  34. void ff_put_no_rnd_pixels8_xy2_arm(uint8_t *block, const uint8_t *pixels, int line_size, int h);
  35. void ff_put_pixels16_arm(uint8_t *block, const uint8_t *pixels, int line_size, int h);
  36. CALL_2X_PIXELS(ff_put_pixels16_x2_arm, ff_put_pixels8_x2_arm, 8)
  37. CALL_2X_PIXELS(ff_put_pixels16_y2_arm, ff_put_pixels8_y2_arm, 8)
  38. CALL_2X_PIXELS(ff_put_pixels16_xy2_arm, ff_put_pixels8_xy2_arm, 8)
  39. CALL_2X_PIXELS(ff_put_no_rnd_pixels16_x2_arm, ff_put_no_rnd_pixels8_x2_arm, 8)
  40. CALL_2X_PIXELS(ff_put_no_rnd_pixels16_y2_arm, ff_put_no_rnd_pixels8_y2_arm, 8)
  41. CALL_2X_PIXELS(ff_put_no_rnd_pixels16_xy2_arm, ff_put_no_rnd_pixels8_xy2_arm,8)
  42. void ff_add_pixels_clamped_arm(const DCTELEM *block, uint8_t *dest,
  43. int line_size);
  44. /* XXX: those functions should be suppressed ASAP when all IDCTs are
  45. converted */
  46. static void j_rev_dct_arm_put(uint8_t *dest, int line_size, DCTELEM *block)
  47. {
  48. ff_j_rev_dct_arm (block);
  49. ff_put_pixels_clamped(block, dest, line_size);
  50. }
  51. static void j_rev_dct_arm_add(uint8_t *dest, int line_size, DCTELEM *block)
  52. {
  53. ff_j_rev_dct_arm (block);
  54. ff_add_pixels_clamped(block, dest, line_size);
  55. }
  56. static void simple_idct_arm_put(uint8_t *dest, int line_size, DCTELEM *block)
  57. {
  58. ff_simple_idct_arm (block);
  59. ff_put_pixels_clamped(block, dest, line_size);
  60. }
  61. static void simple_idct_arm_add(uint8_t *dest, int line_size, DCTELEM *block)
  62. {
  63. ff_simple_idct_arm (block);
  64. ff_add_pixels_clamped(block, dest, line_size);
  65. }
  66. int mm_support(void)
  67. {
  68. return HAVE_IWMMXT * FF_MM_IWMMXT;
  69. }
  70. void dsputil_init_arm(DSPContext* c, AVCodecContext *avctx)
  71. {
  72. ff_put_pixels_clamped = c->put_pixels_clamped;
  73. ff_add_pixels_clamped = c->add_pixels_clamped;
  74. if (!avctx->lowres) {
  75. if(avctx->idct_algo == FF_IDCT_AUTO ||
  76. avctx->idct_algo == FF_IDCT_ARM){
  77. c->idct_put = j_rev_dct_arm_put;
  78. c->idct_add = j_rev_dct_arm_add;
  79. c->idct = ff_j_rev_dct_arm;
  80. c->idct_permutation_type = FF_LIBMPEG2_IDCT_PERM;
  81. } else if (avctx->idct_algo == FF_IDCT_SIMPLEARM){
  82. c->idct_put = simple_idct_arm_put;
  83. c->idct_add = simple_idct_arm_add;
  84. c->idct = ff_simple_idct_arm;
  85. c->idct_permutation_type = FF_NO_IDCT_PERM;
  86. }
  87. }
  88. c->add_pixels_clamped = ff_add_pixels_clamped_arm;
  89. c->put_pixels_tab[0][0] = ff_put_pixels16_arm;
  90. c->put_pixels_tab[0][1] = ff_put_pixels16_x2_arm;
  91. c->put_pixels_tab[0][2] = ff_put_pixels16_y2_arm;
  92. c->put_pixels_tab[0][3] = ff_put_pixels16_xy2_arm;
  93. c->put_pixels_tab[1][0] = ff_put_pixels8_arm;
  94. c->put_pixels_tab[1][1] = ff_put_pixels8_x2_arm;
  95. c->put_pixels_tab[1][2] = ff_put_pixels8_y2_arm;
  96. c->put_pixels_tab[1][3] = ff_put_pixels8_xy2_arm;
  97. c->put_no_rnd_pixels_tab[0][0] = ff_put_pixels16_arm;
  98. c->put_no_rnd_pixels_tab[0][1] = ff_put_no_rnd_pixels16_x2_arm;
  99. c->put_no_rnd_pixels_tab[0][2] = ff_put_no_rnd_pixels16_y2_arm;
  100. c->put_no_rnd_pixels_tab[0][3] = ff_put_no_rnd_pixels16_xy2_arm;
  101. c->put_no_rnd_pixels_tab[1][0] = ff_put_pixels8_arm;
  102. c->put_no_rnd_pixels_tab[1][1] = ff_put_no_rnd_pixels8_x2_arm;
  103. c->put_no_rnd_pixels_tab[1][2] = ff_put_no_rnd_pixels8_y2_arm;
  104. c->put_no_rnd_pixels_tab[1][3] = ff_put_no_rnd_pixels8_xy2_arm;
  105. if (HAVE_ARMV5TE) ff_dsputil_init_armv5te(c, avctx);
  106. if (HAVE_ARMV6) ff_dsputil_init_armv6(c, avctx);
  107. if (HAVE_IWMMXT) ff_dsputil_init_iwmmxt(c, avctx);
  108. if (HAVE_ARMVFP) ff_dsputil_init_vfp(c, avctx);
  109. if (HAVE_NEON) ff_dsputil_init_neon(c, avctx);
  110. }