You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

131 lines
5.0KB

  1. /*
  2. * ARM optimized DSP utils
  3. * Copyright (c) 2001 Lionel Ulmer
  4. *
  5. * This file is part of FFmpeg.
  6. *
  7. * FFmpeg is free software; you can redistribute it and/or
  8. * modify it under the terms of the GNU Lesser General Public
  9. * License as published by the Free Software Foundation; either
  10. * version 2.1 of the License, or (at your option) any later version.
  11. *
  12. * FFmpeg is distributed in the hope that it will be useful,
  13. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  14. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  15. * Lesser General Public License for more details.
  16. *
  17. * You should have received a copy of the GNU Lesser General Public
  18. * License along with FFmpeg; if not, write to the Free Software
  19. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  20. */
  21. #include "libavcodec/dsputil.h"
  22. #include "dsputil_arm.h"
  23. void j_rev_dct_ARM(DCTELEM *data);
  24. void simple_idct_ARM(DCTELEM *data);
  25. /* XXX: local hack */
  26. static void (*ff_put_pixels_clamped)(const DCTELEM *block, uint8_t *pixels, int line_size);
  27. static void (*ff_add_pixels_clamped)(const DCTELEM *block, uint8_t *pixels, int line_size);
  28. void put_pixels8_arm(uint8_t *block, const uint8_t *pixels, int line_size, int h);
  29. void put_pixels8_x2_arm(uint8_t *block, const uint8_t *pixels, int line_size, int h);
  30. void put_pixels8_y2_arm(uint8_t *block, const uint8_t *pixels, int line_size, int h);
  31. void put_pixels8_xy2_arm(uint8_t *block, const uint8_t *pixels, int line_size, int h);
  32. void put_no_rnd_pixels8_x2_arm(uint8_t *block, const uint8_t *pixels, int line_size, int h);
  33. void put_no_rnd_pixels8_y2_arm(uint8_t *block, const uint8_t *pixels, int line_size, int h);
  34. void put_no_rnd_pixels8_xy2_arm(uint8_t *block, const uint8_t *pixels, int line_size, int h);
  35. void put_pixels16_arm(uint8_t *block, const uint8_t *pixels, int line_size, int h);
  36. CALL_2X_PIXELS(put_pixels16_x2_arm , put_pixels8_x2_arm , 8)
  37. CALL_2X_PIXELS(put_pixels16_y2_arm , put_pixels8_y2_arm , 8)
  38. CALL_2X_PIXELS(put_pixels16_xy2_arm, put_pixels8_xy2_arm, 8)
  39. CALL_2X_PIXELS(put_no_rnd_pixels16_x2_arm , put_no_rnd_pixels8_x2_arm , 8)
  40. CALL_2X_PIXELS(put_no_rnd_pixels16_y2_arm , put_no_rnd_pixels8_y2_arm , 8)
  41. CALL_2X_PIXELS(put_no_rnd_pixels16_xy2_arm, put_no_rnd_pixels8_xy2_arm, 8)
  42. void ff_add_pixels_clamped_ARM(short *block, unsigned char *dest,
  43. int line_size);
  44. /* XXX: those functions should be suppressed ASAP when all IDCTs are
  45. converted */
  46. static void j_rev_dct_ARM_put(uint8_t *dest, int line_size, DCTELEM *block)
  47. {
  48. j_rev_dct_ARM (block);
  49. ff_put_pixels_clamped(block, dest, line_size);
  50. }
  51. static void j_rev_dct_ARM_add(uint8_t *dest, int line_size, DCTELEM *block)
  52. {
  53. j_rev_dct_ARM (block);
  54. ff_add_pixels_clamped(block, dest, line_size);
  55. }
  56. static void simple_idct_ARM_put(uint8_t *dest, int line_size, DCTELEM *block)
  57. {
  58. simple_idct_ARM (block);
  59. ff_put_pixels_clamped(block, dest, line_size);
  60. }
  61. static void simple_idct_ARM_add(uint8_t *dest, int line_size, DCTELEM *block)
  62. {
  63. simple_idct_ARM (block);
  64. ff_add_pixels_clamped(block, dest, line_size);
  65. }
  66. int mm_support(void)
  67. {
  68. return HAVE_IWMMXT * FF_MM_IWMMXT;
  69. }
  70. void dsputil_init_arm(DSPContext* c, AVCodecContext *avctx)
  71. {
  72. ff_put_pixels_clamped = c->put_pixels_clamped;
  73. ff_add_pixels_clamped = c->add_pixels_clamped;
  74. if (avctx->lowres == 0) {
  75. if(avctx->idct_algo == FF_IDCT_AUTO ||
  76. avctx->idct_algo == FF_IDCT_ARM){
  77. c->idct_put= j_rev_dct_ARM_put;
  78. c->idct_add= j_rev_dct_ARM_add;
  79. c->idct = j_rev_dct_ARM;
  80. c->idct_permutation_type= FF_LIBMPEG2_IDCT_PERM;
  81. } else if (avctx->idct_algo==FF_IDCT_SIMPLEARM){
  82. c->idct_put= simple_idct_ARM_put;
  83. c->idct_add= simple_idct_ARM_add;
  84. c->idct = simple_idct_ARM;
  85. c->idct_permutation_type= FF_NO_IDCT_PERM;
  86. }
  87. }
  88. c->put_pixels_tab[0][0] = put_pixels16_arm;
  89. c->put_pixels_tab[0][1] = put_pixels16_x2_arm;
  90. c->put_pixels_tab[0][2] = put_pixels16_y2_arm;
  91. c->put_pixels_tab[0][3] = put_pixels16_xy2_arm;
  92. c->put_no_rnd_pixels_tab[0][0] = put_pixels16_arm;
  93. c->put_no_rnd_pixels_tab[0][1] = put_no_rnd_pixels16_x2_arm;
  94. c->put_no_rnd_pixels_tab[0][2] = put_no_rnd_pixels16_y2_arm;
  95. c->put_no_rnd_pixels_tab[0][3] = put_no_rnd_pixels16_xy2_arm;
  96. c->put_pixels_tab[1][0] = put_pixels8_arm;
  97. c->put_pixels_tab[1][1] = put_pixels8_x2_arm;
  98. c->put_pixels_tab[1][2] = put_pixels8_y2_arm;
  99. c->put_pixels_tab[1][3] = put_pixels8_xy2_arm;
  100. c->put_no_rnd_pixels_tab[1][0] = put_pixels8_arm;
  101. c->put_no_rnd_pixels_tab[1][1] = put_no_rnd_pixels8_x2_arm;
  102. c->put_no_rnd_pixels_tab[1][2] = put_no_rnd_pixels8_y2_arm;
  103. c->put_no_rnd_pixels_tab[1][3] = put_no_rnd_pixels8_xy2_arm;
  104. if (HAVE_ARMV5TE) ff_dsputil_init_armv5te(c, avctx);
  105. if (HAVE_ARMV6) ff_dsputil_init_armv6(c, avctx);
  106. #if HAVE_IWMMXT
  107. dsputil_init_iwmmxt(c, avctx);
  108. #endif
  109. #if HAVE_ARMVFP
  110. ff_float_init_arm_vfp(c, avctx);
  111. #endif
  112. #if HAVE_NEON
  113. ff_dsputil_init_neon(c, avctx);
  114. #endif
  115. }