You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

122 lines
5.2KB

  1. /*
  2. * ARM optimized DSP utils
  3. * Copyright (c) 2001 Lionel Ulmer
  4. *
  5. * This file is part of FFmpeg.
  6. *
  7. * FFmpeg is free software; you can redistribute it and/or
  8. * modify it under the terms of the GNU Lesser General Public
  9. * License as published by the Free Software Foundation; either
  10. * version 2.1 of the License, or (at your option) any later version.
  11. *
  12. * FFmpeg is distributed in the hope that it will be useful,
  13. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  14. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  15. * Lesser General Public License for more details.
  16. *
  17. * You should have received a copy of the GNU Lesser General Public
  18. * License along with FFmpeg; if not, write to the Free Software
  19. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  20. */
  21. #include "libavcodec/dsputil.h"
  22. #include "dsputil_arm.h"
  23. void ff_j_rev_dct_arm(DCTELEM *data);
  24. void ff_simple_idct_arm(DCTELEM *data);
  25. /* XXX: local hack */
  26. static void (*ff_put_pixels_clamped)(const DCTELEM *block, uint8_t *pixels, int line_size);
  27. static void (*ff_add_pixels_clamped)(const DCTELEM *block, uint8_t *pixels, int line_size);
  28. void ff_put_pixels8_arm(uint8_t *block, const uint8_t *pixels, int line_size, int h);
  29. void ff_put_pixels8_x2_arm(uint8_t *block, const uint8_t *pixels, int line_size, int h);
  30. void ff_put_pixels8_y2_arm(uint8_t *block, const uint8_t *pixels, int line_size, int h);
  31. void ff_put_pixels8_xy2_arm(uint8_t *block, const uint8_t *pixels, int line_size, int h);
  32. void ff_put_no_rnd_pixels8_x2_arm(uint8_t *block, const uint8_t *pixels, int line_size, int h);
  33. void ff_put_no_rnd_pixels8_y2_arm(uint8_t *block, const uint8_t *pixels, int line_size, int h);
  34. void ff_put_no_rnd_pixels8_xy2_arm(uint8_t *block, const uint8_t *pixels, int line_size, int h);
  35. void ff_put_pixels16_arm(uint8_t *block, const uint8_t *pixels, int line_size, int h);
  36. CALL_2X_PIXELS(ff_put_pixels16_x2_arm, ff_put_pixels8_x2_arm, 8)
  37. CALL_2X_PIXELS(ff_put_pixels16_y2_arm, ff_put_pixels8_y2_arm, 8)
  38. CALL_2X_PIXELS(ff_put_pixels16_xy2_arm, ff_put_pixels8_xy2_arm, 8)
  39. CALL_2X_PIXELS(ff_put_no_rnd_pixels16_x2_arm, ff_put_no_rnd_pixels8_x2_arm, 8)
  40. CALL_2X_PIXELS(ff_put_no_rnd_pixels16_y2_arm, ff_put_no_rnd_pixels8_y2_arm, 8)
  41. CALL_2X_PIXELS(ff_put_no_rnd_pixels16_xy2_arm, ff_put_no_rnd_pixels8_xy2_arm,8)
  42. void ff_add_pixels_clamped_arm(const DCTELEM *block, uint8_t *dest,
  43. int line_size);
  44. /* XXX: those functions should be suppressed ASAP when all IDCTs are
  45. converted */
  46. static void j_rev_dct_arm_put(uint8_t *dest, int line_size, DCTELEM *block)
  47. {
  48. ff_j_rev_dct_arm (block);
  49. ff_put_pixels_clamped(block, dest, line_size);
  50. }
  51. static void j_rev_dct_arm_add(uint8_t *dest, int line_size, DCTELEM *block)
  52. {
  53. ff_j_rev_dct_arm (block);
  54. ff_add_pixels_clamped(block, dest, line_size);
  55. }
  56. static void simple_idct_arm_put(uint8_t *dest, int line_size, DCTELEM *block)
  57. {
  58. ff_simple_idct_arm (block);
  59. ff_put_pixels_clamped(block, dest, line_size);
  60. }
  61. static void simple_idct_arm_add(uint8_t *dest, int line_size, DCTELEM *block)
  62. {
  63. ff_simple_idct_arm (block);
  64. ff_add_pixels_clamped(block, dest, line_size);
  65. }
  66. void dsputil_init_arm(DSPContext* c, AVCodecContext *avctx)
  67. {
  68. ff_put_pixels_clamped = c->put_pixels_clamped;
  69. ff_add_pixels_clamped = c->add_pixels_clamped;
  70. if (!avctx->lowres) {
  71. if(avctx->idct_algo == FF_IDCT_AUTO ||
  72. avctx->idct_algo == FF_IDCT_ARM){
  73. c->idct_put = j_rev_dct_arm_put;
  74. c->idct_add = j_rev_dct_arm_add;
  75. c->idct = ff_j_rev_dct_arm;
  76. c->idct_permutation_type = FF_LIBMPEG2_IDCT_PERM;
  77. } else if (avctx->idct_algo == FF_IDCT_SIMPLEARM){
  78. c->idct_put = simple_idct_arm_put;
  79. c->idct_add = simple_idct_arm_add;
  80. c->idct = ff_simple_idct_arm;
  81. c->idct_permutation_type = FF_NO_IDCT_PERM;
  82. }
  83. }
  84. c->add_pixels_clamped = ff_add_pixels_clamped_arm;
  85. c->put_pixels_tab[0][0] = ff_put_pixels16_arm;
  86. c->put_pixels_tab[0][1] = ff_put_pixels16_x2_arm;
  87. c->put_pixels_tab[0][2] = ff_put_pixels16_y2_arm;
  88. c->put_pixels_tab[0][3] = ff_put_pixels16_xy2_arm;
  89. c->put_pixels_tab[1][0] = ff_put_pixels8_arm;
  90. c->put_pixels_tab[1][1] = ff_put_pixels8_x2_arm;
  91. c->put_pixels_tab[1][2] = ff_put_pixels8_y2_arm;
  92. c->put_pixels_tab[1][3] = ff_put_pixels8_xy2_arm;
  93. c->put_no_rnd_pixels_tab[0][0] = ff_put_pixels16_arm;
  94. c->put_no_rnd_pixels_tab[0][1] = ff_put_no_rnd_pixels16_x2_arm;
  95. c->put_no_rnd_pixels_tab[0][2] = ff_put_no_rnd_pixels16_y2_arm;
  96. c->put_no_rnd_pixels_tab[0][3] = ff_put_no_rnd_pixels16_xy2_arm;
  97. c->put_no_rnd_pixels_tab[1][0] = ff_put_pixels8_arm;
  98. c->put_no_rnd_pixels_tab[1][1] = ff_put_no_rnd_pixels8_x2_arm;
  99. c->put_no_rnd_pixels_tab[1][2] = ff_put_no_rnd_pixels8_y2_arm;
  100. c->put_no_rnd_pixels_tab[1][3] = ff_put_no_rnd_pixels8_xy2_arm;
  101. if (HAVE_ARMV5TE) ff_dsputil_init_armv5te(c, avctx);
  102. if (HAVE_ARMV6) ff_dsputil_init_armv6(c, avctx);
  103. if (HAVE_IWMMXT) ff_dsputil_init_iwmmxt(c, avctx);
  104. if (HAVE_ARMVFP) ff_dsputil_init_vfp(c, avctx);
  105. if (HAVE_NEON) ff_dsputil_init_neon(c, avctx);
  106. }