You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

126 lines
5.3KB

  1. /*
  2. * ARM optimized DSP utils
  3. * Copyright (c) 2001 Lionel Ulmer
  4. *
  5. * This file is part of Libav.
  6. *
  7. * Libav is free software; you can redistribute it and/or
  8. * modify it under the terms of the GNU Lesser General Public
  9. * License as published by the Free Software Foundation; either
  10. * version 2.1 of the License, or (at your option) any later version.
  11. *
  12. * Libav is distributed in the hope that it will be useful,
  13. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  14. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  15. * Lesser General Public License for more details.
  16. *
  17. * You should have received a copy of the GNU Lesser General Public
  18. * License along with Libav; if not, write to the Free Software
  19. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  20. */
  21. #include "libavutil/arm/cpu.h"
  22. #include "libavcodec/dsputil.h"
  23. #include "dsputil_arm.h"
  24. void ff_j_rev_dct_arm(int16_t *data);
  25. void ff_simple_idct_arm(int16_t *data);
  26. /* XXX: local hack */
  27. static void (*ff_put_pixels_clamped)(const int16_t *block, uint8_t *pixels, int line_size);
  28. static void (*ff_add_pixels_clamped)(const int16_t *block, uint8_t *pixels, int line_size);
  29. void ff_put_pixels8_arm(uint8_t *block, const uint8_t *pixels, int line_size, int h);
  30. void ff_put_pixels8_x2_arm(uint8_t *block, const uint8_t *pixels, int line_size, int h);
  31. void ff_put_pixels8_y2_arm(uint8_t *block, const uint8_t *pixels, int line_size, int h);
  32. void ff_put_pixels8_xy2_arm(uint8_t *block, const uint8_t *pixels, int line_size, int h);
  33. void ff_put_no_rnd_pixels8_x2_arm(uint8_t *block, const uint8_t *pixels, int line_size, int h);
  34. void ff_put_no_rnd_pixels8_y2_arm(uint8_t *block, const uint8_t *pixels, int line_size, int h);
  35. void ff_put_no_rnd_pixels8_xy2_arm(uint8_t *block, const uint8_t *pixels, int line_size, int h);
  36. void ff_put_pixels16_arm(uint8_t *block, const uint8_t *pixels, int line_size, int h);
  37. CALL_2X_PIXELS(ff_put_pixels16_x2_arm, ff_put_pixels8_x2_arm, 8)
  38. CALL_2X_PIXELS(ff_put_pixels16_y2_arm, ff_put_pixels8_y2_arm, 8)
  39. CALL_2X_PIXELS(ff_put_pixels16_xy2_arm, ff_put_pixels8_xy2_arm, 8)
  40. CALL_2X_PIXELS(ff_put_no_rnd_pixels16_x2_arm, ff_put_no_rnd_pixels8_x2_arm, 8)
  41. CALL_2X_PIXELS(ff_put_no_rnd_pixels16_y2_arm, ff_put_no_rnd_pixels8_y2_arm, 8)
  42. CALL_2X_PIXELS(ff_put_no_rnd_pixels16_xy2_arm, ff_put_no_rnd_pixels8_xy2_arm,8)
  43. void ff_add_pixels_clamped_arm(const int16_t *block, uint8_t *dest,
  44. int line_size);
  45. /* XXX: those functions should be suppressed ASAP when all IDCTs are
  46. converted */
  47. static void j_rev_dct_arm_put(uint8_t *dest, int line_size, int16_t *block)
  48. {
  49. ff_j_rev_dct_arm (block);
  50. ff_put_pixels_clamped(block, dest, line_size);
  51. }
  52. static void j_rev_dct_arm_add(uint8_t *dest, int line_size, int16_t *block)
  53. {
  54. ff_j_rev_dct_arm (block);
  55. ff_add_pixels_clamped(block, dest, line_size);
  56. }
  57. static void simple_idct_arm_put(uint8_t *dest, int line_size, int16_t *block)
  58. {
  59. ff_simple_idct_arm (block);
  60. ff_put_pixels_clamped(block, dest, line_size);
  61. }
  62. static void simple_idct_arm_add(uint8_t *dest, int line_size, int16_t *block)
  63. {
  64. ff_simple_idct_arm (block);
  65. ff_add_pixels_clamped(block, dest, line_size);
  66. }
  67. void ff_dsputil_init_arm(DSPContext* c, AVCodecContext *avctx)
  68. {
  69. const int high_bit_depth = avctx->bits_per_raw_sample > 8;
  70. int cpu_flags = av_get_cpu_flags();
  71. ff_put_pixels_clamped = c->put_pixels_clamped;
  72. ff_add_pixels_clamped = c->add_pixels_clamped;
  73. if (avctx->bits_per_raw_sample <= 8) {
  74. if(avctx->idct_algo == FF_IDCT_AUTO ||
  75. avctx->idct_algo == FF_IDCT_ARM){
  76. c->idct_put = j_rev_dct_arm_put;
  77. c->idct_add = j_rev_dct_arm_add;
  78. c->idct = ff_j_rev_dct_arm;
  79. c->idct_permutation_type = FF_LIBMPEG2_IDCT_PERM;
  80. } else if (avctx->idct_algo == FF_IDCT_SIMPLEARM){
  81. c->idct_put = simple_idct_arm_put;
  82. c->idct_add = simple_idct_arm_add;
  83. c->idct = ff_simple_idct_arm;
  84. c->idct_permutation_type = FF_NO_IDCT_PERM;
  85. }
  86. }
  87. c->add_pixels_clamped = ff_add_pixels_clamped_arm;
  88. if (!high_bit_depth) {
  89. c->put_pixels_tab[0][0] = ff_put_pixels16_arm;
  90. c->put_pixels_tab[0][1] = ff_put_pixels16_x2_arm;
  91. c->put_pixels_tab[0][2] = ff_put_pixels16_y2_arm;
  92. c->put_pixels_tab[0][3] = ff_put_pixels16_xy2_arm;
  93. c->put_pixels_tab[1][0] = ff_put_pixels8_arm;
  94. c->put_pixels_tab[1][1] = ff_put_pixels8_x2_arm;
  95. c->put_pixels_tab[1][2] = ff_put_pixels8_y2_arm;
  96. c->put_pixels_tab[1][3] = ff_put_pixels8_xy2_arm;
  97. c->put_no_rnd_pixels_tab[0][0] = ff_put_pixels16_arm;
  98. c->put_no_rnd_pixels_tab[0][1] = ff_put_no_rnd_pixels16_x2_arm;
  99. c->put_no_rnd_pixels_tab[0][2] = ff_put_no_rnd_pixels16_y2_arm;
  100. c->put_no_rnd_pixels_tab[0][3] = ff_put_no_rnd_pixels16_xy2_arm;
  101. c->put_no_rnd_pixels_tab[1][0] = ff_put_pixels8_arm;
  102. c->put_no_rnd_pixels_tab[1][1] = ff_put_no_rnd_pixels8_x2_arm;
  103. c->put_no_rnd_pixels_tab[1][2] = ff_put_no_rnd_pixels8_y2_arm;
  104. c->put_no_rnd_pixels_tab[1][3] = ff_put_no_rnd_pixels8_xy2_arm;
  105. }
  106. if (have_armv5te(cpu_flags)) ff_dsputil_init_armv5te(c, avctx);
  107. if (have_armv6(cpu_flags)) ff_dsputil_init_armv6(c, avctx);
  108. if (have_neon(cpu_flags)) ff_dsputil_init_neon(c, avctx);
  109. }