You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

219 lines
7.6KB

  1. /**
  2. * Copyright (C) 2010 Mans Rullgard
  3. *
  4. * This file is part of Libav.
  5. *
  6. * Libav is free software; you can redistribute it and/or
  7. * modify it under the terms of the GNU Lesser General Public
  8. * License as published by the Free Software Foundation; either
  9. * version 2.1 of the License, or (at your option) any later version.
  10. *
  11. * Libav is distributed in the hope that it will be useful,
  12. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  13. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  14. * Lesser General Public License for more details.
  15. *
  16. * You should have received a copy of the GNU Lesser General Public
  17. * License along with Libav; if not, write to the Free Software
  18. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  19. */
  20. #include "asm.S"
  21. .macro rac_get_prob h, bs, buf, cw, pr, t0, t1
  22. adds \bs, \bs, \t0
  23. lsl \cw, \cw, \t0
  24. lsl \t0, \h, \t0
  25. rsb \h, \pr, #256
  26. ldrhcs \t1, [\buf], #2
  27. smlabb \h, \t0, \pr, \h
  28. rev16cs \t1, \t1
  29. orrcs \cw, \cw, \t1, lsl \bs
  30. subcs \bs, \bs, #16
  31. lsr \h, \h, #8
  32. cmp \cw, \h, lsl #16
  33. subge \cw, \cw, \h, lsl #16
  34. subge \h, \t0, \h
  35. .endm
  36. .macro rac_get_128 h, bs, buf, cw, t0, t1
  37. adds \bs, \bs, \t0
  38. lsl \cw, \cw, \t0
  39. lsl \t0, \h, \t0
  40. ldrhcs \t1, [\buf], #2
  41. mov \h, #128
  42. rev16cs \t1, \t1
  43. add \h, \h, \t0, lsl #7
  44. orrcs \cw, \cw, \t1, lsl \bs
  45. subcs \bs, \bs, #16
  46. lsr \h, \h, #8
  47. cmp \cw, \h, lsl #16
  48. subge \cw, \cw, \h, lsl #16
  49. subge \h, \t0, \h
  50. .endm
  51. function ff_decode_block_coeffs_armv6, export=1
  52. push {r0,r1,r4-r11,lr}
  53. movrel lr, X(ff_vp56_norm_shift)
  54. ldrd r4, r5, [sp, #44] @ token_prob, qmul
  55. cmp r3, #0
  56. ldr r11, [r5]
  57. ldm r0, {r5-r7} @ high, bits, buf
  58. pkhtbne r11, r11, r11, asr #16
  59. ldr r8, [r0, #16] @ code_word
  60. 0:
  61. ldrb r9, [lr, r5]
  62. add r3, r3, #1
  63. ldrb r0, [r4, #1]
  64. rac_get_prob r5, r6, r7, r8, r0, r9, r10
  65. blt 2f
  66. ldrb r9, [lr, r5]
  67. ldrb r0, [r4, #2]
  68. rac_get_prob r5, r6, r7, r8, r0, r9, r10
  69. ldrb r9, [lr, r5]
  70. bge 3f
  71. add r4, r3, r3, lsl #5
  72. sxth r12, r11
  73. add r4, r2, r4
  74. adds r6, r6, r9
  75. add r4, r4, #11
  76. lsl r8, r8, r9
  77. ldrhcs r10, [r7], #2
  78. lsl r9, r5, r9
  79. mov r5, #128
  80. rev16cs r10, r10
  81. add r5, r5, r9, lsl #7
  82. orrcs r8, r8, r10, lsl r6
  83. subcs r6, r6, #16
  84. lsr r5, r5, #8
  85. cmp r8, r5, lsl #16
  86. movrel r10, zigzag_scan-1
  87. subge r8, r8, r5, lsl #16
  88. subge r5, r9, r5
  89. ldrb r10, [r10, r3]
  90. rsbge r12, r12, #0
  91. cmp r3, #16
  92. strh r12, [r1, r10]
  93. bge 6f
  94. 5:
  95. ldrb r9, [lr, r5]
  96. ldrb r0, [r4]
  97. rac_get_prob r5, r6, r7, r8, r0, r9, r10
  98. pkhtb r11, r11, r11, asr #16
  99. bge 0b
  100. 6:
  101. ldr r0, [sp]
  102. ldr r9, [r0, #12]
  103. cmp r7, r9
  104. movhi r7, r9
  105. stm r0, {r5-r7} @ high, bits, buf
  106. str r8, [r0, #16] @ code_word
  107. add sp, sp, #8
  108. mov r0, r3
  109. pop {r4-r11,pc}
  110. 2:
  111. add r4, r3, r3, lsl #5
  112. cmp r3, #16
  113. add r4, r2, r4
  114. pkhtb r11, r11, r11, asr #16
  115. bne 0b
  116. b 6b
  117. 3:
  118. ldrb r0, [r4, #3]
  119. rac_get_prob r5, r6, r7, r8, r0, r9, r10
  120. ldrb r9, [lr, r5]
  121. bge 1f
  122. mov r12, #2
  123. ldrb r0, [r4, #4]
  124. rac_get_prob r5, r6, r7, r8, r0, r9, r10
  125. addge r12, #1
  126. ldrb r9, [lr, r5]
  127. blt 4f
  128. ldrb r0, [r4, #5]
  129. rac_get_prob r5, r6, r7, r8, r0, r9, r10
  130. addge r12, #1
  131. ldrb r9, [lr, r5]
  132. b 4f
  133. 1:
  134. ldrb r0, [r4, #6]
  135. rac_get_prob r5, r6, r7, r8, r0, r9, r10
  136. ldrb r9, [lr, r5]
  137. bge 3f
  138. ldrb r0, [r4, #7]
  139. rac_get_prob r5, r6, r7, r8, r0, r9, r10
  140. ldrb r9, [lr, r5]
  141. bge 2f
  142. mov r12, #5
  143. mov r0, #159
  144. rac_get_prob r5, r6, r7, r8, r0, r9, r10
  145. addge r12, r12, #1
  146. ldrb r9, [lr, r5]
  147. b 4f
  148. 2:
  149. mov r12, #7
  150. mov r0, #165
  151. rac_get_prob r5, r6, r7, r8, r0, r9, r10
  152. addge r12, r12, #2
  153. ldrb r9, [lr, r5]
  154. mov r0, #145
  155. rac_get_prob r5, r6, r7, r8, r0, r9, r10
  156. addge r12, r12, #1
  157. ldrb r9, [lr, r5]
  158. b 4f
  159. 3:
  160. ldrb r0, [r4, #8]
  161. rac_get_prob r5, r6, r7, r8, r0, r9, r10
  162. addge r4, r4, #1
  163. ldrb r9, [lr, r5]
  164. movge r12, #2
  165. movlt r12, #0
  166. ldrb r0, [r4, #9]
  167. rac_get_prob r5, r6, r7, r8, r0, r9, r10
  168. mov r9, #8
  169. addge r12, r12, #1
  170. movrel r4, X(ff_vp8_dct_cat_prob)
  171. lsl r9, r9, r12
  172. ldr r4, [r4, r12, lsl #2]
  173. add r12, r9, #3
  174. mov r1, #0
  175. ldrb r0, [r4], #1
  176. 1:
  177. ldrb r9, [lr, r5]
  178. lsl r1, r1, #1
  179. rac_get_prob r5, r6, r7, r8, r0, r9, r10
  180. ldrb r0, [r4], #1
  181. addge r1, r1, #1
  182. cmp r0, #0
  183. bne 1b
  184. ldrb r9, [lr, r5]
  185. add r12, r12, r1
  186. ldr r1, [sp, #4]
  187. 4:
  188. add r4, r3, r3, lsl #5
  189. add r4, r2, r4
  190. add r4, r4, #22
  191. rac_get_128 r5, r6, r7, r8, r9, r10
  192. rsbge r12, r12, #0
  193. smulbb r12, r12, r11
  194. movrel r9, zigzag_scan-1
  195. ldrb r9, [r9, r3]
  196. cmp r3, #16
  197. strh r12, [r1, r9]
  198. bge 6b
  199. b 5b
  200. endfunc
  201. .section .rodata
  202. zigzag_scan:
  203. .byte 0, 2, 8, 16
  204. .byte 10, 4, 6, 12
  205. .byte 18, 24, 26, 20
  206. .byte 14, 22, 28, 30