You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

221 lines
7.6KB

  1. /**
  2. * Copyright (C) 2010 Mans Rullgard
  3. *
  4. * This file is part of FFmpeg.
  5. *
  6. * FFmpeg is free software; you can redistribute it and/or
  7. * modify it under the terms of the GNU Lesser General Public
  8. * License as published by the Free Software Foundation; either
  9. * version 2.1 of the License, or (at your option) any later version.
  10. *
  11. * FFmpeg is distributed in the hope that it will be useful,
  12. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  13. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  14. * Lesser General Public License for more details.
  15. *
  16. * You should have received a copy of the GNU Lesser General Public
  17. * License along with FFmpeg; if not, write to the Free Software
  18. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  19. */
  20. #include "asm.S"
  21. .syntax unified
  22. .macro rac_get_prob h, bs, buf, cw, pr, t0, t1
  23. adds \bs, \bs, \t0
  24. lsl \cw, \cw, \t0
  25. lsl \t0, \h, \t0
  26. rsb \h, \pr, #256
  27. ldrhcs \t1, [\buf], #2
  28. smlabb \h, \t0, \pr, \h
  29. rev16cs \t1, \t1
  30. orrcs \cw, \cw, \t1, lsl \bs
  31. subcs \bs, \bs, #16
  32. lsr \h, \h, #8
  33. cmp \cw, \h, lsl #16
  34. subge \cw, \cw, \h, lsl #16
  35. subge \h, \t0, \h
  36. .endm
  37. .macro rac_get_128 h, bs, buf, cw, t0, t1
  38. adds \bs, \bs, \t0
  39. lsl \cw, \cw, \t0
  40. lsl \t0, \h, \t0
  41. ldrhcs \t1, [\buf], #2
  42. mov \h, #128
  43. rev16cs \t1, \t1
  44. add \h, \h, \t0, lsl #7
  45. orrcs \cw, \cw, \t1, lsl \bs
  46. subcs \bs, \bs, #16
  47. lsr \h, \h, #8
  48. cmp \cw, \h, lsl #16
  49. subge \cw, \cw, \h, lsl #16
  50. subge \h, \t0, \h
  51. .endm
  52. function ff_decode_block_coeffs_armv6, export=1
  53. push {r0,r1,r4-r11,lr}
  54. movrel lr, X(ff_vp56_norm_shift)
  55. ldrd r4, r5, [sp, #44] @ token_prob, qmul
  56. cmp r3, #0
  57. ldr r11, [r5]
  58. ldm r0, {r5-r7} @ high, bits, buf
  59. pkhtbne r11, r11, r11, asr #16
  60. ldr r8, [r0, #16] @ code_word
  61. 0:
  62. ldrb r9, [lr, r5]
  63. add r3, r3, #1
  64. ldrb r0, [r4, #1]
  65. rac_get_prob r5, r6, r7, r8, r0, r9, r10
  66. blt 2f
  67. ldrb r9, [lr, r5]
  68. ldrb r0, [r4, #2]
  69. rac_get_prob r5, r6, r7, r8, r0, r9, r10
  70. ldrb r9, [lr, r5]
  71. bge 3f
  72. add r4, r3, r3, lsl #5
  73. sxth r12, r11
  74. add r4, r2, r4
  75. adds r6, r6, r9
  76. add r4, r4, #11
  77. lsl r8, r8, r9
  78. ldrhcs r10, [r7], #2
  79. lsl r9, r5, r9
  80. mov r5, #128
  81. rev16cs r10, r10
  82. add r5, r5, r9, lsl #7
  83. orrcs r8, r8, r10, lsl r6
  84. subcs r6, r6, #16
  85. lsr r5, r5, #8
  86. cmp r8, r5, lsl #16
  87. movrel r10, zigzag_scan-1
  88. subge r8, r8, r5, lsl #16
  89. subge r5, r9, r5
  90. ldrb r10, [r10, r3]
  91. rsbge r12, r12, #0
  92. cmp r3, #16
  93. strh r12, [r1, r10]
  94. bge 6f
  95. 5:
  96. ldrb r9, [lr, r5]
  97. ldrb r0, [r4]
  98. rac_get_prob r5, r6, r7, r8, r0, r9, r10
  99. pkhtb r11, r11, r11, asr #16
  100. bge 0b
  101. 6:
  102. ldr r0, [sp]
  103. ldr r9, [r0, #12]
  104. cmp r7, r9
  105. movhi r7, r9
  106. stm r0, {r5-r7} @ high, bits, buf
  107. str r8, [r0, #16] @ code_word
  108. add sp, sp, #8
  109. mov r0, r3
  110. pop {r4-r11,pc}
  111. 2:
  112. add r4, r3, r3, lsl #5
  113. cmp r3, #16
  114. add r4, r2, r4
  115. pkhtb r11, r11, r11, asr #16
  116. bne 0b
  117. b 6b
  118. 3:
  119. ldrb r0, [r4, #3]
  120. rac_get_prob r5, r6, r7, r8, r0, r9, r10
  121. ldrb r9, [lr, r5]
  122. bge 1f
  123. mov r12, #2
  124. ldrb r0, [r4, #4]
  125. rac_get_prob r5, r6, r7, r8, r0, r9, r10
  126. addge r12, #1
  127. ldrb r9, [lr, r5]
  128. blt 4f
  129. ldrb r0, [r4, #5]
  130. rac_get_prob r5, r6, r7, r8, r0, r9, r10
  131. addge r12, #1
  132. ldrb r9, [lr, r5]
  133. b 4f
  134. 1:
  135. ldrb r0, [r4, #6]
  136. rac_get_prob r5, r6, r7, r8, r0, r9, r10
  137. ldrb r9, [lr, r5]
  138. bge 3f
  139. ldrb r0, [r4, #7]
  140. rac_get_prob r5, r6, r7, r8, r0, r9, r10
  141. ldrb r9, [lr, r5]
  142. bge 2f
  143. mov r12, #5
  144. mov r0, #159
  145. rac_get_prob r5, r6, r7, r8, r0, r9, r10
  146. addge r12, r12, #1
  147. ldrb r9, [lr, r5]
  148. b 4f
  149. 2:
  150. mov r12, #7
  151. mov r0, #165
  152. rac_get_prob r5, r6, r7, r8, r0, r9, r10
  153. addge r12, r12, #2
  154. ldrb r9, [lr, r5]
  155. mov r0, #145
  156. rac_get_prob r5, r6, r7, r8, r0, r9, r10
  157. addge r12, r12, #1
  158. ldrb r9, [lr, r5]
  159. b 4f
  160. 3:
  161. ldrb r0, [r4, #8]
  162. rac_get_prob r5, r6, r7, r8, r0, r9, r10
  163. addge r4, r4, #1
  164. ldrb r9, [lr, r5]
  165. movge r12, #2
  166. movlt r12, #0
  167. ldrb r0, [r4, #9]
  168. rac_get_prob r5, r6, r7, r8, r0, r9, r10
  169. mov r9, #8
  170. addge r12, r12, #1
  171. movrel r4, X(ff_vp8_dct_cat_prob)
  172. lsl r9, r9, r12
  173. ldr r4, [r4, r12, lsl #2]
  174. add r12, r9, #3
  175. mov r1, #0
  176. ldrb r0, [r4], #1
  177. 1:
  178. ldrb r9, [lr, r5]
  179. lsl r1, r1, #1
  180. rac_get_prob r5, r6, r7, r8, r0, r9, r10
  181. ldrb r0, [r4], #1
  182. addge r1, r1, #1
  183. cmp r0, #0
  184. bne 1b
  185. ldrb r9, [lr, r5]
  186. add r12, r12, r1
  187. ldr r1, [sp, #4]
  188. 4:
  189. add r4, r3, r3, lsl #5
  190. add r4, r2, r4
  191. add r4, r4, #22
  192. rac_get_128 r5, r6, r7, r8, r9, r10
  193. rsbge r12, r12, #0
  194. smulbb r12, r12, r11
  195. movrel r9, zigzag_scan-1
  196. ldrb r9, [r9, r3]
  197. cmp r3, #16
  198. strh r12, [r1, r9]
  199. bge 6b
  200. b 5b
  201. endfunc
  202. .section .rodata
  203. zigzag_scan:
  204. .byte 0, 2, 8, 16
  205. .byte 10, 4, 6, 12
  206. .byte 18, 24, 26, 20
  207. .byte 14, 22, 28, 30