You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

337 lines
19KB

  1. /*
  2. * Copyright (c) 2015 Parag Salasakar (Parag.Salasakar@imgtec.com)
  3. *
  4. * This file is part of FFmpeg.
  5. *
  6. * FFmpeg is free software; you can redistribute it and/or
  7. * modify it under the terms of the GNU Lesser General Public
  8. * License as published by the Free Software Foundation; either
  9. * version 2.1 of the License, or (at your option) any later version.
  10. *
  11. * FFmpeg is distributed in the hope that it will be useful,
  12. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  13. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  14. * Lesser General Public License for more details.
  15. *
  16. * You should have received a copy of the GNU Lesser General Public
  17. * License along with FFmpeg; if not, write to the Free Software
  18. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  19. */
  20. #ifndef H264_DSP_MIPS_H
  21. #define H264_DSP_MIPS_H
  22. #include "libavcodec/h264.h"
  23. void ff_h264_h_lpf_luma_inter_msa(uint8_t *src, int stride,
  24. int alpha, int beta, int8_t *tc0);
  25. void ff_h264_v_lpf_luma_inter_msa(uint8_t *src, int stride,
  26. int alpha, int beta, int8_t *tc0);
  27. void ff_h264_h_lpf_chroma_inter_msa(uint8_t *src, int stride,
  28. int alpha, int beta, int8_t *tc0);
  29. void ff_h264_v_lpf_chroma_inter_msa(uint8_t *src, int stride,
  30. int alpha, int beta, int8_t *tc0);
  31. void ff_h264_h_loop_filter_chroma422_msa(uint8_t *src, int32_t stride,
  32. int32_t alpha, int32_t beta,
  33. int8_t *tc0);
  34. void ff_h264_h_loop_filter_chroma422_mbaff_msa(uint8_t *src, int32_t stride,
  35. int32_t alpha, int32_t beta,
  36. int8_t *tc0);
  37. void ff_h264_h_loop_filter_luma_mbaff_msa(uint8_t *src, int32_t stride,
  38. int32_t alpha, int32_t beta,
  39. int8_t *tc0);
  40. void ff_h264_idct_add_msa(uint8_t *dst, int16_t *src, int32_t dst_stride);
  41. void ff_h264_idct4x4_addblk_dc_msa(uint8_t *dst, int16_t *src,
  42. int32_t dst_stride);
  43. void ff_h264_deq_idct_luma_dc_msa(int16_t *dst, int16_t *src,
  44. int32_t de_q_val);
  45. void ff_h264_idct_add16_msa(uint8_t *dst, const int32_t *blk_offset,
  46. int16_t *block, int32_t stride,
  47. const uint8_t nnzc[15 * 8]);
  48. void ff_h264_idct_add16_intra_msa(uint8_t *dst, const int32_t *blk_offset,
  49. int16_t *block, int32_t dst_stride,
  50. const uint8_t nnzc[15 * 8]);
  51. void ff_h264_idct_add8_msa(uint8_t **dst, const int32_t *blk_offset,
  52. int16_t *block, int32_t dst_stride,
  53. const uint8_t nnzc[15 * 8]);
  54. void ff_h264_idct_add8_422_msa(uint8_t **dst, const int32_t *blk_offset,
  55. int16_t *block, int32_t dst_stride,
  56. const uint8_t nnzc[15 * 8]);
  57. void ff_h264_idct8_addblk_msa(uint8_t *dst, int16_t *src, int32_t dst_stride);
  58. void ff_h264_idct8_dc_addblk_msa(uint8_t *dst, int16_t *src,
  59. int32_t dst_stride);
  60. void ff_h264_idct8_add4_msa(uint8_t *dst, const int *blk_offset,
  61. int16_t *blk, int dst_stride,
  62. const uint8_t nnzc[15 * 8]);
  63. void ff_h264_h_lpf_luma_intra_msa(uint8_t *src, int stride,
  64. int alpha, int beta);
  65. void ff_h264_v_lpf_luma_intra_msa(uint8_t *src, int stride,
  66. int alpha, int beta);
  67. void ff_h264_h_lpf_chroma_intra_msa(uint8_t *src, int stride,
  68. int alpha, int beta);
  69. void ff_h264_v_lpf_chroma_intra_msa(uint8_t *src, int stride,
  70. int alpha, int beta);
  71. void ff_h264_h_loop_filter_luma_mbaff_intra_msa(uint8_t *src, int stride,
  72. int alpha, int beta);
  73. void ff_biweight_h264_pixels16_8_msa(uint8_t *dst, uint8_t *src,
  74. int stride, int height, int log2_denom,
  75. int weightd, int weights, int offset);
  76. void ff_biweight_h264_pixels8_8_msa(uint8_t *dst, uint8_t *src,
  77. int stride, int height, int log2_denom,
  78. int weightd, int weights, int offset);
  79. void ff_biweight_h264_pixels4_8_msa(uint8_t *dst, uint8_t *src,
  80. int stride, int height, int log2_denom,
  81. int weightd, int weights, int offset);
  82. void ff_weight_h264_pixels16_8_msa(uint8_t *src, int stride, int height,
  83. int log2_denom, int weight, int offset);
  84. void ff_weight_h264_pixels8_8_msa(uint8_t *src, int stride, int height,
  85. int log2_denom, int weight, int offset);
  86. void ff_weight_h264_pixels4_8_msa(uint8_t *src, int stride, int height,
  87. int log2_denom, int weight, int offset);
  88. void ff_put_h264_qpel16_mc00_msa(uint8_t *dst, const uint8_t *src,
  89. ptrdiff_t dst_stride);
  90. void ff_put_h264_qpel16_mc10_msa(uint8_t *dst, const uint8_t *src,
  91. ptrdiff_t dst_stride);
  92. void ff_put_h264_qpel16_mc20_msa(uint8_t *dst, const uint8_t *src,
  93. ptrdiff_t dst_stride);
  94. void ff_put_h264_qpel16_mc30_msa(uint8_t *dst, const uint8_t *src,
  95. ptrdiff_t dst_stride);
  96. void ff_put_h264_qpel16_mc01_msa(uint8_t *dst, const uint8_t *src,
  97. ptrdiff_t dst_stride);
  98. void ff_put_h264_qpel16_mc11_msa(uint8_t *dst, const uint8_t *src,
  99. ptrdiff_t dst_stride);
  100. void ff_put_h264_qpel16_mc21_msa(uint8_t *dst, const uint8_t *src,
  101. ptrdiff_t dst_stride);
  102. void ff_put_h264_qpel16_mc31_msa(uint8_t *dst, const uint8_t *src,
  103. ptrdiff_t dst_stride);
  104. void ff_put_h264_qpel16_mc02_msa(uint8_t *dst, const uint8_t *src,
  105. ptrdiff_t dst_stride);
  106. void ff_put_h264_qpel16_mc12_msa(uint8_t *dst, const uint8_t *src,
  107. ptrdiff_t dst_stride);
  108. void ff_put_h264_qpel16_mc22_msa(uint8_t *dst, const uint8_t *src,
  109. ptrdiff_t dst_stride);
  110. void ff_put_h264_qpel16_mc32_msa(uint8_t *dst, const uint8_t *src,
  111. ptrdiff_t dst_stride);
  112. void ff_put_h264_qpel16_mc03_msa(uint8_t *dst, const uint8_t *src,
  113. ptrdiff_t dst_stride);
  114. void ff_put_h264_qpel16_mc13_msa(uint8_t *dst, const uint8_t *src,
  115. ptrdiff_t dst_stride);
  116. void ff_put_h264_qpel16_mc23_msa(uint8_t *dst, const uint8_t *src,
  117. ptrdiff_t dst_stride);
  118. void ff_put_h264_qpel16_mc33_msa(uint8_t *dst, const uint8_t *src,
  119. ptrdiff_t dst_stride);
  120. void ff_put_h264_qpel8_mc00_msa(uint8_t *dst, const uint8_t *src,
  121. ptrdiff_t dst_stride);
  122. void ff_put_h264_qpel8_mc10_msa(uint8_t *dst, const uint8_t *src,
  123. ptrdiff_t dst_stride);
  124. void ff_put_h264_qpel8_mc20_msa(uint8_t *dst, const uint8_t *src,
  125. ptrdiff_t dst_stride);
  126. void ff_put_h264_qpel8_mc30_msa(uint8_t *dst, const uint8_t *src,
  127. ptrdiff_t dst_stride);
  128. void ff_put_h264_qpel8_mc01_msa(uint8_t *dst, const uint8_t *src,
  129. ptrdiff_t dst_stride);
  130. void ff_put_h264_qpel8_mc11_msa(uint8_t *dst, const uint8_t *src,
  131. ptrdiff_t dst_stride);
  132. void ff_put_h264_qpel8_mc21_msa(uint8_t *dst, const uint8_t *src,
  133. ptrdiff_t dst_stride);
  134. void ff_put_h264_qpel8_mc31_msa(uint8_t *dst, const uint8_t *src,
  135. ptrdiff_t dst_stride);
  136. void ff_put_h264_qpel8_mc02_msa(uint8_t *dst, const uint8_t *src,
  137. ptrdiff_t dst_stride);
  138. void ff_put_h264_qpel8_mc12_msa(uint8_t *dst, const uint8_t *src,
  139. ptrdiff_t dst_stride);
  140. void ff_put_h264_qpel8_mc22_msa(uint8_t *dst, const uint8_t *src,
  141. ptrdiff_t dst_stride);
  142. void ff_put_h264_qpel8_mc32_msa(uint8_t *dst, const uint8_t *src,
  143. ptrdiff_t dst_stride);
  144. void ff_put_h264_qpel8_mc03_msa(uint8_t *dst, const uint8_t *src,
  145. ptrdiff_t dst_stride);
  146. void ff_put_h264_qpel8_mc13_msa(uint8_t *dst, const uint8_t *src,
  147. ptrdiff_t dst_stride);
  148. void ff_put_h264_qpel8_mc23_msa(uint8_t *dst, const uint8_t *src,
  149. ptrdiff_t dst_stride);
  150. void ff_put_h264_qpel8_mc33_msa(uint8_t *dst, const uint8_t *src,
  151. ptrdiff_t dst_stride);
  152. void ff_put_h264_qpel4_mc00_msa(uint8_t *dst, const uint8_t *src,
  153. ptrdiff_t dst_stride);
  154. void ff_put_h264_qpel4_mc10_msa(uint8_t *dst, const uint8_t *src,
  155. ptrdiff_t dst_stride);
  156. void ff_put_h264_qpel4_mc20_msa(uint8_t *dst, const uint8_t *src,
  157. ptrdiff_t dst_stride);
  158. void ff_put_h264_qpel4_mc30_msa(uint8_t *dst, const uint8_t *src,
  159. ptrdiff_t dst_stride);
  160. void ff_put_h264_qpel4_mc01_msa(uint8_t *dst, const uint8_t *src,
  161. ptrdiff_t dst_stride);
  162. void ff_put_h264_qpel4_mc11_msa(uint8_t *dst, const uint8_t *src,
  163. ptrdiff_t dst_stride);
  164. void ff_put_h264_qpel4_mc21_msa(uint8_t *dst, const uint8_t *src,
  165. ptrdiff_t dst_stride);
  166. void ff_put_h264_qpel4_mc31_msa(uint8_t *dst, const uint8_t *src,
  167. ptrdiff_t dst_stride);
  168. void ff_put_h264_qpel4_mc02_msa(uint8_t *dst, const uint8_t *src,
  169. ptrdiff_t dst_stride);
  170. void ff_put_h264_qpel4_mc12_msa(uint8_t *dst, const uint8_t *src,
  171. ptrdiff_t dst_stride);
  172. void ff_put_h264_qpel4_mc22_msa(uint8_t *dst, const uint8_t *src,
  173. ptrdiff_t dst_stride);
  174. void ff_put_h264_qpel4_mc32_msa(uint8_t *dst, const uint8_t *src,
  175. ptrdiff_t dst_stride);
  176. void ff_put_h264_qpel4_mc03_msa(uint8_t *dst, const uint8_t *src,
  177. ptrdiff_t dst_stride);
  178. void ff_put_h264_qpel4_mc13_msa(uint8_t *dst, const uint8_t *src,
  179. ptrdiff_t dst_stride);
  180. void ff_put_h264_qpel4_mc23_msa(uint8_t *dst, const uint8_t *src,
  181. ptrdiff_t dst_stride);
  182. void ff_put_h264_qpel4_mc33_msa(uint8_t *dst, const uint8_t *src,
  183. ptrdiff_t dst_stride);
  184. void ff_avg_h264_qpel16_mc00_msa(uint8_t *dst, const uint8_t *src,
  185. ptrdiff_t dst_stride);
  186. void ff_avg_h264_qpel16_mc10_msa(uint8_t *dst, const uint8_t *src,
  187. ptrdiff_t dst_stride);
  188. void ff_avg_h264_qpel16_mc20_msa(uint8_t *dst, const uint8_t *src,
  189. ptrdiff_t dst_stride);
  190. void ff_avg_h264_qpel16_mc30_msa(uint8_t *dst, const uint8_t *src,
  191. ptrdiff_t dst_stride);
  192. void ff_avg_h264_qpel16_mc01_msa(uint8_t *dst, const uint8_t *src,
  193. ptrdiff_t dst_stride);
  194. void ff_avg_h264_qpel16_mc11_msa(uint8_t *dst, const uint8_t *src,
  195. ptrdiff_t dst_stride);
  196. void ff_avg_h264_qpel16_mc21_msa(uint8_t *dst, const uint8_t *src,
  197. ptrdiff_t dst_stride);
  198. void ff_avg_h264_qpel16_mc31_msa(uint8_t *dst, const uint8_t *src,
  199. ptrdiff_t dst_stride);
  200. void ff_avg_h264_qpel16_mc02_msa(uint8_t *dst, const uint8_t *src,
  201. ptrdiff_t dst_stride);
  202. void ff_avg_h264_qpel16_mc12_msa(uint8_t *dst, const uint8_t *src,
  203. ptrdiff_t dst_stride);
  204. void ff_avg_h264_qpel16_mc22_msa(uint8_t *dst, const uint8_t *src,
  205. ptrdiff_t dst_stride);
  206. void ff_avg_h264_qpel16_mc32_msa(uint8_t *dst, const uint8_t *src,
  207. ptrdiff_t dst_stride);
  208. void ff_avg_h264_qpel16_mc03_msa(uint8_t *dst, const uint8_t *src,
  209. ptrdiff_t dst_stride);
  210. void ff_avg_h264_qpel16_mc13_msa(uint8_t *dst, const uint8_t *src,
  211. ptrdiff_t dst_stride);
  212. void ff_avg_h264_qpel16_mc23_msa(uint8_t *dst, const uint8_t *src,
  213. ptrdiff_t dst_stride);
  214. void ff_avg_h264_qpel16_mc33_msa(uint8_t *dst, const uint8_t *src,
  215. ptrdiff_t dst_stride);
  216. void ff_avg_h264_qpel8_mc00_msa(uint8_t *dst, const uint8_t *src,
  217. ptrdiff_t dst_stride);
  218. void ff_avg_h264_qpel8_mc10_msa(uint8_t *dst, const uint8_t *src,
  219. ptrdiff_t dst_stride);
  220. void ff_avg_h264_qpel8_mc20_msa(uint8_t *dst, const uint8_t *src,
  221. ptrdiff_t dst_stride);
  222. void ff_avg_h264_qpel8_mc30_msa(uint8_t *dst, const uint8_t *src,
  223. ptrdiff_t dst_stride);
  224. void ff_avg_h264_qpel8_mc01_msa(uint8_t *dst, const uint8_t *src,
  225. ptrdiff_t dst_stride);
  226. void ff_avg_h264_qpel8_mc11_msa(uint8_t *dst, const uint8_t *src,
  227. ptrdiff_t dst_stride);
  228. void ff_avg_h264_qpel8_mc21_msa(uint8_t *dst, const uint8_t *src,
  229. ptrdiff_t dst_stride);
  230. void ff_avg_h264_qpel8_mc31_msa(uint8_t *dst, const uint8_t *src,
  231. ptrdiff_t dst_stride);
  232. void ff_avg_h264_qpel8_mc02_msa(uint8_t *dst, const uint8_t *src,
  233. ptrdiff_t dst_stride);
  234. void ff_avg_h264_qpel8_mc12_msa(uint8_t *dst, const uint8_t *src,
  235. ptrdiff_t dst_stride);
  236. void ff_avg_h264_qpel8_mc22_msa(uint8_t *dst, const uint8_t *src,
  237. ptrdiff_t dst_stride);
  238. void ff_avg_h264_qpel8_mc32_msa(uint8_t *dst, const uint8_t *src,
  239. ptrdiff_t dst_stride);
  240. void ff_avg_h264_qpel8_mc03_msa(uint8_t *dst, const uint8_t *src,
  241. ptrdiff_t dst_stride);
  242. void ff_avg_h264_qpel8_mc13_msa(uint8_t *dst, const uint8_t *src,
  243. ptrdiff_t dst_stride);
  244. void ff_avg_h264_qpel8_mc23_msa(uint8_t *dst, const uint8_t *src,
  245. ptrdiff_t dst_stride);
  246. void ff_avg_h264_qpel8_mc33_msa(uint8_t *dst, const uint8_t *src,
  247. ptrdiff_t dst_stride);
  248. void ff_avg_h264_qpel4_mc00_msa(uint8_t *dst, const uint8_t *src,
  249. ptrdiff_t dst_stride);
  250. void ff_avg_h264_qpel4_mc10_msa(uint8_t *dst, const uint8_t *src,
  251. ptrdiff_t dst_stride);
  252. void ff_avg_h264_qpel4_mc20_msa(uint8_t *dst, const uint8_t *src,
  253. ptrdiff_t dst_stride);
  254. void ff_avg_h264_qpel4_mc30_msa(uint8_t *dst, const uint8_t *src,
  255. ptrdiff_t dst_stride);
  256. void ff_avg_h264_qpel4_mc01_msa(uint8_t *dst, const uint8_t *src,
  257. ptrdiff_t dst_stride);
  258. void ff_avg_h264_qpel4_mc11_msa(uint8_t *dst, const uint8_t *src,
  259. ptrdiff_t dst_stride);
  260. void ff_avg_h264_qpel4_mc21_msa(uint8_t *dst, const uint8_t *src,
  261. ptrdiff_t dst_stride);
  262. void ff_avg_h264_qpel4_mc31_msa(uint8_t *dst, const uint8_t *src,
  263. ptrdiff_t dst_stride);
  264. void ff_avg_h264_qpel4_mc02_msa(uint8_t *dst, const uint8_t *src,
  265. ptrdiff_t dst_stride);
  266. void ff_avg_h264_qpel4_mc12_msa(uint8_t *dst, const uint8_t *src,
  267. ptrdiff_t dst_stride);
  268. void ff_avg_h264_qpel4_mc22_msa(uint8_t *dst, const uint8_t *src,
  269. ptrdiff_t dst_stride);
  270. void ff_avg_h264_qpel4_mc32_msa(uint8_t *dst, const uint8_t *src,
  271. ptrdiff_t dst_stride);
  272. void ff_avg_h264_qpel4_mc03_msa(uint8_t *dst, const uint8_t *src,
  273. ptrdiff_t dst_stride);
  274. void ff_avg_h264_qpel4_mc13_msa(uint8_t *dst, const uint8_t *src,
  275. ptrdiff_t dst_stride);
  276. void ff_avg_h264_qpel4_mc23_msa(uint8_t *dst, const uint8_t *src,
  277. ptrdiff_t dst_stride);
  278. void ff_avg_h264_qpel4_mc33_msa(uint8_t *dst, const uint8_t *src,
  279. ptrdiff_t dst_stride);
  280. void ff_h264_intra_predict_plane_8x8_msa(uint8_t *src, ptrdiff_t stride);
  281. void ff_h264_intra_predict_dc_4blk_8x8_msa(uint8_t *src, ptrdiff_t stride);
  282. void ff_h264_intra_predict_hor_dc_8x8_msa(uint8_t *src, ptrdiff_t stride);
  283. void ff_h264_intra_predict_vert_dc_8x8_msa(uint8_t *src, ptrdiff_t stride);
  284. void ff_h264_intra_predict_mad_cow_dc_l0t_8x8_msa(uint8_t *src,
  285. ptrdiff_t stride);
  286. void ff_h264_intra_predict_mad_cow_dc_0lt_8x8_msa(uint8_t *src,
  287. ptrdiff_t stride);
  288. void ff_h264_intra_predict_mad_cow_dc_l00_8x8_msa(uint8_t *src,
  289. ptrdiff_t stride);
  290. void ff_h264_intra_predict_mad_cow_dc_0l0_8x8_msa(uint8_t *src,
  291. ptrdiff_t stride);
  292. void ff_h264_intra_predict_plane_16x16_msa(uint8_t *src, ptrdiff_t stride);
  293. void ff_h264_intra_pred_vert_8x8_msa(uint8_t *src, ptrdiff_t stride);
  294. void ff_h264_intra_pred_horiz_8x8_msa(uint8_t *src, ptrdiff_t stride);
  295. void ff_h264_intra_pred_dc_16x16_msa(uint8_t *src, ptrdiff_t stride);
  296. void ff_h264_intra_pred_vert_16x16_msa(uint8_t *src, ptrdiff_t stride);
  297. void ff_h264_intra_pred_horiz_16x16_msa(uint8_t *src, ptrdiff_t stride);
  298. void ff_h264_intra_pred_dc_left_16x16_msa(uint8_t *src, ptrdiff_t stride);
  299. void ff_h264_intra_pred_dc_top_16x16_msa(uint8_t *src, ptrdiff_t stride);
  300. void ff_h264_intra_pred_dc_128_8x8_msa(uint8_t *src, ptrdiff_t stride);
  301. void ff_h264_intra_pred_dc_128_16x16_msa(uint8_t *src, ptrdiff_t stride);
  302. void ff_vp8_pred8x8_127_dc_8_msa(uint8_t *src, ptrdiff_t stride);
  303. void ff_vp8_pred8x8_129_dc_8_msa(uint8_t *src, ptrdiff_t stride);
  304. void ff_vp8_pred16x16_127_dc_8_msa(uint8_t *src, ptrdiff_t stride);
  305. void ff_vp8_pred16x16_129_dc_8_msa(uint8_t *src, ptrdiff_t stride);
  306. void ff_h264_weight_pixels16_8_mmi(uint8_t *block, int stride, int height,
  307. int log2_denom, int weight, int offset);
  308. void ff_h264_biweight_pixels16_8_mmi(uint8_t *dst, uint8_t *src,
  309. int stride, int height, int log2_denom, int weightd, int weights,
  310. int offset);
  311. void ff_h264_weight_pixels8_8_mmi(uint8_t *block, int stride, int height,
  312. int log2_denom, int weight, int offset);
  313. void ff_h264_biweight_pixels8_8_mmi(uint8_t *dst, uint8_t *src,
  314. int stride, int height, int log2_denom, int weightd, int weights,
  315. int offset);
  316. void ff_h264_weight_pixels4_8_mmi(uint8_t *block, int stride, int height,
  317. int log2_denom, int weight, int offset);
  318. void ff_h264_biweight_pixels4_8_mmi(uint8_t *dst, uint8_t *src,
  319. int stride, int height, int log2_denom, int weightd, int weights,
  320. int offset);
  321. #endif // #ifndef H264_DSP_MIPS_H