You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

604 lines
22KB

  1. /*
  2. * H.26L/H.264/AVC/JVT/14496-10/... encoder/decoder
  3. * Copyright (c) 2003 Michael Niedermayer <michaelni@gmx.at>
  4. *
  5. * This file is part of FFmpeg.
  6. *
  7. * FFmpeg is free software; you can redistribute it and/or
  8. * modify it under the terms of the GNU Lesser General Public
  9. * License as published by the Free Software Foundation; either
  10. * version 2.1 of the License, or (at your option) any later version.
  11. *
  12. * FFmpeg is distributed in the hope that it will be useful,
  13. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  14. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  15. * Lesser General Public License for more details.
  16. *
  17. * You should have received a copy of the GNU Lesser General Public
  18. * License along with FFmpeg; if not, write to the Free Software
  19. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  20. */
  21. /**
  22. * @file
  23. * H.264 / AVC / MPEG-4 part10 prediction functions.
  24. * @author Michael Niedermayer <michaelni@gmx.at>
  25. */
  26. #include "libavutil/attributes.h"
  27. #include "libavutil/avassert.h"
  28. #include "libavutil/intreadwrite.h"
  29. #include "avcodec.h"
  30. #include "h264pred.h"
  31. #define BIT_DEPTH 8
  32. #include "h264pred_template.c"
  33. #undef BIT_DEPTH
  34. #define BIT_DEPTH 9
  35. #include "h264pred_template.c"
  36. #undef BIT_DEPTH
  37. #define BIT_DEPTH 10
  38. #include "h264pred_template.c"
  39. #undef BIT_DEPTH
  40. #define BIT_DEPTH 12
  41. #include "h264pred_template.c"
  42. #undef BIT_DEPTH
  43. #define BIT_DEPTH 14
  44. #include "h264pred_template.c"
  45. #undef BIT_DEPTH
  46. static void pred4x4_vertical_vp8_c(uint8_t *src, const uint8_t *topright,
  47. ptrdiff_t stride)
  48. {
  49. const unsigned lt = src[-1-1*stride];
  50. LOAD_TOP_EDGE
  51. LOAD_TOP_RIGHT_EDGE
  52. uint32_t v = PACK_4U8((lt + 2*t0 + t1 + 2) >> 2,
  53. (t0 + 2*t1 + t2 + 2) >> 2,
  54. (t1 + 2*t2 + t3 + 2) >> 2,
  55. (t2 + 2*t3 + t4 + 2) >> 2);
  56. AV_WN32A(src+0*stride, v);
  57. AV_WN32A(src+1*stride, v);
  58. AV_WN32A(src+2*stride, v);
  59. AV_WN32A(src+3*stride, v);
  60. }
  61. static void pred4x4_horizontal_vp8_c(uint8_t *src, const uint8_t *topright,
  62. ptrdiff_t stride)
  63. {
  64. const unsigned lt = src[-1-1*stride];
  65. LOAD_LEFT_EDGE
  66. AV_WN32A(src+0*stride, ((lt + 2*l0 + l1 + 2) >> 2)*0x01010101);
  67. AV_WN32A(src+1*stride, ((l0 + 2*l1 + l2 + 2) >> 2)*0x01010101);
  68. AV_WN32A(src+2*stride, ((l1 + 2*l2 + l3 + 2) >> 2)*0x01010101);
  69. AV_WN32A(src+3*stride, ((l2 + 2*l3 + l3 + 2) >> 2)*0x01010101);
  70. }
  71. static void pred4x4_down_left_svq3_c(uint8_t *src, const uint8_t *topright,
  72. ptrdiff_t stride)
  73. {
  74. LOAD_TOP_EDGE
  75. LOAD_LEFT_EDGE
  76. src[0+0*stride]=(l1 + t1)>>1;
  77. src[1+0*stride]=
  78. src[0+1*stride]=(l2 + t2)>>1;
  79. src[2+0*stride]=
  80. src[1+1*stride]=
  81. src[0+2*stride]=
  82. src[3+0*stride]=
  83. src[2+1*stride]=
  84. src[1+2*stride]=
  85. src[0+3*stride]=
  86. src[3+1*stride]=
  87. src[2+2*stride]=
  88. src[1+3*stride]=
  89. src[3+2*stride]=
  90. src[2+3*stride]=
  91. src[3+3*stride]=(l3 + t3)>>1;
  92. }
  93. static void pred4x4_down_left_rv40_c(uint8_t *src, const uint8_t *topright,
  94. ptrdiff_t stride)
  95. {
  96. LOAD_TOP_EDGE
  97. LOAD_TOP_RIGHT_EDGE
  98. LOAD_LEFT_EDGE
  99. LOAD_DOWN_LEFT_EDGE
  100. src[0+0*stride]=(t0 + t2 + 2*t1 + 2 + l0 + l2 + 2*l1 + 2)>>3;
  101. src[1+0*stride]=
  102. src[0+1*stride]=(t1 + t3 + 2*t2 + 2 + l1 + l3 + 2*l2 + 2)>>3;
  103. src[2+0*stride]=
  104. src[1+1*stride]=
  105. src[0+2*stride]=(t2 + t4 + 2*t3 + 2 + l2 + l4 + 2*l3 + 2)>>3;
  106. src[3+0*stride]=
  107. src[2+1*stride]=
  108. src[1+2*stride]=
  109. src[0+3*stride]=(t3 + t5 + 2*t4 + 2 + l3 + l5 + 2*l4 + 2)>>3;
  110. src[3+1*stride]=
  111. src[2+2*stride]=
  112. src[1+3*stride]=(t4 + t6 + 2*t5 + 2 + l4 + l6 + 2*l5 + 2)>>3;
  113. src[3+2*stride]=
  114. src[2+3*stride]=(t5 + t7 + 2*t6 + 2 + l5 + l7 + 2*l6 + 2)>>3;
  115. src[3+3*stride]=(t6 + t7 + 1 + l6 + l7 + 1)>>2;
  116. }
  117. static void pred4x4_down_left_rv40_nodown_c(uint8_t *src,
  118. const uint8_t *topright,
  119. ptrdiff_t stride)
  120. {
  121. LOAD_TOP_EDGE
  122. LOAD_TOP_RIGHT_EDGE
  123. LOAD_LEFT_EDGE
  124. src[0+0*stride]=(t0 + t2 + 2*t1 + 2 + l0 + l2 + 2*l1 + 2)>>3;
  125. src[1+0*stride]=
  126. src[0+1*stride]=(t1 + t3 + 2*t2 + 2 + l1 + l3 + 2*l2 + 2)>>3;
  127. src[2+0*stride]=
  128. src[1+1*stride]=
  129. src[0+2*stride]=(t2 + t4 + 2*t3 + 2 + l2 + 3*l3 + 2)>>3;
  130. src[3+0*stride]=
  131. src[2+1*stride]=
  132. src[1+2*stride]=
  133. src[0+3*stride]=(t3 + t5 + 2*t4 + 2 + l3*4 + 2)>>3;
  134. src[3+1*stride]=
  135. src[2+2*stride]=
  136. src[1+3*stride]=(t4 + t6 + 2*t5 + 2 + l3*4 + 2)>>3;
  137. src[3+2*stride]=
  138. src[2+3*stride]=(t5 + t7 + 2*t6 + 2 + l3*4 + 2)>>3;
  139. src[3+3*stride]=(t6 + t7 + 1 + 2*l3 + 1)>>2;
  140. }
  141. static void pred4x4_vertical_left_rv40(uint8_t *src, const uint8_t *topright,
  142. ptrdiff_t stride,
  143. const int l0, const int l1, const int l2,
  144. const int l3, const int l4)
  145. {
  146. LOAD_TOP_EDGE
  147. LOAD_TOP_RIGHT_EDGE
  148. src[0+0*stride]=(2*t0 + 2*t1 + l1 + 2*l2 + l3 + 4)>>3;
  149. src[1+0*stride]=
  150. src[0+2*stride]=(t1 + t2 + 1)>>1;
  151. src[2+0*stride]=
  152. src[1+2*stride]=(t2 + t3 + 1)>>1;
  153. src[3+0*stride]=
  154. src[2+2*stride]=(t3 + t4+ 1)>>1;
  155. src[3+2*stride]=(t4 + t5+ 1)>>1;
  156. src[0+1*stride]=(t0 + 2*t1 + t2 + l2 + 2*l3 + l4 + 4)>>3;
  157. src[1+1*stride]=
  158. src[0+3*stride]=(t1 + 2*t2 + t3 + 2)>>2;
  159. src[2+1*stride]=
  160. src[1+3*stride]=(t2 + 2*t3 + t4 + 2)>>2;
  161. src[3+1*stride]=
  162. src[2+3*stride]=(t3 + 2*t4 + t5 + 2)>>2;
  163. src[3+3*stride]=(t4 + 2*t5 + t6 + 2)>>2;
  164. }
  165. static void pred4x4_vertical_left_rv40_c(uint8_t *src, const uint8_t *topright,
  166. ptrdiff_t stride)
  167. {
  168. LOAD_LEFT_EDGE
  169. LOAD_DOWN_LEFT_EDGE
  170. pred4x4_vertical_left_rv40(src, topright, stride, l0, l1, l2, l3, l4);
  171. }
  172. static void pred4x4_vertical_left_rv40_nodown_c(uint8_t *src,
  173. const uint8_t *topright,
  174. ptrdiff_t stride)
  175. {
  176. LOAD_LEFT_EDGE
  177. pred4x4_vertical_left_rv40(src, topright, stride, l0, l1, l2, l3, l3);
  178. }
  179. static void pred4x4_vertical_left_vp8_c(uint8_t *src, const uint8_t *topright,
  180. ptrdiff_t stride)
  181. {
  182. LOAD_TOP_EDGE
  183. LOAD_TOP_RIGHT_EDGE
  184. src[0+0*stride]=(t0 + t1 + 1)>>1;
  185. src[1+0*stride]=
  186. src[0+2*stride]=(t1 + t2 + 1)>>1;
  187. src[2+0*stride]=
  188. src[1+2*stride]=(t2 + t3 + 1)>>1;
  189. src[3+0*stride]=
  190. src[2+2*stride]=(t3 + t4 + 1)>>1;
  191. src[0+1*stride]=(t0 + 2*t1 + t2 + 2)>>2;
  192. src[1+1*stride]=
  193. src[0+3*stride]=(t1 + 2*t2 + t3 + 2)>>2;
  194. src[2+1*stride]=
  195. src[1+3*stride]=(t2 + 2*t3 + t4 + 2)>>2;
  196. src[3+1*stride]=
  197. src[2+3*stride]=(t3 + 2*t4 + t5 + 2)>>2;
  198. src[3+2*stride]=(t4 + 2*t5 + t6 + 2)>>2;
  199. src[3+3*stride]=(t5 + 2*t6 + t7 + 2)>>2;
  200. }
  201. static void pred4x4_horizontal_up_rv40_c(uint8_t *src, const uint8_t *topright,
  202. ptrdiff_t stride)
  203. {
  204. LOAD_LEFT_EDGE
  205. LOAD_DOWN_LEFT_EDGE
  206. LOAD_TOP_EDGE
  207. LOAD_TOP_RIGHT_EDGE
  208. src[0+0*stride]=(t1 + 2*t2 + t3 + 2*l0 + 2*l1 + 4)>>3;
  209. src[1+0*stride]=(t2 + 2*t3 + t4 + l0 + 2*l1 + l2 + 4)>>3;
  210. src[2+0*stride]=
  211. src[0+1*stride]=(t3 + 2*t4 + t5 + 2*l1 + 2*l2 + 4)>>3;
  212. src[3+0*stride]=
  213. src[1+1*stride]=(t4 + 2*t5 + t6 + l1 + 2*l2 + l3 + 4)>>3;
  214. src[2+1*stride]=
  215. src[0+2*stride]=(t5 + 2*t6 + t7 + 2*l2 + 2*l3 + 4)>>3;
  216. src[3+1*stride]=
  217. src[1+2*stride]=(t6 + 3*t7 + l2 + 3*l3 + 4)>>3;
  218. src[3+2*stride]=
  219. src[1+3*stride]=(l3 + 2*l4 + l5 + 2)>>2;
  220. src[0+3*stride]=
  221. src[2+2*stride]=(t6 + t7 + l3 + l4 + 2)>>2;
  222. src[2+3*stride]=(l4 + l5 + 1)>>1;
  223. src[3+3*stride]=(l4 + 2*l5 + l6 + 2)>>2;
  224. }
  225. static void pred4x4_horizontal_up_rv40_nodown_c(uint8_t *src,
  226. const uint8_t *topright,
  227. ptrdiff_t stride)
  228. {
  229. LOAD_LEFT_EDGE
  230. LOAD_TOP_EDGE
  231. LOAD_TOP_RIGHT_EDGE
  232. src[0+0*stride]=(t1 + 2*t2 + t3 + 2*l0 + 2*l1 + 4)>>3;
  233. src[1+0*stride]=(t2 + 2*t3 + t4 + l0 + 2*l1 + l2 + 4)>>3;
  234. src[2+0*stride]=
  235. src[0+1*stride]=(t3 + 2*t4 + t5 + 2*l1 + 2*l2 + 4)>>3;
  236. src[3+0*stride]=
  237. src[1+1*stride]=(t4 + 2*t5 + t6 + l1 + 2*l2 + l3 + 4)>>3;
  238. src[2+1*stride]=
  239. src[0+2*stride]=(t5 + 2*t6 + t7 + 2*l2 + 2*l3 + 4)>>3;
  240. src[3+1*stride]=
  241. src[1+2*stride]=(t6 + 3*t7 + l2 + 3*l3 + 4)>>3;
  242. src[3+2*stride]=
  243. src[1+3*stride]=l3;
  244. src[0+3*stride]=
  245. src[2+2*stride]=(t6 + t7 + 2*l3 + 2)>>2;
  246. src[2+3*stride]=
  247. src[3+3*stride]=l3;
  248. }
  249. static void pred4x4_tm_vp8_c(uint8_t *src, const uint8_t *topright,
  250. ptrdiff_t stride)
  251. {
  252. const uint8_t *cm = ff_crop_tab + MAX_NEG_CROP - src[-1-stride];
  253. uint8_t *top = src-stride;
  254. int y;
  255. for (y = 0; y < 4; y++) {
  256. const uint8_t *cm_in = cm + src[-1];
  257. src[0] = cm_in[top[0]];
  258. src[1] = cm_in[top[1]];
  259. src[2] = cm_in[top[2]];
  260. src[3] = cm_in[top[3]];
  261. src += stride;
  262. }
  263. }
  264. static void pred16x16_plane_svq3_c(uint8_t *src, ptrdiff_t stride)
  265. {
  266. pred16x16_plane_compat_8_c(src, stride, 1, 0);
  267. }
  268. static void pred16x16_plane_rv40_c(uint8_t *src, ptrdiff_t stride)
  269. {
  270. pred16x16_plane_compat_8_c(src, stride, 0, 1);
  271. }
  272. static void pred16x16_tm_vp8_c(uint8_t *src, ptrdiff_t stride)
  273. {
  274. const uint8_t *cm = ff_crop_tab + MAX_NEG_CROP - src[-1-stride];
  275. uint8_t *top = src-stride;
  276. int y;
  277. for (y = 0; y < 16; y++) {
  278. const uint8_t *cm_in = cm + src[-1];
  279. src[0] = cm_in[top[0]];
  280. src[1] = cm_in[top[1]];
  281. src[2] = cm_in[top[2]];
  282. src[3] = cm_in[top[3]];
  283. src[4] = cm_in[top[4]];
  284. src[5] = cm_in[top[5]];
  285. src[6] = cm_in[top[6]];
  286. src[7] = cm_in[top[7]];
  287. src[8] = cm_in[top[8]];
  288. src[9] = cm_in[top[9]];
  289. src[10] = cm_in[top[10]];
  290. src[11] = cm_in[top[11]];
  291. src[12] = cm_in[top[12]];
  292. src[13] = cm_in[top[13]];
  293. src[14] = cm_in[top[14]];
  294. src[15] = cm_in[top[15]];
  295. src += stride;
  296. }
  297. }
  298. static void pred8x8_left_dc_rv40_c(uint8_t *src, ptrdiff_t stride)
  299. {
  300. int i;
  301. unsigned dc0;
  302. dc0=0;
  303. for(i=0;i<8; i++)
  304. dc0+= src[-1+i*stride];
  305. dc0= 0x01010101*((dc0 + 4)>>3);
  306. for(i=0; i<8; i++){
  307. ((uint32_t*)(src+i*stride))[0]=
  308. ((uint32_t*)(src+i*stride))[1]= dc0;
  309. }
  310. }
  311. static void pred8x8_top_dc_rv40_c(uint8_t *src, ptrdiff_t stride)
  312. {
  313. int i;
  314. unsigned dc0;
  315. dc0=0;
  316. for(i=0;i<8; i++)
  317. dc0+= src[i-stride];
  318. dc0= 0x01010101*((dc0 + 4)>>3);
  319. for(i=0; i<8; i++){
  320. ((uint32_t*)(src+i*stride))[0]=
  321. ((uint32_t*)(src+i*stride))[1]= dc0;
  322. }
  323. }
  324. static void pred8x8_dc_rv40_c(uint8_t *src, ptrdiff_t stride)
  325. {
  326. int i;
  327. unsigned dc0 = 0;
  328. for(i=0;i<4; i++){
  329. dc0+= src[-1+i*stride] + src[i-stride];
  330. dc0+= src[4+i-stride];
  331. dc0+= src[-1+(i+4)*stride];
  332. }
  333. dc0= 0x01010101*((dc0 + 8)>>4);
  334. for(i=0; i<4; i++){
  335. ((uint32_t*)(src+i*stride))[0]= dc0;
  336. ((uint32_t*)(src+i*stride))[1]= dc0;
  337. }
  338. for(i=4; i<8; i++){
  339. ((uint32_t*)(src+i*stride))[0]= dc0;
  340. ((uint32_t*)(src+i*stride))[1]= dc0;
  341. }
  342. }
  343. static void pred8x8_tm_vp8_c(uint8_t *src, ptrdiff_t stride)
  344. {
  345. const uint8_t *cm = ff_crop_tab + MAX_NEG_CROP - src[-1-stride];
  346. uint8_t *top = src-stride;
  347. int y;
  348. for (y = 0; y < 8; y++) {
  349. const uint8_t *cm_in = cm + src[-1];
  350. src[0] = cm_in[top[0]];
  351. src[1] = cm_in[top[1]];
  352. src[2] = cm_in[top[2]];
  353. src[3] = cm_in[top[3]];
  354. src[4] = cm_in[top[4]];
  355. src[5] = cm_in[top[5]];
  356. src[6] = cm_in[top[6]];
  357. src[7] = cm_in[top[7]];
  358. src += stride;
  359. }
  360. }
  361. /**
  362. * Set the intra prediction function pointers.
  363. */
  364. av_cold void ff_h264_pred_init(H264PredContext *h, int codec_id,
  365. const int bit_depth,
  366. int chroma_format_idc)
  367. {
  368. #undef FUNC
  369. #undef FUNCC
  370. #define FUNC(a, depth) a ## _ ## depth
  371. #define FUNCC(a, depth) a ## _ ## depth ## _c
  372. #define FUNCD(a) a ## _c
  373. #define H264_PRED(depth) \
  374. if(codec_id != AV_CODEC_ID_RV40){\
  375. if (codec_id == AV_CODEC_ID_VP7 || codec_id == AV_CODEC_ID_VP8) {\
  376. h->pred4x4[VERT_PRED ]= FUNCD(pred4x4_vertical_vp8);\
  377. h->pred4x4[HOR_PRED ]= FUNCD(pred4x4_horizontal_vp8);\
  378. } else {\
  379. h->pred4x4[VERT_PRED ]= FUNCC(pred4x4_vertical , depth);\
  380. h->pred4x4[HOR_PRED ]= FUNCC(pred4x4_horizontal , depth);\
  381. }\
  382. h->pred4x4[DC_PRED ]= FUNCC(pred4x4_dc , depth);\
  383. if(codec_id == AV_CODEC_ID_SVQ3)\
  384. h->pred4x4[DIAG_DOWN_LEFT_PRED ]= FUNCD(pred4x4_down_left_svq3);\
  385. else\
  386. h->pred4x4[DIAG_DOWN_LEFT_PRED ]= FUNCC(pred4x4_down_left , depth);\
  387. h->pred4x4[DIAG_DOWN_RIGHT_PRED]= FUNCC(pred4x4_down_right , depth);\
  388. h->pred4x4[VERT_RIGHT_PRED ]= FUNCC(pred4x4_vertical_right , depth);\
  389. h->pred4x4[HOR_DOWN_PRED ]= FUNCC(pred4x4_horizontal_down , depth);\
  390. if (codec_id == AV_CODEC_ID_VP7 || codec_id == AV_CODEC_ID_VP8) {\
  391. h->pred4x4[VERT_LEFT_PRED ]= FUNCD(pred4x4_vertical_left_vp8);\
  392. } else\
  393. h->pred4x4[VERT_LEFT_PRED ]= FUNCC(pred4x4_vertical_left , depth);\
  394. h->pred4x4[HOR_UP_PRED ]= FUNCC(pred4x4_horizontal_up , depth);\
  395. if (codec_id != AV_CODEC_ID_VP7 && codec_id != AV_CODEC_ID_VP8) {\
  396. h->pred4x4[LEFT_DC_PRED ]= FUNCC(pred4x4_left_dc , depth);\
  397. h->pred4x4[TOP_DC_PRED ]= FUNCC(pred4x4_top_dc , depth);\
  398. } else {\
  399. h->pred4x4[TM_VP8_PRED ]= FUNCD(pred4x4_tm_vp8);\
  400. h->pred4x4[DC_127_PRED ]= FUNCC(pred4x4_127_dc , depth);\
  401. h->pred4x4[DC_129_PRED ]= FUNCC(pred4x4_129_dc , depth);\
  402. h->pred4x4[VERT_VP8_PRED ]= FUNCC(pred4x4_vertical , depth);\
  403. h->pred4x4[HOR_VP8_PRED ]= FUNCC(pred4x4_horizontal , depth);\
  404. }\
  405. if (codec_id != AV_CODEC_ID_VP8)\
  406. h->pred4x4[DC_128_PRED ]= FUNCC(pred4x4_128_dc , depth);\
  407. }else{\
  408. h->pred4x4[VERT_PRED ]= FUNCC(pred4x4_vertical , depth);\
  409. h->pred4x4[HOR_PRED ]= FUNCC(pred4x4_horizontal , depth);\
  410. h->pred4x4[DC_PRED ]= FUNCC(pred4x4_dc , depth);\
  411. h->pred4x4[DIAG_DOWN_LEFT_PRED ]= FUNCD(pred4x4_down_left_rv40);\
  412. h->pred4x4[DIAG_DOWN_RIGHT_PRED]= FUNCC(pred4x4_down_right , depth);\
  413. h->pred4x4[VERT_RIGHT_PRED ]= FUNCC(pred4x4_vertical_right , depth);\
  414. h->pred4x4[HOR_DOWN_PRED ]= FUNCC(pred4x4_horizontal_down , depth);\
  415. h->pred4x4[VERT_LEFT_PRED ]= FUNCD(pred4x4_vertical_left_rv40);\
  416. h->pred4x4[HOR_UP_PRED ]= FUNCD(pred4x4_horizontal_up_rv40);\
  417. h->pred4x4[LEFT_DC_PRED ]= FUNCC(pred4x4_left_dc , depth);\
  418. h->pred4x4[TOP_DC_PRED ]= FUNCC(pred4x4_top_dc , depth);\
  419. h->pred4x4[DC_128_PRED ]= FUNCC(pred4x4_128_dc , depth);\
  420. h->pred4x4[DIAG_DOWN_LEFT_PRED_RV40_NODOWN]= FUNCD(pred4x4_down_left_rv40_nodown);\
  421. h->pred4x4[HOR_UP_PRED_RV40_NODOWN]= FUNCD(pred4x4_horizontal_up_rv40_nodown);\
  422. h->pred4x4[VERT_LEFT_PRED_RV40_NODOWN]= FUNCD(pred4x4_vertical_left_rv40_nodown);\
  423. }\
  424. \
  425. h->pred8x8l[VERT_PRED ]= FUNCC(pred8x8l_vertical , depth);\
  426. h->pred8x8l[HOR_PRED ]= FUNCC(pred8x8l_horizontal , depth);\
  427. h->pred8x8l[DC_PRED ]= FUNCC(pred8x8l_dc , depth);\
  428. h->pred8x8l[DIAG_DOWN_LEFT_PRED ]= FUNCC(pred8x8l_down_left , depth);\
  429. h->pred8x8l[DIAG_DOWN_RIGHT_PRED]= FUNCC(pred8x8l_down_right , depth);\
  430. h->pred8x8l[VERT_RIGHT_PRED ]= FUNCC(pred8x8l_vertical_right , depth);\
  431. h->pred8x8l[HOR_DOWN_PRED ]= FUNCC(pred8x8l_horizontal_down , depth);\
  432. h->pred8x8l[VERT_LEFT_PRED ]= FUNCC(pred8x8l_vertical_left , depth);\
  433. h->pred8x8l[HOR_UP_PRED ]= FUNCC(pred8x8l_horizontal_up , depth);\
  434. h->pred8x8l[LEFT_DC_PRED ]= FUNCC(pred8x8l_left_dc , depth);\
  435. h->pred8x8l[TOP_DC_PRED ]= FUNCC(pred8x8l_top_dc , depth);\
  436. h->pred8x8l[DC_128_PRED ]= FUNCC(pred8x8l_128_dc , depth);\
  437. \
  438. if (chroma_format_idc <= 1) {\
  439. h->pred8x8[VERT_PRED8x8 ]= FUNCC(pred8x8_vertical , depth);\
  440. h->pred8x8[HOR_PRED8x8 ]= FUNCC(pred8x8_horizontal , depth);\
  441. } else {\
  442. h->pred8x8[VERT_PRED8x8 ]= FUNCC(pred8x16_vertical , depth);\
  443. h->pred8x8[HOR_PRED8x8 ]= FUNCC(pred8x16_horizontal , depth);\
  444. }\
  445. if (codec_id != AV_CODEC_ID_VP7 && codec_id != AV_CODEC_ID_VP8) {\
  446. if (chroma_format_idc <= 1) {\
  447. h->pred8x8[PLANE_PRED8x8]= FUNCC(pred8x8_plane , depth);\
  448. } else {\
  449. h->pred8x8[PLANE_PRED8x8]= FUNCC(pred8x16_plane , depth);\
  450. }\
  451. } else\
  452. h->pred8x8[PLANE_PRED8x8]= FUNCD(pred8x8_tm_vp8);\
  453. if (codec_id != AV_CODEC_ID_RV40 && codec_id != AV_CODEC_ID_VP7 && \
  454. codec_id != AV_CODEC_ID_VP8) {\
  455. if (chroma_format_idc <= 1) {\
  456. h->pred8x8[DC_PRED8x8 ]= FUNCC(pred8x8_dc , depth);\
  457. h->pred8x8[LEFT_DC_PRED8x8]= FUNCC(pred8x8_left_dc , depth);\
  458. h->pred8x8[TOP_DC_PRED8x8 ]= FUNCC(pred8x8_top_dc , depth);\
  459. h->pred8x8[ALZHEIMER_DC_L0T_PRED8x8 ]= FUNC(pred8x8_mad_cow_dc_l0t, depth);\
  460. h->pred8x8[ALZHEIMER_DC_0LT_PRED8x8 ]= FUNC(pred8x8_mad_cow_dc_0lt, depth);\
  461. h->pred8x8[ALZHEIMER_DC_L00_PRED8x8 ]= FUNC(pred8x8_mad_cow_dc_l00, depth);\
  462. h->pred8x8[ALZHEIMER_DC_0L0_PRED8x8 ]= FUNC(pred8x8_mad_cow_dc_0l0, depth);\
  463. } else {\
  464. h->pred8x8[DC_PRED8x8 ]= FUNCC(pred8x16_dc , depth);\
  465. h->pred8x8[LEFT_DC_PRED8x8]= FUNCC(pred8x16_left_dc , depth);\
  466. h->pred8x8[TOP_DC_PRED8x8 ]= FUNCC(pred8x16_top_dc , depth);\
  467. h->pred8x8[ALZHEIMER_DC_L0T_PRED8x8 ]= FUNC(pred8x16_mad_cow_dc_l0t, depth);\
  468. h->pred8x8[ALZHEIMER_DC_0LT_PRED8x8 ]= FUNC(pred8x16_mad_cow_dc_0lt, depth);\
  469. h->pred8x8[ALZHEIMER_DC_L00_PRED8x8 ]= FUNC(pred8x16_mad_cow_dc_l00, depth);\
  470. h->pred8x8[ALZHEIMER_DC_0L0_PRED8x8 ]= FUNC(pred8x16_mad_cow_dc_0l0, depth);\
  471. }\
  472. }else{\
  473. h->pred8x8[DC_PRED8x8 ]= FUNCD(pred8x8_dc_rv40);\
  474. h->pred8x8[LEFT_DC_PRED8x8]= FUNCD(pred8x8_left_dc_rv40);\
  475. h->pred8x8[TOP_DC_PRED8x8 ]= FUNCD(pred8x8_top_dc_rv40);\
  476. if (codec_id == AV_CODEC_ID_VP7 || codec_id == AV_CODEC_ID_VP8) {\
  477. h->pred8x8[DC_127_PRED8x8]= FUNCC(pred8x8_127_dc , depth);\
  478. h->pred8x8[DC_129_PRED8x8]= FUNCC(pred8x8_129_dc , depth);\
  479. }\
  480. }\
  481. if (chroma_format_idc <= 1) {\
  482. h->pred8x8[DC_128_PRED8x8 ]= FUNCC(pred8x8_128_dc , depth);\
  483. } else {\
  484. h->pred8x8[DC_128_PRED8x8 ]= FUNCC(pred8x16_128_dc , depth);\
  485. }\
  486. \
  487. h->pred16x16[DC_PRED8x8 ]= FUNCC(pred16x16_dc , depth);\
  488. h->pred16x16[VERT_PRED8x8 ]= FUNCC(pred16x16_vertical , depth);\
  489. h->pred16x16[HOR_PRED8x8 ]= FUNCC(pred16x16_horizontal , depth);\
  490. switch(codec_id){\
  491. case AV_CODEC_ID_SVQ3:\
  492. h->pred16x16[PLANE_PRED8x8 ]= FUNCD(pred16x16_plane_svq3);\
  493. break;\
  494. case AV_CODEC_ID_RV40:\
  495. h->pred16x16[PLANE_PRED8x8 ]= FUNCD(pred16x16_plane_rv40);\
  496. break;\
  497. case AV_CODEC_ID_VP7:\
  498. case AV_CODEC_ID_VP8:\
  499. h->pred16x16[PLANE_PRED8x8 ]= FUNCD(pred16x16_tm_vp8);\
  500. h->pred16x16[DC_127_PRED8x8]= FUNCC(pred16x16_127_dc , depth);\
  501. h->pred16x16[DC_129_PRED8x8]= FUNCC(pred16x16_129_dc , depth);\
  502. break;\
  503. default:\
  504. h->pred16x16[PLANE_PRED8x8 ]= FUNCC(pred16x16_plane , depth);\
  505. break;\
  506. }\
  507. h->pred16x16[LEFT_DC_PRED8x8]= FUNCC(pred16x16_left_dc , depth);\
  508. h->pred16x16[TOP_DC_PRED8x8 ]= FUNCC(pred16x16_top_dc , depth);\
  509. h->pred16x16[DC_128_PRED8x8 ]= FUNCC(pred16x16_128_dc , depth);\
  510. \
  511. /* special lossless h/v prediction for H.264 */ \
  512. h->pred4x4_add [VERT_PRED ]= FUNCC(pred4x4_vertical_add , depth);\
  513. h->pred4x4_add [ HOR_PRED ]= FUNCC(pred4x4_horizontal_add , depth);\
  514. h->pred8x8l_add [VERT_PRED ]= FUNCC(pred8x8l_vertical_add , depth);\
  515. h->pred8x8l_add [ HOR_PRED ]= FUNCC(pred8x8l_horizontal_add , depth);\
  516. h->pred8x8l_filter_add [VERT_PRED ]= FUNCC(pred8x8l_vertical_filter_add , depth);\
  517. h->pred8x8l_filter_add [ HOR_PRED ]= FUNCC(pred8x8l_horizontal_filter_add , depth);\
  518. if (chroma_format_idc <= 1) {\
  519. h->pred8x8_add [VERT_PRED8x8]= FUNCC(pred8x8_vertical_add , depth);\
  520. h->pred8x8_add [ HOR_PRED8x8]= FUNCC(pred8x8_horizontal_add , depth);\
  521. } else {\
  522. h->pred8x8_add [VERT_PRED8x8]= FUNCC(pred8x16_vertical_add , depth);\
  523. h->pred8x8_add [ HOR_PRED8x8]= FUNCC(pred8x16_horizontal_add , depth);\
  524. }\
  525. h->pred16x16_add[VERT_PRED8x8]= FUNCC(pred16x16_vertical_add , depth);\
  526. h->pred16x16_add[ HOR_PRED8x8]= FUNCC(pred16x16_horizontal_add , depth);\
  527. switch (bit_depth) {
  528. case 9:
  529. H264_PRED(9)
  530. break;
  531. case 10:
  532. H264_PRED(10)
  533. break;
  534. case 12:
  535. H264_PRED(12)
  536. break;
  537. case 14:
  538. H264_PRED(14)
  539. break;
  540. default:
  541. av_assert0(bit_depth<=8);
  542. H264_PRED(8)
  543. break;
  544. }
  545. if (ARCH_AARCH64)
  546. ff_h264_pred_init_aarch64(h, codec_id, bit_depth, chroma_format_idc);
  547. if (ARCH_ARM)
  548. ff_h264_pred_init_arm(h, codec_id, bit_depth, chroma_format_idc);
  549. if (ARCH_X86)
  550. ff_h264_pred_init_x86(h, codec_id, bit_depth, chroma_format_idc);
  551. if (ARCH_MIPS)
  552. ff_h264_pred_init_mips(h, codec_id, bit_depth, chroma_format_idc);
  553. }