You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

574 lines
21KB

  1. /*
  2. * H.26L/H.264/AVC/JVT/14496-10/... encoder/decoder
  3. * Copyright (c) 2003 Michael Niedermayer <michaelni@gmx.at>
  4. *
  5. * This file is part of Libav.
  6. *
  7. * Libav is free software; you can redistribute it and/or
  8. * modify it under the terms of the GNU Lesser General Public
  9. * License as published by the Free Software Foundation; either
  10. * version 2.1 of the License, or (at your option) any later version.
  11. *
  12. * Libav is distributed in the hope that it will be useful,
  13. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  14. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  15. * Lesser General Public License for more details.
  16. *
  17. * You should have received a copy of the GNU Lesser General Public
  18. * License along with Libav; if not, write to the Free Software
  19. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  20. */
  21. /**
  22. * @file
  23. * H.264 / AVC / MPEG4 part10 prediction functions.
  24. * @author Michael Niedermayer <michaelni@gmx.at>
  25. */
  26. #include "dsputil.h"
  27. #include "h264pred.h"
  28. #define BIT_DEPTH 8
  29. #include "h264pred_template.c"
  30. #undef BIT_DEPTH
  31. #define BIT_DEPTH 9
  32. #include "h264pred_template.c"
  33. #undef BIT_DEPTH
  34. #define BIT_DEPTH 10
  35. #include "h264pred_template.c"
  36. #undef BIT_DEPTH
  37. static void pred4x4_vertical_vp8_c(uint8_t *src, const uint8_t *topright,
  38. ptrdiff_t stride)
  39. {
  40. const unsigned lt = src[-1-1*stride];
  41. LOAD_TOP_EDGE
  42. LOAD_TOP_RIGHT_EDGE
  43. uint32_t v = PACK_4U8((lt + 2*t0 + t1 + 2) >> 2,
  44. (t0 + 2*t1 + t2 + 2) >> 2,
  45. (t1 + 2*t2 + t3 + 2) >> 2,
  46. (t2 + 2*t3 + t4 + 2) >> 2);
  47. AV_WN32A(src+0*stride, v);
  48. AV_WN32A(src+1*stride, v);
  49. AV_WN32A(src+2*stride, v);
  50. AV_WN32A(src+3*stride, v);
  51. }
  52. static void pred4x4_horizontal_vp8_c(uint8_t *src, const uint8_t *topright,
  53. ptrdiff_t stride)
  54. {
  55. const unsigned lt = src[-1-1*stride];
  56. LOAD_LEFT_EDGE
  57. AV_WN32A(src+0*stride, ((lt + 2*l0 + l1 + 2) >> 2)*0x01010101);
  58. AV_WN32A(src+1*stride, ((l0 + 2*l1 + l2 + 2) >> 2)*0x01010101);
  59. AV_WN32A(src+2*stride, ((l1 + 2*l2 + l3 + 2) >> 2)*0x01010101);
  60. AV_WN32A(src+3*stride, ((l2 + 2*l3 + l3 + 2) >> 2)*0x01010101);
  61. }
  62. static void pred4x4_down_left_svq3_c(uint8_t *src, const uint8_t *topright,
  63. ptrdiff_t stride)
  64. {
  65. LOAD_TOP_EDGE
  66. LOAD_LEFT_EDGE
  67. src[0+0*stride]=(l1 + t1)>>1;
  68. src[1+0*stride]=
  69. src[0+1*stride]=(l2 + t2)>>1;
  70. src[2+0*stride]=
  71. src[1+1*stride]=
  72. src[0+2*stride]=
  73. src[3+0*stride]=
  74. src[2+1*stride]=
  75. src[1+2*stride]=
  76. src[0+3*stride]=
  77. src[3+1*stride]=
  78. src[2+2*stride]=
  79. src[1+3*stride]=
  80. src[3+2*stride]=
  81. src[2+3*stride]=
  82. src[3+3*stride]=(l3 + t3)>>1;
  83. }
  84. static void pred4x4_down_left_rv40_c(uint8_t *src, const uint8_t *topright,
  85. ptrdiff_t stride)
  86. {
  87. LOAD_TOP_EDGE
  88. LOAD_TOP_RIGHT_EDGE
  89. LOAD_LEFT_EDGE
  90. LOAD_DOWN_LEFT_EDGE
  91. src[0+0*stride]=(t0 + t2 + 2*t1 + 2 + l0 + l2 + 2*l1 + 2)>>3;
  92. src[1+0*stride]=
  93. src[0+1*stride]=(t1 + t3 + 2*t2 + 2 + l1 + l3 + 2*l2 + 2)>>3;
  94. src[2+0*stride]=
  95. src[1+1*stride]=
  96. src[0+2*stride]=(t2 + t4 + 2*t3 + 2 + l2 + l4 + 2*l3 + 2)>>3;
  97. src[3+0*stride]=
  98. src[2+1*stride]=
  99. src[1+2*stride]=
  100. src[0+3*stride]=(t3 + t5 + 2*t4 + 2 + l3 + l5 + 2*l4 + 2)>>3;
  101. src[3+1*stride]=
  102. src[2+2*stride]=
  103. src[1+3*stride]=(t4 + t6 + 2*t5 + 2 + l4 + l6 + 2*l5 + 2)>>3;
  104. src[3+2*stride]=
  105. src[2+3*stride]=(t5 + t7 + 2*t6 + 2 + l5 + l7 + 2*l6 + 2)>>3;
  106. src[3+3*stride]=(t6 + t7 + 1 + l6 + l7 + 1)>>2;
  107. }
  108. static void pred4x4_down_left_rv40_nodown_c(uint8_t *src,
  109. const uint8_t *topright,
  110. ptrdiff_t stride)
  111. {
  112. LOAD_TOP_EDGE
  113. LOAD_TOP_RIGHT_EDGE
  114. LOAD_LEFT_EDGE
  115. src[0+0*stride]=(t0 + t2 + 2*t1 + 2 + l0 + l2 + 2*l1 + 2)>>3;
  116. src[1+0*stride]=
  117. src[0+1*stride]=(t1 + t3 + 2*t2 + 2 + l1 + l3 + 2*l2 + 2)>>3;
  118. src[2+0*stride]=
  119. src[1+1*stride]=
  120. src[0+2*stride]=(t2 + t4 + 2*t3 + 2 + l2 + 3*l3 + 2)>>3;
  121. src[3+0*stride]=
  122. src[2+1*stride]=
  123. src[1+2*stride]=
  124. src[0+3*stride]=(t3 + t5 + 2*t4 + 2 + l3*4 + 2)>>3;
  125. src[3+1*stride]=
  126. src[2+2*stride]=
  127. src[1+3*stride]=(t4 + t6 + 2*t5 + 2 + l3*4 + 2)>>3;
  128. src[3+2*stride]=
  129. src[2+3*stride]=(t5 + t7 + 2*t6 + 2 + l3*4 + 2)>>3;
  130. src[3+3*stride]=(t6 + t7 + 1 + 2*l3 + 1)>>2;
  131. }
  132. static void pred4x4_vertical_left_rv40(uint8_t *src, const uint8_t *topright,
  133. ptrdiff_t stride,
  134. const int l0, const int l1, const int l2,
  135. const int l3, const int l4)
  136. {
  137. LOAD_TOP_EDGE
  138. LOAD_TOP_RIGHT_EDGE
  139. src[0+0*stride]=(2*t0 + 2*t1 + l1 + 2*l2 + l3 + 4)>>3;
  140. src[1+0*stride]=
  141. src[0+2*stride]=(t1 + t2 + 1)>>1;
  142. src[2+0*stride]=
  143. src[1+2*stride]=(t2 + t3 + 1)>>1;
  144. src[3+0*stride]=
  145. src[2+2*stride]=(t3 + t4+ 1)>>1;
  146. src[3+2*stride]=(t4 + t5+ 1)>>1;
  147. src[0+1*stride]=(t0 + 2*t1 + t2 + l2 + 2*l3 + l4 + 4)>>3;
  148. src[1+1*stride]=
  149. src[0+3*stride]=(t1 + 2*t2 + t3 + 2)>>2;
  150. src[2+1*stride]=
  151. src[1+3*stride]=(t2 + 2*t3 + t4 + 2)>>2;
  152. src[3+1*stride]=
  153. src[2+3*stride]=(t3 + 2*t4 + t5 + 2)>>2;
  154. src[3+3*stride]=(t4 + 2*t5 + t6 + 2)>>2;
  155. }
  156. static void pred4x4_vertical_left_rv40_c(uint8_t *src, const uint8_t *topright,
  157. ptrdiff_t stride)
  158. {
  159. LOAD_LEFT_EDGE
  160. LOAD_DOWN_LEFT_EDGE
  161. pred4x4_vertical_left_rv40(src, topright, stride, l0, l1, l2, l3, l4);
  162. }
  163. static void pred4x4_vertical_left_rv40_nodown_c(uint8_t *src,
  164. const uint8_t *topright,
  165. ptrdiff_t stride)
  166. {
  167. LOAD_LEFT_EDGE
  168. pred4x4_vertical_left_rv40(src, topright, stride, l0, l1, l2, l3, l3);
  169. }
  170. static void pred4x4_vertical_left_vp8_c(uint8_t *src, const uint8_t *topright,
  171. ptrdiff_t stride)
  172. {
  173. LOAD_TOP_EDGE
  174. LOAD_TOP_RIGHT_EDGE
  175. src[0+0*stride]=(t0 + t1 + 1)>>1;
  176. src[1+0*stride]=
  177. src[0+2*stride]=(t1 + t2 + 1)>>1;
  178. src[2+0*stride]=
  179. src[1+2*stride]=(t2 + t3 + 1)>>1;
  180. src[3+0*stride]=
  181. src[2+2*stride]=(t3 + t4 + 1)>>1;
  182. src[0+1*stride]=(t0 + 2*t1 + t2 + 2)>>2;
  183. src[1+1*stride]=
  184. src[0+3*stride]=(t1 + 2*t2 + t3 + 2)>>2;
  185. src[2+1*stride]=
  186. src[1+3*stride]=(t2 + 2*t3 + t4 + 2)>>2;
  187. src[3+1*stride]=
  188. src[2+3*stride]=(t3 + 2*t4 + t5 + 2)>>2;
  189. src[3+2*stride]=(t4 + 2*t5 + t6 + 2)>>2;
  190. src[3+3*stride]=(t5 + 2*t6 + t7 + 2)>>2;
  191. }
  192. static void pred4x4_horizontal_up_rv40_c(uint8_t *src, const uint8_t *topright,
  193. ptrdiff_t stride)
  194. {
  195. LOAD_LEFT_EDGE
  196. LOAD_DOWN_LEFT_EDGE
  197. LOAD_TOP_EDGE
  198. LOAD_TOP_RIGHT_EDGE
  199. src[0+0*stride]=(t1 + 2*t2 + t3 + 2*l0 + 2*l1 + 4)>>3;
  200. src[1+0*stride]=(t2 + 2*t3 + t4 + l0 + 2*l1 + l2 + 4)>>3;
  201. src[2+0*stride]=
  202. src[0+1*stride]=(t3 + 2*t4 + t5 + 2*l1 + 2*l2 + 4)>>3;
  203. src[3+0*stride]=
  204. src[1+1*stride]=(t4 + 2*t5 + t6 + l1 + 2*l2 + l3 + 4)>>3;
  205. src[2+1*stride]=
  206. src[0+2*stride]=(t5 + 2*t6 + t7 + 2*l2 + 2*l3 + 4)>>3;
  207. src[3+1*stride]=
  208. src[1+2*stride]=(t6 + 3*t7 + l2 + 3*l3 + 4)>>3;
  209. src[3+2*stride]=
  210. src[1+3*stride]=(l3 + 2*l4 + l5 + 2)>>2;
  211. src[0+3*stride]=
  212. src[2+2*stride]=(t6 + t7 + l3 + l4 + 2)>>2;
  213. src[2+3*stride]=(l4 + l5 + 1)>>1;
  214. src[3+3*stride]=(l4 + 2*l5 + l6 + 2)>>2;
  215. }
  216. static void pred4x4_horizontal_up_rv40_nodown_c(uint8_t *src,
  217. const uint8_t *topright,
  218. ptrdiff_t stride)
  219. {
  220. LOAD_LEFT_EDGE
  221. LOAD_TOP_EDGE
  222. LOAD_TOP_RIGHT_EDGE
  223. src[0+0*stride]=(t1 + 2*t2 + t3 + 2*l0 + 2*l1 + 4)>>3;
  224. src[1+0*stride]=(t2 + 2*t3 + t4 + l0 + 2*l1 + l2 + 4)>>3;
  225. src[2+0*stride]=
  226. src[0+1*stride]=(t3 + 2*t4 + t5 + 2*l1 + 2*l2 + 4)>>3;
  227. src[3+0*stride]=
  228. src[1+1*stride]=(t4 + 2*t5 + t6 + l1 + 2*l2 + l3 + 4)>>3;
  229. src[2+1*stride]=
  230. src[0+2*stride]=(t5 + 2*t6 + t7 + 2*l2 + 2*l3 + 4)>>3;
  231. src[3+1*stride]=
  232. src[1+2*stride]=(t6 + 3*t7 + l2 + 3*l3 + 4)>>3;
  233. src[3+2*stride]=
  234. src[1+3*stride]=l3;
  235. src[0+3*stride]=
  236. src[2+2*stride]=(t6 + t7 + 2*l3 + 2)>>2;
  237. src[2+3*stride]=
  238. src[3+3*stride]=l3;
  239. }
  240. static void pred4x4_tm_vp8_c(uint8_t *src, const uint8_t *topright,
  241. ptrdiff_t stride)
  242. {
  243. uint8_t *cm = ff_cropTbl + MAX_NEG_CROP - src[-1-stride];
  244. uint8_t *top = src-stride;
  245. int y;
  246. for (y = 0; y < 4; y++) {
  247. uint8_t *cm_in = cm + src[-1];
  248. src[0] = cm_in[top[0]];
  249. src[1] = cm_in[top[1]];
  250. src[2] = cm_in[top[2]];
  251. src[3] = cm_in[top[3]];
  252. src += stride;
  253. }
  254. }
  255. static void pred16x16_plane_svq3_c(uint8_t *src, ptrdiff_t stride)
  256. {
  257. pred16x16_plane_compat_8_c(src, stride, 1, 0);
  258. }
  259. static void pred16x16_plane_rv40_c(uint8_t *src, ptrdiff_t stride)
  260. {
  261. pred16x16_plane_compat_8_c(src, stride, 0, 1);
  262. }
  263. static void pred16x16_tm_vp8_c(uint8_t *src, ptrdiff_t stride)
  264. {
  265. uint8_t *cm = ff_cropTbl + MAX_NEG_CROP - src[-1-stride];
  266. uint8_t *top = src-stride;
  267. int y;
  268. for (y = 0; y < 16; y++) {
  269. uint8_t *cm_in = cm + src[-1];
  270. src[0] = cm_in[top[0]];
  271. src[1] = cm_in[top[1]];
  272. src[2] = cm_in[top[2]];
  273. src[3] = cm_in[top[3]];
  274. src[4] = cm_in[top[4]];
  275. src[5] = cm_in[top[5]];
  276. src[6] = cm_in[top[6]];
  277. src[7] = cm_in[top[7]];
  278. src[8] = cm_in[top[8]];
  279. src[9] = cm_in[top[9]];
  280. src[10] = cm_in[top[10]];
  281. src[11] = cm_in[top[11]];
  282. src[12] = cm_in[top[12]];
  283. src[13] = cm_in[top[13]];
  284. src[14] = cm_in[top[14]];
  285. src[15] = cm_in[top[15]];
  286. src += stride;
  287. }
  288. }
  289. static void pred8x8_left_dc_rv40_c(uint8_t *src, ptrdiff_t stride)
  290. {
  291. int i;
  292. unsigned dc0;
  293. dc0=0;
  294. for(i=0;i<8; i++)
  295. dc0+= src[-1+i*stride];
  296. dc0= 0x01010101*((dc0 + 4)>>3);
  297. for(i=0; i<8; i++){
  298. ((uint32_t*)(src+i*stride))[0]=
  299. ((uint32_t*)(src+i*stride))[1]= dc0;
  300. }
  301. }
  302. static void pred8x8_top_dc_rv40_c(uint8_t *src, ptrdiff_t stride)
  303. {
  304. int i;
  305. unsigned dc0;
  306. dc0=0;
  307. for(i=0;i<8; i++)
  308. dc0+= src[i-stride];
  309. dc0= 0x01010101*((dc0 + 4)>>3);
  310. for(i=0; i<8; i++){
  311. ((uint32_t*)(src+i*stride))[0]=
  312. ((uint32_t*)(src+i*stride))[1]= dc0;
  313. }
  314. }
  315. static void pred8x8_dc_rv40_c(uint8_t *src, ptrdiff_t stride)
  316. {
  317. int i;
  318. unsigned dc0 = 0;
  319. for(i=0;i<4; i++){
  320. dc0+= src[-1+i*stride] + src[i-stride];
  321. dc0+= src[4+i-stride];
  322. dc0+= src[-1+(i+4)*stride];
  323. }
  324. dc0= 0x01010101*((dc0 + 8)>>4);
  325. for(i=0; i<4; i++){
  326. ((uint32_t*)(src+i*stride))[0]= dc0;
  327. ((uint32_t*)(src+i*stride))[1]= dc0;
  328. }
  329. for(i=4; i<8; i++){
  330. ((uint32_t*)(src+i*stride))[0]= dc0;
  331. ((uint32_t*)(src+i*stride))[1]= dc0;
  332. }
  333. }
  334. static void pred8x8_tm_vp8_c(uint8_t *src, ptrdiff_t stride)
  335. {
  336. uint8_t *cm = ff_cropTbl + MAX_NEG_CROP - src[-1-stride];
  337. uint8_t *top = src-stride;
  338. int y;
  339. for (y = 0; y < 8; y++) {
  340. uint8_t *cm_in = cm + src[-1];
  341. src[0] = cm_in[top[0]];
  342. src[1] = cm_in[top[1]];
  343. src[2] = cm_in[top[2]];
  344. src[3] = cm_in[top[3]];
  345. src[4] = cm_in[top[4]];
  346. src[5] = cm_in[top[5]];
  347. src[6] = cm_in[top[6]];
  348. src[7] = cm_in[top[7]];
  349. src += stride;
  350. }
  351. }
  352. /**
  353. * Set the intra prediction function pointers.
  354. */
  355. void ff_h264_pred_init(H264PredContext *h, int codec_id, const int bit_depth,
  356. const int chroma_format_idc)
  357. {
  358. #undef FUNC
  359. #undef FUNCC
  360. #define FUNC(a, depth) a ## _ ## depth
  361. #define FUNCC(a, depth) a ## _ ## depth ## _c
  362. #define FUNCD(a) a ## _c
  363. #define H264_PRED(depth) \
  364. if(codec_id != AV_CODEC_ID_RV40){\
  365. if(codec_id == AV_CODEC_ID_VP8) {\
  366. h->pred4x4[VERT_PRED ]= FUNCD(pred4x4_vertical_vp8);\
  367. h->pred4x4[HOR_PRED ]= FUNCD(pred4x4_horizontal_vp8);\
  368. } else {\
  369. h->pred4x4[VERT_PRED ]= FUNCC(pred4x4_vertical , depth);\
  370. h->pred4x4[HOR_PRED ]= FUNCC(pred4x4_horizontal , depth);\
  371. }\
  372. h->pred4x4[DC_PRED ]= FUNCC(pred4x4_dc , depth);\
  373. if(codec_id == AV_CODEC_ID_SVQ3)\
  374. h->pred4x4[DIAG_DOWN_LEFT_PRED ]= FUNCD(pred4x4_down_left_svq3);\
  375. else\
  376. h->pred4x4[DIAG_DOWN_LEFT_PRED ]= FUNCC(pred4x4_down_left , depth);\
  377. h->pred4x4[DIAG_DOWN_RIGHT_PRED]= FUNCC(pred4x4_down_right , depth);\
  378. h->pred4x4[VERT_RIGHT_PRED ]= FUNCC(pred4x4_vertical_right , depth);\
  379. h->pred4x4[HOR_DOWN_PRED ]= FUNCC(pred4x4_horizontal_down , depth);\
  380. if (codec_id == AV_CODEC_ID_VP8) {\
  381. h->pred4x4[VERT_LEFT_PRED ]= FUNCD(pred4x4_vertical_left_vp8);\
  382. } else\
  383. h->pred4x4[VERT_LEFT_PRED ]= FUNCC(pred4x4_vertical_left , depth);\
  384. h->pred4x4[HOR_UP_PRED ]= FUNCC(pred4x4_horizontal_up , depth);\
  385. if(codec_id != AV_CODEC_ID_VP8) {\
  386. h->pred4x4[LEFT_DC_PRED ]= FUNCC(pred4x4_left_dc , depth);\
  387. h->pred4x4[TOP_DC_PRED ]= FUNCC(pred4x4_top_dc , depth);\
  388. h->pred4x4[DC_128_PRED ]= FUNCC(pred4x4_128_dc , depth);\
  389. } else {\
  390. h->pred4x4[TM_VP8_PRED ]= FUNCD(pred4x4_tm_vp8);\
  391. h->pred4x4[DC_127_PRED ]= FUNCC(pred4x4_127_dc , depth);\
  392. h->pred4x4[DC_129_PRED ]= FUNCC(pred4x4_129_dc , depth);\
  393. h->pred4x4[VERT_VP8_PRED ]= FUNCC(pred4x4_vertical , depth);\
  394. h->pred4x4[HOR_VP8_PRED ]= FUNCC(pred4x4_horizontal , depth);\
  395. }\
  396. }else{\
  397. h->pred4x4[VERT_PRED ]= FUNCC(pred4x4_vertical , depth);\
  398. h->pred4x4[HOR_PRED ]= FUNCC(pred4x4_horizontal , depth);\
  399. h->pred4x4[DC_PRED ]= FUNCC(pred4x4_dc , depth);\
  400. h->pred4x4[DIAG_DOWN_LEFT_PRED ]= FUNCD(pred4x4_down_left_rv40);\
  401. h->pred4x4[DIAG_DOWN_RIGHT_PRED]= FUNCC(pred4x4_down_right , depth);\
  402. h->pred4x4[VERT_RIGHT_PRED ]= FUNCC(pred4x4_vertical_right , depth);\
  403. h->pred4x4[HOR_DOWN_PRED ]= FUNCC(pred4x4_horizontal_down , depth);\
  404. h->pred4x4[VERT_LEFT_PRED ]= FUNCD(pred4x4_vertical_left_rv40);\
  405. h->pred4x4[HOR_UP_PRED ]= FUNCD(pred4x4_horizontal_up_rv40);\
  406. h->pred4x4[LEFT_DC_PRED ]= FUNCC(pred4x4_left_dc , depth);\
  407. h->pred4x4[TOP_DC_PRED ]= FUNCC(pred4x4_top_dc , depth);\
  408. h->pred4x4[DC_128_PRED ]= FUNCC(pred4x4_128_dc , depth);\
  409. h->pred4x4[DIAG_DOWN_LEFT_PRED_RV40_NODOWN]= FUNCD(pred4x4_down_left_rv40_nodown);\
  410. h->pred4x4[HOR_UP_PRED_RV40_NODOWN]= FUNCD(pred4x4_horizontal_up_rv40_nodown);\
  411. h->pred4x4[VERT_LEFT_PRED_RV40_NODOWN]= FUNCD(pred4x4_vertical_left_rv40_nodown);\
  412. }\
  413. \
  414. h->pred8x8l[VERT_PRED ]= FUNCC(pred8x8l_vertical , depth);\
  415. h->pred8x8l[HOR_PRED ]= FUNCC(pred8x8l_horizontal , depth);\
  416. h->pred8x8l[DC_PRED ]= FUNCC(pred8x8l_dc , depth);\
  417. h->pred8x8l[DIAG_DOWN_LEFT_PRED ]= FUNCC(pred8x8l_down_left , depth);\
  418. h->pred8x8l[DIAG_DOWN_RIGHT_PRED]= FUNCC(pred8x8l_down_right , depth);\
  419. h->pred8x8l[VERT_RIGHT_PRED ]= FUNCC(pred8x8l_vertical_right , depth);\
  420. h->pred8x8l[HOR_DOWN_PRED ]= FUNCC(pred8x8l_horizontal_down , depth);\
  421. h->pred8x8l[VERT_LEFT_PRED ]= FUNCC(pred8x8l_vertical_left , depth);\
  422. h->pred8x8l[HOR_UP_PRED ]= FUNCC(pred8x8l_horizontal_up , depth);\
  423. h->pred8x8l[LEFT_DC_PRED ]= FUNCC(pred8x8l_left_dc , depth);\
  424. h->pred8x8l[TOP_DC_PRED ]= FUNCC(pred8x8l_top_dc , depth);\
  425. h->pred8x8l[DC_128_PRED ]= FUNCC(pred8x8l_128_dc , depth);\
  426. \
  427. if (chroma_format_idc == 1) {\
  428. h->pred8x8[VERT_PRED8x8 ]= FUNCC(pred8x8_vertical , depth);\
  429. h->pred8x8[HOR_PRED8x8 ]= FUNCC(pred8x8_horizontal , depth);\
  430. } else {\
  431. h->pred8x8[VERT_PRED8x8 ]= FUNCC(pred8x16_vertical , depth);\
  432. h->pred8x8[HOR_PRED8x8 ]= FUNCC(pred8x16_horizontal , depth);\
  433. }\
  434. if (codec_id != AV_CODEC_ID_VP8) {\
  435. if (chroma_format_idc == 1) {\
  436. h->pred8x8[PLANE_PRED8x8]= FUNCC(pred8x8_plane , depth);\
  437. } else {\
  438. h->pred8x8[PLANE_PRED8x8]= FUNCC(pred8x16_plane , depth);\
  439. }\
  440. } else\
  441. h->pred8x8[PLANE_PRED8x8]= FUNCD(pred8x8_tm_vp8);\
  442. if(codec_id != AV_CODEC_ID_RV40 && codec_id != AV_CODEC_ID_VP8){\
  443. if (chroma_format_idc == 1) {\
  444. h->pred8x8[DC_PRED8x8 ]= FUNCC(pred8x8_dc , depth);\
  445. h->pred8x8[LEFT_DC_PRED8x8]= FUNCC(pred8x8_left_dc , depth);\
  446. h->pred8x8[TOP_DC_PRED8x8 ]= FUNCC(pred8x8_top_dc , depth);\
  447. h->pred8x8[ALZHEIMER_DC_L0T_PRED8x8 ]= FUNC(pred8x8_mad_cow_dc_l0t, depth);\
  448. h->pred8x8[ALZHEIMER_DC_0LT_PRED8x8 ]= FUNC(pred8x8_mad_cow_dc_0lt, depth);\
  449. h->pred8x8[ALZHEIMER_DC_L00_PRED8x8 ]= FUNC(pred8x8_mad_cow_dc_l00, depth);\
  450. h->pred8x8[ALZHEIMER_DC_0L0_PRED8x8 ]= FUNC(pred8x8_mad_cow_dc_0l0, depth);\
  451. } else {\
  452. h->pred8x8[DC_PRED8x8 ]= FUNCC(pred8x16_dc , depth);\
  453. h->pred8x8[LEFT_DC_PRED8x8]= FUNCC(pred8x16_left_dc , depth);\
  454. h->pred8x8[TOP_DC_PRED8x8 ]= FUNCC(pred8x16_top_dc , depth);\
  455. h->pred8x8[ALZHEIMER_DC_L0T_PRED8x8 ]= FUNC(pred8x16_mad_cow_dc_l0t, depth);\
  456. h->pred8x8[ALZHEIMER_DC_0LT_PRED8x8 ]= FUNC(pred8x16_mad_cow_dc_0lt, depth);\
  457. h->pred8x8[ALZHEIMER_DC_L00_PRED8x8 ]= FUNC(pred8x16_mad_cow_dc_l00, depth);\
  458. h->pred8x8[ALZHEIMER_DC_0L0_PRED8x8 ]= FUNC(pred8x16_mad_cow_dc_0l0, depth);\
  459. }\
  460. }else{\
  461. h->pred8x8[DC_PRED8x8 ]= FUNCD(pred8x8_dc_rv40);\
  462. h->pred8x8[LEFT_DC_PRED8x8]= FUNCD(pred8x8_left_dc_rv40);\
  463. h->pred8x8[TOP_DC_PRED8x8 ]= FUNCD(pred8x8_top_dc_rv40);\
  464. if (codec_id == AV_CODEC_ID_VP8) {\
  465. h->pred8x8[DC_127_PRED8x8]= FUNCC(pred8x8_127_dc , depth);\
  466. h->pred8x8[DC_129_PRED8x8]= FUNCC(pred8x8_129_dc , depth);\
  467. }\
  468. }\
  469. if (chroma_format_idc == 1) {\
  470. h->pred8x8[DC_128_PRED8x8 ]= FUNCC(pred8x8_128_dc , depth);\
  471. } else {\
  472. h->pred8x8[DC_128_PRED8x8 ]= FUNCC(pred8x16_128_dc , depth);\
  473. }\
  474. \
  475. h->pred16x16[DC_PRED8x8 ]= FUNCC(pred16x16_dc , depth);\
  476. h->pred16x16[VERT_PRED8x8 ]= FUNCC(pred16x16_vertical , depth);\
  477. h->pred16x16[HOR_PRED8x8 ]= FUNCC(pred16x16_horizontal , depth);\
  478. switch(codec_id){\
  479. case AV_CODEC_ID_SVQ3:\
  480. h->pred16x16[PLANE_PRED8x8 ]= FUNCD(pred16x16_plane_svq3);\
  481. break;\
  482. case AV_CODEC_ID_RV40:\
  483. h->pred16x16[PLANE_PRED8x8 ]= FUNCD(pred16x16_plane_rv40);\
  484. break;\
  485. case AV_CODEC_ID_VP8:\
  486. h->pred16x16[PLANE_PRED8x8 ]= FUNCD(pred16x16_tm_vp8);\
  487. h->pred16x16[DC_127_PRED8x8]= FUNCC(pred16x16_127_dc , depth);\
  488. h->pred16x16[DC_129_PRED8x8]= FUNCC(pred16x16_129_dc , depth);\
  489. break;\
  490. default:\
  491. h->pred16x16[PLANE_PRED8x8 ]= FUNCC(pred16x16_plane , depth);\
  492. break;\
  493. }\
  494. h->pred16x16[LEFT_DC_PRED8x8]= FUNCC(pred16x16_left_dc , depth);\
  495. h->pred16x16[TOP_DC_PRED8x8 ]= FUNCC(pred16x16_top_dc , depth);\
  496. h->pred16x16[DC_128_PRED8x8 ]= FUNCC(pred16x16_128_dc , depth);\
  497. \
  498. /* special lossless h/v prediction for h264 */ \
  499. h->pred4x4_add [VERT_PRED ]= FUNCC(pred4x4_vertical_add , depth);\
  500. h->pred4x4_add [ HOR_PRED ]= FUNCC(pred4x4_horizontal_add , depth);\
  501. h->pred8x8l_add [VERT_PRED ]= FUNCC(pred8x8l_vertical_add , depth);\
  502. h->pred8x8l_add [ HOR_PRED ]= FUNCC(pred8x8l_horizontal_add , depth);\
  503. if (chroma_format_idc == 1) {\
  504. h->pred8x8_add [VERT_PRED8x8]= FUNCC(pred8x8_vertical_add , depth);\
  505. h->pred8x8_add [ HOR_PRED8x8]= FUNCC(pred8x8_horizontal_add , depth);\
  506. } else {\
  507. h->pred8x8_add [VERT_PRED8x8]= FUNCC(pred8x16_vertical_add , depth);\
  508. h->pred8x8_add [ HOR_PRED8x8]= FUNCC(pred8x16_horizontal_add , depth);\
  509. }\
  510. h->pred16x16_add[VERT_PRED8x8]= FUNCC(pred16x16_vertical_add , depth);\
  511. h->pred16x16_add[ HOR_PRED8x8]= FUNCC(pred16x16_horizontal_add , depth);\
  512. switch (bit_depth) {
  513. case 9:
  514. H264_PRED(9)
  515. break;
  516. case 10:
  517. H264_PRED(10)
  518. break;
  519. default:
  520. H264_PRED(8)
  521. break;
  522. }
  523. if (ARCH_ARM) ff_h264_pred_init_arm(h, codec_id, bit_depth, chroma_format_idc);
  524. if (ARCH_X86) ff_h264_pred_init_x86(h, codec_id, bit_depth, chroma_format_idc);
  525. }