You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

535 lines
20KB

  1. /*
  2. * H.26L/H.264/AVC/JVT/14496-10/... encoder/decoder
  3. * Copyright (c) 2003 Michael Niedermayer <michaelni@gmx.at>
  4. *
  5. * This file is part of FFmpeg.
  6. *
  7. * FFmpeg is free software; you can redistribute it and/or
  8. * modify it under the terms of the GNU Lesser General Public
  9. * License as published by the Free Software Foundation; either
  10. * version 2.1 of the License, or (at your option) any later version.
  11. *
  12. * FFmpeg is distributed in the hope that it will be useful,
  13. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  14. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  15. * Lesser General Public License for more details.
  16. *
  17. * You should have received a copy of the GNU Lesser General Public
  18. * License along with FFmpeg; if not, write to the Free Software
  19. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  20. */
  21. /**
  22. * @file
  23. * H.264 / AVC / MPEG4 part10 prediction functions.
  24. * @author Michael Niedermayer <michaelni@gmx.at>
  25. */
  26. #include "h264pred.h"
  27. #define BIT_DEPTH 8
  28. #include "h264pred_template.c"
  29. #undef BIT_DEPTH
  30. #define BIT_DEPTH 9
  31. #include "h264pred_template.c"
  32. #undef BIT_DEPTH
  33. #define BIT_DEPTH 10
  34. #include "h264pred_template.c"
  35. #undef BIT_DEPTH
  36. static void pred4x4_vertical_vp8_c(uint8_t *src, const uint8_t *topright, int stride){
  37. const int lt= src[-1-1*stride];
  38. LOAD_TOP_EDGE
  39. LOAD_TOP_RIGHT_EDGE
  40. uint32_t v = PACK_4U8((lt + 2*t0 + t1 + 2) >> 2,
  41. (t0 + 2*t1 + t2 + 2) >> 2,
  42. (t1 + 2*t2 + t3 + 2) >> 2,
  43. (t2 + 2*t3 + t4 + 2) >> 2);
  44. AV_WN32A(src+0*stride, v);
  45. AV_WN32A(src+1*stride, v);
  46. AV_WN32A(src+2*stride, v);
  47. AV_WN32A(src+3*stride, v);
  48. }
  49. static void pred4x4_horizontal_vp8_c(uint8_t *src, const uint8_t *topright, int stride){
  50. const int lt= src[-1-1*stride];
  51. LOAD_LEFT_EDGE
  52. AV_WN32A(src+0*stride, ((lt + 2*l0 + l1 + 2) >> 2)*0x01010101);
  53. AV_WN32A(src+1*stride, ((l0 + 2*l1 + l2 + 2) >> 2)*0x01010101);
  54. AV_WN32A(src+2*stride, ((l1 + 2*l2 + l3 + 2) >> 2)*0x01010101);
  55. AV_WN32A(src+3*stride, ((l2 + 2*l3 + l3 + 2) >> 2)*0x01010101);
  56. }
  57. static void pred4x4_down_left_svq3_c(uint8_t *src, const uint8_t *topright, int stride){
  58. LOAD_TOP_EDGE
  59. LOAD_LEFT_EDGE
  60. const av_unused int unu0= t0;
  61. const av_unused int unu1= l0;
  62. src[0+0*stride]=(l1 + t1)>>1;
  63. src[1+0*stride]=
  64. src[0+1*stride]=(l2 + t2)>>1;
  65. src[2+0*stride]=
  66. src[1+1*stride]=
  67. src[0+2*stride]=
  68. src[3+0*stride]=
  69. src[2+1*stride]=
  70. src[1+2*stride]=
  71. src[0+3*stride]=
  72. src[3+1*stride]=
  73. src[2+2*stride]=
  74. src[1+3*stride]=
  75. src[3+2*stride]=
  76. src[2+3*stride]=
  77. src[3+3*stride]=(l3 + t3)>>1;
  78. }
  79. static void pred4x4_down_left_rv40_c(uint8_t *src, const uint8_t *topright, int stride){
  80. LOAD_TOP_EDGE
  81. LOAD_TOP_RIGHT_EDGE
  82. LOAD_LEFT_EDGE
  83. LOAD_DOWN_LEFT_EDGE
  84. src[0+0*stride]=(t0 + t2 + 2*t1 + 2 + l0 + l2 + 2*l1 + 2)>>3;
  85. src[1+0*stride]=
  86. src[0+1*stride]=(t1 + t3 + 2*t2 + 2 + l1 + l3 + 2*l2 + 2)>>3;
  87. src[2+0*stride]=
  88. src[1+1*stride]=
  89. src[0+2*stride]=(t2 + t4 + 2*t3 + 2 + l2 + l4 + 2*l3 + 2)>>3;
  90. src[3+0*stride]=
  91. src[2+1*stride]=
  92. src[1+2*stride]=
  93. src[0+3*stride]=(t3 + t5 + 2*t4 + 2 + l3 + l5 + 2*l4 + 2)>>3;
  94. src[3+1*stride]=
  95. src[2+2*stride]=
  96. src[1+3*stride]=(t4 + t6 + 2*t5 + 2 + l4 + l6 + 2*l5 + 2)>>3;
  97. src[3+2*stride]=
  98. src[2+3*stride]=(t5 + t7 + 2*t6 + 2 + l5 + l7 + 2*l6 + 2)>>3;
  99. src[3+3*stride]=(t6 + t7 + 1 + l6 + l7 + 1)>>2;
  100. }
  101. static void pred4x4_down_left_rv40_nodown_c(uint8_t *src, const uint8_t *topright, int stride){
  102. LOAD_TOP_EDGE
  103. LOAD_TOP_RIGHT_EDGE
  104. LOAD_LEFT_EDGE
  105. src[0+0*stride]=(t0 + t2 + 2*t1 + 2 + l0 + l2 + 2*l1 + 2)>>3;
  106. src[1+0*stride]=
  107. src[0+1*stride]=(t1 + t3 + 2*t2 + 2 + l1 + l3 + 2*l2 + 2)>>3;
  108. src[2+0*stride]=
  109. src[1+1*stride]=
  110. src[0+2*stride]=(t2 + t4 + 2*t3 + 2 + l2 + 3*l3 + 2)>>3;
  111. src[3+0*stride]=
  112. src[2+1*stride]=
  113. src[1+2*stride]=
  114. src[0+3*stride]=(t3 + t5 + 2*t4 + 2 + l3*4 + 2)>>3;
  115. src[3+1*stride]=
  116. src[2+2*stride]=
  117. src[1+3*stride]=(t4 + t6 + 2*t5 + 2 + l3*4 + 2)>>3;
  118. src[3+2*stride]=
  119. src[2+3*stride]=(t5 + t7 + 2*t6 + 2 + l3*4 + 2)>>3;
  120. src[3+3*stride]=(t6 + t7 + 1 + 2*l3 + 1)>>2;
  121. }
  122. static void pred4x4_vertical_left_rv40(uint8_t *src, const uint8_t *topright, int stride,
  123. const int l0, const int l1, const int l2, const int l3, const int l4){
  124. LOAD_TOP_EDGE
  125. LOAD_TOP_RIGHT_EDGE
  126. src[0+0*stride]=(2*t0 + 2*t1 + l1 + 2*l2 + l3 + 4)>>3;
  127. src[1+0*stride]=
  128. src[0+2*stride]=(t1 + t2 + 1)>>1;
  129. src[2+0*stride]=
  130. src[1+2*stride]=(t2 + t3 + 1)>>1;
  131. src[3+0*stride]=
  132. src[2+2*stride]=(t3 + t4+ 1)>>1;
  133. src[3+2*stride]=(t4 + t5+ 1)>>1;
  134. src[0+1*stride]=(t0 + 2*t1 + t2 + l2 + 2*l3 + l4 + 4)>>3;
  135. src[1+1*stride]=
  136. src[0+3*stride]=(t1 + 2*t2 + t3 + 2)>>2;
  137. src[2+1*stride]=
  138. src[1+3*stride]=(t2 + 2*t3 + t4 + 2)>>2;
  139. src[3+1*stride]=
  140. src[2+3*stride]=(t3 + 2*t4 + t5 + 2)>>2;
  141. src[3+3*stride]=(t4 + 2*t5 + t6 + 2)>>2;
  142. }
  143. static void pred4x4_vertical_left_rv40_c(uint8_t *src, const uint8_t *topright, int stride){
  144. LOAD_LEFT_EDGE
  145. LOAD_DOWN_LEFT_EDGE
  146. pred4x4_vertical_left_rv40(src, topright, stride, l0, l1, l2, l3, l4);
  147. }
  148. static void pred4x4_vertical_left_rv40_nodown_c(uint8_t *src, const uint8_t *topright, int stride){
  149. LOAD_LEFT_EDGE
  150. pred4x4_vertical_left_rv40(src, topright, stride, l0, l1, l2, l3, l3);
  151. }
  152. static void pred4x4_vertical_left_vp8_c(uint8_t *src, const uint8_t *topright, int stride){
  153. LOAD_TOP_EDGE
  154. LOAD_TOP_RIGHT_EDGE
  155. src[0+0*stride]=(t0 + t1 + 1)>>1;
  156. src[1+0*stride]=
  157. src[0+2*stride]=(t1 + t2 + 1)>>1;
  158. src[2+0*stride]=
  159. src[1+2*stride]=(t2 + t3 + 1)>>1;
  160. src[3+0*stride]=
  161. src[2+2*stride]=(t3 + t4 + 1)>>1;
  162. src[0+1*stride]=(t0 + 2*t1 + t2 + 2)>>2;
  163. src[1+1*stride]=
  164. src[0+3*stride]=(t1 + 2*t2 + t3 + 2)>>2;
  165. src[2+1*stride]=
  166. src[1+3*stride]=(t2 + 2*t3 + t4 + 2)>>2;
  167. src[3+1*stride]=
  168. src[2+3*stride]=(t3 + 2*t4 + t5 + 2)>>2;
  169. src[3+2*stride]=(t4 + 2*t5 + t6 + 2)>>2;
  170. src[3+3*stride]=(t5 + 2*t6 + t7 + 2)>>2;
  171. }
  172. static void pred4x4_horizontal_up_rv40_c(uint8_t *src, const uint8_t *topright, int stride){
  173. LOAD_LEFT_EDGE
  174. LOAD_DOWN_LEFT_EDGE
  175. LOAD_TOP_EDGE
  176. LOAD_TOP_RIGHT_EDGE
  177. src[0+0*stride]=(t1 + 2*t2 + t3 + 2*l0 + 2*l1 + 4)>>3;
  178. src[1+0*stride]=(t2 + 2*t3 + t4 + l0 + 2*l1 + l2 + 4)>>3;
  179. src[2+0*stride]=
  180. src[0+1*stride]=(t3 + 2*t4 + t5 + 2*l1 + 2*l2 + 4)>>3;
  181. src[3+0*stride]=
  182. src[1+1*stride]=(t4 + 2*t5 + t6 + l1 + 2*l2 + l3 + 4)>>3;
  183. src[2+1*stride]=
  184. src[0+2*stride]=(t5 + 2*t6 + t7 + 2*l2 + 2*l3 + 4)>>3;
  185. src[3+1*stride]=
  186. src[1+2*stride]=(t6 + 3*t7 + l2 + 3*l3 + 4)>>3;
  187. src[3+2*stride]=
  188. src[1+3*stride]=(l3 + 2*l4 + l5 + 2)>>2;
  189. src[0+3*stride]=
  190. src[2+2*stride]=(t6 + t7 + l3 + l4 + 2)>>2;
  191. src[2+3*stride]=(l4 + l5 + 1)>>1;
  192. src[3+3*stride]=(l4 + 2*l5 + l6 + 2)>>2;
  193. }
  194. static void pred4x4_horizontal_up_rv40_nodown_c(uint8_t *src, const uint8_t *topright, int stride){
  195. LOAD_LEFT_EDGE
  196. LOAD_TOP_EDGE
  197. LOAD_TOP_RIGHT_EDGE
  198. src[0+0*stride]=(t1 + 2*t2 + t3 + 2*l0 + 2*l1 + 4)>>3;
  199. src[1+0*stride]=(t2 + 2*t3 + t4 + l0 + 2*l1 + l2 + 4)>>3;
  200. src[2+0*stride]=
  201. src[0+1*stride]=(t3 + 2*t4 + t5 + 2*l1 + 2*l2 + 4)>>3;
  202. src[3+0*stride]=
  203. src[1+1*stride]=(t4 + 2*t5 + t6 + l1 + 2*l2 + l3 + 4)>>3;
  204. src[2+1*stride]=
  205. src[0+2*stride]=(t5 + 2*t6 + t7 + 2*l2 + 2*l3 + 4)>>3;
  206. src[3+1*stride]=
  207. src[1+2*stride]=(t6 + 3*t7 + l2 + 3*l3 + 4)>>3;
  208. src[3+2*stride]=
  209. src[1+3*stride]=l3;
  210. src[0+3*stride]=
  211. src[2+2*stride]=(t6 + t7 + 2*l3 + 2)>>2;
  212. src[2+3*stride]=
  213. src[3+3*stride]=l3;
  214. }
  215. static void pred4x4_tm_vp8_c(uint8_t *src, const uint8_t *topright, int stride){
  216. uint8_t *cm = ff_cropTbl + MAX_NEG_CROP - src[-1-stride];
  217. uint8_t *top = src-stride;
  218. int y;
  219. for (y = 0; y < 4; y++) {
  220. uint8_t *cm_in = cm + src[-1];
  221. src[0] = cm_in[top[0]];
  222. src[1] = cm_in[top[1]];
  223. src[2] = cm_in[top[2]];
  224. src[3] = cm_in[top[3]];
  225. src += stride;
  226. }
  227. }
  228. static void pred16x16_plane_svq3_c(uint8_t *src, int stride){
  229. pred16x16_plane_compat_8_c(src, stride, 1, 0);
  230. }
  231. static void pred16x16_plane_rv40_c(uint8_t *src, int stride){
  232. pred16x16_plane_compat_8_c(src, stride, 0, 1);
  233. }
  234. static void pred16x16_tm_vp8_c(uint8_t *src, int stride){
  235. uint8_t *cm = ff_cropTbl + MAX_NEG_CROP - src[-1-stride];
  236. uint8_t *top = src-stride;
  237. int y;
  238. for (y = 0; y < 16; y++) {
  239. uint8_t *cm_in = cm + src[-1];
  240. src[0] = cm_in[top[0]];
  241. src[1] = cm_in[top[1]];
  242. src[2] = cm_in[top[2]];
  243. src[3] = cm_in[top[3]];
  244. src[4] = cm_in[top[4]];
  245. src[5] = cm_in[top[5]];
  246. src[6] = cm_in[top[6]];
  247. src[7] = cm_in[top[7]];
  248. src[8] = cm_in[top[8]];
  249. src[9] = cm_in[top[9]];
  250. src[10] = cm_in[top[10]];
  251. src[11] = cm_in[top[11]];
  252. src[12] = cm_in[top[12]];
  253. src[13] = cm_in[top[13]];
  254. src[14] = cm_in[top[14]];
  255. src[15] = cm_in[top[15]];
  256. src += stride;
  257. }
  258. }
  259. static void pred8x8_left_dc_rv40_c(uint8_t *src, int stride){
  260. int i;
  261. int dc0;
  262. dc0=0;
  263. for(i=0;i<8; i++)
  264. dc0+= src[-1+i*stride];
  265. dc0= 0x01010101*((dc0 + 4)>>3);
  266. for(i=0; i<8; i++){
  267. ((uint32_t*)(src+i*stride))[0]=
  268. ((uint32_t*)(src+i*stride))[1]= dc0;
  269. }
  270. }
  271. static void pred8x8_top_dc_rv40_c(uint8_t *src, int stride){
  272. int i;
  273. int dc0;
  274. dc0=0;
  275. for(i=0;i<8; i++)
  276. dc0+= src[i-stride];
  277. dc0= 0x01010101*((dc0 + 4)>>3);
  278. for(i=0; i<8; i++){
  279. ((uint32_t*)(src+i*stride))[0]=
  280. ((uint32_t*)(src+i*stride))[1]= dc0;
  281. }
  282. }
  283. static void pred8x8_dc_rv40_c(uint8_t *src, int stride){
  284. int i;
  285. int dc0=0;
  286. for(i=0;i<4; i++){
  287. dc0+= src[-1+i*stride] + src[i-stride];
  288. dc0+= src[4+i-stride];
  289. dc0+= src[-1+(i+4)*stride];
  290. }
  291. dc0= 0x01010101*((dc0 + 8)>>4);
  292. for(i=0; i<4; i++){
  293. ((uint32_t*)(src+i*stride))[0]= dc0;
  294. ((uint32_t*)(src+i*stride))[1]= dc0;
  295. }
  296. for(i=4; i<8; i++){
  297. ((uint32_t*)(src+i*stride))[0]= dc0;
  298. ((uint32_t*)(src+i*stride))[1]= dc0;
  299. }
  300. }
  301. static void pred8x8_tm_vp8_c(uint8_t *src, int stride){
  302. uint8_t *cm = ff_cropTbl + MAX_NEG_CROP - src[-1-stride];
  303. uint8_t *top = src-stride;
  304. int y;
  305. for (y = 0; y < 8; y++) {
  306. uint8_t *cm_in = cm + src[-1];
  307. src[0] = cm_in[top[0]];
  308. src[1] = cm_in[top[1]];
  309. src[2] = cm_in[top[2]];
  310. src[3] = cm_in[top[3]];
  311. src[4] = cm_in[top[4]];
  312. src[5] = cm_in[top[5]];
  313. src[6] = cm_in[top[6]];
  314. src[7] = cm_in[top[7]];
  315. src += stride;
  316. }
  317. }
  318. /**
  319. * Set the intra prediction function pointers.
  320. */
  321. void ff_h264_pred_init(H264PredContext *h, int codec_id, const int bit_depth, const int chroma_format_idc){
  322. // MpegEncContext * const s = &h->s;
  323. #undef FUNC
  324. #undef FUNCC
  325. #define FUNC(a, depth) a ## _ ## depth
  326. #define FUNCC(a, depth) a ## _ ## depth ## _c
  327. #define FUNCD(a) a ## _c
  328. #define H264_PRED(depth) \
  329. if(codec_id != CODEC_ID_RV40){\
  330. if(codec_id == CODEC_ID_VP8) {\
  331. h->pred4x4[VERT_PRED ]= FUNCD(pred4x4_vertical_vp8);\
  332. h->pred4x4[HOR_PRED ]= FUNCD(pred4x4_horizontal_vp8);\
  333. } else {\
  334. h->pred4x4[VERT_PRED ]= FUNCC(pred4x4_vertical , depth);\
  335. h->pred4x4[HOR_PRED ]= FUNCC(pred4x4_horizontal , depth);\
  336. }\
  337. h->pred4x4[DC_PRED ]= FUNCC(pred4x4_dc , depth);\
  338. if(codec_id == CODEC_ID_SVQ3)\
  339. h->pred4x4[DIAG_DOWN_LEFT_PRED ]= FUNCD(pred4x4_down_left_svq3);\
  340. else\
  341. h->pred4x4[DIAG_DOWN_LEFT_PRED ]= FUNCC(pred4x4_down_left , depth);\
  342. h->pred4x4[DIAG_DOWN_RIGHT_PRED]= FUNCC(pred4x4_down_right , depth);\
  343. h->pred4x4[VERT_RIGHT_PRED ]= FUNCC(pred4x4_vertical_right , depth);\
  344. h->pred4x4[HOR_DOWN_PRED ]= FUNCC(pred4x4_horizontal_down , depth);\
  345. if (codec_id == CODEC_ID_VP8) {\
  346. h->pred4x4[VERT_LEFT_PRED ]= FUNCD(pred4x4_vertical_left_vp8);\
  347. } else\
  348. h->pred4x4[VERT_LEFT_PRED ]= FUNCC(pred4x4_vertical_left , depth);\
  349. h->pred4x4[HOR_UP_PRED ]= FUNCC(pred4x4_horizontal_up , depth);\
  350. if(codec_id != CODEC_ID_VP8) {\
  351. h->pred4x4[LEFT_DC_PRED ]= FUNCC(pred4x4_left_dc , depth);\
  352. h->pred4x4[TOP_DC_PRED ]= FUNCC(pred4x4_top_dc , depth);\
  353. h->pred4x4[DC_128_PRED ]= FUNCC(pred4x4_128_dc , depth);\
  354. } else {\
  355. h->pred4x4[TM_VP8_PRED ]= FUNCD(pred4x4_tm_vp8);\
  356. h->pred4x4[DC_127_PRED ]= FUNCC(pred4x4_127_dc , depth);\
  357. h->pred4x4[DC_129_PRED ]= FUNCC(pred4x4_129_dc , depth);\
  358. h->pred4x4[VERT_VP8_PRED ]= FUNCC(pred4x4_vertical , depth);\
  359. h->pred4x4[HOR_VP8_PRED ]= FUNCC(pred4x4_horizontal , depth);\
  360. }\
  361. }else{\
  362. h->pred4x4[VERT_PRED ]= FUNCC(pred4x4_vertical , depth);\
  363. h->pred4x4[HOR_PRED ]= FUNCC(pred4x4_horizontal , depth);\
  364. h->pred4x4[DC_PRED ]= FUNCC(pred4x4_dc , depth);\
  365. h->pred4x4[DIAG_DOWN_LEFT_PRED ]= FUNCD(pred4x4_down_left_rv40);\
  366. h->pred4x4[DIAG_DOWN_RIGHT_PRED]= FUNCC(pred4x4_down_right , depth);\
  367. h->pred4x4[VERT_RIGHT_PRED ]= FUNCC(pred4x4_vertical_right , depth);\
  368. h->pred4x4[HOR_DOWN_PRED ]= FUNCC(pred4x4_horizontal_down , depth);\
  369. h->pred4x4[VERT_LEFT_PRED ]= FUNCD(pred4x4_vertical_left_rv40);\
  370. h->pred4x4[HOR_UP_PRED ]= FUNCD(pred4x4_horizontal_up_rv40);\
  371. h->pred4x4[LEFT_DC_PRED ]= FUNCC(pred4x4_left_dc , depth);\
  372. h->pred4x4[TOP_DC_PRED ]= FUNCC(pred4x4_top_dc , depth);\
  373. h->pred4x4[DC_128_PRED ]= FUNCC(pred4x4_128_dc , depth);\
  374. h->pred4x4[DIAG_DOWN_LEFT_PRED_RV40_NODOWN]= FUNCD(pred4x4_down_left_rv40_nodown);\
  375. h->pred4x4[HOR_UP_PRED_RV40_NODOWN]= FUNCD(pred4x4_horizontal_up_rv40_nodown);\
  376. h->pred4x4[VERT_LEFT_PRED_RV40_NODOWN]= FUNCD(pred4x4_vertical_left_rv40_nodown);\
  377. }\
  378. \
  379. h->pred8x8l[VERT_PRED ]= FUNCC(pred8x8l_vertical , depth);\
  380. h->pred8x8l[HOR_PRED ]= FUNCC(pred8x8l_horizontal , depth);\
  381. h->pred8x8l[DC_PRED ]= FUNCC(pred8x8l_dc , depth);\
  382. h->pred8x8l[DIAG_DOWN_LEFT_PRED ]= FUNCC(pred8x8l_down_left , depth);\
  383. h->pred8x8l[DIAG_DOWN_RIGHT_PRED]= FUNCC(pred8x8l_down_right , depth);\
  384. h->pred8x8l[VERT_RIGHT_PRED ]= FUNCC(pred8x8l_vertical_right , depth);\
  385. h->pred8x8l[HOR_DOWN_PRED ]= FUNCC(pred8x8l_horizontal_down , depth);\
  386. h->pred8x8l[VERT_LEFT_PRED ]= FUNCC(pred8x8l_vertical_left , depth);\
  387. h->pred8x8l[HOR_UP_PRED ]= FUNCC(pred8x8l_horizontal_up , depth);\
  388. h->pred8x8l[LEFT_DC_PRED ]= FUNCC(pred8x8l_left_dc , depth);\
  389. h->pred8x8l[TOP_DC_PRED ]= FUNCC(pred8x8l_top_dc , depth);\
  390. h->pred8x8l[DC_128_PRED ]= FUNCC(pred8x8l_128_dc , depth);\
  391. \
  392. if (chroma_format_idc == 1) {\
  393. h->pred8x8[VERT_PRED8x8 ]= FUNCC(pred8x8_vertical , depth);\
  394. h->pred8x8[HOR_PRED8x8 ]= FUNCC(pred8x8_horizontal , depth);\
  395. } else {\
  396. h->pred8x8[VERT_PRED8x8 ]= FUNCC(pred8x16_vertical , depth);\
  397. h->pred8x8[HOR_PRED8x8 ]= FUNCC(pred8x16_horizontal , depth);\
  398. }\
  399. if (codec_id != CODEC_ID_VP8) {\
  400. if (chroma_format_idc == 1) {\
  401. h->pred8x8[PLANE_PRED8x8]= FUNCC(pred8x8_plane , depth);\
  402. } else {\
  403. h->pred8x8[PLANE_PRED8x8]= FUNCC(pred8x16_plane , depth);\
  404. }\
  405. } else\
  406. h->pred8x8[PLANE_PRED8x8]= FUNCD(pred8x8_tm_vp8);\
  407. if(codec_id != CODEC_ID_RV40 && codec_id != CODEC_ID_VP8){\
  408. if (chroma_format_idc == 1) {\
  409. h->pred8x8[DC_PRED8x8 ]= FUNCC(pred8x8_dc , depth);\
  410. h->pred8x8[LEFT_DC_PRED8x8]= FUNCC(pred8x8_left_dc , depth);\
  411. h->pred8x8[TOP_DC_PRED8x8 ]= FUNCC(pred8x8_top_dc , depth);\
  412. h->pred8x8[ALZHEIMER_DC_L0T_PRED8x8 ]= FUNC(pred8x8_mad_cow_dc_l0t, depth);\
  413. h->pred8x8[ALZHEIMER_DC_0LT_PRED8x8 ]= FUNC(pred8x8_mad_cow_dc_0lt, depth);\
  414. h->pred8x8[ALZHEIMER_DC_L00_PRED8x8 ]= FUNC(pred8x8_mad_cow_dc_l00, depth);\
  415. h->pred8x8[ALZHEIMER_DC_0L0_PRED8x8 ]= FUNC(pred8x8_mad_cow_dc_0l0, depth);\
  416. } else {\
  417. h->pred8x8[DC_PRED8x8 ]= FUNCC(pred8x16_dc , depth);\
  418. h->pred8x8[LEFT_DC_PRED8x8]= FUNCC(pred8x16_left_dc , depth);\
  419. h->pred8x8[TOP_DC_PRED8x8 ]= FUNCC(pred8x16_top_dc , depth);\
  420. h->pred8x8[ALZHEIMER_DC_L0T_PRED8x8 ]= FUNC(pred8x8_mad_cow_dc_l0t, depth);\
  421. h->pred8x8[ALZHEIMER_DC_0LT_PRED8x8 ]= FUNC(pred8x8_mad_cow_dc_0lt, depth);\
  422. h->pred8x8[ALZHEIMER_DC_L00_PRED8x8 ]= FUNC(pred8x8_mad_cow_dc_l00, depth);\
  423. h->pred8x8[ALZHEIMER_DC_0L0_PRED8x8 ]= FUNC(pred8x8_mad_cow_dc_0l0, depth);\
  424. }\
  425. }else{\
  426. h->pred8x8[DC_PRED8x8 ]= FUNCD(pred8x8_dc_rv40);\
  427. h->pred8x8[LEFT_DC_PRED8x8]= FUNCD(pred8x8_left_dc_rv40);\
  428. h->pred8x8[TOP_DC_PRED8x8 ]= FUNCD(pred8x8_top_dc_rv40);\
  429. if (codec_id == CODEC_ID_VP8) {\
  430. h->pred8x8[DC_127_PRED8x8]= FUNCC(pred8x8_127_dc , depth);\
  431. h->pred8x8[DC_129_PRED8x8]= FUNCC(pred8x8_129_dc , depth);\
  432. }\
  433. }\
  434. if (chroma_format_idc == 1) {\
  435. h->pred8x8[DC_128_PRED8x8 ]= FUNCC(pred8x8_128_dc , depth);\
  436. } else {\
  437. h->pred8x8[DC_128_PRED8x8 ]= FUNCC(pred8x16_128_dc , depth);\
  438. }\
  439. \
  440. h->pred16x16[DC_PRED8x8 ]= FUNCC(pred16x16_dc , depth);\
  441. h->pred16x16[VERT_PRED8x8 ]= FUNCC(pred16x16_vertical , depth);\
  442. h->pred16x16[HOR_PRED8x8 ]= FUNCC(pred16x16_horizontal , depth);\
  443. switch(codec_id){\
  444. case CODEC_ID_SVQ3:\
  445. h->pred16x16[PLANE_PRED8x8 ]= FUNCD(pred16x16_plane_svq3);\
  446. break;\
  447. case CODEC_ID_RV40:\
  448. h->pred16x16[PLANE_PRED8x8 ]= FUNCD(pred16x16_plane_rv40);\
  449. break;\
  450. case CODEC_ID_VP8:\
  451. h->pred16x16[PLANE_PRED8x8 ]= FUNCD(pred16x16_tm_vp8);\
  452. h->pred16x16[DC_127_PRED8x8]= FUNCC(pred16x16_127_dc , depth);\
  453. h->pred16x16[DC_129_PRED8x8]= FUNCC(pred16x16_129_dc , depth);\
  454. break;\
  455. default:\
  456. h->pred16x16[PLANE_PRED8x8 ]= FUNCC(pred16x16_plane , depth);\
  457. break;\
  458. }\
  459. h->pred16x16[LEFT_DC_PRED8x8]= FUNCC(pred16x16_left_dc , depth);\
  460. h->pred16x16[TOP_DC_PRED8x8 ]= FUNCC(pred16x16_top_dc , depth);\
  461. h->pred16x16[DC_128_PRED8x8 ]= FUNCC(pred16x16_128_dc , depth);\
  462. \
  463. /* special lossless h/v prediction for h264 */ \
  464. h->pred4x4_add [VERT_PRED ]= FUNCC(pred4x4_vertical_add , depth);\
  465. h->pred4x4_add [ HOR_PRED ]= FUNCC(pred4x4_horizontal_add , depth);\
  466. h->pred8x8l_add [VERT_PRED ]= FUNCC(pred8x8l_vertical_add , depth);\
  467. h->pred8x8l_add [ HOR_PRED ]= FUNCC(pred8x8l_horizontal_add , depth);\
  468. h->pred8x8_add [VERT_PRED8x8]= FUNCC(pred8x8_vertical_add , depth);\
  469. h->pred8x8_add [ HOR_PRED8x8]= FUNCC(pred8x8_horizontal_add , depth);\
  470. h->pred16x16_add[VERT_PRED8x8]= FUNCC(pred16x16_vertical_add , depth);\
  471. h->pred16x16_add[ HOR_PRED8x8]= FUNCC(pred16x16_horizontal_add , depth);\
  472. switch (bit_depth) {
  473. case 9:
  474. H264_PRED(9)
  475. break;
  476. case 10:
  477. H264_PRED(10)
  478. break;
  479. default:
  480. H264_PRED(8)
  481. break;
  482. }
  483. if (ARCH_ARM) ff_h264_pred_init_arm(h, codec_id, bit_depth, chroma_format_idc);
  484. if (HAVE_MMX) ff_h264_pred_init_x86(h, codec_id, bit_depth, chroma_format_idc);
  485. }