You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

748 lines
22KB

  1. /*
  2. * software YUV to RGB converter
  3. *
  4. * Copyright (C) 2009 Konstantin Shishkov
  5. *
  6. * 1,4,8bpp support and context / deglobalize stuff
  7. * by Michael Niedermayer (michaelni@gmx.at)
  8. *
  9. * This file is part of FFmpeg.
  10. *
  11. * FFmpeg is free software; you can redistribute it and/or
  12. * modify it under the terms of the GNU Lesser General Public
  13. * License as published by the Free Software Foundation; either
  14. * version 2.1 of the License, or (at your option) any later version.
  15. *
  16. * FFmpeg is distributed in the hope that it will be useful,
  17. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  18. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  19. * Lesser General Public License for more details.
  20. *
  21. * You should have received a copy of the GNU Lesser General Public
  22. * License along with FFmpeg; if not, write to the Free Software
  23. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  24. */
  25. #include <stdio.h>
  26. #include <stdlib.h>
  27. #include <inttypes.h>
  28. #include <assert.h>
  29. #include "config.h"
  30. #include "rgb2rgb.h"
  31. #include "swscale.h"
  32. #include "swscale_internal.h"
  33. #include "libavutil/x86_cpu.h"
  34. extern const uint8_t dither_8x8_32[8][8];
  35. extern const uint8_t dither_8x8_73[8][8];
  36. extern const uint8_t dither_8x8_220[8][8];
  37. const int32_t ff_yuv2rgb_coeffs[8][4] = {
  38. {117504, 138453, 13954, 34903}, /* no sequence_display_extension */
  39. {117504, 138453, 13954, 34903}, /* ITU-R Rec. 709 (1990) */
  40. {104597, 132201, 25675, 53279}, /* unspecified */
  41. {104597, 132201, 25675, 53279}, /* reserved */
  42. {104448, 132798, 24759, 53109}, /* FCC */
  43. {104597, 132201, 25675, 53279}, /* ITU-R Rec. 624-4 System B, G */
  44. {104597, 132201, 25675, 53279}, /* SMPTE 170M */
  45. {117579, 136230, 16907, 35559} /* SMPTE 240M (1987) */
  46. };
  47. #define LOADCHROMA(i) \
  48. U = pu[i]; \
  49. V = pv[i]; \
  50. r = (void *)c->table_rV[V]; \
  51. g = (void *)(c->table_gU[U] + c->table_gV[V]); \
  52. b = (void *)c->table_bU[U];
  53. #define PUTRGB(dst,src,i,o) \
  54. Y = src[2*i+o]; \
  55. dst[2*i ] = r[Y] + g[Y] + b[Y]; \
  56. Y = src[2*i+1-o]; \
  57. dst[2*i+1] = r[Y] + g[Y] + b[Y];
  58. #define PUTRGB24(dst,src,i) \
  59. Y = src[2*i]; \
  60. dst[6*i+0] = r[Y]; dst[6*i+1] = g[Y]; dst[6*i+2] = b[Y]; \
  61. Y = src[2*i+1]; \
  62. dst[6*i+3] = r[Y]; dst[6*i+4] = g[Y]; dst[6*i+5] = b[Y];
  63. #define PUTBGR24(dst,src,i) \
  64. Y = src[2*i]; \
  65. dst[6*i+0] = b[Y]; dst[6*i+1] = g[Y]; dst[6*i+2] = r[Y]; \
  66. Y = src[2*i+1]; \
  67. dst[6*i+3] = b[Y]; dst[6*i+4] = g[Y]; dst[6*i+5] = r[Y];
  68. #define PUTRGBA(dst,ysrc,asrc,i,o,s) \
  69. Y = ysrc[2*i+o]; \
  70. dst[2*i ] = r[Y] + g[Y] + b[Y] + (asrc[2*i ]<<s); \
  71. Y = ysrc[2*i+1-o]; \
  72. dst[2*i+1] = r[Y] + g[Y] + b[Y] + (asrc[2*i+1]<<s);
  73. #define PUTRGB48(dst,src,i) \
  74. Y = src[2*i]; \
  75. dst[12*i+ 0] = dst[12*i+ 1] = r[Y]; \
  76. dst[12*i+ 2] = dst[12*i+ 3] = g[Y]; \
  77. dst[12*i+ 4] = dst[12*i+ 5] = b[Y]; \
  78. Y = src[2*i+1]; \
  79. dst[12*i+ 6] = dst[12*i+ 7] = r[Y]; \
  80. dst[12*i+ 8] = dst[12*i+ 9] = g[Y]; \
  81. dst[12*i+10] = dst[12*i+11] = b[Y];
  82. #define YUV2RGBFUNC(func_name, dst_type, alpha) \
  83. static int func_name(SwsContext *c, uint8_t* src[], int srcStride[], int srcSliceY, \
  84. int srcSliceH, uint8_t* dst[], int dstStride[]){\
  85. int y;\
  86. \
  87. if (!alpha && c->srcFormat == PIX_FMT_YUV422P) {\
  88. srcStride[1] *= 2;\
  89. srcStride[2] *= 2;\
  90. }\
  91. for (y=0; y<srcSliceH; y+=2) {\
  92. dst_type *dst_1 = (dst_type*)(dst[0] + (y+srcSliceY )*dstStride[0]);\
  93. dst_type *dst_2 = (dst_type*)(dst[0] + (y+srcSliceY+1)*dstStride[0]);\
  94. dst_type av_unused *r, *b;\
  95. dst_type *g;\
  96. uint8_t *py_1 = src[0] + y*srcStride[0];\
  97. uint8_t *py_2 = py_1 + srcStride[0];\
  98. uint8_t *pu = src[1] + (y>>1)*srcStride[1];\
  99. uint8_t *pv = src[2] + (y>>1)*srcStride[2];\
  100. uint8_t av_unused *pa_1, *pa_2;\
  101. unsigned int h_size = c->dstW>>3;\
  102. if (alpha){\
  103. pa_1 = src[3] + y*srcStride[3];\
  104. pa_2 = pa_1 + srcStride[3];\
  105. }\
  106. while (h_size--) {\
  107. int av_unused U, V;\
  108. int Y;\
  109. #define ENDYUV2RGBLINE(dst_delta)\
  110. pu += 4;\
  111. pv += 4;\
  112. py_1 += 8;\
  113. py_2 += 8;\
  114. dst_1 += dst_delta;\
  115. dst_2 += dst_delta;\
  116. }\
  117. if (c->dstW & 4) {\
  118. int av_unused Y, U, V;\
  119. #define ENDYUV2RGBFUNC()\
  120. }\
  121. }\
  122. return srcSliceH;\
  123. }
  124. #define CLOSEYUV2RGBFUNC(dst_delta)\
  125. ENDYUV2RGBLINE(dst_delta)\
  126. ENDYUV2RGBFUNC()
  127. YUV2RGBFUNC(yuv2rgb_c_48, uint8_t, 0)
  128. LOADCHROMA(0);
  129. PUTRGB48(dst_1,py_1,0);
  130. PUTRGB48(dst_2,py_2,0);
  131. LOADCHROMA(1);
  132. PUTRGB48(dst_2,py_2,1);
  133. PUTRGB48(dst_1,py_1,1);
  134. LOADCHROMA(2);
  135. PUTRGB48(dst_1,py_1,2);
  136. PUTRGB48(dst_2,py_2,2);
  137. LOADCHROMA(3);
  138. PUTRGB48(dst_2,py_2,3);
  139. PUTRGB48(dst_1,py_1,3);
  140. ENDYUV2RGBLINE(48)
  141. LOADCHROMA(0);
  142. PUTRGB48(dst_1,py_1,0);
  143. PUTRGB48(dst_2,py_2,0);
  144. LOADCHROMA(1);
  145. PUTRGB48(dst_2,py_2,1);
  146. PUTRGB48(dst_1,py_1,1);
  147. ENDYUV2RGBFUNC()
  148. YUV2RGBFUNC(yuv2rgb_c_32, uint32_t, 0)
  149. LOADCHROMA(0);
  150. PUTRGB(dst_1,py_1,0,0);
  151. PUTRGB(dst_2,py_2,0,1);
  152. LOADCHROMA(1);
  153. PUTRGB(dst_2,py_2,1,1);
  154. PUTRGB(dst_1,py_1,1,0);
  155. LOADCHROMA(2);
  156. PUTRGB(dst_1,py_1,2,0);
  157. PUTRGB(dst_2,py_2,2,1);
  158. LOADCHROMA(3);
  159. PUTRGB(dst_2,py_2,3,1);
  160. PUTRGB(dst_1,py_1,3,0);
  161. ENDYUV2RGBLINE(8)
  162. LOADCHROMA(0);
  163. PUTRGB(dst_1,py_1,0,0);
  164. PUTRGB(dst_2,py_2,0,1);
  165. LOADCHROMA(1);
  166. PUTRGB(dst_2,py_2,1,1);
  167. PUTRGB(dst_1,py_1,1,0);
  168. ENDYUV2RGBFUNC()
  169. YUV2RGBFUNC(yuva2rgba_c, uint32_t, 1)
  170. LOADCHROMA(0);
  171. PUTRGBA(dst_1,py_1,pa_1,0,0,24);
  172. PUTRGBA(dst_2,py_2,pa_2,0,1,24);
  173. LOADCHROMA(1);
  174. PUTRGBA(dst_2,py_2,pa_1,1,1,24);
  175. PUTRGBA(dst_1,py_1,pa_2,1,0,24);
  176. LOADCHROMA(2);
  177. PUTRGBA(dst_1,py_1,pa_1,2,0,24);
  178. PUTRGBA(dst_2,py_2,pa_2,2,1,24);
  179. LOADCHROMA(3);
  180. PUTRGBA(dst_2,py_2,pa_1,3,1,24);
  181. PUTRGBA(dst_1,py_1,pa_2,3,0,24);
  182. pa_1 += 8;\
  183. pa_2 += 8;\
  184. ENDYUV2RGBLINE(8)
  185. LOADCHROMA(0);
  186. PUTRGBA(dst_1,py_1,pa_1,0,0,24);
  187. PUTRGBA(dst_2,py_2,pa_2,0,1,24);
  188. LOADCHROMA(1);
  189. PUTRGBA(dst_2,py_2,pa_1,1,1,24);
  190. PUTRGBA(dst_1,py_1,pa_2,1,0,24);
  191. ENDYUV2RGBFUNC()
  192. YUV2RGBFUNC(yuva2argb_c, uint32_t, 1)
  193. LOADCHROMA(0);
  194. PUTRGBA(dst_1,py_1,pa_1,0,0,0);
  195. PUTRGBA(dst_2,py_2,pa_2,0,1,0);
  196. LOADCHROMA(1);
  197. PUTRGBA(dst_2,py_2,pa_2,1,1,0);
  198. PUTRGBA(dst_1,py_1,pa_1,1,0,0);
  199. LOADCHROMA(2);
  200. PUTRGBA(dst_1,py_1,pa_1,2,0,0);
  201. PUTRGBA(dst_2,py_2,pa_2,2,1,0);
  202. LOADCHROMA(3);
  203. PUTRGBA(dst_2,py_2,pa_2,3,1,0);
  204. PUTRGBA(dst_1,py_1,pa_1,3,0,0);
  205. pa_1 += 8;\
  206. pa_2 += 8;\
  207. ENDYUV2RGBLINE(8)
  208. LOADCHROMA(0);
  209. PUTRGBA(dst_1,py_1,pa_1,0,0,0);
  210. PUTRGBA(dst_2,py_2,pa_2,0,1,0);
  211. LOADCHROMA(1);
  212. PUTRGBA(dst_2,py_2,pa_2,1,1,0);
  213. PUTRGBA(dst_1,py_1,pa_1,1,0,0);
  214. ENDYUV2RGBFUNC()
  215. YUV2RGBFUNC(yuv2rgb_c_24_rgb, uint8_t, 0)
  216. LOADCHROMA(0);
  217. PUTRGB24(dst_1,py_1,0);
  218. PUTRGB24(dst_2,py_2,0);
  219. LOADCHROMA(1);
  220. PUTRGB24(dst_2,py_2,1);
  221. PUTRGB24(dst_1,py_1,1);
  222. LOADCHROMA(2);
  223. PUTRGB24(dst_1,py_1,2);
  224. PUTRGB24(dst_2,py_2,2);
  225. LOADCHROMA(3);
  226. PUTRGB24(dst_2,py_2,3);
  227. PUTRGB24(dst_1,py_1,3);
  228. ENDYUV2RGBLINE(24)
  229. LOADCHROMA(0);
  230. PUTRGB24(dst_1,py_1,0);
  231. PUTRGB24(dst_2,py_2,0);
  232. LOADCHROMA(1);
  233. PUTRGB24(dst_2,py_2,1);
  234. PUTRGB24(dst_1,py_1,1);
  235. ENDYUV2RGBFUNC()
  236. // only trivial mods from yuv2rgb_c_24_rgb
  237. YUV2RGBFUNC(yuv2rgb_c_24_bgr, uint8_t, 0)
  238. LOADCHROMA(0);
  239. PUTBGR24(dst_1,py_1,0);
  240. PUTBGR24(dst_2,py_2,0);
  241. LOADCHROMA(1);
  242. PUTBGR24(dst_2,py_2,1);
  243. PUTBGR24(dst_1,py_1,1);
  244. LOADCHROMA(2);
  245. PUTBGR24(dst_1,py_1,2);
  246. PUTBGR24(dst_2,py_2,2);
  247. LOADCHROMA(3);
  248. PUTBGR24(dst_2,py_2,3);
  249. PUTBGR24(dst_1,py_1,3);
  250. ENDYUV2RGBLINE(24)
  251. LOADCHROMA(0);
  252. PUTBGR24(dst_1,py_1,0);
  253. PUTBGR24(dst_2,py_2,0);
  254. LOADCHROMA(1);
  255. PUTBGR24(dst_2,py_2,1);
  256. PUTBGR24(dst_1,py_1,1);
  257. ENDYUV2RGBFUNC()
  258. // This is exactly the same code as yuv2rgb_c_32 except for the types of
  259. // r, g, b, dst_1, dst_2
  260. YUV2RGBFUNC(yuv2rgb_c_16, uint16_t, 0)
  261. LOADCHROMA(0);
  262. PUTRGB(dst_1,py_1,0,0);
  263. PUTRGB(dst_2,py_2,0,1);
  264. LOADCHROMA(1);
  265. PUTRGB(dst_2,py_2,1,1);
  266. PUTRGB(dst_1,py_1,1,0);
  267. LOADCHROMA(2);
  268. PUTRGB(dst_1,py_1,2,0);
  269. PUTRGB(dst_2,py_2,2,1);
  270. LOADCHROMA(3);
  271. PUTRGB(dst_2,py_2,3,1);
  272. PUTRGB(dst_1,py_1,3,0);
  273. CLOSEYUV2RGBFUNC(8)
  274. // This is exactly the same code as yuv2rgb_c_32 except for the types of
  275. // r, g, b, dst_1, dst_2
  276. YUV2RGBFUNC(yuv2rgb_c_8, uint8_t, 0)
  277. LOADCHROMA(0);
  278. PUTRGB(dst_1,py_1,0,0);
  279. PUTRGB(dst_2,py_2,0,1);
  280. LOADCHROMA(1);
  281. PUTRGB(dst_2,py_2,1,1);
  282. PUTRGB(dst_1,py_1,1,0);
  283. LOADCHROMA(2);
  284. PUTRGB(dst_1,py_1,2,0);
  285. PUTRGB(dst_2,py_2,2,1);
  286. LOADCHROMA(3);
  287. PUTRGB(dst_2,py_2,3,1);
  288. PUTRGB(dst_1,py_1,3,0);
  289. CLOSEYUV2RGBFUNC(8)
  290. // r, g, b, dst_1, dst_2
  291. YUV2RGBFUNC(yuv2rgb_c_8_ordered_dither, uint8_t, 0)
  292. const uint8_t *d32 = dither_8x8_32[y&7];
  293. const uint8_t *d64 = dither_8x8_73[y&7];
  294. #define PUTRGB8(dst,src,i,o) \
  295. Y = src[2*i]; \
  296. dst[2*i] = r[Y+d32[0+o]] + g[Y+d32[0+o]] + b[Y+d64[0+o]]; \
  297. Y = src[2*i+1]; \
  298. dst[2*i+1] = r[Y+d32[1+o]] + g[Y+d32[1+o]] + b[Y+d64[1+o]];
  299. LOADCHROMA(0);
  300. PUTRGB8(dst_1,py_1,0,0);
  301. PUTRGB8(dst_2,py_2,0,0+8);
  302. LOADCHROMA(1);
  303. PUTRGB8(dst_2,py_2,1,2+8);
  304. PUTRGB8(dst_1,py_1,1,2);
  305. LOADCHROMA(2);
  306. PUTRGB8(dst_1,py_1,2,4);
  307. PUTRGB8(dst_2,py_2,2,4+8);
  308. LOADCHROMA(3);
  309. PUTRGB8(dst_2,py_2,3,6+8);
  310. PUTRGB8(dst_1,py_1,3,6);
  311. CLOSEYUV2RGBFUNC(8)
  312. // This is exactly the same code as yuv2rgb_c_32 except for the types of
  313. // r, g, b, dst_1, dst_2
  314. YUV2RGBFUNC(yuv2rgb_c_4, uint8_t, 0)
  315. int acc;
  316. #define PUTRGB4(dst,src,i) \
  317. Y = src[2*i]; \
  318. acc = r[Y] + g[Y] + b[Y]; \
  319. Y = src[2*i+1]; \
  320. acc |= (r[Y] + g[Y] + b[Y])<<4; \
  321. dst[i] = acc;
  322. LOADCHROMA(0);
  323. PUTRGB4(dst_1,py_1,0);
  324. PUTRGB4(dst_2,py_2,0);
  325. LOADCHROMA(1);
  326. PUTRGB4(dst_2,py_2,1);
  327. PUTRGB4(dst_1,py_1,1);
  328. LOADCHROMA(2);
  329. PUTRGB4(dst_1,py_1,2);
  330. PUTRGB4(dst_2,py_2,2);
  331. LOADCHROMA(3);
  332. PUTRGB4(dst_2,py_2,3);
  333. PUTRGB4(dst_1,py_1,3);
  334. CLOSEYUV2RGBFUNC(4)
  335. YUV2RGBFUNC(yuv2rgb_c_4_ordered_dither, uint8_t, 0)
  336. const uint8_t *d64 = dither_8x8_73[y&7];
  337. const uint8_t *d128 = dither_8x8_220[y&7];
  338. int acc;
  339. #define PUTRGB4D(dst,src,i,o) \
  340. Y = src[2*i]; \
  341. acc = r[Y+d128[0+o]] + g[Y+d64[0+o]] + b[Y+d128[0+o]]; \
  342. Y = src[2*i+1]; \
  343. acc |= (r[Y+d128[1+o]] + g[Y+d64[1+o]] + b[Y+d128[1+o]])<<4; \
  344. dst[i]= acc;
  345. LOADCHROMA(0);
  346. PUTRGB4D(dst_1,py_1,0,0);
  347. PUTRGB4D(dst_2,py_2,0,0+8);
  348. LOADCHROMA(1);
  349. PUTRGB4D(dst_2,py_2,1,2+8);
  350. PUTRGB4D(dst_1,py_1,1,2);
  351. LOADCHROMA(2);
  352. PUTRGB4D(dst_1,py_1,2,4);
  353. PUTRGB4D(dst_2,py_2,2,4+8);
  354. LOADCHROMA(3);
  355. PUTRGB4D(dst_2,py_2,3,6+8);
  356. PUTRGB4D(dst_1,py_1,3,6);
  357. CLOSEYUV2RGBFUNC(4)
  358. // This is exactly the same code as yuv2rgb_c_32 except for the types of
  359. // r, g, b, dst_1, dst_2
  360. YUV2RGBFUNC(yuv2rgb_c_4b, uint8_t, 0)
  361. LOADCHROMA(0);
  362. PUTRGB(dst_1,py_1,0,0);
  363. PUTRGB(dst_2,py_2,0,1);
  364. LOADCHROMA(1);
  365. PUTRGB(dst_2,py_2,1,1);
  366. PUTRGB(dst_1,py_1,1,0);
  367. LOADCHROMA(2);
  368. PUTRGB(dst_1,py_1,2,0);
  369. PUTRGB(dst_2,py_2,2,1);
  370. LOADCHROMA(3);
  371. PUTRGB(dst_2,py_2,3,1);
  372. PUTRGB(dst_1,py_1,3,0);
  373. CLOSEYUV2RGBFUNC(8)
  374. YUV2RGBFUNC(yuv2rgb_c_4b_ordered_dither, uint8_t, 0)
  375. const uint8_t *d64 = dither_8x8_73[y&7];
  376. const uint8_t *d128 = dither_8x8_220[y&7];
  377. #define PUTRGB4DB(dst,src,i,o) \
  378. Y = src[2*i]; \
  379. dst[2*i] = r[Y+d128[0+o]] + g[Y+d64[0+o]] + b[Y+d128[0+o]]; \
  380. Y = src[2*i+1]; \
  381. dst[2*i+1] = r[Y+d128[1+o]] + g[Y+d64[1+o]] + b[Y+d128[1+o]];
  382. LOADCHROMA(0);
  383. PUTRGB4DB(dst_1,py_1,0,0);
  384. PUTRGB4DB(dst_2,py_2,0,0+8);
  385. LOADCHROMA(1);
  386. PUTRGB4DB(dst_2,py_2,1,2+8);
  387. PUTRGB4DB(dst_1,py_1,1,2);
  388. LOADCHROMA(2);
  389. PUTRGB4DB(dst_1,py_1,2,4);
  390. PUTRGB4DB(dst_2,py_2,2,4+8);
  391. LOADCHROMA(3);
  392. PUTRGB4DB(dst_2,py_2,3,6+8);
  393. PUTRGB4DB(dst_1,py_1,3,6);
  394. CLOSEYUV2RGBFUNC(8)
  395. YUV2RGBFUNC(yuv2rgb_c_1_ordered_dither, uint8_t, 0)
  396. const uint8_t *d128 = dither_8x8_220[y&7];
  397. char out_1 = 0, out_2 = 0;
  398. g= c->table_gU[128] + c->table_gV[128];
  399. #define PUTRGB1(out,src,i,o) \
  400. Y = src[2*i]; \
  401. out+= out + g[Y+d128[0+o]]; \
  402. Y = src[2*i+1]; \
  403. out+= out + g[Y+d128[1+o]];
  404. PUTRGB1(out_1,py_1,0,0);
  405. PUTRGB1(out_2,py_2,0,0+8);
  406. PUTRGB1(out_2,py_2,1,2+8);
  407. PUTRGB1(out_1,py_1,1,2);
  408. PUTRGB1(out_1,py_1,2,4);
  409. PUTRGB1(out_2,py_2,2,4+8);
  410. PUTRGB1(out_2,py_2,3,6+8);
  411. PUTRGB1(out_1,py_1,3,6);
  412. dst_1[0]= out_1;
  413. dst_2[0]= out_2;
  414. CLOSEYUV2RGBFUNC(1)
  415. SwsFunc ff_yuv2rgb_get_func_ptr(SwsContext *c)
  416. {
  417. SwsFunc t = NULL;
  418. #if (HAVE_MMX2 || HAVE_MMX) && CONFIG_GPL
  419. t = ff_yuv2rgb_init_mmx(c);
  420. #endif
  421. #if HAVE_VIS
  422. t = ff_yuv2rgb_init_vis(c);
  423. #endif
  424. #if CONFIG_MLIB
  425. t = ff_yuv2rgb_init_mlib(c);
  426. #endif
  427. #if HAVE_ALTIVEC && CONFIG_GPL
  428. if (c->flags & SWS_CPU_CAPS_ALTIVEC)
  429. t = ff_yuv2rgb_init_altivec(c);
  430. #endif
  431. #if ARCH_BFIN
  432. if (c->flags & SWS_CPU_CAPS_BFIN)
  433. t = ff_yuv2rgb_get_func_ptr_bfin(c);
  434. #endif
  435. if (t)
  436. return t;
  437. av_log(c, AV_LOG_WARNING, "No accelerated colorspace conversion found.\n");
  438. switch (c->dstFormat) {
  439. case PIX_FMT_RGB48BE:
  440. case PIX_FMT_RGB48LE: return yuv2rgb_c_48;
  441. case PIX_FMT_ARGB:
  442. case PIX_FMT_ABGR: if (CONFIG_SWSCALE_ALPHA && c->srcFormat == PIX_FMT_YUVA420P) return yuva2argb_c;
  443. case PIX_FMT_RGBA:
  444. case PIX_FMT_BGRA: return (CONFIG_SWSCALE_ALPHA && c->srcFormat == PIX_FMT_YUVA420P) ? yuva2rgba_c : yuv2rgb_c_32;
  445. case PIX_FMT_RGB24: return yuv2rgb_c_24_rgb;
  446. case PIX_FMT_BGR24: return yuv2rgb_c_24_bgr;
  447. case PIX_FMT_RGB565:
  448. case PIX_FMT_BGR565:
  449. case PIX_FMT_RGB555:
  450. case PIX_FMT_BGR555: return yuv2rgb_c_16;
  451. case PIX_FMT_RGB8:
  452. case PIX_FMT_BGR8: return yuv2rgb_c_8_ordered_dither;
  453. case PIX_FMT_RGB4:
  454. case PIX_FMT_BGR4: return yuv2rgb_c_4_ordered_dither;
  455. case PIX_FMT_RGB4_BYTE:
  456. case PIX_FMT_BGR4_BYTE: return yuv2rgb_c_4b_ordered_dither;
  457. case PIX_FMT_MONOBLACK: return yuv2rgb_c_1_ordered_dither;
  458. default:
  459. assert(0);
  460. }
  461. return NULL;
  462. }
  463. static void fill_table(uint8_t* table[256], const int elemsize, const int inc, uint8_t *y_table)
  464. {
  465. int i;
  466. int64_t cb = 0;
  467. y_table -= elemsize * (inc >> 9);
  468. for (i = 0; i < 256; i++) {
  469. table[i] = y_table + elemsize * (cb >> 16);
  470. cb += inc;
  471. }
  472. }
  473. static void fill_gv_table(int table[256], const int elemsize, const int inc)
  474. {
  475. int i;
  476. int64_t cb = 0;
  477. int off = -(inc >> 9);
  478. for (i = 0; i < 256; i++) {
  479. table[i] = elemsize * (off + (cb >> 16));
  480. cb += inc;
  481. }
  482. }
  483. av_cold int ff_yuv2rgb_c_init_tables(SwsContext *c, const int inv_table[4], int fullRange,
  484. int brightness, int contrast, int saturation)
  485. {
  486. const int isRgb = c->dstFormat==PIX_FMT_RGB32
  487. || c->dstFormat==PIX_FMT_RGB32_1
  488. || c->dstFormat==PIX_FMT_BGR24
  489. || c->dstFormat==PIX_FMT_RGB565
  490. || c->dstFormat==PIX_FMT_RGB555
  491. || c->dstFormat==PIX_FMT_RGB8
  492. || c->dstFormat==PIX_FMT_RGB4
  493. || c->dstFormat==PIX_FMT_RGB4_BYTE
  494. || c->dstFormat==PIX_FMT_MONOBLACK;
  495. const int bpp = fmt_depth(c->dstFormat);
  496. uint8_t *y_table;
  497. uint16_t *y_table16;
  498. uint32_t *y_table32;
  499. int i, base, rbase, gbase, bbase, abase, needAlpha;
  500. const int yoffs = fullRange ? 384 : 326;
  501. int64_t crv = inv_table[0];
  502. int64_t cbu = inv_table[1];
  503. int64_t cgu = -inv_table[2];
  504. int64_t cgv = -inv_table[3];
  505. int64_t cy = 1<<16;
  506. int64_t oy = 0;
  507. int64_t yb = 0;
  508. if (!fullRange) {
  509. cy = (cy*255) / 219;
  510. oy = 16<<16;
  511. } else {
  512. crv = (crv*224) / 255;
  513. cbu = (cbu*224) / 255;
  514. cgu = (cgu*224) / 255;
  515. cgv = (cgv*224) / 255;
  516. }
  517. cy = (cy *contrast ) >> 16;
  518. crv = (crv*contrast * saturation) >> 32;
  519. cbu = (cbu*contrast * saturation) >> 32;
  520. cgu = (cgu*contrast * saturation) >> 32;
  521. cgv = (cgv*contrast * saturation) >> 32;
  522. oy -= 256*brightness;
  523. //scale coefficients by cy
  524. crv = ((crv << 16) + 0x8000) / cy;
  525. cbu = ((cbu << 16) + 0x8000) / cy;
  526. cgu = ((cgu << 16) + 0x8000) / cy;
  527. cgv = ((cgv << 16) + 0x8000) / cy;
  528. av_free(c->yuvTable);
  529. switch (bpp) {
  530. case 1:
  531. c->yuvTable = av_malloc(1024);
  532. y_table = c->yuvTable;
  533. yb = -(384<<16) - oy;
  534. for (i = 0; i < 1024-110; i++) {
  535. y_table[i+110] = av_clip_uint8((yb + 0x8000) >> 16) >> 7;
  536. yb += cy;
  537. }
  538. fill_table(c->table_gU, 1, cgu, y_table + yoffs);
  539. fill_gv_table(c->table_gV, 1, cgv);
  540. break;
  541. case 4:
  542. case 4|128:
  543. rbase = isRgb ? 3 : 0;
  544. gbase = 1;
  545. bbase = isRgb ? 0 : 3;
  546. c->yuvTable = av_malloc(1024*3);
  547. y_table = c->yuvTable;
  548. yb = -(384<<16) - oy;
  549. for (i = 0; i < 1024-110; i++) {
  550. int yval = av_clip_uint8((yb + 0x8000) >> 16);
  551. y_table[i+110 ] = (yval >> 7) << rbase;
  552. y_table[i+ 37+1024] = ((yval + 43) / 85) << gbase;
  553. y_table[i+110+2048] = (yval >> 7) << bbase;
  554. yb += cy;
  555. }
  556. fill_table(c->table_rV, 1, crv, y_table + yoffs);
  557. fill_table(c->table_gU, 1, cgu, y_table + yoffs + 1024);
  558. fill_table(c->table_bU, 1, cbu, y_table + yoffs + 2048);
  559. fill_gv_table(c->table_gV, 1, cgv);
  560. break;
  561. case 8:
  562. rbase = isRgb ? 5 : 0;
  563. gbase = isRgb ? 2 : 3;
  564. bbase = isRgb ? 0 : 6;
  565. c->yuvTable = av_malloc(1024*3);
  566. y_table = c->yuvTable;
  567. yb = -(384<<16) - oy;
  568. for (i = 0; i < 1024-38; i++) {
  569. int yval = av_clip_uint8((yb + 0x8000) >> 16);
  570. y_table[i+16 ] = ((yval + 18) / 36) << rbase;
  571. y_table[i+16+1024] = ((yval + 18) / 36) << gbase;
  572. y_table[i+37+2048] = ((yval + 43) / 85) << bbase;
  573. yb += cy;
  574. }
  575. fill_table(c->table_rV, 1, crv, y_table + yoffs);
  576. fill_table(c->table_gU, 1, cgu, y_table + yoffs + 1024);
  577. fill_table(c->table_bU, 1, cbu, y_table + yoffs + 2048);
  578. fill_gv_table(c->table_gV, 1, cgv);
  579. break;
  580. case 15:
  581. case 16:
  582. rbase = isRgb ? bpp - 5 : 0;
  583. gbase = 5;
  584. bbase = isRgb ? 0 : (bpp - 5);
  585. c->yuvTable = av_malloc(1024*3*2);
  586. y_table16 = c->yuvTable;
  587. yb = -(384<<16) - oy;
  588. for (i = 0; i < 1024; i++) {
  589. uint8_t yval = av_clip_uint8((yb + 0x8000) >> 16);
  590. y_table16[i ] = (yval >> 3) << rbase;
  591. y_table16[i+1024] = (yval >> (18 - bpp)) << gbase;
  592. y_table16[i+2048] = (yval >> 3) << bbase;
  593. yb += cy;
  594. }
  595. fill_table(c->table_rV, 2, crv, y_table16 + yoffs);
  596. fill_table(c->table_gU, 2, cgu, y_table16 + yoffs + 1024);
  597. fill_table(c->table_bU, 2, cbu, y_table16 + yoffs + 2048);
  598. fill_gv_table(c->table_gV, 2, cgv);
  599. break;
  600. case 24:
  601. case 48:
  602. c->yuvTable = av_malloc(1024);
  603. y_table = c->yuvTable;
  604. yb = -(384<<16) - oy;
  605. for (i = 0; i < 1024; i++) {
  606. y_table[i] = av_clip_uint8((yb + 0x8000) >> 16);
  607. yb += cy;
  608. }
  609. fill_table(c->table_rV, 1, crv, y_table + yoffs);
  610. fill_table(c->table_gU, 1, cgu, y_table + yoffs);
  611. fill_table(c->table_bU, 1, cbu, y_table + yoffs);
  612. fill_gv_table(c->table_gV, 1, cgv);
  613. break;
  614. case 32:
  615. base = (c->dstFormat == PIX_FMT_RGB32_1 || c->dstFormat == PIX_FMT_BGR32_1) ? 8 : 0;
  616. rbase = base + (isRgb ? 16 : 0);
  617. gbase = base + 8;
  618. bbase = base + (isRgb ? 0 : 16);
  619. needAlpha = CONFIG_SWSCALE_ALPHA && isALPHA(c->srcFormat);
  620. if (!needAlpha)
  621. abase = (base + 24) & 31;
  622. c->yuvTable = av_malloc(1024*3*4);
  623. y_table32 = c->yuvTable;
  624. yb = -(384<<16) - oy;
  625. for (i = 0; i < 1024; i++) {
  626. uint8_t yval = av_clip_uint8((yb + 0x8000) >> 16);
  627. y_table32[i ] = (yval << rbase) + (needAlpha ? 0 : (255 << abase));
  628. y_table32[i+1024] = yval << gbase;
  629. y_table32[i+2048] = yval << bbase;
  630. yb += cy;
  631. }
  632. fill_table(c->table_rV, 4, crv, y_table32 + yoffs);
  633. fill_table(c->table_gU, 4, cgu, y_table32 + yoffs + 1024);
  634. fill_table(c->table_bU, 4, cbu, y_table32 + yoffs + 2048);
  635. fill_gv_table(c->table_gV, 4, cgv);
  636. break;
  637. default:
  638. c->yuvTable = NULL;
  639. av_log(c, AV_LOG_ERROR, "%ibpp not supported by yuv2rgb\n", bpp);
  640. return -1;
  641. }
  642. return 0;
  643. }