You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

709 lines
21KB

  1. /*
  2. * software YUV to RGB converter
  3. *
  4. * Copyright (C) 2009 Konstantin Shishkov
  5. *
  6. * 1,4,8bpp support and context / deglobalize stuff
  7. * by Michael Niedermayer (michaelni@gmx.at)
  8. *
  9. * This file is part of FFmpeg.
  10. *
  11. * FFmpeg is free software; you can redistribute it and/or
  12. * modify it under the terms of the GNU Lesser General Public
  13. * License as published by the Free Software Foundation; either
  14. * version 2.1 of the License, or (at your option) any later version.
  15. *
  16. * FFmpeg is distributed in the hope that it will be useful,
  17. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  18. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  19. * Lesser General Public License for more details.
  20. *
  21. * You should have received a copy of the GNU Lesser General Public
  22. * License along with FFmpeg; if not, write to the Free Software
  23. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  24. */
  25. #include <stdio.h>
  26. #include <stdlib.h>
  27. #include <inttypes.h>
  28. #include <assert.h>
  29. #include "config.h"
  30. #include "rgb2rgb.h"
  31. #include "swscale.h"
  32. #include "swscale_internal.h"
  33. #include "libavutil/x86_cpu.h"
  34. extern const uint8_t dither_8x8_32[8][8];
  35. extern const uint8_t dither_8x8_73[8][8];
  36. extern const uint8_t dither_8x8_220[8][8];
  37. const int32_t ff_yuv2rgb_coeffs[8][4] = {
  38. {117504, 138453, 13954, 34903}, /* no sequence_display_extension */
  39. {117504, 138453, 13954, 34903}, /* ITU-R Rec. 709 (1990) */
  40. {104597, 132201, 25675, 53279}, /* unspecified */
  41. {104597, 132201, 25675, 53279}, /* reserved */
  42. {104448, 132798, 24759, 53109}, /* FCC */
  43. {104597, 132201, 25675, 53279}, /* ITU-R Rec. 624-4 System B, G */
  44. {104597, 132201, 25675, 53279}, /* SMPTE 170M */
  45. {117579, 136230, 16907, 35559} /* SMPTE 240M (1987) */
  46. };
  47. #define LOADCHROMA(i) \
  48. U = pu[i]; \
  49. V = pv[i]; \
  50. r = (void *)c->table_rV[V]; \
  51. g = (void *)(c->table_gU[U] + c->table_gV[V]); \
  52. b = (void *)c->table_bU[U];
  53. #define PUTRGB(dst,src,i,o) \
  54. Y = src[2*i+o]; \
  55. dst[2*i ] = r[Y] + g[Y] + b[Y]; \
  56. Y = src[2*i+1-o]; \
  57. dst[2*i+1] = r[Y] + g[Y] + b[Y];
  58. #define PUTRGB24(dst,src,i) \
  59. Y = src[2*i]; \
  60. dst[6*i+0] = r[Y]; dst[6*i+1] = g[Y]; dst[6*i+2] = b[Y]; \
  61. Y = src[2*i+1]; \
  62. dst[6*i+3] = r[Y]; dst[6*i+4] = g[Y]; dst[6*i+5] = b[Y];
  63. #define PUTBGR24(dst,src,i) \
  64. Y = src[2*i]; \
  65. dst[6*i+0] = b[Y]; dst[6*i+1] = g[Y]; dst[6*i+2] = r[Y]; \
  66. Y = src[2*i+1]; \
  67. dst[6*i+3] = b[Y]; dst[6*i+4] = g[Y]; dst[6*i+5] = r[Y];
  68. #define PUTRGBA(dst,ysrc,asrc,i,o,s) \
  69. Y = ysrc[2*i+o]; \
  70. dst[2*i ] = r[Y] + g[Y] + b[Y] + (asrc[2*i ]<<s); \
  71. Y = ysrc[2*i+1-o]; \
  72. dst[2*i+1] = r[Y] + g[Y] + b[Y] + (asrc[2*i+1]<<s);
  73. #define YUV2RGBFUNC(func_name, dst_type, alpha) \
  74. static int func_name(SwsContext *c, uint8_t* src[], int srcStride[], int srcSliceY, \
  75. int srcSliceH, uint8_t* dst[], int dstStride[]){\
  76. int y;\
  77. \
  78. if (!alpha && c->srcFormat == PIX_FMT_YUV422P) {\
  79. srcStride[1] *= 2;\
  80. srcStride[2] *= 2;\
  81. }\
  82. for (y=0; y<srcSliceH; y+=2) {\
  83. dst_type *dst_1 = (dst_type*)(dst[0] + (y+srcSliceY )*dstStride[0]);\
  84. dst_type *dst_2 = (dst_type*)(dst[0] + (y+srcSliceY+1)*dstStride[0]);\
  85. dst_type av_unused *r, *b;\
  86. dst_type *g;\
  87. uint8_t *py_1 = src[0] + y*srcStride[0];\
  88. uint8_t *py_2 = py_1 + srcStride[0];\
  89. uint8_t *pu = src[1] + (y>>1)*srcStride[1];\
  90. uint8_t *pv = src[2] + (y>>1)*srcStride[2];\
  91. uint8_t av_unused *pa_1, *pa_2;\
  92. unsigned int h_size = c->dstW>>3;\
  93. if (alpha){\
  94. pa_1 = src[3] + y*srcStride[3];\
  95. pa_2 = pa_1 + srcStride[3];\
  96. }\
  97. while (h_size--) {\
  98. int av_unused U, V;\
  99. int Y;\
  100. #define ENDYUV2RGBLINE(dst_delta)\
  101. pu += 4;\
  102. pv += 4;\
  103. py_1 += 8;\
  104. py_2 += 8;\
  105. dst_1 += dst_delta;\
  106. dst_2 += dst_delta;\
  107. }\
  108. if (c->dstW & 4) {\
  109. int av_unused Y, U, V;\
  110. #define ENDYUV2RGBFUNC()\
  111. }\
  112. }\
  113. return srcSliceH;\
  114. }
  115. #define CLOSEYUV2RGBFUNC(dst_delta)\
  116. ENDYUV2RGBLINE(dst_delta)\
  117. ENDYUV2RGBFUNC()
  118. YUV2RGBFUNC(yuv2rgb_c_32, uint32_t, 0)
  119. LOADCHROMA(0);
  120. PUTRGB(dst_1,py_1,0,0);
  121. PUTRGB(dst_2,py_2,0,1);
  122. LOADCHROMA(1);
  123. PUTRGB(dst_2,py_2,1,1);
  124. PUTRGB(dst_1,py_1,1,0);
  125. LOADCHROMA(2);
  126. PUTRGB(dst_1,py_1,2,0);
  127. PUTRGB(dst_2,py_2,2,1);
  128. LOADCHROMA(3);
  129. PUTRGB(dst_2,py_2,3,1);
  130. PUTRGB(dst_1,py_1,3,0);
  131. ENDYUV2RGBLINE(8)
  132. LOADCHROMA(0);
  133. PUTRGB(dst_1,py_1,0,0);
  134. PUTRGB(dst_2,py_2,0,1);
  135. LOADCHROMA(1);
  136. PUTRGB(dst_2,py_2,1,1);
  137. PUTRGB(dst_1,py_1,1,0);
  138. ENDYUV2RGBFUNC()
  139. YUV2RGBFUNC(yuva2rgba_c, uint32_t, 1)
  140. LOADCHROMA(0);
  141. PUTRGBA(dst_1,py_1,pa_1,0,0,24);
  142. PUTRGBA(dst_2,py_2,pa_2,0,1,24);
  143. LOADCHROMA(1);
  144. PUTRGBA(dst_2,py_2,pa_1,1,1,24);
  145. PUTRGBA(dst_1,py_1,pa_2,1,0,24);
  146. LOADCHROMA(2);
  147. PUTRGBA(dst_1,py_1,pa_1,2,0,24);
  148. PUTRGBA(dst_2,py_2,pa_2,2,1,24);
  149. LOADCHROMA(3);
  150. PUTRGBA(dst_2,py_2,pa_1,3,1,24);
  151. PUTRGBA(dst_1,py_1,pa_2,3,0,24);
  152. pa_1 += 8;\
  153. pa_2 += 8;\
  154. ENDYUV2RGBLINE(8)
  155. LOADCHROMA(0);
  156. PUTRGBA(dst_1,py_1,pa_1,0,0,24);
  157. PUTRGBA(dst_2,py_2,pa_2,0,1,24);
  158. LOADCHROMA(1);
  159. PUTRGBA(dst_2,py_2,pa_1,1,1,24);
  160. PUTRGBA(dst_1,py_1,pa_2,1,0,24);
  161. ENDYUV2RGBFUNC()
  162. YUV2RGBFUNC(yuva2argb_c, uint32_t, 1)
  163. LOADCHROMA(0);
  164. PUTRGBA(dst_1,py_1,pa_1,0,0,0);
  165. PUTRGBA(dst_2,py_2,pa_2,0,1,0);
  166. LOADCHROMA(1);
  167. PUTRGBA(dst_2,py_2,pa_2,1,1,0);
  168. PUTRGBA(dst_1,py_1,pa_1,1,0,0);
  169. LOADCHROMA(2);
  170. PUTRGBA(dst_1,py_1,pa_1,2,0,0);
  171. PUTRGBA(dst_2,py_2,pa_2,2,1,0);
  172. LOADCHROMA(3);
  173. PUTRGBA(dst_2,py_2,pa_2,3,1,0);
  174. PUTRGBA(dst_1,py_1,pa_1,3,0,0);
  175. pa_1 += 8;\
  176. pa_2 += 8;\
  177. ENDYUV2RGBLINE(8)
  178. LOADCHROMA(0);
  179. PUTRGBA(dst_1,py_1,pa_1,0,0,0);
  180. PUTRGBA(dst_2,py_2,pa_2,0,1,0);
  181. LOADCHROMA(1);
  182. PUTRGBA(dst_2,py_2,pa_2,1,1,0);
  183. PUTRGBA(dst_1,py_1,pa_1,1,0,0);
  184. ENDYUV2RGBFUNC()
  185. YUV2RGBFUNC(yuv2rgb_c_24_rgb, uint8_t, 0)
  186. LOADCHROMA(0);
  187. PUTRGB24(dst_1,py_1,0);
  188. PUTRGB24(dst_2,py_2,0);
  189. LOADCHROMA(1);
  190. PUTRGB24(dst_2,py_2,1);
  191. PUTRGB24(dst_1,py_1,1);
  192. LOADCHROMA(2);
  193. PUTRGB24(dst_1,py_1,2);
  194. PUTRGB24(dst_2,py_2,2);
  195. LOADCHROMA(3);
  196. PUTRGB24(dst_2,py_2,3);
  197. PUTRGB24(dst_1,py_1,3);
  198. ENDYUV2RGBLINE(24)
  199. LOADCHROMA(0);
  200. PUTRGB24(dst_1,py_1,0);
  201. PUTRGB24(dst_2,py_2,0);
  202. LOADCHROMA(1);
  203. PUTRGB24(dst_2,py_2,1);
  204. PUTRGB24(dst_1,py_1,1);
  205. ENDYUV2RGBFUNC()
  206. // only trivial mods from yuv2rgb_c_24_rgb
  207. YUV2RGBFUNC(yuv2rgb_c_24_bgr, uint8_t, 0)
  208. LOADCHROMA(0);
  209. PUTBGR24(dst_1,py_1,0);
  210. PUTBGR24(dst_2,py_2,0);
  211. LOADCHROMA(1);
  212. PUTBGR24(dst_2,py_2,1);
  213. PUTBGR24(dst_1,py_1,1);
  214. LOADCHROMA(2);
  215. PUTBGR24(dst_1,py_1,2);
  216. PUTBGR24(dst_2,py_2,2);
  217. LOADCHROMA(3);
  218. PUTBGR24(dst_2,py_2,3);
  219. PUTBGR24(dst_1,py_1,3);
  220. ENDYUV2RGBLINE(24)
  221. LOADCHROMA(0);
  222. PUTBGR24(dst_1,py_1,0);
  223. PUTBGR24(dst_2,py_2,0);
  224. LOADCHROMA(1);
  225. PUTBGR24(dst_2,py_2,1);
  226. PUTBGR24(dst_1,py_1,1);
  227. ENDYUV2RGBFUNC()
  228. // This is exactly the same code as yuv2rgb_c_32 except for the types of
  229. // r, g, b, dst_1, dst_2
  230. YUV2RGBFUNC(yuv2rgb_c_16, uint16_t, 0)
  231. LOADCHROMA(0);
  232. PUTRGB(dst_1,py_1,0,0);
  233. PUTRGB(dst_2,py_2,0,1);
  234. LOADCHROMA(1);
  235. PUTRGB(dst_2,py_2,1,1);
  236. PUTRGB(dst_1,py_1,1,0);
  237. LOADCHROMA(2);
  238. PUTRGB(dst_1,py_1,2,0);
  239. PUTRGB(dst_2,py_2,2,1);
  240. LOADCHROMA(3);
  241. PUTRGB(dst_2,py_2,3,1);
  242. PUTRGB(dst_1,py_1,3,0);
  243. CLOSEYUV2RGBFUNC(8)
  244. // This is exactly the same code as yuv2rgb_c_32 except for the types of
  245. // r, g, b, dst_1, dst_2
  246. YUV2RGBFUNC(yuv2rgb_c_8, uint8_t, 0)
  247. LOADCHROMA(0);
  248. PUTRGB(dst_1,py_1,0,0);
  249. PUTRGB(dst_2,py_2,0,1);
  250. LOADCHROMA(1);
  251. PUTRGB(dst_2,py_2,1,1);
  252. PUTRGB(dst_1,py_1,1,0);
  253. LOADCHROMA(2);
  254. PUTRGB(dst_1,py_1,2,0);
  255. PUTRGB(dst_2,py_2,2,1);
  256. LOADCHROMA(3);
  257. PUTRGB(dst_2,py_2,3,1);
  258. PUTRGB(dst_1,py_1,3,0);
  259. CLOSEYUV2RGBFUNC(8)
  260. // r, g, b, dst_1, dst_2
  261. YUV2RGBFUNC(yuv2rgb_c_8_ordered_dither, uint8_t, 0)
  262. const uint8_t *d32 = dither_8x8_32[y&7];
  263. const uint8_t *d64 = dither_8x8_73[y&7];
  264. #define PUTRGB8(dst,src,i,o) \
  265. Y = src[2*i]; \
  266. dst[2*i] = r[Y+d32[0+o]] + g[Y+d32[0+o]] + b[Y+d64[0+o]]; \
  267. Y = src[2*i+1]; \
  268. dst[2*i+1] = r[Y+d32[1+o]] + g[Y+d32[1+o]] + b[Y+d64[1+o]];
  269. LOADCHROMA(0);
  270. PUTRGB8(dst_1,py_1,0,0);
  271. PUTRGB8(dst_2,py_2,0,0+8);
  272. LOADCHROMA(1);
  273. PUTRGB8(dst_2,py_2,1,2+8);
  274. PUTRGB8(dst_1,py_1,1,2);
  275. LOADCHROMA(2);
  276. PUTRGB8(dst_1,py_1,2,4);
  277. PUTRGB8(dst_2,py_2,2,4+8);
  278. LOADCHROMA(3);
  279. PUTRGB8(dst_2,py_2,3,6+8);
  280. PUTRGB8(dst_1,py_1,3,6);
  281. CLOSEYUV2RGBFUNC(8)
  282. // This is exactly the same code as yuv2rgb_c_32 except for the types of
  283. // r, g, b, dst_1, dst_2
  284. YUV2RGBFUNC(yuv2rgb_c_4, uint8_t, 0)
  285. int acc;
  286. #define PUTRGB4(dst,src,i) \
  287. Y = src[2*i]; \
  288. acc = r[Y] + g[Y] + b[Y]; \
  289. Y = src[2*i+1]; \
  290. acc |= (r[Y] + g[Y] + b[Y])<<4; \
  291. dst[i] = acc;
  292. LOADCHROMA(0);
  293. PUTRGB4(dst_1,py_1,0);
  294. PUTRGB4(dst_2,py_2,0);
  295. LOADCHROMA(1);
  296. PUTRGB4(dst_2,py_2,1);
  297. PUTRGB4(dst_1,py_1,1);
  298. LOADCHROMA(2);
  299. PUTRGB4(dst_1,py_1,2);
  300. PUTRGB4(dst_2,py_2,2);
  301. LOADCHROMA(3);
  302. PUTRGB4(dst_2,py_2,3);
  303. PUTRGB4(dst_1,py_1,3);
  304. CLOSEYUV2RGBFUNC(4)
  305. YUV2RGBFUNC(yuv2rgb_c_4_ordered_dither, uint8_t, 0)
  306. const uint8_t *d64 = dither_8x8_73[y&7];
  307. const uint8_t *d128 = dither_8x8_220[y&7];
  308. int acc;
  309. #define PUTRGB4D(dst,src,i,o) \
  310. Y = src[2*i]; \
  311. acc = r[Y+d128[0+o]] + g[Y+d64[0+o]] + b[Y+d128[0+o]]; \
  312. Y = src[2*i+1]; \
  313. acc |= (r[Y+d128[1+o]] + g[Y+d64[1+o]] + b[Y+d128[1+o]])<<4; \
  314. dst[i]= acc;
  315. LOADCHROMA(0);
  316. PUTRGB4D(dst_1,py_1,0,0);
  317. PUTRGB4D(dst_2,py_2,0,0+8);
  318. LOADCHROMA(1);
  319. PUTRGB4D(dst_2,py_2,1,2+8);
  320. PUTRGB4D(dst_1,py_1,1,2);
  321. LOADCHROMA(2);
  322. PUTRGB4D(dst_1,py_1,2,4);
  323. PUTRGB4D(dst_2,py_2,2,4+8);
  324. LOADCHROMA(3);
  325. PUTRGB4D(dst_2,py_2,3,6+8);
  326. PUTRGB4D(dst_1,py_1,3,6);
  327. CLOSEYUV2RGBFUNC(4)
  328. // This is exactly the same code as yuv2rgb_c_32 except for the types of
  329. // r, g, b, dst_1, dst_2
  330. YUV2RGBFUNC(yuv2rgb_c_4b, uint8_t, 0)
  331. LOADCHROMA(0);
  332. PUTRGB(dst_1,py_1,0,0);
  333. PUTRGB(dst_2,py_2,0,1);
  334. LOADCHROMA(1);
  335. PUTRGB(dst_2,py_2,1,1);
  336. PUTRGB(dst_1,py_1,1,0);
  337. LOADCHROMA(2);
  338. PUTRGB(dst_1,py_1,2,0);
  339. PUTRGB(dst_2,py_2,2,1);
  340. LOADCHROMA(3);
  341. PUTRGB(dst_2,py_2,3,1);
  342. PUTRGB(dst_1,py_1,3,0);
  343. CLOSEYUV2RGBFUNC(8)
  344. YUV2RGBFUNC(yuv2rgb_c_4b_ordered_dither, uint8_t, 0)
  345. const uint8_t *d64 = dither_8x8_73[y&7];
  346. const uint8_t *d128 = dither_8x8_220[y&7];
  347. #define PUTRGB4DB(dst,src,i,o) \
  348. Y = src[2*i]; \
  349. dst[2*i] = r[Y+d128[0+o]] + g[Y+d64[0+o]] + b[Y+d128[0+o]]; \
  350. Y = src[2*i+1]; \
  351. dst[2*i+1] = r[Y+d128[1+o]] + g[Y+d64[1+o]] + b[Y+d128[1+o]];
  352. LOADCHROMA(0);
  353. PUTRGB4DB(dst_1,py_1,0,0);
  354. PUTRGB4DB(dst_2,py_2,0,0+8);
  355. LOADCHROMA(1);
  356. PUTRGB4DB(dst_2,py_2,1,2+8);
  357. PUTRGB4DB(dst_1,py_1,1,2);
  358. LOADCHROMA(2);
  359. PUTRGB4DB(dst_1,py_1,2,4);
  360. PUTRGB4DB(dst_2,py_2,2,4+8);
  361. LOADCHROMA(3);
  362. PUTRGB4DB(dst_2,py_2,3,6+8);
  363. PUTRGB4DB(dst_1,py_1,3,6);
  364. CLOSEYUV2RGBFUNC(8)
  365. YUV2RGBFUNC(yuv2rgb_c_1_ordered_dither, uint8_t, 0)
  366. const uint8_t *d128 = dither_8x8_220[y&7];
  367. char out_1 = 0, out_2 = 0;
  368. g= c->table_gU[128] + c->table_gV[128];
  369. #define PUTRGB1(out,src,i,o) \
  370. Y = src[2*i]; \
  371. out+= out + g[Y+d128[0+o]]; \
  372. Y = src[2*i+1]; \
  373. out+= out + g[Y+d128[1+o]];
  374. PUTRGB1(out_1,py_1,0,0);
  375. PUTRGB1(out_2,py_2,0,0+8);
  376. PUTRGB1(out_2,py_2,1,2+8);
  377. PUTRGB1(out_1,py_1,1,2);
  378. PUTRGB1(out_1,py_1,2,4);
  379. PUTRGB1(out_2,py_2,2,4+8);
  380. PUTRGB1(out_2,py_2,3,6+8);
  381. PUTRGB1(out_1,py_1,3,6);
  382. dst_1[0]= out_1;
  383. dst_2[0]= out_2;
  384. CLOSEYUV2RGBFUNC(1)
  385. SwsFunc ff_yuv2rgb_get_func_ptr(SwsContext *c)
  386. {
  387. SwsFunc t = NULL;
  388. #if (HAVE_MMX2 || HAVE_MMX) && CONFIG_GPL
  389. t = ff_yuv2rgb_init_mmx(c);
  390. #endif
  391. #if HAVE_VIS
  392. t = ff_yuv2rgb_init_vis(c);
  393. #endif
  394. #if CONFIG_MLIB
  395. t = ff_yuv2rgb_init_mlib(c);
  396. #endif
  397. #if HAVE_ALTIVEC && CONFIG_GPL
  398. if (c->flags & SWS_CPU_CAPS_ALTIVEC)
  399. t = ff_yuv2rgb_init_altivec(c);
  400. #endif
  401. #if ARCH_BFIN
  402. if (c->flags & SWS_CPU_CAPS_BFIN)
  403. t = ff_yuv2rgb_get_func_ptr_bfin(c);
  404. #endif
  405. if (t)
  406. return t;
  407. av_log(c, AV_LOG_WARNING, "No accelerated colorspace conversion found.\n");
  408. switch (c->dstFormat) {
  409. case PIX_FMT_ARGB:
  410. case PIX_FMT_ABGR: if (CONFIG_SWSCALE_ALPHA && c->srcFormat == PIX_FMT_YUVA420P) return yuva2argb_c;
  411. case PIX_FMT_RGBA:
  412. case PIX_FMT_BGRA: return (CONFIG_SWSCALE_ALPHA && c->srcFormat == PIX_FMT_YUVA420P) ? yuva2rgba_c : yuv2rgb_c_32;
  413. case PIX_FMT_RGB24: return yuv2rgb_c_24_rgb;
  414. case PIX_FMT_BGR24: return yuv2rgb_c_24_bgr;
  415. case PIX_FMT_RGB565:
  416. case PIX_FMT_BGR565:
  417. case PIX_FMT_RGB555:
  418. case PIX_FMT_BGR555: return yuv2rgb_c_16;
  419. case PIX_FMT_RGB8:
  420. case PIX_FMT_BGR8: return yuv2rgb_c_8_ordered_dither;
  421. case PIX_FMT_RGB4:
  422. case PIX_FMT_BGR4: return yuv2rgb_c_4_ordered_dither;
  423. case PIX_FMT_RGB4_BYTE:
  424. case PIX_FMT_BGR4_BYTE: return yuv2rgb_c_4b_ordered_dither;
  425. case PIX_FMT_MONOBLACK: return yuv2rgb_c_1_ordered_dither;
  426. default:
  427. assert(0);
  428. }
  429. return NULL;
  430. }
  431. static void fill_table(uint8_t* table[256], const int elemsize, const int inc, uint8_t *y_table)
  432. {
  433. int i;
  434. int64_t cb = 0;
  435. y_table -= elemsize * (inc >> 9);
  436. for (i = 0; i < 256; i++) {
  437. table[i] = y_table + elemsize * (cb >> 16);
  438. cb += inc;
  439. }
  440. }
  441. static void fill_gv_table(int table[256], const int elemsize, const int inc)
  442. {
  443. int i;
  444. int64_t cb = 0;
  445. int off = -(inc >> 9);
  446. for (i = 0; i < 256; i++) {
  447. table[i] = elemsize * (off + (cb >> 16));
  448. cb += inc;
  449. }
  450. }
  451. av_cold int ff_yuv2rgb_c_init_tables(SwsContext *c, const int inv_table[4], int fullRange,
  452. int brightness, int contrast, int saturation)
  453. {
  454. const int isRgb = c->dstFormat==PIX_FMT_RGB32
  455. || c->dstFormat==PIX_FMT_RGB32_1
  456. || c->dstFormat==PIX_FMT_BGR24
  457. || c->dstFormat==PIX_FMT_RGB565
  458. || c->dstFormat==PIX_FMT_RGB555
  459. || c->dstFormat==PIX_FMT_RGB8
  460. || c->dstFormat==PIX_FMT_RGB4
  461. || c->dstFormat==PIX_FMT_RGB4_BYTE
  462. || c->dstFormat==PIX_FMT_MONOBLACK;
  463. const int bpp = fmt_depth(c->dstFormat);
  464. uint8_t *y_table;
  465. uint16_t *y_table16;
  466. uint32_t *y_table32;
  467. int i, base, rbase, gbase, bbase, abase, needAlpha;
  468. const int yoffs = fullRange ? 384 : 326;
  469. int64_t crv = inv_table[0];
  470. int64_t cbu = inv_table[1];
  471. int64_t cgu = -inv_table[2];
  472. int64_t cgv = -inv_table[3];
  473. int64_t cy = 1<<16;
  474. int64_t oy = 0;
  475. int64_t yb = 0;
  476. if (!fullRange) {
  477. cy = (cy*255) / 219;
  478. oy = 16<<16;
  479. } else {
  480. crv = (crv*224) / 255;
  481. cbu = (cbu*224) / 255;
  482. cgu = (cgu*224) / 255;
  483. cgv = (cgv*224) / 255;
  484. }
  485. cy = (cy *contrast ) >> 16;
  486. crv = (crv*contrast * saturation) >> 32;
  487. cbu = (cbu*contrast * saturation) >> 32;
  488. cgu = (cgu*contrast * saturation) >> 32;
  489. cgv = (cgv*contrast * saturation) >> 32;
  490. oy -= 256*brightness;
  491. //scale coefficients by cy
  492. crv = ((crv << 16) + 0x8000) / cy;
  493. cbu = ((cbu << 16) + 0x8000) / cy;
  494. cgu = ((cgu << 16) + 0x8000) / cy;
  495. cgv = ((cgv << 16) + 0x8000) / cy;
  496. av_free(c->yuvTable);
  497. switch (bpp) {
  498. case 1:
  499. c->yuvTable = av_malloc(1024);
  500. y_table = c->yuvTable;
  501. yb = -(384<<16) - oy;
  502. for (i = 0; i < 1024-110; i++) {
  503. y_table[i+110] = av_clip_uint8((yb + 0x8000) >> 16) >> 7;
  504. yb += cy;
  505. }
  506. fill_table(c->table_gU, 1, cgu, y_table + yoffs);
  507. fill_gv_table(c->table_gV, 1, cgv);
  508. break;
  509. case 4:
  510. case 4|128:
  511. rbase = isRgb ? 3 : 0;
  512. gbase = 1;
  513. bbase = isRgb ? 0 : 3;
  514. c->yuvTable = av_malloc(1024*3);
  515. y_table = c->yuvTable;
  516. yb = -(384<<16) - oy;
  517. for (i = 0; i < 1024-110; i++) {
  518. int yval = av_clip_uint8((yb + 0x8000) >> 16);
  519. y_table[i+110 ] = (yval >> 7) << rbase;
  520. y_table[i+ 37+1024] = ((yval + 43) / 85) << gbase;
  521. y_table[i+110+2048] = (yval >> 7) << bbase;
  522. yb += cy;
  523. }
  524. fill_table(c->table_rV, 1, crv, y_table + yoffs);
  525. fill_table(c->table_gU, 1, cgu, y_table + yoffs + 1024);
  526. fill_table(c->table_bU, 1, cbu, y_table + yoffs + 2048);
  527. fill_gv_table(c->table_gV, 1, cgv);
  528. break;
  529. case 8:
  530. rbase = isRgb ? 5 : 0;
  531. gbase = isRgb ? 2 : 3;
  532. bbase = isRgb ? 0 : 6;
  533. c->yuvTable = av_malloc(1024*3);
  534. y_table = c->yuvTable;
  535. yb = -(384<<16) - oy;
  536. for (i = 0; i < 1024-38; i++) {
  537. int yval = av_clip_uint8((yb + 0x8000) >> 16);
  538. y_table[i+16 ] = ((yval + 18) / 36) << rbase;
  539. y_table[i+16+1024] = ((yval + 18) / 36) << gbase;
  540. y_table[i+37+2048] = ((yval + 43) / 85) << bbase;
  541. yb += cy;
  542. }
  543. fill_table(c->table_rV, 1, crv, y_table + yoffs);
  544. fill_table(c->table_gU, 1, cgu, y_table + yoffs + 1024);
  545. fill_table(c->table_bU, 1, cbu, y_table + yoffs + 2048);
  546. fill_gv_table(c->table_gV, 1, cgv);
  547. break;
  548. case 15:
  549. case 16:
  550. rbase = isRgb ? bpp - 5 : 0;
  551. gbase = 5;
  552. bbase = isRgb ? 0 : (bpp - 5);
  553. c->yuvTable = av_malloc(1024*3*2);
  554. y_table16 = c->yuvTable;
  555. yb = -(384<<16) - oy;
  556. for (i = 0; i < 1024; i++) {
  557. uint8_t yval = av_clip_uint8((yb + 0x8000) >> 16);
  558. y_table16[i ] = (yval >> 3) << rbase;
  559. y_table16[i+1024] = (yval >> (18 - bpp)) << gbase;
  560. y_table16[i+2048] = (yval >> 3) << bbase;
  561. yb += cy;
  562. }
  563. fill_table(c->table_rV, 2, crv, y_table16 + yoffs);
  564. fill_table(c->table_gU, 2, cgu, y_table16 + yoffs + 1024);
  565. fill_table(c->table_bU, 2, cbu, y_table16 + yoffs + 2048);
  566. fill_gv_table(c->table_gV, 2, cgv);
  567. break;
  568. case 24:
  569. c->yuvTable = av_malloc(1024);
  570. y_table = c->yuvTable;
  571. yb = -(384<<16) - oy;
  572. for (i = 0; i < 1024; i++) {
  573. y_table[i] = av_clip_uint8((yb + 0x8000) >> 16);
  574. yb += cy;
  575. }
  576. fill_table(c->table_rV, 1, crv, y_table + yoffs);
  577. fill_table(c->table_gU, 1, cgu, y_table + yoffs);
  578. fill_table(c->table_bU, 1, cbu, y_table + yoffs);
  579. fill_gv_table(c->table_gV, 1, cgv);
  580. break;
  581. case 32:
  582. base = (c->dstFormat == PIX_FMT_RGB32_1 || c->dstFormat == PIX_FMT_BGR32_1) ? 8 : 0;
  583. rbase = base + (isRgb ? 16 : 0);
  584. gbase = base + 8;
  585. bbase = base + (isRgb ? 0 : 16);
  586. needAlpha = CONFIG_SWSCALE_ALPHA && isALPHA(c->srcFormat);
  587. if (!needAlpha)
  588. abase = (base + 24) & 31;
  589. c->yuvTable = av_malloc(1024*3*4);
  590. y_table32 = c->yuvTable;
  591. yb = -(384<<16) - oy;
  592. for (i = 0; i < 1024; i++) {
  593. uint8_t yval = av_clip_uint8((yb + 0x8000) >> 16);
  594. y_table32[i ] = (yval << rbase) + (needAlpha ? 0 : (255 << abase));
  595. y_table32[i+1024] = yval << gbase;
  596. y_table32[i+2048] = yval << bbase;
  597. yb += cy;
  598. }
  599. fill_table(c->table_rV, 4, crv, y_table32 + yoffs);
  600. fill_table(c->table_gU, 4, cgu, y_table32 + yoffs + 1024);
  601. fill_table(c->table_bU, 4, cbu, y_table32 + yoffs + 2048);
  602. fill_gv_table(c->table_gV, 4, cgv);
  603. break;
  604. default:
  605. c->yuvTable = NULL;
  606. av_log(c, AV_LOG_ERROR, "%ibpp not supported by yuv2rgb\n", bpp);
  607. return -1;
  608. }
  609. return 0;
  610. }