You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

895 lines
30KB

  1. /*
  2. * software YUV to RGB converter
  3. *
  4. * Copyright (C) 2009 Konstantin Shishkov
  5. *
  6. * 1,4,8bpp support and context / deglobalize stuff
  7. * by Michael Niedermayer (michaelni@gmx.at)
  8. *
  9. * This file is part of FFmpeg.
  10. *
  11. * FFmpeg is free software; you can redistribute it and/or
  12. * modify it under the terms of the GNU Lesser General Public
  13. * License as published by the Free Software Foundation; either
  14. * version 2.1 of the License, or (at your option) any later version.
  15. *
  16. * FFmpeg is distributed in the hope that it will be useful,
  17. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  18. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  19. * Lesser General Public License for more details.
  20. *
  21. * You should have received a copy of the GNU Lesser General Public
  22. * License along with FFmpeg; if not, write to the Free Software
  23. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  24. */
  25. #include <stdio.h>
  26. #include <stdlib.h>
  27. #include <inttypes.h>
  28. #include "libavutil/cpu.h"
  29. #include "libavutil/bswap.h"
  30. #include "config.h"
  31. #include "rgb2rgb.h"
  32. #include "swscale.h"
  33. #include "swscale_internal.h"
  34. #include "libavutil/pixdesc.h"
  35. extern const uint8_t dither_2x2_4[2][8];
  36. extern const uint8_t dither_2x2_8[2][8];
  37. extern const uint8_t dither_4x4_16[4][8];
  38. extern const uint8_t dither_8x8_32[8][8];
  39. extern const uint8_t dither_8x8_73[8][8];
  40. extern const uint8_t dither_8x8_220[8][8];
  41. const int32_t ff_yuv2rgb_coeffs[8][4] = {
  42. { 117504, 138453, 13954, 34903 }, /* no sequence_display_extension */
  43. { 117504, 138453, 13954, 34903 }, /* ITU-R Rec. 709 (1990) */
  44. { 104597, 132201, 25675, 53279 }, /* unspecified */
  45. { 104597, 132201, 25675, 53279 }, /* reserved */
  46. { 104448, 132798, 24759, 53109 }, /* FCC */
  47. { 104597, 132201, 25675, 53279 }, /* ITU-R Rec. 624-4 System B, G */
  48. { 104597, 132201, 25675, 53279 }, /* SMPTE 170M */
  49. { 117579, 136230, 16907, 35559 } /* SMPTE 240M (1987) */
  50. };
  51. const int *sws_getCoefficients(int colorspace)
  52. {
  53. if (colorspace > 7 || colorspace < 0)
  54. colorspace = SWS_CS_DEFAULT;
  55. return ff_yuv2rgb_coeffs[colorspace];
  56. }
  57. #define LOADCHROMA(i) \
  58. U = pu[i]; \
  59. V = pv[i]; \
  60. r = (void *)c->table_rV[V+YUVRGB_TABLE_HEADROOM]; \
  61. g = (void *)(c->table_gU[U+YUVRGB_TABLE_HEADROOM] + c->table_gV[V+YUVRGB_TABLE_HEADROOM]); \
  62. b = (void *)c->table_bU[U+YUVRGB_TABLE_HEADROOM];
  63. #define PUTRGB(dst, src, i) \
  64. Y = src[2 * i]; \
  65. dst[2 * i] = r[Y] + g[Y] + b[Y]; \
  66. Y = src[2 * i + 1]; \
  67. dst[2 * i + 1] = r[Y] + g[Y] + b[Y];
  68. #define PUTRGB24(dst, src, i) \
  69. Y = src[2 * i]; \
  70. dst[6 * i + 0] = r[Y]; \
  71. dst[6 * i + 1] = g[Y]; \
  72. dst[6 * i + 2] = b[Y]; \
  73. Y = src[2 * i + 1]; \
  74. dst[6 * i + 3] = r[Y]; \
  75. dst[6 * i + 4] = g[Y]; \
  76. dst[6 * i + 5] = b[Y];
  77. #define PUTBGR24(dst, src, i) \
  78. Y = src[2 * i]; \
  79. dst[6 * i + 0] = b[Y]; \
  80. dst[6 * i + 1] = g[Y]; \
  81. dst[6 * i + 2] = r[Y]; \
  82. Y = src[2 * i + 1]; \
  83. dst[6 * i + 3] = b[Y]; \
  84. dst[6 * i + 4] = g[Y]; \
  85. dst[6 * i + 5] = r[Y];
  86. #define PUTRGBA(dst, ysrc, asrc, i, s) \
  87. Y = ysrc[2 * i]; \
  88. dst[2 * i] = r[Y] + g[Y] + b[Y] + (asrc[2 * i] << s); \
  89. Y = ysrc[2 * i + 1]; \
  90. dst[2 * i + 1] = r[Y] + g[Y] + b[Y] + (asrc[2 * i + 1] << s);
  91. #define PUTRGB48(dst, src, i) \
  92. Y = src[ 2 * i]; \
  93. dst[12 * i + 0] = dst[12 * i + 1] = r[Y]; \
  94. dst[12 * i + 2] = dst[12 * i + 3] = g[Y]; \
  95. dst[12 * i + 4] = dst[12 * i + 5] = b[Y]; \
  96. Y = src[ 2 * i + 1]; \
  97. dst[12 * i + 6] = dst[12 * i + 7] = r[Y]; \
  98. dst[12 * i + 8] = dst[12 * i + 9] = g[Y]; \
  99. dst[12 * i + 10] = dst[12 * i + 11] = b[Y];
  100. #define PUTBGR48(dst, src, i) \
  101. Y = src[2 * i]; \
  102. dst[12 * i + 0] = dst[12 * i + 1] = b[Y]; \
  103. dst[12 * i + 2] = dst[12 * i + 3] = g[Y]; \
  104. dst[12 * i + 4] = dst[12 * i + 5] = r[Y]; \
  105. Y = src[2 * i + 1]; \
  106. dst[12 * i + 6] = dst[12 * i + 7] = b[Y]; \
  107. dst[12 * i + 8] = dst[12 * i + 9] = g[Y]; \
  108. dst[12 * i + 10] = dst[12 * i + 11] = r[Y];
  109. #define YUV2RGBFUNC(func_name, dst_type, alpha) \
  110. static int func_name(SwsContext *c, const uint8_t *src[], \
  111. int srcStride[], int srcSliceY, int srcSliceH, \
  112. uint8_t *dst[], int dstStride[]) \
  113. { \
  114. int y; \
  115. \
  116. if (!alpha && c->srcFormat == PIX_FMT_YUV422P) { \
  117. srcStride[1] *= 2; \
  118. srcStride[2] *= 2; \
  119. } \
  120. for (y = 0; y < srcSliceH; y += 2) { \
  121. dst_type *dst_1 = \
  122. (dst_type *)(dst[0] + (y + srcSliceY) * dstStride[0]); \
  123. dst_type *dst_2 = \
  124. (dst_type *)(dst[0] + (y + srcSliceY + 1) * dstStride[0]); \
  125. dst_type av_unused *r, *g, *b; \
  126. const uint8_t *py_1 = src[0] + y * srcStride[0]; \
  127. const uint8_t *py_2 = py_1 + srcStride[0]; \
  128. const uint8_t *pu = src[1] + (y >> 1) * srcStride[1]; \
  129. const uint8_t *pv = src[2] + (y >> 1) * srcStride[2]; \
  130. const uint8_t av_unused *pa_1, *pa_2; \
  131. unsigned int h_size = c->dstW >> 3; \
  132. if (alpha) { \
  133. pa_1 = src[3] + y * srcStride[3]; \
  134. pa_2 = pa_1 + srcStride[3]; \
  135. } \
  136. while (h_size--) { \
  137. int av_unused U, V, Y; \
  138. #define ENDYUV2RGBLINE(dst_delta) \
  139. pu += 4; \
  140. pv += 4; \
  141. py_1 += 8; \
  142. py_2 += 8; \
  143. dst_1 += dst_delta; \
  144. dst_2 += dst_delta; \
  145. } \
  146. if (c->dstW & 4) { \
  147. int av_unused Y, U, V; \
  148. #define ENDYUV2RGBFUNC() \
  149. } \
  150. } \
  151. return srcSliceH; \
  152. }
  153. #define CLOSEYUV2RGBFUNC(dst_delta) \
  154. ENDYUV2RGBLINE(dst_delta) \
  155. ENDYUV2RGBFUNC()
  156. YUV2RGBFUNC(yuv2rgb_c_48, uint8_t, 0)
  157. LOADCHROMA(0);
  158. PUTRGB48(dst_1, py_1, 0);
  159. PUTRGB48(dst_2, py_2, 0);
  160. LOADCHROMA(1);
  161. PUTRGB48(dst_2, py_2, 1);
  162. PUTRGB48(dst_1, py_1, 1);
  163. LOADCHROMA(2);
  164. PUTRGB48(dst_1, py_1, 2);
  165. PUTRGB48(dst_2, py_2, 2);
  166. LOADCHROMA(3);
  167. PUTRGB48(dst_2, py_2, 3);
  168. PUTRGB48(dst_1, py_1, 3);
  169. ENDYUV2RGBLINE(48)
  170. LOADCHROMA(0);
  171. PUTRGB48(dst_1, py_1, 0);
  172. PUTRGB48(dst_2, py_2, 0);
  173. LOADCHROMA(1);
  174. PUTRGB48(dst_2, py_2, 1);
  175. PUTRGB48(dst_1, py_1, 1);
  176. ENDYUV2RGBFUNC()
  177. YUV2RGBFUNC(yuv2rgb_c_bgr48, uint8_t, 0)
  178. LOADCHROMA(0);
  179. PUTBGR48(dst_1, py_1, 0);
  180. PUTBGR48(dst_2, py_2, 0);
  181. LOADCHROMA(1);
  182. PUTBGR48(dst_2, py_2, 1);
  183. PUTBGR48(dst_1, py_1, 1);
  184. LOADCHROMA(2);
  185. PUTBGR48(dst_1, py_1, 2);
  186. PUTBGR48(dst_2, py_2, 2);
  187. LOADCHROMA(3);
  188. PUTBGR48(dst_2, py_2, 3);
  189. PUTBGR48(dst_1, py_1, 3);
  190. ENDYUV2RGBLINE(48)
  191. LOADCHROMA(0);
  192. PUTBGR48(dst_1, py_1, 0);
  193. PUTBGR48(dst_2, py_2, 0);
  194. LOADCHROMA(1);
  195. PUTBGR48(dst_2, py_2, 1);
  196. PUTBGR48(dst_1, py_1, 1);
  197. ENDYUV2RGBFUNC()
  198. YUV2RGBFUNC(yuv2rgb_c_32, uint32_t, 0)
  199. LOADCHROMA(0);
  200. PUTRGB(dst_1, py_1, 0);
  201. PUTRGB(dst_2, py_2, 0);
  202. LOADCHROMA(1);
  203. PUTRGB(dst_2, py_2, 1);
  204. PUTRGB(dst_1, py_1, 1);
  205. LOADCHROMA(2);
  206. PUTRGB(dst_1, py_1, 2);
  207. PUTRGB(dst_2, py_2, 2);
  208. LOADCHROMA(3);
  209. PUTRGB(dst_2, py_2, 3);
  210. PUTRGB(dst_1, py_1, 3);
  211. ENDYUV2RGBLINE(8)
  212. LOADCHROMA(0);
  213. PUTRGB(dst_1, py_1, 0);
  214. PUTRGB(dst_2, py_2, 0);
  215. LOADCHROMA(1);
  216. PUTRGB(dst_2, py_2, 1);
  217. PUTRGB(dst_1, py_1, 1);
  218. ENDYUV2RGBFUNC()
  219. YUV2RGBFUNC(yuva2rgba_c, uint32_t, 1)
  220. LOADCHROMA(0);
  221. PUTRGBA(dst_1, py_1, pa_1, 0, 24);
  222. PUTRGBA(dst_2, py_2, pa_2, 0, 24);
  223. LOADCHROMA(1);
  224. PUTRGBA(dst_2, py_2, pa_1, 1, 24);
  225. PUTRGBA(dst_1, py_1, pa_2, 1, 24);
  226. LOADCHROMA(2);
  227. PUTRGBA(dst_1, py_1, pa_1, 2, 24);
  228. PUTRGBA(dst_2, py_2, pa_2, 2, 24);
  229. LOADCHROMA(3);
  230. PUTRGBA(dst_2, py_2, pa_1, 3, 24);
  231. PUTRGBA(dst_1, py_1, pa_2, 3, 24);
  232. pa_1 += 8; \
  233. pa_2 += 8; \
  234. ENDYUV2RGBLINE(8)
  235. LOADCHROMA(0);
  236. PUTRGBA(dst_1, py_1, pa_1, 0, 24);
  237. PUTRGBA(dst_2, py_2, pa_2, 0, 24);
  238. LOADCHROMA(1);
  239. PUTRGBA(dst_2, py_2, pa_1, 1, 24);
  240. PUTRGBA(dst_1, py_1, pa_2, 1, 24);
  241. ENDYUV2RGBFUNC()
  242. YUV2RGBFUNC(yuva2argb_c, uint32_t, 1)
  243. LOADCHROMA(0);
  244. PUTRGBA(dst_1, py_1, pa_1, 0, 0);
  245. PUTRGBA(dst_2, py_2, pa_2, 0, 0);
  246. LOADCHROMA(1);
  247. PUTRGBA(dst_2, py_2, pa_2, 1, 0);
  248. PUTRGBA(dst_1, py_1, pa_1, 1, 0);
  249. LOADCHROMA(2);
  250. PUTRGBA(dst_1, py_1, pa_1, 2, 0);
  251. PUTRGBA(dst_2, py_2, pa_2, 2, 0);
  252. LOADCHROMA(3);
  253. PUTRGBA(dst_2, py_2, pa_2, 3, 0);
  254. PUTRGBA(dst_1, py_1, pa_1, 3, 0);
  255. pa_1 += 8; \
  256. pa_2 += 8; \
  257. ENDYUV2RGBLINE(8)
  258. LOADCHROMA(0);
  259. PUTRGBA(dst_1, py_1, pa_1, 0, 0);
  260. PUTRGBA(dst_2, py_2, pa_2, 0, 0);
  261. LOADCHROMA(1);
  262. PUTRGBA(dst_2, py_2, pa_2, 1, 0);
  263. PUTRGBA(dst_1, py_1, pa_1, 1, 0);
  264. ENDYUV2RGBFUNC()
  265. YUV2RGBFUNC(yuv2rgb_c_24_rgb, uint8_t, 0)
  266. LOADCHROMA(0);
  267. PUTRGB24(dst_1, py_1, 0);
  268. PUTRGB24(dst_2, py_2, 0);
  269. LOADCHROMA(1);
  270. PUTRGB24(dst_2, py_2, 1);
  271. PUTRGB24(dst_1, py_1, 1);
  272. LOADCHROMA(2);
  273. PUTRGB24(dst_1, py_1, 2);
  274. PUTRGB24(dst_2, py_2, 2);
  275. LOADCHROMA(3);
  276. PUTRGB24(dst_2, py_2, 3);
  277. PUTRGB24(dst_1, py_1, 3);
  278. ENDYUV2RGBLINE(24)
  279. LOADCHROMA(0);
  280. PUTRGB24(dst_1, py_1, 0);
  281. PUTRGB24(dst_2, py_2, 0);
  282. LOADCHROMA(1);
  283. PUTRGB24(dst_2, py_2, 1);
  284. PUTRGB24(dst_1, py_1, 1);
  285. ENDYUV2RGBFUNC()
  286. // only trivial mods from yuv2rgb_c_24_rgb
  287. YUV2RGBFUNC(yuv2rgb_c_24_bgr, uint8_t, 0)
  288. LOADCHROMA(0);
  289. PUTBGR24(dst_1, py_1, 0);
  290. PUTBGR24(dst_2, py_2, 0);
  291. LOADCHROMA(1);
  292. PUTBGR24(dst_2, py_2, 1);
  293. PUTBGR24(dst_1, py_1, 1);
  294. LOADCHROMA(2);
  295. PUTBGR24(dst_1, py_1, 2);
  296. PUTBGR24(dst_2, py_2, 2);
  297. LOADCHROMA(3);
  298. PUTBGR24(dst_2, py_2, 3);
  299. PUTBGR24(dst_1, py_1, 3);
  300. ENDYUV2RGBLINE(24)
  301. LOADCHROMA(0);
  302. PUTBGR24(dst_1, py_1, 0);
  303. PUTBGR24(dst_2, py_2, 0);
  304. LOADCHROMA(1);
  305. PUTBGR24(dst_2, py_2, 1);
  306. PUTBGR24(dst_1, py_1, 1);
  307. ENDYUV2RGBFUNC()
  308. YUV2RGBFUNC(yuv2rgb_c_16_ordered_dither, uint16_t, 0)
  309. const uint8_t *d16 = dither_2x2_8[y & 1];
  310. const uint8_t *e16 = dither_2x2_4[y & 1];
  311. const uint8_t *f16 = dither_2x2_8[(y & 1)^1];
  312. #define PUTRGB16(dst, src, i, o) \
  313. Y = src[2 * i]; \
  314. dst[2 * i] = r[Y + d16[0 + o]] + \
  315. g[Y + e16[0 + o]] + \
  316. b[Y + f16[0 + o]]; \
  317. Y = src[2 * i + 1]; \
  318. dst[2 * i + 1] = r[Y + d16[1 + o]] + \
  319. g[Y + e16[1 + o]] + \
  320. b[Y + f16[1 + o]];
  321. LOADCHROMA(0);
  322. PUTRGB16(dst_1, py_1, 0, 0);
  323. PUTRGB16(dst_2, py_2, 0, 0 + 8);
  324. LOADCHROMA(1);
  325. PUTRGB16(dst_2, py_2, 1, 2 + 8);
  326. PUTRGB16(dst_1, py_1, 1, 2);
  327. LOADCHROMA(2);
  328. PUTRGB16(dst_1, py_1, 2, 4);
  329. PUTRGB16(dst_2, py_2, 2, 4 + 8);
  330. LOADCHROMA(3);
  331. PUTRGB16(dst_2, py_2, 3, 6 + 8);
  332. PUTRGB16(dst_1, py_1, 3, 6);
  333. CLOSEYUV2RGBFUNC(8)
  334. YUV2RGBFUNC(yuv2rgb_c_15_ordered_dither, uint16_t, 0)
  335. const uint8_t *d16 = dither_2x2_8[y & 1];
  336. const uint8_t *e16 = dither_2x2_8[(y & 1)^1];
  337. #define PUTRGB15(dst, src, i, o) \
  338. Y = src[2 * i]; \
  339. dst[2 * i] = r[Y + d16[0 + o]] + \
  340. g[Y + d16[1 + o]] + \
  341. b[Y + e16[0 + o]]; \
  342. Y = src[2 * i + 1]; \
  343. dst[2 * i + 1] = r[Y + d16[1 + o]] + \
  344. g[Y + d16[0 + o]] + \
  345. b[Y + e16[1 + o]];
  346. LOADCHROMA(0);
  347. PUTRGB15(dst_1, py_1, 0, 0);
  348. PUTRGB15(dst_2, py_2, 0, 0 + 8);
  349. LOADCHROMA(1);
  350. PUTRGB15(dst_2, py_2, 1, 2 + 8);
  351. PUTRGB15(dst_1, py_1, 1, 2);
  352. LOADCHROMA(2);
  353. PUTRGB15(dst_1, py_1, 2, 4);
  354. PUTRGB15(dst_2, py_2, 2, 4 + 8);
  355. LOADCHROMA(3);
  356. PUTRGB15(dst_2, py_2, 3, 6 + 8);
  357. PUTRGB15(dst_1, py_1, 3, 6);
  358. CLOSEYUV2RGBFUNC(8)
  359. // r, g, b, dst_1, dst_2
  360. YUV2RGBFUNC(yuv2rgb_c_12_ordered_dither, uint16_t, 0)
  361. const uint8_t *d16 = dither_4x4_16[y & 3];
  362. #define PUTRGB12(dst, src, i, o) \
  363. Y = src[2 * i]; \
  364. dst[2 * i] = r[Y + d16[0 + o]] + \
  365. g[Y + d16[0 + o]] + \
  366. b[Y + d16[0 + o]]; \
  367. Y = src[2 * i + 1]; \
  368. dst[2 * i + 1] = r[Y + d16[1 + o]] + \
  369. g[Y + d16[1 + o]] + \
  370. b[Y + d16[1 + o]];
  371. LOADCHROMA(0);
  372. PUTRGB12(dst_1, py_1, 0, 0);
  373. PUTRGB12(dst_2, py_2, 0, 0 + 8);
  374. LOADCHROMA(1);
  375. PUTRGB12(dst_2, py_2, 1, 2 + 8);
  376. PUTRGB12(dst_1, py_1, 1, 2);
  377. LOADCHROMA(2);
  378. PUTRGB12(dst_1, py_1, 2, 4);
  379. PUTRGB12(dst_2, py_2, 2, 4 + 8);
  380. LOADCHROMA(3);
  381. PUTRGB12(dst_2, py_2, 3, 6 + 8);
  382. PUTRGB12(dst_1, py_1, 3, 6);
  383. CLOSEYUV2RGBFUNC(8)
  384. // r, g, b, dst_1, dst_2
  385. YUV2RGBFUNC(yuv2rgb_c_8_ordered_dither, uint8_t, 0)
  386. const uint8_t *d32 = dither_8x8_32[y & 7];
  387. const uint8_t *d64 = dither_8x8_73[y & 7];
  388. #define PUTRGB8(dst, src, i, o) \
  389. Y = src[2 * i]; \
  390. dst[2 * i] = r[Y + d32[0 + o]] + \
  391. g[Y + d32[0 + o]] + \
  392. b[Y + d64[0 + o]]; \
  393. Y = src[2 * i + 1]; \
  394. dst[2 * i + 1] = r[Y + d32[1 + o]] + \
  395. g[Y + d32[1 + o]] + \
  396. b[Y + d64[1 + o]];
  397. LOADCHROMA(0);
  398. PUTRGB8(dst_1, py_1, 0, 0);
  399. PUTRGB8(dst_2, py_2, 0, 0 + 8);
  400. LOADCHROMA(1);
  401. PUTRGB8(dst_2, py_2, 1, 2 + 8);
  402. PUTRGB8(dst_1, py_1, 1, 2);
  403. LOADCHROMA(2);
  404. PUTRGB8(dst_1, py_1, 2, 4);
  405. PUTRGB8(dst_2, py_2, 2, 4 + 8);
  406. LOADCHROMA(3);
  407. PUTRGB8(dst_2, py_2, 3, 6 + 8);
  408. PUTRGB8(dst_1, py_1, 3, 6);
  409. CLOSEYUV2RGBFUNC(8)
  410. YUV2RGBFUNC(yuv2rgb_c_4_ordered_dither, uint8_t, 0)
  411. const uint8_t * d64 = dither_8x8_73[y & 7];
  412. const uint8_t *d128 = dither_8x8_220[y & 7];
  413. int acc;
  414. #define PUTRGB4D(dst, src, i, o) \
  415. Y = src[2 * i]; \
  416. acc = r[Y + d128[0 + o]] + \
  417. g[Y + d64[0 + o]] + \
  418. b[Y + d128[0 + o]]; \
  419. Y = src[2 * i + 1]; \
  420. acc |= (r[Y + d128[1 + o]] + \
  421. g[Y + d64[1 + o]] + \
  422. b[Y + d128[1 + o]]) << 4; \
  423. dst[i] = acc;
  424. LOADCHROMA(0);
  425. PUTRGB4D(dst_1, py_1, 0, 0);
  426. PUTRGB4D(dst_2, py_2, 0, 0 + 8);
  427. LOADCHROMA(1);
  428. PUTRGB4D(dst_2, py_2, 1, 2 + 8);
  429. PUTRGB4D(dst_1, py_1, 1, 2);
  430. LOADCHROMA(2);
  431. PUTRGB4D(dst_1, py_1, 2, 4);
  432. PUTRGB4D(dst_2, py_2, 2, 4 + 8);
  433. LOADCHROMA(3);
  434. PUTRGB4D(dst_2, py_2, 3, 6 + 8);
  435. PUTRGB4D(dst_1, py_1, 3, 6);
  436. CLOSEYUV2RGBFUNC(4)
  437. YUV2RGBFUNC(yuv2rgb_c_4b_ordered_dither, uint8_t, 0)
  438. const uint8_t *d64 = dither_8x8_73[y & 7];
  439. const uint8_t *d128 = dither_8x8_220[y & 7];
  440. #define PUTRGB4DB(dst, src, i, o) \
  441. Y = src[2 * i]; \
  442. dst[2 * i] = r[Y + d128[0 + o]] + \
  443. g[Y + d64[0 + o]] + \
  444. b[Y + d128[0 + o]]; \
  445. Y = src[2 * i + 1]; \
  446. dst[2 * i + 1] = r[Y + d128[1 + o]] + \
  447. g[Y + d64[1 + o]] + \
  448. b[Y + d128[1 + o]];
  449. LOADCHROMA(0);
  450. PUTRGB4DB(dst_1, py_1, 0, 0);
  451. PUTRGB4DB(dst_2, py_2, 0, 0 + 8);
  452. LOADCHROMA(1);
  453. PUTRGB4DB(dst_2, py_2, 1, 2 + 8);
  454. PUTRGB4DB(dst_1, py_1, 1, 2);
  455. LOADCHROMA(2);
  456. PUTRGB4DB(dst_1, py_1, 2, 4);
  457. PUTRGB4DB(dst_2, py_2, 2, 4 + 8);
  458. LOADCHROMA(3);
  459. PUTRGB4DB(dst_2, py_2, 3, 6 + 8);
  460. PUTRGB4DB(dst_1, py_1, 3, 6);
  461. CLOSEYUV2RGBFUNC(8)
  462. YUV2RGBFUNC(yuv2rgb_c_1_ordered_dither, uint8_t, 0)
  463. const uint8_t *d128 = dither_8x8_220[y & 7];
  464. char out_1 = 0, out_2 = 0;
  465. g = c->table_gU[128 + YUVRGB_TABLE_HEADROOM] + c->table_gV[128 + YUVRGB_TABLE_HEADROOM];
  466. #define PUTRGB1(out, src, i, o) \
  467. Y = src[2 * i]; \
  468. out += out + g[Y + d128[0 + o]]; \
  469. Y = src[2 * i + 1]; \
  470. out += out + g[Y + d128[1 + o]];
  471. PUTRGB1(out_1, py_1, 0, 0);
  472. PUTRGB1(out_2, py_2, 0, 0 + 8);
  473. PUTRGB1(out_2, py_2, 1, 2 + 8);
  474. PUTRGB1(out_1, py_1, 1, 2);
  475. PUTRGB1(out_1, py_1, 2, 4);
  476. PUTRGB1(out_2, py_2, 2, 4 + 8);
  477. PUTRGB1(out_2, py_2, 3, 6 + 8);
  478. PUTRGB1(out_1, py_1, 3, 6);
  479. dst_1[0] = out_1;
  480. dst_2[0] = out_2;
  481. CLOSEYUV2RGBFUNC(1)
  482. SwsFunc ff_yuv2rgb_get_func_ptr(SwsContext *c)
  483. {
  484. SwsFunc t = NULL;
  485. if (HAVE_MMX)
  486. t = ff_yuv2rgb_init_mmx(c);
  487. else if (HAVE_VIS)
  488. t = ff_yuv2rgb_init_vis(c);
  489. else if (HAVE_ALTIVEC)
  490. t = ff_yuv2rgb_init_altivec(c);
  491. else if (ARCH_BFIN)
  492. t = ff_yuv2rgb_get_func_ptr_bfin(c);
  493. if (t)
  494. return t;
  495. av_log(c, AV_LOG_WARNING,
  496. "No accelerated colorspace conversion found from %s to %s.\n",
  497. av_get_pix_fmt_name(c->srcFormat), av_get_pix_fmt_name(c->dstFormat));
  498. switch (c->dstFormat) {
  499. case PIX_FMT_BGR48BE:
  500. case PIX_FMT_BGR48LE:
  501. return yuv2rgb_c_bgr48;
  502. case PIX_FMT_RGB48BE:
  503. case PIX_FMT_RGB48LE:
  504. return yuv2rgb_c_48;
  505. case PIX_FMT_ARGB:
  506. case PIX_FMT_ABGR:
  507. if (CONFIG_SWSCALE_ALPHA && isALPHA(c->srcFormat))
  508. return yuva2argb_c;
  509. case PIX_FMT_RGBA:
  510. case PIX_FMT_BGRA:
  511. return (CONFIG_SWSCALE_ALPHA && isALPHA(c->srcFormat)) ? yuva2rgba_c : yuv2rgb_c_32;
  512. case PIX_FMT_RGB24:
  513. return yuv2rgb_c_24_rgb;
  514. case PIX_FMT_BGR24:
  515. return yuv2rgb_c_24_bgr;
  516. case PIX_FMT_RGB565:
  517. case PIX_FMT_BGR565:
  518. return yuv2rgb_c_16_ordered_dither;
  519. case PIX_FMT_RGB555:
  520. case PIX_FMT_BGR555:
  521. return yuv2rgb_c_15_ordered_dither;
  522. case PIX_FMT_RGB444:
  523. case PIX_FMT_BGR444:
  524. return yuv2rgb_c_12_ordered_dither;
  525. case PIX_FMT_RGB8:
  526. case PIX_FMT_BGR8:
  527. return yuv2rgb_c_8_ordered_dither;
  528. case PIX_FMT_RGB4:
  529. case PIX_FMT_BGR4:
  530. return yuv2rgb_c_4_ordered_dither;
  531. case PIX_FMT_RGB4_BYTE:
  532. case PIX_FMT_BGR4_BYTE:
  533. return yuv2rgb_c_4b_ordered_dither;
  534. case PIX_FMT_MONOBLACK:
  535. return yuv2rgb_c_1_ordered_dither;
  536. }
  537. return NULL;
  538. }
  539. static void fill_table(uint8_t* table[256 + 2*YUVRGB_TABLE_HEADROOM], const int elemsize,
  540. const int inc, void *y_tab)
  541. {
  542. int i;
  543. uint8_t *y_table = y_tab;
  544. y_table -= elemsize * (inc >> 9);
  545. for (i = 0; i < 256 + 2*YUVRGB_TABLE_HEADROOM; i++) {
  546. int64_t cb = av_clip(i-YUVRGB_TABLE_HEADROOM, 0, 255)*inc;
  547. table[i] = y_table + elemsize * (cb >> 16);
  548. }
  549. }
  550. static void fill_gv_table(int table[256 + 2*YUVRGB_TABLE_HEADROOM], const int elemsize, const int inc)
  551. {
  552. int i;
  553. int off = -(inc >> 9);
  554. for (i = 0; i < 256 + 2*YUVRGB_TABLE_HEADROOM; i++) {
  555. int64_t cb = av_clip(i-YUVRGB_TABLE_HEADROOM, 0, 255)*inc;
  556. table[i] = elemsize * (off + (cb >> 16));
  557. }
  558. }
  559. static uint16_t roundToInt16(int64_t f)
  560. {
  561. int r = (f + (1 << 15)) >> 16;
  562. if (r < -0x7FFF)
  563. return 0x8000;
  564. else if (r > 0x7FFF)
  565. return 0x7FFF;
  566. else
  567. return r;
  568. }
  569. av_cold int ff_yuv2rgb_c_init_tables(SwsContext *c, const int inv_table[4],
  570. int fullRange, int brightness,
  571. int contrast, int saturation)
  572. {
  573. const int isRgb = c->dstFormat == PIX_FMT_RGB32 ||
  574. c->dstFormat == PIX_FMT_RGB32_1 ||
  575. c->dstFormat == PIX_FMT_BGR24 ||
  576. c->dstFormat == PIX_FMT_RGB565BE ||
  577. c->dstFormat == PIX_FMT_RGB565LE ||
  578. c->dstFormat == PIX_FMT_RGB555BE ||
  579. c->dstFormat == PIX_FMT_RGB555LE ||
  580. c->dstFormat == PIX_FMT_RGB444BE ||
  581. c->dstFormat == PIX_FMT_RGB444LE ||
  582. c->dstFormat == PIX_FMT_RGB8 ||
  583. c->dstFormat == PIX_FMT_RGB4 ||
  584. c->dstFormat == PIX_FMT_RGB4_BYTE ||
  585. c->dstFormat == PIX_FMT_MONOBLACK;
  586. const int isNotNe = c->dstFormat == PIX_FMT_NE(RGB565LE, RGB565BE) ||
  587. c->dstFormat == PIX_FMT_NE(RGB555LE, RGB555BE) ||
  588. c->dstFormat == PIX_FMT_NE(RGB444LE, RGB444BE) ||
  589. c->dstFormat == PIX_FMT_NE(BGR565LE, BGR565BE) ||
  590. c->dstFormat == PIX_FMT_NE(BGR555LE, BGR555BE) ||
  591. c->dstFormat == PIX_FMT_NE(BGR444LE, BGR444BE);
  592. const int bpp = c->dstFormatBpp;
  593. uint8_t *y_table;
  594. uint16_t *y_table16;
  595. uint32_t *y_table32;
  596. int i, base, rbase, gbase, bbase, av_uninit(abase), needAlpha;
  597. const int yoffs = fullRange ? 384 : 326;
  598. int64_t crv = inv_table[0];
  599. int64_t cbu = inv_table[1];
  600. int64_t cgu = -inv_table[2];
  601. int64_t cgv = -inv_table[3];
  602. int64_t cy = 1 << 16;
  603. int64_t oy = 0;
  604. int64_t yb = 0;
  605. if (!fullRange) {
  606. cy = (cy * 255) / 219;
  607. oy = 16 << 16;
  608. } else {
  609. crv = (crv * 224) / 255;
  610. cbu = (cbu * 224) / 255;
  611. cgu = (cgu * 224) / 255;
  612. cgv = (cgv * 224) / 255;
  613. }
  614. cy = (cy * contrast) >> 16;
  615. crv = (crv * contrast * saturation) >> 32;
  616. cbu = (cbu * contrast * saturation) >> 32;
  617. cgu = (cgu * contrast * saturation) >> 32;
  618. cgv = (cgv * contrast * saturation) >> 32;
  619. oy -= 256 * brightness;
  620. c->uOffset = 0x0400040004000400LL;
  621. c->vOffset = 0x0400040004000400LL;
  622. c->yCoeff = roundToInt16(cy * 8192) * 0x0001000100010001ULL;
  623. c->vrCoeff = roundToInt16(crv * 8192) * 0x0001000100010001ULL;
  624. c->ubCoeff = roundToInt16(cbu * 8192) * 0x0001000100010001ULL;
  625. c->vgCoeff = roundToInt16(cgv * 8192) * 0x0001000100010001ULL;
  626. c->ugCoeff = roundToInt16(cgu * 8192) * 0x0001000100010001ULL;
  627. c->yOffset = roundToInt16(oy * 8) * 0x0001000100010001ULL;
  628. c->yuv2rgb_y_coeff = (int16_t)roundToInt16(cy << 13);
  629. c->yuv2rgb_y_offset = (int16_t)roundToInt16(oy << 9);
  630. c->yuv2rgb_v2r_coeff = (int16_t)roundToInt16(crv << 13);
  631. c->yuv2rgb_v2g_coeff = (int16_t)roundToInt16(cgv << 13);
  632. c->yuv2rgb_u2g_coeff = (int16_t)roundToInt16(cgu << 13);
  633. c->yuv2rgb_u2b_coeff = (int16_t)roundToInt16(cbu << 13);
  634. //scale coefficients by cy
  635. crv = ((crv << 16) + 0x8000) / cy;
  636. cbu = ((cbu << 16) + 0x8000) / cy;
  637. cgu = ((cgu << 16) + 0x8000) / cy;
  638. cgv = ((cgv << 16) + 0x8000) / cy;
  639. av_free(c->yuvTable);
  640. switch (bpp) {
  641. case 1:
  642. c->yuvTable = av_malloc(1024);
  643. y_table = c->yuvTable;
  644. yb = -(384 << 16) - oy;
  645. for (i = 0; i < 1024 - 110; i++) {
  646. y_table[i + 110] = av_clip_uint8((yb + 0x8000) >> 16) >> 7;
  647. yb += cy;
  648. }
  649. fill_table(c->table_gU, 1, cgu, y_table + yoffs);
  650. fill_gv_table(c->table_gV, 1, cgv);
  651. break;
  652. case 4:
  653. case 4 | 128:
  654. rbase = isRgb ? 3 : 0;
  655. gbase = 1;
  656. bbase = isRgb ? 0 : 3;
  657. c->yuvTable = av_malloc(1024 * 3);
  658. y_table = c->yuvTable;
  659. yb = -(384 << 16) - oy;
  660. for (i = 0; i < 1024 - 110; i++) {
  661. int yval = av_clip_uint8((yb + 0x8000) >> 16);
  662. y_table[i + 110] = (yval >> 7) << rbase;
  663. y_table[i + 37 + 1024] = ((yval + 43) / 85) << gbase;
  664. y_table[i + 110 + 2048] = (yval >> 7) << bbase;
  665. yb += cy;
  666. }
  667. fill_table(c->table_rV, 1, crv, y_table + yoffs);
  668. fill_table(c->table_gU, 1, cgu, y_table + yoffs + 1024);
  669. fill_table(c->table_bU, 1, cbu, y_table + yoffs + 2048);
  670. fill_gv_table(c->table_gV, 1, cgv);
  671. break;
  672. case 8:
  673. rbase = isRgb ? 5 : 0;
  674. gbase = isRgb ? 2 : 3;
  675. bbase = isRgb ? 0 : 6;
  676. c->yuvTable = av_malloc(1024 * 3);
  677. y_table = c->yuvTable;
  678. yb = -(384 << 16) - oy;
  679. for (i = 0; i < 1024 - 38; i++) {
  680. int yval = av_clip_uint8((yb + 0x8000) >> 16);
  681. y_table[i + 16] = ((yval + 18) / 36) << rbase;
  682. y_table[i + 16 + 1024] = ((yval + 18) / 36) << gbase;
  683. y_table[i + 37 + 2048] = ((yval + 43) / 85) << bbase;
  684. yb += cy;
  685. }
  686. fill_table(c->table_rV, 1, crv, y_table + yoffs);
  687. fill_table(c->table_gU, 1, cgu, y_table + yoffs + 1024);
  688. fill_table(c->table_bU, 1, cbu, y_table + yoffs + 2048);
  689. fill_gv_table(c->table_gV, 1, cgv);
  690. break;
  691. case 12:
  692. rbase = isRgb ? 8 : 0;
  693. gbase = 4;
  694. bbase = isRgb ? 0 : 8;
  695. c->yuvTable = av_malloc(1024 * 3 * 2);
  696. y_table16 = c->yuvTable;
  697. yb = -(384 << 16) - oy;
  698. for (i = 0; i < 1024; i++) {
  699. uint8_t yval = av_clip_uint8((yb + 0x8000) >> 16);
  700. y_table16[i] = (yval >> 4) << rbase;
  701. y_table16[i + 1024] = (yval >> 4) << gbase;
  702. y_table16[i + 2048] = (yval >> 4) << bbase;
  703. yb += cy;
  704. }
  705. if (isNotNe)
  706. for (i = 0; i < 1024 * 3; i++)
  707. y_table16[i] = av_bswap16(y_table16[i]);
  708. fill_table(c->table_rV, 2, crv, y_table16 + yoffs);
  709. fill_table(c->table_gU, 2, cgu, y_table16 + yoffs + 1024);
  710. fill_table(c->table_bU, 2, cbu, y_table16 + yoffs + 2048);
  711. fill_gv_table(c->table_gV, 2, cgv);
  712. break;
  713. case 15:
  714. case 16:
  715. rbase = isRgb ? bpp - 5 : 0;
  716. gbase = 5;
  717. bbase = isRgb ? 0 : (bpp - 5);
  718. c->yuvTable = av_malloc(1024 * 3 * 2);
  719. y_table16 = c->yuvTable;
  720. yb = -(384 << 16) - oy;
  721. for (i = 0; i < 1024; i++) {
  722. uint8_t yval = av_clip_uint8((yb + 0x8000) >> 16);
  723. y_table16[i] = (yval >> 3) << rbase;
  724. y_table16[i + 1024] = (yval >> (18 - bpp)) << gbase;
  725. y_table16[i + 2048] = (yval >> 3) << bbase;
  726. yb += cy;
  727. }
  728. if (isNotNe)
  729. for (i = 0; i < 1024 * 3; i++)
  730. y_table16[i] = av_bswap16(y_table16[i]);
  731. fill_table(c->table_rV, 2, crv, y_table16 + yoffs);
  732. fill_table(c->table_gU, 2, cgu, y_table16 + yoffs + 1024);
  733. fill_table(c->table_bU, 2, cbu, y_table16 + yoffs + 2048);
  734. fill_gv_table(c->table_gV, 2, cgv);
  735. break;
  736. case 24:
  737. case 48:
  738. c->yuvTable = av_malloc(1024);
  739. y_table = c->yuvTable;
  740. yb = -(384 << 16) - oy;
  741. for (i = 0; i < 1024; i++) {
  742. y_table[i] = av_clip_uint8((yb + 0x8000) >> 16);
  743. yb += cy;
  744. }
  745. fill_table(c->table_rV, 1, crv, y_table + yoffs);
  746. fill_table(c->table_gU, 1, cgu, y_table + yoffs);
  747. fill_table(c->table_bU, 1, cbu, y_table + yoffs);
  748. fill_gv_table(c->table_gV, 1, cgv);
  749. break;
  750. case 32:
  751. base = (c->dstFormat == PIX_FMT_RGB32_1 ||
  752. c->dstFormat == PIX_FMT_BGR32_1) ? 8 : 0;
  753. rbase = base + (isRgb ? 16 : 0);
  754. gbase = base + 8;
  755. bbase = base + (isRgb ? 0 : 16);
  756. needAlpha = CONFIG_SWSCALE_ALPHA && isALPHA(c->srcFormat);
  757. if (!needAlpha)
  758. abase = (base + 24) & 31;
  759. c->yuvTable = av_malloc(1024 * 3 * 4);
  760. y_table32 = c->yuvTable;
  761. yb = -(384 << 16) - oy;
  762. for (i = 0; i < 1024; i++) {
  763. unsigned yval = av_clip_uint8((yb + 0x8000) >> 16);
  764. y_table32[i] = (yval << rbase) +
  765. (needAlpha ? 0 : (255u << abase));
  766. y_table32[i + 1024] = yval << gbase;
  767. y_table32[i + 2048] = yval << bbase;
  768. yb += cy;
  769. }
  770. fill_table(c->table_rV, 4, crv, y_table32 + yoffs);
  771. fill_table(c->table_gU, 4, cgu, y_table32 + yoffs + 1024);
  772. fill_table(c->table_bU, 4, cbu, y_table32 + yoffs + 2048);
  773. fill_gv_table(c->table_gV, 4, cgv);
  774. break;
  775. default:
  776. c->yuvTable = NULL;
  777. av_log(c, AV_LOG_ERROR, "%ibpp not supported by yuv2rgb\n", bpp);
  778. return -1;
  779. }
  780. return 0;
  781. }