You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

886 lines
29KB

  1. /*
  2. * software YUV to RGB converter
  3. *
  4. * Copyright (C) 2009 Konstantin Shishkov
  5. *
  6. * 1,4,8bpp support and context / deglobalize stuff
  7. * by Michael Niedermayer (michaelni@gmx.at)
  8. *
  9. * This file is part of Libav.
  10. *
  11. * Libav is free software; you can redistribute it and/or
  12. * modify it under the terms of the GNU Lesser General Public
  13. * License as published by the Free Software Foundation; either
  14. * version 2.1 of the License, or (at your option) any later version.
  15. *
  16. * Libav is distributed in the hope that it will be useful,
  17. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  18. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  19. * Lesser General Public License for more details.
  20. *
  21. * You should have received a copy of the GNU Lesser General Public
  22. * License along with Libav; if not, write to the Free Software
  23. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  24. */
  25. #include <stdio.h>
  26. #include <stdlib.h>
  27. #include <inttypes.h>
  28. #include <assert.h>
  29. #include "libavutil/cpu.h"
  30. #include "libavutil/bswap.h"
  31. #include "config.h"
  32. #include "rgb2rgb.h"
  33. #include "swscale.h"
  34. #include "swscale_internal.h"
  35. const int32_t ff_yuv2rgb_coeffs[8][4] = {
  36. { 117504, 138453, 13954, 34903 }, /* no sequence_display_extension */
  37. { 117504, 138453, 13954, 34903 }, /* ITU-R Rec. 709 (1990) */
  38. { 104597, 132201, 25675, 53279 }, /* unspecified */
  39. { 104597, 132201, 25675, 53279 }, /* reserved */
  40. { 104448, 132798, 24759, 53109 }, /* FCC */
  41. { 104597, 132201, 25675, 53279 }, /* ITU-R Rec. 624-4 System B, G */
  42. { 104597, 132201, 25675, 53279 }, /* SMPTE 170M */
  43. { 117579, 136230, 16907, 35559 } /* SMPTE 240M (1987) */
  44. };
  45. const int *sws_getCoefficients(int colorspace)
  46. {
  47. if (colorspace > 7 || colorspace < 0)
  48. colorspace = SWS_CS_DEFAULT;
  49. return ff_yuv2rgb_coeffs[colorspace];
  50. }
  51. #define LOADCHROMA(i) \
  52. U = pu[i]; \
  53. V = pv[i]; \
  54. r = (void *)c->table_rV[V]; \
  55. g = (void *)(c->table_gU[U] + c->table_gV[V]); \
  56. b = (void *)c->table_bU[U];
  57. #define PUTRGB(dst, src, i) \
  58. Y = src[2 * i]; \
  59. dst[2 * i] = r[Y] + g[Y] + b[Y]; \
  60. Y = src[2 * i + 1]; \
  61. dst[2 * i + 1] = r[Y] + g[Y] + b[Y];
  62. #define PUTRGB24(dst, src, i) \
  63. Y = src[2 * i]; \
  64. dst[6 * i + 0] = r[Y]; \
  65. dst[6 * i + 1] = g[Y]; \
  66. dst[6 * i + 2] = b[Y]; \
  67. Y = src[2 * i + 1]; \
  68. dst[6 * i + 3] = r[Y]; \
  69. dst[6 * i + 4] = g[Y]; \
  70. dst[6 * i + 5] = b[Y];
  71. #define PUTBGR24(dst, src, i) \
  72. Y = src[2 * i]; \
  73. dst[6 * i + 0] = b[Y]; \
  74. dst[6 * i + 1] = g[Y]; \
  75. dst[6 * i + 2] = r[Y]; \
  76. Y = src[2 * i + 1]; \
  77. dst[6 * i + 3] = b[Y]; \
  78. dst[6 * i + 4] = g[Y]; \
  79. dst[6 * i + 5] = r[Y];
  80. #define PUTRGBA(dst, ysrc, asrc, i, s) \
  81. Y = ysrc[2 * i]; \
  82. dst[2 * i] = r[Y] + g[Y] + b[Y] + (asrc[2 * i] << s); \
  83. Y = ysrc[2 * i + 1]; \
  84. dst[2 * i + 1] = r[Y] + g[Y] + b[Y] + (asrc[2 * i + 1] << s);
  85. #define PUTRGB48(dst, src, i) \
  86. Y = src[ 2 * i]; \
  87. dst[12 * i + 0] = dst[12 * i + 1] = r[Y]; \
  88. dst[12 * i + 2] = dst[12 * i + 3] = g[Y]; \
  89. dst[12 * i + 4] = dst[12 * i + 5] = b[Y]; \
  90. Y = src[ 2 * i + 1]; \
  91. dst[12 * i + 6] = dst[12 * i + 7] = r[Y]; \
  92. dst[12 * i + 8] = dst[12 * i + 9] = g[Y]; \
  93. dst[12 * i + 10] = dst[12 * i + 11] = b[Y];
  94. #define PUTBGR48(dst, src, i) \
  95. Y = src[2 * i]; \
  96. dst[12 * i + 0] = dst[12 * i + 1] = b[Y]; \
  97. dst[12 * i + 2] = dst[12 * i + 3] = g[Y]; \
  98. dst[12 * i + 4] = dst[12 * i + 5] = r[Y]; \
  99. Y = src[2 * i + 1]; \
  100. dst[12 * i + 6] = dst[12 * i + 7] = b[Y]; \
  101. dst[12 * i + 8] = dst[12 * i + 9] = g[Y]; \
  102. dst[12 * i + 10] = dst[12 * i + 11] = r[Y];
  103. #define YUV2RGBFUNC(func_name, dst_type, alpha) \
  104. static int func_name(SwsContext *c, const uint8_t *src[], \
  105. int srcStride[], int srcSliceY, int srcSliceH, \
  106. uint8_t *dst[], int dstStride[]) \
  107. { \
  108. int y; \
  109. \
  110. if (!alpha && c->srcFormat == AV_PIX_FMT_YUV422P) { \
  111. srcStride[1] *= 2; \
  112. srcStride[2] *= 2; \
  113. } \
  114. for (y = 0; y < srcSliceH; y += 2) { \
  115. dst_type *dst_1 = \
  116. (dst_type *)(dst[0] + (y + srcSliceY) * dstStride[0]); \
  117. dst_type *dst_2 = \
  118. (dst_type *)(dst[0] + (y + srcSliceY + 1) * dstStride[0]); \
  119. dst_type av_unused *r, *g, *b; \
  120. const uint8_t *py_1 = src[0] + y * srcStride[0]; \
  121. const uint8_t *py_2 = py_1 + srcStride[0]; \
  122. const uint8_t *pu = src[1] + (y >> 1) * srcStride[1]; \
  123. const uint8_t *pv = src[2] + (y >> 1) * srcStride[2]; \
  124. const uint8_t av_unused *pa_1, *pa_2; \
  125. unsigned int h_size = c->dstW >> 3; \
  126. if (alpha) { \
  127. pa_1 = src[3] + y * srcStride[3]; \
  128. pa_2 = pa_1 + srcStride[3]; \
  129. } \
  130. while (h_size--) { \
  131. int av_unused U, V, Y; \
  132. #define ENDYUV2RGBLINE(dst_delta, ss) \
  133. pu += 4 >> ss; \
  134. pv += 4 >> ss; \
  135. py_1 += 8 >> ss; \
  136. py_2 += 8 >> ss; \
  137. dst_1 += dst_delta >> ss; \
  138. dst_2 += dst_delta >> ss; \
  139. } \
  140. if (c->dstW & (4 >> ss)) { \
  141. int av_unused Y, U, V; \
  142. #define ENDYUV2RGBFUNC() \
  143. } \
  144. } \
  145. return srcSliceH; \
  146. }
  147. #define CLOSEYUV2RGBFUNC(dst_delta) \
  148. ENDYUV2RGBLINE(dst_delta, 0) \
  149. ENDYUV2RGBFUNC()
  150. YUV2RGBFUNC(yuv2rgb_c_48, uint8_t, 0)
  151. LOADCHROMA(0);
  152. PUTRGB48(dst_1, py_1, 0);
  153. PUTRGB48(dst_2, py_2, 0);
  154. LOADCHROMA(1);
  155. PUTRGB48(dst_2, py_2, 1);
  156. PUTRGB48(dst_1, py_1, 1);
  157. LOADCHROMA(2);
  158. PUTRGB48(dst_1, py_1, 2);
  159. PUTRGB48(dst_2, py_2, 2);
  160. LOADCHROMA(3);
  161. PUTRGB48(dst_2, py_2, 3);
  162. PUTRGB48(dst_1, py_1, 3);
  163. ENDYUV2RGBLINE(48, 0)
  164. LOADCHROMA(0);
  165. PUTRGB48(dst_1, py_1, 0);
  166. PUTRGB48(dst_2, py_2, 0);
  167. LOADCHROMA(1);
  168. PUTRGB48(dst_2, py_2, 1);
  169. PUTRGB48(dst_1, py_1, 1);
  170. ENDYUV2RGBLINE(48, 1)
  171. LOADCHROMA(0);
  172. PUTRGB48(dst_1, py_1, 0);
  173. PUTRGB48(dst_2, py_2, 0);
  174. ENDYUV2RGBFUNC()
  175. YUV2RGBFUNC(yuv2rgb_c_bgr48, uint8_t, 0)
  176. LOADCHROMA(0);
  177. PUTBGR48(dst_1, py_1, 0);
  178. PUTBGR48(dst_2, py_2, 0);
  179. LOADCHROMA(1);
  180. PUTBGR48(dst_2, py_2, 1);
  181. PUTBGR48(dst_1, py_1, 1);
  182. LOADCHROMA(2);
  183. PUTBGR48(dst_1, py_1, 2);
  184. PUTBGR48(dst_2, py_2, 2);
  185. LOADCHROMA(3);
  186. PUTBGR48(dst_2, py_2, 3);
  187. PUTBGR48(dst_1, py_1, 3);
  188. ENDYUV2RGBLINE(48, 0)
  189. LOADCHROMA(0);
  190. PUTBGR48(dst_1, py_1, 0);
  191. PUTBGR48(dst_2, py_2, 0);
  192. LOADCHROMA(1);
  193. PUTBGR48(dst_2, py_2, 1);
  194. PUTBGR48(dst_1, py_1, 1);
  195. ENDYUV2RGBLINE(48, 1)
  196. LOADCHROMA(0);
  197. PUTBGR48(dst_1, py_1, 0);
  198. PUTBGR48(dst_2, py_2, 0);
  199. ENDYUV2RGBFUNC()
  200. YUV2RGBFUNC(yuv2rgb_c_32, uint32_t, 0)
  201. LOADCHROMA(0);
  202. PUTRGB(dst_1, py_1, 0);
  203. PUTRGB(dst_2, py_2, 0);
  204. LOADCHROMA(1);
  205. PUTRGB(dst_2, py_2, 1);
  206. PUTRGB(dst_1, py_1, 1);
  207. LOADCHROMA(2);
  208. PUTRGB(dst_1, py_1, 2);
  209. PUTRGB(dst_2, py_2, 2);
  210. LOADCHROMA(3);
  211. PUTRGB(dst_2, py_2, 3);
  212. PUTRGB(dst_1, py_1, 3);
  213. ENDYUV2RGBLINE(8, 0)
  214. LOADCHROMA(0);
  215. PUTRGB(dst_1, py_1, 0);
  216. PUTRGB(dst_2, py_2, 0);
  217. LOADCHROMA(1);
  218. PUTRGB(dst_2, py_2, 1);
  219. PUTRGB(dst_1, py_1, 1);
  220. ENDYUV2RGBLINE(8, 1)
  221. LOADCHROMA(0);
  222. PUTRGB(dst_1, py_1, 0);
  223. PUTRGB(dst_2, py_2, 0);
  224. ENDYUV2RGBFUNC()
  225. YUV2RGBFUNC(yuva2rgba_c, uint32_t, 1)
  226. LOADCHROMA(0);
  227. PUTRGBA(dst_1, py_1, pa_1, 0, 24);
  228. PUTRGBA(dst_2, py_2, pa_2, 0, 24);
  229. LOADCHROMA(1);
  230. PUTRGBA(dst_2, py_2, pa_2, 1, 24);
  231. PUTRGBA(dst_1, py_1, pa_1, 1, 24);
  232. LOADCHROMA(2);
  233. PUTRGBA(dst_1, py_1, pa_1, 2, 24);
  234. PUTRGBA(dst_2, py_2, pa_2, 2, 24);
  235. LOADCHROMA(3);
  236. PUTRGBA(dst_2, py_2, pa_2, 3, 24);
  237. PUTRGBA(dst_1, py_1, pa_1, 3, 24);
  238. pa_1 += 8;
  239. pa_2 += 8;
  240. ENDYUV2RGBLINE(8, 0)
  241. LOADCHROMA(0);
  242. PUTRGBA(dst_1, py_1, pa_1, 0, 24);
  243. PUTRGBA(dst_2, py_2, pa_2, 0, 24);
  244. LOADCHROMA(1);
  245. PUTRGBA(dst_2, py_2, pa_2, 1, 24);
  246. PUTRGBA(dst_1, py_1, pa_1, 1, 24);
  247. pa_1 += 4;
  248. pa_2 += 4;
  249. ENDYUV2RGBLINE(8, 1)
  250. LOADCHROMA(0);
  251. PUTRGBA(dst_1, py_1, pa_1, 0, 24);
  252. PUTRGBA(dst_2, py_2, pa_2, 0, 24);
  253. ENDYUV2RGBFUNC()
  254. YUV2RGBFUNC(yuva2argb_c, uint32_t, 1)
  255. LOADCHROMA(0);
  256. PUTRGBA(dst_1, py_1, pa_1, 0, 0);
  257. PUTRGBA(dst_2, py_2, pa_2, 0, 0);
  258. LOADCHROMA(1);
  259. PUTRGBA(dst_2, py_2, pa_2, 1, 0);
  260. PUTRGBA(dst_1, py_1, pa_1, 1, 0);
  261. LOADCHROMA(2);
  262. PUTRGBA(dst_1, py_1, pa_1, 2, 0);
  263. PUTRGBA(dst_2, py_2, pa_2, 2, 0);
  264. LOADCHROMA(3);
  265. PUTRGBA(dst_2, py_2, pa_2, 3, 0);
  266. PUTRGBA(dst_1, py_1, pa_1, 3, 0);
  267. pa_1 += 8;
  268. pa_2 += 8;
  269. ENDYUV2RGBLINE(8, 0)
  270. LOADCHROMA(0);
  271. PUTRGBA(dst_1, py_1, pa_1, 0, 0);
  272. PUTRGBA(dst_2, py_2, pa_2, 0, 0);
  273. LOADCHROMA(1);
  274. PUTRGBA(dst_2, py_2, pa_2, 1, 0);
  275. PUTRGBA(dst_1, py_1, pa_1, 1, 0);
  276. pa_1 += 4;
  277. pa_2 += 4;
  278. ENDYUV2RGBLINE(8, 1)
  279. LOADCHROMA(0);
  280. PUTRGBA(dst_1, py_1, pa_1, 0, 0);
  281. PUTRGBA(dst_2, py_2, pa_2, 0, 0);
  282. ENDYUV2RGBFUNC()
  283. YUV2RGBFUNC(yuv2rgb_c_24_rgb, uint8_t, 0)
  284. LOADCHROMA(0);
  285. PUTRGB24(dst_1, py_1, 0);
  286. PUTRGB24(dst_2, py_2, 0);
  287. LOADCHROMA(1);
  288. PUTRGB24(dst_2, py_2, 1);
  289. PUTRGB24(dst_1, py_1, 1);
  290. LOADCHROMA(2);
  291. PUTRGB24(dst_1, py_1, 2);
  292. PUTRGB24(dst_2, py_2, 2);
  293. LOADCHROMA(3);
  294. PUTRGB24(dst_2, py_2, 3);
  295. PUTRGB24(dst_1, py_1, 3);
  296. ENDYUV2RGBLINE(24, 0)
  297. LOADCHROMA(0);
  298. PUTRGB24(dst_1, py_1, 0);
  299. PUTRGB24(dst_2, py_2, 0);
  300. LOADCHROMA(1);
  301. PUTRGB24(dst_2, py_2, 1);
  302. PUTRGB24(dst_1, py_1, 1);
  303. ENDYUV2RGBLINE(24, 1)
  304. LOADCHROMA(0);
  305. PUTRGB24(dst_1, py_1, 0);
  306. PUTRGB24(dst_2, py_2, 0);
  307. ENDYUV2RGBFUNC()
  308. // only trivial mods from yuv2rgb_c_24_rgb
  309. YUV2RGBFUNC(yuv2rgb_c_24_bgr, uint8_t, 0)
  310. LOADCHROMA(0);
  311. PUTBGR24(dst_1, py_1, 0);
  312. PUTBGR24(dst_2, py_2, 0);
  313. LOADCHROMA(1);
  314. PUTBGR24(dst_2, py_2, 1);
  315. PUTBGR24(dst_1, py_1, 1);
  316. LOADCHROMA(2);
  317. PUTBGR24(dst_1, py_1, 2);
  318. PUTBGR24(dst_2, py_2, 2);
  319. LOADCHROMA(3);
  320. PUTBGR24(dst_2, py_2, 3);
  321. PUTBGR24(dst_1, py_1, 3);
  322. ENDYUV2RGBLINE(24, 0)
  323. LOADCHROMA(0);
  324. PUTBGR24(dst_1, py_1, 0);
  325. PUTBGR24(dst_2, py_2, 0);
  326. LOADCHROMA(1);
  327. PUTBGR24(dst_2, py_2, 1);
  328. PUTBGR24(dst_1, py_1, 1);
  329. ENDYUV2RGBLINE(24, 1)
  330. LOADCHROMA(0);
  331. PUTBGR24(dst_1, py_1, 0);
  332. PUTBGR24(dst_2, py_2, 0);
  333. ENDYUV2RGBFUNC()
  334. // This is exactly the same code as yuv2rgb_c_32 except for the types of
  335. // r, g, b, dst_1, dst_2
  336. YUV2RGBFUNC(yuv2rgb_c_16, uint16_t, 0)
  337. LOADCHROMA(0);
  338. PUTRGB(dst_1, py_1, 0);
  339. PUTRGB(dst_2, py_2, 0);
  340. LOADCHROMA(1);
  341. PUTRGB(dst_2, py_2, 1);
  342. PUTRGB(dst_1, py_1, 1);
  343. LOADCHROMA(2);
  344. PUTRGB(dst_1, py_1, 2);
  345. PUTRGB(dst_2, py_2, 2);
  346. LOADCHROMA(3);
  347. PUTRGB(dst_2, py_2, 3);
  348. PUTRGB(dst_1, py_1, 3);
  349. CLOSEYUV2RGBFUNC(8)
  350. // r, g, b, dst_1, dst_2
  351. YUV2RGBFUNC(yuv2rgb_c_12_ordered_dither, uint16_t, 0)
  352. const uint8_t *d16 = ff_dither_4x4_16[y & 3];
  353. #define PUTRGB12(dst, src, i, o) \
  354. Y = src[2 * i]; \
  355. dst[2 * i] = r[Y + d16[0 + o]] + \
  356. g[Y + d16[0 + o]] + \
  357. b[Y + d16[0 + o]]; \
  358. Y = src[2 * i + 1]; \
  359. dst[2 * i + 1] = r[Y + d16[1 + o]] + \
  360. g[Y + d16[1 + o]] + \
  361. b[Y + d16[1 + o]];
  362. LOADCHROMA(0);
  363. PUTRGB12(dst_1, py_1, 0, 0);
  364. PUTRGB12(dst_2, py_2, 0, 0 + 8);
  365. LOADCHROMA(1);
  366. PUTRGB12(dst_2, py_2, 1, 2 + 8);
  367. PUTRGB12(dst_1, py_1, 1, 2);
  368. LOADCHROMA(2);
  369. PUTRGB12(dst_1, py_1, 2, 4);
  370. PUTRGB12(dst_2, py_2, 2, 4 + 8);
  371. LOADCHROMA(3);
  372. PUTRGB12(dst_2, py_2, 3, 6 + 8);
  373. PUTRGB12(dst_1, py_1, 3, 6);
  374. CLOSEYUV2RGBFUNC(8)
  375. // r, g, b, dst_1, dst_2
  376. YUV2RGBFUNC(yuv2rgb_c_8_ordered_dither, uint8_t, 0)
  377. const uint8_t *d32 = ff_dither_8x8_32[y & 7];
  378. const uint8_t *d64 = ff_dither_8x8_73[y & 7];
  379. #define PUTRGB8(dst, src, i, o) \
  380. Y = src[2 * i]; \
  381. dst[2 * i] = r[Y + d32[0 + o]] + \
  382. g[Y + d32[0 + o]] + \
  383. b[Y + d64[0 + o]]; \
  384. Y = src[2 * i + 1]; \
  385. dst[2 * i + 1] = r[Y + d32[1 + o]] + \
  386. g[Y + d32[1 + o]] + \
  387. b[Y + d64[1 + o]];
  388. LOADCHROMA(0);
  389. PUTRGB8(dst_1, py_1, 0, 0);
  390. PUTRGB8(dst_2, py_2, 0, 0 + 8);
  391. LOADCHROMA(1);
  392. PUTRGB8(dst_2, py_2, 1, 2 + 8);
  393. PUTRGB8(dst_1, py_1, 1, 2);
  394. LOADCHROMA(2);
  395. PUTRGB8(dst_1, py_1, 2, 4);
  396. PUTRGB8(dst_2, py_2, 2, 4 + 8);
  397. LOADCHROMA(3);
  398. PUTRGB8(dst_2, py_2, 3, 6 + 8);
  399. PUTRGB8(dst_1, py_1, 3, 6);
  400. CLOSEYUV2RGBFUNC(8)
  401. YUV2RGBFUNC(yuv2rgb_c_4_ordered_dither, uint8_t, 0)
  402. const uint8_t * d64 = ff_dither_8x8_73[y & 7];
  403. const uint8_t *d128 = ff_dither_8x8_220[y & 7];
  404. int acc;
  405. #define PUTRGB4D(dst, src, i, o) \
  406. Y = src[2 * i]; \
  407. acc = r[Y + d128[0 + o]] + \
  408. g[Y + d64[0 + o]] + \
  409. b[Y + d128[0 + o]]; \
  410. Y = src[2 * i + 1]; \
  411. acc |= (r[Y + d128[1 + o]] + \
  412. g[Y + d64[1 + o]] + \
  413. b[Y + d128[1 + o]]) << 4; \
  414. dst[i] = acc;
  415. LOADCHROMA(0);
  416. PUTRGB4D(dst_1, py_1, 0, 0);
  417. PUTRGB4D(dst_2, py_2, 0, 0 + 8);
  418. LOADCHROMA(1);
  419. PUTRGB4D(dst_2, py_2, 1, 2 + 8);
  420. PUTRGB4D(dst_1, py_1, 1, 2);
  421. LOADCHROMA(2);
  422. PUTRGB4D(dst_1, py_1, 2, 4);
  423. PUTRGB4D(dst_2, py_2, 2, 4 + 8);
  424. LOADCHROMA(3);
  425. PUTRGB4D(dst_2, py_2, 3, 6 + 8);
  426. PUTRGB4D(dst_1, py_1, 3, 6);
  427. CLOSEYUV2RGBFUNC(4)
  428. YUV2RGBFUNC(yuv2rgb_c_4b_ordered_dither, uint8_t, 0)
  429. const uint8_t *d64 = ff_dither_8x8_73[y & 7];
  430. const uint8_t *d128 = ff_dither_8x8_220[y & 7];
  431. #define PUTRGB4DB(dst, src, i, o) \
  432. Y = src[2 * i]; \
  433. dst[2 * i] = r[Y + d128[0 + o]] + \
  434. g[Y + d64[0 + o]] + \
  435. b[Y + d128[0 + o]]; \
  436. Y = src[2 * i + 1]; \
  437. dst[2 * i + 1] = r[Y + d128[1 + o]] + \
  438. g[Y + d64[1 + o]] + \
  439. b[Y + d128[1 + o]];
  440. LOADCHROMA(0);
  441. PUTRGB4DB(dst_1, py_1, 0, 0);
  442. PUTRGB4DB(dst_2, py_2, 0, 0 + 8);
  443. LOADCHROMA(1);
  444. PUTRGB4DB(dst_2, py_2, 1, 2 + 8);
  445. PUTRGB4DB(dst_1, py_1, 1, 2);
  446. LOADCHROMA(2);
  447. PUTRGB4DB(dst_1, py_1, 2, 4);
  448. PUTRGB4DB(dst_2, py_2, 2, 4 + 8);
  449. LOADCHROMA(3);
  450. PUTRGB4DB(dst_2, py_2, 3, 6 + 8);
  451. PUTRGB4DB(dst_1, py_1, 3, 6);
  452. CLOSEYUV2RGBFUNC(8)
  453. YUV2RGBFUNC(yuv2rgb_c_1_ordered_dither, uint8_t, 0)
  454. const uint8_t *d128 = ff_dither_8x8_220[y & 7];
  455. char out_1 = 0, out_2 = 0;
  456. g = c->table_gU[128] + c->table_gV[128];
  457. #define PUTRGB1(out, src, i, o) \
  458. Y = src[2 * i]; \
  459. out += out + g[Y + d128[0 + o]]; \
  460. Y = src[2 * i + 1]; \
  461. out += out + g[Y + d128[1 + o]];
  462. PUTRGB1(out_1, py_1, 0, 0);
  463. PUTRGB1(out_2, py_2, 0, 0 + 8);
  464. PUTRGB1(out_2, py_2, 1, 2 + 8);
  465. PUTRGB1(out_1, py_1, 1, 2);
  466. PUTRGB1(out_1, py_1, 2, 4);
  467. PUTRGB1(out_2, py_2, 2, 4 + 8);
  468. PUTRGB1(out_2, py_2, 3, 6 + 8);
  469. PUTRGB1(out_1, py_1, 3, 6);
  470. dst_1[0] = out_1;
  471. dst_2[0] = out_2;
  472. CLOSEYUV2RGBFUNC(1)
  473. SwsFunc ff_yuv2rgb_get_func_ptr(SwsContext *c)
  474. {
  475. SwsFunc t = NULL;
  476. if (ARCH_PPC)
  477. t = ff_yuv2rgb_init_ppc(c);
  478. if (ARCH_X86)
  479. t = ff_yuv2rgb_init_x86(c);
  480. if (t)
  481. return t;
  482. av_log(c, AV_LOG_WARNING,
  483. "No accelerated colorspace conversion found from %s to %s.\n",
  484. sws_format_name(c->srcFormat), sws_format_name(c->dstFormat));
  485. switch (c->dstFormat) {
  486. case AV_PIX_FMT_BGR48BE:
  487. case AV_PIX_FMT_BGR48LE:
  488. return yuv2rgb_c_bgr48;
  489. case AV_PIX_FMT_RGB48BE:
  490. case AV_PIX_FMT_RGB48LE:
  491. return yuv2rgb_c_48;
  492. case AV_PIX_FMT_ARGB:
  493. case AV_PIX_FMT_ABGR:
  494. if (CONFIG_SWSCALE_ALPHA && c->srcFormat == AV_PIX_FMT_YUVA420P)
  495. return yuva2argb_c;
  496. case AV_PIX_FMT_RGBA:
  497. case AV_PIX_FMT_BGRA:
  498. if (CONFIG_SWSCALE_ALPHA && c->srcFormat == AV_PIX_FMT_YUVA420P)
  499. return yuva2rgba_c;
  500. else
  501. return yuv2rgb_c_32;
  502. case AV_PIX_FMT_RGB24:
  503. return yuv2rgb_c_24_rgb;
  504. case AV_PIX_FMT_BGR24:
  505. return yuv2rgb_c_24_bgr;
  506. case AV_PIX_FMT_RGB565:
  507. case AV_PIX_FMT_BGR565:
  508. case AV_PIX_FMT_RGB555:
  509. case AV_PIX_FMT_BGR555:
  510. return yuv2rgb_c_16;
  511. case AV_PIX_FMT_RGB444:
  512. case AV_PIX_FMT_BGR444:
  513. return yuv2rgb_c_12_ordered_dither;
  514. case AV_PIX_FMT_RGB8:
  515. case AV_PIX_FMT_BGR8:
  516. return yuv2rgb_c_8_ordered_dither;
  517. case AV_PIX_FMT_RGB4:
  518. case AV_PIX_FMT_BGR4:
  519. return yuv2rgb_c_4_ordered_dither;
  520. case AV_PIX_FMT_RGB4_BYTE:
  521. case AV_PIX_FMT_BGR4_BYTE:
  522. return yuv2rgb_c_4b_ordered_dither;
  523. case AV_PIX_FMT_MONOBLACK:
  524. return yuv2rgb_c_1_ordered_dither;
  525. default:
  526. assert(0);
  527. }
  528. return NULL;
  529. }
  530. static void fill_table(uint8_t *table[256], const int elemsize,
  531. const int inc, void *y_tab)
  532. {
  533. int i;
  534. int64_t cb = 0;
  535. uint8_t *y_table = y_tab;
  536. y_table -= elemsize * (inc >> 9);
  537. for (i = 0; i < 256; i++) {
  538. table[i] = y_table + elemsize * (cb >> 16);
  539. cb += inc;
  540. }
  541. }
  542. static void fill_gv_table(int table[256], const int elemsize, const int inc)
  543. {
  544. int i;
  545. int64_t cb = 0;
  546. int off = -(inc >> 9);
  547. for (i = 0; i < 256; i++) {
  548. table[i] = elemsize * (off + (cb >> 16));
  549. cb += inc;
  550. }
  551. }
  552. static uint16_t roundToInt16(int64_t f)
  553. {
  554. int r = (f + (1 << 15)) >> 16;
  555. if (r < -0x7FFF)
  556. return 0x8000;
  557. else if (r > 0x7FFF)
  558. return 0x7FFF;
  559. else
  560. return r;
  561. }
  562. av_cold int ff_yuv2rgb_c_init_tables(SwsContext *c, const int inv_table[4],
  563. int fullRange, int brightness,
  564. int contrast, int saturation)
  565. {
  566. const int isRgb = c->dstFormat == AV_PIX_FMT_RGB32 ||
  567. c->dstFormat == AV_PIX_FMT_RGB32_1 ||
  568. c->dstFormat == AV_PIX_FMT_BGR24 ||
  569. c->dstFormat == AV_PIX_FMT_RGB565BE ||
  570. c->dstFormat == AV_PIX_FMT_RGB565LE ||
  571. c->dstFormat == AV_PIX_FMT_RGB555BE ||
  572. c->dstFormat == AV_PIX_FMT_RGB555LE ||
  573. c->dstFormat == AV_PIX_FMT_RGB444BE ||
  574. c->dstFormat == AV_PIX_FMT_RGB444LE ||
  575. c->dstFormat == AV_PIX_FMT_RGB8 ||
  576. c->dstFormat == AV_PIX_FMT_RGB4 ||
  577. c->dstFormat == AV_PIX_FMT_RGB4_BYTE ||
  578. c->dstFormat == AV_PIX_FMT_MONOBLACK;
  579. const int isNotNe = c->dstFormat == AV_PIX_FMT_NE(RGB565LE, RGB565BE) ||
  580. c->dstFormat == AV_PIX_FMT_NE(RGB555LE, RGB555BE) ||
  581. c->dstFormat == AV_PIX_FMT_NE(RGB444LE, RGB444BE) ||
  582. c->dstFormat == AV_PIX_FMT_NE(BGR565LE, BGR565BE) ||
  583. c->dstFormat == AV_PIX_FMT_NE(BGR555LE, BGR555BE) ||
  584. c->dstFormat == AV_PIX_FMT_NE(BGR444LE, BGR444BE);
  585. const int bpp = c->dstFormatBpp;
  586. uint8_t *y_table;
  587. uint16_t *y_table16;
  588. uint32_t *y_table32;
  589. int i, base, rbase, gbase, bbase, abase, needAlpha;
  590. const int yoffs = fullRange ? 384 : 326;
  591. int64_t crv = inv_table[0];
  592. int64_t cbu = inv_table[1];
  593. int64_t cgu = -inv_table[2];
  594. int64_t cgv = -inv_table[3];
  595. int64_t cy = 1 << 16;
  596. int64_t oy = 0;
  597. int64_t yb = 0;
  598. if (!fullRange) {
  599. cy = (cy * 255) / 219;
  600. oy = 16 << 16;
  601. } else {
  602. crv = (crv * 224) / 255;
  603. cbu = (cbu * 224) / 255;
  604. cgu = (cgu * 224) / 255;
  605. cgv = (cgv * 224) / 255;
  606. }
  607. cy = (cy * contrast) >> 16;
  608. crv = (crv * contrast * saturation) >> 32;
  609. cbu = (cbu * contrast * saturation) >> 32;
  610. cgu = (cgu * contrast * saturation) >> 32;
  611. cgv = (cgv * contrast * saturation) >> 32;
  612. oy -= 256 * brightness;
  613. c->uOffset = 0x0400040004000400LL;
  614. c->vOffset = 0x0400040004000400LL;
  615. c->yCoeff = roundToInt16(cy * 8192) * 0x0001000100010001ULL;
  616. c->vrCoeff = roundToInt16(crv * 8192) * 0x0001000100010001ULL;
  617. c->ubCoeff = roundToInt16(cbu * 8192) * 0x0001000100010001ULL;
  618. c->vgCoeff = roundToInt16(cgv * 8192) * 0x0001000100010001ULL;
  619. c->ugCoeff = roundToInt16(cgu * 8192) * 0x0001000100010001ULL;
  620. c->yOffset = roundToInt16(oy * 8) * 0x0001000100010001ULL;
  621. c->yuv2rgb_y_coeff = (int16_t)roundToInt16(cy << 13);
  622. c->yuv2rgb_y_offset = (int16_t)roundToInt16(oy << 9);
  623. c->yuv2rgb_v2r_coeff = (int16_t)roundToInt16(crv << 13);
  624. c->yuv2rgb_v2g_coeff = (int16_t)roundToInt16(cgv << 13);
  625. c->yuv2rgb_u2g_coeff = (int16_t)roundToInt16(cgu << 13);
  626. c->yuv2rgb_u2b_coeff = (int16_t)roundToInt16(cbu << 13);
  627. //scale coefficients by cy
  628. crv = ((crv << 16) + 0x8000) / cy;
  629. cbu = ((cbu << 16) + 0x8000) / cy;
  630. cgu = ((cgu << 16) + 0x8000) / cy;
  631. cgv = ((cgv << 16) + 0x8000) / cy;
  632. av_free(c->yuvTable);
  633. #define ALLOC_YUV_TABLE(x) \
  634. c->yuvTable = av_malloc(x); \
  635. if (!c->yuvTable) \
  636. return AVERROR(ENOMEM);
  637. switch (bpp) {
  638. case 1:
  639. ALLOC_YUV_TABLE(1024);
  640. y_table = c->yuvTable;
  641. yb = -(384 << 16) - oy;
  642. for (i = 0; i < 1024 - 110; i++) {
  643. y_table[i + 110] = av_clip_uint8((yb + 0x8000) >> 16) >> 7;
  644. yb += cy;
  645. }
  646. fill_table(c->table_gU, 1, cgu, y_table + yoffs);
  647. fill_gv_table(c->table_gV, 1, cgv);
  648. break;
  649. case 4:
  650. case 4 | 128:
  651. rbase = isRgb ? 3 : 0;
  652. gbase = 1;
  653. bbase = isRgb ? 0 : 3;
  654. ALLOC_YUV_TABLE(1024 * 3);
  655. y_table = c->yuvTable;
  656. yb = -(384 << 16) - oy;
  657. for (i = 0; i < 1024 - 110; i++) {
  658. int yval = av_clip_uint8((yb + 0x8000) >> 16);
  659. y_table[i + 110] = (yval >> 7) << rbase;
  660. y_table[i + 37 + 1024] = ((yval + 43) / 85) << gbase;
  661. y_table[i + 110 + 2048] = (yval >> 7) << bbase;
  662. yb += cy;
  663. }
  664. fill_table(c->table_rV, 1, crv, y_table + yoffs);
  665. fill_table(c->table_gU, 1, cgu, y_table + yoffs + 1024);
  666. fill_table(c->table_bU, 1, cbu, y_table + yoffs + 2048);
  667. fill_gv_table(c->table_gV, 1, cgv);
  668. break;
  669. case 8:
  670. rbase = isRgb ? 5 : 0;
  671. gbase = isRgb ? 2 : 3;
  672. bbase = isRgb ? 0 : 6;
  673. ALLOC_YUV_TABLE(1024 * 3);
  674. y_table = c->yuvTable;
  675. yb = -(384 << 16) - oy;
  676. for (i = 0; i < 1024 - 38; i++) {
  677. int yval = av_clip_uint8((yb + 0x8000) >> 16);
  678. y_table[i + 16] = ((yval + 18) / 36) << rbase;
  679. y_table[i + 16 + 1024] = ((yval + 18) / 36) << gbase;
  680. y_table[i + 37 + 2048] = ((yval + 43) / 85) << bbase;
  681. yb += cy;
  682. }
  683. fill_table(c->table_rV, 1, crv, y_table + yoffs);
  684. fill_table(c->table_gU, 1, cgu, y_table + yoffs + 1024);
  685. fill_table(c->table_bU, 1, cbu, y_table + yoffs + 2048);
  686. fill_gv_table(c->table_gV, 1, cgv);
  687. break;
  688. case 12:
  689. rbase = isRgb ? 8 : 0;
  690. gbase = 4;
  691. bbase = isRgb ? 0 : 8;
  692. ALLOC_YUV_TABLE(1024 * 3 * 2);
  693. y_table16 = c->yuvTable;
  694. yb = -(384 << 16) - oy;
  695. for (i = 0; i < 1024; i++) {
  696. uint8_t yval = av_clip_uint8((yb + 0x8000) >> 16);
  697. y_table16[i] = (yval >> 4) << rbase;
  698. y_table16[i + 1024] = (yval >> 4) << gbase;
  699. y_table16[i + 2048] = (yval >> 4) << bbase;
  700. yb += cy;
  701. }
  702. if (isNotNe)
  703. for (i = 0; i < 1024 * 3; i++)
  704. y_table16[i] = av_bswap16(y_table16[i]);
  705. fill_table(c->table_rV, 2, crv, y_table16 + yoffs);
  706. fill_table(c->table_gU, 2, cgu, y_table16 + yoffs + 1024);
  707. fill_table(c->table_bU, 2, cbu, y_table16 + yoffs + 2048);
  708. fill_gv_table(c->table_gV, 2, cgv);
  709. break;
  710. case 15:
  711. case 16:
  712. rbase = isRgb ? bpp - 5 : 0;
  713. gbase = 5;
  714. bbase = isRgb ? 0 : (bpp - 5);
  715. ALLOC_YUV_TABLE(1024 * 3 * 2);
  716. y_table16 = c->yuvTable;
  717. yb = -(384 << 16) - oy;
  718. for (i = 0; i < 1024; i++) {
  719. uint8_t yval = av_clip_uint8((yb + 0x8000) >> 16);
  720. y_table16[i] = (yval >> 3) << rbase;
  721. y_table16[i + 1024] = (yval >> (18 - bpp)) << gbase;
  722. y_table16[i + 2048] = (yval >> 3) << bbase;
  723. yb += cy;
  724. }
  725. if (isNotNe)
  726. for (i = 0; i < 1024 * 3; i++)
  727. y_table16[i] = av_bswap16(y_table16[i]);
  728. fill_table(c->table_rV, 2, crv, y_table16 + yoffs);
  729. fill_table(c->table_gU, 2, cgu, y_table16 + yoffs + 1024);
  730. fill_table(c->table_bU, 2, cbu, y_table16 + yoffs + 2048);
  731. fill_gv_table(c->table_gV, 2, cgv);
  732. break;
  733. case 24:
  734. case 48:
  735. ALLOC_YUV_TABLE(1024);
  736. y_table = c->yuvTable;
  737. yb = -(384 << 16) - oy;
  738. for (i = 0; i < 1024; i++) {
  739. y_table[i] = av_clip_uint8((yb + 0x8000) >> 16);
  740. yb += cy;
  741. }
  742. fill_table(c->table_rV, 1, crv, y_table + yoffs);
  743. fill_table(c->table_gU, 1, cgu, y_table + yoffs);
  744. fill_table(c->table_bU, 1, cbu, y_table + yoffs);
  745. fill_gv_table(c->table_gV, 1, cgv);
  746. break;
  747. case 32:
  748. base = (c->dstFormat == AV_PIX_FMT_RGB32_1 ||
  749. c->dstFormat == AV_PIX_FMT_BGR32_1) ? 8 : 0;
  750. rbase = base + (isRgb ? 16 : 0);
  751. gbase = base + 8;
  752. bbase = base + (isRgb ? 0 : 16);
  753. needAlpha = CONFIG_SWSCALE_ALPHA && isALPHA(c->srcFormat);
  754. if (!needAlpha)
  755. abase = (base + 24) & 31;
  756. ALLOC_YUV_TABLE(1024 * 3 * 4);
  757. y_table32 = c->yuvTable;
  758. yb = -(384 << 16) - oy;
  759. for (i = 0; i < 1024; i++) {
  760. unsigned yval = av_clip_uint8((yb + 0x8000) >> 16);
  761. y_table32[i] = (yval << rbase) +
  762. (needAlpha ? 0 : (255u << abase));
  763. y_table32[i + 1024] = yval << gbase;
  764. y_table32[i + 2048] = yval << bbase;
  765. yb += cy;
  766. }
  767. fill_table(c->table_rV, 4, crv, y_table32 + yoffs);
  768. fill_table(c->table_gU, 4, cgu, y_table32 + yoffs + 1024);
  769. fill_table(c->table_bU, 4, cbu, y_table32 + yoffs + 2048);
  770. fill_gv_table(c->table_gV, 4, cgv);
  771. break;
  772. default:
  773. c->yuvTable = NULL;
  774. if(!isPlanar(c->dstFormat) || bpp <= 24)
  775. av_log(c, AV_LOG_ERROR, "%ibpp not supported by yuv2rgb\n", bpp);
  776. return -1;
  777. }
  778. return 0;
  779. }