You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

858 lines
29KB

  1. /*
  2. * software YUV to RGB converter
  3. *
  4. * Copyright (C) 2009 Konstantin Shishkov
  5. *
  6. * 1,4,8bpp support and context / deglobalize stuff
  7. * by Michael Niedermayer (michaelni@gmx.at)
  8. *
  9. * This file is part of Libav.
  10. *
  11. * Libav is free software; you can redistribute it and/or
  12. * modify it under the terms of the GNU Lesser General Public
  13. * License as published by the Free Software Foundation; either
  14. * version 2.1 of the License, or (at your option) any later version.
  15. *
  16. * Libav is distributed in the hope that it will be useful,
  17. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  18. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  19. * Lesser General Public License for more details.
  20. *
  21. * You should have received a copy of the GNU Lesser General Public
  22. * License along with Libav; if not, write to the Free Software
  23. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  24. */
  25. #include <stdio.h>
  26. #include <stdlib.h>
  27. #include <inttypes.h>
  28. #include <assert.h>
  29. #include "libavutil/cpu.h"
  30. #include "libavutil/bswap.h"
  31. #include "config.h"
  32. #include "rgb2rgb.h"
  33. #include "swscale.h"
  34. #include "swscale_internal.h"
  35. extern const uint8_t dither_4x4_16[4][8];
  36. extern const uint8_t dither_8x8_32[8][8];
  37. extern const uint8_t dither_8x8_73[8][8];
  38. extern const uint8_t dither_8x8_220[8][8];
  39. const int32_t ff_yuv2rgb_coeffs[8][4] = {
  40. { 117504, 138453, 13954, 34903 }, /* no sequence_display_extension */
  41. { 117504, 138453, 13954, 34903 }, /* ITU-R Rec. 709 (1990) */
  42. { 104597, 132201, 25675, 53279 }, /* unspecified */
  43. { 104597, 132201, 25675, 53279 }, /* reserved */
  44. { 104448, 132798, 24759, 53109 }, /* FCC */
  45. { 104597, 132201, 25675, 53279 }, /* ITU-R Rec. 624-4 System B, G */
  46. { 104597, 132201, 25675, 53279 }, /* SMPTE 170M */
  47. { 117579, 136230, 16907, 35559 } /* SMPTE 240M (1987) */
  48. };
  49. const int *sws_getCoefficients(int colorspace)
  50. {
  51. if (colorspace > 7 || colorspace < 0)
  52. colorspace = SWS_CS_DEFAULT;
  53. return ff_yuv2rgb_coeffs[colorspace];
  54. }
  55. #define LOADCHROMA(i) \
  56. U = pu[i]; \
  57. V = pv[i]; \
  58. r = (void *)c->table_rV[V]; \
  59. g = (void *)(c->table_gU[U] + c->table_gV[V]); \
  60. b = (void *)c->table_bU[U];
  61. #define PUTRGB(dst, src, i) \
  62. Y = src[2 * i]; \
  63. dst[2 * i] = r[Y] + g[Y] + b[Y]; \
  64. Y = src[2 * i + 1]; \
  65. dst[2 * i + 1] = r[Y] + g[Y] + b[Y];
  66. #define PUTRGB24(dst, src, i) \
  67. Y = src[2 * i]; \
  68. dst[6 * i + 0] = r[Y]; \
  69. dst[6 * i + 1] = g[Y]; \
  70. dst[6 * i + 2] = b[Y]; \
  71. Y = src[2 * i + 1]; \
  72. dst[6 * i + 3] = r[Y]; \
  73. dst[6 * i + 4] = g[Y]; \
  74. dst[6 * i + 5] = b[Y];
  75. #define PUTBGR24(dst, src, i) \
  76. Y = src[2 * i]; \
  77. dst[6 * i + 0] = b[Y]; \
  78. dst[6 * i + 1] = g[Y]; \
  79. dst[6 * i + 2] = r[Y]; \
  80. Y = src[2 * i + 1]; \
  81. dst[6 * i + 3] = b[Y]; \
  82. dst[6 * i + 4] = g[Y]; \
  83. dst[6 * i + 5] = r[Y];
  84. #define PUTRGBA(dst, ysrc, asrc, i, s) \
  85. Y = ysrc[2 * i]; \
  86. dst[2 * i] = r[Y] + g[Y] + b[Y] + (asrc[2 * i] << s); \
  87. Y = ysrc[2 * i + 1]; \
  88. dst[2 * i + 1] = r[Y] + g[Y] + b[Y] + (asrc[2 * i + 1] << s);
  89. #define PUTRGB48(dst, src, i) \
  90. Y = src[ 2 * i]; \
  91. dst[12 * i + 0] = dst[12 * i + 1] = r[Y]; \
  92. dst[12 * i + 2] = dst[12 * i + 3] = g[Y]; \
  93. dst[12 * i + 4] = dst[12 * i + 5] = b[Y]; \
  94. Y = src[ 2 * i + 1]; \
  95. dst[12 * i + 6] = dst[12 * i + 7] = r[Y]; \
  96. dst[12 * i + 8] = dst[12 * i + 9] = g[Y]; \
  97. dst[12 * i + 10] = dst[12 * i + 11] = b[Y];
  98. #define PUTBGR48(dst, src, i) \
  99. Y = src[2 * i]; \
  100. dst[12 * i + 0] = dst[12 * i + 1] = b[Y]; \
  101. dst[12 * i + 2] = dst[12 * i + 3] = g[Y]; \
  102. dst[12 * i + 4] = dst[12 * i + 5] = r[Y]; \
  103. Y = src[2 * i + 1]; \
  104. dst[12 * i + 6] = dst[12 * i + 7] = b[Y]; \
  105. dst[12 * i + 8] = dst[12 * i + 9] = g[Y]; \
  106. dst[12 * i + 10] = dst[12 * i + 11] = r[Y];
  107. #define YUV2RGBFUNC(func_name, dst_type, alpha) \
  108. static int func_name(SwsContext *c, const uint8_t *src[], \
  109. int srcStride[], int srcSliceY, int srcSliceH, \
  110. uint8_t *dst[], int dstStride[]) \
  111. { \
  112. int y; \
  113. \
  114. if (!alpha && c->srcFormat == PIX_FMT_YUV422P) { \
  115. srcStride[1] *= 2; \
  116. srcStride[2] *= 2; \
  117. } \
  118. for (y = 0; y < srcSliceH; y += 2) { \
  119. dst_type *dst_1 = \
  120. (dst_type *)(dst[0] + (y + srcSliceY) * dstStride[0]); \
  121. dst_type *dst_2 = \
  122. (dst_type *)(dst[0] + (y + srcSliceY + 1) * dstStride[0]); \
  123. dst_type av_unused *r, *g, *b; \
  124. const uint8_t *py_1 = src[0] + y * srcStride[0]; \
  125. const uint8_t *py_2 = py_1 + srcStride[0]; \
  126. const uint8_t *pu = src[1] + (y >> 1) * srcStride[1]; \
  127. const uint8_t *pv = src[2] + (y >> 1) * srcStride[2]; \
  128. const uint8_t av_unused *pa_1, *pa_2; \
  129. unsigned int h_size = c->dstW >> 3; \
  130. if (alpha) { \
  131. pa_1 = src[3] + y * srcStride[3]; \
  132. pa_2 = pa_1 + srcStride[3]; \
  133. } \
  134. while (h_size--) { \
  135. int av_unused U, V, Y; \
  136. #define ENDYUV2RGBLINE(dst_delta) \
  137. pu += 4; \
  138. pv += 4; \
  139. py_1 += 8; \
  140. py_2 += 8; \
  141. dst_1 += dst_delta; \
  142. dst_2 += dst_delta; \
  143. } \
  144. if (c->dstW & 4) { \
  145. int av_unused Y, U, V; \
  146. #define ENDYUV2RGBFUNC() \
  147. } \
  148. } \
  149. return srcSliceH; \
  150. }
  151. #define CLOSEYUV2RGBFUNC(dst_delta) \
  152. ENDYUV2RGBLINE(dst_delta) \
  153. ENDYUV2RGBFUNC()
  154. YUV2RGBFUNC(yuv2rgb_c_48, uint8_t, 0)
  155. LOADCHROMA(0);
  156. PUTRGB48(dst_1, py_1, 0);
  157. PUTRGB48(dst_2, py_2, 0);
  158. LOADCHROMA(1);
  159. PUTRGB48(dst_2, py_2, 1);
  160. PUTRGB48(dst_1, py_1, 1);
  161. LOADCHROMA(2);
  162. PUTRGB48(dst_1, py_1, 2);
  163. PUTRGB48(dst_2, py_2, 2);
  164. LOADCHROMA(3);
  165. PUTRGB48(dst_2, py_2, 3);
  166. PUTRGB48(dst_1, py_1, 3);
  167. ENDYUV2RGBLINE(48)
  168. LOADCHROMA(0);
  169. PUTRGB48(dst_1, py_1, 0);
  170. PUTRGB48(dst_2, py_2, 0);
  171. LOADCHROMA(1);
  172. PUTRGB48(dst_2, py_2, 1);
  173. PUTRGB48(dst_1, py_1, 1);
  174. ENDYUV2RGBFUNC()
  175. YUV2RGBFUNC(yuv2rgb_c_bgr48, uint8_t, 0)
  176. LOADCHROMA(0);
  177. PUTBGR48(dst_1, py_1, 0);
  178. PUTBGR48(dst_2, py_2, 0);
  179. LOADCHROMA(1);
  180. PUTBGR48(dst_2, py_2, 1);
  181. PUTBGR48(dst_1, py_1, 1);
  182. LOADCHROMA(2);
  183. PUTBGR48(dst_1, py_1, 2);
  184. PUTBGR48(dst_2, py_2, 2);
  185. LOADCHROMA(3);
  186. PUTBGR48(dst_2, py_2, 3);
  187. PUTBGR48(dst_1, py_1, 3);
  188. ENDYUV2RGBLINE(48)
  189. LOADCHROMA(0);
  190. PUTBGR48(dst_1, py_1, 0);
  191. PUTBGR48(dst_2, py_2, 0);
  192. LOADCHROMA(1);
  193. PUTBGR48(dst_2, py_2, 1);
  194. PUTBGR48(dst_1, py_1, 1);
  195. ENDYUV2RGBFUNC()
  196. YUV2RGBFUNC(yuv2rgb_c_32, uint32_t, 0)
  197. LOADCHROMA(0);
  198. PUTRGB(dst_1, py_1, 0);
  199. PUTRGB(dst_2, py_2, 0);
  200. LOADCHROMA(1);
  201. PUTRGB(dst_2, py_2, 1);
  202. PUTRGB(dst_1, py_1, 1);
  203. LOADCHROMA(2);
  204. PUTRGB(dst_1, py_1, 2);
  205. PUTRGB(dst_2, py_2, 2);
  206. LOADCHROMA(3);
  207. PUTRGB(dst_2, py_2, 3);
  208. PUTRGB(dst_1, py_1, 3);
  209. ENDYUV2RGBLINE(8)
  210. LOADCHROMA(0);
  211. PUTRGB(dst_1, py_1, 0);
  212. PUTRGB(dst_2, py_2, 0);
  213. LOADCHROMA(1);
  214. PUTRGB(dst_2, py_2, 1);
  215. PUTRGB(dst_1, py_1, 1);
  216. ENDYUV2RGBFUNC()
  217. YUV2RGBFUNC(yuva2rgba_c, uint32_t, 1)
  218. LOADCHROMA(0);
  219. PUTRGBA(dst_1, py_1, pa_1, 0, 24);
  220. PUTRGBA(dst_2, py_2, pa_2, 0, 24);
  221. LOADCHROMA(1);
  222. PUTRGBA(dst_2, py_2, pa_1, 1, 24);
  223. PUTRGBA(dst_1, py_1, pa_2, 1, 24);
  224. LOADCHROMA(2);
  225. PUTRGBA(dst_1, py_1, pa_1, 2, 24);
  226. PUTRGBA(dst_2, py_2, pa_2, 2, 24);
  227. LOADCHROMA(3);
  228. PUTRGBA(dst_2, py_2, pa_1, 3, 24);
  229. PUTRGBA(dst_1, py_1, pa_2, 3, 24);
  230. pa_1 += 8; \
  231. pa_2 += 8; \
  232. ENDYUV2RGBLINE(8)
  233. LOADCHROMA(0);
  234. PUTRGBA(dst_1, py_1, pa_1, 0, 24);
  235. PUTRGBA(dst_2, py_2, pa_2, 0, 24);
  236. LOADCHROMA(1);
  237. PUTRGBA(dst_2, py_2, pa_1, 1, 24);
  238. PUTRGBA(dst_1, py_1, pa_2, 1, 24);
  239. ENDYUV2RGBFUNC()
  240. YUV2RGBFUNC(yuva2argb_c, uint32_t, 1)
  241. LOADCHROMA(0);
  242. PUTRGBA(dst_1, py_1, pa_1, 0, 0);
  243. PUTRGBA(dst_2, py_2, pa_2, 0, 0);
  244. LOADCHROMA(1);
  245. PUTRGBA(dst_2, py_2, pa_2, 1, 0);
  246. PUTRGBA(dst_1, py_1, pa_1, 1, 0);
  247. LOADCHROMA(2);
  248. PUTRGBA(dst_1, py_1, pa_1, 2, 0);
  249. PUTRGBA(dst_2, py_2, pa_2, 2, 0);
  250. LOADCHROMA(3);
  251. PUTRGBA(dst_2, py_2, pa_2, 3, 0);
  252. PUTRGBA(dst_1, py_1, pa_1, 3, 0);
  253. pa_1 += 8; \
  254. pa_2 += 8; \
  255. ENDYUV2RGBLINE(8)
  256. LOADCHROMA(0);
  257. PUTRGBA(dst_1, py_1, pa_1, 0, 0);
  258. PUTRGBA(dst_2, py_2, pa_2, 0, 0);
  259. LOADCHROMA(1);
  260. PUTRGBA(dst_2, py_2, pa_2, 1, 0);
  261. PUTRGBA(dst_1, py_1, pa_1, 1, 0);
  262. ENDYUV2RGBFUNC()
  263. YUV2RGBFUNC(yuv2rgb_c_24_rgb, uint8_t, 0)
  264. LOADCHROMA(0);
  265. PUTRGB24(dst_1, py_1, 0);
  266. PUTRGB24(dst_2, py_2, 0);
  267. LOADCHROMA(1);
  268. PUTRGB24(dst_2, py_2, 1);
  269. PUTRGB24(dst_1, py_1, 1);
  270. LOADCHROMA(2);
  271. PUTRGB24(dst_1, py_1, 2);
  272. PUTRGB24(dst_2, py_2, 2);
  273. LOADCHROMA(3);
  274. PUTRGB24(dst_2, py_2, 3);
  275. PUTRGB24(dst_1, py_1, 3);
  276. ENDYUV2RGBLINE(24)
  277. LOADCHROMA(0);
  278. PUTRGB24(dst_1, py_1, 0);
  279. PUTRGB24(dst_2, py_2, 0);
  280. LOADCHROMA(1);
  281. PUTRGB24(dst_2, py_2, 1);
  282. PUTRGB24(dst_1, py_1, 1);
  283. ENDYUV2RGBFUNC()
  284. // only trivial mods from yuv2rgb_c_24_rgb
  285. YUV2RGBFUNC(yuv2rgb_c_24_bgr, uint8_t, 0)
  286. LOADCHROMA(0);
  287. PUTBGR24(dst_1, py_1, 0);
  288. PUTBGR24(dst_2, py_2, 0);
  289. LOADCHROMA(1);
  290. PUTBGR24(dst_2, py_2, 1);
  291. PUTBGR24(dst_1, py_1, 1);
  292. LOADCHROMA(2);
  293. PUTBGR24(dst_1, py_1, 2);
  294. PUTBGR24(dst_2, py_2, 2);
  295. LOADCHROMA(3);
  296. PUTBGR24(dst_2, py_2, 3);
  297. PUTBGR24(dst_1, py_1, 3);
  298. ENDYUV2RGBLINE(24)
  299. LOADCHROMA(0);
  300. PUTBGR24(dst_1, py_1, 0);
  301. PUTBGR24(dst_2, py_2, 0);
  302. LOADCHROMA(1);
  303. PUTBGR24(dst_2, py_2, 1);
  304. PUTBGR24(dst_1, py_1, 1);
  305. ENDYUV2RGBFUNC()
  306. // This is exactly the same code as yuv2rgb_c_32 except for the types of
  307. // r, g, b, dst_1, dst_2
  308. YUV2RGBFUNC(yuv2rgb_c_16, uint16_t, 0)
  309. LOADCHROMA(0);
  310. PUTRGB(dst_1, py_1, 0);
  311. PUTRGB(dst_2, py_2, 0);
  312. LOADCHROMA(1);
  313. PUTRGB(dst_2, py_2, 1);
  314. PUTRGB(dst_1, py_1, 1);
  315. LOADCHROMA(2);
  316. PUTRGB(dst_1, py_1, 2);
  317. PUTRGB(dst_2, py_2, 2);
  318. LOADCHROMA(3);
  319. PUTRGB(dst_2, py_2, 3);
  320. PUTRGB(dst_1, py_1, 3);
  321. CLOSEYUV2RGBFUNC(8)
  322. // r, g, b, dst_1, dst_2
  323. YUV2RGBFUNC(yuv2rgb_c_12_ordered_dither, uint16_t, 0)
  324. const uint8_t *d16 = dither_4x4_16[y & 3];
  325. #define PUTRGB12(dst, src, i, o) \
  326. Y = src[2 * i]; \
  327. dst[2 * i] = r[Y + d16[0 + o]] + \
  328. g[Y + d16[0 + o]] + \
  329. b[Y + d16[0 + o]]; \
  330. Y = src[2 * i + 1]; \
  331. dst[2 * i + 1] = r[Y + d16[1 + o]] + \
  332. g[Y + d16[1 + o]] + \
  333. b[Y + d16[1 + o]];
  334. LOADCHROMA(0);
  335. PUTRGB12(dst_1, py_1, 0, 0);
  336. PUTRGB12(dst_2, py_2, 0, 0 + 8);
  337. LOADCHROMA(1);
  338. PUTRGB12(dst_2, py_2, 1, 2 + 8);
  339. PUTRGB12(dst_1, py_1, 1, 2);
  340. LOADCHROMA(2);
  341. PUTRGB12(dst_1, py_1, 2, 4);
  342. PUTRGB12(dst_2, py_2, 2, 4 + 8);
  343. LOADCHROMA(3);
  344. PUTRGB12(dst_2, py_2, 3, 6 + 8);
  345. PUTRGB12(dst_1, py_1, 3, 6);
  346. CLOSEYUV2RGBFUNC(8)
  347. // r, g, b, dst_1, dst_2
  348. YUV2RGBFUNC(yuv2rgb_c_8_ordered_dither, uint8_t, 0)
  349. const uint8_t *d32 = dither_8x8_32[y & 7];
  350. const uint8_t *d64 = dither_8x8_73[y & 7];
  351. #define PUTRGB8(dst, src, i, o) \
  352. Y = src[2 * i]; \
  353. dst[2 * i] = r[Y + d32[0 + o]] + \
  354. g[Y + d32[0 + o]] + \
  355. b[Y + d64[0 + o]]; \
  356. Y = src[2 * i + 1]; \
  357. dst[2 * i + 1] = r[Y + d32[1 + o]] + \
  358. g[Y + d32[1 + o]] + \
  359. b[Y + d64[1 + o]];
  360. LOADCHROMA(0);
  361. PUTRGB8(dst_1, py_1, 0, 0);
  362. PUTRGB8(dst_2, py_2, 0, 0 + 8);
  363. LOADCHROMA(1);
  364. PUTRGB8(dst_2, py_2, 1, 2 + 8);
  365. PUTRGB8(dst_1, py_1, 1, 2);
  366. LOADCHROMA(2);
  367. PUTRGB8(dst_1, py_1, 2, 4);
  368. PUTRGB8(dst_2, py_2, 2, 4 + 8);
  369. LOADCHROMA(3);
  370. PUTRGB8(dst_2, py_2, 3, 6 + 8);
  371. PUTRGB8(dst_1, py_1, 3, 6);
  372. CLOSEYUV2RGBFUNC(8)
  373. YUV2RGBFUNC(yuv2rgb_c_4_ordered_dither, uint8_t, 0)
  374. const uint8_t * d64 = dither_8x8_73[y & 7];
  375. const uint8_t *d128 = dither_8x8_220[y & 7];
  376. int acc;
  377. #define PUTRGB4D(dst, src, i, o) \
  378. Y = src[2 * i]; \
  379. acc = r[Y + d128[0 + o]] + \
  380. g[Y + d64[0 + o]] + \
  381. b[Y + d128[0 + o]]; \
  382. Y = src[2 * i + 1]; \
  383. acc |= (r[Y + d128[1 + o]] + \
  384. g[Y + d64[1 + o]] + \
  385. b[Y + d128[1 + o]]) << 4; \
  386. dst[i] = acc;
  387. LOADCHROMA(0);
  388. PUTRGB4D(dst_1, py_1, 0, 0);
  389. PUTRGB4D(dst_2, py_2, 0, 0 + 8);
  390. LOADCHROMA(1);
  391. PUTRGB4D(dst_2, py_2, 1, 2 + 8);
  392. PUTRGB4D(dst_1, py_1, 1, 2);
  393. LOADCHROMA(2);
  394. PUTRGB4D(dst_1, py_1, 2, 4);
  395. PUTRGB4D(dst_2, py_2, 2, 4 + 8);
  396. LOADCHROMA(3);
  397. PUTRGB4D(dst_2, py_2, 3, 6 + 8);
  398. PUTRGB4D(dst_1, py_1, 3, 6);
  399. CLOSEYUV2RGBFUNC(4)
  400. YUV2RGBFUNC(yuv2rgb_c_4b_ordered_dither, uint8_t, 0)
  401. const uint8_t *d64 = dither_8x8_73[y & 7];
  402. const uint8_t *d128 = dither_8x8_220[y & 7];
  403. #define PUTRGB4DB(dst, src, i, o) \
  404. Y = src[2 * i]; \
  405. dst[2 * i] = r[Y + d128[0 + o]] + \
  406. g[Y + d64[0 + o]] + \
  407. b[Y + d128[0 + o]]; \
  408. Y = src[2 * i + 1]; \
  409. dst[2 * i + 1] = r[Y + d128[1 + o]] + \
  410. g[Y + d64[1 + o]] + \
  411. b[Y + d128[1 + o]];
  412. LOADCHROMA(0);
  413. PUTRGB4DB(dst_1, py_1, 0, 0);
  414. PUTRGB4DB(dst_2, py_2, 0, 0 + 8);
  415. LOADCHROMA(1);
  416. PUTRGB4DB(dst_2, py_2, 1, 2 + 8);
  417. PUTRGB4DB(dst_1, py_1, 1, 2);
  418. LOADCHROMA(2);
  419. PUTRGB4DB(dst_1, py_1, 2, 4);
  420. PUTRGB4DB(dst_2, py_2, 2, 4 + 8);
  421. LOADCHROMA(3);
  422. PUTRGB4DB(dst_2, py_2, 3, 6 + 8);
  423. PUTRGB4DB(dst_1, py_1, 3, 6);
  424. CLOSEYUV2RGBFUNC(8)
  425. YUV2RGBFUNC(yuv2rgb_c_1_ordered_dither, uint8_t, 0)
  426. const uint8_t *d128 = dither_8x8_220[y & 7];
  427. char out_1 = 0, out_2 = 0;
  428. g = c->table_gU[128] + c->table_gV[128];
  429. #define PUTRGB1(out, src, i, o) \
  430. Y = src[2 * i]; \
  431. out += out + g[Y + d128[0 + o]]; \
  432. Y = src[2 * i + 1]; \
  433. out += out + g[Y + d128[1 + o]];
  434. PUTRGB1(out_1, py_1, 0, 0);
  435. PUTRGB1(out_2, py_2, 0, 0 + 8);
  436. PUTRGB1(out_2, py_2, 1, 2 + 8);
  437. PUTRGB1(out_1, py_1, 1, 2);
  438. PUTRGB1(out_1, py_1, 2, 4);
  439. PUTRGB1(out_2, py_2, 2, 4 + 8);
  440. PUTRGB1(out_2, py_2, 3, 6 + 8);
  441. PUTRGB1(out_1, py_1, 3, 6);
  442. dst_1[0] = out_1;
  443. dst_2[0] = out_2;
  444. CLOSEYUV2RGBFUNC(1)
  445. SwsFunc ff_yuv2rgb_get_func_ptr(SwsContext *c)
  446. {
  447. SwsFunc t = NULL;
  448. if (HAVE_MMX)
  449. t = ff_yuv2rgb_init_mmx(c);
  450. else if (HAVE_VIS)
  451. t = ff_yuv2rgb_init_vis(c);
  452. else if (HAVE_ALTIVEC)
  453. t = ff_yuv2rgb_init_altivec(c);
  454. else if (ARCH_BFIN)
  455. t = ff_yuv2rgb_get_func_ptr_bfin(c);
  456. if (t)
  457. return t;
  458. av_log(c, AV_LOG_WARNING,
  459. "No accelerated colorspace conversion found from %s to %s.\n",
  460. sws_format_name(c->srcFormat), sws_format_name(c->dstFormat));
  461. switch (c->dstFormat) {
  462. case PIX_FMT_BGR48BE:
  463. case PIX_FMT_BGR48LE:
  464. return yuv2rgb_c_bgr48;
  465. case PIX_FMT_RGB48BE:
  466. case PIX_FMT_RGB48LE:
  467. return yuv2rgb_c_48;
  468. case PIX_FMT_ARGB:
  469. case PIX_FMT_ABGR:
  470. if (CONFIG_SWSCALE_ALPHA && c->srcFormat == PIX_FMT_YUVA420P)
  471. return yuva2argb_c;
  472. case PIX_FMT_RGBA:
  473. case PIX_FMT_BGRA:
  474. if (CONFIG_SWSCALE_ALPHA && c->srcFormat == PIX_FMT_YUVA420P)
  475. return yuva2rgba_c;
  476. else
  477. return yuv2rgb_c_32;
  478. case PIX_FMT_RGB24:
  479. return yuv2rgb_c_24_rgb;
  480. case PIX_FMT_BGR24:
  481. return yuv2rgb_c_24_bgr;
  482. case PIX_FMT_RGB565:
  483. case PIX_FMT_BGR565:
  484. case PIX_FMT_RGB555:
  485. case PIX_FMT_BGR555:
  486. return yuv2rgb_c_16;
  487. case PIX_FMT_RGB444:
  488. case PIX_FMT_BGR444:
  489. return yuv2rgb_c_12_ordered_dither;
  490. case PIX_FMT_RGB8:
  491. case PIX_FMT_BGR8:
  492. return yuv2rgb_c_8_ordered_dither;
  493. case PIX_FMT_RGB4:
  494. case PIX_FMT_BGR4:
  495. return yuv2rgb_c_4_ordered_dither;
  496. case PIX_FMT_RGB4_BYTE:
  497. case PIX_FMT_BGR4_BYTE:
  498. return yuv2rgb_c_4b_ordered_dither;
  499. case PIX_FMT_MONOBLACK:
  500. return yuv2rgb_c_1_ordered_dither;
  501. default:
  502. assert(0);
  503. }
  504. return NULL;
  505. }
  506. static void fill_table(uint8_t *table[256], const int elemsize,
  507. const int inc, void *y_tab)
  508. {
  509. int i;
  510. int64_t cb = 0;
  511. uint8_t *y_table = y_tab;
  512. y_table -= elemsize * (inc >> 9);
  513. for (i = 0; i < 256; i++) {
  514. table[i] = y_table + elemsize * (cb >> 16);
  515. cb += inc;
  516. }
  517. }
  518. static void fill_gv_table(int table[256], const int elemsize, const int inc)
  519. {
  520. int i;
  521. int64_t cb = 0;
  522. int off = -(inc >> 9);
  523. for (i = 0; i < 256; i++) {
  524. table[i] = elemsize * (off + (cb >> 16));
  525. cb += inc;
  526. }
  527. }
  528. static uint16_t roundToInt16(int64_t f)
  529. {
  530. int r = (f + (1 << 15)) >> 16;
  531. if (r < -0x7FFF)
  532. return 0x8000;
  533. else if (r > 0x7FFF)
  534. return 0x7FFF;
  535. else
  536. return r;
  537. }
  538. av_cold int ff_yuv2rgb_c_init_tables(SwsContext *c, const int inv_table[4],
  539. int fullRange, int brightness,
  540. int contrast, int saturation)
  541. {
  542. const int isRgb = c->dstFormat == PIX_FMT_RGB32 ||
  543. c->dstFormat == PIX_FMT_RGB32_1 ||
  544. c->dstFormat == PIX_FMT_BGR24 ||
  545. c->dstFormat == PIX_FMT_RGB565BE ||
  546. c->dstFormat == PIX_FMT_RGB565LE ||
  547. c->dstFormat == PIX_FMT_RGB555BE ||
  548. c->dstFormat == PIX_FMT_RGB555LE ||
  549. c->dstFormat == PIX_FMT_RGB444BE ||
  550. c->dstFormat == PIX_FMT_RGB444LE ||
  551. c->dstFormat == PIX_FMT_RGB8 ||
  552. c->dstFormat == PIX_FMT_RGB4 ||
  553. c->dstFormat == PIX_FMT_RGB4_BYTE ||
  554. c->dstFormat == PIX_FMT_MONOBLACK;
  555. const int isNotNe = c->dstFormat == PIX_FMT_NE(RGB565LE, RGB565BE) ||
  556. c->dstFormat == PIX_FMT_NE(RGB555LE, RGB555BE) ||
  557. c->dstFormat == PIX_FMT_NE(RGB444LE, RGB444BE) ||
  558. c->dstFormat == PIX_FMT_NE(BGR565LE, BGR565BE) ||
  559. c->dstFormat == PIX_FMT_NE(BGR555LE, BGR555BE) ||
  560. c->dstFormat == PIX_FMT_NE(BGR444LE, BGR444BE);
  561. const int bpp = c->dstFormatBpp;
  562. uint8_t *y_table;
  563. uint16_t *y_table16;
  564. uint32_t *y_table32;
  565. int i, base, rbase, gbase, bbase, abase, needAlpha;
  566. const int yoffs = fullRange ? 384 : 326;
  567. int64_t crv = inv_table[0];
  568. int64_t cbu = inv_table[1];
  569. int64_t cgu = -inv_table[2];
  570. int64_t cgv = -inv_table[3];
  571. int64_t cy = 1 << 16;
  572. int64_t oy = 0;
  573. int64_t yb = 0;
  574. if (!fullRange) {
  575. cy = (cy * 255) / 219;
  576. oy = 16 << 16;
  577. } else {
  578. crv = (crv * 224) / 255;
  579. cbu = (cbu * 224) / 255;
  580. cgu = (cgu * 224) / 255;
  581. cgv = (cgv * 224) / 255;
  582. }
  583. cy = (cy * contrast) >> 16;
  584. crv = (crv * contrast * saturation) >> 32;
  585. cbu = (cbu * contrast * saturation) >> 32;
  586. cgu = (cgu * contrast * saturation) >> 32;
  587. cgv = (cgv * contrast * saturation) >> 32;
  588. oy -= 256 * brightness;
  589. c->uOffset = 0x0400040004000400LL;
  590. c->vOffset = 0x0400040004000400LL;
  591. c->yCoeff = roundToInt16(cy * 8192) * 0x0001000100010001ULL;
  592. c->vrCoeff = roundToInt16(crv * 8192) * 0x0001000100010001ULL;
  593. c->ubCoeff = roundToInt16(cbu * 8192) * 0x0001000100010001ULL;
  594. c->vgCoeff = roundToInt16(cgv * 8192) * 0x0001000100010001ULL;
  595. c->ugCoeff = roundToInt16(cgu * 8192) * 0x0001000100010001ULL;
  596. c->yOffset = roundToInt16(oy * 8) * 0x0001000100010001ULL;
  597. c->yuv2rgb_y_coeff = (int16_t)roundToInt16(cy << 13);
  598. c->yuv2rgb_y_offset = (int16_t)roundToInt16(oy << 9);
  599. c->yuv2rgb_v2r_coeff = (int16_t)roundToInt16(crv << 13);
  600. c->yuv2rgb_v2g_coeff = (int16_t)roundToInt16(cgv << 13);
  601. c->yuv2rgb_u2g_coeff = (int16_t)roundToInt16(cgu << 13);
  602. c->yuv2rgb_u2b_coeff = (int16_t)roundToInt16(cbu << 13);
  603. //scale coefficients by cy
  604. crv = ((crv << 16) + 0x8000) / cy;
  605. cbu = ((cbu << 16) + 0x8000) / cy;
  606. cgu = ((cgu << 16) + 0x8000) / cy;
  607. cgv = ((cgv << 16) + 0x8000) / cy;
  608. av_free(c->yuvTable);
  609. switch (bpp) {
  610. case 1:
  611. c->yuvTable = av_malloc(1024);
  612. y_table = c->yuvTable;
  613. yb = -(384 << 16) - oy;
  614. for (i = 0; i < 1024 - 110; i++) {
  615. y_table[i + 110] = av_clip_uint8((yb + 0x8000) >> 16) >> 7;
  616. yb += cy;
  617. }
  618. fill_table(c->table_gU, 1, cgu, y_table + yoffs);
  619. fill_gv_table(c->table_gV, 1, cgv);
  620. break;
  621. case 4:
  622. case 4 | 128:
  623. rbase = isRgb ? 3 : 0;
  624. gbase = 1;
  625. bbase = isRgb ? 0 : 3;
  626. c->yuvTable = av_malloc(1024 * 3);
  627. y_table = c->yuvTable;
  628. yb = -(384 << 16) - oy;
  629. for (i = 0; i < 1024 - 110; i++) {
  630. int yval = av_clip_uint8((yb + 0x8000) >> 16);
  631. y_table[i + 110] = (yval >> 7) << rbase;
  632. y_table[i + 37 + 1024] = ((yval + 43) / 85) << gbase;
  633. y_table[i + 110 + 2048] = (yval >> 7) << bbase;
  634. yb += cy;
  635. }
  636. fill_table(c->table_rV, 1, crv, y_table + yoffs);
  637. fill_table(c->table_gU, 1, cgu, y_table + yoffs + 1024);
  638. fill_table(c->table_bU, 1, cbu, y_table + yoffs + 2048);
  639. fill_gv_table(c->table_gV, 1, cgv);
  640. break;
  641. case 8:
  642. rbase = isRgb ? 5 : 0;
  643. gbase = isRgb ? 2 : 3;
  644. bbase = isRgb ? 0 : 6;
  645. c->yuvTable = av_malloc(1024 * 3);
  646. y_table = c->yuvTable;
  647. yb = -(384 << 16) - oy;
  648. for (i = 0; i < 1024 - 38; i++) {
  649. int yval = av_clip_uint8((yb + 0x8000) >> 16);
  650. y_table[i + 16] = ((yval + 18) / 36) << rbase;
  651. y_table[i + 16 + 1024] = ((yval + 18) / 36) << gbase;
  652. y_table[i + 37 + 2048] = ((yval + 43) / 85) << bbase;
  653. yb += cy;
  654. }
  655. fill_table(c->table_rV, 1, crv, y_table + yoffs);
  656. fill_table(c->table_gU, 1, cgu, y_table + yoffs + 1024);
  657. fill_table(c->table_bU, 1, cbu, y_table + yoffs + 2048);
  658. fill_gv_table(c->table_gV, 1, cgv);
  659. break;
  660. case 12:
  661. rbase = isRgb ? 8 : 0;
  662. gbase = 4;
  663. bbase = isRgb ? 0 : 8;
  664. c->yuvTable = av_malloc(1024 * 3 * 2);
  665. y_table16 = c->yuvTable;
  666. yb = -(384 << 16) - oy;
  667. for (i = 0; i < 1024; i++) {
  668. uint8_t yval = av_clip_uint8((yb + 0x8000) >> 16);
  669. y_table16[i] = (yval >> 4) << rbase;
  670. y_table16[i + 1024] = (yval >> 4) << gbase;
  671. y_table16[i + 2048] = (yval >> 4) << bbase;
  672. yb += cy;
  673. }
  674. if (isNotNe)
  675. for (i = 0; i < 1024 * 3; i++)
  676. y_table16[i] = av_bswap16(y_table16[i]);
  677. fill_table(c->table_rV, 2, crv, y_table16 + yoffs);
  678. fill_table(c->table_gU, 2, cgu, y_table16 + yoffs + 1024);
  679. fill_table(c->table_bU, 2, cbu, y_table16 + yoffs + 2048);
  680. fill_gv_table(c->table_gV, 2, cgv);
  681. break;
  682. case 15:
  683. case 16:
  684. rbase = isRgb ? bpp - 5 : 0;
  685. gbase = 5;
  686. bbase = isRgb ? 0 : (bpp - 5);
  687. c->yuvTable = av_malloc(1024 * 3 * 2);
  688. y_table16 = c->yuvTable;
  689. yb = -(384 << 16) - oy;
  690. for (i = 0; i < 1024; i++) {
  691. uint8_t yval = av_clip_uint8((yb + 0x8000) >> 16);
  692. y_table16[i] = (yval >> 3) << rbase;
  693. y_table16[i + 1024] = (yval >> (18 - bpp)) << gbase;
  694. y_table16[i + 2048] = (yval >> 3) << bbase;
  695. yb += cy;
  696. }
  697. if (isNotNe)
  698. for (i = 0; i < 1024 * 3; i++)
  699. y_table16[i] = av_bswap16(y_table16[i]);
  700. fill_table(c->table_rV, 2, crv, y_table16 + yoffs);
  701. fill_table(c->table_gU, 2, cgu, y_table16 + yoffs + 1024);
  702. fill_table(c->table_bU, 2, cbu, y_table16 + yoffs + 2048);
  703. fill_gv_table(c->table_gV, 2, cgv);
  704. break;
  705. case 24:
  706. case 48:
  707. c->yuvTable = av_malloc(1024);
  708. y_table = c->yuvTable;
  709. yb = -(384 << 16) - oy;
  710. for (i = 0; i < 1024; i++) {
  711. y_table[i] = av_clip_uint8((yb + 0x8000) >> 16);
  712. yb += cy;
  713. }
  714. fill_table(c->table_rV, 1, crv, y_table + yoffs);
  715. fill_table(c->table_gU, 1, cgu, y_table + yoffs);
  716. fill_table(c->table_bU, 1, cbu, y_table + yoffs);
  717. fill_gv_table(c->table_gV, 1, cgv);
  718. break;
  719. case 32:
  720. base = (c->dstFormat == PIX_FMT_RGB32_1 ||
  721. c->dstFormat == PIX_FMT_BGR32_1) ? 8 : 0;
  722. rbase = base + (isRgb ? 16 : 0);
  723. gbase = base + 8;
  724. bbase = base + (isRgb ? 0 : 16);
  725. needAlpha = CONFIG_SWSCALE_ALPHA && isALPHA(c->srcFormat);
  726. if (!needAlpha)
  727. abase = (base + 24) & 31;
  728. c->yuvTable = av_malloc(1024 * 3 * 4);
  729. y_table32 = c->yuvTable;
  730. yb = -(384 << 16) - oy;
  731. for (i = 0; i < 1024; i++) {
  732. unsigned yval = av_clip_uint8((yb + 0x8000) >> 16);
  733. y_table32[i] = (yval << rbase) +
  734. (needAlpha ? 0 : (255u << abase));
  735. y_table32[i + 1024] = yval << gbase;
  736. y_table32[i + 2048] = yval << bbase;
  737. yb += cy;
  738. }
  739. fill_table(c->table_rV, 4, crv, y_table32 + yoffs);
  740. fill_table(c->table_gU, 4, cgu, y_table32 + yoffs + 1024);
  741. fill_table(c->table_bU, 4, cbu, y_table32 + yoffs + 2048);
  742. fill_gv_table(c->table_gV, 4, cgv);
  743. break;
  744. default:
  745. c->yuvTable = NULL;
  746. av_log(c, AV_LOG_ERROR, "%ibpp not supported by yuv2rgb\n", bpp);
  747. return -1;
  748. }
  749. return 0;
  750. }