You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

760 lines
24KB

  1. /*
  2. * This file is part of FFmpeg.
  3. *
  4. * Copyright (C) 2011, 2012 Hyllian/Jararaca - sergiogdb@gmail.com
  5. *
  6. * Copyright (c) 2014 Arwa Arif <arwaarif1994@gmail.com>
  7. *
  8. * FFmpeg is free software; you can redistribute it and/or modify
  9. * it under the terms of the GNU General Public License as published by
  10. * the Free Software Foundation; either version 2 of the License, or
  11. * (at your option) any later version.
  12. *
  13. * FFmpeg is distributed in the hope that it will be useful,
  14. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  15. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  16. * GNU General Public License for more details.
  17. *
  18. * You should have received a copy of the GNU General Public License along
  19. * with FFmpeg; if not, write to the Free Software Foundation, Inc.,
  20. * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
  21. */
  22. /**
  23. * @file
  24. * XBR Filter is used for depixelization of image.
  25. * This is based on Hyllian's xBR shader.
  26. *
  27. * @see http://www.libretro.com/forums/viewtopic.php?f=6&t=134
  28. * @see https://github.com/yoyofr/iFBA/blob/master/fba_src/src/intf/video/scalers/xbr.cpp
  29. *
  30. * @todo add threading and FATE test
  31. */
  32. #include "libavutil/opt.h"
  33. #include "libavutil/avassert.h"
  34. #include "libavutil/pixdesc.h"
  35. #include "internal.h"
  36. #define RGB_MASK 0x00FFFFFF
  37. #define LB_MASK 0x00FEFEFE
  38. #define RED_BLUE_MASK 0x00FF00FF
  39. #define GREEN_MASK 0x0000FF00
  40. typedef struct {
  41. const AVClass *class;
  42. int n;
  43. uint32_t rgbtoyuv[1<<24];
  44. } XBRContext;
  45. #define OFFSET(x) offsetof(XBRContext, x)
  46. static const AVOption xbr_options[] = {
  47. { "n", "set scale factor", OFFSET(n), AV_OPT_TYPE_INT, {.i64 = 3}, 2, 4, },
  48. { NULL }
  49. };
  50. AVFILTER_DEFINE_CLASS(xbr);
  51. static uint32_t df(uint32_t x, uint32_t y, const uint32_t *r2y)
  52. {
  53. #define YMASK 0xff0000
  54. #define UMASK 0x00ff00
  55. #define VMASK 0x0000ff
  56. uint32_t yuv1 = r2y[x & 0xffffff];
  57. uint32_t yuv2 = r2y[y & 0xffffff];
  58. return (abs((yuv1 & YMASK) - (yuv2 & YMASK)) >> 16) +
  59. (abs((yuv1 & UMASK) - (yuv2 & UMASK)) >> 8) +
  60. abs((yuv1 & VMASK) - (yuv2 & VMASK));
  61. }
  62. #define ALPHA_BLEND_128_W(dst, src) dst = ((src & LB_MASK) >> 1) + ((dst & LB_MASK) >> 1)
  63. #define ALPHA_BLEND_32_W(dst, src) \
  64. dst = ((RED_BLUE_MASK & ((dst & RED_BLUE_MASK) + ((((src & RED_BLUE_MASK) - \
  65. (dst & RED_BLUE_MASK))) >>3))) | (GREEN_MASK & ((dst & GREEN_MASK) + \
  66. ((((src & GREEN_MASK) - (dst & GREEN_MASK))) >>3))))
  67. #define ALPHA_BLEND_64_W(dst, src) \
  68. dst = ((RED_BLUE_MASK & ((dst & RED_BLUE_MASK) + ((((src & RED_BLUE_MASK) - \
  69. (dst & RED_BLUE_MASK))) >>2))) | (GREEN_MASK & ((dst & GREEN_MASK) + \
  70. ((((src & GREEN_MASK) - (dst & GREEN_MASK))) >>2))))
  71. #define ALPHA_BLEND_192_W(dst, src) \
  72. dst = ((RED_BLUE_MASK & ((dst & RED_BLUE_MASK) + ((((src & RED_BLUE_MASK) - \
  73. (dst & RED_BLUE_MASK)) * 3) >>2))) | (GREEN_MASK & ((dst & GREEN_MASK) + \
  74. ((((src & GREEN_MASK) - (dst & GREEN_MASK)) * 3) >>2))))
  75. #define ALPHA_BLEND_224_W(dst, src) \
  76. dst = ((RED_BLUE_MASK & ((dst & RED_BLUE_MASK) + ((((src & RED_BLUE_MASK) - \
  77. (dst & RED_BLUE_MASK)) * 7) >>3))) | (GREEN_MASK & ((dst & GREEN_MASK) + \
  78. ((((src & GREEN_MASK) - (dst & GREEN_MASK)) * 7) >>3))))
  79. #define LEFT_UP_2_2X(N3, N2, N1, PIXEL)\
  80. ALPHA_BLEND_224_W(E[N3], PIXEL); \
  81. ALPHA_BLEND_64_W( E[N2], PIXEL); \
  82. E[N1] = E[N2]; \
  83. #define LEFT_2_2X(N3, N2, PIXEL)\
  84. ALPHA_BLEND_192_W(E[N3], PIXEL); \
  85. ALPHA_BLEND_64_W( E[N2], PIXEL); \
  86. #define UP_2_2X(N3, N1, PIXEL)\
  87. ALPHA_BLEND_192_W(E[N3], PIXEL); \
  88. ALPHA_BLEND_64_W( E[N1], PIXEL); \
  89. #define DIA_2X(N3, PIXEL)\
  90. ALPHA_BLEND_128_W(E[N3], PIXEL); \
  91. #define eq(A, B, r2y)\
  92. (df(A, B, r2y) < 155)\
  93. #define FILTRO(PE, PI, PH, PF, PG, PC, PD, PB, PA, G5, C4, G0, D0, C1, B1, F4, I4, H5, I5, A0, A1, N0, N1, N2, N3,r2y) \
  94. ex = (PE!=PH && PE!=PF); \
  95. if ( ex )\
  96. {\
  97. e = (df(PE,PC,r2y)+df(PE,PG,r2y)+df(PI,H5,r2y)+df(PI,F4,r2y))+(df(PH,PF,r2y)<<2); \
  98. i = (df(PH,PD,r2y)+df(PH,I5,r2y)+df(PF,I4,r2y)+df(PF,PB,r2y))+(df(PE,PI,r2y)<<2); \
  99. if ((e<i) && ( !eq(PF,PB,r2y) && !eq(PH,PD,r2y) || eq(PE,PI,r2y) && (!eq(PF,I4,r2y) && !eq(PH,I5,r2y)) || eq(PE,PG,r2y) || eq(PE,PC,r2y)) )\
  100. {\
  101. ke=df(PF,PG,r2y); ki=df(PH,PC,r2y); \
  102. ex2 = (PE!=PC && PB!=PC); ex3 = (PE!=PG && PD!=PG); px = (df(PE,PF,r2y) <= df(PE,PH,r2y)) ? PF : PH; \
  103. if ( ((ke<<1)<=ki) && ex3 && (ke>=(ki<<1)) && ex2 ) \
  104. {\
  105. LEFT_UP_2_2X(N3, N2, N1, px)\
  106. }\
  107. else if ( ((ke<<1)<=ki) && ex3 ) \
  108. {\
  109. LEFT_2_2X(N3, N2, px);\
  110. }\
  111. else if ( (ke>=(ki<<1)) && ex2 ) \
  112. {\
  113. UP_2_2X(N3, N1, px);\
  114. }\
  115. else \
  116. {\
  117. DIA_2X(N3, px);\
  118. }\
  119. }\
  120. else if (e<=i)\
  121. {\
  122. ALPHA_BLEND_128_W( E[N3], ((df(PE,PF,r2y) <= df(PE,PH,r2y)) ? PF : PH)); \
  123. }\
  124. }\
  125. static void xbr2x(AVFrame * input, AVFrame * output, const uint32_t * r2y)
  126. {
  127. unsigned int e, i,px;
  128. unsigned int ex, ex2, ex3;
  129. unsigned int ke, ki;
  130. int x,y;
  131. int next_line = output->linesize[0]>>2;
  132. for (y = 0; y < input->height; y++) {
  133. uint32_t pprev;
  134. uint32_t pprev2;
  135. uint32_t * E = (uint32_t *)(output->data[0] + y * output->linesize[0] * 2);
  136. /* middle. Offset of -8 is given */
  137. uint32_t * sa2 = (uint32_t *)(input->data[0] + y * input->linesize[0] - 8);
  138. /* up one */
  139. uint32_t * sa1 = sa2 - (input->linesize[0]>>2);
  140. /* up two */
  141. uint32_t * sa0 = sa1 - (input->linesize[0]>>2);
  142. /* down one */
  143. uint32_t * sa3 = sa2 + (input->linesize[0]>>2);
  144. /* down two */
  145. uint32_t * sa4 = sa3 + (input->linesize[0]>>2);
  146. if (y <= 1) {
  147. sa0 = sa1;
  148. if (y == 0) {
  149. sa0 = sa1 = sa2;
  150. }
  151. }
  152. if (y >= input->height - 2) {
  153. sa4 = sa3;
  154. if (y == input->height - 1) {
  155. sa4 = sa3 = sa2;
  156. }
  157. }
  158. pprev = pprev2 = 2;
  159. for (x = 0; x < input->width; x++) {
  160. uint32_t B1 = sa0[2];
  161. uint32_t PB = sa1[2];
  162. uint32_t PE = sa2[2];
  163. uint32_t PH = sa3[2];
  164. uint32_t H5 = sa4[2];
  165. uint32_t A1 = sa0[pprev];
  166. uint32_t PA = sa1[pprev];
  167. uint32_t PD = sa2[pprev];
  168. uint32_t PG = sa3[pprev];
  169. uint32_t G5 = sa4[pprev];
  170. uint32_t A0 = sa1[pprev2];
  171. uint32_t D0 = sa2[pprev2];
  172. uint32_t G0 = sa3[pprev2];
  173. uint32_t C1 = 0;
  174. uint32_t PC = 0;
  175. uint32_t PF = 0;
  176. uint32_t PI = 0;
  177. uint32_t I5 = 0;
  178. uint32_t C4 = 0;
  179. uint32_t F4 = 0;
  180. uint32_t I4 = 0;
  181. if (x >= input->width - 2) {
  182. if (x == input->width - 1) {
  183. C1 = sa0[2];
  184. PC = sa1[2];
  185. PF = sa2[2];
  186. PI = sa3[2];
  187. I5 = sa4[2];
  188. C4 = sa1[2];
  189. F4 = sa2[2];
  190. I4 = sa3[2];
  191. } else {
  192. C1 = sa0[3];
  193. PC = sa1[3];
  194. PF = sa2[3];
  195. PI = sa3[3];
  196. I5 = sa4[3];
  197. C4 = sa1[3];
  198. F4 = sa2[3];
  199. I4 = sa3[3];
  200. }
  201. } else {
  202. C1 = sa0[3];
  203. PC = sa1[3];
  204. PF = sa2[3];
  205. PI = sa3[3];
  206. I5 = sa4[3];
  207. C4 = sa1[4];
  208. F4 = sa2[4];
  209. I4 = sa3[4];
  210. }
  211. E[0] = E[1] = E[next_line] = E[next_line + 1] = PE; // 0, 1, 2, 3
  212. FILTRO(PE, PI, PH, PF, PG, PC, PD, PB, PA, G5, C4, G0, D0, C1, B1, F4, I4, H5, I5, A0, A1, 0, 1, next_line, next_line+1,r2y);
  213. FILTRO(PE, PC, PF, PB, PI, PA, PH, PD, PG, I4, A1, I5, H5, A0, D0, B1, C1, F4, C4, G5, G0, next_line, 0, next_line+1, 1,r2y);
  214. FILTRO(PE, PA, PB, PD, PC, PG, PF, PH, PI, C1, G0, C4, F4, G5, H5, D0, A0, B1, A1, I4, I5, next_line+1, next_line, 1, 0,r2y);
  215. FILTRO(PE, PG, PD, PH, PA, PI, PB, PF, PC, A0, I5, A1, B1, I4, F4, H5, G5, D0, G0, C1, C4, 1, next_line+1, 0, next_line,r2y);
  216. sa0 += 1;
  217. sa1 += 1;
  218. sa2 += 1;
  219. sa3 += 1;
  220. sa4 += 1;
  221. E += 2;
  222. if (pprev2){
  223. pprev2--;
  224. pprev = 1;
  225. }
  226. }
  227. }
  228. }
  229. #undef FILTRO
  230. #define LEFT_UP_2_3X(N7, N5, N6, N2, N8, PIXEL)\
  231. ALPHA_BLEND_192_W(E[N7], PIXEL); \
  232. ALPHA_BLEND_64_W( E[N6], PIXEL); \
  233. E[N5] = E[N7]; \
  234. E[N2] = E[N6]; \
  235. E[N8] = PIXEL;\
  236. #define LEFT_2_3X(N7, N5, N6, N8, PIXEL)\
  237. ALPHA_BLEND_192_W(E[N7], PIXEL); \
  238. ALPHA_BLEND_64_W( E[N5], PIXEL); \
  239. ALPHA_BLEND_64_W( E[N6], PIXEL); \
  240. E[N8] = PIXEL;\
  241. #define UP_2_3X(N5, N7, N2, N8, PIXEL)\
  242. ALPHA_BLEND_192_W(E[N5], PIXEL); \
  243. ALPHA_BLEND_64_W( E[N7], PIXEL); \
  244. ALPHA_BLEND_64_W( E[N2], PIXEL); \
  245. E[N8] = PIXEL;\
  246. #define DIA_3X(N8, N5, N7, PIXEL)\
  247. ALPHA_BLEND_224_W(E[N8], PIXEL); \
  248. ALPHA_BLEND_32_W(E[N5], PIXEL); \
  249. ALPHA_BLEND_32_W(E[N7], PIXEL); \
  250. #define FILTRO(PE, PI, PH, PF, PG, PC, PD, PB, PA, G5, C4, G0, D0, C1, B1, F4, I4, H5, I5, A0, A1, N0, N1, N2, N3, N4, N5, N6, N7, N8,r2y) \
  251. ex = (PE!=PH && PE!=PF); \
  252. if ( ex )\
  253. {\
  254. e = (df(PE,PC,r2y)+df(PE,PG,r2y)+df(PI,H5,r2y)+df(PI,F4,r2y))+(df(PH,PF,r2y)<<2); \
  255. i = (df(PH,PD,r2y)+df(PH,I5,r2y)+df(PF,I4,r2y)+df(PF,PB,r2y))+(df(PE,PI,r2y)<<2); \
  256. if ((e<i) && ( !eq(PF,PB,r2y) && !eq(PF,PC,r2y) || !eq(PH,PD,r2y) && !eq(PH,PG,r2y) || eq(PE,PI,r2y) && (!eq(PF,F4,r2y) && !eq(PF,I4,r2y) || !eq(PH,H5,r2y) && !eq(PH,I5,r2y)) || eq(PE,PG,r2y) || eq(PE,PC,r2y)) )\
  257. {\
  258. ke=df(PF,PG,r2y); ki=df(PH,PC,r2y); \
  259. ex2 = (PE!=PC && PB!=PC); ex3 = (PE!=PG && PD!=PG); px = (df(PE,PF,r2y) <= df(PE,PH,r2y)) ? PF : PH; \
  260. if ( ((ke<<1)<=ki) && ex3 && (ke>=(ki<<1)) && ex2 ) \
  261. {\
  262. LEFT_UP_2_3X(N7, N5, N6, N2, N8, px)\
  263. }\
  264. else if ( ((ke<<1)<=ki) && ex3 ) \
  265. {\
  266. LEFT_2_3X(N7, N5, N6, N8, px);\
  267. }\
  268. else if ( (ke>=(ki<<1)) && ex2 ) \
  269. {\
  270. UP_2_3X(N5, N7, N2, N8, px);\
  271. }\
  272. else \
  273. {\
  274. DIA_3X(N8, N5, N7, px);\
  275. }\
  276. }\
  277. else if (e<=i)\
  278. {\
  279. ALPHA_BLEND_128_W( E[N8], ((df(PE,PF,r2y) <= df(PE,PH,r2y)) ? PF : PH)); \
  280. }\
  281. }\
  282. static void xbr3x(AVFrame *input, AVFrame *output, const uint32_t *r2y)
  283. {
  284. const int nl = output->linesize[0]>>2;
  285. const int nl1 = nl + nl;
  286. unsigned int e, i,px;
  287. unsigned int ex, ex2, ex3;
  288. unsigned int ke, ki;
  289. uint32_t pprev;
  290. uint32_t pprev2;
  291. int x,y;
  292. for (y = 0; y < input->height; y++) {
  293. uint32_t * E = (uint32_t *)(output->data[0] + y * output->linesize[0] * 3);
  294. /* middle. Offset of -8 is given */
  295. uint32_t * sa2 = (uint32_t *)(input->data[0] + y * input->linesize[0] - 8);
  296. /* up one */
  297. uint32_t * sa1 = sa2 - (input->linesize[0]>>2);
  298. /* up two */
  299. uint32_t * sa0 = sa1 - (input->linesize[0]>>2);
  300. /* down one */
  301. uint32_t * sa3 = sa2 + (input->linesize[0]>>2);
  302. /* down two */
  303. uint32_t * sa4 = sa3 + (input->linesize[0]>>2);
  304. if (y <= 1){
  305. sa0 = sa1;
  306. if (y == 0){
  307. sa0 = sa1 = sa2;
  308. }
  309. }
  310. if (y >= input->height - 2){
  311. sa4 = sa3;
  312. if (y == input->height - 1){
  313. sa4 = sa3 = sa2;
  314. }
  315. }
  316. pprev = pprev2 = 2;
  317. for (x = 0; x < input->width; x++){
  318. uint32_t B1 = sa0[2];
  319. uint32_t PB = sa1[2];
  320. uint32_t PE = sa2[2];
  321. uint32_t PH = sa3[2];
  322. uint32_t H5 = sa4[2];
  323. uint32_t A1 = sa0[pprev];
  324. uint32_t PA = sa1[pprev];
  325. uint32_t PD = sa2[pprev];
  326. uint32_t PG = sa3[pprev];
  327. uint32_t G5 = sa4[pprev];
  328. uint32_t A0 = sa1[pprev2];
  329. uint32_t D0 = sa2[pprev2];
  330. uint32_t G0 = sa3[pprev2];
  331. uint32_t C1 = 0;
  332. uint32_t PC = 0;
  333. uint32_t PF = 0;
  334. uint32_t PI = 0;
  335. uint32_t I5 = 0;
  336. uint32_t C4 = 0;
  337. uint32_t F4 = 0;
  338. uint32_t I4 = 0;
  339. if (x >= input->width - 2){
  340. if (x == input->width - 1){
  341. C1 = sa0[2];
  342. PC = sa1[2];
  343. PF = sa2[2];
  344. PI = sa3[2];
  345. I5 = sa4[2];
  346. C4 = sa1[2];
  347. F4 = sa2[2];
  348. I4 = sa3[2];
  349. } else {
  350. C1 = sa0[3];
  351. PC = sa1[3];
  352. PF = sa2[3];
  353. PI = sa3[3];
  354. I5 = sa4[3];
  355. C4 = sa1[3];
  356. F4 = sa2[3];
  357. I4 = sa3[3];
  358. }
  359. } else {
  360. C1 = sa0[3];
  361. PC = sa1[3];
  362. PF = sa2[3];
  363. PI = sa3[3];
  364. I5 = sa4[3];
  365. C4 = sa1[4];
  366. F4 = sa2[4];
  367. I4 = sa3[4];
  368. }
  369. E[0] = E[1] = E[2] = PE;
  370. E[nl] = E[nl+1] = E[nl+2] = PE; // 3, 4, 5
  371. E[nl1] = E[nl1+1] = E[nl1+2] = PE; // 6, 7, 8
  372. FILTRO(PE, PI, PH, PF, PG, PC, PD, PB, PA, G5, C4, G0, D0, C1, B1, F4, I4, H5, I5, A0, A1, 0, 1, 2, nl, nl+1, nl+2, nl1, nl1+1, nl1+2,r2y);
  373. FILTRO(PE, PC, PF, PB, PI, PA, PH, PD, PG, I4, A1, I5, H5, A0, D0, B1, C1, F4, C4, G5, G0, nl1, nl, 0, nl1+1, nl+1, 1, nl1+2, nl+2, 2,r2y);
  374. FILTRO(PE, PA, PB, PD, PC, PG, PF, PH, PI, C1, G0, C4, F4, G5, H5, D0, A0, B1, A1, I4, I5, nl1+2, nl1+1, nl1, nl+2, nl+1, nl, 2, 1, 0,r2y);
  375. FILTRO(PE, PG, PD, PH, PA, PI, PB, PF, PC, A0, I5, A1, B1, I4, F4, H5, G5, D0, G0, C1, C4, 2, nl+2, nl1+2, 1, nl+1, nl1+1, 0, nl, nl1,r2y);
  376. sa0 += 1;
  377. sa1 += 1;
  378. sa2 += 1;
  379. sa3 += 1;
  380. sa4 += 1;
  381. E += 3;
  382. if (pprev2){
  383. pprev2--;
  384. pprev = 1;
  385. }
  386. }
  387. }
  388. }
  389. #undef FILTRO
  390. #define LEFT_UP_2(N15, N14, N11, N13, N12, N10, N7, N3, PIXEL)\
  391. ALPHA_BLEND_192_W(E[N13], PIXEL); \
  392. ALPHA_BLEND_64_W( E[N12], PIXEL); \
  393. E[N15] = E[N14] = E[N11] = PIXEL; \
  394. E[N10] = E[N3] = E[N12]; \
  395. E[N7] = E[N13]; \
  396. #define LEFT_2(N15, N14, N11, N13, N12, N10, PIXEL)\
  397. ALPHA_BLEND_192_W(E[N11], PIXEL); \
  398. ALPHA_BLEND_192_W(E[N13], PIXEL); \
  399. ALPHA_BLEND_64_W( E[N10], PIXEL); \
  400. ALPHA_BLEND_64_W( E[N12], PIXEL); \
  401. E[N14] = PIXEL; \
  402. E[N15] = PIXEL; \
  403. #define UP_2(N15, N14, N11, N3, N7, N10, PIXEL)\
  404. ALPHA_BLEND_192_W(E[N14], PIXEL); \
  405. ALPHA_BLEND_192_W(E[N7 ], PIXEL); \
  406. ALPHA_BLEND_64_W( E[N10], PIXEL); \
  407. ALPHA_BLEND_64_W( E[N3 ], PIXEL); \
  408. E[N11] = PIXEL; \
  409. E[N15] = PIXEL; \
  410. #define DIA(N15, N14, N11, PIXEL)\
  411. ALPHA_BLEND_128_W(E[N11], PIXEL); \
  412. ALPHA_BLEND_128_W(E[N14], PIXEL); \
  413. E[N15] = PIXEL; \
  414. #define FILTRO(PE, PI, PH, PF, PG, PC, PD, PB, PA, G5, C4, G0, D0, C1, B1, F4, I4, H5, I5, A0, A1, N15, N14, N11, N3, N7, N10, N13, N12, N9, N6, N2, N1, N5, N8, N4, N0,r2y) \
  415. ex = (PE!=PH && PE!=PF); \
  416. if ( ex )\
  417. {\
  418. e = (df(PE,PC,r2y)+df(PE,PG,r2y)+df(PI,H5,r2y)+df(PI,F4,r2y))+(df(PH,PF,r2y)<<2); \
  419. i = (df(PH,PD,r2y)+df(PH,I5,r2y)+df(PF,I4,r2y)+df(PF,PB,r2y))+(df(PE,PI,r2y)<<2); \
  420. if ((e<i) && ( !eq(PF,PB,r2y) && !eq(PH,PD,r2y) || eq(PE,PI,r2y) && (!eq(PF,I4,r2y) && !eq(PH,I5,r2y)) || eq(PE,PG,r2y) || eq(PE,PC,r2y)) )\
  421. {\
  422. ke=df(PF,PG,r2y); ki=df(PH,PC,r2y); \
  423. ex2 = (PE!=PC && PB!=PC); ex3 = (PE!=PG && PD!=PG); px = (df(PE,PF,r2y) <= df(PE,PH,r2y)) ? PF : PH; \
  424. if ( ((ke<<1)<=ki) && ex3 && (ke>=(ki<<1)) && ex2 ) \
  425. {\
  426. LEFT_UP_2(N15, N14, N11, N13, N12, N10, N7, N3, px)\
  427. }\
  428. else if ( ((ke<<1)<=ki) && ex3 ) \
  429. {\
  430. LEFT_2(N15, N14, N11, N13, N12, N10, px)\
  431. }\
  432. else if ( (ke>=(ki<<1)) && ex2 ) \
  433. {\
  434. UP_2(N15, N14, N11, N3, N7, N10, px)\
  435. }\
  436. else \
  437. {\
  438. DIA(N15, N14, N11, px)\
  439. }\
  440. }\
  441. else if (e<=i)\
  442. {\
  443. ALPHA_BLEND_128_W( E[N15], ((df(PE,PF,r2y) <= df(PE,PH,r2y)) ? PF : PH)); \
  444. }\
  445. }\
  446. static void xbr4x(AVFrame *input, AVFrame *output, const uint32_t *r2y)
  447. {
  448. const int nl = output->linesize[0]>>2;
  449. const int nl1 = nl + nl;
  450. const int nl2 = nl1 + nl;
  451. unsigned int e, i, px;
  452. unsigned int ex, ex2, ex3;
  453. unsigned int ke, ki;
  454. uint32_t pprev;
  455. uint32_t pprev2;
  456. int x, y;
  457. for (y = 0; y < input->height; y++) {
  458. uint32_t * E = (uint32_t *)(output->data[0] + y * output->linesize[0] * 4);
  459. /* middle. Offset of -8 is given */
  460. uint32_t * sa2 = (uint32_t *)(input->data[0] + y * input->linesize[0] - 8);
  461. /* up one */
  462. uint32_t * sa1 = sa2 - (input->linesize[0]>>2);
  463. /* up two */
  464. uint32_t * sa0 = sa1 - (input->linesize[0]>>2);
  465. /* down one */
  466. uint32_t * sa3 = sa2 + (input->linesize[0]>>2);
  467. /* down two */
  468. uint32_t * sa4 = sa3 + (input->linesize[0]>>2);
  469. if (y <= 1) {
  470. sa0 = sa1;
  471. if (y == 0) {
  472. sa0 = sa1 = sa2;
  473. }
  474. }
  475. if (y >= input->height - 2) {
  476. sa4 = sa3;
  477. if (y == input->height - 1) {
  478. sa4 = sa3 = sa2;
  479. }
  480. }
  481. pprev = pprev2 = 2;
  482. for (x = 0; x < input->width; x++) {
  483. uint32_t B1 = sa0[2];
  484. uint32_t PB = sa1[2];
  485. uint32_t PE = sa2[2];
  486. uint32_t PH = sa3[2];
  487. uint32_t H5 = sa4[2];
  488. uint32_t A1 = sa0[pprev];
  489. uint32_t PA = sa1[pprev];
  490. uint32_t PD = sa2[pprev];
  491. uint32_t PG = sa3[pprev];
  492. uint32_t G5 = sa4[pprev];
  493. uint32_t A0 = sa1[pprev2];
  494. uint32_t D0 = sa2[pprev2];
  495. uint32_t G0 = sa3[pprev2];
  496. uint32_t C1 = 0;
  497. uint32_t PC = 0;
  498. uint32_t PF = 0;
  499. uint32_t PI = 0;
  500. uint32_t I5 = 0;
  501. uint32_t C4 = 0;
  502. uint32_t F4 = 0;
  503. uint32_t I4 = 0;
  504. if (x >= input->width - 2) {
  505. if (x == input->width - 1) {
  506. C1 = sa0[2];
  507. PC = sa1[2];
  508. PF = sa2[2];
  509. PI = sa3[2];
  510. I5 = sa4[2];
  511. C4 = sa1[2];
  512. F4 = sa2[2];
  513. I4 = sa3[2];
  514. } else {
  515. C1 = sa0[3];
  516. PC = sa1[3];
  517. PF = sa2[3];
  518. PI = sa3[3];
  519. I5 = sa4[3];
  520. C4 = sa1[3];
  521. F4 = sa2[3];
  522. I4 = sa3[3];
  523. }
  524. } else {
  525. C1 = sa0[3];
  526. PC = sa1[3];
  527. PF = sa2[3];
  528. PI = sa3[3];
  529. I5 = sa4[3];
  530. C4 = sa1[4];
  531. F4 = sa2[4];
  532. I4 = sa3[4];
  533. }
  534. E[0] = E[1] = E[2] = E[3] = PE;
  535. E[nl] = E[nl+1] = E[nl+2] = E[nl+3] = PE; // 4, 5, 6, 7
  536. E[nl1] = E[nl1+1] = E[nl1+2] = E[nl1+3] = PE; // 8, 9, 10, 11
  537. E[nl2] = E[nl2+1] = E[nl2+2] = E[nl2+3] = PE; // 12, 13, 14, 15
  538. FILTRO(PE, PI, PH, PF, PG, PC, PD, PB, PA, G5, C4, G0, D0, C1, B1, F4, I4, H5, I5, A0, A1, nl2+3, nl2+2, nl1+3, 3, nl+3, nl1+2, nl2+1, nl2, nl1+1, nl+2, 2, 1, nl+1, nl1, nl, 0,r2y);
  539. FILTRO(PE, PC, PF, PB, PI, PA, PH, PD, PG, I4, A1, I5, H5, A0, D0, B1, C1, F4, C4, G5, G0, 3, nl+3, 2, 0, 1, nl+2, nl1+3, nl2+3, nl1+2, nl+1, nl, nl1, nl1+1,nl2+2,nl2+1,nl2,r2y);
  540. FILTRO(PE, PA, PB, PD, PC, PG, PF, PH, PI, C1, G0, C4, F4, G5, H5, D0, A0, B1, A1, I4, I5, 0, 1, nl, nl2, nl1, nl+1, 2, 3, nl+2, nl1+1, nl2+1,nl2+2,nl1+2, nl+3,nl1+3,nl2+3,r2y);
  541. FILTRO(PE, PG, PD, PH, PA, PI, PB, PF, PC, A0, I5, A1, B1, I4, F4, H5, G5, D0, G0, C1, C4, nl2, nl1, nl2+1, nl2+3, nl2+2, nl1+1, nl, 0, nl+1, nl1+2, nl1+3, nl+3, nl+2, 1, 2, 3,r2y);
  542. sa0 += 1;
  543. sa1 += 1;
  544. sa2 += 1;
  545. sa3 += 1;
  546. sa4 += 1;
  547. E += 4;
  548. if (pprev2){
  549. pprev2--;
  550. pprev = 1;
  551. }
  552. }
  553. }
  554. }
  555. #undef FILTRO
  556. static int config_output(AVFilterLink *outlink)
  557. {
  558. AVFilterContext *ctx = outlink->src;
  559. XBRContext *xbr = ctx->priv;
  560. AVFilterLink *inlink = ctx->inputs[0];
  561. outlink->w = inlink->w * xbr->n;
  562. outlink->h = inlink->h * xbr->n;
  563. return 0;
  564. }
  565. static int query_formats(AVFilterContext *ctx)
  566. {
  567. static const enum AVPixelFormat pix_fmts[] = {
  568. AV_PIX_FMT_0RGB32, AV_PIX_FMT_NONE,
  569. };
  570. ff_set_common_formats(ctx, ff_make_format_list(pix_fmts));
  571. return 0;
  572. }
  573. static int filter_frame(AVFilterLink *inlink, AVFrame *in)
  574. {
  575. AVFilterContext *ctx = inlink->dst;
  576. AVFilterLink *outlink = ctx->outputs[0];
  577. XBRContext *xbr = ctx->priv;
  578. const uint32_t *r2y = xbr->rgbtoyuv;
  579. AVFrame *out = ff_get_video_buffer(outlink, outlink->w, outlink->h);
  580. if (!out) {
  581. av_frame_free(&in);
  582. return AVERROR(ENOMEM);
  583. }
  584. av_frame_copy_props(out, in);
  585. if (xbr->n == 4)
  586. xbr4x(in, out, r2y);
  587. else if (xbr->n == 3)
  588. xbr3x(in, out, r2y);
  589. else
  590. xbr2x(in, out, r2y);
  591. out->width = outlink->w;
  592. out->height = outlink->h;
  593. av_frame_free(&in);
  594. return ff_filter_frame(outlink, out);
  595. }
  596. static int init(AVFilterContext *ctx)
  597. {
  598. XBRContext *xbr = ctx->priv;
  599. uint32_t c;
  600. int bg, rg, g;
  601. for (bg = -255; bg < 256; bg++) {
  602. for (rg = -255; rg < 256; rg++) {
  603. const uint32_t u = (uint32_t)((-169*rg + 500*bg)/1000) + 128;
  604. const uint32_t v = (uint32_t)(( 500*rg - 81*bg)/1000) + 128;
  605. int startg = FFMAX3(-bg, -rg, 0);
  606. int endg = FFMIN3(255-bg, 255-rg, 255);
  607. uint32_t y = (uint32_t)(( 299*rg + 1000*startg + 114*bg)/1000);
  608. c = bg + (rg<<16) + 0x010101 * startg;
  609. for (g = startg; g <= endg; g++) {
  610. xbr->rgbtoyuv[c] = ((y++) << 16) + (u << 8) + v;
  611. c+= 0x010101;
  612. }
  613. }
  614. }
  615. return 0;
  616. }
  617. static const AVFilterPad xbr_inputs[] = {
  618. {
  619. .name = "default",
  620. .type = AVMEDIA_TYPE_VIDEO,
  621. .filter_frame = filter_frame,
  622. },
  623. { NULL }
  624. };
  625. static const AVFilterPad xbr_outputs[] = {
  626. {
  627. .name = "default",
  628. .type = AVMEDIA_TYPE_VIDEO,
  629. .config_props = config_output,
  630. },
  631. { NULL }
  632. };
  633. AVFilter ff_vf_xbr = {
  634. .name = "xbr",
  635. .description = NULL_IF_CONFIG_SMALL("Scale the input using xBR algorithm."),
  636. .inputs = xbr_inputs,
  637. .outputs = xbr_outputs,
  638. .query_formats = query_formats,
  639. .priv_size = sizeof(XBRContext),
  640. .priv_class = &xbr_class,
  641. .init = init,
  642. };