You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

228 lines
6.0KB

  1. /*
  2. Copyright (C) 2003 Michael Niedermayer <michaelni@gmx.at>
  3. This program is free software; you can redistribute it and/or modify
  4. it under the terms of the GNU General Public License as published by
  5. the Free Software Foundation; either version 2 of the License, or
  6. (at your option) any later version.
  7. This program is distributed in the hope that it will be useful,
  8. but WITHOUT ANY WARRANTY; without even the implied warranty of
  9. MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  10. GNU General Public License for more details.
  11. You should have received a copy of the GNU General Public License
  12. along with this program; if not, write to the Free Software
  13. Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA
  14. */
  15. #include <stdio.h>
  16. #include <stdlib.h>
  17. #include <string.h>
  18. #include <inttypes.h>
  19. #include <stdarg.h>
  20. #undef HAVE_AV_CONFIG_H
  21. #include "avutil.h"
  22. #include "swscale.h"
  23. #include "swscale_internal.h"
  24. #include "rgb2rgb.h"
  25. static uint64_t getSSD(uint8_t *src1, uint8_t *src2, int stride1, int stride2, int w, int h){
  26. int x,y;
  27. uint64_t ssd=0;
  28. //printf("%d %d\n", w, h);
  29. for(y=0; y<h; y++){
  30. for(x=0; x<w; x++){
  31. int d= src1[x + y*stride1] - src2[x + y*stride2];
  32. ssd+= d*d;
  33. //printf("%d", abs(src1[x + y*stride1] - src2[x + y*stride2])/26 );
  34. }
  35. //printf("\n");
  36. }
  37. return ssd;
  38. }
  39. // test by ref -> src -> dst -> out & compare out against ref
  40. // ref & out are YV12
  41. static int doTest(uint8_t *ref[3], int refStride[3], int w, int h, int srcFormat, int dstFormat,
  42. int srcW, int srcH, int dstW, int dstH, int flags){
  43. uint8_t *src[3];
  44. uint8_t *dst[3];
  45. uint8_t *out[3];
  46. int srcStride[3], dstStride[3];
  47. int i;
  48. uint64_t ssdY, ssdU, ssdV;
  49. struct SwsContext *srcContext, *dstContext, *outContext;
  50. int res;
  51. res = 0;
  52. for(i=0; i<3; i++){
  53. // avoid stride % bpp != 0
  54. if(srcFormat==PIX_FMT_RGB24 || srcFormat==PIX_FMT_BGR24)
  55. srcStride[i]= srcW*3;
  56. else
  57. srcStride[i]= srcW*4;
  58. if(dstFormat==PIX_FMT_RGB24 || dstFormat==PIX_FMT_BGR24)
  59. dstStride[i]= dstW*3;
  60. else
  61. dstStride[i]= dstW*4;
  62. src[i]= (uint8_t*) malloc(srcStride[i]*srcH);
  63. dst[i]= (uint8_t*) malloc(dstStride[i]*dstH);
  64. out[i]= (uint8_t*) malloc(refStride[i]*h);
  65. if ((src[i] == NULL) || (dst[i] == NULL) || (out[i] == NULL)) {
  66. perror("Malloc");
  67. res = -1;
  68. goto end;
  69. }
  70. }
  71. dstContext = outContext = NULL;
  72. srcContext= sws_getContext(w, h, PIX_FMT_YUV420P, srcW, srcH, srcFormat, flags, NULL, NULL, NULL);
  73. if (srcContext == NULL) {
  74. fprintf(stderr, "Failed to get %s ---> %s\n",
  75. sws_format_name(PIX_FMT_YUV420P),
  76. sws_format_name(srcFormat));
  77. res = -1;
  78. goto end;
  79. }
  80. dstContext= sws_getContext(srcW, srcH, srcFormat, dstW, dstH, dstFormat, flags, NULL, NULL, NULL);
  81. if (dstContext == NULL) {
  82. fprintf(stderr, "Failed to get %s ---> %s\n",
  83. sws_format_name(srcFormat),
  84. sws_format_name(dstFormat));
  85. res = -1;
  86. goto end;
  87. }
  88. outContext= sws_getContext(dstW, dstH, dstFormat, w, h, PIX_FMT_YUV420P, flags, NULL, NULL, NULL);
  89. if (outContext == NULL) {
  90. fprintf(stderr, "Failed to get %s ---> %s\n",
  91. sws_format_name(dstFormat),
  92. sws_format_name(PIX_FMT_YUV420P));
  93. res = -1;
  94. goto end;
  95. }
  96. // printf("test %X %X %X -> %X %X %X\n", (int)ref[0], (int)ref[1], (int)ref[2],
  97. // (int)src[0], (int)src[1], (int)src[2]);
  98. sws_scale(srcContext, ref, refStride, 0, h , src, srcStride);
  99. sws_scale(dstContext, src, srcStride, 0, srcH, dst, dstStride);
  100. sws_scale(outContext, dst, dstStride, 0, dstH, out, refStride);
  101. #if defined(ARCH_X86) || defined(ARCH_X86_64)
  102. asm volatile ("emms\n\t");
  103. #endif
  104. ssdY= getSSD(ref[0], out[0], refStride[0], refStride[0], w, h);
  105. ssdU= getSSD(ref[1], out[1], refStride[1], refStride[1], (w+1)>>1, (h+1)>>1);
  106. ssdV= getSSD(ref[2], out[2], refStride[2], refStride[2], (w+1)>>1, (h+1)>>1);
  107. if(srcFormat == PIX_FMT_GRAY8 || dstFormat==PIX_FMT_GRAY8) ssdU=ssdV=0; //FIXME check that output is really gray
  108. ssdY/= w*h;
  109. ssdU/= w*h/4;
  110. ssdV/= w*h/4;
  111. if(ssdY>100 || ssdU>100 || ssdV>100){
  112. printf(" %s %dx%d -> %s %4dx%4d flags=%2d SSD=%5lld,%5lld,%5lld\n",
  113. sws_format_name(srcFormat), srcW, srcH,
  114. sws_format_name(dstFormat), dstW, dstH,
  115. flags,
  116. ssdY, ssdU, ssdV);
  117. }
  118. end:
  119. sws_freeContext(srcContext);
  120. sws_freeContext(dstContext);
  121. sws_freeContext(outContext);
  122. for(i=0; i<3; i++){
  123. free(src[i]);
  124. free(dst[i]);
  125. free(out[i]);
  126. }
  127. return res;
  128. }
  129. void fast_memcpy(void *a, void *b, int s){ //FIXME
  130. memcpy(a, b, s);
  131. }
  132. static void selfTest(uint8_t *src[3], int stride[3], int w, int h){
  133. enum PixelFormat srcFormat, dstFormat;
  134. int srcW, srcH, dstW, dstH;
  135. int flags;
  136. for(srcFormat = 0; srcFormat < PIX_FMT_NB; srcFormat++) {
  137. for(dstFormat = 0; dstFormat < PIX_FMT_NB; dstFormat++) {
  138. printf("%s -> %s\n",
  139. sws_format_name(srcFormat),
  140. sws_format_name(dstFormat));
  141. srcW= w;
  142. srcH= h;
  143. for(dstW=w - w/3; dstW<= 4*w/3; dstW+= w/3){
  144. for(dstH=h - h/3; dstH<= 4*h/3; dstH+= h/3){
  145. for(flags=1; flags<33; flags*=2) {
  146. int res;
  147. res = doTest(src, stride, w, h, srcFormat, dstFormat,
  148. srcW, srcH, dstW, dstH, flags);
  149. if (res < 0) {
  150. dstW = 4 * w / 3;
  151. dstH = 4 * h / 3;
  152. flags = 33;
  153. }
  154. }
  155. }
  156. }
  157. }
  158. }
  159. }
  160. #define W 96
  161. #define H 96
  162. int main(int argc, char **argv){
  163. uint8_t rgb_data[W*H*4];
  164. uint8_t *rgb_src[3]= {rgb_data, NULL, NULL};
  165. int rgb_stride[3]={4*W, 0, 0};
  166. uint8_t data[3][W*H];
  167. uint8_t *src[3]= {data[0], data[1], data[2]};
  168. int stride[3]={W, W, W};
  169. int x, y;
  170. struct SwsContext *sws;
  171. sws= sws_getContext(W/12, H/12, PIX_FMT_RGB32, W, H, PIX_FMT_YUV420P, 2, NULL, NULL, NULL);
  172. for(y=0; y<H; y++){
  173. for(x=0; x<W*4; x++){
  174. rgb_data[ x + y*4*W]= random();
  175. }
  176. }
  177. #if defined(ARCH_X86) || defined(ARCH_X86_64)
  178. sws_rgb2rgb_init(SWS_CPU_CAPS_MMX*0);
  179. #else
  180. sws_rgb2rgb_init(0);
  181. #endif
  182. sws_scale(sws, rgb_src, rgb_stride, 0, H , src, stride);
  183. #if defined(ARCH_X86) || defined(ARCH_X86_64)
  184. asm volatile ("emms\n\t");
  185. #endif
  186. selfTest(src, stride, W, H);
  187. return 123;
  188. }