|
- /*
- * Misc image convertion routines
- * Copyright (c) 2001, 2002 Fabrice Bellard.
- *
- * This library is free software; you can redistribute it and/or
- * modify it under the terms of the GNU Lesser General Public
- * License as published by the Free Software Foundation; either
- * version 2 of the License, or (at your option) any later version.
- *
- * This library is distributed in the hope that it will be useful,
- * but WITHOUT ANY WARRANTY; without even the implied warranty of
- * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
- * Lesser General Public License for more details.
- *
- * You should have received a copy of the GNU Lesser General Public
- * License along with this library; if not, write to the Free Software
- * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
- */
- #include "avcodec.h"
- #include "dsputil.h"
-
- #ifdef USE_FASTMEMCPY
- #include "fastmemcpy.h"
- #endif
-
- #ifdef HAVE_MMX
- #include "i386/mmx.h"
- #endif
- /* XXX: totally non optimized */
-
- static void yuv422_to_yuv420p(UINT8 *lum, UINT8 *cb, UINT8 *cr,
- UINT8 *src, int width, int height)
- {
- int x, y;
- UINT8 *p = src;
-
- for(y=0;y<height;y+=2) {
- for(x=0;x<width;x+=2) {
- lum[0] = p[0];
- cb[0] = p[1];
- lum[1] = p[2];
- cr[0] = p[3];
- p += 4;
- lum += 2;
- cb++;
- cr++;
- }
- for(x=0;x<width;x+=2) {
- lum[0] = p[0];
- lum[1] = p[2];
- p += 4;
- lum += 2;
- }
- }
- }
-
- #define SCALEBITS 8
- #define ONE_HALF (1 << (SCALEBITS - 1))
- #define FIX(x) ((int) ((x) * (1L<<SCALEBITS) + 0.5))
-
- static void rgb24_to_yuv420p(UINT8 *lum, UINT8 *cb, UINT8 *cr,
- UINT8 *src, int width, int height)
- {
- int wrap, wrap3, x, y;
- int r, g, b, r1, g1, b1;
- UINT8 *p;
-
- wrap = width;
- wrap3 = width * 3;
- p = src;
- for(y=0;y<height;y+=2) {
- for(x=0;x<width;x+=2) {
- r = p[0];
- g = p[1];
- b = p[2];
- r1 = r;
- g1 = g;
- b1 = b;
- lum[0] = (FIX(0.29900) * r + FIX(0.58700) * g +
- FIX(0.11400) * b + ONE_HALF) >> SCALEBITS;
- r = p[3];
- g = p[4];
- b = p[5];
- r1 += r;
- g1 += g;
- b1 += b;
- lum[1] = (FIX(0.29900) * r + FIX(0.58700) * g +
- FIX(0.11400) * b + ONE_HALF) >> SCALEBITS;
- p += wrap3;
- lum += wrap;
-
- r = p[0];
- g = p[1];
- b = p[2];
- r1 += r;
- g1 += g;
- b1 += b;
- lum[0] = (FIX(0.29900) * r + FIX(0.58700) * g +
- FIX(0.11400) * b + ONE_HALF) >> SCALEBITS;
- r = p[3];
- g = p[4];
- b = p[5];
- r1 += r;
- g1 += g;
- b1 += b;
- lum[1] = (FIX(0.29900) * r + FIX(0.58700) * g +
- FIX(0.11400) * b + ONE_HALF) >> SCALEBITS;
-
- cb[0] = ((- FIX(0.16874) * r1 - FIX(0.33126) * g1 +
- FIX(0.50000) * b1 + 4 * ONE_HALF - 1) >> (SCALEBITS + 2)) + 128;
- cr[0] = ((FIX(0.50000) * r1 - FIX(0.41869) * g1 -
- FIX(0.08131) * b1 + 4 * ONE_HALF - 1) >> (SCALEBITS + 2)) + 128;
-
- cb++;
- cr++;
- p += -wrap3 + 2 * 3;
- lum += -wrap + 2;
- }
- p += wrap3;
- lum += wrap;
- }
- }
-
- static void rgba32_to_yuv420p(UINT8 *lum, UINT8 *cb, UINT8 *cr,
- UINT8 *src, int width, int height)
- {
- int wrap, wrap4, x, y;
- int r, g, b, r1, g1, b1;
- UINT8 *p;
-
- wrap = width;
- wrap4 = width * 4;
- p = src;
- for(y=0;y<height;y+=2) {
- for(x=0;x<width;x+=2) {
- r = p[0];
- g = p[1];
- b = p[2];
- r1 = r;
- g1 = g;
- b1 = b;
- lum[0] = (FIX(0.29900) * r + FIX(0.58700) * g +
- FIX(0.11400) * b + ONE_HALF) >> SCALEBITS;
- r = p[4];
- g = p[5];
- b = p[6];
- r1 += r;
- g1 += g;
- b1 += b;
- lum[1] = (FIX(0.29900) * r + FIX(0.58700) * g +
- FIX(0.11400) * b + ONE_HALF) >> SCALEBITS;
- p += wrap4;
- lum += wrap;
-
- r = p[0];
- g = p[1];
- b = p[2];
- r1 += r;
- g1 += g;
- b1 += b;
- lum[0] = (FIX(0.29900) * r + FIX(0.58700) * g +
- FIX(0.11400) * b + ONE_HALF) >> SCALEBITS;
- r = p[4];
- g = p[5];
- b = p[6];
- r1 += r;
- g1 += g;
- b1 += b;
- lum[1] = (FIX(0.29900) * r + FIX(0.58700) * g +
- FIX(0.11400) * b + ONE_HALF) >> SCALEBITS;
-
- cb[0] = ((- FIX(0.16874) * r1 - FIX(0.33126) * g1 +
- FIX(0.50000) * b1 + 4 * ONE_HALF - 1) >> (SCALEBITS + 2)) + 128;
- cr[0] = ((FIX(0.50000) * r1 - FIX(0.41869) * g1 -
- FIX(0.08131) * b1 + 4 * ONE_HALF - 1) >> (SCALEBITS + 2)) + 128;
-
- cb++;
- cr++;
- p += -wrap4 + 2 * 4;
- lum += -wrap + 2;
- }
- p += wrap4;
- lum += wrap;
- }
- }
-
- #define rgb565_to_yuv420p(lum,cb,cr,src,width,height) rgbmisc_to_yuv420p((lum),(cb),(cr),(src),(width),(height),0x0800,31, 0x0020,63,0x0001,31)
- #define rgb555_to_yuv420p(lum,cb,cr,src,width,height) rgbmisc_to_yuv420p((lum),(cb),(cr),(src),(width),(height),0x0400,31, 0x0020,31,0x0001,31)
- #define rgb5551_to_yuv420p(lum,cb,cr,src,width,height) rgbmisc_to_yuv420p((lum),(cb),(cr),(src),(width),(height),0x0800,31, 0x0040,31,0x0002,31)
- #define bgr565_to_yuv420p(lum,cb,cr,src,width,height) rgbmisc_to_yuv420p((lum),(cb),(cr),(src),(width),(height),0x0001,31, 0x0020,63,0x0800,31)
- #define bgr555_to_yuv420p(lum,cb,cr,src,width,height) rgbmisc_to_yuv420p((lum),(cb),(cr),(src),(width),(height),0x0001,31, 0x0020,31,0x0400,31)
- #define gbr565_to_yuv420p(lum,cb,cr,src,width,height) rgbmisc_to_yuv420p((lum),(cb),(cr),(src),(width),(height),0x0001,31, 0x0800,31,0x0040,63)
- #define gbr555_to_yuv420p(lum,cb,cr,src,width,height) rgbmisc_to_yuv420p((lum),(cb),(cr),(src),(width),(height),0x0001,31, 0x0400,31,0x0020,31)
-
- static void rgbmisc_to_yuv420p
- (UINT8 *lum, UINT8 *cb, UINT8 *cr,
- UINT8 *src, int width, int height,
-
- UINT16 R_LOWMASK, UINT16 R_MAX,
- UINT16 G_LOWMASK, UINT16 G_MAX,
- UINT16 B_LOWMASK, UINT16 B_MAX
- )
- {
- int wrap, wrap2, x, y;
- int r, g, b, r1, g1, b1;
- UINT8 *p;
- UINT16 pixel;
-
- wrap = width;
- wrap2 = width * 2;
- p = src;
- for(y=0;y<height;y+=2) {
- for(x=0;x<width;x+=2) {
- pixel = p[0] | (p[1]<<8);
- r = (((pixel/R_LOWMASK) & R_MAX) * (0x100 / (R_MAX+1)));
- g = (((pixel/G_LOWMASK) & G_MAX) * (0x100 / (G_MAX+1)));
- b = (((pixel/B_LOWMASK) & B_MAX) * (0x100 / (B_MAX+1)));
- r1 = r;
- g1 = g;
- b1 = b;
- lum[0] = (FIX(0.29900) * r + FIX(0.58700) * g +
- FIX(0.11400) * b + ONE_HALF) >> SCALEBITS;
-
- pixel = p[2] | (p[3]<<8);
- r = (((pixel/R_LOWMASK) & R_MAX) * (0x100 / (R_MAX+1)));
- g = (((pixel/G_LOWMASK) & G_MAX) * (0x100 / (G_MAX+1)));
- b = (((pixel/B_LOWMASK) & B_MAX) * (0x100 / (B_MAX+1)));
- r1 += r;
- g1 += g;
- b1 += b;
- lum[1] = (FIX(0.29900) * r + FIX(0.58700) * g +
- FIX(0.11400) * b + ONE_HALF) >> SCALEBITS;
- p += wrap2;
- lum += wrap;
-
- pixel = p[0] | (p[1]<<8);
- r = (((pixel/R_LOWMASK) & R_MAX) * (0x100 / (R_MAX+1)));
- g = (((pixel/G_LOWMASK) & G_MAX) * (0x100 / (G_MAX+1)));
- b = (((pixel/B_LOWMASK) & B_MAX) * (0x100 / (B_MAX+1)));
- r1 += r;
- g1 += g;
- b1 += b;
- lum[0] = (FIX(0.29900) * r + FIX(0.58700) * g +
- FIX(0.11400) * b + ONE_HALF) >> SCALEBITS;
- pixel = p[2] | (p[3]<<8);
- r = (((pixel/R_LOWMASK) & R_MAX) * (0x100 / (R_MAX+1)));
- g = (((pixel/G_LOWMASK) & G_MAX) * (0x100 / (G_MAX+1)));
- b = (((pixel/B_LOWMASK) & B_MAX) * (0x100 / (B_MAX+1)));
- r1 += r;
- g1 += g;
- b1 += b;
- lum[1] = (FIX(0.29900) * r + FIX(0.58700) * g +
- FIX(0.11400) * b + ONE_HALF) >> SCALEBITS;
-
- cb[0] = ((- FIX(0.16874) * r1 - FIX(0.33126) * g1 +
- FIX(0.50000) * b1 + 4 * ONE_HALF - 1) >> (SCALEBITS + 2)) + 128;
- cr[0] = ((FIX(0.50000) * r1 - FIX(0.41869) * g1 -
- FIX(0.08131) * b1 + 4 * ONE_HALF - 1) >> (SCALEBITS + 2)) + 128;
-
- cb++;
- cr++;
- p += -wrap2 + 2 * 2;
- lum += -wrap + 2;
- }
- p += wrap2;
- lum += wrap;
- }
- }
-
-
- static void bgr24_to_yuv420p(UINT8 *lum, UINT8 *cb, UINT8 *cr,
- UINT8 *src, int width, int height)
- {
- int wrap, wrap3, x, y;
- int r, g, b, r1, g1, b1;
- UINT8 *p;
-
- wrap = width;
- wrap3 = width * 3;
- p = src;
- for(y=0;y<height;y+=2) {
- for(x=0;x<width;x+=2) {
- b = p[0];
- g = p[1];
- r = p[2];
- r1 = r;
- g1 = g;
- b1 = b;
- lum[0] = (FIX(0.29900) * r + FIX(0.58700) * g +
- FIX(0.11400) * b + ONE_HALF) >> SCALEBITS;
- b = p[3];
- g = p[4];
- r = p[5];
- r1 += r;
- g1 += g;
- b1 += b;
- lum[1] = (FIX(0.29900) * r + FIX(0.58700) * g +
- FIX(0.11400) * b + ONE_HALF) >> SCALEBITS;
- p += wrap3;
- lum += wrap;
-
- b = p[0];
- g = p[1];
- r = p[2];
- r1 += r;
- g1 += g;
- b1 += b;
- lum[0] = (FIX(0.29900) * r + FIX(0.58700) * g +
- FIX(0.11400) * b + ONE_HALF) >> SCALEBITS;
- b = p[3];
- g = p[4];
- r = p[5];
- r1 += r;
- g1 += g;
- b1 += b;
- lum[1] = (FIX(0.29900) * r + FIX(0.58700) * g +
- FIX(0.11400) * b + ONE_HALF) >> SCALEBITS;
-
- cb[0] = ((- FIX(0.16874) * r1 - FIX(0.33126) * g1 +
- FIX(0.50000) * b1 + 4 * ONE_HALF - 1) >> (SCALEBITS + 2)) + 128;
- cr[0] = ((FIX(0.50000) * r1 - FIX(0.41869) * g1 -
- FIX(0.08131) * b1 + 4 * ONE_HALF - 1) >> (SCALEBITS + 2)) + 128;
-
- cb++;
- cr++;
- p += -wrap3 + 2 * 3;
- lum += -wrap + 2;
- }
- p += wrap3;
- lum += wrap;
- }
- }
-
- static void bgra32_to_yuv420p(UINT8 *lum, UINT8 *cb, UINT8 *cr,
- UINT8 *src, int width, int height)
- {
- int wrap, wrap4, x, y;
- int r, g, b, r1, g1, b1;
- UINT8 *p;
-
- wrap = width;
- wrap4 = width * 4;
- p = src;
- for(y=0;y<height;y+=2) {
- for(x=0;x<width;x+=2) {
- b = p[0];
- g = p[1];
- r = p[2];
- r1 = r;
- g1 = g;
- b1 = b;
- lum[0] = (FIX(0.29900) * r + FIX(0.58700) * g +
- FIX(0.11400) * b + ONE_HALF) >> SCALEBITS;
- b = p[4];
- g = p[5];
- r = p[6];
- r1 += r;
- g1 += g;
- b1 += b;
- lum[1] = (FIX(0.29900) * r + FIX(0.58700) * g +
- FIX(0.11400) * b + ONE_HALF) >> SCALEBITS;
- p += wrap4;
- lum += wrap;
-
- b = p[0];
- g = p[1];
- r = p[2];
- r1 += r;
- g1 += g;
- b1 += b;
- lum[0] = (FIX(0.29900) * r + FIX(0.58700) * g +
- FIX(0.11400) * b + ONE_HALF) >> SCALEBITS;
- b = p[4];
- g = p[5];
- r = p[6];
- r1 += r;
- g1 += g;
- b1 += b;
- lum[1] = (FIX(0.29900) * r + FIX(0.58700) * g +
- FIX(0.11400) * b + ONE_HALF) >> SCALEBITS;
-
- cb[0] = ((- FIX(0.16874) * r1 - FIX(0.33126) * g1 +
- FIX(0.50000) * b1 + 4 * ONE_HALF - 1) >> (SCALEBITS + 2)) + 128;
- cr[0] = ((FIX(0.50000) * r1 - FIX(0.41869) * g1 -
- FIX(0.08131) * b1 + 4 * ONE_HALF - 1) >> (SCALEBITS + 2)) + 128;
-
- cb++;
- cr++;
- p += -wrap4 + 2 * 4;
- lum += -wrap + 2;
- }
- p += wrap4;
- lum += wrap;
- }
- }
-
- /* XXX: use generic filter ? */
- /* 1x2 -> 1x1 */
- static void shrink2(UINT8 *dst, int dst_wrap,
- UINT8 *src, int src_wrap,
- int width, int height)
- {
- int w;
- UINT8 *s1, *s2, *d;
-
- for(;height > 0; height--) {
- s1 = src;
- s2 = s1 + src_wrap;
- d = dst;
- for(w = width;w >= 4; w-=4) {
- d[0] = (s1[0] + s2[0]) >> 1;
- d[1] = (s1[1] + s2[1]) >> 1;
- d[2] = (s1[2] + s2[2]) >> 1;
- d[3] = (s1[3] + s2[3]) >> 1;
- s1 += 4;
- s2 += 4;
- d += 4;
- }
- for(;w > 0; w--) {
- d[0] = (s1[0] + s2[0]) >> 1;
- s1++;
- s2++;
- d++;
- }
- src += 2 * src_wrap;
- dst += dst_wrap;
- }
- }
-
- /* 2x2 -> 1x1 */
- static void shrink22(UINT8 *dst, int dst_wrap,
- UINT8 *src, int src_wrap,
- int width, int height)
- {
- int w;
- UINT8 *s1, *s2, *d;
-
- for(;height > 0; height--) {
- s1 = src;
- s2 = s1 + src_wrap;
- d = dst;
- for(w = width;w >= 4; w-=4) {
- d[0] = (s1[0] + s1[1] + s2[0] + s2[1] + 2) >> 1;
- d[1] = (s1[2] + s1[3] + s2[2] + s2[3] + 2) >> 1;
- d[2] = (s1[4] + s1[5] + s2[4] + s2[5] + 2) >> 1;
- d[3] = (s1[6] + s1[7] + s2[6] + s2[7] + 2) >> 1;
- s1 += 8;
- s2 += 8;
- d += 4;
- }
- for(;w > 0; w--) {
- d[0] = (s1[0] + s1[1] + s2[0] + s2[1] + 2) >> 1;
- s1 += 2;
- s2 += 2;
- d++;
- }
- src += 2 * src_wrap;
- dst += dst_wrap;
- }
- }
-
- /* 1x1 -> 2x2 */
- static void grow22(UINT8 *dst, int dst_wrap,
- UINT8 *src, int src_wrap,
- int width, int height)
- {
- int w;
- UINT8 *s1, *d;
-
- for(;height > 0; height--) {
- s1 = src;
- d = dst;
- for(w = width;w >= 4; w-=4) {
- d[1] = d[0] = s1[0];
- d[3] = d[2] = s1[1];
- s1 += 2;
- d += 4;
- }
- for(;w > 0; w--) {
- d[0] = s1[0];
- s1 ++;
- d++;
- }
- if (height%2)
- src += src_wrap;
- dst += dst_wrap;
- }
- }
-
- /* 1x2 -> 2x1. width and height are given for the source picture */
- static void conv411(UINT8 *dst, int dst_wrap,
- UINT8 *src, int src_wrap,
- int width, int height)
- {
- int w, c;
- UINT8 *s1, *s2, *d;
-
- for(;height > 0; height -= 2) {
- s1 = src;
- s2 = src + src_wrap;
- d = dst;
- for(w = width;w > 0; w--) {
- c = (s1[0] + s2[0]) >> 1;
- d[0] = c;
- d[1] = c;
- s1++;
- s2++;
- d += 2;
- }
- src += src_wrap * 2;
- dst += dst_wrap;
- }
- }
-
- static void img_copy(UINT8 *dst, int dst_wrap,
- UINT8 *src, int src_wrap,
- int width, int height)
- {
- for(;height > 0; height--) {
- memcpy(dst, src, width);
- dst += dst_wrap;
- src += src_wrap;
- }
- }
-
- #define SCALE_BITS 10
-
- #define C_Y (76309 >> (16 - SCALE_BITS))
- #define C_RV (117504 >> (16 - SCALE_BITS))
- #define C_BU (138453 >> (16 - SCALE_BITS))
- #define C_GU (13954 >> (16 - SCALE_BITS))
- #define C_GV (34903 >> (16 - SCALE_BITS))
-
- #define RGBOUT(r, g, b, y1)\
- {\
- y = (y1 - 16) * C_Y;\
- r = cm[(y + r_add) >> SCALE_BITS];\
- g = cm[(y + g_add) >> SCALE_BITS];\
- b = cm[(y + b_add) >> SCALE_BITS];\
- }
-
- /* XXX: no chroma interpolating is done */
- static void yuv420p_to_bgra32(AVPicture *dst, AVPicture *src,
- int width, int height)
- {
- UINT8 *y1_ptr, *y2_ptr, *cb_ptr, *cr_ptr, *d, *d1, *d2;
- int w, y, cb, cr, r_add, g_add, b_add, width2;
- UINT8 *cm = cropTbl + MAX_NEG_CROP;
-
- d = dst->data[0];
- y1_ptr = src->data[0];
- cb_ptr = src->data[1];
- cr_ptr = src->data[2];
- width2 = width >> 1;
- for(;height > 0; height -= 2) {
- d1 = d;
- d2 = d + dst->linesize[0];
- y2_ptr = y1_ptr + src->linesize[0];
- for(w = width2; w > 0; w --) {
- cb = cb_ptr[0] - 128;
- cr = cr_ptr[0] - 128;
- r_add = C_RV * cr + (1 << (SCALE_BITS - 1));
- g_add = - C_GU * cb - C_GV * cr + (1 << (SCALE_BITS - 1));
- b_add = C_BU * cb + (1 << (SCALE_BITS - 1));
-
- /* output 4 pixels */
- RGBOUT(d1[2], d1[1], d1[0], y1_ptr[0]);
- RGBOUT(d1[6], d1[5], d1[4], y1_ptr[1]);
- RGBOUT(d2[2], d2[1], d2[0], y2_ptr[0]);
- RGBOUT(d2[6], d2[5], d2[4], y2_ptr[1]);
-
- d1[3] = d1[7] = d2[3] = d2[7] = 255;
-
- d1 += 8;
- d2 += 8;
- y1_ptr += 2;
- y2_ptr += 2;
- cb_ptr++;
- cr_ptr++;
- }
- d += 2 * dst->linesize[0];
- y1_ptr += 2 * src->linesize[0] - width;
- cb_ptr += src->linesize[1] - width2;
- cr_ptr += src->linesize[2] - width2;
- }
- }
-
- /* XXX: no chroma interpolating is done */
- static void yuv420p_to_rgba32(AVPicture *dst, AVPicture *src,
- int width, int height)
- {
- UINT8 *y1_ptr, *y2_ptr, *cb_ptr, *cr_ptr, *d, *d1, *d2;
- int w, y, cb, cr, r_add, g_add, b_add, width2;
- UINT8 *cm = cropTbl + MAX_NEG_CROP;
-
- d = dst->data[0];
- y1_ptr = src->data[0];
- cb_ptr = src->data[1];
- cr_ptr = src->data[2];
- width2 = width >> 1;
- for(;height > 0; height -= 2) {
- d1 = d;
- d2 = d + dst->linesize[0];
- y2_ptr = y1_ptr + src->linesize[0];
- for(w = width2; w > 0; w --) {
- cb = cb_ptr[0] - 128;
- cr = cr_ptr[0] - 128;
- r_add = C_RV * cr + (1 << (SCALE_BITS - 1));
- g_add = - C_GU * cb - C_GV * cr + (1 << (SCALE_BITS - 1));
- b_add = C_BU * cb + (1 << (SCALE_BITS - 1));
-
- /* output 4 pixels */
- RGBOUT(d1[0], d1[1], d1[2], y1_ptr[0]);
- RGBOUT(d1[4], d1[5], d1[6], y1_ptr[1]);
- RGBOUT(d2[0], d2[1], d2[2], y2_ptr[0]);
- RGBOUT(d2[4], d2[5], d2[6], y2_ptr[1]);
-
- d1[3] = d1[7] = d2[3] = d2[7] = 255;
-
- d1 += 8;
- d2 += 8;
- y1_ptr += 2;
- y2_ptr += 2;
- cb_ptr++;
- cr_ptr++;
- }
- d += 2 * dst->linesize[0];
- y1_ptr += 2 * src->linesize[0] - width;
- cb_ptr += src->linesize[1] - width2;
- cr_ptr += src->linesize[2] - width2;
- }
- }
-
- /* XXX: no chroma interpolating is done */
- static void yuv420p_to_rgb24(AVPicture *dst, AVPicture *src,
- int width, int height)
- {
- UINT8 *y1_ptr, *y2_ptr, *cb_ptr, *cr_ptr, *d, *d1, *d2;
- int w, y, cb, cr, r_add, g_add, b_add, width2;
- UINT8 *cm = cropTbl + MAX_NEG_CROP;
-
- d = dst->data[0];
- y1_ptr = src->data[0];
- cb_ptr = src->data[1];
- cr_ptr = src->data[2];
- width2 = width >> 1;
- for(;height > 0; height -= 2) {
- d1 = d;
- d2 = d + dst->linesize[0];
- y2_ptr = y1_ptr + src->linesize[0];
- for(w = width2; w > 0; w --) {
- cb = cb_ptr[0] - 128;
- cr = cr_ptr[0] - 128;
- r_add = C_RV * cr + (1 << (SCALE_BITS - 1));
- g_add = - C_GU * cb - C_GV * cr + (1 << (SCALE_BITS - 1));
- b_add = C_BU * cb + (1 << (SCALE_BITS - 1));
-
- /* output 4 pixels */
- RGBOUT(d1[0], d1[1], d1[2], y1_ptr[0]);
- RGBOUT(d1[3], d1[4], d1[5], y1_ptr[1]);
- RGBOUT(d2[0], d2[1], d2[2], y2_ptr[0]);
- RGBOUT(d2[3], d2[4], d2[5], y2_ptr[1]);
-
- d1 += 6;
- d2 += 6;
- y1_ptr += 2;
- y2_ptr += 2;
- cb_ptr++;
- cr_ptr++;
- }
- d += 2 * dst->linesize[0];
- y1_ptr += 2 * src->linesize[0] - width;
- cb_ptr += src->linesize[1] - width2;
- cr_ptr += src->linesize[2] - width2;
- }
- }
-
- /* XXX: no chroma interpolating is done */
- static void yuv422p_to_rgb24(AVPicture *dst, AVPicture *src,
- int width, int height)
- {
- UINT8 *y1_ptr, *cb_ptr, *cr_ptr, *d, *d1;
- int w, y, cb, cr, r_add, g_add, b_add, width2;
- UINT8 *cm = cropTbl + MAX_NEG_CROP;
-
- d = dst->data[0];
- y1_ptr = src->data[0];
- cb_ptr = src->data[1];
- cr_ptr = src->data[2];
- width2 = width >> 1;
- for(;height > 0; height --) {
- d1 = d;
- for(w = width2; w > 0; w --) {
- cb = cb_ptr[0] - 128;
- cr = cr_ptr[0] - 128;
- r_add = C_RV * cr + (1 << (SCALE_BITS - 1));
- g_add = - C_GU * cb - C_GV * cr + (1 << (SCALE_BITS - 1));
- b_add = C_BU * cb + (1 << (SCALE_BITS - 1));
-
- /* output 2 pixels */
- RGBOUT(d1[0], d1[1], d1[2], y1_ptr[0]);
- RGBOUT(d1[3], d1[4], d1[5], y1_ptr[1]);
-
- d1 += 6;
- y1_ptr += 2;
- cb_ptr++;
- cr_ptr++;
- }
- d += dst->linesize[0];
- y1_ptr += src->linesize[0] - width;
- cb_ptr += src->linesize[1] - width2;
- cr_ptr += src->linesize[2] - width2;
- }
- }
-
- /* XXX: always use linesize. Return -1 if not supported */
- int img_convert(AVPicture *dst, int dst_pix_fmt,
- AVPicture *src, int pix_fmt,
- int width, int height)
- {
- int i;
-
- assert(pix_fmt != PIX_FMT_ANY && dst_pix_fmt != PIX_FMT_ANY);
-
- if (dst_pix_fmt == pix_fmt) {
- switch(pix_fmt) {
- case PIX_FMT_YUV420P:
- for(i=0;i<3;i++) {
- if (i == 1) {
- width >>= 1;
- height >>= 1;
- }
- img_copy(dst->data[i], dst->linesize[i],
- src->data[i], src->linesize[i],
- width, height);
- }
- break;
- default:
- return -1;
- }
- } else if (dst_pix_fmt == PIX_FMT_YUV420P) {
-
- switch(pix_fmt) {
- case PIX_FMT_YUV411P:
- img_copy(dst->data[0], dst->linesize[0],
- src->data[0], src->linesize[0],
- width, height);
- conv411(dst->data[1], dst->linesize[1],
- src->data[1], src->linesize[1],
- width / 4, height);
- conv411(dst->data[2], dst->linesize[2],
- src->data[2], src->linesize[2],
- width / 4, height);
- break;
- case PIX_FMT_YUV410P:
- img_copy(dst->data[0], dst->linesize[0],
- src->data[0], src->linesize[0],
- width, height);
- grow22(dst->data[1], dst->linesize[1],
- src->data[1], src->linesize[1],
- width/2, height/2);
- grow22(dst->data[2], dst->linesize[2],
- src->data[2], src->linesize[2],
- width/2, height/2);
- break;
- case PIX_FMT_YUV420P:
- for(i=0;i<3;i++) {
- img_copy(dst->data[i], dst->linesize[i],
- src->data[i], src->linesize[i],
- width, height);
- }
- break;
- case PIX_FMT_YUV422P:
- img_copy(dst->data[0], dst->linesize[0],
- src->data[0], src->linesize[0],
- width, height);
- width >>= 1;
- height >>= 1;
- for(i=1;i<3;i++) {
- shrink2(dst->data[i], dst->linesize[i],
- src->data[i], src->linesize[i],
- width, height);
- }
- break;
- case PIX_FMT_YUV444P:
- img_copy(dst->data[0], dst->linesize[0],
- src->data[0], src->linesize[0],
- width, height);
- width >>= 1;
- height >>= 1;
- for(i=1;i<3;i++) {
- shrink22(dst->data[i], dst->linesize[i],
- src->data[i], src->linesize[i],
- width, height);
- }
- break;
- case PIX_FMT_YUV422:
- yuv422_to_yuv420p(dst->data[0], dst->data[1], dst->data[2],
- src->data[0], width, height);
- break;
- case PIX_FMT_RGB24:
- rgb24_to_yuv420p(dst->data[0], dst->data[1], dst->data[2],
- src->data[0], width, height);
- break;
- case PIX_FMT_RGBA32:
- rgba32_to_yuv420p(dst->data[0], dst->data[1], dst->data[2],
- src->data[0], width, height);
- break;
- case PIX_FMT_BGR24:
- bgr24_to_yuv420p(dst->data[0], dst->data[1], dst->data[2],
- src->data[0], width, height);
- break;
- case PIX_FMT_BGRA32:
- bgra32_to_yuv420p(dst->data[0], dst->data[1], dst->data[2],
- src->data[0], width, height);
- break;
- case PIX_FMT_RGB565:
- rgb565_to_yuv420p(dst->data[0], dst->data[1], dst->data[2],
- src->data[0], width, height);
- break;
- case PIX_FMT_RGB555:
- rgb555_to_yuv420p(dst->data[0], dst->data[1], dst->data[2],
- src->data[0], width, height);
- break;
- /* case PIX_FMT_RGB5551:
- rgb5551_to_yuv420p(dst->data[0], dst->data[1], dst->data[2],
- src->data[0], width, height);
- break;*/
- case PIX_FMT_BGR565:
- bgr565_to_yuv420p(dst->data[0], dst->data[1], dst->data[2],
- src->data[0], width, height);
- break;
- case PIX_FMT_BGR555:
- bgr555_to_yuv420p(dst->data[0], dst->data[1], dst->data[2],
- src->data[0], width, height);
- break;
- /* case PIX_FMT_GBR565:
- gbr565_to_yuv420p(dst->data[0], dst->data[1], dst->data[2],
- src->data[0], width, height);
- break;
- case PIX_FMT_GBR555:
- gbr555_to_yuv420p(dst->data[0], dst->data[1], dst->data[2],
- src->data[0], width, height);
- break;*/
- default:
- return -1;
- }
- } else if (dst_pix_fmt == PIX_FMT_RGB24) {
- switch(pix_fmt) {
- case PIX_FMT_YUV420P:
- yuv420p_to_rgb24(dst, src, width, height);
- break;
- case PIX_FMT_YUV422P:
- yuv422p_to_rgb24(dst, src, width, height);
- break;
- default:
- return -1;
- }
- } else if (dst_pix_fmt == PIX_FMT_RGBA32) {
- switch(pix_fmt) {
- case PIX_FMT_YUV420P:
- yuv420p_to_rgba32(dst, src, width, height);
- break;
- default:
- return -1;
- }
- } else if (dst_pix_fmt == PIX_FMT_BGRA32) {
- switch(pix_fmt) {
- case PIX_FMT_YUV420P:
- yuv420p_to_bgra32(dst, src, width, height);
- break;
- default:
- return -1;
- }
- } else {
- return -1;
- }
- return 0;
- }
-
-
- #ifdef HAVE_MMX
- #define DEINT_INPLACE_LINE_LUM \
- movd_m2r(lum_m4[0],mm0);\
- movd_m2r(lum_m3[0],mm1);\
- movd_m2r(lum_m2[0],mm2);\
- movd_m2r(lum_m1[0],mm3);\
- movd_m2r(lum[0],mm4);\
- punpcklbw_r2r(mm7,mm0);\
- movd_r2m(mm2,lum_m4[0]);\
- punpcklbw_r2r(mm7,mm1);\
- punpcklbw_r2r(mm7,mm2);\
- punpcklbw_r2r(mm7,mm3);\
- punpcklbw_r2r(mm7,mm4);\
- paddw_r2r(mm3,mm1);\
- psllw_i2r(1,mm2);\
- paddw_r2r(mm4,mm0);\
- psllw_i2r(2,mm1);\
- paddw_r2r(mm6,mm2);\
- paddw_r2r(mm2,mm1);\
- psubusw_r2r(mm0,mm1);\
- psrlw_i2r(3,mm1);\
- packuswb_r2r(mm7,mm1);\
- movd_r2m(mm1,lum_m2[0]);
-
- #define DEINT_LINE_LUM \
- movd_m2r(lum_m4[0],mm0);\
- movd_m2r(lum_m3[0],mm1);\
- movd_m2r(lum_m2[0],mm2);\
- movd_m2r(lum_m1[0],mm3);\
- movd_m2r(lum[0],mm4);\
- punpcklbw_r2r(mm7,mm0);\
- punpcklbw_r2r(mm7,mm1);\
- punpcklbw_r2r(mm7,mm2);\
- punpcklbw_r2r(mm7,mm3);\
- punpcklbw_r2r(mm7,mm4);\
- paddw_r2r(mm3,mm1);\
- psllw_i2r(1,mm2);\
- paddw_r2r(mm4,mm0);\
- psllw_i2r(2,mm1);\
- paddw_r2r(mm6,mm2);\
- paddw_r2r(mm2,mm1);\
- psubusw_r2r(mm0,mm1);\
- psrlw_i2r(3,mm1);\
- packuswb_r2r(mm7,mm1);\
- movd_r2m(mm1,dst[0]);
- #endif
-
- /* filter parameters: [-1 4 2 4 -1] // 8 */
- static void deinterlace_line(UINT8 *dst, UINT8 *lum_m4, UINT8 *lum_m3, UINT8 *lum_m2, UINT8 *lum_m1, UINT8 *lum,
- int size)
- {
- #ifndef HAVE_MMX
- UINT8 *cm = cropTbl + MAX_NEG_CROP;
- int sum;
-
- for(;size > 0;size--) {
- sum = -lum_m4[0];
- sum += lum_m3[0] << 2;
- sum += lum_m2[0] << 1;
- sum += lum_m1[0] << 2;
- sum += -lum[0];
- dst[0] = cm[(sum + 4) >> 3];
- lum_m4++;
- lum_m3++;
- lum_m2++;
- lum_m1++;
- lum++;
- dst++;
- }
- #else
-
- for (;size > 3; size-=4) {
- DEINT_LINE_LUM
- lum_m4+=4;
- lum_m3+=4;
- lum_m2+=4;
- lum_m1+=4;
- lum+=4;
- dst+=4;
- }
- #endif
- }
- static void deinterlace_line_inplace(UINT8 *lum_m4, UINT8 *lum_m3, UINT8 *lum_m2, UINT8 *lum_m1, UINT8 *lum,
- int size)
- {
- #ifndef HAVE_MMX
- UINT8 *cm = cropTbl + MAX_NEG_CROP;
- int sum;
-
- for(;size > 0;size--) {
- sum = -lum_m4[0];
- sum += lum_m3[0] << 2;
- sum += lum_m2[0] << 1;
- lum_m4[0]=lum_m2[0];
- sum += lum_m1[0] << 2;
- sum += -lum[0];
- lum_m2[0] = cm[(sum + 4) >> 3];
- lum_m4++;
- lum_m3++;
- lum_m2++;
- lum_m1++;
- lum++;
- }
- #else
-
- for (;size > 3; size-=4) {
- DEINT_INPLACE_LINE_LUM
- lum_m4+=4;
- lum_m3+=4;
- lum_m2+=4;
- lum_m1+=4;
- lum+=4;
- }
- #endif
- }
-
- /* deinterlacing : 2 temporal taps, 3 spatial taps linear filter. The
- top field is copied as is, but the bottom field is deinterlaced
- against the top field. */
- static void deinterlace_bottom_field(UINT8 *dst, int dst_wrap,
- UINT8 *src1, int src_wrap,
- int width, int height)
- {
- UINT8 *src_m2, *src_m1, *src_0, *src_p1, *src_p2;
- int y;
-
- src_m2 = src1;
- src_m1 = src1;
- src_0=&src_m1[src_wrap];
- src_p1=&src_0[src_wrap];
- src_p2=&src_p1[src_wrap];
- for(y=0;y<(height-2);y+=2) {
- memcpy(dst,src_m1,width);
- dst += dst_wrap;
- deinterlace_line(dst,src_m2,src_m1,src_0,src_p1,src_p2,width);
- src_m2 = src_0;
- src_m1 = src_p1;
- src_0 = src_p2;
- src_p1 += 2*src_wrap;
- src_p2 += 2*src_wrap;
- dst += dst_wrap;
- }
- memcpy(dst,src_m1,width);
- dst += dst_wrap;
- /* do last line */
- deinterlace_line(dst,src_m2,src_m1,src_0,src_0,src_0,width);
- }
-
- static void deinterlace_bottom_field_inplace(UINT8 *src1, int src_wrap,
- int width, int height)
- {
- UINT8 *src_m1, *src_0, *src_p1, *src_p2;
- int y;
- UINT8 *buf;
- buf = (UINT8*)av_malloc(width);
-
- src_m1 = src1;
- memcpy(buf,src_m1,width);
- src_0=&src_m1[src_wrap];
- src_p1=&src_0[src_wrap];
- src_p2=&src_p1[src_wrap];
- for(y=0;y<(height-2);y+=2) {
- deinterlace_line_inplace(buf,src_m1,src_0,src_p1,src_p2,width);
- src_m1 = src_p1;
- src_0 = src_p2;
- src_p1 += 2*src_wrap;
- src_p2 += 2*src_wrap;
- }
- /* do last line */
- deinterlace_line_inplace(buf,src_m1,src_0,src_0,src_0,width);
- av_free(buf);
- }
-
-
- /* deinterlace - if not supported return -1 */
- int avpicture_deinterlace(AVPicture *dst, AVPicture *src,
- int pix_fmt, int width, int height)
- {
- int i;
-
- if (pix_fmt != PIX_FMT_YUV420P &&
- pix_fmt != PIX_FMT_YUV422P &&
- pix_fmt != PIX_FMT_YUV444P)
- return -1;
- if ((width & 3) != 0 || (height & 3) != 0)
- return -1;
-
- #ifdef HAVE_MMX
- {
- mmx_t rounder;
- rounder.uw[0]=4;
- rounder.uw[1]=4;
- rounder.uw[2]=4;
- rounder.uw[3]=4;
- pxor_r2r(mm7,mm7);
- movq_m2r(rounder,mm6);
- }
- #endif
-
-
- for(i=0;i<3;i++) {
- if (i == 1) {
- switch(pix_fmt) {
- case PIX_FMT_YUV420P:
- width >>= 1;
- height >>= 1;
- break;
- case PIX_FMT_YUV422P:
- width >>= 1;
- break;
- default:
- break;
- }
- }
- if (src == dst) {
- deinterlace_bottom_field_inplace(src->data[i], src->linesize[i],
- width, height);
- } else {
- deinterlace_bottom_field(dst->data[i],dst->linesize[i],
- src->data[i], src->linesize[i],
- width, height);
- }
- }
- #ifdef HAVE_MMX
- emms();
- #endif
- return 0;
- }
-
- #undef FIX
|