|
|
@@ -1612,16 +1612,26 @@ void ff_avg_vc1_mspel_mc00_mmxext(uint8_t *dst, const uint8_t *src, |
|
|
|
#define DIRAC_PIXOP(OPNAME2, OPNAME, EXT)\ |
|
|
|
void ff_ ## OPNAME2 ## _dirac_pixels8_ ## EXT(uint8_t *dst, const uint8_t *src[5], int stride, int h)\ |
|
|
|
{\ |
|
|
|
OPNAME ## _pixels8_ ## EXT(dst, src[0], stride, h);\ |
|
|
|
if (h&3)\ |
|
|
|
ff_ ## OPNAME2 ## _dirac_pixels8_c(dst, src, stride, h);\ |
|
|
|
else\ |
|
|
|
OPNAME ## _pixels8_ ## EXT(dst, src[0], stride, h);\ |
|
|
|
}\ |
|
|
|
void ff_ ## OPNAME2 ## _dirac_pixels16_ ## EXT(uint8_t *dst, const uint8_t *src[5], int stride, int h)\ |
|
|
|
{\ |
|
|
|
OPNAME ## _pixels16_ ## EXT(dst, src[0], stride, h);\ |
|
|
|
if (h&3)\ |
|
|
|
ff_ ## OPNAME2 ## _dirac_pixels16_c(dst, src, stride, h);\ |
|
|
|
else\ |
|
|
|
OPNAME ## _pixels16_ ## EXT(dst, src[0], stride, h);\ |
|
|
|
}\ |
|
|
|
void ff_ ## OPNAME2 ## _dirac_pixels32_ ## EXT(uint8_t *dst, const uint8_t *src[5], int stride, int h)\ |
|
|
|
{\ |
|
|
|
OPNAME ## _pixels16_ ## EXT(dst , src[0] , stride, h);\ |
|
|
|
OPNAME ## _pixels16_ ## EXT(dst+16, src[0]+16, stride, h);\ |
|
|
|
if (h&3) {\ |
|
|
|
ff_ ## OPNAME2 ## _dirac_pixels32_c(dst, src, stride, h);\ |
|
|
|
} else {\ |
|
|
|
OPNAME ## _pixels16_ ## EXT(dst , src[0] , stride, h);\ |
|
|
|
OPNAME ## _pixels16_ ## EXT(dst+16, src[0]+16, stride, h);\ |
|
|
|
}\ |
|
|
|
} |
|
|
|
|
|
|
|
DIRAC_PIXOP(put, put, mmx) |
|
|
@@ -1631,21 +1641,35 @@ DIRAC_PIXOP(avg, ff_avg, mmxext) |
|
|
|
#if HAVE_YASM |
|
|
|
void ff_put_dirac_pixels16_sse2(uint8_t *dst, const uint8_t *src[5], int stride, int h) |
|
|
|
{ |
|
|
|
if (h&3) |
|
|
|
ff_put_dirac_pixels16_c(dst, src, stride, h); |
|
|
|
else |
|
|
|
ff_put_pixels16_sse2(dst, src[0], stride, h); |
|
|
|
} |
|
|
|
void ff_avg_dirac_pixels16_sse2(uint8_t *dst, const uint8_t *src[5], int stride, int h) |
|
|
|
{ |
|
|
|
if (h&3) |
|
|
|
ff_avg_dirac_pixels16_c(dst, src, stride, h); |
|
|
|
else |
|
|
|
ff_avg_pixels16_sse2(dst, src[0], stride, h); |
|
|
|
} |
|
|
|
void ff_put_dirac_pixels32_sse2(uint8_t *dst, const uint8_t *src[5], int stride, int h) |
|
|
|
{ |
|
|
|
if (h&3) { |
|
|
|
ff_put_dirac_pixels32_c(dst, src, stride, h); |
|
|
|
} else { |
|
|
|
ff_put_pixels16_sse2(dst , src[0] , stride, h); |
|
|
|
ff_put_pixels16_sse2(dst+16, src[0]+16, stride, h); |
|
|
|
} |
|
|
|
} |
|
|
|
void ff_avg_dirac_pixels32_sse2(uint8_t *dst, const uint8_t *src[5], int stride, int h) |
|
|
|
{ |
|
|
|
if (h&3) { |
|
|
|
ff_avg_dirac_pixels32_c(dst, src, stride, h); |
|
|
|
} else { |
|
|
|
ff_avg_pixels16_sse2(dst , src[0] , stride, h); |
|
|
|
ff_avg_pixels16_sse2(dst+16, src[0]+16, stride, h); |
|
|
|
} |
|
|
|
} |
|
|
|
#endif |
|
|
|
#endif |
|
|
|