Originally committed as revision 234 to svn://svn.ffmpeg.org/ffmpeg/trunktags/v0.5
| @@ -6,7 +6,7 @@ LDFLAGS= -g | |||||
| OBJS= common.o utils.o mpegvideo.o h263.o jrevdct.o jfdctfst.o \ | OBJS= common.o utils.o mpegvideo.o h263.o jrevdct.o jfdctfst.o \ | ||||
| mpegaudio.o ac3enc.o mjpeg.o resample.o dsputil.o \ | mpegaudio.o ac3enc.o mjpeg.o resample.o dsputil.o \ | ||||
| motion_est.o imgconvert.o imgresample.o msmpeg4.o \ | motion_est.o imgconvert.o imgresample.o msmpeg4.o \ | ||||
| mpeg12.o h263dec.o rv10.o mpegaudiodec.o pcm.o | |||||
| mpeg12.o h263dec.o rv10.o mpegaudiodec.o pcm.o simple_idct.o | |||||
| ASM_OBJS= | ASM_OBJS= | ||||
| # currently using libac3 for ac3 decoding | # currently using libac3 for ac3 decoding | ||||
| @@ -20,7 +20,8 @@ endif | |||||
| ifeq ($(TARGET_MMX),yes) | ifeq ($(TARGET_MMX),yes) | ||||
| OBJS += i386/fdct_mmx.o i386/cputest.o \ | OBJS += i386/fdct_mmx.o i386/cputest.o \ | ||||
| i386/dsputil_mmx.o i386/mpegvideo_mmx.o \ | i386/dsputil_mmx.o i386/mpegvideo_mmx.o \ | ||||
| i386/idct_mmx.o i386/motion_est_mmx.o | |||||
| i386/idct_mmx.o i386/motion_est_mmx.o \ | |||||
| i386/simple_idct_mmx.o | |||||
| endif | endif | ||||
| # armv4l specific stuff | # armv4l specific stuff | ||||
| @@ -20,6 +20,7 @@ | |||||
| #include <stdio.h> | #include <stdio.h> | ||||
| #include "avcodec.h" | #include "avcodec.h" | ||||
| #include "dsputil.h" | #include "dsputil.h" | ||||
| #include "simple_idct.h" | |||||
| void (*ff_idct)(DCTELEM *block); | void (*ff_idct)(DCTELEM *block); | ||||
| void (*get_pixels)(DCTELEM *block, const UINT8 *pixels, int line_size); | void (*get_pixels)(DCTELEM *block, const UINT8 *pixels, int line_size); | ||||
| @@ -388,6 +389,27 @@ int pix_abs16x16_xy2_c(UINT8 *pix1, UINT8 *pix2, int line_size, int h) | |||||
| /* permute block according so that it corresponds to the MMX idct | /* permute block according so that it corresponds to the MMX idct | ||||
| order */ | order */ | ||||
| #ifdef SIMPLE_IDCT | |||||
| void block_permute(INT16 *block) | |||||
| { | |||||
| int i; | |||||
| INT16 temp[64]; | |||||
| // for(i=0; i<64; i++) temp[i] = block[ block_permute_op(i) ]; | |||||
| for(i=0; i<64; i++) temp[ block_permute_op(i) ] = block[i]; | |||||
| for(i=0; i<64; i++) block[i] = temp[i]; | |||||
| /* | |||||
| for(i=0; i<64; i++) | |||||
| { | |||||
| if((i&7)==0) printf("\n"); | |||||
| printf("%2d ", block[i]); | |||||
| } | |||||
| */ | |||||
| } | |||||
| #else | |||||
| void block_permute(INT16 *block) | void block_permute(INT16 *block) | ||||
| { | { | ||||
| int tmp1, tmp2, tmp3, tmp4, tmp5, tmp6; | int tmp1, tmp2, tmp3, tmp4, tmp5, tmp6; | ||||
| @@ -409,6 +431,7 @@ void block_permute(INT16 *block) | |||||
| block += 8; | block += 8; | ||||
| } | } | ||||
| } | } | ||||
| #endif | |||||
| void dsputil_init(void) | void dsputil_init(void) | ||||
| { | { | ||||
| @@ -425,7 +448,11 @@ void dsputil_init(void) | |||||
| squareTbl[i] = (i - 256) * (i - 256); | squareTbl[i] = (i - 256) * (i - 256); | ||||
| } | } | ||||
| #ifdef SIMPLE_IDCT | |||||
| ff_idct = simple_idct; | |||||
| #else | |||||
| ff_idct = j_rev_dct; | ff_idct = j_rev_dct; | ||||
| #endif | |||||
| get_pixels = get_pixels_c; | get_pixels = get_pixels_c; | ||||
| put_pixels_clamped = put_pixels_clamped_c; | put_pixels_clamped = put_pixels_clamped_c; | ||||
| add_pixels_clamped = add_pixels_clamped_c; | add_pixels_clamped = add_pixels_clamped_c; | ||||
| @@ -449,6 +476,10 @@ void dsputil_init(void) | |||||
| use_permuted_idct = 0; | use_permuted_idct = 0; | ||||
| #endif | #endif | ||||
| #ifdef SIMPLE_IDCT | |||||
| if(ff_idct == simple_idct) use_permuted_idct=0; | |||||
| #endif | |||||
| if (use_permuted_idct) { | if (use_permuted_idct) { | ||||
| /* permute for IDCT */ | /* permute for IDCT */ | ||||
| for(i=0;i<64;i++) { | for(i=0;i<64;i++) { | ||||
| @@ -67,10 +67,33 @@ int pix_abs16x16_x2_c(UINT8 *blk1, UINT8 *blk2, int lx, int h); | |||||
| int pix_abs16x16_y2_c(UINT8 *blk1, UINT8 *blk2, int lx, int h); | int pix_abs16x16_y2_c(UINT8 *blk1, UINT8 *blk2, int lx, int h); | ||||
| int pix_abs16x16_xy2_c(UINT8 *blk1, UINT8 *blk2, int lx, int h); | int pix_abs16x16_xy2_c(UINT8 *blk1, UINT8 *blk2, int lx, int h); | ||||
| #if defined (SIMPLE_IDCT) && defined (HAVE_MMX) | |||||
| static inline int block_permute_op(int j) | |||||
| { | |||||
| static const int table[64]={ | |||||
| 0x00, 0x08, 0x01, 0x09, 0x04, 0x0C, 0x05, 0x0D, | |||||
| 0x10, 0x18, 0x11, 0x19, 0x14, 0x1C, 0x15, 0x1D, | |||||
| 0x02, 0x0A, 0x03, 0x0B, 0x06, 0x0E, 0x07, 0x0F, | |||||
| 0x12, 0x1A, 0x13, 0x1B, 0x16, 0x1E, 0x17, 0x1F, | |||||
| 0x20, 0x28, 0x21, 0x29, 0x24, 0x2C, 0x25, 0x2D, | |||||
| 0x30, 0x38, 0x31, 0x39, 0x34, 0x3C, 0x35, 0x3D, | |||||
| 0x22, 0x2A, 0x23, 0x2B, 0x26, 0x2E, 0x27, 0x2F, | |||||
| 0x32, 0x3A, 0x33, 0x3B, 0x36, 0x3E, 0x37, 0x3F, | |||||
| }; | |||||
| return table[j]; | |||||
| } | |||||
| #elif defined (SIMPLE_IDCT) | |||||
| static inline int block_permute_op(int j) | |||||
| { | |||||
| return j; | |||||
| } | |||||
| #else | |||||
| static inline int block_permute_op(int j) | static inline int block_permute_op(int j) | ||||
| { | { | ||||
| return (j & 0x38) | ((j & 6) >> 1) | ((j & 1) << 2); | return (j & 0x38) | ((j & 6) >> 1) | ((j & 1) << 2); | ||||
| } | } | ||||
| #endif | |||||
| void block_permute(INT16 *block); | void block_permute(INT16 *block); | ||||
| @@ -554,7 +554,7 @@ static int mpeg4_pred_dc(MpegEncContext * s, int n, UINT16 **dc_val_ptr, int *di | |||||
| return pred; | return pred; | ||||
| } | } | ||||
| void mpeg4_pred_ac(MpegEncContext * s, INT16 *block, int n, | |||||
| void mpeg4_pred_ac(MpegEncContext * s, INT16 *block, int n, | |||||
| int dir) | int dir) | ||||
| { | { | ||||
| int x, y, wrap, i; | int x, y, wrap, i; | ||||
| @@ -579,22 +579,22 @@ void mpeg4_pred_ac(MpegEncContext * s, INT16 *block, int n, | |||||
| /* left prediction */ | /* left prediction */ | ||||
| ac_val -= 16; | ac_val -= 16; | ||||
| for(i=1;i<8;i++) { | for(i=1;i<8;i++) { | ||||
| block[i*8] += ac_val[i]; | |||||
| block[block_permute_op(i*8)] += ac_val[i]; | |||||
| } | } | ||||
| } else { | } else { | ||||
| /* top prediction */ | /* top prediction */ | ||||
| ac_val -= 16 * wrap; | ac_val -= 16 * wrap; | ||||
| for(i=1;i<8;i++) { | for(i=1;i<8;i++) { | ||||
| block[i] += ac_val[i + 8]; | |||||
| block[block_permute_op(i)] += ac_val[i + 8]; | |||||
| } | } | ||||
| } | } | ||||
| } | } | ||||
| /* left copy */ | /* left copy */ | ||||
| for(i=1;i<8;i++) | for(i=1;i<8;i++) | ||||
| ac_val1[i] = block[i * 8]; | |||||
| ac_val1[i] = block[block_permute_op(i * 8)]; | |||||
| /* top copy */ | /* top copy */ | ||||
| for(i=1;i<8;i++) | for(i=1;i<8;i++) | ||||
| ac_val1[8 + i] = block[i]; | |||||
| ac_val1[8 + i] = block[block_permute_op(i)]; | |||||
| } | } | ||||
| static inline void mpeg4_encode_dc(MpegEncContext * s, int level, int n, int *dir_ptr) | static inline void mpeg4_encode_dc(MpegEncContext * s, int level, int n, int *dir_ptr) | ||||
| @@ -20,6 +20,7 @@ | |||||
| */ | */ | ||||
| #include "../dsputil.h" | #include "../dsputil.h" | ||||
| #include "../simple_idct.h" | |||||
| int mm_flags; /* multimedia extension flags */ | int mm_flags; /* multimedia extension flags */ | ||||
| @@ -1047,5 +1048,9 @@ void dsputil_init_mmx(void) | |||||
| } else { | } else { | ||||
| ff_idct = ff_mmx_idct; | ff_idct = ff_mmx_idct; | ||||
| } | } | ||||
| #ifdef SIMPLE_IDCT | |||||
| // ff_idct = simple_idct; | |||||
| ff_idct = simple_idct_mmx; | |||||
| #endif | |||||
| } | } | ||||
| } | } | ||||