Browse Source

x86inc: Use SSE instead of SSE2 for copying data

Reduces code size because movaps/movups is one byte
shorter than movdqa/movdqu.

Signed-off-by: Derek Buitenhuis <derek.buitenhuis@gmail.com>
tags/n2.1
Henrik Gramner Derek Buitenhuis 12 years ago
parent
commit
63f0d62310
1 changed files with 2 additions and 2 deletions
  1. +2
    -2
      libavutil/x86/x86inc.asm

+ 2
- 2
libavutil/x86/x86inc.asm View File

@@ -436,7 +436,7 @@ DECLARE_REG 14, R15, 120
%assign %%i xmm_regs_used
%rep (xmm_regs_used-6)
%assign %%i %%i-1
movdqa [rsp + (%%i-6)*16 + stack_size + (~stack_offset&8)], xmm %+ %%i
movaps [rsp + (%%i-6)*16 + stack_size + (~stack_offset&8)], xmm %+ %%i
%endrep
%endmacro

@@ -454,7 +454,7 @@ DECLARE_REG 14, R15, 120
%assign %%i xmm_regs_used
%rep (xmm_regs_used-6)
%assign %%i %%i-1
movdqa xmm %+ %%i, [%1 + (%%i-6)*16+stack_size+(~stack_offset&8)]
movaps xmm %+ %%i, [%1 + (%%i-6)*16+stack_size+(~stack_offset&8)]
%endrep
%if stack_size_padded == 0
add %1, (xmm_regs_used-6)*16+16


Loading…
Cancel
Save