Skip to content
Snippets Groups Projects
Commit 52b6d962 authored by Michael Niedermayer's avatar Michael Niedermayer
Browse files

Merge commit 'a344e5d0'


* commit 'a344e5d0':
  x86: bswapdsp: Don't treat 32-bit integers as 64-bit

Conflicts:
	libavcodec/x86/bswapdsp.asm

Merged-by: default avatarMichael Niedermayer <michael@niedermayer.cc>
parents c7c33ab7 a344e5d0
No related branches found
No related tags found
No related merge requests found
...@@ -32,8 +32,8 @@ SECTION_TEXT ...@@ -32,8 +32,8 @@ SECTION_TEXT
; %1 = aligned/unaligned ; %1 = aligned/unaligned
%macro BSWAP_LOOPS 1 %macro BSWAP_LOOPS 1
mov r3, r2 mov r3d, r2d
sar r2, 3 sar r2d, 3
jz .left4_%1 jz .left4_%1
.loop8_%1: .loop8_%1:
mov%1 m0, [r1 + 0] mov%1 m0, [r1 + 0]
...@@ -61,11 +61,11 @@ SECTION_TEXT ...@@ -61,11 +61,11 @@ SECTION_TEXT
%endif %endif
add r0, 32 add r0, 32
add r1, 32 add r1, 32
dec r2 dec r2d
jnz .loop8_%1 jnz .loop8_%1
.left4_%1: .left4_%1:
mov r2, r3 mov r2d, r3d
and r3, 4 test r3d, 4
jz .left jz .left
mov%1 m0, [r1] mov%1 m0, [r1]
%if cpuflag(ssse3) %if cpuflag(ssse3)
...@@ -95,7 +95,7 @@ cglobal bswap32_buf, 3,4,5 ...@@ -95,7 +95,7 @@ cglobal bswap32_buf, 3,4,5
mov r3, r1 mov r3, r1
%endif %endif
or r3, r0 or r3, r0
and r3, 15 test r3, 15
jz .start_align jz .start_align
BSWAP_LOOPS u BSWAP_LOOPS u
jmp .left jmp .left
...@@ -103,8 +103,7 @@ cglobal bswap32_buf, 3,4,5 ...@@ -103,8 +103,7 @@ cglobal bswap32_buf, 3,4,5
BSWAP_LOOPS a BSWAP_LOOPS a
.left: .left:
%if cpuflag(ssse3) %if cpuflag(ssse3)
mov r3, r2 test r2d, 2
and r2, 2
jz .left1 jz .left1
movq m0, [r1] movq m0, [r1]
pshufb m0, m2 pshufb m0, m2
...@@ -112,13 +111,13 @@ cglobal bswap32_buf, 3,4,5 ...@@ -112,13 +111,13 @@ cglobal bswap32_buf, 3,4,5
add r1, 8 add r1, 8
add r0, 8 add r0, 8
.left1: .left1:
and r3, 1 test r2d, 1
jz .end jz .end
mov r2d, [r1] mov r2d, [r1]
bswap r2d bswap r2d
mov [r0], r2d mov [r0], r2d
%else %else
and r2, 3 and r2d, 3
jz .end jz .end
.loop2: .loop2:
mov r3d, [r1] mov r3d, [r1]
...@@ -126,7 +125,7 @@ cglobal bswap32_buf, 3,4,5 ...@@ -126,7 +125,7 @@ cglobal bswap32_buf, 3,4,5
mov [r0], r3d mov [r0], r3d
add r1, 4 add r1, 4
add r0, 4 add r0, 4
dec r2 dec r2d
jnz .loop2 jnz .loop2
%endif %endif
.end: .end:
......
0% Loading or .
You are about to add 0 people to the discussion. Proceed with caution.
Please register or to comment