~mdw
/
catacomb
/ blobdiff
commit
grep
author
committer
pickaxe
?
search:
re
summary
|
shortlog
|
log
|
commit
|
commitdiff
|
tree
raw
|
inline
| side by side
math/mpx-mul4-*.S: Use more portable type syntax for ambiguous instructions.
[catacomb]
/
math
/
mpx-mul4-x86-sse2.S
diff --git
a/math/mpx-mul4-x86-sse2.S
b/math/mpx-mul4-x86-sse2.S
index
7e7173f
..
916adef
100644
(file)
--- a/
math/mpx-mul4-x86-sse2.S
+++ b/
math/mpx-mul4-x86-sse2.S
@@
-1054,9
+1054,9
@@
FUNC(mpxmont_redc4_x86_sse2)
// Continue carry propagation until the end of the buffer.
0: add [edi], eax
mov eax, 0 // preserves flags
// Continue carry propagation until the end of the buffer.
0: add [edi], eax
mov eax, 0 // preserves flags
- adc
d
[edi + 4], 0
- adc
d
[edi + 8], 0
- adc
d
[edi + 12], 0
+ adc
dword ptr
[edi + 4], 0
+ adc
dword ptr
[edi + 8], 0
+ adc
dword ptr
[edi + 12], 0
adc eax, 0
add edi, 16
cmp edi, esi
adc eax, 0
add edi, 16
cmp edi, esi
@@
-1286,6
+1286,8
@@
FUNC(test_mmul4)
mov edi, [BP + 28]
movdqa xmm0, [SP + 64]
movdqa xmm1, [SP + 80]
mov edi, [BP + 28]
movdqa xmm0, [SP + 64]
movdqa xmm1, [SP + 80]
+ pshufd xmm0, xmm0, SHUF(0, 2, 1, 3)
+ pshufd xmm1, xmm1, SHUF(0, 2, 1, 3)
movdqu [edi], xmm0
movdqu [edi + 16], xmm1
testcarryout [BP + 24]
movdqu [edi], xmm0
movdqu [edi + 16], xmm1
testcarryout [BP + 24]
@@
-1302,6
+1304,8
@@
FUNC(test_mmla4)
mov edi, [BP + 28]
movdqa xmm0, [SP + 64]
movdqa xmm1, [SP + 80]
mov edi, [BP + 28]
movdqa xmm0, [SP + 64]
movdqa xmm1, [SP + 80]
+ pshufd xmm0, xmm0, SHUF(0, 2, 1, 3)
+ pshufd xmm1, xmm1, SHUF(0, 2, 1, 3)
movdqu [edi], xmm0
movdqu [edi + 16], xmm1
testcarryout [BP + 24]
movdqu [edi], xmm0
movdqu [edi + 16], xmm1
testcarryout [BP + 24]
@@
-1318,6
+1322,8
@@
FUNC(test_mont4)
mov edi, [BP + 28]
movdqa xmm0, [SP + 64]
movdqa xmm1, [SP + 80]
mov edi, [BP + 28]
movdqa xmm0, [SP + 64]
movdqa xmm1, [SP + 80]
+ pshufd xmm0, xmm0, SHUF(0, 2, 1, 3)
+ pshufd xmm1, xmm1, SHUF(0, 2, 1, 3)
movdqu [edi], xmm0
movdqu [edi + 16], xmm1
testcarryout [BP + 24]
movdqu [edi], xmm0
movdqu [edi + 16], xmm1
testcarryout [BP + 24]