X-Git-Url: https://git.distorted.org.uk/~mdw/catacomb/blobdiff_plain/a90d420cbe87490c844ae422c966e746d3134b07..a1a9ee0a7240087e202a7855e470573de0e59c09:/math/mpx-mul4-x86-sse2.S diff --git a/math/mpx-mul4-x86-sse2.S b/math/mpx-mul4-x86-sse2.S index ba7ae6a3..2f7b5ec9 100644 --- a/math/mpx-mul4-x86-sse2.S +++ b/math/mpx-mul4-x86-sse2.S @@ -316,7 +316,6 @@ INTFUNC(carryprop) propout [edi + 8], xmm6, nil endprop [edi + 12], xmm6, xmm4 ret - ENDFUNC INTFUNC(dmul4) @@ -348,7 +347,6 @@ INTFUNC(dmul4) propout [edi + 12], xmm7, xmm4 ret - ENDFUNC INTFUNC(dmla4) @@ -384,7 +382,6 @@ INTFUNC(dmla4) propout [edi + 12], xmm7, xmm4 ret - ENDFUNC INTFUNC(mul4zc) @@ -410,7 +407,6 @@ INTFUNC(mul4zc) propout [edi + 12], xmm7, xmm4 ret - ENDFUNC INTFUNC(mul4) @@ -438,7 +434,6 @@ INTFUNC(mul4) propout [edi + 12], xmm7, xmm4 ret - ENDFUNC INTFUNC(mla4zc) @@ -470,7 +465,6 @@ INTFUNC(mla4zc) propout [edi + 12], xmm7, xmm4 ret - ENDFUNC INTFUNC(mla4) @@ -501,7 +495,6 @@ INTFUNC(mla4) propout [edi + 12], xmm7, xmm4 ret - ENDFUNC INTFUNC(mmul4) @@ -523,7 +516,6 @@ INTFUNC(mmul4) mulcore [eax + 0], ecx, xmm4, xmm5, xmm6, xmm7 propout [edi + 0], xmm4, xmm5 jmp 5f - ENDFUNC INTFUNC(mmla4) @@ -613,7 +605,6 @@ INTFUNC(mmla4) // And, with that, we're done. stfree 48 + 12 ret - ENDFUNC INTFUNC(mont4) @@ -670,7 +661,6 @@ INTFUNC(mont4) // And, with that, we're done. ret - ENDFUNC ///-------------------------------------------------------------------------- @@ -706,8 +696,8 @@ FUNC(mpx_umul4_x86_sse2) pushreg esi pushreg edi setfp + stalloc 32 and SP, ~15 - sub SP, 32 endprologue // Prepare for the first iteration. @@ -781,7 +771,6 @@ FUNC(mpx_umul4_x86_sse2) pop ebx pop BP ret - ENDFUNC FUNC(mpxmont_mul4_x86_avx) @@ -821,8 +810,8 @@ FUNC(mpxmont_mul4_x86_sse2) pushreg esi pushreg edi setfp + stalloc 112 and SP, ~15 - sub SP, 112 endprologue // Establish the expanded operands. @@ -930,7 +919,6 @@ FUNC(mpxmont_mul4_x86_sse2) popreg ebx popreg BP ret - ENDFUNC FUNC(mpxmont_redc4_x86_avx) @@ -968,7 +956,7 @@ FUNC(mpxmont_redc4_x86_sse2) pushreg edi setfp and SP, ~15 - sub SP, 76 + stalloc 76 endprologue // Establish the expanded operands and the blocks-of-4 dv limit. @@ -1064,7 +1052,6 @@ FUNC(mpxmont_redc4_x86_sse2) popreg ebx popreg BP ret - ENDFUNC ///-------------------------------------------------------------------------- @@ -1096,8 +1083,8 @@ ENDFUNC pushreg esi pushreg edi setfp + stalloc 3*32 + 4*4 and SP, ~15 - sub SP, 3*32 + 4*4 endprologue mov eax, \n mov [SP + 104], eax