// of the sum U V + N Y to [EDI], leaving the remaining carry in
// XMM4, XMM5, and XMM6. The registers XMM0, XMM1, XMM2, XMM3, and
// XMM7 are clobbered; the general-purpose registers are preserved.
- stalloc 64 // space for the carries
+ stalloc 48 // space for the carries
endprologue
// Calculate W = U V, and leave it in the destination. Stash the
// carry in XMM4, XMM5, and XMM6. The registers XMM0, XMM1, XMM2,
// XMM3, and XMM7 are clobbered; the general-purpose registers are
// preserved.
- stalloc 64 // space for the carries
+ stalloc 48 // space for the carries
endprologue
movd xmm4, [edi + 0]
paddq xmm6, [esp + 32]
// And, with that, we're done.
- stfree 64
+ stfree 48
ret
ENDFUNC
INTFUNC(mont4)
// On entry, EDI points to the destination buffer holding a packed
- // value A; EBX points to a packed operand N; ESI points to an
+ // value W; EBX points to a packed operand N; ESI points to an
// expanded operand M; and EDX points to a place to store an expanded
// result Y (32 bytes, at a 16-byte boundary).
//