2123 lines
37 KiB
NASM
2123 lines
37 KiB
NASM
; Don't even think of reading this code
|
|
; It was automatically generated by bn-586.pl
|
|
; Which is a perl program used to generate the x86 assember for
|
|
; any of elf, a.out, BSDI,Win32, or Solaris
|
|
; eric <eay@cryptsoft.com>
|
|
;
|
|
TITLE bn-586.asm
|
|
.386
|
|
.model FLAT
|
|
_TEXT SEGMENT
|
|
PUBLIC _bn_mul_add_words
|
|
|
|
_bn_mul_add_words PROC NEAR
|
|
push ebp
|
|
push ebx
|
|
push esi
|
|
push edi
|
|
;
|
|
xor esi, esi
|
|
mov edi, DWORD PTR 20[esp]
|
|
mov ecx, DWORD PTR 28[esp]
|
|
mov ebx, DWORD PTR 24[esp]
|
|
and ecx, 4294967288
|
|
mov ebp, DWORD PTR 32[esp]
|
|
push ecx
|
|
jz $L000maw_finish
|
|
L001maw_loop:
|
|
mov DWORD PTR [esp],ecx
|
|
; Round 0
|
|
mov eax, DWORD PTR [ebx]
|
|
mul ebp
|
|
add eax, esi
|
|
mov esi, DWORD PTR [edi]
|
|
adc edx, 0
|
|
add eax, esi
|
|
adc edx, 0
|
|
mov DWORD PTR [edi],eax
|
|
mov esi, edx
|
|
; Round 4
|
|
mov eax, DWORD PTR 4[ebx]
|
|
mul ebp
|
|
add eax, esi
|
|
mov esi, DWORD PTR 4[edi]
|
|
adc edx, 0
|
|
add eax, esi
|
|
adc edx, 0
|
|
mov DWORD PTR 4[edi],eax
|
|
mov esi, edx
|
|
; Round 8
|
|
mov eax, DWORD PTR 8[ebx]
|
|
mul ebp
|
|
add eax, esi
|
|
mov esi, DWORD PTR 8[edi]
|
|
adc edx, 0
|
|
add eax, esi
|
|
adc edx, 0
|
|
mov DWORD PTR 8[edi],eax
|
|
mov esi, edx
|
|
; Round 12
|
|
mov eax, DWORD PTR 12[ebx]
|
|
mul ebp
|
|
add eax, esi
|
|
mov esi, DWORD PTR 12[edi]
|
|
adc edx, 0
|
|
add eax, esi
|
|
adc edx, 0
|
|
mov DWORD PTR 12[edi],eax
|
|
mov esi, edx
|
|
; Round 16
|
|
mov eax, DWORD PTR 16[ebx]
|
|
mul ebp
|
|
add eax, esi
|
|
mov esi, DWORD PTR 16[edi]
|
|
adc edx, 0
|
|
add eax, esi
|
|
adc edx, 0
|
|
mov DWORD PTR 16[edi],eax
|
|
mov esi, edx
|
|
; Round 20
|
|
mov eax, DWORD PTR 20[ebx]
|
|
mul ebp
|
|
add eax, esi
|
|
mov esi, DWORD PTR 20[edi]
|
|
adc edx, 0
|
|
add eax, esi
|
|
adc edx, 0
|
|
mov DWORD PTR 20[edi],eax
|
|
mov esi, edx
|
|
; Round 24
|
|
mov eax, DWORD PTR 24[ebx]
|
|
mul ebp
|
|
add eax, esi
|
|
mov esi, DWORD PTR 24[edi]
|
|
adc edx, 0
|
|
add eax, esi
|
|
adc edx, 0
|
|
mov DWORD PTR 24[edi],eax
|
|
mov esi, edx
|
|
; Round 28
|
|
mov eax, DWORD PTR 28[ebx]
|
|
mul ebp
|
|
add eax, esi
|
|
mov esi, DWORD PTR 28[edi]
|
|
adc edx, 0
|
|
add eax, esi
|
|
adc edx, 0
|
|
mov DWORD PTR 28[edi],eax
|
|
mov esi, edx
|
|
;
|
|
mov ecx, DWORD PTR [esp]
|
|
add ebx, 32
|
|
add edi, 32
|
|
sub ecx, 8
|
|
jnz L001maw_loop
|
|
$L000maw_finish:
|
|
mov ecx, DWORD PTR 32[esp]
|
|
and ecx, 7
|
|
jnz $L002maw_finish2
|
|
jmp $L003maw_end
|
|
$L002maw_finish2:
|
|
; Tail Round 0
|
|
mov eax, DWORD PTR [ebx]
|
|
mul ebp
|
|
add eax, esi
|
|
mov esi, DWORD PTR [edi]
|
|
adc edx, 0
|
|
add eax, esi
|
|
adc edx, 0
|
|
dec ecx
|
|
mov DWORD PTR [edi],eax
|
|
mov esi, edx
|
|
jz $L003maw_end
|
|
; Tail Round 1
|
|
mov eax, DWORD PTR 4[ebx]
|
|
mul ebp
|
|
add eax, esi
|
|
mov esi, DWORD PTR 4[edi]
|
|
adc edx, 0
|
|
add eax, esi
|
|
adc edx, 0
|
|
dec ecx
|
|
mov DWORD PTR 4[edi],eax
|
|
mov esi, edx
|
|
jz $L003maw_end
|
|
; Tail Round 2
|
|
mov eax, DWORD PTR 8[ebx]
|
|
mul ebp
|
|
add eax, esi
|
|
mov esi, DWORD PTR 8[edi]
|
|
adc edx, 0
|
|
add eax, esi
|
|
adc edx, 0
|
|
dec ecx
|
|
mov DWORD PTR 8[edi],eax
|
|
mov esi, edx
|
|
jz $L003maw_end
|
|
; Tail Round 3
|
|
mov eax, DWORD PTR 12[ebx]
|
|
mul ebp
|
|
add eax, esi
|
|
mov esi, DWORD PTR 12[edi]
|
|
adc edx, 0
|
|
add eax, esi
|
|
adc edx, 0
|
|
dec ecx
|
|
mov DWORD PTR 12[edi],eax
|
|
mov esi, edx
|
|
jz $L003maw_end
|
|
; Tail Round 4
|
|
mov eax, DWORD PTR 16[ebx]
|
|
mul ebp
|
|
add eax, esi
|
|
mov esi, DWORD PTR 16[edi]
|
|
adc edx, 0
|
|
add eax, esi
|
|
adc edx, 0
|
|
dec ecx
|
|
mov DWORD PTR 16[edi],eax
|
|
mov esi, edx
|
|
jz $L003maw_end
|
|
; Tail Round 5
|
|
mov eax, DWORD PTR 20[ebx]
|
|
mul ebp
|
|
add eax, esi
|
|
mov esi, DWORD PTR 20[edi]
|
|
adc edx, 0
|
|
add eax, esi
|
|
adc edx, 0
|
|
dec ecx
|
|
mov DWORD PTR 20[edi],eax
|
|
mov esi, edx
|
|
jz $L003maw_end
|
|
; Tail Round 6
|
|
mov eax, DWORD PTR 24[ebx]
|
|
mul ebp
|
|
add eax, esi
|
|
mov esi, DWORD PTR 24[edi]
|
|
adc edx, 0
|
|
add eax, esi
|
|
adc edx, 0
|
|
mov DWORD PTR 24[edi],eax
|
|
mov esi, edx
|
|
$L003maw_end:
|
|
mov eax, esi
|
|
pop ecx
|
|
pop edi
|
|
pop esi
|
|
pop ebx
|
|
pop ebp
|
|
ret
|
|
_bn_mul_add_words ENDP
|
|
_TEXT ENDS
|
|
_TEXT SEGMENT
|
|
PUBLIC _bn_mul_words
|
|
|
|
_bn_mul_words PROC NEAR
|
|
push ebp
|
|
push ebx
|
|
push esi
|
|
push edi
|
|
;
|
|
xor esi, esi
|
|
mov edi, DWORD PTR 20[esp]
|
|
mov ebx, DWORD PTR 24[esp]
|
|
mov ebp, DWORD PTR 28[esp]
|
|
mov ecx, DWORD PTR 32[esp]
|
|
and ebp, 4294967288
|
|
jz $L004mw_finish
|
|
L005mw_loop:
|
|
; Round 0
|
|
mov eax, DWORD PTR [ebx]
|
|
mul ecx
|
|
add eax, esi
|
|
adc edx, 0
|
|
mov DWORD PTR [edi],eax
|
|
mov esi, edx
|
|
; Round 4
|
|
mov eax, DWORD PTR 4[ebx]
|
|
mul ecx
|
|
add eax, esi
|
|
adc edx, 0
|
|
mov DWORD PTR 4[edi],eax
|
|
mov esi, edx
|
|
; Round 8
|
|
mov eax, DWORD PTR 8[ebx]
|
|
mul ecx
|
|
add eax, esi
|
|
adc edx, 0
|
|
mov DWORD PTR 8[edi],eax
|
|
mov esi, edx
|
|
; Round 12
|
|
mov eax, DWORD PTR 12[ebx]
|
|
mul ecx
|
|
add eax, esi
|
|
adc edx, 0
|
|
mov DWORD PTR 12[edi],eax
|
|
mov esi, edx
|
|
; Round 16
|
|
mov eax, DWORD PTR 16[ebx]
|
|
mul ecx
|
|
add eax, esi
|
|
adc edx, 0
|
|
mov DWORD PTR 16[edi],eax
|
|
mov esi, edx
|
|
; Round 20
|
|
mov eax, DWORD PTR 20[ebx]
|
|
mul ecx
|
|
add eax, esi
|
|
adc edx, 0
|
|
mov DWORD PTR 20[edi],eax
|
|
mov esi, edx
|
|
; Round 24
|
|
mov eax, DWORD PTR 24[ebx]
|
|
mul ecx
|
|
add eax, esi
|
|
adc edx, 0
|
|
mov DWORD PTR 24[edi],eax
|
|
mov esi, edx
|
|
; Round 28
|
|
mov eax, DWORD PTR 28[ebx]
|
|
mul ecx
|
|
add eax, esi
|
|
adc edx, 0
|
|
mov DWORD PTR 28[edi],eax
|
|
mov esi, edx
|
|
;
|
|
add ebx, 32
|
|
add edi, 32
|
|
sub ebp, 8
|
|
jz $L004mw_finish
|
|
jmp L005mw_loop
|
|
$L004mw_finish:
|
|
mov ebp, DWORD PTR 28[esp]
|
|
and ebp, 7
|
|
jnz $L006mw_finish2
|
|
jmp $L007mw_end
|
|
$L006mw_finish2:
|
|
; Tail Round 0
|
|
mov eax, DWORD PTR [ebx]
|
|
mul ecx
|
|
add eax, esi
|
|
adc edx, 0
|
|
mov DWORD PTR [edi],eax
|
|
mov esi, edx
|
|
dec ebp
|
|
jz $L007mw_end
|
|
; Tail Round 1
|
|
mov eax, DWORD PTR 4[ebx]
|
|
mul ecx
|
|
add eax, esi
|
|
adc edx, 0
|
|
mov DWORD PTR 4[edi],eax
|
|
mov esi, edx
|
|
dec ebp
|
|
jz $L007mw_end
|
|
; Tail Round 2
|
|
mov eax, DWORD PTR 8[ebx]
|
|
mul ecx
|
|
add eax, esi
|
|
adc edx, 0
|
|
mov DWORD PTR 8[edi],eax
|
|
mov esi, edx
|
|
dec ebp
|
|
jz $L007mw_end
|
|
; Tail Round 3
|
|
mov eax, DWORD PTR 12[ebx]
|
|
mul ecx
|
|
add eax, esi
|
|
adc edx, 0
|
|
mov DWORD PTR 12[edi],eax
|
|
mov esi, edx
|
|
dec ebp
|
|
jz $L007mw_end
|
|
; Tail Round 4
|
|
mov eax, DWORD PTR 16[ebx]
|
|
mul ecx
|
|
add eax, esi
|
|
adc edx, 0
|
|
mov DWORD PTR 16[edi],eax
|
|
mov esi, edx
|
|
dec ebp
|
|
jz $L007mw_end
|
|
; Tail Round 5
|
|
mov eax, DWORD PTR 20[ebx]
|
|
mul ecx
|
|
add eax, esi
|
|
adc edx, 0
|
|
mov DWORD PTR 20[edi],eax
|
|
mov esi, edx
|
|
dec ebp
|
|
jz $L007mw_end
|
|
; Tail Round 6
|
|
mov eax, DWORD PTR 24[ebx]
|
|
mul ecx
|
|
add eax, esi
|
|
adc edx, 0
|
|
mov DWORD PTR 24[edi],eax
|
|
mov esi, edx
|
|
$L007mw_end:
|
|
mov eax, esi
|
|
pop edi
|
|
pop esi
|
|
pop ebx
|
|
pop ebp
|
|
ret
|
|
_bn_mul_words ENDP
|
|
_TEXT ENDS
|
|
_TEXT SEGMENT
|
|
PUBLIC _bn_sqr_words
|
|
|
|
_bn_sqr_words PROC NEAR
|
|
push ebp
|
|
push ebx
|
|
push esi
|
|
push edi
|
|
;
|
|
mov esi, DWORD PTR 20[esp]
|
|
mov edi, DWORD PTR 24[esp]
|
|
mov ebx, DWORD PTR 28[esp]
|
|
and ebx, 4294967288
|
|
jz $L008sw_finish
|
|
L009sw_loop:
|
|
; Round 0
|
|
mov eax, DWORD PTR [edi]
|
|
mul eax
|
|
mov DWORD PTR [esi],eax
|
|
mov DWORD PTR 4[esi],edx
|
|
; Round 4
|
|
mov eax, DWORD PTR 4[edi]
|
|
mul eax
|
|
mov DWORD PTR 8[esi],eax
|
|
mov DWORD PTR 12[esi],edx
|
|
; Round 8
|
|
mov eax, DWORD PTR 8[edi]
|
|
mul eax
|
|
mov DWORD PTR 16[esi],eax
|
|
mov DWORD PTR 20[esi],edx
|
|
; Round 12
|
|
mov eax, DWORD PTR 12[edi]
|
|
mul eax
|
|
mov DWORD PTR 24[esi],eax
|
|
mov DWORD PTR 28[esi],edx
|
|
; Round 16
|
|
mov eax, DWORD PTR 16[edi]
|
|
mul eax
|
|
mov DWORD PTR 32[esi],eax
|
|
mov DWORD PTR 36[esi],edx
|
|
; Round 20
|
|
mov eax, DWORD PTR 20[edi]
|
|
mul eax
|
|
mov DWORD PTR 40[esi],eax
|
|
mov DWORD PTR 44[esi],edx
|
|
; Round 24
|
|
mov eax, DWORD PTR 24[edi]
|
|
mul eax
|
|
mov DWORD PTR 48[esi],eax
|
|
mov DWORD PTR 52[esi],edx
|
|
; Round 28
|
|
mov eax, DWORD PTR 28[edi]
|
|
mul eax
|
|
mov DWORD PTR 56[esi],eax
|
|
mov DWORD PTR 60[esi],edx
|
|
;
|
|
add edi, 32
|
|
add esi, 64
|
|
sub ebx, 8
|
|
jnz L009sw_loop
|
|
$L008sw_finish:
|
|
mov ebx, DWORD PTR 28[esp]
|
|
and ebx, 7
|
|
jz $L010sw_end
|
|
; Tail Round 0
|
|
mov eax, DWORD PTR [edi]
|
|
mul eax
|
|
mov DWORD PTR [esi],eax
|
|
dec ebx
|
|
mov DWORD PTR 4[esi],edx
|
|
jz $L010sw_end
|
|
; Tail Round 1
|
|
mov eax, DWORD PTR 4[edi]
|
|
mul eax
|
|
mov DWORD PTR 8[esi],eax
|
|
dec ebx
|
|
mov DWORD PTR 12[esi],edx
|
|
jz $L010sw_end
|
|
; Tail Round 2
|
|
mov eax, DWORD PTR 8[edi]
|
|
mul eax
|
|
mov DWORD PTR 16[esi],eax
|
|
dec ebx
|
|
mov DWORD PTR 20[esi],edx
|
|
jz $L010sw_end
|
|
; Tail Round 3
|
|
mov eax, DWORD PTR 12[edi]
|
|
mul eax
|
|
mov DWORD PTR 24[esi],eax
|
|
dec ebx
|
|
mov DWORD PTR 28[esi],edx
|
|
jz $L010sw_end
|
|
; Tail Round 4
|
|
mov eax, DWORD PTR 16[edi]
|
|
mul eax
|
|
mov DWORD PTR 32[esi],eax
|
|
dec ebx
|
|
mov DWORD PTR 36[esi],edx
|
|
jz $L010sw_end
|
|
; Tail Round 5
|
|
mov eax, DWORD PTR 20[edi]
|
|
mul eax
|
|
mov DWORD PTR 40[esi],eax
|
|
dec ebx
|
|
mov DWORD PTR 44[esi],edx
|
|
jz $L010sw_end
|
|
; Tail Round 6
|
|
mov eax, DWORD PTR 24[edi]
|
|
mul eax
|
|
mov DWORD PTR 48[esi],eax
|
|
mov DWORD PTR 52[esi],edx
|
|
$L010sw_end:
|
|
pop edi
|
|
pop esi
|
|
pop ebx
|
|
pop ebp
|
|
ret
|
|
_bn_sqr_words ENDP
|
|
_TEXT ENDS
|
|
_TEXT SEGMENT
|
|
PUBLIC _bn_div_words
|
|
|
|
_bn_div_words PROC NEAR
|
|
push ebp
|
|
push ebx
|
|
push esi
|
|
push edi
|
|
mov edx, DWORD PTR 20[esp]
|
|
mov eax, DWORD PTR 24[esp]
|
|
mov ebx, DWORD PTR 28[esp]
|
|
div ebx
|
|
pop edi
|
|
pop esi
|
|
pop ebx
|
|
pop ebp
|
|
ret
|
|
_bn_div_words ENDP
|
|
_TEXT ENDS
|
|
_TEXT SEGMENT
|
|
PUBLIC _bn_add_words
|
|
|
|
_bn_add_words PROC NEAR
|
|
push ebp
|
|
push ebx
|
|
push esi
|
|
push edi
|
|
;
|
|
mov ebx, DWORD PTR 20[esp]
|
|
mov esi, DWORD PTR 24[esp]
|
|
mov edi, DWORD PTR 28[esp]
|
|
mov ebp, DWORD PTR 32[esp]
|
|
xor eax, eax
|
|
and ebp, 4294967288
|
|
jz $L011aw_finish
|
|
L012aw_loop:
|
|
; Round 0
|
|
mov ecx, DWORD PTR [esi]
|
|
mov edx, DWORD PTR [edi]
|
|
add ecx, eax
|
|
mov eax, 0
|
|
adc eax, eax
|
|
add ecx, edx
|
|
adc eax, 0
|
|
mov DWORD PTR [ebx],ecx
|
|
; Round 1
|
|
mov ecx, DWORD PTR 4[esi]
|
|
mov edx, DWORD PTR 4[edi]
|
|
add ecx, eax
|
|
mov eax, 0
|
|
adc eax, eax
|
|
add ecx, edx
|
|
adc eax, 0
|
|
mov DWORD PTR 4[ebx],ecx
|
|
; Round 2
|
|
mov ecx, DWORD PTR 8[esi]
|
|
mov edx, DWORD PTR 8[edi]
|
|
add ecx, eax
|
|
mov eax, 0
|
|
adc eax, eax
|
|
add ecx, edx
|
|
adc eax, 0
|
|
mov DWORD PTR 8[ebx],ecx
|
|
; Round 3
|
|
mov ecx, DWORD PTR 12[esi]
|
|
mov edx, DWORD PTR 12[edi]
|
|
add ecx, eax
|
|
mov eax, 0
|
|
adc eax, eax
|
|
add ecx, edx
|
|
adc eax, 0
|
|
mov DWORD PTR 12[ebx],ecx
|
|
; Round 4
|
|
mov ecx, DWORD PTR 16[esi]
|
|
mov edx, DWORD PTR 16[edi]
|
|
add ecx, eax
|
|
mov eax, 0
|
|
adc eax, eax
|
|
add ecx, edx
|
|
adc eax, 0
|
|
mov DWORD PTR 16[ebx],ecx
|
|
; Round 5
|
|
mov ecx, DWORD PTR 20[esi]
|
|
mov edx, DWORD PTR 20[edi]
|
|
add ecx, eax
|
|
mov eax, 0
|
|
adc eax, eax
|
|
add ecx, edx
|
|
adc eax, 0
|
|
mov DWORD PTR 20[ebx],ecx
|
|
; Round 6
|
|
mov ecx, DWORD PTR 24[esi]
|
|
mov edx, DWORD PTR 24[edi]
|
|
add ecx, eax
|
|
mov eax, 0
|
|
adc eax, eax
|
|
add ecx, edx
|
|
adc eax, 0
|
|
mov DWORD PTR 24[ebx],ecx
|
|
; Round 7
|
|
mov ecx, DWORD PTR 28[esi]
|
|
mov edx, DWORD PTR 28[edi]
|
|
add ecx, eax
|
|
mov eax, 0
|
|
adc eax, eax
|
|
add ecx, edx
|
|
adc eax, 0
|
|
mov DWORD PTR 28[ebx],ecx
|
|
;
|
|
add esi, 32
|
|
add edi, 32
|
|
add ebx, 32
|
|
sub ebp, 8
|
|
jnz L012aw_loop
|
|
$L011aw_finish:
|
|
mov ebp, DWORD PTR 32[esp]
|
|
and ebp, 7
|
|
jz $L013aw_end
|
|
; Tail Round 0
|
|
mov ecx, DWORD PTR [esi]
|
|
mov edx, DWORD PTR [edi]
|
|
add ecx, eax
|
|
mov eax, 0
|
|
adc eax, eax
|
|
add ecx, edx
|
|
adc eax, 0
|
|
dec ebp
|
|
mov DWORD PTR [ebx],ecx
|
|
jz $L013aw_end
|
|
; Tail Round 1
|
|
mov ecx, DWORD PTR 4[esi]
|
|
mov edx, DWORD PTR 4[edi]
|
|
add ecx, eax
|
|
mov eax, 0
|
|
adc eax, eax
|
|
add ecx, edx
|
|
adc eax, 0
|
|
dec ebp
|
|
mov DWORD PTR 4[ebx],ecx
|
|
jz $L013aw_end
|
|
; Tail Round 2
|
|
mov ecx, DWORD PTR 8[esi]
|
|
mov edx, DWORD PTR 8[edi]
|
|
add ecx, eax
|
|
mov eax, 0
|
|
adc eax, eax
|
|
add ecx, edx
|
|
adc eax, 0
|
|
dec ebp
|
|
mov DWORD PTR 8[ebx],ecx
|
|
jz $L013aw_end
|
|
; Tail Round 3
|
|
mov ecx, DWORD PTR 12[esi]
|
|
mov edx, DWORD PTR 12[edi]
|
|
add ecx, eax
|
|
mov eax, 0
|
|
adc eax, eax
|
|
add ecx, edx
|
|
adc eax, 0
|
|
dec ebp
|
|
mov DWORD PTR 12[ebx],ecx
|
|
jz $L013aw_end
|
|
; Tail Round 4
|
|
mov ecx, DWORD PTR 16[esi]
|
|
mov edx, DWORD PTR 16[edi]
|
|
add ecx, eax
|
|
mov eax, 0
|
|
adc eax, eax
|
|
add ecx, edx
|
|
adc eax, 0
|
|
dec ebp
|
|
mov DWORD PTR 16[ebx],ecx
|
|
jz $L013aw_end
|
|
; Tail Round 5
|
|
mov ecx, DWORD PTR 20[esi]
|
|
mov edx, DWORD PTR 20[edi]
|
|
add ecx, eax
|
|
mov eax, 0
|
|
adc eax, eax
|
|
add ecx, edx
|
|
adc eax, 0
|
|
dec ebp
|
|
mov DWORD PTR 20[ebx],ecx
|
|
jz $L013aw_end
|
|
; Tail Round 6
|
|
mov ecx, DWORD PTR 24[esi]
|
|
mov edx, DWORD PTR 24[edi]
|
|
add ecx, eax
|
|
mov eax, 0
|
|
adc eax, eax
|
|
add ecx, edx
|
|
adc eax, 0
|
|
mov DWORD PTR 24[ebx],ecx
|
|
$L013aw_end:
|
|
pop edi
|
|
pop esi
|
|
pop ebx
|
|
pop ebp
|
|
ret
|
|
_bn_add_words ENDP
|
|
_TEXT ENDS
|
|
_TEXT SEGMENT
|
|
PUBLIC _bn_sub_words
|
|
|
|
_bn_sub_words PROC NEAR
|
|
push ebp
|
|
push ebx
|
|
push esi
|
|
push edi
|
|
;
|
|
mov ebx, DWORD PTR 20[esp]
|
|
mov esi, DWORD PTR 24[esp]
|
|
mov edi, DWORD PTR 28[esp]
|
|
mov ebp, DWORD PTR 32[esp]
|
|
xor eax, eax
|
|
and ebp, 4294967288
|
|
jz $L014aw_finish
|
|
L015aw_loop:
|
|
; Round 0
|
|
mov ecx, DWORD PTR [esi]
|
|
mov edx, DWORD PTR [edi]
|
|
sub ecx, eax
|
|
mov eax, 0
|
|
adc eax, eax
|
|
sub ecx, edx
|
|
adc eax, 0
|
|
mov DWORD PTR [ebx],ecx
|
|
; Round 1
|
|
mov ecx, DWORD PTR 4[esi]
|
|
mov edx, DWORD PTR 4[edi]
|
|
sub ecx, eax
|
|
mov eax, 0
|
|
adc eax, eax
|
|
sub ecx, edx
|
|
adc eax, 0
|
|
mov DWORD PTR 4[ebx],ecx
|
|
; Round 2
|
|
mov ecx, DWORD PTR 8[esi]
|
|
mov edx, DWORD PTR 8[edi]
|
|
sub ecx, eax
|
|
mov eax, 0
|
|
adc eax, eax
|
|
sub ecx, edx
|
|
adc eax, 0
|
|
mov DWORD PTR 8[ebx],ecx
|
|
; Round 3
|
|
mov ecx, DWORD PTR 12[esi]
|
|
mov edx, DWORD PTR 12[edi]
|
|
sub ecx, eax
|
|
mov eax, 0
|
|
adc eax, eax
|
|
sub ecx, edx
|
|
adc eax, 0
|
|
mov DWORD PTR 12[ebx],ecx
|
|
; Round 4
|
|
mov ecx, DWORD PTR 16[esi]
|
|
mov edx, DWORD PTR 16[edi]
|
|
sub ecx, eax
|
|
mov eax, 0
|
|
adc eax, eax
|
|
sub ecx, edx
|
|
adc eax, 0
|
|
mov DWORD PTR 16[ebx],ecx
|
|
; Round 5
|
|
mov ecx, DWORD PTR 20[esi]
|
|
mov edx, DWORD PTR 20[edi]
|
|
sub ecx, eax
|
|
mov eax, 0
|
|
adc eax, eax
|
|
sub ecx, edx
|
|
adc eax, 0
|
|
mov DWORD PTR 20[ebx],ecx
|
|
; Round 6
|
|
mov ecx, DWORD PTR 24[esi]
|
|
mov edx, DWORD PTR 24[edi]
|
|
sub ecx, eax
|
|
mov eax, 0
|
|
adc eax, eax
|
|
sub ecx, edx
|
|
adc eax, 0
|
|
mov DWORD PTR 24[ebx],ecx
|
|
; Round 7
|
|
mov ecx, DWORD PTR 28[esi]
|
|
mov edx, DWORD PTR 28[edi]
|
|
sub ecx, eax
|
|
mov eax, 0
|
|
adc eax, eax
|
|
sub ecx, edx
|
|
adc eax, 0
|
|
mov DWORD PTR 28[ebx],ecx
|
|
;
|
|
add esi, 32
|
|
add edi, 32
|
|
add ebx, 32
|
|
sub ebp, 8
|
|
jnz L015aw_loop
|
|
$L014aw_finish:
|
|
mov ebp, DWORD PTR 32[esp]
|
|
and ebp, 7
|
|
jz $L016aw_end
|
|
; Tail Round 0
|
|
mov ecx, DWORD PTR [esi]
|
|
mov edx, DWORD PTR [edi]
|
|
sub ecx, eax
|
|
mov eax, 0
|
|
adc eax, eax
|
|
sub ecx, edx
|
|
adc eax, 0
|
|
dec ebp
|
|
mov DWORD PTR [ebx],ecx
|
|
jz $L016aw_end
|
|
; Tail Round 1
|
|
mov ecx, DWORD PTR 4[esi]
|
|
mov edx, DWORD PTR 4[edi]
|
|
sub ecx, eax
|
|
mov eax, 0
|
|
adc eax, eax
|
|
sub ecx, edx
|
|
adc eax, 0
|
|
dec ebp
|
|
mov DWORD PTR 4[ebx],ecx
|
|
jz $L016aw_end
|
|
; Tail Round 2
|
|
mov ecx, DWORD PTR 8[esi]
|
|
mov edx, DWORD PTR 8[edi]
|
|
sub ecx, eax
|
|
mov eax, 0
|
|
adc eax, eax
|
|
sub ecx, edx
|
|
adc eax, 0
|
|
dec ebp
|
|
mov DWORD PTR 8[ebx],ecx
|
|
jz $L016aw_end
|
|
; Tail Round 3
|
|
mov ecx, DWORD PTR 12[esi]
|
|
mov edx, DWORD PTR 12[edi]
|
|
sub ecx, eax
|
|
mov eax, 0
|
|
adc eax, eax
|
|
sub ecx, edx
|
|
adc eax, 0
|
|
dec ebp
|
|
mov DWORD PTR 12[ebx],ecx
|
|
jz $L016aw_end
|
|
; Tail Round 4
|
|
mov ecx, DWORD PTR 16[esi]
|
|
mov edx, DWORD PTR 16[edi]
|
|
sub ecx, eax
|
|
mov eax, 0
|
|
adc eax, eax
|
|
sub ecx, edx
|
|
adc eax, 0
|
|
dec ebp
|
|
mov DWORD PTR 16[ebx],ecx
|
|
jz $L016aw_end
|
|
; Tail Round 5
|
|
mov ecx, DWORD PTR 20[esi]
|
|
mov edx, DWORD PTR 20[edi]
|
|
sub ecx, eax
|
|
mov eax, 0
|
|
adc eax, eax
|
|
sub ecx, edx
|
|
adc eax, 0
|
|
dec ebp
|
|
mov DWORD PTR 20[ebx],ecx
|
|
jz $L016aw_end
|
|
; Tail Round 6
|
|
mov ecx, DWORD PTR 24[esi]
|
|
mov edx, DWORD PTR 24[edi]
|
|
sub ecx, eax
|
|
mov eax, 0
|
|
adc eax, eax
|
|
sub ecx, edx
|
|
adc eax, 0
|
|
mov DWORD PTR 24[ebx],ecx
|
|
$L016aw_end:
|
|
pop edi
|
|
pop esi
|
|
pop ebx
|
|
pop ebp
|
|
ret
|
|
_bn_sub_words ENDP
|
|
_TEXT ENDS
|
|
_TEXT SEGMENT
|
|
PUBLIC _bn_mul_comba8
|
|
|
|
_bn_mul_comba8 PROC NEAR
|
|
push esi
|
|
mov esi, DWORD PTR 12[esp]
|
|
push edi
|
|
mov edi, DWORD PTR 20[esp]
|
|
push ebp
|
|
push ebx
|
|
xor ebx, ebx
|
|
mov eax, DWORD PTR [esi]
|
|
xor ecx, ecx
|
|
mov edx, DWORD PTR [edi]
|
|
; ################## Calculate word 0
|
|
xor ebp, ebp
|
|
; mul a[0]*b[0]
|
|
mul edx
|
|
add ebx, eax
|
|
mov eax, DWORD PTR 20[esp]
|
|
adc ecx, edx
|
|
mov edx, DWORD PTR [edi]
|
|
adc ebp, 0
|
|
mov DWORD PTR [eax],ebx
|
|
mov eax, DWORD PTR 4[esi]
|
|
; saved r[0]
|
|
; ################## Calculate word 1
|
|
xor ebx, ebx
|
|
; mul a[1]*b[0]
|
|
mul edx
|
|
add ecx, eax
|
|
mov eax, DWORD PTR [esi]
|
|
adc ebp, edx
|
|
mov edx, DWORD PTR 4[edi]
|
|
adc ebx, 0
|
|
; mul a[0]*b[1]
|
|
mul edx
|
|
add ecx, eax
|
|
mov eax, DWORD PTR 20[esp]
|
|
adc ebp, edx
|
|
mov edx, DWORD PTR [edi]
|
|
adc ebx, 0
|
|
mov DWORD PTR 4[eax],ecx
|
|
mov eax, DWORD PTR 8[esi]
|
|
; saved r[1]
|
|
; ################## Calculate word 2
|
|
xor ecx, ecx
|
|
; mul a[2]*b[0]
|
|
mul edx
|
|
add ebp, eax
|
|
mov eax, DWORD PTR 4[esi]
|
|
adc ebx, edx
|
|
mov edx, DWORD PTR 4[edi]
|
|
adc ecx, 0
|
|
; mul a[1]*b[1]
|
|
mul edx
|
|
add ebp, eax
|
|
mov eax, DWORD PTR [esi]
|
|
adc ebx, edx
|
|
mov edx, DWORD PTR 8[edi]
|
|
adc ecx, 0
|
|
; mul a[0]*b[2]
|
|
mul edx
|
|
add ebp, eax
|
|
mov eax, DWORD PTR 20[esp]
|
|
adc ebx, edx
|
|
mov edx, DWORD PTR [edi]
|
|
adc ecx, 0
|
|
mov DWORD PTR 8[eax],ebp
|
|
mov eax, DWORD PTR 12[esi]
|
|
; saved r[2]
|
|
; ################## Calculate word 3
|
|
xor ebp, ebp
|
|
; mul a[3]*b[0]
|
|
mul edx
|
|
add ebx, eax
|
|
mov eax, DWORD PTR 8[esi]
|
|
adc ecx, edx
|
|
mov edx, DWORD PTR 4[edi]
|
|
adc ebp, 0
|
|
; mul a[2]*b[1]
|
|
mul edx
|
|
add ebx, eax
|
|
mov eax, DWORD PTR 4[esi]
|
|
adc ecx, edx
|
|
mov edx, DWORD PTR 8[edi]
|
|
adc ebp, 0
|
|
; mul a[1]*b[2]
|
|
mul edx
|
|
add ebx, eax
|
|
mov eax, DWORD PTR [esi]
|
|
adc ecx, edx
|
|
mov edx, DWORD PTR 12[edi]
|
|
adc ebp, 0
|
|
; mul a[0]*b[3]
|
|
mul edx
|
|
add ebx, eax
|
|
mov eax, DWORD PTR 20[esp]
|
|
adc ecx, edx
|
|
mov edx, DWORD PTR [edi]
|
|
adc ebp, 0
|
|
mov DWORD PTR 12[eax],ebx
|
|
mov eax, DWORD PTR 16[esi]
|
|
; saved r[3]
|
|
; ################## Calculate word 4
|
|
xor ebx, ebx
|
|
; mul a[4]*b[0]
|
|
mul edx
|
|
add ecx, eax
|
|
mov eax, DWORD PTR 12[esi]
|
|
adc ebp, edx
|
|
mov edx, DWORD PTR 4[edi]
|
|
adc ebx, 0
|
|
; mul a[3]*b[1]
|
|
mul edx
|
|
add ecx, eax
|
|
mov eax, DWORD PTR 8[esi]
|
|
adc ebp, edx
|
|
mov edx, DWORD PTR 8[edi]
|
|
adc ebx, 0
|
|
; mul a[2]*b[2]
|
|
mul edx
|
|
add ecx, eax
|
|
mov eax, DWORD PTR 4[esi]
|
|
adc ebp, edx
|
|
mov edx, DWORD PTR 12[edi]
|
|
adc ebx, 0
|
|
; mul a[1]*b[3]
|
|
mul edx
|
|
add ecx, eax
|
|
mov eax, DWORD PTR [esi]
|
|
adc ebp, edx
|
|
mov edx, DWORD PTR 16[edi]
|
|
adc ebx, 0
|
|
; mul a[0]*b[4]
|
|
mul edx
|
|
add ecx, eax
|
|
mov eax, DWORD PTR 20[esp]
|
|
adc ebp, edx
|
|
mov edx, DWORD PTR [edi]
|
|
adc ebx, 0
|
|
mov DWORD PTR 16[eax],ecx
|
|
mov eax, DWORD PTR 20[esi]
|
|
; saved r[4]
|
|
; ################## Calculate word 5
|
|
xor ecx, ecx
|
|
; mul a[5]*b[0]
|
|
mul edx
|
|
add ebp, eax
|
|
mov eax, DWORD PTR 16[esi]
|
|
adc ebx, edx
|
|
mov edx, DWORD PTR 4[edi]
|
|
adc ecx, 0
|
|
; mul a[4]*b[1]
|
|
mul edx
|
|
add ebp, eax
|
|
mov eax, DWORD PTR 12[esi]
|
|
adc ebx, edx
|
|
mov edx, DWORD PTR 8[edi]
|
|
adc ecx, 0
|
|
; mul a[3]*b[2]
|
|
mul edx
|
|
add ebp, eax
|
|
mov eax, DWORD PTR 8[esi]
|
|
adc ebx, edx
|
|
mov edx, DWORD PTR 12[edi]
|
|
adc ecx, 0
|
|
; mul a[2]*b[3]
|
|
mul edx
|
|
add ebp, eax
|
|
mov eax, DWORD PTR 4[esi]
|
|
adc ebx, edx
|
|
mov edx, DWORD PTR 16[edi]
|
|
adc ecx, 0
|
|
; mul a[1]*b[4]
|
|
mul edx
|
|
add ebp, eax
|
|
mov eax, DWORD PTR [esi]
|
|
adc ebx, edx
|
|
mov edx, DWORD PTR 20[edi]
|
|
adc ecx, 0
|
|
; mul a[0]*b[5]
|
|
mul edx
|
|
add ebp, eax
|
|
mov eax, DWORD PTR 20[esp]
|
|
adc ebx, edx
|
|
mov edx, DWORD PTR [edi]
|
|
adc ecx, 0
|
|
mov DWORD PTR 20[eax],ebp
|
|
mov eax, DWORD PTR 24[esi]
|
|
; saved r[5]
|
|
; ################## Calculate word 6
|
|
xor ebp, ebp
|
|
; mul a[6]*b[0]
|
|
mul edx
|
|
add ebx, eax
|
|
mov eax, DWORD PTR 20[esi]
|
|
adc ecx, edx
|
|
mov edx, DWORD PTR 4[edi]
|
|
adc ebp, 0
|
|
; mul a[5]*b[1]
|
|
mul edx
|
|
add ebx, eax
|
|
mov eax, DWORD PTR 16[esi]
|
|
adc ecx, edx
|
|
mov edx, DWORD PTR 8[edi]
|
|
adc ebp, 0
|
|
; mul a[4]*b[2]
|
|
mul edx
|
|
add ebx, eax
|
|
mov eax, DWORD PTR 12[esi]
|
|
adc ecx, edx
|
|
mov edx, DWORD PTR 12[edi]
|
|
adc ebp, 0
|
|
; mul a[3]*b[3]
|
|
mul edx
|
|
add ebx, eax
|
|
mov eax, DWORD PTR 8[esi]
|
|
adc ecx, edx
|
|
mov edx, DWORD PTR 16[edi]
|
|
adc ebp, 0
|
|
; mul a[2]*b[4]
|
|
mul edx
|
|
add ebx, eax
|
|
mov eax, DWORD PTR 4[esi]
|
|
adc ecx, edx
|
|
mov edx, DWORD PTR 20[edi]
|
|
adc ebp, 0
|
|
; mul a[1]*b[5]
|
|
mul edx
|
|
add ebx, eax
|
|
mov eax, DWORD PTR [esi]
|
|
adc ecx, edx
|
|
mov edx, DWORD PTR 24[edi]
|
|
adc ebp, 0
|
|
; mul a[0]*b[6]
|
|
mul edx
|
|
add ebx, eax
|
|
mov eax, DWORD PTR 20[esp]
|
|
adc ecx, edx
|
|
mov edx, DWORD PTR [edi]
|
|
adc ebp, 0
|
|
mov DWORD PTR 24[eax],ebx
|
|
mov eax, DWORD PTR 28[esi]
|
|
; saved r[6]
|
|
; ################## Calculate word 7
|
|
xor ebx, ebx
|
|
; mul a[7]*b[0]
|
|
mul edx
|
|
add ecx, eax
|
|
mov eax, DWORD PTR 24[esi]
|
|
adc ebp, edx
|
|
mov edx, DWORD PTR 4[edi]
|
|
adc ebx, 0
|
|
; mul a[6]*b[1]
|
|
mul edx
|
|
add ecx, eax
|
|
mov eax, DWORD PTR 20[esi]
|
|
adc ebp, edx
|
|
mov edx, DWORD PTR 8[edi]
|
|
adc ebx, 0
|
|
; mul a[5]*b[2]
|
|
mul edx
|
|
add ecx, eax
|
|
mov eax, DWORD PTR 16[esi]
|
|
adc ebp, edx
|
|
mov edx, DWORD PTR 12[edi]
|
|
adc ebx, 0
|
|
; mul a[4]*b[3]
|
|
mul edx
|
|
add ecx, eax
|
|
mov eax, DWORD PTR 12[esi]
|
|
adc ebp, edx
|
|
mov edx, DWORD PTR 16[edi]
|
|
adc ebx, 0
|
|
; mul a[3]*b[4]
|
|
mul edx
|
|
add ecx, eax
|
|
mov eax, DWORD PTR 8[esi]
|
|
adc ebp, edx
|
|
mov edx, DWORD PTR 20[edi]
|
|
adc ebx, 0
|
|
; mul a[2]*b[5]
|
|
mul edx
|
|
add ecx, eax
|
|
mov eax, DWORD PTR 4[esi]
|
|
adc ebp, edx
|
|
mov edx, DWORD PTR 24[edi]
|
|
adc ebx, 0
|
|
; mul a[1]*b[6]
|
|
mul edx
|
|
add ecx, eax
|
|
mov eax, DWORD PTR [esi]
|
|
adc ebp, edx
|
|
mov edx, DWORD PTR 28[edi]
|
|
adc ebx, 0
|
|
; mul a[0]*b[7]
|
|
mul edx
|
|
add ecx, eax
|
|
mov eax, DWORD PTR 20[esp]
|
|
adc ebp, edx
|
|
mov edx, DWORD PTR 4[edi]
|
|
adc ebx, 0
|
|
mov DWORD PTR 28[eax],ecx
|
|
mov eax, DWORD PTR 28[esi]
|
|
; saved r[7]
|
|
; ################## Calculate word 8
|
|
xor ecx, ecx
|
|
; mul a[7]*b[1]
|
|
mul edx
|
|
add ebp, eax
|
|
mov eax, DWORD PTR 24[esi]
|
|
adc ebx, edx
|
|
mov edx, DWORD PTR 8[edi]
|
|
adc ecx, 0
|
|
; mul a[6]*b[2]
|
|
mul edx
|
|
add ebp, eax
|
|
mov eax, DWORD PTR 20[esi]
|
|
adc ebx, edx
|
|
mov edx, DWORD PTR 12[edi]
|
|
adc ecx, 0
|
|
; mul a[5]*b[3]
|
|
mul edx
|
|
add ebp, eax
|
|
mov eax, DWORD PTR 16[esi]
|
|
adc ebx, edx
|
|
mov edx, DWORD PTR 16[edi]
|
|
adc ecx, 0
|
|
; mul a[4]*b[4]
|
|
mul edx
|
|
add ebp, eax
|
|
mov eax, DWORD PTR 12[esi]
|
|
adc ebx, edx
|
|
mov edx, DWORD PTR 20[edi]
|
|
adc ecx, 0
|
|
; mul a[3]*b[5]
|
|
mul edx
|
|
add ebp, eax
|
|
mov eax, DWORD PTR 8[esi]
|
|
adc ebx, edx
|
|
mov edx, DWORD PTR 24[edi]
|
|
adc ecx, 0
|
|
; mul a[2]*b[6]
|
|
mul edx
|
|
add ebp, eax
|
|
mov eax, DWORD PTR 4[esi]
|
|
adc ebx, edx
|
|
mov edx, DWORD PTR 28[edi]
|
|
adc ecx, 0
|
|
; mul a[1]*b[7]
|
|
mul edx
|
|
add ebp, eax
|
|
mov eax, DWORD PTR 20[esp]
|
|
adc ebx, edx
|
|
mov edx, DWORD PTR 8[edi]
|
|
adc ecx, 0
|
|
mov DWORD PTR 32[eax],ebp
|
|
mov eax, DWORD PTR 28[esi]
|
|
; saved r[8]
|
|
; ################## Calculate word 9
|
|
xor ebp, ebp
|
|
; mul a[7]*b[2]
|
|
mul edx
|
|
add ebx, eax
|
|
mov eax, DWORD PTR 24[esi]
|
|
adc ecx, edx
|
|
mov edx, DWORD PTR 12[edi]
|
|
adc ebp, 0
|
|
; mul a[6]*b[3]
|
|
mul edx
|
|
add ebx, eax
|
|
mov eax, DWORD PTR 20[esi]
|
|
adc ecx, edx
|
|
mov edx, DWORD PTR 16[edi]
|
|
adc ebp, 0
|
|
; mul a[5]*b[4]
|
|
mul edx
|
|
add ebx, eax
|
|
mov eax, DWORD PTR 16[esi]
|
|
adc ecx, edx
|
|
mov edx, DWORD PTR 20[edi]
|
|
adc ebp, 0
|
|
; mul a[4]*b[5]
|
|
mul edx
|
|
add ebx, eax
|
|
mov eax, DWORD PTR 12[esi]
|
|
adc ecx, edx
|
|
mov edx, DWORD PTR 24[edi]
|
|
adc ebp, 0
|
|
; mul a[3]*b[6]
|
|
mul edx
|
|
add ebx, eax
|
|
mov eax, DWORD PTR 8[esi]
|
|
adc ecx, edx
|
|
mov edx, DWORD PTR 28[edi]
|
|
adc ebp, 0
|
|
; mul a[2]*b[7]
|
|
mul edx
|
|
add ebx, eax
|
|
mov eax, DWORD PTR 20[esp]
|
|
adc ecx, edx
|
|
mov edx, DWORD PTR 12[edi]
|
|
adc ebp, 0
|
|
mov DWORD PTR 36[eax],ebx
|
|
mov eax, DWORD PTR 28[esi]
|
|
; saved r[9]
|
|
; ################## Calculate word 10
|
|
xor ebx, ebx
|
|
; mul a[7]*b[3]
|
|
mul edx
|
|
add ecx, eax
|
|
mov eax, DWORD PTR 24[esi]
|
|
adc ebp, edx
|
|
mov edx, DWORD PTR 16[edi]
|
|
adc ebx, 0
|
|
; mul a[6]*b[4]
|
|
mul edx
|
|
add ecx, eax
|
|
mov eax, DWORD PTR 20[esi]
|
|
adc ebp, edx
|
|
mov edx, DWORD PTR 20[edi]
|
|
adc ebx, 0
|
|
; mul a[5]*b[5]
|
|
mul edx
|
|
add ecx, eax
|
|
mov eax, DWORD PTR 16[esi]
|
|
adc ebp, edx
|
|
mov edx, DWORD PTR 24[edi]
|
|
adc ebx, 0
|
|
; mul a[4]*b[6]
|
|
mul edx
|
|
add ecx, eax
|
|
mov eax, DWORD PTR 12[esi]
|
|
adc ebp, edx
|
|
mov edx, DWORD PTR 28[edi]
|
|
adc ebx, 0
|
|
; mul a[3]*b[7]
|
|
mul edx
|
|
add ecx, eax
|
|
mov eax, DWORD PTR 20[esp]
|
|
adc ebp, edx
|
|
mov edx, DWORD PTR 16[edi]
|
|
adc ebx, 0
|
|
mov DWORD PTR 40[eax],ecx
|
|
mov eax, DWORD PTR 28[esi]
|
|
; saved r[10]
|
|
; ################## Calculate word 11
|
|
xor ecx, ecx
|
|
; mul a[7]*b[4]
|
|
mul edx
|
|
add ebp, eax
|
|
mov eax, DWORD PTR 24[esi]
|
|
adc ebx, edx
|
|
mov edx, DWORD PTR 20[edi]
|
|
adc ecx, 0
|
|
; mul a[6]*b[5]
|
|
mul edx
|
|
add ebp, eax
|
|
mov eax, DWORD PTR 20[esi]
|
|
adc ebx, edx
|
|
mov edx, DWORD PTR 24[edi]
|
|
adc ecx, 0
|
|
; mul a[5]*b[6]
|
|
mul edx
|
|
add ebp, eax
|
|
mov eax, DWORD PTR 16[esi]
|
|
adc ebx, edx
|
|
mov edx, DWORD PTR 28[edi]
|
|
adc ecx, 0
|
|
; mul a[4]*b[7]
|
|
mul edx
|
|
add ebp, eax
|
|
mov eax, DWORD PTR 20[esp]
|
|
adc ebx, edx
|
|
mov edx, DWORD PTR 20[edi]
|
|
adc ecx, 0
|
|
mov DWORD PTR 44[eax],ebp
|
|
mov eax, DWORD PTR 28[esi]
|
|
; saved r[11]
|
|
; ################## Calculate word 12
|
|
xor ebp, ebp
|
|
; mul a[7]*b[5]
|
|
mul edx
|
|
add ebx, eax
|
|
mov eax, DWORD PTR 24[esi]
|
|
adc ecx, edx
|
|
mov edx, DWORD PTR 24[edi]
|
|
adc ebp, 0
|
|
; mul a[6]*b[6]
|
|
mul edx
|
|
add ebx, eax
|
|
mov eax, DWORD PTR 20[esi]
|
|
adc ecx, edx
|
|
mov edx, DWORD PTR 28[edi]
|
|
adc ebp, 0
|
|
; mul a[5]*b[7]
|
|
mul edx
|
|
add ebx, eax
|
|
mov eax, DWORD PTR 20[esp]
|
|
adc ecx, edx
|
|
mov edx, DWORD PTR 24[edi]
|
|
adc ebp, 0
|
|
mov DWORD PTR 48[eax],ebx
|
|
mov eax, DWORD PTR 28[esi]
|
|
; saved r[12]
|
|
; ################## Calculate word 13
|
|
xor ebx, ebx
|
|
; mul a[7]*b[6]
|
|
mul edx
|
|
add ecx, eax
|
|
mov eax, DWORD PTR 24[esi]
|
|
adc ebp, edx
|
|
mov edx, DWORD PTR 28[edi]
|
|
adc ebx, 0
|
|
; mul a[6]*b[7]
|
|
mul edx
|
|
add ecx, eax
|
|
mov eax, DWORD PTR 20[esp]
|
|
adc ebp, edx
|
|
mov edx, DWORD PTR 28[edi]
|
|
adc ebx, 0
|
|
mov DWORD PTR 52[eax],ecx
|
|
mov eax, DWORD PTR 28[esi]
|
|
; saved r[13]
|
|
; ################## Calculate word 14
|
|
xor ecx, ecx
|
|
; mul a[7]*b[7]
|
|
mul edx
|
|
add ebp, eax
|
|
mov eax, DWORD PTR 20[esp]
|
|
adc ebx, edx
|
|
adc ecx, 0
|
|
mov DWORD PTR 56[eax],ebp
|
|
; saved r[14]
|
|
; save r[15]
|
|
mov DWORD PTR 60[eax],ebx
|
|
pop ebx
|
|
pop ebp
|
|
pop edi
|
|
pop esi
|
|
ret
|
|
_bn_mul_comba8 ENDP
|
|
_TEXT ENDS
|
|
_TEXT SEGMENT
|
|
PUBLIC _bn_mul_comba4
|
|
|
|
_bn_mul_comba4 PROC NEAR
|
|
push esi
|
|
mov esi, DWORD PTR 12[esp]
|
|
push edi
|
|
mov edi, DWORD PTR 20[esp]
|
|
push ebp
|
|
push ebx
|
|
xor ebx, ebx
|
|
mov eax, DWORD PTR [esi]
|
|
xor ecx, ecx
|
|
mov edx, DWORD PTR [edi]
|
|
; ################## Calculate word 0
|
|
xor ebp, ebp
|
|
; mul a[0]*b[0]
|
|
mul edx
|
|
add ebx, eax
|
|
mov eax, DWORD PTR 20[esp]
|
|
adc ecx, edx
|
|
mov edx, DWORD PTR [edi]
|
|
adc ebp, 0
|
|
mov DWORD PTR [eax],ebx
|
|
mov eax, DWORD PTR 4[esi]
|
|
; saved r[0]
|
|
; ################## Calculate word 1
|
|
xor ebx, ebx
|
|
; mul a[1]*b[0]
|
|
mul edx
|
|
add ecx, eax
|
|
mov eax, DWORD PTR [esi]
|
|
adc ebp, edx
|
|
mov edx, DWORD PTR 4[edi]
|
|
adc ebx, 0
|
|
; mul a[0]*b[1]
|
|
mul edx
|
|
add ecx, eax
|
|
mov eax, DWORD PTR 20[esp]
|
|
adc ebp, edx
|
|
mov edx, DWORD PTR [edi]
|
|
adc ebx, 0
|
|
mov DWORD PTR 4[eax],ecx
|
|
mov eax, DWORD PTR 8[esi]
|
|
; saved r[1]
|
|
; ################## Calculate word 2
|
|
xor ecx, ecx
|
|
; mul a[2]*b[0]
|
|
mul edx
|
|
add ebp, eax
|
|
mov eax, DWORD PTR 4[esi]
|
|
adc ebx, edx
|
|
mov edx, DWORD PTR 4[edi]
|
|
adc ecx, 0
|
|
; mul a[1]*b[1]
|
|
mul edx
|
|
add ebp, eax
|
|
mov eax, DWORD PTR [esi]
|
|
adc ebx, edx
|
|
mov edx, DWORD PTR 8[edi]
|
|
adc ecx, 0
|
|
; mul a[0]*b[2]
|
|
mul edx
|
|
add ebp, eax
|
|
mov eax, DWORD PTR 20[esp]
|
|
adc ebx, edx
|
|
mov edx, DWORD PTR [edi]
|
|
adc ecx, 0
|
|
mov DWORD PTR 8[eax],ebp
|
|
mov eax, DWORD PTR 12[esi]
|
|
; saved r[2]
|
|
; ################## Calculate word 3
|
|
xor ebp, ebp
|
|
; mul a[3]*b[0]
|
|
mul edx
|
|
add ebx, eax
|
|
mov eax, DWORD PTR 8[esi]
|
|
adc ecx, edx
|
|
mov edx, DWORD PTR 4[edi]
|
|
adc ebp, 0
|
|
; mul a[2]*b[1]
|
|
mul edx
|
|
add ebx, eax
|
|
mov eax, DWORD PTR 4[esi]
|
|
adc ecx, edx
|
|
mov edx, DWORD PTR 8[edi]
|
|
adc ebp, 0
|
|
; mul a[1]*b[2]
|
|
mul edx
|
|
add ebx, eax
|
|
mov eax, DWORD PTR [esi]
|
|
adc ecx, edx
|
|
mov edx, DWORD PTR 12[edi]
|
|
adc ebp, 0
|
|
; mul a[0]*b[3]
|
|
mul edx
|
|
add ebx, eax
|
|
mov eax, DWORD PTR 20[esp]
|
|
adc ecx, edx
|
|
mov edx, DWORD PTR 4[edi]
|
|
adc ebp, 0
|
|
mov DWORD PTR 12[eax],ebx
|
|
mov eax, DWORD PTR 12[esi]
|
|
; saved r[3]
|
|
; ################## Calculate word 4
|
|
xor ebx, ebx
|
|
; mul a[3]*b[1]
|
|
mul edx
|
|
add ecx, eax
|
|
mov eax, DWORD PTR 8[esi]
|
|
adc ebp, edx
|
|
mov edx, DWORD PTR 8[edi]
|
|
adc ebx, 0
|
|
; mul a[2]*b[2]
|
|
mul edx
|
|
add ecx, eax
|
|
mov eax, DWORD PTR 4[esi]
|
|
adc ebp, edx
|
|
mov edx, DWORD PTR 12[edi]
|
|
adc ebx, 0
|
|
; mul a[1]*b[3]
|
|
mul edx
|
|
add ecx, eax
|
|
mov eax, DWORD PTR 20[esp]
|
|
adc ebp, edx
|
|
mov edx, DWORD PTR 8[edi]
|
|
adc ebx, 0
|
|
mov DWORD PTR 16[eax],ecx
|
|
mov eax, DWORD PTR 12[esi]
|
|
; saved r[4]
|
|
; ################## Calculate word 5
|
|
xor ecx, ecx
|
|
; mul a[3]*b[2]
|
|
mul edx
|
|
add ebp, eax
|
|
mov eax, DWORD PTR 8[esi]
|
|
adc ebx, edx
|
|
mov edx, DWORD PTR 12[edi]
|
|
adc ecx, 0
|
|
; mul a[2]*b[3]
|
|
mul edx
|
|
add ebp, eax
|
|
mov eax, DWORD PTR 20[esp]
|
|
adc ebx, edx
|
|
mov edx, DWORD PTR 12[edi]
|
|
adc ecx, 0
|
|
mov DWORD PTR 20[eax],ebp
|
|
mov eax, DWORD PTR 12[esi]
|
|
; saved r[5]
|
|
; ################## Calculate word 6
|
|
xor ebp, ebp
|
|
; mul a[3]*b[3]
|
|
mul edx
|
|
add ebx, eax
|
|
mov eax, DWORD PTR 20[esp]
|
|
adc ecx, edx
|
|
adc ebp, 0
|
|
mov DWORD PTR 24[eax],ebx
|
|
; saved r[6]
|
|
; save r[7]
|
|
mov DWORD PTR 28[eax],ecx
|
|
pop ebx
|
|
pop ebp
|
|
pop edi
|
|
pop esi
|
|
ret
|
|
_bn_mul_comba4 ENDP
|
|
_TEXT ENDS
|
|
_TEXT SEGMENT
|
|
PUBLIC _bn_sqr_comba8
|
|
|
|
_bn_sqr_comba8 PROC NEAR
|
|
push esi
|
|
push edi
|
|
push ebp
|
|
push ebx
|
|
mov edi, DWORD PTR 20[esp]
|
|
mov esi, DWORD PTR 24[esp]
|
|
xor ebx, ebx
|
|
xor ecx, ecx
|
|
mov eax, DWORD PTR [esi]
|
|
; ############### Calculate word 0
|
|
xor ebp, ebp
|
|
; sqr a[0]*a[0]
|
|
mul eax
|
|
add ebx, eax
|
|
adc ecx, edx
|
|
mov edx, DWORD PTR [esi]
|
|
adc ebp, 0
|
|
mov DWORD PTR [edi],ebx
|
|
mov eax, DWORD PTR 4[esi]
|
|
; saved r[0]
|
|
; ############### Calculate word 1
|
|
xor ebx, ebx
|
|
; sqr a[1]*a[0]
|
|
mul edx
|
|
add eax, eax
|
|
adc edx, edx
|
|
adc ebx, 0
|
|
add ecx, eax
|
|
adc ebp, edx
|
|
mov eax, DWORD PTR 8[esi]
|
|
adc ebx, 0
|
|
mov DWORD PTR 4[edi],ecx
|
|
mov edx, DWORD PTR [esi]
|
|
; saved r[1]
|
|
; ############### Calculate word 2
|
|
xor ecx, ecx
|
|
; sqr a[2]*a[0]
|
|
mul edx
|
|
add eax, eax
|
|
adc edx, edx
|
|
adc ecx, 0
|
|
add ebp, eax
|
|
adc ebx, edx
|
|
mov eax, DWORD PTR 4[esi]
|
|
adc ecx, 0
|
|
; sqr a[1]*a[1]
|
|
mul eax
|
|
add ebp, eax
|
|
adc ebx, edx
|
|
mov edx, DWORD PTR [esi]
|
|
adc ecx, 0
|
|
mov DWORD PTR 8[edi],ebp
|
|
mov eax, DWORD PTR 12[esi]
|
|
; saved r[2]
|
|
; ############### Calculate word 3
|
|
xor ebp, ebp
|
|
; sqr a[3]*a[0]
|
|
mul edx
|
|
add eax, eax
|
|
adc edx, edx
|
|
adc ebp, 0
|
|
add ebx, eax
|
|
adc ecx, edx
|
|
mov eax, DWORD PTR 8[esi]
|
|
adc ebp, 0
|
|
mov edx, DWORD PTR 4[esi]
|
|
; sqr a[2]*a[1]
|
|
mul edx
|
|
add eax, eax
|
|
adc edx, edx
|
|
adc ebp, 0
|
|
add ebx, eax
|
|
adc ecx, edx
|
|
mov eax, DWORD PTR 16[esi]
|
|
adc ebp, 0
|
|
mov DWORD PTR 12[edi],ebx
|
|
mov edx, DWORD PTR [esi]
|
|
; saved r[3]
|
|
; ############### Calculate word 4
|
|
xor ebx, ebx
|
|
; sqr a[4]*a[0]
|
|
mul edx
|
|
add eax, eax
|
|
adc edx, edx
|
|
adc ebx, 0
|
|
add ecx, eax
|
|
adc ebp, edx
|
|
mov eax, DWORD PTR 12[esi]
|
|
adc ebx, 0
|
|
mov edx, DWORD PTR 4[esi]
|
|
; sqr a[3]*a[1]
|
|
mul edx
|
|
add eax, eax
|
|
adc edx, edx
|
|
adc ebx, 0
|
|
add ecx, eax
|
|
adc ebp, edx
|
|
mov eax, DWORD PTR 8[esi]
|
|
adc ebx, 0
|
|
; sqr a[2]*a[2]
|
|
mul eax
|
|
add ecx, eax
|
|
adc ebp, edx
|
|
mov edx, DWORD PTR [esi]
|
|
adc ebx, 0
|
|
mov DWORD PTR 16[edi],ecx
|
|
mov eax, DWORD PTR 20[esi]
|
|
; saved r[4]
|
|
; ############### Calculate word 5
|
|
xor ecx, ecx
|
|
; sqr a[5]*a[0]
|
|
mul edx
|
|
add eax, eax
|
|
adc edx, edx
|
|
adc ecx, 0
|
|
add ebp, eax
|
|
adc ebx, edx
|
|
mov eax, DWORD PTR 16[esi]
|
|
adc ecx, 0
|
|
mov edx, DWORD PTR 4[esi]
|
|
; sqr a[4]*a[1]
|
|
mul edx
|
|
add eax, eax
|
|
adc edx, edx
|
|
adc ecx, 0
|
|
add ebp, eax
|
|
adc ebx, edx
|
|
mov eax, DWORD PTR 12[esi]
|
|
adc ecx, 0
|
|
mov edx, DWORD PTR 8[esi]
|
|
; sqr a[3]*a[2]
|
|
mul edx
|
|
add eax, eax
|
|
adc edx, edx
|
|
adc ecx, 0
|
|
add ebp, eax
|
|
adc ebx, edx
|
|
mov eax, DWORD PTR 24[esi]
|
|
adc ecx, 0
|
|
mov DWORD PTR 20[edi],ebp
|
|
mov edx, DWORD PTR [esi]
|
|
; saved r[5]
|
|
; ############### Calculate word 6
|
|
xor ebp, ebp
|
|
; sqr a[6]*a[0]
|
|
mul edx
|
|
add eax, eax
|
|
adc edx, edx
|
|
adc ebp, 0
|
|
add ebx, eax
|
|
adc ecx, edx
|
|
mov eax, DWORD PTR 20[esi]
|
|
adc ebp, 0
|
|
mov edx, DWORD PTR 4[esi]
|
|
; sqr a[5]*a[1]
|
|
mul edx
|
|
add eax, eax
|
|
adc edx, edx
|
|
adc ebp, 0
|
|
add ebx, eax
|
|
adc ecx, edx
|
|
mov eax, DWORD PTR 16[esi]
|
|
adc ebp, 0
|
|
mov edx, DWORD PTR 8[esi]
|
|
; sqr a[4]*a[2]
|
|
mul edx
|
|
add eax, eax
|
|
adc edx, edx
|
|
adc ebp, 0
|
|
add ebx, eax
|
|
adc ecx, edx
|
|
mov eax, DWORD PTR 12[esi]
|
|
adc ebp, 0
|
|
; sqr a[3]*a[3]
|
|
mul eax
|
|
add ebx, eax
|
|
adc ecx, edx
|
|
mov edx, DWORD PTR [esi]
|
|
adc ebp, 0
|
|
mov DWORD PTR 24[edi],ebx
|
|
mov eax, DWORD PTR 28[esi]
|
|
; saved r[6]
|
|
; ############### Calculate word 7
|
|
xor ebx, ebx
|
|
; sqr a[7]*a[0]
|
|
mul edx
|
|
add eax, eax
|
|
adc edx, edx
|
|
adc ebx, 0
|
|
add ecx, eax
|
|
adc ebp, edx
|
|
mov eax, DWORD PTR 24[esi]
|
|
adc ebx, 0
|
|
mov edx, DWORD PTR 4[esi]
|
|
; sqr a[6]*a[1]
|
|
mul edx
|
|
add eax, eax
|
|
adc edx, edx
|
|
adc ebx, 0
|
|
add ecx, eax
|
|
adc ebp, edx
|
|
mov eax, DWORD PTR 20[esi]
|
|
adc ebx, 0
|
|
mov edx, DWORD PTR 8[esi]
|
|
; sqr a[5]*a[2]
|
|
mul edx
|
|
add eax, eax
|
|
adc edx, edx
|
|
adc ebx, 0
|
|
add ecx, eax
|
|
adc ebp, edx
|
|
mov eax, DWORD PTR 16[esi]
|
|
adc ebx, 0
|
|
mov edx, DWORD PTR 12[esi]
|
|
; sqr a[4]*a[3]
|
|
mul edx
|
|
add eax, eax
|
|
adc edx, edx
|
|
adc ebx, 0
|
|
add ecx, eax
|
|
adc ebp, edx
|
|
mov eax, DWORD PTR 28[esi]
|
|
adc ebx, 0
|
|
mov DWORD PTR 28[edi],ecx
|
|
mov edx, DWORD PTR 4[esi]
|
|
; saved r[7]
|
|
; ############### Calculate word 8
|
|
xor ecx, ecx
|
|
; sqr a[7]*a[1]
|
|
mul edx
|
|
add eax, eax
|
|
adc edx, edx
|
|
adc ecx, 0
|
|
add ebp, eax
|
|
adc ebx, edx
|
|
mov eax, DWORD PTR 24[esi]
|
|
adc ecx, 0
|
|
mov edx, DWORD PTR 8[esi]
|
|
; sqr a[6]*a[2]
|
|
mul edx
|
|
add eax, eax
|
|
adc edx, edx
|
|
adc ecx, 0
|
|
add ebp, eax
|
|
adc ebx, edx
|
|
mov eax, DWORD PTR 20[esi]
|
|
adc ecx, 0
|
|
mov edx, DWORD PTR 12[esi]
|
|
; sqr a[5]*a[3]
|
|
mul edx
|
|
add eax, eax
|
|
adc edx, edx
|
|
adc ecx, 0
|
|
add ebp, eax
|
|
adc ebx, edx
|
|
mov eax, DWORD PTR 16[esi]
|
|
adc ecx, 0
|
|
; sqr a[4]*a[4]
|
|
mul eax
|
|
add ebp, eax
|
|
adc ebx, edx
|
|
mov edx, DWORD PTR 8[esi]
|
|
adc ecx, 0
|
|
mov DWORD PTR 32[edi],ebp
|
|
mov eax, DWORD PTR 28[esi]
|
|
; saved r[8]
|
|
; ############### Calculate word 9
|
|
xor ebp, ebp
|
|
; sqr a[7]*a[2]
|
|
mul edx
|
|
add eax, eax
|
|
adc edx, edx
|
|
adc ebp, 0
|
|
add ebx, eax
|
|
adc ecx, edx
|
|
mov eax, DWORD PTR 24[esi]
|
|
adc ebp, 0
|
|
mov edx, DWORD PTR 12[esi]
|
|
; sqr a[6]*a[3]
|
|
mul edx
|
|
add eax, eax
|
|
adc edx, edx
|
|
adc ebp, 0
|
|
add ebx, eax
|
|
adc ecx, edx
|
|
mov eax, DWORD PTR 20[esi]
|
|
adc ebp, 0
|
|
mov edx, DWORD PTR 16[esi]
|
|
; sqr a[5]*a[4]
|
|
mul edx
|
|
add eax, eax
|
|
adc edx, edx
|
|
adc ebp, 0
|
|
add ebx, eax
|
|
adc ecx, edx
|
|
mov eax, DWORD PTR 28[esi]
|
|
adc ebp, 0
|
|
mov DWORD PTR 36[edi],ebx
|
|
mov edx, DWORD PTR 12[esi]
|
|
; saved r[9]
|
|
; ############### Calculate word 10
|
|
xor ebx, ebx
|
|
; sqr a[7]*a[3]
|
|
mul edx
|
|
add eax, eax
|
|
adc edx, edx
|
|
adc ebx, 0
|
|
add ecx, eax
|
|
adc ebp, edx
|
|
mov eax, DWORD PTR 24[esi]
|
|
adc ebx, 0
|
|
mov edx, DWORD PTR 16[esi]
|
|
; sqr a[6]*a[4]
|
|
mul edx
|
|
add eax, eax
|
|
adc edx, edx
|
|
adc ebx, 0
|
|
add ecx, eax
|
|
adc ebp, edx
|
|
mov eax, DWORD PTR 20[esi]
|
|
adc ebx, 0
|
|
; sqr a[5]*a[5]
|
|
mul eax
|
|
add ecx, eax
|
|
adc ebp, edx
|
|
mov edx, DWORD PTR 16[esi]
|
|
adc ebx, 0
|
|
mov DWORD PTR 40[edi],ecx
|
|
mov eax, DWORD PTR 28[esi]
|
|
; saved r[10]
|
|
; ############### Calculate word 11
|
|
xor ecx, ecx
|
|
; sqr a[7]*a[4]
|
|
mul edx
|
|
add eax, eax
|
|
adc edx, edx
|
|
adc ecx, 0
|
|
add ebp, eax
|
|
adc ebx, edx
|
|
mov eax, DWORD PTR 24[esi]
|
|
adc ecx, 0
|
|
mov edx, DWORD PTR 20[esi]
|
|
; sqr a[6]*a[5]
|
|
mul edx
|
|
add eax, eax
|
|
adc edx, edx
|
|
adc ecx, 0
|
|
add ebp, eax
|
|
adc ebx, edx
|
|
mov eax, DWORD PTR 28[esi]
|
|
adc ecx, 0
|
|
mov DWORD PTR 44[edi],ebp
|
|
mov edx, DWORD PTR 20[esi]
|
|
; saved r[11]
|
|
; ############### Calculate word 12
|
|
xor ebp, ebp
|
|
; sqr a[7]*a[5]
|
|
mul edx
|
|
add eax, eax
|
|
adc edx, edx
|
|
adc ebp, 0
|
|
add ebx, eax
|
|
adc ecx, edx
|
|
mov eax, DWORD PTR 24[esi]
|
|
adc ebp, 0
|
|
; sqr a[6]*a[6]
|
|
mul eax
|
|
add ebx, eax
|
|
adc ecx, edx
|
|
mov edx, DWORD PTR 24[esi]
|
|
adc ebp, 0
|
|
mov DWORD PTR 48[edi],ebx
|
|
mov eax, DWORD PTR 28[esi]
|
|
; saved r[12]
|
|
; ############### Calculate word 13
|
|
xor ebx, ebx
|
|
; sqr a[7]*a[6]
|
|
mul edx
|
|
add eax, eax
|
|
adc edx, edx
|
|
adc ebx, 0
|
|
add ecx, eax
|
|
adc ebp, edx
|
|
mov eax, DWORD PTR 28[esi]
|
|
adc ebx, 0
|
|
mov DWORD PTR 52[edi],ecx
|
|
; saved r[13]
|
|
; ############### Calculate word 14
|
|
xor ecx, ecx
|
|
; sqr a[7]*a[7]
|
|
mul eax
|
|
add ebp, eax
|
|
adc ebx, edx
|
|
adc ecx, 0
|
|
mov DWORD PTR 56[edi],ebp
|
|
; saved r[14]
|
|
mov DWORD PTR 60[edi],ebx
|
|
pop ebx
|
|
pop ebp
|
|
pop edi
|
|
pop esi
|
|
ret
|
|
_bn_sqr_comba8 ENDP
|
|
_TEXT ENDS
|
|
_TEXT SEGMENT
|
|
PUBLIC _bn_sqr_comba4
|
|
|
|
_bn_sqr_comba4 PROC NEAR
|
|
push esi
|
|
push edi
|
|
push ebp
|
|
push ebx
|
|
mov edi, DWORD PTR 20[esp]
|
|
mov esi, DWORD PTR 24[esp]
|
|
xor ebx, ebx
|
|
xor ecx, ecx
|
|
mov eax, DWORD PTR [esi]
|
|
; ############### Calculate word 0
|
|
xor ebp, ebp
|
|
; sqr a[0]*a[0]
|
|
mul eax
|
|
add ebx, eax
|
|
adc ecx, edx
|
|
mov edx, DWORD PTR [esi]
|
|
adc ebp, 0
|
|
mov DWORD PTR [edi],ebx
|
|
mov eax, DWORD PTR 4[esi]
|
|
; saved r[0]
|
|
; ############### Calculate word 1
|
|
xor ebx, ebx
|
|
; sqr a[1]*a[0]
|
|
mul edx
|
|
add eax, eax
|
|
adc edx, edx
|
|
adc ebx, 0
|
|
add ecx, eax
|
|
adc ebp, edx
|
|
mov eax, DWORD PTR 8[esi]
|
|
adc ebx, 0
|
|
mov DWORD PTR 4[edi],ecx
|
|
mov edx, DWORD PTR [esi]
|
|
; saved r[1]
|
|
; ############### Calculate word 2
|
|
xor ecx, ecx
|
|
; sqr a[2]*a[0]
|
|
mul edx
|
|
add eax, eax
|
|
adc edx, edx
|
|
adc ecx, 0
|
|
add ebp, eax
|
|
adc ebx, edx
|
|
mov eax, DWORD PTR 4[esi]
|
|
adc ecx, 0
|
|
; sqr a[1]*a[1]
|
|
mul eax
|
|
add ebp, eax
|
|
adc ebx, edx
|
|
mov edx, DWORD PTR [esi]
|
|
adc ecx, 0
|
|
mov DWORD PTR 8[edi],ebp
|
|
mov eax, DWORD PTR 12[esi]
|
|
; saved r[2]
|
|
; ############### Calculate word 3
|
|
xor ebp, ebp
|
|
; sqr a[3]*a[0]
|
|
mul edx
|
|
add eax, eax
|
|
adc edx, edx
|
|
adc ebp, 0
|
|
add ebx, eax
|
|
adc ecx, edx
|
|
mov eax, DWORD PTR 8[esi]
|
|
adc ebp, 0
|
|
mov edx, DWORD PTR 4[esi]
|
|
; sqr a[2]*a[1]
|
|
mul edx
|
|
add eax, eax
|
|
adc edx, edx
|
|
adc ebp, 0
|
|
add ebx, eax
|
|
adc ecx, edx
|
|
mov eax, DWORD PTR 12[esi]
|
|
adc ebp, 0
|
|
mov DWORD PTR 12[edi],ebx
|
|
mov edx, DWORD PTR 4[esi]
|
|
; saved r[3]
|
|
; ############### Calculate word 4
|
|
xor ebx, ebx
|
|
; sqr a[3]*a[1]
|
|
mul edx
|
|
add eax, eax
|
|
adc edx, edx
|
|
adc ebx, 0
|
|
add ecx, eax
|
|
adc ebp, edx
|
|
mov eax, DWORD PTR 8[esi]
|
|
adc ebx, 0
|
|
; sqr a[2]*a[2]
|
|
mul eax
|
|
add ecx, eax
|
|
adc ebp, edx
|
|
mov edx, DWORD PTR 8[esi]
|
|
adc ebx, 0
|
|
mov DWORD PTR 16[edi],ecx
|
|
mov eax, DWORD PTR 12[esi]
|
|
; saved r[4]
|
|
; ############### Calculate word 5
|
|
xor ecx, ecx
|
|
; sqr a[3]*a[2]
|
|
mul edx
|
|
add eax, eax
|
|
adc edx, edx
|
|
adc ecx, 0
|
|
add ebp, eax
|
|
adc ebx, edx
|
|
mov eax, DWORD PTR 12[esi]
|
|
adc ecx, 0
|
|
mov DWORD PTR 20[edi],ebp
|
|
; saved r[5]
|
|
; ############### Calculate word 6
|
|
xor ebp, ebp
|
|
; sqr a[3]*a[3]
|
|
mul eax
|
|
add ebx, eax
|
|
adc ecx, edx
|
|
adc ebp, 0
|
|
mov DWORD PTR 24[edi],ebx
|
|
; saved r[6]
|
|
mov DWORD PTR 28[edi],ecx
|
|
pop ebx
|
|
pop ebp
|
|
pop edi
|
|
pop esi
|
|
ret
|
|
_bn_sqr_comba4 ENDP
|
|
_TEXT ENDS
|
|
END
|