summaryrefslogtreecommitdiffstats
path: root/third_party/boringssl/win-x86_64
diff options
context:
space:
mode:
Diffstat (limited to 'third_party/boringssl/win-x86_64')
-rw-r--r--third_party/boringssl/win-x86_64/crypto/bn/modexp512-x86_64.asm1885
1 files changed, 0 insertions, 1885 deletions
diff --git a/third_party/boringssl/win-x86_64/crypto/bn/modexp512-x86_64.asm b/third_party/boringssl/win-x86_64/crypto/bn/modexp512-x86_64.asm
deleted file mode 100644
index f3b306e..0000000
--- a/third_party/boringssl/win-x86_64/crypto/bn/modexp512-x86_64.asm
+++ /dev/null
@@ -1,1885 +0,0 @@
-default rel
-%define XMMWORD
-%define YMMWORD
-%define ZMMWORD
-section .text code align=64
-
-
-
-ALIGN 16
-MULADD_128x512:
- mov rax,QWORD[rsi]
- mul rbp
- add r8,rax
- adc rdx,0
- mov QWORD[rcx],r8
- mov rbx,rdx
-
- mov rax,QWORD[8+rsi]
- mul rbp
- add r9,rax
- adc rdx,0
- add r9,rbx
- adc rdx,0
- mov rbx,rdx
-
- mov rax,QWORD[16+rsi]
- mul rbp
- add r10,rax
- adc rdx,0
- add r10,rbx
- adc rdx,0
- mov rbx,rdx
-
- mov rax,QWORD[24+rsi]
- mul rbp
- add r11,rax
- adc rdx,0
- add r11,rbx
- adc rdx,0
- mov rbx,rdx
-
- mov rax,QWORD[32+rsi]
- mul rbp
- add r12,rax
- adc rdx,0
- add r12,rbx
- adc rdx,0
- mov rbx,rdx
-
- mov rax,QWORD[40+rsi]
- mul rbp
- add r13,rax
- adc rdx,0
- add r13,rbx
- adc rdx,0
- mov rbx,rdx
-
- mov rax,QWORD[48+rsi]
- mul rbp
- add r14,rax
- adc rdx,0
- add r14,rbx
- adc rdx,0
- mov rbx,rdx
-
- mov rax,QWORD[56+rsi]
- mul rbp
- add r15,rax
- adc rdx,0
- add r15,rbx
- adc rdx,0
- mov r8,rdx
- mov rbp,QWORD[8+rdi]
- mov rax,QWORD[rsi]
- mul rbp
- add r9,rax
- adc rdx,0
- mov QWORD[8+rcx],r9
- mov rbx,rdx
-
- mov rax,QWORD[8+rsi]
- mul rbp
- add r10,rax
- adc rdx,0
- add r10,rbx
- adc rdx,0
- mov rbx,rdx
-
- mov rax,QWORD[16+rsi]
- mul rbp
- add r11,rax
- adc rdx,0
- add r11,rbx
- adc rdx,0
- mov rbx,rdx
-
- mov rax,QWORD[24+rsi]
- mul rbp
- add r12,rax
- adc rdx,0
- add r12,rbx
- adc rdx,0
- mov rbx,rdx
-
- mov rax,QWORD[32+rsi]
- mul rbp
- add r13,rax
- adc rdx,0
- add r13,rbx
- adc rdx,0
- mov rbx,rdx
-
- mov rax,QWORD[40+rsi]
- mul rbp
- add r14,rax
- adc rdx,0
- add r14,rbx
- adc rdx,0
- mov rbx,rdx
-
- mov rax,QWORD[48+rsi]
- mul rbp
- add r15,rax
- adc rdx,0
- add r15,rbx
- adc rdx,0
- mov rbx,rdx
-
- mov rax,QWORD[56+rsi]
- mul rbp
- add r8,rax
- adc rdx,0
- add r8,rbx
- adc rdx,0
- mov r9,rdx
- DB 0F3h,0C3h ;repret
-
-
-ALIGN 16
-mont_reduce:
- lea rdi,[192+rsp]
- mov rsi,QWORD[32+rsp]
- add rsi,576
- lea rcx,[520+rsp]
-
- mov rbp,QWORD[96+rcx]
- mov rax,QWORD[rsi]
- mul rbp
- mov r8,QWORD[rcx]
- add r8,rax
- adc rdx,0
- mov QWORD[rdi],r8
- mov rbx,rdx
-
- mov rax,QWORD[8+rsi]
- mul rbp
- mov r9,QWORD[8+rcx]
- add r9,rax
- adc rdx,0
- add r9,rbx
- adc rdx,0
- mov rbx,rdx
-
- mov rax,QWORD[16+rsi]
- mul rbp
- mov r10,QWORD[16+rcx]
- add r10,rax
- adc rdx,0
- add r10,rbx
- adc rdx,0
- mov rbx,rdx
-
- mov rax,QWORD[24+rsi]
- mul rbp
- mov r11,QWORD[24+rcx]
- add r11,rax
- adc rdx,0
- add r11,rbx
- adc rdx,0
- mov rbx,rdx
-
- mov rax,QWORD[32+rsi]
- mul rbp
- mov r12,QWORD[32+rcx]
- add r12,rax
- adc rdx,0
- add r12,rbx
- adc rdx,0
- mov rbx,rdx
-
- mov rax,QWORD[40+rsi]
- mul rbp
- mov r13,QWORD[40+rcx]
- add r13,rax
- adc rdx,0
- add r13,rbx
- adc rdx,0
- mov rbx,rdx
-
- mov rax,QWORD[48+rsi]
- mul rbp
- mov r14,QWORD[48+rcx]
- add r14,rax
- adc rdx,0
- add r14,rbx
- adc rdx,0
- mov rbx,rdx
-
- mov rax,QWORD[56+rsi]
- mul rbp
- mov r15,QWORD[56+rcx]
- add r15,rax
- adc rdx,0
- add r15,rbx
- adc rdx,0
- mov r8,rdx
- mov rbp,QWORD[104+rcx]
- mov rax,QWORD[rsi]
- mul rbp
- add r9,rax
- adc rdx,0
- mov QWORD[8+rdi],r9
- mov rbx,rdx
-
- mov rax,QWORD[8+rsi]
- mul rbp
- add r10,rax
- adc rdx,0
- add r10,rbx
- adc rdx,0
- mov rbx,rdx
-
- mov rax,QWORD[16+rsi]
- mul rbp
- add r11,rax
- adc rdx,0
- add r11,rbx
- adc rdx,0
- mov rbx,rdx
-
- mov rax,QWORD[24+rsi]
- mul rbp
- add r12,rax
- adc rdx,0
- add r12,rbx
- adc rdx,0
- mov rbx,rdx
-
- mov rax,QWORD[32+rsi]
- mul rbp
- add r13,rax
- adc rdx,0
- add r13,rbx
- adc rdx,0
- mov rbx,rdx
-
- mov rax,QWORD[40+rsi]
- mul rbp
- add r14,rax
- adc rdx,0
- add r14,rbx
- adc rdx,0
- mov rbx,rdx
-
- mov rax,QWORD[48+rsi]
- mul rbp
- add r15,rax
- adc rdx,0
- add r15,rbx
- adc rdx,0
- mov rbx,rdx
-
- mov rax,QWORD[56+rsi]
- mul rbp
- add r8,rax
- adc rdx,0
- add r8,rbx
- adc rdx,0
- mov r9,rdx
- mov rbp,QWORD[112+rcx]
- mov rax,QWORD[rsi]
- mul rbp
- add r10,rax
- adc rdx,0
- mov QWORD[16+rdi],r10
- mov rbx,rdx
-
- mov rax,QWORD[8+rsi]
- mul rbp
- add r11,rax
- adc rdx,0
- add r11,rbx
- adc rdx,0
- mov rbx,rdx
-
- mov rax,QWORD[16+rsi]
- mul rbp
- add r12,rax
- adc rdx,0
- add r12,rbx
- adc rdx,0
- mov rbx,rdx
-
- mov rax,QWORD[24+rsi]
- mul rbp
- add r13,rax
- adc rdx,0
- add r13,rbx
- adc rdx,0
- mov rbx,rdx
-
- mov rax,QWORD[32+rsi]
- mul rbp
- add r14,rax
- adc rdx,0
- add r14,rbx
- adc rdx,0
- mov rbx,rdx
-
- mov rax,QWORD[40+rsi]
- mul rbp
- add r15,rax
- adc rdx,0
- add r15,rbx
- adc rdx,0
- mov rbx,rdx
-
- mov rax,QWORD[48+rsi]
- mul rbp
- add r8,rax
- adc rdx,0
- add r8,rbx
- adc rdx,0
- mov rbx,rdx
-
- mov rax,QWORD[56+rsi]
- mul rbp
- add r9,rax
- adc rdx,0
- add r9,rbx
- adc rdx,0
- mov r10,rdx
- mov rbp,QWORD[120+rcx]
- mov rax,QWORD[rsi]
- mul rbp
- add r11,rax
- adc rdx,0
- mov QWORD[24+rdi],r11
- mov rbx,rdx
-
- mov rax,QWORD[8+rsi]
- mul rbp
- add r12,rax
- adc rdx,0
- add r12,rbx
- adc rdx,0
- mov rbx,rdx
-
- mov rax,QWORD[16+rsi]
- mul rbp
- add r13,rax
- adc rdx,0
- add r13,rbx
- adc rdx,0
- mov rbx,rdx
-
- mov rax,QWORD[24+rsi]
- mul rbp
- add r14,rax
- adc rdx,0
- add r14,rbx
- adc rdx,0
- mov rbx,rdx
-
- mov rax,QWORD[32+rsi]
- mul rbp
- add r15,rax
- adc rdx,0
- add r15,rbx
- adc rdx,0
- mov rbx,rdx
-
- mov rax,QWORD[40+rsi]
- mul rbp
- add r8,rax
- adc rdx,0
- add r8,rbx
- adc rdx,0
- mov rbx,rdx
-
- mov rax,QWORD[48+rsi]
- mul rbp
- add r9,rax
- adc rdx,0
- add r9,rbx
- adc rdx,0
- mov rbx,rdx
-
- mov rax,QWORD[56+rsi]
- mul rbp
- add r10,rax
- adc rdx,0
- add r10,rbx
- adc rdx,0
- mov r11,rdx
- xor rax,rax
-
- add r8,QWORD[64+rcx]
- adc r9,QWORD[72+rcx]
- adc r10,QWORD[80+rcx]
- adc r11,QWORD[88+rcx]
- adc rax,0
-
-
-
-
- mov QWORD[64+rdi],r8
- mov QWORD[72+rdi],r9
- mov rbp,r10
- mov QWORD[88+rdi],r11
-
- mov QWORD[384+rsp],rax
-
- mov r8,QWORD[rdi]
- mov r9,QWORD[8+rdi]
- mov r10,QWORD[16+rdi]
- mov r11,QWORD[24+rdi]
-
-
-
-
-
-
-
-
- add rdi,8*10
-
- add rsi,64
- lea rcx,[296+rsp]
-
- call MULADD_128x512
-
- mov rax,QWORD[384+rsp]
-
-
- add r8,QWORD[((-16))+rdi]
- adc r9,QWORD[((-8))+rdi]
- mov QWORD[64+rcx],r8
- mov QWORD[72+rcx],r9
-
- adc rax,rax
- mov QWORD[384+rsp],rax
-
- lea rdi,[192+rsp]
- add rsi,64
-
-
-
-
-
- mov r8,QWORD[rsi]
- mov rbx,QWORD[8+rsi]
-
- mov rax,QWORD[rcx]
- mul r8
- mov rbp,rax
- mov r9,rdx
-
- mov rax,QWORD[8+rcx]
- mul r8
- add r9,rax
-
- mov rax,QWORD[rcx]
- mul rbx
- add r9,rax
-
- mov QWORD[8+rdi],r9
-
-
- sub rsi,192
-
- mov r8,QWORD[rcx]
- mov r9,QWORD[8+rcx]
-
- call MULADD_128x512
-
-
-
-
- mov rax,QWORD[rsi]
- mov rbx,QWORD[8+rsi]
- mov rdi,QWORD[16+rsi]
- mov rdx,QWORD[24+rsi]
-
-
- mov rbp,QWORD[384+rsp]
-
- add r8,QWORD[64+rcx]
- adc r9,QWORD[72+rcx]
-
-
- adc rbp,rbp
-
-
-
- shl rbp,3
- mov rcx,QWORD[32+rsp]
- add rbp,rcx
-
-
- xor rsi,rsi
-
- add r10,QWORD[rbp]
- adc r11,QWORD[64+rbp]
- adc r12,QWORD[128+rbp]
- adc r13,QWORD[192+rbp]
- adc r14,QWORD[256+rbp]
- adc r15,QWORD[320+rbp]
- adc r8,QWORD[384+rbp]
- adc r9,QWORD[448+rbp]
-
-
-
- sbb rsi,0
-
-
- and rax,rsi
- and rbx,rsi
- and rdi,rsi
- and rdx,rsi
-
- mov rbp,1
- sub r10,rax
- sbb r11,rbx
- sbb r12,rdi
- sbb r13,rdx
-
-
-
-
- sbb rbp,0
-
-
-
- add rcx,512
- mov rax,QWORD[32+rcx]
- mov rbx,QWORD[40+rcx]
- mov rdi,QWORD[48+rcx]
- mov rdx,QWORD[56+rcx]
-
-
-
- and rax,rsi
- and rbx,rsi
- and rdi,rsi
- and rdx,rsi
-
-
-
- sub rbp,1
-
- sbb r14,rax
- sbb r15,rbx
- sbb r8,rdi
- sbb r9,rdx
-
-
-
- mov rsi,QWORD[144+rsp]
- mov QWORD[rsi],r10
- mov QWORD[8+rsi],r11
- mov QWORD[16+rsi],r12
- mov QWORD[24+rsi],r13
- mov QWORD[32+rsi],r14
- mov QWORD[40+rsi],r15
- mov QWORD[48+rsi],r8
- mov QWORD[56+rsi],r9
-
- DB 0F3h,0C3h ;repret
-
-
-ALIGN 16
-mont_mul_a3b:
-
-
-
-
- mov rbp,QWORD[rdi]
-
- mov rax,r10
- mul rbp
- mov QWORD[520+rsp],rax
- mov r10,rdx
- mov rax,r11
- mul rbp
- add r10,rax
- adc rdx,0
- mov r11,rdx
- mov rax,r12
- mul rbp
- add r11,rax
- adc rdx,0
- mov r12,rdx
- mov rax,r13
- mul rbp
- add r12,rax
- adc rdx,0
- mov r13,rdx
- mov rax,r14
- mul rbp
- add r13,rax
- adc rdx,0
- mov r14,rdx
- mov rax,r15
- mul rbp
- add r14,rax
- adc rdx,0
- mov r15,rdx
- mov rax,r8
- mul rbp
- add r15,rax
- adc rdx,0
- mov r8,rdx
- mov rax,r9
- mul rbp
- add r8,rax
- adc rdx,0
- mov r9,rdx
- mov rbp,QWORD[8+rdi]
- mov rax,QWORD[rsi]
- mul rbp
- add r10,rax
- adc rdx,0
- mov QWORD[528+rsp],r10
- mov rbx,rdx
-
- mov rax,QWORD[8+rsi]
- mul rbp
- add r11,rax
- adc rdx,0
- add r11,rbx
- adc rdx,0
- mov rbx,rdx
-
- mov rax,QWORD[16+rsi]
- mul rbp
- add r12,rax
- adc rdx,0
- add r12,rbx
- adc rdx,0
- mov rbx,rdx
-
- mov rax,QWORD[24+rsi]
- mul rbp
- add r13,rax
- adc rdx,0
- add r13,rbx
- adc rdx,0
- mov rbx,rdx
-
- mov rax,QWORD[32+rsi]
- mul rbp
- add r14,rax
- adc rdx,0
- add r14,rbx
- adc rdx,0
- mov rbx,rdx
-
- mov rax,QWORD[40+rsi]
- mul rbp
- add r15,rax
- adc rdx,0
- add r15,rbx
- adc rdx,0
- mov rbx,rdx
-
- mov rax,QWORD[48+rsi]
- mul rbp
- add r8,rax
- adc rdx,0
- add r8,rbx
- adc rdx,0
- mov rbx,rdx
-
- mov rax,QWORD[56+rsi]
- mul rbp
- add r9,rax
- adc rdx,0
- add r9,rbx
- adc rdx,0
- mov r10,rdx
- mov rbp,QWORD[16+rdi]
- mov rax,QWORD[rsi]
- mul rbp
- add r11,rax
- adc rdx,0
- mov QWORD[536+rsp],r11
- mov rbx,rdx
-
- mov rax,QWORD[8+rsi]
- mul rbp
- add r12,rax
- adc rdx,0
- add r12,rbx
- adc rdx,0
- mov rbx,rdx
-
- mov rax,QWORD[16+rsi]
- mul rbp
- add r13,rax
- adc rdx,0
- add r13,rbx
- adc rdx,0
- mov rbx,rdx
-
- mov rax,QWORD[24+rsi]
- mul rbp
- add r14,rax
- adc rdx,0
- add r14,rbx
- adc rdx,0
- mov rbx,rdx
-
- mov rax,QWORD[32+rsi]
- mul rbp
- add r15,rax
- adc rdx,0
- add r15,rbx
- adc rdx,0
- mov rbx,rdx
-
- mov rax,QWORD[40+rsi]
- mul rbp
- add r8,rax
- adc rdx,0
- add r8,rbx
- adc rdx,0
- mov rbx,rdx
-
- mov rax,QWORD[48+rsi]
- mul rbp
- add r9,rax
- adc rdx,0
- add r9,rbx
- adc rdx,0
- mov rbx,rdx
-
- mov rax,QWORD[56+rsi]
- mul rbp
- add r10,rax
- adc rdx,0
- add r10,rbx
- adc rdx,0
- mov r11,rdx
- mov rbp,QWORD[24+rdi]
- mov rax,QWORD[rsi]
- mul rbp
- add r12,rax
- adc rdx,0
- mov QWORD[544+rsp],r12
- mov rbx,rdx
-
- mov rax,QWORD[8+rsi]
- mul rbp
- add r13,rax
- adc rdx,0
- add r13,rbx
- adc rdx,0
- mov rbx,rdx
-
- mov rax,QWORD[16+rsi]
- mul rbp
- add r14,rax
- adc rdx,0
- add r14,rbx
- adc rdx,0
- mov rbx,rdx
-
- mov rax,QWORD[24+rsi]
- mul rbp
- add r15,rax
- adc rdx,0
- add r15,rbx
- adc rdx,0
- mov rbx,rdx
-
- mov rax,QWORD[32+rsi]
- mul rbp
- add r8,rax
- adc rdx,0
- add r8,rbx
- adc rdx,0
- mov rbx,rdx
-
- mov rax,QWORD[40+rsi]
- mul rbp
- add r9,rax
- adc rdx,0
- add r9,rbx
- adc rdx,0
- mov rbx,rdx
-
- mov rax,QWORD[48+rsi]
- mul rbp
- add r10,rax
- adc rdx,0
- add r10,rbx
- adc rdx,0
- mov rbx,rdx
-
- mov rax,QWORD[56+rsi]
- mul rbp
- add r11,rax
- adc rdx,0
- add r11,rbx
- adc rdx,0
- mov r12,rdx
- mov rbp,QWORD[32+rdi]
- mov rax,QWORD[rsi]
- mul rbp
- add r13,rax
- adc rdx,0
- mov QWORD[552+rsp],r13
- mov rbx,rdx
-
- mov rax,QWORD[8+rsi]
- mul rbp
- add r14,rax
- adc rdx,0
- add r14,rbx
- adc rdx,0
- mov rbx,rdx
-
- mov rax,QWORD[16+rsi]
- mul rbp
- add r15,rax
- adc rdx,0
- add r15,rbx
- adc rdx,0
- mov rbx,rdx
-
- mov rax,QWORD[24+rsi]
- mul rbp
- add r8,rax
- adc rdx,0
- add r8,rbx
- adc rdx,0
- mov rbx,rdx
-
- mov rax,QWORD[32+rsi]
- mul rbp
- add r9,rax
- adc rdx,0
- add r9,rbx
- adc rdx,0
- mov rbx,rdx
-
- mov rax,QWORD[40+rsi]
- mul rbp
- add r10,rax
- adc rdx,0
- add r10,rbx
- adc rdx,0
- mov rbx,rdx
-
- mov rax,QWORD[48+rsi]
- mul rbp
- add r11,rax
- adc rdx,0
- add r11,rbx
- adc rdx,0
- mov rbx,rdx
-
- mov rax,QWORD[56+rsi]
- mul rbp
- add r12,rax
- adc rdx,0
- add r12,rbx
- adc rdx,0
- mov r13,rdx
- mov rbp,QWORD[40+rdi]
- mov rax,QWORD[rsi]
- mul rbp
- add r14,rax
- adc rdx,0
- mov QWORD[560+rsp],r14
- mov rbx,rdx
-
- mov rax,QWORD[8+rsi]
- mul rbp
- add r15,rax
- adc rdx,0
- add r15,rbx
- adc rdx,0
- mov rbx,rdx
-
- mov rax,QWORD[16+rsi]
- mul rbp
- add r8,rax
- adc rdx,0
- add r8,rbx
- adc rdx,0
- mov rbx,rdx
-
- mov rax,QWORD[24+rsi]
- mul rbp
- add r9,rax
- adc rdx,0
- add r9,rbx
- adc rdx,0
- mov rbx,rdx
-
- mov rax,QWORD[32+rsi]
- mul rbp
- add r10,rax
- adc rdx,0
- add r10,rbx
- adc rdx,0
- mov rbx,rdx
-
- mov rax,QWORD[40+rsi]
- mul rbp
- add r11,rax
- adc rdx,0
- add r11,rbx
- adc rdx,0
- mov rbx,rdx
-
- mov rax,QWORD[48+rsi]
- mul rbp
- add r12,rax
- adc rdx,0
- add r12,rbx
- adc rdx,0
- mov rbx,rdx
-
- mov rax,QWORD[56+rsi]
- mul rbp
- add r13,rax
- adc rdx,0
- add r13,rbx
- adc rdx,0
- mov r14,rdx
- mov rbp,QWORD[48+rdi]
- mov rax,QWORD[rsi]
- mul rbp
- add r15,rax
- adc rdx,0
- mov QWORD[568+rsp],r15
- mov rbx,rdx
-
- mov rax,QWORD[8+rsi]
- mul rbp
- add r8,rax
- adc rdx,0
- add r8,rbx
- adc rdx,0
- mov rbx,rdx
-
- mov rax,QWORD[16+rsi]
- mul rbp
- add r9,rax
- adc rdx,0
- add r9,rbx
- adc rdx,0
- mov rbx,rdx
-
- mov rax,QWORD[24+rsi]
- mul rbp
- add r10,rax
- adc rdx,0
- add r10,rbx
- adc rdx,0
- mov rbx,rdx
-
- mov rax,QWORD[32+rsi]
- mul rbp
- add r11,rax
- adc rdx,0
- add r11,rbx
- adc rdx,0
- mov rbx,rdx
-
- mov rax,QWORD[40+rsi]
- mul rbp
- add r12,rax
- adc rdx,0
- add r12,rbx
- adc rdx,0
- mov rbx,rdx
-
- mov rax,QWORD[48+rsi]
- mul rbp
- add r13,rax
- adc rdx,0
- add r13,rbx
- adc rdx,0
- mov rbx,rdx
-
- mov rax,QWORD[56+rsi]
- mul rbp
- add r14,rax
- adc rdx,0
- add r14,rbx
- adc rdx,0
- mov r15,rdx
- mov rbp,QWORD[56+rdi]
- mov rax,QWORD[rsi]
- mul rbp
- add r8,rax
- adc rdx,0
- mov QWORD[576+rsp],r8
- mov rbx,rdx
-
- mov rax,QWORD[8+rsi]
- mul rbp
- add r9,rax
- adc rdx,0
- add r9,rbx
- adc rdx,0
- mov rbx,rdx
-
- mov rax,QWORD[16+rsi]
- mul rbp
- add r10,rax
- adc rdx,0
- add r10,rbx
- adc rdx,0
- mov rbx,rdx
-
- mov rax,QWORD[24+rsi]
- mul rbp
- add r11,rax
- adc rdx,0
- add r11,rbx
- adc rdx,0
- mov rbx,rdx
-
- mov rax,QWORD[32+rsi]
- mul rbp
- add r12,rax
- adc rdx,0
- add r12,rbx
- adc rdx,0
- mov rbx,rdx
-
- mov rax,QWORD[40+rsi]
- mul rbp
- add r13,rax
- adc rdx,0
- add r13,rbx
- adc rdx,0
- mov rbx,rdx
-
- mov rax,QWORD[48+rsi]
- mul rbp
- add r14,rax
- adc rdx,0
- add r14,rbx
- adc rdx,0
- mov rbx,rdx
-
- mov rax,QWORD[56+rsi]
- mul rbp
- add r15,rax
- adc rdx,0
- add r15,rbx
- adc rdx,0
- mov r8,rdx
- mov QWORD[584+rsp],r9
- mov QWORD[592+rsp],r10
- mov QWORD[600+rsp],r11
- mov QWORD[608+rsp],r12
- mov QWORD[616+rsp],r13
- mov QWORD[624+rsp],r14
- mov QWORD[632+rsp],r15
- mov QWORD[640+rsp],r8
-
-
-
-
-
- jmp NEAR mont_reduce
-
-
-
-
-ALIGN 16
-sqr_reduce:
- mov rcx,QWORD[16+rsp]
-
-
-
- mov rbx,r10
-
- mov rax,r11
- mul rbx
- mov QWORD[528+rsp],rax
- mov r10,rdx
- mov rax,r12
- mul rbx
- add r10,rax
- adc rdx,0
- mov r11,rdx
- mov rax,r13
- mul rbx
- add r11,rax
- adc rdx,0
- mov r12,rdx
- mov rax,r14
- mul rbx
- add r12,rax
- adc rdx,0
- mov r13,rdx
- mov rax,r15
- mul rbx
- add r13,rax
- adc rdx,0
- mov r14,rdx
- mov rax,r8
- mul rbx
- add r14,rax
- adc rdx,0
- mov r15,rdx
- mov rax,r9
- mul rbx
- add r15,rax
- adc rdx,0
- mov rsi,rdx
-
- mov QWORD[536+rsp],r10
-
-
-
-
-
- mov rbx,QWORD[8+rcx]
-
- mov rax,QWORD[16+rcx]
- mul rbx
- add r11,rax
- adc rdx,0
- mov QWORD[544+rsp],r11
-
- mov r10,rdx
- mov rax,QWORD[24+rcx]
- mul rbx
- add r12,rax
- adc rdx,0
- add r12,r10
- adc rdx,0
- mov QWORD[552+rsp],r12
-
- mov r10,rdx
- mov rax,QWORD[32+rcx]
- mul rbx
- add r13,rax
- adc rdx,0
- add r13,r10
- adc rdx,0
-
- mov r10,rdx
- mov rax,QWORD[40+rcx]
- mul rbx
- add r14,rax
- adc rdx,0
- add r14,r10
- adc rdx,0
-
- mov r10,rdx
- mov rax,r8
- mul rbx
- add r15,rax
- adc rdx,0
- add r15,r10
- adc rdx,0
-
- mov r10,rdx
- mov rax,r9
- mul rbx
- add rsi,rax
- adc rdx,0
- add rsi,r10
- adc rdx,0
-
- mov r11,rdx
-
-
-
-
- mov rbx,QWORD[16+rcx]
-
- mov rax,QWORD[24+rcx]
- mul rbx
- add r13,rax
- adc rdx,0
- mov QWORD[560+rsp],r13
-
- mov r10,rdx
- mov rax,QWORD[32+rcx]
- mul rbx
- add r14,rax
- adc rdx,0
- add r14,r10
- adc rdx,0
- mov QWORD[568+rsp],r14
-
- mov r10,rdx
- mov rax,QWORD[40+rcx]
- mul rbx
- add r15,rax
- adc rdx,0
- add r15,r10
- adc rdx,0
-
- mov r10,rdx
- mov rax,r8
- mul rbx
- add rsi,rax
- adc rdx,0
- add rsi,r10
- adc rdx,0
-
- mov r10,rdx
- mov rax,r9
- mul rbx
- add r11,rax
- adc rdx,0
- add r11,r10
- adc rdx,0
-
- mov r12,rdx
-
-
-
-
-
- mov rbx,QWORD[24+rcx]
-
- mov rax,QWORD[32+rcx]
- mul rbx
- add r15,rax
- adc rdx,0
- mov QWORD[576+rsp],r15
-
- mov r10,rdx
- mov rax,QWORD[40+rcx]
- mul rbx
- add rsi,rax
- adc rdx,0
- add rsi,r10
- adc rdx,0
- mov QWORD[584+rsp],rsi
-
- mov r10,rdx
- mov rax,r8
- mul rbx
- add r11,rax
- adc rdx,0
- add r11,r10
- adc rdx,0
-
- mov r10,rdx
- mov rax,r9
- mul rbx
- add r12,rax
- adc rdx,0
- add r12,r10
- adc rdx,0
-
- mov r15,rdx
-
-
-
-
- mov rbx,QWORD[32+rcx]
-
- mov rax,QWORD[40+rcx]
- mul rbx
- add r11,rax
- adc rdx,0
- mov QWORD[592+rsp],r11
-
- mov r10,rdx
- mov rax,r8
- mul rbx
- add r12,rax
- adc rdx,0
- add r12,r10
- adc rdx,0
- mov QWORD[600+rsp],r12
-
- mov r10,rdx
- mov rax,r9
- mul rbx
- add r15,rax
- adc rdx,0
- add r15,r10
- adc rdx,0
-
- mov r11,rdx
-
-
-
-
- mov rbx,QWORD[40+rcx]
-
- mov rax,r8
- mul rbx
- add r15,rax
- adc rdx,0
- mov QWORD[608+rsp],r15
-
- mov r10,rdx
- mov rax,r9
- mul rbx
- add r11,rax
- adc rdx,0
- add r11,r10
- adc rdx,0
- mov QWORD[616+rsp],r11
-
- mov r12,rdx
-
-
-
-
- mov rbx,r8
-
- mov rax,r9
- mul rbx
- add r12,rax
- adc rdx,0
- mov QWORD[624+rsp],r12
-
- mov QWORD[632+rsp],rdx
-
-
- mov r10,QWORD[528+rsp]
- mov r11,QWORD[536+rsp]
- mov r12,QWORD[544+rsp]
- mov r13,QWORD[552+rsp]
- mov r14,QWORD[560+rsp]
- mov r15,QWORD[568+rsp]
-
- mov rax,QWORD[24+rcx]
- mul rax
- mov rdi,rax
- mov r8,rdx
-
- add r10,r10
- adc r11,r11
- adc r12,r12
- adc r13,r13
- adc r14,r14
- adc r15,r15
- adc r8,0
-
- mov rax,QWORD[rcx]
- mul rax
- mov QWORD[520+rsp],rax
- mov rbx,rdx
-
- mov rax,QWORD[8+rcx]
- mul rax
-
- add r10,rbx
- adc r11,rax
- adc rdx,0
-
- mov rbx,rdx
- mov QWORD[528+rsp],r10
- mov QWORD[536+rsp],r11
-
- mov rax,QWORD[16+rcx]
- mul rax
-
- add r12,rbx
- adc r13,rax
- adc rdx,0
-
- mov rbx,rdx
-
- mov QWORD[544+rsp],r12
- mov QWORD[552+rsp],r13
-
- xor rbp,rbp
- add r14,rbx
- adc r15,rdi
- adc rbp,0
-
- mov QWORD[560+rsp],r14
- mov QWORD[568+rsp],r15
-
-
-
-
- mov r10,QWORD[576+rsp]
- mov r11,QWORD[584+rsp]
- mov r12,QWORD[592+rsp]
- mov r13,QWORD[600+rsp]
- mov r14,QWORD[608+rsp]
- mov r15,QWORD[616+rsp]
- mov rdi,QWORD[624+rsp]
- mov rsi,QWORD[632+rsp]
-
- mov rax,r9
- mul rax
- mov r9,rax
- mov rbx,rdx
-
- add r10,r10
- adc r11,r11
- adc r12,r12
- adc r13,r13
- adc r14,r14
- adc r15,r15
- adc rdi,rdi
- adc rsi,rsi
- adc rbx,0
-
- add r10,rbp
-
- mov rax,QWORD[32+rcx]
- mul rax
-
- add r10,r8
- adc r11,rax
- adc rdx,0
-
- mov rbp,rdx
-
- mov QWORD[576+rsp],r10
- mov QWORD[584+rsp],r11
-
- mov rax,QWORD[40+rcx]
- mul rax
-
- add r12,rbp
- adc r13,rax
- adc rdx,0
-
- mov rbp,rdx
-
- mov QWORD[592+rsp],r12
- mov QWORD[600+rsp],r13
-
- mov rax,QWORD[48+rcx]
- mul rax
-
- add r14,rbp
- adc r15,rax
- adc rdx,0
-
- mov QWORD[608+rsp],r14
- mov QWORD[616+rsp],r15
-
- add rdi,rdx
- adc rsi,r9
- adc rbx,0
-
- mov QWORD[624+rsp],rdi
- mov QWORD[632+rsp],rsi
- mov QWORD[640+rsp],rbx
-
- jmp NEAR mont_reduce
-
-
-
-global mod_exp_512
-
-mod_exp_512:
- mov QWORD[8+rsp],rdi ;WIN64 prologue
- mov QWORD[16+rsp],rsi
- mov rax,rsp
-$L$SEH_begin_mod_exp_512:
- mov rdi,rcx
- mov rsi,rdx
- mov rdx,r8
- mov rcx,r9
-
-
- push rbp
- push rbx
- push r12
- push r13
- push r14
- push r15
-
-
- mov r8,rsp
- sub rsp,2688
- and rsp,-64
-
-
- mov QWORD[rsp],r8
- mov QWORD[8+rsp],rdi
- mov QWORD[16+rsp],rsi
- mov QWORD[24+rsp],rcx
-$L$body:
-
-
-
- pxor xmm4,xmm4
- movdqu xmm0,XMMWORD[rsi]
- movdqu xmm1,XMMWORD[16+rsi]
- movdqu xmm2,XMMWORD[32+rsi]
- movdqu xmm3,XMMWORD[48+rsi]
- movdqa XMMWORD[512+rsp],xmm4
- movdqa XMMWORD[528+rsp],xmm4
- movdqa XMMWORD[608+rsp],xmm4
- movdqa XMMWORD[624+rsp],xmm4
- movdqa XMMWORD[544+rsp],xmm0
- movdqa XMMWORD[560+rsp],xmm1
- movdqa XMMWORD[576+rsp],xmm2
- movdqa XMMWORD[592+rsp],xmm3
-
-
- movdqu xmm0,XMMWORD[rdx]
- movdqu xmm1,XMMWORD[16+rdx]
- movdqu xmm2,XMMWORD[32+rdx]
- movdqu xmm3,XMMWORD[48+rdx]
-
- lea rbx,[384+rsp]
- mov QWORD[136+rsp],rbx
- call mont_reduce
-
-
- lea rcx,[448+rsp]
- xor rax,rax
- mov QWORD[rcx],rax
- mov QWORD[8+rcx],rax
- mov QWORD[24+rcx],rax
- mov QWORD[32+rcx],rax
- mov QWORD[40+rcx],rax
- mov QWORD[48+rcx],rax
- mov QWORD[56+rcx],rax
- mov QWORD[128+rsp],rax
- mov QWORD[16+rcx],1
-
- lea rbp,[640+rsp]
- mov rsi,rcx
- mov rdi,rbp
- mov rax,8
-loop_0:
- mov rbx,QWORD[rcx]
- mov WORD[rdi],bx
- shr rbx,16
- mov WORD[64+rdi],bx
- shr rbx,16
- mov WORD[128+rdi],bx
- shr rbx,16
- mov WORD[192+rdi],bx
- lea rcx,[8+rcx]
- lea rdi,[256+rdi]
- dec rax
- jnz NEAR loop_0
- mov rax,31
- mov QWORD[32+rsp],rax
- mov QWORD[40+rsp],rbp
-
- mov QWORD[136+rsp],rsi
- mov r10,QWORD[rsi]
- mov r11,QWORD[8+rsi]
- mov r12,QWORD[16+rsi]
- mov r13,QWORD[24+rsi]
- mov r14,QWORD[32+rsi]
- mov r15,QWORD[40+rsi]
- mov r8,QWORD[48+rsi]
- mov r9,QWORD[56+rsi]
-init_loop:
- lea rdi,[384+rsp]
- call mont_mul_a3b
- lea rsi,[448+rsp]
- mov rbp,QWORD[40+rsp]
- add rbp,2
- mov QWORD[40+rsp],rbp
- mov rcx,rsi
- mov rax,8
-loop_1:
- mov rbx,QWORD[rcx]
- mov WORD[rbp],bx
- shr rbx,16
- mov WORD[64+rbp],bx
- shr rbx,16
- mov WORD[128+rbp],bx
- shr rbx,16
- mov WORD[192+rbp],bx
- lea rcx,[8+rcx]
- lea rbp,[256+rbp]
- dec rax
- jnz NEAR loop_1
- mov rax,QWORD[32+rsp]
- sub rax,1
- mov QWORD[32+rsp],rax
- jne NEAR init_loop
-
-
-
- movdqa XMMWORD[64+rsp],xmm0
- movdqa XMMWORD[80+rsp],xmm1
- movdqa XMMWORD[96+rsp],xmm2
- movdqa XMMWORD[112+rsp],xmm3
-
-
-
-
-
- mov eax,DWORD[126+rsp]
- mov rdx,rax
- shr rax,11
- and edx,0x07FF
- mov DWORD[126+rsp],edx
- lea rsi,[640+rax*2+rsp]
- mov rdx,QWORD[8+rsp]
- mov rbp,4
-loop_2:
- movzx rbx,WORD[192+rsi]
- movzx rax,WORD[448+rsi]
- shl rbx,16
- shl rax,16
- mov bx,WORD[128+rsi]
- mov ax,WORD[384+rsi]
- shl rbx,16
- shl rax,16
- mov bx,WORD[64+rsi]
- mov ax,WORD[320+rsi]
- shl rbx,16
- shl rax,16
- mov bx,WORD[rsi]
- mov ax,WORD[256+rsi]
- mov QWORD[rdx],rbx
- mov QWORD[8+rdx],rax
- lea rsi,[512+rsi]
- lea rdx,[16+rdx]
- sub rbp,1
- jnz NEAR loop_2
- mov QWORD[48+rsp],505
-
- mov rcx,QWORD[8+rsp]
- mov QWORD[136+rsp],rcx
- mov r10,QWORD[rcx]
- mov r11,QWORD[8+rcx]
- mov r12,QWORD[16+rcx]
- mov r13,QWORD[24+rcx]
- mov r14,QWORD[32+rcx]
- mov r15,QWORD[40+rcx]
- mov r8,QWORD[48+rcx]
- mov r9,QWORD[56+rcx]
- jmp NEAR sqr_2
-
-main_loop_a3b:
- call sqr_reduce
- call sqr_reduce
- call sqr_reduce
-sqr_2:
- call sqr_reduce
- call sqr_reduce
-
-
-
- mov rcx,QWORD[48+rsp]
- mov rax,rcx
- shr rax,4
- mov edx,DWORD[64+rax*2+rsp]
- and rcx,15
- shr rdx,cl
- and rdx,0x1F
-
- lea rsi,[640+rdx*2+rsp]
- lea rdx,[448+rsp]
- mov rdi,rdx
- mov rbp,4
-loop_3:
- movzx rbx,WORD[192+rsi]
- movzx rax,WORD[448+rsi]
- shl rbx,16
- shl rax,16
- mov bx,WORD[128+rsi]
- mov ax,WORD[384+rsi]
- shl rbx,16
- shl rax,16
- mov bx,WORD[64+rsi]
- mov ax,WORD[320+rsi]
- shl rbx,16
- shl rax,16
- mov bx,WORD[rsi]
- mov ax,WORD[256+rsi]
- mov QWORD[rdx],rbx
- mov QWORD[8+rdx],rax
- lea rsi,[512+rsi]
- lea rdx,[16+rdx]
- sub rbp,1
- jnz NEAR loop_3
- mov rsi,QWORD[8+rsp]
- call mont_mul_a3b
-
-
-
- mov rcx,QWORD[48+rsp]
- sub rcx,5
- mov QWORD[48+rsp],rcx
- jge NEAR main_loop_a3b
-
-
-
-end_main_loop_a3b:
-
-
- mov rdx,QWORD[8+rsp]
- pxor xmm4,xmm4
- movdqu xmm0,XMMWORD[rdx]
- movdqu xmm1,XMMWORD[16+rdx]
- movdqu xmm2,XMMWORD[32+rdx]
- movdqu xmm3,XMMWORD[48+rdx]
- movdqa XMMWORD[576+rsp],xmm4
- movdqa XMMWORD[592+rsp],xmm4
- movdqa XMMWORD[608+rsp],xmm4
- movdqa XMMWORD[624+rsp],xmm4
- movdqa XMMWORD[512+rsp],xmm0
- movdqa XMMWORD[528+rsp],xmm1
- movdqa XMMWORD[544+rsp],xmm2
- movdqa XMMWORD[560+rsp],xmm3
- call mont_reduce
-
-
-
- mov rax,QWORD[8+rsp]
- mov r8,QWORD[rax]
- mov r9,QWORD[8+rax]
- mov r10,QWORD[16+rax]
- mov r11,QWORD[24+rax]
- mov r12,QWORD[32+rax]
- mov r13,QWORD[40+rax]
- mov r14,QWORD[48+rax]
- mov r15,QWORD[56+rax]
-
-
- mov rbx,QWORD[24+rsp]
- add rbx,512
-
- sub r8,QWORD[rbx]
- sbb r9,QWORD[8+rbx]
- sbb r10,QWORD[16+rbx]
- sbb r11,QWORD[24+rbx]
- sbb r12,QWORD[32+rbx]
- sbb r13,QWORD[40+rbx]
- sbb r14,QWORD[48+rbx]
- sbb r15,QWORD[56+rbx]
-
-
- mov rsi,QWORD[rax]
- mov rdi,QWORD[8+rax]
- mov rcx,QWORD[16+rax]
- mov rdx,QWORD[24+rax]
- cmovnc rsi,r8
- cmovnc rdi,r9
- cmovnc rcx,r10
- cmovnc rdx,r11
- mov QWORD[rax],rsi
- mov QWORD[8+rax],rdi
- mov QWORD[16+rax],rcx
- mov QWORD[24+rax],rdx
-
- mov rsi,QWORD[32+rax]
- mov rdi,QWORD[40+rax]
- mov rcx,QWORD[48+rax]
- mov rdx,QWORD[56+rax]
- cmovnc rsi,r12
- cmovnc rdi,r13
- cmovnc rcx,r14
- cmovnc rdx,r15
- mov QWORD[32+rax],rsi
- mov QWORD[40+rax],rdi
- mov QWORD[48+rax],rcx
- mov QWORD[56+rax],rdx
-
- mov rsi,QWORD[rsp]
- mov r15,QWORD[rsi]
- mov r14,QWORD[8+rsi]
- mov r13,QWORD[16+rsi]
- mov r12,QWORD[24+rsi]
- mov rbx,QWORD[32+rsi]
- mov rbp,QWORD[40+rsi]
- lea rsp,[48+rsi]
-$L$epilogue:
- mov rdi,QWORD[8+rsp] ;WIN64 epilogue
- mov rsi,QWORD[16+rsp]
- DB 0F3h,0C3h ;repret
-$L$SEH_end_mod_exp_512:
-EXTERN __imp_RtlVirtualUnwind
-
-ALIGN 16
-mod_exp_512_se_handler:
- push rsi
- push rdi
- push rbx
- push rbp
- push r12
- push r13
- push r14
- push r15
- pushfq
- sub rsp,64
-
- mov rax,QWORD[120+r8]
- mov rbx,QWORD[248+r8]
-
- lea r10,[$L$body]
- cmp rbx,r10
- jb NEAR $L$in_prologue
-
- mov rax,QWORD[152+r8]
-
- lea r10,[$L$epilogue]
- cmp rbx,r10
- jae NEAR $L$in_prologue
-
- mov rax,QWORD[rax]
-
- mov rbx,QWORD[32+rax]
- mov rbp,QWORD[40+rax]
- mov r12,QWORD[24+rax]
- mov r13,QWORD[16+rax]
- mov r14,QWORD[8+rax]
- mov r15,QWORD[rax]
- lea rax,[48+rax]
- mov QWORD[144+r8],rbx
- mov QWORD[160+r8],rbp
- mov QWORD[216+r8],r12
- mov QWORD[224+r8],r13
- mov QWORD[232+r8],r14
- mov QWORD[240+r8],r15
-
-$L$in_prologue:
- mov rdi,QWORD[8+rax]
- mov rsi,QWORD[16+rax]
- mov QWORD[152+r8],rax
- mov QWORD[168+r8],rsi
- mov QWORD[176+r8],rdi
-
- mov rdi,QWORD[40+r9]
- mov rsi,r8
- mov ecx,154
- DD 0xa548f3fc
-
- mov rsi,r9
- xor rcx,rcx
- mov rdx,QWORD[8+rsi]
- mov r8,QWORD[rsi]
- mov r9,QWORD[16+rsi]
- mov r10,QWORD[40+rsi]
- lea r11,[56+rsi]
- lea r12,[24+rsi]
- mov QWORD[32+rsp],r10
- mov QWORD[40+rsp],r11
- mov QWORD[48+rsp],r12
- mov QWORD[56+rsp],rcx
- call QWORD[__imp_RtlVirtualUnwind]
-
- mov eax,1
- add rsp,64
- popfq
- pop r15
- pop r14
- pop r13
- pop r12
- pop rbp
- pop rbx
- pop rdi
- pop rsi
- DB 0F3h,0C3h ;repret
-
-
-section .pdata rdata align=4
-ALIGN 4
- DD $L$SEH_begin_mod_exp_512 wrt ..imagebase
- DD $L$SEH_end_mod_exp_512 wrt ..imagebase
- DD $L$SEH_info_mod_exp_512 wrt ..imagebase
-
-section .xdata rdata align=8
-ALIGN 8
-$L$SEH_info_mod_exp_512:
-DB 9,0,0,0
- DD mod_exp_512_se_handler wrt ..imagebase