-rw-r--r-- 71820 lib25519-20240928/crypto_multiscalar/ed25519/amd64-maax-opt/ge25519_multi_scalarmult_process.S raw
#include "crypto_asm_hidden.h" // linker define ge25519_multi_scalarmult_process // linker use EC2D0 EC2D1 EC2D2 EC2D3 mask63 // linker use twoexp8_p0 // linker use twoexp8_p123 // linker use twoexp8_p4 #define EC2D0 CRYPTO_SHARED_NAMESPACE(EC2D0) #define EC2D1 CRYPTO_SHARED_NAMESPACE(EC2D1) #define EC2D2 CRYPTO_SHARED_NAMESPACE(EC2D2) #define EC2D3 CRYPTO_SHARED_NAMESPACE(EC2D3) #define mask63 CRYPTO_SHARED_NAMESPACE(mask63) #define twoexp8_p0 CRYPTO_SHARED_NAMESPACE(twoexp8_p0) #define twoexp8_p123 CRYPTO_SHARED_NAMESPACE(twoexp8_p123) #define twoexp8_p4 CRYPTO_SHARED_NAMESPACE(twoexp8_p4) .p2align 5 ASM_HIDDEN _CRYPTO_SHARED_NAMESPACE(ge25519_multi_scalarmult_process) .globl _CRYPTO_SHARED_NAMESPACE(ge25519_multi_scalarmult_process) ASM_HIDDEN CRYPTO_SHARED_NAMESPACE(ge25519_multi_scalarmult_process) .globl CRYPTO_SHARED_NAMESPACE(ge25519_multi_scalarmult_process) _CRYPTO_SHARED_NAMESPACE(ge25519_multi_scalarmult_process): CRYPTO_SHARED_NAMESPACE(ge25519_multi_scalarmult_process): movq %rsp,%r11 andq $-32,%rsp subq $632,%rsp movq %r11,0(%rsp) movq %r12,8(%rsp) movq %r13,16(%rsp) movq %r14,24(%rsp) movq %r15,32(%rsp) movq %rbx,40(%rsp) movq %rbp,48(%rsp) // p1p1 to 0 movq $0,%rax movq $1,%rbx movq %rax,144(%rsp) movq %rax,152(%rsp) movq %rax,160(%rsp) movq %rax,168(%rsp) movq %rbx,176(%rsp) movq %rax,184(%rsp) movq %rax,192(%rsp) movq %rax,200(%rsp) movq %rbx,208(%rsp) movq %rax,216(%rsp) movq %rax,224(%rsp) movq %rax,232(%rsp) movq %rbx,240(%rsp) movq %rax,248(%rsp) movq %rax,256(%rsp) movq %rax,264(%rsp) movq %rdi,56(%rsp) movq %rsi,64(%rsp) movq %rdx,72(%rsp) movq %rcx,80(%rsp) movq %rax,88(%rsp) movq $128,%rdx mulx %r8,%r8,%r9 movq %r8,96(%rsp) movq $255,104(%rsp) addq 104(%rsp),%rsi movq %rsi,112(%rsp) .L1: movq 88(%rsp),%rax cmpq $0,%rax je .L2 /* p1p1 to p2 */ // mul xorq %r13,%r13 movq 144(%rsp),%rdx mulx 240(%rsp),%r8,%r9 mulx 248(%rsp),%rcx,%r10 adcx %rcx,%r9 mulx 256(%rsp),%rcx,%r11 adcx %rcx,%r10 mulx 264(%rsp),%rcx,%r12 adcx %rcx,%r11 adcx %r13,%r12 xorq %r14,%r14 movq 152(%rsp),%rdx mulx 240(%rsp),%rcx,%rbp adcx %rcx,%r9 adox %rbp,%r10 mulx 248(%rsp),%rcx,%rbp adcx %rcx,%r10 adox %rbp,%r11 mulx 256(%rsp),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 264(%rsp),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 adcx %r14,%r13 xorq %r15,%r15 movq 160(%rsp),%rdx mulx 240(%rsp),%rcx,%rbp adcx %rcx,%r10 adox %rbp,%r11 mulx 248(%rsp),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 256(%rsp),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 mulx 264(%rsp),%rcx,%rbp adcx %rcx,%r13 adox %rbp,%r14 adcx %r15,%r14 xorq %rax,%rax movq 168(%rsp),%rdx mulx 240(%rsp),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 248(%rsp),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 mulx 256(%rsp),%rcx,%rbp adcx %rcx,%r13 adox %rbp,%r14 mulx 264(%rsp),%rcx,%rbp adcx %rcx,%r14 adox %rbp,%r15 adcx %rax,%r15 xorq %rbp,%rbp movq $38,%rdx mulx %r12,%rax,%r12 adcx %rax,%r8 adox %r12,%r9 mulx %r13,%rcx,%r13 adcx %rcx,%r9 adox %r13,%r10 mulx %r14,%rcx,%r14 adcx %rcx,%r10 adox %r14,%r11 mulx %r15,%rcx,%r15 adcx %rcx,%r11 adox %rbp,%r15 adcx %rbp,%r15 shld $1,%r11,%r15 andq mask63(%rip),%r11 imul $19,%r15,%r15 addq %r15,%r8 adcq $0,%r9 adcq $0,%r10 adcq $0,%r11 movq %r8,272(%rsp) movq %r9,280(%rsp) movq %r10,288(%rsp) movq %r11,296(%rsp) // mul xorq %r13,%r13 movq 176(%rsp),%rdx mulx 208(%rsp),%r8,%r9 mulx 216(%rsp),%rcx,%r10 adcx %rcx,%r9 mulx 224(%rsp),%rcx,%r11 adcx %rcx,%r10 mulx 232(%rsp),%rcx,%r12 adcx %rcx,%r11 adcx %r13,%r12 xorq %r14,%r14 movq 184(%rsp),%rdx mulx 208(%rsp),%rcx,%rbp adcx %rcx,%r9 adox %rbp,%r10 mulx 216(%rsp),%rcx,%rbp adcx %rcx,%r10 adox %rbp,%r11 mulx 224(%rsp),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 232(%rsp),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 adcx %r14,%r13 xorq %r15,%r15 movq 192(%rsp),%rdx mulx 208(%rsp),%rcx,%rbp adcx %rcx,%r10 adox %rbp,%r11 mulx 216(%rsp),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 224(%rsp),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 mulx 232(%rsp),%rcx,%rbp adcx %rcx,%r13 adox %rbp,%r14 adcx %r15,%r14 xorq %rax,%rax movq 200(%rsp),%rdx mulx 208(%rsp),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 216(%rsp),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 mulx 224(%rsp),%rcx,%rbp adcx %rcx,%r13 adox %rbp,%r14 mulx 232(%rsp),%rcx,%rbp adcx %rcx,%r14 adox %rbp,%r15 adcx %rax,%r15 xorq %rbp,%rbp movq $38,%rdx mulx %r12,%rax,%r12 adcx %rax,%r8 adox %r12,%r9 mulx %r13,%rcx,%r13 adcx %rcx,%r9 adox %r13,%r10 mulx %r14,%rcx,%r14 adcx %rcx,%r10 adox %r14,%r11 mulx %r15,%rcx,%r15 adcx %rcx,%r11 adox %rbp,%r15 adcx %rbp,%r15 shld $1,%r11,%r15 andq mask63(%rip),%r11 imul $19,%r15,%r15 addq %r15,%r8 adcq $0,%r9 adcq $0,%r10 adcq $0,%r11 movq %r8,304(%rsp) movq %r9,312(%rsp) movq %r10,320(%rsp) movq %r11,328(%rsp) // mul xorq %r13,%r13 movq 176(%rsp),%rdx mulx 240(%rsp),%r8,%r9 mulx 248(%rsp),%rcx,%r10 adcx %rcx,%r9 mulx 256(%rsp),%rcx,%r11 adcx %rcx,%r10 mulx 264(%rsp),%rcx,%r12 adcx %rcx,%r11 adcx %r13,%r12 xorq %r14,%r14 movq 184(%rsp),%rdx mulx 240(%rsp),%rcx,%rbp adcx %rcx,%r9 adox %rbp,%r10 mulx 248(%rsp),%rcx,%rbp adcx %rcx,%r10 adox %rbp,%r11 mulx 256(%rsp),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 264(%rsp),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 adcx %r14,%r13 xorq %r15,%r15 movq 192(%rsp),%rdx mulx 240(%rsp),%rcx,%rbp adcx %rcx,%r10 adox %rbp,%r11 mulx 248(%rsp),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 256(%rsp),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 mulx 264(%rsp),%rcx,%rbp adcx %rcx,%r13 adox %rbp,%r14 adcx %r15,%r14 xorq %rax,%rax movq 200(%rsp),%rdx mulx 240(%rsp),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 248(%rsp),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 mulx 256(%rsp),%rcx,%rbp adcx %rcx,%r13 adox %rbp,%r14 mulx 264(%rsp),%rcx,%rbp adcx %rcx,%r14 adox %rbp,%r15 adcx %rax,%r15 xorq %rbp,%rbp movq $38,%rdx mulx %r12,%rax,%r12 adcx %rax,%r8 adox %r12,%r9 mulx %r13,%rcx,%r13 adcx %rcx,%r9 adox %r13,%r10 mulx %r14,%rcx,%r14 adcx %rcx,%r10 adox %r14,%r11 mulx %r15,%rcx,%r15 adcx %rcx,%r11 adox %rbp,%r15 adcx %rbp,%r15 shld $1,%r11,%r15 andq mask63(%rip),%r11 imul $19,%r15,%r15 addq %r15,%r8 adcq $0,%r9 adcq $0,%r10 adcq $0,%r11 movq %r8,336(%rsp) movq %r9,344(%rsp) movq %r10,352(%rsp) movq %r11,360(%rsp) /* dbl p1p1 */ // square xorq %r13,%r13 movq 336(%rsp),%rdx mulx 344(%rsp),%r9,%r10 mulx 352(%rsp),%rcx,%r11 adcx %rcx,%r10 mulx 360(%rsp),%rcx,%r12 adcx %rcx,%r11 adcx %r13,%r12 movq 344(%rsp),%rdx xorq %r14,%r14 mulx 352(%rsp),%rcx,%rdx adcx %rcx,%r11 adox %rdx,%r12 movq 344(%rsp),%rdx mulx 360(%rsp),%rcx,%rdx adcx %rcx,%r12 adox %rdx,%r13 adcx %r14,%r13 xorq %r15,%r15 movq 352(%rsp),%rdx mulx 360(%rsp),%rcx,%r14 adcx %rcx,%r13 adcx %r15,%r14 shld $1,%r14,%r15 shld $1,%r13,%r14 shld $1,%r12,%r13 shld $1,%r11,%r12 shld $1,%r10,%r11 shld $1,%r9,%r10 shlq $1,%r9 xorq %rdx,%rdx movq 336(%rsp),%rdx mulx %rdx,%r8,%rdx adcx %rdx,%r9 movq 344(%rsp),%rdx mulx %rdx,%rcx,%rdx adcx %rcx,%r10 adcx %rdx,%r11 movq 352(%rsp),%rdx mulx %rdx,%rcx,%rdx adcx %rcx,%r12 adcx %rdx,%r13 movq 360(%rsp),%rdx mulx %rdx,%rcx,%rdx adcx %rcx,%r14 adcx %rdx,%r15 xorq %rbp,%rbp movq $38,%rdx mulx %r12,%rax,%r12 adcx %rax,%r8 adox %r12,%r9 mulx %r13,%rcx,%r13 adcx %rcx,%r9 adox %r13,%r10 mulx %r14,%rcx,%r14 adcx %rcx,%r10 adox %r14,%r11 mulx %r15,%rcx,%r15 adcx %rcx,%r11 adox %rbp,%r15 adcx %rbp,%r15 // double addq %r8,%r8 adcq %r9,%r9 adcq %r10,%r10 adcq %r11,%r11 adcq %r15,%r15 movq %r8,448(%rsp) movq %r9,456(%rsp) movq %r10,464(%rsp) movq %r11,472(%rsp) movq %r15,480(%rsp) // square xorq %r13,%r13 movq 304(%rsp),%rdx mulx 312(%rsp),%r9,%r10 mulx 320(%rsp),%rcx,%r11 adcx %rcx,%r10 mulx 328(%rsp),%rcx,%r12 adcx %rcx,%r11 adcx %r13,%r12 movq 312(%rsp),%rdx xorq %r14,%r14 mulx 320(%rsp),%rcx,%rdx adcx %rcx,%r11 adox %rdx,%r12 movq 312(%rsp),%rdx mulx 328(%rsp),%rcx,%rdx adcx %rcx,%r12 adox %rdx,%r13 adcx %r14,%r13 xorq %r15,%r15 movq 320(%rsp),%rdx mulx 328(%rsp),%rcx,%r14 adcx %rcx,%r13 adcx %r15,%r14 shld $1,%r14,%r15 shld $1,%r13,%r14 shld $1,%r12,%r13 shld $1,%r11,%r12 shld $1,%r10,%r11 shld $1,%r9,%r10 shlq $1,%r9 xorq %rdx,%rdx movq 304(%rsp),%rdx mulx %rdx,%r8,%rdx adcx %rdx,%r9 movq 312(%rsp),%rdx mulx %rdx,%rcx,%rdx adcx %rcx,%r10 adcx %rdx,%r11 movq 320(%rsp),%rdx mulx %rdx,%rcx,%rdx adcx %rcx,%r12 adcx %rdx,%r13 movq 328(%rsp),%rdx mulx %rdx,%rcx,%rdx adcx %rcx,%r14 adcx %rdx,%r15 xorq %rbp,%rbp movq $38,%rdx mulx %r12,%rax,%r12 adcx %rax,%r8 adox %r12,%r9 mulx %r13,%rcx,%r13 adcx %rcx,%r9 adox %r13,%r10 mulx %r14,%rcx,%r14 adcx %rcx,%r10 adox %r14,%r11 mulx %r15,%rcx,%r15 adcx %rcx,%r11 adox %rbp,%r15 adcx %rbp,%r15 movq %r8,408(%rsp) movq %r9,416(%rsp) movq %r10,424(%rsp) movq %r11,432(%rsp) movq %r15,440(%rsp) // square xorq %r13,%r13 movq 272(%rsp),%rdx mulx 280(%rsp),%r9,%r10 mulx 288(%rsp),%rcx,%r11 adcx %rcx,%r10 mulx 296(%rsp),%rcx,%r12 adcx %rcx,%r11 adcx %r13,%r12 movq 280(%rsp),%rdx xorq %r14,%r14 mulx 288(%rsp),%rcx,%rdx adcx %rcx,%r11 adox %rdx,%r12 movq 280(%rsp),%rdx mulx 296(%rsp),%rcx,%rdx adcx %rcx,%r12 adox %rdx,%r13 adcx %r14,%r13 xorq %r15,%r15 movq 288(%rsp),%rdx mulx 296(%rsp),%rcx,%r14 adcx %rcx,%r13 adcx %r15,%r14 shld $1,%r14,%r15 shld $1,%r13,%r14 shld $1,%r12,%r13 shld $1,%r11,%r12 shld $1,%r10,%r11 shld $1,%r9,%r10 shlq $1,%r9 xorq %rdx,%rdx movq 272(%rsp),%rdx mulx %rdx,%r8,%rdx adcx %rdx,%r9 movq 280(%rsp),%rdx mulx %rdx,%rcx,%rdx adcx %rcx,%r10 adcx %rdx,%r11 movq 288(%rsp),%rdx mulx %rdx,%rcx,%rdx adcx %rcx,%r12 adcx %rdx,%r13 movq 296(%rsp),%rdx mulx %rdx,%rcx,%rdx adcx %rcx,%r14 adcx %rdx,%r15 xorq %rbp,%rbp movq $38,%rdx mulx %r12,%rax,%r12 adcx %rax,%r8 adox %r12,%r9 mulx %r13,%rcx,%r13 adcx %rcx,%r9 adox %r13,%r10 mulx %r14,%rcx,%r14 adcx %rcx,%r10 adox %r14,%r11 mulx %r15,%rcx,%r15 adcx %rcx,%r11 adox %rbp,%r15 adcx %rbp,%r15 movq %r8,368(%rsp) movq %r9,376(%rsp) movq %r10,384(%rsp) movq %r11,392(%rsp) movq %r15,400(%rsp) // neg movq twoexp8_p0(%rip),%r12 movq twoexp8_p123(%rip),%r13 movq twoexp8_p123(%rip),%r14 movq twoexp8_p123(%rip),%rax movq twoexp8_p4(%rip),%rbx subq %r8,%r12 sbbq %r9,%r13 sbbq %r10,%r14 sbbq %r11,%rax sbbq %r15,%rbx // add addq 408(%rsp),%r12 adcq 416(%rsp),%r13 adcq 424(%rsp),%r14 adcq 432(%rsp),%rax adcq 440(%rsp),%rbx movq %r12,%r8 movq %r13,%r9 movq %r14,%r10 movq %rax,%r11 movq %rbx,%r15 shld $1,%rax,%rbx andq mask63(%rip),%rax imul $19,%rbx,%rbx addq %rbx,%r12 adcq $0,%r13 adcq $0,%r14 adcq $0,%rax movq %r12,176(%rsp) movq %r13,184(%rsp) movq %r14,192(%rsp) movq %rax,200(%rsp) // sub subq 448(%rsp),%r8 sbbq 456(%rsp),%r9 sbbq 464(%rsp),%r10 sbbq 472(%rsp),%r11 sbbq 480(%rsp),%r15 shld $1,%r11,%r15 andq mask63(%rip),%r11 imul $19,%r15,%r15 addq %r15,%r8 adcq $0,%r9 adcq $0,%r10 adcq $0,%r11 movq %r8,240(%rsp) movq %r9,248(%rsp) movq %r10,256(%rsp) movq %r11,264(%rsp) // neg movq twoexp8_p0(%rip),%r8 movq twoexp8_p123(%rip),%r9 movq twoexp8_p123(%rip),%r10 movq twoexp8_p123(%rip),%r11 movq twoexp8_p4(%rip),%rax subq 408(%rsp),%r8 sbbq 416(%rsp),%r9 sbbq 424(%rsp),%r10 sbbq 432(%rsp),%r11 sbbq 440(%rsp),%rax // sub subq 368(%rsp),%r8 sbbq 376(%rsp),%r9 sbbq 384(%rsp),%r10 sbbq 392(%rsp),%r11 sbbq 400(%rsp),%rax shld $1,%r11,%rax andq mask63(%rip),%r11 imul $19,%rax,%rax addq %rax,%r8 adcq $0,%r9 adcq $0,%r10 adcq $0,%r11 movq %r8,208(%rsp) movq %r9,216(%rsp) movq %r10,224(%rsp) movq %r11,232(%rsp) // add movq 272(%rsp),%rbx movq 280(%rsp),%rbp movq 288(%rsp),%rcx movq 296(%rsp),%rsi addq 304(%rsp),%rbx adcq 312(%rsp),%rbp adcq 320(%rsp),%rcx adcq 328(%rsp),%rsi movq $0,%rdx movq $38,%rax cmovae %rdx,%rax addq %rax,%rbx adcq %rdx,%rbp adcq %rdx,%rcx adcq %rdx,%rsi cmovc %rax,%rdx addq %rdx,%rbx // square xorq %r13,%r13 movq %rbx,%rdx mulx %rbp,%r9,%r10 mulx %rcx,%r8,%r11 adcx %r8,%r10 mulx %rsi,%r8,%r12 adcx %r8,%r11 adcx %r13,%r12 movq %rbp,%rdx xorq %r14,%r14 mulx %rcx,%r8,%rdx adcx %r8,%r11 adox %rdx,%r12 movq %rbp,%rdx mulx %rsi,%r8,%rdx adcx %r8,%r12 adox %rdx,%r13 adcx %r14,%r13 xorq %r15,%r15 movq %rcx,%rdx mulx %rsi,%r8,%r14 adcx %r8,%r13 adcx %r15,%r14 shld $1,%r14,%r15 shld $1,%r13,%r14 shld $1,%r12,%r13 shld $1,%r11,%r12 shld $1,%r10,%r11 shld $1,%r9,%r10 shlq $1,%r9 xorq %rdx,%rdx movq %rbx,%rdx mulx %rdx,%r8,%rdx adcx %rdx,%r9 movq %rbp,%rdx mulx %rdx,%rax,%rdx adcx %rax,%r10 adcx %rdx,%r11 movq %rcx,%rdx mulx %rdx,%rax,%rdx adcx %rax,%r12 adcx %rdx,%r13 movq %rsi,%rdx mulx %rdx,%rax,%rdx adcx %rax,%r14 adcx %rdx,%r15 xorq %rbp,%rbp movq $38,%rdx mulx %r12,%rax,%r12 adcx %rax,%r8 adox %r12,%r9 mulx %r13,%rcx,%r13 adcx %rcx,%r9 adox %r13,%r10 mulx %r14,%rcx,%r14 adcx %rcx,%r10 adox %r14,%r11 mulx %r15,%rcx,%r15 adcx %rcx,%r11 adox %rbp,%r15 adcx %rbp,%r15 // add addq 208(%rsp),%r8 adcq 216(%rsp),%r9 adcq 224(%rsp),%r10 adcq 232(%rsp),%r11 adcq $0,%r15 shld $1,%r11,%r15 andq mask63(%rip),%r11 imul $19,%r15,%r15 addq %r15,%r8 adcq $0,%r9 adcq $0,%r10 adcq $0,%r11 movq %r8,144(%rsp) movq %r9,152(%rsp) movq %r10,160(%rsp) movq %r11,168(%rsp) .L2: movq $0,120(%rsp) movq 112(%rsp),%rsi movq %rsi,128(%rsp) .L3: movb 0(%rsi),%r14b cmpb $0,%r14b jne .L4 addq $256,%rsi movq %rsi,128(%rsp) movq 120(%rsp),%rcx addq $1,%rcx movq %rcx,120(%rsp) cmpq 80(%rsp),%rcx jl .L3 movq 112(%rsp),%rsi decq %rsi movq %rsi,112(%rsp) movq 104(%rsp),%rax decq %rax movq %rax,104(%rsp) cmpq $0,%rax jge .L1 jmp .L8 .L4: movq $1,88(%rsp) movb %r14b,136(%rsp) /* p1p1 to p3 */ // mul xorq %r13,%r13 movq 144(%rsp),%rdx mulx 240(%rsp),%r8,%r9 mulx 248(%rsp),%rcx,%r10 adcx %rcx,%r9 mulx 256(%rsp),%rcx,%r11 adcx %rcx,%r10 mulx 264(%rsp),%rcx,%r12 adcx %rcx,%r11 adcx %r13,%r12 xorq %r14,%r14 movq 152(%rsp),%rdx mulx 240(%rsp),%rcx,%rbp adcx %rcx,%r9 adox %rbp,%r10 mulx 248(%rsp),%rcx,%rbp adcx %rcx,%r10 adox %rbp,%r11 mulx 256(%rsp),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 264(%rsp),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 adcx %r14,%r13 xorq %r15,%r15 movq 160(%rsp),%rdx mulx 240(%rsp),%rcx,%rbp adcx %rcx,%r10 adox %rbp,%r11 mulx 248(%rsp),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 256(%rsp),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 mulx 264(%rsp),%rcx,%rbp adcx %rcx,%r13 adox %rbp,%r14 adcx %r15,%r14 xorq %rax,%rax movq 168(%rsp),%rdx mulx 240(%rsp),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 248(%rsp),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 mulx 256(%rsp),%rcx,%rbp adcx %rcx,%r13 adox %rbp,%r14 mulx 264(%rsp),%rcx,%rbp adcx %rcx,%r14 adox %rbp,%r15 adcx %rax,%r15 xorq %rbp,%rbp movq $38,%rdx mulx %r12,%rax,%r12 adcx %rax,%r8 adox %r12,%r9 mulx %r13,%rcx,%r13 adcx %rcx,%r9 adox %r13,%r10 mulx %r14,%rcx,%r14 adcx %rcx,%r10 adox %r14,%r11 mulx %r15,%rcx,%r15 adcx %rcx,%r11 adox %rbp,%r15 adcx %rbp,%r15 movq %r8,272(%rsp) movq %r9,280(%rsp) movq %r10,288(%rsp) movq %r11,296(%rsp) movq %r15,304(%rsp) // mul xorq %r13,%r13 movq 176(%rsp),%rdx mulx 208(%rsp),%r8,%r9 mulx 216(%rsp),%rcx,%r10 adcx %rcx,%r9 mulx 224(%rsp),%rcx,%r11 adcx %rcx,%r10 mulx 232(%rsp),%rcx,%r12 adcx %rcx,%r11 adcx %r13,%r12 xorq %r14,%r14 movq 184(%rsp),%rdx mulx 208(%rsp),%rcx,%rbp adcx %rcx,%r9 adox %rbp,%r10 mulx 216(%rsp),%rcx,%rbp adcx %rcx,%r10 adox %rbp,%r11 mulx 224(%rsp),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 232(%rsp),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 adcx %r14,%r13 xorq %r15,%r15 movq 192(%rsp),%rdx mulx 208(%rsp),%rcx,%rbp adcx %rcx,%r10 adox %rbp,%r11 mulx 216(%rsp),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 224(%rsp),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 mulx 232(%rsp),%rcx,%rbp adcx %rcx,%r13 adox %rbp,%r14 adcx %r15,%r14 xorq %rax,%rax movq 200(%rsp),%rdx mulx 208(%rsp),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 216(%rsp),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 mulx 224(%rsp),%rcx,%rbp adcx %rcx,%r13 adox %rbp,%r14 mulx 232(%rsp),%rcx,%rbp adcx %rcx,%r14 adox %rbp,%r15 adcx %rax,%r15 xorq %rbp,%rbp movq $38,%rdx mulx %r12,%rax,%r12 adcx %rax,%r8 adox %r12,%r9 mulx %r13,%rcx,%r13 adcx %rcx,%r9 adox %r13,%r10 mulx %r14,%rcx,%r14 adcx %rcx,%r10 adox %r14,%r11 mulx %r15,%rcx,%r15 adcx %rcx,%r11 adox %rbp,%r15 adcx %rbp,%r15 movq %r8,312(%rsp) movq %r9,320(%rsp) movq %r10,328(%rsp) movq %r11,336(%rsp) movq %r15,344(%rsp) // mul xorq %r13,%r13 movq 176(%rsp),%rdx mulx 240(%rsp),%r8,%r9 mulx 248(%rsp),%rcx,%r10 adcx %rcx,%r9 mulx 256(%rsp),%rcx,%r11 adcx %rcx,%r10 mulx 264(%rsp),%rcx,%r12 adcx %rcx,%r11 adcx %r13,%r12 xorq %r14,%r14 movq 184(%rsp),%rdx mulx 240(%rsp),%rcx,%rbp adcx %rcx,%r9 adox %rbp,%r10 mulx 248(%rsp),%rcx,%rbp adcx %rcx,%r10 adox %rbp,%r11 mulx 256(%rsp),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 264(%rsp),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 adcx %r14,%r13 xorq %r15,%r15 movq 192(%rsp),%rdx mulx 240(%rsp),%rcx,%rbp adcx %rcx,%r10 adox %rbp,%r11 mulx 248(%rsp),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 256(%rsp),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 mulx 264(%rsp),%rcx,%rbp adcx %rcx,%r13 adox %rbp,%r14 adcx %r15,%r14 xorq %rax,%rax movq 200(%rsp),%rdx mulx 240(%rsp),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 248(%rsp),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 mulx 256(%rsp),%rcx,%rbp adcx %rcx,%r13 adox %rbp,%r14 mulx 264(%rsp),%rcx,%rbp adcx %rcx,%r14 adox %rbp,%r15 adcx %rax,%r15 xorq %rbp,%rbp movq $38,%rdx mulx %r12,%rax,%r12 adcx %rax,%r8 adox %r12,%r9 mulx %r13,%rcx,%r13 adcx %rcx,%r9 adox %r13,%r10 mulx %r14,%rcx,%r14 adcx %rcx,%r10 adox %r14,%r11 mulx %r15,%rcx,%r15 adcx %rcx,%r11 adox %rbp,%r15 adcx %rbp,%r15 shld $1,%r11,%r15 andq mask63(%rip),%r11 imul $19,%r15,%r15 addq %r15,%r8 adcq $0,%r9 adcq $0,%r10 adcq $0,%r11 movq %r8,352(%rsp) movq %r9,360(%rsp) movq %r10,368(%rsp) movq %r11,376(%rsp) // mul xorq %r13,%r13 movq 144(%rsp),%rdx mulx 208(%rsp),%r8,%r9 mulx 216(%rsp),%rcx,%r10 adcx %rcx,%r9 mulx 224(%rsp),%rcx,%r11 adcx %rcx,%r10 mulx 232(%rsp),%rcx,%r12 adcx %rcx,%r11 adcx %r13,%r12 xorq %r14,%r14 movq 152(%rsp),%rdx mulx 208(%rsp),%rcx,%rbp adcx %rcx,%r9 adox %rbp,%r10 mulx 216(%rsp),%rcx,%rbp adcx %rcx,%r10 adox %rbp,%r11 mulx 224(%rsp),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 232(%rsp),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 adcx %r14,%r13 xorq %r15,%r15 movq 160(%rsp),%rdx mulx 208(%rsp),%rcx,%rbp adcx %rcx,%r10 adox %rbp,%r11 mulx 216(%rsp),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 224(%rsp),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 mulx 232(%rsp),%rcx,%rbp adcx %rcx,%r13 adox %rbp,%r14 adcx %r15,%r14 xorq %rax,%rax movq 168(%rsp),%rdx mulx 208(%rsp),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 216(%rsp),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 mulx 224(%rsp),%rcx,%rbp adcx %rcx,%r13 adox %rbp,%r14 mulx 232(%rsp),%rcx,%rbp adcx %rcx,%r14 adox %rbp,%r15 adcx %rax,%r15 xorq %rbp,%rbp movq $38,%rdx mulx %r12,%rax,%r12 adcx %rax,%r8 adox %r12,%r9 mulx %r13,%rcx,%r13 adcx %rcx,%r9 adox %r13,%r10 mulx %r14,%rcx,%r14 adcx %rcx,%r10 adox %r14,%r11 mulx %r15,%rcx,%r15 adcx %rcx,%r11 adox %rbp,%r15 adcx %rbp,%r15 shld $1,%r11,%r15 andq mask63(%rip),%r11 imul $19,%r15,%r15 addq %r15,%r8 adcq $0,%r9 adcq $0,%r10 adcq $0,%r11 movq %r8,392(%rsp) movq %r9,400(%rsp) movq %r10,408(%rsp) movq %r11,416(%rsp) movq 72(%rsp),%rdi movq 96(%rsp),%rdx mulx 120(%rsp),%r13,%r15 addq %r13,%rdi movb 136(%rsp),%r14b cmpb $0,%r14b jl .L5 shrb $1,%r14b movzbq %r14b,%r14 imul $128,%r14,%r14 addq %r14,%rdi /* pnielsadd p1p1 */ movq 312(%rsp),%r8 movq 320(%rsp),%r9 movq 328(%rsp),%r10 movq 336(%rsp),%r11 movq 344(%rsp),%rax // copy movq %r8,%r12 movq %r9,%r13 movq %r10,%r14 movq %r11,%r15 movq %rax,%rbx // sub addq twoexp8_p0(%rip),%r8 adcq twoexp8_p123(%rip),%r9 adcq twoexp8_p123(%rip),%r10 adcq twoexp8_p123(%rip),%r11 adcq twoexp8_p4(%rip),%rax subq 272(%rsp),%r8 sbbq 280(%rsp),%r9 sbbq 288(%rsp),%r10 sbbq 296(%rsp),%r11 sbbq 304(%rsp),%rax shld $1,%r11,%rax andq mask63(%rip),%r11 imul $19,%rax,%rax addq %rax,%r8 adcq $0,%r9 adcq $0,%r10 adcq $0,%r11 movq %r8,432(%rsp) movq %r9,440(%rsp) movq %r10,448(%rsp) movq %r11,456(%rsp) // add addq 272(%rsp),%r12 adcq 280(%rsp),%r13 adcq 288(%rsp),%r14 adcq 296(%rsp),%r15 adcq 304(%rsp),%rbx shld $1,%r15,%rbx andq mask63(%rip),%r15 imul $19,%rbx,%rbx addq %rbx,%r12 adcq $0,%r13 adcq $0,%r14 adcq $0,%r15 movq %r12,472(%rsp) movq %r13,480(%rsp) movq %r14,488(%rsp) movq %r15,496(%rsp) // mul xorq %r13,%r13 movq 0(%rdi),%rdx mulx 432(%rsp),%r8,%r9 mulx 440(%rsp),%rcx,%r10 adcx %rcx,%r9 mulx 448(%rsp),%rcx,%r11 adcx %rcx,%r10 mulx 456(%rsp),%rcx,%r12 adcx %rcx,%r11 adcx %r13,%r12 xorq %r14,%r14 movq 8(%rdi),%rdx mulx 432(%rsp),%rcx,%rbp adcx %rcx,%r9 adox %rbp,%r10 mulx 440(%rsp),%rcx,%rbp adcx %rcx,%r10 adox %rbp,%r11 mulx 448(%rsp),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 456(%rsp),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 adcx %r14,%r13 xorq %r15,%r15 movq 16(%rdi),%rdx mulx 432(%rsp),%rcx,%rbp adcx %rcx,%r10 adox %rbp,%r11 mulx 440(%rsp),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 448(%rsp),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 mulx 456(%rsp),%rcx,%rbp adcx %rcx,%r13 adox %rbp,%r14 adcx %r15,%r14 xorq %rax,%rax movq 24(%rdi),%rdx mulx 432(%rsp),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 440(%rsp),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 mulx 448(%rsp),%rcx,%rbp adcx %rcx,%r13 adox %rbp,%r14 mulx 456(%rsp),%rcx,%rbp adcx %rcx,%r14 adox %rbp,%r15 adcx %rax,%r15 xorq %rbp,%rbp movq $38,%rdx mulx %r12,%rax,%r12 adcx %rax,%r8 adox %r12,%r9 mulx %r13,%rcx,%r13 adcx %rcx,%r9 adox %r13,%r10 mulx %r14,%rcx,%r14 adcx %rcx,%r10 adox %r14,%r11 mulx %r15,%rcx,%r15 adcx %rcx,%r11 adox %rbp,%r15 adcx %rbp,%r15 movq %r8,432(%rsp) movq %r9,440(%rsp) movq %r10,448(%rsp) movq %r11,456(%rsp) movq %r15,464(%rsp) // mul xorq %r13,%r13 movq 32(%rdi),%rdx mulx 472(%rsp),%r8,%r9 mulx 480(%rsp),%rcx,%r10 adcx %rcx,%r9 mulx 488(%rsp),%rcx,%r11 adcx %rcx,%r10 mulx 496(%rsp),%rcx,%r12 adcx %rcx,%r11 adcx %r13,%r12 xorq %r14,%r14 movq 40(%rdi),%rdx mulx 472(%rsp),%rcx,%rbp adcx %rcx,%r9 adox %rbp,%r10 mulx 480(%rsp),%rcx,%rbp adcx %rcx,%r10 adox %rbp,%r11 mulx 488(%rsp),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 496(%rsp),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 adcx %r14,%r13 xorq %r15,%r15 movq 48(%rdi),%rdx mulx 472(%rsp),%rcx,%rbp adcx %rcx,%r10 adox %rbp,%r11 mulx 480(%rsp),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 488(%rsp),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 mulx 496(%rsp),%rcx,%rbp adcx %rcx,%r13 adox %rbp,%r14 adcx %r15,%r14 xorq %rax,%rax movq 56(%rdi),%rdx mulx 472(%rsp),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 480(%rsp),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 mulx 488(%rsp),%rcx,%rbp adcx %rcx,%r13 adox %rbp,%r14 mulx 496(%rsp),%rcx,%rbp adcx %rcx,%r14 adox %rbp,%r15 adcx %rax,%r15 xorq %rbp,%rbp movq $38,%rdx mulx %r12,%rax,%r12 adcx %rax,%r8 adox %r12,%r9 mulx %r13,%rcx,%r13 adcx %rcx,%r9 adox %r13,%r10 mulx %r14,%rcx,%r14 adcx %rcx,%r10 adox %r14,%r11 mulx %r15,%rcx,%r15 adcx %rcx,%r11 adox %rbp,%r15 adcx %rbp,%r15 // add movq %r8,%r12 movq %r9,%r13 movq %r10,%r14 movq %r11,%rax movq %r15,%rbx addq 432(%rsp),%r8 adcq 440(%rsp),%r9 adcq 448(%rsp),%r10 adcq 456(%rsp),%r11 adcq 464(%rsp),%r15 shld $1,%r11,%r15 andq mask63(%rip),%r11 imul $19,%r15,%r15 addq %r15,%r8 adcq $0,%r9 adcq $0,%r10 adcq $0,%r11 movq %r8,208(%rsp) movq %r9,216(%rsp) movq %r10,224(%rsp) movq %r11,232(%rsp) // sub addq twoexp8_p0(%rip),%r12 adcq twoexp8_p123(%rip),%r13 adcq twoexp8_p123(%rip),%r14 adcq twoexp8_p123(%rip),%rax adcq twoexp8_p4(%rip),%rbx subq 432(%rsp),%r12 sbbq 440(%rsp),%r13 sbbq 448(%rsp),%r14 sbbq 456(%rsp),%rax sbbq 464(%rsp),%rbx shld $1,%rax,%rbx andq mask63(%rip),%rax imul $19,%rbx,%rbx addq %rbx,%r12 adcq $0,%r13 adcq $0,%r14 adcq $0,%rax movq %r12,144(%rsp) movq %r13,152(%rsp) movq %r14,160(%rsp) movq %rax,168(%rsp) // mul xorq %r13,%r13 movq 96(%rdi),%rdx mulx 392(%rsp),%r8,%r9 mulx 400(%rsp),%rcx,%r10 adcx %rcx,%r9 mulx 408(%rsp),%rcx,%r11 adcx %rcx,%r10 mulx 416(%rsp),%rcx,%r12 adcx %rcx,%r11 adcx %r13,%r12 xorq %r14,%r14 movq 104(%rdi),%rdx mulx 392(%rsp),%rcx,%rbp adcx %rcx,%r9 adox %rbp,%r10 mulx 400(%rsp),%rcx,%rbp adcx %rcx,%r10 adox %rbp,%r11 mulx 408(%rsp),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 416(%rsp),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 adcx %r14,%r13 xorq %r15,%r15 movq 112(%rdi),%rdx mulx 392(%rsp),%rcx,%rbp adcx %rcx,%r10 adox %rbp,%r11 mulx 400(%rsp),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 408(%rsp),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 mulx 416(%rsp),%rcx,%rbp adcx %rcx,%r13 adox %rbp,%r14 adcx %r15,%r14 xorq %rax,%rax movq 120(%rdi),%rdx mulx 392(%rsp),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 400(%rsp),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 mulx 408(%rsp),%rcx,%rbp adcx %rcx,%r13 adox %rbp,%r14 mulx 416(%rsp),%rcx,%rbp adcx %rcx,%r14 adox %rbp,%r15 adcx %rax,%r15 xorq %rbp,%rbp movq $38,%rdx mulx %r12,%rax,%r12 adcx %rax,%r8 adox %r12,%r9 mulx %r13,%rcx,%r13 adcx %rcx,%r9 adox %r13,%r10 mulx %r14,%rcx,%r14 adcx %rcx,%r10 adox %r14,%r11 mulx %r15,%rcx,%r15 adcx %rcx,%r11 adox %rbp,%r15 adcx %rbp,%r15 movq %r8,432(%rsp) movq %r9,440(%rsp) movq %r10,448(%rsp) movq %r11,456(%rsp) movq %r15,464(%rsp) // mul xorq %r13,%r13 movq 64(%rdi),%rdx mulx 352(%rsp),%r8,%r9 mulx 360(%rsp),%rcx,%r10 adcx %rcx,%r9 mulx 368(%rsp),%rcx,%r11 adcx %rcx,%r10 mulx 376(%rsp),%rcx,%r12 adcx %rcx,%r11 adcx %r13,%r12 xorq %r14,%r14 movq 72(%rdi),%rdx mulx 352(%rsp),%rcx,%rbp adcx %rcx,%r9 adox %rbp,%r10 mulx 360(%rsp),%rcx,%rbp adcx %rcx,%r10 adox %rbp,%r11 mulx 368(%rsp),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 376(%rsp),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 adcx %r14,%r13 xorq %r15,%r15 movq 80(%rdi),%rdx mulx 352(%rsp),%rcx,%rbp adcx %rcx,%r10 adox %rbp,%r11 mulx 360(%rsp),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 368(%rsp),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 mulx 376(%rsp),%rcx,%rbp adcx %rcx,%r13 adox %rbp,%r14 adcx %r15,%r14 xorq %rax,%rax movq 88(%rdi),%rdx mulx 352(%rsp),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 360(%rsp),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 mulx 368(%rsp),%rcx,%rbp adcx %rcx,%r13 adox %rbp,%r14 mulx 376(%rsp),%rcx,%rbp adcx %rcx,%r14 adox %rbp,%r15 adcx %rax,%r15 xorq %rbp,%rbp movq $38,%rdx mulx %r12,%rax,%r12 adcx %rax,%r8 adox %r12,%r9 mulx %r13,%rcx,%r13 adcx %rcx,%r9 adox %r13,%r10 mulx %r14,%rcx,%r14 adcx %rcx,%r10 adox %r14,%r11 mulx %r15,%rcx,%r15 adcx %rcx,%r11 adox %rbp,%r15 adcx %rbp,%r15 // double addq %r8,%r8 adcq %r9,%r9 adcq %r10,%r10 adcq %r11,%r11 adcq %r15,%r15 // add movq %r8,%r12 movq %r9,%r13 movq %r10,%r14 movq %r11,%rax movq %r15,%rbx addq 432(%rsp),%r8 adcq 440(%rsp),%r9 adcq 448(%rsp),%r10 adcq 456(%rsp),%r11 adcq 464(%rsp),%r15 shld $1,%r11,%r15 andq mask63(%rip),%r11 imul $19,%r15,%r15 addq %r15,%r8 adcq $0,%r9 adcq $0,%r10 adcq $0,%r11 movq %r8,176(%rsp) movq %r9,184(%rsp) movq %r10,192(%rsp) movq %r11,200(%rsp) // sub addq twoexp8_p0(%rip),%r12 adcq twoexp8_p123(%rip),%r13 adcq twoexp8_p123(%rip),%r14 adcq twoexp8_p123(%rip),%rax adcq twoexp8_p4(%rip),%rbx subq 432(%rsp),%r12 sbbq 440(%rsp),%r13 sbbq 448(%rsp),%r14 sbbq 456(%rsp),%rax sbbq 464(%rsp),%rbx shld $1,%rax,%rbx andq mask63(%rip),%rax imul $19,%rbx,%rbx addq %rbx,%r12 adcq $0,%r13 adcq $0,%r14 adcq $0,%rax movq %r12,240(%rsp) movq %r13,248(%rsp) movq %r14,256(%rsp) movq %rax,264(%rsp) jmp .L6 .L5: movb $0,%r15b subb %r14b,%r15b shrb $1,%r15b movzbq %r15b,%r15 imul $128,%r15,%r15 addq %r15,%rdi /* pnielssub p1p1 */ // neg movq $0,%r8 movq $0,%r9 movq $0,%r10 movq $0,%r11 subq 96(%rdi),%r8 sbbq 104(%rdi),%r9 sbbq 112(%rdi),%r10 sbbq 120(%rdi),%r11 movq $0,%rdx movq $38,%rax cmovae %rdx,%rax subq %rax,%r8 sbbq %rdx,%r9 sbbq %rdx,%r10 sbbq %rdx,%r11 cmovc %rax,%rdx subq %rdx,%r8 movq %r8,504(%rsp) movq %r9,512(%rsp) movq %r10,520(%rsp) movq %r11,528(%rsp) movq 312(%rsp),%r8 movq 320(%rsp),%r9 movq 328(%rsp),%r10 movq 336(%rsp),%r11 movq 344(%rsp),%rax // copy movq %r8,%r12 movq %r9,%r13 movq %r10,%r14 movq %r11,%r15 movq %rax,%rbx // sub addq twoexp8_p0(%rip),%r8 adcq twoexp8_p123(%rip),%r9 adcq twoexp8_p123(%rip),%r10 adcq twoexp8_p123(%rip),%r11 adcq twoexp8_p4(%rip),%rax subq 272(%rsp),%r8 sbbq 280(%rsp),%r9 sbbq 288(%rsp),%r10 sbbq 296(%rsp),%r11 sbbq 304(%rsp),%rax shld $1,%r11,%rax andq mask63(%rip),%r11 imul $19,%rax,%rax addq %rax,%r8 adcq $0,%r9 adcq $0,%r10 adcq $0,%r11 movq %r8,432(%rsp) movq %r9,440(%rsp) movq %r10,448(%rsp) movq %r11,456(%rsp) // add addq 272(%rsp),%r12 adcq 280(%rsp),%r13 adcq 288(%rsp),%r14 adcq 296(%rsp),%r15 adcq 304(%rsp),%rbx shld $1,%r15,%rbx andq mask63(%rip),%r15 imul $19,%rbx,%rbx addq %rbx,%r12 adcq $0,%r13 adcq $0,%r14 adcq $0,%r15 movq %r12,472(%rsp) movq %r13,480(%rsp) movq %r14,488(%rsp) movq %r15,496(%rsp) // mul xorq %r13,%r13 movq 32(%rdi),%rdx mulx 432(%rsp),%r8,%r9 mulx 440(%rsp),%rcx,%r10 adcx %rcx,%r9 mulx 448(%rsp),%rcx,%r11 adcx %rcx,%r10 mulx 456(%rsp),%rcx,%r12 adcx %rcx,%r11 adcx %r13,%r12 xorq %r14,%r14 movq 40(%rdi),%rdx mulx 432(%rsp),%rcx,%rbp adcx %rcx,%r9 adox %rbp,%r10 mulx 440(%rsp),%rcx,%rbp adcx %rcx,%r10 adox %rbp,%r11 mulx 448(%rsp),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 456(%rsp),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 adcx %r14,%r13 xorq %r15,%r15 movq 48(%rdi),%rdx mulx 432(%rsp),%rcx,%rbp adcx %rcx,%r10 adox %rbp,%r11 mulx 440(%rsp),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 448(%rsp),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 mulx 456(%rsp),%rcx,%rbp adcx %rcx,%r13 adox %rbp,%r14 adcx %r15,%r14 xorq %rax,%rax movq 56(%rdi),%rdx mulx 432(%rsp),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 440(%rsp),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 mulx 448(%rsp),%rcx,%rbp adcx %rcx,%r13 adox %rbp,%r14 mulx 456(%rsp),%rcx,%rbp adcx %rcx,%r14 adox %rbp,%r15 adcx %rax,%r15 xorq %rbp,%rbp movq $38,%rdx mulx %r12,%rax,%r12 adcx %rax,%r8 adox %r12,%r9 mulx %r13,%rcx,%r13 adcx %rcx,%r9 adox %r13,%r10 mulx %r14,%rcx,%r14 adcx %rcx,%r10 adox %r14,%r11 mulx %r15,%rcx,%r15 adcx %rcx,%r11 adox %rbp,%r15 adcx %rbp,%r15 movq %r8,432(%rsp) movq %r9,440(%rsp) movq %r10,448(%rsp) movq %r11,456(%rsp) movq %r15,464(%rsp) // mul xorq %r13,%r13 movq 0(%rdi),%rdx mulx 472(%rsp),%r8,%r9 mulx 480(%rsp),%rcx,%r10 adcx %rcx,%r9 mulx 488(%rsp),%rcx,%r11 adcx %rcx,%r10 mulx 496(%rsp),%rcx,%r12 adcx %rcx,%r11 adcx %r13,%r12 xorq %r14,%r14 movq 8(%rdi),%rdx mulx 472(%rsp),%rcx,%rbp adcx %rcx,%r9 adox %rbp,%r10 mulx 480(%rsp),%rcx,%rbp adcx %rcx,%r10 adox %rbp,%r11 mulx 488(%rsp),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 496(%rsp),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 adcx %r14,%r13 xorq %r15,%r15 movq 16(%rdi),%rdx mulx 472(%rsp),%rcx,%rbp adcx %rcx,%r10 adox %rbp,%r11 mulx 480(%rsp),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 488(%rsp),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 mulx 496(%rsp),%rcx,%rbp adcx %rcx,%r13 adox %rbp,%r14 adcx %r15,%r14 xorq %rax,%rax movq 24(%rdi),%rdx mulx 472(%rsp),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 480(%rsp),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 mulx 488(%rsp),%rcx,%rbp adcx %rcx,%r13 adox %rbp,%r14 mulx 496(%rsp),%rcx,%rbp adcx %rcx,%r14 adox %rbp,%r15 adcx %rax,%r15 xorq %rbp,%rbp movq $38,%rdx mulx %r12,%rax,%r12 adcx %rax,%r8 adox %r12,%r9 mulx %r13,%rcx,%r13 adcx %rcx,%r9 adox %r13,%r10 mulx %r14,%rcx,%r14 adcx %rcx,%r10 adox %r14,%r11 mulx %r15,%rcx,%r15 adcx %rcx,%r11 adox %rbp,%r15 adcx %rbp,%r15 // add movq %r8,%r12 movq %r9,%r13 movq %r10,%r14 movq %r11,%rax movq %r15,%rbx addq 432(%rsp),%r8 adcq 440(%rsp),%r9 adcq 448(%rsp),%r10 adcq 456(%rsp),%r11 adcq 464(%rsp),%r15 shld $1,%r11,%r15 andq mask63(%rip),%r11 imul $19,%r15,%r15 addq %r15,%r8 adcq $0,%r9 adcq $0,%r10 adcq $0,%r11 movq %r8,208(%rsp) movq %r9,216(%rsp) movq %r10,224(%rsp) movq %r11,232(%rsp) // sub addq twoexp8_p0(%rip),%r12 adcq twoexp8_p123(%rip),%r13 adcq twoexp8_p123(%rip),%r14 adcq twoexp8_p123(%rip),%rax adcq twoexp8_p4(%rip),%rbx subq 432(%rsp),%r12 sbbq 440(%rsp),%r13 sbbq 448(%rsp),%r14 sbbq 456(%rsp),%rax sbbq 464(%rsp),%rbx shld $1,%rax,%rbx andq mask63(%rip),%rax imul $19,%rbx,%rbx addq %rbx,%r12 adcq $0,%r13 adcq $0,%r14 adcq $0,%rax movq %r12,144(%rsp) movq %r13,152(%rsp) movq %r14,160(%rsp) movq %rax,168(%rsp) // mul xorq %r13,%r13 movq 504(%rsp),%rdx mulx 392(%rsp),%r8,%r9 mulx 400(%rsp),%rcx,%r10 adcx %rcx,%r9 mulx 408(%rsp),%rcx,%r11 adcx %rcx,%r10 mulx 416(%rsp),%rcx,%r12 adcx %rcx,%r11 adcx %r13,%r12 xorq %r14,%r14 movq 512(%rsp),%rdx mulx 392(%rsp),%rcx,%rbp adcx %rcx,%r9 adox %rbp,%r10 mulx 400(%rsp),%rcx,%rbp adcx %rcx,%r10 adox %rbp,%r11 mulx 408(%rsp),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 416(%rsp),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 adcx %r14,%r13 xorq %r15,%r15 movq 520(%rsp),%rdx mulx 392(%rsp),%rcx,%rbp adcx %rcx,%r10 adox %rbp,%r11 mulx 400(%rsp),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 408(%rsp),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 mulx 416(%rsp),%rcx,%rbp adcx %rcx,%r13 adox %rbp,%r14 adcx %r15,%r14 xorq %rax,%rax movq 528(%rsp),%rdx mulx 392(%rsp),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 400(%rsp),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 mulx 408(%rsp),%rcx,%rbp adcx %rcx,%r13 adox %rbp,%r14 mulx 416(%rsp),%rcx,%rbp adcx %rcx,%r14 adox %rbp,%r15 adcx %rax,%r15 xorq %rbp,%rbp movq $38,%rdx mulx %r12,%rax,%r12 adcx %rax,%r8 adox %r12,%r9 mulx %r13,%rcx,%r13 adcx %rcx,%r9 adox %r13,%r10 mulx %r14,%rcx,%r14 adcx %rcx,%r10 adox %r14,%r11 mulx %r15,%rcx,%r15 adcx %rcx,%r11 adox %rbp,%r15 adcx %rbp,%r15 movq %r8,432(%rsp) movq %r9,440(%rsp) movq %r10,448(%rsp) movq %r11,456(%rsp) movq %r15,464(%rsp) // mul xorq %r13,%r13 movq 64(%rdi),%rdx mulx 352(%rsp),%r8,%r9 mulx 360(%rsp),%rcx,%r10 adcx %rcx,%r9 mulx 368(%rsp),%rcx,%r11 adcx %rcx,%r10 mulx 376(%rsp),%rcx,%r12 adcx %rcx,%r11 adcx %r13,%r12 xorq %r14,%r14 movq 72(%rdi),%rdx mulx 352(%rsp),%rcx,%rbp adcx %rcx,%r9 adox %rbp,%r10 mulx 360(%rsp),%rcx,%rbp adcx %rcx,%r10 adox %rbp,%r11 mulx 368(%rsp),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 376(%rsp),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 adcx %r14,%r13 xorq %r15,%r15 movq 80(%rdi),%rdx mulx 352(%rsp),%rcx,%rbp adcx %rcx,%r10 adox %rbp,%r11 mulx 360(%rsp),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 368(%rsp),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 mulx 376(%rsp),%rcx,%rbp adcx %rcx,%r13 adox %rbp,%r14 adcx %r15,%r14 xorq %rax,%rax movq 88(%rdi),%rdx mulx 352(%rsp),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 360(%rsp),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 mulx 368(%rsp),%rcx,%rbp adcx %rcx,%r13 adox %rbp,%r14 mulx 376(%rsp),%rcx,%rbp adcx %rcx,%r14 adox %rbp,%r15 adcx %rax,%r15 xorq %rbp,%rbp movq $38,%rdx mulx %r12,%rax,%r12 adcx %rax,%r8 adox %r12,%r9 mulx %r13,%rcx,%r13 adcx %rcx,%r9 adox %r13,%r10 mulx %r14,%rcx,%r14 adcx %rcx,%r10 adox %r14,%r11 mulx %r15,%rcx,%r15 adcx %rcx,%r11 adox %rbp,%r15 adcx %rbp,%r15 // double addq %r8,%r8 adcq %r9,%r9 adcq %r10,%r10 adcq %r11,%r11 adcq %r15,%r15 // add movq %r8,%r12 movq %r9,%r13 movq %r10,%r14 movq %r11,%rax movq %r15,%rbx addq 432(%rsp),%r8 adcq 440(%rsp),%r9 adcq 448(%rsp),%r10 adcq 456(%rsp),%r11 adcq 464(%rsp),%r15 shld $1,%r11,%r15 andq mask63(%rip),%r11 imul $19,%r15,%r15 addq %r15,%r8 adcq $0,%r9 adcq $0,%r10 adcq $0,%r11 movq %r8,176(%rsp) movq %r9,184(%rsp) movq %r10,192(%rsp) movq %r11,200(%rsp) // sub addq twoexp8_p0(%rip),%r12 adcq twoexp8_p123(%rip),%r13 adcq twoexp8_p123(%rip),%r14 adcq twoexp8_p123(%rip),%rax adcq twoexp8_p4(%rip),%rbx subq 432(%rsp),%r12 sbbq 440(%rsp),%r13 sbbq 448(%rsp),%r14 sbbq 456(%rsp),%rax sbbq 464(%rsp),%rbx shld $1,%rax,%rbx andq mask63(%rip),%rax imul $19,%rbx,%rbx addq %rbx,%r12 adcq $0,%r13 adcq $0,%r14 adcq $0,%rax movq %r12,240(%rsp) movq %r13,248(%rsp) movq %r14,256(%rsp) movq %rax,264(%rsp) .L6: addq $256,%rsi movq %rsi,128(%rsp) movq 120(%rsp),%rcx addq $1,%rcx movq %rcx,120(%rsp) cmpq 80(%rsp),%rcx jl .L3 .L7: movq 112(%rsp),%rsi decq %rsi movq %rsi,112(%rsp) movq 104(%rsp),%rax decq %rax movq %rax,104(%rsp) cmpq $0,%rax jge .L1 .L8: /* p1p1 to p3 */ // mul xorq %r13,%r13 movq 144(%rsp),%rdx mulx 240(%rsp),%r8,%r9 mulx 248(%rsp),%rcx,%r10 adcx %rcx,%r9 mulx 256(%rsp),%rcx,%r11 adcx %rcx,%r10 mulx 264(%rsp),%rcx,%r12 adcx %rcx,%r11 adcx %r13,%r12 xorq %r14,%r14 movq 152(%rsp),%rdx mulx 240(%rsp),%rcx,%rbp adcx %rcx,%r9 adox %rbp,%r10 mulx 248(%rsp),%rcx,%rbp adcx %rcx,%r10 adox %rbp,%r11 mulx 256(%rsp),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 264(%rsp),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 adcx %r14,%r13 xorq %r15,%r15 movq 160(%rsp),%rdx mulx 240(%rsp),%rcx,%rbp adcx %rcx,%r10 adox %rbp,%r11 mulx 248(%rsp),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 256(%rsp),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 mulx 264(%rsp),%rcx,%rbp adcx %rcx,%r13 adox %rbp,%r14 adcx %r15,%r14 xorq %rax,%rax movq 168(%rsp),%rdx mulx 240(%rsp),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 248(%rsp),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 mulx 256(%rsp),%rcx,%rbp adcx %rcx,%r13 adox %rbp,%r14 mulx 264(%rsp),%rcx,%rbp adcx %rcx,%r14 adox %rbp,%r15 adcx %rax,%r15 xorq %rbp,%rbp movq $38,%rdx mulx %r12,%rax,%r12 adcx %rax,%r8 adox %r12,%r9 mulx %r13,%rcx,%r13 adcx %rcx,%r9 adox %r13,%r10 mulx %r14,%rcx,%r14 adcx %rcx,%r10 adox %r14,%r11 mulx %r15,%rcx,%r15 adcx %rcx,%r11 adox %rbp,%r15 adcx %rbp,%r15 movq %r8,272(%rsp) movq %r9,280(%rsp) movq %r10,288(%rsp) movq %r11,296(%rsp) movq %r15,304(%rsp) // mul xorq %r13,%r13 movq 176(%rsp),%rdx mulx 208(%rsp),%r8,%r9 mulx 216(%rsp),%rcx,%r10 adcx %rcx,%r9 mulx 224(%rsp),%rcx,%r11 adcx %rcx,%r10 mulx 232(%rsp),%rcx,%r12 adcx %rcx,%r11 adcx %r13,%r12 xorq %r14,%r14 movq 184(%rsp),%rdx mulx 208(%rsp),%rcx,%rbp adcx %rcx,%r9 adox %rbp,%r10 mulx 216(%rsp),%rcx,%rbp adcx %rcx,%r10 adox %rbp,%r11 mulx 224(%rsp),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 232(%rsp),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 adcx %r14,%r13 xorq %r15,%r15 movq 192(%rsp),%rdx mulx 208(%rsp),%rcx,%rbp adcx %rcx,%r10 adox %rbp,%r11 mulx 216(%rsp),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 224(%rsp),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 mulx 232(%rsp),%rcx,%rbp adcx %rcx,%r13 adox %rbp,%r14 adcx %r15,%r14 xorq %rax,%rax movq 200(%rsp),%rdx mulx 208(%rsp),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 216(%rsp),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 mulx 224(%rsp),%rcx,%rbp adcx %rcx,%r13 adox %rbp,%r14 mulx 232(%rsp),%rcx,%rbp adcx %rcx,%r14 adox %rbp,%r15 adcx %rax,%r15 xorq %rbp,%rbp movq $38,%rdx mulx %r12,%rax,%r12 adcx %rax,%r8 adox %r12,%r9 mulx %r13,%rcx,%r13 adcx %rcx,%r9 adox %r13,%r10 mulx %r14,%rcx,%r14 adcx %rcx,%r10 adox %r14,%r11 mulx %r15,%rcx,%r15 adcx %rcx,%r11 adox %rbp,%r15 adcx %rbp,%r15 movq %r8,312(%rsp) movq %r9,320(%rsp) movq %r10,328(%rsp) movq %r11,336(%rsp) movq %r15,344(%rsp) /* p3 to cached add/sub */ // add movq %r8,%r12 movq %r9,%r13 movq %r10,%r14 movq %r11,%rax movq %r15,%rbx addq 272(%rsp),%r8 adcq 280(%rsp),%r9 adcq 288(%rsp),%r10 adcq 296(%rsp),%r11 adcq 304(%rsp),%r15 shld $1,%r11,%r15 andq mask63(%rip),%r11 imul $19,%r15,%r15 addq %r15,%r8 adcq $0,%r9 adcq $0,%r10 adcq $0,%r11 movq %r8,536(%rsp) movq %r9,544(%rsp) movq %r10,552(%rsp) movq %r11,560(%rsp) // sub addq twoexp8_p0(%rip),%r12 adcq twoexp8_p123(%rip),%r13 adcq twoexp8_p123(%rip),%r14 adcq twoexp8_p123(%rip),%rax adcq twoexp8_p4(%rip),%rbx subq 272(%rsp),%r12 sbbq 280(%rsp),%r13 sbbq 288(%rsp),%r14 sbbq 296(%rsp),%rax sbbq 304(%rsp),%rbx shld $1,%rax,%rbx andq mask63(%rip),%rax imul $19,%rbx,%rbx addq %rbx,%r12 adcq $0,%r13 adcq $0,%r14 adcq $0,%rax movq %r12,504(%rsp) movq %r13,512(%rsp) movq %r14,520(%rsp) movq %rax,528(%rsp) // mul xorq %r13,%r13 movq 176(%rsp),%rdx mulx 240(%rsp),%r8,%r9 mulx 248(%rsp),%rcx,%r10 adcx %rcx,%r9 mulx 256(%rsp),%rcx,%r11 adcx %rcx,%r10 mulx 264(%rsp),%rcx,%r12 adcx %rcx,%r11 adcx %r13,%r12 xorq %r14,%r14 movq 184(%rsp),%rdx mulx 240(%rsp),%rcx,%rbp adcx %rcx,%r9 adox %rbp,%r10 mulx 248(%rsp),%rcx,%rbp adcx %rcx,%r10 adox %rbp,%r11 mulx 256(%rsp),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 264(%rsp),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 adcx %r14,%r13 xorq %r15,%r15 movq 192(%rsp),%rdx mulx 240(%rsp),%rcx,%rbp adcx %rcx,%r10 adox %rbp,%r11 mulx 248(%rsp),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 256(%rsp),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 mulx 264(%rsp),%rcx,%rbp adcx %rcx,%r13 adox %rbp,%r14 adcx %r15,%r14 xorq %rax,%rax movq 200(%rsp),%rdx mulx 240(%rsp),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 248(%rsp),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 mulx 256(%rsp),%rcx,%rbp adcx %rcx,%r13 adox %rbp,%r14 mulx 264(%rsp),%rcx,%rbp adcx %rcx,%r14 adox %rbp,%r15 adcx %rax,%r15 xorq %rbp,%rbp movq $38,%rdx mulx %r12,%rax,%r12 adcx %rax,%r8 adox %r12,%r9 mulx %r13,%rcx,%r13 adcx %rcx,%r9 adox %r13,%r10 mulx %r14,%rcx,%r14 adcx %rcx,%r10 adox %r14,%r11 mulx %r15,%rcx,%r15 adcx %rcx,%r11 adox %rbp,%r15 adcx %rbp,%r15 shld $1,%r11,%r15 andq mask63(%rip),%r11 imul $19,%r15,%r15 addq %r15,%r8 adcq $0,%r9 adcq $0,%r10 adcq $0,%r11 /* p3 to cached: assign to third fe */ movq %r8,568(%rsp) movq %r9,576(%rsp) movq %r10,584(%rsp) movq %r11,592(%rsp) // mul xorq %r13,%r13 movq 144(%rsp),%rdx mulx 208(%rsp),%r8,%r9 mulx 216(%rsp),%rcx,%r10 adcx %rcx,%r9 mulx 224(%rsp),%rcx,%r11 adcx %rcx,%r10 mulx 232(%rsp),%rcx,%r12 adcx %rcx,%r11 adcx %r13,%r12 xorq %r14,%r14 movq 152(%rsp),%rdx mulx 208(%rsp),%rcx,%rbp adcx %rcx,%r9 adox %rbp,%r10 mulx 216(%rsp),%rcx,%rbp adcx %rcx,%r10 adox %rbp,%r11 mulx 224(%rsp),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 232(%rsp),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 adcx %r14,%r13 xorq %r15,%r15 movq 160(%rsp),%rdx mulx 208(%rsp),%rcx,%rbp adcx %rcx,%r10 adox %rbp,%r11 mulx 216(%rsp),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 224(%rsp),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 mulx 232(%rsp),%rcx,%rbp adcx %rcx,%r13 adox %rbp,%r14 adcx %r15,%r14 xorq %rax,%rax movq 168(%rsp),%rdx mulx 208(%rsp),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 216(%rsp),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 mulx 224(%rsp),%rcx,%rbp adcx %rcx,%r13 adox %rbp,%r14 mulx 232(%rsp),%rcx,%rbp adcx %rcx,%r14 adox %rbp,%r15 adcx %rax,%r15 xorq %rbp,%rbp movq $38,%rdx mulx %r12,%rax,%r12 adcx %rax,%r8 adox %r12,%r9 mulx %r13,%rcx,%r13 adcx %rcx,%r9 adox %r13,%r10 mulx %r14,%rcx,%r14 adcx %rcx,%r10 adox %r14,%r11 mulx %r15,%rcx,%r15 adcx %rcx,%r11 adox %rbp,%r15 adcx %rbp,%r15 shld $1,%r11,%r15 andq mask63(%rip),%r11 imul $19,%r15,%r15 addq %r15,%r8 adcq $0,%r9 adcq $0,%r10 adcq $0,%r11 movq %r8,392(%rsp) movq %r9,400(%rsp) movq %r10,408(%rsp) movq %r11,416(%rsp) /* p3 to cached: multiply the fourth fes */ // mul xorq %r13,%r13 movq EC2D0(%rip),%rdx mulx 392(%rsp),%r8,%r9 mulx 400(%rsp),%rcx,%r10 adcx %rcx,%r9 mulx 408(%rsp),%rcx,%r11 adcx %rcx,%r10 mulx 416(%rsp),%rcx,%r12 adcx %rcx,%r11 adcx %r13,%r12 xorq %r14,%r14 movq EC2D1(%rip),%rdx mulx 392(%rsp),%rcx,%rbp adcx %rcx,%r9 adox %rbp,%r10 mulx 400(%rsp),%rcx,%rbp adcx %rcx,%r10 adox %rbp,%r11 mulx 408(%rsp),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 416(%rsp),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 adcx %r14,%r13 xorq %r15,%r15 movq EC2D2(%rip),%rdx mulx 392(%rsp),%rcx,%rbp adcx %rcx,%r10 adox %rbp,%r11 mulx 400(%rsp),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 408(%rsp),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 mulx 416(%rsp),%rcx,%rbp adcx %rcx,%r13 adox %rbp,%r14 adcx %r15,%r14 xorq %rax,%rax movq EC2D3(%rip),%rdx mulx 392(%rsp),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 400(%rsp),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 mulx 408(%rsp),%rcx,%rbp adcx %rcx,%r13 adox %rbp,%r14 mulx 416(%rsp),%rcx,%rbp adcx %rcx,%r14 adox %rbp,%r15 adcx %rax,%r15 xorq %rbp,%rbp movq $38,%rdx mulx %r12,%rax,%r12 adcx %rax,%r8 adox %r12,%r9 mulx %r13,%rcx,%r13 adcx %rcx,%r9 adox %r13,%r10 mulx %r14,%rcx,%r14 adcx %rcx,%r10 adox %r14,%r11 mulx %r15,%rcx,%r15 adcx %rcx,%r11 adox %rbp,%r15 adcx %rbp,%r15 shld $1,%r11,%r15 andq mask63(%rip),%r11 imul $19,%r15,%r15 addq %r15,%r8 adcq $0,%r9 adcq $0,%r10 adcq $0,%r11 movq %r8,600(%rsp) movq %r9,608(%rsp) movq %r10,616(%rsp) movq %r11,624(%rsp) /* p1p1 to p3 */ movq 56(%rsp),%rdi // mul xorq %r13,%r13 movq 0(%rdi),%rdx mulx 96(%rdi),%r8,%r9 mulx 104(%rdi),%rcx,%r10 adcx %rcx,%r9 mulx 112(%rdi),%rcx,%r11 adcx %rcx,%r10 mulx 120(%rdi),%rcx,%r12 adcx %rcx,%r11 adcx %r13,%r12 xorq %r14,%r14 movq 8(%rdi),%rdx mulx 96(%rdi),%rcx,%rbp adcx %rcx,%r9 adox %rbp,%r10 mulx 104(%rdi),%rcx,%rbp adcx %rcx,%r10 adox %rbp,%r11 mulx 112(%rdi),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 120(%rdi),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 adcx %r14,%r13 xorq %r15,%r15 movq 16(%rdi),%rdx mulx 96(%rdi),%rcx,%rbp adcx %rcx,%r10 adox %rbp,%r11 mulx 104(%rdi),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 112(%rdi),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 mulx 120(%rdi),%rcx,%rbp adcx %rcx,%r13 adox %rbp,%r14 adcx %r15,%r14 xorq %rax,%rax movq 24(%rdi),%rdx mulx 96(%rdi),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 104(%rdi),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 mulx 112(%rdi),%rcx,%rbp adcx %rcx,%r13 adox %rbp,%r14 mulx 120(%rdi),%rcx,%rbp adcx %rcx,%r14 adox %rbp,%r15 adcx %rax,%r15 xorq %rbp,%rbp movq $38,%rdx mulx %r12,%rax,%r12 adcx %rax,%r8 adox %r12,%r9 mulx %r13,%rcx,%r13 adcx %rcx,%r9 adox %r13,%r10 mulx %r14,%rcx,%r14 adcx %rcx,%r10 adox %r14,%r11 mulx %r15,%rcx,%r15 adcx %rcx,%r11 adox %rbp,%r15 adcx %rbp,%r15 movq %r8,272(%rsp) movq %r9,280(%rsp) movq %r10,288(%rsp) movq %r11,296(%rsp) movq %r15,304(%rsp) // mul xorq %r13,%r13 movq 32(%rdi),%rdx mulx 64(%rdi),%r8,%r9 mulx 72(%rdi),%rcx,%r10 adcx %rcx,%r9 mulx 80(%rdi),%rcx,%r11 adcx %rcx,%r10 mulx 88(%rdi),%rcx,%r12 adcx %rcx,%r11 adcx %r13,%r12 xorq %r14,%r14 movq 40(%rdi),%rdx mulx 64(%rdi),%rcx,%rbp adcx %rcx,%r9 adox %rbp,%r10 mulx 72(%rdi),%rcx,%rbp adcx %rcx,%r10 adox %rbp,%r11 mulx 80(%rdi),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 88(%rdi),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 adcx %r14,%r13 xorq %r15,%r15 movq 48(%rdi),%rdx mulx 64(%rdi),%rcx,%rbp adcx %rcx,%r10 adox %rbp,%r11 mulx 72(%rdi),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 80(%rdi),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 mulx 88(%rdi),%rcx,%rbp adcx %rcx,%r13 adox %rbp,%r14 adcx %r15,%r14 xorq %rax,%rax movq 56(%rdi),%rdx mulx 64(%rdi),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 72(%rdi),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 mulx 80(%rdi),%rcx,%rbp adcx %rcx,%r13 adox %rbp,%r14 mulx 88(%rdi),%rcx,%rbp adcx %rcx,%r14 adox %rbp,%r15 adcx %rax,%r15 xorq %rbp,%rbp movq $38,%rdx mulx %r12,%rax,%r12 adcx %rax,%r8 adox %r12,%r9 mulx %r13,%rcx,%r13 adcx %rcx,%r9 adox %r13,%r10 mulx %r14,%rcx,%r14 adcx %rcx,%r10 adox %r14,%r11 mulx %r15,%rcx,%r15 adcx %rcx,%r11 adox %rbp,%r15 adcx %rbp,%r15 movq %r8,312(%rsp) movq %r9,320(%rsp) movq %r10,328(%rsp) movq %r11,336(%rsp) movq %r15,344(%rsp) // mul xorq %r13,%r13 movq 32(%rdi),%rdx mulx 96(%rdi),%r8,%r9 mulx 104(%rdi),%rcx,%r10 adcx %rcx,%r9 mulx 112(%rdi),%rcx,%r11 adcx %rcx,%r10 mulx 120(%rdi),%rcx,%r12 adcx %rcx,%r11 adcx %r13,%r12 xorq %r14,%r14 movq 40(%rdi),%rdx mulx 96(%rdi),%rcx,%rbp adcx %rcx,%r9 adox %rbp,%r10 mulx 104(%rdi),%rcx,%rbp adcx %rcx,%r10 adox %rbp,%r11 mulx 112(%rdi),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 120(%rdi),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 adcx %r14,%r13 xorq %r15,%r15 movq 48(%rdi),%rdx mulx 96(%rdi),%rcx,%rbp adcx %rcx,%r10 adox %rbp,%r11 mulx 104(%rdi),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 112(%rdi),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 mulx 120(%rdi),%rcx,%rbp adcx %rcx,%r13 adox %rbp,%r14 adcx %r15,%r14 xorq %rax,%rax movq 56(%rdi),%rdx mulx 96(%rdi),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 104(%rdi),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 mulx 112(%rdi),%rcx,%rbp adcx %rcx,%r13 adox %rbp,%r14 mulx 120(%rdi),%rcx,%rbp adcx %rcx,%r14 adox %rbp,%r15 adcx %rax,%r15 xorq %rbp,%rbp movq $38,%rdx mulx %r12,%rax,%r12 adcx %rax,%r8 adox %r12,%r9 mulx %r13,%rcx,%r13 adcx %rcx,%r9 adox %r13,%r10 mulx %r14,%rcx,%r14 adcx %rcx,%r10 adox %r14,%r11 mulx %r15,%rcx,%r15 adcx %rcx,%r11 adox %rbp,%r15 adcx %rbp,%r15 shld $1,%r11,%r15 andq mask63(%rip),%r11 imul $19,%r15,%r15 addq %r15,%r8 adcq $0,%r9 adcq $0,%r10 adcq $0,%r11 movq %r8,352(%rsp) movq %r9,360(%rsp) movq %r10,368(%rsp) movq %r11,376(%rsp) // mul xorq %r13,%r13 movq 0(%rdi),%rdx mulx 64(%rdi),%r8,%r9 mulx 72(%rdi),%rcx,%r10 adcx %rcx,%r9 mulx 80(%rdi),%rcx,%r11 adcx %rcx,%r10 mulx 88(%rdi),%rcx,%r12 adcx %rcx,%r11 adcx %r13,%r12 xorq %r14,%r14 movq 8(%rdi),%rdx mulx 64(%rdi),%rcx,%rbp adcx %rcx,%r9 adox %rbp,%r10 mulx 72(%rdi),%rcx,%rbp adcx %rcx,%r10 adox %rbp,%r11 mulx 80(%rdi),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 88(%rdi),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 adcx %r14,%r13 xorq %r15,%r15 movq 16(%rdi),%rdx mulx 64(%rdi),%rcx,%rbp adcx %rcx,%r10 adox %rbp,%r11 mulx 72(%rdi),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 80(%rdi),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 mulx 88(%rdi),%rcx,%rbp adcx %rcx,%r13 adox %rbp,%r14 adcx %r15,%r14 xorq %rax,%rax movq 24(%rdi),%rdx mulx 64(%rdi),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 72(%rdi),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 mulx 80(%rdi),%rcx,%rbp adcx %rcx,%r13 adox %rbp,%r14 mulx 88(%rdi),%rcx,%rbp adcx %rcx,%r14 adox %rbp,%r15 adcx %rax,%r15 xorq %rbp,%rbp movq $38,%rdx mulx %r12,%rax,%r12 adcx %rax,%r8 adox %r12,%r9 mulx %r13,%rcx,%r13 adcx %rcx,%r9 adox %r13,%r10 mulx %r14,%rcx,%r14 adcx %rcx,%r10 adox %r14,%r11 mulx %r15,%rcx,%r15 adcx %rcx,%r11 adox %rbp,%r15 adcx %rbp,%r15 shld $1,%r11,%r15 andq mask63(%rip),%r11 imul $19,%r15,%r15 addq %r15,%r8 adcq $0,%r9 adcq $0,%r10 adcq $0,%r11 movq %r8,392(%rsp) movq %r9,400(%rsp) movq %r10,408(%rsp) movq %r11,416(%rsp) /* pnielsadd p1p1 */ movq 56(%rsp),%rdi movq 312(%rsp),%r8 movq 320(%rsp),%r9 movq 328(%rsp),%r10 movq 336(%rsp),%r11 movq 344(%rsp),%rax // copy movq %r8,%r12 movq %r9,%r13 movq %r10,%r14 movq %r11,%r15 movq %rax,%rbx // sub addq twoexp8_p0(%rip),%r8 adcq twoexp8_p123(%rip),%r9 adcq twoexp8_p123(%rip),%r10 adcq twoexp8_p123(%rip),%r11 adcq twoexp8_p4(%rip),%rax subq 272(%rsp),%r8 sbbq 280(%rsp),%r9 sbbq 288(%rsp),%r10 sbbq 296(%rsp),%r11 sbbq 304(%rsp),%rax shld $1,%r11,%rax andq mask63(%rip),%r11 imul $19,%rax,%rax addq %rax,%r8 adcq $0,%r9 adcq $0,%r10 adcq $0,%r11 movq %r8,432(%rsp) movq %r9,440(%rsp) movq %r10,448(%rsp) movq %r11,456(%rsp) // add addq 272(%rsp),%r12 adcq 280(%rsp),%r13 adcq 288(%rsp),%r14 adcq 296(%rsp),%r15 adcq 304(%rsp),%rbx shld $1,%r15,%rbx andq mask63(%rip),%r15 imul $19,%rbx,%rbx addq %rbx,%r12 adcq $0,%r13 adcq $0,%r14 adcq $0,%r15 movq %r12,472(%rsp) movq %r13,480(%rsp) movq %r14,488(%rsp) movq %r15,496(%rsp) // mul xorq %r13,%r13 movq 504(%rsp),%rdx mulx 432(%rsp),%r8,%r9 mulx 440(%rsp),%rcx,%r10 adcx %rcx,%r9 mulx 448(%rsp),%rcx,%r11 adcx %rcx,%r10 mulx 456(%rsp),%rcx,%r12 adcx %rcx,%r11 adcx %r13,%r12 xorq %r14,%r14 movq 512(%rsp),%rdx mulx 432(%rsp),%rcx,%rbp adcx %rcx,%r9 adox %rbp,%r10 mulx 440(%rsp),%rcx,%rbp adcx %rcx,%r10 adox %rbp,%r11 mulx 448(%rsp),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 456(%rsp),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 adcx %r14,%r13 xorq %r15,%r15 movq 520(%rsp),%rdx mulx 432(%rsp),%rcx,%rbp adcx %rcx,%r10 adox %rbp,%r11 mulx 440(%rsp),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 448(%rsp),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 mulx 456(%rsp),%rcx,%rbp adcx %rcx,%r13 adox %rbp,%r14 adcx %r15,%r14 xorq %rax,%rax movq 528(%rsp),%rdx mulx 432(%rsp),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 440(%rsp),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 mulx 448(%rsp),%rcx,%rbp adcx %rcx,%r13 adox %rbp,%r14 mulx 456(%rsp),%rcx,%rbp adcx %rcx,%r14 adox %rbp,%r15 adcx %rax,%r15 xorq %rbp,%rbp movq $38,%rdx mulx %r12,%rax,%r12 adcx %rax,%r8 adox %r12,%r9 mulx %r13,%rcx,%r13 adcx %rcx,%r9 adox %r13,%r10 mulx %r14,%rcx,%r14 adcx %rcx,%r10 adox %r14,%r11 mulx %r15,%rcx,%r15 adcx %rcx,%r11 adox %rbp,%r15 adcx %rbp,%r15 movq %r8,432(%rsp) movq %r9,440(%rsp) movq %r10,448(%rsp) movq %r11,456(%rsp) movq %r15,464(%rsp) // mul xorq %r13,%r13 movq 536(%rsp),%rdx mulx 472(%rsp),%r8,%r9 mulx 480(%rsp),%rcx,%r10 adcx %rcx,%r9 mulx 488(%rsp),%rcx,%r11 adcx %rcx,%r10 mulx 496(%rsp),%rcx,%r12 adcx %rcx,%r11 adcx %r13,%r12 xorq %r14,%r14 movq 544(%rsp),%rdx mulx 472(%rsp),%rcx,%rbp adcx %rcx,%r9 adox %rbp,%r10 mulx 480(%rsp),%rcx,%rbp adcx %rcx,%r10 adox %rbp,%r11 mulx 488(%rsp),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 496(%rsp),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 adcx %r14,%r13 xorq %r15,%r15 movq 552(%rsp),%rdx mulx 472(%rsp),%rcx,%rbp adcx %rcx,%r10 adox %rbp,%r11 mulx 480(%rsp),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 488(%rsp),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 mulx 496(%rsp),%rcx,%rbp adcx %rcx,%r13 adox %rbp,%r14 adcx %r15,%r14 xorq %rax,%rax movq 560(%rsp),%rdx mulx 472(%rsp),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 480(%rsp),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 mulx 488(%rsp),%rcx,%rbp adcx %rcx,%r13 adox %rbp,%r14 mulx 496(%rsp),%rcx,%rbp adcx %rcx,%r14 adox %rbp,%r15 adcx %rax,%r15 xorq %rbp,%rbp movq $38,%rdx mulx %r12,%rax,%r12 adcx %rax,%r8 adox %r12,%r9 mulx %r13,%rcx,%r13 adcx %rcx,%r9 adox %r13,%r10 mulx %r14,%rcx,%r14 adcx %rcx,%r10 adox %r14,%r11 mulx %r15,%rcx,%r15 adcx %rcx,%r11 adox %rbp,%r15 adcx %rbp,%r15 // add movq %r8,%r12 movq %r9,%r13 movq %r10,%r14 movq %r11,%rax movq %r15,%rbx addq 432(%rsp),%r8 adcq 440(%rsp),%r9 adcq 448(%rsp),%r10 adcq 456(%rsp),%r11 adcq 464(%rsp),%r15 shld $1,%r11,%r15 andq mask63(%rip),%r11 imul $19,%r15,%r15 addq %r15,%r8 adcq $0,%r9 adcq $0,%r10 adcq $0,%r11 movq %r8,64(%rdi) movq %r9,72(%rdi) movq %r10,80(%rdi) movq %r11,88(%rdi) // sub addq twoexp8_p0(%rip),%r12 adcq twoexp8_p123(%rip),%r13 adcq twoexp8_p123(%rip),%r14 adcq twoexp8_p123(%rip),%rax adcq twoexp8_p4(%rip),%rbx subq 432(%rsp),%r12 sbbq 440(%rsp),%r13 sbbq 448(%rsp),%r14 sbbq 456(%rsp),%rax sbbq 464(%rsp),%rbx shld $1,%rax,%rbx andq mask63(%rip),%rax imul $19,%rbx,%rbx addq %rbx,%r12 adcq $0,%r13 adcq $0,%r14 adcq $0,%rax movq %r12,0(%rdi) movq %r13,8(%rdi) movq %r14,16(%rdi) movq %rax,24(%rdi) // mul xorq %r13,%r13 movq 600(%rsp),%rdx mulx 392(%rsp),%r8,%r9 mulx 400(%rsp),%rcx,%r10 adcx %rcx,%r9 mulx 408(%rsp),%rcx,%r11 adcx %rcx,%r10 mulx 416(%rsp),%rcx,%r12 adcx %rcx,%r11 adcx %r13,%r12 xorq %r14,%r14 movq 608(%rsp),%rdx mulx 392(%rsp),%rcx,%rbp adcx %rcx,%r9 adox %rbp,%r10 mulx 400(%rsp),%rcx,%rbp adcx %rcx,%r10 adox %rbp,%r11 mulx 408(%rsp),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 416(%rsp),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 adcx %r14,%r13 xorq %r15,%r15 movq 616(%rsp),%rdx mulx 392(%rsp),%rcx,%rbp adcx %rcx,%r10 adox %rbp,%r11 mulx 400(%rsp),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 408(%rsp),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 mulx 416(%rsp),%rcx,%rbp adcx %rcx,%r13 adox %rbp,%r14 adcx %r15,%r14 xorq %rax,%rax movq 624(%rsp),%rdx mulx 392(%rsp),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 400(%rsp),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 mulx 408(%rsp),%rcx,%rbp adcx %rcx,%r13 adox %rbp,%r14 mulx 416(%rsp),%rcx,%rbp adcx %rcx,%r14 adox %rbp,%r15 adcx %rax,%r15 xorq %rbp,%rbp movq $38,%rdx mulx %r12,%rax,%r12 adcx %rax,%r8 adox %r12,%r9 mulx %r13,%rcx,%r13 adcx %rcx,%r9 adox %r13,%r10 mulx %r14,%rcx,%r14 adcx %rcx,%r10 adox %r14,%r11 mulx %r15,%rcx,%r15 adcx %rcx,%r11 adox %rbp,%r15 adcx %rbp,%r15 movq %r8,432(%rsp) movq %r9,440(%rsp) movq %r10,448(%rsp) movq %r11,456(%rsp) movq %r15,464(%rsp) // mul xorq %r13,%r13 movq 568(%rsp),%rdx mulx 352(%rsp),%r8,%r9 mulx 360(%rsp),%rcx,%r10 adcx %rcx,%r9 mulx 368(%rsp),%rcx,%r11 adcx %rcx,%r10 mulx 376(%rsp),%rcx,%r12 adcx %rcx,%r11 adcx %r13,%r12 xorq %r14,%r14 movq 576(%rsp),%rdx mulx 352(%rsp),%rcx,%rbp adcx %rcx,%r9 adox %rbp,%r10 mulx 360(%rsp),%rcx,%rbp adcx %rcx,%r10 adox %rbp,%r11 mulx 368(%rsp),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 376(%rsp),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 adcx %r14,%r13 xorq %r15,%r15 movq 584(%rsp),%rdx mulx 352(%rsp),%rcx,%rbp adcx %rcx,%r10 adox %rbp,%r11 mulx 360(%rsp),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 368(%rsp),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 mulx 376(%rsp),%rcx,%rbp adcx %rcx,%r13 adox %rbp,%r14 adcx %r15,%r14 xorq %rax,%rax movq 592(%rsp),%rdx mulx 352(%rsp),%rcx,%rbp adcx %rcx,%r11 adox %rbp,%r12 mulx 360(%rsp),%rcx,%rbp adcx %rcx,%r12 adox %rbp,%r13 mulx 368(%rsp),%rcx,%rbp adcx %rcx,%r13 adox %rbp,%r14 mulx 376(%rsp),%rcx,%rbp adcx %rcx,%r14 adox %rbp,%r15 adcx %rax,%r15 xorq %rbp,%rbp movq $38,%rdx mulx %r12,%rax,%r12 adcx %rax,%r8 adox %r12,%r9 mulx %r13,%rcx,%r13 adcx %rcx,%r9 adox %r13,%r10 mulx %r14,%rcx,%r14 adcx %rcx,%r10 adox %r14,%r11 mulx %r15,%rcx,%r15 adcx %rcx,%r11 adox %rbp,%r15 adcx %rbp,%r15 // double addq %r8,%r8 adcq %r9,%r9 adcq %r10,%r10 adcq %r11,%r11 adcq %r15,%r15 // add movq %r8,%r12 movq %r9,%r13 movq %r10,%r14 movq %r11,%rax movq %r15,%rbx addq 432(%rsp),%r8 adcq 440(%rsp),%r9 adcq 448(%rsp),%r10 adcq 456(%rsp),%r11 adcq 464(%rsp),%r15 shld $1,%r11,%r15 andq mask63(%rip),%r11 imul $19,%r15,%r15 addq %r15,%r8 adcq $0,%r9 adcq $0,%r10 adcq $0,%r11 movq %r8,32(%rdi) movq %r9,40(%rdi) movq %r10,48(%rdi) movq %r11,56(%rdi) // sub addq twoexp8_p0(%rip),%r12 adcq twoexp8_p123(%rip),%r13 adcq twoexp8_p123(%rip),%r14 adcq twoexp8_p123(%rip),%rax adcq twoexp8_p4(%rip),%rbx subq 432(%rsp),%r12 sbbq 440(%rsp),%r13 sbbq 448(%rsp),%r14 sbbq 456(%rsp),%rax sbbq 464(%rsp),%rbx shld $1,%rax,%rbx andq mask63(%rip),%rax imul $19,%rbx,%rbx addq %rbx,%r12 adcq $0,%r13 adcq $0,%r14 adcq $0,%rax movq %r12,96(%rdi) movq %r13,104(%rdi) movq %r14,112(%rdi) movq %rax,120(%rdi) movq 0(%rsp),%r11 movq 8(%rsp),%r12 movq 16(%rsp),%r13 movq 24(%rsp),%r14 movq 32(%rsp),%r15 movq 40(%rsp),%rbx movq 48(%rsp),%rbp movq %r11,%rsp ret .section .note.GNU-stack,"",@progbits