#include "crypto_asm_hidden.h" // linker define ge25519_double_scalarmult_process /* Assembly for double base scalar multiplication. * * This assembly has been developed after studying the * amd64-64-24k implementation of the work "High speed * high security signatures" by Bernstein et al. */ .p2align 4 ASM_HIDDEN _CRYPTO_SHARED_NAMESPACE(ge25519_double_scalarmult_process) .globl _CRYPTO_SHARED_NAMESPACE(ge25519_double_scalarmult_process) ASM_HIDDEN CRYPTO_SHARED_NAMESPACE(ge25519_double_scalarmult_process) .globl CRYPTO_SHARED_NAMESPACE(ge25519_double_scalarmult_process) _CRYPTO_SHARED_NAMESPACE(ge25519_double_scalarmult_process): CRYPTO_SHARED_NAMESPACE(ge25519_double_scalarmult_process): sub sp, sp, #800 stp x19, x20, [sp, #0] stp x21, x22, [sp, #16] stp x23, x24, [sp, #32] stp x25, x26, [sp, #48] stp x27, x28, [sp, #64] stp x29, x30, [sp, #80] movz x21, #0xfffe movk x21, #0x3fff, lsl 16 movk x21, #0xfffe, lsl 32 movk x21, #0x3fff, lsl 48 movz x22, #0xfffe movk x22, #0x3fff, lsl 16 movk x22, #0xfffe, lsl 32 movk x22, #0x00ff, lsl 48 movz x23, #0xfffe movk x23, #0x3fff, lsl 16 movk x23, #0xffda, lsl 32 movk x23, #0x3fff, lsl 48 movz x24, #0xfffe movk x24, #0x3fff, lsl 16 stp x21, x22, [sp, #160] stp x23, x24, [sp, #176] mov w30, #1216 mov x27, #0x1<<32 stp xzr, xzr, [sp, #192] stp xzr, xzr, [sp, #208] str xzr, [sp, #224] stp xzr, xzr, [sp, #232] stp x27, xzr, [sp, #248] str xzr, [sp, #264] stp xzr, xzr, [sp, #272] stp x27, xzr, [sp, #288] str xzr, [sp, #304] stp xzr, xzr, [sp, #312] stp xzr, xzr, [sp, #328] str xzr, [sp, #344] mov w25, #255 add x29, x1, x25 add x2, x2, x25 str x0, [sp, #96] str x3, [sp, #104] str x4, [sp, #112] .L1: ldrsb w8, [x29, #0] ldrsb w9, [x2, #0] cmp w8, wzr bgt .L2 cmp w9, wzr bgt .L2 sub x29, x29, #1 sub x2, x2, #1 sub w25, w25, #1 cmp w25, wzr bge .L1 cmp w25, wzr blt .L10 .L2: str x2, [sp, #120] str x29, [sp, #128] str x25, [sp, #136] .L3: /* dbl p1p1 */ // square add x29, sp, #272 ldp w13, w17, [x29, #0] ldp w14, w18, [x29, #8] ldp w15, w10, [x29, #16] ldp w16, w11, [x29, #24] ldr w12, [x29, #32] add w20, w10, w10 add w21, w11, w11 add w22, w12, w12 add w23, w13, w13 add w24, w14, w14 add w25, w15, w15 add w26, w16, w16 add w27, w17, w17 umull x0, w10, w10 umull x1, w20, w11 umull x2, w20, w12 umull x3, w20, w13 umull x4, w20, w14 umull x5, w20, w15 umull x6, w20, w16 umull x7, w20, w17 umull x8, w20, w18 umaddl x2, w11, w11, x2 umaddl x3, w21, w12, x3 umaddl x4, w21, w13, x4 umaddl x5, w21, w14, x5 umaddl x6, w21, w15, x6 umaddl x7, w21, w16, x7 umaddl x8, w21, w17, x8 umull x9, w21, w18 umaddl x4, w12, w12, x4 umaddl x5, w22, w13, x5 umaddl x6, w22, w14, x6 umaddl x7, w22, w15, x7 umaddl x8, w22, w16, x8 umaddl x9, w22, w17, x9 umull x10, w22, w18 umaddl x6, w13, w13, x6 umaddl x7, w23, w14, x7 umaddl x8, w23, w15, x8 umaddl x9, w23, w16, x9 umaddl x10, w23, w17, x10 umull x11, w23, w18 umaddl x8, w14, w14, x8 umaddl x9, w24, w15, x9 umaddl x10, w24, w16, x10 umaddl x11, w24, w17, x11 umull x12, w24, w18 umaddl x10, w15, w15, x10 umaddl x11, w25, w16, x11 umaddl x12, w25, w17, x12 umull x13, w25, w18 add x10, x10, x9, lsr #29 and x9, x9, #0x1fffffff umull x9, w9, w30 add x0, x0, x9 add x11, x11, x10, lsr #29 and x10, x10, #0x1fffffff umull x10, w10, w30 add x1, x1, x10 umaddl x12, w16, w16, x12 umaddl x13, w26, w17, x13 umull x14, w26, w18 add x12, x12, x11, lsr #29 and x11, x11, #0x1fffffff umull x11, w11, w30 add x2, x2, x11 add x13, x13, x12, lsr #29 and x12, x12, #0x1fffffff umull x12, w12, w30 add x3, x3, x12 umaddl x14, w17, w17, x14 umull x15, w27, w18 add x14, x14, x13, lsr #29 and x13, x13, #0x1fffffff umull x13, w13, w30 add x4, x4, x13 add x15, x15, x14, lsr #29 and x14, x14, #0x1fffffff umull x14, w14, w30 add x5, x5, x14 umull x16, w18, w18 add x16, x16, x15, lsr #29 and x15, x15, #0x1fffffff umull x15, w15, w30 add x6, x6, x15 lsr x9, x16, #29 and x16, x16, #0x1fffffff umull x16, w16, w30 add x7, x7, x16 umull x9, w9, w30 add x8, x8, x9 // double and then reduce add x0, x0, x0 add x1, x1, x1 add x2, x2, x2 add x3, x3, x3 add x4, x4, x4 add x5, x5, x5 add x6, x6, x6 add x7, x7, x7 add x8, x8, x8 add x5, x5, x4, lsr #29 and x4, x4, 0x1fffffff add x1, x1, x0, lsr #29 and x0, x0, 0x1fffffff add x6, x6, x5, lsr #29 and x5, x5, 0x1fffffff add x2, x2, x1, lsr #29 and x1, x1, 0x1fffffff add x7, x7, x6, lsr #29 and x6, x6, 0x1fffffff add x3, x3, x2, lsr #29 and x2, x2, 0x1fffffff add x8, x8, x7, lsr #29 and x7, x7, 0x1fffffff add x4, x4, x3, lsr #29 and x3, x3, 0x1fffffff bfi x3, x7, #32, #29 bic x10, x8, #0x7fffff add x0, x0, x10, lsr #23 add x0, x0, x10, lsr #22 add x0, x0, x10, lsr #19 and x8, x8, #0x7fffff add x5, x5, x4, lsr #29 and x4, x4, 0x1fffffff bfi x4, x8, #32, #23 add x1, x1, x0, lsr #29 bfi x6, x1, #32, #30 and x0, x0, 0x1fffffff bfi x5, x0, #32, #29 stp x3, x4, [sp, #432] stp x5, x6, [sp, #448] str x2, [sp, #464] // square add x29, sp, #232 ldp w13, w17, [x29, #0] ldp w14, w18, [x29, #8] ldp w15, w10, [x29, #16] ldp w16, w11, [x29, #24] ldr w12, [x29, #32] add w20, w10, w10 add w21, w11, w11 add w22, w12, w12 add w23, w13, w13 add w24, w14, w14 add w25, w15, w15 add w26, w16, w16 add w27, w17, w17 umull x0, w10, w10 umull x1, w20, w11 umull x2, w20, w12 umull x3, w20, w13 umull x4, w20, w14 umull x5, w20, w15 umull x6, w20, w16 umull x7, w20, w17 umull x8, w20, w18 umaddl x2, w11, w11, x2 umaddl x3, w21, w12, x3 umaddl x4, w21, w13, x4 umaddl x5, w21, w14, x5 umaddl x6, w21, w15, x6 umaddl x7, w21, w16, x7 umaddl x8, w21, w17, x8 umull x9, w21, w18 umaddl x4, w12, w12, x4 umaddl x5, w22, w13, x5 umaddl x6, w22, w14, x6 umaddl x7, w22, w15, x7 umaddl x8, w22, w16, x8 umaddl x9, w22, w17, x9 umull x10, w22, w18 umaddl x6, w13, w13, x6 umaddl x7, w23, w14, x7 umaddl x8, w23, w15, x8 umaddl x9, w23, w16, x9 umaddl x10, w23, w17, x10 umull x11, w23, w18 umaddl x8, w14, w14, x8 umaddl x9, w24, w15, x9 umaddl x10, w24, w16, x10 umaddl x11, w24, w17, x11 umull x12, w24, w18 umaddl x10, w15, w15, x10 umaddl x11, w25, w16, x11 umaddl x12, w25, w17, x12 umull x13, w25, w18 add x10, x10, x9, lsr #29 and x9, x9, #0x1fffffff umull x9, w9, w30 add x0, x0, x9 add x11, x11, x10, lsr #29 and x10, x10, #0x1fffffff umull x10, w10, w30 add x1, x1, x10 umaddl x12, w16, w16, x12 umaddl x13, w26, w17, x13 umull x14, w26, w18 add x12, x12, x11, lsr #29 and x11, x11, #0x1fffffff umull x11, w11, w30 add x2, x2, x11 add x13, x13, x12, lsr #29 and x12, x12, #0x1fffffff umull x12, w12, w30 add x3, x3, x12 umaddl x14, w17, w17, x14 umull x15, w27, w18 add x14, x14, x13, lsr #29 and x13, x13, #0x1fffffff umull x13, w13, w30 add x4, x4, x13 add x15, x15, x14, lsr #29 and x14, x14, #0x1fffffff umull x14, w14, w30 add x5, x5, x14 umull x16, w18, w18 add x16, x16, x15, lsr #29 and x15, x15, #0x1fffffff umull x15, w15, w30 add x6, x6, x15 lsr x9, x16, #29 and x16, x16, #0x1fffffff umull x16, w16, w30 add x7, x7, x16 umull x9, w9, w30 add x8, x8, x9 add x5, x5, x4, lsr #29 and x4, x4, 0x1fffffff add x1, x1, x0, lsr #29 and x0, x0, 0x1fffffff add x6, x6, x5, lsr #29 and x5, x5, 0x1fffffff add x2, x2, x1, lsr #29 and x1, x1, 0x1fffffff add x7, x7, x6, lsr #29 and x6, x6, 0x1fffffff add x3, x3, x2, lsr #29 and x2, x2, 0x1fffffff add x8, x8, x7, lsr #29 and x7, x7, 0x1fffffff add x4, x4, x3, lsr #29 and x3, x3, 0x1fffffff bfi x3, x7, #32, #29 bic x10, x8, #0x7fffff add x0, x0, x10, lsr #23 add x0, x0, x10, lsr #22 add x0, x0, x10, lsr #19 and x8, x8, #0x7fffff add x5, x5, x4, lsr #29 and x4, x4, 0x1fffffff bfi x4, x8, #32, #23 add x1, x1, x0, lsr #29 bfi x6, x1, #32, #30 and x0, x0, 0x1fffffff bfi x5, x0, #32, #29 stp x3, x4, [sp, #392] stp x5, x6, [sp, #408] str x2, [sp, #424] // square ldp w13, w17, [sp, #192] ldp w14, w18, [sp, #200] ldp w15, w10, [sp, #208] ldp w16, w11, [sp, #216] ldr w12, [sp, #224] add w20, w10, w10 add w21, w11, w11 add w22, w12, w12 add w23, w13, w13 add w24, w14, w14 add w25, w15, w15 add w26, w16, w16 add w27, w17, w17 umull x0, w10, w10 umull x1, w20, w11 umull x2, w20, w12 umull x3, w20, w13 umull x4, w20, w14 umull x5, w20, w15 umull x6, w20, w16 umull x7, w20, w17 umull x8, w20, w18 umaddl x2, w11, w11, x2 umaddl x3, w21, w12, x3 umaddl x4, w21, w13, x4 umaddl x5, w21, w14, x5 umaddl x6, w21, w15, x6 umaddl x7, w21, w16, x7 umaddl x8, w21, w17, x8 umull x9, w21, w18 umaddl x4, w12, w12, x4 umaddl x5, w22, w13, x5 umaddl x6, w22, w14, x6 umaddl x7, w22, w15, x7 umaddl x8, w22, w16, x8 umaddl x9, w22, w17, x9 umull x10, w22, w18 umaddl x6, w13, w13, x6 umaddl x7, w23, w14, x7 umaddl x8, w23, w15, x8 umaddl x9, w23, w16, x9 umaddl x10, w23, w17, x10 umull x11, w23, w18 umaddl x8, w14, w14, x8 umaddl x9, w24, w15, x9 umaddl x10, w24, w16, x10 umaddl x11, w24, w17, x11 umull x12, w24, w18 umaddl x10, w15, w15, x10 umaddl x11, w25, w16, x11 umaddl x12, w25, w17, x12 umull x13, w25, w18 add x10, x10, x9, lsr #29 and x9, x9, #0x1fffffff umull x9, w9, w30 add x0, x0, x9 add x11, x11, x10, lsr #29 and x10, x10, #0x1fffffff umull x10, w10, w30 add x1, x1, x10 umaddl x12, w16, w16, x12 umaddl x13, w26, w17, x13 umull x14, w26, w18 add x12, x12, x11, lsr #29 and x11, x11, #0x1fffffff umull x11, w11, w30 add x2, x2, x11 add x13, x13, x12, lsr #29 and x12, x12, #0x1fffffff umull x12, w12, w30 add x3, x3, x12 umaddl x14, w17, w17, x14 umull x15, w27, w18 add x14, x14, x13, lsr #29 and x13, x13, #0x1fffffff umull x13, w13, w30 add x4, x4, x13 add x15, x15, x14, lsr #29 and x14, x14, #0x1fffffff umull x14, w14, w30 add x5, x5, x14 umull x16, w18, w18 add x16, x16, x15, lsr #29 and x15, x15, #0x1fffffff umull x15, w15, w30 add x6, x6, x15 lsr x9, x16, #29 and x16, x16, #0x1fffffff umull x16, w16, w30 add x7, x7, x16 umull x9, w9, w30 add x8, x8, x9 add x5, x5, x4, lsr #29 and x4, x4, 0x1fffffff add x1, x1, x0, lsr #29 and x0, x0, 0x1fffffff add x6, x6, x5, lsr #29 and x5, x5, 0x1fffffff add x2, x2, x1, lsr #29 and x1, x1, 0x1fffffff add x7, x7, x6, lsr #29 and x6, x6, 0x1fffffff add x3, x3, x2, lsr #29 and x2, x2, 0x1fffffff add x8, x8, x7, lsr #29 and x7, x7, 0x1fffffff add x4, x4, x3, lsr #29 and x3, x3, 0x1fffffff bfi x3, x7, #32, #29 bic x10, x8, #0x7fffff add x0, x0, x10, lsr #23 add x0, x0, x10, lsr #22 add x0, x0, x10, lsr #19 and x8, x8, #0x7fffff add x5, x5, x4, lsr #29 and x4, x4, 0x1fffffff bfi x4, x8, #32, #23 add x1, x1, x0, lsr #29 bfi x6, x1, #32, #30 and x0, x0, 0x1fffffff bfi x5, x0, #32, #29 // neg ldp x20, x21, [sp, #160] ldp x27, x28, [sp, #176] sub x10, x20, x3 sub x11, x21, x4 sub x17, x27, x5 sub x18, x20, x6 sub x19, x28, x2 // add ldp x13, x14, [sp, #392] ldp x15, x16, [sp, #408] ldr x12, [sp, #424] add x3, x10, x13 add x4, x11, x14 add x5, x17, x15 add x6, x18, x16 add x2, x19, x12 add x29, sp, #552 stp x3, x4, [x29, #0] stp x5, x6, [x29, #16] str x2, [x29, #32] // sub ldp x13, x14, [sp, #432] ldp x15, x16, [sp, #448] ldr x12, [sp, #464] sub x3, x3, x13 sub x4, x4, x14 sub x5, x5, x15 sub x6, x6, x16 sub x2, x2, x12 stp x3, x4, [x29, #80] stp x5, x6, [x29, #96] str x2, [x29, #112] // sub ldp x13, x14, [sp, #392] ldp x15, x16, [sp, #408] ldr x12, [sp, #424] ldp x20, x21, [sp, #160] ldp x27, x28, [sp, #176] add x10, x10, x20 add x11, x11, x21 add x17, x17, x27 add x18, x18, x20 add x19, x19, x28 sub x3, x10, x13 sub x4, x11, x14 sub x5, x17, x15 sub x6, x18, x16 sub x2, x19, x12 lsr x7, x3, #32 lsr x8, x4, #32 lsr x0, x5, #32 lsr x1, x6, #32 mov w3, w3 mov w4, w4 mov w5, w5 mov w6, w6 add x5, x5, x4, lsr #29 and x4, x4, 0x1fffffff add x1, x1, x0, lsr #29 and x0, x0, 0x1fffffff add x6, x6, x5, lsr #29 and x5, x5, 0x1fffffff add x2, x2, x1, lsr #29 and x1, x1, 0x1fffffff add x7, x7, x6, lsr #29 and x6, x6, 0x1fffffff add x3, x3, x2, lsr #29 and x2, x2, 0x1fffffff add x8, x8, x7, lsr #29 and x7, x7, 0x1fffffff add x4, x4, x3, lsr #29 and x3, x3, 0x1fffffff bfi x3, x7, #32, #29 bic x10, x8, #0x7fffff add x0, x0, x10, lsr #23 add x0, x0, x10, lsr #22 add x0, x0, x10, lsr #19 and x8, x8, #0x7fffff add x5, x5, x4, lsr #29 and x4, x4, 0x1fffffff bfi x4, x8, #32, #23 add x1, x1, x0, lsr #29 bfi x6, x1, #32, #30 and x0, x0, 0x1fffffff bfi x5, x0, #32, #29 stp x3, x4, [x29, #40] stp x5, x6, [x29, #56] str x2, [x29, #72] // add ldp x13, x14, [sp, #192] ldp x15, x16, [sp, #208] ldr x12, [sp, #224] ldp x23, x24, [sp, #232] ldp x25, x26, [sp, #248] ldr x22, [sp, #264] add x13, x13, x23 add x14, x14, x24 add x15, x15, x25 add x16, x16, x26 add x12, x12, x22 // square lsr x17, x13, #32 lsr x18, x14, #32 lsr x10, x15, #32 lsr x11, x16, #32 add w20, w10, w10 add w21, w11, w11 add w22, w12, w12 add w23, w13, w13 add w24, w14, w14 add w25, w15, w15 add w26, w16, w16 add w27, w17, w17 umull x0, w10, w10 umull x1, w20, w11 umull x2, w20, w12 umull x3, w20, w13 umull x4, w20, w14 umull x5, w20, w15 umull x6, w20, w16 umull x7, w20, w17 umull x8, w20, w18 umaddl x2, w11, w11, x2 umaddl x3, w21, w12, x3 umaddl x4, w21, w13, x4 umaddl x5, w21, w14, x5 umaddl x6, w21, w15, x6 umaddl x7, w21, w16, x7 umaddl x8, w21, w17, x8 umull x9, w21, w18 umaddl x4, w12, w12, x4 umaddl x5, w22, w13, x5 umaddl x6, w22, w14, x6 umaddl x7, w22, w15, x7 umaddl x8, w22, w16, x8 umaddl x9, w22, w17, x9 umull x10, w22, w18 umaddl x6, w13, w13, x6 umaddl x7, w23, w14, x7 umaddl x8, w23, w15, x8 umaddl x9, w23, w16, x9 umaddl x10, w23, w17, x10 umull x11, w23, w18 umaddl x8, w14, w14, x8 umaddl x9, w24, w15, x9 umaddl x10, w24, w16, x10 umaddl x11, w24, w17, x11 umull x12, w24, w18 umaddl x10, w15, w15, x10 umaddl x11, w25, w16, x11 umaddl x12, w25, w17, x12 umull x13, w25, w18 add x10, x10, x9, lsr #29 and x9, x9, #0x1fffffff umull x9, w9, w30 add x0, x0, x9 add x11, x11, x10, lsr #29 and x10, x10, #0x1fffffff umull x10, w10, w30 add x1, x1, x10 umaddl x12, w16, w16, x12 umaddl x13, w26, w17, x13 umull x14, w26, w18 add x12, x12, x11, lsr #29 and x11, x11, #0x1fffffff umull x11, w11, w30 add x2, x2, x11 add x13, x13, x12, lsr #29 and x12, x12, #0x1fffffff umull x12, w12, w30 add x3, x3, x12 umaddl x14, w17, w17, x14 umull x15, w27, w18 add x14, x14, x13, lsr #29 and x13, x13, #0x1fffffff umull x13, w13, w30 add x4, x4, x13 add x15, x15, x14, lsr #29 and x14, x14, #0x1fffffff umull x14, w14, w30 add x5, x5, x14 umull x16, w18, w18 add x16, x16, x15, lsr #29 and x15, x15, #0x1fffffff umull x15, w15, w30 add x6, x6, x15 lsr x9, x16, #29 and x16, x16, #0x1fffffff umull x16, w16, w30 add x7, x7, x16 umull x9, w9, w30 add x8, x8, x9 add x5, x5, x4, lsr #29 and x4, x4, 0x1fffffff add x1, x1, x0, lsr #29 and x0, x0, 0x1fffffff add x6, x6, x5, lsr #29 and x5, x5, 0x1fffffff add x2, x2, x1, lsr #29 and x1, x1, 0x1fffffff add x7, x7, x6, lsr #29 and x6, x6, 0x1fffffff add x3, x3, x2, lsr #29 and x2, x2, 0x1fffffff add x8, x8, x7, lsr #29 and x7, x7, 0x1fffffff add x4, x4, x3, lsr #29 and x3, x3, 0x1fffffff bfi x3, x7, #32, #29 bic x10, x8, #0x7fffff add x0, x0, x10, lsr #23 add x0, x0, x10, lsr #22 add x0, x0, x10, lsr #19 and x8, x8, #0x7fffff add x5, x5, x4, lsr #29 and x4, x4, 0x1fffffff bfi x4, x8, #32, #23 add x1, x1, x0, lsr #29 bfi x6, x1, #32, #30 and x0, x0, 0x1fffffff bfi x5, x0, #32, #29 // add add x29, sp, #512 ldp x13, x14, [x29, #80] ldp x15, x16, [x29, #96] ldr x12, [x29, #112] add x3, x3, x13 add x4, x4, x14 add x5, x5, x15 add x6, x6, x16 add x2, x2, x12 stp x3, x4, [x29, #0] stp x5, x6, [x29, #16] str x2, [x29, #32] ldr x29, [sp, #128] ldrsb w26, [x29, #0] sub x29, x29, #1 str x29, [sp, #128] str w26, [sp, #144] cmp w26, wzr bgt .L4 blt .L5 beq .L6 .L4: /* p1p1 to p3 */ // mul add x29, sp, #512 ldp w13, w17, [x29, #0] ldp w14, w18, [x29, #8] ldp w15, w10, [x29, #16] ldp w16, w11, [x29, #24] ldr w12, [x29, #32] ldp w23, w27, [x29, #120] ldp w24, w28, [x29, #128] ldp w25, w20, [x29, #136] ldp w26, w21, [x29, #144] ldr w22, [x29, #152] umull x0, w10, w20 umull x1, w10, w21 umull x2, w10, w22 umull x3, w10, w23 umull x4, w10, w24 umull x5, w10, w25 umull x6, w10, w26 umull x7, w10, w27 umull x8, w10, w28 umaddl x1, w11, w20, x1 umaddl x2, w11, w21, x2 umaddl x3, w11, w22, x3 umaddl x4, w11, w23, x4 umaddl x5, w11, w24, x5 umaddl x6, w11, w25, x6 umaddl x7, w11, w26, x7 umaddl x8, w11, w27, x8 umull x9, w11, w28 umaddl x2, w12, w20, x2 umaddl x3, w12, w21, x3 umaddl x4, w12, w22, x4 umaddl x5, w12, w23, x5 umaddl x6, w12, w24, x6 umaddl x7, w12, w25, x7 umaddl x8, w12, w26, x8 umaddl x9, w12, w27, x9 umull x10, w12, w28 umaddl x3, w13, w20, x3 umaddl x4, w13, w21, x4 umaddl x5, w13, w22, x5 umaddl x6, w13, w23, x6 umaddl x7, w13, w24, x7 umaddl x8, w13, w25, x8 umaddl x9, w13, w26, x9 umaddl x10, w13, w27, x10 umull x11, w13, w28 umaddl x4, w14, w20, x4 umaddl x5, w14, w21, x5 umaddl x6, w14, w22, x6 umaddl x7, w14, w23, x7 umaddl x8, w14, w24, x8 umaddl x9, w14, w25, x9 umaddl x10, w14, w26, x10 umaddl x11, w14, w27, x11 umull x12, w14, w28 umaddl x5, w15, w20, x5 umaddl x6, w15, w21, x6 umaddl x7, w15, w22, x7 umaddl x8, w15, w23, x8 umaddl x9, w15, w24, x9 umaddl x10, w15, w25, x10 umaddl x11, w15, w26, x11 umaddl x12, w15, w27, x12 umull x13, w15, w28 umaddl x6, w16, w20, x6 umaddl x7, w16, w21, x7 umaddl x8, w16, w22, x8 umaddl x9, w16, w23, x9 umaddl x10, w16, w24, x10 umaddl x11, w16, w25, x11 umaddl x12, w16, w26, x12 umaddl x13, w16, w27, x13 umull x14, w16, w28 umaddl x7, w17, w20, x7 umaddl x8, w17, w21, x8 umaddl x9, w17, w22, x9 umaddl x10, w17, w23, x10 umaddl x11, w17, w24, x11 umaddl x12, w17, w25, x12 umaddl x13, w17, w26, x13 umaddl x14, w17, w27, x14 umull x15, w17, w28 umaddl x8, w18, w20, x8 umaddl x9, w18, w21, x9 umaddl x10, w18, w22, x10 umaddl x11, w18, w23, x11 umaddl x12, w18, w24, x12 umaddl x13, w18, w25, x13 umaddl x14, w18, w26, x14 umaddl x15, w18, w27, x15 umull x16, w18, w28 add x10, x10, x9, lsr #29 and x9, x9, #0x1fffffff umull x9, w9, w30 add x0, x0, x9 add x11, x11, x10, lsr #29 and x10, x10, #0x1fffffff umull x10, w10, w30 add x1, x1, x10 add x12, x12, x11, lsr #29 and x11, x11, #0x1fffffff umull x11, w11, w30 add x2, x2, x11 add x13, x13, x12, lsr #29 and x12, x12, #0x1fffffff umull x12, w12, w30 add x3, x3, x12 add x14, x14, x13, lsr #29 and x13, x13, #0x1fffffff umull x13, w13, w30 add x4, x4, x13 add x15, x15, x14, lsr #29 and x14, x14, #0x1fffffff umull x14, w14, w30 add x5, x5, x14 add x16, x16, x15, lsr #29 and x15, x15, #0x1fffffff umull x15, w15, w30 add x6, x6, x15 lsr x9, x16, #29 and x16, x16, #0x1fffffff umull x16, w16, w30 add x7, x7, x16 umull x9, w9, w30 add x8, x8, x9 add x5, x5, x4, lsr #29 and x4, x4, 0x1fffffff add x1, x1, x0, lsr #29 and x0, x0, 0x1fffffff add x6, x6, x5, lsr #29 and x5, x5, 0x1fffffff add x2, x2, x1, lsr #29 and x1, x1, 0x1fffffff add x7, x7, x6, lsr #29 and x6, x6, 0x1fffffff add x3, x3, x2, lsr #29 and x2, x2, 0x1fffffff add x8, x8, x7, lsr #29 and x7, x7, 0x1fffffff add x4, x4, x3, lsr #29 and x3, x3, 0x1fffffff bfi x3, x7, #32, #29 bic x10, x8, #0x7fffff add x0, x0, x10, lsr #23 add x0, x0, x10, lsr #22 add x0, x0, x10, lsr #19 and x8, x8, #0x7fffff add x5, x5, x4, lsr #29 and x4, x4, 0x1fffffff bfi x4, x8, #32, #23 add x1, x1, x0, lsr #29 bfi x6, x1, #32, #30 and x0, x0, 0x1fffffff bfi x5, x0, #32, #29 stp x3, x4, [sp, #352] stp x5, x6, [sp, #368] str x2, [sp, #384] // mul add x29, sp, #552 ldp w13, w17, [x29, #0] ldp w14, w18, [x29, #8] ldp w15, w10, [x29, #16] ldp w16, w11, [x29, #24] ldr w12, [x29, #32] ldp w23, w27, [x29, #40] ldp w24, w28, [x29, #48] ldp w25, w20, [x29, #56] ldp w26, w21, [x29, #64] ldr w22, [x29, #72] umull x0, w10, w20 umull x1, w10, w21 umull x2, w10, w22 umull x3, w10, w23 umull x4, w10, w24 umull x5, w10, w25 umull x6, w10, w26 umull x7, w10, w27 umull x8, w10, w28 umaddl x1, w11, w20, x1 umaddl x2, w11, w21, x2 umaddl x3, w11, w22, x3 umaddl x4, w11, w23, x4 umaddl x5, w11, w24, x5 umaddl x6, w11, w25, x6 umaddl x7, w11, w26, x7 umaddl x8, w11, w27, x8 umull x9, w11, w28 umaddl x2, w12, w20, x2 umaddl x3, w12, w21, x3 umaddl x4, w12, w22, x4 umaddl x5, w12, w23, x5 umaddl x6, w12, w24, x6 umaddl x7, w12, w25, x7 umaddl x8, w12, w26, x8 umaddl x9, w12, w27, x9 umull x10, w12, w28 umaddl x3, w13, w20, x3 umaddl x4, w13, w21, x4 umaddl x5, w13, w22, x5 umaddl x6, w13, w23, x6 umaddl x7, w13, w24, x7 umaddl x8, w13, w25, x8 umaddl x9, w13, w26, x9 umaddl x10, w13, w27, x10 umull x11, w13, w28 umaddl x4, w14, w20, x4 umaddl x5, w14, w21, x5 umaddl x6, w14, w22, x6 umaddl x7, w14, w23, x7 umaddl x8, w14, w24, x8 umaddl x9, w14, w25, x9 umaddl x10, w14, w26, x10 umaddl x11, w14, w27, x11 umull x12, w14, w28 umaddl x5, w15, w20, x5 umaddl x6, w15, w21, x6 umaddl x7, w15, w22, x7 umaddl x8, w15, w23, x8 umaddl x9, w15, w24, x9 umaddl x10, w15, w25, x10 umaddl x11, w15, w26, x11 umaddl x12, w15, w27, x12 umull x13, w15, w28 umaddl x6, w16, w20, x6 umaddl x7, w16, w21, x7 umaddl x8, w16, w22, x8 umaddl x9, w16, w23, x9 umaddl x10, w16, w24, x10 umaddl x11, w16, w25, x11 umaddl x12, w16, w26, x12 umaddl x13, w16, w27, x13 umull x14, w16, w28 umaddl x7, w17, w20, x7 umaddl x8, w17, w21, x8 umaddl x9, w17, w22, x9 umaddl x10, w17, w23, x10 umaddl x11, w17, w24, x11 umaddl x12, w17, w25, x12 umaddl x13, w17, w26, x13 umaddl x14, w17, w27, x14 umull x15, w17, w28 umaddl x8, w18, w20, x8 umaddl x9, w18, w21, x9 umaddl x10, w18, w22, x10 umaddl x11, w18, w23, x11 umaddl x12, w18, w24, x12 umaddl x13, w18, w25, x13 umaddl x14, w18, w26, x14 umaddl x15, w18, w27, x15 umull x16, w18, w28 add x10, x10, x9, lsr #29 and x9, x9, #0x1fffffff umull x9, w9, w30 add x0, x0, x9 add x11, x11, x10, lsr #29 and x10, x10, #0x1fffffff umull x10, w10, w30 add x1, x1, x10 add x12, x12, x11, lsr #29 and x11, x11, #0x1fffffff umull x11, w11, w30 add x2, x2, x11 add x13, x13, x12, lsr #29 and x12, x12, #0x1fffffff umull x12, w12, w30 add x3, x3, x12 add x14, x14, x13, lsr #29 and x13, x13, #0x1fffffff umull x13, w13, w30 add x4, x4, x13 add x15, x15, x14, lsr #29 and x14, x14, #0x1fffffff umull x14, w14, w30 add x5, x5, x14 add x16, x16, x15, lsr #29 and x15, x15, #0x1fffffff umull x15, w15, w30 add x6, x6, x15 lsr x9, x16, #29 and x16, x16, #0x1fffffff umull x16, w16, w30 add x7, x7, x16 umull x9, w9, w30 add x8, x8, x9 add x5, x5, x4, lsr #29 and x4, x4, 0x1fffffff add x1, x1, x0, lsr #29 and x0, x0, 0x1fffffff add x6, x6, x5, lsr #29 and x5, x5, 0x1fffffff add x2, x2, x1, lsr #29 and x1, x1, 0x1fffffff add x7, x7, x6, lsr #29 and x6, x6, 0x1fffffff add x3, x3, x2, lsr #29 and x2, x2, 0x1fffffff add x8, x8, x7, lsr #29 and x7, x7, 0x1fffffff add x4, x4, x3, lsr #29 and x3, x3, 0x1fffffff bfi x3, x7, #32, #29 bic x10, x8, #0x7fffff add x0, x0, x10, lsr #23 add x0, x0, x10, lsr #22 add x0, x0, x10, lsr #19 and x8, x8, #0x7fffff add x5, x5, x4, lsr #29 and x4, x4, 0x1fffffff bfi x4, x8, #32, #23 add x1, x1, x0, lsr #29 bfi x6, x1, #32, #30 and x0, x0, 0x1fffffff bfi x5, x0, #32, #29 stp x3, x4, [sp, #392] stp x5, x6, [sp, #408] str x2, [sp, #424] // mul add x29, sp, #552 ldp w13, w17, [x29, #0] ldp w14, w18, [x29, #8] ldp w15, w10, [x29, #16] ldp w16, w11, [x29, #24] ldr w12, [x29, #32] ldp w23, w27, [x29, #80] ldp w24, w28, [x29, #88] ldp w25, w20, [x29, #96] ldp w26, w21, [x29, #104] ldr w22, [x29, #112] umull x0, w10, w20 umull x1, w10, w21 umull x2, w10, w22 umull x3, w10, w23 umull x4, w10, w24 umull x5, w10, w25 umull x6, w10, w26 umull x7, w10, w27 umull x8, w10, w28 umaddl x1, w11, w20, x1 umaddl x2, w11, w21, x2 umaddl x3, w11, w22, x3 umaddl x4, w11, w23, x4 umaddl x5, w11, w24, x5 umaddl x6, w11, w25, x6 umaddl x7, w11, w26, x7 umaddl x8, w11, w27, x8 umull x9, w11, w28 umaddl x2, w12, w20, x2 umaddl x3, w12, w21, x3 umaddl x4, w12, w22, x4 umaddl x5, w12, w23, x5 umaddl x6, w12, w24, x6 umaddl x7, w12, w25, x7 umaddl x8, w12, w26, x8 umaddl x9, w12, w27, x9 umull x10, w12, w28 umaddl x3, w13, w20, x3 umaddl x4, w13, w21, x4 umaddl x5, w13, w22, x5 umaddl x6, w13, w23, x6 umaddl x7, w13, w24, x7 umaddl x8, w13, w25, x8 umaddl x9, w13, w26, x9 umaddl x10, w13, w27, x10 umull x11, w13, w28 umaddl x4, w14, w20, x4 umaddl x5, w14, w21, x5 umaddl x6, w14, w22, x6 umaddl x7, w14, w23, x7 umaddl x8, w14, w24, x8 umaddl x9, w14, w25, x9 umaddl x10, w14, w26, x10 umaddl x11, w14, w27, x11 umull x12, w14, w28 umaddl x5, w15, w20, x5 umaddl x6, w15, w21, x6 umaddl x7, w15, w22, x7 umaddl x8, w15, w23, x8 umaddl x9, w15, w24, x9 umaddl x10, w15, w25, x10 umaddl x11, w15, w26, x11 umaddl x12, w15, w27, x12 umull x13, w15, w28 umaddl x6, w16, w20, x6 umaddl x7, w16, w21, x7 umaddl x8, w16, w22, x8 umaddl x9, w16, w23, x9 umaddl x10, w16, w24, x10 umaddl x11, w16, w25, x11 umaddl x12, w16, w26, x12 umaddl x13, w16, w27, x13 umull x14, w16, w28 umaddl x7, w17, w20, x7 umaddl x8, w17, w21, x8 umaddl x9, w17, w22, x9 umaddl x10, w17, w23, x10 umaddl x11, w17, w24, x11 umaddl x12, w17, w25, x12 umaddl x13, w17, w26, x13 umaddl x14, w17, w27, x14 umull x15, w17, w28 umaddl x8, w18, w20, x8 umaddl x9, w18, w21, x9 umaddl x10, w18, w22, x10 umaddl x11, w18, w23, x11 umaddl x12, w18, w24, x12 umaddl x13, w18, w25, x13 umaddl x14, w18, w26, x14 umaddl x15, w18, w27, x15 umull x16, w18, w28 add x10, x10, x9, lsr #29 and x9, x9, #0x1fffffff umull x9, w9, w30 add x0, x0, x9 add x11, x11, x10, lsr #29 and x10, x10, #0x1fffffff umull x10, w10, w30 add x1, x1, x10 add x12, x12, x11, lsr #29 and x11, x11, #0x1fffffff umull x11, w11, w30 add x2, x2, x11 add x13, x13, x12, lsr #29 and x12, x12, #0x1fffffff umull x12, w12, w30 add x3, x3, x12 add x14, x14, x13, lsr #29 and x13, x13, #0x1fffffff umull x13, w13, w30 add x4, x4, x13 add x15, x15, x14, lsr #29 and x14, x14, #0x1fffffff umull x14, w14, w30 add x5, x5, x14 add x16, x16, x15, lsr #29 and x15, x15, #0x1fffffff umull x15, w15, w30 add x6, x6, x15 lsr x9, x16, #29 and x16, x16, #0x1fffffff umull x16, w16, w30 add x7, x7, x16 umull x9, w9, w30 add x8, x8, x9 add x5, x5, x4, lsr #29 and x4, x4, 0x1fffffff add x1, x1, x0, lsr #29 and x0, x0, 0x1fffffff add x6, x6, x5, lsr #29 and x5, x5, 0x1fffffff add x2, x2, x1, lsr #29 and x1, x1, 0x1fffffff add x7, x7, x6, lsr #29 and x6, x6, 0x1fffffff add x3, x3, x2, lsr #29 and x2, x2, 0x1fffffff add x8, x8, x7, lsr #29 and x7, x7, 0x1fffffff add x4, x4, x3, lsr #29 and x3, x3, 0x1fffffff bfi x3, x7, #32, #29 bic x10, x8, #0x7fffff add x0, x0, x10, lsr #23 add x0, x0, x10, lsr #22 add x0, x0, x10, lsr #19 and x8, x8, #0x7fffff add x5, x5, x4, lsr #29 and x4, x4, 0x1fffffff bfi x4, x8, #32, #23 add x1, x1, x0, lsr #29 bfi x6, x1, #32, #30 and x0, x0, 0x1fffffff bfi x5, x0, #32, #29 stp x3, x4, [sp, #432] stp x5, x6, [sp, #448] str x2, [sp, #464] // mul add x29, sp, #512 ldp w13, w17, [x29, #0] ldp w14, w18, [x29, #8] ldp w15, w10, [x29, #16] ldp w16, w11, [x29, #24] ldr w12, [x29, #32] ldp w23, w27, [x29, #80] ldp w24, w28, [x29, #88] ldp w25, w20, [x29, #96] ldp w26, w21, [x29, #104] ldr w22, [x29, #112] umull x0, w10, w20 umull x1, w10, w21 umull x2, w10, w22 umull x3, w10, w23 umull x4, w10, w24 umull x5, w10, w25 umull x6, w10, w26 umull x7, w10, w27 umull x8, w10, w28 umaddl x1, w11, w20, x1 umaddl x2, w11, w21, x2 umaddl x3, w11, w22, x3 umaddl x4, w11, w23, x4 umaddl x5, w11, w24, x5 umaddl x6, w11, w25, x6 umaddl x7, w11, w26, x7 umaddl x8, w11, w27, x8 umull x9, w11, w28 umaddl x2, w12, w20, x2 umaddl x3, w12, w21, x3 umaddl x4, w12, w22, x4 umaddl x5, w12, w23, x5 umaddl x6, w12, w24, x6 umaddl x7, w12, w25, x7 umaddl x8, w12, w26, x8 umaddl x9, w12, w27, x9 umull x10, w12, w28 umaddl x3, w13, w20, x3 umaddl x4, w13, w21, x4 umaddl x5, w13, w22, x5 umaddl x6, w13, w23, x6 umaddl x7, w13, w24, x7 umaddl x8, w13, w25, x8 umaddl x9, w13, w26, x9 umaddl x10, w13, w27, x10 umull x11, w13, w28 umaddl x4, w14, w20, x4 umaddl x5, w14, w21, x5 umaddl x6, w14, w22, x6 umaddl x7, w14, w23, x7 umaddl x8, w14, w24, x8 umaddl x9, w14, w25, x9 umaddl x10, w14, w26, x10 umaddl x11, w14, w27, x11 umull x12, w14, w28 umaddl x5, w15, w20, x5 umaddl x6, w15, w21, x6 umaddl x7, w15, w22, x7 umaddl x8, w15, w23, x8 umaddl x9, w15, w24, x9 umaddl x10, w15, w25, x10 umaddl x11, w15, w26, x11 umaddl x12, w15, w27, x12 umull x13, w15, w28 umaddl x6, w16, w20, x6 umaddl x7, w16, w21, x7 umaddl x8, w16, w22, x8 umaddl x9, w16, w23, x9 umaddl x10, w16, w24, x10 umaddl x11, w16, w25, x11 umaddl x12, w16, w26, x12 umaddl x13, w16, w27, x13 umull x14, w16, w28 umaddl x7, w17, w20, x7 umaddl x8, w17, w21, x8 umaddl x9, w17, w22, x9 umaddl x10, w17, w23, x10 umaddl x11, w17, w24, x11 umaddl x12, w17, w25, x12 umaddl x13, w17, w26, x13 umaddl x14, w17, w27, x14 umull x15, w17, w28 umaddl x8, w18, w20, x8 umaddl x9, w18, w21, x9 umaddl x10, w18, w22, x10 umaddl x11, w18, w23, x11 umaddl x12, w18, w24, x12 umaddl x13, w18, w25, x13 umaddl x14, w18, w26, x14 umaddl x15, w18, w27, x15 umull x16, w18, w28 add x10, x10, x9, lsr #29 and x9, x9, #0x1fffffff umull x9, w9, w30 add x0, x0, x9 add x11, x11, x10, lsr #29 and x10, x10, #0x1fffffff umull x10, w10, w30 add x1, x1, x10 add x12, x12, x11, lsr #29 and x11, x11, #0x1fffffff umull x11, w11, w30 add x2, x2, x11 add x13, x13, x12, lsr #29 and x12, x12, #0x1fffffff umull x12, w12, w30 add x3, x3, x12 add x14, x14, x13, lsr #29 and x13, x13, #0x1fffffff umull x13, w13, w30 add x4, x4, x13 add x15, x15, x14, lsr #29 and x14, x14, #0x1fffffff umull x14, w14, w30 add x5, x5, x14 add x16, x16, x15, lsr #29 and x15, x15, #0x1fffffff umull x15, w15, w30 add x6, x6, x15 lsr x9, x16, #29 and x16, x16, #0x1fffffff umull x16, w16, w30 add x7, x7, x16 umull x9, w9, w30 add x8, x8, x9 add x5, x5, x4, lsr #29 and x4, x4, 0x1fffffff add x1, x1, x0, lsr #29 and x0, x0, 0x1fffffff add x6, x6, x5, lsr #29 and x5, x5, 0x1fffffff add x2, x2, x1, lsr #29 and x1, x1, 0x1fffffff add x7, x7, x6, lsr #29 and x6, x6, 0x1fffffff add x3, x3, x2, lsr #29 and x2, x2, 0x1fffffff add x8, x8, x7, lsr #29 and x7, x7, 0x1fffffff add x4, x4, x3, lsr #29 and x3, x3, 0x1fffffff bfi x3, x7, #32, #29 bic x10, x8, #0x7fffff add x0, x0, x10, lsr #23 add x0, x0, x10, lsr #22 add x0, x0, x10, lsr #19 and x8, x8, #0x7fffff add x5, x5, x4, lsr #29 and x4, x4, 0x1fffffff bfi x4, x8, #32, #23 add x1, x1, x0, lsr #29 bfi x6, x1, #32, #30 and x0, x0, 0x1fffffff bfi x5, x0, #32, #29 stp x3, x4, [sp, #472] stp x5, x6, [sp, #488] str x2, [sp, #504] ldrsb w26, [sp, #144] lsr w8, w26, #1 mov w7, w8 mov x9, #160 mul x8, x8, x9 ldr x0, [sp, #104] add x0, x0, x8 str x0, [sp, #152] /* pnielsadd p1p1 */ // add ldp x23, x24, [sp, #392] ldp x25, x26, [sp, #408] ldr x22, [sp, #424] ldp x13, x14, [sp, #352] ldp x15, x16, [sp, #368] ldr x12, [sp, #384] add x3, x23, x13 add x4, x24, x14 add x5, x25, x15 add x6, x26, x16 add x2, x22, x12 add x29, sp, #712 stp x3, x4, [x29, #0] stp x5, x6, [x29, #16] str x2, [x29, #32] // sub ldp x20, x21, [sp, #160] ldp x27, x28, [sp, #176] add x23, x23, x20 add x24, x24, x21 add x25, x25, x27 add x26, x26, x20 add x22, x22, x28 sub x23, x23, x13 sub x24, x24, x14 sub x25, x25, x15 sub x26, x26, x16 sub x22, x22, x12 // mul ldr x0, [sp, #152] ldp w13, w17, [x0, #0] ldp w14, w18, [x0, #8] ldp w15, w10, [x0, #16] ldp w16, w11, [x0, #24] ldr w12, [x0, #32] lsr x27, x23, #32 lsr x28, x24, #32 lsr x20, x25, #32 lsr x21, x26, #32 umull x0, w10, w20 umull x1, w10, w21 umull x2, w10, w22 umull x3, w10, w23 umull x4, w10, w24 umull x5, w10, w25 umull x6, w10, w26 umull x7, w10, w27 umull x8, w10, w28 umaddl x1, w11, w20, x1 umaddl x2, w11, w21, x2 umaddl x3, w11, w22, x3 umaddl x4, w11, w23, x4 umaddl x5, w11, w24, x5 umaddl x6, w11, w25, x6 umaddl x7, w11, w26, x7 umaddl x8, w11, w27, x8 umull x9, w11, w28 umaddl x2, w12, w20, x2 umaddl x3, w12, w21, x3 umaddl x4, w12, w22, x4 umaddl x5, w12, w23, x5 umaddl x6, w12, w24, x6 umaddl x7, w12, w25, x7 umaddl x8, w12, w26, x8 umaddl x9, w12, w27, x9 umull x10, w12, w28 umaddl x3, w13, w20, x3 umaddl x4, w13, w21, x4 umaddl x5, w13, w22, x5 umaddl x6, w13, w23, x6 umaddl x7, w13, w24, x7 umaddl x8, w13, w25, x8 umaddl x9, w13, w26, x9 umaddl x10, w13, w27, x10 umull x11, w13, w28 umaddl x4, w14, w20, x4 umaddl x5, w14, w21, x5 umaddl x6, w14, w22, x6 umaddl x7, w14, w23, x7 umaddl x8, w14, w24, x8 umaddl x9, w14, w25, x9 umaddl x10, w14, w26, x10 umaddl x11, w14, w27, x11 umull x12, w14, w28 umaddl x5, w15, w20, x5 umaddl x6, w15, w21, x6 umaddl x7, w15, w22, x7 umaddl x8, w15, w23, x8 umaddl x9, w15, w24, x9 umaddl x10, w15, w25, x10 umaddl x11, w15, w26, x11 umaddl x12, w15, w27, x12 umull x13, w15, w28 umaddl x6, w16, w20, x6 umaddl x7, w16, w21, x7 umaddl x8, w16, w22, x8 umaddl x9, w16, w23, x9 umaddl x10, w16, w24, x10 umaddl x11, w16, w25, x11 umaddl x12, w16, w26, x12 umaddl x13, w16, w27, x13 umull x14, w16, w28 umaddl x7, w17, w20, x7 umaddl x8, w17, w21, x8 umaddl x9, w17, w22, x9 umaddl x10, w17, w23, x10 umaddl x11, w17, w24, x11 umaddl x12, w17, w25, x12 umaddl x13, w17, w26, x13 umaddl x14, w17, w27, x14 umull x15, w17, w28 umaddl x8, w18, w20, x8 umaddl x9, w18, w21, x9 umaddl x10, w18, w22, x10 umaddl x11, w18, w23, x11 umaddl x12, w18, w24, x12 umaddl x13, w18, w25, x13 umaddl x14, w18, w26, x14 umaddl x15, w18, w27, x15 umull x16, w18, w28 add x10, x10, x9, lsr #29 and x9, x9, #0x1fffffff umull x9, w9, w30 add x0, x0, x9 add x11, x11, x10, lsr #29 and x10, x10, #0x1fffffff umull x10, w10, w30 add x1, x1, x10 add x12, x12, x11, lsr #29 and x11, x11, #0x1fffffff umull x11, w11, w30 add x2, x2, x11 add x13, x13, x12, lsr #29 and x12, x12, #0x1fffffff umull x12, w12, w30 add x3, x3, x12 add x14, x14, x13, lsr #29 and x13, x13, #0x1fffffff umull x13, w13, w30 add x4, x4, x13 add x15, x15, x14, lsr #29 and x14, x14, #0x1fffffff umull x14, w14, w30 add x5, x5, x14 add x16, x16, x15, lsr #29 and x15, x15, #0x1fffffff umull x15, w15, w30 add x6, x6, x15 lsr x9, x16, #29 and x16, x16, #0x1fffffff umull x16, w16, w30 add x7, x7, x16 umull x9, w9, w30 add x8, x8, x9 add x5, x5, x4, lsr #29 and x4, x4, 0x1fffffff add x1, x1, x0, lsr #29 and x0, x0, 0x1fffffff add x6, x6, x5, lsr #29 and x5, x5, 0x1fffffff add x2, x2, x1, lsr #29 and x1, x1, 0x1fffffff add x7, x7, x6, lsr #29 and x6, x6, 0x1fffffff add x3, x3, x2, lsr #29 and x2, x2, 0x1fffffff add x8, x8, x7, lsr #29 and x7, x7, 0x1fffffff add x4, x4, x3, lsr #29 and x3, x3, 0x1fffffff bfi x3, x7, #32, #29 bic x10, x8, #0x7fffff add x0, x0, x10, lsr #23 add x0, x0, x10, lsr #22 add x0, x0, x10, lsr #19 and x8, x8, #0x7fffff add x5, x5, x4, lsr #29 and x4, x4, 0x1fffffff bfi x4, x8, #32, #23 add x1, x1, x0, lsr #29 bfi x6, x1, #32, #30 and x0, x0, 0x1fffffff bfi x5, x0, #32, #29 add x29, sp, #672 stp x3, x4, [x29, #0] stp x5, x6, [x29, #16] str x2, [x29, #32] // mul ldr x0, [sp, #152] ldp w13, w17, [x0, #40] ldp w14, w18, [x0, #48] ldp w15, w10, [x0, #56] ldp w16, w11, [x0, #64] ldr w12, [x0, #72] ldp w23, w27, [x29, #40] ldp w24, w28, [x29, #48] ldp w25, w20, [x29, #56] ldp w26, w21, [x29, #64] ldr w22, [x29, #72] umull x0, w10, w20 umull x1, w10, w21 umull x2, w10, w22 umull x3, w10, w23 umull x4, w10, w24 umull x5, w10, w25 umull x6, w10, w26 umull x7, w10, w27 umull x8, w10, w28 umaddl x1, w11, w20, x1 umaddl x2, w11, w21, x2 umaddl x3, w11, w22, x3 umaddl x4, w11, w23, x4 umaddl x5, w11, w24, x5 umaddl x6, w11, w25, x6 umaddl x7, w11, w26, x7 umaddl x8, w11, w27, x8 umull x9, w11, w28 umaddl x2, w12, w20, x2 umaddl x3, w12, w21, x3 umaddl x4, w12, w22, x4 umaddl x5, w12, w23, x5 umaddl x6, w12, w24, x6 umaddl x7, w12, w25, x7 umaddl x8, w12, w26, x8 umaddl x9, w12, w27, x9 umull x10, w12, w28 umaddl x3, w13, w20, x3 umaddl x4, w13, w21, x4 umaddl x5, w13, w22, x5 umaddl x6, w13, w23, x6 umaddl x7, w13, w24, x7 umaddl x8, w13, w25, x8 umaddl x9, w13, w26, x9 umaddl x10, w13, w27, x10 umull x11, w13, w28 umaddl x4, w14, w20, x4 umaddl x5, w14, w21, x5 umaddl x6, w14, w22, x6 umaddl x7, w14, w23, x7 umaddl x8, w14, w24, x8 umaddl x9, w14, w25, x9 umaddl x10, w14, w26, x10 umaddl x11, w14, w27, x11 umull x12, w14, w28 umaddl x5, w15, w20, x5 umaddl x6, w15, w21, x6 umaddl x7, w15, w22, x7 umaddl x8, w15, w23, x8 umaddl x9, w15, w24, x9 umaddl x10, w15, w25, x10 umaddl x11, w15, w26, x11 umaddl x12, w15, w27, x12 umull x13, w15, w28 umaddl x6, w16, w20, x6 umaddl x7, w16, w21, x7 umaddl x8, w16, w22, x8 umaddl x9, w16, w23, x9 umaddl x10, w16, w24, x10 umaddl x11, w16, w25, x11 umaddl x12, w16, w26, x12 umaddl x13, w16, w27, x13 umull x14, w16, w28 umaddl x7, w17, w20, x7 umaddl x8, w17, w21, x8 umaddl x9, w17, w22, x9 umaddl x10, w17, w23, x10 umaddl x11, w17, w24, x11 umaddl x12, w17, w25, x12 umaddl x13, w17, w26, x13 umaddl x14, w17, w27, x14 umull x15, w17, w28 umaddl x8, w18, w20, x8 umaddl x9, w18, w21, x9 umaddl x10, w18, w22, x10 umaddl x11, w18, w23, x11 umaddl x12, w18, w24, x12 umaddl x13, w18, w25, x13 umaddl x14, w18, w26, x14 umaddl x15, w18, w27, x15 umull x16, w18, w28 add x10, x10, x9, lsr #29 and x9, x9, #0x1fffffff umull x9, w9, w30 add x0, x0, x9 add x11, x11, x10, lsr #29 and x10, x10, #0x1fffffff umull x10, w10, w30 add x1, x1, x10 add x12, x12, x11, lsr #29 and x11, x11, #0x1fffffff umull x11, w11, w30 add x2, x2, x11 add x13, x13, x12, lsr #29 and x12, x12, #0x1fffffff umull x12, w12, w30 add x3, x3, x12 add x14, x14, x13, lsr #29 and x13, x13, #0x1fffffff umull x13, w13, w30 add x4, x4, x13 add x15, x15, x14, lsr #29 and x14, x14, #0x1fffffff umull x14, w14, w30 add x5, x5, x14 add x16, x16, x15, lsr #29 and x15, x15, #0x1fffffff umull x15, w15, w30 add x6, x6, x15 lsr x9, x16, #29 and x16, x16, #0x1fffffff umull x16, w16, w30 add x7, x7, x16 umull x9, w9, w30 add x8, x8, x9 add x5, x5, x4, lsr #29 and x4, x4, 0x1fffffff add x1, x1, x0, lsr #29 and x0, x0, 0x1fffffff add x6, x6, x5, lsr #29 and x5, x5, 0x1fffffff add x2, x2, x1, lsr #29 and x1, x1, 0x1fffffff add x7, x7, x6, lsr #29 and x6, x6, 0x1fffffff add x3, x3, x2, lsr #29 and x2, x2, 0x1fffffff add x8, x8, x7, lsr #29 and x7, x7, 0x1fffffff add x4, x4, x3, lsr #29 and x3, x3, 0x1fffffff bfi x3, x7, #32, #29 bic x10, x8, #0x7fffff add x0, x0, x10, lsr #23 add x0, x0, x10, lsr #22 add x0, x0, x10, lsr #19 and x8, x8, #0x7fffff add x5, x5, x4, lsr #29 and x4, x4, 0x1fffffff bfi x4, x8, #32, #23 add x1, x1, x0, lsr #29 bfi x6, x1, #32, #30 and x0, x0, 0x1fffffff bfi x5, x0, #32, #29 // add add x29, sp, #472 ldp x13, x14, [x29, #200] ldp x15, x16, [x29, #216] ldr x12, [x29, #232] add x0, x3, x13 add x1, x4, x14 add x7, x5, x15 add x8, x6, x16 add x9, x2, x12 stp x0, x1, [x29, #120] stp x7, x8, [x29, #136] str x9, [x29, #152] // sub ldp x20, x21, [sp, #160] ldp x27, x28, [sp, #176] add x3, x3, x20 add x4, x4, x21 add x5, x5, x27 add x6, x6, x20 add x2, x2, x28 sub x3, x3, x13 sub x4, x4, x14 sub x5, x5, x15 sub x6, x6, x16 sub x2, x2, x12 stp x3, x4, [x29, #40] stp x5, x6, [x29, #56] str x2, [x29, #72] // mul ldr x0, [sp, #152] ldp w13, w17, [x0, #120] ldp w14, w18, [x0, #128] ldp w15, w10, [x0, #136] ldp w16, w11, [x0, #144] ldr w12, [x0, #152] ldp w23, w27, [x29, #0] ldp w24, w28, [x29, #8] ldp w25, w20, [x29, #16] ldp w26, w21, [x29, #24] ldr w22, [x29, #32] umull x0, w10, w20 umull x1, w10, w21 umull x2, w10, w22 umull x3, w10, w23 umull x4, w10, w24 umull x5, w10, w25 umull x6, w10, w26 umull x7, w10, w27 umull x8, w10, w28 umaddl x1, w11, w20, x1 umaddl x2, w11, w21, x2 umaddl x3, w11, w22, x3 umaddl x4, w11, w23, x4 umaddl x5, w11, w24, x5 umaddl x6, w11, w25, x6 umaddl x7, w11, w26, x7 umaddl x8, w11, w27, x8 umull x9, w11, w28 umaddl x2, w12, w20, x2 umaddl x3, w12, w21, x3 umaddl x4, w12, w22, x4 umaddl x5, w12, w23, x5 umaddl x6, w12, w24, x6 umaddl x7, w12, w25, x7 umaddl x8, w12, w26, x8 umaddl x9, w12, w27, x9 umull x10, w12, w28 umaddl x3, w13, w20, x3 umaddl x4, w13, w21, x4 umaddl x5, w13, w22, x5 umaddl x6, w13, w23, x6 umaddl x7, w13, w24, x7 umaddl x8, w13, w25, x8 umaddl x9, w13, w26, x9 umaddl x10, w13, w27, x10 umull x11, w13, w28 umaddl x4, w14, w20, x4 umaddl x5, w14, w21, x5 umaddl x6, w14, w22, x6 umaddl x7, w14, w23, x7 umaddl x8, w14, w24, x8 umaddl x9, w14, w25, x9 umaddl x10, w14, w26, x10 umaddl x11, w14, w27, x11 umull x12, w14, w28 umaddl x5, w15, w20, x5 umaddl x6, w15, w21, x6 umaddl x7, w15, w22, x7 umaddl x8, w15, w23, x8 umaddl x9, w15, w24, x9 umaddl x10, w15, w25, x10 umaddl x11, w15, w26, x11 umaddl x12, w15, w27, x12 umull x13, w15, w28 umaddl x6, w16, w20, x6 umaddl x7, w16, w21, x7 umaddl x8, w16, w22, x8 umaddl x9, w16, w23, x9 umaddl x10, w16, w24, x10 umaddl x11, w16, w25, x11 umaddl x12, w16, w26, x12 umaddl x13, w16, w27, x13 umull x14, w16, w28 umaddl x7, w17, w20, x7 umaddl x8, w17, w21, x8 umaddl x9, w17, w22, x9 umaddl x10, w17, w23, x10 umaddl x11, w17, w24, x11 umaddl x12, w17, w25, x12 umaddl x13, w17, w26, x13 umaddl x14, w17, w27, x14 umull x15, w17, w28 umaddl x8, w18, w20, x8 umaddl x9, w18, w21, x9 umaddl x10, w18, w22, x10 umaddl x11, w18, w23, x11 umaddl x12, w18, w24, x12 umaddl x13, w18, w25, x13 umaddl x14, w18, w26, x14 umaddl x15, w18, w27, x15 umull x16, w18, w28 add x10, x10, x9, lsr #29 and x9, x9, #0x1fffffff umull x9, w9, w30 add x0, x0, x9 add x11, x11, x10, lsr #29 and x10, x10, #0x1fffffff umull x10, w10, w30 add x1, x1, x10 add x12, x12, x11, lsr #29 and x11, x11, #0x1fffffff umull x11, w11, w30 add x2, x2, x11 add x13, x13, x12, lsr #29 and x12, x12, #0x1fffffff umull x12, w12, w30 add x3, x3, x12 add x14, x14, x13, lsr #29 and x13, x13, #0x1fffffff umull x13, w13, w30 add x4, x4, x13 add x15, x15, x14, lsr #29 and x14, x14, #0x1fffffff umull x14, w14, w30 add x5, x5, x14 add x16, x16, x15, lsr #29 and x15, x15, #0x1fffffff umull x15, w15, w30 add x6, x6, x15 lsr x9, x16, #29 and x16, x16, #0x1fffffff umull x16, w16, w30 add x7, x7, x16 umull x9, w9, w30 add x8, x8, x9 add x5, x5, x4, lsr #29 and x4, x4, 0x1fffffff add x1, x1, x0, lsr #29 and x0, x0, 0x1fffffff add x6, x6, x5, lsr #29 and x5, x5, 0x1fffffff add x2, x2, x1, lsr #29 and x1, x1, 0x1fffffff add x7, x7, x6, lsr #29 and x6, x6, 0x1fffffff add x3, x3, x2, lsr #29 and x2, x2, 0x1fffffff add x8, x8, x7, lsr #29 and x7, x7, 0x1fffffff add x4, x4, x3, lsr #29 and x3, x3, 0x1fffffff bfi x3, x7, #32, #29 bic x10, x8, #0x7fffff add x0, x0, x10, lsr #23 add x0, x0, x10, lsr #22 add x0, x0, x10, lsr #19 and x8, x8, #0x7fffff add x5, x5, x4, lsr #29 and x4, x4, 0x1fffffff bfi x4, x8, #32, #23 add x1, x1, x0, lsr #29 bfi x6, x1, #32, #30 and x0, x0, 0x1fffffff bfi x5, x0, #32, #29 add x29, sp, #672 stp x3, x4, [x29, #0] stp x5, x6, [x29, #16] str x2, [x29, #32] // mul ldr x0, [sp, #152] ldp w13, w17, [x0, #80] ldp w14, w18, [x0, #88] ldp w15, w10, [x0, #96] ldp w16, w11, [x0, #104] ldr w12, [x0, #112] add x29, sp, #432 ldp w23, w27, [x29, #0] ldp w24, w28, [x29, #8] ldp w25, w20, [x29, #16] ldp w26, w21, [x29, #24] ldr w22, [x29, #32] umull x0, w10, w20 umull x1, w10, w21 umull x2, w10, w22 umull x3, w10, w23 umull x4, w10, w24 umull x5, w10, w25 umull x6, w10, w26 umull x7, w10, w27 umull x8, w10, w28 umaddl x1, w11, w20, x1 umaddl x2, w11, w21, x2 umaddl x3, w11, w22, x3 umaddl x4, w11, w23, x4 umaddl x5, w11, w24, x5 umaddl x6, w11, w25, x6 umaddl x7, w11, w26, x7 umaddl x8, w11, w27, x8 umull x9, w11, w28 umaddl x2, w12, w20, x2 umaddl x3, w12, w21, x3 umaddl x4, w12, w22, x4 umaddl x5, w12, w23, x5 umaddl x6, w12, w24, x6 umaddl x7, w12, w25, x7 umaddl x8, w12, w26, x8 umaddl x9, w12, w27, x9 umull x10, w12, w28 umaddl x3, w13, w20, x3 umaddl x4, w13, w21, x4 umaddl x5, w13, w22, x5 umaddl x6, w13, w23, x6 umaddl x7, w13, w24, x7 umaddl x8, w13, w25, x8 umaddl x9, w13, w26, x9 umaddl x10, w13, w27, x10 umull x11, w13, w28 umaddl x4, w14, w20, x4 umaddl x5, w14, w21, x5 umaddl x6, w14, w22, x6 umaddl x7, w14, w23, x7 umaddl x8, w14, w24, x8 umaddl x9, w14, w25, x9 umaddl x10, w14, w26, x10 umaddl x11, w14, w27, x11 umull x12, w14, w28 umaddl x5, w15, w20, x5 umaddl x6, w15, w21, x6 umaddl x7, w15, w22, x7 umaddl x8, w15, w23, x8 umaddl x9, w15, w24, x9 umaddl x10, w15, w25, x10 umaddl x11, w15, w26, x11 umaddl x12, w15, w27, x12 umull x13, w15, w28 umaddl x6, w16, w20, x6 umaddl x7, w16, w21, x7 umaddl x8, w16, w22, x8 umaddl x9, w16, w23, x9 umaddl x10, w16, w24, x10 umaddl x11, w16, w25, x11 umaddl x12, w16, w26, x12 umaddl x13, w16, w27, x13 umull x14, w16, w28 umaddl x7, w17, w20, x7 umaddl x8, w17, w21, x8 umaddl x9, w17, w22, x9 umaddl x10, w17, w23, x10 umaddl x11, w17, w24, x11 umaddl x12, w17, w25, x12 umaddl x13, w17, w26, x13 umaddl x14, w17, w27, x14 umull x15, w17, w28 umaddl x8, w18, w20, x8 umaddl x9, w18, w21, x9 umaddl x10, w18, w22, x10 umaddl x11, w18, w23, x11 umaddl x12, w18, w24, x12 umaddl x13, w18, w25, x13 umaddl x14, w18, w26, x14 umaddl x15, w18, w27, x15 umull x16, w18, w28 add x10, x10, x9, lsr #29 and x9, x9, #0x1fffffff umull x9, w9, w30 add x0, x0, x9 add x11, x11, x10, lsr #29 and x10, x10, #0x1fffffff umull x10, w10, w30 add x1, x1, x10 add x12, x12, x11, lsr #29 and x11, x11, #0x1fffffff umull x11, w11, w30 add x2, x2, x11 add x13, x13, x12, lsr #29 and x12, x12, #0x1fffffff umull x12, w12, w30 add x3, x3, x12 add x14, x14, x13, lsr #29 and x13, x13, #0x1fffffff umull x13, w13, w30 add x4, x4, x13 add x15, x15, x14, lsr #29 and x14, x14, #0x1fffffff umull x14, w14, w30 add x5, x5, x14 add x16, x16, x15, lsr #29 and x15, x15, #0x1fffffff umull x15, w15, w30 add x6, x6, x15 lsr x9, x16, #29 and x16, x16, #0x1fffffff umull x16, w16, w30 add x7, x7, x16 umull x9, w9, w30 add x8, x8, x9 // double and then reduce add x0, x0, x0 add x1, x1, x1 add x2, x2, x2 add x3, x3, x3 add x4, x4, x4 add x5, x5, x5 add x6, x6, x6 add x7, x7, x7 add x8, x8, x8 add x5, x5, x4, lsr #29 and x4, x4, 0x1fffffff add x1, x1, x0, lsr #29 and x0, x0, 0x1fffffff add x6, x6, x5, lsr #29 and x5, x5, 0x1fffffff add x2, x2, x1, lsr #29 and x1, x1, 0x1fffffff add x7, x7, x6, lsr #29 and x6, x6, 0x1fffffff add x3, x3, x2, lsr #29 and x2, x2, 0x1fffffff add x8, x8, x7, lsr #29 and x7, x7, 0x1fffffff add x4, x4, x3, lsr #29 and x3, x3, 0x1fffffff bfi x3, x7, #32, #29 bic x10, x8, #0x7fffff add x0, x0, x10, lsr #23 add x0, x0, x10, lsr #22 add x0, x0, x10, lsr #19 and x8, x8, #0x7fffff add x5, x5, x4, lsr #29 and x4, x4, 0x1fffffff bfi x4, x8, #32, #23 add x1, x1, x0, lsr #29 bfi x6, x1, #32, #30 and x0, x0, 0x1fffffff bfi x5, x0, #32, #29 // add add x29, sp, #552 ldp x13, x14, [x29, #120] ldp x15, x16, [x29, #136] ldr x12, [x29, #152] add x0, x3, x13 add x1, x4, x14 add x7, x5, x15 add x8, x6, x16 add x9, x2, x12 stp x0, x1, [x29, #0] stp x7, x8, [x29, #16] str x9, [x29, #32] // sub ldp x20, x21, [sp, #160] ldp x27, x28, [sp, #176] add x3, x3, x20 add x4, x4, x21 add x5, x5, x27 add x6, x6, x20 add x2, x2, x28 sub x3, x3, x13 sub x4, x4, x14 sub x5, x5, x15 sub x6, x6, x16 sub x2, x2, x12 stp x3, x4, [x29, #80] stp x5, x6, [x29, #96] str x2, [x29, #112] b .L6 .L5: /* p1p1 to p3 */ // mul add x29, sp, #512 ldp w13, w17, [x29, #0] ldp w14, w18, [x29, #8] ldp w15, w10, [x29, #16] ldp w16, w11, [x29, #24] ldr w12, [x29, #32] ldp w23, w27, [x29, #120] ldp w24, w28, [x29, #128] ldp w25, w20, [x29, #136] ldp w26, w21, [x29, #144] ldr w22, [x29, #152] umull x0, w10, w20 umull x1, w10, w21 umull x2, w10, w22 umull x3, w10, w23 umull x4, w10, w24 umull x5, w10, w25 umull x6, w10, w26 umull x7, w10, w27 umull x8, w10, w28 umaddl x1, w11, w20, x1 umaddl x2, w11, w21, x2 umaddl x3, w11, w22, x3 umaddl x4, w11, w23, x4 umaddl x5, w11, w24, x5 umaddl x6, w11, w25, x6 umaddl x7, w11, w26, x7 umaddl x8, w11, w27, x8 umull x9, w11, w28 umaddl x2, w12, w20, x2 umaddl x3, w12, w21, x3 umaddl x4, w12, w22, x4 umaddl x5, w12, w23, x5 umaddl x6, w12, w24, x6 umaddl x7, w12, w25, x7 umaddl x8, w12, w26, x8 umaddl x9, w12, w27, x9 umull x10, w12, w28 umaddl x3, w13, w20, x3 umaddl x4, w13, w21, x4 umaddl x5, w13, w22, x5 umaddl x6, w13, w23, x6 umaddl x7, w13, w24, x7 umaddl x8, w13, w25, x8 umaddl x9, w13, w26, x9 umaddl x10, w13, w27, x10 umull x11, w13, w28 umaddl x4, w14, w20, x4 umaddl x5, w14, w21, x5 umaddl x6, w14, w22, x6 umaddl x7, w14, w23, x7 umaddl x8, w14, w24, x8 umaddl x9, w14, w25, x9 umaddl x10, w14, w26, x10 umaddl x11, w14, w27, x11 umull x12, w14, w28 umaddl x5, w15, w20, x5 umaddl x6, w15, w21, x6 umaddl x7, w15, w22, x7 umaddl x8, w15, w23, x8 umaddl x9, w15, w24, x9 umaddl x10, w15, w25, x10 umaddl x11, w15, w26, x11 umaddl x12, w15, w27, x12 umull x13, w15, w28 umaddl x6, w16, w20, x6 umaddl x7, w16, w21, x7 umaddl x8, w16, w22, x8 umaddl x9, w16, w23, x9 umaddl x10, w16, w24, x10 umaddl x11, w16, w25, x11 umaddl x12, w16, w26, x12 umaddl x13, w16, w27, x13 umull x14, w16, w28 umaddl x7, w17, w20, x7 umaddl x8, w17, w21, x8 umaddl x9, w17, w22, x9 umaddl x10, w17, w23, x10 umaddl x11, w17, w24, x11 umaddl x12, w17, w25, x12 umaddl x13, w17, w26, x13 umaddl x14, w17, w27, x14 umull x15, w17, w28 umaddl x8, w18, w20, x8 umaddl x9, w18, w21, x9 umaddl x10, w18, w22, x10 umaddl x11, w18, w23, x11 umaddl x12, w18, w24, x12 umaddl x13, w18, w25, x13 umaddl x14, w18, w26, x14 umaddl x15, w18, w27, x15 umull x16, w18, w28 add x10, x10, x9, lsr #29 and x9, x9, #0x1fffffff umull x9, w9, w30 add x0, x0, x9 add x11, x11, x10, lsr #29 and x10, x10, #0x1fffffff umull x10, w10, w30 add x1, x1, x10 add x12, x12, x11, lsr #29 and x11, x11, #0x1fffffff umull x11, w11, w30 add x2, x2, x11 add x13, x13, x12, lsr #29 and x12, x12, #0x1fffffff umull x12, w12, w30 add x3, x3, x12 add x14, x14, x13, lsr #29 and x13, x13, #0x1fffffff umull x13, w13, w30 add x4, x4, x13 add x15, x15, x14, lsr #29 and x14, x14, #0x1fffffff umull x14, w14, w30 add x5, x5, x14 add x16, x16, x15, lsr #29 and x15, x15, #0x1fffffff umull x15, w15, w30 add x6, x6, x15 lsr x9, x16, #29 and x16, x16, #0x1fffffff umull x16, w16, w30 add x7, x7, x16 umull x9, w9, w30 add x8, x8, x9 add x5, x5, x4, lsr #29 and x4, x4, 0x1fffffff add x1, x1, x0, lsr #29 and x0, x0, 0x1fffffff add x6, x6, x5, lsr #29 and x5, x5, 0x1fffffff add x2, x2, x1, lsr #29 and x1, x1, 0x1fffffff add x7, x7, x6, lsr #29 and x6, x6, 0x1fffffff add x3, x3, x2, lsr #29 and x2, x2, 0x1fffffff add x8, x8, x7, lsr #29 and x7, x7, 0x1fffffff add x4, x4, x3, lsr #29 and x3, x3, 0x1fffffff bfi x3, x7, #32, #29 bic x10, x8, #0x7fffff add x0, x0, x10, lsr #23 add x0, x0, x10, lsr #22 add x0, x0, x10, lsr #19 and x8, x8, #0x7fffff add x5, x5, x4, lsr #29 and x4, x4, 0x1fffffff bfi x4, x8, #32, #23 add x1, x1, x0, lsr #29 bfi x6, x1, #32, #30 and x0, x0, 0x1fffffff bfi x5, x0, #32, #29 stp x3, x4, [sp, #352] stp x5, x6, [sp, #368] str x2, [sp, #384] // mul add x29, sp, #552 ldp w13, w17, [x29, #0] ldp w14, w18, [x29, #8] ldp w15, w10, [x29, #16] ldp w16, w11, [x29, #24] ldr w12, [x29, #32] ldp w23, w27, [x29, #40] ldp w24, w28, [x29, #48] ldp w25, w20, [x29, #56] ldp w26, w21, [x29, #64] ldr w22, [x29, #72] umull x0, w10, w20 umull x1, w10, w21 umull x2, w10, w22 umull x3, w10, w23 umull x4, w10, w24 umull x5, w10, w25 umull x6, w10, w26 umull x7, w10, w27 umull x8, w10, w28 umaddl x1, w11, w20, x1 umaddl x2, w11, w21, x2 umaddl x3, w11, w22, x3 umaddl x4, w11, w23, x4 umaddl x5, w11, w24, x5 umaddl x6, w11, w25, x6 umaddl x7, w11, w26, x7 umaddl x8, w11, w27, x8 umull x9, w11, w28 umaddl x2, w12, w20, x2 umaddl x3, w12, w21, x3 umaddl x4, w12, w22, x4 umaddl x5, w12, w23, x5 umaddl x6, w12, w24, x6 umaddl x7, w12, w25, x7 umaddl x8, w12, w26, x8 umaddl x9, w12, w27, x9 umull x10, w12, w28 umaddl x3, w13, w20, x3 umaddl x4, w13, w21, x4 umaddl x5, w13, w22, x5 umaddl x6, w13, w23, x6 umaddl x7, w13, w24, x7 umaddl x8, w13, w25, x8 umaddl x9, w13, w26, x9 umaddl x10, w13, w27, x10 umull x11, w13, w28 umaddl x4, w14, w20, x4 umaddl x5, w14, w21, x5 umaddl x6, w14, w22, x6 umaddl x7, w14, w23, x7 umaddl x8, w14, w24, x8 umaddl x9, w14, w25, x9 umaddl x10, w14, w26, x10 umaddl x11, w14, w27, x11 umull x12, w14, w28 umaddl x5, w15, w20, x5 umaddl x6, w15, w21, x6 umaddl x7, w15, w22, x7 umaddl x8, w15, w23, x8 umaddl x9, w15, w24, x9 umaddl x10, w15, w25, x10 umaddl x11, w15, w26, x11 umaddl x12, w15, w27, x12 umull x13, w15, w28 umaddl x6, w16, w20, x6 umaddl x7, w16, w21, x7 umaddl x8, w16, w22, x8 umaddl x9, w16, w23, x9 umaddl x10, w16, w24, x10 umaddl x11, w16, w25, x11 umaddl x12, w16, w26, x12 umaddl x13, w16, w27, x13 umull x14, w16, w28 umaddl x7, w17, w20, x7 umaddl x8, w17, w21, x8 umaddl x9, w17, w22, x9 umaddl x10, w17, w23, x10 umaddl x11, w17, w24, x11 umaddl x12, w17, w25, x12 umaddl x13, w17, w26, x13 umaddl x14, w17, w27, x14 umull x15, w17, w28 umaddl x8, w18, w20, x8 umaddl x9, w18, w21, x9 umaddl x10, w18, w22, x10 umaddl x11, w18, w23, x11 umaddl x12, w18, w24, x12 umaddl x13, w18, w25, x13 umaddl x14, w18, w26, x14 umaddl x15, w18, w27, x15 umull x16, w18, w28 add x10, x10, x9, lsr #29 and x9, x9, #0x1fffffff umull x9, w9, w30 add x0, x0, x9 add x11, x11, x10, lsr #29 and x10, x10, #0x1fffffff umull x10, w10, w30 add x1, x1, x10 add x12, x12, x11, lsr #29 and x11, x11, #0x1fffffff umull x11, w11, w30 add x2, x2, x11 add x13, x13, x12, lsr #29 and x12, x12, #0x1fffffff umull x12, w12, w30 add x3, x3, x12 add x14, x14, x13, lsr #29 and x13, x13, #0x1fffffff umull x13, w13, w30 add x4, x4, x13 add x15, x15, x14, lsr #29 and x14, x14, #0x1fffffff umull x14, w14, w30 add x5, x5, x14 add x16, x16, x15, lsr #29 and x15, x15, #0x1fffffff umull x15, w15, w30 add x6, x6, x15 lsr x9, x16, #29 and x16, x16, #0x1fffffff umull x16, w16, w30 add x7, x7, x16 umull x9, w9, w30 add x8, x8, x9 add x5, x5, x4, lsr #29 and x4, x4, 0x1fffffff add x1, x1, x0, lsr #29 and x0, x0, 0x1fffffff add x6, x6, x5, lsr #29 and x5, x5, 0x1fffffff add x2, x2, x1, lsr #29 and x1, x1, 0x1fffffff add x7, x7, x6, lsr #29 and x6, x6, 0x1fffffff add x3, x3, x2, lsr #29 and x2, x2, 0x1fffffff add x8, x8, x7, lsr #29 and x7, x7, 0x1fffffff add x4, x4, x3, lsr #29 and x3, x3, 0x1fffffff bfi x3, x7, #32, #29 bic x10, x8, #0x7fffff add x0, x0, x10, lsr #23 add x0, x0, x10, lsr #22 add x0, x0, x10, lsr #19 and x8, x8, #0x7fffff add x5, x5, x4, lsr #29 and x4, x4, 0x1fffffff bfi x4, x8, #32, #23 add x1, x1, x0, lsr #29 bfi x6, x1, #32, #30 and x0, x0, 0x1fffffff bfi x5, x0, #32, #29 stp x3, x4, [sp, #392] stp x5, x6, [sp, #408] str x2, [sp, #424] // mul add x29, sp, #552 ldp w13, w17, [x29, #0] ldp w14, w18, [x29, #8] ldp w15, w10, [x29, #16] ldp w16, w11, [x29, #24] ldr w12, [x29, #32] ldp w23, w27, [x29, #80] ldp w24, w28, [x29, #88] ldp w25, w20, [x29, #96] ldp w26, w21, [x29, #104] ldr w22, [x29, #112] umull x0, w10, w20 umull x1, w10, w21 umull x2, w10, w22 umull x3, w10, w23 umull x4, w10, w24 umull x5, w10, w25 umull x6, w10, w26 umull x7, w10, w27 umull x8, w10, w28 umaddl x1, w11, w20, x1 umaddl x2, w11, w21, x2 umaddl x3, w11, w22, x3 umaddl x4, w11, w23, x4 umaddl x5, w11, w24, x5 umaddl x6, w11, w25, x6 umaddl x7, w11, w26, x7 umaddl x8, w11, w27, x8 umull x9, w11, w28 umaddl x2, w12, w20, x2 umaddl x3, w12, w21, x3 umaddl x4, w12, w22, x4 umaddl x5, w12, w23, x5 umaddl x6, w12, w24, x6 umaddl x7, w12, w25, x7 umaddl x8, w12, w26, x8 umaddl x9, w12, w27, x9 umull x10, w12, w28 umaddl x3, w13, w20, x3 umaddl x4, w13, w21, x4 umaddl x5, w13, w22, x5 umaddl x6, w13, w23, x6 umaddl x7, w13, w24, x7 umaddl x8, w13, w25, x8 umaddl x9, w13, w26, x9 umaddl x10, w13, w27, x10 umull x11, w13, w28 umaddl x4, w14, w20, x4 umaddl x5, w14, w21, x5 umaddl x6, w14, w22, x6 umaddl x7, w14, w23, x7 umaddl x8, w14, w24, x8 umaddl x9, w14, w25, x9 umaddl x10, w14, w26, x10 umaddl x11, w14, w27, x11 umull x12, w14, w28 umaddl x5, w15, w20, x5 umaddl x6, w15, w21, x6 umaddl x7, w15, w22, x7 umaddl x8, w15, w23, x8 umaddl x9, w15, w24, x9 umaddl x10, w15, w25, x10 umaddl x11, w15, w26, x11 umaddl x12, w15, w27, x12 umull x13, w15, w28 umaddl x6, w16, w20, x6 umaddl x7, w16, w21, x7 umaddl x8, w16, w22, x8 umaddl x9, w16, w23, x9 umaddl x10, w16, w24, x10 umaddl x11, w16, w25, x11 umaddl x12, w16, w26, x12 umaddl x13, w16, w27, x13 umull x14, w16, w28 umaddl x7, w17, w20, x7 umaddl x8, w17, w21, x8 umaddl x9, w17, w22, x9 umaddl x10, w17, w23, x10 umaddl x11, w17, w24, x11 umaddl x12, w17, w25, x12 umaddl x13, w17, w26, x13 umaddl x14, w17, w27, x14 umull x15, w17, w28 umaddl x8, w18, w20, x8 umaddl x9, w18, w21, x9 umaddl x10, w18, w22, x10 umaddl x11, w18, w23, x11 umaddl x12, w18, w24, x12 umaddl x13, w18, w25, x13 umaddl x14, w18, w26, x14 umaddl x15, w18, w27, x15 umull x16, w18, w28 add x10, x10, x9, lsr #29 and x9, x9, #0x1fffffff umull x9, w9, w30 add x0, x0, x9 add x11, x11, x10, lsr #29 and x10, x10, #0x1fffffff umull x10, w10, w30 add x1, x1, x10 add x12, x12, x11, lsr #29 and x11, x11, #0x1fffffff umull x11, w11, w30 add x2, x2, x11 add x13, x13, x12, lsr #29 and x12, x12, #0x1fffffff umull x12, w12, w30 add x3, x3, x12 add x14, x14, x13, lsr #29 and x13, x13, #0x1fffffff umull x13, w13, w30 add x4, x4, x13 add x15, x15, x14, lsr #29 and x14, x14, #0x1fffffff umull x14, w14, w30 add x5, x5, x14 add x16, x16, x15, lsr #29 and x15, x15, #0x1fffffff umull x15, w15, w30 add x6, x6, x15 lsr x9, x16, #29 and x16, x16, #0x1fffffff umull x16, w16, w30 add x7, x7, x16 umull x9, w9, w30 add x8, x8, x9 add x5, x5, x4, lsr #29 and x4, x4, 0x1fffffff add x1, x1, x0, lsr #29 and x0, x0, 0x1fffffff add x6, x6, x5, lsr #29 and x5, x5, 0x1fffffff add x2, x2, x1, lsr #29 and x1, x1, 0x1fffffff add x7, x7, x6, lsr #29 and x6, x6, 0x1fffffff add x3, x3, x2, lsr #29 and x2, x2, 0x1fffffff add x8, x8, x7, lsr #29 and x7, x7, 0x1fffffff add x4, x4, x3, lsr #29 and x3, x3, 0x1fffffff bfi x3, x7, #32, #29 bic x10, x8, #0x7fffff add x0, x0, x10, lsr #23 add x0, x0, x10, lsr #22 add x0, x0, x10, lsr #19 and x8, x8, #0x7fffff add x5, x5, x4, lsr #29 and x4, x4, 0x1fffffff bfi x4, x8, #32, #23 add x1, x1, x0, lsr #29 bfi x6, x1, #32, #30 and x0, x0, 0x1fffffff bfi x5, x0, #32, #29 stp x3, x4, [sp, #432] stp x5, x6, [sp, #448] str x2, [sp, #464] // mul add x29, sp, #512 ldp w13, w17, [x29, #0] ldp w14, w18, [x29, #8] ldp w15, w10, [x29, #16] ldp w16, w11, [x29, #24] ldr w12, [x29, #32] ldp w23, w27, [x29, #80] ldp w24, w28, [x29, #88] ldp w25, w20, [x29, #96] ldp w26, w21, [x29, #104] ldr w22, [x29, #112] umull x0, w10, w20 umull x1, w10, w21 umull x2, w10, w22 umull x3, w10, w23 umull x4, w10, w24 umull x5, w10, w25 umull x6, w10, w26 umull x7, w10, w27 umull x8, w10, w28 umaddl x1, w11, w20, x1 umaddl x2, w11, w21, x2 umaddl x3, w11, w22, x3 umaddl x4, w11, w23, x4 umaddl x5, w11, w24, x5 umaddl x6, w11, w25, x6 umaddl x7, w11, w26, x7 umaddl x8, w11, w27, x8 umull x9, w11, w28 umaddl x2, w12, w20, x2 umaddl x3, w12, w21, x3 umaddl x4, w12, w22, x4 umaddl x5, w12, w23, x5 umaddl x6, w12, w24, x6 umaddl x7, w12, w25, x7 umaddl x8, w12, w26, x8 umaddl x9, w12, w27, x9 umull x10, w12, w28 umaddl x3, w13, w20, x3 umaddl x4, w13, w21, x4 umaddl x5, w13, w22, x5 umaddl x6, w13, w23, x6 umaddl x7, w13, w24, x7 umaddl x8, w13, w25, x8 umaddl x9, w13, w26, x9 umaddl x10, w13, w27, x10 umull x11, w13, w28 umaddl x4, w14, w20, x4 umaddl x5, w14, w21, x5 umaddl x6, w14, w22, x6 umaddl x7, w14, w23, x7 umaddl x8, w14, w24, x8 umaddl x9, w14, w25, x9 umaddl x10, w14, w26, x10 umaddl x11, w14, w27, x11 umull x12, w14, w28 umaddl x5, w15, w20, x5 umaddl x6, w15, w21, x6 umaddl x7, w15, w22, x7 umaddl x8, w15, w23, x8 umaddl x9, w15, w24, x9 umaddl x10, w15, w25, x10 umaddl x11, w15, w26, x11 umaddl x12, w15, w27, x12 umull x13, w15, w28 umaddl x6, w16, w20, x6 umaddl x7, w16, w21, x7 umaddl x8, w16, w22, x8 umaddl x9, w16, w23, x9 umaddl x10, w16, w24, x10 umaddl x11, w16, w25, x11 umaddl x12, w16, w26, x12 umaddl x13, w16, w27, x13 umull x14, w16, w28 umaddl x7, w17, w20, x7 umaddl x8, w17, w21, x8 umaddl x9, w17, w22, x9 umaddl x10, w17, w23, x10 umaddl x11, w17, w24, x11 umaddl x12, w17, w25, x12 umaddl x13, w17, w26, x13 umaddl x14, w17, w27, x14 umull x15, w17, w28 umaddl x8, w18, w20, x8 umaddl x9, w18, w21, x9 umaddl x10, w18, w22, x10 umaddl x11, w18, w23, x11 umaddl x12, w18, w24, x12 umaddl x13, w18, w25, x13 umaddl x14, w18, w26, x14 umaddl x15, w18, w27, x15 umull x16, w18, w28 add x10, x10, x9, lsr #29 and x9, x9, #0x1fffffff umull x9, w9, w30 add x0, x0, x9 add x11, x11, x10, lsr #29 and x10, x10, #0x1fffffff umull x10, w10, w30 add x1, x1, x10 add x12, x12, x11, lsr #29 and x11, x11, #0x1fffffff umull x11, w11, w30 add x2, x2, x11 add x13, x13, x12, lsr #29 and x12, x12, #0x1fffffff umull x12, w12, w30 add x3, x3, x12 add x14, x14, x13, lsr #29 and x13, x13, #0x1fffffff umull x13, w13, w30 add x4, x4, x13 add x15, x15, x14, lsr #29 and x14, x14, #0x1fffffff umull x14, w14, w30 add x5, x5, x14 add x16, x16, x15, lsr #29 and x15, x15, #0x1fffffff umull x15, w15, w30 add x6, x6, x15 lsr x9, x16, #29 and x16, x16, #0x1fffffff umull x16, w16, w30 add x7, x7, x16 umull x9, w9, w30 add x8, x8, x9 add x5, x5, x4, lsr #29 and x4, x4, 0x1fffffff add x1, x1, x0, lsr #29 and x0, x0, 0x1fffffff add x6, x6, x5, lsr #29 and x5, x5, 0x1fffffff add x2, x2, x1, lsr #29 and x1, x1, 0x1fffffff add x7, x7, x6, lsr #29 and x6, x6, 0x1fffffff add x3, x3, x2, lsr #29 and x2, x2, 0x1fffffff add x8, x8, x7, lsr #29 and x7, x7, 0x1fffffff add x4, x4, x3, lsr #29 and x3, x3, 0x1fffffff bfi x3, x7, #32, #29 bic x10, x8, #0x7fffff add x0, x0, x10, lsr #23 add x0, x0, x10, lsr #22 add x0, x0, x10, lsr #19 and x8, x8, #0x7fffff add x5, x5, x4, lsr #29 and x4, x4, 0x1fffffff bfi x4, x8, #32, #23 add x1, x1, x0, lsr #29 bfi x6, x1, #32, #30 and x0, x0, 0x1fffffff bfi x5, x0, #32, #29 stp x3, x4, [sp, #472] stp x5, x6, [sp, #488] str x2, [sp, #504] mov w9, wzr ldr x26, [sp, #144] sub w9, w9, w26 lsr w9, w9, #1 mov x8, #160 mul x8, x8, x9 ldr x0, [sp, #104] add x0, x0, x8 str x0, [sp, #152] /* pnielssub p1p1 */ // neg ldr x0, [sp, #152] ldp x13, x14, [x0, #120] ldp x15, x16, [x0, #136] ldr x12, [x0, #152] ldp x20, x21, [sp, #160] ldp x27, x28, [sp, #176] sub x13, x20, x13 sub x14, x21, x14 sub x15, x27, x15 sub x16, x20, x16 sub x12, x28, x12 add x29, sp, #712 stp x13, x14, [x29, #40] stp x15, x16, [x29, #56] str x12, [x29, #72] // add ldp x23, x24, [sp, #392] ldp x25, x26, [sp, #408] ldr x22, [sp, #424] ldp x13, x14, [sp, #352] ldp x15, x16, [sp, #368] ldr x12, [sp, #384] add x3, x23, x13 add x4, x24, x14 add x5, x25, x15 add x6, x26, x16 add x2, x22, x12 stp x3, x4, [x29, #0] stp x5, x6, [x29, #16] str x2, [x29, #32] // sub add x23, x23, x20 add x24, x24, x21 add x25, x25, x27 add x26, x26, x20 add x22, x22, x28 sub x23, x23, x13 sub x24, x24, x14 sub x25, x25, x15 sub x26, x26, x16 sub x22, x22, x12 // mul ldr x0, [sp, #152] ldp w13, w17, [x0, #40] ldp w14, w18, [x0, #48] ldp w15, w10, [x0, #56] ldp w16, w11, [x0, #64] ldr w12, [x0, #72] lsr x27, x23, #32 lsr x28, x24, #32 lsr x20, x25, #32 lsr x21, x26, #32 umull x0, w10, w20 umull x1, w10, w21 umull x2, w10, w22 umull x3, w10, w23 umull x4, w10, w24 umull x5, w10, w25 umull x6, w10, w26 umull x7, w10, w27 umull x8, w10, w28 umaddl x1, w11, w20, x1 umaddl x2, w11, w21, x2 umaddl x3, w11, w22, x3 umaddl x4, w11, w23, x4 umaddl x5, w11, w24, x5 umaddl x6, w11, w25, x6 umaddl x7, w11, w26, x7 umaddl x8, w11, w27, x8 umull x9, w11, w28 umaddl x2, w12, w20, x2 umaddl x3, w12, w21, x3 umaddl x4, w12, w22, x4 umaddl x5, w12, w23, x5 umaddl x6, w12, w24, x6 umaddl x7, w12, w25, x7 umaddl x8, w12, w26, x8 umaddl x9, w12, w27, x9 umull x10, w12, w28 umaddl x3, w13, w20, x3 umaddl x4, w13, w21, x4 umaddl x5, w13, w22, x5 umaddl x6, w13, w23, x6 umaddl x7, w13, w24, x7 umaddl x8, w13, w25, x8 umaddl x9, w13, w26, x9 umaddl x10, w13, w27, x10 umull x11, w13, w28 umaddl x4, w14, w20, x4 umaddl x5, w14, w21, x5 umaddl x6, w14, w22, x6 umaddl x7, w14, w23, x7 umaddl x8, w14, w24, x8 umaddl x9, w14, w25, x9 umaddl x10, w14, w26, x10 umaddl x11, w14, w27, x11 umull x12, w14, w28 umaddl x5, w15, w20, x5 umaddl x6, w15, w21, x6 umaddl x7, w15, w22, x7 umaddl x8, w15, w23, x8 umaddl x9, w15, w24, x9 umaddl x10, w15, w25, x10 umaddl x11, w15, w26, x11 umaddl x12, w15, w27, x12 umull x13, w15, w28 umaddl x6, w16, w20, x6 umaddl x7, w16, w21, x7 umaddl x8, w16, w22, x8 umaddl x9, w16, w23, x9 umaddl x10, w16, w24, x10 umaddl x11, w16, w25, x11 umaddl x12, w16, w26, x12 umaddl x13, w16, w27, x13 umull x14, w16, w28 umaddl x7, w17, w20, x7 umaddl x8, w17, w21, x8 umaddl x9, w17, w22, x9 umaddl x10, w17, w23, x10 umaddl x11, w17, w24, x11 umaddl x12, w17, w25, x12 umaddl x13, w17, w26, x13 umaddl x14, w17, w27, x14 umull x15, w17, w28 umaddl x8, w18, w20, x8 umaddl x9, w18, w21, x9 umaddl x10, w18, w22, x10 umaddl x11, w18, w23, x11 umaddl x12, w18, w24, x12 umaddl x13, w18, w25, x13 umaddl x14, w18, w26, x14 umaddl x15, w18, w27, x15 umull x16, w18, w28 add x10, x10, x9, lsr #29 and x9, x9, #0x1fffffff umull x9, w9, w30 add x0, x0, x9 add x11, x11, x10, lsr #29 and x10, x10, #0x1fffffff umull x10, w10, w30 add x1, x1, x10 add x12, x12, x11, lsr #29 and x11, x11, #0x1fffffff umull x11, w11, w30 add x2, x2, x11 add x13, x13, x12, lsr #29 and x12, x12, #0x1fffffff umull x12, w12, w30 add x3, x3, x12 add x14, x14, x13, lsr #29 and x13, x13, #0x1fffffff umull x13, w13, w30 add x4, x4, x13 add x15, x15, x14, lsr #29 and x14, x14, #0x1fffffff umull x14, w14, w30 add x5, x5, x14 add x16, x16, x15, lsr #29 and x15, x15, #0x1fffffff umull x15, w15, w30 add x6, x6, x15 lsr x9, x16, #29 and x16, x16, #0x1fffffff umull x16, w16, w30 add x7, x7, x16 umull x9, w9, w30 add x8, x8, x9 add x5, x5, x4, lsr #29 and x4, x4, 0x1fffffff add x1, x1, x0, lsr #29 and x0, x0, 0x1fffffff add x6, x6, x5, lsr #29 and x5, x5, 0x1fffffff add x2, x2, x1, lsr #29 and x1, x1, 0x1fffffff add x7, x7, x6, lsr #29 and x6, x6, 0x1fffffff add x3, x3, x2, lsr #29 and x2, x2, 0x1fffffff add x8, x8, x7, lsr #29 and x7, x7, 0x1fffffff add x4, x4, x3, lsr #29 and x3, x3, 0x1fffffff bfi x3, x7, #32, #29 bic x10, x8, #0x7fffff add x0, x0, x10, lsr #23 add x0, x0, x10, lsr #22 add x0, x0, x10, lsr #19 and x8, x8, #0x7fffff add x5, x5, x4, lsr #29 and x4, x4, 0x1fffffff bfi x4, x8, #32, #23 add x1, x1, x0, lsr #29 bfi x6, x1, #32, #30 and x0, x0, 0x1fffffff bfi x5, x0, #32, #29 add x29, sp, #672 stp x3, x4, [x29, #0] stp x5, x6, [x29, #16] str x2, [x29, #32] // mul ldr x0, [sp, #152] ldp w13, w17, [x0, #0] ldp w14, w18, [x0, #8] ldp w15, w10, [x0, #16] ldp w16, w11, [x0, #24] ldr w12, [x0, #32] ldp w23, w27, [x29, #40] ldp w24, w28, [x29, #48] ldp w25, w20, [x29, #56] ldp w26, w21, [x29, #64] ldr w22, [x29, #72] umull x0, w10, w20 umull x1, w10, w21 umull x2, w10, w22 umull x3, w10, w23 umull x4, w10, w24 umull x5, w10, w25 umull x6, w10, w26 umull x7, w10, w27 umull x8, w10, w28 umaddl x1, w11, w20, x1 umaddl x2, w11, w21, x2 umaddl x3, w11, w22, x3 umaddl x4, w11, w23, x4 umaddl x5, w11, w24, x5 umaddl x6, w11, w25, x6 umaddl x7, w11, w26, x7 umaddl x8, w11, w27, x8 umull x9, w11, w28 umaddl x2, w12, w20, x2 umaddl x3, w12, w21, x3 umaddl x4, w12, w22, x4 umaddl x5, w12, w23, x5 umaddl x6, w12, w24, x6 umaddl x7, w12, w25, x7 umaddl x8, w12, w26, x8 umaddl x9, w12, w27, x9 umull x10, w12, w28 umaddl x3, w13, w20, x3 umaddl x4, w13, w21, x4 umaddl x5, w13, w22, x5 umaddl x6, w13, w23, x6 umaddl x7, w13, w24, x7 umaddl x8, w13, w25, x8 umaddl x9, w13, w26, x9 umaddl x10, w13, w27, x10 umull x11, w13, w28 umaddl x4, w14, w20, x4 umaddl x5, w14, w21, x5 umaddl x6, w14, w22, x6 umaddl x7, w14, w23, x7 umaddl x8, w14, w24, x8 umaddl x9, w14, w25, x9 umaddl x10, w14, w26, x10 umaddl x11, w14, w27, x11 umull x12, w14, w28 umaddl x5, w15, w20, x5 umaddl x6, w15, w21, x6 umaddl x7, w15, w22, x7 umaddl x8, w15, w23, x8 umaddl x9, w15, w24, x9 umaddl x10, w15, w25, x10 umaddl x11, w15, w26, x11 umaddl x12, w15, w27, x12 umull x13, w15, w28 umaddl x6, w16, w20, x6 umaddl x7, w16, w21, x7 umaddl x8, w16, w22, x8 umaddl x9, w16, w23, x9 umaddl x10, w16, w24, x10 umaddl x11, w16, w25, x11 umaddl x12, w16, w26, x12 umaddl x13, w16, w27, x13 umull x14, w16, w28 umaddl x7, w17, w20, x7 umaddl x8, w17, w21, x8 umaddl x9, w17, w22, x9 umaddl x10, w17, w23, x10 umaddl x11, w17, w24, x11 umaddl x12, w17, w25, x12 umaddl x13, w17, w26, x13 umaddl x14, w17, w27, x14 umull x15, w17, w28 umaddl x8, w18, w20, x8 umaddl x9, w18, w21, x9 umaddl x10, w18, w22, x10 umaddl x11, w18, w23, x11 umaddl x12, w18, w24, x12 umaddl x13, w18, w25, x13 umaddl x14, w18, w26, x14 umaddl x15, w18, w27, x15 umull x16, w18, w28 add x10, x10, x9, lsr #29 and x9, x9, #0x1fffffff umull x9, w9, w30 add x0, x0, x9 add x11, x11, x10, lsr #29 and x10, x10, #0x1fffffff umull x10, w10, w30 add x1, x1, x10 add x12, x12, x11, lsr #29 and x11, x11, #0x1fffffff umull x11, w11, w30 add x2, x2, x11 add x13, x13, x12, lsr #29 and x12, x12, #0x1fffffff umull x12, w12, w30 add x3, x3, x12 add x14, x14, x13, lsr #29 and x13, x13, #0x1fffffff umull x13, w13, w30 add x4, x4, x13 add x15, x15, x14, lsr #29 and x14, x14, #0x1fffffff umull x14, w14, w30 add x5, x5, x14 add x16, x16, x15, lsr #29 and x15, x15, #0x1fffffff umull x15, w15, w30 add x6, x6, x15 lsr x9, x16, #29 and x16, x16, #0x1fffffff umull x16, w16, w30 add x7, x7, x16 umull x9, w9, w30 add x8, x8, x9 add x5, x5, x4, lsr #29 and x4, x4, 0x1fffffff add x1, x1, x0, lsr #29 and x0, x0, 0x1fffffff add x6, x6, x5, lsr #29 and x5, x5, 0x1fffffff add x2, x2, x1, lsr #29 and x1, x1, 0x1fffffff add x7, x7, x6, lsr #29 and x6, x6, 0x1fffffff add x3, x3, x2, lsr #29 and x2, x2, 0x1fffffff add x8, x8, x7, lsr #29 and x7, x7, 0x1fffffff add x4, x4, x3, lsr #29 and x3, x3, 0x1fffffff bfi x3, x7, #32, #29 bic x10, x8, #0x7fffff add x0, x0, x10, lsr #23 add x0, x0, x10, lsr #22 add x0, x0, x10, lsr #19 and x8, x8, #0x7fffff add x5, x5, x4, lsr #29 and x4, x4, 0x1fffffff bfi x4, x8, #32, #23 add x1, x1, x0, lsr #29 bfi x6, x1, #32, #30 and x0, x0, 0x1fffffff bfi x5, x0, #32, #29 // add add x29, sp, #472 ldp x13, x14, [x29, #200] ldp x15, x16, [x29, #216] ldr x12, [x29, #232] add x0, x3, x13 add x1, x4, x14 add x7, x5, x15 add x8, x6, x16 add x9, x2, x12 stp x0, x1, [x29, #120] stp x7, x8, [x29, #136] str x9, [x29, #152] // sub ldp x20, x21, [sp, #160] ldp x27, x28, [sp, #176] add x3, x3, x20 add x4, x4, x21 add x5, x5, x27 add x6, x6, x20 add x2, x2, x28 sub x3, x3, x13 sub x4, x4, x14 sub x5, x5, x15 sub x6, x6, x16 sub x2, x2, x12 stp x3, x4, [x29, #40] stp x5, x6, [x29, #56] str x2, [x29, #72] // mul ldp w13, w17, [x29, #0] ldp w14, w18, [x29, #8] ldp w15, w10, [x29, #16] ldp w16, w11, [x29, #24] ldr w12, [x29, #32] add x29, sp, #752 ldp w23, w27, [x29, #0] ldp w24, w28, [x29, #8] ldp w25, w20, [x29, #16] ldp w26, w21, [x29, #24] ldr w22, [x29, #32] umull x0, w10, w20 umull x1, w10, w21 umull x2, w10, w22 umull x3, w10, w23 umull x4, w10, w24 umull x5, w10, w25 umull x6, w10, w26 umull x7, w10, w27 umull x8, w10, w28 umaddl x1, w11, w20, x1 umaddl x2, w11, w21, x2 umaddl x3, w11, w22, x3 umaddl x4, w11, w23, x4 umaddl x5, w11, w24, x5 umaddl x6, w11, w25, x6 umaddl x7, w11, w26, x7 umaddl x8, w11, w27, x8 umull x9, w11, w28 umaddl x2, w12, w20, x2 umaddl x3, w12, w21, x3 umaddl x4, w12, w22, x4 umaddl x5, w12, w23, x5 umaddl x6, w12, w24, x6 umaddl x7, w12, w25, x7 umaddl x8, w12, w26, x8 umaddl x9, w12, w27, x9 umull x10, w12, w28 umaddl x3, w13, w20, x3 umaddl x4, w13, w21, x4 umaddl x5, w13, w22, x5 umaddl x6, w13, w23, x6 umaddl x7, w13, w24, x7 umaddl x8, w13, w25, x8 umaddl x9, w13, w26, x9 umaddl x10, w13, w27, x10 umull x11, w13, w28 umaddl x4, w14, w20, x4 umaddl x5, w14, w21, x5 umaddl x6, w14, w22, x6 umaddl x7, w14, w23, x7 umaddl x8, w14, w24, x8 umaddl x9, w14, w25, x9 umaddl x10, w14, w26, x10 umaddl x11, w14, w27, x11 umull x12, w14, w28 umaddl x5, w15, w20, x5 umaddl x6, w15, w21, x6 umaddl x7, w15, w22, x7 umaddl x8, w15, w23, x8 umaddl x9, w15, w24, x9 umaddl x10, w15, w25, x10 umaddl x11, w15, w26, x11 umaddl x12, w15, w27, x12 umull x13, w15, w28 umaddl x6, w16, w20, x6 umaddl x7, w16, w21, x7 umaddl x8, w16, w22, x8 umaddl x9, w16, w23, x9 umaddl x10, w16, w24, x10 umaddl x11, w16, w25, x11 umaddl x12, w16, w26, x12 umaddl x13, w16, w27, x13 umull x14, w16, w28 umaddl x7, w17, w20, x7 umaddl x8, w17, w21, x8 umaddl x9, w17, w22, x9 umaddl x10, w17, w23, x10 umaddl x11, w17, w24, x11 umaddl x12, w17, w25, x12 umaddl x13, w17, w26, x13 umaddl x14, w17, w27, x14 umull x15, w17, w28 umaddl x8, w18, w20, x8 umaddl x9, w18, w21, x9 umaddl x10, w18, w22, x10 umaddl x11, w18, w23, x11 umaddl x12, w18, w24, x12 umaddl x13, w18, w25, x13 umaddl x14, w18, w26, x14 umaddl x15, w18, w27, x15 umull x16, w18, w28 add x10, x10, x9, lsr #29 and x9, x9, #0x1fffffff umull x9, w9, w30 add x0, x0, x9 add x11, x11, x10, lsr #29 and x10, x10, #0x1fffffff umull x10, w10, w30 add x1, x1, x10 add x12, x12, x11, lsr #29 and x11, x11, #0x1fffffff umull x11, w11, w30 add x2, x2, x11 add x13, x13, x12, lsr #29 and x12, x12, #0x1fffffff umull x12, w12, w30 add x3, x3, x12 add x14, x14, x13, lsr #29 and x13, x13, #0x1fffffff umull x13, w13, w30 add x4, x4, x13 add x15, x15, x14, lsr #29 and x14, x14, #0x1fffffff umull x14, w14, w30 add x5, x5, x14 add x16, x16, x15, lsr #29 and x15, x15, #0x1fffffff umull x15, w15, w30 add x6, x6, x15 lsr x9, x16, #29 and x16, x16, #0x1fffffff umull x16, w16, w30 add x7, x7, x16 umull x9, w9, w30 add x8, x8, x9 add x5, x5, x4, lsr #29 and x4, x4, 0x1fffffff add x1, x1, x0, lsr #29 and x0, x0, 0x1fffffff add x6, x6, x5, lsr #29 and x5, x5, 0x1fffffff add x2, x2, x1, lsr #29 and x1, x1, 0x1fffffff add x7, x7, x6, lsr #29 and x6, x6, 0x1fffffff add x3, x3, x2, lsr #29 and x2, x2, 0x1fffffff add x8, x8, x7, lsr #29 and x7, x7, 0x1fffffff add x4, x4, x3, lsr #29 and x3, x3, 0x1fffffff bfi x3, x7, #32, #29 bic x10, x8, #0x7fffff add x0, x0, x10, lsr #23 add x0, x0, x10, lsr #22 add x0, x0, x10, lsr #19 and x8, x8, #0x7fffff add x5, x5, x4, lsr #29 and x4, x4, 0x1fffffff bfi x4, x8, #32, #23 add x1, x1, x0, lsr #29 bfi x6, x1, #32, #30 and x0, x0, 0x1fffffff bfi x5, x0, #32, #29 add x29, sp, #672 stp x3, x4, [x29, #0] stp x5, x6, [x29, #16] str x2, [x29, #32] // mul ldr x0, [sp, #152] ldp w13, w17, [x0, #80] ldp w14, w18, [x0, #88] ldp w15, w10, [x0, #96] ldp w16, w11, [x0, #104] ldr w12, [x0, #112] add x29, sp, #432 ldp w23, w27, [x29, #0] ldp w24, w28, [x29, #8] ldp w25, w20, [x29, #16] ldp w26, w21, [x29, #24] ldr w22, [x29, #32] umull x0, w10, w20 umull x1, w10, w21 umull x2, w10, w22 umull x3, w10, w23 umull x4, w10, w24 umull x5, w10, w25 umull x6, w10, w26 umull x7, w10, w27 umull x8, w10, w28 umaddl x1, w11, w20, x1 umaddl x2, w11, w21, x2 umaddl x3, w11, w22, x3 umaddl x4, w11, w23, x4 umaddl x5, w11, w24, x5 umaddl x6, w11, w25, x6 umaddl x7, w11, w26, x7 umaddl x8, w11, w27, x8 umull x9, w11, w28 umaddl x2, w12, w20, x2 umaddl x3, w12, w21, x3 umaddl x4, w12, w22, x4 umaddl x5, w12, w23, x5 umaddl x6, w12, w24, x6 umaddl x7, w12, w25, x7 umaddl x8, w12, w26, x8 umaddl x9, w12, w27, x9 umull x10, w12, w28 umaddl x3, w13, w20, x3 umaddl x4, w13, w21, x4 umaddl x5, w13, w22, x5 umaddl x6, w13, w23, x6 umaddl x7, w13, w24, x7 umaddl x8, w13, w25, x8 umaddl x9, w13, w26, x9 umaddl x10, w13, w27, x10 umull x11, w13, w28 umaddl x4, w14, w20, x4 umaddl x5, w14, w21, x5 umaddl x6, w14, w22, x6 umaddl x7, w14, w23, x7 umaddl x8, w14, w24, x8 umaddl x9, w14, w25, x9 umaddl x10, w14, w26, x10 umaddl x11, w14, w27, x11 umull x12, w14, w28 umaddl x5, w15, w20, x5 umaddl x6, w15, w21, x6 umaddl x7, w15, w22, x7 umaddl x8, w15, w23, x8 umaddl x9, w15, w24, x9 umaddl x10, w15, w25, x10 umaddl x11, w15, w26, x11 umaddl x12, w15, w27, x12 umull x13, w15, w28 umaddl x6, w16, w20, x6 umaddl x7, w16, w21, x7 umaddl x8, w16, w22, x8 umaddl x9, w16, w23, x9 umaddl x10, w16, w24, x10 umaddl x11, w16, w25, x11 umaddl x12, w16, w26, x12 umaddl x13, w16, w27, x13 umull x14, w16, w28 umaddl x7, w17, w20, x7 umaddl x8, w17, w21, x8 umaddl x9, w17, w22, x9 umaddl x10, w17, w23, x10 umaddl x11, w17, w24, x11 umaddl x12, w17, w25, x12 umaddl x13, w17, w26, x13 umaddl x14, w17, w27, x14 umull x15, w17, w28 umaddl x8, w18, w20, x8 umaddl x9, w18, w21, x9 umaddl x10, w18, w22, x10 umaddl x11, w18, w23, x11 umaddl x12, w18, w24, x12 umaddl x13, w18, w25, x13 umaddl x14, w18, w26, x14 umaddl x15, w18, w27, x15 umull x16, w18, w28 add x10, x10, x9, lsr #29 and x9, x9, #0x1fffffff umull x9, w9, w30 add x0, x0, x9 add x11, x11, x10, lsr #29 and x10, x10, #0x1fffffff umull x10, w10, w30 add x1, x1, x10 add x12, x12, x11, lsr #29 and x11, x11, #0x1fffffff umull x11, w11, w30 add x2, x2, x11 add x13, x13, x12, lsr #29 and x12, x12, #0x1fffffff umull x12, w12, w30 add x3, x3, x12 add x14, x14, x13, lsr #29 and x13, x13, #0x1fffffff umull x13, w13, w30 add x4, x4, x13 add x15, x15, x14, lsr #29 and x14, x14, #0x1fffffff umull x14, w14, w30 add x5, x5, x14 add x16, x16, x15, lsr #29 and x15, x15, #0x1fffffff umull x15, w15, w30 add x6, x6, x15 lsr x9, x16, #29 and x16, x16, #0x1fffffff umull x16, w16, w30 add x7, x7, x16 umull x9, w9, w30 add x8, x8, x9 // double and then reduce add x0, x0, x0 add x1, x1, x1 add x2, x2, x2 add x3, x3, x3 add x4, x4, x4 add x5, x5, x5 add x6, x6, x6 add x7, x7, x7 add x8, x8, x8 add x5, x5, x4, lsr #29 and x4, x4, 0x1fffffff add x1, x1, x0, lsr #29 and x0, x0, 0x1fffffff add x6, x6, x5, lsr #29 and x5, x5, 0x1fffffff add x2, x2, x1, lsr #29 and x1, x1, 0x1fffffff add x7, x7, x6, lsr #29 and x6, x6, 0x1fffffff add x3, x3, x2, lsr #29 and x2, x2, 0x1fffffff add x8, x8, x7, lsr #29 and x7, x7, 0x1fffffff add x4, x4, x3, lsr #29 and x3, x3, 0x1fffffff bfi x3, x7, #32, #29 bic x10, x8, #0x7fffff add x0, x0, x10, lsr #23 add x0, x0, x10, lsr #22 add x0, x0, x10, lsr #19 and x8, x8, #0x7fffff add x5, x5, x4, lsr #29 and x4, x4, 0x1fffffff bfi x4, x8, #32, #23 add x1, x1, x0, lsr #29 bfi x6, x1, #32, #30 and x0, x0, 0x1fffffff bfi x5, x0, #32, #29 // add add x29, sp, #552 ldp x13, x14, [x29, #120] ldp x15, x16, [x29, #136] ldr x12, [x29, #152] add x0, x3, x13 add x1, x4, x14 add x7, x5, x15 add x8, x6, x16 add x9, x2, x12 stp x0, x1, [x29, #0] stp x7, x8, [x29, #16] str x9, [x29, #32] // sub ldp x20, x21, [sp, #160] ldp x27, x28, [sp, #176] add x3, x3, x20 add x4, x4, x21 add x5, x5, x27 add x6, x6, x20 add x2, x2, x28 sub x3, x3, x13 sub x4, x4, x14 sub x5, x5, x15 sub x6, x6, x16 sub x2, x2, x12 stp x3, x4, [x29, #80] stp x5, x6, [x29, #96] str x2, [x29, #112] .L6: ldr x2, [sp, #120] ldrsb w26, [x2, #0] sub x2, x2, #1 str x2, [sp, #120] str x26, [sp, #144] cmp w26, wzr bgt .L7 blt .L8 beq .L9 .L7: /* p1p1 to p3 */ // mul add x29, sp, #512 ldp w13, w17, [x29, #0] ldp w14, w18, [x29, #8] ldp w15, w10, [x29, #16] ldp w16, w11, [x29, #24] ldr w12, [x29, #32] ldp w23, w27, [x29, #120] ldp w24, w28, [x29, #128] ldp w25, w20, [x29, #136] ldp w26, w21, [x29, #144] ldr w22, [x29, #152] umull x0, w10, w20 umull x1, w10, w21 umull x2, w10, w22 umull x3, w10, w23 umull x4, w10, w24 umull x5, w10, w25 umull x6, w10, w26 umull x7, w10, w27 umull x8, w10, w28 umaddl x1, w11, w20, x1 umaddl x2, w11, w21, x2 umaddl x3, w11, w22, x3 umaddl x4, w11, w23, x4 umaddl x5, w11, w24, x5 umaddl x6, w11, w25, x6 umaddl x7, w11, w26, x7 umaddl x8, w11, w27, x8 umull x9, w11, w28 umaddl x2, w12, w20, x2 umaddl x3, w12, w21, x3 umaddl x4, w12, w22, x4 umaddl x5, w12, w23, x5 umaddl x6, w12, w24, x6 umaddl x7, w12, w25, x7 umaddl x8, w12, w26, x8 umaddl x9, w12, w27, x9 umull x10, w12, w28 umaddl x3, w13, w20, x3 umaddl x4, w13, w21, x4 umaddl x5, w13, w22, x5 umaddl x6, w13, w23, x6 umaddl x7, w13, w24, x7 umaddl x8, w13, w25, x8 umaddl x9, w13, w26, x9 umaddl x10, w13, w27, x10 umull x11, w13, w28 umaddl x4, w14, w20, x4 umaddl x5, w14, w21, x5 umaddl x6, w14, w22, x6 umaddl x7, w14, w23, x7 umaddl x8, w14, w24, x8 umaddl x9, w14, w25, x9 umaddl x10, w14, w26, x10 umaddl x11, w14, w27, x11 umull x12, w14, w28 umaddl x5, w15, w20, x5 umaddl x6, w15, w21, x6 umaddl x7, w15, w22, x7 umaddl x8, w15, w23, x8 umaddl x9, w15, w24, x9 umaddl x10, w15, w25, x10 umaddl x11, w15, w26, x11 umaddl x12, w15, w27, x12 umull x13, w15, w28 umaddl x6, w16, w20, x6 umaddl x7, w16, w21, x7 umaddl x8, w16, w22, x8 umaddl x9, w16, w23, x9 umaddl x10, w16, w24, x10 umaddl x11, w16, w25, x11 umaddl x12, w16, w26, x12 umaddl x13, w16, w27, x13 umull x14, w16, w28 umaddl x7, w17, w20, x7 umaddl x8, w17, w21, x8 umaddl x9, w17, w22, x9 umaddl x10, w17, w23, x10 umaddl x11, w17, w24, x11 umaddl x12, w17, w25, x12 umaddl x13, w17, w26, x13 umaddl x14, w17, w27, x14 umull x15, w17, w28 umaddl x8, w18, w20, x8 umaddl x9, w18, w21, x9 umaddl x10, w18, w22, x10 umaddl x11, w18, w23, x11 umaddl x12, w18, w24, x12 umaddl x13, w18, w25, x13 umaddl x14, w18, w26, x14 umaddl x15, w18, w27, x15 umull x16, w18, w28 add x10, x10, x9, lsr #29 and x9, x9, #0x1fffffff umull x9, w9, w30 add x0, x0, x9 add x11, x11, x10, lsr #29 and x10, x10, #0x1fffffff umull x10, w10, w30 add x1, x1, x10 add x12, x12, x11, lsr #29 and x11, x11, #0x1fffffff umull x11, w11, w30 add x2, x2, x11 add x13, x13, x12, lsr #29 and x12, x12, #0x1fffffff umull x12, w12, w30 add x3, x3, x12 add x14, x14, x13, lsr #29 and x13, x13, #0x1fffffff umull x13, w13, w30 add x4, x4, x13 add x15, x15, x14, lsr #29 and x14, x14, #0x1fffffff umull x14, w14, w30 add x5, x5, x14 add x16, x16, x15, lsr #29 and x15, x15, #0x1fffffff umull x15, w15, w30 add x6, x6, x15 lsr x9, x16, #29 and x16, x16, #0x1fffffff umull x16, w16, w30 add x7, x7, x16 umull x9, w9, w30 add x8, x8, x9 add x5, x5, x4, lsr #29 and x4, x4, 0x1fffffff add x1, x1, x0, lsr #29 and x0, x0, 0x1fffffff add x6, x6, x5, lsr #29 and x5, x5, 0x1fffffff add x2, x2, x1, lsr #29 and x1, x1, 0x1fffffff add x7, x7, x6, lsr #29 and x6, x6, 0x1fffffff add x3, x3, x2, lsr #29 and x2, x2, 0x1fffffff add x8, x8, x7, lsr #29 and x7, x7, 0x1fffffff add x4, x4, x3, lsr #29 and x3, x3, 0x1fffffff bfi x3, x7, #32, #29 bic x10, x8, #0x7fffff add x0, x0, x10, lsr #23 add x0, x0, x10, lsr #22 add x0, x0, x10, lsr #19 and x8, x8, #0x7fffff add x5, x5, x4, lsr #29 and x4, x4, 0x1fffffff bfi x4, x8, #32, #23 add x1, x1, x0, lsr #29 bfi x6, x1, #32, #30 and x0, x0, 0x1fffffff bfi x5, x0, #32, #29 stp x3, x4, [sp, #352] stp x5, x6, [sp, #368] str x2, [sp, #384] // mul add x29, sp, #552 ldp w13, w17, [x29, #0] ldp w14, w18, [x29, #8] ldp w15, w10, [x29, #16] ldp w16, w11, [x29, #24] ldr w12, [x29, #32] ldp w23, w27, [x29, #40] ldp w24, w28, [x29, #48] ldp w25, w20, [x29, #56] ldp w26, w21, [x29, #64] ldr w22, [x29, #72] umull x0, w10, w20 umull x1, w10, w21 umull x2, w10, w22 umull x3, w10, w23 umull x4, w10, w24 umull x5, w10, w25 umull x6, w10, w26 umull x7, w10, w27 umull x8, w10, w28 umaddl x1, w11, w20, x1 umaddl x2, w11, w21, x2 umaddl x3, w11, w22, x3 umaddl x4, w11, w23, x4 umaddl x5, w11, w24, x5 umaddl x6, w11, w25, x6 umaddl x7, w11, w26, x7 umaddl x8, w11, w27, x8 umull x9, w11, w28 umaddl x2, w12, w20, x2 umaddl x3, w12, w21, x3 umaddl x4, w12, w22, x4 umaddl x5, w12, w23, x5 umaddl x6, w12, w24, x6 umaddl x7, w12, w25, x7 umaddl x8, w12, w26, x8 umaddl x9, w12, w27, x9 umull x10, w12, w28 umaddl x3, w13, w20, x3 umaddl x4, w13, w21, x4 umaddl x5, w13, w22, x5 umaddl x6, w13, w23, x6 umaddl x7, w13, w24, x7 umaddl x8, w13, w25, x8 umaddl x9, w13, w26, x9 umaddl x10, w13, w27, x10 umull x11, w13, w28 umaddl x4, w14, w20, x4 umaddl x5, w14, w21, x5 umaddl x6, w14, w22, x6 umaddl x7, w14, w23, x7 umaddl x8, w14, w24, x8 umaddl x9, w14, w25, x9 umaddl x10, w14, w26, x10 umaddl x11, w14, w27, x11 umull x12, w14, w28 umaddl x5, w15, w20, x5 umaddl x6, w15, w21, x6 umaddl x7, w15, w22, x7 umaddl x8, w15, w23, x8 umaddl x9, w15, w24, x9 umaddl x10, w15, w25, x10 umaddl x11, w15, w26, x11 umaddl x12, w15, w27, x12 umull x13, w15, w28 umaddl x6, w16, w20, x6 umaddl x7, w16, w21, x7 umaddl x8, w16, w22, x8 umaddl x9, w16, w23, x9 umaddl x10, w16, w24, x10 umaddl x11, w16, w25, x11 umaddl x12, w16, w26, x12 umaddl x13, w16, w27, x13 umull x14, w16, w28 umaddl x7, w17, w20, x7 umaddl x8, w17, w21, x8 umaddl x9, w17, w22, x9 umaddl x10, w17, w23, x10 umaddl x11, w17, w24, x11 umaddl x12, w17, w25, x12 umaddl x13, w17, w26, x13 umaddl x14, w17, w27, x14 umull x15, w17, w28 umaddl x8, w18, w20, x8 umaddl x9, w18, w21, x9 umaddl x10, w18, w22, x10 umaddl x11, w18, w23, x11 umaddl x12, w18, w24, x12 umaddl x13, w18, w25, x13 umaddl x14, w18, w26, x14 umaddl x15, w18, w27, x15 umull x16, w18, w28 add x10, x10, x9, lsr #29 and x9, x9, #0x1fffffff umull x9, w9, w30 add x0, x0, x9 add x11, x11, x10, lsr #29 and x10, x10, #0x1fffffff umull x10, w10, w30 add x1, x1, x10 add x12, x12, x11, lsr #29 and x11, x11, #0x1fffffff umull x11, w11, w30 add x2, x2, x11 add x13, x13, x12, lsr #29 and x12, x12, #0x1fffffff umull x12, w12, w30 add x3, x3, x12 add x14, x14, x13, lsr #29 and x13, x13, #0x1fffffff umull x13, w13, w30 add x4, x4, x13 add x15, x15, x14, lsr #29 and x14, x14, #0x1fffffff umull x14, w14, w30 add x5, x5, x14 add x16, x16, x15, lsr #29 and x15, x15, #0x1fffffff umull x15, w15, w30 add x6, x6, x15 lsr x9, x16, #29 and x16, x16, #0x1fffffff umull x16, w16, w30 add x7, x7, x16 umull x9, w9, w30 add x8, x8, x9 add x5, x5, x4, lsr #29 and x4, x4, 0x1fffffff add x1, x1, x0, lsr #29 and x0, x0, 0x1fffffff add x6, x6, x5, lsr #29 and x5, x5, 0x1fffffff add x2, x2, x1, lsr #29 and x1, x1, 0x1fffffff add x7, x7, x6, lsr #29 and x6, x6, 0x1fffffff add x3, x3, x2, lsr #29 and x2, x2, 0x1fffffff add x8, x8, x7, lsr #29 and x7, x7, 0x1fffffff add x4, x4, x3, lsr #29 and x3, x3, 0x1fffffff bfi x3, x7, #32, #29 bic x10, x8, #0x7fffff add x0, x0, x10, lsr #23 add x0, x0, x10, lsr #22 add x0, x0, x10, lsr #19 and x8, x8, #0x7fffff add x5, x5, x4, lsr #29 and x4, x4, 0x1fffffff bfi x4, x8, #32, #23 add x1, x1, x0, lsr #29 bfi x6, x1, #32, #30 and x0, x0, 0x1fffffff bfi x5, x0, #32, #29 stp x3, x4, [sp, #392] stp x5, x6, [sp, #408] str x2, [sp, #424] // mul add x29, sp, #552 ldp w13, w17, [x29, #0] ldp w14, w18, [x29, #8] ldp w15, w10, [x29, #16] ldp w16, w11, [x29, #24] ldr w12, [x29, #32] ldp w23, w27, [x29, #80] ldp w24, w28, [x29, #88] ldp w25, w20, [x29, #96] ldp w26, w21, [x29, #104] ldr w22, [x29, #112] umull x0, w10, w20 umull x1, w10, w21 umull x2, w10, w22 umull x3, w10, w23 umull x4, w10, w24 umull x5, w10, w25 umull x6, w10, w26 umull x7, w10, w27 umull x8, w10, w28 umaddl x1, w11, w20, x1 umaddl x2, w11, w21, x2 umaddl x3, w11, w22, x3 umaddl x4, w11, w23, x4 umaddl x5, w11, w24, x5 umaddl x6, w11, w25, x6 umaddl x7, w11, w26, x7 umaddl x8, w11, w27, x8 umull x9, w11, w28 umaddl x2, w12, w20, x2 umaddl x3, w12, w21, x3 umaddl x4, w12, w22, x4 umaddl x5, w12, w23, x5 umaddl x6, w12, w24, x6 umaddl x7, w12, w25, x7 umaddl x8, w12, w26, x8 umaddl x9, w12, w27, x9 umull x10, w12, w28 umaddl x3, w13, w20, x3 umaddl x4, w13, w21, x4 umaddl x5, w13, w22, x5 umaddl x6, w13, w23, x6 umaddl x7, w13, w24, x7 umaddl x8, w13, w25, x8 umaddl x9, w13, w26, x9 umaddl x10, w13, w27, x10 umull x11, w13, w28 umaddl x4, w14, w20, x4 umaddl x5, w14, w21, x5 umaddl x6, w14, w22, x6 umaddl x7, w14, w23, x7 umaddl x8, w14, w24, x8 umaddl x9, w14, w25, x9 umaddl x10, w14, w26, x10 umaddl x11, w14, w27, x11 umull x12, w14, w28 umaddl x5, w15, w20, x5 umaddl x6, w15, w21, x6 umaddl x7, w15, w22, x7 umaddl x8, w15, w23, x8 umaddl x9, w15, w24, x9 umaddl x10, w15, w25, x10 umaddl x11, w15, w26, x11 umaddl x12, w15, w27, x12 umull x13, w15, w28 umaddl x6, w16, w20, x6 umaddl x7, w16, w21, x7 umaddl x8, w16, w22, x8 umaddl x9, w16, w23, x9 umaddl x10, w16, w24, x10 umaddl x11, w16, w25, x11 umaddl x12, w16, w26, x12 umaddl x13, w16, w27, x13 umull x14, w16, w28 umaddl x7, w17, w20, x7 umaddl x8, w17, w21, x8 umaddl x9, w17, w22, x9 umaddl x10, w17, w23, x10 umaddl x11, w17, w24, x11 umaddl x12, w17, w25, x12 umaddl x13, w17, w26, x13 umaddl x14, w17, w27, x14 umull x15, w17, w28 umaddl x8, w18, w20, x8 umaddl x9, w18, w21, x9 umaddl x10, w18, w22, x10 umaddl x11, w18, w23, x11 umaddl x12, w18, w24, x12 umaddl x13, w18, w25, x13 umaddl x14, w18, w26, x14 umaddl x15, w18, w27, x15 umull x16, w18, w28 add x10, x10, x9, lsr #29 and x9, x9, #0x1fffffff umull x9, w9, w30 add x0, x0, x9 add x11, x11, x10, lsr #29 and x10, x10, #0x1fffffff umull x10, w10, w30 add x1, x1, x10 add x12, x12, x11, lsr #29 and x11, x11, #0x1fffffff umull x11, w11, w30 add x2, x2, x11 add x13, x13, x12, lsr #29 and x12, x12, #0x1fffffff umull x12, w12, w30 add x3, x3, x12 add x14, x14, x13, lsr #29 and x13, x13, #0x1fffffff umull x13, w13, w30 add x4, x4, x13 add x15, x15, x14, lsr #29 and x14, x14, #0x1fffffff umull x14, w14, w30 add x5, x5, x14 add x16, x16, x15, lsr #29 and x15, x15, #0x1fffffff umull x15, w15, w30 add x6, x6, x15 lsr x9, x16, #29 and x16, x16, #0x1fffffff umull x16, w16, w30 add x7, x7, x16 umull x9, w9, w30 add x8, x8, x9 add x5, x5, x4, lsr #29 and x4, x4, 0x1fffffff add x1, x1, x0, lsr #29 and x0, x0, 0x1fffffff add x6, x6, x5, lsr #29 and x5, x5, 0x1fffffff add x2, x2, x1, lsr #29 and x1, x1, 0x1fffffff add x7, x7, x6, lsr #29 and x6, x6, 0x1fffffff add x3, x3, x2, lsr #29 and x2, x2, 0x1fffffff add x8, x8, x7, lsr #29 and x7, x7, 0x1fffffff add x4, x4, x3, lsr #29 and x3, x3, 0x1fffffff bfi x3, x7, #32, #29 bic x10, x8, #0x7fffff add x0, x0, x10, lsr #23 add x0, x0, x10, lsr #22 add x0, x0, x10, lsr #19 and x8, x8, #0x7fffff add x5, x5, x4, lsr #29 and x4, x4, 0x1fffffff bfi x4, x8, #32, #23 add x1, x1, x0, lsr #29 bfi x6, x1, #32, #30 and x0, x0, 0x1fffffff bfi x5, x0, #32, #29 stp x3, x4, [sp, #432] stp x5, x6, [sp, #448] str x2, [sp, #464] // mul add x29, sp, #512 ldp w13, w17, [x29, #0] ldp w14, w18, [x29, #8] ldp w15, w10, [x29, #16] ldp w16, w11, [x29, #24] ldr w12, [x29, #32] ldp w23, w27, [x29, #80] ldp w24, w28, [x29, #88] ldp w25, w20, [x29, #96] ldp w26, w21, [x29, #104] ldr w22, [x29, #112] umull x0, w10, w20 umull x1, w10, w21 umull x2, w10, w22 umull x3, w10, w23 umull x4, w10, w24 umull x5, w10, w25 umull x6, w10, w26 umull x7, w10, w27 umull x8, w10, w28 umaddl x1, w11, w20, x1 umaddl x2, w11, w21, x2 umaddl x3, w11, w22, x3 umaddl x4, w11, w23, x4 umaddl x5, w11, w24, x5 umaddl x6, w11, w25, x6 umaddl x7, w11, w26, x7 umaddl x8, w11, w27, x8 umull x9, w11, w28 umaddl x2, w12, w20, x2 umaddl x3, w12, w21, x3 umaddl x4, w12, w22, x4 umaddl x5, w12, w23, x5 umaddl x6, w12, w24, x6 umaddl x7, w12, w25, x7 umaddl x8, w12, w26, x8 umaddl x9, w12, w27, x9 umull x10, w12, w28 umaddl x3, w13, w20, x3 umaddl x4, w13, w21, x4 umaddl x5, w13, w22, x5 umaddl x6, w13, w23, x6 umaddl x7, w13, w24, x7 umaddl x8, w13, w25, x8 umaddl x9, w13, w26, x9 umaddl x10, w13, w27, x10 umull x11, w13, w28 umaddl x4, w14, w20, x4 umaddl x5, w14, w21, x5 umaddl x6, w14, w22, x6 umaddl x7, w14, w23, x7 umaddl x8, w14, w24, x8 umaddl x9, w14, w25, x9 umaddl x10, w14, w26, x10 umaddl x11, w14, w27, x11 umull x12, w14, w28 umaddl x5, w15, w20, x5 umaddl x6, w15, w21, x6 umaddl x7, w15, w22, x7 umaddl x8, w15, w23, x8 umaddl x9, w15, w24, x9 umaddl x10, w15, w25, x10 umaddl x11, w15, w26, x11 umaddl x12, w15, w27, x12 umull x13, w15, w28 umaddl x6, w16, w20, x6 umaddl x7, w16, w21, x7 umaddl x8, w16, w22, x8 umaddl x9, w16, w23, x9 umaddl x10, w16, w24, x10 umaddl x11, w16, w25, x11 umaddl x12, w16, w26, x12 umaddl x13, w16, w27, x13 umull x14, w16, w28 umaddl x7, w17, w20, x7 umaddl x8, w17, w21, x8 umaddl x9, w17, w22, x9 umaddl x10, w17, w23, x10 umaddl x11, w17, w24, x11 umaddl x12, w17, w25, x12 umaddl x13, w17, w26, x13 umaddl x14, w17, w27, x14 umull x15, w17, w28 umaddl x8, w18, w20, x8 umaddl x9, w18, w21, x9 umaddl x10, w18, w22, x10 umaddl x11, w18, w23, x11 umaddl x12, w18, w24, x12 umaddl x13, w18, w25, x13 umaddl x14, w18, w26, x14 umaddl x15, w18, w27, x15 umull x16, w18, w28 add x10, x10, x9, lsr #29 and x9, x9, #0x1fffffff umull x9, w9, w30 add x0, x0, x9 add x11, x11, x10, lsr #29 and x10, x10, #0x1fffffff umull x10, w10, w30 add x1, x1, x10 add x12, x12, x11, lsr #29 and x11, x11, #0x1fffffff umull x11, w11, w30 add x2, x2, x11 add x13, x13, x12, lsr #29 and x12, x12, #0x1fffffff umull x12, w12, w30 add x3, x3, x12 add x14, x14, x13, lsr #29 and x13, x13, #0x1fffffff umull x13, w13, w30 add x4, x4, x13 add x15, x15, x14, lsr #29 and x14, x14, #0x1fffffff umull x14, w14, w30 add x5, x5, x14 add x16, x16, x15, lsr #29 and x15, x15, #0x1fffffff umull x15, w15, w30 add x6, x6, x15 lsr x9, x16, #29 and x16, x16, #0x1fffffff umull x16, w16, w30 add x7, x7, x16 umull x9, w9, w30 add x8, x8, x9 add x5, x5, x4, lsr #29 and x4, x4, 0x1fffffff add x1, x1, x0, lsr #29 and x0, x0, 0x1fffffff add x6, x6, x5, lsr #29 and x5, x5, 0x1fffffff add x2, x2, x1, lsr #29 and x1, x1, 0x1fffffff add x7, x7, x6, lsr #29 and x6, x6, 0x1fffffff add x3, x3, x2, lsr #29 and x2, x2, 0x1fffffff add x8, x8, x7, lsr #29 and x7, x7, 0x1fffffff add x4, x4, x3, lsr #29 and x3, x3, 0x1fffffff bfi x3, x7, #32, #29 bic x10, x8, #0x7fffff add x0, x0, x10, lsr #23 add x0, x0, x10, lsr #22 add x0, x0, x10, lsr #19 and x8, x8, #0x7fffff add x5, x5, x4, lsr #29 and x4, x4, 0x1fffffff bfi x4, x8, #32, #23 add x1, x1, x0, lsr #29 bfi x6, x1, #32, #30 and x0, x0, 0x1fffffff bfi x5, x0, #32, #29 stp x3, x4, [sp, #472] stp x5, x6, [sp, #488] str x2, [sp, #504] ldr x26, [sp, #144] lsr w8, w26, #1 mov w9, #120 mul x8, x8, x9 ldr x0, [sp, #112] add x0, x0, x8 str x0, [sp, #152] /* nielsadd p1p1 */ // add ldp x23, x24, [sp, #392] ldp x25, x26, [sp, #408] ldr x22, [sp, #424] ldp x13, x14, [sp, #352] ldp x15, x16, [sp, #368] ldr x12, [sp, #384] add x3, x23, x13 add x4, x24, x14 add x5, x25, x15 add x6, x26, x16 add x2, x22, x12 add x29, sp, #712 stp x3, x4, [x29, #0] stp x5, x6, [x29, #16] str x2, [x29, #32] // sub ldp x20, x21, [sp, #160] ldp x27, x28, [sp, #176] add x23, x23, x20 add x24, x24, x21 add x25, x25, x27 add x26, x26, x20 add x22, x22, x28 sub x23, x23, x13 sub x24, x24, x14 sub x25, x25, x15 sub x26, x26, x16 sub x22, x22, x12 // mul ldr x0, [sp, #152] ldp w13, w17, [x0, #0] ldp w14, w18, [x0, #8] ldp w15, w10, [x0, #16] ldp w16, w11, [x0, #24] ldr w12, [x0, #32] lsr x27, x23, #32 lsr x28, x24, #32 lsr x20, x25, #32 lsr x21, x26, #32 umull x0, w10, w20 umull x1, w10, w21 umull x2, w10, w22 umull x3, w10, w23 umull x4, w10, w24 umull x5, w10, w25 umull x6, w10, w26 umull x7, w10, w27 umull x8, w10, w28 umaddl x1, w11, w20, x1 umaddl x2, w11, w21, x2 umaddl x3, w11, w22, x3 umaddl x4, w11, w23, x4 umaddl x5, w11, w24, x5 umaddl x6, w11, w25, x6 umaddl x7, w11, w26, x7 umaddl x8, w11, w27, x8 umull x9, w11, w28 umaddl x2, w12, w20, x2 umaddl x3, w12, w21, x3 umaddl x4, w12, w22, x4 umaddl x5, w12, w23, x5 umaddl x6, w12, w24, x6 umaddl x7, w12, w25, x7 umaddl x8, w12, w26, x8 umaddl x9, w12, w27, x9 umull x10, w12, w28 umaddl x3, w13, w20, x3 umaddl x4, w13, w21, x4 umaddl x5, w13, w22, x5 umaddl x6, w13, w23, x6 umaddl x7, w13, w24, x7 umaddl x8, w13, w25, x8 umaddl x9, w13, w26, x9 umaddl x10, w13, w27, x10 umull x11, w13, w28 umaddl x4, w14, w20, x4 umaddl x5, w14, w21, x5 umaddl x6, w14, w22, x6 umaddl x7, w14, w23, x7 umaddl x8, w14, w24, x8 umaddl x9, w14, w25, x9 umaddl x10, w14, w26, x10 umaddl x11, w14, w27, x11 umull x12, w14, w28 umaddl x5, w15, w20, x5 umaddl x6, w15, w21, x6 umaddl x7, w15, w22, x7 umaddl x8, w15, w23, x8 umaddl x9, w15, w24, x9 umaddl x10, w15, w25, x10 umaddl x11, w15, w26, x11 umaddl x12, w15, w27, x12 umull x13, w15, w28 umaddl x6, w16, w20, x6 umaddl x7, w16, w21, x7 umaddl x8, w16, w22, x8 umaddl x9, w16, w23, x9 umaddl x10, w16, w24, x10 umaddl x11, w16, w25, x11 umaddl x12, w16, w26, x12 umaddl x13, w16, w27, x13 umull x14, w16, w28 umaddl x7, w17, w20, x7 umaddl x8, w17, w21, x8 umaddl x9, w17, w22, x9 umaddl x10, w17, w23, x10 umaddl x11, w17, w24, x11 umaddl x12, w17, w25, x12 umaddl x13, w17, w26, x13 umaddl x14, w17, w27, x14 umull x15, w17, w28 umaddl x8, w18, w20, x8 umaddl x9, w18, w21, x9 umaddl x10, w18, w22, x10 umaddl x11, w18, w23, x11 umaddl x12, w18, w24, x12 umaddl x13, w18, w25, x13 umaddl x14, w18, w26, x14 umaddl x15, w18, w27, x15 umull x16, w18, w28 add x10, x10, x9, lsr #29 and x9, x9, #0x1fffffff umull x9, w9, w30 add x0, x0, x9 add x11, x11, x10, lsr #29 and x10, x10, #0x1fffffff umull x10, w10, w30 add x1, x1, x10 add x12, x12, x11, lsr #29 and x11, x11, #0x1fffffff umull x11, w11, w30 add x2, x2, x11 add x13, x13, x12, lsr #29 and x12, x12, #0x1fffffff umull x12, w12, w30 add x3, x3, x12 add x14, x14, x13, lsr #29 and x13, x13, #0x1fffffff umull x13, w13, w30 add x4, x4, x13 add x15, x15, x14, lsr #29 and x14, x14, #0x1fffffff umull x14, w14, w30 add x5, x5, x14 add x16, x16, x15, lsr #29 and x15, x15, #0x1fffffff umull x15, w15, w30 add x6, x6, x15 lsr x9, x16, #29 and x16, x16, #0x1fffffff umull x16, w16, w30 add x7, x7, x16 umull x9, w9, w30 add x8, x8, x9 add x5, x5, x4, lsr #29 and x4, x4, 0x1fffffff add x1, x1, x0, lsr #29 and x0, x0, 0x1fffffff add x6, x6, x5, lsr #29 and x5, x5, 0x1fffffff add x2, x2, x1, lsr #29 and x1, x1, 0x1fffffff add x7, x7, x6, lsr #29 and x6, x6, 0x1fffffff add x3, x3, x2, lsr #29 and x2, x2, 0x1fffffff add x8, x8, x7, lsr #29 and x7, x7, 0x1fffffff add x4, x4, x3, lsr #29 and x3, x3, 0x1fffffff bfi x3, x7, #32, #29 bic x10, x8, #0x7fffff add x0, x0, x10, lsr #23 add x0, x0, x10, lsr #22 add x0, x0, x10, lsr #19 and x8, x8, #0x7fffff add x5, x5, x4, lsr #29 and x4, x4, 0x1fffffff bfi x4, x8, #32, #23 add x1, x1, x0, lsr #29 bfi x6, x1, #32, #30 and x0, x0, 0x1fffffff bfi x5, x0, #32, #29 add x29, sp, #672 stp x3, x4, [x29, #0] stp x5, x6, [x29, #16] str x2, [x29, #32] // mul ldr x0, [sp, #152] ldp w13, w17, [x0, #40] ldp w14, w18, [x0, #48] ldp w15, w10, [x0, #56] ldp w16, w11, [x0, #64] ldr w12, [x0, #72] ldp w23, w27, [x29, #40] ldp w24, w28, [x29, #48] ldp w25, w20, [x29, #56] ldp w26, w21, [x29, #64] ldr w22, [x29, #72] umull x0, w10, w20 umull x1, w10, w21 umull x2, w10, w22 umull x3, w10, w23 umull x4, w10, w24 umull x5, w10, w25 umull x6, w10, w26 umull x7, w10, w27 umull x8, w10, w28 umaddl x1, w11, w20, x1 umaddl x2, w11, w21, x2 umaddl x3, w11, w22, x3 umaddl x4, w11, w23, x4 umaddl x5, w11, w24, x5 umaddl x6, w11, w25, x6 umaddl x7, w11, w26, x7 umaddl x8, w11, w27, x8 umull x9, w11, w28 umaddl x2, w12, w20, x2 umaddl x3, w12, w21, x3 umaddl x4, w12, w22, x4 umaddl x5, w12, w23, x5 umaddl x6, w12, w24, x6 umaddl x7, w12, w25, x7 umaddl x8, w12, w26, x8 umaddl x9, w12, w27, x9 umull x10, w12, w28 umaddl x3, w13, w20, x3 umaddl x4, w13, w21, x4 umaddl x5, w13, w22, x5 umaddl x6, w13, w23, x6 umaddl x7, w13, w24, x7 umaddl x8, w13, w25, x8 umaddl x9, w13, w26, x9 umaddl x10, w13, w27, x10 umull x11, w13, w28 umaddl x4, w14, w20, x4 umaddl x5, w14, w21, x5 umaddl x6, w14, w22, x6 umaddl x7, w14, w23, x7 umaddl x8, w14, w24, x8 umaddl x9, w14, w25, x9 umaddl x10, w14, w26, x10 umaddl x11, w14, w27, x11 umull x12, w14, w28 umaddl x5, w15, w20, x5 umaddl x6, w15, w21, x6 umaddl x7, w15, w22, x7 umaddl x8, w15, w23, x8 umaddl x9, w15, w24, x9 umaddl x10, w15, w25, x10 umaddl x11, w15, w26, x11 umaddl x12, w15, w27, x12 umull x13, w15, w28 umaddl x6, w16, w20, x6 umaddl x7, w16, w21, x7 umaddl x8, w16, w22, x8 umaddl x9, w16, w23, x9 umaddl x10, w16, w24, x10 umaddl x11, w16, w25, x11 umaddl x12, w16, w26, x12 umaddl x13, w16, w27, x13 umull x14, w16, w28 umaddl x7, w17, w20, x7 umaddl x8, w17, w21, x8 umaddl x9, w17, w22, x9 umaddl x10, w17, w23, x10 umaddl x11, w17, w24, x11 umaddl x12, w17, w25, x12 umaddl x13, w17, w26, x13 umaddl x14, w17, w27, x14 umull x15, w17, w28 umaddl x8, w18, w20, x8 umaddl x9, w18, w21, x9 umaddl x10, w18, w22, x10 umaddl x11, w18, w23, x11 umaddl x12, w18, w24, x12 umaddl x13, w18, w25, x13 umaddl x14, w18, w26, x14 umaddl x15, w18, w27, x15 umull x16, w18, w28 add x10, x10, x9, lsr #29 and x9, x9, #0x1fffffff umull x9, w9, w30 add x0, x0, x9 add x11, x11, x10, lsr #29 and x10, x10, #0x1fffffff umull x10, w10, w30 add x1, x1, x10 add x12, x12, x11, lsr #29 and x11, x11, #0x1fffffff umull x11, w11, w30 add x2, x2, x11 add x13, x13, x12, lsr #29 and x12, x12, #0x1fffffff umull x12, w12, w30 add x3, x3, x12 add x14, x14, x13, lsr #29 and x13, x13, #0x1fffffff umull x13, w13, w30 add x4, x4, x13 add x15, x15, x14, lsr #29 and x14, x14, #0x1fffffff umull x14, w14, w30 add x5, x5, x14 add x16, x16, x15, lsr #29 and x15, x15, #0x1fffffff umull x15, w15, w30 add x6, x6, x15 lsr x9, x16, #29 and x16, x16, #0x1fffffff umull x16, w16, w30 add x7, x7, x16 umull x9, w9, w30 add x8, x8, x9 add x5, x5, x4, lsr #29 and x4, x4, 0x1fffffff add x1, x1, x0, lsr #29 and x0, x0, 0x1fffffff add x6, x6, x5, lsr #29 and x5, x5, 0x1fffffff add x2, x2, x1, lsr #29 and x1, x1, 0x1fffffff add x7, x7, x6, lsr #29 and x6, x6, 0x1fffffff add x3, x3, x2, lsr #29 and x2, x2, 0x1fffffff add x8, x8, x7, lsr #29 and x7, x7, 0x1fffffff add x4, x4, x3, lsr #29 and x3, x3, 0x1fffffff bfi x3, x7, #32, #29 bic x10, x8, #0x7fffff add x0, x0, x10, lsr #23 add x0, x0, x10, lsr #22 add x0, x0, x10, lsr #19 and x8, x8, #0x7fffff add x5, x5, x4, lsr #29 and x4, x4, 0x1fffffff bfi x4, x8, #32, #23 add x1, x1, x0, lsr #29 bfi x6, x1, #32, #30 and x0, x0, 0x1fffffff bfi x5, x0, #32, #29 // add add x29, sp, #512 ldp x13, x14, [x29, #160] ldp x15, x16, [x29, #176] ldr x12, [x29, #192] add x0, x3, x13 add x1, x4, x14 add x7, x5, x15 add x8, x6, x16 add x9, x2, x12 stp x0, x1, [x29, #80] stp x7, x8, [x29, #96] str x9, [x29, #112] // sub ldp x20, x21, [sp, #160] ldp x27, x28, [sp, #176] add x3, x3, x20 add x4, x4, x21 add x5, x5, x27 add x6, x6, x20 add x2, x2, x28 sub x3, x3, x13 sub x4, x4, x14 sub x5, x5, x15 sub x6, x6, x16 sub x2, x2, x12 stp x3, x4, [x29, #0] stp x5, x6, [x29, #16] str x2, [x29, #32] // mul ldr x0, [sp, #152] ldp w13, w17, [x0, #80] ldp w14, w18, [x0, #88] ldp w15, w10, [x0, #96] ldp w16, w11, [x0, #104] ldr w12, [x0, #112] add x29, sp, #472 ldp w23, w27, [x29, #0] ldp w24, w28, [x29, #8] ldp w25, w20, [x29, #16] ldp w26, w21, [x29, #24] ldr w22, [x29, #32] umull x0, w10, w20 umull x1, w10, w21 umull x2, w10, w22 umull x3, w10, w23 umull x4, w10, w24 umull x5, w10, w25 umull x6, w10, w26 umull x7, w10, w27 umull x8, w10, w28 umaddl x1, w11, w20, x1 umaddl x2, w11, w21, x2 umaddl x3, w11, w22, x3 umaddl x4, w11, w23, x4 umaddl x5, w11, w24, x5 umaddl x6, w11, w25, x6 umaddl x7, w11, w26, x7 umaddl x8, w11, w27, x8 umull x9, w11, w28 umaddl x2, w12, w20, x2 umaddl x3, w12, w21, x3 umaddl x4, w12, w22, x4 umaddl x5, w12, w23, x5 umaddl x6, w12, w24, x6 umaddl x7, w12, w25, x7 umaddl x8, w12, w26, x8 umaddl x9, w12, w27, x9 umull x10, w12, w28 umaddl x3, w13, w20, x3 umaddl x4, w13, w21, x4 umaddl x5, w13, w22, x5 umaddl x6, w13, w23, x6 umaddl x7, w13, w24, x7 umaddl x8, w13, w25, x8 umaddl x9, w13, w26, x9 umaddl x10, w13, w27, x10 umull x11, w13, w28 umaddl x4, w14, w20, x4 umaddl x5, w14, w21, x5 umaddl x6, w14, w22, x6 umaddl x7, w14, w23, x7 umaddl x8, w14, w24, x8 umaddl x9, w14, w25, x9 umaddl x10, w14, w26, x10 umaddl x11, w14, w27, x11 umull x12, w14, w28 umaddl x5, w15, w20, x5 umaddl x6, w15, w21, x6 umaddl x7, w15, w22, x7 umaddl x8, w15, w23, x8 umaddl x9, w15, w24, x9 umaddl x10, w15, w25, x10 umaddl x11, w15, w26, x11 umaddl x12, w15, w27, x12 umull x13, w15, w28 umaddl x6, w16, w20, x6 umaddl x7, w16, w21, x7 umaddl x8, w16, w22, x8 umaddl x9, w16, w23, x9 umaddl x10, w16, w24, x10 umaddl x11, w16, w25, x11 umaddl x12, w16, w26, x12 umaddl x13, w16, w27, x13 umull x14, w16, w28 umaddl x7, w17, w20, x7 umaddl x8, w17, w21, x8 umaddl x9, w17, w22, x9 umaddl x10, w17, w23, x10 umaddl x11, w17, w24, x11 umaddl x12, w17, w25, x12 umaddl x13, w17, w26, x13 umaddl x14, w17, w27, x14 umull x15, w17, w28 umaddl x8, w18, w20, x8 umaddl x9, w18, w21, x9 umaddl x10, w18, w22, x10 umaddl x11, w18, w23, x11 umaddl x12, w18, w24, x12 umaddl x13, w18, w25, x13 umaddl x14, w18, w26, x14 umaddl x15, w18, w27, x15 umull x16, w18, w28 add x10, x10, x9, lsr #29 and x9, x9, #0x1fffffff umull x9, w9, w30 add x0, x0, x9 add x11, x11, x10, lsr #29 and x10, x10, #0x1fffffff umull x10, w10, w30 add x1, x1, x10 add x12, x12, x11, lsr #29 and x11, x11, #0x1fffffff umull x11, w11, w30 add x2, x2, x11 add x13, x13, x12, lsr #29 and x12, x12, #0x1fffffff umull x12, w12, w30 add x3, x3, x12 add x14, x14, x13, lsr #29 and x13, x13, #0x1fffffff umull x13, w13, w30 add x4, x4, x13 add x15, x15, x14, lsr #29 and x14, x14, #0x1fffffff umull x14, w14, w30 add x5, x5, x14 add x16, x16, x15, lsr #29 and x15, x15, #0x1fffffff umull x15, w15, w30 add x6, x6, x15 lsr x9, x16, #29 and x16, x16, #0x1fffffff umull x16, w16, w30 add x7, x7, x16 umull x9, w9, w30 add x8, x8, x9 add x5, x5, x4, lsr #29 and x4, x4, 0x1fffffff add x1, x1, x0, lsr #29 and x0, x0, 0x1fffffff add x6, x6, x5, lsr #29 and x5, x5, 0x1fffffff add x2, x2, x1, lsr #29 and x1, x1, 0x1fffffff add x7, x7, x6, lsr #29 and x6, x6, 0x1fffffff add x3, x3, x2, lsr #29 and x2, x2, 0x1fffffff add x8, x8, x7, lsr #29 and x7, x7, 0x1fffffff add x4, x4, x3, lsr #29 and x3, x3, 0x1fffffff bfi x3, x7, #32, #29 bic x10, x8, #0x7fffff add x0, x0, x10, lsr #23 add x0, x0, x10, lsr #22 add x0, x0, x10, lsr #19 and x8, x8, #0x7fffff add x5, x5, x4, lsr #29 and x4, x4, 0x1fffffff bfi x4, x8, #32, #23 add x1, x1, x0, lsr #29 bfi x6, x1, #32, #30 and x0, x0, 0x1fffffff bfi x5, x0, #32, #29 // double ldp x13, x14, [sp, #432] ldp x15, x16, [sp, #448] ldr x12, [sp, #464] add x13, x13, x13 add x14, x14, x14 add x15, x15, x15 add x16, x16, x16 add x12, x12, x12 lsr x17, x13, #32 mov w13, w13 lsr x18, x14, #32 mov w14, w14 lsr x10, x15, #32 mov w15, w15 lsr x11, x16, #32 mov w16, w16 add x15, x15, x14, lsr #29 and x14, x14, 0x1fffffff add x11, x11, x10, lsr #29 and x10, x10, 0x1fffffff add x16, x16, x15, lsr #29 and x15, x15, 0x1fffffff add x12, x12, x11, lsr #29 and x11, x11, 0x1fffffff add x17, x17, x16, lsr #29 and x16, x16, 0x1fffffff add x13, x13, x12, lsr #29 and x12, x12, 0x1fffffff add x18, x18, x17, lsr #29 and x17, x17, 0x1fffffff add x14, x14, x13, lsr #29 and x13, x13, 0x1fffffff bfi x13, x17, #32, #29 bic x20, x18, #0x7fffff add x10, x10, x20, lsr #23 add x10, x10, x20, lsr #22 add x10, x10, x20, lsr #19 and x18, x18, #0x7fffff add x15, x15, x14, lsr #29 and x14, x14, 0x1fffffff bfi x14, x18, #32, #23 add x11, x11, x10, lsr #29 bfi x16, x11, #32, #30 and x10, x10, 0x1fffffff bfi x15, x10, #32, #29 // sub ldp x20, x21, [sp, #160] ldp x27, x28, [sp, #176] add x0, x13, x20 add x1, x14, x21 add x7, x15, x27 add x8, x16, x20 add x9, x12, x28 sub x0, x0, x3 sub x1, x1, x4 sub x7, x7, x5 sub x8, x8, x6 sub x9, x9, x2 add x29, sp, #552 stp x0, x1, [x29, #80] stp x7, x8, [x29, #96] str x9, [x29, #112] // add add x3, x3, x13 add x4, x4, x14 add x5, x5, x15 add x6, x6, x16 add x2, x2, x12 stp x3, x4, [x29, #0] stp x5, x6, [x29, #16] str x2, [x29, #32] b .L9 .L8: /* p1p1 to p3 */ // mul add x29, sp, #512 ldp w13, w17, [x29, #0] ldp w14, w18, [x29, #8] ldp w15, w10, [x29, #16] ldp w16, w11, [x29, #24] ldr w12, [x29, #32] ldp w23, w27, [x29, #120] ldp w24, w28, [x29, #128] ldp w25, w20, [x29, #136] ldp w26, w21, [x29, #144] ldr w22, [x29, #152] umull x0, w10, w20 umull x1, w10, w21 umull x2, w10, w22 umull x3, w10, w23 umull x4, w10, w24 umull x5, w10, w25 umull x6, w10, w26 umull x7, w10, w27 umull x8, w10, w28 umaddl x1, w11, w20, x1 umaddl x2, w11, w21, x2 umaddl x3, w11, w22, x3 umaddl x4, w11, w23, x4 umaddl x5, w11, w24, x5 umaddl x6, w11, w25, x6 umaddl x7, w11, w26, x7 umaddl x8, w11, w27, x8 umull x9, w11, w28 umaddl x2, w12, w20, x2 umaddl x3, w12, w21, x3 umaddl x4, w12, w22, x4 umaddl x5, w12, w23, x5 umaddl x6, w12, w24, x6 umaddl x7, w12, w25, x7 umaddl x8, w12, w26, x8 umaddl x9, w12, w27, x9 umull x10, w12, w28 umaddl x3, w13, w20, x3 umaddl x4, w13, w21, x4 umaddl x5, w13, w22, x5 umaddl x6, w13, w23, x6 umaddl x7, w13, w24, x7 umaddl x8, w13, w25, x8 umaddl x9, w13, w26, x9 umaddl x10, w13, w27, x10 umull x11, w13, w28 umaddl x4, w14, w20, x4 umaddl x5, w14, w21, x5 umaddl x6, w14, w22, x6 umaddl x7, w14, w23, x7 umaddl x8, w14, w24, x8 umaddl x9, w14, w25, x9 umaddl x10, w14, w26, x10 umaddl x11, w14, w27, x11 umull x12, w14, w28 umaddl x5, w15, w20, x5 umaddl x6, w15, w21, x6 umaddl x7, w15, w22, x7 umaddl x8, w15, w23, x8 umaddl x9, w15, w24, x9 umaddl x10, w15, w25, x10 umaddl x11, w15, w26, x11 umaddl x12, w15, w27, x12 umull x13, w15, w28 umaddl x6, w16, w20, x6 umaddl x7, w16, w21, x7 umaddl x8, w16, w22, x8 umaddl x9, w16, w23, x9 umaddl x10, w16, w24, x10 umaddl x11, w16, w25, x11 umaddl x12, w16, w26, x12 umaddl x13, w16, w27, x13 umull x14, w16, w28 umaddl x7, w17, w20, x7 umaddl x8, w17, w21, x8 umaddl x9, w17, w22, x9 umaddl x10, w17, w23, x10 umaddl x11, w17, w24, x11 umaddl x12, w17, w25, x12 umaddl x13, w17, w26, x13 umaddl x14, w17, w27, x14 umull x15, w17, w28 umaddl x8, w18, w20, x8 umaddl x9, w18, w21, x9 umaddl x10, w18, w22, x10 umaddl x11, w18, w23, x11 umaddl x12, w18, w24, x12 umaddl x13, w18, w25, x13 umaddl x14, w18, w26, x14 umaddl x15, w18, w27, x15 umull x16, w18, w28 add x10, x10, x9, lsr #29 and x9, x9, #0x1fffffff umull x9, w9, w30 add x0, x0, x9 add x11, x11, x10, lsr #29 and x10, x10, #0x1fffffff umull x10, w10, w30 add x1, x1, x10 add x12, x12, x11, lsr #29 and x11, x11, #0x1fffffff umull x11, w11, w30 add x2, x2, x11 add x13, x13, x12, lsr #29 and x12, x12, #0x1fffffff umull x12, w12, w30 add x3, x3, x12 add x14, x14, x13, lsr #29 and x13, x13, #0x1fffffff umull x13, w13, w30 add x4, x4, x13 add x15, x15, x14, lsr #29 and x14, x14, #0x1fffffff umull x14, w14, w30 add x5, x5, x14 add x16, x16, x15, lsr #29 and x15, x15, #0x1fffffff umull x15, w15, w30 add x6, x6, x15 lsr x9, x16, #29 and x16, x16, #0x1fffffff umull x16, w16, w30 add x7, x7, x16 umull x9, w9, w30 add x8, x8, x9 add x5, x5, x4, lsr #29 and x4, x4, 0x1fffffff add x1, x1, x0, lsr #29 and x0, x0, 0x1fffffff add x6, x6, x5, lsr #29 and x5, x5, 0x1fffffff add x2, x2, x1, lsr #29 and x1, x1, 0x1fffffff add x7, x7, x6, lsr #29 and x6, x6, 0x1fffffff add x3, x3, x2, lsr #29 and x2, x2, 0x1fffffff add x8, x8, x7, lsr #29 and x7, x7, 0x1fffffff add x4, x4, x3, lsr #29 and x3, x3, 0x1fffffff bfi x3, x7, #32, #29 bic x10, x8, #0x7fffff add x0, x0, x10, lsr #23 add x0, x0, x10, lsr #22 add x0, x0, x10, lsr #19 and x8, x8, #0x7fffff add x5, x5, x4, lsr #29 and x4, x4, 0x1fffffff bfi x4, x8, #32, #23 add x1, x1, x0, lsr #29 bfi x6, x1, #32, #30 and x0, x0, 0x1fffffff bfi x5, x0, #32, #29 stp x3, x4, [sp, #352] stp x5, x6, [sp, #368] str x2, [sp, #384] // mul add x29, sp, #552 ldp w13, w17, [x29, #0] ldp w14, w18, [x29, #8] ldp w15, w10, [x29, #16] ldp w16, w11, [x29, #24] ldr w12, [x29, #32] ldp w23, w27, [x29, #40] ldp w24, w28, [x29, #48] ldp w25, w20, [x29, #56] ldp w26, w21, [x29, #64] ldr w22, [x29, #72] umull x0, w10, w20 umull x1, w10, w21 umull x2, w10, w22 umull x3, w10, w23 umull x4, w10, w24 umull x5, w10, w25 umull x6, w10, w26 umull x7, w10, w27 umull x8, w10, w28 umaddl x1, w11, w20, x1 umaddl x2, w11, w21, x2 umaddl x3, w11, w22, x3 umaddl x4, w11, w23, x4 umaddl x5, w11, w24, x5 umaddl x6, w11, w25, x6 umaddl x7, w11, w26, x7 umaddl x8, w11, w27, x8 umull x9, w11, w28 umaddl x2, w12, w20, x2 umaddl x3, w12, w21, x3 umaddl x4, w12, w22, x4 umaddl x5, w12, w23, x5 umaddl x6, w12, w24, x6 umaddl x7, w12, w25, x7 umaddl x8, w12, w26, x8 umaddl x9, w12, w27, x9 umull x10, w12, w28 umaddl x3, w13, w20, x3 umaddl x4, w13, w21, x4 umaddl x5, w13, w22, x5 umaddl x6, w13, w23, x6 umaddl x7, w13, w24, x7 umaddl x8, w13, w25, x8 umaddl x9, w13, w26, x9 umaddl x10, w13, w27, x10 umull x11, w13, w28 umaddl x4, w14, w20, x4 umaddl x5, w14, w21, x5 umaddl x6, w14, w22, x6 umaddl x7, w14, w23, x7 umaddl x8, w14, w24, x8 umaddl x9, w14, w25, x9 umaddl x10, w14, w26, x10 umaddl x11, w14, w27, x11 umull x12, w14, w28 umaddl x5, w15, w20, x5 umaddl x6, w15, w21, x6 umaddl x7, w15, w22, x7 umaddl x8, w15, w23, x8 umaddl x9, w15, w24, x9 umaddl x10, w15, w25, x10 umaddl x11, w15, w26, x11 umaddl x12, w15, w27, x12 umull x13, w15, w28 umaddl x6, w16, w20, x6 umaddl x7, w16, w21, x7 umaddl x8, w16, w22, x8 umaddl x9, w16, w23, x9 umaddl x10, w16, w24, x10 umaddl x11, w16, w25, x11 umaddl x12, w16, w26, x12 umaddl x13, w16, w27, x13 umull x14, w16, w28 umaddl x7, w17, w20, x7 umaddl x8, w17, w21, x8 umaddl x9, w17, w22, x9 umaddl x10, w17, w23, x10 umaddl x11, w17, w24, x11 umaddl x12, w17, w25, x12 umaddl x13, w17, w26, x13 umaddl x14, w17, w27, x14 umull x15, w17, w28 umaddl x8, w18, w20, x8 umaddl x9, w18, w21, x9 umaddl x10, w18, w22, x10 umaddl x11, w18, w23, x11 umaddl x12, w18, w24, x12 umaddl x13, w18, w25, x13 umaddl x14, w18, w26, x14 umaddl x15, w18, w27, x15 umull x16, w18, w28 add x10, x10, x9, lsr #29 and x9, x9, #0x1fffffff umull x9, w9, w30 add x0, x0, x9 add x11, x11, x10, lsr #29 and x10, x10, #0x1fffffff umull x10, w10, w30 add x1, x1, x10 add x12, x12, x11, lsr #29 and x11, x11, #0x1fffffff umull x11, w11, w30 add x2, x2, x11 add x13, x13, x12, lsr #29 and x12, x12, #0x1fffffff umull x12, w12, w30 add x3, x3, x12 add x14, x14, x13, lsr #29 and x13, x13, #0x1fffffff umull x13, w13, w30 add x4, x4, x13 add x15, x15, x14, lsr #29 and x14, x14, #0x1fffffff umull x14, w14, w30 add x5, x5, x14 add x16, x16, x15, lsr #29 and x15, x15, #0x1fffffff umull x15, w15, w30 add x6, x6, x15 lsr x9, x16, #29 and x16, x16, #0x1fffffff umull x16, w16, w30 add x7, x7, x16 umull x9, w9, w30 add x8, x8, x9 add x5, x5, x4, lsr #29 and x4, x4, 0x1fffffff add x1, x1, x0, lsr #29 and x0, x0, 0x1fffffff add x6, x6, x5, lsr #29 and x5, x5, 0x1fffffff add x2, x2, x1, lsr #29 and x1, x1, 0x1fffffff add x7, x7, x6, lsr #29 and x6, x6, 0x1fffffff add x3, x3, x2, lsr #29 and x2, x2, 0x1fffffff add x8, x8, x7, lsr #29 and x7, x7, 0x1fffffff add x4, x4, x3, lsr #29 and x3, x3, 0x1fffffff bfi x3, x7, #32, #29 bic x10, x8, #0x7fffff add x0, x0, x10, lsr #23 add x0, x0, x10, lsr #22 add x0, x0, x10, lsr #19 and x8, x8, #0x7fffff add x5, x5, x4, lsr #29 and x4, x4, 0x1fffffff bfi x4, x8, #32, #23 add x1, x1, x0, lsr #29 bfi x6, x1, #32, #30 and x0, x0, 0x1fffffff bfi x5, x0, #32, #29 stp x3, x4, [sp, #392] stp x5, x6, [sp, #408] str x2, [sp, #424] // mul add x29, sp, #552 ldp w13, w17, [x29, #0] ldp w14, w18, [x29, #8] ldp w15, w10, [x29, #16] ldp w16, w11, [x29, #24] ldr w12, [x29, #32] ldp w23, w27, [x29, #80] ldp w24, w28, [x29, #88] ldp w25, w20, [x29, #96] ldp w26, w21, [x29, #104] ldr w22, [x29, #112] umull x0, w10, w20 umull x1, w10, w21 umull x2, w10, w22 umull x3, w10, w23 umull x4, w10, w24 umull x5, w10, w25 umull x6, w10, w26 umull x7, w10, w27 umull x8, w10, w28 umaddl x1, w11, w20, x1 umaddl x2, w11, w21, x2 umaddl x3, w11, w22, x3 umaddl x4, w11, w23, x4 umaddl x5, w11, w24, x5 umaddl x6, w11, w25, x6 umaddl x7, w11, w26, x7 umaddl x8, w11, w27, x8 umull x9, w11, w28 umaddl x2, w12, w20, x2 umaddl x3, w12, w21, x3 umaddl x4, w12, w22, x4 umaddl x5, w12, w23, x5 umaddl x6, w12, w24, x6 umaddl x7, w12, w25, x7 umaddl x8, w12, w26, x8 umaddl x9, w12, w27, x9 umull x10, w12, w28 umaddl x3, w13, w20, x3 umaddl x4, w13, w21, x4 umaddl x5, w13, w22, x5 umaddl x6, w13, w23, x6 umaddl x7, w13, w24, x7 umaddl x8, w13, w25, x8 umaddl x9, w13, w26, x9 umaddl x10, w13, w27, x10 umull x11, w13, w28 umaddl x4, w14, w20, x4 umaddl x5, w14, w21, x5 umaddl x6, w14, w22, x6 umaddl x7, w14, w23, x7 umaddl x8, w14, w24, x8 umaddl x9, w14, w25, x9 umaddl x10, w14, w26, x10 umaddl x11, w14, w27, x11 umull x12, w14, w28 umaddl x5, w15, w20, x5 umaddl x6, w15, w21, x6 umaddl x7, w15, w22, x7 umaddl x8, w15, w23, x8 umaddl x9, w15, w24, x9 umaddl x10, w15, w25, x10 umaddl x11, w15, w26, x11 umaddl x12, w15, w27, x12 umull x13, w15, w28 umaddl x6, w16, w20, x6 umaddl x7, w16, w21, x7 umaddl x8, w16, w22, x8 umaddl x9, w16, w23, x9 umaddl x10, w16, w24, x10 umaddl x11, w16, w25, x11 umaddl x12, w16, w26, x12 umaddl x13, w16, w27, x13 umull x14, w16, w28 umaddl x7, w17, w20, x7 umaddl x8, w17, w21, x8 umaddl x9, w17, w22, x9 umaddl x10, w17, w23, x10 umaddl x11, w17, w24, x11 umaddl x12, w17, w25, x12 umaddl x13, w17, w26, x13 umaddl x14, w17, w27, x14 umull x15, w17, w28 umaddl x8, w18, w20, x8 umaddl x9, w18, w21, x9 umaddl x10, w18, w22, x10 umaddl x11, w18, w23, x11 umaddl x12, w18, w24, x12 umaddl x13, w18, w25, x13 umaddl x14, w18, w26, x14 umaddl x15, w18, w27, x15 umull x16, w18, w28 add x10, x10, x9, lsr #29 and x9, x9, #0x1fffffff umull x9, w9, w30 add x0, x0, x9 add x11, x11, x10, lsr #29 and x10, x10, #0x1fffffff umull x10, w10, w30 add x1, x1, x10 add x12, x12, x11, lsr #29 and x11, x11, #0x1fffffff umull x11, w11, w30 add x2, x2, x11 add x13, x13, x12, lsr #29 and x12, x12, #0x1fffffff umull x12, w12, w30 add x3, x3, x12 add x14, x14, x13, lsr #29 and x13, x13, #0x1fffffff umull x13, w13, w30 add x4, x4, x13 add x15, x15, x14, lsr #29 and x14, x14, #0x1fffffff umull x14, w14, w30 add x5, x5, x14 add x16, x16, x15, lsr #29 and x15, x15, #0x1fffffff umull x15, w15, w30 add x6, x6, x15 lsr x9, x16, #29 and x16, x16, #0x1fffffff umull x16, w16, w30 add x7, x7, x16 umull x9, w9, w30 add x8, x8, x9 add x5, x5, x4, lsr #29 and x4, x4, 0x1fffffff add x1, x1, x0, lsr #29 and x0, x0, 0x1fffffff add x6, x6, x5, lsr #29 and x5, x5, 0x1fffffff add x2, x2, x1, lsr #29 and x1, x1, 0x1fffffff add x7, x7, x6, lsr #29 and x6, x6, 0x1fffffff add x3, x3, x2, lsr #29 and x2, x2, 0x1fffffff add x8, x8, x7, lsr #29 and x7, x7, 0x1fffffff add x4, x4, x3, lsr #29 and x3, x3, 0x1fffffff bfi x3, x7, #32, #29 bic x10, x8, #0x7fffff add x0, x0, x10, lsr #23 add x0, x0, x10, lsr #22 add x0, x0, x10, lsr #19 and x8, x8, #0x7fffff add x5, x5, x4, lsr #29 and x4, x4, 0x1fffffff bfi x4, x8, #32, #23 add x1, x1, x0, lsr #29 bfi x6, x1, #32, #30 and x0, x0, 0x1fffffff bfi x5, x0, #32, #29 stp x3, x4, [sp, #432] stp x5, x6, [sp, #448] str x2, [sp, #464] // mul add x29, sp, #512 ldp w13, w17, [x29, #0] ldp w14, w18, [x29, #8] ldp w15, w10, [x29, #16] ldp w16, w11, [x29, #24] ldr w12, [x29, #32] ldp w23, w27, [x29, #80] ldp w24, w28, [x29, #88] ldp w25, w20, [x29, #96] ldp w26, w21, [x29, #104] ldr w22, [x29, #112] umull x0, w10, w20 umull x1, w10, w21 umull x2, w10, w22 umull x3, w10, w23 umull x4, w10, w24 umull x5, w10, w25 umull x6, w10, w26 umull x7, w10, w27 umull x8, w10, w28 umaddl x1, w11, w20, x1 umaddl x2, w11, w21, x2 umaddl x3, w11, w22, x3 umaddl x4, w11, w23, x4 umaddl x5, w11, w24, x5 umaddl x6, w11, w25, x6 umaddl x7, w11, w26, x7 umaddl x8, w11, w27, x8 umull x9, w11, w28 umaddl x2, w12, w20, x2 umaddl x3, w12, w21, x3 umaddl x4, w12, w22, x4 umaddl x5, w12, w23, x5 umaddl x6, w12, w24, x6 umaddl x7, w12, w25, x7 umaddl x8, w12, w26, x8 umaddl x9, w12, w27, x9 umull x10, w12, w28 umaddl x3, w13, w20, x3 umaddl x4, w13, w21, x4 umaddl x5, w13, w22, x5 umaddl x6, w13, w23, x6 umaddl x7, w13, w24, x7 umaddl x8, w13, w25, x8 umaddl x9, w13, w26, x9 umaddl x10, w13, w27, x10 umull x11, w13, w28 umaddl x4, w14, w20, x4 umaddl x5, w14, w21, x5 umaddl x6, w14, w22, x6 umaddl x7, w14, w23, x7 umaddl x8, w14, w24, x8 umaddl x9, w14, w25, x9 umaddl x10, w14, w26, x10 umaddl x11, w14, w27, x11 umull x12, w14, w28 umaddl x5, w15, w20, x5 umaddl x6, w15, w21, x6 umaddl x7, w15, w22, x7 umaddl x8, w15, w23, x8 umaddl x9, w15, w24, x9 umaddl x10, w15, w25, x10 umaddl x11, w15, w26, x11 umaddl x12, w15, w27, x12 umull x13, w15, w28 umaddl x6, w16, w20, x6 umaddl x7, w16, w21, x7 umaddl x8, w16, w22, x8 umaddl x9, w16, w23, x9 umaddl x10, w16, w24, x10 umaddl x11, w16, w25, x11 umaddl x12, w16, w26, x12 umaddl x13, w16, w27, x13 umull x14, w16, w28 umaddl x7, w17, w20, x7 umaddl x8, w17, w21, x8 umaddl x9, w17, w22, x9 umaddl x10, w17, w23, x10 umaddl x11, w17, w24, x11 umaddl x12, w17, w25, x12 umaddl x13, w17, w26, x13 umaddl x14, w17, w27, x14 umull x15, w17, w28 umaddl x8, w18, w20, x8 umaddl x9, w18, w21, x9 umaddl x10, w18, w22, x10 umaddl x11, w18, w23, x11 umaddl x12, w18, w24, x12 umaddl x13, w18, w25, x13 umaddl x14, w18, w26, x14 umaddl x15, w18, w27, x15 umull x16, w18, w28 add x10, x10, x9, lsr #29 and x9, x9, #0x1fffffff umull x9, w9, w30 add x0, x0, x9 add x11, x11, x10, lsr #29 and x10, x10, #0x1fffffff umull x10, w10, w30 add x1, x1, x10 add x12, x12, x11, lsr #29 and x11, x11, #0x1fffffff umull x11, w11, w30 add x2, x2, x11 add x13, x13, x12, lsr #29 and x12, x12, #0x1fffffff umull x12, w12, w30 add x3, x3, x12 add x14, x14, x13, lsr #29 and x13, x13, #0x1fffffff umull x13, w13, w30 add x4, x4, x13 add x15, x15, x14, lsr #29 and x14, x14, #0x1fffffff umull x14, w14, w30 add x5, x5, x14 add x16, x16, x15, lsr #29 and x15, x15, #0x1fffffff umull x15, w15, w30 add x6, x6, x15 lsr x9, x16, #29 and x16, x16, #0x1fffffff umull x16, w16, w30 add x7, x7, x16 umull x9, w9, w30 add x8, x8, x9 add x5, x5, x4, lsr #29 and x4, x4, 0x1fffffff add x1, x1, x0, lsr #29 and x0, x0, 0x1fffffff add x6, x6, x5, lsr #29 and x5, x5, 0x1fffffff add x2, x2, x1, lsr #29 and x1, x1, 0x1fffffff add x7, x7, x6, lsr #29 and x6, x6, 0x1fffffff add x3, x3, x2, lsr #29 and x2, x2, 0x1fffffff add x8, x8, x7, lsr #29 and x7, x7, 0x1fffffff add x4, x4, x3, lsr #29 and x3, x3, 0x1fffffff bfi x3, x7, #32, #29 bic x10, x8, #0x7fffff add x0, x0, x10, lsr #23 add x0, x0, x10, lsr #22 add x0, x0, x10, lsr #19 and x8, x8, #0x7fffff add x5, x5, x4, lsr #29 and x4, x4, 0x1fffffff bfi x4, x8, #32, #23 add x1, x1, x0, lsr #29 bfi x6, x1, #32, #30 and x0, x0, 0x1fffffff bfi x5, x0, #32, #29 stp x3, x4, [sp, #472] stp x5, x6, [sp, #488] str x2, [sp, #504] mov w9, wzr ldr w26, [sp, #144] sub w9, w9, w26 lsr w9, w9, #1 mov w8, #120 mul x8, x8, x9 ldr x0, [sp, #112] add x0, x0, x8 str x0, [sp, #152] /* nielssub p1p1 */ // neg ldr x0, [sp, #152] ldp x13, x14, [x0, #80] ldp x15, x16, [x0, #96] ldr x12, [x0, #112] ldp x20, x21, [sp, #160] ldp x27, x28, [sp, #176] sub x13, x20, x13 sub x14, x21, x14 sub x15, x27, x15 sub x16, x20, x16 sub x12, x28, x12 add x29, sp, #712 stp x13, x14, [x29, #40] stp x15, x16, [x29, #56] str x12, [x29, #72] // add ldp x23, x24, [sp, #392] ldp x25, x26, [sp, #408] ldr x22, [sp, #424] ldp x13, x14, [sp, #352] ldp x15, x16, [sp, #368] ldr x12, [sp, #384] add x3, x23, x13 add x4, x24, x14 add x5, x25, x15 add x6, x26, x16 add x2, x22, x12 stp x3, x4, [x29, #0] stp x5, x6, [x29, #16] str x2, [x29, #32] // sub add x23, x23, x20 add x24, x24, x21 add x25, x25, x27 add x26, x26, x20 add x22, x22, x28 sub x23, x23, x13 sub x24, x24, x14 sub x25, x25, x15 sub x26, x26, x16 sub x22, x22, x12 // mul ldr x0, [sp, #152] ldp w13, w17, [x0, #40] ldp w14, w18, [x0, #48] ldp w15, w10, [x0, #56] ldp w16, w11, [x0, #64] ldr w12, [x0, #72] lsr x27, x23, #32 lsr x28, x24, #32 lsr x20, x25, #32 lsr x21, x26, #32 umull x0, w10, w20 umull x1, w10, w21 umull x2, w10, w22 umull x3, w10, w23 umull x4, w10, w24 umull x5, w10, w25 umull x6, w10, w26 umull x7, w10, w27 umull x8, w10, w28 umaddl x1, w11, w20, x1 umaddl x2, w11, w21, x2 umaddl x3, w11, w22, x3 umaddl x4, w11, w23, x4 umaddl x5, w11, w24, x5 umaddl x6, w11, w25, x6 umaddl x7, w11, w26, x7 umaddl x8, w11, w27, x8 umull x9, w11, w28 umaddl x2, w12, w20, x2 umaddl x3, w12, w21, x3 umaddl x4, w12, w22, x4 umaddl x5, w12, w23, x5 umaddl x6, w12, w24, x6 umaddl x7, w12, w25, x7 umaddl x8, w12, w26, x8 umaddl x9, w12, w27, x9 umull x10, w12, w28 umaddl x3, w13, w20, x3 umaddl x4, w13, w21, x4 umaddl x5, w13, w22, x5 umaddl x6, w13, w23, x6 umaddl x7, w13, w24, x7 umaddl x8, w13, w25, x8 umaddl x9, w13, w26, x9 umaddl x10, w13, w27, x10 umull x11, w13, w28 umaddl x4, w14, w20, x4 umaddl x5, w14, w21, x5 umaddl x6, w14, w22, x6 umaddl x7, w14, w23, x7 umaddl x8, w14, w24, x8 umaddl x9, w14, w25, x9 umaddl x10, w14, w26, x10 umaddl x11, w14, w27, x11 umull x12, w14, w28 umaddl x5, w15, w20, x5 umaddl x6, w15, w21, x6 umaddl x7, w15, w22, x7 umaddl x8, w15, w23, x8 umaddl x9, w15, w24, x9 umaddl x10, w15, w25, x10 umaddl x11, w15, w26, x11 umaddl x12, w15, w27, x12 umull x13, w15, w28 umaddl x6, w16, w20, x6 umaddl x7, w16, w21, x7 umaddl x8, w16, w22, x8 umaddl x9, w16, w23, x9 umaddl x10, w16, w24, x10 umaddl x11, w16, w25, x11 umaddl x12, w16, w26, x12 umaddl x13, w16, w27, x13 umull x14, w16, w28 umaddl x7, w17, w20, x7 umaddl x8, w17, w21, x8 umaddl x9, w17, w22, x9 umaddl x10, w17, w23, x10 umaddl x11, w17, w24, x11 umaddl x12, w17, w25, x12 umaddl x13, w17, w26, x13 umaddl x14, w17, w27, x14 umull x15, w17, w28 umaddl x8, w18, w20, x8 umaddl x9, w18, w21, x9 umaddl x10, w18, w22, x10 umaddl x11, w18, w23, x11 umaddl x12, w18, w24, x12 umaddl x13, w18, w25, x13 umaddl x14, w18, w26, x14 umaddl x15, w18, w27, x15 umull x16, w18, w28 add x10, x10, x9, lsr #29 and x9, x9, #0x1fffffff umull x9, w9, w30 add x0, x0, x9 add x11, x11, x10, lsr #29 and x10, x10, #0x1fffffff umull x10, w10, w30 add x1, x1, x10 add x12, x12, x11, lsr #29 and x11, x11, #0x1fffffff umull x11, w11, w30 add x2, x2, x11 add x13, x13, x12, lsr #29 and x12, x12, #0x1fffffff umull x12, w12, w30 add x3, x3, x12 add x14, x14, x13, lsr #29 and x13, x13, #0x1fffffff umull x13, w13, w30 add x4, x4, x13 add x15, x15, x14, lsr #29 and x14, x14, #0x1fffffff umull x14, w14, w30 add x5, x5, x14 add x16, x16, x15, lsr #29 and x15, x15, #0x1fffffff umull x15, w15, w30 add x6, x6, x15 lsr x9, x16, #29 and x16, x16, #0x1fffffff umull x16, w16, w30 add x7, x7, x16 umull x9, w9, w30 add x8, x8, x9 add x5, x5, x4, lsr #29 and x4, x4, 0x1fffffff add x1, x1, x0, lsr #29 and x0, x0, 0x1fffffff add x6, x6, x5, lsr #29 and x5, x5, 0x1fffffff add x2, x2, x1, lsr #29 and x1, x1, 0x1fffffff add x7, x7, x6, lsr #29 and x6, x6, 0x1fffffff add x3, x3, x2, lsr #29 and x2, x2, 0x1fffffff add x8, x8, x7, lsr #29 and x7, x7, 0x1fffffff add x4, x4, x3, lsr #29 and x3, x3, 0x1fffffff bfi x3, x7, #32, #29 bic x10, x8, #0x7fffff add x0, x0, x10, lsr #23 add x0, x0, x10, lsr #22 add x0, x0, x10, lsr #19 and x8, x8, #0x7fffff add x5, x5, x4, lsr #29 and x4, x4, 0x1fffffff bfi x4, x8, #32, #23 add x1, x1, x0, lsr #29 bfi x6, x1, #32, #30 and x0, x0, 0x1fffffff bfi x5, x0, #32, #29 add x29, sp, #672 stp x3, x4, [x29, #0] stp x5, x6, [x29, #16] str x2, [x29, #32] // mul ldr x0, [sp, #152] ldp w13, w17, [x0, #0] ldp w14, w18, [x0, #8] ldp w15, w10, [x0, #16] ldp w16, w11, [x0, #24] ldr w12, [x0, #32] ldp w23, w27, [x29, #40] ldp w24, w28, [x29, #48] ldp w25, w20, [x29, #56] ldp w26, w21, [x29, #64] ldr w22, [x29, #72] umull x0, w10, w20 umull x1, w10, w21 umull x2, w10, w22 umull x3, w10, w23 umull x4, w10, w24 umull x5, w10, w25 umull x6, w10, w26 umull x7, w10, w27 umull x8, w10, w28 umaddl x1, w11, w20, x1 umaddl x2, w11, w21, x2 umaddl x3, w11, w22, x3 umaddl x4, w11, w23, x4 umaddl x5, w11, w24, x5 umaddl x6, w11, w25, x6 umaddl x7, w11, w26, x7 umaddl x8, w11, w27, x8 umull x9, w11, w28 umaddl x2, w12, w20, x2 umaddl x3, w12, w21, x3 umaddl x4, w12, w22, x4 umaddl x5, w12, w23, x5 umaddl x6, w12, w24, x6 umaddl x7, w12, w25, x7 umaddl x8, w12, w26, x8 umaddl x9, w12, w27, x9 umull x10, w12, w28 umaddl x3, w13, w20, x3 umaddl x4, w13, w21, x4 umaddl x5, w13, w22, x5 umaddl x6, w13, w23, x6 umaddl x7, w13, w24, x7 umaddl x8, w13, w25, x8 umaddl x9, w13, w26, x9 umaddl x10, w13, w27, x10 umull x11, w13, w28 umaddl x4, w14, w20, x4 umaddl x5, w14, w21, x5 umaddl x6, w14, w22, x6 umaddl x7, w14, w23, x7 umaddl x8, w14, w24, x8 umaddl x9, w14, w25, x9 umaddl x10, w14, w26, x10 umaddl x11, w14, w27, x11 umull x12, w14, w28 umaddl x5, w15, w20, x5 umaddl x6, w15, w21, x6 umaddl x7, w15, w22, x7 umaddl x8, w15, w23, x8 umaddl x9, w15, w24, x9 umaddl x10, w15, w25, x10 umaddl x11, w15, w26, x11 umaddl x12, w15, w27, x12 umull x13, w15, w28 umaddl x6, w16, w20, x6 umaddl x7, w16, w21, x7 umaddl x8, w16, w22, x8 umaddl x9, w16, w23, x9 umaddl x10, w16, w24, x10 umaddl x11, w16, w25, x11 umaddl x12, w16, w26, x12 umaddl x13, w16, w27, x13 umull x14, w16, w28 umaddl x7, w17, w20, x7 umaddl x8, w17, w21, x8 umaddl x9, w17, w22, x9 umaddl x10, w17, w23, x10 umaddl x11, w17, w24, x11 umaddl x12, w17, w25, x12 umaddl x13, w17, w26, x13 umaddl x14, w17, w27, x14 umull x15, w17, w28 umaddl x8, w18, w20, x8 umaddl x9, w18, w21, x9 umaddl x10, w18, w22, x10 umaddl x11, w18, w23, x11 umaddl x12, w18, w24, x12 umaddl x13, w18, w25, x13 umaddl x14, w18, w26, x14 umaddl x15, w18, w27, x15 umull x16, w18, w28 add x10, x10, x9, lsr #29 and x9, x9, #0x1fffffff umull x9, w9, w30 add x0, x0, x9 add x11, x11, x10, lsr #29 and x10, x10, #0x1fffffff umull x10, w10, w30 add x1, x1, x10 add x12, x12, x11, lsr #29 and x11, x11, #0x1fffffff umull x11, w11, w30 add x2, x2, x11 add x13, x13, x12, lsr #29 and x12, x12, #0x1fffffff umull x12, w12, w30 add x3, x3, x12 add x14, x14, x13, lsr #29 and x13, x13, #0x1fffffff umull x13, w13, w30 add x4, x4, x13 add x15, x15, x14, lsr #29 and x14, x14, #0x1fffffff umull x14, w14, w30 add x5, x5, x14 add x16, x16, x15, lsr #29 and x15, x15, #0x1fffffff umull x15, w15, w30 add x6, x6, x15 lsr x9, x16, #29 and x16, x16, #0x1fffffff umull x16, w16, w30 add x7, x7, x16 umull x9, w9, w30 add x8, x8, x9 add x5, x5, x4, lsr #29 and x4, x4, 0x1fffffff add x1, x1, x0, lsr #29 and x0, x0, 0x1fffffff add x6, x6, x5, lsr #29 and x5, x5, 0x1fffffff add x2, x2, x1, lsr #29 and x1, x1, 0x1fffffff add x7, x7, x6, lsr #29 and x6, x6, 0x1fffffff add x3, x3, x2, lsr #29 and x2, x2, 0x1fffffff add x8, x8, x7, lsr #29 and x7, x7, 0x1fffffff add x4, x4, x3, lsr #29 and x3, x3, 0x1fffffff bfi x3, x7, #32, #29 bic x10, x8, #0x7fffff add x0, x0, x10, lsr #23 add x0, x0, x10, lsr #22 add x0, x0, x10, lsr #19 and x8, x8, #0x7fffff add x5, x5, x4, lsr #29 and x4, x4, 0x1fffffff bfi x4, x8, #32, #23 add x1, x1, x0, lsr #29 bfi x6, x1, #32, #30 and x0, x0, 0x1fffffff bfi x5, x0, #32, #29 // add add x29, sp, #472 ldp x13, x14, [x29, #200] ldp x15, x16, [x29, #216] ldr x12, [x29, #232] add x0, x3, x13 add x1, x4, x14 add x7, x5, x15 add x8, x6, x16 add x9, x2, x12 stp x0, x1, [x29, #120] stp x7, x8, [x29, #136] str x9, [x29, #152] // sub ldp x20, x21, [sp, #160] ldp x27, x28, [sp, #176] add x3, x3, x20 add x4, x4, x21 add x5, x5, x27 add x6, x6, x20 add x2, x2, x28 sub x3, x3, x13 sub x4, x4, x14 sub x5, x5, x15 sub x6, x6, x16 sub x2, x2, x12 stp x3, x4, [x29, #40] stp x5, x6, [x29, #56] str x2, [x29, #72] // mul ldp w23, w27, [x29, #0] ldp w24, w28, [x29, #8] ldp w25, w20, [x29, #16] ldp w26, w21, [x29, #24] ldr w22, [x29, #32] add x29, sp, #752 ldp w13, w17, [x29, #0] ldp w14, w18, [x29, #8] ldp w15, w10, [x29, #16] ldp w16, w11, [x29, #24] ldr w12, [x29, #32] umull x0, w10, w20 umull x1, w10, w21 umull x2, w10, w22 umull x3, w10, w23 umull x4, w10, w24 umull x5, w10, w25 umull x6, w10, w26 umull x7, w10, w27 umull x8, w10, w28 umaddl x1, w11, w20, x1 umaddl x2, w11, w21, x2 umaddl x3, w11, w22, x3 umaddl x4, w11, w23, x4 umaddl x5, w11, w24, x5 umaddl x6, w11, w25, x6 umaddl x7, w11, w26, x7 umaddl x8, w11, w27, x8 umull x9, w11, w28 umaddl x2, w12, w20, x2 umaddl x3, w12, w21, x3 umaddl x4, w12, w22, x4 umaddl x5, w12, w23, x5 umaddl x6, w12, w24, x6 umaddl x7, w12, w25, x7 umaddl x8, w12, w26, x8 umaddl x9, w12, w27, x9 umull x10, w12, w28 umaddl x3, w13, w20, x3 umaddl x4, w13, w21, x4 umaddl x5, w13, w22, x5 umaddl x6, w13, w23, x6 umaddl x7, w13, w24, x7 umaddl x8, w13, w25, x8 umaddl x9, w13, w26, x9 umaddl x10, w13, w27, x10 umull x11, w13, w28 umaddl x4, w14, w20, x4 umaddl x5, w14, w21, x5 umaddl x6, w14, w22, x6 umaddl x7, w14, w23, x7 umaddl x8, w14, w24, x8 umaddl x9, w14, w25, x9 umaddl x10, w14, w26, x10 umaddl x11, w14, w27, x11 umull x12, w14, w28 umaddl x5, w15, w20, x5 umaddl x6, w15, w21, x6 umaddl x7, w15, w22, x7 umaddl x8, w15, w23, x8 umaddl x9, w15, w24, x9 umaddl x10, w15, w25, x10 umaddl x11, w15, w26, x11 umaddl x12, w15, w27, x12 umull x13, w15, w28 umaddl x6, w16, w20, x6 umaddl x7, w16, w21, x7 umaddl x8, w16, w22, x8 umaddl x9, w16, w23, x9 umaddl x10, w16, w24, x10 umaddl x11, w16, w25, x11 umaddl x12, w16, w26, x12 umaddl x13, w16, w27, x13 umull x14, w16, w28 umaddl x7, w17, w20, x7 umaddl x8, w17, w21, x8 umaddl x9, w17, w22, x9 umaddl x10, w17, w23, x10 umaddl x11, w17, w24, x11 umaddl x12, w17, w25, x12 umaddl x13, w17, w26, x13 umaddl x14, w17, w27, x14 umull x15, w17, w28 umaddl x8, w18, w20, x8 umaddl x9, w18, w21, x9 umaddl x10, w18, w22, x10 umaddl x11, w18, w23, x11 umaddl x12, w18, w24, x12 umaddl x13, w18, w25, x13 umaddl x14, w18, w26, x14 umaddl x15, w18, w27, x15 umull x16, w18, w28 add x10, x10, x9, lsr #29 and x9, x9, #0x1fffffff umull x9, w9, w30 add x0, x0, x9 add x11, x11, x10, lsr #29 and x10, x10, #0x1fffffff umull x10, w10, w30 add x1, x1, x10 add x12, x12, x11, lsr #29 and x11, x11, #0x1fffffff umull x11, w11, w30 add x2, x2, x11 add x13, x13, x12, lsr #29 and x12, x12, #0x1fffffff umull x12, w12, w30 add x3, x3, x12 add x14, x14, x13, lsr #29 and x13, x13, #0x1fffffff umull x13, w13, w30 add x4, x4, x13 add x15, x15, x14, lsr #29 and x14, x14, #0x1fffffff umull x14, w14, w30 add x5, x5, x14 add x16, x16, x15, lsr #29 and x15, x15, #0x1fffffff umull x15, w15, w30 add x6, x6, x15 lsr x9, x16, #29 and x16, x16, #0x1fffffff umull x16, w16, w30 add x7, x7, x16 umull x9, w9, w30 add x8, x8, x9 add x5, x5, x4, lsr #29 and x4, x4, 0x1fffffff add x1, x1, x0, lsr #29 and x0, x0, 0x1fffffff add x6, x6, x5, lsr #29 and x5, x5, 0x1fffffff add x2, x2, x1, lsr #29 and x1, x1, 0x1fffffff add x7, x7, x6, lsr #29 and x6, x6, 0x1fffffff add x3, x3, x2, lsr #29 and x2, x2, 0x1fffffff add x8, x8, x7, lsr #29 and x7, x7, 0x1fffffff add x4, x4, x3, lsr #29 and x3, x3, 0x1fffffff bfi x3, x7, #32, #29 bic x10, x8, #0x7fffff add x0, x0, x10, lsr #23 add x0, x0, x10, lsr #22 add x0, x0, x10, lsr #19 and x8, x8, #0x7fffff add x5, x5, x4, lsr #29 and x4, x4, 0x1fffffff bfi x4, x8, #32, #23 add x1, x1, x0, lsr #29 bfi x6, x1, #32, #30 and x0, x0, 0x1fffffff bfi x5, x0, #32, #29 // double ldp x13, x14, [sp, #432] ldp x15, x16, [sp, #448] ldr x12, [sp, #464] add x13, x13, x13 add x14, x14, x14 add x15, x15, x15 add x16, x16, x16 add x12, x12, x12 lsr x17, x13, #32 mov w13, w13 lsr x18, x14, #32 mov w14, w14 lsr x10, x15, #32 mov w15, w15 lsr x11, x16, #32 mov w16, w16 add x15, x15, x14, lsr #29 and x14, x14, 0x1fffffff add x11, x11, x10, lsr #29 and x10, x10, 0x1fffffff add x16, x16, x15, lsr #29 and x15, x15, 0x1fffffff add x12, x12, x11, lsr #29 and x11, x11, 0x1fffffff add x17, x17, x16, lsr #29 and x16, x16, 0x1fffffff add x13, x13, x12, lsr #29 and x12, x12, 0x1fffffff add x18, x18, x17, lsr #29 and x17, x17, 0x1fffffff add x14, x14, x13, lsr #29 and x13, x13, 0x1fffffff bfi x13, x17, #32, #29 bic x20, x18, #0x7fffff add x10, x10, x20, lsr #23 add x10, x10, x20, lsr #22 add x10, x10, x20, lsr #19 and x18, x18, #0x7fffff add x15, x15, x14, lsr #29 and x14, x14, 0x1fffffff bfi x14, x18, #32, #23 add x11, x11, x10, lsr #29 bfi x16, x11, #32, #30 and x10, x10, 0x1fffffff bfi x15, x10, #32, #29 // sub ldp x20, x21, [sp, #160] ldp x27, x28, [sp, #176] add x0, x13, x20 add x1, x14, x21 add x7, x15, x27 add x8, x16, x20 add x9, x12, x28 sub x0, x0, x3 sub x1, x1, x4 sub x7, x7, x5 sub x8, x8, x6 sub x9, x9, x2 add x29, sp, #552 stp x0, x1, [x29, #80] stp x7, x8, [x29, #96] str x9, [x29, #112] // add add x3, x3, x13 add x4, x4, x14 add x5, x5, x15 add x6, x6, x16 add x2, x2, x12 stp x3, x4, [x29, #0] stp x5, x6, [x29, #16] str x2, [x29, #32] .L9: /* p1p1 to p2 */ // mul add x29, sp, #512 ldp w13, w17, [x29, #0] ldp w14, w18, [x29, #8] ldp w15, w10, [x29, #16] ldp w16, w11, [x29, #24] ldr w12, [x29, #32] ldp w23, w27, [x29, #120] ldp w24, w28, [x29, #128] ldp w25, w20, [x29, #136] ldp w26, w21, [x29, #144] ldr w22, [x29, #152] umull x0, w10, w20 umull x1, w10, w21 umull x2, w10, w22 umull x3, w10, w23 umull x4, w10, w24 umull x5, w10, w25 umull x6, w10, w26 umull x7, w10, w27 umull x8, w10, w28 umaddl x1, w11, w20, x1 umaddl x2, w11, w21, x2 umaddl x3, w11, w22, x3 umaddl x4, w11, w23, x4 umaddl x5, w11, w24, x5 umaddl x6, w11, w25, x6 umaddl x7, w11, w26, x7 umaddl x8, w11, w27, x8 umull x9, w11, w28 umaddl x2, w12, w20, x2 umaddl x3, w12, w21, x3 umaddl x4, w12, w22, x4 umaddl x5, w12, w23, x5 umaddl x6, w12, w24, x6 umaddl x7, w12, w25, x7 umaddl x8, w12, w26, x8 umaddl x9, w12, w27, x9 umull x10, w12, w28 umaddl x3, w13, w20, x3 umaddl x4, w13, w21, x4 umaddl x5, w13, w22, x5 umaddl x6, w13, w23, x6 umaddl x7, w13, w24, x7 umaddl x8, w13, w25, x8 umaddl x9, w13, w26, x9 umaddl x10, w13, w27, x10 umull x11, w13, w28 umaddl x4, w14, w20, x4 umaddl x5, w14, w21, x5 umaddl x6, w14, w22, x6 umaddl x7, w14, w23, x7 umaddl x8, w14, w24, x8 umaddl x9, w14, w25, x9 umaddl x10, w14, w26, x10 umaddl x11, w14, w27, x11 umull x12, w14, w28 umaddl x5, w15, w20, x5 umaddl x6, w15, w21, x6 umaddl x7, w15, w22, x7 umaddl x8, w15, w23, x8 umaddl x9, w15, w24, x9 umaddl x10, w15, w25, x10 umaddl x11, w15, w26, x11 umaddl x12, w15, w27, x12 umull x13, w15, w28 umaddl x6, w16, w20, x6 umaddl x7, w16, w21, x7 umaddl x8, w16, w22, x8 umaddl x9, w16, w23, x9 umaddl x10, w16, w24, x10 umaddl x11, w16, w25, x11 umaddl x12, w16, w26, x12 umaddl x13, w16, w27, x13 umull x14, w16, w28 umaddl x7, w17, w20, x7 umaddl x8, w17, w21, x8 umaddl x9, w17, w22, x9 umaddl x10, w17, w23, x10 umaddl x11, w17, w24, x11 umaddl x12, w17, w25, x12 umaddl x13, w17, w26, x13 umaddl x14, w17, w27, x14 umull x15, w17, w28 umaddl x8, w18, w20, x8 umaddl x9, w18, w21, x9 umaddl x10, w18, w22, x10 umaddl x11, w18, w23, x11 umaddl x12, w18, w24, x12 umaddl x13, w18, w25, x13 umaddl x14, w18, w26, x14 umaddl x15, w18, w27, x15 umull x16, w18, w28 add x10, x10, x9, lsr #29 and x9, x9, #0x1fffffff umull x9, w9, w30 add x0, x0, x9 add x11, x11, x10, lsr #29 and x10, x10, #0x1fffffff umull x10, w10, w30 add x1, x1, x10 add x12, x12, x11, lsr #29 and x11, x11, #0x1fffffff umull x11, w11, w30 add x2, x2, x11 add x13, x13, x12, lsr #29 and x12, x12, #0x1fffffff umull x12, w12, w30 add x3, x3, x12 add x14, x14, x13, lsr #29 and x13, x13, #0x1fffffff umull x13, w13, w30 add x4, x4, x13 add x15, x15, x14, lsr #29 and x14, x14, #0x1fffffff umull x14, w14, w30 add x5, x5, x14 add x16, x16, x15, lsr #29 and x15, x15, #0x1fffffff umull x15, w15, w30 add x6, x6, x15 lsr x9, x16, #29 and x16, x16, #0x1fffffff umull x16, w16, w30 add x7, x7, x16 umull x9, w9, w30 add x8, x8, x9 add x5, x5, x4, lsr #29 and x4, x4, 0x1fffffff add x1, x1, x0, lsr #29 and x0, x0, 0x1fffffff add x6, x6, x5, lsr #29 and x5, x5, 0x1fffffff add x2, x2, x1, lsr #29 and x1, x1, 0x1fffffff add x7, x7, x6, lsr #29 and x6, x6, 0x1fffffff add x3, x3, x2, lsr #29 and x2, x2, 0x1fffffff add x8, x8, x7, lsr #29 and x7, x7, 0x1fffffff add x4, x4, x3, lsr #29 and x3, x3, 0x1fffffff bfi x3, x7, #32, #29 bic x10, x8, #0x7fffff add x0, x0, x10, lsr #23 add x0, x0, x10, lsr #22 add x0, x0, x10, lsr #19 and x8, x8, #0x7fffff add x5, x5, x4, lsr #29 and x4, x4, 0x1fffffff bfi x4, x8, #32, #23 add x1, x1, x0, lsr #29 bfi x6, x1, #32, #30 and x0, x0, 0x1fffffff bfi x5, x0, #32, #29 stp x3, x4, [sp, #192] stp x5, x6, [sp, #208] str x2, [sp, #224] // mul add x29, sp, #552 ldp w13, w17, [x29, #0] ldp w14, w18, [x29, #8] ldp w15, w10, [x29, #16] ldp w16, w11, [x29, #24] ldr w12, [x29, #32] ldp w23, w27, [x29, #40] ldp w24, w28, [x29, #48] ldp w25, w20, [x29, #56] ldp w26, w21, [x29, #64] ldr w22, [x29, #72] umull x0, w10, w20 umull x1, w10, w21 umull x2, w10, w22 umull x3, w10, w23 umull x4, w10, w24 umull x5, w10, w25 umull x6, w10, w26 umull x7, w10, w27 umull x8, w10, w28 umaddl x1, w11, w20, x1 umaddl x2, w11, w21, x2 umaddl x3, w11, w22, x3 umaddl x4, w11, w23, x4 umaddl x5, w11, w24, x5 umaddl x6, w11, w25, x6 umaddl x7, w11, w26, x7 umaddl x8, w11, w27, x8 umull x9, w11, w28 umaddl x2, w12, w20, x2 umaddl x3, w12, w21, x3 umaddl x4, w12, w22, x4 umaddl x5, w12, w23, x5 umaddl x6, w12, w24, x6 umaddl x7, w12, w25, x7 umaddl x8, w12, w26, x8 umaddl x9, w12, w27, x9 umull x10, w12, w28 umaddl x3, w13, w20, x3 umaddl x4, w13, w21, x4 umaddl x5, w13, w22, x5 umaddl x6, w13, w23, x6 umaddl x7, w13, w24, x7 umaddl x8, w13, w25, x8 umaddl x9, w13, w26, x9 umaddl x10, w13, w27, x10 umull x11, w13, w28 umaddl x4, w14, w20, x4 umaddl x5, w14, w21, x5 umaddl x6, w14, w22, x6 umaddl x7, w14, w23, x7 umaddl x8, w14, w24, x8 umaddl x9, w14, w25, x9 umaddl x10, w14, w26, x10 umaddl x11, w14, w27, x11 umull x12, w14, w28 umaddl x5, w15, w20, x5 umaddl x6, w15, w21, x6 umaddl x7, w15, w22, x7 umaddl x8, w15, w23, x8 umaddl x9, w15, w24, x9 umaddl x10, w15, w25, x10 umaddl x11, w15, w26, x11 umaddl x12, w15, w27, x12 umull x13, w15, w28 umaddl x6, w16, w20, x6 umaddl x7, w16, w21, x7 umaddl x8, w16, w22, x8 umaddl x9, w16, w23, x9 umaddl x10, w16, w24, x10 umaddl x11, w16, w25, x11 umaddl x12, w16, w26, x12 umaddl x13, w16, w27, x13 umull x14, w16, w28 umaddl x7, w17, w20, x7 umaddl x8, w17, w21, x8 umaddl x9, w17, w22, x9 umaddl x10, w17, w23, x10 umaddl x11, w17, w24, x11 umaddl x12, w17, w25, x12 umaddl x13, w17, w26, x13 umaddl x14, w17, w27, x14 umull x15, w17, w28 umaddl x8, w18, w20, x8 umaddl x9, w18, w21, x9 umaddl x10, w18, w22, x10 umaddl x11, w18, w23, x11 umaddl x12, w18, w24, x12 umaddl x13, w18, w25, x13 umaddl x14, w18, w26, x14 umaddl x15, w18, w27, x15 umull x16, w18, w28 add x10, x10, x9, lsr #29 and x9, x9, #0x1fffffff umull x9, w9, w30 add x0, x0, x9 add x11, x11, x10, lsr #29 and x10, x10, #0x1fffffff umull x10, w10, w30 add x1, x1, x10 add x12, x12, x11, lsr #29 and x11, x11, #0x1fffffff umull x11, w11, w30 add x2, x2, x11 add x13, x13, x12, lsr #29 and x12, x12, #0x1fffffff umull x12, w12, w30 add x3, x3, x12 add x14, x14, x13, lsr #29 and x13, x13, #0x1fffffff umull x13, w13, w30 add x4, x4, x13 add x15, x15, x14, lsr #29 and x14, x14, #0x1fffffff umull x14, w14, w30 add x5, x5, x14 add x16, x16, x15, lsr #29 and x15, x15, #0x1fffffff umull x15, w15, w30 add x6, x6, x15 lsr x9, x16, #29 and x16, x16, #0x1fffffff umull x16, w16, w30 add x7, x7, x16 umull x9, w9, w30 add x8, x8, x9 add x5, x5, x4, lsr #29 and x4, x4, 0x1fffffff add x1, x1, x0, lsr #29 and x0, x0, 0x1fffffff add x6, x6, x5, lsr #29 and x5, x5, 0x1fffffff add x2, x2, x1, lsr #29 and x1, x1, 0x1fffffff add x7, x7, x6, lsr #29 and x6, x6, 0x1fffffff add x3, x3, x2, lsr #29 and x2, x2, 0x1fffffff add x8, x8, x7, lsr #29 and x7, x7, 0x1fffffff add x4, x4, x3, lsr #29 and x3, x3, 0x1fffffff bfi x3, x7, #32, #29 bic x10, x8, #0x7fffff add x0, x0, x10, lsr #23 add x0, x0, x10, lsr #22 add x0, x0, x10, lsr #19 and x8, x8, #0x7fffff add x5, x5, x4, lsr #29 and x4, x4, 0x1fffffff bfi x4, x8, #32, #23 add x1, x1, x0, lsr #29 bfi x6, x1, #32, #30 and x0, x0, 0x1fffffff bfi x5, x0, #32, #29 stp x3, x4, [sp, #232] stp x5, x6, [sp, #248] str x2, [sp, #264] // mul add x29, sp, #552 ldp w13, w17, [x29, #0] ldp w14, w18, [x29, #8] ldp w15, w10, [x29, #16] ldp w16, w11, [x29, #24] ldr w12, [x29, #32] ldp w23, w27, [x29, #80] ldp w24, w28, [x29, #88] ldp w25, w20, [x29, #96] ldp w26, w21, [x29, #104] ldr w22, [x29, #112] umull x0, w10, w20 umull x1, w10, w21 umull x2, w10, w22 umull x3, w10, w23 umull x4, w10, w24 umull x5, w10, w25 umull x6, w10, w26 umull x7, w10, w27 umull x8, w10, w28 umaddl x1, w11, w20, x1 umaddl x2, w11, w21, x2 umaddl x3, w11, w22, x3 umaddl x4, w11, w23, x4 umaddl x5, w11, w24, x5 umaddl x6, w11, w25, x6 umaddl x7, w11, w26, x7 umaddl x8, w11, w27, x8 umull x9, w11, w28 umaddl x2, w12, w20, x2 umaddl x3, w12, w21, x3 umaddl x4, w12, w22, x4 umaddl x5, w12, w23, x5 umaddl x6, w12, w24, x6 umaddl x7, w12, w25, x7 umaddl x8, w12, w26, x8 umaddl x9, w12, w27, x9 umull x10, w12, w28 umaddl x3, w13, w20, x3 umaddl x4, w13, w21, x4 umaddl x5, w13, w22, x5 umaddl x6, w13, w23, x6 umaddl x7, w13, w24, x7 umaddl x8, w13, w25, x8 umaddl x9, w13, w26, x9 umaddl x10, w13, w27, x10 umull x11, w13, w28 umaddl x4, w14, w20, x4 umaddl x5, w14, w21, x5 umaddl x6, w14, w22, x6 umaddl x7, w14, w23, x7 umaddl x8, w14, w24, x8 umaddl x9, w14, w25, x9 umaddl x10, w14, w26, x10 umaddl x11, w14, w27, x11 umull x12, w14, w28 umaddl x5, w15, w20, x5 umaddl x6, w15, w21, x6 umaddl x7, w15, w22, x7 umaddl x8, w15, w23, x8 umaddl x9, w15, w24, x9 umaddl x10, w15, w25, x10 umaddl x11, w15, w26, x11 umaddl x12, w15, w27, x12 umull x13, w15, w28 umaddl x6, w16, w20, x6 umaddl x7, w16, w21, x7 umaddl x8, w16, w22, x8 umaddl x9, w16, w23, x9 umaddl x10, w16, w24, x10 umaddl x11, w16, w25, x11 umaddl x12, w16, w26, x12 umaddl x13, w16, w27, x13 umull x14, w16, w28 umaddl x7, w17, w20, x7 umaddl x8, w17, w21, x8 umaddl x9, w17, w22, x9 umaddl x10, w17, w23, x10 umaddl x11, w17, w24, x11 umaddl x12, w17, w25, x12 umaddl x13, w17, w26, x13 umaddl x14, w17, w27, x14 umull x15, w17, w28 umaddl x8, w18, w20, x8 umaddl x9, w18, w21, x9 umaddl x10, w18, w22, x10 umaddl x11, w18, w23, x11 umaddl x12, w18, w24, x12 umaddl x13, w18, w25, x13 umaddl x14, w18, w26, x14 umaddl x15, w18, w27, x15 umull x16, w18, w28 add x10, x10, x9, lsr #29 and x9, x9, #0x1fffffff umull x9, w9, w30 add x0, x0, x9 add x11, x11, x10, lsr #29 and x10, x10, #0x1fffffff umull x10, w10, w30 add x1, x1, x10 add x12, x12, x11, lsr #29 and x11, x11, #0x1fffffff umull x11, w11, w30 add x2, x2, x11 add x13, x13, x12, lsr #29 and x12, x12, #0x1fffffff umull x12, w12, w30 add x3, x3, x12 add x14, x14, x13, lsr #29 and x13, x13, #0x1fffffff umull x13, w13, w30 add x4, x4, x13 add x15, x15, x14, lsr #29 and x14, x14, #0x1fffffff umull x14, w14, w30 add x5, x5, x14 add x16, x16, x15, lsr #29 and x15, x15, #0x1fffffff umull x15, w15, w30 add x6, x6, x15 lsr x9, x16, #29 and x16, x16, #0x1fffffff umull x16, w16, w30 add x7, x7, x16 umull x9, w9, w30 add x8, x8, x9 add x5, x5, x4, lsr #29 and x4, x4, 0x1fffffff add x1, x1, x0, lsr #29 and x0, x0, 0x1fffffff add x6, x6, x5, lsr #29 and x5, x5, 0x1fffffff add x2, x2, x1, lsr #29 and x1, x1, 0x1fffffff add x7, x7, x6, lsr #29 and x6, x6, 0x1fffffff add x3, x3, x2, lsr #29 and x2, x2, 0x1fffffff add x8, x8, x7, lsr #29 and x7, x7, 0x1fffffff add x4, x4, x3, lsr #29 and x3, x3, 0x1fffffff bfi x3, x7, #32, #29 bic x10, x8, #0x7fffff add x0, x0, x10, lsr #23 add x0, x0, x10, lsr #22 add x0, x0, x10, lsr #19 and x8, x8, #0x7fffff add x5, x5, x4, lsr #29 and x4, x4, 0x1fffffff bfi x4, x8, #32, #23 add x1, x1, x0, lsr #29 bfi x6, x1, #32, #30 and x0, x0, 0x1fffffff bfi x5, x0, #32, #29 stp x3, x4, [sp, #272] stp x5, x6, [sp, #288] str x2, [sp, #304] ldr x25, [sp, #136] sub w25, w25, #1 str x25, [sp, #136] cmp w25, wzr bge .L3 .L10: ldr x0, [sp, #96] ldp x3, x4, [sp, #192] ldp x5, x6, [sp, #208] ldr x2, [sp, #224] stp x3, x4, [x0, #0] stp x5, x6, [x0, #16] str x2, [x0, #32] ldp x3, x4, [sp, #232] ldp x5, x6, [sp, #248] ldr x2, [sp, #264] stp x3, x4, [x0, #40] stp x5, x6, [x0, #56] str x2, [x0, #72] ldp x3, x4, [sp, #272] ldp x5, x6, [sp, #288] ldr x2, [sp, #304] stp x3, x4, [x0, #80] stp x5, x6, [x0, #96] str x2, [x0, #112] ldp x29, x30, [sp, #80] ldp x27, x28, [sp, #64] ldp x25, x26, [sp, #48] ldp x23, x24, [sp, #32] ldp x21, x22, [sp, #16] ldp x19, x20, [sp, #0] add sp, sp, #800 ret .section .note.GNU-stack,"",@progbits