// linker define fe25519_nsquare // linker use REDMASK51 # qhasm: int64 rp # qhasm: int64 n # qhasm: input rp # qhasm: input n # qhasm: int64 r0 # qhasm: int64 r1 # qhasm: int64 r2 # qhasm: int64 r3 # qhasm: int64 r4 # qhasm: int64 c1 # qhasm: int64 c2 # qhasm: int64 c3 # qhasm: int64 c4 # qhasm: int64 c5 # qhasm: int64 c6 # qhasm: int64 c7 # qhasm: caller c1 # qhasm: caller c2 # qhasm: caller c3 # qhasm: caller c4 # qhasm: caller c5 # qhasm: caller c6 # qhasm: caller c7 # qhasm: stack64 c1_stack # qhasm: stack64 c2_stack # qhasm: stack64 c3_stack # qhasm: stack64 c4_stack # qhasm: stack64 c5_stack # qhasm: stack64 c6_stack # qhasm: stack64 c7_stack # qhasm: stack64 x119_stack # qhasm: stack64 x219_stack # qhasm: stack64 x319_stack # qhasm: stack64 x419_stack # qhasm: int64 squarer01 # qhasm: int64 squarer11 # qhasm: int64 squarer21 # qhasm: int64 squarer31 # qhasm: int64 squarer41 # qhasm: int64 squarerax # qhasm: int64 squarerdx # qhasm: int64 squaret # qhasm: int64 squareredmask # qhasm: stack64 n_stack # qhasm: enter CRYPTO_SHARED_NAMESPACE(fe25519_nsquare) .text .p2align 5 .globl _CRYPTO_SHARED_NAMESPACE(fe25519_nsquare) .globl CRYPTO_SHARED_NAMESPACE(fe25519_nsquare) _CRYPTO_SHARED_NAMESPACE(fe25519_nsquare): CRYPTO_SHARED_NAMESPACE(fe25519_nsquare): mov %rsp,%r11 and $31,%r11 add $64,%r11 sub %r11,%rsp # qhasm: c1_stack = c1 # asm 1: movq c1_stack=stack64#1 # asm 2: movq c1_stack=0(%rsp) movq %r11,0(%rsp) # qhasm: c2_stack = c2 # asm 1: movq c2_stack=stack64#2 # asm 2: movq c2_stack=8(%rsp) movq %r12,8(%rsp) # qhasm: c3_stack = c3 # asm 1: movq c3_stack=stack64#3 # asm 2: movq c3_stack=16(%rsp) movq %r13,16(%rsp) # qhasm: c4_stack = c4 # asm 1: movq c4_stack=stack64#4 # asm 2: movq c4_stack=24(%rsp) movq %r14,24(%rsp) # qhasm: c5_stack = c5 # asm 1: movq c5_stack=stack64#5 # asm 2: movq c5_stack=32(%rsp) movq %r15,32(%rsp) # qhasm: c6_stack = c6 # asm 1: movq c6_stack=stack64#6 # asm 2: movq c6_stack=40(%rsp) movq %rbx,40(%rsp) # qhasm: c7_stack = c7 # asm 1: movq c7_stack=stack64#7 # asm 2: movq c7_stack=48(%rsp) movq %rbp,48(%rsp) # qhasm: loop: ._loop: # qhasm: squarerax = *(uint64 *)(rp + 0) # asm 1: movq 0(squarerax=int64#7 # asm 2: movq 0(squarerax=%rax movq 0(%rdi),%rax # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(rp + 0) # asm 1: mulq 0(r0=int64#4 # asm 2: mov r0=%rcx mov %rax,%rcx # qhasm: squarer01 = squarerdx # asm 1: mov squarer01=int64#5 # asm 2: mov squarer01=%r8 mov %rdx,%r8 # qhasm: squarerax = *(uint64 *)(rp + 0) # asm 1: movq 0(squarerax=int64#7 # asm 2: movq 0(squarerax=%rax movq 0(%rdi),%rax # qhasm: squarerax <<= 1 # asm 1: shl $1,r1=int64#6 # asm 2: mov r1=%r9 mov %rax,%r9 # qhasm: squarer11 = squarerdx # asm 1: mov squarer11=int64#8 # asm 2: mov squarer11=%r10 mov %rdx,%r10 # qhasm: squarerax = *(uint64 *)(rp + 0) # asm 1: movq 0(squarerax=int64#7 # asm 2: movq 0(squarerax=%rax movq 0(%rdi),%rax # qhasm: squarerax <<= 1 # asm 1: shl $1,r2=int64#9 # asm 2: mov r2=%r11 mov %rax,%r11 # qhasm: squarer21 = squarerdx # asm 1: mov squarer21=int64#10 # asm 2: mov squarer21=%r12 mov %rdx,%r12 # qhasm: squarerax = *(uint64 *)(rp + 0) # asm 1: movq 0(squarerax=int64#7 # asm 2: movq 0(squarerax=%rax movq 0(%rdi),%rax # qhasm: squarerax <<= 1 # asm 1: shl $1,r3=int64#11 # asm 2: mov r3=%r13 mov %rax,%r13 # qhasm: squarer31 = squarerdx # asm 1: mov squarer31=int64#12 # asm 2: mov squarer31=%r14 mov %rdx,%r14 # qhasm: squarerax = *(uint64 *)(rp + 0) # asm 1: movq 0(squarerax=int64#7 # asm 2: movq 0(squarerax=%rax movq 0(%rdi),%rax # qhasm: squarerax <<= 1 # asm 1: shl $1,r4=int64#13 # asm 2: mov r4=%r15 mov %rax,%r15 # qhasm: squarer41 = squarerdx # asm 1: mov squarer41=int64#14 # asm 2: mov squarer41=%rbx mov %rdx,%rbx # qhasm: squarerax = *(uint64 *)(rp + 8) # asm 1: movq 8(squarerax=int64#7 # asm 2: movq 8(squarerax=%rax movq 8(%rdi),%rax # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(rp + 8) # asm 1: mulq 8(squarerax=int64#7 # asm 2: movq 8(squarerax=%rax movq 8(%rdi),%rax # qhasm: squarerax <<= 1 # asm 1: shl $1,squarerax=int64#7 # asm 2: movq 8(squarerax=%rax movq 8(%rdi),%rax # qhasm: squarerax <<= 1 # asm 1: shl $1,squarerax=int64#3 # asm 2: movq 8(squarerax=%rdx movq 8(%rdi),%rdx # qhasm: squarerax *= 38 # asm 1: imulq $38,squarerax=int64#7 # asm 2: imulq $38,squarerax=%rax imulq $38,%rdx,%rax # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(rp + 32) # asm 1: mulq 32(squarerax=int64#7 # asm 2: movq 16(squarerax=%rax movq 16(%rdi),%rax # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(rp + 16) # asm 1: mulq 16(squarerax=int64#3 # asm 2: movq 16(squarerax=%rdx movq 16(%rdi),%rdx # qhasm: squarerax *= 38 # asm 1: imulq $38,squarerax=int64#7 # asm 2: imulq $38,squarerax=%rax imulq $38,%rdx,%rax # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(rp + 24) # asm 1: mulq 24(squarerax=int64#3 # asm 2: movq 16(squarerax=%rdx movq 16(%rdi),%rdx # qhasm: squarerax *= 38 # asm 1: imulq $38,squarerax=int64#7 # asm 2: imulq $38,squarerax=%rax imulq $38,%rdx,%rax # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(rp + 32) # asm 1: mulq 32(squarerax=int64#3 # asm 2: movq 24(squarerax=%rdx movq 24(%rdi),%rdx # qhasm: squarerax *= 19 # asm 1: imulq $19,squarerax=int64#7 # asm 2: imulq $19,squarerax=%rax imulq $19,%rdx,%rax # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(rp + 24) # asm 1: mulq 24(squarerax=int64#3 # asm 2: movq 24(squarerax=%rdx movq 24(%rdi),%rdx # qhasm: squarerax *= 38 # asm 1: imulq $38,squarerax=int64#7 # asm 2: imulq $38,squarerax=%rax imulq $38,%rdx,%rax # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(rp + 32) # asm 1: mulq 32(squarerax=int64#3 # asm 2: movq 32(squarerax=%rdx movq 32(%rdi),%rdx # qhasm: squarerax *= 19 # asm 1: imulq $19,squarerax=int64#7 # asm 2: imulq $19,squarerax=%rax imulq $19,%rdx,%rax # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(rp + 32) # asm 1: mulq 32(squareredmask=int64#3 # asm 2: movq CRYPTO_SHARED_NAMESPACE(REDMASK51),>squareredmask=%rdx movq CRYPTO_SHARED_NAMESPACE(REDMASK51)(%rip),%rdx # qhasm: squarer01 = (squarer01.r0) << 13 # asm 1: shld $13,squarer41=int64#5 # asm 2: imulq $19,squarer41=%r8 imulq $19,%rbx,%r8 # qhasm: r0 += squarer41 # asm 1: add squaret=int64#5 # asm 2: mov squaret=%r8 mov %rcx,%r8 # qhasm: (uint64) squaret >>= 51 # asm 1: shr $51,r1=int64#6 # asm 2: mov r1=%r9 mov %r8,%r9 # qhasm: (uint64) squaret >>= 51 # asm 1: shr $51,r2=int64#7 # asm 2: mov r2=%rax mov %r8,%rax # qhasm: (uint64) squaret >>= 51 # asm 1: shr $51,r3=int64#8 # asm 2: mov r3=%r10 mov %r8,%r10 # qhasm: (uint64) squaret >>= 51 # asm 1: shr $51,r4=int64#9 # asm 2: mov r4=%r11 mov %r8,%r11 # qhasm: (uint64) squaret >>= 51 # asm 1: shr $51,squaret=int64#5 # asm 2: imulq $19,squaret=%r8 imulq $19,%r8,%r8 # qhasm: r0 += squaret # asm 1: add ? n -= 1 # asm 1: sub $1, jg ._loop # qhasm: c1 =c1_stack # asm 1: movq c1=int64#9 # asm 2: movq c1=%r11 movq 0(%rsp),%r11 # qhasm: c2 =c2_stack # asm 1: movq c2=int64#10 # asm 2: movq c2=%r12 movq 8(%rsp),%r12 # qhasm: c3 =c3_stack # asm 1: movq c3=int64#11 # asm 2: movq c3=%r13 movq 16(%rsp),%r13 # qhasm: c4 =c4_stack # asm 1: movq c4=int64#12 # asm 2: movq c4=%r14 movq 24(%rsp),%r14 # qhasm: c5 =c5_stack # asm 1: movq c5=int64#13 # asm 2: movq c5=%r15 movq 32(%rsp),%r15 # qhasm: c6 =c6_stack # asm 1: movq c6=int64#14 # asm 2: movq c6=%rbx movq 40(%rsp),%rbx # qhasm: c7 =c7_stack # asm 1: movq c7=int64#15 # asm 2: movq c7=%rbp movq 48(%rsp),%rbp # qhasm: leave add %r11,%rsp mov %rdi,%rax mov %rsi,%rdx ret