pqc/crypto_kem/ntru/ntruhps4096821/avx2/square_1_821_patience.s

159 lines
3.1 KiB
ArmAsm

.data
.p2align 5
.text
.global PQCLEAN_NTRUHPS4096821_AVX2_square_1_821
.global _PQCLEAN_NTRUHPS4096821_AVX2_square_1_821
PQCLEAN_NTRUHPS4096821_AVX2_square_1_821:
_PQCLEAN_NTRUHPS4096821_AVX2_square_1_821:
push %r15
push %r14
push %r13
push %r12
push %rbx
push %rbp
mov 0(%rsi), %r11
mov %r11, %r10
and $-0x1, %r10
mov $0x5555555555555555, %rbp
pdep %rbp, %r10, %r10
mov %r10, 0(%rdi)
mov $0xffffffff00000000, %rbx
pext %rbx, %r11, %r10
pdep %rbp, %r10, %r10
mov %r10, 8(%rdi)
mov 8(%rsi), %r11
mov %r11, %r10
and $-0x1, %r10
pdep %rbp, %r10, %r10
mov %r10, 16(%rdi)
pext %rbx, %r11, %r10
pdep %rbp, %r10, %r10
mov %r10, 24(%rdi)
mov 16(%rsi), %r11
mov %r11, %r10
and $-0x1, %r10
pdep %rbp, %r10, %r10
mov %r10, 32(%rdi)
pext %rbx, %r11, %r10
pdep %rbp, %r10, %r10
mov %r10, 40(%rdi)
mov 24(%rsi), %r11
mov %r11, %r10
and $-0x1, %r10
pdep %rbp, %r10, %r10
mov %r10, 48(%rdi)
pext %rbx, %r11, %r10
pdep %rbp, %r10, %r10
mov %r10, 56(%rdi)
mov 32(%rsi), %r11
mov %r11, %r10
and $-0x1, %r10
pdep %rbp, %r10, %r10
mov %r10, 64(%rdi)
pext %rbx, %r11, %r10
pdep %rbp, %r10, %r10
mov %r10, 72(%rdi)
mov 40(%rsi), %r11
mov %r11, %r10
and $-0x1, %r10
pdep %rbp, %r10, %r10
mov %r10, 80(%rdi)
pext %rbx, %r11, %r10
pdep %rbp, %r10, %r10
mov %r10, 88(%rdi)
mov 48(%rsi), %r11
mov $0x7fffffff8000000, %r12
pext %r12, %r11, %r10
mov $0xaaaaaaaaaaaaaaaa, %r13
pdep %r13, %r10, %r10
xor %r10, 0(%rdi)
mov $0xf800000000000000, %r14
pext %r14, %r11, %r10
mov $0x2aa, %r15
pdep %r15, %r10, %r10
xor %r10, 8(%rdi)
mov %r11, %r10
and $0x7ffffff, %r10
mov $0x15555555555555, %r9
pdep %r9, %r10, %r10
mov %r10, 96(%rdi)
mov 56(%rsi), %r11
mov %r11, %r10
and $0x7ffffff, %r10
mov $0xaaaaaaaaaaaaa800, %r8
pdep %r8, %r10, %r10
xor %r10, 8(%rdi)
pext %r12, %r11, %r10
pdep %r13, %r10, %r10
xor %r10, 16(%rdi)
pext %r14, %r11, %r10
pdep %r15, %r10, %r10
xor %r10, 24(%rdi)
mov 64(%rsi), %r11
mov %r11, %r10
and $0x7ffffff, %r10
pdep %r8, %r10, %r10
xor %r10, 24(%rdi)
pext %r12, %r11, %r10
pdep %r13, %r10, %r10
xor %r10, 32(%rdi)
pext %r14, %r11, %r10
pdep %r15, %r10, %r10
xor %r10, 40(%rdi)
mov 72(%rsi), %r11
mov %r11, %r10
and $0x7ffffff, %r10
pdep %r8, %r10, %r10
xor %r10, 40(%rdi)
pext %r12, %r11, %r10
pdep %r13, %r10, %r10
xor %r10, 48(%rdi)
pext %r14, %r11, %r10
pdep %r15, %r10, %r10
xor %r10, 56(%rdi)
mov 80(%rsi), %r11
mov %r11, %r10
and $0x7ffffff, %r10
pdep %r8, %r10, %r10
xor %r10, 56(%rdi)
pext %r12, %r11, %r10
pdep %r13, %r10, %r10
xor %r10, 64(%rdi)
pext %r14, %r11, %r10
pdep %r15, %r10, %r10
xor %r10, 72(%rdi)
mov 88(%rsi), %r11
mov %r11, %r10
and $0x7ffffff, %r10
pdep %r8, %r10, %r10
xor %r10, 72(%rdi)
pext %r12, %r11, %r10
pdep %r13, %r10, %r10
xor %r10, 80(%rdi)
pext %r14, %r11, %r10
pdep %r15, %r10, %r10
xor %r10, 88(%rdi)
mov 96(%rsi), %r11
mov %r11, %r10
and $0x7ffffff, %r10
pdep %r8, %r10, %r10
xor %r10, 88(%rdi)
mov $0x1ffffff8000000, %rdx
pext %rdx, %r11, %r10
mov $0xaaaaaaaaaaaaa, %rcx
pdep %rcx, %r10, %r10
xor %r10, 96(%rdi)
mov 104(%rsi), %r11
mov 112(%rsi), %r11
mov 120(%rsi), %r11
movq $0x0, 104(%rdi)
movq $0x0, 112(%rdi)
movq $0x0, 120(%rdi)
pop %rbp
pop %rbx
pop %r12
pop %r13
pop %r14
pop %r15
ret