1125 lines
19 KiB
ArmAsm
Executable file
1125 lines
19 KiB
ArmAsm
Executable file
#include "x86_arch.h"
|
|
.text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
.def _vpaes_encrypt_core; .scl 3; .type 32; .endef
|
|
.p2align 4
|
|
_vpaes_encrypt_core:
|
|
movq %rdx,%r9
|
|
movq $16,%r11
|
|
movl 240(%rdx),%eax
|
|
movdqa %xmm9,%xmm1
|
|
movdqa .Lk_ipt(%rip),%xmm2
|
|
pandn %xmm0,%xmm1
|
|
movdqu (%r9),%xmm5
|
|
psrld $4,%xmm1
|
|
pand %xmm9,%xmm0
|
|
.byte 102,15,56,0,208
|
|
movdqa .Lk_ipt+16(%rip),%xmm0
|
|
.byte 102,15,56,0,193
|
|
pxor %xmm5,%xmm2
|
|
pxor %xmm2,%xmm0
|
|
addq $16,%r9
|
|
leaq .Lk_mc_backward(%rip),%r10
|
|
jmp .Lenc_entry
|
|
|
|
.p2align 4
|
|
.Lenc_loop:
|
|
|
|
movdqa %xmm13,%xmm4
|
|
.byte 102,15,56,0,226
|
|
pxor %xmm5,%xmm4
|
|
movdqa %xmm12,%xmm0
|
|
.byte 102,15,56,0,195
|
|
pxor %xmm4,%xmm0
|
|
movdqa %xmm15,%xmm5
|
|
.byte 102,15,56,0,234
|
|
movdqa -64(%r11,%r10,1),%xmm1
|
|
movdqa %xmm14,%xmm2
|
|
.byte 102,15,56,0,211
|
|
pxor %xmm5,%xmm2
|
|
movdqa (%r11,%r10,1),%xmm4
|
|
movdqa %xmm0,%xmm3
|
|
.byte 102,15,56,0,193
|
|
addq $16,%r9
|
|
pxor %xmm2,%xmm0
|
|
.byte 102,15,56,0,220
|
|
addq $16,%r11
|
|
pxor %xmm0,%xmm3
|
|
.byte 102,15,56,0,193
|
|
andq $48,%r11
|
|
pxor %xmm3,%xmm0
|
|
subq $1,%rax
|
|
|
|
.Lenc_entry:
|
|
|
|
movdqa %xmm9,%xmm1
|
|
pandn %xmm0,%xmm1
|
|
psrld $4,%xmm1
|
|
pand %xmm9,%xmm0
|
|
movdqa %xmm11,%xmm5
|
|
.byte 102,15,56,0,232
|
|
pxor %xmm1,%xmm0
|
|
movdqa %xmm10,%xmm3
|
|
.byte 102,15,56,0,217
|
|
pxor %xmm5,%xmm3
|
|
movdqa %xmm10,%xmm4
|
|
.byte 102,15,56,0,224
|
|
pxor %xmm5,%xmm4
|
|
movdqa %xmm10,%xmm2
|
|
.byte 102,15,56,0,211
|
|
pxor %xmm0,%xmm2
|
|
movdqa %xmm10,%xmm3
|
|
movdqu (%r9),%xmm5
|
|
.byte 102,15,56,0,220
|
|
pxor %xmm1,%xmm3
|
|
jnz .Lenc_loop
|
|
|
|
|
|
movdqa -96(%r10),%xmm4
|
|
movdqa -80(%r10),%xmm0
|
|
.byte 102,15,56,0,226
|
|
pxor %xmm5,%xmm4
|
|
.byte 102,15,56,0,195
|
|
movdqa 64(%r11,%r10,1),%xmm1
|
|
pxor %xmm4,%xmm0
|
|
.byte 102,15,56,0,193
|
|
retq
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
.def _vpaes_decrypt_core; .scl 3; .type 32; .endef
|
|
.p2align 4
|
|
_vpaes_decrypt_core:
|
|
movq %rdx,%r9
|
|
movl 240(%rdx),%eax
|
|
movdqa %xmm9,%xmm1
|
|
movdqa .Lk_dipt(%rip),%xmm2
|
|
pandn %xmm0,%xmm1
|
|
movq %rax,%r11
|
|
psrld $4,%xmm1
|
|
movdqu (%r9),%xmm5
|
|
shlq $4,%r11
|
|
pand %xmm9,%xmm0
|
|
.byte 102,15,56,0,208
|
|
movdqa .Lk_dipt+16(%rip),%xmm0
|
|
xorq $48,%r11
|
|
leaq .Lk_dsbd(%rip),%r10
|
|
.byte 102,15,56,0,193
|
|
andq $48,%r11
|
|
pxor %xmm5,%xmm2
|
|
movdqa .Lk_mc_forward+48(%rip),%xmm5
|
|
pxor %xmm2,%xmm0
|
|
addq $16,%r9
|
|
addq %r10,%r11
|
|
jmp .Ldec_entry
|
|
|
|
.p2align 4
|
|
.Ldec_loop:
|
|
|
|
|
|
|
|
movdqa -32(%r10),%xmm4
|
|
.byte 102,15,56,0,226
|
|
pxor %xmm0,%xmm4
|
|
movdqa -16(%r10),%xmm0
|
|
.byte 102,15,56,0,195
|
|
pxor %xmm4,%xmm0
|
|
addq $16,%r9
|
|
|
|
.byte 102,15,56,0,197
|
|
movdqa 0(%r10),%xmm4
|
|
.byte 102,15,56,0,226
|
|
pxor %xmm0,%xmm4
|
|
movdqa 16(%r10),%xmm0
|
|
.byte 102,15,56,0,195
|
|
pxor %xmm4,%xmm0
|
|
subq $1,%rax
|
|
|
|
.byte 102,15,56,0,197
|
|
movdqa 32(%r10),%xmm4
|
|
.byte 102,15,56,0,226
|
|
pxor %xmm0,%xmm4
|
|
movdqa 48(%r10),%xmm0
|
|
.byte 102,15,56,0,195
|
|
pxor %xmm4,%xmm0
|
|
|
|
.byte 102,15,56,0,197
|
|
movdqa 64(%r10),%xmm4
|
|
.byte 102,15,56,0,226
|
|
pxor %xmm0,%xmm4
|
|
movdqa 80(%r10),%xmm0
|
|
.byte 102,15,56,0,195
|
|
pxor %xmm4,%xmm0
|
|
|
|
.byte 102,15,58,15,237,12
|
|
|
|
.Ldec_entry:
|
|
|
|
movdqa %xmm9,%xmm1
|
|
pandn %xmm0,%xmm1
|
|
psrld $4,%xmm1
|
|
pand %xmm9,%xmm0
|
|
movdqa %xmm11,%xmm2
|
|
.byte 102,15,56,0,208
|
|
pxor %xmm1,%xmm0
|
|
movdqa %xmm10,%xmm3
|
|
.byte 102,15,56,0,217
|
|
pxor %xmm2,%xmm3
|
|
movdqa %xmm10,%xmm4
|
|
.byte 102,15,56,0,224
|
|
pxor %xmm2,%xmm4
|
|
movdqa %xmm10,%xmm2
|
|
.byte 102,15,56,0,211
|
|
pxor %xmm0,%xmm2
|
|
movdqa %xmm10,%xmm3
|
|
.byte 102,15,56,0,220
|
|
pxor %xmm1,%xmm3
|
|
movdqu (%r9),%xmm0
|
|
jnz .Ldec_loop
|
|
|
|
|
|
movdqa 96(%r10),%xmm4
|
|
.byte 102,15,56,0,226
|
|
pxor %xmm0,%xmm4
|
|
movdqa 112(%r10),%xmm0
|
|
movdqa -352(%r11),%xmm2
|
|
.byte 102,15,56,0,195
|
|
pxor %xmm4,%xmm0
|
|
.byte 102,15,56,0,194
|
|
retq
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
.def _vpaes_schedule_core; .scl 3; .type 32; .endef
|
|
.p2align 4
|
|
_vpaes_schedule_core:
|
|
|
|
|
|
|
|
|
|
|
|
call _vpaes_preheat
|
|
movdqa .Lk_rcon(%rip),%xmm8
|
|
movdqu (%rdi),%xmm0
|
|
|
|
|
|
movdqa %xmm0,%xmm3
|
|
leaq .Lk_ipt(%rip),%r11
|
|
call _vpaes_schedule_transform
|
|
movdqa %xmm0,%xmm7
|
|
|
|
leaq .Lk_sr(%rip),%r10
|
|
testq %rcx,%rcx
|
|
jnz .Lschedule_am_decrypting
|
|
|
|
|
|
movdqu %xmm0,(%rdx)
|
|
jmp .Lschedule_go
|
|
|
|
.Lschedule_am_decrypting:
|
|
|
|
movdqa (%r8,%r10,1),%xmm1
|
|
.byte 102,15,56,0,217
|
|
movdqu %xmm3,(%rdx)
|
|
xorq $48,%r8
|
|
|
|
.Lschedule_go:
|
|
cmpl $192,%esi
|
|
ja .Lschedule_256
|
|
je .Lschedule_192
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
.Lschedule_128:
|
|
movl $10,%esi
|
|
|
|
.Loop_schedule_128:
|
|
call _vpaes_schedule_round
|
|
decq %rsi
|
|
jz .Lschedule_mangle_last
|
|
call _vpaes_schedule_mangle
|
|
jmp .Loop_schedule_128
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
.p2align 4
|
|
.Lschedule_192:
|
|
movdqu 8(%rdi),%xmm0
|
|
call _vpaes_schedule_transform
|
|
movdqa %xmm0,%xmm6
|
|
pxor %xmm4,%xmm4
|
|
movhlps %xmm4,%xmm6
|
|
movl $4,%esi
|
|
|
|
.Loop_schedule_192:
|
|
call _vpaes_schedule_round
|
|
.byte 102,15,58,15,198,8
|
|
call _vpaes_schedule_mangle
|
|
call _vpaes_schedule_192_smear
|
|
call _vpaes_schedule_mangle
|
|
call _vpaes_schedule_round
|
|
decq %rsi
|
|
jz .Lschedule_mangle_last
|
|
call _vpaes_schedule_mangle
|
|
call _vpaes_schedule_192_smear
|
|
jmp .Loop_schedule_192
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
.p2align 4
|
|
.Lschedule_256:
|
|
movdqu 16(%rdi),%xmm0
|
|
call _vpaes_schedule_transform
|
|
movl $7,%esi
|
|
|
|
.Loop_schedule_256:
|
|
call _vpaes_schedule_mangle
|
|
movdqa %xmm0,%xmm6
|
|
|
|
|
|
call _vpaes_schedule_round
|
|
decq %rsi
|
|
jz .Lschedule_mangle_last
|
|
call _vpaes_schedule_mangle
|
|
|
|
|
|
pshufd $255,%xmm0,%xmm0
|
|
movdqa %xmm7,%xmm5
|
|
movdqa %xmm6,%xmm7
|
|
call _vpaes_schedule_low_round
|
|
movdqa %xmm5,%xmm7
|
|
|
|
jmp .Loop_schedule_256
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
.p2align 4
|
|
.Lschedule_mangle_last:
|
|
|
|
leaq .Lk_deskew(%rip),%r11
|
|
testq %rcx,%rcx
|
|
jnz .Lschedule_mangle_last_dec
|
|
|
|
|
|
movdqa (%r8,%r10,1),%xmm1
|
|
.byte 102,15,56,0,193
|
|
leaq .Lk_opt(%rip),%r11
|
|
addq $32,%rdx
|
|
|
|
.Lschedule_mangle_last_dec:
|
|
addq $-16,%rdx
|
|
pxor .Lk_s63(%rip),%xmm0
|
|
call _vpaes_schedule_transform
|
|
movdqu %xmm0,(%rdx)
|
|
|
|
|
|
pxor %xmm0,%xmm0
|
|
pxor %xmm1,%xmm1
|
|
pxor %xmm2,%xmm2
|
|
pxor %xmm3,%xmm3
|
|
pxor %xmm4,%xmm4
|
|
pxor %xmm5,%xmm5
|
|
pxor %xmm6,%xmm6
|
|
pxor %xmm7,%xmm7
|
|
retq
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
.def _vpaes_schedule_192_smear; .scl 3; .type 32; .endef
|
|
.p2align 4
|
|
_vpaes_schedule_192_smear:
|
|
pshufd $128,%xmm6,%xmm0
|
|
pxor %xmm0,%xmm6
|
|
pshufd $254,%xmm7,%xmm0
|
|
pxor %xmm0,%xmm6
|
|
movdqa %xmm6,%xmm0
|
|
pxor %xmm1,%xmm1
|
|
movhlps %xmm1,%xmm6
|
|
retq
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
.def _vpaes_schedule_round; .scl 3; .type 32; .endef
|
|
.p2align 4
|
|
_vpaes_schedule_round:
|
|
|
|
pxor %xmm1,%xmm1
|
|
.byte 102,65,15,58,15,200,15
|
|
.byte 102,69,15,58,15,192,15
|
|
pxor %xmm1,%xmm7
|
|
|
|
|
|
pshufd $255,%xmm0,%xmm0
|
|
.byte 102,15,58,15,192,1
|
|
|
|
|
|
|
|
|
|
_vpaes_schedule_low_round:
|
|
|
|
movdqa %xmm7,%xmm1
|
|
pslldq $4,%xmm7
|
|
pxor %xmm1,%xmm7
|
|
movdqa %xmm7,%xmm1
|
|
pslldq $8,%xmm7
|
|
pxor %xmm1,%xmm7
|
|
pxor .Lk_s63(%rip),%xmm7
|
|
|
|
|
|
movdqa %xmm9,%xmm1
|
|
pandn %xmm0,%xmm1
|
|
psrld $4,%xmm1
|
|
pand %xmm9,%xmm0
|
|
movdqa %xmm11,%xmm2
|
|
.byte 102,15,56,0,208
|
|
pxor %xmm1,%xmm0
|
|
movdqa %xmm10,%xmm3
|
|
.byte 102,15,56,0,217
|
|
pxor %xmm2,%xmm3
|
|
movdqa %xmm10,%xmm4
|
|
.byte 102,15,56,0,224
|
|
pxor %xmm2,%xmm4
|
|
movdqa %xmm10,%xmm2
|
|
.byte 102,15,56,0,211
|
|
pxor %xmm0,%xmm2
|
|
movdqa %xmm10,%xmm3
|
|
.byte 102,15,56,0,220
|
|
pxor %xmm1,%xmm3
|
|
movdqa %xmm13,%xmm4
|
|
.byte 102,15,56,0,226
|
|
movdqa %xmm12,%xmm0
|
|
.byte 102,15,56,0,195
|
|
pxor %xmm4,%xmm0
|
|
|
|
|
|
pxor %xmm7,%xmm0
|
|
movdqa %xmm0,%xmm7
|
|
retq
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
.def _vpaes_schedule_transform; .scl 3; .type 32; .endef
|
|
.p2align 4
|
|
_vpaes_schedule_transform:
|
|
movdqa %xmm9,%xmm1
|
|
pandn %xmm0,%xmm1
|
|
psrld $4,%xmm1
|
|
pand %xmm9,%xmm0
|
|
movdqa (%r11),%xmm2
|
|
.byte 102,15,56,0,208
|
|
movdqa 16(%r11),%xmm0
|
|
.byte 102,15,56,0,193
|
|
pxor %xmm2,%xmm0
|
|
retq
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
.def _vpaes_schedule_mangle; .scl 3; .type 32; .endef
|
|
.p2align 4
|
|
_vpaes_schedule_mangle:
|
|
movdqa %xmm0,%xmm4
|
|
movdqa .Lk_mc_forward(%rip),%xmm5
|
|
testq %rcx,%rcx
|
|
jnz .Lschedule_mangle_dec
|
|
|
|
|
|
addq $16,%rdx
|
|
pxor .Lk_s63(%rip),%xmm4
|
|
.byte 102,15,56,0,229
|
|
movdqa %xmm4,%xmm3
|
|
.byte 102,15,56,0,229
|
|
pxor %xmm4,%xmm3
|
|
.byte 102,15,56,0,229
|
|
pxor %xmm4,%xmm3
|
|
|
|
jmp .Lschedule_mangle_both
|
|
.p2align 4
|
|
.Lschedule_mangle_dec:
|
|
|
|
leaq .Lk_dksd(%rip),%r11
|
|
movdqa %xmm9,%xmm1
|
|
pandn %xmm4,%xmm1
|
|
psrld $4,%xmm1
|
|
pand %xmm9,%xmm4
|
|
|
|
movdqa 0(%r11),%xmm2
|
|
.byte 102,15,56,0,212
|
|
movdqa 16(%r11),%xmm3
|
|
.byte 102,15,56,0,217
|
|
pxor %xmm2,%xmm3
|
|
.byte 102,15,56,0,221
|
|
|
|
movdqa 32(%r11),%xmm2
|
|
.byte 102,15,56,0,212
|
|
pxor %xmm3,%xmm2
|
|
movdqa 48(%r11),%xmm3
|
|
.byte 102,15,56,0,217
|
|
pxor %xmm2,%xmm3
|
|
.byte 102,15,56,0,221
|
|
|
|
movdqa 64(%r11),%xmm2
|
|
.byte 102,15,56,0,212
|
|
pxor %xmm3,%xmm2
|
|
movdqa 80(%r11),%xmm3
|
|
.byte 102,15,56,0,217
|
|
pxor %xmm2,%xmm3
|
|
.byte 102,15,56,0,221
|
|
|
|
movdqa 96(%r11),%xmm2
|
|
.byte 102,15,56,0,212
|
|
pxor %xmm3,%xmm2
|
|
movdqa 112(%r11),%xmm3
|
|
.byte 102,15,56,0,217
|
|
pxor %xmm2,%xmm3
|
|
|
|
addq $-16,%rdx
|
|
|
|
.Lschedule_mangle_both:
|
|
movdqa (%r8,%r10,1),%xmm1
|
|
.byte 102,15,56,0,217
|
|
addq $-16,%r8
|
|
andq $48,%r8
|
|
movdqu %xmm3,(%rdx)
|
|
retq
|
|
|
|
|
|
|
|
|
|
|
|
.globl vpaes_set_encrypt_key
|
|
.def vpaes_set_encrypt_key; .scl 2; .type 32; .endef
|
|
.p2align 4
|
|
vpaes_set_encrypt_key:
|
|
movq %rdi,8(%rsp)
|
|
movq %rsi,16(%rsp)
|
|
movq %rsp,%rax
|
|
.LSEH_begin_vpaes_set_encrypt_key:
|
|
movq %rcx,%rdi
|
|
movq %rdx,%rsi
|
|
movq %r8,%rdx
|
|
|
|
leaq -184(%rsp),%rsp
|
|
movaps %xmm6,16(%rsp)
|
|
movaps %xmm7,32(%rsp)
|
|
movaps %xmm8,48(%rsp)
|
|
movaps %xmm9,64(%rsp)
|
|
movaps %xmm10,80(%rsp)
|
|
movaps %xmm11,96(%rsp)
|
|
movaps %xmm12,112(%rsp)
|
|
movaps %xmm13,128(%rsp)
|
|
movaps %xmm14,144(%rsp)
|
|
movaps %xmm15,160(%rsp)
|
|
.Lenc_key_body:
|
|
movl %esi,%eax
|
|
shrl $5,%eax
|
|
addl $5,%eax
|
|
movl %eax,240(%rdx)
|
|
|
|
movl $0,%ecx
|
|
movl $48,%r8d
|
|
call _vpaes_schedule_core
|
|
movaps 16(%rsp),%xmm6
|
|
movaps 32(%rsp),%xmm7
|
|
movaps 48(%rsp),%xmm8
|
|
movaps 64(%rsp),%xmm9
|
|
movaps 80(%rsp),%xmm10
|
|
movaps 96(%rsp),%xmm11
|
|
movaps 112(%rsp),%xmm12
|
|
movaps 128(%rsp),%xmm13
|
|
movaps 144(%rsp),%xmm14
|
|
movaps 160(%rsp),%xmm15
|
|
leaq 184(%rsp),%rsp
|
|
.Lenc_key_epilogue:
|
|
xorl %eax,%eax
|
|
movq 8(%rsp),%rdi
|
|
movq 16(%rsp),%rsi
|
|
retq
|
|
.LSEH_end_vpaes_set_encrypt_key:
|
|
|
|
.globl vpaes_set_decrypt_key
|
|
.def vpaes_set_decrypt_key; .scl 2; .type 32; .endef
|
|
.p2align 4
|
|
vpaes_set_decrypt_key:
|
|
movq %rdi,8(%rsp)
|
|
movq %rsi,16(%rsp)
|
|
movq %rsp,%rax
|
|
.LSEH_begin_vpaes_set_decrypt_key:
|
|
movq %rcx,%rdi
|
|
movq %rdx,%rsi
|
|
movq %r8,%rdx
|
|
|
|
leaq -184(%rsp),%rsp
|
|
movaps %xmm6,16(%rsp)
|
|
movaps %xmm7,32(%rsp)
|
|
movaps %xmm8,48(%rsp)
|
|
movaps %xmm9,64(%rsp)
|
|
movaps %xmm10,80(%rsp)
|
|
movaps %xmm11,96(%rsp)
|
|
movaps %xmm12,112(%rsp)
|
|
movaps %xmm13,128(%rsp)
|
|
movaps %xmm14,144(%rsp)
|
|
movaps %xmm15,160(%rsp)
|
|
.Ldec_key_body:
|
|
movl %esi,%eax
|
|
shrl $5,%eax
|
|
addl $5,%eax
|
|
movl %eax,240(%rdx)
|
|
shll $4,%eax
|
|
leaq 16(%rdx,%rax,1),%rdx
|
|
|
|
movl $1,%ecx
|
|
movl %esi,%r8d
|
|
shrl $1,%r8d
|
|
andl $32,%r8d
|
|
xorl $32,%r8d
|
|
call _vpaes_schedule_core
|
|
movaps 16(%rsp),%xmm6
|
|
movaps 32(%rsp),%xmm7
|
|
movaps 48(%rsp),%xmm8
|
|
movaps 64(%rsp),%xmm9
|
|
movaps 80(%rsp),%xmm10
|
|
movaps 96(%rsp),%xmm11
|
|
movaps 112(%rsp),%xmm12
|
|
movaps 128(%rsp),%xmm13
|
|
movaps 144(%rsp),%xmm14
|
|
movaps 160(%rsp),%xmm15
|
|
leaq 184(%rsp),%rsp
|
|
.Ldec_key_epilogue:
|
|
xorl %eax,%eax
|
|
movq 8(%rsp),%rdi
|
|
movq 16(%rsp),%rsi
|
|
retq
|
|
.LSEH_end_vpaes_set_decrypt_key:
|
|
|
|
.globl vpaes_encrypt
|
|
.def vpaes_encrypt; .scl 2; .type 32; .endef
|
|
.p2align 4
|
|
vpaes_encrypt:
|
|
movq %rdi,8(%rsp)
|
|
movq %rsi,16(%rsp)
|
|
movq %rsp,%rax
|
|
.LSEH_begin_vpaes_encrypt:
|
|
movq %rcx,%rdi
|
|
movq %rdx,%rsi
|
|
movq %r8,%rdx
|
|
|
|
leaq -184(%rsp),%rsp
|
|
movaps %xmm6,16(%rsp)
|
|
movaps %xmm7,32(%rsp)
|
|
movaps %xmm8,48(%rsp)
|
|
movaps %xmm9,64(%rsp)
|
|
movaps %xmm10,80(%rsp)
|
|
movaps %xmm11,96(%rsp)
|
|
movaps %xmm12,112(%rsp)
|
|
movaps %xmm13,128(%rsp)
|
|
movaps %xmm14,144(%rsp)
|
|
movaps %xmm15,160(%rsp)
|
|
.Lenc_body:
|
|
movdqu (%rdi),%xmm0
|
|
call _vpaes_preheat
|
|
call _vpaes_encrypt_core
|
|
movdqu %xmm0,(%rsi)
|
|
movaps 16(%rsp),%xmm6
|
|
movaps 32(%rsp),%xmm7
|
|
movaps 48(%rsp),%xmm8
|
|
movaps 64(%rsp),%xmm9
|
|
movaps 80(%rsp),%xmm10
|
|
movaps 96(%rsp),%xmm11
|
|
movaps 112(%rsp),%xmm12
|
|
movaps 128(%rsp),%xmm13
|
|
movaps 144(%rsp),%xmm14
|
|
movaps 160(%rsp),%xmm15
|
|
leaq 184(%rsp),%rsp
|
|
.Lenc_epilogue:
|
|
movq 8(%rsp),%rdi
|
|
movq 16(%rsp),%rsi
|
|
retq
|
|
.LSEH_end_vpaes_encrypt:
|
|
|
|
.globl vpaes_decrypt
|
|
.def vpaes_decrypt; .scl 2; .type 32; .endef
|
|
.p2align 4
|
|
vpaes_decrypt:
|
|
movq %rdi,8(%rsp)
|
|
movq %rsi,16(%rsp)
|
|
movq %rsp,%rax
|
|
.LSEH_begin_vpaes_decrypt:
|
|
movq %rcx,%rdi
|
|
movq %rdx,%rsi
|
|
movq %r8,%rdx
|
|
|
|
leaq -184(%rsp),%rsp
|
|
movaps %xmm6,16(%rsp)
|
|
movaps %xmm7,32(%rsp)
|
|
movaps %xmm8,48(%rsp)
|
|
movaps %xmm9,64(%rsp)
|
|
movaps %xmm10,80(%rsp)
|
|
movaps %xmm11,96(%rsp)
|
|
movaps %xmm12,112(%rsp)
|
|
movaps %xmm13,128(%rsp)
|
|
movaps %xmm14,144(%rsp)
|
|
movaps %xmm15,160(%rsp)
|
|
.Ldec_body:
|
|
movdqu (%rdi),%xmm0
|
|
call _vpaes_preheat
|
|
call _vpaes_decrypt_core
|
|
movdqu %xmm0,(%rsi)
|
|
movaps 16(%rsp),%xmm6
|
|
movaps 32(%rsp),%xmm7
|
|
movaps 48(%rsp),%xmm8
|
|
movaps 64(%rsp),%xmm9
|
|
movaps 80(%rsp),%xmm10
|
|
movaps 96(%rsp),%xmm11
|
|
movaps 112(%rsp),%xmm12
|
|
movaps 128(%rsp),%xmm13
|
|
movaps 144(%rsp),%xmm14
|
|
movaps 160(%rsp),%xmm15
|
|
leaq 184(%rsp),%rsp
|
|
.Ldec_epilogue:
|
|
movq 8(%rsp),%rdi
|
|
movq 16(%rsp),%rsi
|
|
retq
|
|
.LSEH_end_vpaes_decrypt:
|
|
.globl vpaes_cbc_encrypt
|
|
.def vpaes_cbc_encrypt; .scl 2; .type 32; .endef
|
|
.p2align 4
|
|
vpaes_cbc_encrypt:
|
|
movq %rdi,8(%rsp)
|
|
movq %rsi,16(%rsp)
|
|
movq %rsp,%rax
|
|
.LSEH_begin_vpaes_cbc_encrypt:
|
|
movq %rcx,%rdi
|
|
movq %rdx,%rsi
|
|
movq %r8,%rdx
|
|
movq %r9,%rcx
|
|
movq 40(%rsp),%r8
|
|
movq 48(%rsp),%r9
|
|
|
|
xchgq %rcx,%rdx
|
|
subq $16,%rcx
|
|
jc .Lcbc_abort
|
|
leaq -184(%rsp),%rsp
|
|
movaps %xmm6,16(%rsp)
|
|
movaps %xmm7,32(%rsp)
|
|
movaps %xmm8,48(%rsp)
|
|
movaps %xmm9,64(%rsp)
|
|
movaps %xmm10,80(%rsp)
|
|
movaps %xmm11,96(%rsp)
|
|
movaps %xmm12,112(%rsp)
|
|
movaps %xmm13,128(%rsp)
|
|
movaps %xmm14,144(%rsp)
|
|
movaps %xmm15,160(%rsp)
|
|
.Lcbc_body:
|
|
movdqu (%r8),%xmm6
|
|
subq %rdi,%rsi
|
|
call _vpaes_preheat
|
|
cmpl $0,%r9d
|
|
je .Lcbc_dec_loop
|
|
jmp .Lcbc_enc_loop
|
|
.p2align 4
|
|
.Lcbc_enc_loop:
|
|
movdqu (%rdi),%xmm0
|
|
pxor %xmm6,%xmm0
|
|
call _vpaes_encrypt_core
|
|
movdqa %xmm0,%xmm6
|
|
movdqu %xmm0,(%rsi,%rdi,1)
|
|
leaq 16(%rdi),%rdi
|
|
subq $16,%rcx
|
|
jnc .Lcbc_enc_loop
|
|
jmp .Lcbc_done
|
|
.p2align 4
|
|
.Lcbc_dec_loop:
|
|
movdqu (%rdi),%xmm0
|
|
movdqa %xmm0,%xmm7
|
|
call _vpaes_decrypt_core
|
|
pxor %xmm6,%xmm0
|
|
movdqa %xmm7,%xmm6
|
|
movdqu %xmm0,(%rsi,%rdi,1)
|
|
leaq 16(%rdi),%rdi
|
|
subq $16,%rcx
|
|
jnc .Lcbc_dec_loop
|
|
.Lcbc_done:
|
|
movdqu %xmm6,(%r8)
|
|
movaps 16(%rsp),%xmm6
|
|
movaps 32(%rsp),%xmm7
|
|
movaps 48(%rsp),%xmm8
|
|
movaps 64(%rsp),%xmm9
|
|
movaps 80(%rsp),%xmm10
|
|
movaps 96(%rsp),%xmm11
|
|
movaps 112(%rsp),%xmm12
|
|
movaps 128(%rsp),%xmm13
|
|
movaps 144(%rsp),%xmm14
|
|
movaps 160(%rsp),%xmm15
|
|
leaq 184(%rsp),%rsp
|
|
.Lcbc_epilogue:
|
|
.Lcbc_abort:
|
|
movq 8(%rsp),%rdi
|
|
movq 16(%rsp),%rsi
|
|
retq
|
|
.LSEH_end_vpaes_cbc_encrypt:
|
|
|
|
|
|
|
|
|
|
|
|
|
|
.def _vpaes_preheat; .scl 3; .type 32; .endef
|
|
.p2align 4
|
|
_vpaes_preheat:
|
|
leaq .Lk_s0F(%rip),%r10
|
|
movdqa -32(%r10),%xmm10
|
|
movdqa -16(%r10),%xmm11
|
|
movdqa 0(%r10),%xmm9
|
|
movdqa 48(%r10),%xmm13
|
|
movdqa 64(%r10),%xmm12
|
|
movdqa 80(%r10),%xmm15
|
|
movdqa 96(%r10),%xmm14
|
|
retq
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
.p2align 6
|
|
_vpaes_consts:
|
|
.Lk_inv:
|
|
.quad 0x0E05060F0D080180, 0x040703090A0B0C02
|
|
.quad 0x01040A060F0B0780, 0x030D0E0C02050809
|
|
|
|
.Lk_s0F:
|
|
.quad 0x0F0F0F0F0F0F0F0F, 0x0F0F0F0F0F0F0F0F
|
|
|
|
.Lk_ipt:
|
|
.quad 0xC2B2E8985A2A7000, 0xCABAE09052227808
|
|
.quad 0x4C01307D317C4D00, 0xCD80B1FCB0FDCC81
|
|
|
|
.Lk_sb1:
|
|
.quad 0xB19BE18FCB503E00, 0xA5DF7A6E142AF544
|
|
.quad 0x3618D415FAE22300, 0x3BF7CCC10D2ED9EF
|
|
.Lk_sb2:
|
|
.quad 0xE27A93C60B712400, 0x5EB7E955BC982FCD
|
|
.quad 0x69EB88400AE12900, 0xC2A163C8AB82234A
|
|
.Lk_sbo:
|
|
.quad 0xD0D26D176FBDC700, 0x15AABF7AC502A878
|
|
.quad 0xCFE474A55FBB6A00, 0x8E1E90D1412B35FA
|
|
|
|
.Lk_mc_forward:
|
|
.quad 0x0407060500030201, 0x0C0F0E0D080B0A09
|
|
.quad 0x080B0A0904070605, 0x000302010C0F0E0D
|
|
.quad 0x0C0F0E0D080B0A09, 0x0407060500030201
|
|
.quad 0x000302010C0F0E0D, 0x080B0A0904070605
|
|
|
|
.Lk_mc_backward:
|
|
.quad 0x0605040702010003, 0x0E0D0C0F0A09080B
|
|
.quad 0x020100030E0D0C0F, 0x0A09080B06050407
|
|
.quad 0x0E0D0C0F0A09080B, 0x0605040702010003
|
|
.quad 0x0A09080B06050407, 0x020100030E0D0C0F
|
|
|
|
.Lk_sr:
|
|
.quad 0x0706050403020100, 0x0F0E0D0C0B0A0908
|
|
.quad 0x030E09040F0A0500, 0x0B06010C07020D08
|
|
.quad 0x0F060D040B020900, 0x070E050C030A0108
|
|
.quad 0x0B0E0104070A0D00, 0x0306090C0F020508
|
|
|
|
.Lk_rcon:
|
|
.quad 0x1F8391B9AF9DEEB6, 0x702A98084D7C7D81
|
|
|
|
.Lk_s63:
|
|
.quad 0x5B5B5B5B5B5B5B5B, 0x5B5B5B5B5B5B5B5B
|
|
|
|
.Lk_opt:
|
|
.quad 0xFF9F4929D6B66000, 0xF7974121DEBE6808
|
|
.quad 0x01EDBD5150BCEC00, 0xE10D5DB1B05C0CE0
|
|
|
|
.Lk_deskew:
|
|
.quad 0x07E4A34047A4E300, 0x1DFEB95A5DBEF91A
|
|
.quad 0x5F36B5DC83EA6900, 0x2841C2ABF49D1E77
|
|
|
|
|
|
|
|
|
|
|
|
.Lk_dksd:
|
|
.quad 0xFEB91A5DA3E44700, 0x0740E3A45A1DBEF9
|
|
.quad 0x41C277F4B5368300, 0x5FDC69EAAB289D1E
|
|
.Lk_dksb:
|
|
.quad 0x9A4FCA1F8550D500, 0x03D653861CC94C99
|
|
.quad 0x115BEDA7B6FC4A00, 0xD993256F7E3482C8
|
|
.Lk_dkse:
|
|
.quad 0xD5031CCA1FC9D600, 0x53859A4C994F5086
|
|
.quad 0xA23196054FDC7BE8, 0xCD5EF96A20B31487
|
|
.Lk_dks9:
|
|
.quad 0xB6116FC87ED9A700, 0x4AED933482255BFC
|
|
.quad 0x4576516227143300, 0x8BB89FACE9DAFDCE
|
|
|
|
|
|
|
|
|
|
|
|
.Lk_dipt:
|
|
.quad 0x0F505B040B545F00, 0x154A411E114E451A
|
|
.quad 0x86E383E660056500, 0x12771772F491F194
|
|
|
|
.Lk_dsb9:
|
|
.quad 0x851C03539A86D600, 0xCAD51F504F994CC9
|
|
.quad 0xC03B1789ECD74900, 0x725E2C9EB2FBA565
|
|
.Lk_dsbd:
|
|
.quad 0x7D57CCDFE6B1A200, 0xF56E9B13882A4439
|
|
.quad 0x3CE2FAF724C6CB00, 0x2931180D15DEEFD3
|
|
.Lk_dsbb:
|
|
.quad 0xD022649296B44200, 0x602646F6B0F2D404
|
|
.quad 0xC19498A6CD596700, 0xF3FF0C3E3255AA6B
|
|
.Lk_dsbe:
|
|
.quad 0x46F2929626D4D000, 0x2242600464B4F6B0
|
|
.quad 0x0C55A6CDFFAAC100, 0x9467F36B98593E32
|
|
.Lk_dsbo:
|
|
.quad 0x1387EA537EF94000, 0xC7AA6DB9D4943E2D
|
|
.quad 0x12D7560F93441D00, 0xCA4B8159D8C58E9C
|
|
.byte 86,101,99,116,111,114,32,80,101,114,109,117,116,97,116,105,111,110,32,65,69,83,32,102,111,114,32,120,56,54,95,54,52,47,83,83,83,69,51,44,32,77,105,107,101,32,72,97,109,98,117,114,103,32,40,83,116,97,110,102,111,114,100,32,85,110,105,118,101,114,115,105,116,121,41,0
|
|
.p2align 6
|
|
|
|
|
|
.def se_handler; .scl 3; .type 32; .endef
|
|
.p2align 4
|
|
se_handler:
|
|
pushq %rsi
|
|
pushq %rdi
|
|
pushq %rbx
|
|
pushq %rbp
|
|
pushq %r12
|
|
pushq %r13
|
|
pushq %r14
|
|
pushq %r15
|
|
pushfq
|
|
subq $64,%rsp
|
|
|
|
movq 120(%r8),%rax
|
|
movq 248(%r8),%rbx
|
|
|
|
movq 8(%r9),%rsi
|
|
movq 56(%r9),%r11
|
|
|
|
movl 0(%r11),%r10d
|
|
leaq (%rsi,%r10,1),%r10
|
|
cmpq %r10,%rbx
|
|
jb .Lin_prologue
|
|
|
|
movq 152(%r8),%rax
|
|
|
|
movl 4(%r11),%r10d
|
|
leaq (%rsi,%r10,1),%r10
|
|
cmpq %r10,%rbx
|
|
jae .Lin_prologue
|
|
|
|
leaq 16(%rax),%rsi
|
|
leaq 512(%r8),%rdi
|
|
movl $20,%ecx
|
|
.long 0xa548f3fc
|
|
leaq 184(%rax),%rax
|
|
|
|
.Lin_prologue:
|
|
movq 8(%rax),%rdi
|
|
movq 16(%rax),%rsi
|
|
movq %rax,152(%r8)
|
|
movq %rsi,168(%r8)
|
|
movq %rdi,176(%r8)
|
|
|
|
movq 40(%r9),%rdi
|
|
movq %r8,%rsi
|
|
movl $154,%ecx
|
|
.long 0xa548f3fc
|
|
|
|
movq %r9,%rsi
|
|
xorq %rcx,%rcx
|
|
movq 8(%rsi),%rdx
|
|
movq 0(%rsi),%r8
|
|
movq 16(%rsi),%r9
|
|
movq 40(%rsi),%r10
|
|
leaq 56(%rsi),%r11
|
|
leaq 24(%rsi),%r12
|
|
movq %r10,32(%rsp)
|
|
movq %r11,40(%rsp)
|
|
movq %r12,48(%rsp)
|
|
movq %rcx,56(%rsp)
|
|
call *__imp_RtlVirtualUnwind(%rip)
|
|
|
|
movl $1,%eax
|
|
addq $64,%rsp
|
|
popfq
|
|
popq %r15
|
|
popq %r14
|
|
popq %r13
|
|
popq %r12
|
|
popq %rbp
|
|
popq %rbx
|
|
popq %rdi
|
|
popq %rsi
|
|
retq
|
|
|
|
|
|
.section .pdata
|
|
.p2align 2
|
|
.rva .LSEH_begin_vpaes_set_encrypt_key
|
|
.rva .LSEH_end_vpaes_set_encrypt_key
|
|
.rva .LSEH_info_vpaes_set_encrypt_key
|
|
|
|
.rva .LSEH_begin_vpaes_set_decrypt_key
|
|
.rva .LSEH_end_vpaes_set_decrypt_key
|
|
.rva .LSEH_info_vpaes_set_decrypt_key
|
|
|
|
.rva .LSEH_begin_vpaes_encrypt
|
|
.rva .LSEH_end_vpaes_encrypt
|
|
.rva .LSEH_info_vpaes_encrypt
|
|
|
|
.rva .LSEH_begin_vpaes_decrypt
|
|
.rva .LSEH_end_vpaes_decrypt
|
|
.rva .LSEH_info_vpaes_decrypt
|
|
|
|
.rva .LSEH_begin_vpaes_cbc_encrypt
|
|
.rva .LSEH_end_vpaes_cbc_encrypt
|
|
.rva .LSEH_info_vpaes_cbc_encrypt
|
|
|
|
.section .xdata
|
|
.p2align 3
|
|
.LSEH_info_vpaes_set_encrypt_key:
|
|
.byte 9,0,0,0
|
|
.rva se_handler
|
|
.rva .Lenc_key_body,.Lenc_key_epilogue
|
|
.LSEH_info_vpaes_set_decrypt_key:
|
|
.byte 9,0,0,0
|
|
.rva se_handler
|
|
.rva .Ldec_key_body,.Ldec_key_epilogue
|
|
.LSEH_info_vpaes_encrypt:
|
|
.byte 9,0,0,0
|
|
.rva se_handler
|
|
.rva .Lenc_body,.Lenc_epilogue
|
|
.LSEH_info_vpaes_decrypt:
|
|
.byte 9,0,0,0
|
|
.rva se_handler
|
|
.rva .Ldec_body,.Ldec_epilogue
|
|
.LSEH_info_vpaes_cbc_encrypt:
|
|
.byte 9,0,0,0
|
|
.rva se_handler
|
|
.rva .Lcbc_body,.Lcbc_epilogue
|