ClickHouse/contrib/boringssl-cmake/win-x86_64/crypto/fipsmodule/vpaes-x86_64.asm

Ignoring revisions in .git-blame-ignore-revs. Click here to bypass and see the normal blame view.

1473 lines
25 KiB
NASM
Raw Normal View History

2020-10-14 20:45:32 +00:00
; This file is generated from a similarly-named Perl script in the BoringSSL
; source tree. Do not edit by hand.
default rel
%define XMMWORD
%define YMMWORD
%define ZMMWORD
%ifdef BORINGSSL_PREFIX
%include "boringssl_prefix_symbols_nasm.inc"
%endif
section .text code align=64
ALIGN 16
_vpaes_encrypt_core:
mov r9,rdx
mov r11,16
mov eax,DWORD[240+rdx]
movdqa xmm1,xmm9
movdqa xmm2,XMMWORD[$L$k_ipt]
pandn xmm1,xmm0
movdqu xmm5,XMMWORD[r9]
psrld xmm1,4
pand xmm0,xmm9
DB 102,15,56,0,208
movdqa xmm0,XMMWORD[(($L$k_ipt+16))]
DB 102,15,56,0,193
pxor xmm2,xmm5
add r9,16
pxor xmm0,xmm2
lea r10,[$L$k_mc_backward]
jmp NEAR $L$enc_entry
ALIGN 16
$L$enc_loop:
movdqa xmm4,xmm13
movdqa xmm0,xmm12
DB 102,15,56,0,226
DB 102,15,56,0,195
pxor xmm4,xmm5
movdqa xmm5,xmm15
pxor xmm0,xmm4
movdqa xmm1,XMMWORD[((-64))+r10*1+r11]
DB 102,15,56,0,234
movdqa xmm4,XMMWORD[r10*1+r11]
movdqa xmm2,xmm14
DB 102,15,56,0,211
movdqa xmm3,xmm0
pxor xmm2,xmm5
DB 102,15,56,0,193
add r9,16
pxor xmm0,xmm2
DB 102,15,56,0,220
add r11,16
pxor xmm3,xmm0
DB 102,15,56,0,193
and r11,0x30
sub rax,1
pxor xmm0,xmm3
$L$enc_entry:
movdqa xmm1,xmm9
movdqa xmm5,xmm11
pandn xmm1,xmm0
psrld xmm1,4
pand xmm0,xmm9
DB 102,15,56,0,232
movdqa xmm3,xmm10
pxor xmm0,xmm1
DB 102,15,56,0,217
movdqa xmm4,xmm10
pxor xmm3,xmm5
DB 102,15,56,0,224
movdqa xmm2,xmm10
pxor xmm4,xmm5
DB 102,15,56,0,211
movdqa xmm3,xmm10
pxor xmm2,xmm0
DB 102,15,56,0,220
movdqu xmm5,XMMWORD[r9]
pxor xmm3,xmm1
jnz NEAR $L$enc_loop
movdqa xmm4,XMMWORD[((-96))+r10]
movdqa xmm0,XMMWORD[((-80))+r10]
DB 102,15,56,0,226
pxor xmm4,xmm5
DB 102,15,56,0,195
movdqa xmm1,XMMWORD[64+r10*1+r11]
pxor xmm0,xmm4
DB 102,15,56,0,193
DB 0F3h,0C3h ;repret
ALIGN 16
_vpaes_encrypt_core_2x:
mov r9,rdx
mov r11,16
mov eax,DWORD[240+rdx]
movdqa xmm1,xmm9
movdqa xmm7,xmm9
movdqa xmm2,XMMWORD[$L$k_ipt]
movdqa xmm8,xmm2
pandn xmm1,xmm0
pandn xmm7,xmm6
movdqu xmm5,XMMWORD[r9]
psrld xmm1,4
psrld xmm7,4
pand xmm0,xmm9
pand xmm6,xmm9
DB 102,15,56,0,208
DB 102,68,15,56,0,198
movdqa xmm0,XMMWORD[(($L$k_ipt+16))]
movdqa xmm6,xmm0
DB 102,15,56,0,193
DB 102,15,56,0,247
pxor xmm2,xmm5
pxor xmm8,xmm5
add r9,16
pxor xmm0,xmm2
pxor xmm6,xmm8
lea r10,[$L$k_mc_backward]
jmp NEAR $L$enc2x_entry
ALIGN 16
$L$enc2x_loop:
movdqa xmm4,XMMWORD[$L$k_sb1]
movdqa xmm0,XMMWORD[(($L$k_sb1+16))]
movdqa xmm12,xmm4
movdqa xmm6,xmm0
DB 102,15,56,0,226
DB 102,69,15,56,0,224
DB 102,15,56,0,195
DB 102,65,15,56,0,243
pxor xmm4,xmm5
pxor xmm12,xmm5
movdqa xmm5,XMMWORD[$L$k_sb2]
movdqa xmm13,xmm5
pxor xmm0,xmm4
pxor xmm6,xmm12
movdqa xmm1,XMMWORD[((-64))+r10*1+r11]
DB 102,15,56,0,234
DB 102,69,15,56,0,232
movdqa xmm4,XMMWORD[r10*1+r11]
movdqa xmm2,XMMWORD[(($L$k_sb2+16))]
movdqa xmm8,xmm2
DB 102,15,56,0,211
DB 102,69,15,56,0,195
movdqa xmm3,xmm0
movdqa xmm11,xmm6
pxor xmm2,xmm5
pxor xmm8,xmm13
DB 102,15,56,0,193
DB 102,15,56,0,241
add r9,16
pxor xmm0,xmm2
pxor xmm6,xmm8
DB 102,15,56,0,220
DB 102,68,15,56,0,220
add r11,16
pxor xmm3,xmm0
pxor xmm11,xmm6
DB 102,15,56,0,193
DB 102,15,56,0,241
and r11,0x30
sub rax,1
pxor xmm0,xmm3
pxor xmm6,xmm11
$L$enc2x_entry:
movdqa xmm1,xmm9
movdqa xmm7,xmm9
movdqa xmm5,XMMWORD[(($L$k_inv+16))]
movdqa xmm13,xmm5
pandn xmm1,xmm0
pandn xmm7,xmm6
psrld xmm1,4
psrld xmm7,4
pand xmm0,xmm9
pand xmm6,xmm9
DB 102,15,56,0,232
DB 102,68,15,56,0,238
movdqa xmm3,xmm10
movdqa xmm11,xmm10
pxor xmm0,xmm1
pxor xmm6,xmm7
DB 102,15,56,0,217
DB 102,68,15,56,0,223
movdqa xmm4,xmm10
movdqa xmm12,xmm10
pxor xmm3,xmm5
pxor xmm11,xmm13
DB 102,15,56,0,224
DB 102,68,15,56,0,230
movdqa xmm2,xmm10
movdqa xmm8,xmm10
pxor xmm4,xmm5
pxor xmm12,xmm13
DB 102,15,56,0,211
DB 102,69,15,56,0,195
movdqa xmm3,xmm10
movdqa xmm11,xmm10
pxor xmm2,xmm0
pxor xmm8,xmm6
DB 102,15,56,0,220
DB 102,69,15,56,0,220
movdqu xmm5,XMMWORD[r9]
pxor xmm3,xmm1
pxor xmm11,xmm7
jnz NEAR $L$enc2x_loop
movdqa xmm4,XMMWORD[((-96))+r10]
movdqa xmm0,XMMWORD[((-80))+r10]
movdqa xmm12,xmm4
movdqa xmm6,xmm0
DB 102,15,56,0,226
DB 102,69,15,56,0,224
pxor xmm4,xmm5
pxor xmm12,xmm5
DB 102,15,56,0,195
DB 102,65,15,56,0,243
movdqa xmm1,XMMWORD[64+r10*1+r11]
pxor xmm0,xmm4
pxor xmm6,xmm12
DB 102,15,56,0,193
DB 102,15,56,0,241
DB 0F3h,0C3h ;repret
ALIGN 16
_vpaes_decrypt_core:
mov r9,rdx
mov eax,DWORD[240+rdx]
movdqa xmm1,xmm9
movdqa xmm2,XMMWORD[$L$k_dipt]
pandn xmm1,xmm0
mov r11,rax
psrld xmm1,4
movdqu xmm5,XMMWORD[r9]
shl r11,4
pand xmm0,xmm9
DB 102,15,56,0,208
movdqa xmm0,XMMWORD[(($L$k_dipt+16))]
xor r11,0x30
lea r10,[$L$k_dsbd]
DB 102,15,56,0,193
and r11,0x30
pxor xmm2,xmm5
movdqa xmm5,XMMWORD[(($L$k_mc_forward+48))]
pxor xmm0,xmm2
add r9,16
add r11,r10
jmp NEAR $L$dec_entry
ALIGN 16
$L$dec_loop:
movdqa xmm4,XMMWORD[((-32))+r10]
movdqa xmm1,XMMWORD[((-16))+r10]
DB 102,15,56,0,226
DB 102,15,56,0,203
pxor xmm0,xmm4
movdqa xmm4,XMMWORD[r10]
pxor xmm0,xmm1
movdqa xmm1,XMMWORD[16+r10]
DB 102,15,56,0,226
DB 102,15,56,0,197
DB 102,15,56,0,203
pxor xmm0,xmm4
movdqa xmm4,XMMWORD[32+r10]
pxor xmm0,xmm1
movdqa xmm1,XMMWORD[48+r10]
DB 102,15,56,0,226
DB 102,15,56,0,197
DB 102,15,56,0,203
pxor xmm0,xmm4
movdqa xmm4,XMMWORD[64+r10]
pxor xmm0,xmm1
movdqa xmm1,XMMWORD[80+r10]
DB 102,15,56,0,226
DB 102,15,56,0,197
DB 102,15,56,0,203
pxor xmm0,xmm4
add r9,16
DB 102,15,58,15,237,12
pxor xmm0,xmm1
sub rax,1
$L$dec_entry:
movdqa xmm1,xmm9
pandn xmm1,xmm0
movdqa xmm2,xmm11
psrld xmm1,4
pand xmm0,xmm9
DB 102,15,56,0,208
movdqa xmm3,xmm10
pxor xmm0,xmm1
DB 102,15,56,0,217
movdqa xmm4,xmm10
pxor xmm3,xmm2
DB 102,15,56,0,224
pxor xmm4,xmm2
movdqa xmm2,xmm10
DB 102,15,56,0,211
movdqa xmm3,xmm10
pxor xmm2,xmm0
DB 102,15,56,0,220
movdqu xmm0,XMMWORD[r9]
pxor xmm3,xmm1
jnz NEAR $L$dec_loop
movdqa xmm4,XMMWORD[96+r10]
DB 102,15,56,0,226
pxor xmm4,xmm0
movdqa xmm0,XMMWORD[112+r10]
movdqa xmm2,XMMWORD[((-352))+r11]
DB 102,15,56,0,195
pxor xmm0,xmm4
DB 102,15,56,0,194
DB 0F3h,0C3h ;repret
ALIGN 16
_vpaes_schedule_core:
call _vpaes_preheat
movdqa xmm8,XMMWORD[$L$k_rcon]
movdqu xmm0,XMMWORD[rdi]
movdqa xmm3,xmm0
lea r11,[$L$k_ipt]
call _vpaes_schedule_transform
movdqa xmm7,xmm0
lea r10,[$L$k_sr]
test rcx,rcx
jnz NEAR $L$schedule_am_decrypting
movdqu XMMWORD[rdx],xmm0
jmp NEAR $L$schedule_go
$L$schedule_am_decrypting:
movdqa xmm1,XMMWORD[r10*1+r8]
DB 102,15,56,0,217
movdqu XMMWORD[rdx],xmm3
xor r8,0x30
$L$schedule_go:
cmp esi,192
ja NEAR $L$schedule_256
je NEAR $L$schedule_192
$L$schedule_128:
mov esi,10
$L$oop_schedule_128:
call _vpaes_schedule_round
dec rsi
jz NEAR $L$schedule_mangle_last
call _vpaes_schedule_mangle
jmp NEAR $L$oop_schedule_128
ALIGN 16
$L$schedule_192:
movdqu xmm0,XMMWORD[8+rdi]
call _vpaes_schedule_transform
movdqa xmm6,xmm0
pxor xmm4,xmm4
movhlps xmm6,xmm4
mov esi,4
$L$oop_schedule_192:
call _vpaes_schedule_round
DB 102,15,58,15,198,8
call _vpaes_schedule_mangle
call _vpaes_schedule_192_smear
call _vpaes_schedule_mangle
call _vpaes_schedule_round
dec rsi
jz NEAR $L$schedule_mangle_last
call _vpaes_schedule_mangle
call _vpaes_schedule_192_smear
jmp NEAR $L$oop_schedule_192
ALIGN 16
$L$schedule_256:
movdqu xmm0,XMMWORD[16+rdi]
call _vpaes_schedule_transform
mov esi,7
$L$oop_schedule_256:
call _vpaes_schedule_mangle
movdqa xmm6,xmm0
call _vpaes_schedule_round
dec rsi
jz NEAR $L$schedule_mangle_last
call _vpaes_schedule_mangle
pshufd xmm0,xmm0,0xFF
movdqa xmm5,xmm7
movdqa xmm7,xmm6
call _vpaes_schedule_low_round
movdqa xmm7,xmm5
jmp NEAR $L$oop_schedule_256
ALIGN 16
$L$schedule_mangle_last:
lea r11,[$L$k_deskew]
test rcx,rcx
jnz NEAR $L$schedule_mangle_last_dec
movdqa xmm1,XMMWORD[r10*1+r8]
DB 102,15,56,0,193
lea r11,[$L$k_opt]
add rdx,32
$L$schedule_mangle_last_dec:
add rdx,-16
pxor xmm0,XMMWORD[$L$k_s63]
call _vpaes_schedule_transform
movdqu XMMWORD[rdx],xmm0
pxor xmm0,xmm0
pxor xmm1,xmm1
pxor xmm2,xmm2
pxor xmm3,xmm3
pxor xmm4,xmm4
pxor xmm5,xmm5
pxor xmm6,xmm6
pxor xmm7,xmm7
DB 0F3h,0C3h ;repret
ALIGN 16
_vpaes_schedule_192_smear:
pshufd xmm1,xmm6,0x80
pshufd xmm0,xmm7,0xFE
pxor xmm6,xmm1
pxor xmm1,xmm1
pxor xmm6,xmm0
movdqa xmm0,xmm6
movhlps xmm6,xmm1
DB 0F3h,0C3h ;repret
ALIGN 16
_vpaes_schedule_round:
pxor xmm1,xmm1
DB 102,65,15,58,15,200,15
DB 102,69,15,58,15,192,15
pxor xmm7,xmm1
pshufd xmm0,xmm0,0xFF
DB 102,15,58,15,192,1
_vpaes_schedule_low_round:
movdqa xmm1,xmm7
pslldq xmm7,4
pxor xmm7,xmm1
movdqa xmm1,xmm7
pslldq xmm7,8
pxor xmm7,xmm1
pxor xmm7,XMMWORD[$L$k_s63]
movdqa xmm1,xmm9
pandn xmm1,xmm0
psrld xmm1,4
pand xmm0,xmm9
movdqa xmm2,xmm11
DB 102,15,56,0,208
pxor xmm0,xmm1
movdqa xmm3,xmm10
DB 102,15,56,0,217
pxor xmm3,xmm2
movdqa xmm4,xmm10
DB 102,15,56,0,224
pxor xmm4,xmm2
movdqa xmm2,xmm10
DB 102,15,56,0,211
pxor xmm2,xmm0
movdqa xmm3,xmm10
DB 102,15,56,0,220
pxor xmm3,xmm1
movdqa xmm4,xmm13
DB 102,15,56,0,226
movdqa xmm0,xmm12
DB 102,15,56,0,195
pxor xmm0,xmm4
pxor xmm0,xmm7
movdqa xmm7,xmm0
DB 0F3h,0C3h ;repret
ALIGN 16
_vpaes_schedule_transform:
movdqa xmm1,xmm9
pandn xmm1,xmm0
psrld xmm1,4
pand xmm0,xmm9
movdqa xmm2,XMMWORD[r11]
DB 102,15,56,0,208
movdqa xmm0,XMMWORD[16+r11]
DB 102,15,56,0,193
pxor xmm0,xmm2
DB 0F3h,0C3h ;repret
ALIGN 16
_vpaes_schedule_mangle:
movdqa xmm4,xmm0
movdqa xmm5,XMMWORD[$L$k_mc_forward]
test rcx,rcx
jnz NEAR $L$schedule_mangle_dec
add rdx,16
pxor xmm4,XMMWORD[$L$k_s63]
DB 102,15,56,0,229
movdqa xmm3,xmm4
DB 102,15,56,0,229
pxor xmm3,xmm4
DB 102,15,56,0,229
pxor xmm3,xmm4
jmp NEAR $L$schedule_mangle_both
ALIGN 16
$L$schedule_mangle_dec:
lea r11,[$L$k_dksd]
movdqa xmm1,xmm9
pandn xmm1,xmm4
psrld xmm1,4
pand xmm4,xmm9
movdqa xmm2,XMMWORD[r11]
DB 102,15,56,0,212
movdqa xmm3,XMMWORD[16+r11]
DB 102,15,56,0,217
pxor xmm3,xmm2
DB 102,15,56,0,221
movdqa xmm2,XMMWORD[32+r11]
DB 102,15,56,0,212
pxor xmm2,xmm3
movdqa xmm3,XMMWORD[48+r11]
DB 102,15,56,0,217
pxor xmm3,xmm2
DB 102,15,56,0,221
movdqa xmm2,XMMWORD[64+r11]
DB 102,15,56,0,212
pxor xmm2,xmm3
movdqa xmm3,XMMWORD[80+r11]
DB 102,15,56,0,217
pxor xmm3,xmm2
DB 102,15,56,0,221
movdqa xmm2,XMMWORD[96+r11]
DB 102,15,56,0,212
pxor xmm2,xmm3
movdqa xmm3,XMMWORD[112+r11]
DB 102,15,56,0,217
pxor xmm3,xmm2
add rdx,-16
$L$schedule_mangle_both:
movdqa xmm1,XMMWORD[r10*1+r8]
DB 102,15,56,0,217
add r8,-16
and r8,0x30
movdqu XMMWORD[rdx],xmm3
DB 0F3h,0C3h ;repret
global vpaes_set_encrypt_key
ALIGN 16
vpaes_set_encrypt_key:
mov QWORD[8+rsp],rdi ;WIN64 prologue
mov QWORD[16+rsp],rsi
mov rax,rsp
$L$SEH_begin_vpaes_set_encrypt_key:
mov rdi,rcx
mov rsi,rdx
mov rdx,r8
%ifdef BORINGSSL_DISPATCH_TEST
2020-10-14 20:45:32 +00:00
EXTERN BORINGSSL_function_hit
mov BYTE[((BORINGSSL_function_hit+5))],1
%endif
lea rsp,[((-184))+rsp]
movaps XMMWORD[16+rsp],xmm6
movaps XMMWORD[32+rsp],xmm7
movaps XMMWORD[48+rsp],xmm8
movaps XMMWORD[64+rsp],xmm9
movaps XMMWORD[80+rsp],xmm10
movaps XMMWORD[96+rsp],xmm11
movaps XMMWORD[112+rsp],xmm12
movaps XMMWORD[128+rsp],xmm13
movaps XMMWORD[144+rsp],xmm14
movaps XMMWORD[160+rsp],xmm15
$L$enc_key_body:
mov eax,esi
shr eax,5
add eax,5
mov DWORD[240+rdx],eax
mov ecx,0
mov r8d,0x30
call _vpaes_schedule_core
movaps xmm6,XMMWORD[16+rsp]
movaps xmm7,XMMWORD[32+rsp]
movaps xmm8,XMMWORD[48+rsp]
movaps xmm9,XMMWORD[64+rsp]
movaps xmm10,XMMWORD[80+rsp]
movaps xmm11,XMMWORD[96+rsp]
movaps xmm12,XMMWORD[112+rsp]
movaps xmm13,XMMWORD[128+rsp]
movaps xmm14,XMMWORD[144+rsp]
movaps xmm15,XMMWORD[160+rsp]
lea rsp,[184+rsp]
$L$enc_key_epilogue:
xor eax,eax
mov rdi,QWORD[8+rsp] ;WIN64 epilogue
mov rsi,QWORD[16+rsp]
DB 0F3h,0C3h ;repret
$L$SEH_end_vpaes_set_encrypt_key:
global vpaes_set_decrypt_key
ALIGN 16
vpaes_set_decrypt_key:
mov QWORD[8+rsp],rdi ;WIN64 prologue
mov QWORD[16+rsp],rsi
mov rax,rsp
$L$SEH_begin_vpaes_set_decrypt_key:
mov rdi,rcx
mov rsi,rdx
mov rdx,r8
lea rsp,[((-184))+rsp]
movaps XMMWORD[16+rsp],xmm6
movaps XMMWORD[32+rsp],xmm7
movaps XMMWORD[48+rsp],xmm8
movaps XMMWORD[64+rsp],xmm9
movaps XMMWORD[80+rsp],xmm10
movaps XMMWORD[96+rsp],xmm11
movaps XMMWORD[112+rsp],xmm12
movaps XMMWORD[128+rsp],xmm13
movaps XMMWORD[144+rsp],xmm14
movaps XMMWORD[160+rsp],xmm15
$L$dec_key_body:
mov eax,esi
shr eax,5
add eax,5
mov DWORD[240+rdx],eax
shl eax,4
lea rdx,[16+rax*1+rdx]
mov ecx,1
mov r8d,esi
shr r8d,1
and r8d,32
xor r8d,32
call _vpaes_schedule_core
movaps xmm6,XMMWORD[16+rsp]
movaps xmm7,XMMWORD[32+rsp]
movaps xmm8,XMMWORD[48+rsp]
movaps xmm9,XMMWORD[64+rsp]
movaps xmm10,XMMWORD[80+rsp]
movaps xmm11,XMMWORD[96+rsp]
movaps xmm12,XMMWORD[112+rsp]
movaps xmm13,XMMWORD[128+rsp]
movaps xmm14,XMMWORD[144+rsp]
movaps xmm15,XMMWORD[160+rsp]
lea rsp,[184+rsp]
$L$dec_key_epilogue:
xor eax,eax
mov rdi,QWORD[8+rsp] ;WIN64 epilogue
mov rsi,QWORD[16+rsp]
DB 0F3h,0C3h ;repret
$L$SEH_end_vpaes_set_decrypt_key:
global vpaes_encrypt
ALIGN 16
vpaes_encrypt:
mov QWORD[8+rsp],rdi ;WIN64 prologue
mov QWORD[16+rsp],rsi
mov rax,rsp
$L$SEH_begin_vpaes_encrypt:
mov rdi,rcx
mov rsi,rdx
mov rdx,r8
%ifdef BORINGSSL_DISPATCH_TEST
2020-10-14 20:45:32 +00:00
EXTERN BORINGSSL_function_hit
mov BYTE[((BORINGSSL_function_hit+4))],1
%endif
lea rsp,[((-184))+rsp]
movaps XMMWORD[16+rsp],xmm6
movaps XMMWORD[32+rsp],xmm7
movaps XMMWORD[48+rsp],xmm8
movaps XMMWORD[64+rsp],xmm9
movaps XMMWORD[80+rsp],xmm10
movaps XMMWORD[96+rsp],xmm11
movaps XMMWORD[112+rsp],xmm12
movaps XMMWORD[128+rsp],xmm13
movaps XMMWORD[144+rsp],xmm14
movaps XMMWORD[160+rsp],xmm15
$L$enc_body:
movdqu xmm0,XMMWORD[rdi]
call _vpaes_preheat
call _vpaes_encrypt_core
movdqu XMMWORD[rsi],xmm0
movaps xmm6,XMMWORD[16+rsp]
movaps xmm7,XMMWORD[32+rsp]
movaps xmm8,XMMWORD[48+rsp]
movaps xmm9,XMMWORD[64+rsp]
movaps xmm10,XMMWORD[80+rsp]
movaps xmm11,XMMWORD[96+rsp]
movaps xmm12,XMMWORD[112+rsp]
movaps xmm13,XMMWORD[128+rsp]
movaps xmm14,XMMWORD[144+rsp]
movaps xmm15,XMMWORD[160+rsp]
lea rsp,[184+rsp]
$L$enc_epilogue:
mov rdi,QWORD[8+rsp] ;WIN64 epilogue
mov rsi,QWORD[16+rsp]
DB 0F3h,0C3h ;repret
$L$SEH_end_vpaes_encrypt:
global vpaes_decrypt
ALIGN 16
vpaes_decrypt:
mov QWORD[8+rsp],rdi ;WIN64 prologue
mov QWORD[16+rsp],rsi
mov rax,rsp
$L$SEH_begin_vpaes_decrypt:
mov rdi,rcx
mov rsi,rdx
mov rdx,r8
lea rsp,[((-184))+rsp]
movaps XMMWORD[16+rsp],xmm6
movaps XMMWORD[32+rsp],xmm7
movaps XMMWORD[48+rsp],xmm8
movaps XMMWORD[64+rsp],xmm9
movaps XMMWORD[80+rsp],xmm10
movaps XMMWORD[96+rsp],xmm11
movaps XMMWORD[112+rsp],xmm12
movaps XMMWORD[128+rsp],xmm13
movaps XMMWORD[144+rsp],xmm14
movaps XMMWORD[160+rsp],xmm15
$L$dec_body:
movdqu xmm0,XMMWORD[rdi]
call _vpaes_preheat
call _vpaes_decrypt_core
movdqu XMMWORD[rsi],xmm0
movaps xmm6,XMMWORD[16+rsp]
movaps xmm7,XMMWORD[32+rsp]
movaps xmm8,XMMWORD[48+rsp]
movaps xmm9,XMMWORD[64+rsp]
movaps xmm10,XMMWORD[80+rsp]
movaps xmm11,XMMWORD[96+rsp]
movaps xmm12,XMMWORD[112+rsp]
movaps xmm13,XMMWORD[128+rsp]
movaps xmm14,XMMWORD[144+rsp]
movaps xmm15,XMMWORD[160+rsp]
lea rsp,[184+rsp]
$L$dec_epilogue:
mov rdi,QWORD[8+rsp] ;WIN64 epilogue
mov rsi,QWORD[16+rsp]
DB 0F3h,0C3h ;repret
$L$SEH_end_vpaes_decrypt:
global vpaes_cbc_encrypt
ALIGN 16
vpaes_cbc_encrypt:
mov QWORD[8+rsp],rdi ;WIN64 prologue
mov QWORD[16+rsp],rsi
mov rax,rsp
$L$SEH_begin_vpaes_cbc_encrypt:
mov rdi,rcx
mov rsi,rdx
mov rdx,r8
mov rcx,r9
mov r8,QWORD[40+rsp]
mov r9,QWORD[48+rsp]
xchg rdx,rcx
sub rcx,16
jc NEAR $L$cbc_abort
lea rsp,[((-184))+rsp]
movaps XMMWORD[16+rsp],xmm6
movaps XMMWORD[32+rsp],xmm7
movaps XMMWORD[48+rsp],xmm8
movaps XMMWORD[64+rsp],xmm9
movaps XMMWORD[80+rsp],xmm10
movaps XMMWORD[96+rsp],xmm11
movaps XMMWORD[112+rsp],xmm12
movaps XMMWORD[128+rsp],xmm13
movaps XMMWORD[144+rsp],xmm14
movaps XMMWORD[160+rsp],xmm15
$L$cbc_body:
movdqu xmm6,XMMWORD[r8]
sub rsi,rdi
call _vpaes_preheat
cmp r9d,0
je NEAR $L$cbc_dec_loop
jmp NEAR $L$cbc_enc_loop
ALIGN 16
$L$cbc_enc_loop:
movdqu xmm0,XMMWORD[rdi]
pxor xmm0,xmm6
call _vpaes_encrypt_core
movdqa xmm6,xmm0
movdqu XMMWORD[rdi*1+rsi],xmm0
lea rdi,[16+rdi]
sub rcx,16
jnc NEAR $L$cbc_enc_loop
jmp NEAR $L$cbc_done
ALIGN 16
$L$cbc_dec_loop:
movdqu xmm0,XMMWORD[rdi]
movdqa xmm7,xmm0
call _vpaes_decrypt_core
pxor xmm0,xmm6
movdqa xmm6,xmm7
movdqu XMMWORD[rdi*1+rsi],xmm0
lea rdi,[16+rdi]
sub rcx,16
jnc NEAR $L$cbc_dec_loop
$L$cbc_done:
movdqu XMMWORD[r8],xmm6
movaps xmm6,XMMWORD[16+rsp]
movaps xmm7,XMMWORD[32+rsp]
movaps xmm8,XMMWORD[48+rsp]
movaps xmm9,XMMWORD[64+rsp]
movaps xmm10,XMMWORD[80+rsp]
movaps xmm11,XMMWORD[96+rsp]
movaps xmm12,XMMWORD[112+rsp]
movaps xmm13,XMMWORD[128+rsp]
movaps xmm14,XMMWORD[144+rsp]
movaps xmm15,XMMWORD[160+rsp]
lea rsp,[184+rsp]
$L$cbc_epilogue:
$L$cbc_abort:
mov rdi,QWORD[8+rsp] ;WIN64 epilogue
mov rsi,QWORD[16+rsp]
DB 0F3h,0C3h ;repret
$L$SEH_end_vpaes_cbc_encrypt:
global vpaes_ctr32_encrypt_blocks
ALIGN 16
vpaes_ctr32_encrypt_blocks:
mov QWORD[8+rsp],rdi ;WIN64 prologue
mov QWORD[16+rsp],rsi
mov rax,rsp
$L$SEH_begin_vpaes_ctr32_encrypt_blocks:
mov rdi,rcx
mov rsi,rdx
mov rdx,r8
mov rcx,r9
mov r8,QWORD[40+rsp]
xchg rdx,rcx
test rcx,rcx
jz NEAR $L$ctr32_abort
lea rsp,[((-184))+rsp]
movaps XMMWORD[16+rsp],xmm6
movaps XMMWORD[32+rsp],xmm7
movaps XMMWORD[48+rsp],xmm8
movaps XMMWORD[64+rsp],xmm9
movaps XMMWORD[80+rsp],xmm10
movaps XMMWORD[96+rsp],xmm11
movaps XMMWORD[112+rsp],xmm12
movaps XMMWORD[128+rsp],xmm13
movaps XMMWORD[144+rsp],xmm14
movaps XMMWORD[160+rsp],xmm15
$L$ctr32_body:
movdqu xmm0,XMMWORD[r8]
movdqa xmm8,XMMWORD[$L$ctr_add_one]
sub rsi,rdi
call _vpaes_preheat
movdqa xmm6,xmm0
pshufb xmm6,XMMWORD[$L$rev_ctr]
test rcx,1
jz NEAR $L$ctr32_prep_loop
movdqu xmm7,XMMWORD[rdi]
call _vpaes_encrypt_core
pxor xmm0,xmm7
paddd xmm6,xmm8
movdqu XMMWORD[rdi*1+rsi],xmm0
sub rcx,1
lea rdi,[16+rdi]
jz NEAR $L$ctr32_done
$L$ctr32_prep_loop:
movdqa xmm14,xmm6
movdqa xmm15,xmm6
paddd xmm15,xmm8
$L$ctr32_loop:
movdqa xmm1,XMMWORD[$L$rev_ctr]
movdqa xmm0,xmm14
movdqa xmm6,xmm15
DB 102,15,56,0,193
DB 102,15,56,0,241
call _vpaes_encrypt_core_2x
movdqu xmm1,XMMWORD[rdi]
movdqu xmm2,XMMWORD[16+rdi]
movdqa xmm3,XMMWORD[$L$ctr_add_two]
pxor xmm0,xmm1
pxor xmm6,xmm2
paddd xmm14,xmm3
paddd xmm15,xmm3
movdqu XMMWORD[rdi*1+rsi],xmm0
movdqu XMMWORD[16+rdi*1+rsi],xmm6
sub rcx,2
lea rdi,[32+rdi]
jnz NEAR $L$ctr32_loop
$L$ctr32_done:
movaps xmm6,XMMWORD[16+rsp]
movaps xmm7,XMMWORD[32+rsp]
movaps xmm8,XMMWORD[48+rsp]
movaps xmm9,XMMWORD[64+rsp]
movaps xmm10,XMMWORD[80+rsp]
movaps xmm11,XMMWORD[96+rsp]
movaps xmm12,XMMWORD[112+rsp]
movaps xmm13,XMMWORD[128+rsp]
movaps xmm14,XMMWORD[144+rsp]
movaps xmm15,XMMWORD[160+rsp]
lea rsp,[184+rsp]
$L$ctr32_epilogue:
$L$ctr32_abort:
mov rdi,QWORD[8+rsp] ;WIN64 epilogue
mov rsi,QWORD[16+rsp]
DB 0F3h,0C3h ;repret
$L$SEH_end_vpaes_ctr32_encrypt_blocks:
ALIGN 16
_vpaes_preheat:
lea r10,[$L$k_s0F]
movdqa xmm10,XMMWORD[((-32))+r10]
movdqa xmm11,XMMWORD[((-16))+r10]
movdqa xmm9,XMMWORD[r10]
movdqa xmm13,XMMWORD[48+r10]
movdqa xmm12,XMMWORD[64+r10]
movdqa xmm15,XMMWORD[80+r10]
movdqa xmm14,XMMWORD[96+r10]
DB 0F3h,0C3h ;repret
ALIGN 64
_vpaes_consts:
$L$k_inv:
DQ 0x0E05060F0D080180,0x040703090A0B0C02
DQ 0x01040A060F0B0780,0x030D0E0C02050809
$L$k_s0F:
DQ 0x0F0F0F0F0F0F0F0F,0x0F0F0F0F0F0F0F0F
$L$k_ipt:
DQ 0xC2B2E8985A2A7000,0xCABAE09052227808
DQ 0x4C01307D317C4D00,0xCD80B1FCB0FDCC81
$L$k_sb1:
DQ 0xB19BE18FCB503E00,0xA5DF7A6E142AF544
DQ 0x3618D415FAE22300,0x3BF7CCC10D2ED9EF
$L$k_sb2:
DQ 0xE27A93C60B712400,0x5EB7E955BC982FCD
DQ 0x69EB88400AE12900,0xC2A163C8AB82234A
$L$k_sbo:
DQ 0xD0D26D176FBDC700,0x15AABF7AC502A878
DQ 0xCFE474A55FBB6A00,0x8E1E90D1412B35FA
$L$k_mc_forward:
DQ 0x0407060500030201,0x0C0F0E0D080B0A09
DQ 0x080B0A0904070605,0x000302010C0F0E0D
DQ 0x0C0F0E0D080B0A09,0x0407060500030201
DQ 0x000302010C0F0E0D,0x080B0A0904070605
$L$k_mc_backward:
DQ 0x0605040702010003,0x0E0D0C0F0A09080B
DQ 0x020100030E0D0C0F,0x0A09080B06050407
DQ 0x0E0D0C0F0A09080B,0x0605040702010003
DQ 0x0A09080B06050407,0x020100030E0D0C0F
$L$k_sr:
DQ 0x0706050403020100,0x0F0E0D0C0B0A0908
DQ 0x030E09040F0A0500,0x0B06010C07020D08
DQ 0x0F060D040B020900,0x070E050C030A0108
DQ 0x0B0E0104070A0D00,0x0306090C0F020508
$L$k_rcon:
DQ 0x1F8391B9AF9DEEB6,0x702A98084D7C7D81
$L$k_s63:
DQ 0x5B5B5B5B5B5B5B5B,0x5B5B5B5B5B5B5B5B
$L$k_opt:
DQ 0xFF9F4929D6B66000,0xF7974121DEBE6808
DQ 0x01EDBD5150BCEC00,0xE10D5DB1B05C0CE0
$L$k_deskew:
DQ 0x07E4A34047A4E300,0x1DFEB95A5DBEF91A
DQ 0x5F36B5DC83EA6900,0x2841C2ABF49D1E77
$L$k_dksd:
DQ 0xFEB91A5DA3E44700,0x0740E3A45A1DBEF9
DQ 0x41C277F4B5368300,0x5FDC69EAAB289D1E
$L$k_dksb:
DQ 0x9A4FCA1F8550D500,0x03D653861CC94C99
DQ 0x115BEDA7B6FC4A00,0xD993256F7E3482C8
$L$k_dkse:
DQ 0xD5031CCA1FC9D600,0x53859A4C994F5086
DQ 0xA23196054FDC7BE8,0xCD5EF96A20B31487
$L$k_dks9:
DQ 0xB6116FC87ED9A700,0x4AED933482255BFC
DQ 0x4576516227143300,0x8BB89FACE9DAFDCE
$L$k_dipt:
DQ 0x0F505B040B545F00,0x154A411E114E451A
DQ 0x86E383E660056500,0x12771772F491F194
$L$k_dsb9:
DQ 0x851C03539A86D600,0xCAD51F504F994CC9
DQ 0xC03B1789ECD74900,0x725E2C9EB2FBA565
$L$k_dsbd:
DQ 0x7D57CCDFE6B1A200,0xF56E9B13882A4439
DQ 0x3CE2FAF724C6CB00,0x2931180D15DEEFD3
$L$k_dsbb:
DQ 0xD022649296B44200,0x602646F6B0F2D404
DQ 0xC19498A6CD596700,0xF3FF0C3E3255AA6B
$L$k_dsbe:
DQ 0x46F2929626D4D000,0x2242600464B4F6B0
DQ 0x0C55A6CDFFAAC100,0x9467F36B98593E32
$L$k_dsbo:
DQ 0x1387EA537EF94000,0xC7AA6DB9D4943E2D
DQ 0x12D7560F93441D00,0xCA4B8159D8C58E9C
$L$rev_ctr:
DQ 0x0706050403020100,0x0c0d0e0f0b0a0908
$L$ctr_add_one:
DQ 0x0000000000000000,0x0000000100000000
$L$ctr_add_two:
DQ 0x0000000000000000,0x0000000200000000
DB 86,101,99,116,111,114,32,80,101,114,109,117,116,97,116,105
DB 111,110,32,65,69,83,32,102,111,114,32,120,56,54,95,54
DB 52,47,83,83,83,69,51,44,32,77,105,107,101,32,72,97
DB 109,98,117,114,103,32,40,83,116,97,110,102,111,114,100,32
DB 85,110,105,118,101,114,115,105,116,121,41,0
ALIGN 64
EXTERN __imp_RtlVirtualUnwind
ALIGN 16
se_handler:
push rsi
push rdi
push rbx
push rbp
push r12
push r13
push r14
push r15
pushfq
sub rsp,64
mov rax,QWORD[120+r8]
mov rbx,QWORD[248+r8]
mov rsi,QWORD[8+r9]
mov r11,QWORD[56+r9]
mov r10d,DWORD[r11]
lea r10,[r10*1+rsi]
cmp rbx,r10
jb NEAR $L$in_prologue
mov rax,QWORD[152+r8]
mov r10d,DWORD[4+r11]
lea r10,[r10*1+rsi]
cmp rbx,r10
jae NEAR $L$in_prologue
lea rsi,[16+rax]
lea rdi,[512+r8]
mov ecx,20
DD 0xa548f3fc
lea rax,[184+rax]
$L$in_prologue:
mov rdi,QWORD[8+rax]
mov rsi,QWORD[16+rax]
mov QWORD[152+r8],rax
mov QWORD[168+r8],rsi
mov QWORD[176+r8],rdi
mov rdi,QWORD[40+r9]
mov rsi,r8
mov ecx,154
DD 0xa548f3fc
mov rsi,r9
xor rcx,rcx
mov rdx,QWORD[8+rsi]
mov r8,QWORD[rsi]
mov r9,QWORD[16+rsi]
mov r10,QWORD[40+rsi]
lea r11,[56+rsi]
lea r12,[24+rsi]
mov QWORD[32+rsp],r10
mov QWORD[40+rsp],r11
mov QWORD[48+rsp],r12
mov QWORD[56+rsp],rcx
call QWORD[__imp_RtlVirtualUnwind]
mov eax,1
add rsp,64
popfq
pop r15
pop r14
pop r13
pop r12
pop rbp
pop rbx
pop rdi
pop rsi
DB 0F3h,0C3h ;repret
section .pdata rdata align=4
ALIGN 4
DD $L$SEH_begin_vpaes_set_encrypt_key wrt ..imagebase
DD $L$SEH_end_vpaes_set_encrypt_key wrt ..imagebase
DD $L$SEH_info_vpaes_set_encrypt_key wrt ..imagebase
DD $L$SEH_begin_vpaes_set_decrypt_key wrt ..imagebase
DD $L$SEH_end_vpaes_set_decrypt_key wrt ..imagebase
DD $L$SEH_info_vpaes_set_decrypt_key wrt ..imagebase
DD $L$SEH_begin_vpaes_encrypt wrt ..imagebase
DD $L$SEH_end_vpaes_encrypt wrt ..imagebase
DD $L$SEH_info_vpaes_encrypt wrt ..imagebase
DD $L$SEH_begin_vpaes_decrypt wrt ..imagebase
DD $L$SEH_end_vpaes_decrypt wrt ..imagebase
DD $L$SEH_info_vpaes_decrypt wrt ..imagebase
DD $L$SEH_begin_vpaes_cbc_encrypt wrt ..imagebase
DD $L$SEH_end_vpaes_cbc_encrypt wrt ..imagebase
DD $L$SEH_info_vpaes_cbc_encrypt wrt ..imagebase
DD $L$SEH_begin_vpaes_ctr32_encrypt_blocks wrt ..imagebase
DD $L$SEH_end_vpaes_ctr32_encrypt_blocks wrt ..imagebase
DD $L$SEH_info_vpaes_ctr32_encrypt_blocks wrt ..imagebase
section .xdata rdata align=8
ALIGN 8
$L$SEH_info_vpaes_set_encrypt_key:
DB 9,0,0,0
DD se_handler wrt ..imagebase
DD $L$enc_key_body wrt ..imagebase,$L$enc_key_epilogue wrt ..imagebase
$L$SEH_info_vpaes_set_decrypt_key:
DB 9,0,0,0
DD se_handler wrt ..imagebase
DD $L$dec_key_body wrt ..imagebase,$L$dec_key_epilogue wrt ..imagebase
$L$SEH_info_vpaes_encrypt:
DB 9,0,0,0
DD se_handler wrt ..imagebase
DD $L$enc_body wrt ..imagebase,$L$enc_epilogue wrt ..imagebase
$L$SEH_info_vpaes_decrypt:
DB 9,0,0,0
DD se_handler wrt ..imagebase
DD $L$dec_body wrt ..imagebase,$L$dec_epilogue wrt ..imagebase
$L$SEH_info_vpaes_cbc_encrypt:
DB 9,0,0,0
DD se_handler wrt ..imagebase
DD $L$cbc_body wrt ..imagebase,$L$cbc_epilogue wrt ..imagebase
$L$SEH_info_vpaes_ctr32_encrypt_blocks:
DB 9,0,0,0
DD se_handler wrt ..imagebase
DD $L$ctr32_body wrt ..imagebase,$L$ctr32_epilogue wrt ..imagebase