blob: 68c74cc1b94d586acd5f7bef430532e58cc97987 [file] [log] [blame] [edit]
; This file is generated from a similarly-named Perl script in the BoringSSL
; source tree. Do not edit by hand.
default rel
%define XMMWORD
%define YMMWORD
%define ZMMWORD
%ifdef BORINGSSL_PREFIX
%include "boringssl_prefix_symbols_nasm.inc"
%endif
section .text code align=64
EXTERN OPENSSL_ia32cap_P
global sha256_block_data_order
ALIGN 16
sha256_block_data_order:
mov QWORD[8+rsp],rdi ;WIN64 prologue
mov QWORD[16+rsp],rsi
mov rax,rsp
$L$SEH_begin_sha256_block_data_order:
mov rdi,rcx
mov rsi,rdx
mov rdx,r8
lea r11,[OPENSSL_ia32cap_P]
mov r9d,DWORD[r11]
mov r10d,DWORD[4+r11]
mov r11d,DWORD[8+r11]
and r9d,1073741824
and r10d,268435968
or r10d,r9d
cmp r10d,1342177792
je NEAR $L$avx_shortcut
test r10d,512
jnz NEAR $L$ssse3_shortcut
mov rax,rsp
push rbx
push rbp
push r12
push r13
push r14
push r15
shl rdx,4
sub rsp,16*4+4*8
lea rdx,[rdx*4+rsi]
and rsp,-64
mov QWORD[((64+0))+rsp],rdi
mov QWORD[((64+8))+rsp],rsi
mov QWORD[((64+16))+rsp],rdx
mov QWORD[88+rsp],rax
$L$prologue:
mov eax,DWORD[rdi]
mov ebx,DWORD[4+rdi]
mov ecx,DWORD[8+rdi]
mov edx,DWORD[12+rdi]
mov r8d,DWORD[16+rdi]
mov r9d,DWORD[20+rdi]
mov r10d,DWORD[24+rdi]
mov r11d,DWORD[28+rdi]
jmp NEAR $L$loop
ALIGN 16
$L$loop:
mov edi,ebx
lea rbp,[K256]
xor edi,ecx
mov r12d,DWORD[rsi]
mov r13d,r8d
mov r14d,eax
bswap r12d
ror r13d,14
mov r15d,r9d
xor r13d,r8d
ror r14d,9
xor r15d,r10d
mov DWORD[rsp],r12d
xor r14d,eax
and r15d,r8d
ror r13d,5
add r12d,r11d
xor r15d,r10d
ror r14d,11
xor r13d,r8d
add r12d,r15d
mov r15d,eax
add r12d,DWORD[rbp]
xor r14d,eax
xor r15d,ebx
ror r13d,6
mov r11d,ebx
and edi,r15d
ror r14d,2
add r12d,r13d
xor r11d,edi
add edx,r12d
add r11d,r12d
lea rbp,[4+rbp]
add r11d,r14d
mov r12d,DWORD[4+rsi]
mov r13d,edx
mov r14d,r11d
bswap r12d
ror r13d,14
mov edi,r8d
xor r13d,edx
ror r14d,9
xor edi,r9d
mov DWORD[4+rsp],r12d
xor r14d,r11d
and edi,edx
ror r13d,5
add r12d,r10d
xor edi,r9d
ror r14d,11
xor r13d,edx
add r12d,edi
mov edi,r11d
add r12d,DWORD[rbp]
xor r14d,r11d
xor edi,eax
ror r13d,6
mov r10d,eax
and r15d,edi
ror r14d,2
add r12d,r13d
xor r10d,r15d
add ecx,r12d
add r10d,r12d
lea rbp,[4+rbp]
add r10d,r14d
mov r12d,DWORD[8+rsi]
mov r13d,ecx
mov r14d,r10d
bswap r12d
ror r13d,14
mov r15d,edx
xor r13d,ecx
ror r14d,9
xor r15d,r8d
mov DWORD[8+rsp],r12d
xor r14d,r10d
and r15d,ecx
ror r13d,5
add r12d,r9d
xor r15d,r8d
ror r14d,11
xor r13d,ecx
add r12d,r15d
mov r15d,r10d
add r12d,DWORD[rbp]
xor r14d,r10d
xor r15d,r11d
ror r13d,6
mov r9d,r11d
and edi,r15d
ror r14d,2
add r12d,r13d
xor r9d,edi
add ebx,r12d
add r9d,r12d
lea rbp,[4+rbp]
add r9d,r14d
mov r12d,DWORD[12+rsi]
mov r13d,ebx
mov r14d,r9d
bswap r12d
ror r13d,14
mov edi,ecx
xor r13d,ebx
ror r14d,9
xor edi,edx
mov DWORD[12+rsp],r12d
xor r14d,r9d
and edi,ebx
ror r13d,5
add r12d,r8d
xor edi,edx
ror r14d,11
xor r13d,ebx
add r12d,edi
mov edi,r9d
add r12d,DWORD[rbp]
xor r14d,r9d
xor edi,r10d
ror r13d,6
mov r8d,r10d
and r15d,edi
ror r14d,2
add r12d,r13d
xor r8d,r15d
add eax,r12d
add r8d,r12d
lea rbp,[20+rbp]
add r8d,r14d
mov r12d,DWORD[16+rsi]
mov r13d,eax
mov r14d,r8d
bswap r12d
ror r13d,14
mov r15d,ebx
xor r13d,eax
ror r14d,9
xor r15d,ecx
mov DWORD[16+rsp],r12d
xor r14d,r8d
and r15d,eax
ror r13d,5
add r12d,edx
xor r15d,ecx
ror r14d,11
xor r13d,eax
add r12d,r15d
mov r15d,r8d
add r12d,DWORD[rbp]
xor r14d,r8d
xor r15d,r9d
ror r13d,6
mov edx,r9d
and edi,r15d
ror r14d,2
add r12d,r13d
xor edx,edi
add r11d,r12d
add edx,r12d
lea rbp,[4+rbp]
add edx,r14d
mov r12d,DWORD[20+rsi]
mov r13d,r11d
mov r14d,edx
bswap r12d
ror r13d,14
mov edi,eax
xor r13d,r11d
ror r14d,9
xor edi,ebx
mov DWORD[20+rsp],r12d
xor r14d,edx
and edi,r11d
ror r13d,5
add r12d,ecx
xor edi,ebx
ror r14d,11
xor r13d,r11d
add r12d,edi
mov edi,edx
add r12d,DWORD[rbp]
xor r14d,edx
xor edi,r8d
ror r13d,6
mov ecx,r8d
and r15d,edi
ror r14d,2
add r12d,r13d
xor ecx,r15d
add r10d,r12d
add ecx,r12d
lea rbp,[4+rbp]
add ecx,r14d
mov r12d,DWORD[24+rsi]
mov r13d,r10d
mov r14d,ecx
bswap r12d
ror r13d,14
mov r15d,r11d
xor r13d,r10d
ror r14d,9
xor r15d,eax
mov DWORD[24+rsp],r12d
xor r14d,ecx
and r15d,r10d
ror r13d,5
add r12d,ebx
xor r15d,eax
ror r14d,11
xor r13d,r10d
add r12d,r15d
mov r15d,ecx
add r12d,DWORD[rbp]
xor r14d,ecx
xor r15d,edx
ror r13d,6
mov ebx,edx
and edi,r15d
ror r14d,2
add r12d,r13d
xor ebx,edi
add r9d,r12d
add ebx,r12d
lea rbp,[4+rbp]
add ebx,r14d
mov r12d,DWORD[28+rsi]
mov r13d,r9d
mov r14d,ebx
bswap r12d
ror r13d,14
mov edi,r10d
xor r13d,r9d
ror r14d,9
xor edi,r11d
mov DWORD[28+rsp],r12d
xor r14d,ebx
and edi,r9d
ror r13d,5
add r12d,eax
xor edi,r11d
ror r14d,11
xor r13d,r9d
add r12d,edi
mov edi,ebx
add r12d,DWORD[rbp]
xor r14d,ebx
xor edi,ecx
ror r13d,6
mov eax,ecx
and r15d,edi
ror r14d,2
add r12d,r13d
xor eax,r15d
add r8d,r12d
add eax,r12d
lea rbp,[20+rbp]
add eax,r14d
mov r12d,DWORD[32+rsi]
mov r13d,r8d
mov r14d,eax
bswap r12d
ror r13d,14
mov r15d,r9d
xor r13d,r8d
ror r14d,9
xor r15d,r10d
mov DWORD[32+rsp],r12d
xor r14d,eax
and r15d,r8d
ror r13d,5
add r12d,r11d
xor r15d,r10d
ror r14d,11
xor r13d,r8d
add r12d,r15d
mov r15d,eax
add r12d,DWORD[rbp]
xor r14d,eax
xor r15d,ebx
ror r13d,6
mov r11d,ebx
and edi,r15d
ror r14d,2
add r12d,r13d
xor r11d,edi
add edx,r12d
add r11d,r12d
lea rbp,[4+rbp]
add r11d,r14d
mov r12d,DWORD[36+rsi]
mov r13d,edx
mov r14d,r11d
bswap r12d
ror r13d,14
mov edi,r8d
xor r13d,edx
ror r14d,9
xor edi,r9d
mov DWORD[36+rsp],r12d
xor r14d,r11d
and edi,edx
ror r13d,5
add r12d,r10d
xor edi,r9d
ror r14d,11
xor r13d,edx
add r12d,edi
mov edi,r11d
add r12d,DWORD[rbp]
xor r14d,r11d
xor edi,eax
ror r13d,6
mov r10d,eax
and r15d,edi
ror r14d,2
add r12d,r13d
xor r10d,r15d
add ecx,r12d
add r10d,r12d
lea rbp,[4+rbp]
add r10d,r14d
mov r12d,DWORD[40+rsi]
mov r13d,ecx
mov r14d,r10d
bswap r12d
ror r13d,14
mov r15d,edx
xor r13d,ecx
ror r14d,9
xor r15d,r8d
mov DWORD[40+rsp],r12d
xor r14d,r10d
and r15d,ecx
ror r13d,5
add r12d,r9d
xor r15d,r8d
ror r14d,11
xor r13d,ecx
add r12d,r15d
mov r15d,r10d
add r12d,DWORD[rbp]
xor r14d,r10d
xor r15d,r11d
ror r13d,6
mov r9d,r11d
and edi,r15d
ror r14d,2
add r12d,r13d
xor r9d,edi
add ebx,r12d
add r9d,r12d
lea rbp,[4+rbp]
add r9d,r14d
mov r12d,DWORD[44+rsi]
mov r13d,ebx
mov r14d,r9d
bswap r12d
ror r13d,14
mov edi,ecx
xor r13d,ebx
ror r14d,9
xor edi,edx
mov DWORD[44+rsp],r12d
xor r14d,r9d
and edi,ebx
ror r13d,5
add r12d,r8d
xor edi,edx
ror r14d,11
xor r13d,ebx
add r12d,edi
mov edi,r9d
add r12d,DWORD[rbp]
xor r14d,r9d
xor edi,r10d
ror r13d,6
mov r8d,r10d
and r15d,edi
ror r14d,2
add r12d,r13d
xor r8d,r15d
add eax,r12d
add r8d,r12d
lea rbp,[20+rbp]
add r8d,r14d
mov r12d,DWORD[48+rsi]
mov r13d,eax
mov r14d,r8d
bswap r12d
ror r13d,14
mov r15d,ebx
xor r13d,eax
ror r14d,9
xor r15d,ecx
mov DWORD[48+rsp],r12d
xor r14d,r8d
and r15d,eax
ror r13d,5
add r12d,edx
xor r15d,ecx
ror r14d,11
xor r13d,eax
add r12d,r15d
mov r15d,r8d
add r12d,DWORD[rbp]
xor r14d,r8d
xor r15d,r9d
ror r13d,6
mov edx,r9d
and edi,r15d
ror r14d,2
add r12d,r13d
xor edx,edi
add r11d,r12d
add edx,r12d
lea rbp,[4+rbp]
add edx,r14d
mov r12d,DWORD[52+rsi]
mov r13d,r11d
mov r14d,edx
bswap r12d
ror r13d,14
mov edi,eax
xor r13d,r11d
ror r14d,9
xor edi,ebx
mov DWORD[52+rsp],r12d
xor r14d,edx
and edi,r11d
ror r13d,5
add r12d,ecx
xor edi,ebx
ror r14d,11
xor r13d,r11d
add r12d,edi
mov edi,edx
add r12d,DWORD[rbp]
xor r14d,edx
xor edi,r8d
ror r13d,6
mov ecx,r8d
and r15d,edi
ror r14d,2
add r12d,r13d
xor ecx,r15d
add r10d,r12d
add ecx,r12d
lea rbp,[4+rbp]
add ecx,r14d
mov r12d,DWORD[56+rsi]
mov r13d,r10d
mov r14d,ecx
bswap r12d
ror r13d,14
mov r15d,r11d
xor r13d,r10d
ror r14d,9
xor r15d,eax
mov DWORD[56+rsp],r12d
xor r14d,ecx
and r15d,r10d
ror r13d,5
add r12d,ebx
xor r15d,eax
ror r14d,11
xor r13d,r10d
add r12d,r15d
mov r15d,ecx
add r12d,DWORD[rbp]
xor r14d,ecx
xor r15d,edx
ror r13d,6
mov ebx,edx
and edi,r15d
ror r14d,2
add r12d,r13d
xor ebx,edi
add r9d,r12d
add ebx,r12d
lea rbp,[4+rbp]
add ebx,r14d
mov r12d,DWORD[60+rsi]
mov r13d,r9d
mov r14d,ebx
bswap r12d
ror r13d,14
mov edi,r10d
xor r13d,r9d
ror r14d,9
xor edi,r11d
mov DWORD[60+rsp],r12d
xor r14d,ebx
and edi,r9d
ror r13d,5
add r12d,eax
xor edi,r11d
ror r14d,11
xor r13d,r9d
add r12d,edi
mov edi,ebx
add r12d,DWORD[rbp]
xor r14d,ebx
xor edi,ecx
ror r13d,6
mov eax,ecx
and r15d,edi
ror r14d,2
add r12d,r13d
xor eax,r15d
add r8d,r12d
add eax,r12d
lea rbp,[20+rbp]
jmp NEAR $L$rounds_16_xx
ALIGN 16
$L$rounds_16_xx:
mov r13d,DWORD[4+rsp]
mov r15d,DWORD[56+rsp]
mov r12d,r13d
ror r13d,11
add eax,r14d
mov r14d,r15d
ror r15d,2
xor r13d,r12d
shr r12d,3
ror r13d,7
xor r15d,r14d
shr r14d,10
ror r15d,17
xor r12d,r13d
xor r15d,r14d
add r12d,DWORD[36+rsp]
add r12d,DWORD[rsp]
mov r13d,r8d
add r12d,r15d
mov r14d,eax
ror r13d,14
mov r15d,r9d
xor r13d,r8d
ror r14d,9
xor r15d,r10d
mov DWORD[rsp],r12d
xor r14d,eax
and r15d,r8d
ror r13d,5
add r12d,r11d
xor r15d,r10d
ror r14d,11
xor r13d,r8d
add r12d,r15d
mov r15d,eax
add r12d,DWORD[rbp]
xor r14d,eax
xor r15d,ebx
ror r13d,6
mov r11d,ebx
and edi,r15d
ror r14d,2
add r12d,r13d
xor r11d,edi
add edx,r12d
add r11d,r12d
lea rbp,[4+rbp]
mov r13d,DWORD[8+rsp]
mov edi,DWORD[60+rsp]
mov r12d,r13d
ror r13d,11
add r11d,r14d
mov r14d,edi
ror edi,2
xor r13d,r12d
shr r12d,3
ror r13d,7
xor edi,r14d
shr r14d,10
ror edi,17
xor r12d,r13d
xor edi,r14d
add r12d,DWORD[40+rsp]
add r12d,DWORD[4+rsp]
mov r13d,edx
add r12d,edi
mov r14d,r11d
ror r13d,14
mov edi,r8d
xor r13d,edx
ror r14d,9
xor edi,r9d
mov DWORD[4+rsp],r12d
xor r14d,r11d
and edi,edx
ror r13d,5
add r12d,r10d
xor edi,r9d
ror r14d,11
xor r13d,edx
add r12d,edi
mov edi,r11d
add r12d,DWORD[rbp]
xor r14d,r11d
xor edi,eax
ror r13d,6
mov r10d,eax
and r15d,edi
ror r14d,2
add r12d,r13d
xor r10d,r15d
add ecx,r12d
add r10d,r12d
lea rbp,[4+rbp]
mov r13d,DWORD[12+rsp]
mov r15d,DWORD[rsp]
mov r12d,r13d
ror r13d,11
add r10d,r14d
mov r14d,r15d
ror r15d,2
xor r13d,r12d
shr r12d,3
ror r13d,7
xor r15d,r14d
shr r14d,10
ror r15d,17
xor r12d,r13d
xor r15d,r14d
add r12d,DWORD[44+rsp]
add r12d,DWORD[8+rsp]
mov r13d,ecx
add r12d,r15d
mov r14d,r10d
ror r13d,14
mov r15d,edx
xor r13d,ecx
ror r14d,9
xor r15d,r8d
mov DWORD[8+rsp],r12d
xor r14d,r10d
and r15d,ecx
ror r13d,5
add r12d,r9d
xor r15d,r8d
ror r14d,11
xor r13d,ecx
add r12d,r15d
mov r15d,r10d
add r12d,DWORD[rbp]
xor r14d,r10d
xor r15d,r11d
ror r13d,6
mov r9d,r11d
and edi,r15d
ror r14d,2
add r12d,r13d
xor r9d,edi
add ebx,r12d
add r9d,r12d
lea rbp,[4+rbp]
mov r13d,DWORD[16+rsp]
mov edi,DWORD[4+rsp]
mov r12d,r13d
ror r13d,11
add r9d,r14d
mov r14d,edi
ror edi,2
xor r13d,r12d
shr r12d,3
ror r13d,7
xor edi,r14d
shr r14d,10
ror edi,17
xor r12d,r13d
xor edi,r14d
add r12d,DWORD[48+rsp]
add r12d,DWORD[12+rsp]
mov r13d,ebx
add r12d,edi
mov r14d,r9d
ror r13d,14
mov edi,ecx
xor r13d,ebx
ror r14d,9
xor edi,edx
mov DWORD[12+rsp],r12d
xor r14d,r9d
and edi,ebx
ror r13d,5
add r12d,r8d
xor edi,edx
ror r14d,11
xor r13d,ebx
add r12d,edi
mov edi,r9d
add r12d,DWORD[rbp]
xor r14d,r9d
xor edi,r10d
ror r13d,6
mov r8d,r10d
and r15d,edi
ror r14d,2
add r12d,r13d
xor r8d,r15d
add eax,r12d
add r8d,r12d
lea rbp,[20+rbp]
mov r13d,DWORD[20+rsp]
mov r15d,DWORD[8+rsp]
mov r12d,r13d
ror r13d,11
add r8d,r14d
mov r14d,r15d
ror r15d,2
xor r13d,r12d
shr r12d,3
ror r13d,7
xor r15d,r14d
shr r14d,10
ror r15d,17
xor r12d,r13d
xor r15d,r14d
add r12d,DWORD[52+rsp]
add r12d,DWORD[16+rsp]
mov r13d,eax
add r12d,r15d
mov r14d,r8d
ror r13d,14
mov r15d,ebx
xor r13d,eax
ror r14d,9
xor r15d,ecx
mov DWORD[16+rsp],r12d
xor r14d,r8d
and r15d,eax
ror r13d,5
add r12d,edx
xor r15d,ecx
ror r14d,11
xor r13d,eax
add r12d,r15d
mov r15d,r8d
add r12d,DWORD[rbp]
xor r14d,r8d
xor r15d,r9d
ror r13d,6
mov edx,r9d
and edi,r15d
ror r14d,2
add r12d,r13d
xor edx,edi
add r11d,r12d
add edx,r12d
lea rbp,[4+rbp]
mov r13d,DWORD[24+rsp]
mov edi,DWORD[12+rsp]
mov r12d,r13d
ror r13d,11
add edx,r14d
mov r14d,edi
ror edi,2
xor r13d,r12d
shr r12d,3
ror r13d,7
xor edi,r14d
shr r14d,10
ror edi,17
xor r12d,r13d
xor edi,r14d
add r12d,DWORD[56+rsp]
add r12d,DWORD[20+rsp]
mov r13d,r11d
add r12d,edi
mov r14d,edx
ror r13d,14
mov edi,eax
xor r13d,r11d
ror r14d,9
xor edi,ebx
mov DWORD[20+rsp],r12d
xor r14d,edx
and edi,r11d
ror r13d,5
add r12d,ecx
xor edi,ebx
ror r14d,11
xor r13d,r11d
add r12d,edi
mov edi,edx
add r12d,DWORD[rbp]
xor r14d,edx
xor edi,r8d
ror r13d,6
mov ecx,r8d
and r15d,edi
ror r14d,2
add r12d,r13d
xor ecx,r15d
add r10d,r12d
add ecx,r12d
lea rbp,[4+rbp]
mov r13d,DWORD[28+rsp]
mov r15d,DWORD[16+rsp]
mov r12d,r13d
ror r13d,11
add ecx,r14d
mov r14d,r15d
ror r15d,2
xor r13d,r12d
shr r12d,3
ror r13d,7
xor r15d,r14d
shr r14d,10
ror r15d,17
xor r12d,r13d
xor r15d,r14d
add r12d,DWORD[60+rsp]
add r12d,DWORD[24+rsp]
mov r13d,r10d
add r12d,r15d
mov r14d,ecx
ror r13d,14
mov r15d,r11d
xor r13d,r10d
ror r14d,9
xor r15d,eax
mov DWORD[24+rsp],r12d
xor r14d,ecx
and r15d,r10d
ror r13d,5
add r12d,ebx
xor r15d,eax
ror r14d,11
xor r13d,r10d
add r12d,r15d
mov r15d,ecx
add r12d,DWORD[rbp]
xor r14d,ecx
xor r15d,edx
ror r13d,6
mov ebx,edx
and edi,r15d
ror r14d,2
add r12d,r13d
xor ebx,edi
add r9d,r12d
add ebx,r12d
lea rbp,[4+rbp]
mov r13d,DWORD[32+rsp]
mov edi,DWORD[20+rsp]
mov r12d,r13d
ror r13d,11
add ebx,r14d
mov r14d,edi
ror edi,2
xor r13d,r12d
shr r12d,3
ror r13d,7
xor edi,r14d
shr r14d,10
ror edi,17
xor r12d,r13d
xor edi,r14d
add r12d,DWORD[rsp]
add r12d,DWORD[28+rsp]
mov r13d,r9d
add r12d,edi
mov r14d,ebx
ror r13d,14
mov edi,r10d
xor r13d,r9d
ror r14d,9
xor edi,r11d
mov DWORD[28+rsp],r12d
xor r14d,ebx
and edi,r9d
ror r13d,5
add r12d,eax
xor edi,r11d
ror r14d,11
xor r13d,r9d
add r12d,edi
mov edi,ebx
add r12d,DWORD[rbp]
xor r14d,ebx
xor edi,ecx
ror r13d,6
mov eax,ecx
and r15d,edi
ror r14d,2
add r12d,r13d
xor eax,r15d
add r8d,r12d
add eax,r12d
lea rbp,[20+rbp]
mov r13d,DWORD[36+rsp]
mov r15d,DWORD[24+rsp]
mov r12d,r13d
ror r13d,11
add eax,r14d
mov r14d,r15d
ror r15d,2
xor r13d,r12d
shr r12d,3
ror r13d,7
xor r15d,r14d
shr r14d,10
ror r15d,17
xor r12d,r13d
xor r15d,r14d
add r12d,DWORD[4+rsp]
add r12d,DWORD[32+rsp]
mov r13d,r8d
add r12d,r15d
mov r14d,eax
ror r13d,14
mov r15d,r9d
xor r13d,r8d
ror r14d,9
xor r15d,r10d
mov DWORD[32+rsp],r12d
xor r14d,eax
and r15d,r8d
ror r13d,5
add r12d,r11d
xor r15d,r10d
ror r14d,11
xor r13d,r8d
add r12d,r15d
mov r15d,eax
add r12d,DWORD[rbp]
xor r14d,eax
xor r15d,ebx
ror r13d,6
mov r11d,ebx
and edi,r15d
ror r14d,2
add r12d,r13d
xor r11d,edi
add edx,r12d
add r11d,r12d
lea rbp,[4+rbp]
mov r13d,DWORD[40+rsp]
mov edi,DWORD[28+rsp]
mov r12d,r13d
ror r13d,11
add r11d,r14d
mov r14d,edi
ror edi,2
xor r13d,r12d
shr r12d,3
ror r13d,7
xor edi,r14d
shr r14d,10
ror edi,17
xor r12d,r13d
xor edi,r14d
add r12d,DWORD[8+rsp]
add r12d,DWORD[36+rsp]
mov r13d,edx
add r12d,edi
mov r14d,r11d
ror r13d,14
mov edi,r8d
xor r13d,edx
ror r14d,9
xor edi,r9d
mov DWORD[36+rsp],r12d
xor r14d,r11d
and edi,edx
ror r13d,5
add r12d,r10d
xor edi,r9d
ror r14d,11
xor r13d,edx
add r12d,edi
mov edi,r11d
add r12d,DWORD[rbp]
xor r14d,r11d
xor edi,eax
ror r13d,6
mov r10d,eax
and r15d,edi
ror r14d,2
add r12d,r13d
xor r10d,r15d
add ecx,r12d
add r10d,r12d
lea rbp,[4+rbp]
mov r13d,DWORD[44+rsp]
mov r15d,DWORD[32+rsp]
mov r12d,r13d
ror r13d,11
add r10d,r14d
mov r14d,r15d
ror r15d,2
xor r13d,r12d
shr r12d,3
ror r13d,7
xor r15d,r14d
shr r14d,10
ror r15d,17
xor r12d,r13d
xor r15d,r14d
add r12d,DWORD[12+rsp]
add r12d,DWORD[40+rsp]
mov r13d,ecx
add r12d,r15d
mov r14d,r10d
ror r13d,14
mov r15d,edx
xor r13d,ecx
ror r14d,9
xor r15d,r8d
mov DWORD[40+rsp],r12d
xor r14d,r10d
and r15d,ecx
ror r13d,5
add r12d,r9d
xor r15d,r8d
ror r14d,11
xor r13d,ecx
add r12d,r15d
mov r15d,r10d
add r12d,DWORD[rbp]
xor r14d,r10d
xor r15d,r11d
ror r13d,6
mov r9d,r11d
and edi,r15d
ror r14d,2
add r12d,r13d
xor r9d,edi
add ebx,r12d
add r9d,r12d
lea rbp,[4+rbp]
mov r13d,DWORD[48+rsp]
mov edi,DWORD[36+rsp]
mov r12d,r13d
ror r13d,11
add r9d,r14d
mov r14d,edi
ror edi,2
xor r13d,r12d
shr r12d,3
ror r13d,7
xor edi,r14d
shr r14d,10
ror edi,17
xor r12d,r13d
xor edi,r14d
add r12d,DWORD[16+rsp]
add r12d,DWORD[44+rsp]
mov r13d,ebx
add r12d,edi
mov r14d,r9d
ror r13d,14
mov edi,ecx
xor r13d,ebx
ror r14d,9
xor edi,edx
mov DWORD[44+rsp],r12d
xor r14d,r9d
and edi,ebx
ror r13d,5
add r12d,r8d
xor edi,edx
ror r14d,11
xor r13d,ebx
add r12d,edi
mov edi,r9d
add r12d,DWORD[rbp]
xor r14d,r9d
xor edi,r10d
ror r13d,6
mov r8d,r10d
and r15d,edi
ror r14d,2
add r12d,r13d
xor r8d,r15d
add eax,r12d
add r8d,r12d
lea rbp,[20+rbp]
mov r13d,DWORD[52+rsp]
mov r15d,DWORD[40+rsp]
mov r12d,r13d
ror r13d,11
add r8d,r14d
mov r14d,r15d
ror r15d,2
xor r13d,r12d
shr r12d,3
ror r13d,7
xor r15d,r14d
shr r14d,10
ror r15d,17
xor r12d,r13d
xor r15d,r14d
add r12d,DWORD[20+rsp]
add r12d,DWORD[48+rsp]
mov r13d,eax
add r12d,r15d
mov r14d,r8d
ror r13d,14
mov r15d,ebx
xor r13d,eax
ror r14d,9
xor r15d,ecx
mov DWORD[48+rsp],r12d
xor r14d,r8d
and r15d,eax
ror r13d,5
add r12d,edx
xor r15d,ecx
ror r14d,11
xor r13d,eax
add r12d,r15d
mov r15d,r8d
add r12d,DWORD[rbp]
xor r14d,r8d
xor r15d,r9d
ror r13d,6
mov edx,r9d
and edi,r15d
ror r14d,2
add r12d,r13d
xor edx,edi
add r11d,r12d
add edx,r12d
lea rbp,[4+rbp]
mov r13d,DWORD[56+rsp]
mov edi,DWORD[44+rsp]
mov r12d,r13d
ror r13d,11
add edx,r14d
mov r14d,edi
ror edi,2
xor r13d,r12d
shr r12d,3
ror r13d,7
xor edi,r14d
shr r14d,10
ror edi,17
xor r12d,r13d
xor edi,r14d
add r12d,DWORD[24+rsp]
add r12d,DWORD[52+rsp]
mov r13d,r11d
add r12d,edi
mov r14d,edx
ror r13d,14
mov edi,eax
xor r13d,r11d
ror r14d,9
xor edi,ebx
mov DWORD[52+rsp],r12d
xor r14d,edx
and edi,r11d
ror r13d,5
add r12d,ecx
xor edi,ebx
ror r14d,11
xor r13d,r11d
add r12d,edi
mov edi,edx
add r12d,DWORD[rbp]
xor r14d,edx
xor edi,r8d
ror r13d,6
mov ecx,r8d
and r15d,edi
ror r14d,2
add r12d,r13d
xor ecx,r15d
add r10d,r12d
add ecx,r12d
lea rbp,[4+rbp]
mov r13d,DWORD[60+rsp]
mov r15d,DWORD[48+rsp]
mov r12d,r13d
ror r13d,11
add ecx,r14d
mov r14d,r15d
ror r15d,2
xor r13d,r12d
shr r12d,3
ror r13d,7
xor r15d,r14d
shr r14d,10
ror r15d,17
xor r12d,r13d
xor r15d,r14d
add r12d,DWORD[28+rsp]
add r12d,DWORD[56+rsp]
mov r13d,r10d
add r12d,r15d
mov r14d,ecx
ror r13d,14
mov r15d,r11d
xor r13d,r10d
ror r14d,9
xor r15d,eax
mov DWORD[56+rsp],r12d
xor r14d,ecx
and r15d,r10d
ror r13d,5
add r12d,ebx
xor r15d,eax
ror r14d,11
xor r13d,r10d
add r12d,r15d
mov r15d,ecx
add r12d,DWORD[rbp]
xor r14d,ecx
xor r15d,edx
ror r13d,6
mov ebx,edx
and edi,r15d
ror r14d,2
add r12d,r13d
xor ebx,edi
add r9d,r12d
add ebx,r12d
lea rbp,[4+rbp]
mov r13d,DWORD[rsp]
mov edi,DWORD[52+rsp]
mov r12d,r13d
ror r13d,11
add ebx,r14d
mov r14d,edi
ror edi,2
xor r13d,r12d
shr r12d,3
ror r13d,7
xor edi,r14d
shr r14d,10
ror edi,17
xor r12d,r13d
xor edi,r14d
add r12d,DWORD[32+rsp]
add r12d,DWORD[60+rsp]
mov r13d,r9d
add r12d,edi
mov r14d,ebx
ror r13d,14
mov edi,r10d
xor r13d,r9d
ror r14d,9
xor edi,r11d
mov DWORD[60+rsp],r12d
xor r14d,ebx
and edi,r9d
ror r13d,5
add r12d,eax
xor edi,r11d
ror r14d,11
xor r13d,r9d
add r12d,edi
mov edi,ebx
add r12d,DWORD[rbp]
xor r14d,ebx
xor edi,ecx
ror r13d,6
mov eax,ecx
and r15d,edi
ror r14d,2
add r12d,r13d
xor eax,r15d
add r8d,r12d
add eax,r12d
lea rbp,[20+rbp]
cmp BYTE[3+rbp],0
jnz NEAR $L$rounds_16_xx
mov rdi,QWORD[((64+0))+rsp]
add eax,r14d
lea rsi,[64+rsi]
add eax,DWORD[rdi]
add ebx,DWORD[4+rdi]
add ecx,DWORD[8+rdi]
add edx,DWORD[12+rdi]
add r8d,DWORD[16+rdi]
add r9d,DWORD[20+rdi]
add r10d,DWORD[24+rdi]
add r11d,DWORD[28+rdi]
cmp rsi,QWORD[((64+16))+rsp]
mov DWORD[rdi],eax
mov DWORD[4+rdi],ebx
mov DWORD[8+rdi],ecx
mov DWORD[12+rdi],edx
mov DWORD[16+rdi],r8d
mov DWORD[20+rdi],r9d
mov DWORD[24+rdi],r10d
mov DWORD[28+rdi],r11d
jb NEAR $L$loop
mov rsi,QWORD[88+rsp]
mov r15,QWORD[((-48))+rsi]
mov r14,QWORD[((-40))+rsi]
mov r13,QWORD[((-32))+rsi]
mov r12,QWORD[((-24))+rsi]
mov rbp,QWORD[((-16))+rsi]
mov rbx,QWORD[((-8))+rsi]
lea rsp,[rsi]
$L$epilogue:
mov rdi,QWORD[8+rsp] ;WIN64 epilogue
mov rsi,QWORD[16+rsp]
DB 0F3h,0C3h ;repret
$L$SEH_end_sha256_block_data_order:
ALIGN 64
K256:
DD 0x428a2f98,0x71374491,0xb5c0fbcf,0xe9b5dba5
DD 0x428a2f98,0x71374491,0xb5c0fbcf,0xe9b5dba5
DD 0x3956c25b,0x59f111f1,0x923f82a4,0xab1c5ed5
DD 0x3956c25b,0x59f111f1,0x923f82a4,0xab1c5ed5
DD 0xd807aa98,0x12835b01,0x243185be,0x550c7dc3
DD 0xd807aa98,0x12835b01,0x243185be,0x550c7dc3
DD 0x72be5d74,0x80deb1fe,0x9bdc06a7,0xc19bf174
DD 0x72be5d74,0x80deb1fe,0x9bdc06a7,0xc19bf174
DD 0xe49b69c1,0xefbe4786,0x0fc19dc6,0x240ca1cc
DD 0xe49b69c1,0xefbe4786,0x0fc19dc6,0x240ca1cc
DD 0x2de92c6f,0x4a7484aa,0x5cb0a9dc,0x76f988da
DD 0x2de92c6f,0x4a7484aa,0x5cb0a9dc,0x76f988da
DD 0x983e5152,0xa831c66d,0xb00327c8,0xbf597fc7
DD 0x983e5152,0xa831c66d,0xb00327c8,0xbf597fc7
DD 0xc6e00bf3,0xd5a79147,0x06ca6351,0x14292967
DD 0xc6e00bf3,0xd5a79147,0x06ca6351,0x14292967
DD 0x27b70a85,0x2e1b2138,0x4d2c6dfc,0x53380d13
DD 0x27b70a85,0x2e1b2138,0x4d2c6dfc,0x53380d13
DD 0x650a7354,0x766a0abb,0x81c2c92e,0x92722c85
DD 0x650a7354,0x766a0abb,0x81c2c92e,0x92722c85
DD 0xa2bfe8a1,0xa81a664b,0xc24b8b70,0xc76c51a3
DD 0xa2bfe8a1,0xa81a664b,0xc24b8b70,0xc76c51a3
DD 0xd192e819,0xd6990624,0xf40e3585,0x106aa070
DD 0xd192e819,0xd6990624,0xf40e3585,0x106aa070
DD 0x19a4c116,0x1e376c08,0x2748774c,0x34b0bcb5
DD 0x19a4c116,0x1e376c08,0x2748774c,0x34b0bcb5
DD 0x391c0cb3,0x4ed8aa4a,0x5b9cca4f,0x682e6ff3
DD 0x391c0cb3,0x4ed8aa4a,0x5b9cca4f,0x682e6ff3
DD 0x748f82ee,0x78a5636f,0x84c87814,0x8cc70208
DD 0x748f82ee,0x78a5636f,0x84c87814,0x8cc70208
DD 0x90befffa,0xa4506ceb,0xbef9a3f7,0xc67178f2
DD 0x90befffa,0xa4506ceb,0xbef9a3f7,0xc67178f2
DD 0x00010203,0x04050607,0x08090a0b,0x0c0d0e0f
DD 0x00010203,0x04050607,0x08090a0b,0x0c0d0e0f
DD 0x03020100,0x0b0a0908,0xffffffff,0xffffffff
DD 0x03020100,0x0b0a0908,0xffffffff,0xffffffff
DD 0xffffffff,0xffffffff,0x03020100,0x0b0a0908
DD 0xffffffff,0xffffffff,0x03020100,0x0b0a0908
DB 83,72,65,50,53,54,32,98,108,111,99,107,32,116,114,97
DB 110,115,102,111,114,109,32,102,111,114,32,120,56,54,95,54
DB 52,44,32,67,82,89,80,84,79,71,65,77,83,32,98,121
DB 32,60,97,112,112,114,111,64,111,112,101,110,115,115,108,46
DB 111,114,103,62,0
ALIGN 64
sha256_block_data_order_ssse3:
mov QWORD[8+rsp],rdi ;WIN64 prologue
mov QWORD[16+rsp],rsi
mov rax,rsp
$L$SEH_begin_sha256_block_data_order_ssse3:
mov rdi,rcx
mov rsi,rdx
mov rdx,r8
$L$ssse3_shortcut:
mov rax,rsp
push rbx
push rbp
push r12
push r13
push r14
push r15
shl rdx,4
sub rsp,160
lea rdx,[rdx*4+rsi]
and rsp,-64
mov QWORD[((64+0))+rsp],rdi
mov QWORD[((64+8))+rsp],rsi
mov QWORD[((64+16))+rsp],rdx
mov QWORD[88+rsp],rax
movaps XMMWORD[(64+32)+rsp],xmm6
movaps XMMWORD[(64+48)+rsp],xmm7
movaps XMMWORD[(64+64)+rsp],xmm8
movaps XMMWORD[(64+80)+rsp],xmm9
$L$prologue_ssse3:
mov eax,DWORD[rdi]
mov ebx,DWORD[4+rdi]
mov ecx,DWORD[8+rdi]
mov edx,DWORD[12+rdi]
mov r8d,DWORD[16+rdi]
mov r9d,DWORD[20+rdi]
mov r10d,DWORD[24+rdi]
mov r11d,DWORD[28+rdi]
jmp NEAR $L$loop_ssse3
ALIGN 16
$L$loop_ssse3:
movdqa xmm7,XMMWORD[((K256+512))]
movdqu xmm0,XMMWORD[rsi]
movdqu xmm1,XMMWORD[16+rsi]
movdqu xmm2,XMMWORD[32+rsi]
DB 102,15,56,0,199
movdqu xmm3,XMMWORD[48+rsi]
lea rbp,[K256]
DB 102,15,56,0,207
movdqa xmm4,XMMWORD[rbp]
movdqa xmm5,XMMWORD[32+rbp]
DB 102,15,56,0,215
paddd xmm4,xmm0
movdqa xmm6,XMMWORD[64+rbp]
DB 102,15,56,0,223
movdqa xmm7,XMMWORD[96+rbp]
paddd xmm5,xmm1
paddd xmm6,xmm2
paddd xmm7,xmm3
movdqa XMMWORD[rsp],xmm4
mov r14d,eax
movdqa XMMWORD[16+rsp],xmm5
mov edi,ebx
movdqa XMMWORD[32+rsp],xmm6
xor edi,ecx
movdqa XMMWORD[48+rsp],xmm7
mov r13d,r8d
jmp NEAR $L$ssse3_00_47
ALIGN 16
$L$ssse3_00_47:
sub rbp,-128
ror r13d,14
movdqa xmm4,xmm1
mov eax,r14d
mov r12d,r9d
movdqa xmm7,xmm3
ror r14d,9
xor r13d,r8d
xor r12d,r10d
ror r13d,5
xor r14d,eax
DB 102,15,58,15,224,4
and r12d,r8d
xor r13d,r8d
DB 102,15,58,15,250,4
add r11d,DWORD[rsp]
mov r15d,eax
xor r12d,r10d
ror r14d,11
movdqa xmm5,xmm4
xor r15d,ebx
add r11d,r12d
movdqa xmm6,xmm4
ror r13d,6
and edi,r15d
psrld xmm4,3
xor r14d,eax
add r11d,r13d
xor edi,ebx
paddd xmm0,xmm7
ror r14d,2
add edx,r11d
psrld xmm6,7
add r11d,edi
mov r13d,edx
pshufd xmm7,xmm3,250
add r14d,r11d
ror r13d,14
pslld xmm5,14
mov r11d,r14d
mov r12d,r8d
pxor xmm4,xmm6
ror r14d,9
xor r13d,edx
xor r12d,r9d
ror r13d,5
psrld xmm6,11
xor r14d,r11d
pxor xmm4,xmm5
and r12d,edx
xor r13d,edx
pslld xmm5,11
add r10d,DWORD[4+rsp]
mov edi,r11d
pxor xmm4,xmm6
xor r12d,r9d
ror r14d,11
movdqa xmm6,xmm7
xor edi,eax
add r10d,r12d
pxor xmm4,xmm5
ror r13d,6
and r15d,edi
xor r14d,r11d
psrld xmm7,10
add r10d,r13d
xor r15d,eax
paddd xmm0,xmm4
ror r14d,2
add ecx,r10d
psrlq xmm6,17
add r10d,r15d
mov r13d,ecx
add r14d,r10d
pxor xmm7,xmm6
ror r13d,14
mov r10d,r14d
mov r12d,edx
ror r14d,9
psrlq xmm6,2
xor r13d,ecx
xor r12d,r8d
pxor xmm7,xmm6
ror r13d,5
xor r14d,r10d
and r12d,ecx
pshufd xmm7,xmm7,128
xor r13d,ecx
add r9d,DWORD[8+rsp]
mov r15d,r10d
psrldq xmm7,8
xor r12d,r8d
ror r14d,11
xor r15d,r11d
add r9d,r12d
ror r13d,6
paddd xmm0,xmm7
and edi,r15d
xor r14d,r10d
add r9d,r13d
pshufd xmm7,xmm0,80
xor edi,r11d
ror r14d,2
add ebx,r9d
movdqa xmm6,xmm7
add r9d,edi
mov r13d,ebx
psrld xmm7,10
add r14d,r9d
ror r13d,14
psrlq xmm6,17
mov r9d,r14d
mov r12d,ecx
pxor xmm7,xmm6
ror r14d,9
xor r13d,ebx
xor r12d,edx
ror r13d,5
xor r14d,r9d
psrlq xmm6,2
and r12d,ebx
xor r13d,ebx
add r8d,DWORD[12+rsp]
pxor xmm7,xmm6
mov edi,r9d
xor r12d,edx
ror r14d,11
pshufd xmm7,xmm7,8
xor edi,r10d
add r8d,r12d
movdqa xmm6,XMMWORD[rbp]
ror r13d,6
and r15d,edi
pslldq xmm7,8
xor r14d,r9d
add r8d,r13d
xor r15d,r10d
paddd xmm0,xmm7
ror r14d,2
add eax,r8d
add r8d,r15d
paddd xmm6,xmm0
mov r13d,eax
add r14d,r8d
movdqa XMMWORD[rsp],xmm6
ror r13d,14
movdqa xmm4,xmm2
mov r8d,r14d
mov r12d,ebx
movdqa xmm7,xmm0
ror r14d,9
xor r13d,eax
xor r12d,ecx
ror r13d,5
xor r14d,r8d
DB 102,15,58,15,225,4
and r12d,eax
xor r13d,eax
DB 102,15,58,15,251,4
add edx,DWORD[16+rsp]
mov r15d,r8d
xor r12d,ecx
ror r14d,11
movdqa xmm5,xmm4
xor r15d,r9d
add edx,r12d
movdqa xmm6,xmm4
ror r13d,6
and edi,r15d
psrld xmm4,3
xor r14d,r8d
add edx,r13d
xor edi,r9d
paddd xmm1,xmm7
ror r14d,2
add r11d,edx
psrld xmm6,7
add edx,edi
mov r13d,r11d
pshufd xmm7,xmm0,250
add r14d,edx
ror r13d,14
pslld xmm5,14
mov edx,r14d
mov r12d,eax
pxor xmm4,xmm6
ror r14d,9
xor r13d,r11d
xor r12d,ebx
ror r13d,5
psrld xmm6,11
xor r14d,edx
pxor xmm4,xmm5
and r12d,r11d
xor r13d,r11d
pslld xmm5,11
add ecx,DWORD[20+rsp]
mov edi,edx
pxor xmm4,xmm6
xor r12d,ebx
ror r14d,11
movdqa xmm6,xmm7
xor edi,r8d
add ecx,r12d
pxor xmm4,xmm5
ror r13d,6
and r15d,edi
xor r14d,edx
psrld xmm7,10
add ecx,r13d
xor r15d,r8d
paddd xmm1,xmm4
ror r14d,2
add r10d,ecx
psrlq xmm6,17
add ecx,r15d
mov r13d,r10d
add r14d,ecx
pxor xmm7,xmm6
ror r13d,14
mov ecx,r14d
mov r12d,r11d
ror r14d,9
psrlq xmm6,2
xor r13d,r10d
xor r12d,eax
pxor xmm7,xmm6
ror r13d,5
xor r14d,ecx
and r12d,r10d
pshufd xmm7,xmm7,128
xor r13d,r10d
add ebx,DWORD[24+rsp]
mov r15d,ecx
psrldq xmm7,8
xor r12d,eax
ror r14d,11
xor r15d,edx
add ebx,r12d
ror r13d,6
paddd xmm1,xmm7
and edi,r15d
xor r14d,ecx
add ebx,r13d
pshufd xmm7,xmm1,80
xor edi,edx
ror r14d,2
add r9d,ebx
movdqa xmm6,xmm7
add ebx,edi
mov r13d,r9d
psrld xmm7,10
add r14d,ebx
ror r13d,14
psrlq xmm6,17
mov ebx,r14d
mov r12d,r10d
pxor xmm7,xmm6
ror r14d,9
xor r13d,r9d
xor r12d,r11d
ror r13d,5
xor r14d,ebx
psrlq xmm6,2
and r12d,r9d
xor r13d,r9d
add eax,DWORD[28+rsp]
pxor xmm7,xmm6
mov edi,ebx
xor r12d,r11d
ror r14d,11
pshufd xmm7,xmm7,8
xor edi,ecx
add eax,r12d
movdqa xmm6,XMMWORD[32+rbp]
ror r13d,6
and r15d,edi
pslldq xmm7,8
xor r14d,ebx
add eax,r13d
xor r15d,ecx
paddd xmm1,xmm7
ror r14d,2
add r8d,eax
add eax,r15d
paddd xmm6,xmm1
mov r13d,r8d
add r14d,eax
movdqa XMMWORD[16+rsp],xmm6
ror r13d,14
movdqa xmm4,xmm3
mov eax,r14d
mov r12d,r9d
movdqa xmm7,xmm1
ror r14d,9
xor r13d,r8d
xor r12d,r10d
ror r13d,5
xor r14d,eax
DB 102,15,58,15,226,4
and r12d,r8d
xor r13d,r8d
DB 102,15,58,15,248,4
add r11d,DWORD[32+rsp]
mov r15d,eax
xor r12d,r10d
ror r14d,11
movdqa xmm5,xmm4
xor r15d,ebx
add r11d,r12d
movdqa xmm6,xmm4
ror r13d,6
and edi,r15d
psrld xmm4,3
xor r14d,eax
add r11d,r13d
xor edi,ebx
paddd xmm2,xmm7
ror r14d,2
add edx,r11d
psrld xmm6,7
add r11d,edi
mov r13d,edx
pshufd xmm7,xmm1,250
add r14d,r11d
ror r13d,14
pslld xmm5,14
mov r11d,r14d
mov r12d,r8d
pxor xmm4,xmm6
ror r14d,9
xor r13d,edx
xor r12d,r9d
ror r13d,5
psrld xmm6,11
xor r14d,r11d
pxor xmm4,xmm5
and r12d,edx
xor r13d,edx
pslld xmm5,11
add r10d,DWORD[36+rsp]
mov edi,r11d
pxor xmm4,xmm6
xor r12d,r9d
ror r14d,11
movdqa xmm6,xmm7
xor edi,eax
add r10d,r12d
pxor xmm4,xmm5
ror r13d,6
and r15d,edi
xor r14d,r11d
psrld xmm7,10
add r10d,r13d
xor r15d,eax
paddd xmm2,xmm4
ror r14d,2
add ecx,r10d
psrlq xmm6,17
add r10d,r15d
mov r13d,ecx
add r14d,r10d
pxor xmm7,xmm6
ror r13d,14
mov r10d,r14d
mov r12d,edx
ror r14d,9
psrlq xmm6,2
xor r13d,ecx
xor r12d,r8d
pxor xmm7,xmm6
ror r13d,5
xor r14d,r10d
and r12d,ecx
pshufd xmm7,xmm7,128
xor r13d,ecx
add r9d,DWORD[40+rsp]
mov r15d,r10d
psrldq xmm7,8
xor r12d,r8d
ror r14d,11
xor r15d,r11d
add r9d,r12d
ror r13d,6
paddd xmm2,xmm7
and edi,r15d
xor r14d,r10d
add r9d,r13d
pshufd xmm7,xmm2,80
xor edi,r11d
ror r14d,2
add ebx,r9d
movdqa xmm6,xmm7
add r9d,edi
mov r13d,ebx
psrld xmm7,10
add r14d,r9d
ror r13d,14
psrlq xmm6,17
mov r9d,r14d
mov r12d,ecx
pxor xmm7,xmm6
ror r14d,9
xor r13d,ebx
xor r12d,edx
ror r13d,5
xor r14d,r9d
psrlq xmm6,2
and r12d,ebx
xor r13d,ebx
add r8d,DWORD[44+rsp]
pxor xmm7,xmm6
mov edi,r9d
xor r12d,edx
ror r14d,11
pshufd xmm7,xmm7,8
xor edi,r10d
add r8d,r12d
movdqa xmm6,XMMWORD[64+rbp]
ror r13d,6
and r15d,edi
pslldq xmm7,8
xor r14d,r9d
add r8d,r13d
xor r15d,r10d
paddd xmm2,xmm7
ror r14d,2
add eax,r8d
add r8d,r15d
paddd xmm6,xmm2
mov r13d,eax
add r14d,r8d
movdqa XMMWORD[32+rsp],xmm6
ror r13d,14
movdqa xmm4,xmm0
mov r8d,r14d
mov r12d,ebx
movdqa xmm7,xmm2
ror r14d,9
xor r13d,eax
xor r12d,ecx
ror r13d,5
xor r14d,r8d
DB 102,15,58,15,227,4
and r12d,eax
xor r13d,eax
DB 102,15,58,15,249,4
add edx,DWORD[48+rsp]
mov r15d,r8d
xor r12d,ecx
ror r14d,11
movdqa xmm5,xmm4
xor r15d,r9d
add edx,r12d
movdqa xmm6,xmm4
ror r13d,6
and edi,r15d
psrld xmm4,3
xor r14d,r8d
add edx,r13d
xor edi,r9d
paddd xmm3,xmm7
ror r14d,2
add r11d,edx
psrld xmm6,7
add edx,edi
mov r13d,r11d
pshufd xmm7,xmm2,250
add r14d,edx
ror r13d,14
pslld xmm5,14
mov edx,r14d
mov r12d,eax
pxor xmm4,xmm6
ror r14d,9
xor r13d,r11d
xor r12d,ebx
ror r13d,5
psrld xmm6,11
xor r14d,edx
pxor xmm4,xmm5
and r12d,r11d
xor r13d,r11d
pslld xmm5,11
add ecx,DWORD[52+rsp]
mov edi,edx
pxor xmm4,xmm6
xor r12d,ebx
ror r14d,11
movdqa xmm6,xmm7
xor edi,r8d
add ecx,r12d
pxor xmm4,xmm5
ror r13d,6
and r15d,edi
xor r14d,edx
psrld xmm7,10
add ecx,r13d
xor r15d,r8d
paddd xmm3,xmm4
ror r14d,2
add r10d,ecx
psrlq xmm6,17
add ecx,r15d
mov r13d,r10d
add r14d,ecx
pxor xmm7,xmm6
ror r13d,14
mov ecx,r14d
mov r12d,r11d
ror r14d,9
psrlq xmm6,2
xor r13d,r10d
xor r12d,eax
pxor xmm7,xmm6
ror r13d,5
xor r14d,ecx
and r12d,r10d
pshufd xmm7,xmm7,128
xor r13d,r10d
add ebx,DWORD[56+rsp]
mov r15d,ecx
psrldq xmm7,8
xor r12d,eax
ror r14d,11
xor r15d,edx
add ebx,r12d
ror r13d,6
paddd xmm3,xmm7
and edi,r15d
xor r14d,ecx
add ebx,r13d
pshufd xmm7,xmm3,80
xor edi,edx
ror r14d,2
add r9d,ebx
movdqa xmm6,xmm7
add ebx,edi
mov r13d,r9d
psrld xmm7,10
add r14d,ebx
ror r13d,14
psrlq xmm6,17
mov ebx,r14d
mov r12d,r10d
pxor xmm7,xmm6
ror r14d,9
xor r13d,r9d
xor r12d,r11d
ror r13d,5
xor r14d,ebx
psrlq xmm6,2
and r12d,r9d
xor r13d,r9d
add eax,DWORD[60+rsp]
pxor xmm7,xmm6
mov edi,ebx
xor r12d,r11d
ror r14d,11
pshufd xmm7,xmm7,8
xor edi,ecx
add eax,r12d
movdqa xmm6,XMMWORD[96+rbp]
ror r13d,6
and r15d,edi
pslldq xmm7,8
xor r14d,ebx
add eax,r13d
xor r15d,ecx
paddd xmm3,xmm7
ror r14d,2
add r8d,eax
add eax,r15d
paddd xmm6,xmm3
mov r13d,r8d
add r14d,eax
movdqa XMMWORD[48+rsp],xmm6
cmp BYTE[131+rbp],0
jne NEAR $L$ssse3_00_47
ror r13d,14
mov eax,r14d
mov r12d,r9d
ror r14d,9
xor r13d,r8d
xor r12d,r10d
ror r13d,5
xor r14d,eax
and r12d,r8d
xor r13d,r8d
add r11d,DWORD[rsp]
mov r15d,eax
xor r12d,r10d
ror r14d,11
xor r15d,ebx
add r11d,r12d
ror r13d,6
and edi,r15d
xor r14d,eax
add r11d,r13d
xor edi,ebx
ror r14d,2
add edx,r11d
add r11d,edi
mov r13d,edx
add r14d,r11d
ror r13d,14
mov r11d,r14d
mov r12d,r8d
ror r14d,9
xor r13d,edx
xor r12d,r9d
ror r13d,5
xor r14d,r11d
and r12d,edx
xor r13d,edx
add r10d,DWORD[4+rsp]
mov edi,r11d
xor r12d,r9d
ror r14d,11
xor edi,eax
add r10d,r12d
ror r13d,6
and r15d,edi
xor r14d,r11d
add r10d,r13d
xor r15d,eax
ror r14d,2
add ecx,r10d
add r10d,r15d
mov r13d,ecx
add r14d,r10d
ror r13d,14
mov r10d,r14d
mov r12d,edx
ror r14d,9
xor r13d,ecx
xor r12d,r8d
ror r13d,5
xor r14d,r10d
and r12d,ecx
xor r13d,ecx
add r9d,DWORD[8+rsp]
mov r15d,r10d
xor r12d,r8d
ror r14d,11
xor r15d,r11d
add r9d,r12d
ror r13d,6
and edi,r15d
xor r14d,r10d
add r9d,r13d
xor edi,r11d
ror r14d,2
add ebx,r9d
add r9d,edi
mov r13d,ebx
add r14d,r9d
ror r13d,14
mov r9d,r14d
mov r12d,ecx
ror r14d,9
xor r13d,ebx
xor r12d,edx
ror r13d,5
xor r14d,r9d
and r12d,ebx
xor r13d,ebx
add r8d,DWORD[12+rsp]
mov edi,r9d
xor r12d,edx
ror r14d,11
xor edi,r10d
add r8d,r12d
ror r13d,6
and r15d,edi
xor r14d,r9d
add r8d,r13d
xor r15d,r10d
ror r14d,2
add eax,r8d
add r8d,r15d
mov r13d,eax
add r14d,r8d
ror r13d,14
mov r8d,r14d
mov r12d,ebx
ror r14d,9
xor r13d,eax
xor r12d,ecx
ror r13d,5
xor r14d,r8d
and r12d,eax
xor r13d,eax
add edx,DWORD[16+rsp]
mov r15d,r8d
xor r12d,ecx
ror r14d,11
xor r15d,r9d
add edx,r12d
ror r13d,6
and edi,r15d
xor r14d,r8d
add edx,r13d
xor edi,r9d
ror r14d,2
add r11d,edx
add edx,edi
mov r13d,r11d
add r14d,edx
ror r13d,14
mov edx,r14d
mov r12d,eax
ror r14d,9
xor r13d,r11d
xor r12d,ebx
ror r13d,5
xor r14d,edx
and r12d,r11d
xor r13d,r11d
add ecx,DWORD[20+rsp]
mov edi,edx
xor r12d,ebx
ror r14d,11
xor edi,r8d
add ecx,r12d
ror r13d,6
and r15d,edi
xor r14d,edx
add ecx,r13d
xor r15d,r8d
ror r14d,2
add r10d,ecx
add ecx,r15d
mov r13d,r10d
add r14d,ecx
ror r13d,14
mov ecx,r14d
mov r12d,r11d
ror r14d,9
xor r13d,r10d
xor r12d,eax
ror r13d,5
xor r14d,ecx
and r12d,r10d
xor r13d,r10d
add ebx,DWORD[24+rsp]
mov r15d,ecx
xor r12d,eax
ror r14d,11
xor r15d,edx
add ebx,r12d
ror r13d,6
and edi,r15d
xor r14d,ecx
add ebx,r13d
xor edi,edx
ror r14d,2
add r9d,ebx
add ebx,edi
mov r13d,r9d
add r14d,ebx
ror r13d,14
mov ebx,r14d
mov r12d,r10d
ror r14d,9
xor r13d,r9d
xor r12d,r11d
ror r13d,5
xor r14d,ebx
and r12d,r9d
xor r13d,r9d
add eax,DWORD[28+rsp]
mov edi,ebx
xor r12d,r11d
ror r14d,11
xor edi,ecx
add eax,r12d
ror r13d,6
and r15d,edi
xor r14d,ebx
add eax,r13d
xor r15d,ecx
ror r14d,2
add r8d,eax
add eax,r15d
mov r13d,r8d
add r14d,eax
ror r13d,14
mov eax,r14d
mov r12d,r9d
ror r14d,9
xor r13d,r8d
xor r12d,r10d
ror r13d,5
xor r14d,eax
and r12d,r8d
xor r13d,r8d
add r11d,DWORD[32+rsp]
mov r15d,eax
xor r12d,r10d
ror r14d,11
xor r15d,ebx
add r11d,r12d
ror r13d,6
and edi,r15d
xor r14d,eax
add r11d,r13d
xor edi,ebx
ror r14d,2
add edx,r11d
add r11d,edi
mov r13d,edx
add r14d,r11d
ror r13d,14
mov r11d,r14d
mov r12d,r8d
ror r14d,9
xor r13d,edx
xor r12d,r9d
ror r13d,5
xor r14d,r11d
and r12d,edx
xor r13d,edx
add r10d,DWORD[36+rsp]
mov edi,r11d
xor r12d,r9d
ror r14d,11
xor edi,eax
add r10d,r12d
ror r13d,6
and r15d,edi
xor r14d,r11d
add r10d,r13d
xor r15d,eax
ror r14d,2
add ecx,r10d
add r10d,r15d
mov r13d,ecx
add r14d,r10d
ror r13d,14
mov r10d,r14d
mov r12d,edx
ror r14d,9
xor r13d,ecx
xor r12d,r8d
ror r13d,5
xor r14d,r10d
and r12d,ecx
xor r13d,ecx
add r9d,DWORD[40+rsp]
mov r15d,r10d
xor r12d,r8d
ror r14d,11
xor r15d,r11d
add r9d,r12d
ror r13d,6
and edi,r15d
xor r14d,r10d
add r9d,r13d
xor edi,r11d
ror r14d,2
add ebx,r9d
add r9d,edi
mov r13d,ebx
add r14d,r9d
ror r13d,14
mov r9d,r14d
mov r12d,ecx
ror r14d,9
xor r13d,ebx
xor r12d,edx
ror r13d,5
xor r14d,r9d
and r12d,ebx
xor r13d,ebx
add r8d,DWORD[44+rsp]
mov edi,r9d
xor r12d,edx
ror r14d,11
xor edi,r10d
add r8d,r12d
ror r13d,6
and r15d,edi
xor r14d,r9d
add r8d,r13d
xor r15d,r10d
ror r14d,2
add eax,r8d
add r8d,r15d
mov r13d,eax
add r14d,r8d
ror r13d,14
mov r8d,r14d
mov r12d,ebx
ror r14d,9
xor r13d,eax
xor r12d,ecx
ror r13d,5
xor r14d,r8d
and r12d,eax
xor r13d,eax
add edx,DWORD[48+rsp]
mov r15d,r8d
xor r12d,ecx
ror r14d,11
xor r15d,r9d
add edx,r12d
ror r13d,6
and edi,r15d
xor r14d,r8d
add edx,r13d
xor edi,r9d
ror r14d,2
add r11d,edx
add edx,edi
mov r13d,r11d
add r14d,edx
ror r13d,14
mov edx,r14d
mov r12d,eax
ror r14d,9
xor r13d,r11d
xor r12d,ebx
ror r13d,5
xor r14d,edx
and r12d,r11d
xor r13d,r11d
add ecx,DWORD[52+rsp]
mov edi,edx
xor r12d,ebx
ror r14d,11
xor edi,r8d
add ecx,r12d
ror r13d,6
and r15d,edi
xor r14d,edx
add ecx,r13d
xor r15d,r8d
ror r14d,2
add r10d,ecx
add ecx,r15d
mov r13d,r10d
add r14d,ecx
ror r13d,14
mov ecx,r14d
mov r12d,r11d
ror r14d,9
xor r13d,r10d
xor r12d,eax
ror r13d,5
xor r14d,ecx
and r12d,r10d
xor r13d,r10d
add ebx,DWORD[56+rsp]
mov r15d,ecx
xor r12d,eax
ror r14d,11
xor r15d,edx
add ebx,r12d
ror r13d,6
and edi,r15d
xor r14d,ecx
add ebx,r13d
xor edi,edx
ror r14d,2
add r9d,ebx
add ebx,edi
mov r13d,r9d
add r14d,ebx
ror r13d,14
mov ebx,r14d
mov r12d,r10d
ror r14d,9
xor r13d,r9d
xor r12d,r11d
ror r13d,5
xor r14d,ebx
and r12d,r9d
xor r13d,r9d
add eax,DWORD[60+rsp]
mov edi,ebx
xor r12d,r11d
ror r14d,11
xor edi,ecx
add eax,r12d
ror r13d,6
and r15d,edi
xor r14d,ebx
add eax,r13d
xor r15d,ecx
ror r14d,2
add r8d,eax
add eax,r15d
mov r13d,r8d
add r14d,eax
mov rdi,QWORD[((64+0))+rsp]
mov eax,r14d
add eax,DWORD[rdi]
lea rsi,[64+rsi]
add ebx,DWORD[4+rdi]
add ecx,DWORD[8+rdi]
add edx,DWORD[12+rdi]
add r8d,DWORD[16+rdi]
add r9d,DWORD[20+rdi]
add r10d,DWORD[24+rdi]
add r11d,DWORD[28+rdi]
cmp rsi,QWORD[((64+16))+rsp]
mov DWORD[rdi],eax
mov DWORD[4+rdi],ebx
mov DWORD[8+rdi],ecx
mov DWORD[12+rdi],edx
mov DWORD[16+rdi],r8d
mov DWORD[20+rdi],r9d
mov DWORD[24+rdi],r10d
mov DWORD[28+rdi],r11d
jb NEAR $L$loop_ssse3
mov rsi,QWORD[88+rsp]
movaps xmm6,XMMWORD[((64+32))+rsp]
movaps xmm7,XMMWORD[((64+48))+rsp]
movaps xmm8,XMMWORD[((64+64))+rsp]
movaps xmm9,XMMWORD[((64+80))+rsp]
mov r15,QWORD[((-48))+rsi]
mov r14,QWORD[((-40))+rsi]
mov r13,QWORD[((-32))+rsi]
mov r12,QWORD[((-24))+rsi]
mov rbp,QWORD[((-16))+rsi]
mov rbx,QWORD[((-8))+rsi]
lea rsp,[rsi]
$L$epilogue_ssse3:
mov rdi,QWORD[8+rsp] ;WIN64 epilogue
mov rsi,QWORD[16+rsp]
DB 0F3h,0C3h ;repret
$L$SEH_end_sha256_block_data_order_ssse3:
ALIGN 64
sha256_block_data_order_avx:
mov QWORD[8+rsp],rdi ;WIN64 prologue
mov QWORD[16+rsp],rsi
mov rax,rsp
$L$SEH_begin_sha256_block_data_order_avx:
mov rdi,rcx
mov rsi,rdx
mov rdx,r8
$L$avx_shortcut:
mov rax,rsp
push rbx
push rbp
push r12
push r13
push r14
push r15
shl rdx,4
sub rsp,160
lea rdx,[rdx*4+rsi]
and rsp,-64
mov QWORD[((64+0))+rsp],rdi
mov QWORD[((64+8))+rsp],rsi
mov QWORD[((64+16))+rsp],rdx
mov QWORD[88+rsp],rax
movaps XMMWORD[(64+32)+rsp],xmm6
movaps XMMWORD[(64+48)+rsp],xmm7
movaps XMMWORD[(64+64)+rsp],xmm8
movaps XMMWORD[(64+80)+rsp],xmm9
$L$prologue_avx:
vzeroupper
mov eax,DWORD[rdi]
mov ebx,DWORD[4+rdi]
mov ecx,DWORD[8+rdi]
mov edx,DWORD[12+rdi]
mov r8d,DWORD[16+rdi]
mov r9d,DWORD[20+rdi]
mov r10d,DWORD[24+rdi]
mov r11d,DWORD[28+rdi]
vmovdqa xmm8,XMMWORD[((K256+512+32))]
vmovdqa xmm9,XMMWORD[((K256+512+64))]
jmp NEAR $L$loop_avx
ALIGN 16
$L$loop_avx:
vmovdqa xmm7,XMMWORD[((K256+512))]
vmovdqu xmm0,XMMWORD[rsi]
vmovdqu xmm1,XMMWORD[16+rsi]
vmovdqu xmm2,XMMWORD[32+rsi]
vmovdqu xmm3,XMMWORD[48+rsi]
vpshufb xmm0,xmm0,xmm7
lea rbp,[K256]
vpshufb xmm1,xmm1,xmm7
vpshufb xmm2,xmm2,xmm7
vpaddd xmm4,xmm0,XMMWORD[rbp]
vpshufb xmm3,xmm3,xmm7
vpaddd xmm5,xmm1,XMMWORD[32+rbp]
vpaddd xmm6,xmm2,XMMWORD[64+rbp]
vpaddd xmm7,xmm3,XMMWORD[96+rbp]
vmovdqa XMMWORD[rsp],xmm4
mov r14d,eax
vmovdqa XMMWORD[16+rsp],xmm5
mov edi,ebx
vmovdqa XMMWORD[32+rsp],xmm6
xor edi,ecx
vmovdqa XMMWORD[48+rsp],xmm7
mov r13d,r8d
jmp NEAR $L$avx_00_47
ALIGN 16
$L$avx_00_47:
sub rbp,-128
vpalignr xmm4,xmm1,xmm0,4
shrd r13d,r13d,14
mov eax,r14d
mov r12d,r9d
vpalignr xmm7,xmm3,xmm2,4
shrd r14d,r14d,9
xor r13d,r8d
xor r12d,r10d
vpsrld xmm6,xmm4,7
shrd r13d,r13d,5
xor r14d,eax
and r12d,r8d
vpaddd xmm0,xmm0,xmm7
xor r13d,r8d
add r11d,DWORD[rsp]
mov r15d,eax
vpsrld xmm7,xmm4,3
xor r12d,r10d
shrd r14d,r14d,11
xor r15d,ebx
vpslld xmm5,xmm4,14
add r11d,r12d
shrd r13d,r13d,6
and edi,r15d
vpxor xmm4,xmm7,xmm6
xor r14d,eax
add r11d,r13d
xor edi,ebx
vpshufd xmm7,xmm3,250
shrd r14d,r14d,2
add edx,r11d
add r11d,edi
vpsrld xmm6,xmm6,11
mov r13d,edx
add r14d,r11d
shrd r13d,r13d,14
vpxor xmm4,xmm4,xmm5
mov r11d,r14d
mov r12d,r8d
shrd r14d,r14d,9
vpslld xmm5,xmm5,11
xor r13d,edx
xor r12d,r9d
shrd r13d,r13d,5
vpxor xmm4,xmm4,xmm6
xor r14d,r11d
and r12d,edx
xor r13d,edx
vpsrld xmm6,xmm7,10
add r10d,DWORD[4+rsp]
mov edi,r11d
xor r12d,r9d
vpxor xmm4,xmm4,xmm5
shrd r14d,r14d,11
xor edi,eax
add r10d,r12d
vpsrlq xmm7,xmm7,17
shrd r13d,r13d,6
and r15d,edi
xor r14d,r11d
vpaddd xmm0,xmm0,xmm4
add r10d,r13d
xor r15d,eax
shrd r14d,r14d,2
vpxor xmm6,xmm6,xmm7
add ecx,r10d
add r10d,r15d
mov r13d,ecx
vpsrlq xmm7,xmm7,2
add r14d,r10d
shrd r13d,r13d,14
mov r10d,r14d
vpxor xmm6,xmm6,xmm7
mov r12d,edx
shrd r14d,r14d,9
xor r13d,ecx
vpshufb xmm6,xmm6,xmm8
xor r12d,r8d
shrd r13d,r13d,5
xor r14d,r10d
vpaddd xmm0,xmm0,xmm6
and r12d,ecx
xor r13d,ecx
add r9d,DWORD[8+rsp]
vpshufd xmm7,xmm0,80
mov r15d,r10d
xor r12d,r8d
shrd r14d,r14d,11
vpsrld xmm6,xmm7,10
xor r15d,r11d
add r9d,r12d
shrd r13d,r13d,6
vpsrlq xmm7,xmm7,17
and edi,r15d
xor r14d,r10d
add r9d,r13d
vpxor xmm6,xmm6,xmm7
xor edi,r11d
shrd r14d,r14d,2
add ebx,r9d
vpsrlq xmm7,xmm7,2
add r9d,edi
mov r13d,ebx
add r14d,r9d
vpxor xmm6,xmm6,xmm7
shrd r13d,r13d,14
mov r9d,r14d
mov r12d,ecx
vpshufb xmm6,xmm6,xmm9
shrd r14d,r14d,9
xor r13d,ebx
xor r12d,edx
vpaddd xmm0,xmm0,xmm6
shrd r13d,r13d,5
xor r14d,r9d
and r12d,ebx
vpaddd xmm6,xmm0,XMMWORD[rbp]
xor r13d,ebx
add r8d,DWORD[12+rsp]
mov edi,r9d
xor r12d,edx
shrd r14d,r14d,11
xor edi,r10d
add r8d,r12d
shrd r13d,r13d,6
and r15d,edi
xor r14d,r9d
add r8d,r13d
xor r15d,r10d
shrd r14d,r14d,2
add eax,r8d
add r8d,r15d
mov r13d,eax
add r14d,r8d
vmovdqa XMMWORD[rsp],xmm6
vpalignr xmm4,xmm2,xmm1,4
shrd r13d,r13d,14
mov r8d,r14d
mov r12d,ebx
vpalignr xmm7,xmm0,xmm3,4
shrd r14d,r14d,9
xor r13d,eax
xor r12d,ecx
vpsrld xmm6,xmm4,7
shrd r13d,r13d,5
xor r14d,r8d
and r12d,eax
vpaddd xmm1,xmm1,xmm7
xor r13d,eax
add edx,DWORD[16+rsp]
mov r15d,r8d
vpsrld xmm7,xmm4,3
xor r12d,ecx
shrd r14d,r14d,11
xor r15d,r9d
vpslld xmm5,xmm4,14
add edx,r12d
shrd r13d,r13d,6
and edi,r15d
vpxor xmm4,xmm7,xmm6
xor r14d,r8d
add edx,r13d
xor edi,r9d
vpshufd xmm7,xmm0,250
shrd r14d,r14d,2
add r11d,edx
add edx,edi
vpsrld xmm6,xmm6,11
mov r13d,r11d
add r14d,edx
shrd r13d,r13d,14
vpxor xmm4,xmm4,xmm5
mov edx,r14d
mov r12d,eax
shrd r14d,r14d,9
vpslld xmm5,xmm5,11
xor r13d,r11d
xor r12d,ebx
shrd r13d,r13d,5
vpxor xmm4,xmm4,xmm6
xor r14d,edx
and r12d,r11d
xor r13d,r11d
vpsrld xmm6,xmm7,10
add ecx,DWORD[20+rsp]
mov edi,edx
xor r12d,ebx
vpxor xmm4,xmm4,xmm5
shrd r14d,r14d,11
xor edi,r8d
add ecx,r12d
vpsrlq xmm7,xmm7,17
shrd r13d,r13d,6
and r15d,edi
xor r14d,edx
vpaddd xmm1,xmm1,xmm4
add ecx,r13d
xor r15d,r8d
shrd r14d,r14d,2
vpxor xmm6,xmm6,xmm7
add r10d,ecx
add ecx,r15d
mov r13d,r10d
vpsrlq xmm7,xmm7,2
add r14d,ecx
shrd r13d,r13d,14
mov ecx,r14d
vpxor xmm6,xmm6,xmm7
mov r12d,r11d
shrd r14d,r14d,9
xor r13d,r10d
vpshufb xmm6,xmm6,xmm8
xor r12d,eax
shrd r13d,r13d,5
xor r14d,ecx
vpaddd xmm1,xmm1,xmm6
and r12d,r10d
xor r13d,r10d
add ebx,DWORD[24+rsp]
vpshufd xmm7,xmm1,80
mov r15d,ecx
xor r12d,eax
shrd r14d,r14d,11
vpsrld xmm6,xmm7,10
xor r15d,edx
add ebx,r12d
shrd r13d,r13d,6
vpsrlq xmm7,xmm7,17
and edi,r15d
xor r14d,ecx
add ebx,r13d
vpxor xmm6,xmm6,xmm7
xor edi,edx
shrd r14d,r14d,2
add r9d,ebx
vpsrlq xmm7,xmm7,2
add ebx,edi
mov r13d,r9d
add r14d,ebx
vpxor xmm6,xmm6,xmm7
shrd r13d,r13d,14
mov ebx,r14d
mov r12d,r10d
vpshufb xmm6,xmm6,xmm9
shrd r14d,r14d,9
xor r13d,r9d
xor r12d,r11d
vpaddd xmm1,xmm1,xmm6
shrd r13d,r13d,5
xor r14d,ebx
and r12d,r9d
vpaddd xmm6,xmm1,XMMWORD[32+rbp]
xor r13d,r9d
add eax,DWORD[28+rsp]
mov edi,ebx
xor r12d,r11d
shrd r14d,r14d,11
xor edi,ecx
add eax,r12d
shrd r13d,r13d,6
and r15d,edi
xor r14d,ebx
add eax,r13d
xor r15d,ecx
shrd r14d,r14d,2
add r8d,eax
add eax,r15d
mov r13d,r8d
add r14d,eax
vmovdqa XMMWORD[16+rsp],xmm6
vpalignr xmm4,xmm3,xmm2,4
shrd r13d,r13d,14
mov eax,r14d
mov r12d,r9d
vpalignr xmm7,xmm1,xmm0,4
shrd r14d,r14d,9
xor r13d,r8d
xor r12d,r10d
vpsrld xmm6,xmm4,7
shrd r13d,r13d,5
xor r14d,eax
and r12d,r8d
vpaddd xmm2,xmm2,xmm7
xor r13d,r8d
add r11d,DWORD[32+rsp]
mov r15d,eax
vpsrld xmm7,xmm4,3
xor r12d,r10d
shrd r14d,r14d,11
xor r15d,ebx
vpslld xmm5,xmm4,14
add r11d,r12d
shrd r13d,r13d,6
and edi,r15d
vpxor xmm4,xmm7,xmm6
xor r14d,eax
add r11d,r13d
xor edi,ebx
vpshufd xmm7,xmm1,250
shrd r14d,r14d,2
add edx,r11d
add r11d,edi
vpsrld xmm6,xmm6,11
mov r13d,edx
add r14d,r11d
shrd r13d,r13d,14
vpxor xmm4,xmm4,xmm5
mov r11d,r14d
mov r12d,r8d
shrd r14d,r14d,9
vpslld xmm5,xmm5,11
xor r13d,edx
xor r12d,r9d
shrd r13d,r13d,5
vpxor xmm4,xmm4,xmm6
xor r14d,r11d
and r12d,edx
xor r13d,edx
vpsrld xmm6,xmm7,10
add r10d,DWORD[36+rsp]
mov edi,r11d
xor r12d,r9d
vpxor xmm4,xmm4,xmm5
shrd r14d,r14d,11
xor edi,eax
add r10d,r12d
vpsrlq xmm7,xmm7,17
shrd r13d,r13d,6
and r15d,edi
xor r14d,r11d
vpaddd xmm2,xmm2,xmm4
add r10d,r13d
xor r15d,eax
shrd r14d,r14d,2
vpxor xmm6,xmm6,xmm7
add ecx,r10d
add r10d,r15d
mov r13d,ecx
vpsrlq xmm7,xmm7,2
add r14d,r10d
shrd r13d,r13d,14
mov r10d,r14d
vpxor xmm6,xmm6,xmm7
mov r12d,edx
shrd r14d,r14d,9
xor r13d,ecx
vpshufb xmm6,xmm6,xmm8
xor r12d,r8d
shrd r13d,r13d,5
xor r14d,r10d
vpaddd xmm2,xmm2,xmm6
and r12d,ecx
xor r13d,ecx
add r9d,DWORD[40+rsp]
vpshufd xmm7,xmm2,80
mov r15d,r10d
xor r12d,r8d
shrd r14d,r14d,11
vpsrld xmm6,xmm7,10
xor r15d,r11d
add r9d,r12d
shrd r13d,r13d,6
vpsrlq xmm7,xmm7,17
and edi,r15d
xor r14d,r10d
add r9d,r13d
vpxor xmm6,xmm6,xmm7
xor edi,r11d
shrd r14d,r14d,2
add ebx,r9d
vpsrlq xmm7,xmm7,2
add r9d,edi
mov r13d,ebx
add r14d,r9d
vpxor xmm6,xmm6,xmm7
shrd r13d,r13d,14
mov r9d,r14d
mov r12d,ecx
vpshufb xmm6,xmm6,xmm9
shrd r14d,r14d,9
xor r13d,ebx
xor r12d,edx
vpaddd xmm2,xmm2,xmm6
shrd r13d,r13d,5
xor r14d,r9d
and r12d,ebx
vpaddd xmm6,xmm2,XMMWORD[64+rbp]
xor r13d,ebx
add r8d,DWORD[44+rsp]
mov edi,r9d
xor r12d,edx
shrd r14d,r14d,11
xor edi,r10d
add r8d,r12d
shrd r13d,r13d,6
and r15d,edi
xor r14d,r9d
add r8d,r13d
xor r15d,r10d
shrd r14d,r14d,2
add eax,r8d
add r8d,r15d
mov r13d,eax
add r14d,r8d
vmovdqa XMMWORD[32+rsp],xmm6
vpalignr xmm4,xmm0,xmm3,4
shrd r13d,r13d,14
mov r8d,r14d
mov r12d,ebx
vpalignr xmm7,xmm2,xmm1,4
shrd r14d,r14d,9
xor r13d,eax
xor r12d,ecx
vpsrld xmm6,xmm4,7
shrd r13d,r13d,5
xor r14d,r8d
and r12d,eax
vpaddd xmm3,xmm3,xmm7
xor r13d,eax
add edx,DWORD[48+rsp]
mov r15d,r8d
vpsrld xmm7,xmm4,3
xor r12d,ecx
shrd r14d,r14d,11
xor r15d,r9d
vpslld xmm5,xmm4,14
add edx,r12d
shrd r13d,r13d,6
and edi,r15d
vpxor xmm4,xmm7,xmm6
xor r14d,r8d
add edx,r13d
xor edi,r9d
vpshufd xmm7,xmm2,250
shrd r14d,r14d,2
add r11d,edx
add edx,edi
vpsrld xmm6,xmm6,11
mov r13d,r11d
add r14d,edx
shrd r13d,r13d,14
vpxor xmm4,xmm4,xmm5
mov edx,r14d
mov r12d,eax
shrd r14d,r14d,9
vpslld xmm5,xmm5,11
xor r13d,r11d
xor r12d,ebx
shrd r13d,r13d,5
vpxor xmm4,xmm4,xmm6
xor r14d,edx
and r12d,r11d
xor r13d,r11d
vpsrld xmm6,xmm7,10
add ecx,DWORD[52+rsp]
mov edi,edx
xor r12d,ebx
vpxor xmm4,xmm4,xmm5
shrd r14d,r14d,11
xor edi,r8d
add ecx,r12d
vpsrlq xmm7,xmm7,17
shrd r13d,r13d,6
and r15d,edi
xor r14d,edx
vpaddd xmm3,xmm3,xmm4
add ecx,r13d
xor r15d,r8d
shrd r14d,r14d,2
vpxor xmm6,xmm6,xmm7
add r10d,ecx
add ecx,r15d
mov r13d,r10d
vpsrlq xmm7,xmm7,2
add r14d,ecx
shrd r13d,r13d,14
mov ecx,r14d
vpxor xmm6,xmm6,xmm7
mov r12d,r11d
shrd r14d,r14d,9
xor r13d,r10d
vpshufb xmm6,xmm6,xmm8
xor r12d,eax
shrd r13d,r13d,5
xor r14d,ecx
vpaddd xmm3,xmm3,xmm6
and r12d,r10d
xor r13d,r10d
add ebx,DWORD[56+rsp]
vpshufd xmm7,xmm3,80
mov r15d,ecx
xor r12d,eax
shrd r14d,r14d,11
vpsrld xmm6,xmm7,10
xor r15d,edx
add ebx,r12d
shrd r13d,r13d,6
vpsrlq xmm7,xmm7,17
and edi,r15d
xor r14d,ecx
add ebx,r13d
vpxor xmm6,xmm6,xmm7
xor edi,edx
shrd r14d,r14d,2
add r9d,ebx
vpsrlq xmm7,xmm7,2
add ebx,edi
mov r13d,r9d
add r14d,ebx
vpxor xmm6,xmm6,xmm7
shrd r13d,r13d,14
mov ebx,r14d
mov r12d,r10d
vpshufb xmm6,xmm6,xmm9
shrd r14d,r14d,9
xor r13d,r9d
xor r12d,r11d
vpaddd xmm3,xmm3,xmm6
shrd r13d,r13d,5
xor r14d,ebx
and r12d,r9d
vpaddd xmm6,xmm3,XMMWORD[96+rbp]
xor r13d,r9d
add eax,DWORD[60+rsp]
mov edi,ebx
xor r12d,r11d
shrd r14d,r14d,11
xor edi,ecx
add eax,r12d
shrd r13d,r13d,6
and r15d,edi
xor r14d,ebx
add eax,r13d
xor r15d,ecx
shrd r14d,r14d,2
add r8d,eax
add eax,r15d
mov r13d,r8d
add r14d,eax
vmovdqa XMMWORD[48+rsp],xmm6
cmp BYTE[131+rbp],0
jne NEAR $L$avx_00_47
shrd r13d,r13d,14
mov eax,r14d
mov r12d,r9d
shrd r14d,r14d,9
xor r13d,r8d
xor r12d,r10d
shrd r13d,r13d,5
xor r14d,eax
and r12d,r8d
xor r13d,r8d
add r11d,DWORD[rsp]
mov r15d,eax
xor r12d,r10d
shrd r14d,r14d,11
xor r15d,ebx
add r11d,r12d
shrd r13d,r13d,6
and edi,r15d
xor r14d,eax
add r11d,r13d
xor edi,ebx
shrd r14d,r14d,2
add edx,r11d
add r11d,edi
mov r13d,edx
add r14d,r11d
shrd r13d,r13d,14
mov r11d,r14d
mov r12d,r8d
shrd r14d,r14d,9
xor r13d,edx
xor r12d,r9d
shrd r13d,r13d,5
xor r14d,r11d
and r12d,edx
xor r13d,edx
add r10d,DWORD[4+rsp]
mov edi,r11d
xor r12d,r9d
shrd r14d,r14d,11
xor edi,eax
add r10d,r12d
shrd r13d,r13d,6
and r15d,edi
xor r14d,r11d
add r10d,r13d
xor r15d,eax
shrd r14d,r14d,2
add ecx,r10d
add r10d,r15d
mov r13d,ecx
add r14d,r10d
shrd r13d,r13d,14
mov r10d,r14d
mov r12d,edx
shrd r14d,r14d,9
xor r13d,ecx
xor r12d,r8d
shrd r13d,r13d,5
xor r14d,r10d
and r12d,ecx
xor r13d,ecx
add r9d,DWORD[8+rsp]
mov r15d,r10d
xor r12d,r8d
shrd r14d,r14d,11
xor r15d,r11d
add r9d,r12d
shrd r13d,r13d,6
and edi,r15d
xor r14d,r10d
add r9d,r13d
xor edi,r11d
shrd r14d,r14d,2
add ebx,r9d
add r9d