; This file is generated from a similarly-named Perl script in the BoringSSL ; source tree. Do not edit by hand. %ifidn __OUTPUT_FORMAT__, win64 default rel %define XMMWORD %define YMMWORD %define ZMMWORD %ifdef BORINGSSL_PREFIX %include "boringssl_prefix_symbols_nasm.inc" %endif section .text code align=64 EXTERN OPENSSL_ia32cap_P global sha512_block_data_order ALIGN 16 sha512_block_data_order: mov QWORD[8+rsp],rdi ;WIN64 prologue mov QWORD[16+rsp],rsi mov rax,rsp $L$SEH_begin_sha512_block_data_order: mov rdi,rcx mov rsi,rdx mov rdx,r8 lea r11,[OPENSSL_ia32cap_P] mov r9d,DWORD[r11] mov r10d,DWORD[4+r11] mov r11d,DWORD[8+r11] and r9d,1073741824 and r10d,268435968 or r10d,r9d cmp r10d,1342177792 je NEAR $L$avx_shortcut mov rax,rsp push rbx push rbp push r12 push r13 push r14 push r15 shl rdx,4 sub rsp,16*8+4*8 lea rdx,[rdx*8+rsi] and rsp,-64 mov QWORD[((128+0))+rsp],rdi mov QWORD[((128+8))+rsp],rsi mov QWORD[((128+16))+rsp],rdx mov QWORD[152+rsp],rax $L$prologue: mov rax,QWORD[rdi] mov rbx,QWORD[8+rdi] mov rcx,QWORD[16+rdi] mov rdx,QWORD[24+rdi] mov r8,QWORD[32+rdi] mov r9,QWORD[40+rdi] mov r10,QWORD[48+rdi] mov r11,QWORD[56+rdi] jmp NEAR $L$loop ALIGN 16 $L$loop: mov rdi,rbx lea rbp,[K512] xor rdi,rcx mov r12,QWORD[rsi] mov r13,r8 mov r14,rax bswap r12 ror r13,23 mov r15,r9 xor r13,r8 ror r14,5 xor r15,r10 mov QWORD[rsp],r12 xor r14,rax and r15,r8 ror r13,4 add r12,r11 xor r15,r10 ror r14,6 xor r13,r8 add r12,r15 mov r15,rax add r12,QWORD[rbp] xor r14,rax xor r15,rbx ror r13,14 mov r11,rbx and rdi,r15 ror r14,28 add r12,r13 xor r11,rdi add rdx,r12 add r11,r12 lea rbp,[8+rbp] add r11,r14 mov r12,QWORD[8+rsi] mov r13,rdx mov r14,r11 bswap r12 ror r13,23 mov rdi,r8 xor r13,rdx ror r14,5 xor rdi,r9 mov QWORD[8+rsp],r12 xor r14,r11 and rdi,rdx ror r13,4 add r12,r10 xor rdi,r9 ror r14,6 xor r13,rdx add r12,rdi mov rdi,r11 add r12,QWORD[rbp] xor r14,r11 xor rdi,rax ror r13,14 mov r10,rax and r15,rdi ror r14,28 add r12,r13 xor r10,r15 add rcx,r12 add r10,r12 lea rbp,[24+rbp] add r10,r14 mov r12,QWORD[16+rsi] mov r13,rcx mov r14,r10 bswap r12 ror r13,23 mov r15,rdx xor r13,rcx ror r14,5 xor r15,r8 mov QWORD[16+rsp],r12 xor r14,r10 and r15,rcx ror r13,4 add r12,r9 xor r15,r8 ror r14,6 xor r13,rcx add r12,r15 mov r15,r10 add r12,QWORD[rbp] xor r14,r10 xor r15,r11 ror r13,14 mov r9,r11 and rdi,r15 ror r14,28 add r12,r13 xor r9,rdi add rbx,r12 add r9,r12 lea rbp,[8+rbp] add r9,r14 mov r12,QWORD[24+rsi] mov r13,rbx mov r14,r9 bswap r12 ror r13,23 mov rdi,rcx xor r13,rbx ror r14,5 xor rdi,rdx mov QWORD[24+rsp],r12 xor r14,r9 and rdi,rbx ror r13,4 add r12,r8 xor rdi,rdx ror r14,6 xor r13,rbx add r12,rdi mov rdi,r9 add r12,QWORD[rbp] xor r14,r9 xor rdi,r10 ror r13,14 mov r8,r10 and r15,rdi ror r14,28 add r12,r13 xor r8,r15 add rax,r12 add r8,r12 lea rbp,[24+rbp] add r8,r14 mov r12,QWORD[32+rsi] mov r13,rax mov r14,r8 bswap r12 ror r13,23 mov r15,rbx xor r13,rax ror r14,5 xor r15,rcx mov QWORD[32+rsp],r12 xor r14,r8 and r15,rax ror r13,4 add r12,rdx xor r15,rcx ror r14,6 xor r13,rax add r12,r15 mov r15,r8 add r12,QWORD[rbp] xor r14,r8 xor r15,r9 ror r13,14 mov rdx,r9 and rdi,r15 ror r14,28 add r12,r13 xor rdx,rdi add r11,r12 add rdx,r12 lea rbp,[8+rbp] add rdx,r14 mov r12,QWORD[40+rsi] mov r13,r11 mov r14,rdx bswap r12 ror r13,23 mov rdi,rax xor r13,r11 ror r14,5 xor rdi,rbx mov QWORD[40+rsp],r12 xor r14,rdx and rdi,r11 ror r13,4 add r12,rcx xor rdi,rbx ror r14,6 xor r13,r11 add r12,rdi mov rdi,rdx add r12,QWORD[rbp] xor r14,rdx xor rdi,r8 ror r13,14 mov rcx,r8 and r15,rdi ror r14,28 add r12,r13 xor rcx,r15 add r10,r12 add rcx,r12 lea rbp,[24+rbp] add rcx,r14 mov r12,QWORD[48+rsi] mov r13,r10 mov r14,rcx bswap r12 ror r13,23 mov r15,r11 xor r13,r10 ror r14,5 xor r15,rax mov QWORD[48+rsp],r12 xor r14,rcx and r15,r10 ror r13,4 add r12,rbx xor r15,rax ror r14,6 xor r13,r10 add r12,r15 mov r15,rcx add r12,QWORD[rbp] xor r14,rcx xor r15,rdx ror r13,14 mov rbx,rdx and rdi,r15 ror r14,28 add r12,r13 xor rbx,rdi add r9,r12 add rbx,r12 lea rbp,[8+rbp] add rbx,r14 mov r12,QWORD[56+rsi] mov r13,r9 mov r14,rbx bswap r12 ror r13,23 mov rdi,r10 xor r13,r9 ror r14,5 xor rdi,r11 mov QWORD[56+rsp],r12 xor r14,rbx and rdi,r9 ror r13,4 add r12,rax xor rdi,r11 ror r14,6 xor r13,r9 add r12,rdi mov rdi,rbx add r12,QWORD[rbp] xor r14,rbx xor rdi,rcx ror r13,14 mov rax,rcx and r15,rdi ror r14,28 add r12,r13 xor rax,r15 add r8,r12 add rax,r12 lea rbp,[24+rbp] add rax,r14 mov r12,QWORD[64+rsi] mov r13,r8 mov r14,rax bswap r12 ror r13,23 mov r15,r9 xor r13,r8 ror r14,5 xor r15,r10 mov QWORD[64+rsp],r12 xor r14,rax and r15,r8 ror r13,4 add r12,r11 xor r15,r10 ror r14,6 xor r13,r8 add r12,r15 mov r15,rax add r12,QWORD[rbp] xor r14,rax xor r15,rbx ror r13,14 mov r11,rbx and rdi,r15 ror r14,28 add r12,r13 xor r11,rdi add rdx,r12 add r11,r12 lea rbp,[8+rbp] add r11,r14 mov r12,QWORD[72+rsi] mov r13,rdx mov r14,r11 bswap r12 ror r13,23 mov rdi,r8 xor r13,rdx ror r14,5 xor rdi,r9 mov QWORD[72+rsp],r12 xor r14,r11 and rdi,rdx ror r13,4 add r12,r10 xor rdi,r9 ror r14,6 xor r13,rdx add r12,rdi mov rdi,r11 add r12,QWORD[rbp] xor r14,r11 xor rdi,rax ror r13,14 mov r10,rax and r15,rdi ror r14,28 add r12,r13 xor r10,r15 add rcx,r12 add r10,r12 lea rbp,[24+rbp] add r10,r14 mov r12,QWORD[80+rsi] mov r13,rcx mov r14,r10 bswap r12 ror r13,23 mov r15,rdx xor r13,rcx ror r14,5 xor r15,r8 mov QWORD[80+rsp],r12 xor r14,r10 and r15,rcx ror r13,4 add r12,r9 xor r15,r8 ror r14,6 xor r13,rcx add r12,r15 mov r15,r10 add r12,QWORD[rbp] xor r14,r10 xor r15,r11 ror r13,14 mov r9,r11 and rdi,r15 ror r14,28 add r12,r13 xor r9,rdi add rbx,r12 add r9,r12 lea rbp,[8+rbp] add r9,r14 mov r12,QWORD[88+rsi] mov r13,rbx mov r14,r9 bswap r12 ror r13,23 mov rdi,rcx xor r13,rbx ror r14,5 xor rdi,rdx mov QWORD[88+rsp],r12 xor r14,r9 and rdi,rbx ror r13,4 add r12,r8 xor rdi,rdx ror r14,6 xor r13,rbx add r12,rdi mov rdi,r9 add r12,QWORD[rbp] xor r14,r9 xor rdi,r10 ror r13,14 mov r8,r10 and r15,rdi ror r14,28 add r12,r13 xor r8,r15 add rax,r12 add r8,r12 lea rbp,[24+rbp] add r8,r14 mov r12,QWORD[96+rsi] mov r13,rax mov r14,r8 bswap r12 ror r13,23 mov r15,rbx xor r13,rax ror r14,5 xor r15,rcx mov QWORD[96+rsp],r12 xor r14,r8 and r15,rax ror r13,4 add r12,rdx xor r15,rcx ror r14,6 xor r13,rax add r12,r15 mov r15,r8 add r12,QWORD[rbp] xor r14,r8 xor r15,r9 ror r13,14 mov rdx,r9 and rdi,r15 ror r14,28 add r12,r13 xor rdx,rdi add r11,r12 add rdx,r12 lea rbp,[8+rbp] add rdx,r14 mov r12,QWORD[104+rsi] mov r13,r11 mov r14,rdx bswap r12 ror r13,23 mov rdi,rax xor r13,r11 ror r14,5 xor rdi,rbx mov QWORD[104+rsp],r12 xor r14,rdx and rdi,r11 ror r13,4 add r12,rcx xor rdi,rbx ror r14,6 xor r13,r11 add r12,rdi mov rdi,rdx add r12,QWORD[rbp] xor r14,rdx xor rdi,r8 ror r13,14 mov rcx,r8 and r15,rdi ror r14,28 add r12,r13 xor rcx,r15 add r10,r12 add rcx,r12 lea rbp,[24+rbp] add rcx,r14 mov r12,QWORD[112+rsi] mov r13,r10 mov r14,rcx bswap r12 ror r13,23 mov r15,r11 xor r13,r10 ror r14,5 xor r15,rax mov QWORD[112+rsp],r12 xor r14,rcx and r15,r10 ror r13,4 add r12,rbx xor r15,rax ror r14,6 xor r13,r10 add r12,r15 mov r15,rcx add r12,QWORD[rbp] xor r14,rcx xor r15,rdx ror r13,14 mov rbx,rdx and rdi,r15 ror r14,28 add r12,r13 xor rbx,rdi add r9,r12 add rbx,r12 lea rbp,[8+rbp] add rbx,r14 mov r12,QWORD[120+rsi] mov r13,r9 mov r14,rbx bswap r12 ror r13,23 mov rdi,r10 xor r13,r9 ror r14,5 xor rdi,r11 mov QWORD[120+rsp],r12 xor r14,rbx and rdi,r9 ror r13,4 add r12,rax xor rdi,r11 ror r14,6 xor r13,r9 add r12,rdi mov rdi,rbx add r12,QWORD[rbp] xor r14,rbx xor rdi,rcx ror r13,14 mov rax,rcx and r15,rdi ror r14,28 add r12,r13 xor rax,r15 add r8,r12 add rax,r12 lea rbp,[24+rbp] jmp NEAR $L$rounds_16_xx ALIGN 16 $L$rounds_16_xx: mov r13,QWORD[8+rsp] mov r15,QWORD[112+rsp] mov r12,r13 ror r13,7 add rax,r14 mov r14,r15 ror r15,42 xor r13,r12 shr r12,7 ror r13,1 xor r15,r14 shr r14,6 ror r15,19 xor r12,r13 xor r15,r14 add r12,QWORD[72+rsp] add r12,QWORD[rsp] mov r13,r8 add r12,r15 mov r14,rax ror r13,23 mov r15,r9 xor r13,r8 ror r14,5 xor r15,r10 mov QWORD[rsp],r12 xor r14,rax and r15,r8 ror r13,4 add r12,r11 xor r15,r10 ror r14,6 xor r13,r8 add r12,r15 mov r15,rax add r12,QWORD[rbp] xor r14,rax xor r15,rbx ror r13,14 mov r11,rbx and rdi,r15 ror r14,28 add r12,r13 xor r11,rdi add rdx,r12 add r11,r12 lea rbp,[8+rbp] mov r13,QWORD[16+rsp] mov rdi,QWORD[120+rsp] mov r12,r13 ror r13,7 add r11,r14 mov r14,rdi ror rdi,42 xor r13,r12 shr r12,7 ror r13,1 xor rdi,r14 shr r14,6 ror rdi,19 xor r12,r13 xor rdi,r14 add r12,QWORD[80+rsp] add r12,QWORD[8+rsp] mov r13,rdx add r12,rdi mov r14,r11 ror r13,23 mov rdi,r8 xor r13,rdx ror r14,5 xor rdi,r9 mov QWORD[8+rsp],r12 xor r14,r11 and rdi,rdx ror r13,4 add r12,r10 xor rdi,r9 ror r14,6 xor r13,rdx add r12,rdi mov rdi,r11 add r12,QWORD[rbp] xor r14,r11 xor rdi,rax ror r13,14 mov r10,rax and r15,rdi ror r14,28 add r12,r13 xor r10,r15 add rcx,r12 add r10,r12 lea rbp,[24+rbp] mov r13,QWORD[24+rsp] mov r15,QWORD[rsp] mov r12,r13 ror r13,7 add r10,r14 mov r14,r15 ror r15,42 xor r13,r12 shr r12,7 ror r13,1 xor r15,r14 shr r14,6 ror r15,19 xor r12,r13 xor r15,r14 add r12,QWORD[88+rsp] add r12,QWORD[16+rsp] mov r13,rcx add r12,r15 mov r14,r10 ror r13,23 mov r15,rdx xor r13,rcx ror r14,5 xor r15,r8 mov QWORD[16+rsp],r12 xor r14,r10 and r15,rcx ror r13,4 add r12,r9 xor r15,r8 ror r14,6 xor r13,rcx add r12,r15 mov r15,r10 add r12,QWORD[rbp] xor r14,r10 xor r15,r11 ror r13,14 mov r9,r11 and rdi,r15 ror r14,28 add r12,r13 xor r9,rdi add rbx,r12 add r9,r12 lea rbp,[8+rbp] mov r13,QWORD[32+rsp] mov rdi,QWORD[8+rsp] mov r12,r13 ror r13,7 add r9,r14 mov r14,rdi ror rdi,42 xor r13,r12 shr r12,7 ror r13,1 xor rdi,r14 shr r14,6 ror rdi,19 xor r12,r13 xor rdi,r14 add r12,QWORD[96+rsp] add r12,QWORD[24+rsp] mov r13,rbx add r12,rdi mov r14,r9 ror r13,23 mov rdi,rcx xor r13,rbx ror r14,5 xor rdi,rdx mov QWORD[24+rsp],r12 xor r14,r9 and rdi,rbx ror r13,4 add r12,r8 xor rdi,rdx ror r14,6 xor r13,rbx add r12,rdi mov rdi,r9 add r12,QWORD[rbp] xor r14,r9 xor rdi,r10 ror r13,14 mov r8,r10 and r15,rdi ror r14,28 add r12,r13 xor r8,r15 add rax,r12 add r8,r12 lea rbp,[24+rbp] mov r13,QWORD[40+rsp] mov r15,QWORD[16+rsp] mov r12,r13 ror r13,7 add r8,r14 mov r14,r15 ror r15,42 xor r13,r12 shr r12,7 ror r13,1 xor r15,r14 shr r14,6 ror r15,19 xor r12,r13 xor r15,r14 add r12,QWORD[104+rsp] add r12,QWORD[32+rsp] mov r13,rax add r12,r15 mov r14,r8 ror r13,23 mov r15,rbx xor r13,rax ror r14,5 xor r15,rcx mov QWORD[32+rsp],r12 xor r14,r8 and r15,rax ror r13,4 add r12,rdx xor r15,rcx ror r14,6 xor r13,rax add r12,r15 mov r15,r8 add r12,QWORD[rbp] xor r14,r8 xor r15,r9 ror r13,14 mov rdx,r9 and rdi,r15 ror r14,28 add r12,r13 xor rdx,rdi add r11,r12 add rdx,r12 lea rbp,[8+rbp] mov r13,QWORD[48+rsp] mov rdi,QWORD[24+rsp] mov r12,r13 ror r13,7 add rdx,r14 mov r14,rdi ror rdi,42 xor r13,r12 shr r12,7 ror r13,1 xor rdi,r14 shr r14,6 ror rdi,19 xor r12,r13 xor rdi,r14 add r12,QWORD[112+rsp] add r12,QWORD[40+rsp] mov r13,r11 add r12,rdi mov r14,rdx ror r13,23 mov rdi,rax xor r13,r11 ror r14,5 xor rdi,rbx mov QWORD[40+rsp],r12 xor r14,rdx and rdi,r11 ror r13,4 add r12,rcx xor rdi,rbx ror r14,6 xor r13,r11 add r12,rdi mov rdi,rdx add r12,QWORD[rbp] xor r14,rdx xor rdi,r8 ror r13,14 mov rcx,r8 and r15,rdi ror r14,28 add r12,r13 xor rcx,r15 add r10,r12 add rcx,r12 lea rbp,[24+rbp] mov r13,QWORD[56+rsp] mov r15,QWORD[32+rsp] mov r12,r13 ror r13,7 add rcx,r14 mov r14,r15 ror r15,42 xor r13,r12 shr r12,7 ror r13,1 xor r15,r14 shr r14,6 ror r15,19 xor r12,r13 xor r15,r14 add r12,QWORD[120+rsp] add r12,QWORD[48+rsp] mov r13,r10 add r12,r15 mov r14,rcx ror r13,23 mov r15,r11 xor r13,r10 ror r14,5 xor r15,rax mov QWORD[48+rsp],r12 xor r14,rcx and r15,r10 ror r13,4 add r12,rbx xor r15,rax ror r14,6 xor r13,r10 add r12,r15 mov r15,rcx add r12,QWORD[rbp] xor r14,rcx xor r15,rdx ror r13,14 mov rbx,rdx and rdi,r15 ror r14,28 add r12,r13 xor rbx,rdi add r9,r12 add rbx,r12 lea rbp,[8+rbp] mov r13,QWORD[64+rsp] mov rdi,QWORD[40+rsp] mov r12,r13 ror r13,7 add rbx,r14 mov r14,rdi ror rdi,42 xor r13,r12 shr r12,7 ror r13,1 xor rdi,r14 shr r14,6 ror rdi,19 xor r12,r13 xor rdi,r14 add r12,QWORD[rsp] add r12,QWORD[56+rsp] mov r13,r9 add r12,rdi mov r14,rbx ror r13,23 mov rdi,r10 xor r13,r9 ror r14,5 xor rdi,r11 mov QWORD[56+rsp],r12 xor r14,rbx and rdi,r9 ror r13,4 add r12,rax xor rdi,r11 ror r14,6 xor r13,r9 add r12,rdi mov rdi,rbx add r12,QWORD[rbp] xor r14,rbx xor rdi,rcx ror r13,14 mov rax,rcx and r15,rdi ror r14,28 add r12,r13 xor rax,r15 add r8,r12 add rax,r12 lea rbp,[24+rbp] mov r13,QWORD[72+rsp] mov r15,QWORD[48+rsp] mov r12,r13 ror r13,7 add rax,r14 mov r14,r15 ror r15,42 xor r13,r12 shr r12,7 ror r13,1 xor r15,r14 shr r14,6 ror r15,19 xor r12,r13 xor r15,r14 add r12,QWORD[8+rsp] add r12,QWORD[64+rsp] mov r13,r8 add r12,r15 mov r14,rax ror r13,23 mov r15,r9 xor r13,r8 ror r14,5 xor r15,r10 mov QWORD[64+rsp],r12 xor r14,rax and r15,r8 ror r13,4 add r12,r11 xor r15,r10 ror r14,6 xor r13,r8 add r12,r15 mov r15,rax add r12,QWORD[rbp] xor r14,rax xor r15,rbx ror r13,14 mov r11,rbx and rdi,r15 ror r14,28 add r12,r13 xor r11,rdi add rdx,r12 add r11,r12 lea rbp,[8+rbp] mov r13,QWORD[80+rsp] mov rdi,QWORD[56+rsp] mov r12,r13 ror r13,7 add r11,r14 mov r14,rdi ror rdi,42 xor r13,r12 shr r12,7 ror r13,1 xor rdi,r14 shr r14,6 ror rdi,19 xor r12,r13 xor rdi,r14 add r12,QWORD[16+rsp] add r12,QWORD[72+rsp] mov r13,rdx add r12,rdi mov r14,r11 ror r13,23 mov rdi,r8 xor r13,rdx ror r14,5 xor rdi,r9 mov QWORD[72+rsp],r12 xor r14,r11 and rdi,rdx ror r13,4 add r12,r10 xor rdi,r9 ror r14,6 xor r13,rdx add r12,rdi mov rdi,r11 add r12,QWORD[rbp] xor r14,r11 xor rdi,rax ror r13,14 mov r10,rax and r15,rdi ror r14,28 add r12,r13 xor r10,r15 add rcx,r12 add r10,r12 lea rbp,[24+rbp] mov r13,QWORD[88+rsp] mov r15,QWORD[64+rsp] mov r12,r13 ror r13,7 add r10,r14 mov r14,r15 ror r15,42 xor r13,r12 shr r12,7 ror r13,1 xor r15,r14 shr r14,6 ror r15,19 xor r12,r13 xor r15,r14 add r12,QWORD[24+rsp] add r12,QWORD[80+rsp] mov r13,rcx add r12,r15 mov r14,r10 ror r13,23 mov r15,rdx xor r13,rcx ror r14,5 xor r15,r8 mov QWORD[80+rsp],r12 xor r14,r10 and r15,rcx ror r13,4 add r12,r9 xor r15,r8 ror r14,6 xor r13,rcx add r12,r15 mov r15,r10 add r12,QWORD[rbp] xor r14,r10 xor r15,r11 ror r13,14 mov r9,r11 and rdi,r15 ror r14,28 add r12,r13 xor r9,rdi add rbx,r12 add r9,r12 lea rbp,[8+rbp] mov r13,QWORD[96+rsp] mov rdi,QWORD[72+rsp] mov r12,r13 ror r13,7 add r9,r14 mov r14,rdi ror rdi,42 xor r13,r12 shr r12,7 ror r13,1 xor rdi,r14 shr r14,6 ror rdi,19 xor r12,r13 xor rdi,r14 add r12,QWORD[32+rsp] add r12,QWORD[88+rsp] mov r13,rbx add r12,rdi mov r14,r9 ror r13,23 mov rdi,rcx xor r13,rbx ror r14,5 xor rdi,rdx mov QWORD[88+rsp],r12 xor r14,r9 and rdi,rbx ror r13,4 add r12,r8 xor rdi,rdx ror r14,6 xor r13,rbx add r12,rdi mov rdi,r9 add r12,QWORD[rbp] xor r14,r9 xor rdi,r10 ror r13,14 mov r8,r10 and r15,rdi ror r14,28 add r12,r13 xor r8,r15 add rax,r12 add r8,r12 lea rbp,[24+rbp] mov r13,QWORD[104+rsp] mov r15,QWORD[80+rsp] mov r12,r13 ror r13,7 add r8,r14 mov r14,r15 ror r15,42 xor r13,r12 shr r12,7 ror r13,1 xor r15,r14 shr r14,6 ror r15,19 xor r12,r13 xor r15,r14 add r12,QWORD[40+rsp] add r12,QWORD[96+rsp] mov r13,rax add r12,r15 mov r14,r8 ror r13,23 mov r15,rbx xor r13,rax ror r14,5 xor r15,rcx mov QWORD[96+rsp],r12 xor r14,r8 and r15,rax ror r13,4 add r12,rdx xor r15,rcx ror r14,6 xor r13,rax add r12,r15 mov r15,r8 add r12,QWORD[rbp] xor r14,r8 xor r15,r9 ror r13,14 mov rdx,r9 and rdi,r15 ror r14,28 add r12,r13 xor rdx,rdi add r11,r12 add rdx,r12 lea rbp,[8+rbp] mov r13,QWORD[112+rsp] mov rdi,QWORD[88+rsp] mov r12,r13 ror r13,7 add rdx,r14 mov r14,rdi ror rdi,42 xor r13,r12 shr r12,7 ror r13,1 xor rdi,r14 shr r14,6 ror rdi,19 xor r12,r13 xor rdi,r14 add r12,QWORD[48+rsp] add r12,QWORD[104+rsp] mov r13,r11 add r12,rdi mov r14,rdx ror r13,23 mov rdi,rax xor r13,r11 ror r14,5 xor rdi,rbx mov QWORD[104+rsp],r12 xor r14,rdx and rdi,r11 ror r13,4 add r12,rcx xor rdi,rbx ror r14,6 xor r13,r11 add r12,rdi mov rdi,rdx add r12,QWORD[rbp] xor r14,rdx xor rdi,r8 ror r13,14 mov rcx,r8 and r15,rdi ror r14,28 add r12,r13 xor rcx,r15 add r10,r12 add rcx,r12 lea rbp,[24+rbp] mov r13,QWORD[120+rsp] mov r15,QWORD[96+rsp] mov r12,r13 ror r13,7 add rcx,r14 mov r14,r15 ror r15,42 xor r13,r12 shr r12,7 ror r13,1 xor r15,r14 shr r14,6 ror r15,19 xor r12,r13 xor r15,r14 add r12,QWORD[56+rsp] add r12,QWORD[112+rsp] mov r13,r10 add r12,r15 mov r14,rcx ror r13,23 mov r15,r11 xor r13,r10 ror r14,5 xor r15,rax mov QWORD[112+rsp],r12 xor r14,rcx and r15,r10 ror r13,4 add r12,rbx xor r15,rax ror r14,6 xor r13,r10 add r12,r15 mov r15,rcx add r12,QWORD[rbp] xor r14,rcx xor r15,rdx ror r13,14 mov rbx,rdx and rdi,r15 ror r14,28 add r12,r13 xor rbx,rdi add r9,r12 add rbx,r12 lea rbp,[8+rbp] mov r13,QWORD[rsp] mov rdi,QWORD[104+rsp] mov r12,r13 ror r13,7 add rbx,r14 mov r14,rdi ror rdi,42 xor r13,r12 shr r12,7 ror r13,1 xor rdi,r14 shr r14,6 ror rdi,19 xor r12,r13 xor rdi,r14 add r12,QWORD[64+rsp] add r12,QWORD[120+rsp] mov r13,r9 add r12,rdi mov r14,rbx ror r13,23 mov rdi,r10 xor r13,r9 ror r14,5 xor rdi,r11 mov QWORD[120+rsp],r12 xor r14,rbx and rdi,r9 ror r13,4 add r12,rax xor rdi,r11 ror r14,6 xor r13,r9 add r12,rdi mov rdi,rbx add r12,QWORD[rbp] xor r14,rbx xor rdi,rcx ror r13,14 mov rax,rcx and r15,rdi ror r14,28 add r12,r13 xor rax,r15 add r8,r12 add rax,r12 lea rbp,[24+rbp] cmp BYTE[7+rbp],0 jnz NEAR $L$rounds_16_xx mov rdi,QWORD[((128+0))+rsp] add rax,r14 lea rsi,[128+rsi] add rax,QWORD[rdi] add rbx,QWORD[8+rdi] add rcx,QWORD[16+rdi] add rdx,QWORD[24+rdi] add r8,QWORD[32+rdi] add r9,QWORD[40+rdi] add r10,QWORD[48+rdi] add r11,QWORD[56+rdi] cmp rsi,QWORD[((128+16))+rsp] mov QWORD[rdi],rax mov QWORD[8+rdi],rbx mov QWORD[16+rdi],rcx mov QWORD[24+rdi],rdx mov QWORD[32+rdi],r8 mov QWORD[40+rdi],r9 mov QWORD[48+rdi],r10 mov QWORD[56+rdi],r11 jb NEAR $L$loop mov rsi,QWORD[152+rsp] mov r15,QWORD[((-48))+rsi] mov r14,QWORD[((-40))+rsi] mov r13,QWORD[((-32))+rsi] mov r12,QWORD[((-24))+rsi] mov rbp,QWORD[((-16))+rsi] mov rbx,QWORD[((-8))+rsi] lea rsp,[rsi] $L$epilogue: mov rdi,QWORD[8+rsp] ;WIN64 epilogue mov rsi,QWORD[16+rsp] DB 0F3h,0C3h ;repret $L$SEH_end_sha512_block_data_order: section .rdata rdata align=8 ALIGN 64 K512: DQ 0x428a2f98d728ae22,0x7137449123ef65cd DQ 0x428a2f98d728ae22,0x7137449123ef65cd DQ 0xb5c0fbcfec4d3b2f,0xe9b5dba58189dbbc DQ 0xb5c0fbcfec4d3b2f,0xe9b5dba58189dbbc DQ 0x3956c25bf348b538,0x59f111f1b605d019 DQ 0x3956c25bf348b538,0x59f111f1b605d019 DQ 0x923f82a4af194f9b,0xab1c5ed5da6d8118 DQ 0x923f82a4af194f9b,0xab1c5ed5da6d8118 DQ 0xd807aa98a3030242,0x12835b0145706fbe DQ 0xd807aa98a3030242,0x12835b0145706fbe DQ 0x243185be4ee4b28c,0x550c7dc3d5ffb4e2 DQ 0x243185be4ee4b28c,0x550c7dc3d5ffb4e2 DQ 0x72be5d74f27b896f,0x80deb1fe3b1696b1 DQ 0x72be5d74f27b896f,0x80deb1fe3b1696b1 DQ 0x9bdc06a725c71235,0xc19bf174cf692694 DQ 0x9bdc06a725c71235,0xc19bf174cf692694 DQ 0xe49b69c19ef14ad2,0xefbe4786384f25e3 DQ 0xe49b69c19ef14ad2,0xefbe4786384f25e3 DQ 0x0fc19dc68b8cd5b5,0x240ca1cc77ac9c65 DQ 0x0fc19dc68b8cd5b5,0x240ca1cc77ac9c65 DQ 0x2de92c6f592b0275,0x4a7484aa6ea6e483 DQ 0x2de92c6f592b0275,0x4a7484aa6ea6e483 DQ 0x5cb0a9dcbd41fbd4,0x76f988da831153b5 DQ 0x5cb0a9dcbd41fbd4,0x76f988da831153b5 DQ 0x983e5152ee66dfab,0xa831c66d2db43210 DQ 0x983e5152ee66dfab,0xa831c66d2db43210 DQ 0xb00327c898fb213f,0xbf597fc7beef0ee4 DQ 0xb00327c898fb213f,0xbf597fc7beef0ee4 DQ 0xc6e00bf33da88fc2,0xd5a79147930aa725 DQ 0xc6e00bf33da88fc2,0xd5a79147930aa725 DQ 0x06ca6351e003826f,0x142929670a0e6e70 DQ 0x06ca6351e003826f,0x142929670a0e6e70 DQ 0x27b70a8546d22ffc,0x2e1b21385c26c926 DQ 0x27b70a8546d22ffc,0x2e1b21385c26c926 DQ 0x4d2c6dfc5ac42aed,0x53380d139d95b3df DQ 0x4d2c6dfc5ac42aed,0x53380d139d95b3df DQ 0x650a73548baf63de,0x766a0abb3c77b2a8 DQ 0x650a73548baf63de,0x766a0abb3c77b2a8 DQ 0x81c2c92e47edaee6,0x92722c851482353b DQ 0x81c2c92e47edaee6,0x92722c851482353b DQ 0xa2bfe8a14cf10364,0xa81a664bbc423001 DQ 0xa2bfe8a14cf10364,0xa81a664bbc423001 DQ 0xc24b8b70d0f89791,0xc76c51a30654be30 DQ 0xc24b8b70d0f89791,0xc76c51a30654be30 DQ 0xd192e819d6ef5218,0xd69906245565a910 DQ 0xd192e819d6ef5218,0xd69906245565a910 DQ 0xf40e35855771202a,0x106aa07032bbd1b8 DQ 0xf40e35855771202a,0x106aa07032bbd1b8 DQ 0x19a4c116b8d2d0c8,0x1e376c085141ab53 DQ 0x19a4c116b8d2d0c8,0x1e376c085141ab53 DQ 0x2748774cdf8eeb99,0x34b0bcb5e19b48a8 DQ 0x2748774cdf8eeb99,0x34b0bcb5e19b48a8 DQ 0x391c0cb3c5c95a63,0x4ed8aa4ae3418acb DQ 0x391c0cb3c5c95a63,0x4ed8aa4ae3418acb DQ 0x5b9cca4f7763e373,0x682e6ff3d6b2b8a3 DQ 0x5b9cca4f7763e373,0x682e6ff3d6b2b8a3 DQ 0x748f82ee5defb2fc,0x78a5636f43172f60 DQ 0x748f82ee5defb2fc,0x78a5636f43172f60 DQ 0x84c87814a1f0ab72,0x8cc702081a6439ec DQ 0x84c87814a1f0ab72,0x8cc702081a6439ec DQ 0x90befffa23631e28,0xa4506cebde82bde9 DQ 0x90befffa23631e28,0xa4506cebde82bde9 DQ 0xbef9a3f7b2c67915,0xc67178f2e372532b DQ 0xbef9a3f7b2c67915,0xc67178f2e372532b DQ 0xca273eceea26619c,0xd186b8c721c0c207 DQ 0xca273eceea26619c,0xd186b8c721c0c207 DQ 0xeada7dd6cde0eb1e,0xf57d4f7fee6ed178 DQ 0xeada7dd6cde0eb1e,0xf57d4f7fee6ed178 DQ 0x06f067aa72176fba,0x0a637dc5a2c898a6 DQ 0x06f067aa72176fba,0x0a637dc5a2c898a6 DQ 0x113f9804bef90dae,0x1b710b35131c471b DQ 0x113f9804bef90dae,0x1b710b35131c471b DQ 0x28db77f523047d84,0x32caab7b40c72493 DQ 0x28db77f523047d84,0x32caab7b40c72493 DQ 0x3c9ebe0a15c9bebc,0x431d67c49c100d4c DQ 0x3c9ebe0a15c9bebc,0x431d67c49c100d4c DQ 0x4cc5d4becb3e42b6,0x597f299cfc657e2a DQ 0x4cc5d4becb3e42b6,0x597f299cfc657e2a DQ 0x5fcb6fab3ad6faec,0x6c44198c4a475817 DQ 0x5fcb6fab3ad6faec,0x6c44198c4a475817 DQ 0x0001020304050607,0x08090a0b0c0d0e0f DQ 0x0001020304050607,0x08090a0b0c0d0e0f DB 83,72,65,53,49,50,32,98,108,111,99,107,32,116,114,97 DB 110,115,102,111,114,109,32,102,111,114,32,120,56,54,95,54 DB 52,44,32,67,82,89,80,84,79,71,65,77,83,32,98,121 DB 32,60,97,112,112,114,111,64,111,112,101,110,115,115,108,46 DB 111,114,103,62,0 section .text ALIGN 64 sha512_block_data_order_avx: mov QWORD[8+rsp],rdi ;WIN64 prologue mov QWORD[16+rsp],rsi mov rax,rsp $L$SEH_begin_sha512_block_data_order_avx: mov rdi,rcx mov rsi,rdx mov rdx,r8 $L$avx_shortcut: mov rax,rsp push rbx push rbp push r12 push r13 push r14 push r15 shl rdx,4 sub rsp,256 lea rdx,[rdx*8+rsi] and rsp,-64 mov QWORD[((128+0))+rsp],rdi mov QWORD[((128+8))+rsp],rsi mov QWORD[((128+16))+rsp],rdx mov QWORD[152+rsp],rax movaps XMMWORD[(128+32)+rsp],xmm6 movaps XMMWORD[(128+48)+rsp],xmm7 movaps XMMWORD[(128+64)+rsp],xmm8 movaps XMMWORD[(128+80)+rsp],xmm9 movaps XMMWORD[(128+96)+rsp],xmm10 movaps XMMWORD[(128+112)+rsp],xmm11 $L$prologue_avx: vzeroupper mov rax,QWORD[rdi] mov rbx,QWORD[8+rdi] mov rcx,QWORD[16+rdi] mov rdx,QWORD[24+rdi] mov r8,QWORD[32+rdi] mov r9,QWORD[40+rdi] mov r10,QWORD[48+rdi] mov r11,QWORD[56+rdi] jmp NEAR $L$loop_avx ALIGN 16 $L$loop_avx: vmovdqa xmm11,XMMWORD[((K512+1280))] vmovdqu xmm0,XMMWORD[rsi] lea rbp,[((K512+128))] vmovdqu xmm1,XMMWORD[16+rsi] vmovdqu xmm2,XMMWORD[32+rsi] vpshufb xmm0,xmm0,xmm11 vmovdqu xmm3,XMMWORD[48+rsi] vpshufb xmm1,xmm1,xmm11 vmovdqu xmm4,XMMWORD[64+rsi] vpshufb xmm2,xmm2,xmm11 vmovdqu xmm5,XMMWORD[80+rsi] vpshufb xmm3,xmm3,xmm11 vmovdqu xmm6,XMMWORD[96+rsi] vpshufb xmm4,xmm4,xmm11 vmovdqu xmm7,XMMWORD[112+rsi] vpshufb xmm5,xmm5,xmm11 vpaddq xmm8,xmm0,XMMWORD[((-128))+rbp] vpshufb xmm6,xmm6,xmm11 vpaddq xmm9,xmm1,XMMWORD[((-96))+rbp] vpshufb xmm7,xmm7,xmm11 vpaddq xmm10,xmm2,XMMWORD[((-64))+rbp] vpaddq xmm11,xmm3,XMMWORD[((-32))+rbp] vmovdqa XMMWORD[rsp],xmm8 vpaddq xmm8,xmm4,XMMWORD[rbp] vmovdqa XMMWORD[16+rsp],xmm9 vpaddq xmm9,xmm5,XMMWORD[32+rbp] vmovdqa XMMWORD[32+rsp],xmm10 vpaddq xmm10,xmm6,XMMWORD[64+rbp] vmovdqa XMMWORD[48+rsp],xmm11 vpaddq xmm11,xmm7,XMMWORD[96+rbp] vmovdqa XMMWORD[64+rsp],xmm8 mov r14,rax vmovdqa XMMWORD[80+rsp],xmm9 mov rdi,rbx vmovdqa XMMWORD[96+rsp],xmm10 xor rdi,rcx vmovdqa XMMWORD[112+rsp],xmm11 mov r13,r8 jmp NEAR $L$avx_00_47 ALIGN 16 $L$avx_00_47: add rbp,256 vpalignr xmm8,xmm1,xmm0,8 shrd r13,r13,23 mov rax,r14 vpalignr xmm11,xmm5,xmm4,8 mov r12,r9 shrd r14,r14,5 vpsrlq xmm10,xmm8,1 xor r13,r8 xor r12,r10 vpaddq xmm0,xmm0,xmm11 shrd r13,r13,4 xor r14,rax vpsrlq xmm11,xmm8,7 and r12,r8 xor r13,r8 vpsllq xmm9,xmm8,56 add r11,QWORD[rsp] mov r15,rax vpxor xmm8,xmm11,xmm10 xor r12,r10 shrd r14,r14,6 vpsrlq xmm10,xmm10,7 xor r15,rbx add r11,r12 vpxor xmm8,xmm8,xmm9 shrd r13,r13,14 and rdi,r15 vpsllq xmm9,xmm9,7 xor r14,rax add r11,r13 vpxor xmm8,xmm8,xmm10 xor rdi,rbx shrd r14,r14,28 vpsrlq xmm11,xmm7,6 add rdx,r11 add r11,rdi vpxor xmm8,xmm8,xmm9 mov r13,rdx add r14,r11 vpsllq xmm10,xmm7,3 shrd r13,r13,23 mov r11,r14 vpaddq xmm0,xmm0,xmm8 mov r12,r8 shrd r14,r14,5 vpsrlq xmm9,xmm7,19 xor r13,rdx xor r12,r9 vpxor xmm11,xmm11,xmm10 shrd r13,r13,4 xor r14,r11 vpsllq xmm10,xmm10,42 and r12,rdx xor r13,rdx vpxor xmm11,xmm11,xmm9 add r10,QWORD[8+rsp] mov rdi,r11 vpsrlq xmm9,xmm9,42 xor r12,r9 shrd r14,r14,6 vpxor xmm11,xmm11,xmm10 xor rdi,rax add r10,r12 vpxor xmm11,xmm11,xmm9 shrd r13,r13,14 and r15,rdi vpaddq xmm0,xmm0,xmm11 xor r14,r11 add r10,r13 vpaddq xmm10,xmm0,XMMWORD[((-128))+rbp] xor r15,rax shrd r14,r14,28 add rcx,r10 add r10,r15 mov r13,rcx add r14,r10 vmovdqa XMMWORD[rsp],xmm10 vpalignr xmm8,xmm2,xmm1,8 shrd r13,r13,23 mov r10,r14 vpalignr xmm11,xmm6,xmm5,8 mov r12,rdx shrd r14,r14,5 vpsrlq xmm10,xmm8,1 xor r13,rcx xor r12,r8 vpaddq xmm1,xmm1,xmm11 shrd r13,r13,4 xor r14,r10 vpsrlq xmm11,xmm8,7 and r12,rcx xor r13,rcx vpsllq xmm9,xmm8,56 add r9,QWORD[16+rsp] mov r15,r10 vpxor xmm8,xmm11,xmm10 xor r12,r8 shrd r14,r14,6 vpsrlq xmm10,xmm10,7 xor r15,r11 add r9,r12 vpxor xmm8,xmm8,xmm9 shrd r13,r13,14 and rdi,r15 vpsllq xmm9,xmm9,7 xor r14,r10 add r9,r13 vpxor xmm8,xmm8,xmm10 xor rdi,r11 shrd r14,r14,28 vpsrlq xmm11,xmm0,6 add rbx,r9 add r9,rdi vpxor xmm8,xmm8,xmm9 mov r13,rbx add r14,r9 vpsllq xmm10,xmm0,3 shrd r13,r13,23 mov r9,r14 vpaddq xmm1,xmm1,xmm8 mov r12,rcx shrd r14,r14,5 vpsrlq xmm9,xmm0,19 xor r13,rbx xor r12,rdx vpxor xmm11,xmm11,xmm10 shrd r13,r13,4 xor r14,r9 vpsllq xmm10,xmm10,42 and r12,rbx xor r13,rbx vpxor xmm11,xmm11,xmm9 add r8,QWORD[24+rsp] mov rdi,r9 vpsrlq xmm9,xmm9,42 xor r12,rdx shrd r14,r14,6 vpxor xmm11,xmm11,xmm10 xor rdi,r10 add r8,r12 vpxor xmm11,xmm11,xmm9 shrd r13,r13,14 and r15,rdi vpaddq xmm1,xmm1,xmm11 xor r14,r9 add r8,r13 vpaddq xmm10,xmm1,XMMWORD[((-96))+rbp] xor r15,r10 shrd r14,r14,28 add rax,r8 add r8,r15 mov r13,rax add r14,r8 vmovdqa XMMWORD[16+rsp],xmm10 vpalignr xmm8,xmm3,xmm2,8 shrd r13,r13,23 mov r8,r14 vpalignr xmm11,xmm7,xmm6,8 mov r12,rbx shrd r14,r14,5 vpsrlq xmm10,xmm8,1 xor r13,rax xor r12,rcx vpaddq xmm2,xmm2,xmm11 shrd r13,r13,4 xor r14,r8 vpsrlq xmm11,xmm8,7 and r12,rax xor r13,rax vpsllq xmm9,xmm8,56 add rdx,QWORD[32+rsp] mov r15,r8 vpxor xmm8,xmm11,xmm10 xor r12,rcx shrd r14,r14,6 vpsrlq xmm10,xmm10,7 xor r15,r9 add rdx,r12 vpxor xmm8,xmm8,xmm9 shrd r13,r13,14 and rdi,r15 vpsllq xmm9,xmm9,7 xor r14,r8 add rdx,r13 vpxor xmm8,xmm8,xmm10 xor rdi,r9 shrd r14,r14,28 vpsrlq xmm11,xmm1,6 add r11,rdx add rdx,rdi vpxor xmm8,xmm8,xmm9 mov r13,r11 add r14,rdx vpsllq xmm10,xmm1,3 shrd r13,r13,23 mov rdx,r14 vpaddq xmm2,xmm2,xmm8 mov r12,rax shrd r14,r14,5 vpsrlq xmm9,xmm1,19 xor r13,r11 xor r12,rbx vpxor xmm11,xmm11,xmm10 shrd r13,r13,4 xor r14,rdx vpsllq xmm10,xmm10,42 and r12,r11 xor r13,r11 vpxor xmm11,xmm11,xmm9 add rcx,QWORD[40+rsp] mov rdi,rdx vpsrlq xmm9,xmm9,42 xor r12,rbx shrd r14,r14,6 vpxor xmm11,xmm11,xmm10 xor rdi,r8 add rcx,r12 vpxor xmm11,xmm11,xmm9 shrd r13,r13,14 and r15,rdi vpaddq xmm2,xmm2,xmm11 xor r14,rdx add rcx,r13 vpaddq xmm10,xmm2,XMMWORD[((-64))+rbp] xor r15,r8 shrd r14,r14,28 add r10,rcx add rcx,r15 mov r13,r10 add r14,rcx vmovdqa XMMWORD[32+rsp],xmm10 vpalignr xmm8,xmm4,xmm3,8 shrd r13,r13,23 mov rcx,r14 vpalignr xmm11,xmm0,xmm7,8 mov r12,r11 shrd r14,r14,5 vpsrlq xmm10,xmm8,1 xor r13,r10 xor r12,rax vpaddq xmm3,xmm3,xmm11 shrd r13,r13,4 xor r14,rcx vpsrlq xmm11,xmm8,7 and r12,r10 xor r13,r10 vpsllq xmm9,xmm8,56 add rbx,QWORD[48+rsp] mov r15,rcx vpxor xmm8,xmm11,xmm10 xor r12,rax shrd r14,r14,6 vpsrlq xmm10,xmm10,7 xor r15,rdx add rbx,r12 vpxor xmm8,xmm8,xmm9 shrd r13,r13,14 and rdi,r15 vpsllq xmm9,xmm9,7 xor r14,rcx add rbx,r13 vpxor xmm8,xmm8,xmm10 xor rdi,rdx shrd r14,r14,28 vpsrlq xmm11,xmm2,6 add r9,rbx add rbx,rdi vpxor xmm8,xmm8,xmm9 mov r13,r9 add r14,rbx vpsllq xmm10,xmm2,3 shrd r13,r13,23 mov rbx,r14 vpaddq xmm3,xmm3,xmm8 mov r12,r10 shrd r14,r14,5 vpsrlq xmm9,xmm2,19 xor r13,r9 xor r12,r11 vpxor xmm11,xmm11,xmm10 shrd r13,r13,4 xor r14,rbx vpsllq xmm10,xmm10,42 and r12,r9 xor r13,r9 vpxor xmm11,xmm11,xmm9 add rax,QWORD[56+rsp] mov rdi,rbx vpsrlq xmm9,xmm9,42 xor r12,r11 shrd r14,r14,6 vpxor xmm11,xmm11,xmm10 xor rdi,rcx add rax,r12 vpxor xmm11,xmm11,xmm9 shrd r13,r13,14 and r15,rdi vpaddq xmm3,xmm3,xmm11 xor r14,rbx add rax,r13 vpaddq xmm10,xmm3,XMMWORD[((-32))+rbp] xor r15,rcx shrd r14,r14,28 add r8,rax add rax,r15 mov r13,r8 add r14,rax vmovdqa XMMWORD[48+rsp],xmm10 vpalignr xmm8,xmm5,xmm4,8 shrd r13,r13,23 mov rax,r14 vpalignr xmm11,xmm1,xmm0,8 mov r12,r9 shrd r14,r14,5 vpsrlq xmm10,xmm8,1 xor r13,r8 xor r12,r10 vpaddq xmm4,xmm4,xmm11 shrd r13,r13,4 xor r14,rax vpsrlq xmm11,xmm8,7 and r12,r8 xor r13,r8 vpsllq xmm9,xmm8,56 add r11,QWORD[64+rsp] mov r15,rax vpxor xmm8,xmm11,xmm10 xor r12,r10 shrd r14,r14,6 vpsrlq xmm10,xmm10,7 xor r15,rbx add r11,r12 vpxor xmm8,xmm8,xmm9 shrd r13,r13,14 and rdi,r15 vpsllq xmm9,xmm9,7 xor r14,rax add r11,r13 vpxor xmm8,xmm8,xmm10 xor rdi,rbx shrd r14,r14,28 vpsrlq xmm11,xmm3,6 add rdx,r11 add r11,rdi vpxor xmm8,xmm8,xmm9 mov r13,rdx add r14,r11 vpsllq xmm10,xmm3,3 shrd r13,r13,23 mov r11,r14 vpaddq xmm4,xmm4,xmm8 mov r12,r8 shrd r14,r14,5 vpsrlq xmm9,xmm3,19 xor r13,rdx xor r12,r9 vpxor xmm11,xmm11,xmm10 shrd r13,r13,4 xor r14,r11 vpsllq xmm10,xmm10,42 and r12,rdx xor r13,rdx vpxor xmm11,xmm11,xmm9 add r10,QWORD[72+rsp] mov rdi,r11 vpsrlq xmm9,xmm9,42 xor r12,r9 shrd r14,r14,6 vpxor xmm11,xmm11,xmm10 xor rdi,rax add r10,r12 vpxor xmm11,xmm11,xmm9 shrd r13,r13,14 and r15,rdi vpaddq xmm4,xmm4,xmm11 xor r14,r11 add r10,r13 vpaddq xmm10,xmm4,XMMWORD[rbp] xor r15,rax shrd r14,r14,28 add rcx,r10 add r10,r15 mov r13,rcx add r14,r10 vmovdqa XMMWORD[64+rsp],xmm10 vpalignr xmm8,xmm6,xmm5,8 shrd r13,r13,23 mov r10,r14 vpalignr xmm11,xmm2,xmm1,8 mov r12,rdx shrd r14,r14,5 vpsrlq xmm10,xmm8,1 xor r13,rcx xor r12,r8 vpaddq xmm5,xmm5,xmm11 shrd r13,r13,4 xor r14,r10 vpsrlq xmm11,xmm8,7 and r12,rcx xor r13,rcx vpsllq xmm9,xmm8,56 add r9,QWORD[80+rsp] mov r15,r10 vpxor xmm8,xmm11,xmm10 xor r12,r8 shrd r14,r14,6 vpsrlq xmm10,xmm10,7 xor r15,r11 add r9,r12 vpxor xmm8,xmm8,xmm9 shrd r13,r13,14 and rdi,r15 vpsllq xmm9,xmm9,7 xor r14,r10 add r9,r13 vpxor xmm8,xmm8,xmm10 xor rdi,r11 shrd r14,r14,28 vpsrlq xmm11,xmm4,6 add rbx,r9 add r9,rdi vpxor xmm8,xmm8,xmm9 mov r13,rbx add r14,r9 vpsllq xmm10,xmm4,3 shrd r13,r13,23 mov r9,r14 vpaddq xmm5,xmm5,xmm8 mov r12,rcx shrd r14,r14,5 vpsrlq xmm9,xmm4,19 xor r13,rbx xor r12,rdx vpxor xmm11,xmm11,xmm10 shrd r13,r13,4 xor r14,r9 vpsllq xmm10,xmm10,42 and r12,rbx xor r13,rbx vpxor xmm11,xmm11,xmm9 add r8,QWORD[88+rsp] mov rdi,r9 vpsrlq xmm9,xmm9,42 xor r12,rdx shrd r14,r14,6 vpxor xmm11,xmm11,xmm10 xor rdi,r10 add r8,r12 vpxor xmm11,xmm11,xmm9 shrd r13,r13,14 and r15,rdi vpaddq xmm5,xmm5,xmm11 xor r14,r9 add r8,r13 vpaddq xmm10,xmm5,XMMWORD[32+rbp] xor r15,r10 shrd r14,r14,28 add rax,r8 add r8,r15 mov r13,rax add r14,r8 vmovdqa XMMWORD[80+rsp],xmm10 vpalignr xmm8,xmm7,xmm6,8 shrd r13,r13,23 mov r8,r14 vpalignr xmm11,xmm3,xmm2,8 mov r12,rbx shrd r14,r14,5 vpsrlq xmm10,xmm8,1 xor r13,rax xor r12,rcx vpaddq xmm6,xmm6,xmm11 shrd r13,r13,4 xor r14,r8 vpsrlq xmm11,xmm8,7 and r12,rax xor r13,rax vpsllq xmm9,xmm8,56 add rdx,QWORD[96+rsp] mov r15,r8 vpxor xmm8,xmm11,xmm10 xor r12,rcx shrd r14,r14,6 vpsrlq xmm10,xmm10,7 xor r15,r9 add rdx,r12 vpxor xmm8,xmm8,xmm9 shrd r13,r13,14 and rdi,r15 vpsllq xmm9,xmm9,7 xor r14,r8 add rdx,r13 vpxor xmm8,xmm8,xmm10 xor rdi,r9 shrd r14,r14,28 vpsrlq xmm11,xmm5,6 add r11,rdx add rdx,rdi vpxor xmm8,xmm8,xmm9 mov r13,r11 add r14,rdx vpsllq xmm10,xmm5,3 shrd r13,r13,23 mov rdx,r14 vpaddq xmm6,xmm6,xmm8 mov r12,rax shrd r14,r14,5 vpsrlq xmm9,xmm5,19 xor r13,r11 xor r12,rbx vpxor xmm11,xmm11,xmm10 shrd r13,r13,4 xor r14,rdx vpsllq xmm10,xmm10,42 and r12,r11 xor r13,r11 vpxor xmm11,xmm11,xmm9 add rcx,QWORD[104+rsp] mov rdi,rdx vpsrlq xmm9,xmm9,42 xor r12,rbx shrd r14,r14,6 vpxor xmm11,xmm11,xmm10 xor rdi,r8 add rcx,r12 vpxor xmm11,xmm11,xmm9 shrd r13,r13,14 and r15,rdi vpaddq xmm6,xmm6,xmm11 xor r14,rdx add rcx,r13 vpaddq xmm10,xmm6,XMMWORD[64+rbp] xor r15,r8 shrd r14,r14,28 add r10,rcx add rcx,r15 mov r13,r10 add r14,rcx vmovdqa XMMWORD[96+rsp],xmm10 vpalignr xmm8,xmm0,xmm7,8 shrd r13,r13,23 mov rcx,r14 vpalignr xmm11,xmm4,xmm3,8 mov r12,r11 shrd r14,r14,5 vpsrlq xmm10,xmm8,1 xor r13,r10 xor r12,rax vpaddq xmm7,xmm7,xmm11 shrd r13,r13,4 xor r14,rcx vpsrlq xmm11,xmm8,7 and r12,r10 xor r13,r10 vpsllq xmm9,xmm8,56 add rbx,QWORD[112+rsp] mov r15,rcx vpxor xmm8,xmm11,xmm10 xor r12,rax shrd r14,r14,6 vpsrlq xmm10,xmm10,7 xor r15,rdx add rbx,r12 vpxor xmm8,xmm8,xmm9 shrd r13,r13,14 and rdi,r15 vpsllq xmm9,xmm9,7 xor r14,rcx add rbx,r13 vpxor xmm8,xmm8,xmm10 xor rdi,rdx shrd r14,r14,28 vpsrlq xmm11,xmm6,6 add r9,rbx add rbx,rdi vpxor xmm8,xmm8,xmm9 mov r13,r9 add r14,rbx vpsllq xmm10,xmm6,3 shrd r13,r13,23 mov rbx,r14 vpaddq xmm7,xmm7,xmm8 mov r12,r10 shrd r14,r14,5 vpsrlq xmm9,xmm6,19 xor r13,r9 xor r12,r11 vpxor xmm11,xmm11,xmm10 shrd r13,r13,4 xor r14,rbx vpsllq xmm10,xmm10,42 and r12,r9 xor r13,r9 vpxor xmm11,xmm11,xmm9 add rax,QWORD[120+rsp] mov rdi,rbx vpsrlq xmm9,xmm9,42 xor r12,r11 shrd r14,r14,6 vpxor xmm11,xmm11,xmm10 xor rdi,rcx add rax,r12 vpxor xmm11,xmm11,xmm9 shrd r13,r13,14 and r15,rdi vpaddq xmm7,xmm7,xmm11 xor r14,rbx add rax,r13 vpaddq xmm10,xmm7,XMMWORD[96+rbp] xor r15,rcx shrd r14,r14,28 add r8,rax add rax,r15 mov r13,r8 add r14,rax vmovdqa XMMWORD[112+rsp],xmm10 cmp BYTE[135+rbp],0 jne NEAR $L$avx_00_47 shrd r13,r13,23 mov rax,r14 mov r12,r9 shrd r14,r14,5 xor r13,r8 xor r12,r10 shrd r13,r13,4 xor r14,rax and r12,r8 xor r13,r8 add r11,QWORD[rsp] mov r15,rax xor r12,r10 shrd r14,r14,6 xor r15,rbx add r11,r12 shrd r13,r13,14 and rdi,r15 xor r14,rax add r11,r13 xor rdi,rbx shrd r14,r14,28 add rdx,r11 add r11,rdi mov r13,rdx add r14,r11 shrd r13,r13,23 mov r11,r14 mov r12,r8 shrd r14,r14,5 xor r13,rdx xor r12,r9 shrd r13,r13,4 xor r14,r11 and r12,rdx xor r13,rdx add r10,QWORD[8+rsp] mov rdi,r11 xor r12,r9 shrd r14,r14,6 xor rdi,rax add r10,r12 shrd r13,r13,14 and r15,rdi xor r14,r11 add r10,r13 xor r15,rax shrd r14,r14,28 add rcx,r10 add r10,r15 mov r13,rcx add r14,r10 shrd r13,r13,23 mov r10,r14 mov r12,rdx shrd r14,r14,5 xor r13,rcx xor r12,r8 shrd r13,r13,4 xor r14,r10 and r12,rcx xor r13,rcx add r9,QWORD[16+rsp] mov r15,r10 xor r12,r8 shrd r14,r14,6 xor r15,r11 add r9,r12 shrd r13,r13,14 and rdi,r15 xor r14,r10 add r9,r13 xor rdi,r11 shrd r14,r14,28 add rbx,r9 add r9,rdi mov r13,rbx add r14,r9 shrd r13,r13,23 mov r9,r14 mov r12,rcx shrd r14,r14,5 xor r13,rbx xor r12,rdx shrd r13,r13,4 xor r14,r9 and r12,rbx xor r13,rbx add r8,QWORD[24+rsp] mov rdi,r9 xor r12,rdx shrd r14,r14,6 xor rdi,r10 add r8,r12 shrd r13,r13,14 and r15,rdi xor r14,r9 add r8,r13 xor r15,r10 shrd r14,r14,28 add rax,r8 add r8,r15 mov r13,rax add r14,r8 shrd r13,r13,23 mov r8,r14 mov r12,rbx shrd r14,r14,5 xor r13,rax xor r12,rcx shrd r13,r13,4 xor r14,r8 and r12,rax xor r13,rax add rdx,QWORD[32+rsp] mov r15,r8 xor r12,rcx shrd r14,r14,6 xor r15,r9 add rdx,r12 shrd r13,r13,14 and rdi,r15 xor r14,r8 add rdx,r13 xor rdi,r9 shrd r14,r14,28 add r11,rdx add rdx,rdi mov r13,r11 add r14,rdx shrd r13,r13,23 mov rdx,r14 mov r12,rax shrd r14,r14,5 xor r13,r11 xor r12,rbx shrd r13,r13,4 xor r14,rdx and r12,r11 xor r13,r11 add rcx,QWORD[40+rsp] mov rdi,rdx xor r12,rbx shrd r14,r14,6 xor rdi,r8 add rcx,r12 shrd r13,r13,14 and r15,rdi xor r14,rdx add rcx,r13 xor r15,r8 shrd r14,r14,28 add r10,rcx add rcx,r15 mov r13,r10 add r14,rcx shrd r13,r13,23 mov rcx,r14 mov r12,r11 shrd r14,r14,5 xor r13,r10 xor r12,rax shrd r13,r13,4 xor r14,rcx and r12,r10 xor r13,r10 add rbx,QWORD[48+rsp] mov r15,rcx xor r12,rax shrd r14,r14,6 xor r15,rdx add rbx,r12 shrd r13,r13,14 and rdi,r15 xor r14,rcx add rbx,r13 xor rdi,rdx shrd r14,r14,28 add r9,rbx add rbx,rdi mov r13,r9 add r14,rbx shrd r13,r13,23 mov rbx,r14 mov r12,r10 shrd r14,r14,5 xor r13,r9 xor r12,r11 shrd r13,r13,4 xor r14,rbx and r12,r9 xor r13,r9 add rax,QWORD[56+rsp] mov rdi,rbx xor r12,r11 shrd r14,r14,6 xor rdi,rcx add rax,r12 shrd r13,r13,14 and r15,rdi xor r14,rbx add rax,r13 xor r15,rcx shrd r14,r14,28 add r8,rax add rax,r15 mov r13,r8 add r14,rax shrd r13,r13,23 mov rax,r14 mov r12,r9 shrd r14,r14,5 xor r13,r8 xor r12,r10 shrd r13,r13,4 xor r14,rax and r12,r8 xor r13,r8 add r11,QWORD[64+rsp] mov r15,rax xor r12,r10 shrd r14,r14,6 xor r15,rbx add r11,r12 shrd r13,r13,14 and rdi,r15 xor r14,rax add r11,r13 xor rdi,rbx shrd r14,r14,28 add rdx,r11 add r11,rdi mov r13,rdx add r14,r11 shrd r13,r13,23 mov r11,r14 mov r12,r8 shrd r14,r14,5 xor r13,rdx xor r12,r9 shrd r13,r13,4 xor r14,r11 and r12,rdx xor r13,rdx add r10,QWORD[72+rsp] mov rdi,r11 xor r12,r9 shrd r14,r14,6 xor rdi,rax add r10,r12 shrd r13,r13,14 and r15,rdi xor r14,r11 add r10,r13 xor r15,rax shrd r14,r14,28 add rcx,r10 add r10,r15 mov r13,rcx add r14,r10 shrd r13,r13,23 mov r10,r14 mov r12,rdx shrd r14,r14,5 xor r13,rcx xor r12,r8 shrd r13,r13,4 xor r14,r10 and r12,rcx xor r13,rcx add r9,QWORD[80+rsp] mov r15,r10 xor r12,r8 shrd r14,r14,6 xor r15,r11 add r9,r12 shrd r13,r13,14 and rdi,r15 xor r14,r10 add r9,r13 xor rdi,r11 shrd r14,r14,28 add rbx,r9 add r9,rdi mov r13,rbx add r14,r9 shrd r13,r13,23 mov r9,r14 mov r12,rcx shrd r14,r14,5 xor r13,rbx xor r12,rdx shrd r13,r13,4 xor r14,r9 and r12,rbx xor r13,rbx add r8,QWORD[88+rsp] mov rdi,r9 xor r12,rdx shrd r14,r14,6 xor rdi,r10 add r8,r12 shrd r13,r13,14 and r15,rdi xor r14,r9 add r8,r13 xor r15,r10 shrd r14,r14,28 add rax,r8 add r8,r15 mov r13,rax add r14,r8 shrd r13,r13,23 mov r8,r14 mov r12,rbx shrd r14,r14,5 xor r13,rax xor r12,rcx shrd r13,r13,4 xor r14,r8 and r12,rax xor r13,rax add rdx,QWORD[96+rsp] mov r15,r8 xor r12,rcx shrd r14,r14,6 xor r15,r9 add rdx,r12 shrd r13,r13,14 and rdi,r15 xor r14,r8 add rdx,r13 xor rdi,r9 shrd r14,r14,28 add r11,rdx add rdx,rdi mov r13,r11 add r14,rdx shrd r13,r13,23 mov rdx,r14 mov r12,rax shrd r14,r14,5 xor r13,r11 xor r12,rbx shrd r13,r13,4 xor r14,rdx and r12,r11 xor r13,r11 add rcx,QWORD[104+rsp] mov rdi,rdx xor r12,rbx shrd r14,r14,6 xor rdi,r8 add rcx,r12 shrd r13,r13,14 and r15,rdi xor r14,rdx add rcx,r13 xor r15,r8 shrd r14,r14,28 add r10,rcx add rcx,r15 mov r13,r10 add r14,rcx shrd r13,r13,23 mov rcx,r14 mov r12,r11 shrd r14,r14,5 xor r13,r10 xor r12,rax shrd r13,r13,4 xor r14,rcx and r12,r10 xor r13,r10 add rbx,QWORD[112+rsp] mov r15,rcx xor r12,rax shrd r14,r14,6 xor r15,rdx add rbx,r12 shrd r13,r13,14 and rdi,r15 xor r14,rcx add rbx,r13 xor rdi,rdx shrd r14,r14,28 add r9,rbx add rbx,rdi mov r13,r9 add r14,rbx shrd r13,r13,23 mov rbx,r14 mov r12,r10 shrd r14,r14,5 xor r13,r9 xor r12,r11 shrd r13,r13,4 xor r14,rbx and r12,r9 xor r13,r9 add rax,QWORD[120+rsp] mov rdi,rbx xor r12,r11 shrd r14,r14,6 xor rdi,rcx add rax,r12 shrd r13,r13,14 and r15,rdi xor r14,rbx add rax,r13 xor r15,rcx shrd r14,r14,28 add r8,rax add rax,r15 mov r13,r8 add r14,rax mov rdi,QWORD[((128+0))+rsp] mov rax,r14 add rax,QWORD[rdi] lea rsi,[128+rsi] add rbx,QWORD[8+rdi] add rcx,QWORD[16+rdi] add rdx,QWORD[24+rdi] add r8,QWORD[32+rdi] add r9,QWORD[40+rdi] add r10,QWORD[48+rdi] add r11,QWORD[56+rdi] cmp rsi,QWORD[((128+16))+rsp] mov QWORD[rdi],rax mov QWORD[8+rdi],rbx mov QWORD[16+rdi],rcx mov QWORD[24+rdi],rdx mov QWORD[32+rdi],r8 mov QWORD[40+rdi],r9 mov QWORD[48+rdi],r10 mov QWORD[56+rdi],r11 jb NEAR $L$loop_avx mov rsi,QWORD[152+rsp] vzeroupper movaps xmm6,XMMWORD[((128+32))+rsp] movaps xmm7,XMMWORD[((128+48))+rsp] movaps xmm8,XMMWORD[((128+64))+rsp] movaps xmm9,XMMWORD[((128+80))+rsp] movaps xmm10,XMMWORD[((128+96))+rsp] movaps xmm11,XMMWORD[((128+112))+rsp] mov r15,QWORD[((-48))+rsi] mov r14,QWORD[((-40))+rsi] mov r13,QWORD[((-32))+rsi] mov r12,QWORD[((-24))+rsi] mov rbp,QWORD[((-16))+rsi] mov rbx,QWORD[((-8))+rsi] lea rsp,[rsi] $L$epilogue_avx: mov rdi,QWORD[8+rsp] ;WIN64 epilogue mov rsi,QWORD[16+rsp] DB 0F3h,0C3h ;repret $L$SEH_end_sha512_block_data_order_avx: EXTERN __imp_RtlVirtualUnwind ALIGN 16 se_handler: push rsi push rdi push rbx push rbp push r12 push r13 push r14 push r15 pushfq sub rsp,64 mov rax,QWORD[120+r8] mov rbx,QWORD[248+r8] mov rsi,QWORD[8+r9] mov r11,QWORD[56+r9] mov r10d,DWORD[r11] lea r10,[r10*1+rsi] cmp rbx,r10 jb NEAR $L$in_prologue mov rax,QWORD[152+r8] mov r10d,DWORD[4+r11] lea r10,[r10*1+rsi] cmp rbx,r10 jae NEAR $L$in_prologue mov rsi,rax mov rax,QWORD[((128+24))+rax] mov rbx,QWORD[((-8))+rax] mov rbp,QWORD[((-16))+rax] mov r12,QWORD[((-24))+rax] mov r13,QWORD[((-32))+rax] mov r14,QWORD[((-40))+rax] mov r15,QWORD[((-48))+rax] mov QWORD[144+r8],rbx mov QWORD[160+r8],rbp mov QWORD[216+r8],r12 mov QWORD[224+r8],r13 mov QWORD[232+r8],r14 mov QWORD[240+r8],r15 lea r10,[$L$epilogue] cmp rbx,r10 jb NEAR $L$in_prologue lea rsi,[((128+32))+rsi] lea rdi,[512+r8] mov ecx,12 DD 0xa548f3fc $L$in_prologue: mov rdi,QWORD[8+rax] mov rsi,QWORD[16+rax] mov QWORD[152+r8],rax mov QWORD[168+r8],rsi mov QWORD[176+r8],rdi mov rdi,QWORD[40+r9] mov rsi,r8 mov ecx,154 DD 0xa548f3fc mov rsi,r9 xor rcx,rcx mov rdx,QWORD[8+rsi] mov r8,QWORD[rsi] mov r9,QWORD[16+rsi] mov r10,QWORD[40+rsi] lea r11,[56+rsi] lea r12,[24+rsi] mov QWORD[32+rsp],r10 mov QWORD[40+rsp],r11 mov QWORD[48+rsp],r12 mov QWORD[56+rsp],rcx call QWORD[__imp_RtlVirtualUnwind] mov eax,1 add rsp,64 popfq pop r15 pop r14 pop r13 pop r12 pop rbp pop rbx pop rdi pop rsi DB 0F3h,0C3h ;repret section .pdata rdata align=4 ALIGN 4 DD $L$SEH_begin_sha512_block_data_order wrt ..imagebase DD $L$SEH_end_sha512_block_data_order wrt ..imagebase DD $L$SEH_info_sha512_block_data_order wrt ..imagebase DD $L$SEH_begin_sha512_block_data_order_avx wrt ..imagebase DD $L$SEH_end_sha512_block_data_order_avx wrt ..imagebase DD $L$SEH_info_sha512_block_data_order_avx wrt ..imagebase section .xdata rdata align=8 ALIGN 8 $L$SEH_info_sha512_block_data_order: DB 9,0,0,0 DD se_handler wrt ..imagebase DD $L$prologue wrt ..imagebase,$L$epilogue wrt ..imagebase $L$SEH_info_sha512_block_data_order_avx: DB 9,0,0,0 DD se_handler wrt ..imagebase DD $L$prologue_avx wrt ..imagebase,$L$epilogue_avx wrt ..imagebase %else ; Work around https://bugzilla.nasm.us/show_bug.cgi?id=3392738 ret %endif