ref: 94f2907dc40a6415a10c252cb9ba3971f1f7e838
dir: /third_party/boringssl/src/gen/bcm/aesni-x86-win.asm/
; This file is generated from a similarly-named Perl script in the BoringSSL ; source tree. Do not edit by hand. %ifdef BORINGSSL_PREFIX %include "boringssl_prefix_symbols_nasm.inc" %endif %ifidn __OUTPUT_FORMAT__, win32 %ifidn __OUTPUT_FORMAT__,obj section code use32 class=code align=64 %elifidn __OUTPUT_FORMAT__,win32 [email protected] equ 1 section .text code align=64 %else section .text code %endif %ifdef BORINGSSL_DISPATCH_TEST extern _BORINGSSL_function_hit %endif global _aes_hw_encrypt align 16 _aes_hw_encrypt: L$_aes_hw_encrypt_begin: %ifdef BORINGSSL_DISPATCH_TEST push ebx push edx call L$000pic_for_function_hit L$000pic_for_function_hit: pop ebx lea ebx,[(_BORINGSSL_function_hit+1-L$000pic_for_function_hit)+ebx] mov edx,1 mov BYTE [ebx],dl pop edx pop ebx %endif mov eax,DWORD [4+esp] mov edx,DWORD [12+esp] movups xmm2,[eax] mov ecx,DWORD [240+edx] mov eax,DWORD [8+esp] movups xmm0,[edx] movups xmm1,[16+edx] lea edx,[32+edx] xorps xmm2,xmm0 L$001enc1_loop_1: db 102,15,56,220,209 dec ecx movups xmm1,[edx] lea edx,[16+edx] jnz NEAR L$001enc1_loop_1 db 102,15,56,221,209 pxor xmm0,xmm0 pxor xmm1,xmm1 movups [eax],xmm2 pxor xmm2,xmm2 ret global _aes_hw_decrypt align 16 _aes_hw_decrypt: L$_aes_hw_decrypt_begin: mov eax,DWORD [4+esp] mov edx,DWORD [12+esp] movups xmm2,[eax] mov ecx,DWORD [240+edx] mov eax,DWORD [8+esp] movups xmm0,[edx] movups xmm1,[16+edx] lea edx,[32+edx] xorps xmm2,xmm0 L$002dec1_loop_2: db 102,15,56,222,209 dec ecx movups xmm1,[edx] lea edx,[16+edx] jnz NEAR L$002dec1_loop_2 db 102,15,56,223,209 pxor xmm0,xmm0 pxor xmm1,xmm1 movups [eax],xmm2 pxor xmm2,xmm2 ret align 16 __aesni_encrypt2: movups xmm0,[edx] shl ecx,4 movups xmm1,[16+edx] xorps xmm2,xmm0 pxor xmm3,xmm0 movups xmm0,[32+edx] lea edx,[32+ecx*1+edx] neg ecx add ecx,16 L$003enc2_loop: db 102,15,56,220,209 db 102,15,56,220,217 movups xmm1,[ecx*1+edx] add ecx,32 db 102,15,56,220,208 db 102,15,56,220,216 movups xmm0,[ecx*1+edx-16] jnz NEAR L$003enc2_loop db 102,15,56,220,209 db 102,15,56,220,217 db 102,15,56,221,208 db 102,15,56,221,216 ret align 16 __aesni_decrypt2: movups xmm0,[edx] shl ecx,4 movups xmm1,[16+edx] xorps xmm2,xmm0 pxor xmm3,xmm0 movups xmm0,[32+edx] lea edx,[32+ecx*1+edx] neg ecx add ecx,16 L$004dec2_loop: db 102,15,56,222,209 db 102,15,56,222,217 movups xmm1,[ecx*1+edx] add ecx,32 db 102,15,56,222,208 db 102,15,56,222,216 movups xmm0,[ecx*1+edx-16] jnz NEAR L$004dec2_loop db 102,15,56,222,209 db 102,15,56,222,217 db 102,15,56,223,208 db 102,15,56,223,216 ret align 16 __aesni_encrypt3: movups xmm0,[edx] shl ecx,4 movups xmm1,[16+edx] xorps xmm2,xmm0 pxor xmm3,xmm0 pxor xmm4,xmm0 movups xmm0,[32+edx] lea edx,[32+ecx*1+edx] neg ecx add ecx,16 L$005enc3_loop: db 102,15,56,220,209 db 102,15,56,220,217 db 102,15,56,220,225 movups xmm1,[ecx*1+edx] add ecx,32 db 102,15,56,220,208 db 102,15,56,220,216 db 102,15,56,220,224 movups xmm0,[ecx*1+edx-16] jnz NEAR L$005enc3_loop db 102,15,56,220,209 db 102,15,56,220,217 db 102,15,56,220,225 db 102,15,56,221,208 db 102,15,56,221,216 db 102,15,56,221,224 ret align 16 __aesni_decrypt3: movups xmm0,[edx] shl ecx,4 movups xmm1,[16+edx] xorps xmm2,xmm0 pxor xmm3,xmm0 pxor xmm4,xmm0 movups xmm0,[32+edx] lea edx,[32+ecx*1+edx] neg ecx add ecx,16 L$006dec3_loop: db 102,15,56,222,209 db 102,15,56,222,217 db 102,15,56,222,225 movups xmm1,[ecx*1+edx] add ecx,32 db 102,15,56,222,208 db 102,15,56,222,216 db 102,15,56,222,224 movups xmm0,[ecx*1+edx-16] jnz NEAR L$006dec3_loop db 102,15,56,222,209 db 102,15,56,222,217 db 102,15,56,222,225 db 102,15,56,223,208 db 102,15,56,223,216 db 102,15,56,223,224 ret align 16 __aesni_encrypt4: movups xmm0,[edx] movups xmm1,[16+edx] shl ecx,4 xorps xmm2,xmm0 pxor xmm3,xmm0 pxor xmm4,xmm0 pxor xmm5,xmm0 movups xmm0,[32+edx] lea edx,[32+ecx*1+edx] neg ecx db 15,31,64,0 add ecx,16 L$007enc4_loop: db 102,15,56,220,209 db 102,15,56,220,217 db 102,15,56,220,225 db 102,15,56,220,233 movups xmm1,[ecx*1+edx] add ecx,32 db 102,15,56,220,208 db 102,15,56,220,216 db 102,15,56,220,224 db 102,15,56,220,232 movups xmm0,[ecx*1+edx-16] jnz NEAR L$007enc4_loop db 102,15,56,220,209 db 102,15,56,220,217 db 102,15,56,220,225 db 102,15,56,220,233 db 102,15,56,221,208 db 102,15,56,221,216 db 102,15,56,221,224 db 102,15,56,221,232 ret align 16 __aesni_decrypt4: movups xmm0,[edx] movups xmm1,[16+edx] shl ecx,4 xorps xmm2,xmm0 pxor xmm3,xmm0 pxor xmm4,xmm0 pxor xmm5,xmm0 movups xmm0,[32+edx] lea edx,[32+ecx*1+edx] neg ecx db 15,31,64,0 add ecx,16 L$008dec4_loop: db 102,15,56,222,209 db 102,15,56,222,217 db 102,15,56,222,225 db 102,15,56,222,233 movups xmm1,[ecx*1+edx] add ecx,32 db 102,15,56,222,208 db 102,15,56,222,216 db 102,15,56,222,224 db 102,15,56,222,232 movups xmm0,[ecx*1+edx-16] jnz NEAR L$008dec4_loop db 102,15,56,222,209 db 102,15,56,222,217 db 102,15,56,222,225 db 102,15,56,222,233 db 102,15,56,223,208 db 102,15,56,223,216 db 102,15,56,223,224 db 102,15,56,223,232 ret align 16 __aesni_encrypt6: movups xmm0,[edx] shl ecx,4 movups xmm1,[16+edx] xorps xmm2,xmm0 pxor xmm3,xmm0 pxor xmm4,xmm0 db 102,15,56,220,209 pxor xmm5,xmm0 pxor xmm6,xmm0 db 102,15,56,220,217 lea edx,[32+ecx*1+edx] neg ecx db 102,15,56,220,225 pxor xmm7,xmm0 movups xmm0,[ecx*1+edx] add ecx,16 jmp NEAR L$009_aesni_encrypt6_inner align 16 L$010enc6_loop: db 102,15,56,220,209 db 102,15,56,220,217 db 102,15,56,220,225 L$009_aesni_encrypt6_inner: db 102,15,56,220,233 db 102,15,56,220,241 db 102,15,56,220,249 L$_aesni_encrypt6_enter: movups xmm1,[ecx*1+edx] add ecx,32 db 102,15,56,220,208 db 102,15,56,220,216 db 102,15,56,220,224 db 102,15,56,220,232 db 102,15,56,220,240 db 102,15,56,220,248 movups xmm0,[ecx*1+edx-16] jnz NEAR L$010enc6_loop db 102,15,56,220,209 db 102,15,56,220,217 db 102,15,56,220,225 db 102,15,56,220,233 db 102,15,56,220,241 db 102,15,56,220,249 db 102,15,56,221,208 db 102,15,56,221,216 db 102,15,56,221,224 db 102,15,56,221,232 db 102,15,56,221,240 db 102,15,56,221,248 ret align 16 __aesni_decrypt6: movups xmm0,[edx] shl ecx,4 movups xmm1,[16+edx] xorps xmm2,xmm0 pxor xmm3,xmm0 pxor xmm4,xmm0 db 102,15,56,222,209 pxor xmm5,xmm0 pxor xmm6,xmm0 db 102,15,56,222,217 lea edx,[32+ecx*1+edx] neg ecx db 102,15,56,222,225 pxor xmm7,xmm0 movups xmm0,[ecx*1+edx] add ecx,16 jmp NEAR L$011_aesni_decrypt6_inner align 16 L$012dec6_loop: db 102,15,56,222,209 db 102,15,56,222,217 db 102,15,56,222,225 L$011_aesni_decrypt6_inner: db 102,15,56,222,233 db 102,15,56,222,241 db 102,15,56,222,249 L$_aesni_decrypt6_enter: movups xmm1,[ecx*1+edx] add ecx,32 db 102,15,56,222,208 db 102,15,56,222,216 db 102,15,56,222,224 db 102,15,56,222,232 db 102,15,56,222,240 db 102,15,56,222,248 movups xmm0,[ecx*1+edx-16] jnz NEAR L$012dec6_loop db 102,15,56,222,209 db 102,15,56,222,217 db 102,15,56,222,225 db 102,15,56,222,233 db 102,15,56,222,241 db 102,15,56,222,249 db 102,15,56,223,208 db 102,15,56,223,216 db 102,15,56,223,224 db 102,15,56,223,232 db 102,15,56,223,240 db 102,15,56,223,248 ret global _aes_hw_ecb_encrypt align 16 _aes_hw_ecb_encrypt: L$_aes_hw_ecb_encrypt_begin: push ebp push ebx push esi push edi mov esi,DWORD [20+esp] mov edi,DWORD [24+esp] mov eax,DWORD [28+esp] mov edx,DWORD [32+esp] mov ebx,DWORD [36+esp] and eax,-16 jz NEAR L$013ecb_ret mov ecx,DWORD [240+edx] test ebx,ebx jz NEAR L$014ecb_decrypt mov ebp,edx mov ebx,ecx cmp eax,96 jb NEAR L$015ecb_enc_tail movdqu xmm2,[esi] movdqu xmm3,[16+esi] movdqu xmm4,[32+esi] movdqu xmm5,[48+esi] movdqu xmm6,[64+esi] movdqu xmm7,[80+esi] lea esi,[96+esi] sub eax,96 jmp NEAR L$016ecb_enc_loop6_enter align 16 L$017ecb_enc_loop6: movups [edi],xmm2 movdqu xmm2,[esi] movups [16+edi],xmm3 movdqu xmm3,[16+esi] movups [32+edi],xmm4 movdqu xmm4,[32+esi] movups [48+edi],xmm5 movdqu xmm5,[48+esi] movups [64+edi],xmm6 movdqu xmm6,[64+esi] movups [80+edi],xmm7 lea edi,[96+edi] movdqu xmm7,[80+esi] lea esi,[96+esi] L$016ecb_enc_loop6_enter: call __aesni_encrypt6 mov edx,ebp mov ecx,ebx sub eax,96 jnc NEAR L$017ecb_enc_loop6 movups [edi],xmm2 movups [16+edi],xmm3 movups [32+edi],xmm4 movups [48+edi],xmm5 movups [64+edi],xmm6 movups [80+edi],xmm7 lea edi,[96+edi] add eax,96 jz NEAR L$013ecb_ret L$015ecb_enc_tail: movups xmm2,[esi] cmp eax,32 jb NEAR L$018ecb_enc_one movups xmm3,[16+esi] je NEAR L$019ecb_enc_two movups xmm4,[32+esi] cmp eax,64 jb NEAR L$020ecb_enc_three movups xmm5,[48+esi] je NEAR L$021ecb_enc_four movups xmm6,[64+esi] xorps xmm7,xmm7 call __aesni_encrypt6 movups [edi],xmm2 movups [16+edi],xmm3 movups [32+edi],xmm4 movups [48+edi],xmm5 movups [64+edi],xmm6 jmp NEAR L$013ecb_ret align 16 L$018ecb_enc_one: movups xmm0,[edx] movups xmm1,[16+edx] lea edx,[32+edx] xorps xmm2,xmm0 L$022enc1_loop_3: db 102,15,56,220,209 dec ecx movups xmm1,[edx] lea edx,[16+edx] jnz NEAR L$022enc1_loop_3 db 102,15,56,221,209 movups [edi],xmm2 jmp NEAR L$013ecb_ret align 16 L$019ecb_enc_two: call __aesni_encrypt2 movups [edi],xmm2 movups [16+edi],xmm3 jmp NEAR L$013ecb_ret align 16 L$020ecb_enc_three: call __aesni_encrypt3 movups [edi],xmm2 movups [16+edi],xmm3 movups [32+edi],xmm4 jmp NEAR L$013ecb_ret align 16 L$021ecb_enc_four: call __aesni_encrypt4 movups [edi],xmm2 movups [16+edi],xmm3 movups [32+edi],xmm4 movups [48+edi],xmm5 jmp NEAR L$013ecb_ret align 16 L$014ecb_decrypt: mov ebp,edx mov ebx,ecx cmp eax,96 jb NEAR L$023ecb_dec_tail movdqu xmm2,[esi] movdqu xmm3,[16+esi] movdqu xmm4,[32+esi] movdqu xmm5,[48+esi] movdqu xmm6,[64+esi] movdqu xmm7,[80+esi] lea esi,[96+esi] sub eax,96 jmp NEAR L$024ecb_dec_loop6_enter align 16 L$025ecb_dec_loop6: movups [edi],xmm2 movdqu xmm2,[esi] movups [16+edi],xmm3 movdqu xmm3,[16+esi] movups [32+edi],xmm4 movdqu xmm4,[32+esi] movups [48+edi],xmm5 movdqu xmm5,[48+esi] movups [64+edi],xmm6 movdqu xmm6,[64+esi] movups [80+edi],xmm7 lea edi,[96+edi] movdqu xmm7,[80+esi] lea esi,[96+esi] L$024ecb_dec_loop6_enter: call __aesni_decrypt6 mov edx,ebp mov ecx,ebx sub eax,96 jnc NEAR L$025ecb_dec_loop6 movups [edi],xmm2 movups [16+edi],xmm3 movups [32+edi],xmm4 movups [48+edi],xmm5 movups [64+edi],xmm6 movups [80+edi],xmm7 lea edi,[96+edi] add eax,96 jz NEAR L$013ecb_ret L$023ecb_dec_tail: movups xmm2,[esi] cmp eax,32 jb NEAR L$026ecb_dec_one movups xmm3,[16+esi] je NEAR L$027ecb_dec_two movups xmm4,[32+esi] cmp eax,64 jb NEAR L$028ecb_dec_three movups xmm5,[48+esi] je NEAR L$029ecb_dec_four movups xmm6,[64+esi] xorps xmm7,xmm7 call __aesni_decrypt6 movups [edi],xmm2 movups [16+edi],xmm3 movups [32+edi],xmm4 movups [48+edi],xmm5 movups [64+edi],xmm6 jmp NEAR L$013ecb_ret align 16 L$026ecb_dec_one: movups xmm0,[edx] movups xmm1,[16+edx] lea edx,[32+edx] xorps xmm2,xmm0 L$030dec1_loop_4: db 102,15,56,222,209 dec ecx movups xmm1,[edx] lea edx,[16+edx] jnz NEAR L$030dec1_loop_4 db 102,15,56,223,209 movups [edi],xmm2 jmp NEAR L$013ecb_ret align 16 L$027ecb_dec_two: call __aesni_decrypt2 movups [edi],xmm2 movups [16+edi],xmm3 jmp NEAR L$013ecb_ret align 16 L$028ecb_dec_three: call __aesni_decrypt3 movups [edi],xmm2 movups [16+edi],xmm3 movups [32+edi],xmm4 jmp NEAR L$013ecb_ret align 16 L$029ecb_dec_four: call __aesni_decrypt4 movups [edi],xmm2 movups [16+edi],xmm3 movups [32+edi],xmm4 movups [48+edi],xmm5 L$013ecb_ret: pxor xmm0,xmm0 pxor xmm1,xmm1 pxor xmm2,xmm2 pxor xmm3,xmm3 pxor xmm4,xmm4 pxor xmm5,xmm5 pxor xmm6,xmm6 pxor xmm7,xmm7 pop edi pop esi pop ebx pop ebp ret global _aes_hw_ccm64_encrypt_blocks align 16 _aes_hw_ccm64_encrypt_blocks: L$_aes_hw_ccm64_encrypt_blocks_begin: push ebp push ebx push esi push edi mov esi,DWORD [20+esp] mov edi,DWORD [24+esp] mov eax,DWORD [28+esp] mov edx,DWORD [32+esp] mov ebx,DWORD [36+esp] mov ecx,DWORD [40+esp] mov ebp,esp sub esp,60 and esp,-16 mov DWORD [48+esp],ebp movdqu xmm7,[ebx] movdqu xmm3,[ecx] mov ecx,DWORD [240+edx] mov DWORD [esp],202182159 mov DWORD [4+esp],134810123 mov DWORD [8+esp],67438087 mov DWORD [12+esp],66051 mov ebx,1 xor ebp,ebp mov DWORD [16+esp],ebx mov DWORD [20+esp],ebp mov DWORD [24+esp],ebp mov DWORD [28+esp],ebp shl ecx,4 mov ebx,16 lea ebp,[edx] movdqa xmm5,[esp] movdqa xmm2,xmm7 lea edx,[32+ecx*1+edx] sub ebx,ecx db 102,15,56,0,253 L$031ccm64_enc_outer: movups xmm0,[ebp] mov ecx,ebx movups xmm6,[esi] xorps xmm2,xmm0 movups xmm1,[16+ebp] xorps xmm0,xmm6 xorps xmm3,xmm0 movups xmm0,[32+ebp] L$032ccm64_enc2_loop: db 102,15,56,220,209 db 102,15,56,220,217 movups xmm1,[ecx*1+edx] add ecx,32 db 102,15,56,220,208 db 102,15,56,220,216 movups xmm0,[ecx*1+edx-16] jnz NEAR L$032ccm64_enc2_loop db 102,15,56,220,209 db 102,15,56,220,217 paddq xmm7,[16+esp] dec eax db 102,15,56,221,208 db 102,15,56,221,216 lea esi,[16+esi] xorps xmm6,xmm2 movdqa xmm2,xmm7 movups [edi],xmm6 db 102,15,56,0,213 lea edi,[16+edi] jnz NEAR L$031ccm64_enc_outer mov esp,DWORD [48+esp] mov edi,DWORD [40+esp] movups [edi],xmm3 pxor xmm0,xmm0 pxor xmm1,xmm1 pxor xmm2,xmm2 pxor xmm3,xmm3 pxor xmm4,xmm4 pxor xmm5,xmm5 pxor xmm6,xmm6 pxor xmm7,xmm7 pop edi pop esi pop ebx pop ebp ret global _aes_hw_ccm64_decrypt_blocks align 16 _aes_hw_ccm64_decrypt_blocks: L$_aes_hw_ccm64_decrypt_blocks_begin: push ebp push ebx push esi push edi mov esi,DWORD [20+esp] mov edi,DWORD [24+esp] mov eax,DWORD [28+esp] mov edx,DWORD [32+esp] mov ebx,DWORD [36+esp] mov ecx,DWORD [40+esp] mov ebp,esp sub esp,60 and esp,-16 mov DWORD [48+esp],ebp movdqu xmm7,[ebx] movdqu xmm3,[ecx] mov ecx,DWORD [240+edx] mov DWORD [esp],202182159 mov DWORD [4+esp],134810123 mov DWORD [8+esp],67438087 mov DWORD [12+esp],66051 mov ebx,1 xor ebp,ebp mov DWORD [16+esp],ebx mov DWORD [20+esp],ebp mov DWORD [24+esp],ebp mov DWORD [28+esp],ebp movdqa xmm5,[esp] movdqa xmm2,xmm7 mov ebp,edx mov ebx,ecx db 102,15,56,0,253 movups xmm0,[edx] movups xmm1,[16+edx] lea edx,[32+edx] xorps xmm2,xmm0 L$033enc1_loop_5: db 102,15,56,220,209 dec ecx movups xmm1,[edx] lea edx,[16+edx] jnz NEAR L$033enc1_loop_5 db 102,15,56,221,209 shl ebx,4 mov ecx,16 movups xmm6,[esi] paddq xmm7,[16+esp] lea esi,[16+esi] sub ecx,ebx lea edx,[32+ebx*1+ebp] mov ebx,ecx jmp NEAR L$034ccm64_dec_outer align 16 L$034ccm64_dec_outer: xorps xmm6,xmm2 movdqa xmm2,xmm7 movups [edi],xmm6 lea edi,[16+edi] db 102,15,56,0,213 sub eax,1 jz NEAR L$035ccm64_dec_break movups xmm0,[ebp] mov ecx,ebx movups xmm1,[16+ebp] xorps xmm6,xmm0 xorps xmm2,xmm0 xorps xmm3,xmm6 movups xmm0,[32+ebp] L$036ccm64_dec2_loop: db 102,15,56,220,209 db 102,15,56,220,217 movups xmm1,[ecx*1+edx] add ecx,32 db 102,15,56,220,208 db 102,15,56,220,216 movups xmm0,[ecx*1+edx-16] jnz NEAR L$036ccm64_dec2_loop movups xmm6,[esi] paddq xmm7,[16+esp] db 102,15,56,220,209 db 102,15,56,220,217 db 102,15,56,221,208 db 102,15,56,221,216 lea esi,[16+esi] jmp NEAR L$034ccm64_dec_outer align 16 L$035ccm64_dec_break: mov ecx,DWORD [240+ebp] mov edx,ebp movups xmm0,[edx] movups xmm1,[16+edx] xorps xmm6,xmm0 lea edx,[32+edx] xorps xmm3,xmm6 L$037enc1_loop_6: db 102,15,56,220,217 dec ecx movups xmm1,[edx] lea edx,[16+edx] jnz NEAR L$037enc1_loop_6 db 102,15,56,221,217 mov esp,DWORD [48+esp] mov edi,DWORD [40+esp] movups [edi],xmm3 pxor xmm0,xmm0 pxor xmm1,xmm1 pxor xmm2,xmm2 pxor xmm3,xmm3 pxor xmm4,xmm4 pxor xmm5,xmm5 pxor xmm6,xmm6 pxor xmm7,xmm7 pop edi pop esi pop ebx pop ebp ret global _aes_hw_ctr32_encrypt_blocks align 16 _aes_hw_ctr32_encrypt_blocks: L$_aes_hw_ctr32_encrypt_blocks_begin: push ebp push ebx push esi push edi %ifdef BORINGSSL_DISPATCH_TEST push ebx push edx call L$038pic_for_function_hit L$038pic_for_function_hit: pop ebx lea ebx,[(_BORINGSSL_function_hit+0-L$038pic_for_function_hit)+ebx] mov edx,1 mov BYTE [ebx],dl pop edx pop ebx %endif mov esi,DWORD [20+esp] mov edi,DWORD [24+esp] mov eax,DWORD [28+esp] mov edx,DWORD [32+esp] mov ebx,DWORD [36+esp] mov ebp,esp sub esp,88 and esp,-16 mov DWORD [80+esp],ebp cmp eax,1 je NEAR L$039ctr32_one_shortcut movdqu xmm7,[ebx] mov DWORD [esp],202182159 mov DWORD [4+esp],134810123 mov DWORD [8+esp],67438087 mov DWORD [12+esp],66051 mov ecx,6 xor ebp,ebp mov DWORD [16+esp],ecx mov DWORD [20+esp],ecx mov DWORD [24+esp],ecx mov DWORD [28+esp],ebp db 102,15,58,22,251,3 db 102,15,58,34,253,3 mov ecx,DWORD [240+edx] bswap ebx pxor xmm0,xmm0 pxor xmm1,xmm1 movdqa xmm2,[esp] db 102,15,58,34,195,0 lea ebp,[3+ebx] db 102,15,58,34,205,0 inc ebx db 102,15,58,34,195,1 inc ebp db 102,15,58,34,205,1 inc ebx db 102,15,58,34,195,2 inc ebp db 102,15,58,34,205,2 movdqa [48+esp],xmm0 db 102,15,56,0,194 movdqu xmm6,[edx] movdqa [64+esp],xmm1 db 102,15,56,0,202 pshufd xmm2,xmm0,192 pshufd xmm3,xmm0,128 cmp eax,6 jb NEAR L$040ctr32_tail pxor xmm7,xmm6 shl ecx,4 mov ebx,16 movdqa [32+esp],xmm7 mov ebp,edx sub ebx,ecx lea edx,[32+ecx*1+edx] sub eax,6 jmp NEAR L$041ctr32_loop6 align 16 L$041ctr32_loop6: pshufd xmm4,xmm0,64 movdqa xmm0,[32+esp] pshufd xmm5,xmm1,192 pxor xmm2,xmm0 pshufd xmm6,xmm1,128 pxor xmm3,xmm0 pshufd xmm7,xmm1,64 movups xmm1,[16+ebp] pxor xmm4,xmm0 pxor xmm5,xmm0 db 102,15,56,220,209 pxor xmm6,xmm0 pxor xmm7,xmm0 db 102,15,56,220,217 movups xmm0,[32+ebp] mov ecx,ebx db 102,15,56,220,225 db 102,15,56,220,233 db 102,15,56,220,241 db 102,15,56,220,249 call L$_aesni_encrypt6_enter movups xmm1,[esi] movups xmm0,[16+esi] xorps xmm2,xmm1 movups xmm1,[32+esi] xorps xmm3,xmm0 movups [edi],xmm2 movdqa xmm0,[16+esp] xorps xmm4,xmm1 movdqa xmm1,[64+esp] movups [16+edi],xmm3 movups [32+edi],xmm4 paddd xmm1,xmm0 paddd xmm0,[48+esp] movdqa xmm2,[esp] movups xmm3,[48+esi] movups xmm4,[64+esi] xorps xmm5,xmm3 movups xmm3,[80+esi] lea esi,[96+esi] movdqa [48+esp],xmm0 db 102,15,56,0,194 xorps xmm6,xmm4 movups [48+edi],xmm5 xorps xmm7,xmm3 movdqa [64+esp],xmm1 db 102,15,56,0,202 movups [64+edi],xmm6 pshufd xmm2,xmm0,192 movups [80+edi],xmm7 lea edi,[96+edi] pshufd xmm3,xmm0,128 sub eax,6 jnc NEAR L$041ctr32_loop6 add eax,6 jz NEAR L$042ctr32_ret movdqu xmm7,[ebp] mov edx,ebp pxor xmm7,[32+esp] mov ecx,DWORD [240+ebp] L$040ctr32_tail: por xmm2,xmm7 cmp eax,2 jb NEAR L$043ctr32_one pshufd xmm4,xmm0,64 por xmm3,xmm7 je NEAR L$044ctr32_two pshufd xmm5,xmm1,192 por xmm4,xmm7 cmp eax,4 jb NEAR L$045ctr32_three pshufd xmm6,xmm1,128 por xmm5,xmm7 je NEAR L$046ctr32_four por xmm6,xmm7 call __aesni_encrypt6 movups xmm1,[esi] movups xmm0,[16+esi] xorps xmm2,xmm1 movups xmm1,[32+esi] xorps xmm3,xmm0 movups xmm0,[48+esi] xorps xmm4,xmm1 movups xmm1,[64+esi] xorps xmm5,xmm0 movups [edi],xmm2 xorps xmm6,xmm1 movups [16+edi],xmm3 movups [32+edi],xmm4 movups [48+edi],xmm5 movups [64+edi],xmm6 jmp NEAR L$042ctr32_ret align 16 L$039ctr32_one_shortcut: movups xmm2,[ebx] mov ecx,DWORD [240+edx] L$043ctr32_one: movups xmm0,[edx] movups xmm1,[16+edx] lea edx,[32+edx] xorps xmm2,xmm0 L$047enc1_loop_7: db 102,15,56,220,209 dec ecx movups xmm1,[edx] lea edx,[16+edx] jnz NEAR L$047enc1_loop_7 db 102,15,56,221,209 movups xmm6,[esi] xorps xmm6,xmm2 movups [edi],xmm6 jmp NEAR L$042ctr32_ret align 16 L$044ctr32_two: call __aesni_encrypt2 movups xmm5,[esi] movups xmm6,[16+esi] xorps xmm2,xmm5 xorps xmm3,xmm6 movups [edi],xmm2 movups [16+edi],xmm3 jmp NEAR L$042ctr32_ret align 16 L$045ctr32_three: call __aesni_encrypt3 movups xmm5,[esi] movups xmm6,[16+esi] xorps xmm2,xmm5 movups xmm7,[32+esi] xorps xmm3,xmm6 movups [edi],xmm2 xorps xmm4,xmm7 movups [16+edi],xmm3 movups [32+edi],xmm4 jmp NEAR L$042ctr32_ret align 16 L$046ctr32_four: call __aesni_encrypt4 movups xmm6,[esi] movups xmm7,[16+esi] movups xmm1,[32+esi] xorps xmm2,xmm6 movups xmm0,[48+esi] xorps xmm3,xmm7 movups [edi],xmm2 xorps xmm4,xmm1 movups [16+edi],xmm3 xorps xmm5,xmm0 movups [32+edi],xmm4 movups [48+edi],xmm5 L$042ctr32_ret: pxor xmm0,xmm0 pxor xmm1,xmm1 pxor xmm2,xmm2 pxor xmm3,xmm3 pxor xmm4,xmm4 movdqa [32+esp],xmm0 pxor xmm5,xmm5 movdqa [48+esp],xmm0 pxor xmm6,xmm6 movdqa [64+esp],xmm0 pxor xmm7,xmm7 mov esp,DWORD [80+esp] pop edi pop esi pop ebx pop ebp ret global _aes_hw_xts_encrypt align 16 _aes_hw_xts_encrypt: L$_aes_hw_xts_encrypt_begin: push ebp push ebx push esi push edi mov edx,DWORD [36+esp] mov esi,DWORD [40+esp] mov ecx,DWORD [240+edx] movups xmm2,[esi] movups xmm0,[edx] movups xmm1,[16+edx] lea edx,[32+edx] xorps xmm2,xmm0 L$048enc1_loop_8: db 102,15,56,220,209 dec ecx movups xmm1,[edx] lea edx,[16+edx] jnz NEAR L$048enc1_loop_8 db 102,15,56,221,209 mov esi,DWORD [20+esp] mov edi,DWORD [24+esp] mov eax,DWORD [28+esp] mov edx,DWORD [32+esp] mov ebp,esp sub esp,120 mov ecx,DWORD [240+edx] and esp,-16 mov DWORD [96+esp],135 mov DWORD [100+esp],0 mov DWORD [104+esp],1 mov DWORD [108+esp],0 mov DWORD [112+esp],eax mov DWORD [116+esp],ebp movdqa xmm1,xmm2 pxor xmm0,xmm0 movdqa xmm3,[96+esp] pcmpgtd xmm0,xmm1 and eax,-16 mov ebp,edx mov ebx,ecx sub eax,96 jc NEAR L$049xts_enc_short shl ecx,4 mov ebx,16 sub ebx,ecx lea edx,[32+ecx*1+edx] jmp NEAR L$050xts_enc_loop6 align 16 L$050xts_enc_loop6: pshufd xmm2,xmm0,19 pxor xmm0,xmm0 movdqa [esp],xmm1 paddq xmm1,xmm1 pand xmm2,xmm3 pcmpgtd xmm0,xmm1 pxor xmm1,xmm2 pshufd xmm2,xmm0,19 pxor xmm0,xmm0 movdqa [16+esp],xmm1 paddq xmm1,xmm1 pand xmm2,xmm3 pcmpgtd xmm0,xmm1 pxor xmm1,xmm2 pshufd xmm2,xmm0,19 pxor xmm0,xmm0 movdqa [32+esp],xmm1 paddq xmm1,xmm1 pand xmm2,xmm3 pcmpgtd xmm0,xmm1 pxor xmm1,xmm2 pshufd xmm2,xmm0,19 pxor xmm0,xmm0 movdqa [48+esp],xmm1 paddq xmm1,xmm1 pand xmm2,xmm3 pcmpgtd xmm0,xmm1 pxor xmm1,xmm2 pshufd xmm7,xmm0,19 movdqa [64+esp],xmm1 paddq xmm1,xmm1 movups xmm0,[ebp] pand xmm7,xmm3 movups xmm2,[esi] pxor xmm7,xmm1 mov ecx,ebx movdqu xmm3,[16+esi] xorps xmm2,xmm0 movdqu xmm4,[32+esi] pxor xmm3,xmm0 movdqu xmm5,[48+esi] pxor xmm4,xmm0 movdqu xmm6,[64+esi] pxor xmm5,xmm0 movdqu xmm1,[80+esi] pxor xmm6,xmm0 lea esi,[96+esi] pxor xmm2,[esp] movdqa [80+esp],xmm7 pxor xmm7,xmm1 movups xmm1,[16+ebp] pxor xmm3,[16+esp] pxor xmm4,[32+esp] db 102,15,56,220,209 pxor xmm5,[48+esp] pxor xmm6,[64+esp] db 102,15,56,220,217 pxor xmm7,xmm0 movups xmm0,[32+ebp] db 102,15,56,220,225 db 102,15,56,220,233 db 102,15,56,220,241 db 102,15,56,220,249 call L$_aesni_encrypt6_enter movdqa xmm1,[80+esp] pxor xmm0,xmm0 xorps xmm2,[esp] pcmpgtd xmm0,xmm1 xorps xmm3,[16+esp] movups [edi],xmm2 xorps xmm4,[32+esp] movups [16+edi],xmm3 xorps xmm5,[48+esp] movups [32+edi],xmm4 xorps xmm6,[64+esp] movups [48+edi],xmm5 xorps xmm7,xmm1 movups [64+edi],xmm6 pshufd xmm2,xmm0,19 movups [80+edi],xmm7 lea edi,[96+edi] movdqa xmm3,[96+esp] pxor xmm0,xmm0 paddq xmm1,xmm1 pand xmm2,xmm3 pcmpgtd xmm0,xmm1 pxor xmm1,xmm2 sub eax,96 jnc NEAR L$050xts_enc_loop6 mov ecx,DWORD [240+ebp] mov edx,ebp mov ebx,ecx L$049xts_enc_short: add eax,96 jz NEAR L$051xts_enc_done6x movdqa xmm5,xmm1 cmp eax,32 jb NEAR L$052xts_enc_one pshufd xmm2,xmm0,19 pxor xmm0,xmm0 paddq xmm1,xmm1 pand xmm2,xmm3 pcmpgtd xmm0,xmm1 pxor xmm1,xmm2 je NEAR L$053xts_enc_two pshufd xmm2,xmm0,19 pxor xmm0,xmm0 movdqa xmm6,xmm1 paddq xmm1,xmm1 pand xmm2,xmm3 pcmpgtd xmm0,xmm1 pxor xmm1,xmm2 cmp eax,64 jb NEAR L$054xts_enc_three pshufd xmm2,xmm0,19 pxor xmm0,xmm0 movdqa xmm7,xmm1 paddq xmm1,xmm1 pand xmm2,xmm3 pcmpgtd xmm0,xmm1 pxor xmm1,xmm2 movdqa [esp],xmm5 movdqa [16+esp],xmm6 je NEAR L$055xts_enc_four movdqa [32+esp],xmm7 pshufd xmm7,xmm0,19 movdqa [48+esp],xmm1 paddq xmm1,xmm1 pand xmm7,xmm3 pxor xmm7,xmm1 movdqu xmm2,[esi] movdqu xmm3,[16+esi] movdqu xmm4,[32+esi] pxor xmm2,[esp] movdqu xmm5,[48+esi] pxor xmm3,[16+esp] movdqu xmm6,[64+esi] pxor xmm4,[32+esp] lea esi,[80+esi] pxor xmm5,[48+esp] movdqa [64+esp],xmm7 pxor xmm6,xmm7 call __aesni_encrypt6 movaps xmm1,[64+esp] xorps xmm2,[esp] xorps xmm3,[16+esp] xorps xmm4,[32+esp] movups [edi],xmm2 xorps xmm5,[48+esp] movups [16+edi],xmm3 xorps xmm6,xmm1 movups [32+edi],xmm4 movups [48+edi],xmm5 movups [64+edi],xmm6 lea edi,[80+edi] jmp NEAR L$056xts_enc_done align 16 L$052xts_enc_one: movups xmm2,[esi] lea esi,[16+esi] xorps xmm2,xmm5 movups xmm0,[edx] movups xmm1,[16+edx] lea edx,[32+edx] xorps xmm2,xmm0 L$057enc1_loop_9: db 102,15,56,220,209 dec ecx movups xmm1,[edx] lea edx,[16+edx] jnz NEAR L$057enc1_loop_9 db 102,15,56,221,209 xorps xmm2,xmm5 movups [edi],xmm2 lea edi,[16+edi] movdqa xmm1,xmm5 jmp NEAR L$056xts_enc_done align 16 L$053xts_enc_two: movaps xmm6,xmm1 movups xmm2,[esi] movups xmm3,[16+esi] lea esi,[32+esi] xorps xmm2,xmm5 xorps xmm3,xmm6 call __aesni_encrypt2 xorps xmm2,xmm5 xorps xmm3,xmm6 movups [edi],xmm2 movups [16+edi],xmm3 lea edi,[32+edi] movdqa xmm1,xmm6 jmp NEAR L$056xts_enc_done align 16 L$054xts_enc_three: movaps xmm7,xmm1 movups xmm2,[esi] movups xmm3,[16+esi] movups xmm4,[32+esi] lea esi,[48+esi] xorps xmm2,xmm5 xorps xmm3,xmm6 xorps xmm4,xmm7 call __aesni_encrypt3 xorps xmm2,xmm5 xorps xmm3,xmm6 xorps xmm4,xmm7 movups [edi],xmm2 movups [16+edi],xmm3 movups [32+edi],xmm4 lea edi,[48+edi] movdqa xmm1,xmm7 jmp NEAR L$056xts_enc_done align 16 L$055xts_enc_four: movaps xmm6,xmm1 movups xmm2,[esi] movups xmm3,[16+esi] movups xmm4,[32+esi] xorps xmm2,[esp] movups xmm5,[48+esi] lea esi,[64+esi] xorps xmm3,[16+esp] xorps xmm4,xmm7 xorps xmm5,xmm6 call __aesni_encrypt4 xorps xmm2,[esp] xorps xmm3,[16+esp] xorps xmm4,xmm7 movups [edi],xmm2 xorps xmm5,xmm6 movups [16+edi],xmm3 movups [32+edi],xmm4 movups [48+edi],xmm5 lea edi,[64+edi] movdqa xmm1,xmm6 jmp NEAR L$056xts_enc_done align 16 L$051xts_enc_done6x: mov eax,DWORD [112+esp] and eax,15 jz NEAR L$058xts_enc_ret movdqa xmm5,xmm1 mov DWORD [112+esp],eax jmp NEAR L$059xts_enc_steal align 16 L$056xts_enc_done: mov eax,DWORD [112+esp] pxor xmm0,xmm0 and eax,15 jz NEAR L$058xts_enc_ret pcmpgtd xmm0,xmm1 mov DWORD [112+esp],eax pshufd xmm5,xmm0,19 paddq xmm1,xmm1 pand xmm5,[96+esp] pxor xmm5,xmm1 L$059xts_enc_steal: movzx ecx,BYTE [esi] movzx edx,BYTE [edi-16] lea esi,[1+esi] mov BYTE [edi-16],cl mov BYTE [edi],dl lea edi,[1+edi] sub eax,1 jnz NEAR L$059xts_enc_steal sub edi,DWORD [112+esp] mov edx,ebp mov ecx,ebx movups xmm2,[edi-16] xorps xmm2,xmm5 movups xmm0,[edx] movups xmm1,[16+edx] lea edx,[32+edx] xorps xmm2,xmm0 L$060enc1_loop_10: db 102,15,56,220,209 dec ecx movups xmm1,[edx] lea edx,[16+edx] jnz NEAR L$060enc1_loop_10 db 102,15,56,221,209 xorps xmm2,xmm5 movups [edi-16],xmm2 L$058xts_enc_ret: pxor xmm0,xmm0 pxor xmm1,xmm1 pxor xmm2,xmm2 movdqa [esp],xmm0 pxor xmm3,xmm3 movdqa [16+esp],xmm0 pxor xmm4,xmm4 movdqa [32+esp],xmm0 pxor xmm5,xmm5 movdqa [48+esp],xmm0 pxor xmm6,xmm6 movdqa [64+esp],xmm0 pxor xmm7,xmm7 movdqa [80+esp],xmm0 mov esp,DWORD [116+esp] pop edi pop esi pop ebx pop ebp ret global _aes_hw_xts_decrypt align 16 _aes_hw_xts_decrypt: L$_aes_hw_xts_decrypt_begin: push ebp push ebx push esi push edi mov edx,DWORD [36+esp] mov esi,DWORD [40+esp] mov ecx,DWORD [240+edx] movups xmm2,[esi] movups xmm0,[edx] movups xmm1,[16+edx] lea edx,[32+edx] xorps xmm2,xmm0 L$061enc1_loop_11: db 102,15,56,220,209 dec ecx movups xmm1,[edx] lea edx,[16+edx] jnz NEAR L$061enc1_loop_11 db 102,15,56,221,209 mov esi,DWORD [20+esp] mov edi,DWORD [24+esp] mov eax,DWORD [28+esp] mov edx,DWORD [32+esp] mov ebp,esp sub esp,120 and esp,-16 xor ebx,ebx test eax,15 setnz bl shl ebx,4 sub eax,ebx mov DWORD [96+esp],135 mov DWORD [100+esp],0 mov DWORD [104+esp],1 mov DWORD [108+esp],0 mov DWORD [112+esp],eax mov DWORD [116+esp],ebp mov ecx,DWORD [240+edx] mov ebp,edx mov ebx,ecx movdqa xmm1,xmm2 pxor xmm0,xmm0 movdqa xmm3,[96+esp] pcmpgtd xmm0,xmm1 and eax,-16 sub eax,96 jc NEAR L$062xts_dec_short shl ecx,4 mov ebx,16 sub ebx,ecx lea edx,[32+ecx*1+edx] jmp NEAR L$063xts_dec_loop6 align 16 L$063xts_dec_loop6: pshufd xmm2,xmm0,19 pxor xmm0,xmm0 movdqa [esp],xmm1 paddq xmm1,xmm1 pand xmm2,xmm3 pcmpgtd xmm0,xmm1 pxor xmm1,xmm2 pshufd xmm2,xmm0,19 pxor xmm0,xmm0 movdqa [16+esp],xmm1 paddq xmm1,xmm1 pand xmm2,xmm3 pcmpgtd xmm0,xmm1 pxor xmm1,xmm2 pshufd xmm2,xmm0,19 pxor xmm0,xmm0 movdqa [32+esp],xmm1 paddq xmm1,xmm1 pand xmm2,xmm3 pcmpgtd xmm0,xmm1 pxor xmm1,xmm2 pshufd xmm2,xmm0,19 pxor xmm0,xmm0 movdqa [48+esp],xmm1 paddq xmm1,xmm1 pand xmm2,xmm3 pcmpgtd xmm0,xmm1 pxor xmm1,xmm2 pshufd xmm7,xmm0,19 movdqa [64+esp],xmm1 paddq xmm1,xmm1 movups xmm0,[ebp] pand xmm7,xmm3 movups xmm2,[esi] pxor xmm7,xmm1 mov ecx,ebx movdqu xmm3,[16+esi] xorps xmm2,xmm0 movdqu xmm4,[32+esi] pxor xmm3,xmm0 movdqu xmm5,[48+esi] pxor xmm4,xmm0 movdqu xmm6,[64+esi] pxor xmm5,xmm0 movdqu xmm1,[80+esi] pxor xmm6,xmm0 lea esi,[96+esi] pxor xmm2,[esp] movdqa [80+esp],xmm7 pxor xmm7,xmm1 movups xmm1,[16+ebp] pxor xmm3,[16+esp] pxor xmm4,[32+esp] db 102,15,56,222,209 pxor xmm5,[48+esp] pxor xmm6,[64+esp] db 102,15,56,222,217 pxor xmm7,xmm0 movups xmm0,[32+ebp] db 102,15,56,222,225 db 102,15,56,222,233 db 102,15,56,222,241 db 102,15,56,222,249 call L$_aesni_decrypt6_enter movdqa xmm1,[80+esp] pxor xmm0,xmm0 xorps xmm2,[esp] pcmpgtd xmm0,xmm1 xorps xmm3,[16+esp] movups [edi],xmm2 xorps xmm4,[32+esp] movups [16+edi],xmm3 xorps xmm5,[48+esp] movups [32+edi],xmm4 xorps xmm6,[64+esp] movups [48+edi],xmm5 xorps xmm7,xmm1 movups [64+edi],xmm6 pshufd xmm2,xmm0,19 movups [80+edi],xmm7 lea edi,[96+edi] movdqa xmm3,[96+esp] pxor xmm0,xmm0 paddq xmm1,xmm1 pand xmm2,xmm3 pcmpgtd xmm0,xmm1 pxor xmm1,xmm2 sub eax,96 jnc NEAR L$063xts_dec_loop6 mov ecx,DWORD [240+ebp] mov edx,ebp mov ebx,ecx L$062xts_dec_short: add eax,96 jz NEAR L$064xts_dec_done6x movdqa xmm5,xmm1 cmp eax,32 jb NEAR L$065xts_dec_one pshufd xmm2,xmm0,19 pxor xmm0,xmm0 paddq xmm1,xmm1 pand xmm2,xmm3 pcmpgtd xmm0,xmm1 pxor xmm1,xmm2 je NEAR L$066xts_dec_two pshufd xmm2,xmm0,19 pxor xmm0,xmm0 movdqa xmm6,xmm1 paddq xmm1,xmm1 pand xmm2,xmm3 pcmpgtd xmm0,xmm1 pxor xmm1,xmm2 cmp eax,64 jb NEAR L$067xts_dec_three pshufd xmm2,xmm0,19 pxor xmm0,xmm0 movdqa xmm7,xmm1 paddq xmm1,xmm1 pand xmm2,xmm3 pcmpgtd xmm0,xmm1 pxor xmm1,xmm2 movdqa [esp],xmm5 movdqa [16+esp],xmm6 je NEAR L$068xts_dec_four movdqa [32+esp],xmm7 pshufd xmm7,xmm0,19 movdqa [48+esp],xmm1 paddq xmm1,xmm1 pand xmm7,xmm3 pxor xmm7,xmm1 movdqu xmm2,[esi] movdqu xmm3,[16+esi] movdqu xmm4,[32+esi] pxor xmm2,[esp] movdqu xmm5,[48+esi] pxor xmm3,[16+esp] movdqu xmm6,[64+esi] pxor xmm4,[32+esp] lea esi,[80+esi] pxor xmm5,[48+esp] movdqa [64+esp],xmm7 pxor xmm6,xmm7 call __aesni_decrypt6 movaps xmm1,[64+esp] xorps xmm2,[esp] xorps xmm3,[16+esp] xorps xmm4,[32+esp] movups [edi],xmm2 xorps xmm5,[48+esp] movups [16+edi],xmm3 xorps xmm6,xmm1 movups [32+edi],xmm4 movups [48+edi],xmm5 movups [64+edi],xmm6 lea edi,[80+edi] jmp NEAR L$069xts_dec_done align 16 L$065xts_dec_one: movups xmm2,[esi] lea esi,[16+esi] xorps xmm2,xmm5 movups xmm0,[edx] movups xmm1,[16+edx] lea edx,[32+edx] xorps xmm2,xmm0 L$070dec1_loop_12: db 102,15,56,222,209 dec ecx movups xmm1,[edx] lea edx,[16+edx] jnz NEAR L$070dec1_loop_12 db 102,15,56,223,209 xorps xmm2,xmm5 movups [edi],xmm2 lea edi,[16+edi] movdqa xmm1,xmm5 jmp NEAR L$069xts_dec_done align 16 L$066xts_dec_two: movaps xmm6,xmm1 movups xmm2,[esi] movups xmm3,[16+esi] lea esi,[32+esi] xorps xmm2,xmm5 xorps xmm3,xmm6 call __aesni_decrypt2 xorps xmm2,xmm5 xorps xmm3,xmm6 movups [edi],xmm2 movups [16+edi],xmm3 lea edi,[32+edi] movdqa xmm1,xmm6 jmp NEAR L$069xts_dec_done align 16 L$067xts_dec_three: movaps xmm7,xmm1 movups xmm2,[esi] movups xmm3,[16+esi] movups xmm4,[32+esi] lea esi,[48+esi] xorps xmm2,xmm5 xorps xmm3,xmm6 xorps xmm4,xmm7 call __aesni_decrypt3 xorps xmm2,xmm5 xorps xmm3,xmm6 xorps xmm4,xmm7 movups [edi],xmm2 movups [16+edi],xmm3 movups [32+edi],xmm4 lea edi,[48+edi] movdqa xmm1,xmm7 jmp NEAR L$069xts_dec_done align 16 L$068xts_dec_four: movaps xmm6,xmm1 movups xmm2,[esi] movups xmm3,[16+esi] movups xmm4,[32+esi] xorps xmm2,[esp] movups xmm5,[48+esi] lea esi,[64+esi] xorps xmm3,[16+esp] xorps xmm4,xmm7 xorps xmm5,xmm6 call __aesni_decrypt4 xorps xmm2,[esp] xorps xmm3,[16+esp] xorps xmm4,xmm7 movups [edi],xmm2 xorps xmm5,xmm6 movups [16+edi],xmm3 movups [32+edi],xmm4 movups [48+edi],xmm5 lea edi,[64+edi] movdqa xmm1,xmm6 jmp NEAR L$069xts_dec_done align 16 L$064xts_dec_done6x: mov eax,DWORD [112+esp] and eax,15 jz NEAR L$071xts_dec_ret mov DWORD [112+esp],eax jmp NEAR L$072xts_dec_only_one_more align 16 L$069xts_dec_done: mov eax,DWORD [112+esp] pxor xmm0,xmm0 and eax,15 jz NEAR L$071xts_dec_ret pcmpgtd xmm0,xmm1 mov DWORD [112+esp],eax pshufd xmm2,xmm0,19 pxor xmm0,xmm0 movdqa xmm3,[96+esp] paddq xmm1,xmm1 pand xmm2,xmm3 pcmpgtd xmm0,xmm1 pxor xmm1,xmm2 L$072xts_dec_only_one_more: pshufd xmm5,xmm0,19 movdqa xmm6,xmm1 paddq xmm1,xmm1 pand xmm5,xmm3 pxor xmm5,xmm1 mov edx,ebp mov ecx,ebx movups xmm2,[esi] xorps xmm2,xmm5 movups xmm0,[edx] movups xmm1,[16+edx] lea edx,[32+edx] xorps xmm2,xmm0 L$073dec1_loop_13: db 102,15,56,222,209 dec ecx movups xmm1,[edx] lea edx,[16+edx] jnz NEAR L$073dec1_loop_13 db 102,15,56,223,209 xorps xmm2,xmm5 movups [edi],xmm2 L$074xts_dec_steal: movzx ecx,BYTE [16+esi] movzx edx,BYTE [edi] lea esi,[1+esi] mov BYTE [edi],cl mov BYTE [16+edi],dl lea edi,[1+edi] sub eax,1 jnz NEAR L$074xts_dec_steal sub edi,DWORD [112+esp] mov edx,ebp mov ecx,ebx movups xmm2,[edi] xorps xmm2,xmm6 movups xmm0,[edx] movups xmm1,[16+edx] lea edx,[32+edx] xorps xmm2,xmm0 L$075dec1_loop_14: db 102,15,56,222,209 dec ecx movups xmm1,[edx] lea edx,[16+edx] jnz NEAR L$075dec1_loop_14 db 102,15,56,223,209 xorps xmm2,xmm6 movups [edi],xmm2 L$071xts_dec_ret: pxor xmm0,xmm0 pxor xmm1,xmm1 pxor xmm2,xmm2 movdqa [esp],xmm0 pxor xmm3,xmm3 movdqa [16+esp],xmm0 pxor xmm4,xmm4 movdqa [32+esp],xmm0 pxor xmm5,xmm5 movdqa [48+esp],xmm0 pxor xmm6,xmm6 movdqa [64+esp],xmm0 pxor xmm7,xmm7 movdqa [80+esp],xmm0 mov esp,DWORD [116+esp] pop edi pop esi pop ebx pop ebp ret global _aes_hw_cbc_encrypt align 16 _aes_hw_cbc_encrypt: L$_aes_hw_cbc_encrypt_begin: push ebp push ebx push esi push edi mov esi,DWORD [20+esp] mov ebx,esp mov edi,DWORD [24+esp] sub ebx,24 mov eax,DWORD [28+esp] and ebx,-16 mov edx,DWORD [32+esp] mov ebp,DWORD [36+esp] test eax,eax jz NEAR L$076cbc_abort cmp DWORD [40+esp],0 xchg ebx,esp movups xmm7,[ebp] mov ecx,DWORD [240+edx] mov ebp,edx mov DWORD [16+esp],ebx mov ebx,ecx je NEAR L$077cbc_decrypt movaps xmm2,xmm7 cmp eax,16 jb NEAR L$078cbc_enc_tail sub eax,16 jmp NEAR L$079cbc_enc_loop align 16 L$079cbc_enc_loop: movups xmm7,[esi] lea esi,[16+esi] movups xmm0,[edx] movups xmm1,[16+edx] xorps xmm7,xmm0 lea edx,[32+edx] xorps xmm2,xmm7 L$080enc1_loop_15: db 102,15,56,220,209 dec ecx movups xmm1,[edx] lea edx,[16+edx] jnz NEAR L$080enc1_loop_15 db 102,15,56,221,209 mov ecx,ebx mov edx,ebp movups [edi],xmm2 lea edi,[16+edi] sub eax,16 jnc NEAR L$079cbc_enc_loop add eax,16 jnz NEAR L$078cbc_enc_tail movaps xmm7,xmm2 pxor xmm2,xmm2 jmp NEAR L$081cbc_ret L$078cbc_enc_tail: mov ecx,eax dd 2767451785 mov ecx,16 sub ecx,eax xor eax,eax dd 2868115081 lea edi,[edi-16] mov ecx,ebx mov esi,edi mov edx,ebp jmp NEAR L$079cbc_enc_loop align 16 L$077cbc_decrypt: cmp eax,80 jbe NEAR L$082cbc_dec_tail movaps [esp],xmm7 sub eax,80 jmp NEAR L$083cbc_dec_loop6_enter align 16 L$084cbc_dec_loop6: movaps [esp],xmm0 movups [edi],xmm7 lea edi,[16+edi] L$083cbc_dec_loop6_enter: movdqu xmm2,[esi] movdqu xmm3,[16+esi] movdqu xmm4,[32+esi] movdqu xmm5,[48+esi] movdqu xmm6,[64+esi] movdqu xmm7,[80+esi] call __aesni_decrypt6 movups xmm1,[esi] movups xmm0,[16+esi] xorps xmm2,[esp] xorps xmm3,xmm1 movups xmm1,[32+esi] xorps xmm4,xmm0 movups xmm0,[48+esi] xorps xmm5,xmm1 movups xmm1,[64+esi] xorps xmm6,xmm0 movups xmm0,[80+esi] xorps xmm7,xmm1 movups [edi],xmm2 movups [16+edi],xmm3 lea esi,[96+esi] movups [32+edi],xmm4 mov ecx,ebx movups [48+edi],xmm5 mov edx,ebp movups [64+edi],xmm6 lea edi,[80+edi] sub eax,96 ja NEAR L$084cbc_dec_loop6 movaps xmm2,xmm7 movaps xmm7,xmm0 add eax,80 jle NEAR L$085cbc_dec_clear_tail_collected movups [edi],xmm2 lea edi,[16+edi] L$082cbc_dec_tail: movups xmm2,[esi] movaps xmm6,xmm2 cmp eax,16 jbe NEAR L$086cbc_dec_one movups xmm3,[16+esi] movaps xmm5,xmm3 cmp eax,32 jbe NEAR L$087cbc_dec_two movups xmm4,[32+esi] cmp eax,48 jbe NEAR L$088cbc_dec_three movups xmm5,[48+esi] cmp eax,64 jbe NEAR L$089cbc_dec_four movups xmm6,[64+esi] movaps [esp],xmm7 movups xmm2,[esi] xorps xmm7,xmm7 call __aesni_decrypt6 movups xmm1,[esi] movups xmm0,[16+esi] xorps xmm2,[esp] xorps xmm3,xmm1 movups xmm1,[32+esi] xorps xmm4,xmm0 movups xmm0,[48+esi] xorps xmm5,xmm1 movups xmm7,[64+esi] xorps xmm6,xmm0 movups [edi],xmm2 movups [16+edi],xmm3 pxor xmm3,xmm3 movups [32+edi],xmm4 pxor xmm4,xmm4 movups [48+edi],xmm5 pxor xmm5,xmm5 lea edi,[64+edi] movaps xmm2,xmm6 pxor xmm6,xmm6 sub eax,80 jmp NEAR L$090cbc_dec_tail_collected align 16 L$086cbc_dec_one: movups xmm0,[edx] movups xmm1,[16+edx] lea edx,[32+edx] xorps xmm2,xmm0 L$091dec1_loop_16: db 102,15,56,222,209 dec ecx movups xmm1,[edx] lea edx,[16+edx] jnz NEAR L$091dec1_loop_16 db 102,15,56,223,209 xorps xmm2,xmm7 movaps xmm7,xmm6 sub eax,16 jmp NEAR L$090cbc_dec_tail_collected align 16 L$087cbc_dec_two: call __aesni_decrypt2 xorps xmm2,xmm7 xorps xmm3,xmm6 movups [edi],xmm2 movaps xmm2,xmm3 pxor xmm3,xmm3 lea edi,[16+edi] movaps xmm7,xmm5 sub eax,32 jmp NEAR L$090cbc_dec_tail_collected align 16 L$088cbc_dec_three: call __aesni_decrypt3 xorps xmm2,xmm7 xorps xmm3,xmm6 xorps xmm4,xmm5 movups [edi],xmm2 movaps xmm2,xmm4 pxor xmm4,xmm4 movups [16+edi],xmm3 pxor xmm3,xmm3 lea edi,[32+edi] movups xmm7,[32+esi] sub eax,48 jmp NEAR L$090cbc_dec_tail_collected align 16 L$089cbc_dec_four: call __aesni_decrypt4 movups xmm1,[16+esi] movups xmm0,[32+esi] xorps xmm2,xmm7 movups xmm7,[48+esi] xorps xmm3,xmm6 movups [edi],xmm2 xorps xmm4,xmm1 movups [16+edi],xmm3 pxor xmm3,xmm3 xorps xmm5,xmm0 movups [32+edi],xmm4 pxor xmm4,xmm4 lea edi,[48+edi] movaps xmm2,xmm5 pxor xmm5,xmm5 sub eax,64 jmp NEAR L$090cbc_dec_tail_collected align 16 L$085cbc_dec_clear_tail_collected: pxor xmm3,xmm3 pxor xmm4,xmm4 pxor xmm5,xmm5 pxor xmm6,xmm6 L$090cbc_dec_tail_collected: and eax,15 jnz NEAR L$092cbc_dec_tail_partial movups [edi],xmm2 pxor xmm0,xmm0 jmp NEAR L$081cbc_ret align 16 L$092cbc_dec_tail_partial: movaps [esp],xmm2 pxor xmm0,xmm0 mov ecx,16 mov esi,esp sub ecx,eax dd 2767451785 movdqa [esp],xmm2 L$081cbc_ret: mov esp,DWORD [16+esp] mov ebp,DWORD [36+esp] pxor xmm2,xmm2 pxor xmm1,xmm1 movups [ebp],xmm7 pxor xmm7,xmm7 L$076cbc_abort: pop edi pop esi pop ebx pop ebp ret global _aes_hw_set_encrypt_key_base align 16 _aes_hw_set_encrypt_key_base: L$_aes_hw_set_encrypt_key_base_begin: %ifdef BORINGSSL_DISPATCH_TEST push ebx push edx call L$093pic_for_function_hit L$093pic_for_function_hit: pop ebx lea ebx,[(_BORINGSSL_function_hit+3-L$093pic_for_function_hit)+ebx] mov edx,1 mov BYTE [ebx],dl pop edx pop ebx %endif mov eax,DWORD [4+esp] mov ecx,DWORD [8+esp] mov edx,DWORD [12+esp] push ebx call L$094pic L$094pic: pop ebx lea ebx,[(L$key_const-L$094pic)+ebx] movups xmm0,[eax] xorps xmm4,xmm4 lea edx,[16+edx] cmp ecx,256 je NEAR L$09514rounds cmp ecx,192 je NEAR L$09612rounds cmp ecx,128 jne NEAR L$097bad_keybits align 16 L$09810rounds: mov ecx,9 movups [edx-16],xmm0 db 102,15,58,223,200,1 call L$099key_128_cold db 102,15,58,223,200,2 call L$100key_128 db 102,15,58,223,200,4 call L$100key_128 db 102,15,58,223,200,8 call L$100key_128 db 102,15,58,223,200,16 call L$100key_128 db 102,15,58,223,200,32 call L$100key_128 db 102,15,58,223,200,64 call L$100key_128 db 102,15,58,223,200,128 call L$100key_128 db 102,15,58,223,200,27 call L$100key_128 db 102,15,58,223,200,54 call L$100key_128 movups [edx],xmm0 mov DWORD [80+edx],ecx jmp NEAR L$101good_key align 16 L$100key_128: movups [edx],xmm0 lea edx,[16+edx] L$099key_128_cold: shufps xmm4,xmm0,16 xorps xmm0,xmm4 shufps xmm4,xmm0,140 xorps xmm0,xmm4 shufps xmm1,xmm1,255 xorps xmm0,xmm1 ret align 16 L$09612rounds: movq xmm2,[16+eax] mov ecx,11 movups [edx-16],xmm0 db 102,15,58,223,202,1 call L$102key_192a_cold db 102,15,58,223,202,2 call L$103key_192b db 102,15,58,223,202,4 call L$104key_192a db 102,15,58,223,202,8 call L$103key_192b db 102,15,58,223,202,16 call L$104key_192a db 102,15,58,223,202,32 call L$103key_192b db 102,15,58,223,202,64 call L$104key_192a db 102,15,58,223,202,128 call L$103key_192b movups [edx],xmm0 mov DWORD [48+edx],ecx jmp NEAR L$101good_key align 16 L$104key_192a: movups [edx],xmm0 lea edx,[16+edx] align 16 L$102key_192a_cold: movaps xmm5,xmm2 L$105key_192b_warm: shufps xmm4,xmm0,16 movdqa xmm3,xmm2 xorps xmm0,xmm4 shufps xmm4,xmm0,140 pslldq xmm3,4 xorps xmm0,xmm4 pshufd xmm1,xmm1,85 pxor xmm2,xmm3 pxor xmm0,xmm1 pshufd xmm3,xmm0,255 pxor xmm2,xmm3 ret align 16 L$103key_192b: movaps xmm3,xmm0 shufps xmm5,xmm0,68 movups [edx],xmm5 shufps xmm3,xmm2,78 movups [16+edx],xmm3 lea edx,[32+edx] jmp NEAR L$105key_192b_warm align 16 L$09514rounds: movups xmm2,[16+eax] lea edx,[16+edx] mov ecx,13 movups [edx-32],xmm0 movups [edx-16],xmm2 db 102,15,58,223,202,1 call L$106key_256a_cold db 102,15,58,223,200,1 call L$107key_256b db 102,15,58,223,202,2 call L$108key_256a db 102,15,58,223,200,2 call L$107key_256b db 102,15,58,223,202,4 call L$108key_256a db 102,15,58,223,200,4 call L$107key_256b db 102,15,58,223,202,8 call L$108key_256a db 102,15,58,223,200,8 call L$107key_256b db 102,15,58,223,202,16 call L$108key_256a db 102,15,58,223,200,16 call L$107key_256b db 102,15,58,223,202,32 call L$108key_256a db 102,15,58,223,200,32 call L$107key_256b db 102,15,58,223,202,64 call L$108key_256a movups [edx],xmm0 mov DWORD [16+edx],ecx xor eax,eax jmp NEAR L$101good_key align 16 L$108key_256a: movups [edx],xmm2 lea edx,[16+edx] L$106key_256a_cold: shufps xmm4,xmm0,16 xorps xmm0,xmm4 shufps xmm4,xmm0,140 xorps xmm0,xmm4 shufps xmm1,xmm1,255 xorps xmm0,xmm1 ret align 16 L$107key_256b: movups [edx],xmm0 lea edx,[16+edx] shufps xmm4,xmm2,16 xorps xmm2,xmm4 shufps xmm4,xmm2,140 xorps xmm2,xmm4 shufps xmm1,xmm1,170 xorps xmm2,xmm1 ret L$101good_key: pxor xmm0,xmm0 pxor xmm1,xmm1 pxor xmm2,xmm2 pxor xmm3,xmm3 pxor xmm4,xmm4 pxor xmm5,xmm5 xor eax,eax pop ebx ret align 4 L$097bad_keybits: pxor xmm0,xmm0 mov eax,-2 pop ebx ret global _aes_hw_set_encrypt_key_alt align 16 _aes_hw_set_encrypt_key_alt: L$_aes_hw_set_encrypt_key_alt_begin: %ifdef BORINGSSL_DISPATCH_TEST push ebx push edx call L$109pic_for_function_hit L$109pic_for_function_hit: pop ebx lea ebx,[(_BORINGSSL_function_hit+3-L$109pic_for_function_hit)+ebx] mov edx,1 mov BYTE [ebx],dl pop edx pop ebx %endif mov eax,DWORD [4+esp] mov ecx,DWORD [8+esp] mov edx,DWORD [12+esp] push ebx call L$110pic L$110pic: pop ebx lea ebx,[(L$key_const-L$110pic)+ebx] movups xmm0,[eax] xorps xmm4,xmm4 lea edx,[16+edx] cmp ecx,256 je NEAR L$11114rounds_alt cmp ecx,192 je NEAR L$11212rounds_alt cmp ecx,128 jne NEAR L$113bad_keybits align 16 L$11410rounds_alt: movdqa xmm5,[ebx] mov ecx,8 movdqa xmm4,[32+ebx] movdqa xmm2,xmm0 movdqu [edx-16],xmm0 L$115loop_key128: db 102,15,56,0,197 db 102,15,56,221,196 pslld xmm4,1 lea edx,[16+edx] movdqa xmm3,xmm2 pslldq xmm2,4 pxor xmm3,xmm2 pslldq xmm2,4 pxor xmm3,xmm2 pslldq xmm2,4 pxor xmm2,xmm3 pxor xmm0,xmm2 movdqu [edx-16],xmm0 movdqa xmm2,xmm0 dec ecx jnz NEAR L$115loop_key128 movdqa xmm4,[48+ebx] db 102,15,56,0,197 db 102,15,56,221,196 pslld xmm4,1 movdqa xmm3,xmm2 pslldq xmm2,4 pxor xmm3,xmm2 pslldq xmm2,4 pxor xmm3,xmm2 pslldq xmm2,4 pxor xmm2,xmm3 pxor xmm0,xmm2 movdqu [edx],xmm0 movdqa xmm2,xmm0 db 102,15,56,0,197 db 102,15,56,221,196 movdqa xmm3,xmm2 pslldq xmm2,4 pxor xmm3,xmm2 pslldq xmm2,4 pxor xmm3,xmm2 pslldq xmm2,4 pxor xmm2,xmm3 pxor xmm0,xmm2 movdqu [16+edx],xmm0 mov ecx,9 mov DWORD [96+edx],ecx jmp NEAR L$116good_key align 16 L$11212rounds_alt: movq xmm2,[16+eax] movdqa xmm5,[16+ebx] movdqa xmm4,[32+ebx] mov ecx,8 movdqu [edx-16],xmm0 L$117loop_key192: movq [edx],xmm2 movdqa xmm1,xmm2 db 102,15,56,0,213 db 102,15,56,221,212 pslld xmm4,1 lea edx,[24+edx] movdqa xmm3,xmm0 pslldq xmm0,4 pxor xmm3,xmm0 pslldq xmm0,4 pxor xmm3,xmm0 pslldq xmm0,4 pxor xmm0,xmm3 pshufd xmm3,xmm0,255 pxor xmm3,xmm1 pslldq xmm1,4 pxor xmm3,xmm1 pxor xmm0,xmm2 pxor xmm2,xmm3 movdqu [edx-16],xmm0 dec ecx jnz NEAR L$117loop_key192 mov ecx,11 mov DWORD [32+edx],ecx jmp NEAR L$116good_key align 16 L$11114rounds_alt: movups xmm2,[16+eax] lea edx,[16+edx] movdqa xmm5,[ebx] movdqa xmm4,[32+ebx] mov ecx,7 movdqu [edx-32],xmm0 movdqa xmm1,xmm2 movdqu [edx-16],xmm2 L$118loop_key256: db 102,15,56,0,213 db 102,15,56,221,212 movdqa xmm3,xmm0 pslldq xmm0,4 pxor xmm3,xmm0 pslldq xmm0,4 pxor xmm3,xmm0 pslldq xmm0,4 pxor xmm0,xmm3 pslld xmm4,1 pxor xmm0,xmm2 movdqu [edx],xmm0 dec ecx jz NEAR L$119done_key256 pshufd xmm2,xmm0,255 pxor xmm3,xmm3 db 102,15,56,221,211 movdqa xmm3,xmm1 pslldq xmm1,4 pxor xmm3,xmm1 pslldq xmm1,4 pxor xmm3,xmm1 pslldq xmm1,4 pxor xmm1,xmm3 pxor xmm2,xmm1 movdqu [16+edx],xmm2 lea edx,[32+edx] movdqa xmm1,xmm2 jmp NEAR L$118loop_key256 L$119done_key256: mov ecx,13 mov DWORD [16+edx],ecx L$116good_key: pxor xmm0,xmm0 pxor xmm1,xmm1 pxor xmm2,xmm2 pxor xmm3,xmm3 pxor xmm4,xmm4 pxor xmm5,xmm5 xor eax,eax pop ebx ret align 4 L$113bad_keybits: pxor xmm0,xmm0 mov eax,-2 pop ebx ret global _aes_hw_encrypt_key_to_decrypt_key align 16 _aes_hw_encrypt_key_to_decrypt_key: L$_aes_hw_encrypt_key_to_decrypt_key_begin: mov edx,DWORD [4+esp] mov ecx,DWORD [240+edx] shl ecx,4 lea eax,[16+ecx*1+edx] movups xmm0,[edx] movups xmm1,[eax] movups [eax],xmm0 movups [edx],xmm1 lea edx,[16+edx] lea eax,[eax-16] L$120dec_key_inverse: movups xmm0,[edx] movups xmm1,[eax] db 102,15,56,219,192 db 102,15,56,219,201 lea edx,[16+edx] lea eax,[eax-16] movups [16+eax],xmm0 movups [edx-16],xmm1 cmp eax,edx ja NEAR L$120dec_key_inverse movups xmm0,[edx] db 102,15,56,219,192 movups [edx],xmm0 pxor xmm0,xmm0 pxor xmm1,xmm1 ret align 64 L$key_const: dd 202313229,202313229,202313229,202313229 dd 67569157,67569157,67569157,67569157 dd 1,1,1,1 dd 27,27,27,27 db 65,69,83,32,102,111,114,32,73,110,116,101,108,32,65,69 db 83,45,78,73,44,32,67,82,89,80,84,79,71,65,77,83 db 32,98,121,32,60,97,112,112,114,111,64,111,112,101,110,115 db 115,108,46,111,114,103,62,0 %else ; Work around https://bugzilla.nasm.us/show_bug.cgi?id=3392738 ret %endif