mirror of
https://github.com/pineappleEA/pineapple-src.git
synced 2024-11-29 18:08:25 -05:00
2804 lines
54 KiB
ArmAsm
2804 lines
54 KiB
ArmAsm
|
; 1 "crypto/aes/bsaes-masm-x86_64.S.tmp"
|
||
|
; 1 "<built-in>" 1
|
||
|
; 1 "<built-in>" 3
|
||
|
; 340 "<built-in>" 3
|
||
|
; 1 "<command line>" 1
|
||
|
; 1 "<built-in>" 2
|
||
|
; 1 "crypto/aes/bsaes-masm-x86_64.S.tmp" 2
|
||
|
OPTION DOTNAME
|
||
|
|
||
|
; 1 "./crypto/x86_arch.h" 1
|
||
|
|
||
|
|
||
|
; 16 "./crypto/x86_arch.h"
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
; 40 "./crypto/x86_arch.h"
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
; 3 "crypto/aes/bsaes-masm-x86_64.S.tmp" 2
|
||
|
.text$ SEGMENT ALIGN(64) 'CODE'
|
||
|
|
||
|
EXTERN asm_AES_encrypt:NEAR
|
||
|
EXTERN asm_AES_decrypt:NEAR
|
||
|
|
||
|
|
||
|
ALIGN 64
|
||
|
_bsaes_encrypt8 PROC PRIVATE
|
||
|
lea r11,QWORD PTR[$L$BS0]
|
||
|
|
||
|
movdqa xmm8,XMMWORD PTR[rax]
|
||
|
lea rax,QWORD PTR[16+rax]
|
||
|
movdqa xmm7,XMMWORD PTR[80+r11]
|
||
|
pxor xmm15,xmm8
|
||
|
pxor xmm0,xmm8
|
||
|
DB 102,68,15,56,0,255
|
||
|
pxor xmm1,xmm8
|
||
|
DB 102,15,56,0,199
|
||
|
pxor xmm2,xmm8
|
||
|
DB 102,15,56,0,207
|
||
|
pxor xmm3,xmm8
|
||
|
DB 102,15,56,0,215
|
||
|
pxor xmm4,xmm8
|
||
|
DB 102,15,56,0,223
|
||
|
pxor xmm5,xmm8
|
||
|
DB 102,15,56,0,231
|
||
|
pxor xmm6,xmm8
|
||
|
DB 102,15,56,0,239
|
||
|
DB 102,15,56,0,247
|
||
|
_bsaes_encrypt8_bitslice::
|
||
|
movdqa xmm7,XMMWORD PTR[r11]
|
||
|
movdqa xmm8,XMMWORD PTR[16+r11]
|
||
|
movdqa xmm9,xmm5
|
||
|
psrlq xmm5,1
|
||
|
movdqa xmm10,xmm3
|
||
|
psrlq xmm3,1
|
||
|
pxor xmm5,xmm6
|
||
|
pxor xmm3,xmm4
|
||
|
pand xmm5,xmm7
|
||
|
pand xmm3,xmm7
|
||
|
pxor xmm6,xmm5
|
||
|
psllq xmm5,1
|
||
|
pxor xmm4,xmm3
|
||
|
psllq xmm3,1
|
||
|
pxor xmm5,xmm9
|
||
|
pxor xmm3,xmm10
|
||
|
movdqa xmm9,xmm1
|
||
|
psrlq xmm1,1
|
||
|
movdqa xmm10,xmm15
|
||
|
psrlq xmm15,1
|
||
|
pxor xmm1,xmm2
|
||
|
pxor xmm15,xmm0
|
||
|
pand xmm1,xmm7
|
||
|
pand xmm15,xmm7
|
||
|
pxor xmm2,xmm1
|
||
|
psllq xmm1,1
|
||
|
pxor xmm0,xmm15
|
||
|
psllq xmm15,1
|
||
|
pxor xmm1,xmm9
|
||
|
pxor xmm15,xmm10
|
||
|
movdqa xmm7,XMMWORD PTR[32+r11]
|
||
|
movdqa xmm9,xmm4
|
||
|
psrlq xmm4,2
|
||
|
movdqa xmm10,xmm3
|
||
|
psrlq xmm3,2
|
||
|
pxor xmm4,xmm6
|
||
|
pxor xmm3,xmm5
|
||
|
pand xmm4,xmm8
|
||
|
pand xmm3,xmm8
|
||
|
pxor xmm6,xmm4
|
||
|
psllq xmm4,2
|
||
|
pxor xmm5,xmm3
|
||
|
psllq xmm3,2
|
||
|
pxor xmm4,xmm9
|
||
|
pxor xmm3,xmm10
|
||
|
movdqa xmm9,xmm0
|
||
|
psrlq xmm0,2
|
||
|
movdqa xmm10,xmm15
|
||
|
psrlq xmm15,2
|
||
|
pxor xmm0,xmm2
|
||
|
pxor xmm15,xmm1
|
||
|
pand xmm0,xmm8
|
||
|
pand xmm15,xmm8
|
||
|
pxor xmm2,xmm0
|
||
|
psllq xmm0,2
|
||
|
pxor xmm1,xmm15
|
||
|
psllq xmm15,2
|
||
|
pxor xmm0,xmm9
|
||
|
pxor xmm15,xmm10
|
||
|
movdqa xmm9,xmm2
|
||
|
psrlq xmm2,4
|
||
|
movdqa xmm10,xmm1
|
||
|
psrlq xmm1,4
|
||
|
pxor xmm2,xmm6
|
||
|
pxor xmm1,xmm5
|
||
|
pand xmm2,xmm7
|
||
|
pand xmm1,xmm7
|
||
|
pxor xmm6,xmm2
|
||
|
psllq xmm2,4
|
||
|
pxor xmm5,xmm1
|
||
|
psllq xmm1,4
|
||
|
pxor xmm2,xmm9
|
||
|
pxor xmm1,xmm10
|
||
|
movdqa xmm9,xmm0
|
||
|
psrlq xmm0,4
|
||
|
movdqa xmm10,xmm15
|
||
|
psrlq xmm15,4
|
||
|
pxor xmm0,xmm4
|
||
|
pxor xmm15,xmm3
|
||
|
pand xmm0,xmm7
|
||
|
pand xmm15,xmm7
|
||
|
pxor xmm4,xmm0
|
||
|
psllq xmm0,4
|
||
|
pxor xmm3,xmm15
|
||
|
psllq xmm15,4
|
||
|
pxor xmm0,xmm9
|
||
|
pxor xmm15,xmm10
|
||
|
dec r10d
|
||
|
jmp $L$enc_sbox
|
||
|
ALIGN 16
|
||
|
$L$enc_loop::
|
||
|
pxor xmm15,XMMWORD PTR[rax]
|
||
|
pxor xmm0,XMMWORD PTR[16+rax]
|
||
|
DB 102,68,15,56,0,255
|
||
|
pxor xmm1,XMMWORD PTR[32+rax]
|
||
|
DB 102,15,56,0,199
|
||
|
pxor xmm2,XMMWORD PTR[48+rax]
|
||
|
DB 102,15,56,0,207
|
||
|
pxor xmm3,XMMWORD PTR[64+rax]
|
||
|
DB 102,15,56,0,215
|
||
|
pxor xmm4,XMMWORD PTR[80+rax]
|
||
|
DB 102,15,56,0,223
|
||
|
pxor xmm5,XMMWORD PTR[96+rax]
|
||
|
DB 102,15,56,0,231
|
||
|
pxor xmm6,XMMWORD PTR[112+rax]
|
||
|
DB 102,15,56,0,239
|
||
|
lea rax,QWORD PTR[128+rax]
|
||
|
DB 102,15,56,0,247
|
||
|
$L$enc_sbox::
|
||
|
pxor xmm4,xmm5
|
||
|
pxor xmm1,xmm0
|
||
|
pxor xmm2,xmm15
|
||
|
pxor xmm5,xmm1
|
||
|
pxor xmm4,xmm15
|
||
|
|
||
|
pxor xmm5,xmm2
|
||
|
pxor xmm2,xmm6
|
||
|
pxor xmm6,xmm4
|
||
|
pxor xmm2,xmm3
|
||
|
pxor xmm3,xmm4
|
||
|
pxor xmm2,xmm0
|
||
|
|
||
|
pxor xmm1,xmm6
|
||
|
pxor xmm0,xmm4
|
||
|
movdqa xmm10,xmm6
|
||
|
movdqa xmm9,xmm0
|
||
|
movdqa xmm8,xmm4
|
||
|
movdqa xmm12,xmm1
|
||
|
movdqa xmm11,xmm5
|
||
|
|
||
|
pxor xmm10,xmm3
|
||
|
pxor xmm9,xmm1
|
||
|
pxor xmm8,xmm2
|
||
|
movdqa xmm13,xmm10
|
||
|
pxor xmm12,xmm3
|
||
|
movdqa xmm7,xmm9
|
||
|
pxor xmm11,xmm15
|
||
|
movdqa xmm14,xmm10
|
||
|
|
||
|
por xmm9,xmm8
|
||
|
por xmm10,xmm11
|
||
|
pxor xmm14,xmm7
|
||
|
pand xmm13,xmm11
|
||
|
pxor xmm11,xmm8
|
||
|
pand xmm7,xmm8
|
||
|
pand xmm14,xmm11
|
||
|
movdqa xmm11,xmm2
|
||
|
pxor xmm11,xmm15
|
||
|
pand xmm12,xmm11
|
||
|
pxor xmm10,xmm12
|
||
|
pxor xmm9,xmm12
|
||
|
movdqa xmm12,xmm6
|
||
|
movdqa xmm11,xmm4
|
||
|
pxor xmm12,xmm0
|
||
|
pxor xmm11,xmm5
|
||
|
movdqa xmm8,xmm12
|
||
|
pand xmm12,xmm11
|
||
|
por xmm8,xmm11
|
||
|
pxor xmm7,xmm12
|
||
|
pxor xmm10,xmm14
|
||
|
pxor xmm9,xmm13
|
||
|
pxor xmm8,xmm14
|
||
|
movdqa xmm11,xmm1
|
||
|
pxor xmm7,xmm13
|
||
|
movdqa xmm12,xmm3
|
||
|
pxor xmm8,xmm13
|
||
|
movdqa xmm13,xmm0
|
||
|
pand xmm11,xmm2
|
||
|
movdqa xmm14,xmm6
|
||
|
pand xmm12,xmm15
|
||
|
pand xmm13,xmm4
|
||
|
por xmm14,xmm5
|
||
|
pxor xmm10,xmm11
|
||
|
pxor xmm9,xmm12
|
||
|
pxor xmm8,xmm13
|
||
|
pxor xmm7,xmm14
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
movdqa xmm11,xmm10
|
||
|
pand xmm10,xmm8
|
||
|
pxor xmm11,xmm9
|
||
|
|
||
|
movdqa xmm13,xmm7
|
||
|
movdqa xmm14,xmm11
|
||
|
pxor xmm13,xmm10
|
||
|
pand xmm14,xmm13
|
||
|
|
||
|
movdqa xmm12,xmm8
|
||
|
pxor xmm14,xmm9
|
||
|
pxor xmm12,xmm7
|
||
|
|
||
|
pxor xmm10,xmm9
|
||
|
|
||
|
pand xmm12,xmm10
|
||
|
|
||
|
movdqa xmm9,xmm13
|
||
|
pxor xmm12,xmm7
|
||
|
|
||
|
pxor xmm9,xmm12
|
||
|
pxor xmm8,xmm12
|
||
|
|
||
|
pand xmm9,xmm7
|
||
|
|
||
|
pxor xmm13,xmm9
|
||
|
pxor xmm8,xmm9
|
||
|
|
||
|
pand xmm13,xmm14
|
||
|
|
||
|
pxor xmm13,xmm11
|
||
|
movdqa xmm11,xmm5
|
||
|
movdqa xmm7,xmm4
|
||
|
movdqa xmm9,xmm14
|
||
|
pxor xmm9,xmm13
|
||
|
pand xmm9,xmm5
|
||
|
pxor xmm5,xmm4
|
||
|
pand xmm4,xmm14
|
||
|
pand xmm5,xmm13
|
||
|
pxor xmm5,xmm4
|
||
|
pxor xmm4,xmm9
|
||
|
pxor xmm11,xmm15
|
||
|
pxor xmm7,xmm2
|
||
|
pxor xmm14,xmm12
|
||
|
pxor xmm13,xmm8
|
||
|
movdqa xmm10,xmm14
|
||
|
movdqa xmm9,xmm12
|
||
|
pxor xmm10,xmm13
|
||
|
pxor xmm9,xmm8
|
||
|
pand xmm10,xmm11
|
||
|
pand xmm9,xmm15
|
||
|
pxor xmm11,xmm7
|
||
|
pxor xmm15,xmm2
|
||
|
pand xmm7,xmm14
|
||
|
pand xmm2,xmm12
|
||
|
pand xmm11,xmm13
|
||
|
pand xmm15,xmm8
|
||
|
pxor xmm7,xmm11
|
||
|
pxor xmm15,xmm2
|
||
|
pxor xmm11,xmm10
|
||
|
pxor xmm2,xmm9
|
||
|
pxor xmm5,xmm11
|
||
|
pxor xmm15,xmm11
|
||
|
pxor xmm4,xmm7
|
||
|
pxor xmm2,xmm7
|
||
|
|
||
|
movdqa xmm11,xmm6
|
||
|
movdqa xmm7,xmm0
|
||
|
pxor xmm11,xmm3
|
||
|
pxor xmm7,xmm1
|
||
|
movdqa xmm10,xmm14
|
||
|
movdqa xmm9,xmm12
|
||
|
pxor xmm10,xmm13
|
||
|
pxor xmm9,xmm8
|
||
|
pand xmm10,xmm11
|
||
|
pand xmm9,xmm3
|
||
|
pxor xmm11,xmm7
|
||
|
pxor xmm3,xmm1
|
||
|
pand xmm7,xmm14
|
||
|
pand xmm1,xmm12
|
||
|
pand xmm11,xmm13
|
||
|
pand xmm3,xmm8
|
||
|
pxor xmm7,xmm11
|
||
|
pxor xmm3,xmm1
|
||
|
pxor xmm11,xmm10
|
||
|
pxor xmm1,xmm9
|
||
|
pxor xmm14,xmm12
|
||
|
pxor xmm13,xmm8
|
||
|
movdqa xmm10,xmm14
|
||
|
pxor xmm10,xmm13
|
||
|
pand xmm10,xmm6
|
||
|
pxor xmm6,xmm0
|
||
|
pand xmm0,xmm14
|
||
|
pand xmm6,xmm13
|
||
|
pxor xmm6,xmm0
|
||
|
pxor xmm0,xmm10
|
||
|
pxor xmm6,xmm11
|
||
|
pxor xmm3,xmm11
|
||
|
pxor xmm0,xmm7
|
||
|
pxor xmm1,xmm7
|
||
|
pxor xmm6,xmm15
|
||
|
pxor xmm0,xmm5
|
||
|
pxor xmm3,xmm6
|
||
|
pxor xmm5,xmm15
|
||
|
pxor xmm15,xmm0
|
||
|
|
||
|
pxor xmm0,xmm4
|
||
|
pxor xmm4,xmm1
|
||
|
pxor xmm1,xmm2
|
||
|
pxor xmm2,xmm4
|
||
|
pxor xmm3,xmm4
|
||
|
|
||
|
pxor xmm5,xmm2
|
||
|
dec r10d
|
||
|
jl $L$enc_done
|
||
|
pshufd xmm7,xmm15,093h
|
||
|
pshufd xmm8,xmm0,093h
|
||
|
pxor xmm15,xmm7
|
||
|
pshufd xmm9,xmm3,093h
|
||
|
pxor xmm0,xmm8
|
||
|
pshufd xmm10,xmm5,093h
|
||
|
pxor xmm3,xmm9
|
||
|
pshufd xmm11,xmm2,093h
|
||
|
pxor xmm5,xmm10
|
||
|
pshufd xmm12,xmm6,093h
|
||
|
pxor xmm2,xmm11
|
||
|
pshufd xmm13,xmm1,093h
|
||
|
pxor xmm6,xmm12
|
||
|
pshufd xmm14,xmm4,093h
|
||
|
pxor xmm1,xmm13
|
||
|
pxor xmm4,xmm14
|
||
|
|
||
|
pxor xmm8,xmm15
|
||
|
pxor xmm7,xmm4
|
||
|
pxor xmm8,xmm4
|
||
|
pshufd xmm15,xmm15,04Eh
|
||
|
pxor xmm9,xmm0
|
||
|
pshufd xmm0,xmm0,04Eh
|
||
|
pxor xmm12,xmm2
|
||
|
pxor xmm15,xmm7
|
||
|
pxor xmm13,xmm6
|
||
|
pxor xmm0,xmm8
|
||
|
pxor xmm11,xmm5
|
||
|
pshufd xmm7,xmm2,04Eh
|
||
|
pxor xmm14,xmm1
|
||
|
pshufd xmm8,xmm6,04Eh
|
||
|
pxor xmm10,xmm3
|
||
|
pshufd xmm2,xmm5,04Eh
|
||
|
pxor xmm10,xmm4
|
||
|
pshufd xmm6,xmm4,04Eh
|
||
|
pxor xmm11,xmm4
|
||
|
pshufd xmm5,xmm1,04Eh
|
||
|
pxor xmm7,xmm11
|
||
|
pshufd xmm1,xmm3,04Eh
|
||
|
pxor xmm8,xmm12
|
||
|
pxor xmm2,xmm10
|
||
|
pxor xmm6,xmm14
|
||
|
pxor xmm5,xmm13
|
||
|
movdqa xmm3,xmm7
|
||
|
pxor xmm1,xmm9
|
||
|
movdqa xmm4,xmm8
|
||
|
movdqa xmm7,XMMWORD PTR[48+r11]
|
||
|
jnz $L$enc_loop
|
||
|
movdqa xmm7,XMMWORD PTR[64+r11]
|
||
|
jmp $L$enc_loop
|
||
|
ALIGN 16
|
||
|
$L$enc_done::
|
||
|
movdqa xmm7,XMMWORD PTR[r11]
|
||
|
movdqa xmm8,XMMWORD PTR[16+r11]
|
||
|
movdqa xmm9,xmm1
|
||
|
psrlq xmm1,1
|
||
|
movdqa xmm10,xmm2
|
||
|
psrlq xmm2,1
|
||
|
pxor xmm1,xmm4
|
||
|
pxor xmm2,xmm6
|
||
|
pand xmm1,xmm7
|
||
|
pand xmm2,xmm7
|
||
|
pxor xmm4,xmm1
|
||
|
psllq xmm1,1
|
||
|
pxor xmm6,xmm2
|
||
|
psllq xmm2,1
|
||
|
pxor xmm1,xmm9
|
||
|
pxor xmm2,xmm10
|
||
|
movdqa xmm9,xmm3
|
||
|
psrlq xmm3,1
|
||
|
movdqa xmm10,xmm15
|
||
|
psrlq xmm15,1
|
||
|
pxor xmm3,xmm5
|
||
|
pxor xmm15,xmm0
|
||
|
pand xmm3,xmm7
|
||
|
pand xmm15,xmm7
|
||
|
pxor xmm5,xmm3
|
||
|
psllq xmm3,1
|
||
|
pxor xmm0,xmm15
|
||
|
psllq xmm15,1
|
||
|
pxor xmm3,xmm9
|
||
|
pxor xmm15,xmm10
|
||
|
movdqa xmm7,XMMWORD PTR[32+r11]
|
||
|
movdqa xmm9,xmm6
|
||
|
psrlq xmm6,2
|
||
|
movdqa xmm10,xmm2
|
||
|
psrlq xmm2,2
|
||
|
pxor xmm6,xmm4
|
||
|
pxor xmm2,xmm1
|
||
|
pand xmm6,xmm8
|
||
|
pand xmm2,xmm8
|
||
|
pxor xmm4,xmm6
|
||
|
psllq xmm6,2
|
||
|
pxor xmm1,xmm2
|
||
|
psllq xmm2,2
|
||
|
pxor xmm6,xmm9
|
||
|
pxor xmm2,xmm10
|
||
|
movdqa xmm9,xmm0
|
||
|
psrlq xmm0,2
|
||
|
movdqa xmm10,xmm15
|
||
|
psrlq xmm15,2
|
||
|
pxor xmm0,xmm5
|
||
|
pxor xmm15,xmm3
|
||
|
pand xmm0,xmm8
|
||
|
pand xmm15,xmm8
|
||
|
pxor xmm5,xmm0
|
||
|
psllq xmm0,2
|
||
|
pxor xmm3,xmm15
|
||
|
psllq xmm15,2
|
||
|
pxor xmm0,xmm9
|
||
|
pxor xmm15,xmm10
|
||
|
movdqa xmm9,xmm5
|
||
|
psrlq xmm5,4
|
||
|
movdqa xmm10,xmm3
|
||
|
psrlq xmm3,4
|
||
|
pxor xmm5,xmm4
|
||
|
pxor xmm3,xmm1
|
||
|
pand xmm5,xmm7
|
||
|
pand xmm3,xmm7
|
||
|
pxor xmm4,xmm5
|
||
|
psllq xmm5,4
|
||
|
pxor xmm1,xmm3
|
||
|
psllq xmm3,4
|
||
|
pxor xmm5,xmm9
|
||
|
pxor xmm3,xmm10
|
||
|
movdqa xmm9,xmm0
|
||
|
psrlq xmm0,4
|
||
|
movdqa xmm10,xmm15
|
||
|
psrlq xmm15,4
|
||
|
pxor xmm0,xmm6
|
||
|
pxor xmm15,xmm2
|
||
|
pand xmm0,xmm7
|
||
|
pand xmm15,xmm7
|
||
|
pxor xmm6,xmm0
|
||
|
psllq xmm0,4
|
||
|
pxor xmm2,xmm15
|
||
|
psllq xmm15,4
|
||
|
pxor xmm0,xmm9
|
||
|
pxor xmm15,xmm10
|
||
|
movdqa xmm7,XMMWORD PTR[rax]
|
||
|
pxor xmm3,xmm7
|
||
|
pxor xmm5,xmm7
|
||
|
pxor xmm2,xmm7
|
||
|
pxor xmm6,xmm7
|
||
|
pxor xmm1,xmm7
|
||
|
pxor xmm4,xmm7
|
||
|
pxor xmm15,xmm7
|
||
|
pxor xmm0,xmm7
|
||
|
DB 0F3h,0C3h ;repret
|
||
|
_bsaes_encrypt8 ENDP
|
||
|
|
||
|
|
||
|
ALIGN 64
|
||
|
_bsaes_decrypt8 PROC PRIVATE
|
||
|
lea r11,QWORD PTR[$L$BS0]
|
||
|
|
||
|
movdqa xmm8,XMMWORD PTR[rax]
|
||
|
lea rax,QWORD PTR[16+rax]
|
||
|
movdqa xmm7,XMMWORD PTR[((-48))+r11]
|
||
|
pxor xmm15,xmm8
|
||
|
pxor xmm0,xmm8
|
||
|
DB 102,68,15,56,0,255
|
||
|
pxor xmm1,xmm8
|
||
|
DB 102,15,56,0,199
|
||
|
pxor xmm2,xmm8
|
||
|
DB 102,15,56,0,207
|
||
|
pxor xmm3,xmm8
|
||
|
DB 102,15,56,0,215
|
||
|
pxor xmm4,xmm8
|
||
|
DB 102,15,56,0,223
|
||
|
pxor xmm5,xmm8
|
||
|
DB 102,15,56,0,231
|
||
|
pxor xmm6,xmm8
|
||
|
DB 102,15,56,0,239
|
||
|
DB 102,15,56,0,247
|
||
|
movdqa xmm7,XMMWORD PTR[r11]
|
||
|
movdqa xmm8,XMMWORD PTR[16+r11]
|
||
|
movdqa xmm9,xmm5
|
||
|
psrlq xmm5,1
|
||
|
movdqa xmm10,xmm3
|
||
|
psrlq xmm3,1
|
||
|
pxor xmm5,xmm6
|
||
|
pxor xmm3,xmm4
|
||
|
pand xmm5,xmm7
|
||
|
pand xmm3,xmm7
|
||
|
pxor xmm6,xmm5
|
||
|
psllq xmm5,1
|
||
|
pxor xmm4,xmm3
|
||
|
psllq xmm3,1
|
||
|
pxor xmm5,xmm9
|
||
|
pxor xmm3,xmm10
|
||
|
movdqa xmm9,xmm1
|
||
|
psrlq xmm1,1
|
||
|
movdqa xmm10,xmm15
|
||
|
psrlq xmm15,1
|
||
|
pxor xmm1,xmm2
|
||
|
pxor xmm15,xmm0
|
||
|
pand xmm1,xmm7
|
||
|
pand xmm15,xmm7
|
||
|
pxor xmm2,xmm1
|
||
|
psllq xmm1,1
|
||
|
pxor xmm0,xmm15
|
||
|
psllq xmm15,1
|
||
|
pxor xmm1,xmm9
|
||
|
pxor xmm15,xmm10
|
||
|
movdqa xmm7,XMMWORD PTR[32+r11]
|
||
|
movdqa xmm9,xmm4
|
||
|
psrlq xmm4,2
|
||
|
movdqa xmm10,xmm3
|
||
|
psrlq xmm3,2
|
||
|
pxor xmm4,xmm6
|
||
|
pxor xmm3,xmm5
|
||
|
pand xmm4,xmm8
|
||
|
pand xmm3,xmm8
|
||
|
pxor xmm6,xmm4
|
||
|
psllq xmm4,2
|
||
|
pxor xmm5,xmm3
|
||
|
psllq xmm3,2
|
||
|
pxor xmm4,xmm9
|
||
|
pxor xmm3,xmm10
|
||
|
movdqa xmm9,xmm0
|
||
|
psrlq xmm0,2
|
||
|
movdqa xmm10,xmm15
|
||
|
psrlq xmm15,2
|
||
|
pxor xmm0,xmm2
|
||
|
pxor xmm15,xmm1
|
||
|
pand xmm0,xmm8
|
||
|
pand xmm15,xmm8
|
||
|
pxor xmm2,xmm0
|
||
|
psllq xmm0,2
|
||
|
pxor xmm1,xmm15
|
||
|
psllq xmm15,2
|
||
|
pxor xmm0,xmm9
|
||
|
pxor xmm15,xmm10
|
||
|
movdqa xmm9,xmm2
|
||
|
psrlq xmm2,4
|
||
|
movdqa xmm10,xmm1
|
||
|
psrlq xmm1,4
|
||
|
pxor xmm2,xmm6
|
||
|
pxor xmm1,xmm5
|
||
|
pand xmm2,xmm7
|
||
|
pand xmm1,xmm7
|
||
|
pxor xmm6,xmm2
|
||
|
psllq xmm2,4
|
||
|
pxor xmm5,xmm1
|
||
|
psllq xmm1,4
|
||
|
pxor xmm2,xmm9
|
||
|
pxor xmm1,xmm10
|
||
|
movdqa xmm9,xmm0
|
||
|
psrlq xmm0,4
|
||
|
movdqa xmm10,xmm15
|
||
|
psrlq xmm15,4
|
||
|
pxor xmm0,xmm4
|
||
|
pxor xmm15,xmm3
|
||
|
pand xmm0,xmm7
|
||
|
pand xmm15,xmm7
|
||
|
pxor xmm4,xmm0
|
||
|
psllq xmm0,4
|
||
|
pxor xmm3,xmm15
|
||
|
psllq xmm15,4
|
||
|
pxor xmm0,xmm9
|
||
|
pxor xmm15,xmm10
|
||
|
dec r10d
|
||
|
jmp $L$dec_sbox
|
||
|
ALIGN 16
|
||
|
$L$dec_loop::
|
||
|
pxor xmm15,XMMWORD PTR[rax]
|
||
|
pxor xmm0,XMMWORD PTR[16+rax]
|
||
|
DB 102,68,15,56,0,255
|
||
|
pxor xmm1,XMMWORD PTR[32+rax]
|
||
|
DB 102,15,56,0,199
|
||
|
pxor xmm2,XMMWORD PTR[48+rax]
|
||
|
DB 102,15,56,0,207
|
||
|
pxor xmm3,XMMWORD PTR[64+rax]
|
||
|
DB 102,15,56,0,215
|
||
|
pxor xmm4,XMMWORD PTR[80+rax]
|
||
|
DB 102,15,56,0,223
|
||
|
pxor xmm5,XMMWORD PTR[96+rax]
|
||
|
DB 102,15,56,0,231
|
||
|
pxor xmm6,XMMWORD PTR[112+rax]
|
||
|
DB 102,15,56,0,239
|
||
|
lea rax,QWORD PTR[128+rax]
|
||
|
DB 102,15,56,0,247
|
||
|
$L$dec_sbox::
|
||
|
pxor xmm2,xmm3
|
||
|
|
||
|
pxor xmm3,xmm6
|
||
|
pxor xmm1,xmm6
|
||
|
pxor xmm5,xmm3
|
||
|
pxor xmm6,xmm5
|
||
|
pxor xmm0,xmm6
|
||
|
|
||
|
pxor xmm15,xmm0
|
||
|
pxor xmm1,xmm4
|
||
|
pxor xmm2,xmm15
|
||
|
pxor xmm4,xmm15
|
||
|
pxor xmm0,xmm2
|
||
|
movdqa xmm10,xmm2
|
||
|
movdqa xmm9,xmm6
|
||
|
movdqa xmm8,xmm0
|
||
|
movdqa xmm12,xmm3
|
||
|
movdqa xmm11,xmm4
|
||
|
|
||
|
pxor xmm10,xmm15
|
||
|
pxor xmm9,xmm3
|
||
|
pxor xmm8,xmm5
|
||
|
movdqa xmm13,xmm10
|
||
|
pxor xmm12,xmm15
|
||
|
movdqa xmm7,xmm9
|
||
|
pxor xmm11,xmm1
|
||
|
movdqa xmm14,xmm10
|
||
|
|
||
|
por xmm9,xmm8
|
||
|
por xmm10,xmm11
|
||
|
pxor xmm14,xmm7
|
||
|
pand xmm13,xmm11
|
||
|
pxor xmm11,xmm8
|
||
|
pand xmm7,xmm8
|
||
|
pand xmm14,xmm11
|
||
|
movdqa xmm11,xmm5
|
||
|
pxor xmm11,xmm1
|
||
|
pand xmm12,xmm11
|
||
|
pxor xmm10,xmm12
|
||
|
pxor xmm9,xmm12
|
||
|
movdqa xmm12,xmm2
|
||
|
movdqa xmm11,xmm0
|
||
|
pxor xmm12,xmm6
|
||
|
pxor xmm11,xmm4
|
||
|
movdqa xmm8,xmm12
|
||
|
pand xmm12,xmm11
|
||
|
por xmm8,xmm11
|
||
|
pxor xmm7,xmm12
|
||
|
pxor xmm10,xmm14
|
||
|
pxor xmm9,xmm13
|
||
|
pxor xmm8,xmm14
|
||
|
movdqa xmm11,xmm3
|
||
|
pxor xmm7,xmm13
|
||
|
movdqa xmm12,xmm15
|
||
|
pxor xmm8,xmm13
|
||
|
movdqa xmm13,xmm6
|
||
|
pand xmm11,xmm5
|
||
|
movdqa xmm14,xmm2
|
||
|
pand xmm12,xmm1
|
||
|
pand xmm13,xmm0
|
||
|
por xmm14,xmm4
|
||
|
pxor xmm10,xmm11
|
||
|
pxor xmm9,xmm12
|
||
|
pxor xmm8,xmm13
|
||
|
pxor xmm7,xmm14
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
movdqa xmm11,xmm10
|
||
|
pand xmm10,xmm8
|
||
|
pxor xmm11,xmm9
|
||
|
|
||
|
movdqa xmm13,xmm7
|
||
|
movdqa xmm14,xmm11
|
||
|
pxor xmm13,xmm10
|
||
|
pand xmm14,xmm13
|
||
|
|
||
|
movdqa xmm12,xmm8
|
||
|
pxor xmm14,xmm9
|
||
|
pxor xmm12,xmm7
|
||
|
|
||
|
pxor xmm10,xmm9
|
||
|
|
||
|
pand xmm12,xmm10
|
||
|
|
||
|
movdqa xmm9,xmm13
|
||
|
pxor xmm12,xmm7
|
||
|
|
||
|
pxor xmm9,xmm12
|
||
|
pxor xmm8,xmm12
|
||
|
|
||
|
pand xmm9,xmm7
|
||
|
|
||
|
pxor xmm13,xmm9
|
||
|
pxor xmm8,xmm9
|
||
|
|
||
|
pand xmm13,xmm14
|
||
|
|
||
|
pxor xmm13,xmm11
|
||
|
movdqa xmm11,xmm4
|
||
|
movdqa xmm7,xmm0
|
||
|
movdqa xmm9,xmm14
|
||
|
pxor xmm9,xmm13
|
||
|
pand xmm9,xmm4
|
||
|
pxor xmm4,xmm0
|
||
|
pand xmm0,xmm14
|
||
|
pand xmm4,xmm13
|
||
|
pxor xmm4,xmm0
|
||
|
pxor xmm0,xmm9
|
||
|
pxor xmm11,xmm1
|
||
|
pxor xmm7,xmm5
|
||
|
pxor xmm14,xmm12
|
||
|
pxor xmm13,xmm8
|
||
|
movdqa xmm10,xmm14
|
||
|
movdqa xmm9,xmm12
|
||
|
pxor xmm10,xmm13
|
||
|
pxor xmm9,xmm8
|
||
|
pand xmm10,xmm11
|
||
|
pand xmm9,xmm1
|
||
|
pxor xmm11,xmm7
|
||
|
pxor xmm1,xmm5
|
||
|
pand xmm7,xmm14
|
||
|
pand xmm5,xmm12
|
||
|
pand xmm11,xmm13
|
||
|
pand xmm1,xmm8
|
||
|
pxor xmm7,xmm11
|
||
|
pxor xmm1,xmm5
|
||
|
pxor xmm11,xmm10
|
||
|
pxor xmm5,xmm9
|
||
|
pxor xmm4,xmm11
|
||
|
pxor xmm1,xmm11
|
||
|
pxor xmm0,xmm7
|
||
|
pxor xmm5,xmm7
|
||
|
|
||
|
movdqa xmm11,xmm2
|
||
|
movdqa xmm7,xmm6
|
||
|
pxor xmm11,xmm15
|
||
|
pxor xmm7,xmm3
|
||
|
movdqa xmm10,xmm14
|
||
|
movdqa xmm9,xmm12
|
||
|
pxor xmm10,xmm13
|
||
|
pxor xmm9,xmm8
|
||
|
pand xmm10,xmm11
|
||
|
pand xmm9,xmm15
|
||
|
pxor xmm11,xmm7
|
||
|
pxor xmm15,xmm3
|
||
|
pand xmm7,xmm14
|
||
|
pand xmm3,xmm12
|
||
|
pand xmm11,xmm13
|
||
|
pand xmm15,xmm8
|
||
|
pxor xmm7,xmm11
|
||
|
pxor xmm15,xmm3
|
||
|
pxor xmm11,xmm10
|
||
|
pxor xmm3,xmm9
|
||
|
pxor xmm14,xmm12
|
||
|
pxor xmm13,xmm8
|
||
|
movdqa xmm10,xmm14
|
||
|
pxor xmm10,xmm13
|
||
|
pand xmm10,xmm2
|
||
|
pxor xmm2,xmm6
|
||
|
pand xmm6,xmm14
|
||
|
pand xmm2,xmm13
|
||
|
pxor xmm2,xmm6
|
||
|
pxor xmm6,xmm10
|
||
|
pxor xmm2,xmm11
|
||
|
pxor xmm15,xmm11
|
||
|
pxor xmm6,xmm7
|
||
|
pxor xmm3,xmm7
|
||
|
pxor xmm0,xmm6
|
||
|
pxor xmm5,xmm4
|
||
|
|
||
|
pxor xmm3,xmm0
|
||
|
pxor xmm1,xmm6
|
||
|
pxor xmm4,xmm6
|
||
|
pxor xmm3,xmm1
|
||
|
pxor xmm6,xmm15
|
||
|
pxor xmm3,xmm4
|
||
|
pxor xmm2,xmm5
|
||
|
pxor xmm5,xmm0
|
||
|
pxor xmm2,xmm3
|
||
|
|
||
|
pxor xmm3,xmm15
|
||
|
pxor xmm6,xmm2
|
||
|
dec r10d
|
||
|
jl $L$dec_done
|
||
|
|
||
|
pshufd xmm7,xmm15,04Eh
|
||
|
pshufd xmm13,xmm2,04Eh
|
||
|
pxor xmm7,xmm15
|
||
|
pshufd xmm14,xmm4,04Eh
|
||
|
pxor xmm13,xmm2
|
||
|
pshufd xmm8,xmm0,04Eh
|
||
|
pxor xmm14,xmm4
|
||
|
pshufd xmm9,xmm5,04Eh
|
||
|
pxor xmm8,xmm0
|
||
|
pshufd xmm10,xmm3,04Eh
|
||
|
pxor xmm9,xmm5
|
||
|
pxor xmm15,xmm13
|
||
|
pxor xmm0,xmm13
|
||
|
pshufd xmm11,xmm1,04Eh
|
||
|
pxor xmm10,xmm3
|
||
|
pxor xmm5,xmm7
|
||
|
pxor xmm3,xmm8
|
||
|
pshufd xmm12,xmm6,04Eh
|
||
|
pxor xmm11,xmm1
|
||
|
pxor xmm0,xmm14
|
||
|
pxor xmm1,xmm9
|
||
|
pxor xmm12,xmm6
|
||
|
|
||
|
pxor xmm5,xmm14
|
||
|
pxor xmm3,xmm13
|
||
|
pxor xmm1,xmm13
|
||
|
pxor xmm6,xmm10
|
||
|
pxor xmm2,xmm11
|
||
|
pxor xmm1,xmm14
|
||
|
pxor xmm6,xmm14
|
||
|
pxor xmm4,xmm12
|
||
|
pshufd xmm7,xmm15,093h
|
||
|
pshufd xmm8,xmm0,093h
|
||
|
pxor xmm15,xmm7
|
||
|
pshufd xmm9,xmm5,093h
|
||
|
pxor xmm0,xmm8
|
||
|
pshufd xmm10,xmm3,093h
|
||
|
pxor xmm5,xmm9
|
||
|
pshufd xmm11,xmm1,093h
|
||
|
pxor xmm3,xmm10
|
||
|
pshufd xmm12,xmm6,093h
|
||
|
pxor xmm1,xmm11
|
||
|
pshufd xmm13,xmm2,093h
|
||
|
pxor xmm6,xmm12
|
||
|
pshufd xmm14,xmm4,093h
|
||
|
pxor xmm2,xmm13
|
||
|
pxor xmm4,xmm14
|
||
|
|
||
|
pxor xmm8,xmm15
|
||
|
pxor xmm7,xmm4
|
||
|
pxor xmm8,xmm4
|
||
|
pshufd xmm15,xmm15,04Eh
|
||
|
pxor xmm9,xmm0
|
||
|
pshufd xmm0,xmm0,04Eh
|
||
|
pxor xmm12,xmm1
|
||
|
pxor xmm15,xmm7
|
||
|
pxor xmm13,xmm6
|
||
|
pxor xmm0,xmm8
|
||
|
pxor xmm11,xmm3
|
||
|
pshufd xmm7,xmm1,04Eh
|
||
|
pxor xmm14,xmm2
|
||
|
pshufd xmm8,xmm6,04Eh
|
||
|
pxor xmm10,xmm5
|
||
|
pshufd xmm1,xmm3,04Eh
|
||
|
pxor xmm10,xmm4
|
||
|
pshufd xmm6,xmm4,04Eh
|
||
|
pxor xmm11,xmm4
|
||
|
pshufd xmm3,xmm2,04Eh
|
||
|
pxor xmm7,xmm11
|
||
|
pshufd xmm2,xmm5,04Eh
|
||
|
pxor xmm8,xmm12
|
||
|
pxor xmm10,xmm1
|
||
|
pxor xmm6,xmm14
|
||
|
pxor xmm13,xmm3
|
||
|
movdqa xmm3,xmm7
|
||
|
pxor xmm2,xmm9
|
||
|
movdqa xmm5,xmm13
|
||
|
movdqa xmm4,xmm8
|
||
|
movdqa xmm1,xmm2
|
||
|
movdqa xmm2,xmm10
|
||
|
movdqa xmm7,XMMWORD PTR[((-16))+r11]
|
||
|
jnz $L$dec_loop
|
||
|
movdqa xmm7,XMMWORD PTR[((-32))+r11]
|
||
|
jmp $L$dec_loop
|
||
|
ALIGN 16
|
||
|
$L$dec_done::
|
||
|
movdqa xmm7,XMMWORD PTR[r11]
|
||
|
movdqa xmm8,XMMWORD PTR[16+r11]
|
||
|
movdqa xmm9,xmm2
|
||
|
psrlq xmm2,1
|
||
|
movdqa xmm10,xmm1
|
||
|
psrlq xmm1,1
|
||
|
pxor xmm2,xmm4
|
||
|
pxor xmm1,xmm6
|
||
|
pand xmm2,xmm7
|
||
|
pand xmm1,xmm7
|
||
|
pxor xmm4,xmm2
|
||
|
psllq xmm2,1
|
||
|
pxor xmm6,xmm1
|
||
|
psllq xmm1,1
|
||
|
pxor xmm2,xmm9
|
||
|
pxor xmm1,xmm10
|
||
|
movdqa xmm9,xmm5
|
||
|
psrlq xmm5,1
|
||
|
movdqa xmm10,xmm15
|
||
|
psrlq xmm15,1
|
||
|
pxor xmm5,xmm3
|
||
|
pxor xmm15,xmm0
|
||
|
pand xmm5,xmm7
|
||
|
pand xmm15,xmm7
|
||
|
pxor xmm3,xmm5
|
||
|
psllq xmm5,1
|
||
|
pxor xmm0,xmm15
|
||
|
psllq xmm15,1
|
||
|
pxor xmm5,xmm9
|
||
|
pxor xmm15,xmm10
|
||
|
movdqa xmm7,XMMWORD PTR[32+r11]
|
||
|
movdqa xmm9,xmm6
|
||
|
psrlq xmm6,2
|
||
|
movdqa xmm10,xmm1
|
||
|
psrlq xmm1,2
|
||
|
pxor xmm6,xmm4
|
||
|
pxor xmm1,xmm2
|
||
|
pand xmm6,xmm8
|
||
|
pand xmm1,xmm8
|
||
|
pxor xmm4,xmm6
|
||
|
psllq xmm6,2
|
||
|
pxor xmm2,xmm1
|
||
|
psllq xmm1,2
|
||
|
pxor xmm6,xmm9
|
||
|
pxor xmm1,xmm10
|
||
|
movdqa xmm9,xmm0
|
||
|
psrlq xmm0,2
|
||
|
movdqa xmm10,xmm15
|
||
|
psrlq xmm15,2
|
||
|
pxor xmm0,xmm3
|
||
|
pxor xmm15,xmm5
|
||
|
pand xmm0,xmm8
|
||
|
pand xmm15,xmm8
|
||
|
pxor xmm3,xmm0
|
||
|
psllq xmm0,2
|
||
|
pxor xmm5,xmm15
|
||
|
psllq xmm15,2
|
||
|
pxor xmm0,xmm9
|
||
|
pxor xmm15,xmm10
|
||
|
movdqa xmm9,xmm3
|
||
|
psrlq xmm3,4
|
||
|
movdqa xmm10,xmm5
|
||
|
psrlq xmm5,4
|
||
|
pxor xmm3,xmm4
|
||
|
pxor xmm5,xmm2
|
||
|
pand xmm3,xmm7
|
||
|
pand xmm5,xmm7
|
||
|
pxor xmm4,xmm3
|
||
|
psllq xmm3,4
|
||
|
pxor xmm2,xmm5
|
||
|
psllq xmm5,4
|
||
|
pxor xmm3,xmm9
|
||
|
pxor xmm5,xmm10
|
||
|
movdqa xmm9,xmm0
|
||
|
psrlq xmm0,4
|
||
|
movdqa xmm10,xmm15
|
||
|
psrlq xmm15,4
|
||
|
pxor xmm0,xmm6
|
||
|
pxor xmm15,xmm1
|
||
|
pand xmm0,xmm7
|
||
|
pand xmm15,xmm7
|
||
|
pxor xmm6,xmm0
|
||
|
psllq xmm0,4
|
||
|
pxor xmm1,xmm15
|
||
|
psllq xmm15,4
|
||
|
pxor xmm0,xmm9
|
||
|
pxor xmm15,xmm10
|
||
|
movdqa xmm7,XMMWORD PTR[rax]
|
||
|
pxor xmm5,xmm7
|
||
|
pxor xmm3,xmm7
|
||
|
pxor xmm1,xmm7
|
||
|
pxor xmm6,xmm7
|
||
|
pxor xmm2,xmm7
|
||
|
pxor xmm4,xmm7
|
||
|
pxor xmm15,xmm7
|
||
|
pxor xmm0,xmm7
|
||
|
DB 0F3h,0C3h ;repret
|
||
|
_bsaes_decrypt8 ENDP
|
||
|
|
||
|
ALIGN 16
|
||
|
_bsaes_key_convert PROC PRIVATE
|
||
|
lea r11,QWORD PTR[$L$masks]
|
||
|
movdqu xmm7,XMMWORD PTR[rcx]
|
||
|
lea rcx,QWORD PTR[16+rcx]
|
||
|
movdqa xmm0,XMMWORD PTR[r11]
|
||
|
movdqa xmm1,XMMWORD PTR[16+r11]
|
||
|
movdqa xmm2,XMMWORD PTR[32+r11]
|
||
|
movdqa xmm3,XMMWORD PTR[48+r11]
|
||
|
movdqa xmm4,XMMWORD PTR[64+r11]
|
||
|
pcmpeqd xmm5,xmm5
|
||
|
|
||
|
movdqu xmm6,XMMWORD PTR[rcx]
|
||
|
movdqa XMMWORD PTR[rax],xmm7
|
||
|
lea rax,QWORD PTR[16+rax]
|
||
|
dec r10d
|
||
|
jmp $L$key_loop
|
||
|
ALIGN 16
|
||
|
$L$key_loop::
|
||
|
DB 102,15,56,0,244
|
||
|
|
||
|
movdqa xmm8,xmm0
|
||
|
movdqa xmm9,xmm1
|
||
|
|
||
|
pand xmm8,xmm6
|
||
|
pand xmm9,xmm6
|
||
|
movdqa xmm10,xmm2
|
||
|
pcmpeqb xmm8,xmm0
|
||
|
psllq xmm0,4
|
||
|
movdqa xmm11,xmm3
|
||
|
pcmpeqb xmm9,xmm1
|
||
|
psllq xmm1,4
|
||
|
|
||
|
pand xmm10,xmm6
|
||
|
pand xmm11,xmm6
|
||
|
movdqa xmm12,xmm0
|
||
|
pcmpeqb xmm10,xmm2
|
||
|
psllq xmm2,4
|
||
|
movdqa xmm13,xmm1
|
||
|
pcmpeqb xmm11,xmm3
|
||
|
psllq xmm3,4
|
||
|
|
||
|
movdqa xmm14,xmm2
|
||
|
movdqa xmm15,xmm3
|
||
|
pxor xmm8,xmm5
|
||
|
pxor xmm9,xmm5
|
||
|
|
||
|
pand xmm12,xmm6
|
||
|
pand xmm13,xmm6
|
||
|
movdqa XMMWORD PTR[rax],xmm8
|
||
|
pcmpeqb xmm12,xmm0
|
||
|
psrlq xmm0,4
|
||
|
movdqa XMMWORD PTR[16+rax],xmm9
|
||
|
pcmpeqb xmm13,xmm1
|
||
|
psrlq xmm1,4
|
||
|
lea rcx,QWORD PTR[16+rcx]
|
||
|
|
||
|
pand xmm14,xmm6
|
||
|
pand xmm15,xmm6
|
||
|
movdqa XMMWORD PTR[32+rax],xmm10
|
||
|
pcmpeqb xmm14,xmm2
|
||
|
psrlq xmm2,4
|
||
|
movdqa XMMWORD PTR[48+rax],xmm11
|
||
|
pcmpeqb xmm15,xmm3
|
||
|
psrlq xmm3,4
|
||
|
movdqu xmm6,XMMWORD PTR[rcx]
|
||
|
|
||
|
pxor xmm13,xmm5
|
||
|
pxor xmm14,xmm5
|
||
|
movdqa XMMWORD PTR[64+rax],xmm12
|
||
|
movdqa XMMWORD PTR[80+rax],xmm13
|
||
|
movdqa XMMWORD PTR[96+rax],xmm14
|
||
|
movdqa XMMWORD PTR[112+rax],xmm15
|
||
|
lea rax,QWORD PTR[128+rax]
|
||
|
dec r10d
|
||
|
jnz $L$key_loop
|
||
|
|
||
|
movdqa xmm7,XMMWORD PTR[80+r11]
|
||
|
|
||
|
DB 0F3h,0C3h ;repret
|
||
|
_bsaes_key_convert ENDP
|
||
|
EXTERN asm_AES_cbc_encrypt:NEAR
|
||
|
PUBLIC bsaes_cbc_encrypt
|
||
|
|
||
|
ALIGN 16
|
||
|
bsaes_cbc_encrypt PROC PUBLIC
|
||
|
mov r11d,DWORD PTR[48+rsp]
|
||
|
cmp r11d,0
|
||
|
jne asm_AES_cbc_encrypt
|
||
|
cmp r8,128
|
||
|
jb asm_AES_cbc_encrypt
|
||
|
|
||
|
mov rax,rsp
|
||
|
$L$cbc_dec_prologue::
|
||
|
push rbp
|
||
|
push rbx
|
||
|
push r12
|
||
|
push r13
|
||
|
push r14
|
||
|
push r15
|
||
|
lea rsp,QWORD PTR[((-72))+rsp]
|
||
|
mov r10,QWORD PTR[160+rsp]
|
||
|
lea rsp,QWORD PTR[((-160))+rsp]
|
||
|
movaps XMMWORD PTR[64+rsp],xmm6
|
||
|
movaps XMMWORD PTR[80+rsp],xmm7
|
||
|
movaps XMMWORD PTR[96+rsp],xmm8
|
||
|
movaps XMMWORD PTR[112+rsp],xmm9
|
||
|
movaps XMMWORD PTR[128+rsp],xmm10
|
||
|
movaps XMMWORD PTR[144+rsp],xmm11
|
||
|
movaps XMMWORD PTR[160+rsp],xmm12
|
||
|
movaps XMMWORD PTR[176+rsp],xmm13
|
||
|
movaps XMMWORD PTR[192+rsp],xmm14
|
||
|
movaps XMMWORD PTR[208+rsp],xmm15
|
||
|
$L$cbc_dec_body::
|
||
|
mov rbp,rsp
|
||
|
mov eax,DWORD PTR[240+r9]
|
||
|
mov r12,rcx
|
||
|
mov r13,rdx
|
||
|
mov r14,r8
|
||
|
mov r15,r9
|
||
|
mov rbx,r10
|
||
|
shr r14,4
|
||
|
|
||
|
mov edx,eax
|
||
|
shl rax,7
|
||
|
sub rax,96
|
||
|
sub rsp,rax
|
||
|
|
||
|
mov rax,rsp
|
||
|
mov rcx,r15
|
||
|
mov r10d,edx
|
||
|
call _bsaes_key_convert
|
||
|
pxor xmm7,XMMWORD PTR[rsp]
|
||
|
movdqa XMMWORD PTR[rax],xmm6
|
||
|
movdqa XMMWORD PTR[rsp],xmm7
|
||
|
|
||
|
movdqu xmm14,XMMWORD PTR[rbx]
|
||
|
sub r14,8
|
||
|
$L$cbc_dec_loop::
|
||
|
movdqu xmm15,XMMWORD PTR[r12]
|
||
|
movdqu xmm0,XMMWORD PTR[16+r12]
|
||
|
movdqu xmm1,XMMWORD PTR[32+r12]
|
||
|
movdqu xmm2,XMMWORD PTR[48+r12]
|
||
|
movdqu xmm3,XMMWORD PTR[64+r12]
|
||
|
movdqu xmm4,XMMWORD PTR[80+r12]
|
||
|
mov rax,rsp
|
||
|
movdqu xmm5,XMMWORD PTR[96+r12]
|
||
|
mov r10d,edx
|
||
|
movdqu xmm6,XMMWORD PTR[112+r12]
|
||
|
movdqa XMMWORD PTR[32+rbp],xmm14
|
||
|
|
||
|
call _bsaes_decrypt8
|
||
|
|
||
|
pxor xmm15,XMMWORD PTR[32+rbp]
|
||
|
movdqu xmm7,XMMWORD PTR[r12]
|
||
|
movdqu xmm8,XMMWORD PTR[16+r12]
|
||
|
pxor xmm0,xmm7
|
||
|
movdqu xmm9,XMMWORD PTR[32+r12]
|
||
|
pxor xmm5,xmm8
|
||
|
movdqu xmm10,XMMWORD PTR[48+r12]
|
||
|
pxor xmm3,xmm9
|
||
|
movdqu xmm11,XMMWORD PTR[64+r12]
|
||
|
pxor xmm1,xmm10
|
||
|
movdqu xmm12,XMMWORD PTR[80+r12]
|
||
|
pxor xmm6,xmm11
|
||
|
movdqu xmm13,XMMWORD PTR[96+r12]
|
||
|
pxor xmm2,xmm12
|
||
|
movdqu xmm14,XMMWORD PTR[112+r12]
|
||
|
pxor xmm4,xmm13
|
||
|
movdqu XMMWORD PTR[r13],xmm15
|
||
|
lea r12,QWORD PTR[128+r12]
|
||
|
movdqu XMMWORD PTR[16+r13],xmm0
|
||
|
movdqu XMMWORD PTR[32+r13],xmm5
|
||
|
movdqu XMMWORD PTR[48+r13],xmm3
|
||
|
movdqu XMMWORD PTR[64+r13],xmm1
|
||
|
movdqu XMMWORD PTR[80+r13],xmm6
|
||
|
movdqu XMMWORD PTR[96+r13],xmm2
|
||
|
movdqu XMMWORD PTR[112+r13],xmm4
|
||
|
lea r13,QWORD PTR[128+r13]
|
||
|
sub r14,8
|
||
|
jnc $L$cbc_dec_loop
|
||
|
|
||
|
add r14,8
|
||
|
jz $L$cbc_dec_done
|
||
|
|
||
|
movdqu xmm15,XMMWORD PTR[r12]
|
||
|
mov rax,rsp
|
||
|
mov r10d,edx
|
||
|
cmp r14,2
|
||
|
jb $L$cbc_dec_one
|
||
|
movdqu xmm0,XMMWORD PTR[16+r12]
|
||
|
je $L$cbc_dec_two
|
||
|
movdqu xmm1,XMMWORD PTR[32+r12]
|
||
|
cmp r14,4
|
||
|
jb $L$cbc_dec_three
|
||
|
movdqu xmm2,XMMWORD PTR[48+r12]
|
||
|
je $L$cbc_dec_four
|
||
|
movdqu xmm3,XMMWORD PTR[64+r12]
|
||
|
cmp r14,6
|
||
|
jb $L$cbc_dec_five
|
||
|
movdqu xmm4,XMMWORD PTR[80+r12]
|
||
|
je $L$cbc_dec_six
|
||
|
movdqu xmm5,XMMWORD PTR[96+r12]
|
||
|
movdqa XMMWORD PTR[32+rbp],xmm14
|
||
|
call _bsaes_decrypt8
|
||
|
pxor xmm15,XMMWORD PTR[32+rbp]
|
||
|
movdqu xmm7,XMMWORD PTR[r12]
|
||
|
movdqu xmm8,XMMWORD PTR[16+r12]
|
||
|
pxor xmm0,xmm7
|
||
|
movdqu xmm9,XMMWORD PTR[32+r12]
|
||
|
pxor xmm5,xmm8
|
||
|
movdqu xmm10,XMMWORD PTR[48+r12]
|
||
|
pxor xmm3,xmm9
|
||
|
movdqu xmm11,XMMWORD PTR[64+r12]
|
||
|
pxor xmm1,xmm10
|
||
|
movdqu xmm12,XMMWORD PTR[80+r12]
|
||
|
pxor xmm6,xmm11
|
||
|
movdqu xmm14,XMMWORD PTR[96+r12]
|
||
|
pxor xmm2,xmm12
|
||
|
movdqu XMMWORD PTR[r13],xmm15
|
||
|
movdqu XMMWORD PTR[16+r13],xmm0
|
||
|
movdqu XMMWORD PTR[32+r13],xmm5
|
||
|
movdqu XMMWORD PTR[48+r13],xmm3
|
||
|
movdqu XMMWORD PTR[64+r13],xmm1
|
||
|
movdqu XMMWORD PTR[80+r13],xmm6
|
||
|
movdqu XMMWORD PTR[96+r13],xmm2
|
||
|
jmp $L$cbc_dec_done
|
||
|
ALIGN 16
|
||
|
$L$cbc_dec_six::
|
||
|
movdqa XMMWORD PTR[32+rbp],xmm14
|
||
|
call _bsaes_decrypt8
|
||
|
pxor xmm15,XMMWORD PTR[32+rbp]
|
||
|
movdqu xmm7,XMMWORD PTR[r12]
|
||
|
movdqu xmm8,XMMWORD PTR[16+r12]
|
||
|
pxor xmm0,xmm7
|
||
|
movdqu xmm9,XMMWORD PTR[32+r12]
|
||
|
pxor xmm5,xmm8
|
||
|
movdqu xmm10,XMMWORD PTR[48+r12]
|
||
|
pxor xmm3,xmm9
|
||
|
movdqu xmm11,XMMWORD PTR[64+r12]
|
||
|
pxor xmm1,xmm10
|
||
|
movdqu xmm14,XMMWORD PTR[80+r12]
|
||
|
pxor xmm6,xmm11
|
||
|
movdqu XMMWORD PTR[r13],xmm15
|
||
|
movdqu XMMWORD PTR[16+r13],xmm0
|
||
|
movdqu XMMWORD PTR[32+r13],xmm5
|
||
|
movdqu XMMWORD PTR[48+r13],xmm3
|
||
|
movdqu XMMWORD PTR[64+r13],xmm1
|
||
|
movdqu XMMWORD PTR[80+r13],xmm6
|
||
|
jmp $L$cbc_dec_done
|
||
|
ALIGN 16
|
||
|
$L$cbc_dec_five::
|
||
|
movdqa XMMWORD PTR[32+rbp],xmm14
|
||
|
call _bsaes_decrypt8
|
||
|
pxor xmm15,XMMWORD PTR[32+rbp]
|
||
|
movdqu xmm7,XMMWORD PTR[r12]
|
||
|
movdqu xmm8,XMMWORD PTR[16+r12]
|
||
|
pxor xmm0,xmm7
|
||
|
movdqu xmm9,XMMWORD PTR[32+r12]
|
||
|
pxor xmm5,xmm8
|
||
|
movdqu xmm10,XMMWORD PTR[48+r12]
|
||
|
pxor xmm3,xmm9
|
||
|
movdqu xmm14,XMMWORD PTR[64+r12]
|
||
|
pxor xmm1,xmm10
|
||
|
movdqu XMMWORD PTR[r13],xmm15
|
||
|
movdqu XMMWORD PTR[16+r13],xmm0
|
||
|
movdqu XMMWORD PTR[32+r13],xmm5
|
||
|
movdqu XMMWORD PTR[48+r13],xmm3
|
||
|
movdqu XMMWORD PTR[64+r13],xmm1
|
||
|
jmp $L$cbc_dec_done
|
||
|
ALIGN 16
|
||
|
$L$cbc_dec_four::
|
||
|
movdqa XMMWORD PTR[32+rbp],xmm14
|
||
|
call _bsaes_decrypt8
|
||
|
pxor xmm15,XMMWORD PTR[32+rbp]
|
||
|
movdqu xmm7,XMMWORD PTR[r12]
|
||
|
movdqu xmm8,XMMWORD PTR[16+r12]
|
||
|
pxor xmm0,xmm7
|
||
|
movdqu xmm9,XMMWORD PTR[32+r12]
|
||
|
pxor xmm5,xmm8
|
||
|
movdqu xmm14,XMMWORD PTR[48+r12]
|
||
|
pxor xmm3,xmm9
|
||
|
movdqu XMMWORD PTR[r13],xmm15
|
||
|
movdqu XMMWORD PTR[16+r13],xmm0
|
||
|
movdqu XMMWORD PTR[32+r13],xmm5
|
||
|
movdqu XMMWORD PTR[48+r13],xmm3
|
||
|
jmp $L$cbc_dec_done
|
||
|
ALIGN 16
|
||
|
$L$cbc_dec_three::
|
||
|
movdqa XMMWORD PTR[32+rbp],xmm14
|
||
|
call _bsaes_decrypt8
|
||
|
pxor xmm15,XMMWORD PTR[32+rbp]
|
||
|
movdqu xmm7,XMMWORD PTR[r12]
|
||
|
movdqu xmm8,XMMWORD PTR[16+r12]
|
||
|
pxor xmm0,xmm7
|
||
|
movdqu xmm14,XMMWORD PTR[32+r12]
|
||
|
pxor xmm5,xmm8
|
||
|
movdqu XMMWORD PTR[r13],xmm15
|
||
|
movdqu XMMWORD PTR[16+r13],xmm0
|
||
|
movdqu XMMWORD PTR[32+r13],xmm5
|
||
|
jmp $L$cbc_dec_done
|
||
|
ALIGN 16
|
||
|
$L$cbc_dec_two::
|
||
|
movdqa XMMWORD PTR[32+rbp],xmm14
|
||
|
call _bsaes_decrypt8
|
||
|
pxor xmm15,XMMWORD PTR[32+rbp]
|
||
|
movdqu xmm7,XMMWORD PTR[r12]
|
||
|
movdqu xmm14,XMMWORD PTR[16+r12]
|
||
|
pxor xmm0,xmm7
|
||
|
movdqu XMMWORD PTR[r13],xmm15
|
||
|
movdqu XMMWORD PTR[16+r13],xmm0
|
||
|
jmp $L$cbc_dec_done
|
||
|
ALIGN 16
|
||
|
$L$cbc_dec_one::
|
||
|
lea rcx,QWORD PTR[r12]
|
||
|
lea rdx,QWORD PTR[32+rbp]
|
||
|
lea r8,QWORD PTR[r15]
|
||
|
call asm_AES_decrypt
|
||
|
pxor xmm14,XMMWORD PTR[32+rbp]
|
||
|
movdqu XMMWORD PTR[r13],xmm14
|
||
|
movdqa xmm14,xmm15
|
||
|
|
||
|
$L$cbc_dec_done::
|
||
|
movdqu XMMWORD PTR[rbx],xmm14
|
||
|
lea rax,QWORD PTR[rsp]
|
||
|
pxor xmm0,xmm0
|
||
|
$L$cbc_dec_bzero::
|
||
|
movdqa XMMWORD PTR[rax],xmm0
|
||
|
movdqa XMMWORD PTR[16+rax],xmm0
|
||
|
lea rax,QWORD PTR[32+rax]
|
||
|
cmp rbp,rax
|
||
|
ja $L$cbc_dec_bzero
|
||
|
|
||
|
lea rsp,QWORD PTR[rbp]
|
||
|
movaps xmm6,XMMWORD PTR[64+rbp]
|
||
|
movaps xmm7,XMMWORD PTR[80+rbp]
|
||
|
movaps xmm8,XMMWORD PTR[96+rbp]
|
||
|
movaps xmm9,XMMWORD PTR[112+rbp]
|
||
|
movaps xmm10,XMMWORD PTR[128+rbp]
|
||
|
movaps xmm11,XMMWORD PTR[144+rbp]
|
||
|
movaps xmm12,XMMWORD PTR[160+rbp]
|
||
|
movaps xmm13,XMMWORD PTR[176+rbp]
|
||
|
movaps xmm14,XMMWORD PTR[192+rbp]
|
||
|
movaps xmm15,XMMWORD PTR[208+rbp]
|
||
|
lea rsp,QWORD PTR[160+rbp]
|
||
|
mov r15,QWORD PTR[72+rsp]
|
||
|
mov r14,QWORD PTR[80+rsp]
|
||
|
mov r13,QWORD PTR[88+rsp]
|
||
|
mov r12,QWORD PTR[96+rsp]
|
||
|
mov rbx,QWORD PTR[104+rsp]
|
||
|
mov rax,QWORD PTR[112+rsp]
|
||
|
lea rsp,QWORD PTR[120+rsp]
|
||
|
mov rbp,rax
|
||
|
$L$cbc_dec_epilogue::
|
||
|
DB 0F3h,0C3h ;repret
|
||
|
bsaes_cbc_encrypt ENDP
|
||
|
|
||
|
PUBLIC bsaes_ctr32_encrypt_blocks
|
||
|
|
||
|
ALIGN 16
|
||
|
bsaes_ctr32_encrypt_blocks PROC PUBLIC
|
||
|
mov rax,rsp
|
||
|
$L$ctr_enc_prologue::
|
||
|
push rbp
|
||
|
push rbx
|
||
|
push r12
|
||
|
push r13
|
||
|
push r14
|
||
|
push r15
|
||
|
lea rsp,QWORD PTR[((-72))+rsp]
|
||
|
mov r10,QWORD PTR[160+rsp]
|
||
|
lea rsp,QWORD PTR[((-160))+rsp]
|
||
|
movaps XMMWORD PTR[64+rsp],xmm6
|
||
|
movaps XMMWORD PTR[80+rsp],xmm7
|
||
|
movaps XMMWORD PTR[96+rsp],xmm8
|
||
|
movaps XMMWORD PTR[112+rsp],xmm9
|
||
|
movaps XMMWORD PTR[128+rsp],xmm10
|
||
|
movaps XMMWORD PTR[144+rsp],xmm11
|
||
|
movaps XMMWORD PTR[160+rsp],xmm12
|
||
|
movaps XMMWORD PTR[176+rsp],xmm13
|
||
|
movaps XMMWORD PTR[192+rsp],xmm14
|
||
|
movaps XMMWORD PTR[208+rsp],xmm15
|
||
|
$L$ctr_enc_body::
|
||
|
mov rbp,rsp
|
||
|
movdqu xmm0,XMMWORD PTR[r10]
|
||
|
mov eax,DWORD PTR[240+r9]
|
||
|
mov r12,rcx
|
||
|
mov r13,rdx
|
||
|
mov r14,r8
|
||
|
mov r15,r9
|
||
|
movdqa XMMWORD PTR[32+rbp],xmm0
|
||
|
cmp r8,8
|
||
|
jb $L$ctr_enc_short
|
||
|
|
||
|
mov ebx,eax
|
||
|
shl rax,7
|
||
|
sub rax,96
|
||
|
sub rsp,rax
|
||
|
|
||
|
mov rax,rsp
|
||
|
mov rcx,r15
|
||
|
mov r10d,ebx
|
||
|
call _bsaes_key_convert
|
||
|
pxor xmm7,xmm6
|
||
|
movdqa XMMWORD PTR[rax],xmm7
|
||
|
|
||
|
movdqa xmm8,XMMWORD PTR[rsp]
|
||
|
lea r11,QWORD PTR[$L$ADD1]
|
||
|
movdqa xmm15,XMMWORD PTR[32+rbp]
|
||
|
movdqa xmm7,XMMWORD PTR[((-32))+r11]
|
||
|
DB 102,68,15,56,0,199
|
||
|
DB 102,68,15,56,0,255
|
||
|
movdqa XMMWORD PTR[rsp],xmm8
|
||
|
jmp $L$ctr_enc_loop
|
||
|
ALIGN 16
|
||
|
$L$ctr_enc_loop::
|
||
|
movdqa XMMWORD PTR[32+rbp],xmm15
|
||
|
movdqa xmm0,xmm15
|
||
|
movdqa xmm1,xmm15
|
||
|
paddd xmm0,XMMWORD PTR[r11]
|
||
|
movdqa xmm2,xmm15
|
||
|
paddd xmm1,XMMWORD PTR[16+r11]
|
||
|
movdqa xmm3,xmm15
|
||
|
paddd xmm2,XMMWORD PTR[32+r11]
|
||
|
movdqa xmm4,xmm15
|
||
|
paddd xmm3,XMMWORD PTR[48+r11]
|
||
|
movdqa xmm5,xmm15
|
||
|
paddd xmm4,XMMWORD PTR[64+r11]
|
||
|
movdqa xmm6,xmm15
|
||
|
paddd xmm5,XMMWORD PTR[80+r11]
|
||
|
paddd xmm6,XMMWORD PTR[96+r11]
|
||
|
|
||
|
|
||
|
|
||
|
movdqa xmm8,XMMWORD PTR[rsp]
|
||
|
lea rax,QWORD PTR[16+rsp]
|
||
|
movdqa xmm7,XMMWORD PTR[((-16))+r11]
|
||
|
pxor xmm15,xmm8
|
||
|
pxor xmm0,xmm8
|
||
|
DB 102,68,15,56,0,255
|
||
|
pxor xmm1,xmm8
|
||
|
DB 102,15,56,0,199
|
||
|
pxor xmm2,xmm8
|
||
|
DB 102,15,56,0,207
|
||
|
pxor xmm3,xmm8
|
||
|
DB 102,15,56,0,215
|
||
|
pxor xmm4,xmm8
|
||
|
DB 102,15,56,0,223
|
||
|
pxor xmm5,xmm8
|
||
|
DB 102,15,56,0,231
|
||
|
pxor xmm6,xmm8
|
||
|
DB 102,15,56,0,239
|
||
|
lea r11,QWORD PTR[$L$BS0]
|
||
|
DB 102,15,56,0,247
|
||
|
mov r10d,ebx
|
||
|
|
||
|
call _bsaes_encrypt8_bitslice
|
||
|
|
||
|
sub r14,8
|
||
|
jc $L$ctr_enc_loop_done
|
||
|
|
||
|
movdqu xmm7,XMMWORD PTR[r12]
|
||
|
movdqu xmm8,XMMWORD PTR[16+r12]
|
||
|
movdqu xmm9,XMMWORD PTR[32+r12]
|
||
|
movdqu xmm10,XMMWORD PTR[48+r12]
|
||
|
movdqu xmm11,XMMWORD PTR[64+r12]
|
||
|
movdqu xmm12,XMMWORD PTR[80+r12]
|
||
|
movdqu xmm13,XMMWORD PTR[96+r12]
|
||
|
movdqu xmm14,XMMWORD PTR[112+r12]
|
||
|
lea r12,QWORD PTR[128+r12]
|
||
|
pxor xmm7,xmm15
|
||
|
movdqa xmm15,XMMWORD PTR[32+rbp]
|
||
|
pxor xmm0,xmm8
|
||
|
movdqu XMMWORD PTR[r13],xmm7
|
||
|
pxor xmm3,xmm9
|
||
|
movdqu XMMWORD PTR[16+r13],xmm0
|
||
|
pxor xmm5,xmm10
|
||
|
movdqu XMMWORD PTR[32+r13],xmm3
|
||
|
pxor xmm2,xmm11
|
||
|
movdqu XMMWORD PTR[48+r13],xmm5
|
||
|
pxor xmm6,xmm12
|
||
|
movdqu XMMWORD PTR[64+r13],xmm2
|
||
|
pxor xmm1,xmm13
|
||
|
movdqu XMMWORD PTR[80+r13],xmm6
|
||
|
pxor xmm4,xmm14
|
||
|
movdqu XMMWORD PTR[96+r13],xmm1
|
||
|
lea r11,QWORD PTR[$L$ADD1]
|
||
|
movdqu XMMWORD PTR[112+r13],xmm4
|
||
|
lea r13,QWORD PTR[128+r13]
|
||
|
paddd xmm15,XMMWORD PTR[112+r11]
|
||
|
jnz $L$ctr_enc_loop
|
||
|
|
||
|
jmp $L$ctr_enc_done
|
||
|
ALIGN 16
|
||
|
$L$ctr_enc_loop_done::
|
||
|
add r14,8
|
||
|
movdqu xmm7,XMMWORD PTR[r12]
|
||
|
pxor xmm15,xmm7
|
||
|
movdqu XMMWORD PTR[r13],xmm15
|
||
|
cmp r14,2
|
||
|
jb $L$ctr_enc_done
|
||
|
movdqu xmm8,XMMWORD PTR[16+r12]
|
||
|
pxor xmm0,xmm8
|
||
|
movdqu XMMWORD PTR[16+r13],xmm0
|
||
|
je $L$ctr_enc_done
|
||
|
movdqu xmm9,XMMWORD PTR[32+r12]
|
||
|
pxor xmm3,xmm9
|
||
|
movdqu XMMWORD PTR[32+r13],xmm3
|
||
|
cmp r14,4
|
||
|
jb $L$ctr_enc_done
|
||
|
movdqu xmm10,XMMWORD PTR[48+r12]
|
||
|
pxor xmm5,xmm10
|
||
|
movdqu XMMWORD PTR[48+r13],xmm5
|
||
|
je $L$ctr_enc_done
|
||
|
movdqu xmm11,XMMWORD PTR[64+r12]
|
||
|
pxor xmm2,xmm11
|
||
|
movdqu XMMWORD PTR[64+r13],xmm2
|
||
|
cmp r14,6
|
||
|
jb $L$ctr_enc_done
|
||
|
movdqu xmm12,XMMWORD PTR[80+r12]
|
||
|
pxor xmm6,xmm12
|
||
|
movdqu XMMWORD PTR[80+r13],xmm6
|
||
|
je $L$ctr_enc_done
|
||
|
movdqu xmm13,XMMWORD PTR[96+r12]
|
||
|
pxor xmm1,xmm13
|
||
|
movdqu XMMWORD PTR[96+r13],xmm1
|
||
|
jmp $L$ctr_enc_done
|
||
|
|
||
|
ALIGN 16
|
||
|
$L$ctr_enc_short::
|
||
|
lea rcx,QWORD PTR[32+rbp]
|
||
|
lea rdx,QWORD PTR[48+rbp]
|
||
|
lea r8,QWORD PTR[r15]
|
||
|
call asm_AES_encrypt
|
||
|
movdqu xmm0,XMMWORD PTR[r12]
|
||
|
lea r12,QWORD PTR[16+r12]
|
||
|
mov eax,DWORD PTR[44+rbp]
|
||
|
bswap eax
|
||
|
pxor xmm0,XMMWORD PTR[48+rbp]
|
||
|
inc eax
|
||
|
movdqu XMMWORD PTR[r13],xmm0
|
||
|
bswap eax
|
||
|
lea r13,QWORD PTR[16+r13]
|
||
|
mov DWORD PTR[44+rsp],eax
|
||
|
dec r14
|
||
|
jnz $L$ctr_enc_short
|
||
|
|
||
|
$L$ctr_enc_done::
|
||
|
lea rax,QWORD PTR[rsp]
|
||
|
pxor xmm0,xmm0
|
||
|
$L$ctr_enc_bzero::
|
||
|
movdqa XMMWORD PTR[rax],xmm0
|
||
|
movdqa XMMWORD PTR[16+rax],xmm0
|
||
|
lea rax,QWORD PTR[32+rax]
|
||
|
cmp rbp,rax
|
||
|
ja $L$ctr_enc_bzero
|
||
|
|
||
|
lea rsp,QWORD PTR[rbp]
|
||
|
movaps xmm6,XMMWORD PTR[64+rbp]
|
||
|
movaps xmm7,XMMWORD PTR[80+rbp]
|
||
|
movaps xmm8,XMMWORD PTR[96+rbp]
|
||
|
movaps xmm9,XMMWORD PTR[112+rbp]
|
||
|
movaps xmm10,XMMWORD PTR[128+rbp]
|
||
|
movaps xmm11,XMMWORD PTR[144+rbp]
|
||
|
movaps xmm12,XMMWORD PTR[160+rbp]
|
||
|
movaps xmm13,XMMWORD PTR[176+rbp]
|
||
|
movaps xmm14,XMMWORD PTR[192+rbp]
|
||
|
movaps xmm15,XMMWORD PTR[208+rbp]
|
||
|
lea rsp,QWORD PTR[160+rbp]
|
||
|
mov r15,QWORD PTR[72+rsp]
|
||
|
mov r14,QWORD PTR[80+rsp]
|
||
|
mov r13,QWORD PTR[88+rsp]
|
||
|
mov r12,QWORD PTR[96+rsp]
|
||
|
mov rbx,QWORD PTR[104+rsp]
|
||
|
mov rax,QWORD PTR[112+rsp]
|
||
|
lea rsp,QWORD PTR[120+rsp]
|
||
|
mov rbp,rax
|
||
|
$L$ctr_enc_epilogue::
|
||
|
DB 0F3h,0C3h ;repret
|
||
|
bsaes_ctr32_encrypt_blocks ENDP
|
||
|
PUBLIC bsaes_xts_encrypt
|
||
|
|
||
|
ALIGN 16
|
||
|
bsaes_xts_encrypt PROC PUBLIC
|
||
|
mov rax,rsp
|
||
|
$L$xts_enc_prologue::
|
||
|
push rbp
|
||
|
push rbx
|
||
|
push r12
|
||
|
push r13
|
||
|
push r14
|
||
|
push r15
|
||
|
lea rsp,QWORD PTR[((-72))+rsp]
|
||
|
mov r10,QWORD PTR[160+rsp]
|
||
|
mov r11,QWORD PTR[168+rsp]
|
||
|
lea rsp,QWORD PTR[((-160))+rsp]
|
||
|
movaps XMMWORD PTR[64+rsp],xmm6
|
||
|
movaps XMMWORD PTR[80+rsp],xmm7
|
||
|
movaps XMMWORD PTR[96+rsp],xmm8
|
||
|
movaps XMMWORD PTR[112+rsp],xmm9
|
||
|
movaps XMMWORD PTR[128+rsp],xmm10
|
||
|
movaps XMMWORD PTR[144+rsp],xmm11
|
||
|
movaps XMMWORD PTR[160+rsp],xmm12
|
||
|
movaps XMMWORD PTR[176+rsp],xmm13
|
||
|
movaps XMMWORD PTR[192+rsp],xmm14
|
||
|
movaps XMMWORD PTR[208+rsp],xmm15
|
||
|
$L$xts_enc_body::
|
||
|
mov rbp,rsp
|
||
|
mov r12,rcx
|
||
|
mov r13,rdx
|
||
|
mov r14,r8
|
||
|
mov r15,r9
|
||
|
|
||
|
lea rcx,QWORD PTR[r11]
|
||
|
lea rdx,QWORD PTR[32+rbp]
|
||
|
lea r8,QWORD PTR[r10]
|
||
|
call asm_AES_encrypt
|
||
|
|
||
|
mov eax,DWORD PTR[240+r15]
|
||
|
mov rbx,r14
|
||
|
|
||
|
mov edx,eax
|
||
|
shl rax,7
|
||
|
sub rax,96
|
||
|
sub rsp,rax
|
||
|
|
||
|
mov rax,rsp
|
||
|
mov rcx,r15
|
||
|
mov r10d,edx
|
||
|
call _bsaes_key_convert
|
||
|
pxor xmm7,xmm6
|
||
|
movdqa XMMWORD PTR[rax],xmm7
|
||
|
|
||
|
and r14,-16
|
||
|
sub rsp,080h
|
||
|
movdqa xmm6,XMMWORD PTR[32+rbp]
|
||
|
|
||
|
pxor xmm14,xmm14
|
||
|
movdqa xmm12,XMMWORD PTR[$L$xts_magic]
|
||
|
pcmpgtd xmm14,xmm6
|
||
|
|
||
|
sub r14,080h
|
||
|
jc $L$xts_enc_short
|
||
|
jmp $L$xts_enc_loop
|
||
|
|
||
|
ALIGN 16
|
||
|
$L$xts_enc_loop::
|
||
|
pshufd xmm13,xmm14,013h
|
||
|
pxor xmm14,xmm14
|
||
|
movdqa xmm15,xmm6
|
||
|
movdqa XMMWORD PTR[rsp],xmm6
|
||
|
paddq xmm6,xmm6
|
||
|
pand xmm13,xmm12
|
||
|
pcmpgtd xmm14,xmm6
|
||
|
pxor xmm6,xmm13
|
||
|
pshufd xmm13,xmm14,013h
|
||
|
pxor xmm14,xmm14
|
||
|
movdqa xmm0,xmm6
|
||
|
movdqa XMMWORD PTR[16+rsp],xmm6
|
||
|
paddq xmm6,xmm6
|
||
|
pand xmm13,xmm12
|
||
|
pcmpgtd xmm14,xmm6
|
||
|
pxor xmm6,xmm13
|
||
|
movdqu xmm7,XMMWORD PTR[r12]
|
||
|
pshufd xmm13,xmm14,013h
|
||
|
pxor xmm14,xmm14
|
||
|
movdqa xmm1,xmm6
|
||
|
movdqa XMMWORD PTR[32+rsp],xmm6
|
||
|
paddq xmm6,xmm6
|
||
|
pand xmm13,xmm12
|
||
|
pcmpgtd xmm14,xmm6
|
||
|
pxor xmm6,xmm13
|
||
|
movdqu xmm8,XMMWORD PTR[16+r12]
|
||
|
pxor xmm15,xmm7
|
||
|
pshufd xmm13,xmm14,013h
|
||
|
pxor xmm14,xmm14
|
||
|
movdqa xmm2,xmm6
|
||
|
movdqa XMMWORD PTR[48+rsp],xmm6
|
||
|
paddq xmm6,xmm6
|
||
|
pand xmm13,xmm12
|
||
|
pcmpgtd xmm14,xmm6
|
||
|
pxor xmm6,xmm13
|
||
|
movdqu xmm9,XMMWORD PTR[32+r12]
|
||
|
pxor xmm0,xmm8
|
||
|
pshufd xmm13,xmm14,013h
|
||
|
pxor xmm14,xmm14
|
||
|
movdqa xmm3,xmm6
|
||
|
movdqa XMMWORD PTR[64+rsp],xmm6
|
||
|
paddq xmm6,xmm6
|
||
|
pand xmm13,xmm12
|
||
|
pcmpgtd xmm14,xmm6
|
||
|
pxor xmm6,xmm13
|
||
|
movdqu xmm10,XMMWORD PTR[48+r12]
|
||
|
pxor xmm1,xmm9
|
||
|
pshufd xmm13,xmm14,013h
|
||
|
pxor xmm14,xmm14
|
||
|
movdqa xmm4,xmm6
|
||
|
movdqa XMMWORD PTR[80+rsp],xmm6
|
||
|
paddq xmm6,xmm6
|
||
|
pand xmm13,xmm12
|
||
|
pcmpgtd xmm14,xmm6
|
||
|
pxor xmm6,xmm13
|
||
|
movdqu xmm11,XMMWORD PTR[64+r12]
|
||
|
pxor xmm2,xmm10
|
||
|
pshufd xmm13,xmm14,013h
|
||
|
pxor xmm14,xmm14
|
||
|
movdqa xmm5,xmm6
|
||
|
movdqa XMMWORD PTR[96+rsp],xmm6
|
||
|
paddq xmm6,xmm6
|
||
|
pand xmm13,xmm12
|
||
|
pcmpgtd xmm14,xmm6
|
||
|
pxor xmm6,xmm13
|
||
|
movdqu xmm12,XMMWORD PTR[80+r12]
|
||
|
pxor xmm3,xmm11
|
||
|
movdqu xmm13,XMMWORD PTR[96+r12]
|
||
|
pxor xmm4,xmm12
|
||
|
movdqu xmm14,XMMWORD PTR[112+r12]
|
||
|
lea r12,QWORD PTR[128+r12]
|
||
|
movdqa XMMWORD PTR[112+rsp],xmm6
|
||
|
pxor xmm5,xmm13
|
||
|
lea rax,QWORD PTR[128+rsp]
|
||
|
pxor xmm6,xmm14
|
||
|
mov r10d,edx
|
||
|
|
||
|
call _bsaes_encrypt8
|
||
|
|
||
|
pxor xmm15,XMMWORD PTR[rsp]
|
||
|
pxor xmm0,XMMWORD PTR[16+rsp]
|
||
|
movdqu XMMWORD PTR[r13],xmm15
|
||
|
pxor xmm3,XMMWORD PTR[32+rsp]
|
||
|
movdqu XMMWORD PTR[16+r13],xmm0
|
||
|
pxor xmm5,XMMWORD PTR[48+rsp]
|
||
|
movdqu XMMWORD PTR[32+r13],xmm3
|
||
|
pxor xmm2,XMMWORD PTR[64+rsp]
|
||
|
movdqu XMMWORD PTR[48+r13],xmm5
|
||
|
pxor xmm6,XMMWORD PTR[80+rsp]
|
||
|
movdqu XMMWORD PTR[64+r13],xmm2
|
||
|
pxor xmm1,XMMWORD PTR[96+rsp]
|
||
|
movdqu XMMWORD PTR[80+r13],xmm6
|
||
|
pxor xmm4,XMMWORD PTR[112+rsp]
|
||
|
movdqu XMMWORD PTR[96+r13],xmm1
|
||
|
movdqu XMMWORD PTR[112+r13],xmm4
|
||
|
lea r13,QWORD PTR[128+r13]
|
||
|
|
||
|
movdqa xmm6,XMMWORD PTR[112+rsp]
|
||
|
pxor xmm14,xmm14
|
||
|
movdqa xmm12,XMMWORD PTR[$L$xts_magic]
|
||
|
pcmpgtd xmm14,xmm6
|
||
|
pshufd xmm13,xmm14,013h
|
||
|
pxor xmm14,xmm14
|
||
|
paddq xmm6,xmm6
|
||
|
pand xmm13,xmm12
|
||
|
pcmpgtd xmm14,xmm6
|
||
|
pxor xmm6,xmm13
|
||
|
|
||
|
sub r14,080h
|
||
|
jnc $L$xts_enc_loop
|
||
|
|
||
|
$L$xts_enc_short::
|
||
|
add r14,080h
|
||
|
jz $L$xts_enc_done
|
||
|
pshufd xmm13,xmm14,013h
|
||
|
pxor xmm14,xmm14
|
||
|
movdqa xmm15,xmm6
|
||
|
movdqa XMMWORD PTR[rsp],xmm6
|
||
|
paddq xmm6,xmm6
|
||
|
pand xmm13,xmm12
|
||
|
pcmpgtd xmm14,xmm6
|
||
|
pxor xmm6,xmm13
|
||
|
pshufd xmm13,xmm14,013h
|
||
|
pxor xmm14,xmm14
|
||
|
movdqa xmm0,xmm6
|
||
|
movdqa XMMWORD PTR[16+rsp],xmm6
|
||
|
paddq xmm6,xmm6
|
||
|
pand xmm13,xmm12
|
||
|
pcmpgtd xmm14,xmm6
|
||
|
pxor xmm6,xmm13
|
||
|
movdqu xmm7,XMMWORD PTR[r12]
|
||
|
cmp r14,16
|
||
|
je $L$xts_enc_1
|
||
|
pshufd xmm13,xmm14,013h
|
||
|
pxor xmm14,xmm14
|
||
|
movdqa xmm1,xmm6
|
||
|
movdqa XMMWORD PTR[32+rsp],xmm6
|
||
|
paddq xmm6,xmm6
|
||
|
pand xmm13,xmm12
|
||
|
pcmpgtd xmm14,xmm6
|
||
|
pxor xmm6,xmm13
|
||
|
movdqu xmm8,XMMWORD PTR[16+r12]
|
||
|
cmp r14,32
|
||
|
je $L$xts_enc_2
|
||
|
pxor xmm15,xmm7
|
||
|
pshufd xmm13,xmm14,013h
|
||
|
pxor xmm14,xmm14
|
||
|
movdqa xmm2,xmm6
|
||
|
movdqa XMMWORD PTR[48+rsp],xmm6
|
||
|
paddq xmm6,xmm6
|
||
|
pand xmm13,xmm12
|
||
|
pcmpgtd xmm14,xmm6
|
||
|
pxor xmm6,xmm13
|
||
|
movdqu xmm9,XMMWORD PTR[32+r12]
|
||
|
cmp r14,48
|
||
|
je $L$xts_enc_3
|
||
|
pxor xmm0,xmm8
|
||
|
pshufd xmm13,xmm14,013h
|
||
|
pxor xmm14,xmm14
|
||
|
movdqa xmm3,xmm6
|
||
|
movdqa XMMWORD PTR[64+rsp],xmm6
|
||
|
paddq xmm6,xmm6
|
||
|
pand xmm13,xmm12
|
||
|
pcmpgtd xmm14,xmm6
|
||
|
pxor xmm6,xmm13
|
||
|
movdqu xmm10,XMMWORD PTR[48+r12]
|
||
|
cmp r14,64
|
||
|
je $L$xts_enc_4
|
||
|
pxor xmm1,xmm9
|
||
|
pshufd xmm13,xmm14,013h
|
||
|
pxor xmm14,xmm14
|
||
|
movdqa xmm4,xmm6
|
||
|
movdqa XMMWORD PTR[80+rsp],xmm6
|
||
|
paddq xmm6,xmm6
|
||
|
pand xmm13,xmm12
|
||
|
pcmpgtd xmm14,xmm6
|
||
|
pxor xmm6,xmm13
|
||
|
movdqu xmm11,XMMWORD PTR[64+r12]
|
||
|
cmp r14,80
|
||
|
je $L$xts_enc_5
|
||
|
pxor xmm2,xmm10
|
||
|
pshufd xmm13,xmm14,013h
|
||
|
pxor xmm14,xmm14
|
||
|
movdqa xmm5,xmm6
|
||
|
movdqa XMMWORD PTR[96+rsp],xmm6
|
||
|
paddq xmm6,xmm6
|
||
|
pand xmm13,xmm12
|
||
|
pcmpgtd xmm14,xmm6
|
||
|
pxor xmm6,xmm13
|
||
|
movdqu xmm12,XMMWORD PTR[80+r12]
|
||
|
cmp r14,96
|
||
|
je $L$xts_enc_6
|
||
|
pxor xmm3,xmm11
|
||
|
movdqu xmm13,XMMWORD PTR[96+r12]
|
||
|
pxor xmm4,xmm12
|
||
|
movdqa XMMWORD PTR[112+rsp],xmm6
|
||
|
lea r12,QWORD PTR[112+r12]
|
||
|
pxor xmm5,xmm13
|
||
|
lea rax,QWORD PTR[128+rsp]
|
||
|
mov r10d,edx
|
||
|
|
||
|
call _bsaes_encrypt8
|
||
|
|
||
|
pxor xmm15,XMMWORD PTR[rsp]
|
||
|
pxor xmm0,XMMWORD PTR[16+rsp]
|
||
|
movdqu XMMWORD PTR[r13],xmm15
|
||
|
pxor xmm3,XMMWORD PTR[32+rsp]
|
||
|
movdqu XMMWORD PTR[16+r13],xmm0
|
||
|
pxor xmm5,XMMWORD PTR[48+rsp]
|
||
|
movdqu XMMWORD PTR[32+r13],xmm3
|
||
|
pxor xmm2,XMMWORD PTR[64+rsp]
|
||
|
movdqu XMMWORD PTR[48+r13],xmm5
|
||
|
pxor xmm6,XMMWORD PTR[80+rsp]
|
||
|
movdqu XMMWORD PTR[64+r13],xmm2
|
||
|
pxor xmm1,XMMWORD PTR[96+rsp]
|
||
|
movdqu XMMWORD PTR[80+r13],xmm6
|
||
|
movdqu XMMWORD PTR[96+r13],xmm1
|
||
|
lea r13,QWORD PTR[112+r13]
|
||
|
|
||
|
movdqa xmm6,XMMWORD PTR[112+rsp]
|
||
|
jmp $L$xts_enc_done
|
||
|
ALIGN 16
|
||
|
$L$xts_enc_6::
|
||
|
pxor xmm3,xmm11
|
||
|
lea r12,QWORD PTR[96+r12]
|
||
|
pxor xmm4,xmm12
|
||
|
lea rax,QWORD PTR[128+rsp]
|
||
|
mov r10d,edx
|
||
|
|
||
|
call _bsaes_encrypt8
|
||
|
|
||
|
pxor xmm15,XMMWORD PTR[rsp]
|
||
|
pxor xmm0,XMMWORD PTR[16+rsp]
|
||
|
movdqu XMMWORD PTR[r13],xmm15
|
||
|
pxor xmm3,XMMWORD PTR[32+rsp]
|
||
|
movdqu XMMWORD PTR[16+r13],xmm0
|
||
|
pxor xmm5,XMMWORD PTR[48+rsp]
|
||
|
movdqu XMMWORD PTR[32+r13],xmm3
|
||
|
pxor xmm2,XMMWORD PTR[64+rsp]
|
||
|
movdqu XMMWORD PTR[48+r13],xmm5
|
||
|
pxor xmm6,XMMWORD PTR[80+rsp]
|
||
|
movdqu XMMWORD PTR[64+r13],xmm2
|
||
|
movdqu XMMWORD PTR[80+r13],xmm6
|
||
|
lea r13,QWORD PTR[96+r13]
|
||
|
|
||
|
movdqa xmm6,XMMWORD PTR[96+rsp]
|
||
|
jmp $L$xts_enc_done
|
||
|
ALIGN 16
|
||
|
$L$xts_enc_5::
|
||
|
pxor xmm2,xmm10
|
||
|
lea r12,QWORD PTR[80+r12]
|
||
|
pxor xmm3,xmm11
|
||
|
lea rax,QWORD PTR[128+rsp]
|
||
|
mov r10d,edx
|
||
|
|
||
|
call _bsaes_encrypt8
|
||
|
|
||
|
pxor xmm15,XMMWORD PTR[rsp]
|
||
|
pxor xmm0,XMMWORD PTR[16+rsp]
|
||
|
movdqu XMMWORD PTR[r13],xmm15
|
||
|
pxor xmm3,XMMWORD PTR[32+rsp]
|
||
|
movdqu XMMWORD PTR[16+r13],xmm0
|
||
|
pxor xmm5,XMMWORD PTR[48+rsp]
|
||
|
movdqu XMMWORD PTR[32+r13],xmm3
|
||
|
pxor xmm2,XMMWORD PTR[64+rsp]
|
||
|
movdqu XMMWORD PTR[48+r13],xmm5
|
||
|
movdqu XMMWORD PTR[64+r13],xmm2
|
||
|
lea r13,QWORD PTR[80+r13]
|
||
|
|
||
|
movdqa xmm6,XMMWORD PTR[80+rsp]
|
||
|
jmp $L$xts_enc_done
|
||
|
ALIGN 16
|
||
|
$L$xts_enc_4::
|
||
|
pxor xmm1,xmm9
|
||
|
lea r12,QWORD PTR[64+r12]
|
||
|
pxor xmm2,xmm10
|
||
|
lea rax,QWORD PTR[128+rsp]
|
||
|
mov r10d,edx
|
||
|
|
||
|
call _bsaes_encrypt8
|
||
|
|
||
|
pxor xmm15,XMMWORD PTR[rsp]
|
||
|
pxor xmm0,XMMWORD PTR[16+rsp]
|
||
|
movdqu XMMWORD PTR[r13],xmm15
|
||
|
pxor xmm3,XMMWORD PTR[32+rsp]
|
||
|
movdqu XMMWORD PTR[16+r13],xmm0
|
||
|
pxor xmm5,XMMWORD PTR[48+rsp]
|
||
|
movdqu XMMWORD PTR[32+r13],xmm3
|
||
|
movdqu XMMWORD PTR[48+r13],xmm5
|
||
|
lea r13,QWORD PTR[64+r13]
|
||
|
|
||
|
movdqa xmm6,XMMWORD PTR[64+rsp]
|
||
|
jmp $L$xts_enc_done
|
||
|
ALIGN 16
|
||
|
$L$xts_enc_3::
|
||
|
pxor xmm0,xmm8
|
||
|
lea r12,QWORD PTR[48+r12]
|
||
|
pxor xmm1,xmm9
|
||
|
lea rax,QWORD PTR[128+rsp]
|
||
|
mov r10d,edx
|
||
|
|
||
|
call _bsaes_encrypt8
|
||
|
|
||
|
pxor xmm15,XMMWORD PTR[rsp]
|
||
|
pxor xmm0,XMMWORD PTR[16+rsp]
|
||
|
movdqu XMMWORD PTR[r13],xmm15
|
||
|
pxor xmm3,XMMWORD PTR[32+rsp]
|
||
|
movdqu XMMWORD PTR[16+r13],xmm0
|
||
|
movdqu XMMWORD PTR[32+r13],xmm3
|
||
|
lea r13,QWORD PTR[48+r13]
|
||
|
|
||
|
movdqa xmm6,XMMWORD PTR[48+rsp]
|
||
|
jmp $L$xts_enc_done
|
||
|
ALIGN 16
|
||
|
$L$xts_enc_2::
|
||
|
pxor xmm15,xmm7
|
||
|
lea r12,QWORD PTR[32+r12]
|
||
|
pxor xmm0,xmm8
|
||
|
lea rax,QWORD PTR[128+rsp]
|
||
|
mov r10d,edx
|
||
|
|
||
|
call _bsaes_encrypt8
|
||
|
|
||
|
pxor xmm15,XMMWORD PTR[rsp]
|
||
|
pxor xmm0,XMMWORD PTR[16+rsp]
|
||
|
movdqu XMMWORD PTR[r13],xmm15
|
||
|
movdqu XMMWORD PTR[16+r13],xmm0
|
||
|
lea r13,QWORD PTR[32+r13]
|
||
|
|
||
|
movdqa xmm6,XMMWORD PTR[32+rsp]
|
||
|
jmp $L$xts_enc_done
|
||
|
ALIGN 16
|
||
|
$L$xts_enc_1::
|
||
|
pxor xmm7,xmm15
|
||
|
lea r12,QWORD PTR[16+r12]
|
||
|
movdqa XMMWORD PTR[32+rbp],xmm7
|
||
|
lea rcx,QWORD PTR[32+rbp]
|
||
|
lea rdx,QWORD PTR[32+rbp]
|
||
|
lea r8,QWORD PTR[r15]
|
||
|
call asm_AES_encrypt
|
||
|
pxor xmm15,XMMWORD PTR[32+rbp]
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
movdqu XMMWORD PTR[r13],xmm15
|
||
|
lea r13,QWORD PTR[16+r13]
|
||
|
|
||
|
movdqa xmm6,XMMWORD PTR[16+rsp]
|
||
|
|
||
|
$L$xts_enc_done::
|
||
|
and ebx,15
|
||
|
jz $L$xts_enc_ret
|
||
|
mov rdx,r13
|
||
|
|
||
|
$L$xts_enc_steal::
|
||
|
movzx eax,BYTE PTR[r12]
|
||
|
movzx ecx,BYTE PTR[((-16))+rdx]
|
||
|
lea r12,QWORD PTR[1+r12]
|
||
|
mov BYTE PTR[((-16))+rdx],al
|
||
|
mov BYTE PTR[rdx],cl
|
||
|
lea rdx,QWORD PTR[1+rdx]
|
||
|
sub ebx,1
|
||
|
jnz $L$xts_enc_steal
|
||
|
|
||
|
movdqu xmm15,XMMWORD PTR[((-16))+r13]
|
||
|
lea rcx,QWORD PTR[32+rbp]
|
||
|
pxor xmm15,xmm6
|
||
|
lea rdx,QWORD PTR[32+rbp]
|
||
|
movdqa XMMWORD PTR[32+rbp],xmm15
|
||
|
lea r8,QWORD PTR[r15]
|
||
|
call asm_AES_encrypt
|
||
|
pxor xmm6,XMMWORD PTR[32+rbp]
|
||
|
movdqu XMMWORD PTR[(-16)+r13],xmm6
|
||
|
|
||
|
$L$xts_enc_ret::
|
||
|
lea rax,QWORD PTR[rsp]
|
||
|
pxor xmm0,xmm0
|
||
|
$L$xts_enc_bzero::
|
||
|
movdqa XMMWORD PTR[rax],xmm0
|
||
|
movdqa XMMWORD PTR[16+rax],xmm0
|
||
|
lea rax,QWORD PTR[32+rax]
|
||
|
cmp rbp,rax
|
||
|
ja $L$xts_enc_bzero
|
||
|
|
||
|
lea rsp,QWORD PTR[rbp]
|
||
|
movaps xmm6,XMMWORD PTR[64+rbp]
|
||
|
movaps xmm7,XMMWORD PTR[80+rbp]
|
||
|
movaps xmm8,XMMWORD PTR[96+rbp]
|
||
|
movaps xmm9,XMMWORD PTR[112+rbp]
|
||
|
movaps xmm10,XMMWORD PTR[128+rbp]
|
||
|
movaps xmm11,XMMWORD PTR[144+rbp]
|
||
|
movaps xmm12,XMMWORD PTR[160+rbp]
|
||
|
movaps xmm13,XMMWORD PTR[176+rbp]
|
||
|
movaps xmm14,XMMWORD PTR[192+rbp]
|
||
|
movaps xmm15,XMMWORD PTR[208+rbp]
|
||
|
lea rsp,QWORD PTR[160+rbp]
|
||
|
mov r15,QWORD PTR[72+rsp]
|
||
|
mov r14,QWORD PTR[80+rsp]
|
||
|
mov r13,QWORD PTR[88+rsp]
|
||
|
mov r12,QWORD PTR[96+rsp]
|
||
|
mov rbx,QWORD PTR[104+rsp]
|
||
|
mov rax,QWORD PTR[112+rsp]
|
||
|
lea rsp,QWORD PTR[120+rsp]
|
||
|
mov rbp,rax
|
||
|
$L$xts_enc_epilogue::
|
||
|
DB 0F3h,0C3h ;repret
|
||
|
bsaes_xts_encrypt ENDP
|
||
|
|
||
|
PUBLIC bsaes_xts_decrypt
|
||
|
|
||
|
ALIGN 16
|
||
|
bsaes_xts_decrypt PROC PUBLIC
|
||
|
mov rax,rsp
|
||
|
$L$xts_dec_prologue::
|
||
|
push rbp
|
||
|
push rbx
|
||
|
push r12
|
||
|
push r13
|
||
|
push r14
|
||
|
push r15
|
||
|
lea rsp,QWORD PTR[((-72))+rsp]
|
||
|
mov r10,QWORD PTR[160+rsp]
|
||
|
mov r11,QWORD PTR[168+rsp]
|
||
|
lea rsp,QWORD PTR[((-160))+rsp]
|
||
|
movaps XMMWORD PTR[64+rsp],xmm6
|
||
|
movaps XMMWORD PTR[80+rsp],xmm7
|
||
|
movaps XMMWORD PTR[96+rsp],xmm8
|
||
|
movaps XMMWORD PTR[112+rsp],xmm9
|
||
|
movaps XMMWORD PTR[128+rsp],xmm10
|
||
|
movaps XMMWORD PTR[144+rsp],xmm11
|
||
|
movaps XMMWORD PTR[160+rsp],xmm12
|
||
|
movaps XMMWORD PTR[176+rsp],xmm13
|
||
|
movaps XMMWORD PTR[192+rsp],xmm14
|
||
|
movaps XMMWORD PTR[208+rsp],xmm15
|
||
|
$L$xts_dec_body::
|
||
|
mov rbp,rsp
|
||
|
mov r12,rcx
|
||
|
mov r13,rdx
|
||
|
mov r14,r8
|
||
|
mov r15,r9
|
||
|
|
||
|
lea rcx,QWORD PTR[r11]
|
||
|
lea rdx,QWORD PTR[32+rbp]
|
||
|
lea r8,QWORD PTR[r10]
|
||
|
call asm_AES_encrypt
|
||
|
|
||
|
mov eax,DWORD PTR[240+r15]
|
||
|
mov rbx,r14
|
||
|
|
||
|
mov edx,eax
|
||
|
shl rax,7
|
||
|
sub rax,96
|
||
|
sub rsp,rax
|
||
|
|
||
|
mov rax,rsp
|
||
|
mov rcx,r15
|
||
|
mov r10d,edx
|
||
|
call _bsaes_key_convert
|
||
|
pxor xmm7,XMMWORD PTR[rsp]
|
||
|
movdqa XMMWORD PTR[rax],xmm6
|
||
|
movdqa XMMWORD PTR[rsp],xmm7
|
||
|
|
||
|
xor eax,eax
|
||
|
and r14,-16
|
||
|
test ebx,15
|
||
|
setnz al
|
||
|
shl rax,4
|
||
|
sub r14,rax
|
||
|
|
||
|
sub rsp,080h
|
||
|
movdqa xmm6,XMMWORD PTR[32+rbp]
|
||
|
|
||
|
pxor xmm14,xmm14
|
||
|
movdqa xmm12,XMMWORD PTR[$L$xts_magic]
|
||
|
pcmpgtd xmm14,xmm6
|
||
|
|
||
|
sub r14,080h
|
||
|
jc $L$xts_dec_short
|
||
|
jmp $L$xts_dec_loop
|
||
|
|
||
|
ALIGN 16
|
||
|
$L$xts_dec_loop::
|
||
|
pshufd xmm13,xmm14,013h
|
||
|
pxor xmm14,xmm14
|
||
|
movdqa xmm15,xmm6
|
||
|
movdqa XMMWORD PTR[rsp],xmm6
|
||
|
paddq xmm6,xmm6
|
||
|
pand xmm13,xmm12
|
||
|
pcmpgtd xmm14,xmm6
|
||
|
pxor xmm6,xmm13
|
||
|
pshufd xmm13,xmm14,013h
|
||
|
pxor xmm14,xmm14
|
||
|
movdqa xmm0,xmm6
|
||
|
movdqa XMMWORD PTR[16+rsp],xmm6
|
||
|
paddq xmm6,xmm6
|
||
|
pand xmm13,xmm12
|
||
|
pcmpgtd xmm14,xmm6
|
||
|
pxor xmm6,xmm13
|
||
|
movdqu xmm7,XMMWORD PTR[r12]
|
||
|
pshufd xmm13,xmm14,013h
|
||
|
pxor xmm14,xmm14
|
||
|
movdqa xmm1,xmm6
|
||
|
movdqa XMMWORD PTR[32+rsp],xmm6
|
||
|
paddq xmm6,xmm6
|
||
|
pand xmm13,xmm12
|
||
|
pcmpgtd xmm14,xmm6
|
||
|
pxor xmm6,xmm13
|
||
|
movdqu xmm8,XMMWORD PTR[16+r12]
|
||
|
pxor xmm15,xmm7
|
||
|
pshufd xmm13,xmm14,013h
|
||
|
pxor xmm14,xmm14
|
||
|
movdqa xmm2,xmm6
|
||
|
movdqa XMMWORD PTR[48+rsp],xmm6
|
||
|
paddq xmm6,xmm6
|
||
|
pand xmm13,xmm12
|
||
|
pcmpgtd xmm14,xmm6
|
||
|
pxor xmm6,xmm13
|
||
|
movdqu xmm9,XMMWORD PTR[32+r12]
|
||
|
pxor xmm0,xmm8
|
||
|
pshufd xmm13,xmm14,013h
|
||
|
pxor xmm14,xmm14
|
||
|
movdqa xmm3,xmm6
|
||
|
movdqa XMMWORD PTR[64+rsp],xmm6
|
||
|
paddq xmm6,xmm6
|
||
|
pand xmm13,xmm12
|
||
|
pcmpgtd xmm14,xmm6
|
||
|
pxor xmm6,xmm13
|
||
|
movdqu xmm10,XMMWORD PTR[48+r12]
|
||
|
pxor xmm1,xmm9
|
||
|
pshufd xmm13,xmm14,013h
|
||
|
pxor xmm14,xmm14
|
||
|
movdqa xmm4,xmm6
|
||
|
movdqa XMMWORD PTR[80+rsp],xmm6
|
||
|
paddq xmm6,xmm6
|
||
|
pand xmm13,xmm12
|
||
|
pcmpgtd xmm14,xmm6
|
||
|
pxor xmm6,xmm13
|
||
|
movdqu xmm11,XMMWORD PTR[64+r12]
|
||
|
pxor xmm2,xmm10
|
||
|
pshufd xmm13,xmm14,013h
|
||
|
pxor xmm14,xmm14
|
||
|
movdqa xmm5,xmm6
|
||
|
movdqa XMMWORD PTR[96+rsp],xmm6
|
||
|
paddq xmm6,xmm6
|
||
|
pand xmm13,xmm12
|
||
|
pcmpgtd xmm14,xmm6
|
||
|
pxor xmm6,xmm13
|
||
|
movdqu xmm12,XMMWORD PTR[80+r12]
|
||
|
pxor xmm3,xmm11
|
||
|
movdqu xmm13,XMMWORD PTR[96+r12]
|
||
|
pxor xmm4,xmm12
|
||
|
movdqu xmm14,XMMWORD PTR[112+r12]
|
||
|
lea r12,QWORD PTR[128+r12]
|
||
|
movdqa XMMWORD PTR[112+rsp],xmm6
|
||
|
pxor xmm5,xmm13
|
||
|
lea rax,QWORD PTR[128+rsp]
|
||
|
pxor xmm6,xmm14
|
||
|
mov r10d,edx
|
||
|
|
||
|
call _bsaes_decrypt8
|
||
|
|
||
|
pxor xmm15,XMMWORD PTR[rsp]
|
||
|
pxor xmm0,XMMWORD PTR[16+rsp]
|
||
|
movdqu XMMWORD PTR[r13],xmm15
|
||
|
pxor xmm5,XMMWORD PTR[32+rsp]
|
||
|
movdqu XMMWORD PTR[16+r13],xmm0
|
||
|
pxor xmm3,XMMWORD PTR[48+rsp]
|
||
|
movdqu XMMWORD PTR[32+r13],xmm5
|
||
|
pxor xmm1,XMMWORD PTR[64+rsp]
|
||
|
movdqu XMMWORD PTR[48+r13],xmm3
|
||
|
pxor xmm6,XMMWORD PTR[80+rsp]
|
||
|
movdqu XMMWORD PTR[64+r13],xmm1
|
||
|
pxor xmm2,XMMWORD PTR[96+rsp]
|
||
|
movdqu XMMWORD PTR[80+r13],xmm6
|
||
|
pxor xmm4,XMMWORD PTR[112+rsp]
|
||
|
movdqu XMMWORD PTR[96+r13],xmm2
|
||
|
movdqu XMMWORD PTR[112+r13],xmm4
|
||
|
lea r13,QWORD PTR[128+r13]
|
||
|
|
||
|
movdqa xmm6,XMMWORD PTR[112+rsp]
|
||
|
pxor xmm14,xmm14
|
||
|
movdqa xmm12,XMMWORD PTR[$L$xts_magic]
|
||
|
pcmpgtd xmm14,xmm6
|
||
|
pshufd xmm13,xmm14,013h
|
||
|
pxor xmm14,xmm14
|
||
|
paddq xmm6,xmm6
|
||
|
pand xmm13,xmm12
|
||
|
pcmpgtd xmm14,xmm6
|
||
|
pxor xmm6,xmm13
|
||
|
|
||
|
sub r14,080h
|
||
|
jnc $L$xts_dec_loop
|
||
|
|
||
|
$L$xts_dec_short::
|
||
|
add r14,080h
|
||
|
jz $L$xts_dec_done
|
||
|
pshufd xmm13,xmm14,013h
|
||
|
pxor xmm14,xmm14
|
||
|
movdqa xmm15,xmm6
|
||
|
movdqa XMMWORD PTR[rsp],xmm6
|
||
|
paddq xmm6,xmm6
|
||
|
pand xmm13,xmm12
|
||
|
pcmpgtd xmm14,xmm6
|
||
|
pxor xmm6,xmm13
|
||
|
pshufd xmm13,xmm14,013h
|
||
|
pxor xmm14,xmm14
|
||
|
movdqa xmm0,xmm6
|
||
|
movdqa XMMWORD PTR[16+rsp],xmm6
|
||
|
paddq xmm6,xmm6
|
||
|
pand xmm13,xmm12
|
||
|
pcmpgtd xmm14,xmm6
|
||
|
pxor xmm6,xmm13
|
||
|
movdqu xmm7,XMMWORD PTR[r12]
|
||
|
cmp r14,16
|
||
|
je $L$xts_dec_1
|
||
|
pshufd xmm13,xmm14,013h
|
||
|
pxor xmm14,xmm14
|
||
|
movdqa xmm1,xmm6
|
||
|
movdqa XMMWORD PTR[32+rsp],xmm6
|
||
|
paddq xmm6,xmm6
|
||
|
pand xmm13,xmm12
|
||
|
pcmpgtd xmm14,xmm6
|
||
|
pxor xmm6,xmm13
|
||
|
movdqu xmm8,XMMWORD PTR[16+r12]
|
||
|
cmp r14,32
|
||
|
je $L$xts_dec_2
|
||
|
pxor xmm15,xmm7
|
||
|
pshufd xmm13,xmm14,013h
|
||
|
pxor xmm14,xmm14
|
||
|
movdqa xmm2,xmm6
|
||
|
movdqa XMMWORD PTR[48+rsp],xmm6
|
||
|
paddq xmm6,xmm6
|
||
|
pand xmm13,xmm12
|
||
|
pcmpgtd xmm14,xmm6
|
||
|
pxor xmm6,xmm13
|
||
|
movdqu xmm9,XMMWORD PTR[32+r12]
|
||
|
cmp r14,48
|
||
|
je $L$xts_dec_3
|
||
|
pxor xmm0,xmm8
|
||
|
pshufd xmm13,xmm14,013h
|
||
|
pxor xmm14,xmm14
|
||
|
movdqa xmm3,xmm6
|
||
|
movdqa XMMWORD PTR[64+rsp],xmm6
|
||
|
paddq xmm6,xmm6
|
||
|
pand xmm13,xmm12
|
||
|
pcmpgtd xmm14,xmm6
|
||
|
pxor xmm6,xmm13
|
||
|
movdqu xmm10,XMMWORD PTR[48+r12]
|
||
|
cmp r14,64
|
||
|
je $L$xts_dec_4
|
||
|
pxor xmm1,xmm9
|
||
|
pshufd xmm13,xmm14,013h
|
||
|
pxor xmm14,xmm14
|
||
|
movdqa xmm4,xmm6
|
||
|
movdqa XMMWORD PTR[80+rsp],xmm6
|
||
|
paddq xmm6,xmm6
|
||
|
pand xmm13,xmm12
|
||
|
pcmpgtd xmm14,xmm6
|
||
|
pxor xmm6,xmm13
|
||
|
movdqu xmm11,XMMWORD PTR[64+r12]
|
||
|
cmp r14,80
|
||
|
je $L$xts_dec_5
|
||
|
pxor xmm2,xmm10
|
||
|
pshufd xmm13,xmm14,013h
|
||
|
pxor xmm14,xmm14
|
||
|
movdqa xmm5,xmm6
|
||
|
movdqa XMMWORD PTR[96+rsp],xmm6
|
||
|
paddq xmm6,xmm6
|
||
|
pand xmm13,xmm12
|
||
|
pcmpgtd xmm14,xmm6
|
||
|
pxor xmm6,xmm13
|
||
|
movdqu xmm12,XMMWORD PTR[80+r12]
|
||
|
cmp r14,96
|
||
|
je $L$xts_dec_6
|
||
|
pxor xmm3,xmm11
|
||
|
movdqu xmm13,XMMWORD PTR[96+r12]
|
||
|
pxor xmm4,xmm12
|
||
|
movdqa XMMWORD PTR[112+rsp],xmm6
|
||
|
lea r12,QWORD PTR[112+r12]
|
||
|
pxor xmm5,xmm13
|
||
|
lea rax,QWORD PTR[128+rsp]
|
||
|
mov r10d,edx
|
||
|
|
||
|
call _bsaes_decrypt8
|
||
|
|
||
|
pxor xmm15,XMMWORD PTR[rsp]
|
||
|
pxor xmm0,XMMWORD PTR[16+rsp]
|
||
|
movdqu XMMWORD PTR[r13],xmm15
|
||
|
pxor xmm5,XMMWORD PTR[32+rsp]
|
||
|
movdqu XMMWORD PTR[16+r13],xmm0
|
||
|
pxor xmm3,XMMWORD PTR[48+rsp]
|
||
|
movdqu XMMWORD PTR[32+r13],xmm5
|
||
|
pxor xmm1,XMMWORD PTR[64+rsp]
|
||
|
movdqu XMMWORD PTR[48+r13],xmm3
|
||
|
pxor xmm6,XMMWORD PTR[80+rsp]
|
||
|
movdqu XMMWORD PTR[64+r13],xmm1
|
||
|
pxor xmm2,XMMWORD PTR[96+rsp]
|
||
|
movdqu XMMWORD PTR[80+r13],xmm6
|
||
|
movdqu XMMWORD PTR[96+r13],xmm2
|
||
|
lea r13,QWORD PTR[112+r13]
|
||
|
|
||
|
movdqa xmm6,XMMWORD PTR[112+rsp]
|
||
|
jmp $L$xts_dec_done
|
||
|
ALIGN 16
|
||
|
$L$xts_dec_6::
|
||
|
pxor xmm3,xmm11
|
||
|
lea r12,QWORD PTR[96+r12]
|
||
|
pxor xmm4,xmm12
|
||
|
lea rax,QWORD PTR[128+rsp]
|
||
|
mov r10d,edx
|
||
|
|
||
|
call _bsaes_decrypt8
|
||
|
|
||
|
pxor xmm15,XMMWORD PTR[rsp]
|
||
|
pxor xmm0,XMMWORD PTR[16+rsp]
|
||
|
movdqu XMMWORD PTR[r13],xmm15
|
||
|
pxor xmm5,XMMWORD PTR[32+rsp]
|
||
|
movdqu XMMWORD PTR[16+r13],xmm0
|
||
|
pxor xmm3,XMMWORD PTR[48+rsp]
|
||
|
movdqu XMMWORD PTR[32+r13],xmm5
|
||
|
pxor xmm1,XMMWORD PTR[64+rsp]
|
||
|
movdqu XMMWORD PTR[48+r13],xmm3
|
||
|
pxor xmm6,XMMWORD PTR[80+rsp]
|
||
|
movdqu XMMWORD PTR[64+r13],xmm1
|
||
|
movdqu XMMWORD PTR[80+r13],xmm6
|
||
|
lea r13,QWORD PTR[96+r13]
|
||
|
|
||
|
movdqa xmm6,XMMWORD PTR[96+rsp]
|
||
|
jmp $L$xts_dec_done
|
||
|
ALIGN 16
|
||
|
$L$xts_dec_5::
|
||
|
pxor xmm2,xmm10
|
||
|
lea r12,QWORD PTR[80+r12]
|
||
|
pxor xmm3,xmm11
|
||
|
lea rax,QWORD PTR[128+rsp]
|
||
|
mov r10d,edx
|
||
|
|
||
|
call _bsaes_decrypt8
|
||
|
|
||
|
pxor xmm15,XMMWORD PTR[rsp]
|
||
|
pxor xmm0,XMMWORD PTR[16+rsp]
|
||
|
movdqu XMMWORD PTR[r13],xmm15
|
||
|
pxor xmm5,XMMWORD PTR[32+rsp]
|
||
|
movdqu XMMWORD PTR[16+r13],xmm0
|
||
|
pxor xmm3,XMMWORD PTR[48+rsp]
|
||
|
movdqu XMMWORD PTR[32+r13],xmm5
|
||
|
pxor xmm1,XMMWORD PTR[64+rsp]
|
||
|
movdqu XMMWORD PTR[48+r13],xmm3
|
||
|
movdqu XMMWORD PTR[64+r13],xmm1
|
||
|
lea r13,QWORD PTR[80+r13]
|
||
|
|
||
|
movdqa xmm6,XMMWORD PTR[80+rsp]
|
||
|
jmp $L$xts_dec_done
|
||
|
ALIGN 16
|
||
|
$L$xts_dec_4::
|
||
|
pxor xmm1,xmm9
|
||
|
lea r12,QWORD PTR[64+r12]
|
||
|
pxor xmm2,xmm10
|
||
|
lea rax,QWORD PTR[128+rsp]
|
||
|
mov r10d,edx
|
||
|
|
||
|
call _bsaes_decrypt8
|
||
|
|
||
|
pxor xmm15,XMMWORD PTR[rsp]
|
||
|
pxor xmm0,XMMWORD PTR[16+rsp]
|
||
|
movdqu XMMWORD PTR[r13],xmm15
|
||
|
pxor xmm5,XMMWORD PTR[32+rsp]
|
||
|
movdqu XMMWORD PTR[16+r13],xmm0
|
||
|
pxor xmm3,XMMWORD PTR[48+rsp]
|
||
|
movdqu XMMWORD PTR[32+r13],xmm5
|
||
|
movdqu XMMWORD PTR[48+r13],xmm3
|
||
|
lea r13,QWORD PTR[64+r13]
|
||
|
|
||
|
movdqa xmm6,XMMWORD PTR[64+rsp]
|
||
|
jmp $L$xts_dec_done
|
||
|
ALIGN 16
|
||
|
$L$xts_dec_3::
|
||
|
pxor xmm0,xmm8
|
||
|
lea r12,QWORD PTR[48+r12]
|
||
|
pxor xmm1,xmm9
|
||
|
lea rax,QWORD PTR[128+rsp]
|
||
|
mov r10d,edx
|
||
|
|
||
|
call _bsaes_decrypt8
|
||
|
|
||
|
pxor xmm15,XMMWORD PTR[rsp]
|
||
|
pxor xmm0,XMMWORD PTR[16+rsp]
|
||
|
movdqu XMMWORD PTR[r13],xmm15
|
||
|
pxor xmm5,XMMWORD PTR[32+rsp]
|
||
|
movdqu XMMWORD PTR[16+r13],xmm0
|
||
|
movdqu XMMWORD PTR[32+r13],xmm5
|
||
|
lea r13,QWORD PTR[48+r13]
|
||
|
|
||
|
movdqa xmm6,XMMWORD PTR[48+rsp]
|
||
|
jmp $L$xts_dec_done
|
||
|
ALIGN 16
|
||
|
$L$xts_dec_2::
|
||
|
pxor xmm15,xmm7
|
||
|
lea r12,QWORD PTR[32+r12]
|
||
|
pxor xmm0,xmm8
|
||
|
lea rax,QWORD PTR[128+rsp]
|
||
|
mov r10d,edx
|
||
|
|
||
|
call _bsaes_decrypt8
|
||
|
|
||
|
pxor xmm15,XMMWORD PTR[rsp]
|
||
|
pxor xmm0,XMMWORD PTR[16+rsp]
|
||
|
movdqu XMMWORD PTR[r13],xmm15
|
||
|
movdqu XMMWORD PTR[16+r13],xmm0
|
||
|
lea r13,QWORD PTR[32+r13]
|
||
|
|
||
|
movdqa xmm6,XMMWORD PTR[32+rsp]
|
||
|
jmp $L$xts_dec_done
|
||
|
ALIGN 16
|
||
|
$L$xts_dec_1::
|
||
|
pxor xmm7,xmm15
|
||
|
lea r12,QWORD PTR[16+r12]
|
||
|
movdqa XMMWORD PTR[32+rbp],xmm7
|
||
|
lea rcx,QWORD PTR[32+rbp]
|
||
|
lea rdx,QWORD PTR[32+rbp]
|
||
|
lea r8,QWORD PTR[r15]
|
||
|
call asm_AES_decrypt
|
||
|
pxor xmm15,XMMWORD PTR[32+rbp]
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
movdqu XMMWORD PTR[r13],xmm15
|
||
|
lea r13,QWORD PTR[16+r13]
|
||
|
|
||
|
movdqa xmm6,XMMWORD PTR[16+rsp]
|
||
|
|
||
|
$L$xts_dec_done::
|
||
|
and ebx,15
|
||
|
jz $L$xts_dec_ret
|
||
|
|
||
|
pxor xmm14,xmm14
|
||
|
movdqa xmm12,XMMWORD PTR[$L$xts_magic]
|
||
|
pcmpgtd xmm14,xmm6
|
||
|
pshufd xmm13,xmm14,013h
|
||
|
movdqa xmm5,xmm6
|
||
|
paddq xmm6,xmm6
|
||
|
pand xmm13,xmm12
|
||
|
movdqu xmm15,XMMWORD PTR[r12]
|
||
|
pxor xmm6,xmm13
|
||
|
|
||
|
lea rcx,QWORD PTR[32+rbp]
|
||
|
pxor xmm15,xmm6
|
||
|
lea rdx,QWORD PTR[32+rbp]
|
||
|
movdqa XMMWORD PTR[32+rbp],xmm15
|
||
|
lea r8,QWORD PTR[r15]
|
||
|
call asm_AES_decrypt
|
||
|
pxor xmm6,XMMWORD PTR[32+rbp]
|
||
|
mov rdx,r13
|
||
|
movdqu XMMWORD PTR[r13],xmm6
|
||
|
|
||
|
$L$xts_dec_steal::
|
||
|
movzx eax,BYTE PTR[16+r12]
|
||
|
movzx ecx,BYTE PTR[rdx]
|
||
|
lea r12,QWORD PTR[1+r12]
|
||
|
mov BYTE PTR[rdx],al
|
||
|
mov BYTE PTR[16+rdx],cl
|
||
|
lea rdx,QWORD PTR[1+rdx]
|
||
|
sub ebx,1
|
||
|
jnz $L$xts_dec_steal
|
||
|
|
||
|
movdqu xmm15,XMMWORD PTR[r13]
|
||
|
lea rcx,QWORD PTR[32+rbp]
|
||
|
pxor xmm15,xmm5
|
||
|
lea rdx,QWORD PTR[32+rbp]
|
||
|
movdqa XMMWORD PTR[32+rbp],xmm15
|
||
|
lea r8,QWORD PTR[r15]
|
||
|
call asm_AES_decrypt
|
||
|
pxor xmm5,XMMWORD PTR[32+rbp]
|
||
|
movdqu XMMWORD PTR[r13],xmm5
|
||
|
|
||
|
$L$xts_dec_ret::
|
||
|
lea rax,QWORD PTR[rsp]
|
||
|
pxor xmm0,xmm0
|
||
|
$L$xts_dec_bzero::
|
||
|
movdqa XMMWORD PTR[rax],xmm0
|
||
|
movdqa XMMWORD PTR[16+rax],xmm0
|
||
|
lea rax,QWORD PTR[32+rax]
|
||
|
cmp rbp,rax
|
||
|
ja $L$xts_dec_bzero
|
||
|
|
||
|
lea rsp,QWORD PTR[rbp]
|
||
|
movaps xmm6,XMMWORD PTR[64+rbp]
|
||
|
movaps xmm7,XMMWORD PTR[80+rbp]
|
||
|
movaps xmm8,XMMWORD PTR[96+rbp]
|
||
|
movaps xmm9,XMMWORD PTR[112+rbp]
|
||
|
movaps xmm10,XMMWORD PTR[128+rbp]
|
||
|
movaps xmm11,XMMWORD PTR[144+rbp]
|
||
|
movaps xmm12,XMMWORD PTR[160+rbp]
|
||
|
movaps xmm13,XMMWORD PTR[176+rbp]
|
||
|
movaps xmm14,XMMWORD PTR[192+rbp]
|
||
|
movaps xmm15,XMMWORD PTR[208+rbp]
|
||
|
lea rsp,QWORD PTR[160+rbp]
|
||
|
mov r15,QWORD PTR[72+rsp]
|
||
|
mov r14,QWORD PTR[80+rsp]
|
||
|
mov r13,QWORD PTR[88+rsp]
|
||
|
mov r12,QWORD PTR[96+rsp]
|
||
|
mov rbx,QWORD PTR[104+rsp]
|
||
|
mov rax,QWORD PTR[112+rsp]
|
||
|
lea rsp,QWORD PTR[120+rsp]
|
||
|
mov rbp,rax
|
||
|
$L$xts_dec_epilogue::
|
||
|
DB 0F3h,0C3h ;repret
|
||
|
bsaes_xts_decrypt ENDP
|
||
|
|
||
|
ALIGN 64
|
||
|
_bsaes_const::
|
||
|
$L$M0ISR::
|
||
|
DQ 00a0e0206070b0f03h,00004080c0d010509h
|
||
|
$L$ISRM0::
|
||
|
DQ 001040b0e0205080fh,00306090c00070a0dh
|
||
|
$L$ISR::
|
||
|
DQ 00504070602010003h,00f0e0d0c080b0a09h
|
||
|
$L$BS0::
|
||
|
DQ 05555555555555555h,05555555555555555h
|
||
|
$L$BS1::
|
||
|
DQ 03333333333333333h,03333333333333333h
|
||
|
$L$BS2::
|
||
|
DQ 00f0f0f0f0f0f0f0fh,00f0f0f0f0f0f0f0fh
|
||
|
$L$SR::
|
||
|
DQ 00504070600030201h,00f0e0d0c0a09080bh
|
||
|
$L$SRM0::
|
||
|
DQ 00304090e00050a0fh,001060b0c0207080dh
|
||
|
$L$M0SR::
|
||
|
DQ 00a0e02060f03070bh,00004080c05090d01h
|
||
|
$L$SWPUP::
|
||
|
DQ 00706050403020100h,00c0d0e0f0b0a0908h
|
||
|
$L$SWPUPM0SR::
|
||
|
DQ 00a0d02060c03070bh,00004080f05090e01h
|
||
|
$L$ADD1::
|
||
|
DQ 00000000000000000h,00000000100000000h
|
||
|
$L$ADD2::
|
||
|
DQ 00000000000000000h,00000000200000000h
|
||
|
$L$ADD3::
|
||
|
DQ 00000000000000000h,00000000300000000h
|
||
|
$L$ADD4::
|
||
|
DQ 00000000000000000h,00000000400000000h
|
||
|
$L$ADD5::
|
||
|
DQ 00000000000000000h,00000000500000000h
|
||
|
$L$ADD6::
|
||
|
DQ 00000000000000000h,00000000600000000h
|
||
|
$L$ADD7::
|
||
|
DQ 00000000000000000h,00000000700000000h
|
||
|
$L$ADD8::
|
||
|
DQ 00000000000000000h,00000000800000000h
|
||
|
$L$xts_magic::
|
||
|
DD 087h,0,1,0
|
||
|
$L$masks::
|
||
|
DQ 00101010101010101h,00101010101010101h
|
||
|
DQ 00202020202020202h,00202020202020202h
|
||
|
DQ 00404040404040404h,00404040404040404h
|
||
|
DQ 00808080808080808h,00808080808080808h
|
||
|
$L$M0::
|
||
|
DQ 002060a0e03070b0fh,00004080c0105090dh
|
||
|
$L$63::
|
||
|
DQ 06363636363636363h,06363636363636363h
|
||
|
DB 66,105,116,45,115,108,105,99,101,100,32,65,69,83,32,102
|
||
|
DB 111,114,32,120,56,54,95,54,52,47,83,83,83,69,51,44
|
||
|
DB 32,69,109,105,108,105,97,32,75,195,164,115,112,101,114,44
|
||
|
DB 32,80,101,116,101,114,32,83,99,104,119,97,98,101,44,32
|
||
|
DB 65,110,100,121,32,80,111,108,121,97,107,111,118,0
|
||
|
ALIGN 64
|
||
|
|
||
|
EXTERN __imp_RtlVirtualUnwind:NEAR
|
||
|
|
||
|
ALIGN 16
|
||
|
se_handler PROC PRIVATE
|
||
|
push rsi
|
||
|
push rdi
|
||
|
push rbx
|
||
|
push rbp
|
||
|
push r12
|
||
|
push r13
|
||
|
push r14
|
||
|
push r15
|
||
|
pushfq
|
||
|
sub rsp,64
|
||
|
|
||
|
mov rax,QWORD PTR[120+r8]
|
||
|
mov rbx,QWORD PTR[248+r8]
|
||
|
|
||
|
mov rsi,QWORD PTR[8+r9]
|
||
|
mov r11,QWORD PTR[56+r9]
|
||
|
|
||
|
mov r10d,DWORD PTR[r11]
|
||
|
lea r10,QWORD PTR[r10*1+rsi]
|
||
|
cmp rbx,r10
|
||
|
jb $L$in_prologue
|
||
|
|
||
|
mov rax,QWORD PTR[152+r8]
|
||
|
|
||
|
mov r10d,DWORD PTR[4+r11]
|
||
|
lea r10,QWORD PTR[r10*1+rsi]
|
||
|
cmp rbx,r10
|
||
|
jae $L$in_prologue
|
||
|
|
||
|
mov rax,QWORD PTR[160+r8]
|
||
|
|
||
|
lea rsi,QWORD PTR[64+rax]
|
||
|
lea rdi,QWORD PTR[512+r8]
|
||
|
mov ecx,20
|
||
|
DD 0a548f3fch
|
||
|
lea rax,QWORD PTR[160+rax]
|
||
|
|
||
|
mov rbp,QWORD PTR[112+rax]
|
||
|
mov rbx,QWORD PTR[104+rax]
|
||
|
mov r12,QWORD PTR[96+rax]
|
||
|
mov r13,QWORD PTR[88+rax]
|
||
|
mov r14,QWORD PTR[80+rax]
|
||
|
mov r15,QWORD PTR[72+rax]
|
||
|
lea rax,QWORD PTR[120+rax]
|
||
|
mov QWORD PTR[144+r8],rbx
|
||
|
mov QWORD PTR[160+r8],rbp
|
||
|
mov QWORD PTR[216+r8],r12
|
||
|
mov QWORD PTR[224+r8],r13
|
||
|
mov QWORD PTR[232+r8],r14
|
||
|
mov QWORD PTR[240+r8],r15
|
||
|
|
||
|
$L$in_prologue::
|
||
|
mov QWORD PTR[152+r8],rax
|
||
|
|
||
|
mov rdi,QWORD PTR[40+r9]
|
||
|
mov rsi,r8
|
||
|
mov ecx,154
|
||
|
DD 0a548f3fch
|
||
|
|
||
|
mov rsi,r9
|
||
|
xor rcx,rcx
|
||
|
mov rdx,QWORD PTR[8+rsi]
|
||
|
mov r8,QWORD PTR[rsi]
|
||
|
mov r9,QWORD PTR[16+rsi]
|
||
|
mov r10,QWORD PTR[40+rsi]
|
||
|
lea r11,QWORD PTR[56+rsi]
|
||
|
lea r12,QWORD PTR[24+rsi]
|
||
|
mov QWORD PTR[32+rsp],r10
|
||
|
mov QWORD PTR[40+rsp],r11
|
||
|
mov QWORD PTR[48+rsp],r12
|
||
|
mov QWORD PTR[56+rsp],rcx
|
||
|
call QWORD PTR[__imp_RtlVirtualUnwind]
|
||
|
|
||
|
mov eax,1
|
||
|
add rsp,64
|
||
|
popfq
|
||
|
pop r15
|
||
|
pop r14
|
||
|
pop r13
|
||
|
pop r12
|
||
|
pop rbp
|
||
|
pop rbx
|
||
|
pop rdi
|
||
|
pop rsi
|
||
|
DB 0F3h,0C3h ;repret
|
||
|
se_handler ENDP
|
||
|
|
||
|
.text$ ENDS
|
||
|
.pdata SEGMENT READONLY ALIGN(4)
|
||
|
ALIGN 4
|
||
|
DD imagerel $L$cbc_dec_prologue
|
||
|
DD imagerel $L$cbc_dec_epilogue
|
||
|
DD imagerel $L$cbc_dec_info
|
||
|
|
||
|
DD imagerel $L$ctr_enc_prologue
|
||
|
DD imagerel $L$ctr_enc_epilogue
|
||
|
DD imagerel $L$ctr_enc_info
|
||
|
|
||
|
DD imagerel $L$xts_enc_prologue
|
||
|
DD imagerel $L$xts_enc_epilogue
|
||
|
DD imagerel $L$xts_enc_info
|
||
|
|
||
|
DD imagerel $L$xts_dec_prologue
|
||
|
DD imagerel $L$xts_dec_epilogue
|
||
|
DD imagerel $L$xts_dec_info
|
||
|
|
||
|
.pdata ENDS
|
||
|
.xdata SEGMENT READONLY ALIGN(8)
|
||
|
ALIGN 8
|
||
|
$L$cbc_dec_info::
|
||
|
DB 9,0,0,0
|
||
|
DD imagerel se_handler
|
||
|
DD imagerel $L$cbc_dec_body,imagerel $L$cbc_dec_epilogue
|
||
|
$L$ctr_enc_info::
|
||
|
DB 9,0,0,0
|
||
|
DD imagerel se_handler
|
||
|
DD imagerel $L$ctr_enc_body,imagerel $L$ctr_enc_epilogue
|
||
|
$L$xts_enc_info::
|
||
|
DB 9,0,0,0
|
||
|
DD imagerel se_handler
|
||
|
DD imagerel $L$xts_enc_body,imagerel $L$xts_enc_epilogue
|
||
|
$L$xts_dec_info::
|
||
|
DB 9,0,0,0
|
||
|
DD imagerel se_handler
|
||
|
DD imagerel $L$xts_dec_body,imagerel $L$xts_dec_epilogue
|
||
|
|
||
|
.xdata ENDS
|
||
|
END
|
||
|
|