mirror of
https://github.com/ClickHouse/ClickHouse.git
synced 2024-12-15 10:52:30 +00:00
427 lines
5.2 KiB
ArmAsm
427 lines
5.2 KiB
ArmAsm
|
# This file is generated from a similarly-named Perl script in the BoringSSL
|
||
|
# source tree. Do not edit by hand.
|
||
|
|
||
|
#if defined(__has_feature)
|
||
|
#if __has_feature(memory_sanitizer) && !defined(OPENSSL_NO_ASM)
|
||
|
#define OPENSSL_NO_ASM
|
||
|
#endif
|
||
|
#endif
|
||
|
|
||
|
#if defined(__x86_64__) && !defined(OPENSSL_NO_ASM)
|
||
|
#if defined(BORINGSSL_PREFIX)
|
||
|
#include <boringssl_prefix_symbols_asm.h>
|
||
|
#endif
|
||
|
.text
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
.globl _gcm_gmult_ssse3
|
||
|
.private_extern _gcm_gmult_ssse3
|
||
|
.p2align 4
|
||
|
_gcm_gmult_ssse3:
|
||
|
|
||
|
L$gmult_seh_begin:
|
||
|
movdqu (%rdi),%xmm0
|
||
|
movdqa L$reverse_bytes(%rip),%xmm10
|
||
|
movdqa L$low4_mask(%rip),%xmm2
|
||
|
|
||
|
|
||
|
.byte 102,65,15,56,0,194
|
||
|
|
||
|
|
||
|
movdqa %xmm2,%xmm1
|
||
|
pandn %xmm0,%xmm1
|
||
|
psrld $4,%xmm1
|
||
|
pand %xmm2,%xmm0
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
pxor %xmm2,%xmm2
|
||
|
pxor %xmm3,%xmm3
|
||
|
movq $5,%rax
|
||
|
L$oop_row_1:
|
||
|
movdqa (%rsi),%xmm4
|
||
|
leaq 16(%rsi),%rsi
|
||
|
|
||
|
|
||
|
movdqa %xmm2,%xmm6
|
||
|
.byte 102,15,58,15,243,1
|
||
|
movdqa %xmm6,%xmm3
|
||
|
psrldq $1,%xmm2
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
movdqa %xmm4,%xmm5
|
||
|
.byte 102,15,56,0,224
|
||
|
.byte 102,15,56,0,233
|
||
|
|
||
|
|
||
|
pxor %xmm5,%xmm2
|
||
|
|
||
|
|
||
|
|
||
|
movdqa %xmm4,%xmm5
|
||
|
psllq $60,%xmm5
|
||
|
movdqa %xmm5,%xmm6
|
||
|
pslldq $8,%xmm6
|
||
|
pxor %xmm6,%xmm3
|
||
|
|
||
|
|
||
|
psrldq $8,%xmm5
|
||
|
pxor %xmm5,%xmm2
|
||
|
psrlq $4,%xmm4
|
||
|
pxor %xmm4,%xmm2
|
||
|
|
||
|
subq $1,%rax
|
||
|
jnz L$oop_row_1
|
||
|
|
||
|
|
||
|
|
||
|
pxor %xmm3,%xmm2
|
||
|
psrlq $1,%xmm3
|
||
|
pxor %xmm3,%xmm2
|
||
|
psrlq $1,%xmm3
|
||
|
pxor %xmm3,%xmm2
|
||
|
psrlq $5,%xmm3
|
||
|
pxor %xmm3,%xmm2
|
||
|
pxor %xmm3,%xmm3
|
||
|
movq $5,%rax
|
||
|
L$oop_row_2:
|
||
|
movdqa (%rsi),%xmm4
|
||
|
leaq 16(%rsi),%rsi
|
||
|
|
||
|
|
||
|
movdqa %xmm2,%xmm6
|
||
|
.byte 102,15,58,15,243,1
|
||
|
movdqa %xmm6,%xmm3
|
||
|
psrldq $1,%xmm2
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
movdqa %xmm4,%xmm5
|
||
|
.byte 102,15,56,0,224
|
||
|
.byte 102,15,56,0,233
|
||
|
|
||
|
|
||
|
pxor %xmm5,%xmm2
|
||
|
|
||
|
|
||
|
|
||
|
movdqa %xmm4,%xmm5
|
||
|
psllq $60,%xmm5
|
||
|
movdqa %xmm5,%xmm6
|
||
|
pslldq $8,%xmm6
|
||
|
pxor %xmm6,%xmm3
|
||
|
|
||
|
|
||
|
psrldq $8,%xmm5
|
||
|
pxor %xmm5,%xmm2
|
||
|
psrlq $4,%xmm4
|
||
|
pxor %xmm4,%xmm2
|
||
|
|
||
|
subq $1,%rax
|
||
|
jnz L$oop_row_2
|
||
|
|
||
|
|
||
|
|
||
|
pxor %xmm3,%xmm2
|
||
|
psrlq $1,%xmm3
|
||
|
pxor %xmm3,%xmm2
|
||
|
psrlq $1,%xmm3
|
||
|
pxor %xmm3,%xmm2
|
||
|
psrlq $5,%xmm3
|
||
|
pxor %xmm3,%xmm2
|
||
|
pxor %xmm3,%xmm3
|
||
|
movq $6,%rax
|
||
|
L$oop_row_3:
|
||
|
movdqa (%rsi),%xmm4
|
||
|
leaq 16(%rsi),%rsi
|
||
|
|
||
|
|
||
|
movdqa %xmm2,%xmm6
|
||
|
.byte 102,15,58,15,243,1
|
||
|
movdqa %xmm6,%xmm3
|
||
|
psrldq $1,%xmm2
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
movdqa %xmm4,%xmm5
|
||
|
.byte 102,15,56,0,224
|
||
|
.byte 102,15,56,0,233
|
||
|
|
||
|
|
||
|
pxor %xmm5,%xmm2
|
||
|
|
||
|
|
||
|
|
||
|
movdqa %xmm4,%xmm5
|
||
|
psllq $60,%xmm5
|
||
|
movdqa %xmm5,%xmm6
|
||
|
pslldq $8,%xmm6
|
||
|
pxor %xmm6,%xmm3
|
||
|
|
||
|
|
||
|
psrldq $8,%xmm5
|
||
|
pxor %xmm5,%xmm2
|
||
|
psrlq $4,%xmm4
|
||
|
pxor %xmm4,%xmm2
|
||
|
|
||
|
subq $1,%rax
|
||
|
jnz L$oop_row_3
|
||
|
|
||
|
|
||
|
|
||
|
pxor %xmm3,%xmm2
|
||
|
psrlq $1,%xmm3
|
||
|
pxor %xmm3,%xmm2
|
||
|
psrlq $1,%xmm3
|
||
|
pxor %xmm3,%xmm2
|
||
|
psrlq $5,%xmm3
|
||
|
pxor %xmm3,%xmm2
|
||
|
pxor %xmm3,%xmm3
|
||
|
|
||
|
.byte 102,65,15,56,0,210
|
||
|
movdqu %xmm2,(%rdi)
|
||
|
|
||
|
|
||
|
pxor %xmm0,%xmm0
|
||
|
pxor %xmm1,%xmm1
|
||
|
pxor %xmm2,%xmm2
|
||
|
pxor %xmm3,%xmm3
|
||
|
pxor %xmm4,%xmm4
|
||
|
pxor %xmm5,%xmm5
|
||
|
pxor %xmm6,%xmm6
|
||
|
.byte 0xf3,0xc3
|
||
|
L$gmult_seh_end:
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
.globl _gcm_ghash_ssse3
|
||
|
.private_extern _gcm_ghash_ssse3
|
||
|
.p2align 4
|
||
|
_gcm_ghash_ssse3:
|
||
|
L$ghash_seh_begin:
|
||
|
|
||
|
movdqu (%rdi),%xmm0
|
||
|
movdqa L$reverse_bytes(%rip),%xmm10
|
||
|
movdqa L$low4_mask(%rip),%xmm11
|
||
|
|
||
|
|
||
|
andq $-16,%rcx
|
||
|
|
||
|
|
||
|
|
||
|
.byte 102,65,15,56,0,194
|
||
|
|
||
|
|
||
|
pxor %xmm3,%xmm3
|
||
|
L$oop_ghash:
|
||
|
|
||
|
movdqu (%rdx),%xmm1
|
||
|
.byte 102,65,15,56,0,202
|
||
|
pxor %xmm1,%xmm0
|
||
|
|
||
|
|
||
|
movdqa %xmm11,%xmm1
|
||
|
pandn %xmm0,%xmm1
|
||
|
psrld $4,%xmm1
|
||
|
pand %xmm11,%xmm0
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
pxor %xmm2,%xmm2
|
||
|
|
||
|
movq $5,%rax
|
||
|
L$oop_row_4:
|
||
|
movdqa (%rsi),%xmm4
|
||
|
leaq 16(%rsi),%rsi
|
||
|
|
||
|
|
||
|
movdqa %xmm2,%xmm6
|
||
|
.byte 102,15,58,15,243,1
|
||
|
movdqa %xmm6,%xmm3
|
||
|
psrldq $1,%xmm2
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
movdqa %xmm4,%xmm5
|
||
|
.byte 102,15,56,0,224
|
||
|
.byte 102,15,56,0,233
|
||
|
|
||
|
|
||
|
pxor %xmm5,%xmm2
|
||
|
|
||
|
|
||
|
|
||
|
movdqa %xmm4,%xmm5
|
||
|
psllq $60,%xmm5
|
||
|
movdqa %xmm5,%xmm6
|
||
|
pslldq $8,%xmm6
|
||
|
pxor %xmm6,%xmm3
|
||
|
|
||
|
|
||
|
psrldq $8,%xmm5
|
||
|
pxor %xmm5,%xmm2
|
||
|
psrlq $4,%xmm4
|
||
|
pxor %xmm4,%xmm2
|
||
|
|
||
|
subq $1,%rax
|
||
|
jnz L$oop_row_4
|
||
|
|
||
|
|
||
|
|
||
|
pxor %xmm3,%xmm2
|
||
|
psrlq $1,%xmm3
|
||
|
pxor %xmm3,%xmm2
|
||
|
psrlq $1,%xmm3
|
||
|
pxor %xmm3,%xmm2
|
||
|
psrlq $5,%xmm3
|
||
|
pxor %xmm3,%xmm2
|
||
|
pxor %xmm3,%xmm3
|
||
|
movq $5,%rax
|
||
|
L$oop_row_5:
|
||
|
movdqa (%rsi),%xmm4
|
||
|
leaq 16(%rsi),%rsi
|
||
|
|
||
|
|
||
|
movdqa %xmm2,%xmm6
|
||
|
.byte 102,15,58,15,243,1
|
||
|
movdqa %xmm6,%xmm3
|
||
|
psrldq $1,%xmm2
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
movdqa %xmm4,%xmm5
|
||
|
.byte 102,15,56,0,224
|
||
|
.byte 102,15,56,0,233
|
||
|
|
||
|
|
||
|
pxor %xmm5,%xmm2
|
||
|
|
||
|
|
||
|
|
||
|
movdqa %xmm4,%xmm5
|
||
|
psllq $60,%xmm5
|
||
|
movdqa %xmm5,%xmm6
|
||
|
pslldq $8,%xmm6
|
||
|
pxor %xmm6,%xmm3
|
||
|
|
||
|
|
||
|
psrldq $8,%xmm5
|
||
|
pxor %xmm5,%xmm2
|
||
|
psrlq $4,%xmm4
|
||
|
pxor %xmm4,%xmm2
|
||
|
|
||
|
subq $1,%rax
|
||
|
jnz L$oop_row_5
|
||
|
|
||
|
|
||
|
|
||
|
pxor %xmm3,%xmm2
|
||
|
psrlq $1,%xmm3
|
||
|
pxor %xmm3,%xmm2
|
||
|
psrlq $1,%xmm3
|
||
|
pxor %xmm3,%xmm2
|
||
|
psrlq $5,%xmm3
|
||
|
pxor %xmm3,%xmm2
|
||
|
pxor %xmm3,%xmm3
|
||
|
movq $6,%rax
|
||
|
L$oop_row_6:
|
||
|
movdqa (%rsi),%xmm4
|
||
|
leaq 16(%rsi),%rsi
|
||
|
|
||
|
|
||
|
movdqa %xmm2,%xmm6
|
||
|
.byte 102,15,58,15,243,1
|
||
|
movdqa %xmm6,%xmm3
|
||
|
psrldq $1,%xmm2
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
movdqa %xmm4,%xmm5
|
||
|
.byte 102,15,56,0,224
|
||
|
.byte 102,15,56,0,233
|
||
|
|
||
|
|
||
|
pxor %xmm5,%xmm2
|
||
|
|
||
|
|
||
|
|
||
|
movdqa %xmm4,%xmm5
|
||
|
psllq $60,%xmm5
|
||
|
movdqa %xmm5,%xmm6
|
||
|
pslldq $8,%xmm6
|
||
|
pxor %xmm6,%xmm3
|
||
|
|
||
|
|
||
|
psrldq $8,%xmm5
|
||
|
pxor %xmm5,%xmm2
|
||
|
psrlq $4,%xmm4
|
||
|
pxor %xmm4,%xmm2
|
||
|
|
||
|
subq $1,%rax
|
||
|
jnz L$oop_row_6
|
||
|
|
||
|
|
||
|
|
||
|
pxor %xmm3,%xmm2
|
||
|
psrlq $1,%xmm3
|
||
|
pxor %xmm3,%xmm2
|
||
|
psrlq $1,%xmm3
|
||
|
pxor %xmm3,%xmm2
|
||
|
psrlq $5,%xmm3
|
||
|
pxor %xmm3,%xmm2
|
||
|
pxor %xmm3,%xmm3
|
||
|
movdqa %xmm2,%xmm0
|
||
|
|
||
|
|
||
|
leaq -256(%rsi),%rsi
|
||
|
|
||
|
|
||
|
leaq 16(%rdx),%rdx
|
||
|
subq $16,%rcx
|
||
|
jnz L$oop_ghash
|
||
|
|
||
|
|
||
|
.byte 102,65,15,56,0,194
|
||
|
movdqu %xmm0,(%rdi)
|
||
|
|
||
|
|
||
|
pxor %xmm0,%xmm0
|
||
|
pxor %xmm1,%xmm1
|
||
|
pxor %xmm2,%xmm2
|
||
|
pxor %xmm3,%xmm3
|
||
|
pxor %xmm4,%xmm4
|
||
|
pxor %xmm5,%xmm5
|
||
|
pxor %xmm6,%xmm6
|
||
|
.byte 0xf3,0xc3
|
||
|
L$ghash_seh_end:
|
||
|
|
||
|
|
||
|
|
||
|
.p2align 4
|
||
|
|
||
|
|
||
|
L$reverse_bytes:
|
||
|
.byte 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0
|
||
|
|
||
|
L$low4_mask:
|
||
|
.quad 0x0f0f0f0f0f0f0f0f, 0x0f0f0f0f0f0f0f0f
|
||
|
#endif
|