mirror of
https://git.proxmox.com/git/mirror_zfs.git
synced 2026-05-22 02:27:36 +03:00
Restore ASMABI and other Unify work
Make sure all SHA2 transform function has wrappers For ASMABI to work, it is required the calling convention is consistent. Reviewed-by: Tino Reichardt <milky-zfs@mcmilk.de> Reviewed-by: Richard Yao <richard.yao@alumni.stonybrook.edu> Signed-off-by: Joergen Lundman <lundman@lundman.net> Closes #14569
This commit is contained in:
@@ -26,8 +26,8 @@
|
||||
|
||||
SECTION_STATIC
|
||||
|
||||
.align 64
|
||||
.type K256,@object
|
||||
.balign 64
|
||||
SET_OBJ(K256)
|
||||
K256:
|
||||
.long 0x428a2f98,0x71374491,0xb5c0fbcf,0xe9b5dba5
|
||||
.long 0x428a2f98,0x71374491,0xb5c0fbcf,0xe9b5dba5
|
||||
@@ -105,7 +105,7 @@ ENTRY_ALIGN(zfs_sha256_transform_x64, 16)
|
||||
movl 24(%rdi),%r10d
|
||||
movl 28(%rdi),%r11d
|
||||
jmp .Lloop
|
||||
.align 16
|
||||
.balign 16
|
||||
.Lloop:
|
||||
movl %ebx,%edi
|
||||
leaq K256(%rip),%rbp
|
||||
@@ -622,7 +622,7 @@ ENTRY_ALIGN(zfs_sha256_transform_x64, 16)
|
||||
addl %r12d,%eax
|
||||
leaq 20(%rbp),%rbp
|
||||
jmp .Lrounds_16_xx
|
||||
.align 16
|
||||
.balign 16
|
||||
.Lrounds_16_xx:
|
||||
movl 4(%rsp),%r13d
|
||||
movl 56(%rsp),%r15d
|
||||
@@ -1436,7 +1436,7 @@ ENTRY_ALIGN(zfs_sha256_transform_shani, 64)
|
||||
punpcklqdq %xmm0,%xmm2
|
||||
jmp .Loop_shani
|
||||
|
||||
.align 16
|
||||
.balign 16
|
||||
.Loop_shani:
|
||||
movdqu (%rsi),%xmm3
|
||||
movdqu 16(%rsi),%xmm4
|
||||
@@ -1666,7 +1666,7 @@ ENTRY_ALIGN(zfs_sha256_transform_ssse3, 64)
|
||||
movl 28(%rdi),%r11d
|
||||
|
||||
jmp .Lloop_ssse3
|
||||
.align 16
|
||||
.balign 16
|
||||
.Lloop_ssse3:
|
||||
movdqa K256+512(%rip),%xmm7
|
||||
movdqu 0(%rsi),%xmm0
|
||||
@@ -1696,7 +1696,7 @@ ENTRY_ALIGN(zfs_sha256_transform_ssse3, 64)
|
||||
movl %r8d,%r13d
|
||||
jmp .Lssse3_00_47
|
||||
|
||||
.align 16
|
||||
.balign 16
|
||||
.Lssse3_00_47:
|
||||
subq $-128,%rbp
|
||||
rorl $14,%r13d
|
||||
@@ -2779,7 +2779,7 @@ ENTRY_ALIGN(zfs_sha256_transform_avx, 64)
|
||||
vmovdqa K256+512+32(%rip),%xmm8
|
||||
vmovdqa K256+512+64(%rip),%xmm9
|
||||
jmp .Lloop_avx
|
||||
.align 16
|
||||
.balign 16
|
||||
.Lloop_avx:
|
||||
vmovdqa K256+512(%rip),%xmm7
|
||||
vmovdqu 0(%rsi),%xmm0
|
||||
@@ -2805,7 +2805,7 @@ ENTRY_ALIGN(zfs_sha256_transform_avx, 64)
|
||||
movl %r8d,%r13d
|
||||
jmp .Lavx_00_47
|
||||
|
||||
.align 16
|
||||
.balign 16
|
||||
.Lavx_00_47:
|
||||
subq $-128,%rbp
|
||||
vpalignr $4,%xmm0,%xmm1,%xmm4
|
||||
@@ -3858,7 +3858,7 @@ ENTRY_ALIGN(zfs_sha256_transform_avx2, 64)
|
||||
vmovdqa K256+512+32(%rip),%ymm8
|
||||
vmovdqa K256+512+64(%rip),%ymm9
|
||||
jmp .Loop_avx2
|
||||
.align 16
|
||||
.balign 16
|
||||
.Loop_avx2:
|
||||
vmovdqa K256+512(%rip),%ymm7
|
||||
vmovdqu -64+0(%rsi),%xmm0
|
||||
@@ -3900,7 +3900,7 @@ ENTRY_ALIGN(zfs_sha256_transform_avx2, 64)
|
||||
subq $-32*4,%rbp
|
||||
jmp .Lavx2_00_47
|
||||
|
||||
.align 16
|
||||
.balign 16
|
||||
.Lavx2_00_47:
|
||||
leaq -64(%rsp),%rsp
|
||||
.cfi_escape 0x0f,0x05,0x77,0x38,0x06,0x23,0x08
|
||||
@@ -4842,7 +4842,7 @@ ENTRY_ALIGN(zfs_sha256_transform_avx2, 64)
|
||||
xorl %ecx,%edi
|
||||
movl %r9d,%r12d
|
||||
jmp .Lower_avx2
|
||||
.align 16
|
||||
.balign 16
|
||||
.Lower_avx2:
|
||||
addl 0+16(%rbp),%r11d
|
||||
andl %r8d,%r12d
|
||||
|
||||
@@ -26,8 +26,8 @@
|
||||
|
||||
SECTION_STATIC
|
||||
|
||||
.align 64
|
||||
.type K512,@object
|
||||
.balign 64
|
||||
SET_OBJ(K512)
|
||||
K512:
|
||||
.quad 0x428a2f98d728ae22,0x7137449123ef65cd
|
||||
.quad 0x428a2f98d728ae22,0x7137449123ef65cd
|
||||
@@ -148,7 +148,7 @@ ENTRY_ALIGN(zfs_sha512_transform_x64, 16)
|
||||
movq 48(%rdi),%r10
|
||||
movq 56(%rdi),%r11
|
||||
jmp .Lloop
|
||||
.align 16
|
||||
.balign 16
|
||||
.Lloop:
|
||||
movq %rbx,%rdi
|
||||
leaq K512(%rip),%rbp
|
||||
@@ -665,7 +665,7 @@ ENTRY_ALIGN(zfs_sha512_transform_x64, 16)
|
||||
addq %r12,%rax
|
||||
leaq 24(%rbp),%rbp
|
||||
jmp .Lrounds_16_xx
|
||||
.align 16
|
||||
.balign 16
|
||||
.Lrounds_16_xx:
|
||||
movq 8(%rsp),%r13
|
||||
movq 112(%rsp),%r15
|
||||
@@ -1501,7 +1501,7 @@ ENTRY_ALIGN(zfs_sha512_transform_avx, 64)
|
||||
movq 48(%rdi),%r10
|
||||
movq 56(%rdi),%r11
|
||||
jmp .Lloop_avx
|
||||
.align 16
|
||||
.balign 16
|
||||
.Lloop_avx:
|
||||
vmovdqa K512+1280(%rip),%xmm11
|
||||
vmovdqu 0(%rsi),%xmm0
|
||||
@@ -1543,7 +1543,7 @@ ENTRY_ALIGN(zfs_sha512_transform_avx, 64)
|
||||
movq %r8,%r13
|
||||
jmp .Lavx_00_47
|
||||
|
||||
.align 16
|
||||
.balign 16
|
||||
.Lavx_00_47:
|
||||
addq $256,%rbp
|
||||
vpalignr $8,%xmm0,%xmm1,%xmm8
|
||||
@@ -2670,7 +2670,7 @@ ENTRY_ALIGN(zfs_sha512_transform_avx2, 64)
|
||||
movq 48(%rdi),%r10
|
||||
movq 56(%rdi),%r11
|
||||
jmp .Loop_avx2
|
||||
.align 16
|
||||
.balign 16
|
||||
.Loop_avx2:
|
||||
vmovdqu -128(%rsi),%xmm0
|
||||
vmovdqu -128+16(%rsi),%xmm1
|
||||
@@ -2732,7 +2732,7 @@ ENTRY_ALIGN(zfs_sha512_transform_avx2, 64)
|
||||
addq $32*8,%rbp
|
||||
jmp .Lavx2_00_47
|
||||
|
||||
.align 16
|
||||
.balign 16
|
||||
.Lavx2_00_47:
|
||||
leaq -128(%rsp),%rsp
|
||||
.cfi_escape 0x0f,0x06,0x77,0xf8,0x00,0x06,0x23,0x08
|
||||
@@ -3750,7 +3750,7 @@ ENTRY_ALIGN(zfs_sha512_transform_avx2, 64)
|
||||
xorq %rcx,%rdi
|
||||
movq %r9,%r12
|
||||
jmp .Lower_avx2
|
||||
.align 16
|
||||
.balign 16
|
||||
.Lower_avx2:
|
||||
addq 0+16(%rbp),%r11
|
||||
andq %r8,%r12
|
||||
|
||||
Reference in New Issue
Block a user