mirror of
https://github.com/AuxXxilium/linux_dsm_epyc7002.git
synced 2024-11-26 00:40:55 +07:00
ce6889515d
Things works better when you increment the source buffer pointer properly. Signed-off-by: David S. Miller <davem@davemloft.net>
420 lines
9.4 KiB
ArmAsm
420 lines
9.4 KiB
ArmAsm
#include <linux/linkage.h>
|
|
#include <asm/visasm.h>
|
|
|
|
#include "opcodes.h"
|
|
|
|
.align 32
|
|
ENTRY(des_sparc64_key_expand)
|
|
/* %o0=input_key, %o1=output_key */
|
|
VISEntryHalf
|
|
ld [%o0 + 0x00], %f0
|
|
ld [%o0 + 0x04], %f1
|
|
DES_KEXPAND(0, 0, 0)
|
|
DES_KEXPAND(0, 1, 2)
|
|
DES_KEXPAND(2, 3, 6)
|
|
DES_KEXPAND(2, 2, 4)
|
|
DES_KEXPAND(6, 3, 10)
|
|
DES_KEXPAND(6, 2, 8)
|
|
DES_KEXPAND(10, 3, 14)
|
|
DES_KEXPAND(10, 2, 12)
|
|
DES_KEXPAND(14, 1, 16)
|
|
DES_KEXPAND(16, 3, 20)
|
|
DES_KEXPAND(16, 2, 18)
|
|
DES_KEXPAND(20, 3, 24)
|
|
DES_KEXPAND(20, 2, 22)
|
|
DES_KEXPAND(24, 3, 28)
|
|
DES_KEXPAND(24, 2, 26)
|
|
DES_KEXPAND(28, 1, 30)
|
|
std %f0, [%o1 + 0x00]
|
|
std %f2, [%o1 + 0x08]
|
|
std %f4, [%o1 + 0x10]
|
|
std %f6, [%o1 + 0x18]
|
|
std %f8, [%o1 + 0x20]
|
|
std %f10, [%o1 + 0x28]
|
|
std %f12, [%o1 + 0x30]
|
|
std %f14, [%o1 + 0x38]
|
|
std %f16, [%o1 + 0x40]
|
|
std %f18, [%o1 + 0x48]
|
|
std %f20, [%o1 + 0x50]
|
|
std %f22, [%o1 + 0x58]
|
|
std %f24, [%o1 + 0x60]
|
|
std %f26, [%o1 + 0x68]
|
|
std %f28, [%o1 + 0x70]
|
|
std %f30, [%o1 + 0x78]
|
|
retl
|
|
VISExitHalf
|
|
ENDPROC(des_sparc64_key_expand)
|
|
|
|
.align 32
|
|
ENTRY(des_sparc64_crypt)
|
|
/* %o0=key, %o1=input, %o2=output */
|
|
VISEntry
|
|
ldd [%o1 + 0x00], %f32
|
|
ldd [%o0 + 0x00], %f0
|
|
ldd [%o0 + 0x08], %f2
|
|
ldd [%o0 + 0x10], %f4
|
|
ldd [%o0 + 0x18], %f6
|
|
ldd [%o0 + 0x20], %f8
|
|
ldd [%o0 + 0x28], %f10
|
|
ldd [%o0 + 0x30], %f12
|
|
ldd [%o0 + 0x38], %f14
|
|
ldd [%o0 + 0x40], %f16
|
|
ldd [%o0 + 0x48], %f18
|
|
ldd [%o0 + 0x50], %f20
|
|
ldd [%o0 + 0x58], %f22
|
|
ldd [%o0 + 0x60], %f24
|
|
ldd [%o0 + 0x68], %f26
|
|
ldd [%o0 + 0x70], %f28
|
|
ldd [%o0 + 0x78], %f30
|
|
DES_IP(32, 32)
|
|
DES_ROUND(0, 2, 32, 32)
|
|
DES_ROUND(4, 6, 32, 32)
|
|
DES_ROUND(8, 10, 32, 32)
|
|
DES_ROUND(12, 14, 32, 32)
|
|
DES_ROUND(16, 18, 32, 32)
|
|
DES_ROUND(20, 22, 32, 32)
|
|
DES_ROUND(24, 26, 32, 32)
|
|
DES_ROUND(28, 30, 32, 32)
|
|
DES_IIP(32, 32)
|
|
std %f32, [%o2 + 0x00]
|
|
retl
|
|
VISExit
|
|
ENDPROC(des_sparc64_crypt)
|
|
|
|
.align 32
|
|
ENTRY(des_sparc64_load_keys)
|
|
/* %o0=key */
|
|
VISEntry
|
|
ldd [%o0 + 0x00], %f0
|
|
ldd [%o0 + 0x08], %f2
|
|
ldd [%o0 + 0x10], %f4
|
|
ldd [%o0 + 0x18], %f6
|
|
ldd [%o0 + 0x20], %f8
|
|
ldd [%o0 + 0x28], %f10
|
|
ldd [%o0 + 0x30], %f12
|
|
ldd [%o0 + 0x38], %f14
|
|
ldd [%o0 + 0x40], %f16
|
|
ldd [%o0 + 0x48], %f18
|
|
ldd [%o0 + 0x50], %f20
|
|
ldd [%o0 + 0x58], %f22
|
|
ldd [%o0 + 0x60], %f24
|
|
ldd [%o0 + 0x68], %f26
|
|
ldd [%o0 + 0x70], %f28
|
|
retl
|
|
ldd [%o0 + 0x78], %f30
|
|
ENDPROC(des_sparc64_load_keys)
|
|
|
|
.align 32
|
|
ENTRY(des_sparc64_ecb_crypt)
|
|
/* %o0=input, %o1=output, %o2=len */
|
|
1: ldd [%o0 + 0x00], %f32
|
|
add %o0, 0x08, %o0
|
|
DES_IP(32, 32)
|
|
DES_ROUND(0, 2, 32, 32)
|
|
DES_ROUND(4, 6, 32, 32)
|
|
DES_ROUND(8, 10, 32, 32)
|
|
DES_ROUND(12, 14, 32, 32)
|
|
DES_ROUND(16, 18, 32, 32)
|
|
DES_ROUND(20, 22, 32, 32)
|
|
DES_ROUND(24, 26, 32, 32)
|
|
DES_ROUND(28, 30, 32, 32)
|
|
DES_IIP(32, 32)
|
|
std %f32, [%o1 + 0x00]
|
|
subcc %o2, 0x08, %o2
|
|
bne,pt %icc, 1b
|
|
add %o1, 0x08, %o1
|
|
retl
|
|
nop
|
|
ENDPROC(des_sparc64_ecb_crypt)
|
|
|
|
.align 32
|
|
ENTRY(des_sparc64_cbc_encrypt)
|
|
/* %o0=input, %o1=output, %o2=len, %o3=IV */
|
|
ldd [%o3 + 0x00], %f32
|
|
1: ldd [%o0 + 0x00], %f34
|
|
fxor %f32, %f34, %f32
|
|
DES_IP(32, 32)
|
|
DES_ROUND(0, 2, 32, 32)
|
|
DES_ROUND(4, 6, 32, 32)
|
|
DES_ROUND(8, 10, 32, 32)
|
|
DES_ROUND(12, 14, 32, 32)
|
|
DES_ROUND(16, 18, 32, 32)
|
|
DES_ROUND(20, 22, 32, 32)
|
|
DES_ROUND(24, 26, 32, 32)
|
|
DES_ROUND(28, 30, 32, 32)
|
|
DES_IIP(32, 32)
|
|
std %f32, [%o1 + 0x00]
|
|
add %o0, 0x08, %o0
|
|
subcc %o2, 0x08, %o2
|
|
bne,pt %icc, 1b
|
|
add %o1, 0x08, %o1
|
|
retl
|
|
std %f32, [%o3 + 0x00]
|
|
ENDPROC(des_sparc64_cbc_encrypt)
|
|
|
|
.align 32
|
|
ENTRY(des_sparc64_cbc_decrypt)
|
|
/* %o0=input, %o1=output, %o2=len, %o3=IV */
|
|
ldd [%o3 + 0x00], %f34
|
|
1: ldd [%o0 + 0x00], %f36
|
|
DES_IP(36, 32)
|
|
DES_ROUND(0, 2, 32, 32)
|
|
DES_ROUND(4, 6, 32, 32)
|
|
DES_ROUND(8, 10, 32, 32)
|
|
DES_ROUND(12, 14, 32, 32)
|
|
DES_ROUND(16, 18, 32, 32)
|
|
DES_ROUND(20, 22, 32, 32)
|
|
DES_ROUND(24, 26, 32, 32)
|
|
DES_ROUND(28, 30, 32, 32)
|
|
DES_IIP(32, 32)
|
|
fxor %f32, %f34, %f32
|
|
fsrc2 %f36, %f34
|
|
std %f32, [%o1 + 0x00]
|
|
add %o0, 0x08, %o0
|
|
subcc %o2, 0x08, %o2
|
|
bne,pt %icc, 1b
|
|
add %o1, 0x08, %o1
|
|
retl
|
|
std %f36, [%o3 + 0x00]
|
|
ENDPROC(des_sparc64_cbc_decrypt)
|
|
|
|
.align 32
|
|
ENTRY(des3_ede_sparc64_crypt)
|
|
/* %o0=key, %o1=input, %o2=output */
|
|
VISEntry
|
|
ldd [%o1 + 0x00], %f32
|
|
ldd [%o0 + 0x00], %f0
|
|
ldd [%o0 + 0x08], %f2
|
|
ldd [%o0 + 0x10], %f4
|
|
ldd [%o0 + 0x18], %f6
|
|
ldd [%o0 + 0x20], %f8
|
|
ldd [%o0 + 0x28], %f10
|
|
ldd [%o0 + 0x30], %f12
|
|
ldd [%o0 + 0x38], %f14
|
|
ldd [%o0 + 0x40], %f16
|
|
ldd [%o0 + 0x48], %f18
|
|
ldd [%o0 + 0x50], %f20
|
|
ldd [%o0 + 0x58], %f22
|
|
ldd [%o0 + 0x60], %f24
|
|
ldd [%o0 + 0x68], %f26
|
|
ldd [%o0 + 0x70], %f28
|
|
ldd [%o0 + 0x78], %f30
|
|
DES_IP(32, 32)
|
|
DES_ROUND(0, 2, 32, 32)
|
|
ldd [%o0 + 0x80], %f0
|
|
ldd [%o0 + 0x88], %f2
|
|
DES_ROUND(4, 6, 32, 32)
|
|
ldd [%o0 + 0x90], %f4
|
|
ldd [%o0 + 0x98], %f6
|
|
DES_ROUND(8, 10, 32, 32)
|
|
ldd [%o0 + 0xa0], %f8
|
|
ldd [%o0 + 0xa8], %f10
|
|
DES_ROUND(12, 14, 32, 32)
|
|
ldd [%o0 + 0xb0], %f12
|
|
ldd [%o0 + 0xb8], %f14
|
|
DES_ROUND(16, 18, 32, 32)
|
|
ldd [%o0 + 0xc0], %f16
|
|
ldd [%o0 + 0xc8], %f18
|
|
DES_ROUND(20, 22, 32, 32)
|
|
ldd [%o0 + 0xd0], %f20
|
|
ldd [%o0 + 0xd8], %f22
|
|
DES_ROUND(24, 26, 32, 32)
|
|
ldd [%o0 + 0xe0], %f24
|
|
ldd [%o0 + 0xe8], %f26
|
|
DES_ROUND(28, 30, 32, 32)
|
|
ldd [%o0 + 0xf0], %f28
|
|
ldd [%o0 + 0xf8], %f30
|
|
DES_IIP(32, 32)
|
|
DES_IP(32, 32)
|
|
DES_ROUND(0, 2, 32, 32)
|
|
ldd [%o0 + 0x100], %f0
|
|
ldd [%o0 + 0x108], %f2
|
|
DES_ROUND(4, 6, 32, 32)
|
|
ldd [%o0 + 0x110], %f4
|
|
ldd [%o0 + 0x118], %f6
|
|
DES_ROUND(8, 10, 32, 32)
|
|
ldd [%o0 + 0x120], %f8
|
|
ldd [%o0 + 0x128], %f10
|
|
DES_ROUND(12, 14, 32, 32)
|
|
ldd [%o0 + 0x130], %f12
|
|
ldd [%o0 + 0x138], %f14
|
|
DES_ROUND(16, 18, 32, 32)
|
|
ldd [%o0 + 0x140], %f16
|
|
ldd [%o0 + 0x148], %f18
|
|
DES_ROUND(20, 22, 32, 32)
|
|
ldd [%o0 + 0x150], %f20
|
|
ldd [%o0 + 0x158], %f22
|
|
DES_ROUND(24, 26, 32, 32)
|
|
ldd [%o0 + 0x160], %f24
|
|
ldd [%o0 + 0x168], %f26
|
|
DES_ROUND(28, 30, 32, 32)
|
|
ldd [%o0 + 0x170], %f28
|
|
ldd [%o0 + 0x178], %f30
|
|
DES_IIP(32, 32)
|
|
DES_IP(32, 32)
|
|
DES_ROUND(0, 2, 32, 32)
|
|
DES_ROUND(4, 6, 32, 32)
|
|
DES_ROUND(8, 10, 32, 32)
|
|
DES_ROUND(12, 14, 32, 32)
|
|
DES_ROUND(16, 18, 32, 32)
|
|
DES_ROUND(20, 22, 32, 32)
|
|
DES_ROUND(24, 26, 32, 32)
|
|
DES_ROUND(28, 30, 32, 32)
|
|
DES_IIP(32, 32)
|
|
|
|
std %f32, [%o2 + 0x00]
|
|
retl
|
|
VISExit
|
|
ENDPROC(des3_ede_sparc64_crypt)
|
|
|
|
.align 32
|
|
ENTRY(des3_ede_sparc64_load_keys)
|
|
/* %o0=key */
|
|
VISEntry
|
|
ldd [%o0 + 0x00], %f0
|
|
ldd [%o0 + 0x08], %f2
|
|
ldd [%o0 + 0x10], %f4
|
|
ldd [%o0 + 0x18], %f6
|
|
ldd [%o0 + 0x20], %f8
|
|
ldd [%o0 + 0x28], %f10
|
|
ldd [%o0 + 0x30], %f12
|
|
ldd [%o0 + 0x38], %f14
|
|
ldd [%o0 + 0x40], %f16
|
|
ldd [%o0 + 0x48], %f18
|
|
ldd [%o0 + 0x50], %f20
|
|
ldd [%o0 + 0x58], %f22
|
|
ldd [%o0 + 0x60], %f24
|
|
ldd [%o0 + 0x68], %f26
|
|
ldd [%o0 + 0x70], %f28
|
|
ldd [%o0 + 0x78], %f30
|
|
ldd [%o0 + 0x80], %f32
|
|
ldd [%o0 + 0x88], %f34
|
|
ldd [%o0 + 0x90], %f36
|
|
ldd [%o0 + 0x98], %f38
|
|
ldd [%o0 + 0xa0], %f40
|
|
ldd [%o0 + 0xa8], %f42
|
|
ldd [%o0 + 0xb0], %f44
|
|
ldd [%o0 + 0xb8], %f46
|
|
ldd [%o0 + 0xc0], %f48
|
|
ldd [%o0 + 0xc8], %f50
|
|
ldd [%o0 + 0xd0], %f52
|
|
ldd [%o0 + 0xd8], %f54
|
|
ldd [%o0 + 0xe0], %f56
|
|
retl
|
|
ldd [%o0 + 0xe8], %f58
|
|
ENDPROC(des3_ede_sparc64_load_keys)
|
|
|
|
#define DES3_LOOP_BODY(X) \
|
|
DES_IP(X, X) \
|
|
DES_ROUND(0, 2, X, X) \
|
|
DES_ROUND(4, 6, X, X) \
|
|
DES_ROUND(8, 10, X, X) \
|
|
DES_ROUND(12, 14, X, X) \
|
|
DES_ROUND(16, 18, X, X) \
|
|
ldd [%o0 + 0xf0], %f16; \
|
|
ldd [%o0 + 0xf8], %f18; \
|
|
DES_ROUND(20, 22, X, X) \
|
|
ldd [%o0 + 0x100], %f20; \
|
|
ldd [%o0 + 0x108], %f22; \
|
|
DES_ROUND(24, 26, X, X) \
|
|
ldd [%o0 + 0x110], %f24; \
|
|
ldd [%o0 + 0x118], %f26; \
|
|
DES_ROUND(28, 30, X, X) \
|
|
ldd [%o0 + 0x120], %f28; \
|
|
ldd [%o0 + 0x128], %f30; \
|
|
DES_IIP(X, X) \
|
|
DES_IP(X, X) \
|
|
DES_ROUND(32, 34, X, X) \
|
|
ldd [%o0 + 0x130], %f0; \
|
|
ldd [%o0 + 0x138], %f2; \
|
|
DES_ROUND(36, 38, X, X) \
|
|
ldd [%o0 + 0x140], %f4; \
|
|
ldd [%o0 + 0x148], %f6; \
|
|
DES_ROUND(40, 42, X, X) \
|
|
ldd [%o0 + 0x150], %f8; \
|
|
ldd [%o0 + 0x158], %f10; \
|
|
DES_ROUND(44, 46, X, X) \
|
|
ldd [%o0 + 0x160], %f12; \
|
|
ldd [%o0 + 0x168], %f14; \
|
|
DES_ROUND(48, 50, X, X) \
|
|
DES_ROUND(52, 54, X, X) \
|
|
DES_ROUND(56, 58, X, X) \
|
|
DES_ROUND(16, 18, X, X) \
|
|
ldd [%o0 + 0x170], %f16; \
|
|
ldd [%o0 + 0x178], %f18; \
|
|
DES_IIP(X, X) \
|
|
DES_IP(X, X) \
|
|
DES_ROUND(20, 22, X, X) \
|
|
ldd [%o0 + 0x50], %f20; \
|
|
ldd [%o0 + 0x58], %f22; \
|
|
DES_ROUND(24, 26, X, X) \
|
|
ldd [%o0 + 0x60], %f24; \
|
|
ldd [%o0 + 0x68], %f26; \
|
|
DES_ROUND(28, 30, X, X) \
|
|
ldd [%o0 + 0x70], %f28; \
|
|
ldd [%o0 + 0x78], %f30; \
|
|
DES_ROUND(0, 2, X, X) \
|
|
ldd [%o0 + 0x00], %f0; \
|
|
ldd [%o0 + 0x08], %f2; \
|
|
DES_ROUND(4, 6, X, X) \
|
|
ldd [%o0 + 0x10], %f4; \
|
|
ldd [%o0 + 0x18], %f6; \
|
|
DES_ROUND(8, 10, X, X) \
|
|
ldd [%o0 + 0x20], %f8; \
|
|
ldd [%o0 + 0x28], %f10; \
|
|
DES_ROUND(12, 14, X, X) \
|
|
ldd [%o0 + 0x30], %f12; \
|
|
ldd [%o0 + 0x38], %f14; \
|
|
DES_ROUND(16, 18, X, X) \
|
|
ldd [%o0 + 0x40], %f16; \
|
|
ldd [%o0 + 0x48], %f18; \
|
|
DES_IIP(X, X)
|
|
|
|
.align 32
|
|
ENTRY(des3_ede_sparc64_ecb_crypt)
|
|
/* %o0=key, %o1=input, %o2=output, %o3=len */
|
|
1: ldd [%o1 + 0x00], %f60
|
|
DES3_LOOP_BODY(60)
|
|
std %f60, [%o2 + 0x00]
|
|
add %o1, 0x08, %o1
|
|
subcc %o3, 0x08, %o3
|
|
bne,pt %icc, 1b
|
|
add %o2, 0x08, %o2
|
|
retl
|
|
nop
|
|
ENDPROC(des3_ede_sparc64_ecb_crypt)
|
|
|
|
.align 32
|
|
ENTRY(des3_ede_sparc64_cbc_encrypt)
|
|
/* %o0=key, %o1=input, %o2=output, %o3=len, %o4=IV */
|
|
ldd [%o4 + 0x00], %f60
|
|
1: ldd [%o1 + 0x00], %f62
|
|
fxor %f60, %f62, %f60
|
|
DES3_LOOP_BODY(60)
|
|
std %f60, [%o2 + 0x00]
|
|
add %o1, 0x08, %o1
|
|
subcc %o3, 0x08, %o3
|
|
bne,pt %icc, 1b
|
|
add %o2, 0x08, %o2
|
|
retl
|
|
std %f60, [%o4 + 0x00]
|
|
ENDPROC(des3_ede_sparc64_cbc_encrypt)
|
|
|
|
.align 32
|
|
ENTRY(des3_ede_sparc64_cbc_decrypt)
|
|
/* %o0=key, %o1=input, %o2=output, %o3=len, %o4=IV */
|
|
ldd [%o4 + 0x00], %f62
|
|
1: ldx [%o1 + 0x00], %g1
|
|
MOVXTOD_G1_F60
|
|
DES3_LOOP_BODY(60)
|
|
fxor %f62, %f60, %f60
|
|
MOVXTOD_G1_F62
|
|
std %f60, [%o2 + 0x00]
|
|
add %o1, 0x08, %o1
|
|
subcc %o3, 0x08, %o3
|
|
bne,pt %icc, 1b
|
|
add %o2, 0x08, %o2
|
|
retl
|
|
stx %g1, [%o4 + 0x00]
|
|
ENDPROC(des3_ede_sparc64_cbc_decrypt)
|