123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563 |
- #include <linux/linkage.h>
- #include <asm/visasm.h>
- #include "opcodes.h"
- #define CAMELLIA_6ROUNDS(KEY_BASE, I0, I1) \
- CAMELLIA_F(KEY_BASE + 0, I1, I0, I1) \
- CAMELLIA_F(KEY_BASE + 2, I0, I1, I0) \
- CAMELLIA_F(KEY_BASE + 4, I1, I0, I1) \
- CAMELLIA_F(KEY_BASE + 6, I0, I1, I0) \
- CAMELLIA_F(KEY_BASE + 8, I1, I0, I1) \
- CAMELLIA_F(KEY_BASE + 10, I0, I1, I0)
- #define CAMELLIA_6ROUNDS_FL_FLI(KEY_BASE, I0, I1) \
- CAMELLIA_6ROUNDS(KEY_BASE, I0, I1) \
- CAMELLIA_FL(KEY_BASE + 12, I0, I0) \
- CAMELLIA_FLI(KEY_BASE + 14, I1, I1)
- .data
- .align 8
- SIGMA: .xword 0xA09E667F3BCC908B
- .xword 0xB67AE8584CAA73B2
- .xword 0xC6EF372FE94F82BE
- .xword 0x54FF53A5F1D36F1C
- .xword 0x10E527FADE682D1D
- .xword 0xB05688C2B3E6C1FD
- .text
- .align 32
- ENTRY(camellia_sparc64_key_expand)
- /* %o0=in_key, %o1=encrypt_key, %o2=key_len, %o3=decrypt_key */
- VISEntry
- ld [%o0 + 0x00], %f0 ! i0, k[0]
- ld [%o0 + 0x04], %f1 ! i1, k[1]
- ld [%o0 + 0x08], %f2 ! i2, k[2]
- ld [%o0 + 0x0c], %f3 ! i3, k[3]
- std %f0, [%o1 + 0x00] ! k[0, 1]
- fsrc2 %f0, %f28
- std %f2, [%o1 + 0x08] ! k[2, 3]
- cmp %o2, 16
- be 10f
- fsrc2 %f2, %f30
- ld [%o0 + 0x10], %f0
- ld [%o0 + 0x14], %f1
- std %f0, [%o1 + 0x20] ! k[8, 9]
- cmp %o2, 24
- fone %f10
- be,a 1f
- fxor %f10, %f0, %f2
- ld [%o0 + 0x18], %f2
- ld [%o0 + 0x1c], %f3
- 1:
- std %f2, [%o1 + 0x28] ! k[10, 11]
- fxor %f28, %f0, %f0
- fxor %f30, %f2, %f2
- 10:
- sethi %hi(SIGMA), %g3
- or %g3, %lo(SIGMA), %g3
- ldd [%g3 + 0x00], %f16
- ldd [%g3 + 0x08], %f18
- ldd [%g3 + 0x10], %f20
- ldd [%g3 + 0x18], %f22
- ldd [%g3 + 0x20], %f24
- ldd [%g3 + 0x28], %f26
- CAMELLIA_F(16, 2, 0, 2)
- CAMELLIA_F(18, 0, 2, 0)
- fxor %f28, %f0, %f0
- fxor %f30, %f2, %f2
- CAMELLIA_F(20, 2, 0, 2)
- CAMELLIA_F(22, 0, 2, 0)
- #define ROTL128(S01, S23, TMP1, TMP2, N) \
- srlx S01, (64 - N), TMP1; \
- sllx S01, N, S01; \
- srlx S23, (64 - N), TMP2; \
- sllx S23, N, S23; \
- or S01, TMP2, S01; \
- or S23, TMP1, S23
- cmp %o2, 16
- bne 1f
- nop
- /* 128-bit key */
- std %f0, [%o1 + 0x10] ! k[ 4, 5]
- std %f2, [%o1 + 0x18] ! k[ 6, 7]
- MOVDTOX_F0_O4
- MOVDTOX_F2_O5
- ROTL128(%o4, %o5, %g2, %g3, 15)
- stx %o4, [%o1 + 0x30] ! k[12, 13]
- stx %o5, [%o1 + 0x38] ! k[14, 15]
- ROTL128(%o4, %o5, %g2, %g3, 15)
- stx %o4, [%o1 + 0x40] ! k[16, 17]
- stx %o5, [%o1 + 0x48] ! k[18, 19]
- ROTL128(%o4, %o5, %g2, %g3, 15)
- stx %o4, [%o1 + 0x60] ! k[24, 25]
- ROTL128(%o4, %o5, %g2, %g3, 15)
- stx %o4, [%o1 + 0x70] ! k[28, 29]
- stx %o5, [%o1 + 0x78] ! k[30, 31]
- ROTL128(%o4, %o5, %g2, %g3, 34)
- stx %o4, [%o1 + 0xa0] ! k[40, 41]
- stx %o5, [%o1 + 0xa8] ! k[42, 43]
- ROTL128(%o4, %o5, %g2, %g3, 17)
- stx %o4, [%o1 + 0xc0] ! k[48, 49]
- stx %o5, [%o1 + 0xc8] ! k[50, 51]
- ldx [%o1 + 0x00], %o4 ! k[ 0, 1]
- ldx [%o1 + 0x08], %o5 ! k[ 2, 3]
- ROTL128(%o4, %o5, %g2, %g3, 15)
- stx %o4, [%o1 + 0x20] ! k[ 8, 9]
- stx %o5, [%o1 + 0x28] ! k[10, 11]
- ROTL128(%o4, %o5, %g2, %g3, 30)
- stx %o4, [%o1 + 0x50] ! k[20, 21]
- stx %o5, [%o1 + 0x58] ! k[22, 23]
- ROTL128(%o4, %o5, %g2, %g3, 15)
- stx %o5, [%o1 + 0x68] ! k[26, 27]
- ROTL128(%o4, %o5, %g2, %g3, 17)
- stx %o4, [%o1 + 0x80] ! k[32, 33]
- stx %o5, [%o1 + 0x88] ! k[34, 35]
- ROTL128(%o4, %o5, %g2, %g3, 17)
- stx %o4, [%o1 + 0x90] ! k[36, 37]
- stx %o5, [%o1 + 0x98] ! k[38, 39]
- ROTL128(%o4, %o5, %g2, %g3, 17)
- stx %o4, [%o1 + 0xb0] ! k[44, 45]
- stx %o5, [%o1 + 0xb8] ! k[46, 47]
- ba,pt %xcc, 2f
- mov (3 * 16 * 4), %o0
- 1:
- /* 192-bit or 256-bit key */
- std %f0, [%o1 + 0x30] ! k[12, 13]
- std %f2, [%o1 + 0x38] ! k[14, 15]
- ldd [%o1 + 0x20], %f4 ! k[ 8, 9]
- ldd [%o1 + 0x28], %f6 ! k[10, 11]
- fxor %f0, %f4, %f0
- fxor %f2, %f6, %f2
- CAMELLIA_F(24, 2, 0, 2)
- CAMELLIA_F(26, 0, 2, 0)
- std %f0, [%o1 + 0x10] ! k[ 4, 5]
- std %f2, [%o1 + 0x18] ! k[ 6, 7]
- MOVDTOX_F0_O4
- MOVDTOX_F2_O5
- ROTL128(%o4, %o5, %g2, %g3, 30)
- stx %o4, [%o1 + 0x50] ! k[20, 21]
- stx %o5, [%o1 + 0x58] ! k[22, 23]
- ROTL128(%o4, %o5, %g2, %g3, 30)
- stx %o4, [%o1 + 0xa0] ! k[40, 41]
- stx %o5, [%o1 + 0xa8] ! k[42, 43]
- ROTL128(%o4, %o5, %g2, %g3, 51)
- stx %o4, [%o1 + 0x100] ! k[64, 65]
- stx %o5, [%o1 + 0x108] ! k[66, 67]
- ldx [%o1 + 0x20], %o4 ! k[ 8, 9]
- ldx [%o1 + 0x28], %o5 ! k[10, 11]
- ROTL128(%o4, %o5, %g2, %g3, 15)
- stx %o4, [%o1 + 0x20] ! k[ 8, 9]
- stx %o5, [%o1 + 0x28] ! k[10, 11]
- ROTL128(%o4, %o5, %g2, %g3, 15)
- stx %o4, [%o1 + 0x40] ! k[16, 17]
- stx %o5, [%o1 + 0x48] ! k[18, 19]
- ROTL128(%o4, %o5, %g2, %g3, 30)
- stx %o4, [%o1 + 0x90] ! k[36, 37]
- stx %o5, [%o1 + 0x98] ! k[38, 39]
- ROTL128(%o4, %o5, %g2, %g3, 34)
- stx %o4, [%o1 + 0xd0] ! k[52, 53]
- stx %o5, [%o1 + 0xd8] ! k[54, 55]
- ldx [%o1 + 0x30], %o4 ! k[12, 13]
- ldx [%o1 + 0x38], %o5 ! k[14, 15]
- ROTL128(%o4, %o5, %g2, %g3, 15)
- stx %o4, [%o1 + 0x30] ! k[12, 13]
- stx %o5, [%o1 + 0x38] ! k[14, 15]
- ROTL128(%o4, %o5, %g2, %g3, 30)
- stx %o4, [%o1 + 0x70] ! k[28, 29]
- stx %o5, [%o1 + 0x78] ! k[30, 31]
- srlx %o4, 32, %g2
- srlx %o5, 32, %g3
- stw %o4, [%o1 + 0xc0] ! k[48]
- stw %g3, [%o1 + 0xc4] ! k[49]
- stw %o5, [%o1 + 0xc8] ! k[50]
- stw %g2, [%o1 + 0xcc] ! k[51]
- ROTL128(%o4, %o5, %g2, %g3, 49)
- stx %o4, [%o1 + 0xe0] ! k[56, 57]
- stx %o5, [%o1 + 0xe8] ! k[58, 59]
- ldx [%o1 + 0x00], %o4 ! k[ 0, 1]
- ldx [%o1 + 0x08], %o5 ! k[ 2, 3]
- ROTL128(%o4, %o5, %g2, %g3, 45)
- stx %o4, [%o1 + 0x60] ! k[24, 25]
- stx %o5, [%o1 + 0x68] ! k[26, 27]
- ROTL128(%o4, %o5, %g2, %g3, 15)
- stx %o4, [%o1 + 0x80] ! k[32, 33]
- stx %o5, [%o1 + 0x88] ! k[34, 35]
- ROTL128(%o4, %o5, %g2, %g3, 17)
- stx %o4, [%o1 + 0xb0] ! k[44, 45]
- stx %o5, [%o1 + 0xb8] ! k[46, 47]
- ROTL128(%o4, %o5, %g2, %g3, 34)
- stx %o4, [%o1 + 0xf0] ! k[60, 61]
- stx %o5, [%o1 + 0xf8] ! k[62, 63]
- mov (4 * 16 * 4), %o0
- 2:
- add %o1, %o0, %o1
- ldd [%o1 + 0x00], %f0
- ldd [%o1 + 0x08], %f2
- std %f0, [%o3 + 0x00]
- std %f2, [%o3 + 0x08]
- add %o3, 0x10, %o3
- 1:
- sub %o1, (16 * 4), %o1
- ldd [%o1 + 0x38], %f0
- ldd [%o1 + 0x30], %f2
- ldd [%o1 + 0x28], %f4
- ldd [%o1 + 0x20], %f6
- ldd [%o1 + 0x18], %f8
- ldd [%o1 + 0x10], %f10
- std %f0, [%o3 + 0x00]
- std %f2, [%o3 + 0x08]
- std %f4, [%o3 + 0x10]
- std %f6, [%o3 + 0x18]
- std %f8, [%o3 + 0x20]
- std %f10, [%o3 + 0x28]
- ldd [%o1 + 0x08], %f0
- ldd [%o1 + 0x00], %f2
- std %f0, [%o3 + 0x30]
- std %f2, [%o3 + 0x38]
- subcc %o0, (16 * 4), %o0
- bne,pt %icc, 1b
- add %o3, (16 * 4), %o3
- std %f2, [%o3 - 0x10]
- std %f0, [%o3 - 0x08]
- retl
- VISExit
- ENDPROC(camellia_sparc64_key_expand)
- .align 32
- ENTRY(camellia_sparc64_crypt)
- /* %o0=key, %o1=input, %o2=output, %o3=key_len */
- VISEntry
- ld [%o1 + 0x00], %f0
- ld [%o1 + 0x04], %f1
- ld [%o1 + 0x08], %f2
- ld [%o1 + 0x0c], %f3
- ldd [%o0 + 0x00], %f4
- ldd [%o0 + 0x08], %f6
- cmp %o3, 16
- fxor %f4, %f0, %f0
- be 1f
- fxor %f6, %f2, %f2
- ldd [%o0 + 0x10], %f8
- ldd [%o0 + 0x18], %f10
- ldd [%o0 + 0x20], %f12
- ldd [%o0 + 0x28], %f14
- ldd [%o0 + 0x30], %f16
- ldd [%o0 + 0x38], %f18
- ldd [%o0 + 0x40], %f20
- ldd [%o0 + 0x48], %f22
- add %o0, 0x40, %o0
- CAMELLIA_6ROUNDS_FL_FLI( 8, 0, 2)
- 1:
- ldd [%o0 + 0x10], %f8
- ldd [%o0 + 0x18], %f10
- ldd [%o0 + 0x20], %f12
- ldd [%o0 + 0x28], %f14
- ldd [%o0 + 0x30], %f16
- ldd [%o0 + 0x38], %f18
- ldd [%o0 + 0x40], %f20
- ldd [%o0 + 0x48], %f22
- ldd [%o0 + 0x50], %f24
- ldd [%o0 + 0x58], %f26
- ldd [%o0 + 0x60], %f28
- ldd [%o0 + 0x68], %f30
- ldd [%o0 + 0x70], %f32
- ldd [%o0 + 0x78], %f34
- ldd [%o0 + 0x80], %f36
- ldd [%o0 + 0x88], %f38
- ldd [%o0 + 0x90], %f40
- ldd [%o0 + 0x98], %f42
- ldd [%o0 + 0xa0], %f44
- ldd [%o0 + 0xa8], %f46
- ldd [%o0 + 0xb0], %f48
- ldd [%o0 + 0xb8], %f50
- ldd [%o0 + 0xc0], %f52
- ldd [%o0 + 0xc8], %f54
- CAMELLIA_6ROUNDS_FL_FLI( 8, 0, 2)
- CAMELLIA_6ROUNDS_FL_FLI(24, 0, 2)
- CAMELLIA_6ROUNDS(40, 0, 2)
- fxor %f52, %f2, %f2
- fxor %f54, %f0, %f0
- st %f2, [%o2 + 0x00]
- st %f3, [%o2 + 0x04]
- st %f0, [%o2 + 0x08]
- st %f1, [%o2 + 0x0c]
- retl
- VISExit
- ENDPROC(camellia_sparc64_crypt)
- .align 32
- ENTRY(camellia_sparc64_load_keys)
- /* %o0=key, %o1=key_len */
- VISEntry
- ldd [%o0 + 0x00], %f4
- ldd [%o0 + 0x08], %f6
- ldd [%o0 + 0x10], %f8
- ldd [%o0 + 0x18], %f10
- ldd [%o0 + 0x20], %f12
- ldd [%o0 + 0x28], %f14
- ldd [%o0 + 0x30], %f16
- ldd [%o0 + 0x38], %f18
- ldd [%o0 + 0x40], %f20
- ldd [%o0 + 0x48], %f22
- ldd [%o0 + 0x50], %f24
- ldd [%o0 + 0x58], %f26
- ldd [%o0 + 0x60], %f28
- ldd [%o0 + 0x68], %f30
- ldd [%o0 + 0x70], %f32
- ldd [%o0 + 0x78], %f34
- ldd [%o0 + 0x80], %f36
- ldd [%o0 + 0x88], %f38
- ldd [%o0 + 0x90], %f40
- ldd [%o0 + 0x98], %f42
- ldd [%o0 + 0xa0], %f44
- ldd [%o0 + 0xa8], %f46
- ldd [%o0 + 0xb0], %f48
- ldd [%o0 + 0xb8], %f50
- ldd [%o0 + 0xc0], %f52
- retl
- ldd [%o0 + 0xc8], %f54
- ENDPROC(camellia_sparc64_load_keys)
- .align 32
- ENTRY(camellia_sparc64_ecb_crypt_3_grand_rounds)
- /* %o0=input, %o1=output, %o2=len, %o3=key */
- 1: ldd [%o0 + 0x00], %f0
- ldd [%o0 + 0x08], %f2
- add %o0, 0x10, %o0
- fxor %f4, %f0, %f0
- fxor %f6, %f2, %f2
- CAMELLIA_6ROUNDS_FL_FLI( 8, 0, 2)
- CAMELLIA_6ROUNDS_FL_FLI(24, 0, 2)
- CAMELLIA_6ROUNDS(40, 0, 2)
- fxor %f52, %f2, %f2
- fxor %f54, %f0, %f0
- std %f2, [%o1 + 0x00]
- std %f0, [%o1 + 0x08]
- subcc %o2, 0x10, %o2
- bne,pt %icc, 1b
- add %o1, 0x10, %o1
- retl
- nop
- ENDPROC(camellia_sparc64_ecb_crypt_3_grand_rounds)
- .align 32
- ENTRY(camellia_sparc64_ecb_crypt_4_grand_rounds)
- /* %o0=input, %o1=output, %o2=len, %o3=key */
- 1: ldd [%o0 + 0x00], %f0
- ldd [%o0 + 0x08], %f2
- add %o0, 0x10, %o0
- fxor %f4, %f0, %f0
- fxor %f6, %f2, %f2
- CAMELLIA_6ROUNDS_FL_FLI( 8, 0, 2)
- ldd [%o3 + 0xd0], %f8
- ldd [%o3 + 0xd8], %f10
- ldd [%o3 + 0xe0], %f12
- ldd [%o3 + 0xe8], %f14
- ldd [%o3 + 0xf0], %f16
- ldd [%o3 + 0xf8], %f18
- ldd [%o3 + 0x100], %f20
- ldd [%o3 + 0x108], %f22
- CAMELLIA_6ROUNDS_FL_FLI(24, 0, 2)
- CAMELLIA_6ROUNDS_FL_FLI(40, 0, 2)
- CAMELLIA_F(8, 2, 0, 2)
- CAMELLIA_F(10, 0, 2, 0)
- ldd [%o3 + 0x10], %f8
- ldd [%o3 + 0x18], %f10
- CAMELLIA_F(12, 2, 0, 2)
- CAMELLIA_F(14, 0, 2, 0)
- ldd [%o3 + 0x20], %f12
- ldd [%o3 + 0x28], %f14
- CAMELLIA_F(16, 2, 0, 2)
- CAMELLIA_F(18, 0, 2, 0)
- ldd [%o3 + 0x30], %f16
- ldd [%o3 + 0x38], %f18
- fxor %f20, %f2, %f2
- fxor %f22, %f0, %f0
- ldd [%o3 + 0x40], %f20
- ldd [%o3 + 0x48], %f22
- std %f2, [%o1 + 0x00]
- std %f0, [%o1 + 0x08]
- subcc %o2, 0x10, %o2
- bne,pt %icc, 1b
- add %o1, 0x10, %o1
- retl
- nop
- ENDPROC(camellia_sparc64_ecb_crypt_4_grand_rounds)
- .align 32
- ENTRY(camellia_sparc64_cbc_encrypt_3_grand_rounds)
- /* %o0=input, %o1=output, %o2=len, %o3=key, %o4=IV */
- ldd [%o4 + 0x00], %f60
- ldd [%o4 + 0x08], %f62
- 1: ldd [%o0 + 0x00], %f0
- ldd [%o0 + 0x08], %f2
- add %o0, 0x10, %o0
- fxor %f60, %f0, %f0
- fxor %f62, %f2, %f2
- fxor %f4, %f0, %f0
- fxor %f6, %f2, %f2
- CAMELLIA_6ROUNDS_FL_FLI( 8, 0, 2)
- CAMELLIA_6ROUNDS_FL_FLI(24, 0, 2)
- CAMELLIA_6ROUNDS(40, 0, 2)
- fxor %f52, %f2, %f60
- fxor %f54, %f0, %f62
- std %f60, [%o1 + 0x00]
- std %f62, [%o1 + 0x08]
- subcc %o2, 0x10, %o2
- bne,pt %icc, 1b
- add %o1, 0x10, %o1
- std %f60, [%o4 + 0x00]
- retl
- std %f62, [%o4 + 0x08]
- ENDPROC(camellia_sparc64_cbc_encrypt_3_grand_rounds)
- .align 32
- ENTRY(camellia_sparc64_cbc_encrypt_4_grand_rounds)
- /* %o0=input, %o1=output, %o2=len, %o3=key, %o4=IV */
- ldd [%o4 + 0x00], %f60
- ldd [%o4 + 0x08], %f62
- 1: ldd [%o0 + 0x00], %f0
- ldd [%o0 + 0x08], %f2
- add %o0, 0x10, %o0
- fxor %f60, %f0, %f0
- fxor %f62, %f2, %f2
- fxor %f4, %f0, %f0
- fxor %f6, %f2, %f2
- CAMELLIA_6ROUNDS_FL_FLI( 8, 0, 2)
- ldd [%o3 + 0xd0], %f8
- ldd [%o3 + 0xd8], %f10
- ldd [%o3 + 0xe0], %f12
- ldd [%o3 + 0xe8], %f14
- ldd [%o3 + 0xf0], %f16
- ldd [%o3 + 0xf8], %f18
- ldd [%o3 + 0x100], %f20
- ldd [%o3 + 0x108], %f22
- CAMELLIA_6ROUNDS_FL_FLI(24, 0, 2)
- CAMELLIA_6ROUNDS_FL_FLI(40, 0, 2)
- CAMELLIA_F(8, 2, 0, 2)
- CAMELLIA_F(10, 0, 2, 0)
- ldd [%o3 + 0x10], %f8
- ldd [%o3 + 0x18], %f10
- CAMELLIA_F(12, 2, 0, 2)
- CAMELLIA_F(14, 0, 2, 0)
- ldd [%o3 + 0x20], %f12
- ldd [%o3 + 0x28], %f14
- CAMELLIA_F(16, 2, 0, 2)
- CAMELLIA_F(18, 0, 2, 0)
- ldd [%o3 + 0x30], %f16
- ldd [%o3 + 0x38], %f18
- fxor %f20, %f2, %f60
- fxor %f22, %f0, %f62
- ldd [%o3 + 0x40], %f20
- ldd [%o3 + 0x48], %f22
- std %f60, [%o1 + 0x00]
- std %f62, [%o1 + 0x08]
- subcc %o2, 0x10, %o2
- bne,pt %icc, 1b
- add %o1, 0x10, %o1
- std %f60, [%o4 + 0x00]
- retl
- std %f62, [%o4 + 0x08]
- ENDPROC(camellia_sparc64_cbc_encrypt_4_grand_rounds)
- .align 32
- ENTRY(camellia_sparc64_cbc_decrypt_3_grand_rounds)
- /* %o0=input, %o1=output, %o2=len, %o3=key, %o4=IV */
- ldd [%o4 + 0x00], %f60
- ldd [%o4 + 0x08], %f62
- 1: ldd [%o0 + 0x00], %f56
- ldd [%o0 + 0x08], %f58
- add %o0, 0x10, %o0
- fxor %f4, %f56, %f0
- fxor %f6, %f58, %f2
- CAMELLIA_6ROUNDS_FL_FLI( 8, 0, 2)
- CAMELLIA_6ROUNDS_FL_FLI(24, 0, 2)
- CAMELLIA_6ROUNDS(40, 0, 2)
- fxor %f52, %f2, %f2
- fxor %f54, %f0, %f0
- fxor %f60, %f2, %f2
- fxor %f62, %f0, %f0
- fsrc2 %f56, %f60
- fsrc2 %f58, %f62
- std %f2, [%o1 + 0x00]
- std %f0, [%o1 + 0x08]
- subcc %o2, 0x10, %o2
- bne,pt %icc, 1b
- add %o1, 0x10, %o1
- std %f60, [%o4 + 0x00]
- retl
- std %f62, [%o4 + 0x08]
- ENDPROC(camellia_sparc64_cbc_decrypt_3_grand_rounds)
- .align 32
- ENTRY(camellia_sparc64_cbc_decrypt_4_grand_rounds)
- /* %o0=input, %o1=output, %o2=len, %o3=key, %o4=IV */
- ldd [%o4 + 0x00], %f60
- ldd [%o4 + 0x08], %f62
- 1: ldd [%o0 + 0x00], %f56
- ldd [%o0 + 0x08], %f58
- add %o0, 0x10, %o0
- fxor %f4, %f56, %f0
- fxor %f6, %f58, %f2
- CAMELLIA_6ROUNDS_FL_FLI( 8, 0, 2)
- ldd [%o3 + 0xd0], %f8
- ldd [%o3 + 0xd8], %f10
- ldd [%o3 + 0xe0], %f12
- ldd [%o3 + 0xe8], %f14
- ldd [%o3 + 0xf0], %f16
- ldd [%o3 + 0xf8], %f18
- ldd [%o3 + 0x100], %f20
- ldd [%o3 + 0x108], %f22
- CAMELLIA_6ROUNDS_FL_FLI(24, 0, 2)
- CAMELLIA_6ROUNDS_FL_FLI(40, 0, 2)
- CAMELLIA_F(8, 2, 0, 2)
- CAMELLIA_F(10, 0, 2, 0)
- ldd [%o3 + 0x10], %f8
- ldd [%o3 + 0x18], %f10
- CAMELLIA_F(12, 2, 0, 2)
- CAMELLIA_F(14, 0, 2, 0)
- ldd [%o3 + 0x20], %f12
- ldd [%o3 + 0x28], %f14
- CAMELLIA_F(16, 2, 0, 2)
- CAMELLIA_F(18, 0, 2, 0)
- ldd [%o3 + 0x30], %f16
- ldd [%o3 + 0x38], %f18
- fxor %f20, %f2, %f2
- fxor %f22, %f0, %f0
- ldd [%o3 + 0x40], %f20
- ldd [%o3 + 0x48], %f22
- fxor %f60, %f2, %f2
- fxor %f62, %f0, %f0
- fsrc2 %f56, %f60
- fsrc2 %f58, %f62
- std %f2, [%o1 + 0x00]
- std %f0, [%o1 + 0x08]
- subcc %o2, 0x10, %o2
- bne,pt %icc, 1b
- add %o1, 0x10, %o1
- std %f60, [%o4 + 0x00]
- retl
- std %f62, [%o4 + 0x08]
- ENDPROC(camellia_sparc64_cbc_decrypt_4_grand_rounds)
|