Commit | Line | Data |
---|---|---|
b2441318 | 1 | /* SPDX-License-Identifier: GPL-2.0 */ |
81658ad0 DM |
2 | #include <linux/linkage.h> |
3 | #include <asm/visasm.h> | |
4 | ||
7cff82f5 | 5 | #include "opcodes.h" |
81658ad0 DM |
6 | |
7 | #define CAMELLIA_6ROUNDS(KEY_BASE, I0, I1) \ | |
8 | CAMELLIA_F(KEY_BASE + 0, I1, I0, I1) \ | |
9 | CAMELLIA_F(KEY_BASE + 2, I0, I1, I0) \ | |
10 | CAMELLIA_F(KEY_BASE + 4, I1, I0, I1) \ | |
11 | CAMELLIA_F(KEY_BASE + 6, I0, I1, I0) \ | |
12 | CAMELLIA_F(KEY_BASE + 8, I1, I0, I1) \ | |
13 | CAMELLIA_F(KEY_BASE + 10, I0, I1, I0) | |
14 | ||
15 | #define CAMELLIA_6ROUNDS_FL_FLI(KEY_BASE, I0, I1) \ | |
16 | CAMELLIA_6ROUNDS(KEY_BASE, I0, I1) \ | |
17 | CAMELLIA_FL(KEY_BASE + 12, I0, I0) \ | |
18 | CAMELLIA_FLI(KEY_BASE + 14, I1, I1) | |
19 | ||
20 | .data | |
21 | ||
22 | .align 8 | |
23 | SIGMA: .xword 0xA09E667F3BCC908B | |
24 | .xword 0xB67AE8584CAA73B2 | |
25 | .xword 0xC6EF372FE94F82BE | |
26 | .xword 0x54FF53A5F1D36F1C | |
27 | .xword 0x10E527FADE682D1D | |
28 | .xword 0xB05688C2B3E6C1FD | |
29 | ||
30 | .text | |
31 | ||
32 | .align 32 | |
33 | ENTRY(camellia_sparc64_key_expand) | |
274504f5 | 34 | /* %o0=in_key, %o1=encrypt_key, %o2=key_len, %o3=decrypt_key */ |
81658ad0 DM |
35 | VISEntry |
36 | ld [%o0 + 0x00], %f0 ! i0, k[0] | |
37 | ld [%o0 + 0x04], %f1 ! i1, k[1] | |
38 | ld [%o0 + 0x08], %f2 ! i2, k[2] | |
39 | ld [%o0 + 0x0c], %f3 ! i3, k[3] | |
40 | std %f0, [%o1 + 0x00] ! k[0, 1] | |
41 | fsrc2 %f0, %f28 | |
42 | std %f2, [%o1 + 0x08] ! k[2, 3] | |
43 | cmp %o2, 16 | |
44 | be 10f | |
45 | fsrc2 %f2, %f30 | |
46 | ||
47 | ld [%o0 + 0x10], %f0 | |
48 | ld [%o0 + 0x14], %f1 | |
49 | std %f0, [%o1 + 0x20] ! k[8, 9] | |
50 | cmp %o2, 24 | |
51 | fone %f10 | |
52 | be,a 1f | |
53 | fxor %f10, %f0, %f2 | |
54 | ld [%o0 + 0x18], %f2 | |
55 | ld [%o0 + 0x1c], %f3 | |
56 | 1: | |
57 | std %f2, [%o1 + 0x28] ! k[10, 11] | |
58 | fxor %f28, %f0, %f0 | |
59 | fxor %f30, %f2, %f2 | |
60 | ||
61 | 10: | |
62 | sethi %hi(SIGMA), %g3 | |
63 | or %g3, %lo(SIGMA), %g3 | |
64 | ldd [%g3 + 0x00], %f16 | |
65 | ldd [%g3 + 0x08], %f18 | |
66 | ldd [%g3 + 0x10], %f20 | |
67 | ldd [%g3 + 0x18], %f22 | |
68 | ldd [%g3 + 0x20], %f24 | |
69 | ldd [%g3 + 0x28], %f26 | |
70 | CAMELLIA_F(16, 2, 0, 2) | |
71 | CAMELLIA_F(18, 0, 2, 0) | |
72 | fxor %f28, %f0, %f0 | |
73 | fxor %f30, %f2, %f2 | |
74 | CAMELLIA_F(20, 2, 0, 2) | |
75 | CAMELLIA_F(22, 0, 2, 0) | |
76 | ||
77 | #define ROTL128(S01, S23, TMP1, TMP2, N) \ | |
78 | srlx S01, (64 - N), TMP1; \ | |
79 | sllx S01, N, S01; \ | |
80 | srlx S23, (64 - N), TMP2; \ | |
81 | sllx S23, N, S23; \ | |
82 | or S01, TMP2, S01; \ | |
83 | or S23, TMP1, S23 | |
84 | ||
85 | cmp %o2, 16 | |
86 | bne 1f | |
87 | nop | |
88 | /* 128-bit key */ | |
89 | std %f0, [%o1 + 0x10] ! k[ 4, 5] | |
90 | std %f2, [%o1 + 0x18] ! k[ 6, 7] | |
91 | MOVDTOX_F0_O4 | |
92 | MOVDTOX_F2_O5 | |
93 | ROTL128(%o4, %o5, %g2, %g3, 15) | |
94 | stx %o4, [%o1 + 0x30] ! k[12, 13] | |
95 | stx %o5, [%o1 + 0x38] ! k[14, 15] | |
96 | ROTL128(%o4, %o5, %g2, %g3, 15) | |
97 | stx %o4, [%o1 + 0x40] ! k[16, 17] | |
98 | stx %o5, [%o1 + 0x48] ! k[18, 19] | |
99 | ROTL128(%o4, %o5, %g2, %g3, 15) | |
100 | stx %o4, [%o1 + 0x60] ! k[24, 25] | |
101 | ROTL128(%o4, %o5, %g2, %g3, 15) | |
102 | stx %o4, [%o1 + 0x70] ! k[28, 29] | |
103 | stx %o5, [%o1 + 0x78] ! k[30, 31] | |
104 | ROTL128(%o4, %o5, %g2, %g3, 34) | |
105 | stx %o4, [%o1 + 0xa0] ! k[40, 41] | |
106 | stx %o5, [%o1 + 0xa8] ! k[42, 43] | |
107 | ROTL128(%o4, %o5, %g2, %g3, 17) | |
108 | stx %o4, [%o1 + 0xc0] ! k[48, 49] | |
109 | stx %o5, [%o1 + 0xc8] ! k[50, 51] | |
110 | ||
111 | ldx [%o1 + 0x00], %o4 ! k[ 0, 1] | |
112 | ldx [%o1 + 0x08], %o5 ! k[ 2, 3] | |
113 | ROTL128(%o4, %o5, %g2, %g3, 15) | |
114 | stx %o4, [%o1 + 0x20] ! k[ 8, 9] | |
115 | stx %o5, [%o1 + 0x28] ! k[10, 11] | |
116 | ROTL128(%o4, %o5, %g2, %g3, 30) | |
117 | stx %o4, [%o1 + 0x50] ! k[20, 21] | |
118 | stx %o5, [%o1 + 0x58] ! k[22, 23] | |
119 | ROTL128(%o4, %o5, %g2, %g3, 15) | |
120 | stx %o5, [%o1 + 0x68] ! k[26, 27] | |
121 | ROTL128(%o4, %o5, %g2, %g3, 17) | |
122 | stx %o4, [%o1 + 0x80] ! k[32, 33] | |
123 | stx %o5, [%o1 + 0x88] ! k[34, 35] | |
124 | ROTL128(%o4, %o5, %g2, %g3, 17) | |
125 | stx %o4, [%o1 + 0x90] ! k[36, 37] | |
126 | stx %o5, [%o1 + 0x98] ! k[38, 39] | |
127 | ROTL128(%o4, %o5, %g2, %g3, 17) | |
128 | stx %o4, [%o1 + 0xb0] ! k[44, 45] | |
129 | stx %o5, [%o1 + 0xb8] ! k[46, 47] | |
130 | ||
131 | ba,pt %xcc, 2f | |
132 | mov (3 * 16 * 4), %o0 | |
133 | ||
134 | 1: | |
135 | /* 192-bit or 256-bit key */ | |
136 | std %f0, [%o1 + 0x30] ! k[12, 13] | |
137 | std %f2, [%o1 + 0x38] ! k[14, 15] | |
138 | ldd [%o1 + 0x20], %f4 ! k[ 8, 9] | |
139 | ldd [%o1 + 0x28], %f6 ! k[10, 11] | |
140 | fxor %f0, %f4, %f0 | |
141 | fxor %f2, %f6, %f2 | |
142 | CAMELLIA_F(24, 2, 0, 2) | |
143 | CAMELLIA_F(26, 0, 2, 0) | |
144 | std %f0, [%o1 + 0x10] ! k[ 4, 5] | |
145 | std %f2, [%o1 + 0x18] ! k[ 6, 7] | |
146 | MOVDTOX_F0_O4 | |
147 | MOVDTOX_F2_O5 | |
148 | ROTL128(%o4, %o5, %g2, %g3, 30) | |
149 | stx %o4, [%o1 + 0x50] ! k[20, 21] | |
150 | stx %o5, [%o1 + 0x58] ! k[22, 23] | |
151 | ROTL128(%o4, %o5, %g2, %g3, 30) | |
152 | stx %o4, [%o1 + 0xa0] ! k[40, 41] | |
153 | stx %o5, [%o1 + 0xa8] ! k[42, 43] | |
154 | ROTL128(%o4, %o5, %g2, %g3, 51) | |
155 | stx %o4, [%o1 + 0x100] ! k[64, 65] | |
156 | stx %o5, [%o1 + 0x108] ! k[66, 67] | |
157 | ldx [%o1 + 0x20], %o4 ! k[ 8, 9] | |
158 | ldx [%o1 + 0x28], %o5 ! k[10, 11] | |
159 | ROTL128(%o4, %o5, %g2, %g3, 15) | |
160 | stx %o4, [%o1 + 0x20] ! k[ 8, 9] | |
161 | stx %o5, [%o1 + 0x28] ! k[10, 11] | |
162 | ROTL128(%o4, %o5, %g2, %g3, 15) | |
163 | stx %o4, [%o1 + 0x40] ! k[16, 17] | |
164 | stx %o5, [%o1 + 0x48] ! k[18, 19] | |
165 | ROTL128(%o4, %o5, %g2, %g3, 30) | |
166 | stx %o4, [%o1 + 0x90] ! k[36, 37] | |
167 | stx %o5, [%o1 + 0x98] ! k[38, 39] | |
168 | ROTL128(%o4, %o5, %g2, %g3, 34) | |
169 | stx %o4, [%o1 + 0xd0] ! k[52, 53] | |
170 | stx %o5, [%o1 + 0xd8] ! k[54, 55] | |
171 | ldx [%o1 + 0x30], %o4 ! k[12, 13] | |
172 | ldx [%o1 + 0x38], %o5 ! k[14, 15] | |
173 | ROTL128(%o4, %o5, %g2, %g3, 15) | |
174 | stx %o4, [%o1 + 0x30] ! k[12, 13] | |
175 | stx %o5, [%o1 + 0x38] ! k[14, 15] | |
176 | ROTL128(%o4, %o5, %g2, %g3, 30) | |
177 | stx %o4, [%o1 + 0x70] ! k[28, 29] | |
178 | stx %o5, [%o1 + 0x78] ! k[30, 31] | |
179 | srlx %o4, 32, %g2 | |
180 | srlx %o5, 32, %g3 | |
181 | stw %o4, [%o1 + 0xc0] ! k[48] | |
182 | stw %g3, [%o1 + 0xc4] ! k[49] | |
183 | stw %o5, [%o1 + 0xc8] ! k[50] | |
184 | stw %g2, [%o1 + 0xcc] ! k[51] | |
185 | ROTL128(%o4, %o5, %g2, %g3, 49) | |
186 | stx %o4, [%o1 + 0xe0] ! k[56, 57] | |
187 | stx %o5, [%o1 + 0xe8] ! k[58, 59] | |
188 | ldx [%o1 + 0x00], %o4 ! k[ 0, 1] | |
189 | ldx [%o1 + 0x08], %o5 ! k[ 2, 3] | |
190 | ROTL128(%o4, %o5, %g2, %g3, 45) | |
191 | stx %o4, [%o1 + 0x60] ! k[24, 25] | |
192 | stx %o5, [%o1 + 0x68] ! k[26, 27] | |
193 | ROTL128(%o4, %o5, %g2, %g3, 15) | |
194 | stx %o4, [%o1 + 0x80] ! k[32, 33] | |
195 | stx %o5, [%o1 + 0x88] ! k[34, 35] | |
196 | ROTL128(%o4, %o5, %g2, %g3, 17) | |
197 | stx %o4, [%o1 + 0xb0] ! k[44, 45] | |
198 | stx %o5, [%o1 + 0xb8] ! k[46, 47] | |
199 | ROTL128(%o4, %o5, %g2, %g3, 34) | |
200 | stx %o4, [%o1 + 0xf0] ! k[60, 61] | |
201 | stx %o5, [%o1 + 0xf8] ! k[62, 63] | |
202 | mov (4 * 16 * 4), %o0 | |
203 | 2: | |
204 | add %o1, %o0, %o1 | |
205 | ldd [%o1 + 0x00], %f0 | |
206 | ldd [%o1 + 0x08], %f2 | |
207 | std %f0, [%o3 + 0x00] | |
208 | std %f2, [%o3 + 0x08] | |
209 | add %o3, 0x10, %o3 | |
210 | 1: | |
211 | sub %o1, (16 * 4), %o1 | |
212 | ldd [%o1 + 0x38], %f0 | |
213 | ldd [%o1 + 0x30], %f2 | |
214 | ldd [%o1 + 0x28], %f4 | |
215 | ldd [%o1 + 0x20], %f6 | |
216 | ldd [%o1 + 0x18], %f8 | |
217 | ldd [%o1 + 0x10], %f10 | |
218 | std %f0, [%o3 + 0x00] | |
219 | std %f2, [%o3 + 0x08] | |
220 | std %f4, [%o3 + 0x10] | |
221 | std %f6, [%o3 + 0x18] | |
222 | std %f8, [%o3 + 0x20] | |
223 | std %f10, [%o3 + 0x28] | |
224 | ||
225 | ldd [%o1 + 0x08], %f0 | |
226 | ldd [%o1 + 0x00], %f2 | |
227 | std %f0, [%o3 + 0x30] | |
228 | std %f2, [%o3 + 0x38] | |
229 | subcc %o0, (16 * 4), %o0 | |
230 | bne,pt %icc, 1b | |
231 | add %o3, (16 * 4), %o3 | |
232 | ||
233 | std %f2, [%o3 - 0x10] | |
234 | std %f0, [%o3 - 0x08] | |
235 | ||
236 | retl | |
237 | VISExit | |
238 | ENDPROC(camellia_sparc64_key_expand) | |
239 | ||
240 | .align 32 | |
241 | ENTRY(camellia_sparc64_crypt) | |
242 | /* %o0=key, %o1=input, %o2=output, %o3=key_len */ | |
243 | VISEntry | |
244 | ||
245 | ld [%o1 + 0x00], %f0 | |
246 | ld [%o1 + 0x04], %f1 | |
247 | ld [%o1 + 0x08], %f2 | |
248 | ld [%o1 + 0x0c], %f3 | |
249 | ||
250 | ldd [%o0 + 0x00], %f4 | |
251 | ldd [%o0 + 0x08], %f6 | |
252 | ||
253 | cmp %o3, 16 | |
254 | fxor %f4, %f0, %f0 | |
255 | be 1f | |
256 | fxor %f6, %f2, %f2 | |
257 | ||
258 | ldd [%o0 + 0x10], %f8 | |
259 | ldd [%o0 + 0x18], %f10 | |
260 | ldd [%o0 + 0x20], %f12 | |
261 | ldd [%o0 + 0x28], %f14 | |
262 | ldd [%o0 + 0x30], %f16 | |
263 | ldd [%o0 + 0x38], %f18 | |
264 | ldd [%o0 + 0x40], %f20 | |
265 | ldd [%o0 + 0x48], %f22 | |
266 | add %o0, 0x40, %o0 | |
267 | ||
268 | CAMELLIA_6ROUNDS_FL_FLI( 8, 0, 2) | |
269 | ||
270 | 1: | |
271 | ldd [%o0 + 0x10], %f8 | |
272 | ldd [%o0 + 0x18], %f10 | |
273 | ldd [%o0 + 0x20], %f12 | |
274 | ldd [%o0 + 0x28], %f14 | |
275 | ldd [%o0 + 0x30], %f16 | |
276 | ldd [%o0 + 0x38], %f18 | |
277 | ldd [%o0 + 0x40], %f20 | |
278 | ldd [%o0 + 0x48], %f22 | |
279 | ldd [%o0 + 0x50], %f24 | |
280 | ldd [%o0 + 0x58], %f26 | |
281 | ldd [%o0 + 0x60], %f28 | |
282 | ldd [%o0 + 0x68], %f30 | |
283 | ldd [%o0 + 0x70], %f32 | |
284 | ldd [%o0 + 0x78], %f34 | |
285 | ldd [%o0 + 0x80], %f36 | |
286 | ldd [%o0 + 0x88], %f38 | |
287 | ldd [%o0 + 0x90], %f40 | |
288 | ldd [%o0 + 0x98], %f42 | |
289 | ldd [%o0 + 0xa0], %f44 | |
290 | ldd [%o0 + 0xa8], %f46 | |
291 | ldd [%o0 + 0xb0], %f48 | |
292 | ldd [%o0 + 0xb8], %f50 | |
293 | ldd [%o0 + 0xc0], %f52 | |
294 | ldd [%o0 + 0xc8], %f54 | |
295 | ||
296 | CAMELLIA_6ROUNDS_FL_FLI( 8, 0, 2) | |
297 | CAMELLIA_6ROUNDS_FL_FLI(24, 0, 2) | |
298 | CAMELLIA_6ROUNDS(40, 0, 2) | |
299 | fxor %f52, %f2, %f2 | |
300 | fxor %f54, %f0, %f0 | |
301 | ||
302 | st %f2, [%o2 + 0x00] | |
303 | st %f3, [%o2 + 0x04] | |
304 | st %f0, [%o2 + 0x08] | |
305 | st %f1, [%o2 + 0x0c] | |
306 | ||
307 | retl | |
308 | VISExit | |
309 | ENDPROC(camellia_sparc64_crypt) | |
310 | ||
311 | .align 32 | |
312 | ENTRY(camellia_sparc64_load_keys) | |
313 | /* %o0=key, %o1=key_len */ | |
314 | VISEntry | |
315 | ldd [%o0 + 0x00], %f4 | |
316 | ldd [%o0 + 0x08], %f6 | |
317 | ldd [%o0 + 0x10], %f8 | |
318 | ldd [%o0 + 0x18], %f10 | |
319 | ldd [%o0 + 0x20], %f12 | |
320 | ldd [%o0 + 0x28], %f14 | |
321 | ldd [%o0 + 0x30], %f16 | |
322 | ldd [%o0 + 0x38], %f18 | |
323 | ldd [%o0 + 0x40], %f20 | |
324 | ldd [%o0 + 0x48], %f22 | |
325 | ldd [%o0 + 0x50], %f24 | |
326 | ldd [%o0 + 0x58], %f26 | |
327 | ldd [%o0 + 0x60], %f28 | |
328 | ldd [%o0 + 0x68], %f30 | |
329 | ldd [%o0 + 0x70], %f32 | |
330 | ldd [%o0 + 0x78], %f34 | |
331 | ldd [%o0 + 0x80], %f36 | |
332 | ldd [%o0 + 0x88], %f38 | |
333 | ldd [%o0 + 0x90], %f40 | |
334 | ldd [%o0 + 0x98], %f42 | |
335 | ldd [%o0 + 0xa0], %f44 | |
336 | ldd [%o0 + 0xa8], %f46 | |
337 | ldd [%o0 + 0xb0], %f48 | |
338 | ldd [%o0 + 0xb8], %f50 | |
339 | ldd [%o0 + 0xc0], %f52 | |
340 | retl | |
341 | ldd [%o0 + 0xc8], %f54 | |
342 | ENDPROC(camellia_sparc64_load_keys) | |
343 | ||
344 | .align 32 | |
345 | ENTRY(camellia_sparc64_ecb_crypt_3_grand_rounds) | |
346 | /* %o0=input, %o1=output, %o2=len, %o3=key */ | |
347 | 1: ldd [%o0 + 0x00], %f0 | |
348 | ldd [%o0 + 0x08], %f2 | |
349 | add %o0, 0x10, %o0 | |
350 | fxor %f4, %f0, %f0 | |
351 | fxor %f6, %f2, %f2 | |
352 | CAMELLIA_6ROUNDS_FL_FLI( 8, 0, 2) | |
353 | CAMELLIA_6ROUNDS_FL_FLI(24, 0, 2) | |
354 | CAMELLIA_6ROUNDS(40, 0, 2) | |
355 | fxor %f52, %f2, %f2 | |
356 | fxor %f54, %f0, %f0 | |
357 | std %f2, [%o1 + 0x00] | |
358 | std %f0, [%o1 + 0x08] | |
359 | subcc %o2, 0x10, %o2 | |
360 | bne,pt %icc, 1b | |
361 | add %o1, 0x10, %o1 | |
362 | retl | |
363 | nop | |
364 | ENDPROC(camellia_sparc64_ecb_crypt_3_grand_rounds) | |
365 | ||
366 | .align 32 | |
367 | ENTRY(camellia_sparc64_ecb_crypt_4_grand_rounds) | |
368 | /* %o0=input, %o1=output, %o2=len, %o3=key */ | |
369 | 1: ldd [%o0 + 0x00], %f0 | |
370 | ldd [%o0 + 0x08], %f2 | |
371 | add %o0, 0x10, %o0 | |
372 | fxor %f4, %f0, %f0 | |
373 | fxor %f6, %f2, %f2 | |
374 | CAMELLIA_6ROUNDS_FL_FLI( 8, 0, 2) | |
375 | ldd [%o3 + 0xd0], %f8 | |
376 | ldd [%o3 + 0xd8], %f10 | |
377 | ldd [%o3 + 0xe0], %f12 | |
378 | ldd [%o3 + 0xe8], %f14 | |
379 | ldd [%o3 + 0xf0], %f16 | |
380 | ldd [%o3 + 0xf8], %f18 | |
381 | ldd [%o3 + 0x100], %f20 | |
382 | ldd [%o3 + 0x108], %f22 | |
383 | CAMELLIA_6ROUNDS_FL_FLI(24, 0, 2) | |
384 | CAMELLIA_6ROUNDS_FL_FLI(40, 0, 2) | |
385 | CAMELLIA_F(8, 2, 0, 2) | |
386 | CAMELLIA_F(10, 0, 2, 0) | |
387 | ldd [%o3 + 0x10], %f8 | |
388 | ldd [%o3 + 0x18], %f10 | |
389 | CAMELLIA_F(12, 2, 0, 2) | |
390 | CAMELLIA_F(14, 0, 2, 0) | |
391 | ldd [%o3 + 0x20], %f12 | |
392 | ldd [%o3 + 0x28], %f14 | |
393 | CAMELLIA_F(16, 2, 0, 2) | |
394 | CAMELLIA_F(18, 0, 2, 0) | |
395 | ldd [%o3 + 0x30], %f16 | |
396 | ldd [%o3 + 0x38], %f18 | |
397 | fxor %f20, %f2, %f2 | |
398 | fxor %f22, %f0, %f0 | |
399 | ldd [%o3 + 0x40], %f20 | |
400 | ldd [%o3 + 0x48], %f22 | |
401 | std %f2, [%o1 + 0x00] | |
402 | std %f0, [%o1 + 0x08] | |
403 | subcc %o2, 0x10, %o2 | |
404 | bne,pt %icc, 1b | |
405 | add %o1, 0x10, %o1 | |
406 | retl | |
407 | nop | |
408 | ENDPROC(camellia_sparc64_ecb_crypt_4_grand_rounds) | |
409 | ||
410 | .align 32 | |
411 | ENTRY(camellia_sparc64_cbc_encrypt_3_grand_rounds) | |
412 | /* %o0=input, %o1=output, %o2=len, %o3=key, %o4=IV */ | |
413 | ldd [%o4 + 0x00], %f60 | |
414 | ldd [%o4 + 0x08], %f62 | |
415 | 1: ldd [%o0 + 0x00], %f0 | |
416 | ldd [%o0 + 0x08], %f2 | |
417 | add %o0, 0x10, %o0 | |
418 | fxor %f60, %f0, %f0 | |
419 | fxor %f62, %f2, %f2 | |
420 | fxor %f4, %f0, %f0 | |
421 | fxor %f6, %f2, %f2 | |
422 | CAMELLIA_6ROUNDS_FL_FLI( 8, 0, 2) | |
423 | CAMELLIA_6ROUNDS_FL_FLI(24, 0, 2) | |
424 | CAMELLIA_6ROUNDS(40, 0, 2) | |
425 | fxor %f52, %f2, %f60 | |
426 | fxor %f54, %f0, %f62 | |
427 | std %f60, [%o1 + 0x00] | |
428 | std %f62, [%o1 + 0x08] | |
429 | subcc %o2, 0x10, %o2 | |
430 | bne,pt %icc, 1b | |
431 | add %o1, 0x10, %o1 | |
432 | std %f60, [%o4 + 0x00] | |
433 | retl | |
434 | std %f62, [%o4 + 0x08] | |
435 | ENDPROC(camellia_sparc64_cbc_encrypt_3_grand_rounds) | |
436 | ||
437 | .align 32 | |
438 | ENTRY(camellia_sparc64_cbc_encrypt_4_grand_rounds) | |
439 | /* %o0=input, %o1=output, %o2=len, %o3=key, %o4=IV */ | |
440 | ldd [%o4 + 0x00], %f60 | |
441 | ldd [%o4 + 0x08], %f62 | |
442 | 1: ldd [%o0 + 0x00], %f0 | |
443 | ldd [%o0 + 0x08], %f2 | |
444 | add %o0, 0x10, %o0 | |
445 | fxor %f60, %f0, %f0 | |
446 | fxor %f62, %f2, %f2 | |
447 | fxor %f4, %f0, %f0 | |
448 | fxor %f6, %f2, %f2 | |
449 | CAMELLIA_6ROUNDS_FL_FLI( 8, 0, 2) | |
450 | ldd [%o3 + 0xd0], %f8 | |
451 | ldd [%o3 + 0xd8], %f10 | |
452 | ldd [%o3 + 0xe0], %f12 | |
453 | ldd [%o3 + 0xe8], %f14 | |
454 | ldd [%o3 + 0xf0], %f16 | |
455 | ldd [%o3 + 0xf8], %f18 | |
456 | ldd [%o3 + 0x100], %f20 | |
457 | ldd [%o3 + 0x108], %f22 | |
458 | CAMELLIA_6ROUNDS_FL_FLI(24, 0, 2) | |
459 | CAMELLIA_6ROUNDS_FL_FLI(40, 0, 2) | |
460 | CAMELLIA_F(8, 2, 0, 2) | |
461 | CAMELLIA_F(10, 0, 2, 0) | |
462 | ldd [%o3 + 0x10], %f8 | |
463 | ldd [%o3 + 0x18], %f10 | |
464 | CAMELLIA_F(12, 2, 0, 2) | |
465 | CAMELLIA_F(14, 0, 2, 0) | |
466 | ldd [%o3 + 0x20], %f12 | |
467 | ldd [%o3 + 0x28], %f14 | |
468 | CAMELLIA_F(16, 2, 0, 2) | |
469 | CAMELLIA_F(18, 0, 2, 0) | |
470 | ldd [%o3 + 0x30], %f16 | |
471 | ldd [%o3 + 0x38], %f18 | |
472 | fxor %f20, %f2, %f60 | |
473 | fxor %f22, %f0, %f62 | |
474 | ldd [%o3 + 0x40], %f20 | |
475 | ldd [%o3 + 0x48], %f22 | |
476 | std %f60, [%o1 + 0x00] | |
477 | std %f62, [%o1 + 0x08] | |
478 | subcc %o2, 0x10, %o2 | |
479 | bne,pt %icc, 1b | |
480 | add %o1, 0x10, %o1 | |
481 | std %f60, [%o4 + 0x00] | |
482 | retl | |
483 | std %f62, [%o4 + 0x08] | |
484 | ENDPROC(camellia_sparc64_cbc_encrypt_4_grand_rounds) | |
485 | ||
486 | .align 32 | |
487 | ENTRY(camellia_sparc64_cbc_decrypt_3_grand_rounds) | |
488 | /* %o0=input, %o1=output, %o2=len, %o3=key, %o4=IV */ | |
489 | ldd [%o4 + 0x00], %f60 | |
490 | ldd [%o4 + 0x08], %f62 | |
491 | 1: ldd [%o0 + 0x00], %f56 | |
492 | ldd [%o0 + 0x08], %f58 | |
493 | add %o0, 0x10, %o0 | |
494 | fxor %f4, %f56, %f0 | |
495 | fxor %f6, %f58, %f2 | |
496 | CAMELLIA_6ROUNDS_FL_FLI( 8, 0, 2) | |
497 | CAMELLIA_6ROUNDS_FL_FLI(24, 0, 2) | |
498 | CAMELLIA_6ROUNDS(40, 0, 2) | |
499 | fxor %f52, %f2, %f2 | |
500 | fxor %f54, %f0, %f0 | |
501 | fxor %f60, %f2, %f2 | |
502 | fxor %f62, %f0, %f0 | |
503 | fsrc2 %f56, %f60 | |
504 | fsrc2 %f58, %f62 | |
505 | std %f2, [%o1 + 0x00] | |
506 | std %f0, [%o1 + 0x08] | |
507 | subcc %o2, 0x10, %o2 | |
508 | bne,pt %icc, 1b | |
509 | add %o1, 0x10, %o1 | |
510 | std %f60, [%o4 + 0x00] | |
511 | retl | |
512 | std %f62, [%o4 + 0x08] | |
513 | ENDPROC(camellia_sparc64_cbc_decrypt_3_grand_rounds) | |
514 | ||
515 | .align 32 | |
516 | ENTRY(camellia_sparc64_cbc_decrypt_4_grand_rounds) | |
517 | /* %o0=input, %o1=output, %o2=len, %o3=key, %o4=IV */ | |
518 | ldd [%o4 + 0x00], %f60 | |
519 | ldd [%o4 + 0x08], %f62 | |
520 | 1: ldd [%o0 + 0x00], %f56 | |
521 | ldd [%o0 + 0x08], %f58 | |
522 | add %o0, 0x10, %o0 | |
523 | fxor %f4, %f56, %f0 | |
524 | fxor %f6, %f58, %f2 | |
525 | CAMELLIA_6ROUNDS_FL_FLI( 8, 0, 2) | |
526 | ldd [%o3 + 0xd0], %f8 | |
527 | ldd [%o3 + 0xd8], %f10 | |
528 | ldd [%o3 + 0xe0], %f12 | |
529 | ldd [%o3 + 0xe8], %f14 | |
530 | ldd [%o3 + 0xf0], %f16 | |
531 | ldd [%o3 + 0xf8], %f18 | |
532 | ldd [%o3 + 0x100], %f20 | |
533 | ldd [%o3 + 0x108], %f22 | |
534 | CAMELLIA_6ROUNDS_FL_FLI(24, 0, 2) | |
535 | CAMELLIA_6ROUNDS_FL_FLI(40, 0, 2) | |
536 | CAMELLIA_F(8, 2, 0, 2) | |
537 | CAMELLIA_F(10, 0, 2, 0) | |
538 | ldd [%o3 + 0x10], %f8 | |
539 | ldd [%o3 + 0x18], %f10 | |
540 | CAMELLIA_F(12, 2, 0, 2) | |
541 | CAMELLIA_F(14, 0, 2, 0) | |
542 | ldd [%o3 + 0x20], %f12 | |
543 | ldd [%o3 + 0x28], %f14 | |
544 | CAMELLIA_F(16, 2, 0, 2) | |
545 | CAMELLIA_F(18, 0, 2, 0) | |
546 | ldd [%o3 + 0x30], %f16 | |
547 | ldd [%o3 + 0x38], %f18 | |
548 | fxor %f20, %f2, %f2 | |
549 | fxor %f22, %f0, %f0 | |
550 | ldd [%o3 + 0x40], %f20 | |
551 | ldd [%o3 + 0x48], %f22 | |
552 | fxor %f60, %f2, %f2 | |
553 | fxor %f62, %f0, %f0 | |
554 | fsrc2 %f56, %f60 | |
555 | fsrc2 %f58, %f62 | |
556 | std %f2, [%o1 + 0x00] | |
557 | std %f0, [%o1 + 0x08] | |
558 | subcc %o2, 0x10, %o2 | |
559 | bne,pt %icc, 1b | |
560 | add %o1, 0x10, %o1 | |
561 | std %f60, [%o4 + 0x00] | |
562 | retl | |
563 | std %f62, [%o4 + 0x08] | |
564 | ENDPROC(camellia_sparc64_cbc_decrypt_4_grand_rounds) |