1 // SPDX-License-Identifier: GPL-2.0-or-later
3 * Support for Intel AES-NI instructions. This file contains glue
4 * code, the real AES implementation is in intel-aes_asm.S.
6 * Copyright (C) 2008, Intel Corp.
7 * Author: Huang Ying <ying.huang@intel.com>
9 * Added RFC4106 AES-GCM support for 128-bit keys under the AEAD
10 * interface for 64-bit kernels.
11 * Authors: Adrian Hoban <adrian.hoban@intel.com>
12 * Gabriele Paoloni <gabriele.paoloni@intel.com>
13 * Tadeusz Struk (tadeusz.struk@intel.com)
14 * Aidan O'Mahony (aidan.o.mahony@intel.com)
15 * Copyright (c) 2010, Intel Corporation.
18 #include <linux/hardirq.h>
19 #include <linux/types.h>
20 #include <linux/module.h>
21 #include <linux/err.h>
22 #include <crypto/algapi.h>
23 #include <crypto/aes.h>
24 #include <crypto/ctr.h>
25 #include <crypto/b128ops.h>
26 #include <crypto/gcm.h>
27 #include <crypto/xts.h>
28 #include <asm/cpu_device_id.h>
29 #include <asm/crypto/aes.h>
31 #include <crypto/scatterwalk.h>
32 #include <crypto/internal/aead.h>
33 #include <crypto/internal/simd.h>
34 #include <crypto/internal/skcipher.h>
35 #include <linux/workqueue.h>
36 #include <linux/spinlock.h>
38 #include <asm/crypto/glue_helper.h>
42 #define AESNI_ALIGN 16
43 #define AESNI_ALIGN_ATTR __attribute__ ((__aligned__(AESNI_ALIGN)))
44 #define AES_BLOCK_MASK (~(AES_BLOCK_SIZE - 1))
45 #define RFC4106_HASH_SUBKEY_SIZE 16
46 #define AESNI_ALIGN_EXTRA ((AESNI_ALIGN - 1) & ~(CRYPTO_MINALIGN - 1))
47 #define CRYPTO_AES_CTX_SIZE (sizeof(struct crypto_aes_ctx) + AESNI_ALIGN_EXTRA)
48 #define XTS_AES_CTX_SIZE (sizeof(struct aesni_xts_ctx) + AESNI_ALIGN_EXTRA)
50 /* This data is stored at the end of the crypto_tfm struct.
51 * It's a type of per "session" data storage location.
52 * This needs to be 16 byte aligned.
54 struct aesni_rfc4106_gcm_ctx {
55 u8 hash_subkey[16] AESNI_ALIGN_ATTR;
56 struct crypto_aes_ctx aes_key_expanded AESNI_ALIGN_ATTR;
60 struct generic_gcmaes_ctx {
61 u8 hash_subkey[16] AESNI_ALIGN_ATTR;
62 struct crypto_aes_ctx aes_key_expanded AESNI_ALIGN_ATTR;
65 struct aesni_xts_ctx {
66 u8 raw_tweak_ctx[sizeof(struct crypto_aes_ctx)] AESNI_ALIGN_ATTR;
67 u8 raw_crypt_ctx[sizeof(struct crypto_aes_ctx)] AESNI_ALIGN_ATTR;
70 #define GCM_BLOCK_LEN 16
72 struct gcm_context_data {
73 /* init, update and finalize context data */
74 u8 aad_hash[GCM_BLOCK_LEN];
77 u8 partial_block_enc_key[GCM_BLOCK_LEN];
78 u8 orig_IV[GCM_BLOCK_LEN];
79 u8 current_counter[GCM_BLOCK_LEN];
80 u64 partial_block_len;
82 u8 hash_keys[GCM_BLOCK_LEN * 16];
85 asmlinkage int aesni_set_key(struct crypto_aes_ctx *ctx, const u8 *in_key,
86 unsigned int key_len);
87 asmlinkage void aesni_enc(struct crypto_aes_ctx *ctx, u8 *out,
89 asmlinkage void aesni_dec(struct crypto_aes_ctx *ctx, u8 *out,
91 asmlinkage void aesni_ecb_enc(struct crypto_aes_ctx *ctx, u8 *out,
92 const u8 *in, unsigned int len);
93 asmlinkage void aesni_ecb_dec(struct crypto_aes_ctx *ctx, u8 *out,
94 const u8 *in, unsigned int len);
95 asmlinkage void aesni_cbc_enc(struct crypto_aes_ctx *ctx, u8 *out,
96 const u8 *in, unsigned int len, u8 *iv);
97 asmlinkage void aesni_cbc_dec(struct crypto_aes_ctx *ctx, u8 *out,
98 const u8 *in, unsigned int len, u8 *iv);
100 #define AVX_GEN2_OPTSIZE 640
101 #define AVX_GEN4_OPTSIZE 4096
105 static void (*aesni_ctr_enc_tfm)(struct crypto_aes_ctx *ctx, u8 *out,
106 const u8 *in, unsigned int len, u8 *iv);
107 asmlinkage void aesni_ctr_enc(struct crypto_aes_ctx *ctx, u8 *out,
108 const u8 *in, unsigned int len, u8 *iv);
110 asmlinkage void aesni_xts_crypt8(struct crypto_aes_ctx *ctx, u8 *out,
111 const u8 *in, bool enc, u8 *iv);
113 /* asmlinkage void aesni_gcm_enc()
114 * void *ctx, AES Key schedule. Starts on a 16 byte boundary.
115 * struct gcm_context_data. May be uninitialized.
116 * u8 *out, Ciphertext output. Encrypt in-place is allowed.
117 * const u8 *in, Plaintext input
118 * unsigned long plaintext_len, Length of data in bytes for encryption.
119 * u8 *iv, Pre-counter block j0: 12 byte IV concatenated with 0x00000001.
120 * 16-byte aligned pointer.
121 * u8 *hash_subkey, the Hash sub key input. Data starts on a 16-byte boundary.
122 * const u8 *aad, Additional Authentication Data (AAD)
123 * unsigned long aad_len, Length of AAD in bytes.
124 * u8 *auth_tag, Authenticated Tag output.
125 * unsigned long auth_tag_len), Authenticated Tag Length in bytes.
126 * Valid values are 16 (most likely), 12 or 8.
128 asmlinkage void aesni_gcm_enc(void *ctx,
129 struct gcm_context_data *gdata, u8 *out,
130 const u8 *in, unsigned long plaintext_len, u8 *iv,
131 u8 *hash_subkey, const u8 *aad, unsigned long aad_len,
132 u8 *auth_tag, unsigned long auth_tag_len);
134 /* asmlinkage void aesni_gcm_dec()
135 * void *ctx, AES Key schedule. Starts on a 16 byte boundary.
136 * struct gcm_context_data. May be uninitialized.
137 * u8 *out, Plaintext output. Decrypt in-place is allowed.
138 * const u8 *in, Ciphertext input
139 * unsigned long ciphertext_len, Length of data in bytes for decryption.
140 * u8 *iv, Pre-counter block j0: 12 byte IV concatenated with 0x00000001.
141 * 16-byte aligned pointer.
142 * u8 *hash_subkey, the Hash sub key input. Data starts on a 16-byte boundary.
143 * const u8 *aad, Additional Authentication Data (AAD)
144 * unsigned long aad_len, Length of AAD in bytes. With RFC4106 this is going
145 * to be 8 or 12 bytes
146 * u8 *auth_tag, Authenticated Tag output.
147 * unsigned long auth_tag_len) Authenticated Tag Length in bytes.
148 * Valid values are 16 (most likely), 12 or 8.
150 asmlinkage void aesni_gcm_dec(void *ctx,
151 struct gcm_context_data *gdata, u8 *out,
152 const u8 *in, unsigned long ciphertext_len, u8 *iv,
153 u8 *hash_subkey, const u8 *aad, unsigned long aad_len,
154 u8 *auth_tag, unsigned long auth_tag_len);
156 /* Scatter / Gather routines, with args similar to above */
157 asmlinkage void aesni_gcm_init(void *ctx,
158 struct gcm_context_data *gdata,
160 u8 *hash_subkey, const u8 *aad,
161 unsigned long aad_len);
162 asmlinkage void aesni_gcm_enc_update(void *ctx,
163 struct gcm_context_data *gdata, u8 *out,
164 const u8 *in, unsigned long plaintext_len);
165 asmlinkage void aesni_gcm_dec_update(void *ctx,
166 struct gcm_context_data *gdata, u8 *out,
168 unsigned long ciphertext_len);
169 asmlinkage void aesni_gcm_finalize(void *ctx,
170 struct gcm_context_data *gdata,
171 u8 *auth_tag, unsigned long auth_tag_len);
173 static const struct aesni_gcm_tfm_s {
174 void (*init)(void *ctx, struct gcm_context_data *gdata, u8 *iv,
175 u8 *hash_subkey, const u8 *aad, unsigned long aad_len);
176 void (*enc_update)(void *ctx, struct gcm_context_data *gdata, u8 *out,
177 const u8 *in, unsigned long plaintext_len);
178 void (*dec_update)(void *ctx, struct gcm_context_data *gdata, u8 *out,
179 const u8 *in, unsigned long ciphertext_len);
180 void (*finalize)(void *ctx, struct gcm_context_data *gdata,
181 u8 *auth_tag, unsigned long auth_tag_len);
184 static const struct aesni_gcm_tfm_s aesni_gcm_tfm_sse = {
185 .init = &aesni_gcm_init,
186 .enc_update = &aesni_gcm_enc_update,
187 .dec_update = &aesni_gcm_dec_update,
188 .finalize = &aesni_gcm_finalize,
192 asmlinkage void aes_ctr_enc_128_avx_by8(const u8 *in, u8 *iv,
193 void *keys, u8 *out, unsigned int num_bytes);
194 asmlinkage void aes_ctr_enc_192_avx_by8(const u8 *in, u8 *iv,
195 void *keys, u8 *out, unsigned int num_bytes);
196 asmlinkage void aes_ctr_enc_256_avx_by8(const u8 *in, u8 *iv,
197 void *keys, u8 *out, unsigned int num_bytes);
199 * asmlinkage void aesni_gcm_init_avx_gen2()
200 * gcm_data *my_ctx_data, context data
201 * u8 *hash_subkey, the Hash sub key input. Data starts on a 16-byte boundary.
203 asmlinkage void aesni_gcm_init_avx_gen2(void *my_ctx_data,
204 struct gcm_context_data *gdata,
208 unsigned long aad_len);
210 asmlinkage void aesni_gcm_enc_update_avx_gen2(void *ctx,
211 struct gcm_context_data *gdata, u8 *out,
212 const u8 *in, unsigned long plaintext_len);
213 asmlinkage void aesni_gcm_dec_update_avx_gen2(void *ctx,
214 struct gcm_context_data *gdata, u8 *out,
216 unsigned long ciphertext_len);
217 asmlinkage void aesni_gcm_finalize_avx_gen2(void *ctx,
218 struct gcm_context_data *gdata,
219 u8 *auth_tag, unsigned long auth_tag_len);
221 asmlinkage void aesni_gcm_enc_avx_gen2(void *ctx,
222 struct gcm_context_data *gdata, u8 *out,
223 const u8 *in, unsigned long plaintext_len, u8 *iv,
224 const u8 *aad, unsigned long aad_len,
225 u8 *auth_tag, unsigned long auth_tag_len);
227 asmlinkage void aesni_gcm_dec_avx_gen2(void *ctx,
228 struct gcm_context_data *gdata, u8 *out,
229 const u8 *in, unsigned long ciphertext_len, u8 *iv,
230 const u8 *aad, unsigned long aad_len,
231 u8 *auth_tag, unsigned long auth_tag_len);
233 static const struct aesni_gcm_tfm_s aesni_gcm_tfm_avx_gen2 = {
234 .init = &aesni_gcm_init_avx_gen2,
235 .enc_update = &aesni_gcm_enc_update_avx_gen2,
236 .dec_update = &aesni_gcm_dec_update_avx_gen2,
237 .finalize = &aesni_gcm_finalize_avx_gen2,
242 #ifdef CONFIG_AS_AVX2
244 * asmlinkage void aesni_gcm_init_avx_gen4()
245 * gcm_data *my_ctx_data, context data
246 * u8 *hash_subkey, the Hash sub key input. Data starts on a 16-byte boundary.
248 asmlinkage void aesni_gcm_init_avx_gen4(void *my_ctx_data,
249 struct gcm_context_data *gdata,
253 unsigned long aad_len);
255 asmlinkage void aesni_gcm_enc_update_avx_gen4(void *ctx,
256 struct gcm_context_data *gdata, u8 *out,
257 const u8 *in, unsigned long plaintext_len);
258 asmlinkage void aesni_gcm_dec_update_avx_gen4(void *ctx,
259 struct gcm_context_data *gdata, u8 *out,
261 unsigned long ciphertext_len);
262 asmlinkage void aesni_gcm_finalize_avx_gen4(void *ctx,
263 struct gcm_context_data *gdata,
264 u8 *auth_tag, unsigned long auth_tag_len);
266 asmlinkage void aesni_gcm_enc_avx_gen4(void *ctx,
267 struct gcm_context_data *gdata, u8 *out,
268 const u8 *in, unsigned long plaintext_len, u8 *iv,
269 const u8 *aad, unsigned long aad_len,
270 u8 *auth_tag, unsigned long auth_tag_len);
272 asmlinkage void aesni_gcm_dec_avx_gen4(void *ctx,
273 struct gcm_context_data *gdata, u8 *out,
274 const u8 *in, unsigned long ciphertext_len, u8 *iv,
275 const u8 *aad, unsigned long aad_len,
276 u8 *auth_tag, unsigned long auth_tag_len);
278 static const struct aesni_gcm_tfm_s aesni_gcm_tfm_avx_gen4 = {
279 .init = &aesni_gcm_init_avx_gen4,
280 .enc_update = &aesni_gcm_enc_update_avx_gen4,
281 .dec_update = &aesni_gcm_dec_update_avx_gen4,
282 .finalize = &aesni_gcm_finalize_avx_gen4,
288 aesni_rfc4106_gcm_ctx *aesni_rfc4106_gcm_ctx_get(struct crypto_aead *tfm)
290 unsigned long align = AESNI_ALIGN;
292 if (align <= crypto_tfm_ctx_alignment())
294 return PTR_ALIGN(crypto_aead_ctx(tfm), align);
298 generic_gcmaes_ctx *generic_gcmaes_ctx_get(struct crypto_aead *tfm)
300 unsigned long align = AESNI_ALIGN;
302 if (align <= crypto_tfm_ctx_alignment())
304 return PTR_ALIGN(crypto_aead_ctx(tfm), align);
308 static inline struct crypto_aes_ctx *aes_ctx(void *raw_ctx)
310 unsigned long addr = (unsigned long)raw_ctx;
311 unsigned long align = AESNI_ALIGN;
313 if (align <= crypto_tfm_ctx_alignment())
315 return (struct crypto_aes_ctx *)ALIGN(addr, align);
318 static int aes_set_key_common(struct crypto_tfm *tfm, void *raw_ctx,
319 const u8 *in_key, unsigned int key_len)
321 struct crypto_aes_ctx *ctx = aes_ctx(raw_ctx);
322 u32 *flags = &tfm->crt_flags;
325 if (key_len != AES_KEYSIZE_128 && key_len != AES_KEYSIZE_192 &&
326 key_len != AES_KEYSIZE_256) {
327 *flags |= CRYPTO_TFM_RES_BAD_KEY_LEN;
331 if (!crypto_simd_usable())
332 err = crypto_aes_expand_key(ctx, in_key, key_len);
335 err = aesni_set_key(ctx, in_key, key_len);
342 static int aes_set_key(struct crypto_tfm *tfm, const u8 *in_key,
343 unsigned int key_len)
345 return aes_set_key_common(tfm, crypto_tfm_ctx(tfm), in_key, key_len);
348 static void aesni_encrypt(struct crypto_tfm *tfm, u8 *dst, const u8 *src)
350 struct crypto_aes_ctx *ctx = aes_ctx(crypto_tfm_ctx(tfm));
352 if (!crypto_simd_usable())
353 crypto_aes_encrypt_x86(ctx, dst, src);
356 aesni_enc(ctx, dst, src);
361 static void aesni_decrypt(struct crypto_tfm *tfm, u8 *dst, const u8 *src)
363 struct crypto_aes_ctx *ctx = aes_ctx(crypto_tfm_ctx(tfm));
365 if (!crypto_simd_usable())
366 crypto_aes_decrypt_x86(ctx, dst, src);
369 aesni_dec(ctx, dst, src);
374 static int aesni_skcipher_setkey(struct crypto_skcipher *tfm, const u8 *key,
377 return aes_set_key_common(crypto_skcipher_tfm(tfm),
378 crypto_skcipher_ctx(tfm), key, len);
381 static int ecb_encrypt(struct skcipher_request *req)
383 struct crypto_skcipher *tfm = crypto_skcipher_reqtfm(req);
384 struct crypto_aes_ctx *ctx = aes_ctx(crypto_skcipher_ctx(tfm));
385 struct skcipher_walk walk;
389 err = skcipher_walk_virt(&walk, req, true);
392 while ((nbytes = walk.nbytes)) {
393 aesni_ecb_enc(ctx, walk.dst.virt.addr, walk.src.virt.addr,
394 nbytes & AES_BLOCK_MASK);
395 nbytes &= AES_BLOCK_SIZE - 1;
396 err = skcipher_walk_done(&walk, nbytes);
403 static int ecb_decrypt(struct skcipher_request *req)
405 struct crypto_skcipher *tfm = crypto_skcipher_reqtfm(req);
406 struct crypto_aes_ctx *ctx = aes_ctx(crypto_skcipher_ctx(tfm));
407 struct skcipher_walk walk;
411 err = skcipher_walk_virt(&walk, req, true);
414 while ((nbytes = walk.nbytes)) {
415 aesni_ecb_dec(ctx, walk.dst.virt.addr, walk.src.virt.addr,
416 nbytes & AES_BLOCK_MASK);
417 nbytes &= AES_BLOCK_SIZE - 1;
418 err = skcipher_walk_done(&walk, nbytes);
425 static int cbc_encrypt(struct skcipher_request *req)
427 struct crypto_skcipher *tfm = crypto_skcipher_reqtfm(req);
428 struct crypto_aes_ctx *ctx = aes_ctx(crypto_skcipher_ctx(tfm));
429 struct skcipher_walk walk;
433 err = skcipher_walk_virt(&walk, req, true);
436 while ((nbytes = walk.nbytes)) {
437 aesni_cbc_enc(ctx, walk.dst.virt.addr, walk.src.virt.addr,
438 nbytes & AES_BLOCK_MASK, walk.iv);
439 nbytes &= AES_BLOCK_SIZE - 1;
440 err = skcipher_walk_done(&walk, nbytes);
447 static int cbc_decrypt(struct skcipher_request *req)
449 struct crypto_skcipher *tfm = crypto_skcipher_reqtfm(req);
450 struct crypto_aes_ctx *ctx = aes_ctx(crypto_skcipher_ctx(tfm));
451 struct skcipher_walk walk;
455 err = skcipher_walk_virt(&walk, req, true);
458 while ((nbytes = walk.nbytes)) {
459 aesni_cbc_dec(ctx, walk.dst.virt.addr, walk.src.virt.addr,
460 nbytes & AES_BLOCK_MASK, walk.iv);
461 nbytes &= AES_BLOCK_SIZE - 1;
462 err = skcipher_walk_done(&walk, nbytes);
470 static void ctr_crypt_final(struct crypto_aes_ctx *ctx,
471 struct skcipher_walk *walk)
473 u8 *ctrblk = walk->iv;
474 u8 keystream[AES_BLOCK_SIZE];
475 u8 *src = walk->src.virt.addr;
476 u8 *dst = walk->dst.virt.addr;
477 unsigned int nbytes = walk->nbytes;
479 aesni_enc(ctx, keystream, ctrblk);
480 crypto_xor_cpy(dst, keystream, src, nbytes);
482 crypto_inc(ctrblk, AES_BLOCK_SIZE);
486 static void aesni_ctr_enc_avx_tfm(struct crypto_aes_ctx *ctx, u8 *out,
487 const u8 *in, unsigned int len, u8 *iv)
490 * based on key length, override with the by8 version
491 * of ctr mode encryption/decryption for improved performance
492 * aes_set_key_common() ensures that key length is one of
495 if (ctx->key_length == AES_KEYSIZE_128)
496 aes_ctr_enc_128_avx_by8(in, iv, (void *)ctx, out, len);
497 else if (ctx->key_length == AES_KEYSIZE_192)
498 aes_ctr_enc_192_avx_by8(in, iv, (void *)ctx, out, len);
500 aes_ctr_enc_256_avx_by8(in, iv, (void *)ctx, out, len);
504 static int ctr_crypt(struct skcipher_request *req)
506 struct crypto_skcipher *tfm = crypto_skcipher_reqtfm(req);
507 struct crypto_aes_ctx *ctx = aes_ctx(crypto_skcipher_ctx(tfm));
508 struct skcipher_walk walk;
512 err = skcipher_walk_virt(&walk, req, true);
515 while ((nbytes = walk.nbytes) >= AES_BLOCK_SIZE) {
516 aesni_ctr_enc_tfm(ctx, walk.dst.virt.addr, walk.src.virt.addr,
517 nbytes & AES_BLOCK_MASK, walk.iv);
518 nbytes &= AES_BLOCK_SIZE - 1;
519 err = skcipher_walk_done(&walk, nbytes);
522 ctr_crypt_final(ctx, &walk);
523 err = skcipher_walk_done(&walk, 0);
530 static int xts_aesni_setkey(struct crypto_skcipher *tfm, const u8 *key,
533 struct aesni_xts_ctx *ctx = crypto_skcipher_ctx(tfm);
536 err = xts_verify_key(tfm, key, keylen);
542 /* first half of xts-key is for crypt */
543 err = aes_set_key_common(crypto_skcipher_tfm(tfm), ctx->raw_crypt_ctx,
548 /* second half of xts-key is for tweak */
549 return aes_set_key_common(crypto_skcipher_tfm(tfm), ctx->raw_tweak_ctx,
550 key + keylen, keylen);
554 static void aesni_xts_tweak(void *ctx, u8 *out, const u8 *in)
556 aesni_enc(ctx, out, in);
559 static void aesni_xts_enc(void *ctx, u128 *dst, const u128 *src, le128 *iv)
561 glue_xts_crypt_128bit_one(ctx, dst, src, iv, GLUE_FUNC_CAST(aesni_enc));
564 static void aesni_xts_dec(void *ctx, u128 *dst, const u128 *src, le128 *iv)
566 glue_xts_crypt_128bit_one(ctx, dst, src, iv, GLUE_FUNC_CAST(aesni_dec));
569 static void aesni_xts_enc8(void *ctx, u128 *dst, const u128 *src, le128 *iv)
571 aesni_xts_crypt8(ctx, (u8 *)dst, (const u8 *)src, true, (u8 *)iv);
574 static void aesni_xts_dec8(void *ctx, u128 *dst, const u128 *src, le128 *iv)
576 aesni_xts_crypt8(ctx, (u8 *)dst, (const u8 *)src, false, (u8 *)iv);
579 static const struct common_glue_ctx aesni_enc_xts = {
581 .fpu_blocks_limit = 1,
585 .fn_u = { .xts = GLUE_XTS_FUNC_CAST(aesni_xts_enc8) }
588 .fn_u = { .xts = GLUE_XTS_FUNC_CAST(aesni_xts_enc) }
592 static const struct common_glue_ctx aesni_dec_xts = {
594 .fpu_blocks_limit = 1,
598 .fn_u = { .xts = GLUE_XTS_FUNC_CAST(aesni_xts_dec8) }
601 .fn_u = { .xts = GLUE_XTS_FUNC_CAST(aesni_xts_dec) }
605 static int xts_encrypt(struct skcipher_request *req)
607 struct crypto_skcipher *tfm = crypto_skcipher_reqtfm(req);
608 struct aesni_xts_ctx *ctx = crypto_skcipher_ctx(tfm);
610 return glue_xts_req_128bit(&aesni_enc_xts, req,
611 XTS_TWEAK_CAST(aesni_xts_tweak),
612 aes_ctx(ctx->raw_tweak_ctx),
613 aes_ctx(ctx->raw_crypt_ctx));
616 static int xts_decrypt(struct skcipher_request *req)
618 struct crypto_skcipher *tfm = crypto_skcipher_reqtfm(req);
619 struct aesni_xts_ctx *ctx = crypto_skcipher_ctx(tfm);
621 return glue_xts_req_128bit(&aesni_dec_xts, req,
622 XTS_TWEAK_CAST(aesni_xts_tweak),
623 aes_ctx(ctx->raw_tweak_ctx),
624 aes_ctx(ctx->raw_crypt_ctx));
628 rfc4106_set_hash_subkey(u8 *hash_subkey, const u8 *key, unsigned int key_len)
630 struct crypto_cipher *tfm;
633 tfm = crypto_alloc_cipher("aes", 0, 0);
637 ret = crypto_cipher_setkey(tfm, key, key_len);
639 goto out_free_cipher;
641 /* Clear the data in the hash sub key container to zero.*/
642 /* We want to cipher all zeros to create the hash sub key. */
643 memset(hash_subkey, 0, RFC4106_HASH_SUBKEY_SIZE);
645 crypto_cipher_encrypt_one(tfm, hash_subkey, hash_subkey);
648 crypto_free_cipher(tfm);
652 static int common_rfc4106_set_key(struct crypto_aead *aead, const u8 *key,
653 unsigned int key_len)
655 struct aesni_rfc4106_gcm_ctx *ctx = aesni_rfc4106_gcm_ctx_get(aead);
658 crypto_aead_set_flags(aead, CRYPTO_TFM_RES_BAD_KEY_LEN);
661 /*Account for 4 byte nonce at the end.*/
664 memcpy(ctx->nonce, key + key_len, sizeof(ctx->nonce));
666 return aes_set_key_common(crypto_aead_tfm(aead),
667 &ctx->aes_key_expanded, key, key_len) ?:
668 rfc4106_set_hash_subkey(ctx->hash_subkey, key, key_len);
671 /* This is the Integrity Check Value (aka the authentication tag) length and can
672 * be 8, 12 or 16 bytes long. */
673 static int common_rfc4106_set_authsize(struct crypto_aead *aead,
674 unsigned int authsize)
688 static int generic_gcmaes_set_authsize(struct crypto_aead *tfm,
689 unsigned int authsize)
707 static int gcmaes_crypt_by_sg(bool enc, struct aead_request *req,
708 unsigned int assoclen, u8 *hash_subkey,
709 u8 *iv, void *aes_ctx)
711 struct crypto_aead *tfm = crypto_aead_reqtfm(req);
712 unsigned long auth_tag_len = crypto_aead_authsize(tfm);
713 const struct aesni_gcm_tfm_s *gcm_tfm = aesni_gcm_tfm;
714 struct gcm_context_data data AESNI_ALIGN_ATTR;
715 struct scatter_walk dst_sg_walk = {};
716 unsigned long left = req->cryptlen;
717 unsigned long len, srclen, dstlen;
718 struct scatter_walk assoc_sg_walk;
719 struct scatter_walk src_sg_walk;
720 struct scatterlist src_start[2];
721 struct scatterlist dst_start[2];
722 struct scatterlist *src_sg;
723 struct scatterlist *dst_sg;
724 u8 *src, *dst, *assoc;
729 left -= auth_tag_len;
731 #ifdef CONFIG_AS_AVX2
732 if (left < AVX_GEN4_OPTSIZE && gcm_tfm == &aesni_gcm_tfm_avx_gen4)
733 gcm_tfm = &aesni_gcm_tfm_avx_gen2;
736 if (left < AVX_GEN2_OPTSIZE && gcm_tfm == &aesni_gcm_tfm_avx_gen2)
737 gcm_tfm = &aesni_gcm_tfm_sse;
740 /* Linearize assoc, if not already linear */
741 if (req->src->length >= assoclen && req->src->length &&
742 (!PageHighMem(sg_page(req->src)) ||
743 req->src->offset + req->src->length <= PAGE_SIZE)) {
744 scatterwalk_start(&assoc_sg_walk, req->src);
745 assoc = scatterwalk_map(&assoc_sg_walk);
747 /* assoc can be any length, so must be on heap */
748 assocmem = kmalloc(assoclen, GFP_ATOMIC);
749 if (unlikely(!assocmem))
753 scatterwalk_map_and_copy(assoc, req->src, 0, assoclen, 0);
757 src_sg = scatterwalk_ffwd(src_start, req->src, req->assoclen);
758 scatterwalk_start(&src_sg_walk, src_sg);
759 if (req->src != req->dst) {
760 dst_sg = scatterwalk_ffwd(dst_start, req->dst,
762 scatterwalk_start(&dst_sg_walk, dst_sg);
767 gcm_tfm->init(aes_ctx, &data, iv,
768 hash_subkey, assoc, assoclen);
769 if (req->src != req->dst) {
771 src = scatterwalk_map(&src_sg_walk);
772 dst = scatterwalk_map(&dst_sg_walk);
773 srclen = scatterwalk_clamp(&src_sg_walk, left);
774 dstlen = scatterwalk_clamp(&dst_sg_walk, left);
775 len = min(srclen, dstlen);
778 gcm_tfm->enc_update(aes_ctx, &data,
781 gcm_tfm->dec_update(aes_ctx, &data,
786 scatterwalk_unmap(src);
787 scatterwalk_unmap(dst);
788 scatterwalk_advance(&src_sg_walk, len);
789 scatterwalk_advance(&dst_sg_walk, len);
790 scatterwalk_done(&src_sg_walk, 0, left);
791 scatterwalk_done(&dst_sg_walk, 1, left);
795 dst = src = scatterwalk_map(&src_sg_walk);
796 len = scatterwalk_clamp(&src_sg_walk, left);
799 gcm_tfm->enc_update(aes_ctx, &data,
802 gcm_tfm->dec_update(aes_ctx, &data,
806 scatterwalk_unmap(src);
807 scatterwalk_advance(&src_sg_walk, len);
808 scatterwalk_done(&src_sg_walk, 1, left);
811 gcm_tfm->finalize(aes_ctx, &data, authTag, auth_tag_len);
815 scatterwalk_unmap(assoc);
822 /* Copy out original authTag */
823 scatterwalk_map_and_copy(authTagMsg, req->src,
824 req->assoclen + req->cryptlen -
828 /* Compare generated tag with passed in tag. */
829 return crypto_memneq(authTagMsg, authTag, auth_tag_len) ?
833 /* Copy in the authTag */
834 scatterwalk_map_and_copy(authTag, req->dst,
835 req->assoclen + req->cryptlen,
841 static int gcmaes_encrypt(struct aead_request *req, unsigned int assoclen,
842 u8 *hash_subkey, u8 *iv, void *aes_ctx)
844 return gcmaes_crypt_by_sg(true, req, assoclen, hash_subkey, iv,
848 static int gcmaes_decrypt(struct aead_request *req, unsigned int assoclen,
849 u8 *hash_subkey, u8 *iv, void *aes_ctx)
851 return gcmaes_crypt_by_sg(false, req, assoclen, hash_subkey, iv,
855 static int helper_rfc4106_encrypt(struct aead_request *req)
857 struct crypto_aead *tfm = crypto_aead_reqtfm(req);
858 struct aesni_rfc4106_gcm_ctx *ctx = aesni_rfc4106_gcm_ctx_get(tfm);
859 void *aes_ctx = &(ctx->aes_key_expanded);
860 u8 iv[16] __attribute__ ((__aligned__(AESNI_ALIGN)));
862 __be32 counter = cpu_to_be32(1);
864 /* Assuming we are supporting rfc4106 64-bit extended */
865 /* sequence numbers We need to have the AAD length equal */
866 /* to 16 or 20 bytes */
867 if (unlikely(req->assoclen != 16 && req->assoclen != 20))
871 for (i = 0; i < 4; i++)
872 *(iv+i) = ctx->nonce[i];
873 for (i = 0; i < 8; i++)
874 *(iv+4+i) = req->iv[i];
875 *((__be32 *)(iv+12)) = counter;
877 return gcmaes_encrypt(req, req->assoclen - 8, ctx->hash_subkey, iv,
881 static int helper_rfc4106_decrypt(struct aead_request *req)
883 __be32 counter = cpu_to_be32(1);
884 struct crypto_aead *tfm = crypto_aead_reqtfm(req);
885 struct aesni_rfc4106_gcm_ctx *ctx = aesni_rfc4106_gcm_ctx_get(tfm);
886 void *aes_ctx = &(ctx->aes_key_expanded);
887 u8 iv[16] __attribute__ ((__aligned__(AESNI_ALIGN)));
890 if (unlikely(req->assoclen != 16 && req->assoclen != 20))
893 /* Assuming we are supporting rfc4106 64-bit extended */
894 /* sequence numbers We need to have the AAD length */
895 /* equal to 16 or 20 bytes */
898 for (i = 0; i < 4; i++)
899 *(iv+i) = ctx->nonce[i];
900 for (i = 0; i < 8; i++)
901 *(iv+4+i) = req->iv[i];
902 *((__be32 *)(iv+12)) = counter;
904 return gcmaes_decrypt(req, req->assoclen - 8, ctx->hash_subkey, iv,
909 static struct crypto_alg aesni_cipher_alg = {
911 .cra_driver_name = "aes-aesni",
913 .cra_flags = CRYPTO_ALG_TYPE_CIPHER,
914 .cra_blocksize = AES_BLOCK_SIZE,
915 .cra_ctxsize = CRYPTO_AES_CTX_SIZE,
916 .cra_module = THIS_MODULE,
919 .cia_min_keysize = AES_MIN_KEY_SIZE,
920 .cia_max_keysize = AES_MAX_KEY_SIZE,
921 .cia_setkey = aes_set_key,
922 .cia_encrypt = aesni_encrypt,
923 .cia_decrypt = aesni_decrypt
928 static struct skcipher_alg aesni_skciphers[] = {
931 .cra_name = "__ecb(aes)",
932 .cra_driver_name = "__ecb-aes-aesni",
934 .cra_flags = CRYPTO_ALG_INTERNAL,
935 .cra_blocksize = AES_BLOCK_SIZE,
936 .cra_ctxsize = CRYPTO_AES_CTX_SIZE,
937 .cra_module = THIS_MODULE,
939 .min_keysize = AES_MIN_KEY_SIZE,
940 .max_keysize = AES_MAX_KEY_SIZE,
941 .setkey = aesni_skcipher_setkey,
942 .encrypt = ecb_encrypt,
943 .decrypt = ecb_decrypt,
946 .cra_name = "__cbc(aes)",
947 .cra_driver_name = "__cbc-aes-aesni",
949 .cra_flags = CRYPTO_ALG_INTERNAL,
950 .cra_blocksize = AES_BLOCK_SIZE,
951 .cra_ctxsize = CRYPTO_AES_CTX_SIZE,
952 .cra_module = THIS_MODULE,
954 .min_keysize = AES_MIN_KEY_SIZE,
955 .max_keysize = AES_MAX_KEY_SIZE,
956 .ivsize = AES_BLOCK_SIZE,
957 .setkey = aesni_skcipher_setkey,
958 .encrypt = cbc_encrypt,
959 .decrypt = cbc_decrypt,
963 .cra_name = "__ctr(aes)",
964 .cra_driver_name = "__ctr-aes-aesni",
966 .cra_flags = CRYPTO_ALG_INTERNAL,
968 .cra_ctxsize = CRYPTO_AES_CTX_SIZE,
969 .cra_module = THIS_MODULE,
971 .min_keysize = AES_MIN_KEY_SIZE,
972 .max_keysize = AES_MAX_KEY_SIZE,
973 .ivsize = AES_BLOCK_SIZE,
974 .chunksize = AES_BLOCK_SIZE,
975 .setkey = aesni_skcipher_setkey,
976 .encrypt = ctr_crypt,
977 .decrypt = ctr_crypt,
980 .cra_name = "__xts(aes)",
981 .cra_driver_name = "__xts-aes-aesni",
983 .cra_flags = CRYPTO_ALG_INTERNAL,
984 .cra_blocksize = AES_BLOCK_SIZE,
985 .cra_ctxsize = XTS_AES_CTX_SIZE,
986 .cra_module = THIS_MODULE,
988 .min_keysize = 2 * AES_MIN_KEY_SIZE,
989 .max_keysize = 2 * AES_MAX_KEY_SIZE,
990 .ivsize = AES_BLOCK_SIZE,
991 .setkey = xts_aesni_setkey,
992 .encrypt = xts_encrypt,
993 .decrypt = xts_decrypt,
999 struct simd_skcipher_alg *aesni_simd_skciphers[ARRAY_SIZE(aesni_skciphers)];
1001 #ifdef CONFIG_X86_64
1002 static int generic_gcmaes_set_key(struct crypto_aead *aead, const u8 *key,
1003 unsigned int key_len)
1005 struct generic_gcmaes_ctx *ctx = generic_gcmaes_ctx_get(aead);
1007 return aes_set_key_common(crypto_aead_tfm(aead),
1008 &ctx->aes_key_expanded, key, key_len) ?:
1009 rfc4106_set_hash_subkey(ctx->hash_subkey, key, key_len);
1012 static int generic_gcmaes_encrypt(struct aead_request *req)
1014 struct crypto_aead *tfm = crypto_aead_reqtfm(req);
1015 struct generic_gcmaes_ctx *ctx = generic_gcmaes_ctx_get(tfm);
1016 void *aes_ctx = &(ctx->aes_key_expanded);
1017 u8 iv[16] __attribute__ ((__aligned__(AESNI_ALIGN)));
1018 __be32 counter = cpu_to_be32(1);
1020 memcpy(iv, req->iv, 12);
1021 *((__be32 *)(iv+12)) = counter;
1023 return gcmaes_encrypt(req, req->assoclen, ctx->hash_subkey, iv,
1027 static int generic_gcmaes_decrypt(struct aead_request *req)
1029 __be32 counter = cpu_to_be32(1);
1030 struct crypto_aead *tfm = crypto_aead_reqtfm(req);
1031 struct generic_gcmaes_ctx *ctx = generic_gcmaes_ctx_get(tfm);
1032 void *aes_ctx = &(ctx->aes_key_expanded);
1033 u8 iv[16] __attribute__ ((__aligned__(AESNI_ALIGN)));
1035 memcpy(iv, req->iv, 12);
1036 *((__be32 *)(iv+12)) = counter;
1038 return gcmaes_decrypt(req, req->assoclen, ctx->hash_subkey, iv,
1042 static struct aead_alg aesni_aeads[] = { {
1043 .setkey = common_rfc4106_set_key,
1044 .setauthsize = common_rfc4106_set_authsize,
1045 .encrypt = helper_rfc4106_encrypt,
1046 .decrypt = helper_rfc4106_decrypt,
1047 .ivsize = GCM_RFC4106_IV_SIZE,
1050 .cra_name = "__rfc4106(gcm(aes))",
1051 .cra_driver_name = "__rfc4106-gcm-aesni",
1052 .cra_priority = 400,
1053 .cra_flags = CRYPTO_ALG_INTERNAL,
1055 .cra_ctxsize = sizeof(struct aesni_rfc4106_gcm_ctx),
1056 .cra_alignmask = AESNI_ALIGN - 1,
1057 .cra_module = THIS_MODULE,
1060 .setkey = generic_gcmaes_set_key,
1061 .setauthsize = generic_gcmaes_set_authsize,
1062 .encrypt = generic_gcmaes_encrypt,
1063 .decrypt = generic_gcmaes_decrypt,
1064 .ivsize = GCM_AES_IV_SIZE,
1067 .cra_name = "__gcm(aes)",
1068 .cra_driver_name = "__generic-gcm-aesni",
1069 .cra_priority = 400,
1070 .cra_flags = CRYPTO_ALG_INTERNAL,
1072 .cra_ctxsize = sizeof(struct generic_gcmaes_ctx),
1073 .cra_alignmask = AESNI_ALIGN - 1,
1074 .cra_module = THIS_MODULE,
1078 static struct aead_alg aesni_aeads[0];
1081 static struct simd_aead_alg *aesni_simd_aeads[ARRAY_SIZE(aesni_aeads)];
1083 static const struct x86_cpu_id aesni_cpu_id[] = {
1084 X86_FEATURE_MATCH(X86_FEATURE_AES),
1087 MODULE_DEVICE_TABLE(x86cpu, aesni_cpu_id);
1089 static int __init aesni_init(void)
1093 if (!x86_match_cpu(aesni_cpu_id))
1095 #ifdef CONFIG_X86_64
1096 #ifdef CONFIG_AS_AVX2
1097 if (boot_cpu_has(X86_FEATURE_AVX2)) {
1098 pr_info("AVX2 version of gcm_enc/dec engaged.\n");
1099 aesni_gcm_tfm = &aesni_gcm_tfm_avx_gen4;
1102 #ifdef CONFIG_AS_AVX
1103 if (boot_cpu_has(X86_FEATURE_AVX)) {
1104 pr_info("AVX version of gcm_enc/dec engaged.\n");
1105 aesni_gcm_tfm = &aesni_gcm_tfm_avx_gen2;
1109 pr_info("SSE version of gcm_enc/dec engaged.\n");
1110 aesni_gcm_tfm = &aesni_gcm_tfm_sse;
1112 aesni_ctr_enc_tfm = aesni_ctr_enc;
1113 #ifdef CONFIG_AS_AVX
1114 if (boot_cpu_has(X86_FEATURE_AVX)) {
1115 /* optimize performance of ctr mode encryption transform */
1116 aesni_ctr_enc_tfm = aesni_ctr_enc_avx_tfm;
1117 pr_info("AES CTR mode by8 optimization enabled\n");
1122 err = crypto_register_alg(&aesni_cipher_alg);
1126 err = simd_register_skciphers_compat(aesni_skciphers,
1127 ARRAY_SIZE(aesni_skciphers),
1128 aesni_simd_skciphers);
1130 goto unregister_cipher;
1132 err = simd_register_aeads_compat(aesni_aeads, ARRAY_SIZE(aesni_aeads),
1135 goto unregister_skciphers;
1139 unregister_skciphers:
1140 simd_unregister_skciphers(aesni_skciphers, ARRAY_SIZE(aesni_skciphers),
1141 aesni_simd_skciphers);
1143 crypto_unregister_alg(&aesni_cipher_alg);
1147 static void __exit aesni_exit(void)
1149 simd_unregister_aeads(aesni_aeads, ARRAY_SIZE(aesni_aeads),
1151 simd_unregister_skciphers(aesni_skciphers, ARRAY_SIZE(aesni_skciphers),
1152 aesni_simd_skciphers);
1153 crypto_unregister_alg(&aesni_cipher_alg);
1156 late_initcall(aesni_init);
1157 module_exit(aesni_exit);
1159 MODULE_DESCRIPTION("Rijndael (AES) Cipher Algorithm, Intel AES-NI instructions optimized");
1160 MODULE_LICENSE("GPL");
1161 MODULE_ALIAS_CRYPTO("aes");