1 // SPDX-License-Identifier: GPL-2.0-or-later
3 * Support for Intel AES-NI instructions. This file contains glue
4 * code, the real AES implementation is in intel-aes_asm.S.
6 * Copyright (C) 2008, Intel Corp.
7 * Author: Huang Ying <ying.huang@intel.com>
9 * Added RFC4106 AES-GCM support for 128-bit keys under the AEAD
10 * interface for 64-bit kernels.
11 * Authors: Adrian Hoban <adrian.hoban@intel.com>
12 * Gabriele Paoloni <gabriele.paoloni@intel.com>
13 * Tadeusz Struk (tadeusz.struk@intel.com)
14 * Aidan O'Mahony (aidan.o.mahony@intel.com)
15 * Copyright (c) 2010, Intel Corporation.
18 #include <linux/hardirq.h>
19 #include <linux/types.h>
20 #include <linux/module.h>
21 #include <linux/err.h>
22 #include <crypto/algapi.h>
23 #include <crypto/aes.h>
24 #include <crypto/ctr.h>
25 #include <crypto/b128ops.h>
26 #include <crypto/gcm.h>
27 #include <crypto/xts.h>
28 #include <asm/cpu_device_id.h>
30 #include <crypto/scatterwalk.h>
31 #include <crypto/internal/aead.h>
32 #include <crypto/internal/simd.h>
33 #include <crypto/internal/skcipher.h>
34 #include <linux/jump_label.h>
35 #include <linux/workqueue.h>
36 #include <linux/spinlock.h>
37 #include <linux/static_call.h>
40 #define AESNI_ALIGN 16
41 #define AESNI_ALIGN_ATTR __attribute__ ((__aligned__(AESNI_ALIGN)))
42 #define AES_BLOCK_MASK (~(AES_BLOCK_SIZE - 1))
43 #define RFC4106_HASH_SUBKEY_SIZE 16
44 #define AESNI_ALIGN_EXTRA ((AESNI_ALIGN - 1) & ~(CRYPTO_MINALIGN - 1))
45 #define CRYPTO_AES_CTX_SIZE (sizeof(struct crypto_aes_ctx) + AESNI_ALIGN_EXTRA)
46 #define XTS_AES_CTX_SIZE (sizeof(struct aesni_xts_ctx) + AESNI_ALIGN_EXTRA)
48 /* This data is stored at the end of the crypto_tfm struct.
49 * It's a type of per "session" data storage location.
50 * This needs to be 16 byte aligned.
52 struct aesni_rfc4106_gcm_ctx {
53 u8 hash_subkey[16] AESNI_ALIGN_ATTR;
54 struct crypto_aes_ctx aes_key_expanded AESNI_ALIGN_ATTR;
58 struct generic_gcmaes_ctx {
59 u8 hash_subkey[16] AESNI_ALIGN_ATTR;
60 struct crypto_aes_ctx aes_key_expanded AESNI_ALIGN_ATTR;
63 struct aesni_xts_ctx {
64 u8 raw_tweak_ctx[sizeof(struct crypto_aes_ctx)] AESNI_ALIGN_ATTR;
65 u8 raw_crypt_ctx[sizeof(struct crypto_aes_ctx)] AESNI_ALIGN_ATTR;
68 #define GCM_BLOCK_LEN 16
70 struct gcm_context_data {
71 /* init, update and finalize context data */
72 u8 aad_hash[GCM_BLOCK_LEN];
75 u8 partial_block_enc_key[GCM_BLOCK_LEN];
76 u8 orig_IV[GCM_BLOCK_LEN];
77 u8 current_counter[GCM_BLOCK_LEN];
78 u64 partial_block_len;
80 u8 hash_keys[GCM_BLOCK_LEN * 16];
83 asmlinkage int aesni_set_key(struct crypto_aes_ctx *ctx, const u8 *in_key,
84 unsigned int key_len);
85 asmlinkage void aesni_enc(const void *ctx, u8 *out, const u8 *in);
86 asmlinkage void aesni_dec(const void *ctx, u8 *out, const u8 *in);
87 asmlinkage void aesni_ecb_enc(struct crypto_aes_ctx *ctx, u8 *out,
88 const u8 *in, unsigned int len);
89 asmlinkage void aesni_ecb_dec(struct crypto_aes_ctx *ctx, u8 *out,
90 const u8 *in, unsigned int len);
91 asmlinkage void aesni_cbc_enc(struct crypto_aes_ctx *ctx, u8 *out,
92 const u8 *in, unsigned int len, u8 *iv);
93 asmlinkage void aesni_cbc_dec(struct crypto_aes_ctx *ctx, u8 *out,
94 const u8 *in, unsigned int len, u8 *iv);
95 asmlinkage void aesni_cts_cbc_enc(struct crypto_aes_ctx *ctx, u8 *out,
96 const u8 *in, unsigned int len, u8 *iv);
97 asmlinkage void aesni_cts_cbc_dec(struct crypto_aes_ctx *ctx, u8 *out,
98 const u8 *in, unsigned int len, u8 *iv);
100 #define AVX_GEN2_OPTSIZE 640
101 #define AVX_GEN4_OPTSIZE 4096
103 asmlinkage void aesni_xts_encrypt(const struct crypto_aes_ctx *ctx, u8 *out,
104 const u8 *in, unsigned int len, u8 *iv);
106 asmlinkage void aesni_xts_decrypt(const struct crypto_aes_ctx *ctx, u8 *out,
107 const u8 *in, unsigned int len, u8 *iv);
111 asmlinkage void aesni_ctr_enc(struct crypto_aes_ctx *ctx, u8 *out,
112 const u8 *in, unsigned int len, u8 *iv);
113 DEFINE_STATIC_CALL(aesni_ctr_enc_tfm, aesni_ctr_enc);
115 /* Scatter / Gather routines, with args similar to above */
116 asmlinkage void aesni_gcm_init(void *ctx,
117 struct gcm_context_data *gdata,
119 u8 *hash_subkey, const u8 *aad,
120 unsigned long aad_len);
121 asmlinkage void aesni_gcm_enc_update(void *ctx,
122 struct gcm_context_data *gdata, u8 *out,
123 const u8 *in, unsigned long plaintext_len);
124 asmlinkage void aesni_gcm_dec_update(void *ctx,
125 struct gcm_context_data *gdata, u8 *out,
127 unsigned long ciphertext_len);
128 asmlinkage void aesni_gcm_finalize(void *ctx,
129 struct gcm_context_data *gdata,
130 u8 *auth_tag, unsigned long auth_tag_len);
132 asmlinkage void aes_ctr_enc_128_avx_by8(const u8 *in, u8 *iv,
133 void *keys, u8 *out, unsigned int num_bytes);
134 asmlinkage void aes_ctr_enc_192_avx_by8(const u8 *in, u8 *iv,
135 void *keys, u8 *out, unsigned int num_bytes);
136 asmlinkage void aes_ctr_enc_256_avx_by8(const u8 *in, u8 *iv,
137 void *keys, u8 *out, unsigned int num_bytes);
139 * asmlinkage void aesni_gcm_init_avx_gen2()
140 * gcm_data *my_ctx_data, context data
141 * u8 *hash_subkey, the Hash sub key input. Data starts on a 16-byte boundary.
143 asmlinkage void aesni_gcm_init_avx_gen2(void *my_ctx_data,
144 struct gcm_context_data *gdata,
148 unsigned long aad_len);
150 asmlinkage void aesni_gcm_enc_update_avx_gen2(void *ctx,
151 struct gcm_context_data *gdata, u8 *out,
152 const u8 *in, unsigned long plaintext_len);
153 asmlinkage void aesni_gcm_dec_update_avx_gen2(void *ctx,
154 struct gcm_context_data *gdata, u8 *out,
156 unsigned long ciphertext_len);
157 asmlinkage void aesni_gcm_finalize_avx_gen2(void *ctx,
158 struct gcm_context_data *gdata,
159 u8 *auth_tag, unsigned long auth_tag_len);
162 * asmlinkage void aesni_gcm_init_avx_gen4()
163 * gcm_data *my_ctx_data, context data
164 * u8 *hash_subkey, the Hash sub key input. Data starts on a 16-byte boundary.
166 asmlinkage void aesni_gcm_init_avx_gen4(void *my_ctx_data,
167 struct gcm_context_data *gdata,
171 unsigned long aad_len);
173 asmlinkage void aesni_gcm_enc_update_avx_gen4(void *ctx,
174 struct gcm_context_data *gdata, u8 *out,
175 const u8 *in, unsigned long plaintext_len);
176 asmlinkage void aesni_gcm_dec_update_avx_gen4(void *ctx,
177 struct gcm_context_data *gdata, u8 *out,
179 unsigned long ciphertext_len);
180 asmlinkage void aesni_gcm_finalize_avx_gen4(void *ctx,
181 struct gcm_context_data *gdata,
182 u8 *auth_tag, unsigned long auth_tag_len);
184 static __ro_after_init DEFINE_STATIC_KEY_FALSE(gcm_use_avx);
185 static __ro_after_init DEFINE_STATIC_KEY_FALSE(gcm_use_avx2);
188 aesni_rfc4106_gcm_ctx *aesni_rfc4106_gcm_ctx_get(struct crypto_aead *tfm)
190 unsigned long align = AESNI_ALIGN;
192 if (align <= crypto_tfm_ctx_alignment())
194 return PTR_ALIGN(crypto_aead_ctx(tfm), align);
198 generic_gcmaes_ctx *generic_gcmaes_ctx_get(struct crypto_aead *tfm)
200 unsigned long align = AESNI_ALIGN;
202 if (align <= crypto_tfm_ctx_alignment())
204 return PTR_ALIGN(crypto_aead_ctx(tfm), align);
208 static inline struct crypto_aes_ctx *aes_ctx(void *raw_ctx)
210 unsigned long addr = (unsigned long)raw_ctx;
211 unsigned long align = AESNI_ALIGN;
213 if (align <= crypto_tfm_ctx_alignment())
215 return (struct crypto_aes_ctx *)ALIGN(addr, align);
218 static int aes_set_key_common(struct crypto_tfm *tfm, void *raw_ctx,
219 const u8 *in_key, unsigned int key_len)
221 struct crypto_aes_ctx *ctx = aes_ctx(raw_ctx);
224 if (key_len != AES_KEYSIZE_128 && key_len != AES_KEYSIZE_192 &&
225 key_len != AES_KEYSIZE_256)
228 if (!crypto_simd_usable())
229 err = aes_expandkey(ctx, in_key, key_len);
232 err = aesni_set_key(ctx, in_key, key_len);
239 static int aes_set_key(struct crypto_tfm *tfm, const u8 *in_key,
240 unsigned int key_len)
242 return aes_set_key_common(tfm, crypto_tfm_ctx(tfm), in_key, key_len);
245 static void aesni_encrypt(struct crypto_tfm *tfm, u8 *dst, const u8 *src)
247 struct crypto_aes_ctx *ctx = aes_ctx(crypto_tfm_ctx(tfm));
249 if (!crypto_simd_usable()) {
250 aes_encrypt(ctx, dst, src);
253 aesni_enc(ctx, dst, src);
258 static void aesni_decrypt(struct crypto_tfm *tfm, u8 *dst, const u8 *src)
260 struct crypto_aes_ctx *ctx = aes_ctx(crypto_tfm_ctx(tfm));
262 if (!crypto_simd_usable()) {
263 aes_decrypt(ctx, dst, src);
266 aesni_dec(ctx, dst, src);
271 static int aesni_skcipher_setkey(struct crypto_skcipher *tfm, const u8 *key,
274 return aes_set_key_common(crypto_skcipher_tfm(tfm),
275 crypto_skcipher_ctx(tfm), key, len);
278 static int ecb_encrypt(struct skcipher_request *req)
280 struct crypto_skcipher *tfm = crypto_skcipher_reqtfm(req);
281 struct crypto_aes_ctx *ctx = aes_ctx(crypto_skcipher_ctx(tfm));
282 struct skcipher_walk walk;
286 err = skcipher_walk_virt(&walk, req, false);
288 while ((nbytes = walk.nbytes)) {
290 aesni_ecb_enc(ctx, walk.dst.virt.addr, walk.src.virt.addr,
291 nbytes & AES_BLOCK_MASK);
293 nbytes &= AES_BLOCK_SIZE - 1;
294 err = skcipher_walk_done(&walk, nbytes);
300 static int ecb_decrypt(struct skcipher_request *req)
302 struct crypto_skcipher *tfm = crypto_skcipher_reqtfm(req);
303 struct crypto_aes_ctx *ctx = aes_ctx(crypto_skcipher_ctx(tfm));
304 struct skcipher_walk walk;
308 err = skcipher_walk_virt(&walk, req, false);
310 while ((nbytes = walk.nbytes)) {
312 aesni_ecb_dec(ctx, walk.dst.virt.addr, walk.src.virt.addr,
313 nbytes & AES_BLOCK_MASK);
315 nbytes &= AES_BLOCK_SIZE - 1;
316 err = skcipher_walk_done(&walk, nbytes);
322 static int cbc_encrypt(struct skcipher_request *req)
324 struct crypto_skcipher *tfm = crypto_skcipher_reqtfm(req);
325 struct crypto_aes_ctx *ctx = aes_ctx(crypto_skcipher_ctx(tfm));
326 struct skcipher_walk walk;
330 err = skcipher_walk_virt(&walk, req, false);
332 while ((nbytes = walk.nbytes)) {
334 aesni_cbc_enc(ctx, walk.dst.virt.addr, walk.src.virt.addr,
335 nbytes & AES_BLOCK_MASK, walk.iv);
337 nbytes &= AES_BLOCK_SIZE - 1;
338 err = skcipher_walk_done(&walk, nbytes);
344 static int cbc_decrypt(struct skcipher_request *req)
346 struct crypto_skcipher *tfm = crypto_skcipher_reqtfm(req);
347 struct crypto_aes_ctx *ctx = aes_ctx(crypto_skcipher_ctx(tfm));
348 struct skcipher_walk walk;
352 err = skcipher_walk_virt(&walk, req, false);
354 while ((nbytes = walk.nbytes)) {
356 aesni_cbc_dec(ctx, walk.dst.virt.addr, walk.src.virt.addr,
357 nbytes & AES_BLOCK_MASK, walk.iv);
359 nbytes &= AES_BLOCK_SIZE - 1;
360 err = skcipher_walk_done(&walk, nbytes);
366 static int cts_cbc_encrypt(struct skcipher_request *req)
368 struct crypto_skcipher *tfm = crypto_skcipher_reqtfm(req);
369 struct crypto_aes_ctx *ctx = aes_ctx(crypto_skcipher_ctx(tfm));
370 int cbc_blocks = DIV_ROUND_UP(req->cryptlen, AES_BLOCK_SIZE) - 2;
371 struct scatterlist *src = req->src, *dst = req->dst;
372 struct scatterlist sg_src[2], sg_dst[2];
373 struct skcipher_request subreq;
374 struct skcipher_walk walk;
377 skcipher_request_set_tfm(&subreq, tfm);
378 skcipher_request_set_callback(&subreq, skcipher_request_flags(req),
381 if (req->cryptlen <= AES_BLOCK_SIZE) {
382 if (req->cryptlen < AES_BLOCK_SIZE)
387 if (cbc_blocks > 0) {
388 skcipher_request_set_crypt(&subreq, req->src, req->dst,
389 cbc_blocks * AES_BLOCK_SIZE,
392 err = cbc_encrypt(&subreq);
396 if (req->cryptlen == AES_BLOCK_SIZE)
399 dst = src = scatterwalk_ffwd(sg_src, req->src, subreq.cryptlen);
400 if (req->dst != req->src)
401 dst = scatterwalk_ffwd(sg_dst, req->dst,
405 /* handle ciphertext stealing */
406 skcipher_request_set_crypt(&subreq, src, dst,
407 req->cryptlen - cbc_blocks * AES_BLOCK_SIZE,
410 err = skcipher_walk_virt(&walk, &subreq, false);
415 aesni_cts_cbc_enc(ctx, walk.dst.virt.addr, walk.src.virt.addr,
416 walk.nbytes, walk.iv);
419 return skcipher_walk_done(&walk, 0);
422 static int cts_cbc_decrypt(struct skcipher_request *req)
424 struct crypto_skcipher *tfm = crypto_skcipher_reqtfm(req);
425 struct crypto_aes_ctx *ctx = aes_ctx(crypto_skcipher_ctx(tfm));
426 int cbc_blocks = DIV_ROUND_UP(req->cryptlen, AES_BLOCK_SIZE) - 2;
427 struct scatterlist *src = req->src, *dst = req->dst;
428 struct scatterlist sg_src[2], sg_dst[2];
429 struct skcipher_request subreq;
430 struct skcipher_walk walk;
433 skcipher_request_set_tfm(&subreq, tfm);
434 skcipher_request_set_callback(&subreq, skcipher_request_flags(req),
437 if (req->cryptlen <= AES_BLOCK_SIZE) {
438 if (req->cryptlen < AES_BLOCK_SIZE)
443 if (cbc_blocks > 0) {
444 skcipher_request_set_crypt(&subreq, req->src, req->dst,
445 cbc_blocks * AES_BLOCK_SIZE,
448 err = cbc_decrypt(&subreq);
452 if (req->cryptlen == AES_BLOCK_SIZE)
455 dst = src = scatterwalk_ffwd(sg_src, req->src, subreq.cryptlen);
456 if (req->dst != req->src)
457 dst = scatterwalk_ffwd(sg_dst, req->dst,
461 /* handle ciphertext stealing */
462 skcipher_request_set_crypt(&subreq, src, dst,
463 req->cryptlen - cbc_blocks * AES_BLOCK_SIZE,
466 err = skcipher_walk_virt(&walk, &subreq, false);
471 aesni_cts_cbc_dec(ctx, walk.dst.virt.addr, walk.src.virt.addr,
472 walk.nbytes, walk.iv);
475 return skcipher_walk_done(&walk, 0);
479 static void aesni_ctr_enc_avx_tfm(struct crypto_aes_ctx *ctx, u8 *out,
480 const u8 *in, unsigned int len, u8 *iv)
483 * based on key length, override with the by8 version
484 * of ctr mode encryption/decryption for improved performance
485 * aes_set_key_common() ensures that key length is one of
488 if (ctx->key_length == AES_KEYSIZE_128)
489 aes_ctr_enc_128_avx_by8(in, iv, (void *)ctx, out, len);
490 else if (ctx->key_length == AES_KEYSIZE_192)
491 aes_ctr_enc_192_avx_by8(in, iv, (void *)ctx, out, len);
493 aes_ctr_enc_256_avx_by8(in, iv, (void *)ctx, out, len);
496 static int ctr_crypt(struct skcipher_request *req)
498 struct crypto_skcipher *tfm = crypto_skcipher_reqtfm(req);
499 struct crypto_aes_ctx *ctx = aes_ctx(crypto_skcipher_ctx(tfm));
500 u8 keystream[AES_BLOCK_SIZE];
501 struct skcipher_walk walk;
505 err = skcipher_walk_virt(&walk, req, false);
507 while ((nbytes = walk.nbytes) > 0) {
509 if (nbytes & AES_BLOCK_MASK)
510 static_call(aesni_ctr_enc_tfm)(ctx, walk.dst.virt.addr,
512 nbytes & AES_BLOCK_MASK,
514 nbytes &= ~AES_BLOCK_MASK;
516 if (walk.nbytes == walk.total && nbytes > 0) {
517 aesni_enc(ctx, keystream, walk.iv);
518 crypto_xor_cpy(walk.dst.virt.addr + walk.nbytes - nbytes,
519 walk.src.virt.addr + walk.nbytes - nbytes,
521 crypto_inc(walk.iv, AES_BLOCK_SIZE);
525 err = skcipher_walk_done(&walk, nbytes);
531 rfc4106_set_hash_subkey(u8 *hash_subkey, const u8 *key, unsigned int key_len)
533 struct crypto_aes_ctx ctx;
536 ret = aes_expandkey(&ctx, key, key_len);
540 /* Clear the data in the hash sub key container to zero.*/
541 /* We want to cipher all zeros to create the hash sub key. */
542 memset(hash_subkey, 0, RFC4106_HASH_SUBKEY_SIZE);
544 aes_encrypt(&ctx, hash_subkey, hash_subkey);
546 memzero_explicit(&ctx, sizeof(ctx));
550 static int common_rfc4106_set_key(struct crypto_aead *aead, const u8 *key,
551 unsigned int key_len)
553 struct aesni_rfc4106_gcm_ctx *ctx = aesni_rfc4106_gcm_ctx_get(aead);
558 /*Account for 4 byte nonce at the end.*/
561 memcpy(ctx->nonce, key + key_len, sizeof(ctx->nonce));
563 return aes_set_key_common(crypto_aead_tfm(aead),
564 &ctx->aes_key_expanded, key, key_len) ?:
565 rfc4106_set_hash_subkey(ctx->hash_subkey, key, key_len);
568 /* This is the Integrity Check Value (aka the authentication tag) length and can
569 * be 8, 12 or 16 bytes long. */
570 static int common_rfc4106_set_authsize(struct crypto_aead *aead,
571 unsigned int authsize)
585 static int generic_gcmaes_set_authsize(struct crypto_aead *tfm,
586 unsigned int authsize)
604 static int gcmaes_crypt_by_sg(bool enc, struct aead_request *req,
605 unsigned int assoclen, u8 *hash_subkey,
606 u8 *iv, void *aes_ctx, u8 *auth_tag,
607 unsigned long auth_tag_len)
609 u8 databuf[sizeof(struct gcm_context_data) + (AESNI_ALIGN - 8)] __aligned(8);
610 struct gcm_context_data *data = PTR_ALIGN((void *)databuf, AESNI_ALIGN);
611 unsigned long left = req->cryptlen;
612 struct scatter_walk assoc_sg_walk;
613 struct skcipher_walk walk;
614 bool do_avx, do_avx2;
620 left -= auth_tag_len;
622 do_avx = (left >= AVX_GEN2_OPTSIZE);
623 do_avx2 = (left >= AVX_GEN4_OPTSIZE);
625 /* Linearize assoc, if not already linear */
626 if (req->src->length >= assoclen && req->src->length) {
627 scatterwalk_start(&assoc_sg_walk, req->src);
628 assoc = scatterwalk_map(&assoc_sg_walk);
630 gfp_t flags = (req->base.flags & CRYPTO_TFM_REQ_MAY_SLEEP) ?
631 GFP_KERNEL : GFP_ATOMIC;
633 /* assoc can be any length, so must be on heap */
634 assocmem = kmalloc(assoclen, flags);
635 if (unlikely(!assocmem))
639 scatterwalk_map_and_copy(assoc, req->src, 0, assoclen, 0);
643 if (static_branch_likely(&gcm_use_avx2) && do_avx2)
644 aesni_gcm_init_avx_gen4(aes_ctx, data, iv, hash_subkey, assoc,
646 else if (static_branch_likely(&gcm_use_avx) && do_avx)
647 aesni_gcm_init_avx_gen2(aes_ctx, data, iv, hash_subkey, assoc,
650 aesni_gcm_init(aes_ctx, data, iv, hash_subkey, assoc, assoclen);
654 scatterwalk_unmap(assoc);
658 err = enc ? skcipher_walk_aead_encrypt(&walk, req, false)
659 : skcipher_walk_aead_decrypt(&walk, req, false);
661 while (walk.nbytes > 0) {
663 if (static_branch_likely(&gcm_use_avx2) && do_avx2) {
665 aesni_gcm_enc_update_avx_gen4(aes_ctx, data,
670 aesni_gcm_dec_update_avx_gen4(aes_ctx, data,
674 } else if (static_branch_likely(&gcm_use_avx) && do_avx) {
676 aesni_gcm_enc_update_avx_gen2(aes_ctx, data,
681 aesni_gcm_dec_update_avx_gen2(aes_ctx, data,
686 aesni_gcm_enc_update(aes_ctx, data, walk.dst.virt.addr,
687 walk.src.virt.addr, walk.nbytes);
689 aesni_gcm_dec_update(aes_ctx, data, walk.dst.virt.addr,
690 walk.src.virt.addr, walk.nbytes);
694 err = skcipher_walk_done(&walk, 0);
701 if (static_branch_likely(&gcm_use_avx2) && do_avx2)
702 aesni_gcm_finalize_avx_gen4(aes_ctx, data, auth_tag,
704 else if (static_branch_likely(&gcm_use_avx) && do_avx)
705 aesni_gcm_finalize_avx_gen2(aes_ctx, data, auth_tag,
708 aesni_gcm_finalize(aes_ctx, data, auth_tag, auth_tag_len);
714 static int gcmaes_encrypt(struct aead_request *req, unsigned int assoclen,
715 u8 *hash_subkey, u8 *iv, void *aes_ctx)
717 struct crypto_aead *tfm = crypto_aead_reqtfm(req);
718 unsigned long auth_tag_len = crypto_aead_authsize(tfm);
722 err = gcmaes_crypt_by_sg(true, req, assoclen, hash_subkey, iv, aes_ctx,
723 auth_tag, auth_tag_len);
727 scatterwalk_map_and_copy(auth_tag, req->dst,
728 req->assoclen + req->cryptlen,
733 static int gcmaes_decrypt(struct aead_request *req, unsigned int assoclen,
734 u8 *hash_subkey, u8 *iv, void *aes_ctx)
736 struct crypto_aead *tfm = crypto_aead_reqtfm(req);
737 unsigned long auth_tag_len = crypto_aead_authsize(tfm);
742 err = gcmaes_crypt_by_sg(false, req, assoclen, hash_subkey, iv, aes_ctx,
743 auth_tag, auth_tag_len);
747 /* Copy out original auth_tag */
748 scatterwalk_map_and_copy(auth_tag_msg, req->src,
749 req->assoclen + req->cryptlen - auth_tag_len,
752 /* Compare generated tag with passed in tag. */
753 if (crypto_memneq(auth_tag_msg, auth_tag, auth_tag_len)) {
754 memzero_explicit(auth_tag, sizeof(auth_tag));
760 static int helper_rfc4106_encrypt(struct aead_request *req)
762 struct crypto_aead *tfm = crypto_aead_reqtfm(req);
763 struct aesni_rfc4106_gcm_ctx *ctx = aesni_rfc4106_gcm_ctx_get(tfm);
764 void *aes_ctx = &(ctx->aes_key_expanded);
765 u8 ivbuf[16 + (AESNI_ALIGN - 8)] __aligned(8);
766 u8 *iv = PTR_ALIGN(&ivbuf[0], AESNI_ALIGN);
768 __be32 counter = cpu_to_be32(1);
770 /* Assuming we are supporting rfc4106 64-bit extended */
771 /* sequence numbers We need to have the AAD length equal */
772 /* to 16 or 20 bytes */
773 if (unlikely(req->assoclen != 16 && req->assoclen != 20))
777 for (i = 0; i < 4; i++)
778 *(iv+i) = ctx->nonce[i];
779 for (i = 0; i < 8; i++)
780 *(iv+4+i) = req->iv[i];
781 *((__be32 *)(iv+12)) = counter;
783 return gcmaes_encrypt(req, req->assoclen - 8, ctx->hash_subkey, iv,
787 static int helper_rfc4106_decrypt(struct aead_request *req)
789 __be32 counter = cpu_to_be32(1);
790 struct crypto_aead *tfm = crypto_aead_reqtfm(req);
791 struct aesni_rfc4106_gcm_ctx *ctx = aesni_rfc4106_gcm_ctx_get(tfm);
792 void *aes_ctx = &(ctx->aes_key_expanded);
793 u8 ivbuf[16 + (AESNI_ALIGN - 8)] __aligned(8);
794 u8 *iv = PTR_ALIGN(&ivbuf[0], AESNI_ALIGN);
797 if (unlikely(req->assoclen != 16 && req->assoclen != 20))
800 /* Assuming we are supporting rfc4106 64-bit extended */
801 /* sequence numbers We need to have the AAD length */
802 /* equal to 16 or 20 bytes */
805 for (i = 0; i < 4; i++)
806 *(iv+i) = ctx->nonce[i];
807 for (i = 0; i < 8; i++)
808 *(iv+4+i) = req->iv[i];
809 *((__be32 *)(iv+12)) = counter;
811 return gcmaes_decrypt(req, req->assoclen - 8, ctx->hash_subkey, iv,
816 static int xts_aesni_setkey(struct crypto_skcipher *tfm, const u8 *key,
819 struct aesni_xts_ctx *ctx = crypto_skcipher_ctx(tfm);
822 err = xts_verify_key(tfm, key, keylen);
828 /* first half of xts-key is for crypt */
829 err = aes_set_key_common(crypto_skcipher_tfm(tfm), ctx->raw_crypt_ctx,
834 /* second half of xts-key is for tweak */
835 return aes_set_key_common(crypto_skcipher_tfm(tfm), ctx->raw_tweak_ctx,
836 key + keylen, keylen);
839 static int xts_crypt(struct skcipher_request *req, bool encrypt)
841 struct crypto_skcipher *tfm = crypto_skcipher_reqtfm(req);
842 struct aesni_xts_ctx *ctx = crypto_skcipher_ctx(tfm);
843 int tail = req->cryptlen % AES_BLOCK_SIZE;
844 struct skcipher_request subreq;
845 struct skcipher_walk walk;
848 if (req->cryptlen < AES_BLOCK_SIZE)
851 err = skcipher_walk_virt(&walk, req, false);
855 if (unlikely(tail > 0 && walk.nbytes < walk.total)) {
856 int blocks = DIV_ROUND_UP(req->cryptlen, AES_BLOCK_SIZE) - 2;
858 skcipher_walk_abort(&walk);
860 skcipher_request_set_tfm(&subreq, tfm);
861 skcipher_request_set_callback(&subreq,
862 skcipher_request_flags(req),
864 skcipher_request_set_crypt(&subreq, req->src, req->dst,
865 blocks * AES_BLOCK_SIZE, req->iv);
868 err = skcipher_walk_virt(&walk, req, false);
877 /* calculate first value of T */
878 aesni_enc(aes_ctx(ctx->raw_tweak_ctx), walk.iv, walk.iv);
880 while (walk.nbytes > 0) {
881 int nbytes = walk.nbytes;
883 if (nbytes < walk.total)
884 nbytes &= ~(AES_BLOCK_SIZE - 1);
887 aesni_xts_encrypt(aes_ctx(ctx->raw_crypt_ctx),
888 walk.dst.virt.addr, walk.src.virt.addr,
891 aesni_xts_decrypt(aes_ctx(ctx->raw_crypt_ctx),
892 walk.dst.virt.addr, walk.src.virt.addr,
896 err = skcipher_walk_done(&walk, walk.nbytes - nbytes);
902 if (unlikely(tail > 0 && !err)) {
903 struct scatterlist sg_src[2], sg_dst[2];
904 struct scatterlist *src, *dst;
906 dst = src = scatterwalk_ffwd(sg_src, req->src, req->cryptlen);
907 if (req->dst != req->src)
908 dst = scatterwalk_ffwd(sg_dst, req->dst, req->cryptlen);
910 skcipher_request_set_crypt(req, src, dst, AES_BLOCK_SIZE + tail,
913 err = skcipher_walk_virt(&walk, &subreq, false);
919 aesni_xts_encrypt(aes_ctx(ctx->raw_crypt_ctx),
920 walk.dst.virt.addr, walk.src.virt.addr,
921 walk.nbytes, walk.iv);
923 aesni_xts_decrypt(aes_ctx(ctx->raw_crypt_ctx),
924 walk.dst.virt.addr, walk.src.virt.addr,
925 walk.nbytes, walk.iv);
928 err = skcipher_walk_done(&walk, 0);
933 static int xts_encrypt(struct skcipher_request *req)
935 return xts_crypt(req, true);
938 static int xts_decrypt(struct skcipher_request *req)
940 return xts_crypt(req, false);
943 static struct crypto_alg aesni_cipher_alg = {
945 .cra_driver_name = "aes-aesni",
947 .cra_flags = CRYPTO_ALG_TYPE_CIPHER,
948 .cra_blocksize = AES_BLOCK_SIZE,
949 .cra_ctxsize = CRYPTO_AES_CTX_SIZE,
950 .cra_module = THIS_MODULE,
953 .cia_min_keysize = AES_MIN_KEY_SIZE,
954 .cia_max_keysize = AES_MAX_KEY_SIZE,
955 .cia_setkey = aes_set_key,
956 .cia_encrypt = aesni_encrypt,
957 .cia_decrypt = aesni_decrypt
962 static struct skcipher_alg aesni_skciphers[] = {
965 .cra_name = "__ecb(aes)",
966 .cra_driver_name = "__ecb-aes-aesni",
968 .cra_flags = CRYPTO_ALG_INTERNAL,
969 .cra_blocksize = AES_BLOCK_SIZE,
970 .cra_ctxsize = CRYPTO_AES_CTX_SIZE,
971 .cra_module = THIS_MODULE,
973 .min_keysize = AES_MIN_KEY_SIZE,
974 .max_keysize = AES_MAX_KEY_SIZE,
975 .setkey = aesni_skcipher_setkey,
976 .encrypt = ecb_encrypt,
977 .decrypt = ecb_decrypt,
980 .cra_name = "__cbc(aes)",
981 .cra_driver_name = "__cbc-aes-aesni",
983 .cra_flags = CRYPTO_ALG_INTERNAL,
984 .cra_blocksize = AES_BLOCK_SIZE,
985 .cra_ctxsize = CRYPTO_AES_CTX_SIZE,
986 .cra_module = THIS_MODULE,
988 .min_keysize = AES_MIN_KEY_SIZE,
989 .max_keysize = AES_MAX_KEY_SIZE,
990 .ivsize = AES_BLOCK_SIZE,
991 .setkey = aesni_skcipher_setkey,
992 .encrypt = cbc_encrypt,
993 .decrypt = cbc_decrypt,
996 .cra_name = "__cts(cbc(aes))",
997 .cra_driver_name = "__cts-cbc-aes-aesni",
999 .cra_flags = CRYPTO_ALG_INTERNAL,
1000 .cra_blocksize = AES_BLOCK_SIZE,
1001 .cra_ctxsize = CRYPTO_AES_CTX_SIZE,
1002 .cra_module = THIS_MODULE,
1004 .min_keysize = AES_MIN_KEY_SIZE,
1005 .max_keysize = AES_MAX_KEY_SIZE,
1006 .ivsize = AES_BLOCK_SIZE,
1007 .walksize = 2 * AES_BLOCK_SIZE,
1008 .setkey = aesni_skcipher_setkey,
1009 .encrypt = cts_cbc_encrypt,
1010 .decrypt = cts_cbc_decrypt,
1011 #ifdef CONFIG_X86_64
1014 .cra_name = "__ctr(aes)",
1015 .cra_driver_name = "__ctr-aes-aesni",
1016 .cra_priority = 400,
1017 .cra_flags = CRYPTO_ALG_INTERNAL,
1019 .cra_ctxsize = CRYPTO_AES_CTX_SIZE,
1020 .cra_module = THIS_MODULE,
1022 .min_keysize = AES_MIN_KEY_SIZE,
1023 .max_keysize = AES_MAX_KEY_SIZE,
1024 .ivsize = AES_BLOCK_SIZE,
1025 .chunksize = AES_BLOCK_SIZE,
1026 .setkey = aesni_skcipher_setkey,
1027 .encrypt = ctr_crypt,
1028 .decrypt = ctr_crypt,
1032 .cra_name = "__xts(aes)",
1033 .cra_driver_name = "__xts-aes-aesni",
1034 .cra_priority = 401,
1035 .cra_flags = CRYPTO_ALG_INTERNAL,
1036 .cra_blocksize = AES_BLOCK_SIZE,
1037 .cra_ctxsize = XTS_AES_CTX_SIZE,
1038 .cra_module = THIS_MODULE,
1040 .min_keysize = 2 * AES_MIN_KEY_SIZE,
1041 .max_keysize = 2 * AES_MAX_KEY_SIZE,
1042 .ivsize = AES_BLOCK_SIZE,
1043 .walksize = 2 * AES_BLOCK_SIZE,
1044 .setkey = xts_aesni_setkey,
1045 .encrypt = xts_encrypt,
1046 .decrypt = xts_decrypt,
1051 struct simd_skcipher_alg *aesni_simd_skciphers[ARRAY_SIZE(aesni_skciphers)];
1053 #ifdef CONFIG_X86_64
1054 static int generic_gcmaes_set_key(struct crypto_aead *aead, const u8 *key,
1055 unsigned int key_len)
1057 struct generic_gcmaes_ctx *ctx = generic_gcmaes_ctx_get(aead);
1059 return aes_set_key_common(crypto_aead_tfm(aead),
1060 &ctx->aes_key_expanded, key, key_len) ?:
1061 rfc4106_set_hash_subkey(ctx->hash_subkey, key, key_len);
1064 static int generic_gcmaes_encrypt(struct aead_request *req)
1066 struct crypto_aead *tfm = crypto_aead_reqtfm(req);
1067 struct generic_gcmaes_ctx *ctx = generic_gcmaes_ctx_get(tfm);
1068 void *aes_ctx = &(ctx->aes_key_expanded);
1069 u8 ivbuf[16 + (AESNI_ALIGN - 8)] __aligned(8);
1070 u8 *iv = PTR_ALIGN(&ivbuf[0], AESNI_ALIGN);
1071 __be32 counter = cpu_to_be32(1);
1073 memcpy(iv, req->iv, 12);
1074 *((__be32 *)(iv+12)) = counter;
1076 return gcmaes_encrypt(req, req->assoclen, ctx->hash_subkey, iv,
1080 static int generic_gcmaes_decrypt(struct aead_request *req)
1082 __be32 counter = cpu_to_be32(1);
1083 struct crypto_aead *tfm = crypto_aead_reqtfm(req);
1084 struct generic_gcmaes_ctx *ctx = generic_gcmaes_ctx_get(tfm);
1085 void *aes_ctx = &(ctx->aes_key_expanded);
1086 u8 ivbuf[16 + (AESNI_ALIGN - 8)] __aligned(8);
1087 u8 *iv = PTR_ALIGN(&ivbuf[0], AESNI_ALIGN);
1089 memcpy(iv, req->iv, 12);
1090 *((__be32 *)(iv+12)) = counter;
1092 return gcmaes_decrypt(req, req->assoclen, ctx->hash_subkey, iv,
1096 static struct aead_alg aesni_aeads[] = { {
1097 .setkey = common_rfc4106_set_key,
1098 .setauthsize = common_rfc4106_set_authsize,
1099 .encrypt = helper_rfc4106_encrypt,
1100 .decrypt = helper_rfc4106_decrypt,
1101 .ivsize = GCM_RFC4106_IV_SIZE,
1104 .cra_name = "__rfc4106(gcm(aes))",
1105 .cra_driver_name = "__rfc4106-gcm-aesni",
1106 .cra_priority = 400,
1107 .cra_flags = CRYPTO_ALG_INTERNAL,
1109 .cra_ctxsize = sizeof(struct aesni_rfc4106_gcm_ctx),
1111 .cra_module = THIS_MODULE,
1114 .setkey = generic_gcmaes_set_key,
1115 .setauthsize = generic_gcmaes_set_authsize,
1116 .encrypt = generic_gcmaes_encrypt,
1117 .decrypt = generic_gcmaes_decrypt,
1118 .ivsize = GCM_AES_IV_SIZE,
1121 .cra_name = "__gcm(aes)",
1122 .cra_driver_name = "__generic-gcm-aesni",
1123 .cra_priority = 400,
1124 .cra_flags = CRYPTO_ALG_INTERNAL,
1126 .cra_ctxsize = sizeof(struct generic_gcmaes_ctx),
1128 .cra_module = THIS_MODULE,
1132 static struct aead_alg aesni_aeads[0];
1135 static struct simd_aead_alg *aesni_simd_aeads[ARRAY_SIZE(aesni_aeads)];
1137 static const struct x86_cpu_id aesni_cpu_id[] = {
1138 X86_MATCH_FEATURE(X86_FEATURE_AES, NULL),
1141 MODULE_DEVICE_TABLE(x86cpu, aesni_cpu_id);
1143 static int __init aesni_init(void)
1147 if (!x86_match_cpu(aesni_cpu_id))
1149 #ifdef CONFIG_X86_64
1150 if (boot_cpu_has(X86_FEATURE_AVX2)) {
1151 pr_info("AVX2 version of gcm_enc/dec engaged.\n");
1152 static_branch_enable(&gcm_use_avx);
1153 static_branch_enable(&gcm_use_avx2);
1155 if (boot_cpu_has(X86_FEATURE_AVX)) {
1156 pr_info("AVX version of gcm_enc/dec engaged.\n");
1157 static_branch_enable(&gcm_use_avx);
1159 pr_info("SSE version of gcm_enc/dec engaged.\n");
1161 if (boot_cpu_has(X86_FEATURE_AVX)) {
1162 /* optimize performance of ctr mode encryption transform */
1163 static_call_update(aesni_ctr_enc_tfm, aesni_ctr_enc_avx_tfm);
1164 pr_info("AES CTR mode by8 optimization enabled\n");
1168 err = crypto_register_alg(&aesni_cipher_alg);
1172 err = simd_register_skciphers_compat(aesni_skciphers,
1173 ARRAY_SIZE(aesni_skciphers),
1174 aesni_simd_skciphers);
1176 goto unregister_cipher;
1178 err = simd_register_aeads_compat(aesni_aeads, ARRAY_SIZE(aesni_aeads),
1181 goto unregister_skciphers;
1185 unregister_skciphers:
1186 simd_unregister_skciphers(aesni_skciphers, ARRAY_SIZE(aesni_skciphers),
1187 aesni_simd_skciphers);
1189 crypto_unregister_alg(&aesni_cipher_alg);
1193 static void __exit aesni_exit(void)
1195 simd_unregister_aeads(aesni_aeads, ARRAY_SIZE(aesni_aeads),
1197 simd_unregister_skciphers(aesni_skciphers, ARRAY_SIZE(aesni_skciphers),
1198 aesni_simd_skciphers);
1199 crypto_unregister_alg(&aesni_cipher_alg);
1202 late_initcall(aesni_init);
1203 module_exit(aesni_exit);
1205 MODULE_DESCRIPTION("Rijndael (AES) Cipher Algorithm, Intel AES-NI instructions optimized");
1206 MODULE_LICENSE("GPL");
1207 MODULE_ALIAS_CRYPTO("aes");