Loading...
1// SPDX-License-Identifier: GPL-2.0-or-later
2/*
3 * Support for AES-NI and VAES instructions. This file contains glue code.
4 * The real AES implementations are in aesni-intel_asm.S and other .S files.
5 *
6 * Copyright (C) 2008, Intel Corp.
7 * Author: Huang Ying <ying.huang@intel.com>
8 *
9 * Added RFC4106 AES-GCM support for 128-bit keys under the AEAD
10 * interface for 64-bit kernels.
11 * Authors: Adrian Hoban <adrian.hoban@intel.com>
12 * Gabriele Paoloni <gabriele.paoloni@intel.com>
13 * Tadeusz Struk (tadeusz.struk@intel.com)
14 * Aidan O'Mahony (aidan.o.mahony@intel.com)
15 * Copyright (c) 2010, Intel Corporation.
16 *
17 * Copyright 2024 Google LLC
18 */
19
20#include <linux/hardirq.h>
21#include <linux/types.h>
22#include <linux/module.h>
23#include <linux/err.h>
24#include <crypto/algapi.h>
25#include <crypto/aes.h>
26#include <crypto/ctr.h>
27#include <crypto/b128ops.h>
28#include <crypto/gcm.h>
29#include <crypto/xts.h>
30#include <asm/cpu_device_id.h>
31#include <asm/simd.h>
32#include <crypto/scatterwalk.h>
33#include <crypto/internal/aead.h>
34#include <crypto/internal/simd.h>
35#include <crypto/internal/skcipher.h>
36#include <linux/jump_label.h>
37#include <linux/workqueue.h>
38#include <linux/spinlock.h>
39#include <linux/static_call.h>
40
41
42#define AESNI_ALIGN 16
43#define AESNI_ALIGN_ATTR __attribute__ ((__aligned__(AESNI_ALIGN)))
44#define AES_BLOCK_MASK (~(AES_BLOCK_SIZE - 1))
45#define AESNI_ALIGN_EXTRA ((AESNI_ALIGN - 1) & ~(CRYPTO_MINALIGN - 1))
46#define CRYPTO_AES_CTX_SIZE (sizeof(struct crypto_aes_ctx) + AESNI_ALIGN_EXTRA)
47#define XTS_AES_CTX_SIZE (sizeof(struct aesni_xts_ctx) + AESNI_ALIGN_EXTRA)
48
49struct aesni_xts_ctx {
50 struct crypto_aes_ctx tweak_ctx AESNI_ALIGN_ATTR;
51 struct crypto_aes_ctx crypt_ctx AESNI_ALIGN_ATTR;
52};
53
54static inline void *aes_align_addr(void *addr)
55{
56 if (crypto_tfm_ctx_alignment() >= AESNI_ALIGN)
57 return addr;
58 return PTR_ALIGN(addr, AESNI_ALIGN);
59}
60
61asmlinkage void aesni_set_key(struct crypto_aes_ctx *ctx, const u8 *in_key,
62 unsigned int key_len);
63asmlinkage void aesni_enc(const void *ctx, u8 *out, const u8 *in);
64asmlinkage void aesni_dec(const void *ctx, u8 *out, const u8 *in);
65asmlinkage void aesni_ecb_enc(struct crypto_aes_ctx *ctx, u8 *out,
66 const u8 *in, unsigned int len);
67asmlinkage void aesni_ecb_dec(struct crypto_aes_ctx *ctx, u8 *out,
68 const u8 *in, unsigned int len);
69asmlinkage void aesni_cbc_enc(struct crypto_aes_ctx *ctx, u8 *out,
70 const u8 *in, unsigned int len, u8 *iv);
71asmlinkage void aesni_cbc_dec(struct crypto_aes_ctx *ctx, u8 *out,
72 const u8 *in, unsigned int len, u8 *iv);
73asmlinkage void aesni_cts_cbc_enc(struct crypto_aes_ctx *ctx, u8 *out,
74 const u8 *in, unsigned int len, u8 *iv);
75asmlinkage void aesni_cts_cbc_dec(struct crypto_aes_ctx *ctx, u8 *out,
76 const u8 *in, unsigned int len, u8 *iv);
77
78asmlinkage void aesni_xts_enc(const struct crypto_aes_ctx *ctx, u8 *out,
79 const u8 *in, unsigned int len, u8 *iv);
80
81asmlinkage void aesni_xts_dec(const struct crypto_aes_ctx *ctx, u8 *out,
82 const u8 *in, unsigned int len, u8 *iv);
83
84#ifdef CONFIG_X86_64
85
86asmlinkage void aesni_ctr_enc(struct crypto_aes_ctx *ctx, u8 *out,
87 const u8 *in, unsigned int len, u8 *iv);
88DEFINE_STATIC_CALL(aesni_ctr_enc_tfm, aesni_ctr_enc);
89
90asmlinkage void aes_ctr_enc_128_avx_by8(const u8 *in, u8 *iv,
91 void *keys, u8 *out, unsigned int num_bytes);
92asmlinkage void aes_ctr_enc_192_avx_by8(const u8 *in, u8 *iv,
93 void *keys, u8 *out, unsigned int num_bytes);
94asmlinkage void aes_ctr_enc_256_avx_by8(const u8 *in, u8 *iv,
95 void *keys, u8 *out, unsigned int num_bytes);
96
97
98asmlinkage void aes_xctr_enc_128_avx_by8(const u8 *in, const u8 *iv,
99 const void *keys, u8 *out, unsigned int num_bytes,
100 unsigned int byte_ctr);
101
102asmlinkage void aes_xctr_enc_192_avx_by8(const u8 *in, const u8 *iv,
103 const void *keys, u8 *out, unsigned int num_bytes,
104 unsigned int byte_ctr);
105
106asmlinkage void aes_xctr_enc_256_avx_by8(const u8 *in, const u8 *iv,
107 const void *keys, u8 *out, unsigned int num_bytes,
108 unsigned int byte_ctr);
109#endif
110
111static inline struct crypto_aes_ctx *aes_ctx(void *raw_ctx)
112{
113 return aes_align_addr(raw_ctx);
114}
115
116static inline struct aesni_xts_ctx *aes_xts_ctx(struct crypto_skcipher *tfm)
117{
118 return aes_align_addr(crypto_skcipher_ctx(tfm));
119}
120
121static int aes_set_key_common(struct crypto_aes_ctx *ctx,
122 const u8 *in_key, unsigned int key_len)
123{
124 int err;
125
126 if (!crypto_simd_usable())
127 return aes_expandkey(ctx, in_key, key_len);
128
129 err = aes_check_keylen(key_len);
130 if (err)
131 return err;
132
133 kernel_fpu_begin();
134 aesni_set_key(ctx, in_key, key_len);
135 kernel_fpu_end();
136 return 0;
137}
138
139static int aes_set_key(struct crypto_tfm *tfm, const u8 *in_key,
140 unsigned int key_len)
141{
142 return aes_set_key_common(aes_ctx(crypto_tfm_ctx(tfm)), in_key,
143 key_len);
144}
145
146static void aesni_encrypt(struct crypto_tfm *tfm, u8 *dst, const u8 *src)
147{
148 struct crypto_aes_ctx *ctx = aes_ctx(crypto_tfm_ctx(tfm));
149
150 if (!crypto_simd_usable()) {
151 aes_encrypt(ctx, dst, src);
152 } else {
153 kernel_fpu_begin();
154 aesni_enc(ctx, dst, src);
155 kernel_fpu_end();
156 }
157}
158
159static void aesni_decrypt(struct crypto_tfm *tfm, u8 *dst, const u8 *src)
160{
161 struct crypto_aes_ctx *ctx = aes_ctx(crypto_tfm_ctx(tfm));
162
163 if (!crypto_simd_usable()) {
164 aes_decrypt(ctx, dst, src);
165 } else {
166 kernel_fpu_begin();
167 aesni_dec(ctx, dst, src);
168 kernel_fpu_end();
169 }
170}
171
172static int aesni_skcipher_setkey(struct crypto_skcipher *tfm, const u8 *key,
173 unsigned int len)
174{
175 return aes_set_key_common(aes_ctx(crypto_skcipher_ctx(tfm)), key, len);
176}
177
178static int ecb_encrypt(struct skcipher_request *req)
179{
180 struct crypto_skcipher *tfm = crypto_skcipher_reqtfm(req);
181 struct crypto_aes_ctx *ctx = aes_ctx(crypto_skcipher_ctx(tfm));
182 struct skcipher_walk walk;
183 unsigned int nbytes;
184 int err;
185
186 err = skcipher_walk_virt(&walk, req, false);
187
188 while ((nbytes = walk.nbytes)) {
189 kernel_fpu_begin();
190 aesni_ecb_enc(ctx, walk.dst.virt.addr, walk.src.virt.addr,
191 nbytes & AES_BLOCK_MASK);
192 kernel_fpu_end();
193 nbytes &= AES_BLOCK_SIZE - 1;
194 err = skcipher_walk_done(&walk, nbytes);
195 }
196
197 return err;
198}
199
200static int ecb_decrypt(struct skcipher_request *req)
201{
202 struct crypto_skcipher *tfm = crypto_skcipher_reqtfm(req);
203 struct crypto_aes_ctx *ctx = aes_ctx(crypto_skcipher_ctx(tfm));
204 struct skcipher_walk walk;
205 unsigned int nbytes;
206 int err;
207
208 err = skcipher_walk_virt(&walk, req, false);
209
210 while ((nbytes = walk.nbytes)) {
211 kernel_fpu_begin();
212 aesni_ecb_dec(ctx, walk.dst.virt.addr, walk.src.virt.addr,
213 nbytes & AES_BLOCK_MASK);
214 kernel_fpu_end();
215 nbytes &= AES_BLOCK_SIZE - 1;
216 err = skcipher_walk_done(&walk, nbytes);
217 }
218
219 return err;
220}
221
222static int cbc_encrypt(struct skcipher_request *req)
223{
224 struct crypto_skcipher *tfm = crypto_skcipher_reqtfm(req);
225 struct crypto_aes_ctx *ctx = aes_ctx(crypto_skcipher_ctx(tfm));
226 struct skcipher_walk walk;
227 unsigned int nbytes;
228 int err;
229
230 err = skcipher_walk_virt(&walk, req, false);
231
232 while ((nbytes = walk.nbytes)) {
233 kernel_fpu_begin();
234 aesni_cbc_enc(ctx, walk.dst.virt.addr, walk.src.virt.addr,
235 nbytes & AES_BLOCK_MASK, walk.iv);
236 kernel_fpu_end();
237 nbytes &= AES_BLOCK_SIZE - 1;
238 err = skcipher_walk_done(&walk, nbytes);
239 }
240
241 return err;
242}
243
244static int cbc_decrypt(struct skcipher_request *req)
245{
246 struct crypto_skcipher *tfm = crypto_skcipher_reqtfm(req);
247 struct crypto_aes_ctx *ctx = aes_ctx(crypto_skcipher_ctx(tfm));
248 struct skcipher_walk walk;
249 unsigned int nbytes;
250 int err;
251
252 err = skcipher_walk_virt(&walk, req, false);
253
254 while ((nbytes = walk.nbytes)) {
255 kernel_fpu_begin();
256 aesni_cbc_dec(ctx, walk.dst.virt.addr, walk.src.virt.addr,
257 nbytes & AES_BLOCK_MASK, walk.iv);
258 kernel_fpu_end();
259 nbytes &= AES_BLOCK_SIZE - 1;
260 err = skcipher_walk_done(&walk, nbytes);
261 }
262
263 return err;
264}
265
266static int cts_cbc_encrypt(struct skcipher_request *req)
267{
268 struct crypto_skcipher *tfm = crypto_skcipher_reqtfm(req);
269 struct crypto_aes_ctx *ctx = aes_ctx(crypto_skcipher_ctx(tfm));
270 int cbc_blocks = DIV_ROUND_UP(req->cryptlen, AES_BLOCK_SIZE) - 2;
271 struct scatterlist *src = req->src, *dst = req->dst;
272 struct scatterlist sg_src[2], sg_dst[2];
273 struct skcipher_request subreq;
274 struct skcipher_walk walk;
275 int err;
276
277 skcipher_request_set_tfm(&subreq, tfm);
278 skcipher_request_set_callback(&subreq, skcipher_request_flags(req),
279 NULL, NULL);
280
281 if (req->cryptlen <= AES_BLOCK_SIZE) {
282 if (req->cryptlen < AES_BLOCK_SIZE)
283 return -EINVAL;
284 cbc_blocks = 1;
285 }
286
287 if (cbc_blocks > 0) {
288 skcipher_request_set_crypt(&subreq, req->src, req->dst,
289 cbc_blocks * AES_BLOCK_SIZE,
290 req->iv);
291
292 err = cbc_encrypt(&subreq);
293 if (err)
294 return err;
295
296 if (req->cryptlen == AES_BLOCK_SIZE)
297 return 0;
298
299 dst = src = scatterwalk_ffwd(sg_src, req->src, subreq.cryptlen);
300 if (req->dst != req->src)
301 dst = scatterwalk_ffwd(sg_dst, req->dst,
302 subreq.cryptlen);
303 }
304
305 /* handle ciphertext stealing */
306 skcipher_request_set_crypt(&subreq, src, dst,
307 req->cryptlen - cbc_blocks * AES_BLOCK_SIZE,
308 req->iv);
309
310 err = skcipher_walk_virt(&walk, &subreq, false);
311 if (err)
312 return err;
313
314 kernel_fpu_begin();
315 aesni_cts_cbc_enc(ctx, walk.dst.virt.addr, walk.src.virt.addr,
316 walk.nbytes, walk.iv);
317 kernel_fpu_end();
318
319 return skcipher_walk_done(&walk, 0);
320}
321
322static int cts_cbc_decrypt(struct skcipher_request *req)
323{
324 struct crypto_skcipher *tfm = crypto_skcipher_reqtfm(req);
325 struct crypto_aes_ctx *ctx = aes_ctx(crypto_skcipher_ctx(tfm));
326 int cbc_blocks = DIV_ROUND_UP(req->cryptlen, AES_BLOCK_SIZE) - 2;
327 struct scatterlist *src = req->src, *dst = req->dst;
328 struct scatterlist sg_src[2], sg_dst[2];
329 struct skcipher_request subreq;
330 struct skcipher_walk walk;
331 int err;
332
333 skcipher_request_set_tfm(&subreq, tfm);
334 skcipher_request_set_callback(&subreq, skcipher_request_flags(req),
335 NULL, NULL);
336
337 if (req->cryptlen <= AES_BLOCK_SIZE) {
338 if (req->cryptlen < AES_BLOCK_SIZE)
339 return -EINVAL;
340 cbc_blocks = 1;
341 }
342
343 if (cbc_blocks > 0) {
344 skcipher_request_set_crypt(&subreq, req->src, req->dst,
345 cbc_blocks * AES_BLOCK_SIZE,
346 req->iv);
347
348 err = cbc_decrypt(&subreq);
349 if (err)
350 return err;
351
352 if (req->cryptlen == AES_BLOCK_SIZE)
353 return 0;
354
355 dst = src = scatterwalk_ffwd(sg_src, req->src, subreq.cryptlen);
356 if (req->dst != req->src)
357 dst = scatterwalk_ffwd(sg_dst, req->dst,
358 subreq.cryptlen);
359 }
360
361 /* handle ciphertext stealing */
362 skcipher_request_set_crypt(&subreq, src, dst,
363 req->cryptlen - cbc_blocks * AES_BLOCK_SIZE,
364 req->iv);
365
366 err = skcipher_walk_virt(&walk, &subreq, false);
367 if (err)
368 return err;
369
370 kernel_fpu_begin();
371 aesni_cts_cbc_dec(ctx, walk.dst.virt.addr, walk.src.virt.addr,
372 walk.nbytes, walk.iv);
373 kernel_fpu_end();
374
375 return skcipher_walk_done(&walk, 0);
376}
377
378#ifdef CONFIG_X86_64
379static void aesni_ctr_enc_avx_tfm(struct crypto_aes_ctx *ctx, u8 *out,
380 const u8 *in, unsigned int len, u8 *iv)
381{
382 /*
383 * based on key length, override with the by8 version
384 * of ctr mode encryption/decryption for improved performance
385 * aes_set_key_common() ensures that key length is one of
386 * {128,192,256}
387 */
388 if (ctx->key_length == AES_KEYSIZE_128)
389 aes_ctr_enc_128_avx_by8(in, iv, (void *)ctx, out, len);
390 else if (ctx->key_length == AES_KEYSIZE_192)
391 aes_ctr_enc_192_avx_by8(in, iv, (void *)ctx, out, len);
392 else
393 aes_ctr_enc_256_avx_by8(in, iv, (void *)ctx, out, len);
394}
395
396static int ctr_crypt(struct skcipher_request *req)
397{
398 struct crypto_skcipher *tfm = crypto_skcipher_reqtfm(req);
399 struct crypto_aes_ctx *ctx = aes_ctx(crypto_skcipher_ctx(tfm));
400 u8 keystream[AES_BLOCK_SIZE];
401 struct skcipher_walk walk;
402 unsigned int nbytes;
403 int err;
404
405 err = skcipher_walk_virt(&walk, req, false);
406
407 while ((nbytes = walk.nbytes) > 0) {
408 kernel_fpu_begin();
409 if (nbytes & AES_BLOCK_MASK)
410 static_call(aesni_ctr_enc_tfm)(ctx, walk.dst.virt.addr,
411 walk.src.virt.addr,
412 nbytes & AES_BLOCK_MASK,
413 walk.iv);
414 nbytes &= ~AES_BLOCK_MASK;
415
416 if (walk.nbytes == walk.total && nbytes > 0) {
417 aesni_enc(ctx, keystream, walk.iv);
418 crypto_xor_cpy(walk.dst.virt.addr + walk.nbytes - nbytes,
419 walk.src.virt.addr + walk.nbytes - nbytes,
420 keystream, nbytes);
421 crypto_inc(walk.iv, AES_BLOCK_SIZE);
422 nbytes = 0;
423 }
424 kernel_fpu_end();
425 err = skcipher_walk_done(&walk, nbytes);
426 }
427 return err;
428}
429
430static void aesni_xctr_enc_avx_tfm(struct crypto_aes_ctx *ctx, u8 *out,
431 const u8 *in, unsigned int len, u8 *iv,
432 unsigned int byte_ctr)
433{
434 if (ctx->key_length == AES_KEYSIZE_128)
435 aes_xctr_enc_128_avx_by8(in, iv, (void *)ctx, out, len,
436 byte_ctr);
437 else if (ctx->key_length == AES_KEYSIZE_192)
438 aes_xctr_enc_192_avx_by8(in, iv, (void *)ctx, out, len,
439 byte_ctr);
440 else
441 aes_xctr_enc_256_avx_by8(in, iv, (void *)ctx, out, len,
442 byte_ctr);
443}
444
445static int xctr_crypt(struct skcipher_request *req)
446{
447 struct crypto_skcipher *tfm = crypto_skcipher_reqtfm(req);
448 struct crypto_aes_ctx *ctx = aes_ctx(crypto_skcipher_ctx(tfm));
449 u8 keystream[AES_BLOCK_SIZE];
450 struct skcipher_walk walk;
451 unsigned int nbytes;
452 unsigned int byte_ctr = 0;
453 int err;
454 __le32 block[AES_BLOCK_SIZE / sizeof(__le32)];
455
456 err = skcipher_walk_virt(&walk, req, false);
457
458 while ((nbytes = walk.nbytes) > 0) {
459 kernel_fpu_begin();
460 if (nbytes & AES_BLOCK_MASK)
461 aesni_xctr_enc_avx_tfm(ctx, walk.dst.virt.addr,
462 walk.src.virt.addr, nbytes & AES_BLOCK_MASK,
463 walk.iv, byte_ctr);
464 nbytes &= ~AES_BLOCK_MASK;
465 byte_ctr += walk.nbytes - nbytes;
466
467 if (walk.nbytes == walk.total && nbytes > 0) {
468 memcpy(block, walk.iv, AES_BLOCK_SIZE);
469 block[0] ^= cpu_to_le32(1 + byte_ctr / AES_BLOCK_SIZE);
470 aesni_enc(ctx, keystream, (u8 *)block);
471 crypto_xor_cpy(walk.dst.virt.addr + walk.nbytes -
472 nbytes, walk.src.virt.addr + walk.nbytes
473 - nbytes, keystream, nbytes);
474 byte_ctr += nbytes;
475 nbytes = 0;
476 }
477 kernel_fpu_end();
478 err = skcipher_walk_done(&walk, nbytes);
479 }
480 return err;
481}
482#endif
483
484static int xts_setkey_aesni(struct crypto_skcipher *tfm, const u8 *key,
485 unsigned int keylen)
486{
487 struct aesni_xts_ctx *ctx = aes_xts_ctx(tfm);
488 int err;
489
490 err = xts_verify_key(tfm, key, keylen);
491 if (err)
492 return err;
493
494 keylen /= 2;
495
496 /* first half of xts-key is for crypt */
497 err = aes_set_key_common(&ctx->crypt_ctx, key, keylen);
498 if (err)
499 return err;
500
501 /* second half of xts-key is for tweak */
502 return aes_set_key_common(&ctx->tweak_ctx, key + keylen, keylen);
503}
504
505typedef void (*xts_encrypt_iv_func)(const struct crypto_aes_ctx *tweak_key,
506 u8 iv[AES_BLOCK_SIZE]);
507typedef void (*xts_crypt_func)(const struct crypto_aes_ctx *key,
508 const u8 *src, u8 *dst, unsigned int len,
509 u8 tweak[AES_BLOCK_SIZE]);
510
511/* This handles cases where the source and/or destination span pages. */
512static noinline int
513xts_crypt_slowpath(struct skcipher_request *req, xts_crypt_func crypt_func)
514{
515 struct crypto_skcipher *tfm = crypto_skcipher_reqtfm(req);
516 const struct aesni_xts_ctx *ctx = aes_xts_ctx(tfm);
517 int tail = req->cryptlen % AES_BLOCK_SIZE;
518 struct scatterlist sg_src[2], sg_dst[2];
519 struct skcipher_request subreq;
520 struct skcipher_walk walk;
521 struct scatterlist *src, *dst;
522 int err;
523
524 /*
525 * If the message length isn't divisible by the AES block size, then
526 * separate off the last full block and the partial block. This ensures
527 * that they are processed in the same call to the assembly function,
528 * which is required for ciphertext stealing.
529 */
530 if (tail) {
531 skcipher_request_set_tfm(&subreq, tfm);
532 skcipher_request_set_callback(&subreq,
533 skcipher_request_flags(req),
534 NULL, NULL);
535 skcipher_request_set_crypt(&subreq, req->src, req->dst,
536 req->cryptlen - tail - AES_BLOCK_SIZE,
537 req->iv);
538 req = &subreq;
539 }
540
541 err = skcipher_walk_virt(&walk, req, false);
542
543 while (walk.nbytes) {
544 kernel_fpu_begin();
545 (*crypt_func)(&ctx->crypt_ctx,
546 walk.src.virt.addr, walk.dst.virt.addr,
547 walk.nbytes & ~(AES_BLOCK_SIZE - 1), req->iv);
548 kernel_fpu_end();
549 err = skcipher_walk_done(&walk,
550 walk.nbytes & (AES_BLOCK_SIZE - 1));
551 }
552
553 if (err || !tail)
554 return err;
555
556 /* Do ciphertext stealing with the last full block and partial block. */
557
558 dst = src = scatterwalk_ffwd(sg_src, req->src, req->cryptlen);
559 if (req->dst != req->src)
560 dst = scatterwalk_ffwd(sg_dst, req->dst, req->cryptlen);
561
562 skcipher_request_set_crypt(req, src, dst, AES_BLOCK_SIZE + tail,
563 req->iv);
564
565 err = skcipher_walk_virt(&walk, req, false);
566 if (err)
567 return err;
568
569 kernel_fpu_begin();
570 (*crypt_func)(&ctx->crypt_ctx, walk.src.virt.addr, walk.dst.virt.addr,
571 walk.nbytes, req->iv);
572 kernel_fpu_end();
573
574 return skcipher_walk_done(&walk, 0);
575}
576
577/* __always_inline to avoid indirect call in fastpath */
578static __always_inline int
579xts_crypt(struct skcipher_request *req, xts_encrypt_iv_func encrypt_iv,
580 xts_crypt_func crypt_func)
581{
582 struct crypto_skcipher *tfm = crypto_skcipher_reqtfm(req);
583 const struct aesni_xts_ctx *ctx = aes_xts_ctx(tfm);
584 const unsigned int cryptlen = req->cryptlen;
585 struct scatterlist *src = req->src;
586 struct scatterlist *dst = req->dst;
587
588 if (unlikely(cryptlen < AES_BLOCK_SIZE))
589 return -EINVAL;
590
591 kernel_fpu_begin();
592 (*encrypt_iv)(&ctx->tweak_ctx, req->iv);
593
594 /*
595 * In practice, virtually all XTS plaintexts and ciphertexts are either
596 * 512 or 4096 bytes, aligned such that they don't span page boundaries.
597 * To optimize the performance of these cases, and also any other case
598 * where no page boundary is spanned, the below fast-path handles
599 * single-page sources and destinations as efficiently as possible.
600 */
601 if (likely(src->length >= cryptlen && dst->length >= cryptlen &&
602 src->offset + cryptlen <= PAGE_SIZE &&
603 dst->offset + cryptlen <= PAGE_SIZE)) {
604 struct page *src_page = sg_page(src);
605 struct page *dst_page = sg_page(dst);
606 void *src_virt = kmap_local_page(src_page) + src->offset;
607 void *dst_virt = kmap_local_page(dst_page) + dst->offset;
608
609 (*crypt_func)(&ctx->crypt_ctx, src_virt, dst_virt, cryptlen,
610 req->iv);
611 kunmap_local(dst_virt);
612 kunmap_local(src_virt);
613 kernel_fpu_end();
614 return 0;
615 }
616 kernel_fpu_end();
617 return xts_crypt_slowpath(req, crypt_func);
618}
619
620static void aesni_xts_encrypt_iv(const struct crypto_aes_ctx *tweak_key,
621 u8 iv[AES_BLOCK_SIZE])
622{
623 aesni_enc(tweak_key, iv, iv);
624}
625
626static void aesni_xts_encrypt(const struct crypto_aes_ctx *key,
627 const u8 *src, u8 *dst, unsigned int len,
628 u8 tweak[AES_BLOCK_SIZE])
629{
630 aesni_xts_enc(key, dst, src, len, tweak);
631}
632
633static void aesni_xts_decrypt(const struct crypto_aes_ctx *key,
634 const u8 *src, u8 *dst, unsigned int len,
635 u8 tweak[AES_BLOCK_SIZE])
636{
637 aesni_xts_dec(key, dst, src, len, tweak);
638}
639
640static int xts_encrypt_aesni(struct skcipher_request *req)
641{
642 return xts_crypt(req, aesni_xts_encrypt_iv, aesni_xts_encrypt);
643}
644
645static int xts_decrypt_aesni(struct skcipher_request *req)
646{
647 return xts_crypt(req, aesni_xts_encrypt_iv, aesni_xts_decrypt);
648}
649
650static struct crypto_alg aesni_cipher_alg = {
651 .cra_name = "aes",
652 .cra_driver_name = "aes-aesni",
653 .cra_priority = 300,
654 .cra_flags = CRYPTO_ALG_TYPE_CIPHER,
655 .cra_blocksize = AES_BLOCK_SIZE,
656 .cra_ctxsize = CRYPTO_AES_CTX_SIZE,
657 .cra_module = THIS_MODULE,
658 .cra_u = {
659 .cipher = {
660 .cia_min_keysize = AES_MIN_KEY_SIZE,
661 .cia_max_keysize = AES_MAX_KEY_SIZE,
662 .cia_setkey = aes_set_key,
663 .cia_encrypt = aesni_encrypt,
664 .cia_decrypt = aesni_decrypt
665 }
666 }
667};
668
669static struct skcipher_alg aesni_skciphers[] = {
670 {
671 .base = {
672 .cra_name = "__ecb(aes)",
673 .cra_driver_name = "__ecb-aes-aesni",
674 .cra_priority = 400,
675 .cra_flags = CRYPTO_ALG_INTERNAL,
676 .cra_blocksize = AES_BLOCK_SIZE,
677 .cra_ctxsize = CRYPTO_AES_CTX_SIZE,
678 .cra_module = THIS_MODULE,
679 },
680 .min_keysize = AES_MIN_KEY_SIZE,
681 .max_keysize = AES_MAX_KEY_SIZE,
682 .setkey = aesni_skcipher_setkey,
683 .encrypt = ecb_encrypt,
684 .decrypt = ecb_decrypt,
685 }, {
686 .base = {
687 .cra_name = "__cbc(aes)",
688 .cra_driver_name = "__cbc-aes-aesni",
689 .cra_priority = 400,
690 .cra_flags = CRYPTO_ALG_INTERNAL,
691 .cra_blocksize = AES_BLOCK_SIZE,
692 .cra_ctxsize = CRYPTO_AES_CTX_SIZE,
693 .cra_module = THIS_MODULE,
694 },
695 .min_keysize = AES_MIN_KEY_SIZE,
696 .max_keysize = AES_MAX_KEY_SIZE,
697 .ivsize = AES_BLOCK_SIZE,
698 .setkey = aesni_skcipher_setkey,
699 .encrypt = cbc_encrypt,
700 .decrypt = cbc_decrypt,
701 }, {
702 .base = {
703 .cra_name = "__cts(cbc(aes))",
704 .cra_driver_name = "__cts-cbc-aes-aesni",
705 .cra_priority = 400,
706 .cra_flags = CRYPTO_ALG_INTERNAL,
707 .cra_blocksize = AES_BLOCK_SIZE,
708 .cra_ctxsize = CRYPTO_AES_CTX_SIZE,
709 .cra_module = THIS_MODULE,
710 },
711 .min_keysize = AES_MIN_KEY_SIZE,
712 .max_keysize = AES_MAX_KEY_SIZE,
713 .ivsize = AES_BLOCK_SIZE,
714 .walksize = 2 * AES_BLOCK_SIZE,
715 .setkey = aesni_skcipher_setkey,
716 .encrypt = cts_cbc_encrypt,
717 .decrypt = cts_cbc_decrypt,
718#ifdef CONFIG_X86_64
719 }, {
720 .base = {
721 .cra_name = "__ctr(aes)",
722 .cra_driver_name = "__ctr-aes-aesni",
723 .cra_priority = 400,
724 .cra_flags = CRYPTO_ALG_INTERNAL,
725 .cra_blocksize = 1,
726 .cra_ctxsize = CRYPTO_AES_CTX_SIZE,
727 .cra_module = THIS_MODULE,
728 },
729 .min_keysize = AES_MIN_KEY_SIZE,
730 .max_keysize = AES_MAX_KEY_SIZE,
731 .ivsize = AES_BLOCK_SIZE,
732 .chunksize = AES_BLOCK_SIZE,
733 .setkey = aesni_skcipher_setkey,
734 .encrypt = ctr_crypt,
735 .decrypt = ctr_crypt,
736#endif
737 }, {
738 .base = {
739 .cra_name = "__xts(aes)",
740 .cra_driver_name = "__xts-aes-aesni",
741 .cra_priority = 401,
742 .cra_flags = CRYPTO_ALG_INTERNAL,
743 .cra_blocksize = AES_BLOCK_SIZE,
744 .cra_ctxsize = XTS_AES_CTX_SIZE,
745 .cra_module = THIS_MODULE,
746 },
747 .min_keysize = 2 * AES_MIN_KEY_SIZE,
748 .max_keysize = 2 * AES_MAX_KEY_SIZE,
749 .ivsize = AES_BLOCK_SIZE,
750 .walksize = 2 * AES_BLOCK_SIZE,
751 .setkey = xts_setkey_aesni,
752 .encrypt = xts_encrypt_aesni,
753 .decrypt = xts_decrypt_aesni,
754 }
755};
756
757static
758struct simd_skcipher_alg *aesni_simd_skciphers[ARRAY_SIZE(aesni_skciphers)];
759
760#ifdef CONFIG_X86_64
761/*
762 * XCTR does not have a non-AVX implementation, so it must be enabled
763 * conditionally.
764 */
765static struct skcipher_alg aesni_xctr = {
766 .base = {
767 .cra_name = "__xctr(aes)",
768 .cra_driver_name = "__xctr-aes-aesni",
769 .cra_priority = 400,
770 .cra_flags = CRYPTO_ALG_INTERNAL,
771 .cra_blocksize = 1,
772 .cra_ctxsize = CRYPTO_AES_CTX_SIZE,
773 .cra_module = THIS_MODULE,
774 },
775 .min_keysize = AES_MIN_KEY_SIZE,
776 .max_keysize = AES_MAX_KEY_SIZE,
777 .ivsize = AES_BLOCK_SIZE,
778 .chunksize = AES_BLOCK_SIZE,
779 .setkey = aesni_skcipher_setkey,
780 .encrypt = xctr_crypt,
781 .decrypt = xctr_crypt,
782};
783
784static struct simd_skcipher_alg *aesni_simd_xctr;
785
786asmlinkage void aes_xts_encrypt_iv(const struct crypto_aes_ctx *tweak_key,
787 u8 iv[AES_BLOCK_SIZE]);
788
789#define DEFINE_XTS_ALG(suffix, driver_name, priority) \
790 \
791asmlinkage void \
792aes_xts_encrypt_##suffix(const struct crypto_aes_ctx *key, const u8 *src, \
793 u8 *dst, unsigned int len, u8 tweak[AES_BLOCK_SIZE]); \
794asmlinkage void \
795aes_xts_decrypt_##suffix(const struct crypto_aes_ctx *key, const u8 *src, \
796 u8 *dst, unsigned int len, u8 tweak[AES_BLOCK_SIZE]); \
797 \
798static int xts_encrypt_##suffix(struct skcipher_request *req) \
799{ \
800 return xts_crypt(req, aes_xts_encrypt_iv, aes_xts_encrypt_##suffix); \
801} \
802 \
803static int xts_decrypt_##suffix(struct skcipher_request *req) \
804{ \
805 return xts_crypt(req, aes_xts_encrypt_iv, aes_xts_decrypt_##suffix); \
806} \
807 \
808static struct skcipher_alg aes_xts_alg_##suffix = { \
809 .base = { \
810 .cra_name = "__xts(aes)", \
811 .cra_driver_name = "__" driver_name, \
812 .cra_priority = priority, \
813 .cra_flags = CRYPTO_ALG_INTERNAL, \
814 .cra_blocksize = AES_BLOCK_SIZE, \
815 .cra_ctxsize = XTS_AES_CTX_SIZE, \
816 .cra_module = THIS_MODULE, \
817 }, \
818 .min_keysize = 2 * AES_MIN_KEY_SIZE, \
819 .max_keysize = 2 * AES_MAX_KEY_SIZE, \
820 .ivsize = AES_BLOCK_SIZE, \
821 .walksize = 2 * AES_BLOCK_SIZE, \
822 .setkey = xts_setkey_aesni, \
823 .encrypt = xts_encrypt_##suffix, \
824 .decrypt = xts_decrypt_##suffix, \
825}; \
826 \
827static struct simd_skcipher_alg *aes_xts_simdalg_##suffix
828
829DEFINE_XTS_ALG(aesni_avx, "xts-aes-aesni-avx", 500);
830#if defined(CONFIG_AS_VAES) && defined(CONFIG_AS_VPCLMULQDQ)
831DEFINE_XTS_ALG(vaes_avx2, "xts-aes-vaes-avx2", 600);
832DEFINE_XTS_ALG(vaes_avx10_256, "xts-aes-vaes-avx10_256", 700);
833DEFINE_XTS_ALG(vaes_avx10_512, "xts-aes-vaes-avx10_512", 800);
834#endif
835
836/* The common part of the x86_64 AES-GCM key struct */
837struct aes_gcm_key {
838 /* Expanded AES key and the AES key length in bytes */
839 struct crypto_aes_ctx aes_key;
840
841 /* RFC4106 nonce (used only by the rfc4106 algorithms) */
842 u32 rfc4106_nonce;
843};
844
845/* Key struct used by the AES-NI implementations of AES-GCM */
846struct aes_gcm_key_aesni {
847 /*
848 * Common part of the key. The assembly code requires 16-byte alignment
849 * for the round keys; we get this by them being located at the start of
850 * the struct and the whole struct being 16-byte aligned.
851 */
852 struct aes_gcm_key base;
853
854 /*
855 * Powers of the hash key H^8 through H^1. These are 128-bit values.
856 * They all have an extra factor of x^-1 and are byte-reversed. 16-byte
857 * alignment is required by the assembly code.
858 */
859 u64 h_powers[8][2] __aligned(16);
860
861 /*
862 * h_powers_xored[i] contains the two 64-bit halves of h_powers[i] XOR'd
863 * together. It's used for Karatsuba multiplication. 16-byte alignment
864 * is required by the assembly code.
865 */
866 u64 h_powers_xored[8] __aligned(16);
867
868 /*
869 * H^1 times x^64 (and also the usual extra factor of x^-1). 16-byte
870 * alignment is required by the assembly code.
871 */
872 u64 h_times_x64[2] __aligned(16);
873};
874#define AES_GCM_KEY_AESNI(key) \
875 container_of((key), struct aes_gcm_key_aesni, base)
876#define AES_GCM_KEY_AESNI_SIZE \
877 (sizeof(struct aes_gcm_key_aesni) + (15 & ~(CRYPTO_MINALIGN - 1)))
878
879/* Key struct used by the VAES + AVX10 implementations of AES-GCM */
880struct aes_gcm_key_avx10 {
881 /*
882 * Common part of the key. The assembly code prefers 16-byte alignment
883 * for the round keys; we get this by them being located at the start of
884 * the struct and the whole struct being 64-byte aligned.
885 */
886 struct aes_gcm_key base;
887
888 /*
889 * Powers of the hash key H^16 through H^1. These are 128-bit values.
890 * They all have an extra factor of x^-1 and are byte-reversed. This
891 * array is aligned to a 64-byte boundary to make it naturally aligned
892 * for 512-bit loads, which can improve performance. (The assembly code
893 * doesn't *need* the alignment; this is just an optimization.)
894 */
895 u64 h_powers[16][2] __aligned(64);
896
897 /* Three padding blocks required by the assembly code */
898 u64 padding[3][2];
899};
900#define AES_GCM_KEY_AVX10(key) \
901 container_of((key), struct aes_gcm_key_avx10, base)
902#define AES_GCM_KEY_AVX10_SIZE \
903 (sizeof(struct aes_gcm_key_avx10) + (63 & ~(CRYPTO_MINALIGN - 1)))
904
905/*
906 * These flags are passed to the AES-GCM helper functions to specify the
907 * specific version of AES-GCM (RFC4106 or not), whether it's encryption or
908 * decryption, and which assembly functions should be called. Assembly
909 * functions are selected using flags instead of function pointers to avoid
910 * indirect calls (which are very expensive on x86) regardless of inlining.
911 */
912#define FLAG_RFC4106 BIT(0)
913#define FLAG_ENC BIT(1)
914#define FLAG_AVX BIT(2)
915#if defined(CONFIG_AS_VAES) && defined(CONFIG_AS_VPCLMULQDQ)
916# define FLAG_AVX10_256 BIT(3)
917# define FLAG_AVX10_512 BIT(4)
918#else
919 /*
920 * This should cause all calls to the AVX10 assembly functions to be
921 * optimized out, avoiding the need to ifdef each call individually.
922 */
923# define FLAG_AVX10_256 0
924# define FLAG_AVX10_512 0
925#endif
926
927static inline struct aes_gcm_key *
928aes_gcm_key_get(struct crypto_aead *tfm, int flags)
929{
930 if (flags & (FLAG_AVX10_256 | FLAG_AVX10_512))
931 return PTR_ALIGN(crypto_aead_ctx(tfm), 64);
932 else
933 return PTR_ALIGN(crypto_aead_ctx(tfm), 16);
934}
935
936asmlinkage void
937aes_gcm_precompute_aesni(struct aes_gcm_key_aesni *key);
938asmlinkage void
939aes_gcm_precompute_aesni_avx(struct aes_gcm_key_aesni *key);
940asmlinkage void
941aes_gcm_precompute_vaes_avx10_256(struct aes_gcm_key_avx10 *key);
942asmlinkage void
943aes_gcm_precompute_vaes_avx10_512(struct aes_gcm_key_avx10 *key);
944
945static void aes_gcm_precompute(struct aes_gcm_key *key, int flags)
946{
947 /*
948 * To make things a bit easier on the assembly side, the AVX10
949 * implementations use the same key format. Therefore, a single
950 * function using 256-bit vectors would suffice here. However, it's
951 * straightforward to provide a 512-bit one because of how the assembly
952 * code is structured, and it works nicely because the total size of the
953 * key powers is a multiple of 512 bits. So we take advantage of that.
954 *
955 * A similar situation applies to the AES-NI implementations.
956 */
957 if (flags & FLAG_AVX10_512)
958 aes_gcm_precompute_vaes_avx10_512(AES_GCM_KEY_AVX10(key));
959 else if (flags & FLAG_AVX10_256)
960 aes_gcm_precompute_vaes_avx10_256(AES_GCM_KEY_AVX10(key));
961 else if (flags & FLAG_AVX)
962 aes_gcm_precompute_aesni_avx(AES_GCM_KEY_AESNI(key));
963 else
964 aes_gcm_precompute_aesni(AES_GCM_KEY_AESNI(key));
965}
966
967asmlinkage void
968aes_gcm_aad_update_aesni(const struct aes_gcm_key_aesni *key,
969 u8 ghash_acc[16], const u8 *aad, int aadlen);
970asmlinkage void
971aes_gcm_aad_update_aesni_avx(const struct aes_gcm_key_aesni *key,
972 u8 ghash_acc[16], const u8 *aad, int aadlen);
973asmlinkage void
974aes_gcm_aad_update_vaes_avx10(const struct aes_gcm_key_avx10 *key,
975 u8 ghash_acc[16], const u8 *aad, int aadlen);
976
977static void aes_gcm_aad_update(const struct aes_gcm_key *key, u8 ghash_acc[16],
978 const u8 *aad, int aadlen, int flags)
979{
980 if (flags & (FLAG_AVX10_256 | FLAG_AVX10_512))
981 aes_gcm_aad_update_vaes_avx10(AES_GCM_KEY_AVX10(key), ghash_acc,
982 aad, aadlen);
983 else if (flags & FLAG_AVX)
984 aes_gcm_aad_update_aesni_avx(AES_GCM_KEY_AESNI(key), ghash_acc,
985 aad, aadlen);
986 else
987 aes_gcm_aad_update_aesni(AES_GCM_KEY_AESNI(key), ghash_acc,
988 aad, aadlen);
989}
990
991asmlinkage void
992aes_gcm_enc_update_aesni(const struct aes_gcm_key_aesni *key,
993 const u32 le_ctr[4], u8 ghash_acc[16],
994 const u8 *src, u8 *dst, int datalen);
995asmlinkage void
996aes_gcm_enc_update_aesni_avx(const struct aes_gcm_key_aesni *key,
997 const u32 le_ctr[4], u8 ghash_acc[16],
998 const u8 *src, u8 *dst, int datalen);
999asmlinkage void
1000aes_gcm_enc_update_vaes_avx10_256(const struct aes_gcm_key_avx10 *key,
1001 const u32 le_ctr[4], u8 ghash_acc[16],
1002 const u8 *src, u8 *dst, int datalen);
1003asmlinkage void
1004aes_gcm_enc_update_vaes_avx10_512(const struct aes_gcm_key_avx10 *key,
1005 const u32 le_ctr[4], u8 ghash_acc[16],
1006 const u8 *src, u8 *dst, int datalen);
1007
1008asmlinkage void
1009aes_gcm_dec_update_aesni(const struct aes_gcm_key_aesni *key,
1010 const u32 le_ctr[4], u8 ghash_acc[16],
1011 const u8 *src, u8 *dst, int datalen);
1012asmlinkage void
1013aes_gcm_dec_update_aesni_avx(const struct aes_gcm_key_aesni *key,
1014 const u32 le_ctr[4], u8 ghash_acc[16],
1015 const u8 *src, u8 *dst, int datalen);
1016asmlinkage void
1017aes_gcm_dec_update_vaes_avx10_256(const struct aes_gcm_key_avx10 *key,
1018 const u32 le_ctr[4], u8 ghash_acc[16],
1019 const u8 *src, u8 *dst, int datalen);
1020asmlinkage void
1021aes_gcm_dec_update_vaes_avx10_512(const struct aes_gcm_key_avx10 *key,
1022 const u32 le_ctr[4], u8 ghash_acc[16],
1023 const u8 *src, u8 *dst, int datalen);
1024
1025/* __always_inline to optimize out the branches based on @flags */
1026static __always_inline void
1027aes_gcm_update(const struct aes_gcm_key *key,
1028 const u32 le_ctr[4], u8 ghash_acc[16],
1029 const u8 *src, u8 *dst, int datalen, int flags)
1030{
1031 if (flags & FLAG_ENC) {
1032 if (flags & FLAG_AVX10_512)
1033 aes_gcm_enc_update_vaes_avx10_512(AES_GCM_KEY_AVX10(key),
1034 le_ctr, ghash_acc,
1035 src, dst, datalen);
1036 else if (flags & FLAG_AVX10_256)
1037 aes_gcm_enc_update_vaes_avx10_256(AES_GCM_KEY_AVX10(key),
1038 le_ctr, ghash_acc,
1039 src, dst, datalen);
1040 else if (flags & FLAG_AVX)
1041 aes_gcm_enc_update_aesni_avx(AES_GCM_KEY_AESNI(key),
1042 le_ctr, ghash_acc,
1043 src, dst, datalen);
1044 else
1045 aes_gcm_enc_update_aesni(AES_GCM_KEY_AESNI(key), le_ctr,
1046 ghash_acc, src, dst, datalen);
1047 } else {
1048 if (flags & FLAG_AVX10_512)
1049 aes_gcm_dec_update_vaes_avx10_512(AES_GCM_KEY_AVX10(key),
1050 le_ctr, ghash_acc,
1051 src, dst, datalen);
1052 else if (flags & FLAG_AVX10_256)
1053 aes_gcm_dec_update_vaes_avx10_256(AES_GCM_KEY_AVX10(key),
1054 le_ctr, ghash_acc,
1055 src, dst, datalen);
1056 else if (flags & FLAG_AVX)
1057 aes_gcm_dec_update_aesni_avx(AES_GCM_KEY_AESNI(key),
1058 le_ctr, ghash_acc,
1059 src, dst, datalen);
1060 else
1061 aes_gcm_dec_update_aesni(AES_GCM_KEY_AESNI(key),
1062 le_ctr, ghash_acc,
1063 src, dst, datalen);
1064 }
1065}
1066
1067asmlinkage void
1068aes_gcm_enc_final_aesni(const struct aes_gcm_key_aesni *key,
1069 const u32 le_ctr[4], u8 ghash_acc[16],
1070 u64 total_aadlen, u64 total_datalen);
1071asmlinkage void
1072aes_gcm_enc_final_aesni_avx(const struct aes_gcm_key_aesni *key,
1073 const u32 le_ctr[4], u8 ghash_acc[16],
1074 u64 total_aadlen, u64 total_datalen);
1075asmlinkage void
1076aes_gcm_enc_final_vaes_avx10(const struct aes_gcm_key_avx10 *key,
1077 const u32 le_ctr[4], u8 ghash_acc[16],
1078 u64 total_aadlen, u64 total_datalen);
1079
1080/* __always_inline to optimize out the branches based on @flags */
1081static __always_inline void
1082aes_gcm_enc_final(const struct aes_gcm_key *key,
1083 const u32 le_ctr[4], u8 ghash_acc[16],
1084 u64 total_aadlen, u64 total_datalen, int flags)
1085{
1086 if (flags & (FLAG_AVX10_256 | FLAG_AVX10_512))
1087 aes_gcm_enc_final_vaes_avx10(AES_GCM_KEY_AVX10(key),
1088 le_ctr, ghash_acc,
1089 total_aadlen, total_datalen);
1090 else if (flags & FLAG_AVX)
1091 aes_gcm_enc_final_aesni_avx(AES_GCM_KEY_AESNI(key),
1092 le_ctr, ghash_acc,
1093 total_aadlen, total_datalen);
1094 else
1095 aes_gcm_enc_final_aesni(AES_GCM_KEY_AESNI(key),
1096 le_ctr, ghash_acc,
1097 total_aadlen, total_datalen);
1098}
1099
1100asmlinkage bool __must_check
1101aes_gcm_dec_final_aesni(const struct aes_gcm_key_aesni *key,
1102 const u32 le_ctr[4], const u8 ghash_acc[16],
1103 u64 total_aadlen, u64 total_datalen,
1104 const u8 tag[16], int taglen);
1105asmlinkage bool __must_check
1106aes_gcm_dec_final_aesni_avx(const struct aes_gcm_key_aesni *key,
1107 const u32 le_ctr[4], const u8 ghash_acc[16],
1108 u64 total_aadlen, u64 total_datalen,
1109 const u8 tag[16], int taglen);
1110asmlinkage bool __must_check
1111aes_gcm_dec_final_vaes_avx10(const struct aes_gcm_key_avx10 *key,
1112 const u32 le_ctr[4], const u8 ghash_acc[16],
1113 u64 total_aadlen, u64 total_datalen,
1114 const u8 tag[16], int taglen);
1115
1116/* __always_inline to optimize out the branches based on @flags */
1117static __always_inline bool __must_check
1118aes_gcm_dec_final(const struct aes_gcm_key *key, const u32 le_ctr[4],
1119 u8 ghash_acc[16], u64 total_aadlen, u64 total_datalen,
1120 u8 tag[16], int taglen, int flags)
1121{
1122 if (flags & (FLAG_AVX10_256 | FLAG_AVX10_512))
1123 return aes_gcm_dec_final_vaes_avx10(AES_GCM_KEY_AVX10(key),
1124 le_ctr, ghash_acc,
1125 total_aadlen, total_datalen,
1126 tag, taglen);
1127 else if (flags & FLAG_AVX)
1128 return aes_gcm_dec_final_aesni_avx(AES_GCM_KEY_AESNI(key),
1129 le_ctr, ghash_acc,
1130 total_aadlen, total_datalen,
1131 tag, taglen);
1132 else
1133 return aes_gcm_dec_final_aesni(AES_GCM_KEY_AESNI(key),
1134 le_ctr, ghash_acc,
1135 total_aadlen, total_datalen,
1136 tag, taglen);
1137}
1138
1139/*
1140 * This is the Integrity Check Value (aka the authentication tag) length and can
1141 * be 8, 12 or 16 bytes long.
1142 */
1143static int common_rfc4106_set_authsize(struct crypto_aead *aead,
1144 unsigned int authsize)
1145{
1146 switch (authsize) {
1147 case 8:
1148 case 12:
1149 case 16:
1150 break;
1151 default:
1152 return -EINVAL;
1153 }
1154
1155 return 0;
1156}
1157
1158static int generic_gcmaes_set_authsize(struct crypto_aead *tfm,
1159 unsigned int authsize)
1160{
1161 switch (authsize) {
1162 case 4:
1163 case 8:
1164 case 12:
1165 case 13:
1166 case 14:
1167 case 15:
1168 case 16:
1169 break;
1170 default:
1171 return -EINVAL;
1172 }
1173
1174 return 0;
1175}
1176
1177/*
1178 * This is the setkey function for the x86_64 implementations of AES-GCM. It
1179 * saves the RFC4106 nonce if applicable, expands the AES key, and precomputes
1180 * powers of the hash key.
1181 *
1182 * To comply with the crypto_aead API, this has to be usable in no-SIMD context.
1183 * For that reason, this function includes a portable C implementation of the
1184 * needed logic. However, the portable C implementation is very slow, taking
1185 * about the same time as encrypting 37 KB of data. To be ready for users that
1186 * may set a key even somewhat frequently, we therefore also include a SIMD
1187 * assembly implementation, expanding the AES key using AES-NI and precomputing
1188 * the hash key powers using PCLMULQDQ or VPCLMULQDQ.
1189 */
1190static int gcm_setkey(struct crypto_aead *tfm, const u8 *raw_key,
1191 unsigned int keylen, int flags)
1192{
1193 struct aes_gcm_key *key = aes_gcm_key_get(tfm, flags);
1194 int err;
1195
1196 if (flags & FLAG_RFC4106) {
1197 if (keylen < 4)
1198 return -EINVAL;
1199 keylen -= 4;
1200 key->rfc4106_nonce = get_unaligned_be32(raw_key + keylen);
1201 }
1202
1203 /* The assembly code assumes the following offsets. */
1204 BUILD_BUG_ON(offsetof(struct aes_gcm_key_aesni, base.aes_key.key_enc) != 0);
1205 BUILD_BUG_ON(offsetof(struct aes_gcm_key_aesni, base.aes_key.key_length) != 480);
1206 BUILD_BUG_ON(offsetof(struct aes_gcm_key_aesni, h_powers) != 496);
1207 BUILD_BUG_ON(offsetof(struct aes_gcm_key_aesni, h_powers_xored) != 624);
1208 BUILD_BUG_ON(offsetof(struct aes_gcm_key_aesni, h_times_x64) != 688);
1209 BUILD_BUG_ON(offsetof(struct aes_gcm_key_avx10, base.aes_key.key_enc) != 0);
1210 BUILD_BUG_ON(offsetof(struct aes_gcm_key_avx10, base.aes_key.key_length) != 480);
1211 BUILD_BUG_ON(offsetof(struct aes_gcm_key_avx10, h_powers) != 512);
1212 BUILD_BUG_ON(offsetof(struct aes_gcm_key_avx10, padding) != 768);
1213
1214 if (likely(crypto_simd_usable())) {
1215 err = aes_check_keylen(keylen);
1216 if (err)
1217 return err;
1218 kernel_fpu_begin();
1219 aesni_set_key(&key->aes_key, raw_key, keylen);
1220 aes_gcm_precompute(key, flags);
1221 kernel_fpu_end();
1222 } else {
1223 static const u8 x_to_the_minus1[16] __aligned(__alignof__(be128)) = {
1224 [0] = 0xc2, [15] = 1
1225 };
1226 static const u8 x_to_the_63[16] __aligned(__alignof__(be128)) = {
1227 [7] = 1,
1228 };
1229 be128 h1 = {};
1230 be128 h;
1231 int i;
1232
1233 err = aes_expandkey(&key->aes_key, raw_key, keylen);
1234 if (err)
1235 return err;
1236
1237 /* Encrypt the all-zeroes block to get the hash key H^1 */
1238 aes_encrypt(&key->aes_key, (u8 *)&h1, (u8 *)&h1);
1239
1240 /* Compute H^1 * x^-1 */
1241 h = h1;
1242 gf128mul_lle(&h, (const be128 *)x_to_the_minus1);
1243
1244 /* Compute the needed key powers */
1245 if (flags & (FLAG_AVX10_256 | FLAG_AVX10_512)) {
1246 struct aes_gcm_key_avx10 *k = AES_GCM_KEY_AVX10(key);
1247
1248 for (i = ARRAY_SIZE(k->h_powers) - 1; i >= 0; i--) {
1249 k->h_powers[i][0] = be64_to_cpu(h.b);
1250 k->h_powers[i][1] = be64_to_cpu(h.a);
1251 gf128mul_lle(&h, &h1);
1252 }
1253 memset(k->padding, 0, sizeof(k->padding));
1254 } else {
1255 struct aes_gcm_key_aesni *k = AES_GCM_KEY_AESNI(key);
1256
1257 for (i = ARRAY_SIZE(k->h_powers) - 1; i >= 0; i--) {
1258 k->h_powers[i][0] = be64_to_cpu(h.b);
1259 k->h_powers[i][1] = be64_to_cpu(h.a);
1260 k->h_powers_xored[i] = k->h_powers[i][0] ^
1261 k->h_powers[i][1];
1262 gf128mul_lle(&h, &h1);
1263 }
1264 gf128mul_lle(&h1, (const be128 *)x_to_the_63);
1265 k->h_times_x64[0] = be64_to_cpu(h1.b);
1266 k->h_times_x64[1] = be64_to_cpu(h1.a);
1267 }
1268 }
1269 return 0;
1270}
1271
1272/*
1273 * Initialize @ghash_acc, then pass all @assoclen bytes of associated data
1274 * (a.k.a. additional authenticated data) from @sg_src through the GHASH update
1275 * assembly function. kernel_fpu_begin() must have already been called.
1276 */
1277static void gcm_process_assoc(const struct aes_gcm_key *key, u8 ghash_acc[16],
1278 struct scatterlist *sg_src, unsigned int assoclen,
1279 int flags)
1280{
1281 struct scatter_walk walk;
1282 /*
1283 * The assembly function requires that the length of any non-last
1284 * segment of associated data be a multiple of 16 bytes, so this
1285 * function does the buffering needed to achieve that.
1286 */
1287 unsigned int pos = 0;
1288 u8 buf[16];
1289
1290 memset(ghash_acc, 0, 16);
1291 scatterwalk_start(&walk, sg_src);
1292
1293 while (assoclen) {
1294 unsigned int len_this_page = scatterwalk_clamp(&walk, assoclen);
1295 void *mapped = scatterwalk_map(&walk);
1296 const void *src = mapped;
1297 unsigned int len;
1298
1299 assoclen -= len_this_page;
1300 scatterwalk_advance(&walk, len_this_page);
1301 if (unlikely(pos)) {
1302 len = min(len_this_page, 16 - pos);
1303 memcpy(&buf[pos], src, len);
1304 pos += len;
1305 src += len;
1306 len_this_page -= len;
1307 if (pos < 16)
1308 goto next;
1309 aes_gcm_aad_update(key, ghash_acc, buf, 16, flags);
1310 pos = 0;
1311 }
1312 len = len_this_page;
1313 if (unlikely(assoclen)) /* Not the last segment yet? */
1314 len = round_down(len, 16);
1315 aes_gcm_aad_update(key, ghash_acc, src, len, flags);
1316 src += len;
1317 len_this_page -= len;
1318 if (unlikely(len_this_page)) {
1319 memcpy(buf, src, len_this_page);
1320 pos = len_this_page;
1321 }
1322next:
1323 scatterwalk_unmap(mapped);
1324 scatterwalk_pagedone(&walk, 0, assoclen);
1325 if (need_resched()) {
1326 kernel_fpu_end();
1327 kernel_fpu_begin();
1328 }
1329 }
1330 if (unlikely(pos))
1331 aes_gcm_aad_update(key, ghash_acc, buf, pos, flags);
1332}
1333
1334
1335/* __always_inline to optimize out the branches based on @flags */
1336static __always_inline int
1337gcm_crypt(struct aead_request *req, int flags)
1338{
1339 struct crypto_aead *tfm = crypto_aead_reqtfm(req);
1340 const struct aes_gcm_key *key = aes_gcm_key_get(tfm, flags);
1341 unsigned int assoclen = req->assoclen;
1342 struct skcipher_walk walk;
1343 unsigned int nbytes;
1344 u8 ghash_acc[16]; /* GHASH accumulator */
1345 u32 le_ctr[4]; /* Counter in little-endian format */
1346 int taglen;
1347 int err;
1348
1349 /* Initialize the counter and determine the associated data length. */
1350 le_ctr[0] = 2;
1351 if (flags & FLAG_RFC4106) {
1352 if (unlikely(assoclen != 16 && assoclen != 20))
1353 return -EINVAL;
1354 assoclen -= 8;
1355 le_ctr[1] = get_unaligned_be32(req->iv + 4);
1356 le_ctr[2] = get_unaligned_be32(req->iv + 0);
1357 le_ctr[3] = key->rfc4106_nonce; /* already byte-swapped */
1358 } else {
1359 le_ctr[1] = get_unaligned_be32(req->iv + 8);
1360 le_ctr[2] = get_unaligned_be32(req->iv + 4);
1361 le_ctr[3] = get_unaligned_be32(req->iv + 0);
1362 }
1363
1364 /* Begin walking through the plaintext or ciphertext. */
1365 if (flags & FLAG_ENC)
1366 err = skcipher_walk_aead_encrypt(&walk, req, false);
1367 else
1368 err = skcipher_walk_aead_decrypt(&walk, req, false);
1369 if (err)
1370 return err;
1371
1372 /*
1373 * Since the AES-GCM assembly code requires that at least three assembly
1374 * functions be called to process any message (this is needed to support
1375 * incremental updates cleanly), to reduce overhead we try to do all
1376 * three calls in the same kernel FPU section if possible. We close the
1377 * section and start a new one if there are multiple data segments or if
1378 * rescheduling is needed while processing the associated data.
1379 */
1380 kernel_fpu_begin();
1381
1382 /* Pass the associated data through GHASH. */
1383 gcm_process_assoc(key, ghash_acc, req->src, assoclen, flags);
1384
1385 /* En/decrypt the data and pass the ciphertext through GHASH. */
1386 while (unlikely((nbytes = walk.nbytes) < walk.total)) {
1387 /*
1388 * Non-last segment. In this case, the assembly function
1389 * requires that the length be a multiple of 16 (AES_BLOCK_SIZE)
1390 * bytes. The needed buffering of up to 16 bytes is handled by
1391 * the skcipher_walk. Here we just need to round down to a
1392 * multiple of 16.
1393 */
1394 nbytes = round_down(nbytes, AES_BLOCK_SIZE);
1395 aes_gcm_update(key, le_ctr, ghash_acc, walk.src.virt.addr,
1396 walk.dst.virt.addr, nbytes, flags);
1397 le_ctr[0] += nbytes / AES_BLOCK_SIZE;
1398 kernel_fpu_end();
1399 err = skcipher_walk_done(&walk, walk.nbytes - nbytes);
1400 if (err)
1401 return err;
1402 kernel_fpu_begin();
1403 }
1404 /* Last segment: process all remaining data. */
1405 aes_gcm_update(key, le_ctr, ghash_acc, walk.src.virt.addr,
1406 walk.dst.virt.addr, nbytes, flags);
1407 /*
1408 * The low word of the counter isn't used by the finalize, so there's no
1409 * need to increment it here.
1410 */
1411
1412 /* Finalize */
1413 taglen = crypto_aead_authsize(tfm);
1414 if (flags & FLAG_ENC) {
1415 /* Finish computing the auth tag. */
1416 aes_gcm_enc_final(key, le_ctr, ghash_acc, assoclen,
1417 req->cryptlen, flags);
1418
1419 /* Store the computed auth tag in the dst scatterlist. */
1420 scatterwalk_map_and_copy(ghash_acc, req->dst, req->assoclen +
1421 req->cryptlen, taglen, 1);
1422 } else {
1423 unsigned int datalen = req->cryptlen - taglen;
1424 u8 tag[16];
1425
1426 /* Get the transmitted auth tag from the src scatterlist. */
1427 scatterwalk_map_and_copy(tag, req->src, req->assoclen + datalen,
1428 taglen, 0);
1429 /*
1430 * Finish computing the auth tag and compare it to the
1431 * transmitted one. The assembly function does the actual tag
1432 * comparison. Here, just check the boolean result.
1433 */
1434 if (!aes_gcm_dec_final(key, le_ctr, ghash_acc, assoclen,
1435 datalen, tag, taglen, flags))
1436 err = -EBADMSG;
1437 }
1438 kernel_fpu_end();
1439 if (nbytes)
1440 skcipher_walk_done(&walk, 0);
1441 return err;
1442}
1443
1444#define DEFINE_GCM_ALGS(suffix, flags, generic_driver_name, rfc_driver_name, \
1445 ctxsize, priority) \
1446 \
1447static int gcm_setkey_##suffix(struct crypto_aead *tfm, const u8 *raw_key, \
1448 unsigned int keylen) \
1449{ \
1450 return gcm_setkey(tfm, raw_key, keylen, (flags)); \
1451} \
1452 \
1453static int gcm_encrypt_##suffix(struct aead_request *req) \
1454{ \
1455 return gcm_crypt(req, (flags) | FLAG_ENC); \
1456} \
1457 \
1458static int gcm_decrypt_##suffix(struct aead_request *req) \
1459{ \
1460 return gcm_crypt(req, (flags)); \
1461} \
1462 \
1463static int rfc4106_setkey_##suffix(struct crypto_aead *tfm, const u8 *raw_key, \
1464 unsigned int keylen) \
1465{ \
1466 return gcm_setkey(tfm, raw_key, keylen, (flags) | FLAG_RFC4106); \
1467} \
1468 \
1469static int rfc4106_encrypt_##suffix(struct aead_request *req) \
1470{ \
1471 return gcm_crypt(req, (flags) | FLAG_RFC4106 | FLAG_ENC); \
1472} \
1473 \
1474static int rfc4106_decrypt_##suffix(struct aead_request *req) \
1475{ \
1476 return gcm_crypt(req, (flags) | FLAG_RFC4106); \
1477} \
1478 \
1479static struct aead_alg aes_gcm_algs_##suffix[] = { { \
1480 .setkey = gcm_setkey_##suffix, \
1481 .setauthsize = generic_gcmaes_set_authsize, \
1482 .encrypt = gcm_encrypt_##suffix, \
1483 .decrypt = gcm_decrypt_##suffix, \
1484 .ivsize = GCM_AES_IV_SIZE, \
1485 .chunksize = AES_BLOCK_SIZE, \
1486 .maxauthsize = 16, \
1487 .base = { \
1488 .cra_name = "__gcm(aes)", \
1489 .cra_driver_name = "__" generic_driver_name, \
1490 .cra_priority = (priority), \
1491 .cra_flags = CRYPTO_ALG_INTERNAL, \
1492 .cra_blocksize = 1, \
1493 .cra_ctxsize = (ctxsize), \
1494 .cra_module = THIS_MODULE, \
1495 }, \
1496}, { \
1497 .setkey = rfc4106_setkey_##suffix, \
1498 .setauthsize = common_rfc4106_set_authsize, \
1499 .encrypt = rfc4106_encrypt_##suffix, \
1500 .decrypt = rfc4106_decrypt_##suffix, \
1501 .ivsize = GCM_RFC4106_IV_SIZE, \
1502 .chunksize = AES_BLOCK_SIZE, \
1503 .maxauthsize = 16, \
1504 .base = { \
1505 .cra_name = "__rfc4106(gcm(aes))", \
1506 .cra_driver_name = "__" rfc_driver_name, \
1507 .cra_priority = (priority), \
1508 .cra_flags = CRYPTO_ALG_INTERNAL, \
1509 .cra_blocksize = 1, \
1510 .cra_ctxsize = (ctxsize), \
1511 .cra_module = THIS_MODULE, \
1512 }, \
1513} }; \
1514 \
1515static struct simd_aead_alg *aes_gcm_simdalgs_##suffix[2] \
1516
1517/* aes_gcm_algs_aesni */
1518DEFINE_GCM_ALGS(aesni, /* no flags */ 0,
1519 "generic-gcm-aesni", "rfc4106-gcm-aesni",
1520 AES_GCM_KEY_AESNI_SIZE, 400);
1521
1522/* aes_gcm_algs_aesni_avx */
1523DEFINE_GCM_ALGS(aesni_avx, FLAG_AVX,
1524 "generic-gcm-aesni-avx", "rfc4106-gcm-aesni-avx",
1525 AES_GCM_KEY_AESNI_SIZE, 500);
1526
1527#if defined(CONFIG_AS_VAES) && defined(CONFIG_AS_VPCLMULQDQ)
1528/* aes_gcm_algs_vaes_avx10_256 */
1529DEFINE_GCM_ALGS(vaes_avx10_256, FLAG_AVX10_256,
1530 "generic-gcm-vaes-avx10_256", "rfc4106-gcm-vaes-avx10_256",
1531 AES_GCM_KEY_AVX10_SIZE, 700);
1532
1533/* aes_gcm_algs_vaes_avx10_512 */
1534DEFINE_GCM_ALGS(vaes_avx10_512, FLAG_AVX10_512,
1535 "generic-gcm-vaes-avx10_512", "rfc4106-gcm-vaes-avx10_512",
1536 AES_GCM_KEY_AVX10_SIZE, 800);
1537#endif /* CONFIG_AS_VAES && CONFIG_AS_VPCLMULQDQ */
1538
1539/*
1540 * This is a list of CPU models that are known to suffer from downclocking when
1541 * zmm registers (512-bit vectors) are used. On these CPUs, the AES mode
1542 * implementations with zmm registers won't be used by default. Implementations
1543 * with ymm registers (256-bit vectors) will be used by default instead.
1544 */
1545static const struct x86_cpu_id zmm_exclusion_list[] = {
1546 X86_MATCH_VFM(INTEL_SKYLAKE_X, 0),
1547 X86_MATCH_VFM(INTEL_ICELAKE_X, 0),
1548 X86_MATCH_VFM(INTEL_ICELAKE_D, 0),
1549 X86_MATCH_VFM(INTEL_ICELAKE, 0),
1550 X86_MATCH_VFM(INTEL_ICELAKE_L, 0),
1551 X86_MATCH_VFM(INTEL_ICELAKE_NNPI, 0),
1552 X86_MATCH_VFM(INTEL_TIGERLAKE_L, 0),
1553 X86_MATCH_VFM(INTEL_TIGERLAKE, 0),
1554 /* Allow Rocket Lake and later, and Sapphire Rapids and later. */
1555 /* Also allow AMD CPUs (starting with Zen 4, the first with AVX-512). */
1556 {},
1557};
1558
1559static int __init register_avx_algs(void)
1560{
1561 int err;
1562
1563 if (!boot_cpu_has(X86_FEATURE_AVX))
1564 return 0;
1565 err = simd_register_skciphers_compat(&aes_xts_alg_aesni_avx, 1,
1566 &aes_xts_simdalg_aesni_avx);
1567 if (err)
1568 return err;
1569 err = simd_register_aeads_compat(aes_gcm_algs_aesni_avx,
1570 ARRAY_SIZE(aes_gcm_algs_aesni_avx),
1571 aes_gcm_simdalgs_aesni_avx);
1572 if (err)
1573 return err;
1574#if defined(CONFIG_AS_VAES) && defined(CONFIG_AS_VPCLMULQDQ)
1575 if (!boot_cpu_has(X86_FEATURE_AVX2) ||
1576 !boot_cpu_has(X86_FEATURE_VAES) ||
1577 !boot_cpu_has(X86_FEATURE_VPCLMULQDQ) ||
1578 !boot_cpu_has(X86_FEATURE_PCLMULQDQ) ||
1579 !cpu_has_xfeatures(XFEATURE_MASK_SSE | XFEATURE_MASK_YMM, NULL))
1580 return 0;
1581 err = simd_register_skciphers_compat(&aes_xts_alg_vaes_avx2, 1,
1582 &aes_xts_simdalg_vaes_avx2);
1583 if (err)
1584 return err;
1585
1586 if (!boot_cpu_has(X86_FEATURE_AVX512BW) ||
1587 !boot_cpu_has(X86_FEATURE_AVX512VL) ||
1588 !boot_cpu_has(X86_FEATURE_BMI2) ||
1589 !cpu_has_xfeatures(XFEATURE_MASK_SSE | XFEATURE_MASK_YMM |
1590 XFEATURE_MASK_AVX512, NULL))
1591 return 0;
1592
1593 err = simd_register_skciphers_compat(&aes_xts_alg_vaes_avx10_256, 1,
1594 &aes_xts_simdalg_vaes_avx10_256);
1595 if (err)
1596 return err;
1597 err = simd_register_aeads_compat(aes_gcm_algs_vaes_avx10_256,
1598 ARRAY_SIZE(aes_gcm_algs_vaes_avx10_256),
1599 aes_gcm_simdalgs_vaes_avx10_256);
1600 if (err)
1601 return err;
1602
1603 if (x86_match_cpu(zmm_exclusion_list)) {
1604 int i;
1605
1606 aes_xts_alg_vaes_avx10_512.base.cra_priority = 1;
1607 for (i = 0; i < ARRAY_SIZE(aes_gcm_algs_vaes_avx10_512); i++)
1608 aes_gcm_algs_vaes_avx10_512[i].base.cra_priority = 1;
1609 }
1610
1611 err = simd_register_skciphers_compat(&aes_xts_alg_vaes_avx10_512, 1,
1612 &aes_xts_simdalg_vaes_avx10_512);
1613 if (err)
1614 return err;
1615 err = simd_register_aeads_compat(aes_gcm_algs_vaes_avx10_512,
1616 ARRAY_SIZE(aes_gcm_algs_vaes_avx10_512),
1617 aes_gcm_simdalgs_vaes_avx10_512);
1618 if (err)
1619 return err;
1620#endif /* CONFIG_AS_VAES && CONFIG_AS_VPCLMULQDQ */
1621 return 0;
1622}
1623
1624static void unregister_avx_algs(void)
1625{
1626 if (aes_xts_simdalg_aesni_avx)
1627 simd_unregister_skciphers(&aes_xts_alg_aesni_avx, 1,
1628 &aes_xts_simdalg_aesni_avx);
1629 if (aes_gcm_simdalgs_aesni_avx[0])
1630 simd_unregister_aeads(aes_gcm_algs_aesni_avx,
1631 ARRAY_SIZE(aes_gcm_algs_aesni_avx),
1632 aes_gcm_simdalgs_aesni_avx);
1633#if defined(CONFIG_AS_VAES) && defined(CONFIG_AS_VPCLMULQDQ)
1634 if (aes_xts_simdalg_vaes_avx2)
1635 simd_unregister_skciphers(&aes_xts_alg_vaes_avx2, 1,
1636 &aes_xts_simdalg_vaes_avx2);
1637 if (aes_xts_simdalg_vaes_avx10_256)
1638 simd_unregister_skciphers(&aes_xts_alg_vaes_avx10_256, 1,
1639 &aes_xts_simdalg_vaes_avx10_256);
1640 if (aes_gcm_simdalgs_vaes_avx10_256[0])
1641 simd_unregister_aeads(aes_gcm_algs_vaes_avx10_256,
1642 ARRAY_SIZE(aes_gcm_algs_vaes_avx10_256),
1643 aes_gcm_simdalgs_vaes_avx10_256);
1644 if (aes_xts_simdalg_vaes_avx10_512)
1645 simd_unregister_skciphers(&aes_xts_alg_vaes_avx10_512, 1,
1646 &aes_xts_simdalg_vaes_avx10_512);
1647 if (aes_gcm_simdalgs_vaes_avx10_512[0])
1648 simd_unregister_aeads(aes_gcm_algs_vaes_avx10_512,
1649 ARRAY_SIZE(aes_gcm_algs_vaes_avx10_512),
1650 aes_gcm_simdalgs_vaes_avx10_512);
1651#endif
1652}
1653#else /* CONFIG_X86_64 */
1654static struct aead_alg aes_gcm_algs_aesni[0];
1655static struct simd_aead_alg *aes_gcm_simdalgs_aesni[0];
1656
1657static int __init register_avx_algs(void)
1658{
1659 return 0;
1660}
1661
1662static void unregister_avx_algs(void)
1663{
1664}
1665#endif /* !CONFIG_X86_64 */
1666
1667static const struct x86_cpu_id aesni_cpu_id[] = {
1668 X86_MATCH_FEATURE(X86_FEATURE_AES, NULL),
1669 {}
1670};
1671MODULE_DEVICE_TABLE(x86cpu, aesni_cpu_id);
1672
1673static int __init aesni_init(void)
1674{
1675 int err;
1676
1677 if (!x86_match_cpu(aesni_cpu_id))
1678 return -ENODEV;
1679#ifdef CONFIG_X86_64
1680 if (boot_cpu_has(X86_FEATURE_AVX)) {
1681 /* optimize performance of ctr mode encryption transform */
1682 static_call_update(aesni_ctr_enc_tfm, aesni_ctr_enc_avx_tfm);
1683 pr_info("AES CTR mode by8 optimization enabled\n");
1684 }
1685#endif /* CONFIG_X86_64 */
1686
1687 err = crypto_register_alg(&aesni_cipher_alg);
1688 if (err)
1689 return err;
1690
1691 err = simd_register_skciphers_compat(aesni_skciphers,
1692 ARRAY_SIZE(aesni_skciphers),
1693 aesni_simd_skciphers);
1694 if (err)
1695 goto unregister_cipher;
1696
1697 err = simd_register_aeads_compat(aes_gcm_algs_aesni,
1698 ARRAY_SIZE(aes_gcm_algs_aesni),
1699 aes_gcm_simdalgs_aesni);
1700 if (err)
1701 goto unregister_skciphers;
1702
1703#ifdef CONFIG_X86_64
1704 if (boot_cpu_has(X86_FEATURE_AVX))
1705 err = simd_register_skciphers_compat(&aesni_xctr, 1,
1706 &aesni_simd_xctr);
1707 if (err)
1708 goto unregister_aeads;
1709#endif /* CONFIG_X86_64 */
1710
1711 err = register_avx_algs();
1712 if (err)
1713 goto unregister_avx;
1714
1715 return 0;
1716
1717unregister_avx:
1718 unregister_avx_algs();
1719#ifdef CONFIG_X86_64
1720 if (aesni_simd_xctr)
1721 simd_unregister_skciphers(&aesni_xctr, 1, &aesni_simd_xctr);
1722unregister_aeads:
1723#endif /* CONFIG_X86_64 */
1724 simd_unregister_aeads(aes_gcm_algs_aesni,
1725 ARRAY_SIZE(aes_gcm_algs_aesni),
1726 aes_gcm_simdalgs_aesni);
1727unregister_skciphers:
1728 simd_unregister_skciphers(aesni_skciphers, ARRAY_SIZE(aesni_skciphers),
1729 aesni_simd_skciphers);
1730unregister_cipher:
1731 crypto_unregister_alg(&aesni_cipher_alg);
1732 return err;
1733}
1734
1735static void __exit aesni_exit(void)
1736{
1737 simd_unregister_aeads(aes_gcm_algs_aesni,
1738 ARRAY_SIZE(aes_gcm_algs_aesni),
1739 aes_gcm_simdalgs_aesni);
1740 simd_unregister_skciphers(aesni_skciphers, ARRAY_SIZE(aesni_skciphers),
1741 aesni_simd_skciphers);
1742 crypto_unregister_alg(&aesni_cipher_alg);
1743#ifdef CONFIG_X86_64
1744 if (boot_cpu_has(X86_FEATURE_AVX))
1745 simd_unregister_skciphers(&aesni_xctr, 1, &aesni_simd_xctr);
1746#endif /* CONFIG_X86_64 */
1747 unregister_avx_algs();
1748}
1749
1750module_init(aesni_init);
1751module_exit(aesni_exit);
1752
1753MODULE_DESCRIPTION("AES cipher and modes, optimized with AES-NI or VAES instructions");
1754MODULE_LICENSE("GPL");
1755MODULE_ALIAS_CRYPTO("aes");
1/*
2 * Support for Intel AES-NI instructions. This file contains glue
3 * code, the real AES implementation is in intel-aes_asm.S.
4 *
5 * Copyright (C) 2008, Intel Corp.
6 * Author: Huang Ying <ying.huang@intel.com>
7 *
8 * Added RFC4106 AES-GCM support for 128-bit keys under the AEAD
9 * interface for 64-bit kernels.
10 * Authors: Adrian Hoban <adrian.hoban@intel.com>
11 * Gabriele Paoloni <gabriele.paoloni@intel.com>
12 * Tadeusz Struk (tadeusz.struk@intel.com)
13 * Aidan O'Mahony (aidan.o.mahony@intel.com)
14 * Copyright (c) 2010, Intel Corporation.
15 *
16 * This program is free software; you can redistribute it and/or modify
17 * it under the terms of the GNU General Public License as published by
18 * the Free Software Foundation; either version 2 of the License, or
19 * (at your option) any later version.
20 */
21
22#include <linux/hardirq.h>
23#include <linux/types.h>
24#include <linux/crypto.h>
25#include <linux/module.h>
26#include <linux/err.h>
27#include <crypto/algapi.h>
28#include <crypto/aes.h>
29#include <crypto/cryptd.h>
30#include <crypto/ctr.h>
31#include <crypto/b128ops.h>
32#include <crypto/lrw.h>
33#include <crypto/xts.h>
34#include <asm/cpu_device_id.h>
35#include <asm/i387.h>
36#include <asm/crypto/aes.h>
37#include <crypto/ablk_helper.h>
38#include <crypto/scatterwalk.h>
39#include <crypto/internal/aead.h>
40#include <linux/workqueue.h>
41#include <linux/spinlock.h>
42#ifdef CONFIG_X86_64
43#include <asm/crypto/glue_helper.h>
44#endif
45
46#if defined(CONFIG_CRYPTO_PCBC) || defined(CONFIG_CRYPTO_PCBC_MODULE)
47#define HAS_PCBC
48#endif
49
50/* This data is stored at the end of the crypto_tfm struct.
51 * It's a type of per "session" data storage location.
52 * This needs to be 16 byte aligned.
53 */
54struct aesni_rfc4106_gcm_ctx {
55 u8 hash_subkey[16];
56 struct crypto_aes_ctx aes_key_expanded;
57 u8 nonce[4];
58 struct cryptd_aead *cryptd_tfm;
59};
60
61struct aesni_gcm_set_hash_subkey_result {
62 int err;
63 struct completion completion;
64};
65
66struct aesni_hash_subkey_req_data {
67 u8 iv[16];
68 struct aesni_gcm_set_hash_subkey_result result;
69 struct scatterlist sg;
70};
71
72#define AESNI_ALIGN (16)
73#define AES_BLOCK_MASK (~(AES_BLOCK_SIZE-1))
74#define RFC4106_HASH_SUBKEY_SIZE 16
75
76struct aesni_lrw_ctx {
77 struct lrw_table_ctx lrw_table;
78 u8 raw_aes_ctx[sizeof(struct crypto_aes_ctx) + AESNI_ALIGN - 1];
79};
80
81struct aesni_xts_ctx {
82 u8 raw_tweak_ctx[sizeof(struct crypto_aes_ctx) + AESNI_ALIGN - 1];
83 u8 raw_crypt_ctx[sizeof(struct crypto_aes_ctx) + AESNI_ALIGN - 1];
84};
85
86asmlinkage int aesni_set_key(struct crypto_aes_ctx *ctx, const u8 *in_key,
87 unsigned int key_len);
88asmlinkage void aesni_enc(struct crypto_aes_ctx *ctx, u8 *out,
89 const u8 *in);
90asmlinkage void aesni_dec(struct crypto_aes_ctx *ctx, u8 *out,
91 const u8 *in);
92asmlinkage void aesni_ecb_enc(struct crypto_aes_ctx *ctx, u8 *out,
93 const u8 *in, unsigned int len);
94asmlinkage void aesni_ecb_dec(struct crypto_aes_ctx *ctx, u8 *out,
95 const u8 *in, unsigned int len);
96asmlinkage void aesni_cbc_enc(struct crypto_aes_ctx *ctx, u8 *out,
97 const u8 *in, unsigned int len, u8 *iv);
98asmlinkage void aesni_cbc_dec(struct crypto_aes_ctx *ctx, u8 *out,
99 const u8 *in, unsigned int len, u8 *iv);
100
101int crypto_fpu_init(void);
102void crypto_fpu_exit(void);
103
104#define AVX_GEN2_OPTSIZE 640
105#define AVX_GEN4_OPTSIZE 4096
106
107#ifdef CONFIG_X86_64
108asmlinkage void aesni_ctr_enc(struct crypto_aes_ctx *ctx, u8 *out,
109 const u8 *in, unsigned int len, u8 *iv);
110
111asmlinkage void aesni_xts_crypt8(struct crypto_aes_ctx *ctx, u8 *out,
112 const u8 *in, bool enc, u8 *iv);
113
114/* asmlinkage void aesni_gcm_enc()
115 * void *ctx, AES Key schedule. Starts on a 16 byte boundary.
116 * u8 *out, Ciphertext output. Encrypt in-place is allowed.
117 * const u8 *in, Plaintext input
118 * unsigned long plaintext_len, Length of data in bytes for encryption.
119 * u8 *iv, Pre-counter block j0: 4 byte salt (from Security Association)
120 * concatenated with 8 byte Initialisation Vector (from IPSec ESP
121 * Payload) concatenated with 0x00000001. 16-byte aligned pointer.
122 * u8 *hash_subkey, the Hash sub key input. Data starts on a 16-byte boundary.
123 * const u8 *aad, Additional Authentication Data (AAD)
124 * unsigned long aad_len, Length of AAD in bytes. With RFC4106 this
125 * is going to be 8 or 12 bytes
126 * u8 *auth_tag, Authenticated Tag output.
127 * unsigned long auth_tag_len), Authenticated Tag Length in bytes.
128 * Valid values are 16 (most likely), 12 or 8.
129 */
130asmlinkage void aesni_gcm_enc(void *ctx, u8 *out,
131 const u8 *in, unsigned long plaintext_len, u8 *iv,
132 u8 *hash_subkey, const u8 *aad, unsigned long aad_len,
133 u8 *auth_tag, unsigned long auth_tag_len);
134
135/* asmlinkage void aesni_gcm_dec()
136 * void *ctx, AES Key schedule. Starts on a 16 byte boundary.
137 * u8 *out, Plaintext output. Decrypt in-place is allowed.
138 * const u8 *in, Ciphertext input
139 * unsigned long ciphertext_len, Length of data in bytes for decryption.
140 * u8 *iv, Pre-counter block j0: 4 byte salt (from Security Association)
141 * concatenated with 8 byte Initialisation Vector (from IPSec ESP
142 * Payload) concatenated with 0x00000001. 16-byte aligned pointer.
143 * u8 *hash_subkey, the Hash sub key input. Data starts on a 16-byte boundary.
144 * const u8 *aad, Additional Authentication Data (AAD)
145 * unsigned long aad_len, Length of AAD in bytes. With RFC4106 this is going
146 * to be 8 or 12 bytes
147 * u8 *auth_tag, Authenticated Tag output.
148 * unsigned long auth_tag_len) Authenticated Tag Length in bytes.
149 * Valid values are 16 (most likely), 12 or 8.
150 */
151asmlinkage void aesni_gcm_dec(void *ctx, u8 *out,
152 const u8 *in, unsigned long ciphertext_len, u8 *iv,
153 u8 *hash_subkey, const u8 *aad, unsigned long aad_len,
154 u8 *auth_tag, unsigned long auth_tag_len);
155
156
157#ifdef CONFIG_AS_AVX
158/*
159 * asmlinkage void aesni_gcm_precomp_avx_gen2()
160 * gcm_data *my_ctx_data, context data
161 * u8 *hash_subkey, the Hash sub key input. Data starts on a 16-byte boundary.
162 */
163asmlinkage void aesni_gcm_precomp_avx_gen2(void *my_ctx_data, u8 *hash_subkey);
164
165asmlinkage void aesni_gcm_enc_avx_gen2(void *ctx, u8 *out,
166 const u8 *in, unsigned long plaintext_len, u8 *iv,
167 const u8 *aad, unsigned long aad_len,
168 u8 *auth_tag, unsigned long auth_tag_len);
169
170asmlinkage void aesni_gcm_dec_avx_gen2(void *ctx, u8 *out,
171 const u8 *in, unsigned long ciphertext_len, u8 *iv,
172 const u8 *aad, unsigned long aad_len,
173 u8 *auth_tag, unsigned long auth_tag_len);
174
175static void aesni_gcm_enc_avx(void *ctx, u8 *out,
176 const u8 *in, unsigned long plaintext_len, u8 *iv,
177 u8 *hash_subkey, const u8 *aad, unsigned long aad_len,
178 u8 *auth_tag, unsigned long auth_tag_len)
179{
180 if (plaintext_len < AVX_GEN2_OPTSIZE) {
181 aesni_gcm_enc(ctx, out, in, plaintext_len, iv, hash_subkey, aad,
182 aad_len, auth_tag, auth_tag_len);
183 } else {
184 aesni_gcm_precomp_avx_gen2(ctx, hash_subkey);
185 aesni_gcm_enc_avx_gen2(ctx, out, in, plaintext_len, iv, aad,
186 aad_len, auth_tag, auth_tag_len);
187 }
188}
189
190static void aesni_gcm_dec_avx(void *ctx, u8 *out,
191 const u8 *in, unsigned long ciphertext_len, u8 *iv,
192 u8 *hash_subkey, const u8 *aad, unsigned long aad_len,
193 u8 *auth_tag, unsigned long auth_tag_len)
194{
195 if (ciphertext_len < AVX_GEN2_OPTSIZE) {
196 aesni_gcm_dec(ctx, out, in, ciphertext_len, iv, hash_subkey, aad,
197 aad_len, auth_tag, auth_tag_len);
198 } else {
199 aesni_gcm_precomp_avx_gen2(ctx, hash_subkey);
200 aesni_gcm_dec_avx_gen2(ctx, out, in, ciphertext_len, iv, aad,
201 aad_len, auth_tag, auth_tag_len);
202 }
203}
204#endif
205
206#ifdef CONFIG_AS_AVX2
207/*
208 * asmlinkage void aesni_gcm_precomp_avx_gen4()
209 * gcm_data *my_ctx_data, context data
210 * u8 *hash_subkey, the Hash sub key input. Data starts on a 16-byte boundary.
211 */
212asmlinkage void aesni_gcm_precomp_avx_gen4(void *my_ctx_data, u8 *hash_subkey);
213
214asmlinkage void aesni_gcm_enc_avx_gen4(void *ctx, u8 *out,
215 const u8 *in, unsigned long plaintext_len, u8 *iv,
216 const u8 *aad, unsigned long aad_len,
217 u8 *auth_tag, unsigned long auth_tag_len);
218
219asmlinkage void aesni_gcm_dec_avx_gen4(void *ctx, u8 *out,
220 const u8 *in, unsigned long ciphertext_len, u8 *iv,
221 const u8 *aad, unsigned long aad_len,
222 u8 *auth_tag, unsigned long auth_tag_len);
223
224static void aesni_gcm_enc_avx2(void *ctx, u8 *out,
225 const u8 *in, unsigned long plaintext_len, u8 *iv,
226 u8 *hash_subkey, const u8 *aad, unsigned long aad_len,
227 u8 *auth_tag, unsigned long auth_tag_len)
228{
229 if (plaintext_len < AVX_GEN2_OPTSIZE) {
230 aesni_gcm_enc(ctx, out, in, plaintext_len, iv, hash_subkey, aad,
231 aad_len, auth_tag, auth_tag_len);
232 } else if (plaintext_len < AVX_GEN4_OPTSIZE) {
233 aesni_gcm_precomp_avx_gen2(ctx, hash_subkey);
234 aesni_gcm_enc_avx_gen2(ctx, out, in, plaintext_len, iv, aad,
235 aad_len, auth_tag, auth_tag_len);
236 } else {
237 aesni_gcm_precomp_avx_gen4(ctx, hash_subkey);
238 aesni_gcm_enc_avx_gen4(ctx, out, in, plaintext_len, iv, aad,
239 aad_len, auth_tag, auth_tag_len);
240 }
241}
242
243static void aesni_gcm_dec_avx2(void *ctx, u8 *out,
244 const u8 *in, unsigned long ciphertext_len, u8 *iv,
245 u8 *hash_subkey, const u8 *aad, unsigned long aad_len,
246 u8 *auth_tag, unsigned long auth_tag_len)
247{
248 if (ciphertext_len < AVX_GEN2_OPTSIZE) {
249 aesni_gcm_dec(ctx, out, in, ciphertext_len, iv, hash_subkey,
250 aad, aad_len, auth_tag, auth_tag_len);
251 } else if (ciphertext_len < AVX_GEN4_OPTSIZE) {
252 aesni_gcm_precomp_avx_gen2(ctx, hash_subkey);
253 aesni_gcm_dec_avx_gen2(ctx, out, in, ciphertext_len, iv, aad,
254 aad_len, auth_tag, auth_tag_len);
255 } else {
256 aesni_gcm_precomp_avx_gen4(ctx, hash_subkey);
257 aesni_gcm_dec_avx_gen4(ctx, out, in, ciphertext_len, iv, aad,
258 aad_len, auth_tag, auth_tag_len);
259 }
260}
261#endif
262
263static void (*aesni_gcm_enc_tfm)(void *ctx, u8 *out,
264 const u8 *in, unsigned long plaintext_len, u8 *iv,
265 u8 *hash_subkey, const u8 *aad, unsigned long aad_len,
266 u8 *auth_tag, unsigned long auth_tag_len);
267
268static void (*aesni_gcm_dec_tfm)(void *ctx, u8 *out,
269 const u8 *in, unsigned long ciphertext_len, u8 *iv,
270 u8 *hash_subkey, const u8 *aad, unsigned long aad_len,
271 u8 *auth_tag, unsigned long auth_tag_len);
272
273static inline struct
274aesni_rfc4106_gcm_ctx *aesni_rfc4106_gcm_ctx_get(struct crypto_aead *tfm)
275{
276 return
277 (struct aesni_rfc4106_gcm_ctx *)
278 PTR_ALIGN((u8 *)
279 crypto_tfm_ctx(crypto_aead_tfm(tfm)), AESNI_ALIGN);
280}
281#endif
282
283static inline struct crypto_aes_ctx *aes_ctx(void *raw_ctx)
284{
285 unsigned long addr = (unsigned long)raw_ctx;
286 unsigned long align = AESNI_ALIGN;
287
288 if (align <= crypto_tfm_ctx_alignment())
289 align = 1;
290 return (struct crypto_aes_ctx *)ALIGN(addr, align);
291}
292
293static int aes_set_key_common(struct crypto_tfm *tfm, void *raw_ctx,
294 const u8 *in_key, unsigned int key_len)
295{
296 struct crypto_aes_ctx *ctx = aes_ctx(raw_ctx);
297 u32 *flags = &tfm->crt_flags;
298 int err;
299
300 if (key_len != AES_KEYSIZE_128 && key_len != AES_KEYSIZE_192 &&
301 key_len != AES_KEYSIZE_256) {
302 *flags |= CRYPTO_TFM_RES_BAD_KEY_LEN;
303 return -EINVAL;
304 }
305
306 if (!irq_fpu_usable())
307 err = crypto_aes_expand_key(ctx, in_key, key_len);
308 else {
309 kernel_fpu_begin();
310 err = aesni_set_key(ctx, in_key, key_len);
311 kernel_fpu_end();
312 }
313
314 return err;
315}
316
317static int aes_set_key(struct crypto_tfm *tfm, const u8 *in_key,
318 unsigned int key_len)
319{
320 return aes_set_key_common(tfm, crypto_tfm_ctx(tfm), in_key, key_len);
321}
322
323static void aes_encrypt(struct crypto_tfm *tfm, u8 *dst, const u8 *src)
324{
325 struct crypto_aes_ctx *ctx = aes_ctx(crypto_tfm_ctx(tfm));
326
327 if (!irq_fpu_usable())
328 crypto_aes_encrypt_x86(ctx, dst, src);
329 else {
330 kernel_fpu_begin();
331 aesni_enc(ctx, dst, src);
332 kernel_fpu_end();
333 }
334}
335
336static void aes_decrypt(struct crypto_tfm *tfm, u8 *dst, const u8 *src)
337{
338 struct crypto_aes_ctx *ctx = aes_ctx(crypto_tfm_ctx(tfm));
339
340 if (!irq_fpu_usable())
341 crypto_aes_decrypt_x86(ctx, dst, src);
342 else {
343 kernel_fpu_begin();
344 aesni_dec(ctx, dst, src);
345 kernel_fpu_end();
346 }
347}
348
349static void __aes_encrypt(struct crypto_tfm *tfm, u8 *dst, const u8 *src)
350{
351 struct crypto_aes_ctx *ctx = aes_ctx(crypto_tfm_ctx(tfm));
352
353 aesni_enc(ctx, dst, src);
354}
355
356static void __aes_decrypt(struct crypto_tfm *tfm, u8 *dst, const u8 *src)
357{
358 struct crypto_aes_ctx *ctx = aes_ctx(crypto_tfm_ctx(tfm));
359
360 aesni_dec(ctx, dst, src);
361}
362
363static int ecb_encrypt(struct blkcipher_desc *desc,
364 struct scatterlist *dst, struct scatterlist *src,
365 unsigned int nbytes)
366{
367 struct crypto_aes_ctx *ctx = aes_ctx(crypto_blkcipher_ctx(desc->tfm));
368 struct blkcipher_walk walk;
369 int err;
370
371 blkcipher_walk_init(&walk, dst, src, nbytes);
372 err = blkcipher_walk_virt(desc, &walk);
373 desc->flags &= ~CRYPTO_TFM_REQ_MAY_SLEEP;
374
375 kernel_fpu_begin();
376 while ((nbytes = walk.nbytes)) {
377 aesni_ecb_enc(ctx, walk.dst.virt.addr, walk.src.virt.addr,
378 nbytes & AES_BLOCK_MASK);
379 nbytes &= AES_BLOCK_SIZE - 1;
380 err = blkcipher_walk_done(desc, &walk, nbytes);
381 }
382 kernel_fpu_end();
383
384 return err;
385}
386
387static int ecb_decrypt(struct blkcipher_desc *desc,
388 struct scatterlist *dst, struct scatterlist *src,
389 unsigned int nbytes)
390{
391 struct crypto_aes_ctx *ctx = aes_ctx(crypto_blkcipher_ctx(desc->tfm));
392 struct blkcipher_walk walk;
393 int err;
394
395 blkcipher_walk_init(&walk, dst, src, nbytes);
396 err = blkcipher_walk_virt(desc, &walk);
397 desc->flags &= ~CRYPTO_TFM_REQ_MAY_SLEEP;
398
399 kernel_fpu_begin();
400 while ((nbytes = walk.nbytes)) {
401 aesni_ecb_dec(ctx, walk.dst.virt.addr, walk.src.virt.addr,
402 nbytes & AES_BLOCK_MASK);
403 nbytes &= AES_BLOCK_SIZE - 1;
404 err = blkcipher_walk_done(desc, &walk, nbytes);
405 }
406 kernel_fpu_end();
407
408 return err;
409}
410
411static int cbc_encrypt(struct blkcipher_desc *desc,
412 struct scatterlist *dst, struct scatterlist *src,
413 unsigned int nbytes)
414{
415 struct crypto_aes_ctx *ctx = aes_ctx(crypto_blkcipher_ctx(desc->tfm));
416 struct blkcipher_walk walk;
417 int err;
418
419 blkcipher_walk_init(&walk, dst, src, nbytes);
420 err = blkcipher_walk_virt(desc, &walk);
421 desc->flags &= ~CRYPTO_TFM_REQ_MAY_SLEEP;
422
423 kernel_fpu_begin();
424 while ((nbytes = walk.nbytes)) {
425 aesni_cbc_enc(ctx, walk.dst.virt.addr, walk.src.virt.addr,
426 nbytes & AES_BLOCK_MASK, walk.iv);
427 nbytes &= AES_BLOCK_SIZE - 1;
428 err = blkcipher_walk_done(desc, &walk, nbytes);
429 }
430 kernel_fpu_end();
431
432 return err;
433}
434
435static int cbc_decrypt(struct blkcipher_desc *desc,
436 struct scatterlist *dst, struct scatterlist *src,
437 unsigned int nbytes)
438{
439 struct crypto_aes_ctx *ctx = aes_ctx(crypto_blkcipher_ctx(desc->tfm));
440 struct blkcipher_walk walk;
441 int err;
442
443 blkcipher_walk_init(&walk, dst, src, nbytes);
444 err = blkcipher_walk_virt(desc, &walk);
445 desc->flags &= ~CRYPTO_TFM_REQ_MAY_SLEEP;
446
447 kernel_fpu_begin();
448 while ((nbytes = walk.nbytes)) {
449 aesni_cbc_dec(ctx, walk.dst.virt.addr, walk.src.virt.addr,
450 nbytes & AES_BLOCK_MASK, walk.iv);
451 nbytes &= AES_BLOCK_SIZE - 1;
452 err = blkcipher_walk_done(desc, &walk, nbytes);
453 }
454 kernel_fpu_end();
455
456 return err;
457}
458
459#ifdef CONFIG_X86_64
460static void ctr_crypt_final(struct crypto_aes_ctx *ctx,
461 struct blkcipher_walk *walk)
462{
463 u8 *ctrblk = walk->iv;
464 u8 keystream[AES_BLOCK_SIZE];
465 u8 *src = walk->src.virt.addr;
466 u8 *dst = walk->dst.virt.addr;
467 unsigned int nbytes = walk->nbytes;
468
469 aesni_enc(ctx, keystream, ctrblk);
470 crypto_xor(keystream, src, nbytes);
471 memcpy(dst, keystream, nbytes);
472 crypto_inc(ctrblk, AES_BLOCK_SIZE);
473}
474
475static int ctr_crypt(struct blkcipher_desc *desc,
476 struct scatterlist *dst, struct scatterlist *src,
477 unsigned int nbytes)
478{
479 struct crypto_aes_ctx *ctx = aes_ctx(crypto_blkcipher_ctx(desc->tfm));
480 struct blkcipher_walk walk;
481 int err;
482
483 blkcipher_walk_init(&walk, dst, src, nbytes);
484 err = blkcipher_walk_virt_block(desc, &walk, AES_BLOCK_SIZE);
485 desc->flags &= ~CRYPTO_TFM_REQ_MAY_SLEEP;
486
487 kernel_fpu_begin();
488 while ((nbytes = walk.nbytes) >= AES_BLOCK_SIZE) {
489 aesni_ctr_enc(ctx, walk.dst.virt.addr, walk.src.virt.addr,
490 nbytes & AES_BLOCK_MASK, walk.iv);
491 nbytes &= AES_BLOCK_SIZE - 1;
492 err = blkcipher_walk_done(desc, &walk, nbytes);
493 }
494 if (walk.nbytes) {
495 ctr_crypt_final(ctx, &walk);
496 err = blkcipher_walk_done(desc, &walk, 0);
497 }
498 kernel_fpu_end();
499
500 return err;
501}
502#endif
503
504static int ablk_ecb_init(struct crypto_tfm *tfm)
505{
506 return ablk_init_common(tfm, "__driver-ecb-aes-aesni");
507}
508
509static int ablk_cbc_init(struct crypto_tfm *tfm)
510{
511 return ablk_init_common(tfm, "__driver-cbc-aes-aesni");
512}
513
514#ifdef CONFIG_X86_64
515static int ablk_ctr_init(struct crypto_tfm *tfm)
516{
517 return ablk_init_common(tfm, "__driver-ctr-aes-aesni");
518}
519
520#endif
521
522#ifdef HAS_PCBC
523static int ablk_pcbc_init(struct crypto_tfm *tfm)
524{
525 return ablk_init_common(tfm, "fpu(pcbc(__driver-aes-aesni))");
526}
527#endif
528
529static void lrw_xts_encrypt_callback(void *ctx, u8 *blks, unsigned int nbytes)
530{
531 aesni_ecb_enc(ctx, blks, blks, nbytes);
532}
533
534static void lrw_xts_decrypt_callback(void *ctx, u8 *blks, unsigned int nbytes)
535{
536 aesni_ecb_dec(ctx, blks, blks, nbytes);
537}
538
539static int lrw_aesni_setkey(struct crypto_tfm *tfm, const u8 *key,
540 unsigned int keylen)
541{
542 struct aesni_lrw_ctx *ctx = crypto_tfm_ctx(tfm);
543 int err;
544
545 err = aes_set_key_common(tfm, ctx->raw_aes_ctx, key,
546 keylen - AES_BLOCK_SIZE);
547 if (err)
548 return err;
549
550 return lrw_init_table(&ctx->lrw_table, key + keylen - AES_BLOCK_SIZE);
551}
552
553static void lrw_aesni_exit_tfm(struct crypto_tfm *tfm)
554{
555 struct aesni_lrw_ctx *ctx = crypto_tfm_ctx(tfm);
556
557 lrw_free_table(&ctx->lrw_table);
558}
559
560static int lrw_encrypt(struct blkcipher_desc *desc, struct scatterlist *dst,
561 struct scatterlist *src, unsigned int nbytes)
562{
563 struct aesni_lrw_ctx *ctx = crypto_blkcipher_ctx(desc->tfm);
564 be128 buf[8];
565 struct lrw_crypt_req req = {
566 .tbuf = buf,
567 .tbuflen = sizeof(buf),
568
569 .table_ctx = &ctx->lrw_table,
570 .crypt_ctx = aes_ctx(ctx->raw_aes_ctx),
571 .crypt_fn = lrw_xts_encrypt_callback,
572 };
573 int ret;
574
575 desc->flags &= ~CRYPTO_TFM_REQ_MAY_SLEEP;
576
577 kernel_fpu_begin();
578 ret = lrw_crypt(desc, dst, src, nbytes, &req);
579 kernel_fpu_end();
580
581 return ret;
582}
583
584static int lrw_decrypt(struct blkcipher_desc *desc, struct scatterlist *dst,
585 struct scatterlist *src, unsigned int nbytes)
586{
587 struct aesni_lrw_ctx *ctx = crypto_blkcipher_ctx(desc->tfm);
588 be128 buf[8];
589 struct lrw_crypt_req req = {
590 .tbuf = buf,
591 .tbuflen = sizeof(buf),
592
593 .table_ctx = &ctx->lrw_table,
594 .crypt_ctx = aes_ctx(ctx->raw_aes_ctx),
595 .crypt_fn = lrw_xts_decrypt_callback,
596 };
597 int ret;
598
599 desc->flags &= ~CRYPTO_TFM_REQ_MAY_SLEEP;
600
601 kernel_fpu_begin();
602 ret = lrw_crypt(desc, dst, src, nbytes, &req);
603 kernel_fpu_end();
604
605 return ret;
606}
607
608static int xts_aesni_setkey(struct crypto_tfm *tfm, const u8 *key,
609 unsigned int keylen)
610{
611 struct aesni_xts_ctx *ctx = crypto_tfm_ctx(tfm);
612 u32 *flags = &tfm->crt_flags;
613 int err;
614
615 /* key consists of keys of equal size concatenated, therefore
616 * the length must be even
617 */
618 if (keylen % 2) {
619 *flags |= CRYPTO_TFM_RES_BAD_KEY_LEN;
620 return -EINVAL;
621 }
622
623 /* first half of xts-key is for crypt */
624 err = aes_set_key_common(tfm, ctx->raw_crypt_ctx, key, keylen / 2);
625 if (err)
626 return err;
627
628 /* second half of xts-key is for tweak */
629 return aes_set_key_common(tfm, ctx->raw_tweak_ctx, key + keylen / 2,
630 keylen / 2);
631}
632
633
634static void aesni_xts_tweak(void *ctx, u8 *out, const u8 *in)
635{
636 aesni_enc(ctx, out, in);
637}
638
639#ifdef CONFIG_X86_64
640
641static void aesni_xts_enc(void *ctx, u128 *dst, const u128 *src, le128 *iv)
642{
643 glue_xts_crypt_128bit_one(ctx, dst, src, iv, GLUE_FUNC_CAST(aesni_enc));
644}
645
646static void aesni_xts_dec(void *ctx, u128 *dst, const u128 *src, le128 *iv)
647{
648 glue_xts_crypt_128bit_one(ctx, dst, src, iv, GLUE_FUNC_CAST(aesni_dec));
649}
650
651static void aesni_xts_enc8(void *ctx, u128 *dst, const u128 *src, le128 *iv)
652{
653 aesni_xts_crypt8(ctx, (u8 *)dst, (const u8 *)src, true, (u8 *)iv);
654}
655
656static void aesni_xts_dec8(void *ctx, u128 *dst, const u128 *src, le128 *iv)
657{
658 aesni_xts_crypt8(ctx, (u8 *)dst, (const u8 *)src, false, (u8 *)iv);
659}
660
661static const struct common_glue_ctx aesni_enc_xts = {
662 .num_funcs = 2,
663 .fpu_blocks_limit = 1,
664
665 .funcs = { {
666 .num_blocks = 8,
667 .fn_u = { .xts = GLUE_XTS_FUNC_CAST(aesni_xts_enc8) }
668 }, {
669 .num_blocks = 1,
670 .fn_u = { .xts = GLUE_XTS_FUNC_CAST(aesni_xts_enc) }
671 } }
672};
673
674static const struct common_glue_ctx aesni_dec_xts = {
675 .num_funcs = 2,
676 .fpu_blocks_limit = 1,
677
678 .funcs = { {
679 .num_blocks = 8,
680 .fn_u = { .xts = GLUE_XTS_FUNC_CAST(aesni_xts_dec8) }
681 }, {
682 .num_blocks = 1,
683 .fn_u = { .xts = GLUE_XTS_FUNC_CAST(aesni_xts_dec) }
684 } }
685};
686
687static int xts_encrypt(struct blkcipher_desc *desc, struct scatterlist *dst,
688 struct scatterlist *src, unsigned int nbytes)
689{
690 struct aesni_xts_ctx *ctx = crypto_blkcipher_ctx(desc->tfm);
691
692 return glue_xts_crypt_128bit(&aesni_enc_xts, desc, dst, src, nbytes,
693 XTS_TWEAK_CAST(aesni_xts_tweak),
694 aes_ctx(ctx->raw_tweak_ctx),
695 aes_ctx(ctx->raw_crypt_ctx));
696}
697
698static int xts_decrypt(struct blkcipher_desc *desc, struct scatterlist *dst,
699 struct scatterlist *src, unsigned int nbytes)
700{
701 struct aesni_xts_ctx *ctx = crypto_blkcipher_ctx(desc->tfm);
702
703 return glue_xts_crypt_128bit(&aesni_dec_xts, desc, dst, src, nbytes,
704 XTS_TWEAK_CAST(aesni_xts_tweak),
705 aes_ctx(ctx->raw_tweak_ctx),
706 aes_ctx(ctx->raw_crypt_ctx));
707}
708
709#else
710
711static int xts_encrypt(struct blkcipher_desc *desc, struct scatterlist *dst,
712 struct scatterlist *src, unsigned int nbytes)
713{
714 struct aesni_xts_ctx *ctx = crypto_blkcipher_ctx(desc->tfm);
715 be128 buf[8];
716 struct xts_crypt_req req = {
717 .tbuf = buf,
718 .tbuflen = sizeof(buf),
719
720 .tweak_ctx = aes_ctx(ctx->raw_tweak_ctx),
721 .tweak_fn = aesni_xts_tweak,
722 .crypt_ctx = aes_ctx(ctx->raw_crypt_ctx),
723 .crypt_fn = lrw_xts_encrypt_callback,
724 };
725 int ret;
726
727 desc->flags &= ~CRYPTO_TFM_REQ_MAY_SLEEP;
728
729 kernel_fpu_begin();
730 ret = xts_crypt(desc, dst, src, nbytes, &req);
731 kernel_fpu_end();
732
733 return ret;
734}
735
736static int xts_decrypt(struct blkcipher_desc *desc, struct scatterlist *dst,
737 struct scatterlist *src, unsigned int nbytes)
738{
739 struct aesni_xts_ctx *ctx = crypto_blkcipher_ctx(desc->tfm);
740 be128 buf[8];
741 struct xts_crypt_req req = {
742 .tbuf = buf,
743 .tbuflen = sizeof(buf),
744
745 .tweak_ctx = aes_ctx(ctx->raw_tweak_ctx),
746 .tweak_fn = aesni_xts_tweak,
747 .crypt_ctx = aes_ctx(ctx->raw_crypt_ctx),
748 .crypt_fn = lrw_xts_decrypt_callback,
749 };
750 int ret;
751
752 desc->flags &= ~CRYPTO_TFM_REQ_MAY_SLEEP;
753
754 kernel_fpu_begin();
755 ret = xts_crypt(desc, dst, src, nbytes, &req);
756 kernel_fpu_end();
757
758 return ret;
759}
760
761#endif
762
763#ifdef CONFIG_X86_64
764static int rfc4106_init(struct crypto_tfm *tfm)
765{
766 struct cryptd_aead *cryptd_tfm;
767 struct aesni_rfc4106_gcm_ctx *ctx = (struct aesni_rfc4106_gcm_ctx *)
768 PTR_ALIGN((u8 *)crypto_tfm_ctx(tfm), AESNI_ALIGN);
769 struct crypto_aead *cryptd_child;
770 struct aesni_rfc4106_gcm_ctx *child_ctx;
771 cryptd_tfm = cryptd_alloc_aead("__driver-gcm-aes-aesni", 0, 0);
772 if (IS_ERR(cryptd_tfm))
773 return PTR_ERR(cryptd_tfm);
774
775 cryptd_child = cryptd_aead_child(cryptd_tfm);
776 child_ctx = aesni_rfc4106_gcm_ctx_get(cryptd_child);
777 memcpy(child_ctx, ctx, sizeof(*ctx));
778 ctx->cryptd_tfm = cryptd_tfm;
779 tfm->crt_aead.reqsize = sizeof(struct aead_request)
780 + crypto_aead_reqsize(&cryptd_tfm->base);
781 return 0;
782}
783
784static void rfc4106_exit(struct crypto_tfm *tfm)
785{
786 struct aesni_rfc4106_gcm_ctx *ctx =
787 (struct aesni_rfc4106_gcm_ctx *)
788 PTR_ALIGN((u8 *)crypto_tfm_ctx(tfm), AESNI_ALIGN);
789 if (!IS_ERR(ctx->cryptd_tfm))
790 cryptd_free_aead(ctx->cryptd_tfm);
791 return;
792}
793
794static void
795rfc4106_set_hash_subkey_done(struct crypto_async_request *req, int err)
796{
797 struct aesni_gcm_set_hash_subkey_result *result = req->data;
798
799 if (err == -EINPROGRESS)
800 return;
801 result->err = err;
802 complete(&result->completion);
803}
804
805static int
806rfc4106_set_hash_subkey(u8 *hash_subkey, const u8 *key, unsigned int key_len)
807{
808 struct crypto_ablkcipher *ctr_tfm;
809 struct ablkcipher_request *req;
810 int ret = -EINVAL;
811 struct aesni_hash_subkey_req_data *req_data;
812
813 ctr_tfm = crypto_alloc_ablkcipher("ctr(aes)", 0, 0);
814 if (IS_ERR(ctr_tfm))
815 return PTR_ERR(ctr_tfm);
816
817 crypto_ablkcipher_clear_flags(ctr_tfm, ~0);
818
819 ret = crypto_ablkcipher_setkey(ctr_tfm, key, key_len);
820 if (ret)
821 goto out_free_ablkcipher;
822
823 ret = -ENOMEM;
824 req = ablkcipher_request_alloc(ctr_tfm, GFP_KERNEL);
825 if (!req)
826 goto out_free_ablkcipher;
827
828 req_data = kmalloc(sizeof(*req_data), GFP_KERNEL);
829 if (!req_data)
830 goto out_free_request;
831
832 memset(req_data->iv, 0, sizeof(req_data->iv));
833
834 /* Clear the data in the hash sub key container to zero.*/
835 /* We want to cipher all zeros to create the hash sub key. */
836 memset(hash_subkey, 0, RFC4106_HASH_SUBKEY_SIZE);
837
838 init_completion(&req_data->result.completion);
839 sg_init_one(&req_data->sg, hash_subkey, RFC4106_HASH_SUBKEY_SIZE);
840 ablkcipher_request_set_tfm(req, ctr_tfm);
841 ablkcipher_request_set_callback(req, CRYPTO_TFM_REQ_MAY_SLEEP |
842 CRYPTO_TFM_REQ_MAY_BACKLOG,
843 rfc4106_set_hash_subkey_done,
844 &req_data->result);
845
846 ablkcipher_request_set_crypt(req, &req_data->sg,
847 &req_data->sg, RFC4106_HASH_SUBKEY_SIZE, req_data->iv);
848
849 ret = crypto_ablkcipher_encrypt(req);
850 if (ret == -EINPROGRESS || ret == -EBUSY) {
851 ret = wait_for_completion_interruptible
852 (&req_data->result.completion);
853 if (!ret)
854 ret = req_data->result.err;
855 }
856 kfree(req_data);
857out_free_request:
858 ablkcipher_request_free(req);
859out_free_ablkcipher:
860 crypto_free_ablkcipher(ctr_tfm);
861 return ret;
862}
863
864static int rfc4106_set_key(struct crypto_aead *parent, const u8 *key,
865 unsigned int key_len)
866{
867 int ret = 0;
868 struct crypto_tfm *tfm = crypto_aead_tfm(parent);
869 struct aesni_rfc4106_gcm_ctx *ctx = aesni_rfc4106_gcm_ctx_get(parent);
870 struct crypto_aead *cryptd_child = cryptd_aead_child(ctx->cryptd_tfm);
871 struct aesni_rfc4106_gcm_ctx *child_ctx =
872 aesni_rfc4106_gcm_ctx_get(cryptd_child);
873 u8 *new_key_align, *new_key_mem = NULL;
874
875 if (key_len < 4) {
876 crypto_tfm_set_flags(tfm, CRYPTO_TFM_RES_BAD_KEY_LEN);
877 return -EINVAL;
878 }
879 /*Account for 4 byte nonce at the end.*/
880 key_len -= 4;
881 if (key_len != AES_KEYSIZE_128) {
882 crypto_tfm_set_flags(tfm, CRYPTO_TFM_RES_BAD_KEY_LEN);
883 return -EINVAL;
884 }
885
886 memcpy(ctx->nonce, key + key_len, sizeof(ctx->nonce));
887 /*This must be on a 16 byte boundary!*/
888 if ((unsigned long)(&(ctx->aes_key_expanded.key_enc[0])) % AESNI_ALIGN)
889 return -EINVAL;
890
891 if ((unsigned long)key % AESNI_ALIGN) {
892 /*key is not aligned: use an auxuliar aligned pointer*/
893 new_key_mem = kmalloc(key_len+AESNI_ALIGN, GFP_KERNEL);
894 if (!new_key_mem)
895 return -ENOMEM;
896
897 new_key_align = PTR_ALIGN(new_key_mem, AESNI_ALIGN);
898 memcpy(new_key_align, key, key_len);
899 key = new_key_align;
900 }
901
902 if (!irq_fpu_usable())
903 ret = crypto_aes_expand_key(&(ctx->aes_key_expanded),
904 key, key_len);
905 else {
906 kernel_fpu_begin();
907 ret = aesni_set_key(&(ctx->aes_key_expanded), key, key_len);
908 kernel_fpu_end();
909 }
910 /*This must be on a 16 byte boundary!*/
911 if ((unsigned long)(&(ctx->hash_subkey[0])) % AESNI_ALIGN) {
912 ret = -EINVAL;
913 goto exit;
914 }
915 ret = rfc4106_set_hash_subkey(ctx->hash_subkey, key, key_len);
916 memcpy(child_ctx, ctx, sizeof(*ctx));
917exit:
918 kfree(new_key_mem);
919 return ret;
920}
921
922/* This is the Integrity Check Value (aka the authentication tag length and can
923 * be 8, 12 or 16 bytes long. */
924static int rfc4106_set_authsize(struct crypto_aead *parent,
925 unsigned int authsize)
926{
927 struct aesni_rfc4106_gcm_ctx *ctx = aesni_rfc4106_gcm_ctx_get(parent);
928 struct crypto_aead *cryptd_child = cryptd_aead_child(ctx->cryptd_tfm);
929
930 switch (authsize) {
931 case 8:
932 case 12:
933 case 16:
934 break;
935 default:
936 return -EINVAL;
937 }
938 crypto_aead_crt(parent)->authsize = authsize;
939 crypto_aead_crt(cryptd_child)->authsize = authsize;
940 return 0;
941}
942
943static int rfc4106_encrypt(struct aead_request *req)
944{
945 int ret;
946 struct crypto_aead *tfm = crypto_aead_reqtfm(req);
947 struct aesni_rfc4106_gcm_ctx *ctx = aesni_rfc4106_gcm_ctx_get(tfm);
948
949 if (!irq_fpu_usable()) {
950 struct aead_request *cryptd_req =
951 (struct aead_request *) aead_request_ctx(req);
952 memcpy(cryptd_req, req, sizeof(*req));
953 aead_request_set_tfm(cryptd_req, &ctx->cryptd_tfm->base);
954 return crypto_aead_encrypt(cryptd_req);
955 } else {
956 struct crypto_aead *cryptd_child = cryptd_aead_child(ctx->cryptd_tfm);
957 kernel_fpu_begin();
958 ret = cryptd_child->base.crt_aead.encrypt(req);
959 kernel_fpu_end();
960 return ret;
961 }
962}
963
964static int rfc4106_decrypt(struct aead_request *req)
965{
966 int ret;
967 struct crypto_aead *tfm = crypto_aead_reqtfm(req);
968 struct aesni_rfc4106_gcm_ctx *ctx = aesni_rfc4106_gcm_ctx_get(tfm);
969
970 if (!irq_fpu_usable()) {
971 struct aead_request *cryptd_req =
972 (struct aead_request *) aead_request_ctx(req);
973 memcpy(cryptd_req, req, sizeof(*req));
974 aead_request_set_tfm(cryptd_req, &ctx->cryptd_tfm->base);
975 return crypto_aead_decrypt(cryptd_req);
976 } else {
977 struct crypto_aead *cryptd_child = cryptd_aead_child(ctx->cryptd_tfm);
978 kernel_fpu_begin();
979 ret = cryptd_child->base.crt_aead.decrypt(req);
980 kernel_fpu_end();
981 return ret;
982 }
983}
984
985static int __driver_rfc4106_encrypt(struct aead_request *req)
986{
987 u8 one_entry_in_sg = 0;
988 u8 *src, *dst, *assoc;
989 __be32 counter = cpu_to_be32(1);
990 struct crypto_aead *tfm = crypto_aead_reqtfm(req);
991 struct aesni_rfc4106_gcm_ctx *ctx = aesni_rfc4106_gcm_ctx_get(tfm);
992 void *aes_ctx = &(ctx->aes_key_expanded);
993 unsigned long auth_tag_len = crypto_aead_authsize(tfm);
994 u8 iv_tab[16+AESNI_ALIGN];
995 u8* iv = (u8 *) PTR_ALIGN((u8 *)iv_tab, AESNI_ALIGN);
996 struct scatter_walk src_sg_walk;
997 struct scatter_walk assoc_sg_walk;
998 struct scatter_walk dst_sg_walk;
999 unsigned int i;
1000
1001 /* Assuming we are supporting rfc4106 64-bit extended */
1002 /* sequence numbers We need to have the AAD length equal */
1003 /* to 8 or 12 bytes */
1004 if (unlikely(req->assoclen != 8 && req->assoclen != 12))
1005 return -EINVAL;
1006 /* IV below built */
1007 for (i = 0; i < 4; i++)
1008 *(iv+i) = ctx->nonce[i];
1009 for (i = 0; i < 8; i++)
1010 *(iv+4+i) = req->iv[i];
1011 *((__be32 *)(iv+12)) = counter;
1012
1013 if ((sg_is_last(req->src)) && (sg_is_last(req->assoc))) {
1014 one_entry_in_sg = 1;
1015 scatterwalk_start(&src_sg_walk, req->src);
1016 scatterwalk_start(&assoc_sg_walk, req->assoc);
1017 src = scatterwalk_map(&src_sg_walk);
1018 assoc = scatterwalk_map(&assoc_sg_walk);
1019 dst = src;
1020 if (unlikely(req->src != req->dst)) {
1021 scatterwalk_start(&dst_sg_walk, req->dst);
1022 dst = scatterwalk_map(&dst_sg_walk);
1023 }
1024
1025 } else {
1026 /* Allocate memory for src, dst, assoc */
1027 src = kmalloc(req->cryptlen + auth_tag_len + req->assoclen,
1028 GFP_ATOMIC);
1029 if (unlikely(!src))
1030 return -ENOMEM;
1031 assoc = (src + req->cryptlen + auth_tag_len);
1032 scatterwalk_map_and_copy(src, req->src, 0, req->cryptlen, 0);
1033 scatterwalk_map_and_copy(assoc, req->assoc, 0,
1034 req->assoclen, 0);
1035 dst = src;
1036 }
1037
1038 aesni_gcm_enc_tfm(aes_ctx, dst, src, (unsigned long)req->cryptlen, iv,
1039 ctx->hash_subkey, assoc, (unsigned long)req->assoclen, dst
1040 + ((unsigned long)req->cryptlen), auth_tag_len);
1041
1042 /* The authTag (aka the Integrity Check Value) needs to be written
1043 * back to the packet. */
1044 if (one_entry_in_sg) {
1045 if (unlikely(req->src != req->dst)) {
1046 scatterwalk_unmap(dst);
1047 scatterwalk_done(&dst_sg_walk, 0, 0);
1048 }
1049 scatterwalk_unmap(src);
1050 scatterwalk_unmap(assoc);
1051 scatterwalk_done(&src_sg_walk, 0, 0);
1052 scatterwalk_done(&assoc_sg_walk, 0, 0);
1053 } else {
1054 scatterwalk_map_and_copy(dst, req->dst, 0,
1055 req->cryptlen + auth_tag_len, 1);
1056 kfree(src);
1057 }
1058 return 0;
1059}
1060
1061static int __driver_rfc4106_decrypt(struct aead_request *req)
1062{
1063 u8 one_entry_in_sg = 0;
1064 u8 *src, *dst, *assoc;
1065 unsigned long tempCipherLen = 0;
1066 __be32 counter = cpu_to_be32(1);
1067 int retval = 0;
1068 struct crypto_aead *tfm = crypto_aead_reqtfm(req);
1069 struct aesni_rfc4106_gcm_ctx *ctx = aesni_rfc4106_gcm_ctx_get(tfm);
1070 void *aes_ctx = &(ctx->aes_key_expanded);
1071 unsigned long auth_tag_len = crypto_aead_authsize(tfm);
1072 u8 iv_and_authTag[32+AESNI_ALIGN];
1073 u8 *iv = (u8 *) PTR_ALIGN((u8 *)iv_and_authTag, AESNI_ALIGN);
1074 u8 *authTag = iv + 16;
1075 struct scatter_walk src_sg_walk;
1076 struct scatter_walk assoc_sg_walk;
1077 struct scatter_walk dst_sg_walk;
1078 unsigned int i;
1079
1080 if (unlikely((req->cryptlen < auth_tag_len) ||
1081 (req->assoclen != 8 && req->assoclen != 12)))
1082 return -EINVAL;
1083 /* Assuming we are supporting rfc4106 64-bit extended */
1084 /* sequence numbers We need to have the AAD length */
1085 /* equal to 8 or 12 bytes */
1086
1087 tempCipherLen = (unsigned long)(req->cryptlen - auth_tag_len);
1088 /* IV below built */
1089 for (i = 0; i < 4; i++)
1090 *(iv+i) = ctx->nonce[i];
1091 for (i = 0; i < 8; i++)
1092 *(iv+4+i) = req->iv[i];
1093 *((__be32 *)(iv+12)) = counter;
1094
1095 if ((sg_is_last(req->src)) && (sg_is_last(req->assoc))) {
1096 one_entry_in_sg = 1;
1097 scatterwalk_start(&src_sg_walk, req->src);
1098 scatterwalk_start(&assoc_sg_walk, req->assoc);
1099 src = scatterwalk_map(&src_sg_walk);
1100 assoc = scatterwalk_map(&assoc_sg_walk);
1101 dst = src;
1102 if (unlikely(req->src != req->dst)) {
1103 scatterwalk_start(&dst_sg_walk, req->dst);
1104 dst = scatterwalk_map(&dst_sg_walk);
1105 }
1106
1107 } else {
1108 /* Allocate memory for src, dst, assoc */
1109 src = kmalloc(req->cryptlen + req->assoclen, GFP_ATOMIC);
1110 if (!src)
1111 return -ENOMEM;
1112 assoc = (src + req->cryptlen + auth_tag_len);
1113 scatterwalk_map_and_copy(src, req->src, 0, req->cryptlen, 0);
1114 scatterwalk_map_and_copy(assoc, req->assoc, 0,
1115 req->assoclen, 0);
1116 dst = src;
1117 }
1118
1119 aesni_gcm_dec_tfm(aes_ctx, dst, src, tempCipherLen, iv,
1120 ctx->hash_subkey, assoc, (unsigned long)req->assoclen,
1121 authTag, auth_tag_len);
1122
1123 /* Compare generated tag with passed in tag. */
1124 retval = crypto_memneq(src + tempCipherLen, authTag, auth_tag_len) ?
1125 -EBADMSG : 0;
1126
1127 if (one_entry_in_sg) {
1128 if (unlikely(req->src != req->dst)) {
1129 scatterwalk_unmap(dst);
1130 scatterwalk_done(&dst_sg_walk, 0, 0);
1131 }
1132 scatterwalk_unmap(src);
1133 scatterwalk_unmap(assoc);
1134 scatterwalk_done(&src_sg_walk, 0, 0);
1135 scatterwalk_done(&assoc_sg_walk, 0, 0);
1136 } else {
1137 scatterwalk_map_and_copy(dst, req->dst, 0, req->cryptlen, 1);
1138 kfree(src);
1139 }
1140 return retval;
1141}
1142#endif
1143
1144static struct crypto_alg aesni_algs[] = { {
1145 .cra_name = "aes",
1146 .cra_driver_name = "aes-aesni",
1147 .cra_priority = 300,
1148 .cra_flags = CRYPTO_ALG_TYPE_CIPHER,
1149 .cra_blocksize = AES_BLOCK_SIZE,
1150 .cra_ctxsize = sizeof(struct crypto_aes_ctx) +
1151 AESNI_ALIGN - 1,
1152 .cra_alignmask = 0,
1153 .cra_module = THIS_MODULE,
1154 .cra_u = {
1155 .cipher = {
1156 .cia_min_keysize = AES_MIN_KEY_SIZE,
1157 .cia_max_keysize = AES_MAX_KEY_SIZE,
1158 .cia_setkey = aes_set_key,
1159 .cia_encrypt = aes_encrypt,
1160 .cia_decrypt = aes_decrypt
1161 }
1162 }
1163}, {
1164 .cra_name = "__aes-aesni",
1165 .cra_driver_name = "__driver-aes-aesni",
1166 .cra_priority = 0,
1167 .cra_flags = CRYPTO_ALG_TYPE_CIPHER,
1168 .cra_blocksize = AES_BLOCK_SIZE,
1169 .cra_ctxsize = sizeof(struct crypto_aes_ctx) +
1170 AESNI_ALIGN - 1,
1171 .cra_alignmask = 0,
1172 .cra_module = THIS_MODULE,
1173 .cra_u = {
1174 .cipher = {
1175 .cia_min_keysize = AES_MIN_KEY_SIZE,
1176 .cia_max_keysize = AES_MAX_KEY_SIZE,
1177 .cia_setkey = aes_set_key,
1178 .cia_encrypt = __aes_encrypt,
1179 .cia_decrypt = __aes_decrypt
1180 }
1181 }
1182}, {
1183 .cra_name = "__ecb-aes-aesni",
1184 .cra_driver_name = "__driver-ecb-aes-aesni",
1185 .cra_priority = 0,
1186 .cra_flags = CRYPTO_ALG_TYPE_BLKCIPHER,
1187 .cra_blocksize = AES_BLOCK_SIZE,
1188 .cra_ctxsize = sizeof(struct crypto_aes_ctx) +
1189 AESNI_ALIGN - 1,
1190 .cra_alignmask = 0,
1191 .cra_type = &crypto_blkcipher_type,
1192 .cra_module = THIS_MODULE,
1193 .cra_u = {
1194 .blkcipher = {
1195 .min_keysize = AES_MIN_KEY_SIZE,
1196 .max_keysize = AES_MAX_KEY_SIZE,
1197 .setkey = aes_set_key,
1198 .encrypt = ecb_encrypt,
1199 .decrypt = ecb_decrypt,
1200 },
1201 },
1202}, {
1203 .cra_name = "__cbc-aes-aesni",
1204 .cra_driver_name = "__driver-cbc-aes-aesni",
1205 .cra_priority = 0,
1206 .cra_flags = CRYPTO_ALG_TYPE_BLKCIPHER,
1207 .cra_blocksize = AES_BLOCK_SIZE,
1208 .cra_ctxsize = sizeof(struct crypto_aes_ctx) +
1209 AESNI_ALIGN - 1,
1210 .cra_alignmask = 0,
1211 .cra_type = &crypto_blkcipher_type,
1212 .cra_module = THIS_MODULE,
1213 .cra_u = {
1214 .blkcipher = {
1215 .min_keysize = AES_MIN_KEY_SIZE,
1216 .max_keysize = AES_MAX_KEY_SIZE,
1217 .setkey = aes_set_key,
1218 .encrypt = cbc_encrypt,
1219 .decrypt = cbc_decrypt,
1220 },
1221 },
1222}, {
1223 .cra_name = "ecb(aes)",
1224 .cra_driver_name = "ecb-aes-aesni",
1225 .cra_priority = 400,
1226 .cra_flags = CRYPTO_ALG_TYPE_ABLKCIPHER | CRYPTO_ALG_ASYNC,
1227 .cra_blocksize = AES_BLOCK_SIZE,
1228 .cra_ctxsize = sizeof(struct async_helper_ctx),
1229 .cra_alignmask = 0,
1230 .cra_type = &crypto_ablkcipher_type,
1231 .cra_module = THIS_MODULE,
1232 .cra_init = ablk_ecb_init,
1233 .cra_exit = ablk_exit,
1234 .cra_u = {
1235 .ablkcipher = {
1236 .min_keysize = AES_MIN_KEY_SIZE,
1237 .max_keysize = AES_MAX_KEY_SIZE,
1238 .setkey = ablk_set_key,
1239 .encrypt = ablk_encrypt,
1240 .decrypt = ablk_decrypt,
1241 },
1242 },
1243}, {
1244 .cra_name = "cbc(aes)",
1245 .cra_driver_name = "cbc-aes-aesni",
1246 .cra_priority = 400,
1247 .cra_flags = CRYPTO_ALG_TYPE_ABLKCIPHER | CRYPTO_ALG_ASYNC,
1248 .cra_blocksize = AES_BLOCK_SIZE,
1249 .cra_ctxsize = sizeof(struct async_helper_ctx),
1250 .cra_alignmask = 0,
1251 .cra_type = &crypto_ablkcipher_type,
1252 .cra_module = THIS_MODULE,
1253 .cra_init = ablk_cbc_init,
1254 .cra_exit = ablk_exit,
1255 .cra_u = {
1256 .ablkcipher = {
1257 .min_keysize = AES_MIN_KEY_SIZE,
1258 .max_keysize = AES_MAX_KEY_SIZE,
1259 .ivsize = AES_BLOCK_SIZE,
1260 .setkey = ablk_set_key,
1261 .encrypt = ablk_encrypt,
1262 .decrypt = ablk_decrypt,
1263 },
1264 },
1265#ifdef CONFIG_X86_64
1266}, {
1267 .cra_name = "__ctr-aes-aesni",
1268 .cra_driver_name = "__driver-ctr-aes-aesni",
1269 .cra_priority = 0,
1270 .cra_flags = CRYPTO_ALG_TYPE_BLKCIPHER,
1271 .cra_blocksize = 1,
1272 .cra_ctxsize = sizeof(struct crypto_aes_ctx) +
1273 AESNI_ALIGN - 1,
1274 .cra_alignmask = 0,
1275 .cra_type = &crypto_blkcipher_type,
1276 .cra_module = THIS_MODULE,
1277 .cra_u = {
1278 .blkcipher = {
1279 .min_keysize = AES_MIN_KEY_SIZE,
1280 .max_keysize = AES_MAX_KEY_SIZE,
1281 .ivsize = AES_BLOCK_SIZE,
1282 .setkey = aes_set_key,
1283 .encrypt = ctr_crypt,
1284 .decrypt = ctr_crypt,
1285 },
1286 },
1287}, {
1288 .cra_name = "ctr(aes)",
1289 .cra_driver_name = "ctr-aes-aesni",
1290 .cra_priority = 400,
1291 .cra_flags = CRYPTO_ALG_TYPE_ABLKCIPHER | CRYPTO_ALG_ASYNC,
1292 .cra_blocksize = 1,
1293 .cra_ctxsize = sizeof(struct async_helper_ctx),
1294 .cra_alignmask = 0,
1295 .cra_type = &crypto_ablkcipher_type,
1296 .cra_module = THIS_MODULE,
1297 .cra_init = ablk_ctr_init,
1298 .cra_exit = ablk_exit,
1299 .cra_u = {
1300 .ablkcipher = {
1301 .min_keysize = AES_MIN_KEY_SIZE,
1302 .max_keysize = AES_MAX_KEY_SIZE,
1303 .ivsize = AES_BLOCK_SIZE,
1304 .setkey = ablk_set_key,
1305 .encrypt = ablk_encrypt,
1306 .decrypt = ablk_encrypt,
1307 .geniv = "chainiv",
1308 },
1309 },
1310}, {
1311 .cra_name = "__gcm-aes-aesni",
1312 .cra_driver_name = "__driver-gcm-aes-aesni",
1313 .cra_priority = 0,
1314 .cra_flags = CRYPTO_ALG_TYPE_AEAD,
1315 .cra_blocksize = 1,
1316 .cra_ctxsize = sizeof(struct aesni_rfc4106_gcm_ctx) +
1317 AESNI_ALIGN,
1318 .cra_alignmask = 0,
1319 .cra_type = &crypto_aead_type,
1320 .cra_module = THIS_MODULE,
1321 .cra_u = {
1322 .aead = {
1323 .encrypt = __driver_rfc4106_encrypt,
1324 .decrypt = __driver_rfc4106_decrypt,
1325 },
1326 },
1327}, {
1328 .cra_name = "rfc4106(gcm(aes))",
1329 .cra_driver_name = "rfc4106-gcm-aesni",
1330 .cra_priority = 400,
1331 .cra_flags = CRYPTO_ALG_TYPE_AEAD | CRYPTO_ALG_ASYNC,
1332 .cra_blocksize = 1,
1333 .cra_ctxsize = sizeof(struct aesni_rfc4106_gcm_ctx) +
1334 AESNI_ALIGN,
1335 .cra_alignmask = 0,
1336 .cra_type = &crypto_nivaead_type,
1337 .cra_module = THIS_MODULE,
1338 .cra_init = rfc4106_init,
1339 .cra_exit = rfc4106_exit,
1340 .cra_u = {
1341 .aead = {
1342 .setkey = rfc4106_set_key,
1343 .setauthsize = rfc4106_set_authsize,
1344 .encrypt = rfc4106_encrypt,
1345 .decrypt = rfc4106_decrypt,
1346 .geniv = "seqiv",
1347 .ivsize = 8,
1348 .maxauthsize = 16,
1349 },
1350 },
1351#endif
1352#ifdef HAS_PCBC
1353}, {
1354 .cra_name = "pcbc(aes)",
1355 .cra_driver_name = "pcbc-aes-aesni",
1356 .cra_priority = 400,
1357 .cra_flags = CRYPTO_ALG_TYPE_ABLKCIPHER | CRYPTO_ALG_ASYNC,
1358 .cra_blocksize = AES_BLOCK_SIZE,
1359 .cra_ctxsize = sizeof(struct async_helper_ctx),
1360 .cra_alignmask = 0,
1361 .cra_type = &crypto_ablkcipher_type,
1362 .cra_module = THIS_MODULE,
1363 .cra_init = ablk_pcbc_init,
1364 .cra_exit = ablk_exit,
1365 .cra_u = {
1366 .ablkcipher = {
1367 .min_keysize = AES_MIN_KEY_SIZE,
1368 .max_keysize = AES_MAX_KEY_SIZE,
1369 .ivsize = AES_BLOCK_SIZE,
1370 .setkey = ablk_set_key,
1371 .encrypt = ablk_encrypt,
1372 .decrypt = ablk_decrypt,
1373 },
1374 },
1375#endif
1376}, {
1377 .cra_name = "__lrw-aes-aesni",
1378 .cra_driver_name = "__driver-lrw-aes-aesni",
1379 .cra_priority = 0,
1380 .cra_flags = CRYPTO_ALG_TYPE_BLKCIPHER,
1381 .cra_blocksize = AES_BLOCK_SIZE,
1382 .cra_ctxsize = sizeof(struct aesni_lrw_ctx),
1383 .cra_alignmask = 0,
1384 .cra_type = &crypto_blkcipher_type,
1385 .cra_module = THIS_MODULE,
1386 .cra_exit = lrw_aesni_exit_tfm,
1387 .cra_u = {
1388 .blkcipher = {
1389 .min_keysize = AES_MIN_KEY_SIZE + AES_BLOCK_SIZE,
1390 .max_keysize = AES_MAX_KEY_SIZE + AES_BLOCK_SIZE,
1391 .ivsize = AES_BLOCK_SIZE,
1392 .setkey = lrw_aesni_setkey,
1393 .encrypt = lrw_encrypt,
1394 .decrypt = lrw_decrypt,
1395 },
1396 },
1397}, {
1398 .cra_name = "__xts-aes-aesni",
1399 .cra_driver_name = "__driver-xts-aes-aesni",
1400 .cra_priority = 0,
1401 .cra_flags = CRYPTO_ALG_TYPE_BLKCIPHER,
1402 .cra_blocksize = AES_BLOCK_SIZE,
1403 .cra_ctxsize = sizeof(struct aesni_xts_ctx),
1404 .cra_alignmask = 0,
1405 .cra_type = &crypto_blkcipher_type,
1406 .cra_module = THIS_MODULE,
1407 .cra_u = {
1408 .blkcipher = {
1409 .min_keysize = 2 * AES_MIN_KEY_SIZE,
1410 .max_keysize = 2 * AES_MAX_KEY_SIZE,
1411 .ivsize = AES_BLOCK_SIZE,
1412 .setkey = xts_aesni_setkey,
1413 .encrypt = xts_encrypt,
1414 .decrypt = xts_decrypt,
1415 },
1416 },
1417}, {
1418 .cra_name = "lrw(aes)",
1419 .cra_driver_name = "lrw-aes-aesni",
1420 .cra_priority = 400,
1421 .cra_flags = CRYPTO_ALG_TYPE_ABLKCIPHER | CRYPTO_ALG_ASYNC,
1422 .cra_blocksize = AES_BLOCK_SIZE,
1423 .cra_ctxsize = sizeof(struct async_helper_ctx),
1424 .cra_alignmask = 0,
1425 .cra_type = &crypto_ablkcipher_type,
1426 .cra_module = THIS_MODULE,
1427 .cra_init = ablk_init,
1428 .cra_exit = ablk_exit,
1429 .cra_u = {
1430 .ablkcipher = {
1431 .min_keysize = AES_MIN_KEY_SIZE + AES_BLOCK_SIZE,
1432 .max_keysize = AES_MAX_KEY_SIZE + AES_BLOCK_SIZE,
1433 .ivsize = AES_BLOCK_SIZE,
1434 .setkey = ablk_set_key,
1435 .encrypt = ablk_encrypt,
1436 .decrypt = ablk_decrypt,
1437 },
1438 },
1439}, {
1440 .cra_name = "xts(aes)",
1441 .cra_driver_name = "xts-aes-aesni",
1442 .cra_priority = 400,
1443 .cra_flags = CRYPTO_ALG_TYPE_ABLKCIPHER | CRYPTO_ALG_ASYNC,
1444 .cra_blocksize = AES_BLOCK_SIZE,
1445 .cra_ctxsize = sizeof(struct async_helper_ctx),
1446 .cra_alignmask = 0,
1447 .cra_type = &crypto_ablkcipher_type,
1448 .cra_module = THIS_MODULE,
1449 .cra_init = ablk_init,
1450 .cra_exit = ablk_exit,
1451 .cra_u = {
1452 .ablkcipher = {
1453 .min_keysize = 2 * AES_MIN_KEY_SIZE,
1454 .max_keysize = 2 * AES_MAX_KEY_SIZE,
1455 .ivsize = AES_BLOCK_SIZE,
1456 .setkey = ablk_set_key,
1457 .encrypt = ablk_encrypt,
1458 .decrypt = ablk_decrypt,
1459 },
1460 },
1461} };
1462
1463
1464static const struct x86_cpu_id aesni_cpu_id[] = {
1465 X86_FEATURE_MATCH(X86_FEATURE_AES),
1466 {}
1467};
1468MODULE_DEVICE_TABLE(x86cpu, aesni_cpu_id);
1469
1470static int __init aesni_init(void)
1471{
1472 int err;
1473
1474 if (!x86_match_cpu(aesni_cpu_id))
1475 return -ENODEV;
1476#ifdef CONFIG_X86_64
1477#ifdef CONFIG_AS_AVX2
1478 if (boot_cpu_has(X86_FEATURE_AVX2)) {
1479 pr_info("AVX2 version of gcm_enc/dec engaged.\n");
1480 aesni_gcm_enc_tfm = aesni_gcm_enc_avx2;
1481 aesni_gcm_dec_tfm = aesni_gcm_dec_avx2;
1482 } else
1483#endif
1484#ifdef CONFIG_AS_AVX
1485 if (boot_cpu_has(X86_FEATURE_AVX)) {
1486 pr_info("AVX version of gcm_enc/dec engaged.\n");
1487 aesni_gcm_enc_tfm = aesni_gcm_enc_avx;
1488 aesni_gcm_dec_tfm = aesni_gcm_dec_avx;
1489 } else
1490#endif
1491 {
1492 pr_info("SSE version of gcm_enc/dec engaged.\n");
1493 aesni_gcm_enc_tfm = aesni_gcm_enc;
1494 aesni_gcm_dec_tfm = aesni_gcm_dec;
1495 }
1496#endif
1497
1498 err = crypto_fpu_init();
1499 if (err)
1500 return err;
1501
1502 return crypto_register_algs(aesni_algs, ARRAY_SIZE(aesni_algs));
1503}
1504
1505static void __exit aesni_exit(void)
1506{
1507 crypto_unregister_algs(aesni_algs, ARRAY_SIZE(aesni_algs));
1508
1509 crypto_fpu_exit();
1510}
1511
1512module_init(aesni_init);
1513module_exit(aesni_exit);
1514
1515MODULE_DESCRIPTION("Rijndael (AES) Cipher Algorithm, Intel AES-NI instructions optimized");
1516MODULE_LICENSE("GPL");
1517MODULE_ALIAS("aes");