xref: /openbmc/linux/arch/arm/crypto/aes-ce-glue.c (revision c61b1607ed4fbbf2ba7c86f29768cff44a1a88f8)
1d2912cb1SThomas Gleixner // SPDX-License-Identifier: GPL-2.0-only
286464859SArd Biesheuvel /*
386464859SArd Biesheuvel  * aes-ce-glue.c - wrapper code for ARMv8 AES
486464859SArd Biesheuvel  *
586464859SArd Biesheuvel  * Copyright (C) 2015 Linaro Ltd <ard.biesheuvel@linaro.org>
686464859SArd Biesheuvel  */
786464859SArd Biesheuvel 
886464859SArd Biesheuvel #include <asm/hwcap.h>
986464859SArd Biesheuvel #include <asm/neon.h>
105eedf315SArd Biesheuvel #include <asm/simd.h>
11fafb1dcaSArd Biesheuvel #include <asm/unaligned.h>
1286464859SArd Biesheuvel #include <crypto/aes.h>
135eedf315SArd Biesheuvel #include <crypto/ctr.h>
14da40e7a4SHerbert Xu #include <crypto/internal/simd.h>
15da40e7a4SHerbert Xu #include <crypto/internal/skcipher.h>
16*c61b1607SArd Biesheuvel #include <crypto/scatterwalk.h>
174d8061a5SArd Biesheuvel #include <linux/cpufeature.h>
1886464859SArd Biesheuvel #include <linux/module.h>
1949abc0d2SStephan Mueller #include <crypto/xts.h>
2086464859SArd Biesheuvel 
2186464859SArd Biesheuvel MODULE_DESCRIPTION("AES-ECB/CBC/CTR/XTS using ARMv8 Crypto Extensions");
2286464859SArd Biesheuvel MODULE_AUTHOR("Ard Biesheuvel <ard.biesheuvel@linaro.org>");
2386464859SArd Biesheuvel MODULE_LICENSE("GPL v2");
2486464859SArd Biesheuvel 
2586464859SArd Biesheuvel /* defined in aes-ce-core.S */
2686464859SArd Biesheuvel asmlinkage u32 ce_aes_sub(u32 input);
2786464859SArd Biesheuvel asmlinkage void ce_aes_invert(void *dst, void *src);
2886464859SArd Biesheuvel 
29fcb0e30dSArd Biesheuvel asmlinkage void ce_aes_ecb_encrypt(u8 out[], u8 const in[], u32 const rk[],
3086464859SArd Biesheuvel 				   int rounds, int blocks);
31fcb0e30dSArd Biesheuvel asmlinkage void ce_aes_ecb_decrypt(u8 out[], u8 const in[], u32 const rk[],
3286464859SArd Biesheuvel 				   int rounds, int blocks);
3386464859SArd Biesheuvel 
34fcb0e30dSArd Biesheuvel asmlinkage void ce_aes_cbc_encrypt(u8 out[], u8 const in[], u32 const rk[],
3586464859SArd Biesheuvel 				   int rounds, int blocks, u8 iv[]);
36fcb0e30dSArd Biesheuvel asmlinkage void ce_aes_cbc_decrypt(u8 out[], u8 const in[], u32 const rk[],
3786464859SArd Biesheuvel 				   int rounds, int blocks, u8 iv[]);
3886464859SArd Biesheuvel 
39fcb0e30dSArd Biesheuvel asmlinkage void ce_aes_ctr_encrypt(u8 out[], u8 const in[], u32 const rk[],
4086464859SArd Biesheuvel 				   int rounds, int blocks, u8 ctr[]);
4186464859SArd Biesheuvel 
42fcb0e30dSArd Biesheuvel asmlinkage void ce_aes_xts_encrypt(u8 out[], u8 const in[], u32 const rk1[],
43*c61b1607SArd Biesheuvel 				   int rounds, int bytes, u8 iv[],
44fcb0e30dSArd Biesheuvel 				   u32 const rk2[], int first);
45fcb0e30dSArd Biesheuvel asmlinkage void ce_aes_xts_decrypt(u8 out[], u8 const in[], u32 const rk1[],
46*c61b1607SArd Biesheuvel 				   int rounds, int bytes, u8 iv[],
47fcb0e30dSArd Biesheuvel 				   u32 const rk2[], int first);
4886464859SArd Biesheuvel 
4986464859SArd Biesheuvel struct aes_block {
5086464859SArd Biesheuvel 	u8 b[AES_BLOCK_SIZE];
5186464859SArd Biesheuvel };
5286464859SArd Biesheuvel 
5386464859SArd Biesheuvel static int num_rounds(struct crypto_aes_ctx *ctx)
5486464859SArd Biesheuvel {
5586464859SArd Biesheuvel 	/*
5686464859SArd Biesheuvel 	 * # of rounds specified by AES:
5786464859SArd Biesheuvel 	 * 128 bit key		10 rounds
5886464859SArd Biesheuvel 	 * 192 bit key		12 rounds
5986464859SArd Biesheuvel 	 * 256 bit key		14 rounds
6086464859SArd Biesheuvel 	 * => n byte key	=> 6 + (n/4) rounds
6186464859SArd Biesheuvel 	 */
6286464859SArd Biesheuvel 	return 6 + ctx->key_length / 4;
6386464859SArd Biesheuvel }
6486464859SArd Biesheuvel 
6586464859SArd Biesheuvel static int ce_aes_expandkey(struct crypto_aes_ctx *ctx, const u8 *in_key,
6686464859SArd Biesheuvel 			    unsigned int key_len)
6786464859SArd Biesheuvel {
6886464859SArd Biesheuvel 	/*
6986464859SArd Biesheuvel 	 * The AES key schedule round constants
7086464859SArd Biesheuvel 	 */
7186464859SArd Biesheuvel 	static u8 const rcon[] = {
7286464859SArd Biesheuvel 		0x01, 0x02, 0x04, 0x08, 0x10, 0x20, 0x40, 0x80, 0x1b, 0x36,
7386464859SArd Biesheuvel 	};
7486464859SArd Biesheuvel 
7586464859SArd Biesheuvel 	u32 kwords = key_len / sizeof(u32);
7686464859SArd Biesheuvel 	struct aes_block *key_enc, *key_dec;
7786464859SArd Biesheuvel 	int i, j;
7886464859SArd Biesheuvel 
7986464859SArd Biesheuvel 	if (key_len != AES_KEYSIZE_128 &&
8086464859SArd Biesheuvel 	    key_len != AES_KEYSIZE_192 &&
8186464859SArd Biesheuvel 	    key_len != AES_KEYSIZE_256)
8286464859SArd Biesheuvel 		return -EINVAL;
8386464859SArd Biesheuvel 
8486464859SArd Biesheuvel 	ctx->key_length = key_len;
85fafb1dcaSArd Biesheuvel 	for (i = 0; i < kwords; i++)
86fafb1dcaSArd Biesheuvel 		ctx->key_enc[i] = get_unaligned_le32(in_key + i * sizeof(u32));
8786464859SArd Biesheuvel 
8886464859SArd Biesheuvel 	kernel_neon_begin();
8986464859SArd Biesheuvel 	for (i = 0; i < sizeof(rcon); i++) {
9086464859SArd Biesheuvel 		u32 *rki = ctx->key_enc + (i * kwords);
9186464859SArd Biesheuvel 		u32 *rko = rki + kwords;
9286464859SArd Biesheuvel 
9386464859SArd Biesheuvel 		rko[0] = ror32(ce_aes_sub(rki[kwords - 1]), 8);
9486464859SArd Biesheuvel 		rko[0] = rko[0] ^ rki[0] ^ rcon[i];
9586464859SArd Biesheuvel 		rko[1] = rko[0] ^ rki[1];
9686464859SArd Biesheuvel 		rko[2] = rko[1] ^ rki[2];
9786464859SArd Biesheuvel 		rko[3] = rko[2] ^ rki[3];
9886464859SArd Biesheuvel 
9986464859SArd Biesheuvel 		if (key_len == AES_KEYSIZE_192) {
10086464859SArd Biesheuvel 			if (i >= 7)
10186464859SArd Biesheuvel 				break;
10286464859SArd Biesheuvel 			rko[4] = rko[3] ^ rki[4];
10386464859SArd Biesheuvel 			rko[5] = rko[4] ^ rki[5];
10486464859SArd Biesheuvel 		} else if (key_len == AES_KEYSIZE_256) {
10586464859SArd Biesheuvel 			if (i >= 6)
10686464859SArd Biesheuvel 				break;
10786464859SArd Biesheuvel 			rko[4] = ce_aes_sub(rko[3]) ^ rki[4];
10886464859SArd Biesheuvel 			rko[5] = rko[4] ^ rki[5];
10986464859SArd Biesheuvel 			rko[6] = rko[5] ^ rki[6];
11086464859SArd Biesheuvel 			rko[7] = rko[6] ^ rki[7];
11186464859SArd Biesheuvel 		}
11286464859SArd Biesheuvel 	}
11386464859SArd Biesheuvel 
11486464859SArd Biesheuvel 	/*
11586464859SArd Biesheuvel 	 * Generate the decryption keys for the Equivalent Inverse Cipher.
11686464859SArd Biesheuvel 	 * This involves reversing the order of the round keys, and applying
11786464859SArd Biesheuvel 	 * the Inverse Mix Columns transformation on all but the first and
11886464859SArd Biesheuvel 	 * the last one.
11986464859SArd Biesheuvel 	 */
12086464859SArd Biesheuvel 	key_enc = (struct aes_block *)ctx->key_enc;
12186464859SArd Biesheuvel 	key_dec = (struct aes_block *)ctx->key_dec;
12286464859SArd Biesheuvel 	j = num_rounds(ctx);
12386464859SArd Biesheuvel 
12486464859SArd Biesheuvel 	key_dec[0] = key_enc[j];
12586464859SArd Biesheuvel 	for (i = 1, j--; j > 0; i++, j--)
12686464859SArd Biesheuvel 		ce_aes_invert(key_dec + i, key_enc + j);
12786464859SArd Biesheuvel 	key_dec[i] = key_enc[0];
12886464859SArd Biesheuvel 
12986464859SArd Biesheuvel 	kernel_neon_end();
13086464859SArd Biesheuvel 	return 0;
13186464859SArd Biesheuvel }
13286464859SArd Biesheuvel 
133da40e7a4SHerbert Xu static int ce_aes_setkey(struct crypto_skcipher *tfm, const u8 *in_key,
13486464859SArd Biesheuvel 			 unsigned int key_len)
13586464859SArd Biesheuvel {
136da40e7a4SHerbert Xu 	struct crypto_aes_ctx *ctx = crypto_skcipher_ctx(tfm);
13786464859SArd Biesheuvel 	int ret;
13886464859SArd Biesheuvel 
13986464859SArd Biesheuvel 	ret = ce_aes_expandkey(ctx, in_key, key_len);
14086464859SArd Biesheuvel 	if (!ret)
14186464859SArd Biesheuvel 		return 0;
14286464859SArd Biesheuvel 
143da40e7a4SHerbert Xu 	crypto_skcipher_set_flags(tfm, CRYPTO_TFM_RES_BAD_KEY_LEN);
14486464859SArd Biesheuvel 	return -EINVAL;
14586464859SArd Biesheuvel }
14686464859SArd Biesheuvel 
14786464859SArd Biesheuvel struct crypto_aes_xts_ctx {
14886464859SArd Biesheuvel 	struct crypto_aes_ctx key1;
14986464859SArd Biesheuvel 	struct crypto_aes_ctx __aligned(8) key2;
15086464859SArd Biesheuvel };
15186464859SArd Biesheuvel 
152da40e7a4SHerbert Xu static int xts_set_key(struct crypto_skcipher *tfm, const u8 *in_key,
15386464859SArd Biesheuvel 		       unsigned int key_len)
15486464859SArd Biesheuvel {
155da40e7a4SHerbert Xu 	struct crypto_aes_xts_ctx *ctx = crypto_skcipher_ctx(tfm);
15686464859SArd Biesheuvel 	int ret;
15786464859SArd Biesheuvel 
158da40e7a4SHerbert Xu 	ret = xts_verify_key(tfm, in_key, key_len);
15928856a9eSStephan Mueller 	if (ret)
16028856a9eSStephan Mueller 		return ret;
16128856a9eSStephan Mueller 
16286464859SArd Biesheuvel 	ret = ce_aes_expandkey(&ctx->key1, in_key, key_len / 2);
16386464859SArd Biesheuvel 	if (!ret)
16486464859SArd Biesheuvel 		ret = ce_aes_expandkey(&ctx->key2, &in_key[key_len / 2],
16586464859SArd Biesheuvel 				       key_len / 2);
16686464859SArd Biesheuvel 	if (!ret)
16786464859SArd Biesheuvel 		return 0;
16886464859SArd Biesheuvel 
169da40e7a4SHerbert Xu 	crypto_skcipher_set_flags(tfm, CRYPTO_TFM_RES_BAD_KEY_LEN);
17086464859SArd Biesheuvel 	return -EINVAL;
17186464859SArd Biesheuvel }
17286464859SArd Biesheuvel 
173da40e7a4SHerbert Xu static int ecb_encrypt(struct skcipher_request *req)
17486464859SArd Biesheuvel {
175da40e7a4SHerbert Xu 	struct crypto_skcipher *tfm = crypto_skcipher_reqtfm(req);
176da40e7a4SHerbert Xu 	struct crypto_aes_ctx *ctx = crypto_skcipher_ctx(tfm);
177da40e7a4SHerbert Xu 	struct skcipher_walk walk;
17886464859SArd Biesheuvel 	unsigned int blocks;
17986464859SArd Biesheuvel 	int err;
18086464859SArd Biesheuvel 
18146a22776SArd Biesheuvel 	err = skcipher_walk_virt(&walk, req, false);
18286464859SArd Biesheuvel 
18386464859SArd Biesheuvel 	while ((blocks = (walk.nbytes / AES_BLOCK_SIZE))) {
18446a22776SArd Biesheuvel 		kernel_neon_begin();
18586464859SArd Biesheuvel 		ce_aes_ecb_encrypt(walk.dst.virt.addr, walk.src.virt.addr,
186fcb0e30dSArd Biesheuvel 				   ctx->key_enc, num_rounds(ctx), blocks);
18746a22776SArd Biesheuvel 		kernel_neon_end();
188da40e7a4SHerbert Xu 		err = skcipher_walk_done(&walk, walk.nbytes % AES_BLOCK_SIZE);
18986464859SArd Biesheuvel 	}
19086464859SArd Biesheuvel 	return err;
19186464859SArd Biesheuvel }
19286464859SArd Biesheuvel 
193da40e7a4SHerbert Xu static int ecb_decrypt(struct skcipher_request *req)
19486464859SArd Biesheuvel {
195da40e7a4SHerbert Xu 	struct crypto_skcipher *tfm = crypto_skcipher_reqtfm(req);
196da40e7a4SHerbert Xu 	struct crypto_aes_ctx *ctx = crypto_skcipher_ctx(tfm);
197da40e7a4SHerbert Xu 	struct skcipher_walk walk;
19886464859SArd Biesheuvel 	unsigned int blocks;
19986464859SArd Biesheuvel 	int err;
20086464859SArd Biesheuvel 
20146a22776SArd Biesheuvel 	err = skcipher_walk_virt(&walk, req, false);
20286464859SArd Biesheuvel 
20386464859SArd Biesheuvel 	while ((blocks = (walk.nbytes / AES_BLOCK_SIZE))) {
20446a22776SArd Biesheuvel 		kernel_neon_begin();
20586464859SArd Biesheuvel 		ce_aes_ecb_decrypt(walk.dst.virt.addr, walk.src.virt.addr,
206fcb0e30dSArd Biesheuvel 				   ctx->key_dec, num_rounds(ctx), blocks);
20746a22776SArd Biesheuvel 		kernel_neon_end();
208da40e7a4SHerbert Xu 		err = skcipher_walk_done(&walk, walk.nbytes % AES_BLOCK_SIZE);
20986464859SArd Biesheuvel 	}
21086464859SArd Biesheuvel 	return err;
21186464859SArd Biesheuvel }
21286464859SArd Biesheuvel 
213da40e7a4SHerbert Xu static int cbc_encrypt(struct skcipher_request *req)
21486464859SArd Biesheuvel {
215da40e7a4SHerbert Xu 	struct crypto_skcipher *tfm = crypto_skcipher_reqtfm(req);
216da40e7a4SHerbert Xu 	struct crypto_aes_ctx *ctx = crypto_skcipher_ctx(tfm);
217da40e7a4SHerbert Xu 	struct skcipher_walk walk;
21886464859SArd Biesheuvel 	unsigned int blocks;
21986464859SArd Biesheuvel 	int err;
22086464859SArd Biesheuvel 
22146a22776SArd Biesheuvel 	err = skcipher_walk_virt(&walk, req, false);
22286464859SArd Biesheuvel 
22386464859SArd Biesheuvel 	while ((blocks = (walk.nbytes / AES_BLOCK_SIZE))) {
22446a22776SArd Biesheuvel 		kernel_neon_begin();
22586464859SArd Biesheuvel 		ce_aes_cbc_encrypt(walk.dst.virt.addr, walk.src.virt.addr,
226fcb0e30dSArd Biesheuvel 				   ctx->key_enc, num_rounds(ctx), blocks,
22786464859SArd Biesheuvel 				   walk.iv);
22846a22776SArd Biesheuvel 		kernel_neon_end();
229da40e7a4SHerbert Xu 		err = skcipher_walk_done(&walk, walk.nbytes % AES_BLOCK_SIZE);
23086464859SArd Biesheuvel 	}
23186464859SArd Biesheuvel 	return err;
23286464859SArd Biesheuvel }
23386464859SArd Biesheuvel 
234da40e7a4SHerbert Xu static int cbc_decrypt(struct skcipher_request *req)
23586464859SArd Biesheuvel {
236da40e7a4SHerbert Xu 	struct crypto_skcipher *tfm = crypto_skcipher_reqtfm(req);
237da40e7a4SHerbert Xu 	struct crypto_aes_ctx *ctx = crypto_skcipher_ctx(tfm);
238da40e7a4SHerbert Xu 	struct skcipher_walk walk;
23986464859SArd Biesheuvel 	unsigned int blocks;
24086464859SArd Biesheuvel 	int err;
24186464859SArd Biesheuvel 
24246a22776SArd Biesheuvel 	err = skcipher_walk_virt(&walk, req, false);
24386464859SArd Biesheuvel 
24486464859SArd Biesheuvel 	while ((blocks = (walk.nbytes / AES_BLOCK_SIZE))) {
24546a22776SArd Biesheuvel 		kernel_neon_begin();
24686464859SArd Biesheuvel 		ce_aes_cbc_decrypt(walk.dst.virt.addr, walk.src.virt.addr,
247fcb0e30dSArd Biesheuvel 				   ctx->key_dec, num_rounds(ctx), blocks,
24886464859SArd Biesheuvel 				   walk.iv);
24946a22776SArd Biesheuvel 		kernel_neon_end();
250da40e7a4SHerbert Xu 		err = skcipher_walk_done(&walk, walk.nbytes % AES_BLOCK_SIZE);
25186464859SArd Biesheuvel 	}
25286464859SArd Biesheuvel 	return err;
25386464859SArd Biesheuvel }
25486464859SArd Biesheuvel 
255da40e7a4SHerbert Xu static int ctr_encrypt(struct skcipher_request *req)
25686464859SArd Biesheuvel {
257da40e7a4SHerbert Xu 	struct crypto_skcipher *tfm = crypto_skcipher_reqtfm(req);
258da40e7a4SHerbert Xu 	struct crypto_aes_ctx *ctx = crypto_skcipher_ctx(tfm);
259da40e7a4SHerbert Xu 	struct skcipher_walk walk;
26086464859SArd Biesheuvel 	int err, blocks;
26186464859SArd Biesheuvel 
26246a22776SArd Biesheuvel 	err = skcipher_walk_virt(&walk, req, false);
26386464859SArd Biesheuvel 
26486464859SArd Biesheuvel 	while ((blocks = (walk.nbytes / AES_BLOCK_SIZE))) {
26546a22776SArd Biesheuvel 		kernel_neon_begin();
26686464859SArd Biesheuvel 		ce_aes_ctr_encrypt(walk.dst.virt.addr, walk.src.virt.addr,
267fcb0e30dSArd Biesheuvel 				   ctx->key_enc, num_rounds(ctx), blocks,
26886464859SArd Biesheuvel 				   walk.iv);
26946a22776SArd Biesheuvel 		kernel_neon_end();
270da40e7a4SHerbert Xu 		err = skcipher_walk_done(&walk, walk.nbytes % AES_BLOCK_SIZE);
27186464859SArd Biesheuvel 	}
272da40e7a4SHerbert Xu 	if (walk.nbytes) {
27386464859SArd Biesheuvel 		u8 __aligned(8) tail[AES_BLOCK_SIZE];
274da40e7a4SHerbert Xu 		unsigned int nbytes = walk.nbytes;
275da40e7a4SHerbert Xu 		u8 *tdst = walk.dst.virt.addr;
276da40e7a4SHerbert Xu 		u8 *tsrc = walk.src.virt.addr;
27786464859SArd Biesheuvel 
27886464859SArd Biesheuvel 		/*
2791465fb13SArd Biesheuvel 		 * Tell aes_ctr_encrypt() to process a tail block.
28086464859SArd Biesheuvel 		 */
2811465fb13SArd Biesheuvel 		blocks = -1;
28286464859SArd Biesheuvel 
28346a22776SArd Biesheuvel 		kernel_neon_begin();
284fcb0e30dSArd Biesheuvel 		ce_aes_ctr_encrypt(tail, NULL, ctx->key_enc, num_rounds(ctx),
285fcb0e30dSArd Biesheuvel 				   blocks, walk.iv);
28646a22776SArd Biesheuvel 		kernel_neon_end();
28745fe93dfSArd Biesheuvel 		crypto_xor_cpy(tdst, tsrc, tail, nbytes);
288da40e7a4SHerbert Xu 		err = skcipher_walk_done(&walk, 0);
28986464859SArd Biesheuvel 	}
29086464859SArd Biesheuvel 	return err;
29186464859SArd Biesheuvel }
29286464859SArd Biesheuvel 
2935eedf315SArd Biesheuvel static void ctr_encrypt_one(struct crypto_skcipher *tfm, const u8 *src, u8 *dst)
2945eedf315SArd Biesheuvel {
2955eedf315SArd Biesheuvel 	struct crypto_aes_ctx *ctx = crypto_skcipher_ctx(tfm);
2965eedf315SArd Biesheuvel 	unsigned long flags;
2975eedf315SArd Biesheuvel 
2985eedf315SArd Biesheuvel 	/*
2995eedf315SArd Biesheuvel 	 * Temporarily disable interrupts to avoid races where
3005eedf315SArd Biesheuvel 	 * cachelines are evicted when the CPU is interrupted
3015eedf315SArd Biesheuvel 	 * to do something else.
3025eedf315SArd Biesheuvel 	 */
3035eedf315SArd Biesheuvel 	local_irq_save(flags);
3045eedf315SArd Biesheuvel 	aes_encrypt(ctx, dst, src);
3055eedf315SArd Biesheuvel 	local_irq_restore(flags);
3065eedf315SArd Biesheuvel }
3075eedf315SArd Biesheuvel 
3085eedf315SArd Biesheuvel static int ctr_encrypt_sync(struct skcipher_request *req)
3095eedf315SArd Biesheuvel {
3105eedf315SArd Biesheuvel 	if (!crypto_simd_usable())
3115eedf315SArd Biesheuvel 		return crypto_ctr_encrypt_walk(req, ctr_encrypt_one);
3125eedf315SArd Biesheuvel 
3135eedf315SArd Biesheuvel 	return ctr_encrypt(req);
3145eedf315SArd Biesheuvel }
3155eedf315SArd Biesheuvel 
316da40e7a4SHerbert Xu static int xts_encrypt(struct skcipher_request *req)
31786464859SArd Biesheuvel {
318da40e7a4SHerbert Xu 	struct crypto_skcipher *tfm = crypto_skcipher_reqtfm(req);
319da40e7a4SHerbert Xu 	struct crypto_aes_xts_ctx *ctx = crypto_skcipher_ctx(tfm);
32086464859SArd Biesheuvel 	int err, first, rounds = num_rounds(&ctx->key1);
321*c61b1607SArd Biesheuvel 	int tail = req->cryptlen % AES_BLOCK_SIZE;
322*c61b1607SArd Biesheuvel 	struct scatterlist sg_src[2], sg_dst[2];
323*c61b1607SArd Biesheuvel 	struct skcipher_request subreq;
324*c61b1607SArd Biesheuvel 	struct scatterlist *src, *dst;
325da40e7a4SHerbert Xu 	struct skcipher_walk walk;
326*c61b1607SArd Biesheuvel 
327*c61b1607SArd Biesheuvel 	if (req->cryptlen < AES_BLOCK_SIZE)
328*c61b1607SArd Biesheuvel 		return -EINVAL;
32986464859SArd Biesheuvel 
33046a22776SArd Biesheuvel 	err = skcipher_walk_virt(&walk, req, false);
33186464859SArd Biesheuvel 
332*c61b1607SArd Biesheuvel 	if (unlikely(tail > 0 && walk.nbytes < walk.total)) {
333*c61b1607SArd Biesheuvel 		int xts_blocks = DIV_ROUND_UP(req->cryptlen,
334*c61b1607SArd Biesheuvel 					      AES_BLOCK_SIZE) - 2;
335*c61b1607SArd Biesheuvel 
336*c61b1607SArd Biesheuvel 		skcipher_walk_abort(&walk);
337*c61b1607SArd Biesheuvel 
338*c61b1607SArd Biesheuvel 		skcipher_request_set_tfm(&subreq, tfm);
339*c61b1607SArd Biesheuvel 		skcipher_request_set_callback(&subreq,
340*c61b1607SArd Biesheuvel 					      skcipher_request_flags(req),
341*c61b1607SArd Biesheuvel 					      NULL, NULL);
342*c61b1607SArd Biesheuvel 		skcipher_request_set_crypt(&subreq, req->src, req->dst,
343*c61b1607SArd Biesheuvel 					   xts_blocks * AES_BLOCK_SIZE,
344*c61b1607SArd Biesheuvel 					   req->iv);
345*c61b1607SArd Biesheuvel 		req = &subreq;
346*c61b1607SArd Biesheuvel 		err = skcipher_walk_virt(&walk, req, false);
347*c61b1607SArd Biesheuvel 	} else {
348*c61b1607SArd Biesheuvel 		tail = 0;
349*c61b1607SArd Biesheuvel 	}
350*c61b1607SArd Biesheuvel 
351*c61b1607SArd Biesheuvel 	for (first = 1; walk.nbytes >= AES_BLOCK_SIZE; first = 0) {
352*c61b1607SArd Biesheuvel 		int nbytes = walk.nbytes;
353*c61b1607SArd Biesheuvel 
354*c61b1607SArd Biesheuvel 		if (walk.nbytes < walk.total)
355*c61b1607SArd Biesheuvel 			nbytes &= ~(AES_BLOCK_SIZE - 1);
356*c61b1607SArd Biesheuvel 
35746a22776SArd Biesheuvel 		kernel_neon_begin();
35886464859SArd Biesheuvel 		ce_aes_xts_encrypt(walk.dst.virt.addr, walk.src.virt.addr,
359*c61b1607SArd Biesheuvel 				   ctx->key1.key_enc, rounds, nbytes, walk.iv,
360fcb0e30dSArd Biesheuvel 				   ctx->key2.key_enc, first);
36146a22776SArd Biesheuvel 		kernel_neon_end();
362*c61b1607SArd Biesheuvel 		err = skcipher_walk_done(&walk, walk.nbytes - nbytes);
36386464859SArd Biesheuvel 	}
364*c61b1607SArd Biesheuvel 
365*c61b1607SArd Biesheuvel 	if (err || likely(!tail))
36686464859SArd Biesheuvel 		return err;
367*c61b1607SArd Biesheuvel 
368*c61b1607SArd Biesheuvel 	dst = src = scatterwalk_ffwd(sg_src, req->src, req->cryptlen);
369*c61b1607SArd Biesheuvel 	if (req->dst != req->src)
370*c61b1607SArd Biesheuvel 		dst = scatterwalk_ffwd(sg_dst, req->dst, req->cryptlen);
371*c61b1607SArd Biesheuvel 
372*c61b1607SArd Biesheuvel 	skcipher_request_set_crypt(req, src, dst, AES_BLOCK_SIZE + tail,
373*c61b1607SArd Biesheuvel 				   req->iv);
374*c61b1607SArd Biesheuvel 
375*c61b1607SArd Biesheuvel 	err = skcipher_walk_virt(&walk, req, false);
376*c61b1607SArd Biesheuvel 	if (err)
377*c61b1607SArd Biesheuvel 		return err;
378*c61b1607SArd Biesheuvel 
379*c61b1607SArd Biesheuvel 	kernel_neon_begin();
380*c61b1607SArd Biesheuvel 	ce_aes_xts_encrypt(walk.dst.virt.addr, walk.src.virt.addr,
381*c61b1607SArd Biesheuvel 			   ctx->key1.key_enc, rounds, walk.nbytes, walk.iv,
382*c61b1607SArd Biesheuvel 			   ctx->key2.key_enc, first);
383*c61b1607SArd Biesheuvel 	kernel_neon_end();
384*c61b1607SArd Biesheuvel 
385*c61b1607SArd Biesheuvel 	return skcipher_walk_done(&walk, 0);
38686464859SArd Biesheuvel }
38786464859SArd Biesheuvel 
388da40e7a4SHerbert Xu static int xts_decrypt(struct skcipher_request *req)
38986464859SArd Biesheuvel {
390da40e7a4SHerbert Xu 	struct crypto_skcipher *tfm = crypto_skcipher_reqtfm(req);
391da40e7a4SHerbert Xu 	struct crypto_aes_xts_ctx *ctx = crypto_skcipher_ctx(tfm);
39286464859SArd Biesheuvel 	int err, first, rounds = num_rounds(&ctx->key1);
393*c61b1607SArd Biesheuvel 	int tail = req->cryptlen % AES_BLOCK_SIZE;
394*c61b1607SArd Biesheuvel 	struct scatterlist sg_src[2], sg_dst[2];
395*c61b1607SArd Biesheuvel 	struct skcipher_request subreq;
396*c61b1607SArd Biesheuvel 	struct scatterlist *src, *dst;
397da40e7a4SHerbert Xu 	struct skcipher_walk walk;
398*c61b1607SArd Biesheuvel 
399*c61b1607SArd Biesheuvel 	if (req->cryptlen < AES_BLOCK_SIZE)
400*c61b1607SArd Biesheuvel 		return -EINVAL;
40186464859SArd Biesheuvel 
40246a22776SArd Biesheuvel 	err = skcipher_walk_virt(&walk, req, false);
40386464859SArd Biesheuvel 
404*c61b1607SArd Biesheuvel 	if (unlikely(tail > 0 && walk.nbytes < walk.total)) {
405*c61b1607SArd Biesheuvel 		int xts_blocks = DIV_ROUND_UP(req->cryptlen,
406*c61b1607SArd Biesheuvel 					      AES_BLOCK_SIZE) - 2;
407*c61b1607SArd Biesheuvel 
408*c61b1607SArd Biesheuvel 		skcipher_walk_abort(&walk);
409*c61b1607SArd Biesheuvel 
410*c61b1607SArd Biesheuvel 		skcipher_request_set_tfm(&subreq, tfm);
411*c61b1607SArd Biesheuvel 		skcipher_request_set_callback(&subreq,
412*c61b1607SArd Biesheuvel 					      skcipher_request_flags(req),
413*c61b1607SArd Biesheuvel 					      NULL, NULL);
414*c61b1607SArd Biesheuvel 		skcipher_request_set_crypt(&subreq, req->src, req->dst,
415*c61b1607SArd Biesheuvel 					   xts_blocks * AES_BLOCK_SIZE,
416*c61b1607SArd Biesheuvel 					   req->iv);
417*c61b1607SArd Biesheuvel 		req = &subreq;
418*c61b1607SArd Biesheuvel 		err = skcipher_walk_virt(&walk, req, false);
419*c61b1607SArd Biesheuvel 	} else {
420*c61b1607SArd Biesheuvel 		tail = 0;
421*c61b1607SArd Biesheuvel 	}
422*c61b1607SArd Biesheuvel 
423*c61b1607SArd Biesheuvel 	for (first = 1; walk.nbytes >= AES_BLOCK_SIZE; first = 0) {
424*c61b1607SArd Biesheuvel 		int nbytes = walk.nbytes;
425*c61b1607SArd Biesheuvel 
426*c61b1607SArd Biesheuvel 		if (walk.nbytes < walk.total)
427*c61b1607SArd Biesheuvel 			nbytes &= ~(AES_BLOCK_SIZE - 1);
428*c61b1607SArd Biesheuvel 
42946a22776SArd Biesheuvel 		kernel_neon_begin();
43086464859SArd Biesheuvel 		ce_aes_xts_decrypt(walk.dst.virt.addr, walk.src.virt.addr,
431*c61b1607SArd Biesheuvel 				   ctx->key1.key_dec, rounds, nbytes, walk.iv,
432fcb0e30dSArd Biesheuvel 				   ctx->key2.key_enc, first);
43346a22776SArd Biesheuvel 		kernel_neon_end();
434*c61b1607SArd Biesheuvel 		err = skcipher_walk_done(&walk, walk.nbytes - nbytes);
43586464859SArd Biesheuvel 	}
436*c61b1607SArd Biesheuvel 
437*c61b1607SArd Biesheuvel 	if (err || likely(!tail))
43886464859SArd Biesheuvel 		return err;
439*c61b1607SArd Biesheuvel 
440*c61b1607SArd Biesheuvel 	dst = src = scatterwalk_ffwd(sg_src, req->src, req->cryptlen);
441*c61b1607SArd Biesheuvel 	if (req->dst != req->src)
442*c61b1607SArd Biesheuvel 		dst = scatterwalk_ffwd(sg_dst, req->dst, req->cryptlen);
443*c61b1607SArd Biesheuvel 
444*c61b1607SArd Biesheuvel 	skcipher_request_set_crypt(req, src, dst, AES_BLOCK_SIZE + tail,
445*c61b1607SArd Biesheuvel 				   req->iv);
446*c61b1607SArd Biesheuvel 
447*c61b1607SArd Biesheuvel 	err = skcipher_walk_virt(&walk, req, false);
448*c61b1607SArd Biesheuvel 	if (err)
449*c61b1607SArd Biesheuvel 		return err;
450*c61b1607SArd Biesheuvel 
451*c61b1607SArd Biesheuvel 	kernel_neon_begin();
452*c61b1607SArd Biesheuvel 	ce_aes_xts_decrypt(walk.dst.virt.addr, walk.src.virt.addr,
453*c61b1607SArd Biesheuvel 			   ctx->key1.key_dec, rounds, walk.nbytes, walk.iv,
454*c61b1607SArd Biesheuvel 			   ctx->key2.key_enc, first);
455*c61b1607SArd Biesheuvel 	kernel_neon_end();
456*c61b1607SArd Biesheuvel 
457*c61b1607SArd Biesheuvel 	return skcipher_walk_done(&walk, 0);
45886464859SArd Biesheuvel }
45986464859SArd Biesheuvel 
460da40e7a4SHerbert Xu static struct skcipher_alg aes_algs[] = { {
46120bb4ef0SArd Biesheuvel 	.base.cra_name		= "__ecb(aes)",
46220bb4ef0SArd Biesheuvel 	.base.cra_driver_name	= "__ecb-aes-ce",
46320bb4ef0SArd Biesheuvel 	.base.cra_priority	= 300,
46420bb4ef0SArd Biesheuvel 	.base.cra_flags		= CRYPTO_ALG_INTERNAL,
46520bb4ef0SArd Biesheuvel 	.base.cra_blocksize	= AES_BLOCK_SIZE,
46620bb4ef0SArd Biesheuvel 	.base.cra_ctxsize	= sizeof(struct crypto_aes_ctx),
46720bb4ef0SArd Biesheuvel 	.base.cra_module	= THIS_MODULE,
46820bb4ef0SArd Biesheuvel 
46986464859SArd Biesheuvel 	.min_keysize		= AES_MIN_KEY_SIZE,
47086464859SArd Biesheuvel 	.max_keysize		= AES_MAX_KEY_SIZE,
47186464859SArd Biesheuvel 	.setkey			= ce_aes_setkey,
47286464859SArd Biesheuvel 	.encrypt		= ecb_encrypt,
47386464859SArd Biesheuvel 	.decrypt		= ecb_decrypt,
47486464859SArd Biesheuvel }, {
47520bb4ef0SArd Biesheuvel 	.base.cra_name		= "__cbc(aes)",
47620bb4ef0SArd Biesheuvel 	.base.cra_driver_name	= "__cbc-aes-ce",
47720bb4ef0SArd Biesheuvel 	.base.cra_priority	= 300,
47820bb4ef0SArd Biesheuvel 	.base.cra_flags		= CRYPTO_ALG_INTERNAL,
47920bb4ef0SArd Biesheuvel 	.base.cra_blocksize	= AES_BLOCK_SIZE,
48020bb4ef0SArd Biesheuvel 	.base.cra_ctxsize	= sizeof(struct crypto_aes_ctx),
48120bb4ef0SArd Biesheuvel 	.base.cra_module	= THIS_MODULE,
48220bb4ef0SArd Biesheuvel 
48386464859SArd Biesheuvel 	.min_keysize		= AES_MIN_KEY_SIZE,
48486464859SArd Biesheuvel 	.max_keysize		= AES_MAX_KEY_SIZE,
48586464859SArd Biesheuvel 	.ivsize			= AES_BLOCK_SIZE,
48686464859SArd Biesheuvel 	.setkey			= ce_aes_setkey,
48786464859SArd Biesheuvel 	.encrypt		= cbc_encrypt,
48886464859SArd Biesheuvel 	.decrypt		= cbc_decrypt,
48986464859SArd Biesheuvel }, {
49020bb4ef0SArd Biesheuvel 	.base.cra_name		= "__ctr(aes)",
49120bb4ef0SArd Biesheuvel 	.base.cra_driver_name	= "__ctr-aes-ce",
49220bb4ef0SArd Biesheuvel 	.base.cra_priority	= 300,
49320bb4ef0SArd Biesheuvel 	.base.cra_flags		= CRYPTO_ALG_INTERNAL,
49420bb4ef0SArd Biesheuvel 	.base.cra_blocksize	= 1,
49520bb4ef0SArd Biesheuvel 	.base.cra_ctxsize	= sizeof(struct crypto_aes_ctx),
49620bb4ef0SArd Biesheuvel 	.base.cra_module	= THIS_MODULE,
49720bb4ef0SArd Biesheuvel 
49886464859SArd Biesheuvel 	.min_keysize		= AES_MIN_KEY_SIZE,
49986464859SArd Biesheuvel 	.max_keysize		= AES_MAX_KEY_SIZE,
50086464859SArd Biesheuvel 	.ivsize			= AES_BLOCK_SIZE,
501da40e7a4SHerbert Xu 	.chunksize		= AES_BLOCK_SIZE,
50286464859SArd Biesheuvel 	.setkey			= ce_aes_setkey,
50386464859SArd Biesheuvel 	.encrypt		= ctr_encrypt,
50486464859SArd Biesheuvel 	.decrypt		= ctr_encrypt,
50586464859SArd Biesheuvel }, {
5065eedf315SArd Biesheuvel 	.base.cra_name		= "ctr(aes)",
5075eedf315SArd Biesheuvel 	.base.cra_driver_name	= "ctr-aes-ce-sync",
5085eedf315SArd Biesheuvel 	.base.cra_priority	= 300 - 1,
5095eedf315SArd Biesheuvel 	.base.cra_blocksize	= 1,
5105eedf315SArd Biesheuvel 	.base.cra_ctxsize	= sizeof(struct crypto_aes_ctx),
5115eedf315SArd Biesheuvel 	.base.cra_module	= THIS_MODULE,
5125eedf315SArd Biesheuvel 
5135eedf315SArd Biesheuvel 	.min_keysize		= AES_MIN_KEY_SIZE,
5145eedf315SArd Biesheuvel 	.max_keysize		= AES_MAX_KEY_SIZE,
5155eedf315SArd Biesheuvel 	.ivsize			= AES_BLOCK_SIZE,
5165eedf315SArd Biesheuvel 	.chunksize		= AES_BLOCK_SIZE,
5175eedf315SArd Biesheuvel 	.setkey			= ce_aes_setkey,
5185eedf315SArd Biesheuvel 	.encrypt		= ctr_encrypt_sync,
5195eedf315SArd Biesheuvel 	.decrypt		= ctr_encrypt_sync,
5205eedf315SArd Biesheuvel }, {
52120bb4ef0SArd Biesheuvel 	.base.cra_name		= "__xts(aes)",
52220bb4ef0SArd Biesheuvel 	.base.cra_driver_name	= "__xts-aes-ce",
52320bb4ef0SArd Biesheuvel 	.base.cra_priority	= 300,
52420bb4ef0SArd Biesheuvel 	.base.cra_flags		= CRYPTO_ALG_INTERNAL,
52520bb4ef0SArd Biesheuvel 	.base.cra_blocksize	= AES_BLOCK_SIZE,
52620bb4ef0SArd Biesheuvel 	.base.cra_ctxsize	= sizeof(struct crypto_aes_xts_ctx),
52720bb4ef0SArd Biesheuvel 	.base.cra_module	= THIS_MODULE,
52820bb4ef0SArd Biesheuvel 
52986464859SArd Biesheuvel 	.min_keysize		= 2 * AES_MIN_KEY_SIZE,
53086464859SArd Biesheuvel 	.max_keysize		= 2 * AES_MAX_KEY_SIZE,
53186464859SArd Biesheuvel 	.ivsize			= AES_BLOCK_SIZE,
532*c61b1607SArd Biesheuvel 	.walksize		= 2 * AES_BLOCK_SIZE,
53386464859SArd Biesheuvel 	.setkey			= xts_set_key,
53486464859SArd Biesheuvel 	.encrypt		= xts_encrypt,
53586464859SArd Biesheuvel 	.decrypt		= xts_decrypt,
53686464859SArd Biesheuvel } };
53786464859SArd Biesheuvel 
538efad2b61SHerbert Xu static struct simd_skcipher_alg *aes_simd_algs[ARRAY_SIZE(aes_algs)];
539da40e7a4SHerbert Xu 
540da40e7a4SHerbert Xu static void aes_exit(void)
541da40e7a4SHerbert Xu {
542da40e7a4SHerbert Xu 	int i;
543da40e7a4SHerbert Xu 
544da40e7a4SHerbert Xu 	for (i = 0; i < ARRAY_SIZE(aes_simd_algs) && aes_simd_algs[i]; i++)
545da40e7a4SHerbert Xu 		simd_skcipher_free(aes_simd_algs[i]);
546da40e7a4SHerbert Xu 
547da40e7a4SHerbert Xu 	crypto_unregister_skciphers(aes_algs, ARRAY_SIZE(aes_algs));
548da40e7a4SHerbert Xu }
549da40e7a4SHerbert Xu 
55086464859SArd Biesheuvel static int __init aes_init(void)
55186464859SArd Biesheuvel {
552da40e7a4SHerbert Xu 	struct simd_skcipher_alg *simd;
553da40e7a4SHerbert Xu 	const char *basename;
554da40e7a4SHerbert Xu 	const char *algname;
555da40e7a4SHerbert Xu 	const char *drvname;
556da40e7a4SHerbert Xu 	int err;
557da40e7a4SHerbert Xu 	int i;
558da40e7a4SHerbert Xu 
559da40e7a4SHerbert Xu 	err = crypto_register_skciphers(aes_algs, ARRAY_SIZE(aes_algs));
560da40e7a4SHerbert Xu 	if (err)
561da40e7a4SHerbert Xu 		return err;
562da40e7a4SHerbert Xu 
563da40e7a4SHerbert Xu 	for (i = 0; i < ARRAY_SIZE(aes_algs); i++) {
5645eedf315SArd Biesheuvel 		if (!(aes_algs[i].base.cra_flags & CRYPTO_ALG_INTERNAL))
5655eedf315SArd Biesheuvel 			continue;
5665eedf315SArd Biesheuvel 
567da40e7a4SHerbert Xu 		algname = aes_algs[i].base.cra_name + 2;
568da40e7a4SHerbert Xu 		drvname = aes_algs[i].base.cra_driver_name + 2;
569da40e7a4SHerbert Xu 		basename = aes_algs[i].base.cra_driver_name;
570da40e7a4SHerbert Xu 		simd = simd_skcipher_create_compat(algname, drvname, basename);
571da40e7a4SHerbert Xu 		err = PTR_ERR(simd);
572da40e7a4SHerbert Xu 		if (IS_ERR(simd))
573da40e7a4SHerbert Xu 			goto unregister_simds;
574da40e7a4SHerbert Xu 
575da40e7a4SHerbert Xu 		aes_simd_algs[i] = simd;
57686464859SArd Biesheuvel 	}
57786464859SArd Biesheuvel 
578da40e7a4SHerbert Xu 	return 0;
579da40e7a4SHerbert Xu 
580da40e7a4SHerbert Xu unregister_simds:
581da40e7a4SHerbert Xu 	aes_exit();
582da40e7a4SHerbert Xu 	return err;
58386464859SArd Biesheuvel }
58486464859SArd Biesheuvel 
5854d8061a5SArd Biesheuvel module_cpu_feature_match(AES, aes_init);
58686464859SArd Biesheuvel module_exit(aes_exit);
587