1d2912cb1SThomas Gleixner // SPDX-License-Identifier: GPL-2.0-only
2cc477bf6SArd Biesheuvel /*
3cc477bf6SArd Biesheuvel  * Bit sliced AES using NEON instructions
4cc477bf6SArd Biesheuvel  *
5cc477bf6SArd Biesheuvel  * Copyright (C) 2017 Linaro Ltd <ard.biesheuvel@linaro.org>
6cc477bf6SArd Biesheuvel  */
7cc477bf6SArd Biesheuvel 
8cc477bf6SArd Biesheuvel #include <asm/neon.h>
9e5f05040SArd Biesheuvel #include <asm/simd.h>
10cc477bf6SArd Biesheuvel #include <crypto/aes.h>
11e5f05040SArd Biesheuvel #include <crypto/ctr.h>
120eb76ba2SArd Biesheuvel #include <crypto/internal/cipher.h>
13cc477bf6SArd Biesheuvel #include <crypto/internal/simd.h>
14cc477bf6SArd Biesheuvel #include <crypto/internal/skcipher.h>
152ed8b790SArd Biesheuvel #include <crypto/scatterwalk.h>
16cc477bf6SArd Biesheuvel #include <crypto/xts.h>
17cc477bf6SArd Biesheuvel #include <linux/module.h>
18cc477bf6SArd Biesheuvel 
19cc477bf6SArd Biesheuvel MODULE_AUTHOR("Ard Biesheuvel <ard.biesheuvel@linaro.org>");
20cc477bf6SArd Biesheuvel MODULE_LICENSE("GPL v2");
21cc477bf6SArd Biesheuvel 
22cc477bf6SArd Biesheuvel MODULE_ALIAS_CRYPTO("ecb(aes)");
23a2715fbdSHoria Geantă MODULE_ALIAS_CRYPTO("cbc(aes)-all");
24cc477bf6SArd Biesheuvel MODULE_ALIAS_CRYPTO("ctr(aes)");
25cc477bf6SArd Biesheuvel MODULE_ALIAS_CRYPTO("xts(aes)");
26cc477bf6SArd Biesheuvel 
270eb76ba2SArd Biesheuvel MODULE_IMPORT_NS(CRYPTO_INTERNAL);
280eb76ba2SArd Biesheuvel 
29cc477bf6SArd Biesheuvel asmlinkage void aesbs_convert_key(u8 out[], u32 const rk[], int rounds);
30cc477bf6SArd Biesheuvel 
31cc477bf6SArd Biesheuvel asmlinkage void aesbs_ecb_encrypt(u8 out[], u8 const in[], u8 const rk[],
32cc477bf6SArd Biesheuvel 				  int rounds, int blocks);
33cc477bf6SArd Biesheuvel asmlinkage void aesbs_ecb_decrypt(u8 out[], u8 const in[], u8 const rk[],
34cc477bf6SArd Biesheuvel 				  int rounds, int blocks);
35cc477bf6SArd Biesheuvel 
36cc477bf6SArd Biesheuvel asmlinkage void aesbs_cbc_decrypt(u8 out[], u8 const in[], u8 const rk[],
37cc477bf6SArd Biesheuvel 				  int rounds, int blocks, u8 iv[]);
38cc477bf6SArd Biesheuvel 
39cc477bf6SArd Biesheuvel asmlinkage void aesbs_ctr_encrypt(u8 out[], u8 const in[], u8 const rk[],
40*c8bf850eSArd Biesheuvel 				  int rounds, int blocks, u8 ctr[]);
41cc477bf6SArd Biesheuvel 
42cc477bf6SArd Biesheuvel asmlinkage void aesbs_xts_encrypt(u8 out[], u8 const in[], u8 const rk[],
432ed8b790SArd Biesheuvel 				  int rounds, int blocks, u8 iv[], int);
44cc477bf6SArd Biesheuvel asmlinkage void aesbs_xts_decrypt(u8 out[], u8 const in[], u8 const rk[],
452ed8b790SArd Biesheuvel 				  int rounds, int blocks, u8 iv[], int);
46cc477bf6SArd Biesheuvel 
47cc477bf6SArd Biesheuvel struct aesbs_ctx {
48cc477bf6SArd Biesheuvel 	int	rounds;
49cc477bf6SArd Biesheuvel 	u8	rk[13 * (8 * AES_BLOCK_SIZE) + 32] __aligned(AES_BLOCK_SIZE);
50cc477bf6SArd Biesheuvel };
51cc477bf6SArd Biesheuvel 
52cc477bf6SArd Biesheuvel struct aesbs_cbc_ctx {
53cc477bf6SArd Biesheuvel 	struct aesbs_ctx	key;
5400b99ad2SHerbert Xu 	struct crypto_skcipher	*enc_tfm;
55cc477bf6SArd Biesheuvel };
56cc477bf6SArd Biesheuvel 
57cc477bf6SArd Biesheuvel struct aesbs_xts_ctx {
58cc477bf6SArd Biesheuvel 	struct aesbs_ctx	key;
592ed8b790SArd Biesheuvel 	struct crypto_cipher	*cts_tfm;
60b56f5cbcSArd Biesheuvel 	struct crypto_cipher	*tweak_tfm;
61cc477bf6SArd Biesheuvel };
62cc477bf6SArd Biesheuvel 
63e5f05040SArd Biesheuvel struct aesbs_ctr_ctx {
64e5f05040SArd Biesheuvel 	struct aesbs_ctx	key;		/* must be first member */
65e5f05040SArd Biesheuvel 	struct crypto_aes_ctx	fallback;
66e5f05040SArd Biesheuvel };
67e5f05040SArd Biesheuvel 
aesbs_setkey(struct crypto_skcipher * tfm,const u8 * in_key,unsigned int key_len)68cc477bf6SArd Biesheuvel static int aesbs_setkey(struct crypto_skcipher *tfm, const u8 *in_key,
69cc477bf6SArd Biesheuvel 			unsigned int key_len)
70cc477bf6SArd Biesheuvel {
71cc477bf6SArd Biesheuvel 	struct aesbs_ctx *ctx = crypto_skcipher_ctx(tfm);
72cc477bf6SArd Biesheuvel 	struct crypto_aes_ctx rk;
73cc477bf6SArd Biesheuvel 	int err;
74cc477bf6SArd Biesheuvel 
75aa6e2d2bSArd Biesheuvel 	err = aes_expandkey(&rk, in_key, key_len);
76cc477bf6SArd Biesheuvel 	if (err)
77cc477bf6SArd Biesheuvel 		return err;
78cc477bf6SArd Biesheuvel 
79cc477bf6SArd Biesheuvel 	ctx->rounds = 6 + key_len / 4;
80cc477bf6SArd Biesheuvel 
81cc477bf6SArd Biesheuvel 	kernel_neon_begin();
82cc477bf6SArd Biesheuvel 	aesbs_convert_key(ctx->rk, rk.key_enc, ctx->rounds);
83cc477bf6SArd Biesheuvel 	kernel_neon_end();
84cc477bf6SArd Biesheuvel 
85cc477bf6SArd Biesheuvel 	return 0;
86cc477bf6SArd Biesheuvel }
87cc477bf6SArd Biesheuvel 
__ecb_crypt(struct skcipher_request * req,void (* fn)(u8 out[],u8 const in[],u8 const rk[],int rounds,int blocks))88cc477bf6SArd Biesheuvel static int __ecb_crypt(struct skcipher_request *req,
89cc477bf6SArd Biesheuvel 		       void (*fn)(u8 out[], u8 const in[], u8 const rk[],
90cc477bf6SArd Biesheuvel 				  int rounds, int blocks))
91cc477bf6SArd Biesheuvel {
92cc477bf6SArd Biesheuvel 	struct crypto_skcipher *tfm = crypto_skcipher_reqtfm(req);
93cc477bf6SArd Biesheuvel 	struct aesbs_ctx *ctx = crypto_skcipher_ctx(tfm);
94cc477bf6SArd Biesheuvel 	struct skcipher_walk walk;
95cc477bf6SArd Biesheuvel 	int err;
96cc477bf6SArd Biesheuvel 
9746a22776SArd Biesheuvel 	err = skcipher_walk_virt(&walk, req, false);
98cc477bf6SArd Biesheuvel 
99cc477bf6SArd Biesheuvel 	while (walk.nbytes >= AES_BLOCK_SIZE) {
100cc477bf6SArd Biesheuvel 		unsigned int blocks = walk.nbytes / AES_BLOCK_SIZE;
101cc477bf6SArd Biesheuvel 
102cc477bf6SArd Biesheuvel 		if (walk.nbytes < walk.total)
103cc477bf6SArd Biesheuvel 			blocks = round_down(blocks,
104cc477bf6SArd Biesheuvel 					    walk.stride / AES_BLOCK_SIZE);
105cc477bf6SArd Biesheuvel 
10646a22776SArd Biesheuvel 		kernel_neon_begin();
107cc477bf6SArd Biesheuvel 		fn(walk.dst.virt.addr, walk.src.virt.addr, ctx->rk,
108cc477bf6SArd Biesheuvel 		   ctx->rounds, blocks);
10946a22776SArd Biesheuvel 		kernel_neon_end();
110cc477bf6SArd Biesheuvel 		err = skcipher_walk_done(&walk,
111cc477bf6SArd Biesheuvel 					 walk.nbytes - blocks * AES_BLOCK_SIZE);
112cc477bf6SArd Biesheuvel 	}
113cc477bf6SArd Biesheuvel 
114cc477bf6SArd Biesheuvel 	return err;
115cc477bf6SArd Biesheuvel }
116cc477bf6SArd Biesheuvel 
ecb_encrypt(struct skcipher_request * req)117cc477bf6SArd Biesheuvel static int ecb_encrypt(struct skcipher_request *req)
118cc477bf6SArd Biesheuvel {
119cc477bf6SArd Biesheuvel 	return __ecb_crypt(req, aesbs_ecb_encrypt);
120cc477bf6SArd Biesheuvel }
121cc477bf6SArd Biesheuvel 
ecb_decrypt(struct skcipher_request * req)122cc477bf6SArd Biesheuvel static int ecb_decrypt(struct skcipher_request *req)
123cc477bf6SArd Biesheuvel {
124cc477bf6SArd Biesheuvel 	return __ecb_crypt(req, aesbs_ecb_decrypt);
125cc477bf6SArd Biesheuvel }
126cc477bf6SArd Biesheuvel 
aesbs_cbc_setkey(struct crypto_skcipher * tfm,const u8 * in_key,unsigned int key_len)127cc477bf6SArd Biesheuvel static int aesbs_cbc_setkey(struct crypto_skcipher *tfm, const u8 *in_key,
128cc477bf6SArd Biesheuvel 			    unsigned int key_len)
129cc477bf6SArd Biesheuvel {
130cc477bf6SArd Biesheuvel 	struct aesbs_cbc_ctx *ctx = crypto_skcipher_ctx(tfm);
131cc477bf6SArd Biesheuvel 	struct crypto_aes_ctx rk;
132cc477bf6SArd Biesheuvel 	int err;
133cc477bf6SArd Biesheuvel 
134aa6e2d2bSArd Biesheuvel 	err = aes_expandkey(&rk, in_key, key_len);
135cc477bf6SArd Biesheuvel 	if (err)
136cc477bf6SArd Biesheuvel 		return err;
137cc477bf6SArd Biesheuvel 
138cc477bf6SArd Biesheuvel 	ctx->key.rounds = 6 + key_len / 4;
139cc477bf6SArd Biesheuvel 
140cc477bf6SArd Biesheuvel 	kernel_neon_begin();
141cc477bf6SArd Biesheuvel 	aesbs_convert_key(ctx->key.rk, rk.key_enc, ctx->key.rounds);
142cc477bf6SArd Biesheuvel 	kernel_neon_end();
14382ff493eSTorsten Duwe 	memzero_explicit(&rk, sizeof(rk));
144cc477bf6SArd Biesheuvel 
14500b99ad2SHerbert Xu 	return crypto_skcipher_setkey(ctx->enc_tfm, in_key, key_len);
146cc477bf6SArd Biesheuvel }
147cc477bf6SArd Biesheuvel 
cbc_encrypt(struct skcipher_request * req)148cc477bf6SArd Biesheuvel static int cbc_encrypt(struct skcipher_request *req)
149cc477bf6SArd Biesheuvel {
15000b99ad2SHerbert Xu 	struct skcipher_request *subreq = skcipher_request_ctx(req);
15100b99ad2SHerbert Xu 	struct crypto_skcipher *tfm = crypto_skcipher_reqtfm(req);
15200b99ad2SHerbert Xu 	struct aesbs_cbc_ctx *ctx = crypto_skcipher_ctx(tfm);
15300b99ad2SHerbert Xu 
15400b99ad2SHerbert Xu 	skcipher_request_set_tfm(subreq, ctx->enc_tfm);
15500b99ad2SHerbert Xu 	skcipher_request_set_callback(subreq,
15600b99ad2SHerbert Xu 				      skcipher_request_flags(req),
15700b99ad2SHerbert Xu 				      NULL, NULL);
15800b99ad2SHerbert Xu 	skcipher_request_set_crypt(subreq, req->src, req->dst,
15900b99ad2SHerbert Xu 				   req->cryptlen, req->iv);
16000b99ad2SHerbert Xu 
16100b99ad2SHerbert Xu 	return crypto_skcipher_encrypt(subreq);
162cc477bf6SArd Biesheuvel }
163cc477bf6SArd Biesheuvel 
cbc_decrypt(struct skcipher_request * req)164cc477bf6SArd Biesheuvel static int cbc_decrypt(struct skcipher_request *req)
165cc477bf6SArd Biesheuvel {
166cc477bf6SArd Biesheuvel 	struct crypto_skcipher *tfm = crypto_skcipher_reqtfm(req);
167cc477bf6SArd Biesheuvel 	struct aesbs_cbc_ctx *ctx = crypto_skcipher_ctx(tfm);
168cc477bf6SArd Biesheuvel 	struct skcipher_walk walk;
169cc477bf6SArd Biesheuvel 	int err;
170cc477bf6SArd Biesheuvel 
17146a22776SArd Biesheuvel 	err = skcipher_walk_virt(&walk, req, false);
172cc477bf6SArd Biesheuvel 
173cc477bf6SArd Biesheuvel 	while (walk.nbytes >= AES_BLOCK_SIZE) {
174cc477bf6SArd Biesheuvel 		unsigned int blocks = walk.nbytes / AES_BLOCK_SIZE;
175cc477bf6SArd Biesheuvel 
176cc477bf6SArd Biesheuvel 		if (walk.nbytes < walk.total)
177cc477bf6SArd Biesheuvel 			blocks = round_down(blocks,
178cc477bf6SArd Biesheuvel 					    walk.stride / AES_BLOCK_SIZE);
179cc477bf6SArd Biesheuvel 
18046a22776SArd Biesheuvel 		kernel_neon_begin();
181cc477bf6SArd Biesheuvel 		aesbs_cbc_decrypt(walk.dst.virt.addr, walk.src.virt.addr,
182cc477bf6SArd Biesheuvel 				  ctx->key.rk, ctx->key.rounds, blocks,
183cc477bf6SArd Biesheuvel 				  walk.iv);
18446a22776SArd Biesheuvel 		kernel_neon_end();
185cc477bf6SArd Biesheuvel 		err = skcipher_walk_done(&walk,
186cc477bf6SArd Biesheuvel 					 walk.nbytes - blocks * AES_BLOCK_SIZE);
187cc477bf6SArd Biesheuvel 	}
188cc477bf6SArd Biesheuvel 
189cc477bf6SArd Biesheuvel 	return err;
190cc477bf6SArd Biesheuvel }
191cc477bf6SArd Biesheuvel 
cbc_init(struct crypto_skcipher * tfm)19200b99ad2SHerbert Xu static int cbc_init(struct crypto_skcipher *tfm)
193b56f5cbcSArd Biesheuvel {
19400b99ad2SHerbert Xu 	struct aesbs_cbc_ctx *ctx = crypto_skcipher_ctx(tfm);
19500b99ad2SHerbert Xu 	unsigned int reqsize;
196b56f5cbcSArd Biesheuvel 
197a2715fbdSHoria Geantă 	ctx->enc_tfm = crypto_alloc_skcipher("cbc(aes)", 0, CRYPTO_ALG_ASYNC |
198a2715fbdSHoria Geantă 					     CRYPTO_ALG_NEED_FALLBACK);
19900b99ad2SHerbert Xu 	if (IS_ERR(ctx->enc_tfm))
20000b99ad2SHerbert Xu 		return PTR_ERR(ctx->enc_tfm);
20126d85e5fSGomonovych, Vasyl 
20200b99ad2SHerbert Xu 	reqsize = sizeof(struct skcipher_request);
20300b99ad2SHerbert Xu 	reqsize += crypto_skcipher_reqsize(ctx->enc_tfm);
20400b99ad2SHerbert Xu 	crypto_skcipher_set_reqsize(tfm, reqsize);
20500b99ad2SHerbert Xu 
20600b99ad2SHerbert Xu 	return 0;
207b56f5cbcSArd Biesheuvel }
208b56f5cbcSArd Biesheuvel 
cbc_exit(struct crypto_skcipher * tfm)20900b99ad2SHerbert Xu static void cbc_exit(struct crypto_skcipher *tfm)
210b56f5cbcSArd Biesheuvel {
21100b99ad2SHerbert Xu 	struct aesbs_cbc_ctx *ctx = crypto_skcipher_ctx(tfm);
212b56f5cbcSArd Biesheuvel 
21300b99ad2SHerbert Xu 	crypto_free_skcipher(ctx->enc_tfm);
214b56f5cbcSArd Biesheuvel }
215b56f5cbcSArd Biesheuvel 
aesbs_ctr_setkey_sync(struct crypto_skcipher * tfm,const u8 * in_key,unsigned int key_len)216e5f05040SArd Biesheuvel static int aesbs_ctr_setkey_sync(struct crypto_skcipher *tfm, const u8 *in_key,
217e5f05040SArd Biesheuvel 				 unsigned int key_len)
218e5f05040SArd Biesheuvel {
219e5f05040SArd Biesheuvel 	struct aesbs_ctr_ctx *ctx = crypto_skcipher_ctx(tfm);
220e5f05040SArd Biesheuvel 	int err;
221e5f05040SArd Biesheuvel 
222e5f05040SArd Biesheuvel 	err = aes_expandkey(&ctx->fallback, in_key, key_len);
223e5f05040SArd Biesheuvel 	if (err)
224e5f05040SArd Biesheuvel 		return err;
225e5f05040SArd Biesheuvel 
226e5f05040SArd Biesheuvel 	ctx->key.rounds = 6 + key_len / 4;
227e5f05040SArd Biesheuvel 
228e5f05040SArd Biesheuvel 	kernel_neon_begin();
229e5f05040SArd Biesheuvel 	aesbs_convert_key(ctx->key.rk, ctx->fallback.key_enc, ctx->key.rounds);
230e5f05040SArd Biesheuvel 	kernel_neon_end();
231e5f05040SArd Biesheuvel 
232e5f05040SArd Biesheuvel 	return 0;
233e5f05040SArd Biesheuvel }
234e5f05040SArd Biesheuvel 
ctr_encrypt(struct skcipher_request * req)235cc477bf6SArd Biesheuvel static int ctr_encrypt(struct skcipher_request *req)
236cc477bf6SArd Biesheuvel {
237cc477bf6SArd Biesheuvel 	struct crypto_skcipher *tfm = crypto_skcipher_reqtfm(req);
238cc477bf6SArd Biesheuvel 	struct aesbs_ctx *ctx = crypto_skcipher_ctx(tfm);
239cc477bf6SArd Biesheuvel 	struct skcipher_walk walk;
2401a20b966SArd Biesheuvel 	u8 buf[AES_BLOCK_SIZE];
241cc477bf6SArd Biesheuvel 	int err;
242cc477bf6SArd Biesheuvel 
24346a22776SArd Biesheuvel 	err = skcipher_walk_virt(&walk, req, false);
244cc477bf6SArd Biesheuvel 
245cc477bf6SArd Biesheuvel 	while (walk.nbytes > 0) {
246*c8bf850eSArd Biesheuvel 		const u8 *src = walk.src.virt.addr;
247*c8bf850eSArd Biesheuvel 		u8 *dst = walk.dst.virt.addr;
248*c8bf850eSArd Biesheuvel 		int bytes = walk.nbytes;
249cc477bf6SArd Biesheuvel 
250*c8bf850eSArd Biesheuvel 		if (unlikely(bytes < AES_BLOCK_SIZE))
251*c8bf850eSArd Biesheuvel 			src = dst = memcpy(buf + sizeof(buf) - bytes,
252*c8bf850eSArd Biesheuvel 					   src, bytes);
253*c8bf850eSArd Biesheuvel 		else if (walk.nbytes < walk.total)
254*c8bf850eSArd Biesheuvel 			bytes &= ~(8 * AES_BLOCK_SIZE - 1);
255cc477bf6SArd Biesheuvel 
25646a22776SArd Biesheuvel 		kernel_neon_begin();
257*c8bf850eSArd Biesheuvel 		aesbs_ctr_encrypt(dst, src, ctx->rk, ctx->rounds, bytes, walk.iv);
25846a22776SArd Biesheuvel 		kernel_neon_end();
259cc477bf6SArd Biesheuvel 
260*c8bf850eSArd Biesheuvel 		if (unlikely(bytes < AES_BLOCK_SIZE))
261*c8bf850eSArd Biesheuvel 			memcpy(walk.dst.virt.addr,
262*c8bf850eSArd Biesheuvel 			       buf + sizeof(buf) - bytes, bytes);
263cc477bf6SArd Biesheuvel 
264*c8bf850eSArd Biesheuvel 		err = skcipher_walk_done(&walk, walk.nbytes - bytes);
265cc477bf6SArd Biesheuvel 	}
266cc477bf6SArd Biesheuvel 
267cc477bf6SArd Biesheuvel 	return err;
268cc477bf6SArd Biesheuvel }
269cc477bf6SArd Biesheuvel 
ctr_encrypt_one(struct crypto_skcipher * tfm,const u8 * src,u8 * dst)270e5f05040SArd Biesheuvel static void ctr_encrypt_one(struct crypto_skcipher *tfm, const u8 *src, u8 *dst)
271e5f05040SArd Biesheuvel {
272e5f05040SArd Biesheuvel 	struct aesbs_ctr_ctx *ctx = crypto_skcipher_ctx(tfm);
273e5f05040SArd Biesheuvel 	unsigned long flags;
274e5f05040SArd Biesheuvel 
275e5f05040SArd Biesheuvel 	/*
276e5f05040SArd Biesheuvel 	 * Temporarily disable interrupts to avoid races where
277e5f05040SArd Biesheuvel 	 * cachelines are evicted when the CPU is interrupted
278e5f05040SArd Biesheuvel 	 * to do something else.
279e5f05040SArd Biesheuvel 	 */
280e5f05040SArd Biesheuvel 	local_irq_save(flags);
281e5f05040SArd Biesheuvel 	aes_encrypt(&ctx->fallback, dst, src);
282e5f05040SArd Biesheuvel 	local_irq_restore(flags);
283e5f05040SArd Biesheuvel }
284e5f05040SArd Biesheuvel 
ctr_encrypt_sync(struct skcipher_request * req)285e5f05040SArd Biesheuvel static int ctr_encrypt_sync(struct skcipher_request *req)
286e5f05040SArd Biesheuvel {
287e5f05040SArd Biesheuvel 	if (!crypto_simd_usable())
288e5f05040SArd Biesheuvel 		return crypto_ctr_encrypt_walk(req, ctr_encrypt_one);
289e5f05040SArd Biesheuvel 
290e5f05040SArd Biesheuvel 	return ctr_encrypt(req);
291e5f05040SArd Biesheuvel }
292e5f05040SArd Biesheuvel 
aesbs_xts_setkey(struct crypto_skcipher * tfm,const u8 * in_key,unsigned int key_len)293cc477bf6SArd Biesheuvel static int aesbs_xts_setkey(struct crypto_skcipher *tfm, const u8 *in_key,
294cc477bf6SArd Biesheuvel 			    unsigned int key_len)
295cc477bf6SArd Biesheuvel {
296cc477bf6SArd Biesheuvel 	struct aesbs_xts_ctx *ctx = crypto_skcipher_ctx(tfm);
297cc477bf6SArd Biesheuvel 	int err;
298cc477bf6SArd Biesheuvel 
299cc477bf6SArd Biesheuvel 	err = xts_verify_key(tfm, in_key, key_len);
300cc477bf6SArd Biesheuvel 	if (err)
301cc477bf6SArd Biesheuvel 		return err;
302cc477bf6SArd Biesheuvel 
303cc477bf6SArd Biesheuvel 	key_len /= 2;
3042ed8b790SArd Biesheuvel 	err = crypto_cipher_setkey(ctx->cts_tfm, in_key, key_len);
3052ed8b790SArd Biesheuvel 	if (err)
3062ed8b790SArd Biesheuvel 		return err;
307b56f5cbcSArd Biesheuvel 	err = crypto_cipher_setkey(ctx->tweak_tfm, in_key + key_len, key_len);
308cc477bf6SArd Biesheuvel 	if (err)
309cc477bf6SArd Biesheuvel 		return err;
310cc477bf6SArd Biesheuvel 
311cc477bf6SArd Biesheuvel 	return aesbs_setkey(tfm, in_key, key_len);
312cc477bf6SArd Biesheuvel }
313cc477bf6SArd Biesheuvel 
xts_init(struct crypto_skcipher * tfm)3143ebbc035SArd Biesheuvel static int xts_init(struct crypto_skcipher *tfm)
315b56f5cbcSArd Biesheuvel {
3163ebbc035SArd Biesheuvel 	struct aesbs_xts_ctx *ctx = crypto_skcipher_ctx(tfm);
317b56f5cbcSArd Biesheuvel 
3182ed8b790SArd Biesheuvel 	ctx->cts_tfm = crypto_alloc_cipher("aes", 0, 0);
3192ed8b790SArd Biesheuvel 	if (IS_ERR(ctx->cts_tfm))
3202ed8b790SArd Biesheuvel 		return PTR_ERR(ctx->cts_tfm);
3212ed8b790SArd Biesheuvel 
322b56f5cbcSArd Biesheuvel 	ctx->tweak_tfm = crypto_alloc_cipher("aes", 0, 0);
3232ed8b790SArd Biesheuvel 	if (IS_ERR(ctx->tweak_tfm))
3242ed8b790SArd Biesheuvel 		crypto_free_cipher(ctx->cts_tfm);
32526d85e5fSGomonovych, Vasyl 
32626d85e5fSGomonovych, Vasyl 	return PTR_ERR_OR_ZERO(ctx->tweak_tfm);
327b56f5cbcSArd Biesheuvel }
328b56f5cbcSArd Biesheuvel 
xts_exit(struct crypto_skcipher * tfm)3293ebbc035SArd Biesheuvel static void xts_exit(struct crypto_skcipher *tfm)
330b56f5cbcSArd Biesheuvel {
3313ebbc035SArd Biesheuvel 	struct aesbs_xts_ctx *ctx = crypto_skcipher_ctx(tfm);
332b56f5cbcSArd Biesheuvel 
333b56f5cbcSArd Biesheuvel 	crypto_free_cipher(ctx->tweak_tfm);
3342ed8b790SArd Biesheuvel 	crypto_free_cipher(ctx->cts_tfm);
335b56f5cbcSArd Biesheuvel }
336b56f5cbcSArd Biesheuvel 
__xts_crypt(struct skcipher_request * req,bool encrypt,void (* fn)(u8 out[],u8 const in[],u8 const rk[],int rounds,int blocks,u8 iv[],int))3372ed8b790SArd Biesheuvel static int __xts_crypt(struct skcipher_request *req, bool encrypt,
338cc477bf6SArd Biesheuvel 		       void (*fn)(u8 out[], u8 const in[], u8 const rk[],
3392ed8b790SArd Biesheuvel 				  int rounds, int blocks, u8 iv[], int))
340cc477bf6SArd Biesheuvel {
341cc477bf6SArd Biesheuvel 	struct crypto_skcipher *tfm = crypto_skcipher_reqtfm(req);
342cc477bf6SArd Biesheuvel 	struct aesbs_xts_ctx *ctx = crypto_skcipher_ctx(tfm);
3432ed8b790SArd Biesheuvel 	int tail = req->cryptlen % AES_BLOCK_SIZE;
3442ed8b790SArd Biesheuvel 	struct skcipher_request subreq;
3452ed8b790SArd Biesheuvel 	u8 buf[2 * AES_BLOCK_SIZE];
346cc477bf6SArd Biesheuvel 	struct skcipher_walk walk;
347cc477bf6SArd Biesheuvel 	int err;
348cc477bf6SArd Biesheuvel 
3492ed8b790SArd Biesheuvel 	if (req->cryptlen < AES_BLOCK_SIZE)
3502ed8b790SArd Biesheuvel 		return -EINVAL;
3512ed8b790SArd Biesheuvel 
3522ed8b790SArd Biesheuvel 	if (unlikely(tail)) {
3532ed8b790SArd Biesheuvel 		skcipher_request_set_tfm(&subreq, tfm);
3542ed8b790SArd Biesheuvel 		skcipher_request_set_callback(&subreq,
3552ed8b790SArd Biesheuvel 					      skcipher_request_flags(req),
3562ed8b790SArd Biesheuvel 					      NULL, NULL);
3572ed8b790SArd Biesheuvel 		skcipher_request_set_crypt(&subreq, req->src, req->dst,
3582ed8b790SArd Biesheuvel 					   req->cryptlen - tail, req->iv);
3592ed8b790SArd Biesheuvel 		req = &subreq;
3602ed8b790SArd Biesheuvel 	}
3612ed8b790SArd Biesheuvel 
362cc477bf6SArd Biesheuvel 	err = skcipher_walk_virt(&walk, req, true);
363767f015eSEric Biggers 	if (err)
364767f015eSEric Biggers 		return err;
365cc477bf6SArd Biesheuvel 
366b56f5cbcSArd Biesheuvel 	crypto_cipher_encrypt_one(ctx->tweak_tfm, walk.iv, walk.iv);
367cc477bf6SArd Biesheuvel 
368cc477bf6SArd Biesheuvel 	while (walk.nbytes >= AES_BLOCK_SIZE) {
369cc477bf6SArd Biesheuvel 		unsigned int blocks = walk.nbytes / AES_BLOCK_SIZE;
3702ed8b790SArd Biesheuvel 		int reorder_last_tweak = !encrypt && tail > 0;
371cc477bf6SArd Biesheuvel 
3722ed8b790SArd Biesheuvel 		if (walk.nbytes < walk.total) {
373cc477bf6SArd Biesheuvel 			blocks = round_down(blocks,
374cc477bf6SArd Biesheuvel 					    walk.stride / AES_BLOCK_SIZE);
3752ed8b790SArd Biesheuvel 			reorder_last_tweak = 0;
3762ed8b790SArd Biesheuvel 		}
377cc477bf6SArd Biesheuvel 
37846a22776SArd Biesheuvel 		kernel_neon_begin();
379cc477bf6SArd Biesheuvel 		fn(walk.dst.virt.addr, walk.src.virt.addr, ctx->key.rk,
3802ed8b790SArd Biesheuvel 		   ctx->key.rounds, blocks, walk.iv, reorder_last_tweak);
38146a22776SArd Biesheuvel 		kernel_neon_end();
382cc477bf6SArd Biesheuvel 		err = skcipher_walk_done(&walk,
383cc477bf6SArd Biesheuvel 					 walk.nbytes - blocks * AES_BLOCK_SIZE);
384cc477bf6SArd Biesheuvel 	}
385cc477bf6SArd Biesheuvel 
3862ed8b790SArd Biesheuvel 	if (err || likely(!tail))
387cc477bf6SArd Biesheuvel 		return err;
3882ed8b790SArd Biesheuvel 
3892ed8b790SArd Biesheuvel 	/* handle ciphertext stealing */
3902ed8b790SArd Biesheuvel 	scatterwalk_map_and_copy(buf, req->dst, req->cryptlen - AES_BLOCK_SIZE,
3912ed8b790SArd Biesheuvel 				 AES_BLOCK_SIZE, 0);
3922ed8b790SArd Biesheuvel 	memcpy(buf + AES_BLOCK_SIZE, buf, tail);
3932ed8b790SArd Biesheuvel 	scatterwalk_map_and_copy(buf, req->src, req->cryptlen, tail, 0);
3942ed8b790SArd Biesheuvel 
3952ed8b790SArd Biesheuvel 	crypto_xor(buf, req->iv, AES_BLOCK_SIZE);
3962ed8b790SArd Biesheuvel 
3972ed8b790SArd Biesheuvel 	if (encrypt)
3982ed8b790SArd Biesheuvel 		crypto_cipher_encrypt_one(ctx->cts_tfm, buf, buf);
3992ed8b790SArd Biesheuvel 	else
4002ed8b790SArd Biesheuvel 		crypto_cipher_decrypt_one(ctx->cts_tfm, buf, buf);
4012ed8b790SArd Biesheuvel 
4022ed8b790SArd Biesheuvel 	crypto_xor(buf, req->iv, AES_BLOCK_SIZE);
4032ed8b790SArd Biesheuvel 
4042ed8b790SArd Biesheuvel 	scatterwalk_map_and_copy(buf, req->dst, req->cryptlen - AES_BLOCK_SIZE,
4052ed8b790SArd Biesheuvel 				 AES_BLOCK_SIZE + tail, 1);
4062ed8b790SArd Biesheuvel 	return 0;
407cc477bf6SArd Biesheuvel }
408cc477bf6SArd Biesheuvel 
xts_encrypt(struct skcipher_request * req)409cc477bf6SArd Biesheuvel static int xts_encrypt(struct skcipher_request *req)
410cc477bf6SArd Biesheuvel {
4112ed8b790SArd Biesheuvel 	return __xts_crypt(req, true, aesbs_xts_encrypt);
412cc477bf6SArd Biesheuvel }
413cc477bf6SArd Biesheuvel 
xts_decrypt(struct skcipher_request * req)414cc477bf6SArd Biesheuvel static int xts_decrypt(struct skcipher_request *req)
415cc477bf6SArd Biesheuvel {
4162ed8b790SArd Biesheuvel 	return __xts_crypt(req, false, aesbs_xts_decrypt);
417cc477bf6SArd Biesheuvel }
418cc477bf6SArd Biesheuvel 
419cc477bf6SArd Biesheuvel static struct skcipher_alg aes_algs[] = { {
420cc477bf6SArd Biesheuvel 	.base.cra_name		= "__ecb(aes)",
421cc477bf6SArd Biesheuvel 	.base.cra_driver_name	= "__ecb-aes-neonbs",
422cc477bf6SArd Biesheuvel 	.base.cra_priority	= 250,
423cc477bf6SArd Biesheuvel 	.base.cra_blocksize	= AES_BLOCK_SIZE,
424cc477bf6SArd Biesheuvel 	.base.cra_ctxsize	= sizeof(struct aesbs_ctx),
425cc477bf6SArd Biesheuvel 	.base.cra_module	= THIS_MODULE,
426cc477bf6SArd Biesheuvel 	.base.cra_flags		= CRYPTO_ALG_INTERNAL,
427cc477bf6SArd Biesheuvel 
428cc477bf6SArd Biesheuvel 	.min_keysize		= AES_MIN_KEY_SIZE,
429cc477bf6SArd Biesheuvel 	.max_keysize		= AES_MAX_KEY_SIZE,
430cc477bf6SArd Biesheuvel 	.walksize		= 8 * AES_BLOCK_SIZE,
431cc477bf6SArd Biesheuvel 	.setkey			= aesbs_setkey,
432cc477bf6SArd Biesheuvel 	.encrypt		= ecb_encrypt,
433cc477bf6SArd Biesheuvel 	.decrypt		= ecb_decrypt,
434cc477bf6SArd Biesheuvel }, {
435cc477bf6SArd Biesheuvel 	.base.cra_name		= "__cbc(aes)",
436cc477bf6SArd Biesheuvel 	.base.cra_driver_name	= "__cbc-aes-neonbs",
437cc477bf6SArd Biesheuvel 	.base.cra_priority	= 250,
438cc477bf6SArd Biesheuvel 	.base.cra_blocksize	= AES_BLOCK_SIZE,
439cc477bf6SArd Biesheuvel 	.base.cra_ctxsize	= sizeof(struct aesbs_cbc_ctx),
440cc477bf6SArd Biesheuvel 	.base.cra_module	= THIS_MODULE,
441a2715fbdSHoria Geantă 	.base.cra_flags		= CRYPTO_ALG_INTERNAL |
442a2715fbdSHoria Geantă 				  CRYPTO_ALG_NEED_FALLBACK,
443cc477bf6SArd Biesheuvel 
444cc477bf6SArd Biesheuvel 	.min_keysize		= AES_MIN_KEY_SIZE,
445cc477bf6SArd Biesheuvel 	.max_keysize		= AES_MAX_KEY_SIZE,
446cc477bf6SArd Biesheuvel 	.walksize		= 8 * AES_BLOCK_SIZE,
447cc477bf6SArd Biesheuvel 	.ivsize			= AES_BLOCK_SIZE,
448cc477bf6SArd Biesheuvel 	.setkey			= aesbs_cbc_setkey,
449cc477bf6SArd Biesheuvel 	.encrypt		= cbc_encrypt,
450cc477bf6SArd Biesheuvel 	.decrypt		= cbc_decrypt,
45100b99ad2SHerbert Xu 	.init			= cbc_init,
45200b99ad2SHerbert Xu 	.exit			= cbc_exit,
453cc477bf6SArd Biesheuvel }, {
454cc477bf6SArd Biesheuvel 	.base.cra_name		= "__ctr(aes)",
455cc477bf6SArd Biesheuvel 	.base.cra_driver_name	= "__ctr-aes-neonbs",
456cc477bf6SArd Biesheuvel 	.base.cra_priority	= 250,
457cc477bf6SArd Biesheuvel 	.base.cra_blocksize	= 1,
458cc477bf6SArd Biesheuvel 	.base.cra_ctxsize	= sizeof(struct aesbs_ctx),
459cc477bf6SArd Biesheuvel 	.base.cra_module	= THIS_MODULE,
460cc477bf6SArd Biesheuvel 	.base.cra_flags		= CRYPTO_ALG_INTERNAL,
461cc477bf6SArd Biesheuvel 
462cc477bf6SArd Biesheuvel 	.min_keysize		= AES_MIN_KEY_SIZE,
463cc477bf6SArd Biesheuvel 	.max_keysize		= AES_MAX_KEY_SIZE,
464cc477bf6SArd Biesheuvel 	.chunksize		= AES_BLOCK_SIZE,
465cc477bf6SArd Biesheuvel 	.walksize		= 8 * AES_BLOCK_SIZE,
466cc477bf6SArd Biesheuvel 	.ivsize			= AES_BLOCK_SIZE,
467cc477bf6SArd Biesheuvel 	.setkey			= aesbs_setkey,
468cc477bf6SArd Biesheuvel 	.encrypt		= ctr_encrypt,
469cc477bf6SArd Biesheuvel 	.decrypt		= ctr_encrypt,
470cc477bf6SArd Biesheuvel }, {
471e5f05040SArd Biesheuvel 	.base.cra_name		= "ctr(aes)",
472e5f05040SArd Biesheuvel 	.base.cra_driver_name	= "ctr-aes-neonbs-sync",
473e5f05040SArd Biesheuvel 	.base.cra_priority	= 250 - 1,
474e5f05040SArd Biesheuvel 	.base.cra_blocksize	= 1,
475e5f05040SArd Biesheuvel 	.base.cra_ctxsize	= sizeof(struct aesbs_ctr_ctx),
476e5f05040SArd Biesheuvel 	.base.cra_module	= THIS_MODULE,
477e5f05040SArd Biesheuvel 
478e5f05040SArd Biesheuvel 	.min_keysize		= AES_MIN_KEY_SIZE,
479e5f05040SArd Biesheuvel 	.max_keysize		= AES_MAX_KEY_SIZE,
480e5f05040SArd Biesheuvel 	.chunksize		= AES_BLOCK_SIZE,
481e5f05040SArd Biesheuvel 	.walksize		= 8 * AES_BLOCK_SIZE,
482e5f05040SArd Biesheuvel 	.ivsize			= AES_BLOCK_SIZE,
483e5f05040SArd Biesheuvel 	.setkey			= aesbs_ctr_setkey_sync,
484e5f05040SArd Biesheuvel 	.encrypt		= ctr_encrypt_sync,
485e5f05040SArd Biesheuvel 	.decrypt		= ctr_encrypt_sync,
486e5f05040SArd Biesheuvel }, {
487cc477bf6SArd Biesheuvel 	.base.cra_name		= "__xts(aes)",
488cc477bf6SArd Biesheuvel 	.base.cra_driver_name	= "__xts-aes-neonbs",
489cc477bf6SArd Biesheuvel 	.base.cra_priority	= 250,
490cc477bf6SArd Biesheuvel 	.base.cra_blocksize	= AES_BLOCK_SIZE,
491cc477bf6SArd Biesheuvel 	.base.cra_ctxsize	= sizeof(struct aesbs_xts_ctx),
492cc477bf6SArd Biesheuvel 	.base.cra_module	= THIS_MODULE,
493cc477bf6SArd Biesheuvel 	.base.cra_flags		= CRYPTO_ALG_INTERNAL,
494cc477bf6SArd Biesheuvel 
495cc477bf6SArd Biesheuvel 	.min_keysize		= 2 * AES_MIN_KEY_SIZE,
496cc477bf6SArd Biesheuvel 	.max_keysize		= 2 * AES_MAX_KEY_SIZE,
497cc477bf6SArd Biesheuvel 	.walksize		= 8 * AES_BLOCK_SIZE,
498cc477bf6SArd Biesheuvel 	.ivsize			= AES_BLOCK_SIZE,
499cc477bf6SArd Biesheuvel 	.setkey			= aesbs_xts_setkey,
500cc477bf6SArd Biesheuvel 	.encrypt		= xts_encrypt,
501cc477bf6SArd Biesheuvel 	.decrypt		= xts_decrypt,
5023ebbc035SArd Biesheuvel 	.init			= xts_init,
5033ebbc035SArd Biesheuvel 	.exit			= xts_exit,
504cc477bf6SArd Biesheuvel } };
505cc477bf6SArd Biesheuvel 
506cc477bf6SArd Biesheuvel static struct simd_skcipher_alg *aes_simd_algs[ARRAY_SIZE(aes_algs)];
507cc477bf6SArd Biesheuvel 
aes_exit(void)508cc477bf6SArd Biesheuvel static void aes_exit(void)
509cc477bf6SArd Biesheuvel {
510cc477bf6SArd Biesheuvel 	int i;
511cc477bf6SArd Biesheuvel 
512cc477bf6SArd Biesheuvel 	for (i = 0; i < ARRAY_SIZE(aes_simd_algs); i++)
513cc477bf6SArd Biesheuvel 		if (aes_simd_algs[i])
514cc477bf6SArd Biesheuvel 			simd_skcipher_free(aes_simd_algs[i]);
515cc477bf6SArd Biesheuvel 
516cc477bf6SArd Biesheuvel 	crypto_unregister_skciphers(aes_algs, ARRAY_SIZE(aes_algs));
517cc477bf6SArd Biesheuvel }
518cc477bf6SArd Biesheuvel 
aes_init(void)519cc477bf6SArd Biesheuvel static int __init aes_init(void)
520cc477bf6SArd Biesheuvel {
521cc477bf6SArd Biesheuvel 	struct simd_skcipher_alg *simd;
522cc477bf6SArd Biesheuvel 	const char *basename;
523cc477bf6SArd Biesheuvel 	const char *algname;
524cc477bf6SArd Biesheuvel 	const char *drvname;
525cc477bf6SArd Biesheuvel 	int err;
526cc477bf6SArd Biesheuvel 	int i;
527cc477bf6SArd Biesheuvel 
528cc477bf6SArd Biesheuvel 	if (!(elf_hwcap & HWCAP_NEON))
529cc477bf6SArd Biesheuvel 		return -ENODEV;
530cc477bf6SArd Biesheuvel 
531cc477bf6SArd Biesheuvel 	err = crypto_register_skciphers(aes_algs, ARRAY_SIZE(aes_algs));
532cc477bf6SArd Biesheuvel 	if (err)
533cc477bf6SArd Biesheuvel 		return err;
534cc477bf6SArd Biesheuvel 
535cc477bf6SArd Biesheuvel 	for (i = 0; i < ARRAY_SIZE(aes_algs); i++) {
536cc477bf6SArd Biesheuvel 		if (!(aes_algs[i].base.cra_flags & CRYPTO_ALG_INTERNAL))
537cc477bf6SArd Biesheuvel 			continue;
538cc477bf6SArd Biesheuvel 
539cc477bf6SArd Biesheuvel 		algname = aes_algs[i].base.cra_name + 2;
540cc477bf6SArd Biesheuvel 		drvname = aes_algs[i].base.cra_driver_name + 2;
541cc477bf6SArd Biesheuvel 		basename = aes_algs[i].base.cra_driver_name;
542cc477bf6SArd Biesheuvel 		simd = simd_skcipher_create_compat(algname, drvname, basename);
543cc477bf6SArd Biesheuvel 		err = PTR_ERR(simd);
544cc477bf6SArd Biesheuvel 		if (IS_ERR(simd))
545cc477bf6SArd Biesheuvel 			goto unregister_simds;
546cc477bf6SArd Biesheuvel 
547cc477bf6SArd Biesheuvel 		aes_simd_algs[i] = simd;
548cc477bf6SArd Biesheuvel 	}
549cc477bf6SArd Biesheuvel 	return 0;
550cc477bf6SArd Biesheuvel 
551cc477bf6SArd Biesheuvel unregister_simds:
552cc477bf6SArd Biesheuvel 	aes_exit();
553cc477bf6SArd Biesheuvel 	return err;
554cc477bf6SArd Biesheuvel }
555cc477bf6SArd Biesheuvel 
556b56f5cbcSArd Biesheuvel late_initcall(aes_init);
557cc477bf6SArd Biesheuvel module_exit(aes_exit);
558