1d2912cb1SThomas Gleixner // SPDX-License-Identifier: GPL-2.0-only 286464859SArd Biesheuvel /* 386464859SArd Biesheuvel * aes-ce-glue.c - wrapper code for ARMv8 AES 486464859SArd Biesheuvel * 586464859SArd Biesheuvel * Copyright (C) 2015 Linaro Ltd <ard.biesheuvel@linaro.org> 686464859SArd Biesheuvel */ 786464859SArd Biesheuvel 886464859SArd Biesheuvel #include <asm/hwcap.h> 986464859SArd Biesheuvel #include <asm/neon.h> 105eedf315SArd Biesheuvel #include <asm/simd.h> 11fafb1dcaSArd Biesheuvel #include <asm/unaligned.h> 1286464859SArd Biesheuvel #include <crypto/aes.h> 135eedf315SArd Biesheuvel #include <crypto/ctr.h> 14da40e7a4SHerbert Xu #include <crypto/internal/simd.h> 15da40e7a4SHerbert Xu #include <crypto/internal/skcipher.h> 16*c61b1607SArd Biesheuvel #include <crypto/scatterwalk.h> 174d8061a5SArd Biesheuvel #include <linux/cpufeature.h> 1886464859SArd Biesheuvel #include <linux/module.h> 1949abc0d2SStephan Mueller #include <crypto/xts.h> 2086464859SArd Biesheuvel 2186464859SArd Biesheuvel MODULE_DESCRIPTION("AES-ECB/CBC/CTR/XTS using ARMv8 Crypto Extensions"); 2286464859SArd Biesheuvel MODULE_AUTHOR("Ard Biesheuvel <ard.biesheuvel@linaro.org>"); 2386464859SArd Biesheuvel MODULE_LICENSE("GPL v2"); 2486464859SArd Biesheuvel 2586464859SArd Biesheuvel /* defined in aes-ce-core.S */ 2686464859SArd Biesheuvel asmlinkage u32 ce_aes_sub(u32 input); 2786464859SArd Biesheuvel asmlinkage void ce_aes_invert(void *dst, void *src); 2886464859SArd Biesheuvel 29fcb0e30dSArd Biesheuvel asmlinkage void ce_aes_ecb_encrypt(u8 out[], u8 const in[], u32 const rk[], 3086464859SArd Biesheuvel int rounds, int blocks); 31fcb0e30dSArd Biesheuvel asmlinkage void ce_aes_ecb_decrypt(u8 out[], u8 const in[], u32 const rk[], 3286464859SArd Biesheuvel int rounds, int blocks); 3386464859SArd Biesheuvel 34fcb0e30dSArd Biesheuvel asmlinkage void ce_aes_cbc_encrypt(u8 out[], u8 const in[], u32 const rk[], 3586464859SArd Biesheuvel int rounds, int blocks, u8 iv[]); 36fcb0e30dSArd Biesheuvel asmlinkage void ce_aes_cbc_decrypt(u8 out[], u8 const in[], u32 const rk[], 3786464859SArd Biesheuvel int rounds, int blocks, u8 iv[]); 3886464859SArd Biesheuvel 39fcb0e30dSArd Biesheuvel asmlinkage void ce_aes_ctr_encrypt(u8 out[], u8 const in[], u32 const rk[], 4086464859SArd Biesheuvel int rounds, int blocks, u8 ctr[]); 4186464859SArd Biesheuvel 42fcb0e30dSArd Biesheuvel asmlinkage void ce_aes_xts_encrypt(u8 out[], u8 const in[], u32 const rk1[], 43*c61b1607SArd Biesheuvel int rounds, int bytes, u8 iv[], 44fcb0e30dSArd Biesheuvel u32 const rk2[], int first); 45fcb0e30dSArd Biesheuvel asmlinkage void ce_aes_xts_decrypt(u8 out[], u8 const in[], u32 const rk1[], 46*c61b1607SArd Biesheuvel int rounds, int bytes, u8 iv[], 47fcb0e30dSArd Biesheuvel u32 const rk2[], int first); 4886464859SArd Biesheuvel 4986464859SArd Biesheuvel struct aes_block { 5086464859SArd Biesheuvel u8 b[AES_BLOCK_SIZE]; 5186464859SArd Biesheuvel }; 5286464859SArd Biesheuvel 5386464859SArd Biesheuvel static int num_rounds(struct crypto_aes_ctx *ctx) 5486464859SArd Biesheuvel { 5586464859SArd Biesheuvel /* 5686464859SArd Biesheuvel * # of rounds specified by AES: 5786464859SArd Biesheuvel * 128 bit key 10 rounds 5886464859SArd Biesheuvel * 192 bit key 12 rounds 5986464859SArd Biesheuvel * 256 bit key 14 rounds 6086464859SArd Biesheuvel * => n byte key => 6 + (n/4) rounds 6186464859SArd Biesheuvel */ 6286464859SArd Biesheuvel return 6 + ctx->key_length / 4; 6386464859SArd Biesheuvel } 6486464859SArd Biesheuvel 6586464859SArd Biesheuvel static int ce_aes_expandkey(struct crypto_aes_ctx *ctx, const u8 *in_key, 6686464859SArd Biesheuvel unsigned int key_len) 6786464859SArd Biesheuvel { 6886464859SArd Biesheuvel /* 6986464859SArd Biesheuvel * The AES key schedule round constants 7086464859SArd Biesheuvel */ 7186464859SArd Biesheuvel static u8 const rcon[] = { 7286464859SArd Biesheuvel 0x01, 0x02, 0x04, 0x08, 0x10, 0x20, 0x40, 0x80, 0x1b, 0x36, 7386464859SArd Biesheuvel }; 7486464859SArd Biesheuvel 7586464859SArd Biesheuvel u32 kwords = key_len / sizeof(u32); 7686464859SArd Biesheuvel struct aes_block *key_enc, *key_dec; 7786464859SArd Biesheuvel int i, j; 7886464859SArd Biesheuvel 7986464859SArd Biesheuvel if (key_len != AES_KEYSIZE_128 && 8086464859SArd Biesheuvel key_len != AES_KEYSIZE_192 && 8186464859SArd Biesheuvel key_len != AES_KEYSIZE_256) 8286464859SArd Biesheuvel return -EINVAL; 8386464859SArd Biesheuvel 8486464859SArd Biesheuvel ctx->key_length = key_len; 85fafb1dcaSArd Biesheuvel for (i = 0; i < kwords; i++) 86fafb1dcaSArd Biesheuvel ctx->key_enc[i] = get_unaligned_le32(in_key + i * sizeof(u32)); 8786464859SArd Biesheuvel 8886464859SArd Biesheuvel kernel_neon_begin(); 8986464859SArd Biesheuvel for (i = 0; i < sizeof(rcon); i++) { 9086464859SArd Biesheuvel u32 *rki = ctx->key_enc + (i * kwords); 9186464859SArd Biesheuvel u32 *rko = rki + kwords; 9286464859SArd Biesheuvel 9386464859SArd Biesheuvel rko[0] = ror32(ce_aes_sub(rki[kwords - 1]), 8); 9486464859SArd Biesheuvel rko[0] = rko[0] ^ rki[0] ^ rcon[i]; 9586464859SArd Biesheuvel rko[1] = rko[0] ^ rki[1]; 9686464859SArd Biesheuvel rko[2] = rko[1] ^ rki[2]; 9786464859SArd Biesheuvel rko[3] = rko[2] ^ rki[3]; 9886464859SArd Biesheuvel 9986464859SArd Biesheuvel if (key_len == AES_KEYSIZE_192) { 10086464859SArd Biesheuvel if (i >= 7) 10186464859SArd Biesheuvel break; 10286464859SArd Biesheuvel rko[4] = rko[3] ^ rki[4]; 10386464859SArd Biesheuvel rko[5] = rko[4] ^ rki[5]; 10486464859SArd Biesheuvel } else if (key_len == AES_KEYSIZE_256) { 10586464859SArd Biesheuvel if (i >= 6) 10686464859SArd Biesheuvel break; 10786464859SArd Biesheuvel rko[4] = ce_aes_sub(rko[3]) ^ rki[4]; 10886464859SArd Biesheuvel rko[5] = rko[4] ^ rki[5]; 10986464859SArd Biesheuvel rko[6] = rko[5] ^ rki[6]; 11086464859SArd Biesheuvel rko[7] = rko[6] ^ rki[7]; 11186464859SArd Biesheuvel } 11286464859SArd Biesheuvel } 11386464859SArd Biesheuvel 11486464859SArd Biesheuvel /* 11586464859SArd Biesheuvel * Generate the decryption keys for the Equivalent Inverse Cipher. 11686464859SArd Biesheuvel * This involves reversing the order of the round keys, and applying 11786464859SArd Biesheuvel * the Inverse Mix Columns transformation on all but the first and 11886464859SArd Biesheuvel * the last one. 11986464859SArd Biesheuvel */ 12086464859SArd Biesheuvel key_enc = (struct aes_block *)ctx->key_enc; 12186464859SArd Biesheuvel key_dec = (struct aes_block *)ctx->key_dec; 12286464859SArd Biesheuvel j = num_rounds(ctx); 12386464859SArd Biesheuvel 12486464859SArd Biesheuvel key_dec[0] = key_enc[j]; 12586464859SArd Biesheuvel for (i = 1, j--; j > 0; i++, j--) 12686464859SArd Biesheuvel ce_aes_invert(key_dec + i, key_enc + j); 12786464859SArd Biesheuvel key_dec[i] = key_enc[0]; 12886464859SArd Biesheuvel 12986464859SArd Biesheuvel kernel_neon_end(); 13086464859SArd Biesheuvel return 0; 13186464859SArd Biesheuvel } 13286464859SArd Biesheuvel 133da40e7a4SHerbert Xu static int ce_aes_setkey(struct crypto_skcipher *tfm, const u8 *in_key, 13486464859SArd Biesheuvel unsigned int key_len) 13586464859SArd Biesheuvel { 136da40e7a4SHerbert Xu struct crypto_aes_ctx *ctx = crypto_skcipher_ctx(tfm); 13786464859SArd Biesheuvel int ret; 13886464859SArd Biesheuvel 13986464859SArd Biesheuvel ret = ce_aes_expandkey(ctx, in_key, key_len); 14086464859SArd Biesheuvel if (!ret) 14186464859SArd Biesheuvel return 0; 14286464859SArd Biesheuvel 143da40e7a4SHerbert Xu crypto_skcipher_set_flags(tfm, CRYPTO_TFM_RES_BAD_KEY_LEN); 14486464859SArd Biesheuvel return -EINVAL; 14586464859SArd Biesheuvel } 14686464859SArd Biesheuvel 14786464859SArd Biesheuvel struct crypto_aes_xts_ctx { 14886464859SArd Biesheuvel struct crypto_aes_ctx key1; 14986464859SArd Biesheuvel struct crypto_aes_ctx __aligned(8) key2; 15086464859SArd Biesheuvel }; 15186464859SArd Biesheuvel 152da40e7a4SHerbert Xu static int xts_set_key(struct crypto_skcipher *tfm, const u8 *in_key, 15386464859SArd Biesheuvel unsigned int key_len) 15486464859SArd Biesheuvel { 155da40e7a4SHerbert Xu struct crypto_aes_xts_ctx *ctx = crypto_skcipher_ctx(tfm); 15686464859SArd Biesheuvel int ret; 15786464859SArd Biesheuvel 158da40e7a4SHerbert Xu ret = xts_verify_key(tfm, in_key, key_len); 15928856a9eSStephan Mueller if (ret) 16028856a9eSStephan Mueller return ret; 16128856a9eSStephan Mueller 16286464859SArd Biesheuvel ret = ce_aes_expandkey(&ctx->key1, in_key, key_len / 2); 16386464859SArd Biesheuvel if (!ret) 16486464859SArd Biesheuvel ret = ce_aes_expandkey(&ctx->key2, &in_key[key_len / 2], 16586464859SArd Biesheuvel key_len / 2); 16686464859SArd Biesheuvel if (!ret) 16786464859SArd Biesheuvel return 0; 16886464859SArd Biesheuvel 169da40e7a4SHerbert Xu crypto_skcipher_set_flags(tfm, CRYPTO_TFM_RES_BAD_KEY_LEN); 17086464859SArd Biesheuvel return -EINVAL; 17186464859SArd Biesheuvel } 17286464859SArd Biesheuvel 173da40e7a4SHerbert Xu static int ecb_encrypt(struct skcipher_request *req) 17486464859SArd Biesheuvel { 175da40e7a4SHerbert Xu struct crypto_skcipher *tfm = crypto_skcipher_reqtfm(req); 176da40e7a4SHerbert Xu struct crypto_aes_ctx *ctx = crypto_skcipher_ctx(tfm); 177da40e7a4SHerbert Xu struct skcipher_walk walk; 17886464859SArd Biesheuvel unsigned int blocks; 17986464859SArd Biesheuvel int err; 18086464859SArd Biesheuvel 18146a22776SArd Biesheuvel err = skcipher_walk_virt(&walk, req, false); 18286464859SArd Biesheuvel 18386464859SArd Biesheuvel while ((blocks = (walk.nbytes / AES_BLOCK_SIZE))) { 18446a22776SArd Biesheuvel kernel_neon_begin(); 18586464859SArd Biesheuvel ce_aes_ecb_encrypt(walk.dst.virt.addr, walk.src.virt.addr, 186fcb0e30dSArd Biesheuvel ctx->key_enc, num_rounds(ctx), blocks); 18746a22776SArd Biesheuvel kernel_neon_end(); 188da40e7a4SHerbert Xu err = skcipher_walk_done(&walk, walk.nbytes % AES_BLOCK_SIZE); 18986464859SArd Biesheuvel } 19086464859SArd Biesheuvel return err; 19186464859SArd Biesheuvel } 19286464859SArd Biesheuvel 193da40e7a4SHerbert Xu static int ecb_decrypt(struct skcipher_request *req) 19486464859SArd Biesheuvel { 195da40e7a4SHerbert Xu struct crypto_skcipher *tfm = crypto_skcipher_reqtfm(req); 196da40e7a4SHerbert Xu struct crypto_aes_ctx *ctx = crypto_skcipher_ctx(tfm); 197da40e7a4SHerbert Xu struct skcipher_walk walk; 19886464859SArd Biesheuvel unsigned int blocks; 19986464859SArd Biesheuvel int err; 20086464859SArd Biesheuvel 20146a22776SArd Biesheuvel err = skcipher_walk_virt(&walk, req, false); 20286464859SArd Biesheuvel 20386464859SArd Biesheuvel while ((blocks = (walk.nbytes / AES_BLOCK_SIZE))) { 20446a22776SArd Biesheuvel kernel_neon_begin(); 20586464859SArd Biesheuvel ce_aes_ecb_decrypt(walk.dst.virt.addr, walk.src.virt.addr, 206fcb0e30dSArd Biesheuvel ctx->key_dec, num_rounds(ctx), blocks); 20746a22776SArd Biesheuvel kernel_neon_end(); 208da40e7a4SHerbert Xu err = skcipher_walk_done(&walk, walk.nbytes % AES_BLOCK_SIZE); 20986464859SArd Biesheuvel } 21086464859SArd Biesheuvel return err; 21186464859SArd Biesheuvel } 21286464859SArd Biesheuvel 213da40e7a4SHerbert Xu static int cbc_encrypt(struct skcipher_request *req) 21486464859SArd Biesheuvel { 215da40e7a4SHerbert Xu struct crypto_skcipher *tfm = crypto_skcipher_reqtfm(req); 216da40e7a4SHerbert Xu struct crypto_aes_ctx *ctx = crypto_skcipher_ctx(tfm); 217da40e7a4SHerbert Xu struct skcipher_walk walk; 21886464859SArd Biesheuvel unsigned int blocks; 21986464859SArd Biesheuvel int err; 22086464859SArd Biesheuvel 22146a22776SArd Biesheuvel err = skcipher_walk_virt(&walk, req, false); 22286464859SArd Biesheuvel 22386464859SArd Biesheuvel while ((blocks = (walk.nbytes / AES_BLOCK_SIZE))) { 22446a22776SArd Biesheuvel kernel_neon_begin(); 22586464859SArd Biesheuvel ce_aes_cbc_encrypt(walk.dst.virt.addr, walk.src.virt.addr, 226fcb0e30dSArd Biesheuvel ctx->key_enc, num_rounds(ctx), blocks, 22786464859SArd Biesheuvel walk.iv); 22846a22776SArd Biesheuvel kernel_neon_end(); 229da40e7a4SHerbert Xu err = skcipher_walk_done(&walk, walk.nbytes % AES_BLOCK_SIZE); 23086464859SArd Biesheuvel } 23186464859SArd Biesheuvel return err; 23286464859SArd Biesheuvel } 23386464859SArd Biesheuvel 234da40e7a4SHerbert Xu static int cbc_decrypt(struct skcipher_request *req) 23586464859SArd Biesheuvel { 236da40e7a4SHerbert Xu struct crypto_skcipher *tfm = crypto_skcipher_reqtfm(req); 237da40e7a4SHerbert Xu struct crypto_aes_ctx *ctx = crypto_skcipher_ctx(tfm); 238da40e7a4SHerbert Xu struct skcipher_walk walk; 23986464859SArd Biesheuvel unsigned int blocks; 24086464859SArd Biesheuvel int err; 24186464859SArd Biesheuvel 24246a22776SArd Biesheuvel err = skcipher_walk_virt(&walk, req, false); 24386464859SArd Biesheuvel 24486464859SArd Biesheuvel while ((blocks = (walk.nbytes / AES_BLOCK_SIZE))) { 24546a22776SArd Biesheuvel kernel_neon_begin(); 24686464859SArd Biesheuvel ce_aes_cbc_decrypt(walk.dst.virt.addr, walk.src.virt.addr, 247fcb0e30dSArd Biesheuvel ctx->key_dec, num_rounds(ctx), blocks, 24886464859SArd Biesheuvel walk.iv); 24946a22776SArd Biesheuvel kernel_neon_end(); 250da40e7a4SHerbert Xu err = skcipher_walk_done(&walk, walk.nbytes % AES_BLOCK_SIZE); 25186464859SArd Biesheuvel } 25286464859SArd Biesheuvel return err; 25386464859SArd Biesheuvel } 25486464859SArd Biesheuvel 255da40e7a4SHerbert Xu static int ctr_encrypt(struct skcipher_request *req) 25686464859SArd Biesheuvel { 257da40e7a4SHerbert Xu struct crypto_skcipher *tfm = crypto_skcipher_reqtfm(req); 258da40e7a4SHerbert Xu struct crypto_aes_ctx *ctx = crypto_skcipher_ctx(tfm); 259da40e7a4SHerbert Xu struct skcipher_walk walk; 26086464859SArd Biesheuvel int err, blocks; 26186464859SArd Biesheuvel 26246a22776SArd Biesheuvel err = skcipher_walk_virt(&walk, req, false); 26386464859SArd Biesheuvel 26486464859SArd Biesheuvel while ((blocks = (walk.nbytes / AES_BLOCK_SIZE))) { 26546a22776SArd Biesheuvel kernel_neon_begin(); 26686464859SArd Biesheuvel ce_aes_ctr_encrypt(walk.dst.virt.addr, walk.src.virt.addr, 267fcb0e30dSArd Biesheuvel ctx->key_enc, num_rounds(ctx), blocks, 26886464859SArd Biesheuvel walk.iv); 26946a22776SArd Biesheuvel kernel_neon_end(); 270da40e7a4SHerbert Xu err = skcipher_walk_done(&walk, walk.nbytes % AES_BLOCK_SIZE); 27186464859SArd Biesheuvel } 272da40e7a4SHerbert Xu if (walk.nbytes) { 27386464859SArd Biesheuvel u8 __aligned(8) tail[AES_BLOCK_SIZE]; 274da40e7a4SHerbert Xu unsigned int nbytes = walk.nbytes; 275da40e7a4SHerbert Xu u8 *tdst = walk.dst.virt.addr; 276da40e7a4SHerbert Xu u8 *tsrc = walk.src.virt.addr; 27786464859SArd Biesheuvel 27886464859SArd Biesheuvel /* 2791465fb13SArd Biesheuvel * Tell aes_ctr_encrypt() to process a tail block. 28086464859SArd Biesheuvel */ 2811465fb13SArd Biesheuvel blocks = -1; 28286464859SArd Biesheuvel 28346a22776SArd Biesheuvel kernel_neon_begin(); 284fcb0e30dSArd Biesheuvel ce_aes_ctr_encrypt(tail, NULL, ctx->key_enc, num_rounds(ctx), 285fcb0e30dSArd Biesheuvel blocks, walk.iv); 28646a22776SArd Biesheuvel kernel_neon_end(); 28745fe93dfSArd Biesheuvel crypto_xor_cpy(tdst, tsrc, tail, nbytes); 288da40e7a4SHerbert Xu err = skcipher_walk_done(&walk, 0); 28986464859SArd Biesheuvel } 29086464859SArd Biesheuvel return err; 29186464859SArd Biesheuvel } 29286464859SArd Biesheuvel 2935eedf315SArd Biesheuvel static void ctr_encrypt_one(struct crypto_skcipher *tfm, const u8 *src, u8 *dst) 2945eedf315SArd Biesheuvel { 2955eedf315SArd Biesheuvel struct crypto_aes_ctx *ctx = crypto_skcipher_ctx(tfm); 2965eedf315SArd Biesheuvel unsigned long flags; 2975eedf315SArd Biesheuvel 2985eedf315SArd Biesheuvel /* 2995eedf315SArd Biesheuvel * Temporarily disable interrupts to avoid races where 3005eedf315SArd Biesheuvel * cachelines are evicted when the CPU is interrupted 3015eedf315SArd Biesheuvel * to do something else. 3025eedf315SArd Biesheuvel */ 3035eedf315SArd Biesheuvel local_irq_save(flags); 3045eedf315SArd Biesheuvel aes_encrypt(ctx, dst, src); 3055eedf315SArd Biesheuvel local_irq_restore(flags); 3065eedf315SArd Biesheuvel } 3075eedf315SArd Biesheuvel 3085eedf315SArd Biesheuvel static int ctr_encrypt_sync(struct skcipher_request *req) 3095eedf315SArd Biesheuvel { 3105eedf315SArd Biesheuvel if (!crypto_simd_usable()) 3115eedf315SArd Biesheuvel return crypto_ctr_encrypt_walk(req, ctr_encrypt_one); 3125eedf315SArd Biesheuvel 3135eedf315SArd Biesheuvel return ctr_encrypt(req); 3145eedf315SArd Biesheuvel } 3155eedf315SArd Biesheuvel 316da40e7a4SHerbert Xu static int xts_encrypt(struct skcipher_request *req) 31786464859SArd Biesheuvel { 318da40e7a4SHerbert Xu struct crypto_skcipher *tfm = crypto_skcipher_reqtfm(req); 319da40e7a4SHerbert Xu struct crypto_aes_xts_ctx *ctx = crypto_skcipher_ctx(tfm); 32086464859SArd Biesheuvel int err, first, rounds = num_rounds(&ctx->key1); 321*c61b1607SArd Biesheuvel int tail = req->cryptlen % AES_BLOCK_SIZE; 322*c61b1607SArd Biesheuvel struct scatterlist sg_src[2], sg_dst[2]; 323*c61b1607SArd Biesheuvel struct skcipher_request subreq; 324*c61b1607SArd Biesheuvel struct scatterlist *src, *dst; 325da40e7a4SHerbert Xu struct skcipher_walk walk; 326*c61b1607SArd Biesheuvel 327*c61b1607SArd Biesheuvel if (req->cryptlen < AES_BLOCK_SIZE) 328*c61b1607SArd Biesheuvel return -EINVAL; 32986464859SArd Biesheuvel 33046a22776SArd Biesheuvel err = skcipher_walk_virt(&walk, req, false); 33186464859SArd Biesheuvel 332*c61b1607SArd Biesheuvel if (unlikely(tail > 0 && walk.nbytes < walk.total)) { 333*c61b1607SArd Biesheuvel int xts_blocks = DIV_ROUND_UP(req->cryptlen, 334*c61b1607SArd Biesheuvel AES_BLOCK_SIZE) - 2; 335*c61b1607SArd Biesheuvel 336*c61b1607SArd Biesheuvel skcipher_walk_abort(&walk); 337*c61b1607SArd Biesheuvel 338*c61b1607SArd Biesheuvel skcipher_request_set_tfm(&subreq, tfm); 339*c61b1607SArd Biesheuvel skcipher_request_set_callback(&subreq, 340*c61b1607SArd Biesheuvel skcipher_request_flags(req), 341*c61b1607SArd Biesheuvel NULL, NULL); 342*c61b1607SArd Biesheuvel skcipher_request_set_crypt(&subreq, req->src, req->dst, 343*c61b1607SArd Biesheuvel xts_blocks * AES_BLOCK_SIZE, 344*c61b1607SArd Biesheuvel req->iv); 345*c61b1607SArd Biesheuvel req = &subreq; 346*c61b1607SArd Biesheuvel err = skcipher_walk_virt(&walk, req, false); 347*c61b1607SArd Biesheuvel } else { 348*c61b1607SArd Biesheuvel tail = 0; 349*c61b1607SArd Biesheuvel } 350*c61b1607SArd Biesheuvel 351*c61b1607SArd Biesheuvel for (first = 1; walk.nbytes >= AES_BLOCK_SIZE; first = 0) { 352*c61b1607SArd Biesheuvel int nbytes = walk.nbytes; 353*c61b1607SArd Biesheuvel 354*c61b1607SArd Biesheuvel if (walk.nbytes < walk.total) 355*c61b1607SArd Biesheuvel nbytes &= ~(AES_BLOCK_SIZE - 1); 356*c61b1607SArd Biesheuvel 35746a22776SArd Biesheuvel kernel_neon_begin(); 35886464859SArd Biesheuvel ce_aes_xts_encrypt(walk.dst.virt.addr, walk.src.virt.addr, 359*c61b1607SArd Biesheuvel ctx->key1.key_enc, rounds, nbytes, walk.iv, 360fcb0e30dSArd Biesheuvel ctx->key2.key_enc, first); 36146a22776SArd Biesheuvel kernel_neon_end(); 362*c61b1607SArd Biesheuvel err = skcipher_walk_done(&walk, walk.nbytes - nbytes); 36386464859SArd Biesheuvel } 364*c61b1607SArd Biesheuvel 365*c61b1607SArd Biesheuvel if (err || likely(!tail)) 36686464859SArd Biesheuvel return err; 367*c61b1607SArd Biesheuvel 368*c61b1607SArd Biesheuvel dst = src = scatterwalk_ffwd(sg_src, req->src, req->cryptlen); 369*c61b1607SArd Biesheuvel if (req->dst != req->src) 370*c61b1607SArd Biesheuvel dst = scatterwalk_ffwd(sg_dst, req->dst, req->cryptlen); 371*c61b1607SArd Biesheuvel 372*c61b1607SArd Biesheuvel skcipher_request_set_crypt(req, src, dst, AES_BLOCK_SIZE + tail, 373*c61b1607SArd Biesheuvel req->iv); 374*c61b1607SArd Biesheuvel 375*c61b1607SArd Biesheuvel err = skcipher_walk_virt(&walk, req, false); 376*c61b1607SArd Biesheuvel if (err) 377*c61b1607SArd Biesheuvel return err; 378*c61b1607SArd Biesheuvel 379*c61b1607SArd Biesheuvel kernel_neon_begin(); 380*c61b1607SArd Biesheuvel ce_aes_xts_encrypt(walk.dst.virt.addr, walk.src.virt.addr, 381*c61b1607SArd Biesheuvel ctx->key1.key_enc, rounds, walk.nbytes, walk.iv, 382*c61b1607SArd Biesheuvel ctx->key2.key_enc, first); 383*c61b1607SArd Biesheuvel kernel_neon_end(); 384*c61b1607SArd Biesheuvel 385*c61b1607SArd Biesheuvel return skcipher_walk_done(&walk, 0); 38686464859SArd Biesheuvel } 38786464859SArd Biesheuvel 388da40e7a4SHerbert Xu static int xts_decrypt(struct skcipher_request *req) 38986464859SArd Biesheuvel { 390da40e7a4SHerbert Xu struct crypto_skcipher *tfm = crypto_skcipher_reqtfm(req); 391da40e7a4SHerbert Xu struct crypto_aes_xts_ctx *ctx = crypto_skcipher_ctx(tfm); 39286464859SArd Biesheuvel int err, first, rounds = num_rounds(&ctx->key1); 393*c61b1607SArd Biesheuvel int tail = req->cryptlen % AES_BLOCK_SIZE; 394*c61b1607SArd Biesheuvel struct scatterlist sg_src[2], sg_dst[2]; 395*c61b1607SArd Biesheuvel struct skcipher_request subreq; 396*c61b1607SArd Biesheuvel struct scatterlist *src, *dst; 397da40e7a4SHerbert Xu struct skcipher_walk walk; 398*c61b1607SArd Biesheuvel 399*c61b1607SArd Biesheuvel if (req->cryptlen < AES_BLOCK_SIZE) 400*c61b1607SArd Biesheuvel return -EINVAL; 40186464859SArd Biesheuvel 40246a22776SArd Biesheuvel err = skcipher_walk_virt(&walk, req, false); 40386464859SArd Biesheuvel 404*c61b1607SArd Biesheuvel if (unlikely(tail > 0 && walk.nbytes < walk.total)) { 405*c61b1607SArd Biesheuvel int xts_blocks = DIV_ROUND_UP(req->cryptlen, 406*c61b1607SArd Biesheuvel AES_BLOCK_SIZE) - 2; 407*c61b1607SArd Biesheuvel 408*c61b1607SArd Biesheuvel skcipher_walk_abort(&walk); 409*c61b1607SArd Biesheuvel 410*c61b1607SArd Biesheuvel skcipher_request_set_tfm(&subreq, tfm); 411*c61b1607SArd Biesheuvel skcipher_request_set_callback(&subreq, 412*c61b1607SArd Biesheuvel skcipher_request_flags(req), 413*c61b1607SArd Biesheuvel NULL, NULL); 414*c61b1607SArd Biesheuvel skcipher_request_set_crypt(&subreq, req->src, req->dst, 415*c61b1607SArd Biesheuvel xts_blocks * AES_BLOCK_SIZE, 416*c61b1607SArd Biesheuvel req->iv); 417*c61b1607SArd Biesheuvel req = &subreq; 418*c61b1607SArd Biesheuvel err = skcipher_walk_virt(&walk, req, false); 419*c61b1607SArd Biesheuvel } else { 420*c61b1607SArd Biesheuvel tail = 0; 421*c61b1607SArd Biesheuvel } 422*c61b1607SArd Biesheuvel 423*c61b1607SArd Biesheuvel for (first = 1; walk.nbytes >= AES_BLOCK_SIZE; first = 0) { 424*c61b1607SArd Biesheuvel int nbytes = walk.nbytes; 425*c61b1607SArd Biesheuvel 426*c61b1607SArd Biesheuvel if (walk.nbytes < walk.total) 427*c61b1607SArd Biesheuvel nbytes &= ~(AES_BLOCK_SIZE - 1); 428*c61b1607SArd Biesheuvel 42946a22776SArd Biesheuvel kernel_neon_begin(); 43086464859SArd Biesheuvel ce_aes_xts_decrypt(walk.dst.virt.addr, walk.src.virt.addr, 431*c61b1607SArd Biesheuvel ctx->key1.key_dec, rounds, nbytes, walk.iv, 432fcb0e30dSArd Biesheuvel ctx->key2.key_enc, first); 43346a22776SArd Biesheuvel kernel_neon_end(); 434*c61b1607SArd Biesheuvel err = skcipher_walk_done(&walk, walk.nbytes - nbytes); 43586464859SArd Biesheuvel } 436*c61b1607SArd Biesheuvel 437*c61b1607SArd Biesheuvel if (err || likely(!tail)) 43886464859SArd Biesheuvel return err; 439*c61b1607SArd Biesheuvel 440*c61b1607SArd Biesheuvel dst = src = scatterwalk_ffwd(sg_src, req->src, req->cryptlen); 441*c61b1607SArd Biesheuvel if (req->dst != req->src) 442*c61b1607SArd Biesheuvel dst = scatterwalk_ffwd(sg_dst, req->dst, req->cryptlen); 443*c61b1607SArd Biesheuvel 444*c61b1607SArd Biesheuvel skcipher_request_set_crypt(req, src, dst, AES_BLOCK_SIZE + tail, 445*c61b1607SArd Biesheuvel req->iv); 446*c61b1607SArd Biesheuvel 447*c61b1607SArd Biesheuvel err = skcipher_walk_virt(&walk, req, false); 448*c61b1607SArd Biesheuvel if (err) 449*c61b1607SArd Biesheuvel return err; 450*c61b1607SArd Biesheuvel 451*c61b1607SArd Biesheuvel kernel_neon_begin(); 452*c61b1607SArd Biesheuvel ce_aes_xts_decrypt(walk.dst.virt.addr, walk.src.virt.addr, 453*c61b1607SArd Biesheuvel ctx->key1.key_dec, rounds, walk.nbytes, walk.iv, 454*c61b1607SArd Biesheuvel ctx->key2.key_enc, first); 455*c61b1607SArd Biesheuvel kernel_neon_end(); 456*c61b1607SArd Biesheuvel 457*c61b1607SArd Biesheuvel return skcipher_walk_done(&walk, 0); 45886464859SArd Biesheuvel } 45986464859SArd Biesheuvel 460da40e7a4SHerbert Xu static struct skcipher_alg aes_algs[] = { { 46120bb4ef0SArd Biesheuvel .base.cra_name = "__ecb(aes)", 46220bb4ef0SArd Biesheuvel .base.cra_driver_name = "__ecb-aes-ce", 46320bb4ef0SArd Biesheuvel .base.cra_priority = 300, 46420bb4ef0SArd Biesheuvel .base.cra_flags = CRYPTO_ALG_INTERNAL, 46520bb4ef0SArd Biesheuvel .base.cra_blocksize = AES_BLOCK_SIZE, 46620bb4ef0SArd Biesheuvel .base.cra_ctxsize = sizeof(struct crypto_aes_ctx), 46720bb4ef0SArd Biesheuvel .base.cra_module = THIS_MODULE, 46820bb4ef0SArd Biesheuvel 46986464859SArd Biesheuvel .min_keysize = AES_MIN_KEY_SIZE, 47086464859SArd Biesheuvel .max_keysize = AES_MAX_KEY_SIZE, 47186464859SArd Biesheuvel .setkey = ce_aes_setkey, 47286464859SArd Biesheuvel .encrypt = ecb_encrypt, 47386464859SArd Biesheuvel .decrypt = ecb_decrypt, 47486464859SArd Biesheuvel }, { 47520bb4ef0SArd Biesheuvel .base.cra_name = "__cbc(aes)", 47620bb4ef0SArd Biesheuvel .base.cra_driver_name = "__cbc-aes-ce", 47720bb4ef0SArd Biesheuvel .base.cra_priority = 300, 47820bb4ef0SArd Biesheuvel .base.cra_flags = CRYPTO_ALG_INTERNAL, 47920bb4ef0SArd Biesheuvel .base.cra_blocksize = AES_BLOCK_SIZE, 48020bb4ef0SArd Biesheuvel .base.cra_ctxsize = sizeof(struct crypto_aes_ctx), 48120bb4ef0SArd Biesheuvel .base.cra_module = THIS_MODULE, 48220bb4ef0SArd Biesheuvel 48386464859SArd Biesheuvel .min_keysize = AES_MIN_KEY_SIZE, 48486464859SArd Biesheuvel .max_keysize = AES_MAX_KEY_SIZE, 48586464859SArd Biesheuvel .ivsize = AES_BLOCK_SIZE, 48686464859SArd Biesheuvel .setkey = ce_aes_setkey, 48786464859SArd Biesheuvel .encrypt = cbc_encrypt, 48886464859SArd Biesheuvel .decrypt = cbc_decrypt, 48986464859SArd Biesheuvel }, { 49020bb4ef0SArd Biesheuvel .base.cra_name = "__ctr(aes)", 49120bb4ef0SArd Biesheuvel .base.cra_driver_name = "__ctr-aes-ce", 49220bb4ef0SArd Biesheuvel .base.cra_priority = 300, 49320bb4ef0SArd Biesheuvel .base.cra_flags = CRYPTO_ALG_INTERNAL, 49420bb4ef0SArd Biesheuvel .base.cra_blocksize = 1, 49520bb4ef0SArd Biesheuvel .base.cra_ctxsize = sizeof(struct crypto_aes_ctx), 49620bb4ef0SArd Biesheuvel .base.cra_module = THIS_MODULE, 49720bb4ef0SArd Biesheuvel 49886464859SArd Biesheuvel .min_keysize = AES_MIN_KEY_SIZE, 49986464859SArd Biesheuvel .max_keysize = AES_MAX_KEY_SIZE, 50086464859SArd Biesheuvel .ivsize = AES_BLOCK_SIZE, 501da40e7a4SHerbert Xu .chunksize = AES_BLOCK_SIZE, 50286464859SArd Biesheuvel .setkey = ce_aes_setkey, 50386464859SArd Biesheuvel .encrypt = ctr_encrypt, 50486464859SArd Biesheuvel .decrypt = ctr_encrypt, 50586464859SArd Biesheuvel }, { 5065eedf315SArd Biesheuvel .base.cra_name = "ctr(aes)", 5075eedf315SArd Biesheuvel .base.cra_driver_name = "ctr-aes-ce-sync", 5085eedf315SArd Biesheuvel .base.cra_priority = 300 - 1, 5095eedf315SArd Biesheuvel .base.cra_blocksize = 1, 5105eedf315SArd Biesheuvel .base.cra_ctxsize = sizeof(struct crypto_aes_ctx), 5115eedf315SArd Biesheuvel .base.cra_module = THIS_MODULE, 5125eedf315SArd Biesheuvel 5135eedf315SArd Biesheuvel .min_keysize = AES_MIN_KEY_SIZE, 5145eedf315SArd Biesheuvel .max_keysize = AES_MAX_KEY_SIZE, 5155eedf315SArd Biesheuvel .ivsize = AES_BLOCK_SIZE, 5165eedf315SArd Biesheuvel .chunksize = AES_BLOCK_SIZE, 5175eedf315SArd Biesheuvel .setkey = ce_aes_setkey, 5185eedf315SArd Biesheuvel .encrypt = ctr_encrypt_sync, 5195eedf315SArd Biesheuvel .decrypt = ctr_encrypt_sync, 5205eedf315SArd Biesheuvel }, { 52120bb4ef0SArd Biesheuvel .base.cra_name = "__xts(aes)", 52220bb4ef0SArd Biesheuvel .base.cra_driver_name = "__xts-aes-ce", 52320bb4ef0SArd Biesheuvel .base.cra_priority = 300, 52420bb4ef0SArd Biesheuvel .base.cra_flags = CRYPTO_ALG_INTERNAL, 52520bb4ef0SArd Biesheuvel .base.cra_blocksize = AES_BLOCK_SIZE, 52620bb4ef0SArd Biesheuvel .base.cra_ctxsize = sizeof(struct crypto_aes_xts_ctx), 52720bb4ef0SArd Biesheuvel .base.cra_module = THIS_MODULE, 52820bb4ef0SArd Biesheuvel 52986464859SArd Biesheuvel .min_keysize = 2 * AES_MIN_KEY_SIZE, 53086464859SArd Biesheuvel .max_keysize = 2 * AES_MAX_KEY_SIZE, 53186464859SArd Biesheuvel .ivsize = AES_BLOCK_SIZE, 532*c61b1607SArd Biesheuvel .walksize = 2 * AES_BLOCK_SIZE, 53386464859SArd Biesheuvel .setkey = xts_set_key, 53486464859SArd Biesheuvel .encrypt = xts_encrypt, 53586464859SArd Biesheuvel .decrypt = xts_decrypt, 53686464859SArd Biesheuvel } }; 53786464859SArd Biesheuvel 538efad2b61SHerbert Xu static struct simd_skcipher_alg *aes_simd_algs[ARRAY_SIZE(aes_algs)]; 539da40e7a4SHerbert Xu 540da40e7a4SHerbert Xu static void aes_exit(void) 541da40e7a4SHerbert Xu { 542da40e7a4SHerbert Xu int i; 543da40e7a4SHerbert Xu 544da40e7a4SHerbert Xu for (i = 0; i < ARRAY_SIZE(aes_simd_algs) && aes_simd_algs[i]; i++) 545da40e7a4SHerbert Xu simd_skcipher_free(aes_simd_algs[i]); 546da40e7a4SHerbert Xu 547da40e7a4SHerbert Xu crypto_unregister_skciphers(aes_algs, ARRAY_SIZE(aes_algs)); 548da40e7a4SHerbert Xu } 549da40e7a4SHerbert Xu 55086464859SArd Biesheuvel static int __init aes_init(void) 55186464859SArd Biesheuvel { 552da40e7a4SHerbert Xu struct simd_skcipher_alg *simd; 553da40e7a4SHerbert Xu const char *basename; 554da40e7a4SHerbert Xu const char *algname; 555da40e7a4SHerbert Xu const char *drvname; 556da40e7a4SHerbert Xu int err; 557da40e7a4SHerbert Xu int i; 558da40e7a4SHerbert Xu 559da40e7a4SHerbert Xu err = crypto_register_skciphers(aes_algs, ARRAY_SIZE(aes_algs)); 560da40e7a4SHerbert Xu if (err) 561da40e7a4SHerbert Xu return err; 562da40e7a4SHerbert Xu 563da40e7a4SHerbert Xu for (i = 0; i < ARRAY_SIZE(aes_algs); i++) { 5645eedf315SArd Biesheuvel if (!(aes_algs[i].base.cra_flags & CRYPTO_ALG_INTERNAL)) 5655eedf315SArd Biesheuvel continue; 5665eedf315SArd Biesheuvel 567da40e7a4SHerbert Xu algname = aes_algs[i].base.cra_name + 2; 568da40e7a4SHerbert Xu drvname = aes_algs[i].base.cra_driver_name + 2; 569da40e7a4SHerbert Xu basename = aes_algs[i].base.cra_driver_name; 570da40e7a4SHerbert Xu simd = simd_skcipher_create_compat(algname, drvname, basename); 571da40e7a4SHerbert Xu err = PTR_ERR(simd); 572da40e7a4SHerbert Xu if (IS_ERR(simd)) 573da40e7a4SHerbert Xu goto unregister_simds; 574da40e7a4SHerbert Xu 575da40e7a4SHerbert Xu aes_simd_algs[i] = simd; 57686464859SArd Biesheuvel } 57786464859SArd Biesheuvel 578da40e7a4SHerbert Xu return 0; 579da40e7a4SHerbert Xu 580da40e7a4SHerbert Xu unregister_simds: 581da40e7a4SHerbert Xu aes_exit(); 582da40e7a4SHerbert Xu return err; 58386464859SArd Biesheuvel } 58486464859SArd Biesheuvel 5854d8061a5SArd Biesheuvel module_cpu_feature_match(AES, aes_init); 58686464859SArd Biesheuvel module_exit(aes_exit); 587