167fa3a7fSTianjia Zhang /* SPDX-License-Identifier: GPL-2.0-or-later */
267fa3a7fSTianjia Zhang /*
367fa3a7fSTianjia Zhang * SM4-CCM AEAD Algorithm using ARMv8 Crypto Extensions
467fa3a7fSTianjia Zhang * as specified in rfc8998
567fa3a7fSTianjia Zhang * https://datatracker.ietf.org/doc/html/rfc8998
667fa3a7fSTianjia Zhang *
767fa3a7fSTianjia Zhang * Copyright (C) 2022 Tianjia Zhang <tianjia.zhang@linux.alibaba.com>
867fa3a7fSTianjia Zhang */
967fa3a7fSTianjia Zhang
1067fa3a7fSTianjia Zhang #include <linux/module.h>
1167fa3a7fSTianjia Zhang #include <linux/crypto.h>
1267fa3a7fSTianjia Zhang #include <linux/kernel.h>
1367fa3a7fSTianjia Zhang #include <linux/cpufeature.h>
1467fa3a7fSTianjia Zhang #include <asm/neon.h>
1567fa3a7fSTianjia Zhang #include <crypto/scatterwalk.h>
1667fa3a7fSTianjia Zhang #include <crypto/internal/aead.h>
1767fa3a7fSTianjia Zhang #include <crypto/internal/skcipher.h>
1867fa3a7fSTianjia Zhang #include <crypto/sm4.h>
1967fa3a7fSTianjia Zhang #include "sm4-ce.h"
2067fa3a7fSTianjia Zhang
2167fa3a7fSTianjia Zhang asmlinkage void sm4_ce_cbcmac_update(const u32 *rkey_enc, u8 *mac,
2267fa3a7fSTianjia Zhang const u8 *src, unsigned int nblocks);
2367fa3a7fSTianjia Zhang asmlinkage void sm4_ce_ccm_enc(const u32 *rkey_enc, u8 *dst, const u8 *src,
2467fa3a7fSTianjia Zhang u8 *iv, unsigned int nbytes, u8 *mac);
2567fa3a7fSTianjia Zhang asmlinkage void sm4_ce_ccm_dec(const u32 *rkey_enc, u8 *dst, const u8 *src,
2667fa3a7fSTianjia Zhang u8 *iv, unsigned int nbytes, u8 *mac);
2767fa3a7fSTianjia Zhang asmlinkage void sm4_ce_ccm_final(const u32 *rkey_enc, u8 *iv, u8 *mac);
2867fa3a7fSTianjia Zhang
2967fa3a7fSTianjia Zhang
ccm_setkey(struct crypto_aead * tfm,const u8 * key,unsigned int key_len)3067fa3a7fSTianjia Zhang static int ccm_setkey(struct crypto_aead *tfm, const u8 *key,
3167fa3a7fSTianjia Zhang unsigned int key_len)
3267fa3a7fSTianjia Zhang {
3367fa3a7fSTianjia Zhang struct sm4_ctx *ctx = crypto_aead_ctx(tfm);
3467fa3a7fSTianjia Zhang
3567fa3a7fSTianjia Zhang if (key_len != SM4_KEY_SIZE)
3667fa3a7fSTianjia Zhang return -EINVAL;
3767fa3a7fSTianjia Zhang
3867fa3a7fSTianjia Zhang kernel_neon_begin();
3967fa3a7fSTianjia Zhang sm4_ce_expand_key(key, ctx->rkey_enc, ctx->rkey_dec,
4067fa3a7fSTianjia Zhang crypto_sm4_fk, crypto_sm4_ck);
4167fa3a7fSTianjia Zhang kernel_neon_end();
4267fa3a7fSTianjia Zhang
4367fa3a7fSTianjia Zhang return 0;
4467fa3a7fSTianjia Zhang }
4567fa3a7fSTianjia Zhang
ccm_setauthsize(struct crypto_aead * tfm,unsigned int authsize)4667fa3a7fSTianjia Zhang static int ccm_setauthsize(struct crypto_aead *tfm, unsigned int authsize)
4767fa3a7fSTianjia Zhang {
4867fa3a7fSTianjia Zhang if ((authsize & 1) || authsize < 4)
4967fa3a7fSTianjia Zhang return -EINVAL;
5067fa3a7fSTianjia Zhang return 0;
5167fa3a7fSTianjia Zhang }
5267fa3a7fSTianjia Zhang
ccm_format_input(u8 info[],struct aead_request * req,unsigned int msglen)5367fa3a7fSTianjia Zhang static int ccm_format_input(u8 info[], struct aead_request *req,
5467fa3a7fSTianjia Zhang unsigned int msglen)
5567fa3a7fSTianjia Zhang {
5667fa3a7fSTianjia Zhang struct crypto_aead *aead = crypto_aead_reqtfm(req);
5767fa3a7fSTianjia Zhang unsigned int l = req->iv[0] + 1;
5867fa3a7fSTianjia Zhang unsigned int m;
5967fa3a7fSTianjia Zhang __be32 len;
6067fa3a7fSTianjia Zhang
6167fa3a7fSTianjia Zhang /* verify that CCM dimension 'L': 2 <= L <= 8 */
6267fa3a7fSTianjia Zhang if (l < 2 || l > 8)
6367fa3a7fSTianjia Zhang return -EINVAL;
6467fa3a7fSTianjia Zhang if (l < 4 && msglen >> (8 * l))
6567fa3a7fSTianjia Zhang return -EOVERFLOW;
6667fa3a7fSTianjia Zhang
6767fa3a7fSTianjia Zhang memset(&req->iv[SM4_BLOCK_SIZE - l], 0, l);
6867fa3a7fSTianjia Zhang
6967fa3a7fSTianjia Zhang memcpy(info, req->iv, SM4_BLOCK_SIZE);
7067fa3a7fSTianjia Zhang
7167fa3a7fSTianjia Zhang m = crypto_aead_authsize(aead);
7267fa3a7fSTianjia Zhang
7367fa3a7fSTianjia Zhang /* format flags field per RFC 3610/NIST 800-38C */
7467fa3a7fSTianjia Zhang *info |= ((m - 2) / 2) << 3;
7567fa3a7fSTianjia Zhang if (req->assoclen)
7667fa3a7fSTianjia Zhang *info |= (1 << 6);
7767fa3a7fSTianjia Zhang
7867fa3a7fSTianjia Zhang /*
7967fa3a7fSTianjia Zhang * format message length field,
8067fa3a7fSTianjia Zhang * Linux uses a u32 type to represent msglen
8167fa3a7fSTianjia Zhang */
8267fa3a7fSTianjia Zhang if (l >= 4)
8367fa3a7fSTianjia Zhang l = 4;
8467fa3a7fSTianjia Zhang
8567fa3a7fSTianjia Zhang len = cpu_to_be32(msglen);
8667fa3a7fSTianjia Zhang memcpy(&info[SM4_BLOCK_SIZE - l], (u8 *)&len + 4 - l, l);
8767fa3a7fSTianjia Zhang
8867fa3a7fSTianjia Zhang return 0;
8967fa3a7fSTianjia Zhang }
9067fa3a7fSTianjia Zhang
ccm_calculate_auth_mac(struct aead_request * req,u8 mac[])9167fa3a7fSTianjia Zhang static void ccm_calculate_auth_mac(struct aead_request *req, u8 mac[])
9267fa3a7fSTianjia Zhang {
9367fa3a7fSTianjia Zhang struct crypto_aead *aead = crypto_aead_reqtfm(req);
9467fa3a7fSTianjia Zhang struct sm4_ctx *ctx = crypto_aead_ctx(aead);
9567fa3a7fSTianjia Zhang struct __packed { __be16 l; __be32 h; } aadlen;
9667fa3a7fSTianjia Zhang u32 assoclen = req->assoclen;
9767fa3a7fSTianjia Zhang struct scatter_walk walk;
9867fa3a7fSTianjia Zhang unsigned int len;
9967fa3a7fSTianjia Zhang
10067fa3a7fSTianjia Zhang if (assoclen < 0xff00) {
10167fa3a7fSTianjia Zhang aadlen.l = cpu_to_be16(assoclen);
10267fa3a7fSTianjia Zhang len = 2;
10367fa3a7fSTianjia Zhang } else {
10467fa3a7fSTianjia Zhang aadlen.l = cpu_to_be16(0xfffe);
10567fa3a7fSTianjia Zhang put_unaligned_be32(assoclen, &aadlen.h);
10667fa3a7fSTianjia Zhang len = 6;
10767fa3a7fSTianjia Zhang }
10867fa3a7fSTianjia Zhang
10967fa3a7fSTianjia Zhang sm4_ce_crypt_block(ctx->rkey_enc, mac, mac);
11067fa3a7fSTianjia Zhang crypto_xor(mac, (const u8 *)&aadlen, len);
11167fa3a7fSTianjia Zhang
11267fa3a7fSTianjia Zhang scatterwalk_start(&walk, req->src);
11367fa3a7fSTianjia Zhang
11467fa3a7fSTianjia Zhang do {
11567fa3a7fSTianjia Zhang u32 n = scatterwalk_clamp(&walk, assoclen);
11667fa3a7fSTianjia Zhang u8 *p, *ptr;
11767fa3a7fSTianjia Zhang
11867fa3a7fSTianjia Zhang if (!n) {
11967fa3a7fSTianjia Zhang scatterwalk_start(&walk, sg_next(walk.sg));
12067fa3a7fSTianjia Zhang n = scatterwalk_clamp(&walk, assoclen);
12167fa3a7fSTianjia Zhang }
12267fa3a7fSTianjia Zhang
12367fa3a7fSTianjia Zhang p = ptr = scatterwalk_map(&walk);
12467fa3a7fSTianjia Zhang assoclen -= n;
12567fa3a7fSTianjia Zhang scatterwalk_advance(&walk, n);
12667fa3a7fSTianjia Zhang
12767fa3a7fSTianjia Zhang while (n > 0) {
12867fa3a7fSTianjia Zhang unsigned int l, nblocks;
12967fa3a7fSTianjia Zhang
13067fa3a7fSTianjia Zhang if (len == SM4_BLOCK_SIZE) {
13167fa3a7fSTianjia Zhang if (n < SM4_BLOCK_SIZE) {
13267fa3a7fSTianjia Zhang sm4_ce_crypt_block(ctx->rkey_enc,
13367fa3a7fSTianjia Zhang mac, mac);
13467fa3a7fSTianjia Zhang
13567fa3a7fSTianjia Zhang len = 0;
13667fa3a7fSTianjia Zhang } else {
13767fa3a7fSTianjia Zhang nblocks = n / SM4_BLOCK_SIZE;
13867fa3a7fSTianjia Zhang sm4_ce_cbcmac_update(ctx->rkey_enc,
13967fa3a7fSTianjia Zhang mac, ptr, nblocks);
14067fa3a7fSTianjia Zhang
14167fa3a7fSTianjia Zhang ptr += nblocks * SM4_BLOCK_SIZE;
14267fa3a7fSTianjia Zhang n %= SM4_BLOCK_SIZE;
14367fa3a7fSTianjia Zhang
14467fa3a7fSTianjia Zhang continue;
14567fa3a7fSTianjia Zhang }
14667fa3a7fSTianjia Zhang }
14767fa3a7fSTianjia Zhang
14867fa3a7fSTianjia Zhang l = min(n, SM4_BLOCK_SIZE - len);
14967fa3a7fSTianjia Zhang if (l) {
15067fa3a7fSTianjia Zhang crypto_xor(mac + len, ptr, l);
15167fa3a7fSTianjia Zhang len += l;
15267fa3a7fSTianjia Zhang ptr += l;
15367fa3a7fSTianjia Zhang n -= l;
15467fa3a7fSTianjia Zhang }
15567fa3a7fSTianjia Zhang }
15667fa3a7fSTianjia Zhang
15767fa3a7fSTianjia Zhang scatterwalk_unmap(p);
15867fa3a7fSTianjia Zhang scatterwalk_done(&walk, 0, assoclen);
15967fa3a7fSTianjia Zhang } while (assoclen);
16067fa3a7fSTianjia Zhang }
16167fa3a7fSTianjia Zhang
ccm_crypt(struct aead_request * req,struct skcipher_walk * walk,u32 * rkey_enc,u8 mac[],void (* sm4_ce_ccm_crypt)(const u32 * rkey_enc,u8 * dst,const u8 * src,u8 * iv,unsigned int nbytes,u8 * mac))16267fa3a7fSTianjia Zhang static int ccm_crypt(struct aead_request *req, struct skcipher_walk *walk,
16367fa3a7fSTianjia Zhang u32 *rkey_enc, u8 mac[],
16467fa3a7fSTianjia Zhang void (*sm4_ce_ccm_crypt)(const u32 *rkey_enc, u8 *dst,
16567fa3a7fSTianjia Zhang const u8 *src, u8 *iv,
16667fa3a7fSTianjia Zhang unsigned int nbytes, u8 *mac))
16767fa3a7fSTianjia Zhang {
16867fa3a7fSTianjia Zhang u8 __aligned(8) ctr0[SM4_BLOCK_SIZE];
169*3b9d9021STianjia Zhang int err = 0;
17067fa3a7fSTianjia Zhang
17167fa3a7fSTianjia Zhang /* preserve the initial ctr0 for the TAG */
17267fa3a7fSTianjia Zhang memcpy(ctr0, walk->iv, SM4_BLOCK_SIZE);
17367fa3a7fSTianjia Zhang crypto_inc(walk->iv, SM4_BLOCK_SIZE);
17467fa3a7fSTianjia Zhang
17567fa3a7fSTianjia Zhang kernel_neon_begin();
17667fa3a7fSTianjia Zhang
17767fa3a7fSTianjia Zhang if (req->assoclen)
17867fa3a7fSTianjia Zhang ccm_calculate_auth_mac(req, mac);
17967fa3a7fSTianjia Zhang
180*3b9d9021STianjia Zhang while (walk->nbytes && walk->nbytes != walk->total) {
18167fa3a7fSTianjia Zhang unsigned int tail = walk->nbytes % SM4_BLOCK_SIZE;
18267fa3a7fSTianjia Zhang
183*3b9d9021STianjia Zhang sm4_ce_ccm_crypt(rkey_enc, walk->dst.virt.addr,
184*3b9d9021STianjia Zhang walk->src.virt.addr, walk->iv,
18567fa3a7fSTianjia Zhang walk->nbytes - tail, mac);
18667fa3a7fSTianjia Zhang
187*3b9d9021STianjia Zhang kernel_neon_end();
188*3b9d9021STianjia Zhang
189*3b9d9021STianjia Zhang err = skcipher_walk_done(walk, tail);
190*3b9d9021STianjia Zhang
191*3b9d9021STianjia Zhang kernel_neon_begin();
192*3b9d9021STianjia Zhang }
193*3b9d9021STianjia Zhang
194*3b9d9021STianjia Zhang if (walk->nbytes) {
195*3b9d9021STianjia Zhang sm4_ce_ccm_crypt(rkey_enc, walk->dst.virt.addr,
196*3b9d9021STianjia Zhang walk->src.virt.addr, walk->iv,
197*3b9d9021STianjia Zhang walk->nbytes, mac);
198*3b9d9021STianjia Zhang
19967fa3a7fSTianjia Zhang sm4_ce_ccm_final(rkey_enc, ctr0, mac);
20067fa3a7fSTianjia Zhang
20167fa3a7fSTianjia Zhang kernel_neon_end();
20267fa3a7fSTianjia Zhang
203*3b9d9021STianjia Zhang err = skcipher_walk_done(walk, 0);
204*3b9d9021STianjia Zhang } else {
205*3b9d9021STianjia Zhang sm4_ce_ccm_final(rkey_enc, ctr0, mac);
20667fa3a7fSTianjia Zhang
207*3b9d9021STianjia Zhang kernel_neon_end();
208*3b9d9021STianjia Zhang }
209*3b9d9021STianjia Zhang
210*3b9d9021STianjia Zhang return err;
21167fa3a7fSTianjia Zhang }
21267fa3a7fSTianjia Zhang
ccm_encrypt(struct aead_request * req)21367fa3a7fSTianjia Zhang static int ccm_encrypt(struct aead_request *req)
21467fa3a7fSTianjia Zhang {
21567fa3a7fSTianjia Zhang struct crypto_aead *aead = crypto_aead_reqtfm(req);
21667fa3a7fSTianjia Zhang struct sm4_ctx *ctx = crypto_aead_ctx(aead);
21767fa3a7fSTianjia Zhang u8 __aligned(8) mac[SM4_BLOCK_SIZE];
21867fa3a7fSTianjia Zhang struct skcipher_walk walk;
21967fa3a7fSTianjia Zhang int err;
22067fa3a7fSTianjia Zhang
22167fa3a7fSTianjia Zhang err = ccm_format_input(mac, req, req->cryptlen);
22267fa3a7fSTianjia Zhang if (err)
22367fa3a7fSTianjia Zhang return err;
22467fa3a7fSTianjia Zhang
22567fa3a7fSTianjia Zhang err = skcipher_walk_aead_encrypt(&walk, req, false);
22667fa3a7fSTianjia Zhang if (err)
22767fa3a7fSTianjia Zhang return err;
22867fa3a7fSTianjia Zhang
22967fa3a7fSTianjia Zhang err = ccm_crypt(req, &walk, ctx->rkey_enc, mac, sm4_ce_ccm_enc);
23067fa3a7fSTianjia Zhang if (err)
23167fa3a7fSTianjia Zhang return err;
23267fa3a7fSTianjia Zhang
23367fa3a7fSTianjia Zhang /* copy authtag to end of dst */
23467fa3a7fSTianjia Zhang scatterwalk_map_and_copy(mac, req->dst, req->assoclen + req->cryptlen,
23567fa3a7fSTianjia Zhang crypto_aead_authsize(aead), 1);
23667fa3a7fSTianjia Zhang
23767fa3a7fSTianjia Zhang return 0;
23867fa3a7fSTianjia Zhang }
23967fa3a7fSTianjia Zhang
ccm_decrypt(struct aead_request * req)24067fa3a7fSTianjia Zhang static int ccm_decrypt(struct aead_request *req)
24167fa3a7fSTianjia Zhang {
24267fa3a7fSTianjia Zhang struct crypto_aead *aead = crypto_aead_reqtfm(req);
24367fa3a7fSTianjia Zhang unsigned int authsize = crypto_aead_authsize(aead);
24467fa3a7fSTianjia Zhang struct sm4_ctx *ctx = crypto_aead_ctx(aead);
24567fa3a7fSTianjia Zhang u8 __aligned(8) mac[SM4_BLOCK_SIZE];
24667fa3a7fSTianjia Zhang u8 authtag[SM4_BLOCK_SIZE];
24767fa3a7fSTianjia Zhang struct skcipher_walk walk;
24867fa3a7fSTianjia Zhang int err;
24967fa3a7fSTianjia Zhang
25067fa3a7fSTianjia Zhang err = ccm_format_input(mac, req, req->cryptlen - authsize);
25167fa3a7fSTianjia Zhang if (err)
25267fa3a7fSTianjia Zhang return err;
25367fa3a7fSTianjia Zhang
25467fa3a7fSTianjia Zhang err = skcipher_walk_aead_decrypt(&walk, req, false);
25567fa3a7fSTianjia Zhang if (err)
25667fa3a7fSTianjia Zhang return err;
25767fa3a7fSTianjia Zhang
25867fa3a7fSTianjia Zhang err = ccm_crypt(req, &walk, ctx->rkey_enc, mac, sm4_ce_ccm_dec);
25967fa3a7fSTianjia Zhang if (err)
26067fa3a7fSTianjia Zhang return err;
26167fa3a7fSTianjia Zhang
26267fa3a7fSTianjia Zhang /* compare calculated auth tag with the stored one */
26367fa3a7fSTianjia Zhang scatterwalk_map_and_copy(authtag, req->src,
26467fa3a7fSTianjia Zhang req->assoclen + req->cryptlen - authsize,
26567fa3a7fSTianjia Zhang authsize, 0);
26667fa3a7fSTianjia Zhang
26767fa3a7fSTianjia Zhang if (crypto_memneq(authtag, mac, authsize))
26867fa3a7fSTianjia Zhang return -EBADMSG;
26967fa3a7fSTianjia Zhang
27067fa3a7fSTianjia Zhang return 0;
27167fa3a7fSTianjia Zhang }
27267fa3a7fSTianjia Zhang
27367fa3a7fSTianjia Zhang static struct aead_alg sm4_ccm_alg = {
27467fa3a7fSTianjia Zhang .base = {
27567fa3a7fSTianjia Zhang .cra_name = "ccm(sm4)",
27667fa3a7fSTianjia Zhang .cra_driver_name = "ccm-sm4-ce",
27767fa3a7fSTianjia Zhang .cra_priority = 400,
27867fa3a7fSTianjia Zhang .cra_blocksize = 1,
27967fa3a7fSTianjia Zhang .cra_ctxsize = sizeof(struct sm4_ctx),
28067fa3a7fSTianjia Zhang .cra_module = THIS_MODULE,
28167fa3a7fSTianjia Zhang },
28267fa3a7fSTianjia Zhang .ivsize = SM4_BLOCK_SIZE,
28367fa3a7fSTianjia Zhang .chunksize = SM4_BLOCK_SIZE,
28467fa3a7fSTianjia Zhang .maxauthsize = SM4_BLOCK_SIZE,
28567fa3a7fSTianjia Zhang .setkey = ccm_setkey,
28667fa3a7fSTianjia Zhang .setauthsize = ccm_setauthsize,
28767fa3a7fSTianjia Zhang .encrypt = ccm_encrypt,
28867fa3a7fSTianjia Zhang .decrypt = ccm_decrypt,
28967fa3a7fSTianjia Zhang };
29067fa3a7fSTianjia Zhang
sm4_ce_ccm_init(void)29167fa3a7fSTianjia Zhang static int __init sm4_ce_ccm_init(void)
29267fa3a7fSTianjia Zhang {
29367fa3a7fSTianjia Zhang return crypto_register_aead(&sm4_ccm_alg);
29467fa3a7fSTianjia Zhang }
29567fa3a7fSTianjia Zhang
sm4_ce_ccm_exit(void)29667fa3a7fSTianjia Zhang static void __exit sm4_ce_ccm_exit(void)
29767fa3a7fSTianjia Zhang {
29867fa3a7fSTianjia Zhang crypto_unregister_aead(&sm4_ccm_alg);
29967fa3a7fSTianjia Zhang }
30067fa3a7fSTianjia Zhang
30167fa3a7fSTianjia Zhang module_cpu_feature_match(SM4, sm4_ce_ccm_init);
30267fa3a7fSTianjia Zhang module_exit(sm4_ce_ccm_exit);
30367fa3a7fSTianjia Zhang
30467fa3a7fSTianjia Zhang MODULE_DESCRIPTION("Synchronous SM4 in CCM mode using ARMv8 Crypto Extensions");
30567fa3a7fSTianjia Zhang MODULE_ALIAS_CRYPTO("ccm(sm4)");
30667fa3a7fSTianjia Zhang MODULE_AUTHOR("Tianjia Zhang <tianjia.zhang@linux.alibaba.com>");
30767fa3a7fSTianjia Zhang MODULE_LICENSE("GPL v2");
308