xref: /openbmc/linux/crypto/vmac.c (revision f1939f7c56456d22a559d2c75156e91912a2e97e)
1*f1939f7cSShane Wang /*
2*f1939f7cSShane Wang  * Modified to interface to the Linux kernel
3*f1939f7cSShane Wang  * Copyright (c) 2009, Intel Corporation.
4*f1939f7cSShane Wang  *
5*f1939f7cSShane Wang  * This program is free software; you can redistribute it and/or modify it
6*f1939f7cSShane Wang  * under the terms and conditions of the GNU General Public License,
7*f1939f7cSShane Wang  * version 2, as published by the Free Software Foundation.
8*f1939f7cSShane Wang  *
9*f1939f7cSShane Wang  * This program is distributed in the hope it will be useful, but WITHOUT
10*f1939f7cSShane Wang  * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
11*f1939f7cSShane Wang  * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License for
12*f1939f7cSShane Wang  * more details.
13*f1939f7cSShane Wang  *
14*f1939f7cSShane Wang  * You should have received a copy of the GNU General Public License along with
15*f1939f7cSShane Wang  * this program; if not, write to the Free Software Foundation, Inc., 59 Temple
16*f1939f7cSShane Wang  * Place - Suite 330, Boston, MA 02111-1307 USA.
17*f1939f7cSShane Wang  */
18*f1939f7cSShane Wang 
19*f1939f7cSShane Wang /* --------------------------------------------------------------------------
20*f1939f7cSShane Wang  * VMAC and VHASH Implementation by Ted Krovetz (tdk@acm.org) and Wei Dai.
21*f1939f7cSShane Wang  * This implementation is herby placed in the public domain.
22*f1939f7cSShane Wang  * The authors offers no warranty. Use at your own risk.
23*f1939f7cSShane Wang  * Please send bug reports to the authors.
24*f1939f7cSShane Wang  * Last modified: 17 APR 08, 1700 PDT
25*f1939f7cSShane Wang  * ----------------------------------------------------------------------- */
26*f1939f7cSShane Wang 
27*f1939f7cSShane Wang #include <linux/init.h>
28*f1939f7cSShane Wang #include <linux/types.h>
29*f1939f7cSShane Wang #include <linux/crypto.h>
30*f1939f7cSShane Wang #include <linux/scatterlist.h>
31*f1939f7cSShane Wang #include <asm/byteorder.h>
32*f1939f7cSShane Wang #include <crypto/scatterwalk.h>
33*f1939f7cSShane Wang #include <crypto/vmac.h>
34*f1939f7cSShane Wang #include <crypto/internal/hash.h>
35*f1939f7cSShane Wang 
36*f1939f7cSShane Wang /*
37*f1939f7cSShane Wang  * Constants and masks
38*f1939f7cSShane Wang  */
39*f1939f7cSShane Wang #define UINT64_C(x) x##ULL
40*f1939f7cSShane Wang const u64 p64   = UINT64_C(0xfffffffffffffeff);  /* 2^64 - 257 prime  */
41*f1939f7cSShane Wang const u64 m62   = UINT64_C(0x3fffffffffffffff);  /* 62-bit mask       */
42*f1939f7cSShane Wang const u64 m63   = UINT64_C(0x7fffffffffffffff);  /* 63-bit mask       */
43*f1939f7cSShane Wang const u64 m64   = UINT64_C(0xffffffffffffffff);  /* 64-bit mask       */
44*f1939f7cSShane Wang const u64 mpoly = UINT64_C(0x1fffffff1fffffff);  /* Poly key mask     */
45*f1939f7cSShane Wang 
46*f1939f7cSShane Wang #ifdef __LITTLE_ENDIAN
47*f1939f7cSShane Wang #define INDEX_HIGH 1
48*f1939f7cSShane Wang #define INDEX_LOW 0
49*f1939f7cSShane Wang #else
50*f1939f7cSShane Wang #define INDEX_HIGH 0
51*f1939f7cSShane Wang #define INDEX_LOW 1
52*f1939f7cSShane Wang #endif
53*f1939f7cSShane Wang 
54*f1939f7cSShane Wang /*
55*f1939f7cSShane Wang  * The following routines are used in this implementation. They are
56*f1939f7cSShane Wang  * written via macros to simulate zero-overhead call-by-reference.
57*f1939f7cSShane Wang  *
58*f1939f7cSShane Wang  * MUL64: 64x64->128-bit multiplication
59*f1939f7cSShane Wang  * PMUL64: assumes top bits cleared on inputs
60*f1939f7cSShane Wang  * ADD128: 128x128->128-bit addition
61*f1939f7cSShane Wang  */
62*f1939f7cSShane Wang 
63*f1939f7cSShane Wang #define ADD128(rh, rl, ih, il)						\
64*f1939f7cSShane Wang 	do {								\
65*f1939f7cSShane Wang 		u64 _il = (il);						\
66*f1939f7cSShane Wang 		(rl) += (_il);						\
67*f1939f7cSShane Wang 		if ((rl) < (_il))					\
68*f1939f7cSShane Wang 			(rh)++;						\
69*f1939f7cSShane Wang 		(rh) += (ih);						\
70*f1939f7cSShane Wang 	} while (0)
71*f1939f7cSShane Wang 
72*f1939f7cSShane Wang #define MUL32(i1, i2)	((u64)(u32)(i1)*(u32)(i2))
73*f1939f7cSShane Wang 
74*f1939f7cSShane Wang #define PMUL64(rh, rl, i1, i2)	/* Assumes m doesn't overflow */	\
75*f1939f7cSShane Wang 	do {								\
76*f1939f7cSShane Wang 		u64 _i1 = (i1), _i2 = (i2);				\
77*f1939f7cSShane Wang 		u64 m = MUL32(_i1, _i2>>32) + MUL32(_i1>>32, _i2);	\
78*f1939f7cSShane Wang 		rh = MUL32(_i1>>32, _i2>>32);				\
79*f1939f7cSShane Wang 		rl = MUL32(_i1, _i2);					\
80*f1939f7cSShane Wang 		ADD128(rh, rl, (m >> 32), (m << 32));			\
81*f1939f7cSShane Wang 	} while (0)
82*f1939f7cSShane Wang 
83*f1939f7cSShane Wang #define MUL64(rh, rl, i1, i2)						\
84*f1939f7cSShane Wang 	do {								\
85*f1939f7cSShane Wang 		u64 _i1 = (i1), _i2 = (i2);				\
86*f1939f7cSShane Wang 		u64 m1 = MUL32(_i1, _i2>>32);				\
87*f1939f7cSShane Wang 		u64 m2 = MUL32(_i1>>32, _i2);				\
88*f1939f7cSShane Wang 		rh = MUL32(_i1>>32, _i2>>32);				\
89*f1939f7cSShane Wang 		rl = MUL32(_i1, _i2);					\
90*f1939f7cSShane Wang 		ADD128(rh, rl, (m1 >> 32), (m1 << 32));			\
91*f1939f7cSShane Wang 		ADD128(rh, rl, (m2 >> 32), (m2 << 32));			\
92*f1939f7cSShane Wang 	} while (0)
93*f1939f7cSShane Wang 
94*f1939f7cSShane Wang /*
95*f1939f7cSShane Wang  * For highest performance the L1 NH and L2 polynomial hashes should be
96*f1939f7cSShane Wang  * carefully implemented to take advantage of one's target architechture.
97*f1939f7cSShane Wang  * Here these two hash functions are defined multiple time; once for
98*f1939f7cSShane Wang  * 64-bit architectures, once for 32-bit SSE2 architectures, and once
99*f1939f7cSShane Wang  * for the rest (32-bit) architectures.
100*f1939f7cSShane Wang  * For each, nh_16 *must* be defined (works on multiples of 16 bytes).
101*f1939f7cSShane Wang  * Optionally, nh_vmac_nhbytes can be defined (for multiples of
102*f1939f7cSShane Wang  * VMAC_NHBYTES), and nh_16_2 and nh_vmac_nhbytes_2 (versions that do two
103*f1939f7cSShane Wang  * NH computations at once).
104*f1939f7cSShane Wang  */
105*f1939f7cSShane Wang 
106*f1939f7cSShane Wang #ifdef CONFIG_64BIT
107*f1939f7cSShane Wang 
108*f1939f7cSShane Wang #define nh_16(mp, kp, nw, rh, rl)					\
109*f1939f7cSShane Wang 	do {								\
110*f1939f7cSShane Wang 		int i; u64 th, tl;					\
111*f1939f7cSShane Wang 		rh = rl = 0;						\
112*f1939f7cSShane Wang 		for (i = 0; i < nw; i += 2) {				\
113*f1939f7cSShane Wang 			MUL64(th, tl, le64_to_cpup((mp)+i)+(kp)[i],	\
114*f1939f7cSShane Wang 				le64_to_cpup((mp)+i+1)+(kp)[i+1]);	\
115*f1939f7cSShane Wang 			ADD128(rh, rl, th, tl);				\
116*f1939f7cSShane Wang 		}							\
117*f1939f7cSShane Wang 	} while (0)
118*f1939f7cSShane Wang 
119*f1939f7cSShane Wang #define nh_16_2(mp, kp, nw, rh, rl, rh1, rl1)				\
120*f1939f7cSShane Wang 	do {								\
121*f1939f7cSShane Wang 		int i; u64 th, tl;					\
122*f1939f7cSShane Wang 		rh1 = rl1 = rh = rl = 0;				\
123*f1939f7cSShane Wang 		for (i = 0; i < nw; i += 2) {				\
124*f1939f7cSShane Wang 			MUL64(th, tl, le64_to_cpup((mp)+i)+(kp)[i],	\
125*f1939f7cSShane Wang 				le64_to_cpup((mp)+i+1)+(kp)[i+1]);	\
126*f1939f7cSShane Wang 			ADD128(rh, rl, th, tl);				\
127*f1939f7cSShane Wang 			MUL64(th, tl, le64_to_cpup((mp)+i)+(kp)[i+2],	\
128*f1939f7cSShane Wang 				le64_to_cpup((mp)+i+1)+(kp)[i+3]);	\
129*f1939f7cSShane Wang 			ADD128(rh1, rl1, th, tl);			\
130*f1939f7cSShane Wang 		}							\
131*f1939f7cSShane Wang 	} while (0)
132*f1939f7cSShane Wang 
133*f1939f7cSShane Wang #if (VMAC_NHBYTES >= 64) /* These versions do 64-bytes of message at a time */
134*f1939f7cSShane Wang #define nh_vmac_nhbytes(mp, kp, nw, rh, rl)				\
135*f1939f7cSShane Wang 	do {								\
136*f1939f7cSShane Wang 		int i; u64 th, tl;					\
137*f1939f7cSShane Wang 		rh = rl = 0;						\
138*f1939f7cSShane Wang 		for (i = 0; i < nw; i += 8) {				\
139*f1939f7cSShane Wang 			MUL64(th, tl, le64_to_cpup((mp)+i)+(kp)[i],	\
140*f1939f7cSShane Wang 				le64_to_cpup((mp)+i+1)+(kp)[i+1]);	\
141*f1939f7cSShane Wang 			ADD128(rh, rl, th, tl);				\
142*f1939f7cSShane Wang 			MUL64(th, tl, le64_to_cpup((mp)+i+2)+(kp)[i+2],	\
143*f1939f7cSShane Wang 				le64_to_cpup((mp)+i+3)+(kp)[i+3]);	\
144*f1939f7cSShane Wang 			ADD128(rh, rl, th, tl);				\
145*f1939f7cSShane Wang 			MUL64(th, tl, le64_to_cpup((mp)+i+4)+(kp)[i+4],	\
146*f1939f7cSShane Wang 				le64_to_cpup((mp)+i+5)+(kp)[i+5]);	\
147*f1939f7cSShane Wang 			ADD128(rh, rl, th, tl);				\
148*f1939f7cSShane Wang 			MUL64(th, tl, le64_to_cpup((mp)+i+6)+(kp)[i+6],	\
149*f1939f7cSShane Wang 				le64_to_cpup((mp)+i+7)+(kp)[i+7]);	\
150*f1939f7cSShane Wang 			ADD128(rh, rl, th, tl);				\
151*f1939f7cSShane Wang 		}							\
152*f1939f7cSShane Wang 	} while (0)
153*f1939f7cSShane Wang 
154*f1939f7cSShane Wang #define nh_vmac_nhbytes_2(mp, kp, nw, rh, rl, rh1, rl1)			\
155*f1939f7cSShane Wang 	do {								\
156*f1939f7cSShane Wang 		int i; u64 th, tl;					\
157*f1939f7cSShane Wang 		rh1 = rl1 = rh = rl = 0;				\
158*f1939f7cSShane Wang 		for (i = 0; i < nw; i += 8) {				\
159*f1939f7cSShane Wang 			MUL64(th, tl, le64_to_cpup((mp)+i)+(kp)[i],	\
160*f1939f7cSShane Wang 				le64_to_cpup((mp)+i+1)+(kp)[i+1]);	\
161*f1939f7cSShane Wang 			ADD128(rh, rl, th, tl);				\
162*f1939f7cSShane Wang 			MUL64(th, tl, le64_to_cpup((mp)+i)+(kp)[i+2],	\
163*f1939f7cSShane Wang 				le64_to_cpup((mp)+i+1)+(kp)[i+3]);	\
164*f1939f7cSShane Wang 			ADD128(rh1, rl1, th, tl);			\
165*f1939f7cSShane Wang 			MUL64(th, tl, le64_to_cpup((mp)+i+2)+(kp)[i+2],	\
166*f1939f7cSShane Wang 				le64_to_cpup((mp)+i+3)+(kp)[i+3]);	\
167*f1939f7cSShane Wang 			ADD128(rh, rl, th, tl);				\
168*f1939f7cSShane Wang 			MUL64(th, tl, le64_to_cpup((mp)+i+2)+(kp)[i+4],	\
169*f1939f7cSShane Wang 				le64_to_cpup((mp)+i+3)+(kp)[i+5]);	\
170*f1939f7cSShane Wang 			ADD128(rh1, rl1, th, tl);			\
171*f1939f7cSShane Wang 			MUL64(th, tl, le64_to_cpup((mp)+i+4)+(kp)[i+4],	\
172*f1939f7cSShane Wang 				le64_to_cpup((mp)+i+5)+(kp)[i+5]);	\
173*f1939f7cSShane Wang 			ADD128(rh, rl, th, tl);				\
174*f1939f7cSShane Wang 			MUL64(th, tl, le64_to_cpup((mp)+i+4)+(kp)[i+6],	\
175*f1939f7cSShane Wang 				le64_to_cpup((mp)+i+5)+(kp)[i+7]);	\
176*f1939f7cSShane Wang 			ADD128(rh1, rl1, th, tl);			\
177*f1939f7cSShane Wang 			MUL64(th, tl, le64_to_cpup((mp)+i+6)+(kp)[i+6],	\
178*f1939f7cSShane Wang 				le64_to_cpup((mp)+i+7)+(kp)[i+7]);	\
179*f1939f7cSShane Wang 			ADD128(rh, rl, th, tl);				\
180*f1939f7cSShane Wang 			MUL64(th, tl, le64_to_cpup((mp)+i+6)+(kp)[i+8],	\
181*f1939f7cSShane Wang 				le64_to_cpup((mp)+i+7)+(kp)[i+9]);	\
182*f1939f7cSShane Wang 			ADD128(rh1, rl1, th, tl);			\
183*f1939f7cSShane Wang 		}							\
184*f1939f7cSShane Wang 	} while (0)
185*f1939f7cSShane Wang #endif
186*f1939f7cSShane Wang 
187*f1939f7cSShane Wang #define poly_step(ah, al, kh, kl, mh, ml)				\
188*f1939f7cSShane Wang 	do {								\
189*f1939f7cSShane Wang 		u64 t1h, t1l, t2h, t2l, t3h, t3l, z = 0;		\
190*f1939f7cSShane Wang 		/* compute ab*cd, put bd into result registers */	\
191*f1939f7cSShane Wang 		PMUL64(t3h, t3l, al, kh);				\
192*f1939f7cSShane Wang 		PMUL64(t2h, t2l, ah, kl);				\
193*f1939f7cSShane Wang 		PMUL64(t1h, t1l, ah, 2*kh);				\
194*f1939f7cSShane Wang 		PMUL64(ah, al, al, kl);					\
195*f1939f7cSShane Wang 		/* add 2 * ac to result */				\
196*f1939f7cSShane Wang 		ADD128(ah, al, t1h, t1l);				\
197*f1939f7cSShane Wang 		/* add together ad + bc */				\
198*f1939f7cSShane Wang 		ADD128(t2h, t2l, t3h, t3l);				\
199*f1939f7cSShane Wang 		/* now (ah,al), (t2l,2*t2h) need summing */		\
200*f1939f7cSShane Wang 		/* first add the high registers, carrying into t2h */	\
201*f1939f7cSShane Wang 		ADD128(t2h, ah, z, t2l);				\
202*f1939f7cSShane Wang 		/* double t2h and add top bit of ah */			\
203*f1939f7cSShane Wang 		t2h = 2 * t2h + (ah >> 63);				\
204*f1939f7cSShane Wang 		ah &= m63;						\
205*f1939f7cSShane Wang 		/* now add the low registers */				\
206*f1939f7cSShane Wang 		ADD128(ah, al, mh, ml);					\
207*f1939f7cSShane Wang 		ADD128(ah, al, z, t2h);					\
208*f1939f7cSShane Wang 	} while (0)
209*f1939f7cSShane Wang 
210*f1939f7cSShane Wang #else /* ! CONFIG_64BIT */
211*f1939f7cSShane Wang 
212*f1939f7cSShane Wang #ifndef nh_16
213*f1939f7cSShane Wang #define nh_16(mp, kp, nw, rh, rl)					\
214*f1939f7cSShane Wang 	do {								\
215*f1939f7cSShane Wang 		u64 t1, t2, m1, m2, t;					\
216*f1939f7cSShane Wang 		int i;							\
217*f1939f7cSShane Wang 		rh = rl = t = 0;					\
218*f1939f7cSShane Wang 		for (i = 0; i < nw; i += 2)  {				\
219*f1939f7cSShane Wang 			t1 = le64_to_cpup(mp+i) + kp[i];		\
220*f1939f7cSShane Wang 			t2 = le64_to_cpup(mp+i+1) + kp[i+1];		\
221*f1939f7cSShane Wang 			m2 = MUL32(t1 >> 32, t2);			\
222*f1939f7cSShane Wang 			m1 = MUL32(t1, t2 >> 32);			\
223*f1939f7cSShane Wang 			ADD128(rh, rl, MUL32(t1 >> 32, t2 >> 32),	\
224*f1939f7cSShane Wang 				MUL32(t1, t2));				\
225*f1939f7cSShane Wang 			rh += (u64)(u32)(m1 >> 32)			\
226*f1939f7cSShane Wang 				+ (u32)(m2 >> 32);			\
227*f1939f7cSShane Wang 			t += (u64)(u32)m1 + (u32)m2;			\
228*f1939f7cSShane Wang 		}							\
229*f1939f7cSShane Wang 		ADD128(rh, rl, (t >> 32), (t << 32));			\
230*f1939f7cSShane Wang 	} while (0)
231*f1939f7cSShane Wang #endif
232*f1939f7cSShane Wang 
233*f1939f7cSShane Wang static void poly_step_func(u64 *ahi, u64 *alo,
234*f1939f7cSShane Wang 			const u64 *kh, const u64 *kl,
235*f1939f7cSShane Wang 			const u64 *mh, const u64 *ml)
236*f1939f7cSShane Wang {
237*f1939f7cSShane Wang #define a0 (*(((u32 *)alo)+INDEX_LOW))
238*f1939f7cSShane Wang #define a1 (*(((u32 *)alo)+INDEX_HIGH))
239*f1939f7cSShane Wang #define a2 (*(((u32 *)ahi)+INDEX_LOW))
240*f1939f7cSShane Wang #define a3 (*(((u32 *)ahi)+INDEX_HIGH))
241*f1939f7cSShane Wang #define k0 (*(((u32 *)kl)+INDEX_LOW))
242*f1939f7cSShane Wang #define k1 (*(((u32 *)kl)+INDEX_HIGH))
243*f1939f7cSShane Wang #define k2 (*(((u32 *)kh)+INDEX_LOW))
244*f1939f7cSShane Wang #define k3 (*(((u32 *)kh)+INDEX_HIGH))
245*f1939f7cSShane Wang 
246*f1939f7cSShane Wang 	u64 p, q, t;
247*f1939f7cSShane Wang 	u32 t2;
248*f1939f7cSShane Wang 
249*f1939f7cSShane Wang 	p = MUL32(a3, k3);
250*f1939f7cSShane Wang 	p += p;
251*f1939f7cSShane Wang 	p += *(u64 *)mh;
252*f1939f7cSShane Wang 	p += MUL32(a0, k2);
253*f1939f7cSShane Wang 	p += MUL32(a1, k1);
254*f1939f7cSShane Wang 	p += MUL32(a2, k0);
255*f1939f7cSShane Wang 	t = (u32)(p);
256*f1939f7cSShane Wang 	p >>= 32;
257*f1939f7cSShane Wang 	p += MUL32(a0, k3);
258*f1939f7cSShane Wang 	p += MUL32(a1, k2);
259*f1939f7cSShane Wang 	p += MUL32(a2, k1);
260*f1939f7cSShane Wang 	p += MUL32(a3, k0);
261*f1939f7cSShane Wang 	t |= ((u64)((u32)p & 0x7fffffff)) << 32;
262*f1939f7cSShane Wang 	p >>= 31;
263*f1939f7cSShane Wang 	p += (u64)(((u32 *)ml)[INDEX_LOW]);
264*f1939f7cSShane Wang 	p += MUL32(a0, k0);
265*f1939f7cSShane Wang 	q =  MUL32(a1, k3);
266*f1939f7cSShane Wang 	q += MUL32(a2, k2);
267*f1939f7cSShane Wang 	q += MUL32(a3, k1);
268*f1939f7cSShane Wang 	q += q;
269*f1939f7cSShane Wang 	p += q;
270*f1939f7cSShane Wang 	t2 = (u32)(p);
271*f1939f7cSShane Wang 	p >>= 32;
272*f1939f7cSShane Wang 	p += (u64)(((u32 *)ml)[INDEX_HIGH]);
273*f1939f7cSShane Wang 	p += MUL32(a0, k1);
274*f1939f7cSShane Wang 	p += MUL32(a1, k0);
275*f1939f7cSShane Wang 	q =  MUL32(a2, k3);
276*f1939f7cSShane Wang 	q += MUL32(a3, k2);
277*f1939f7cSShane Wang 	q += q;
278*f1939f7cSShane Wang 	p += q;
279*f1939f7cSShane Wang 	*(u64 *)(alo) = (p << 32) | t2;
280*f1939f7cSShane Wang 	p >>= 32;
281*f1939f7cSShane Wang 	*(u64 *)(ahi) = p + t;
282*f1939f7cSShane Wang 
283*f1939f7cSShane Wang #undef a0
284*f1939f7cSShane Wang #undef a1
285*f1939f7cSShane Wang #undef a2
286*f1939f7cSShane Wang #undef a3
287*f1939f7cSShane Wang #undef k0
288*f1939f7cSShane Wang #undef k1
289*f1939f7cSShane Wang #undef k2
290*f1939f7cSShane Wang #undef k3
291*f1939f7cSShane Wang }
292*f1939f7cSShane Wang 
293*f1939f7cSShane Wang #define poly_step(ah, al, kh, kl, mh, ml)				\
294*f1939f7cSShane Wang 	poly_step_func(&(ah), &(al), &(kh), &(kl), &(mh), &(ml))
295*f1939f7cSShane Wang 
296*f1939f7cSShane Wang #endif  /* end of specialized NH and poly definitions */
297*f1939f7cSShane Wang 
298*f1939f7cSShane Wang /* At least nh_16 is defined. Defined others as needed here */
299*f1939f7cSShane Wang #ifndef nh_16_2
300*f1939f7cSShane Wang #define nh_16_2(mp, kp, nw, rh, rl, rh2, rl2)				\
301*f1939f7cSShane Wang 	do { 								\
302*f1939f7cSShane Wang 		nh_16(mp, kp, nw, rh, rl);				\
303*f1939f7cSShane Wang 		nh_16(mp, ((kp)+2), nw, rh2, rl2);			\
304*f1939f7cSShane Wang 	} while (0)
305*f1939f7cSShane Wang #endif
306*f1939f7cSShane Wang #ifndef nh_vmac_nhbytes
307*f1939f7cSShane Wang #define nh_vmac_nhbytes(mp, kp, nw, rh, rl)				\
308*f1939f7cSShane Wang 	nh_16(mp, kp, nw, rh, rl)
309*f1939f7cSShane Wang #endif
310*f1939f7cSShane Wang #ifndef nh_vmac_nhbytes_2
311*f1939f7cSShane Wang #define nh_vmac_nhbytes_2(mp, kp, nw, rh, rl, rh2, rl2)			\
312*f1939f7cSShane Wang 	do {								\
313*f1939f7cSShane Wang 		nh_vmac_nhbytes(mp, kp, nw, rh, rl);			\
314*f1939f7cSShane Wang 		nh_vmac_nhbytes(mp, ((kp)+2), nw, rh2, rl2);		\
315*f1939f7cSShane Wang 	} while (0)
316*f1939f7cSShane Wang #endif
317*f1939f7cSShane Wang 
318*f1939f7cSShane Wang static void vhash_abort(struct vmac_ctx *ctx)
319*f1939f7cSShane Wang {
320*f1939f7cSShane Wang 	ctx->polytmp[0] = ctx->polykey[0] ;
321*f1939f7cSShane Wang 	ctx->polytmp[1] = ctx->polykey[1] ;
322*f1939f7cSShane Wang 	ctx->first_block_processed = 0;
323*f1939f7cSShane Wang }
324*f1939f7cSShane Wang 
325*f1939f7cSShane Wang static u64 l3hash(u64 p1, u64 p2,
326*f1939f7cSShane Wang 			u64 k1, u64 k2, u64 len)
327*f1939f7cSShane Wang {
328*f1939f7cSShane Wang 	u64 rh, rl, t, z = 0;
329*f1939f7cSShane Wang 
330*f1939f7cSShane Wang 	/* fully reduce (p1,p2)+(len,0) mod p127 */
331*f1939f7cSShane Wang 	t = p1 >> 63;
332*f1939f7cSShane Wang 	p1 &= m63;
333*f1939f7cSShane Wang 	ADD128(p1, p2, len, t);
334*f1939f7cSShane Wang 	/* At this point, (p1,p2) is at most 2^127+(len<<64) */
335*f1939f7cSShane Wang 	t = (p1 > m63) + ((p1 == m63) && (p2 == m64));
336*f1939f7cSShane Wang 	ADD128(p1, p2, z, t);
337*f1939f7cSShane Wang 	p1 &= m63;
338*f1939f7cSShane Wang 
339*f1939f7cSShane Wang 	/* compute (p1,p2)/(2^64-2^32) and (p1,p2)%(2^64-2^32) */
340*f1939f7cSShane Wang 	t = p1 + (p2 >> 32);
341*f1939f7cSShane Wang 	t += (t >> 32);
342*f1939f7cSShane Wang 	t += (u32)t > 0xfffffffeu;
343*f1939f7cSShane Wang 	p1 += (t >> 32);
344*f1939f7cSShane Wang 	p2 += (p1 << 32);
345*f1939f7cSShane Wang 
346*f1939f7cSShane Wang 	/* compute (p1+k1)%p64 and (p2+k2)%p64 */
347*f1939f7cSShane Wang 	p1 += k1;
348*f1939f7cSShane Wang 	p1 += (0 - (p1 < k1)) & 257;
349*f1939f7cSShane Wang 	p2 += k2;
350*f1939f7cSShane Wang 	p2 += (0 - (p2 < k2)) & 257;
351*f1939f7cSShane Wang 
352*f1939f7cSShane Wang 	/* compute (p1+k1)*(p2+k2)%p64 */
353*f1939f7cSShane Wang 	MUL64(rh, rl, p1, p2);
354*f1939f7cSShane Wang 	t = rh >> 56;
355*f1939f7cSShane Wang 	ADD128(t, rl, z, rh);
356*f1939f7cSShane Wang 	rh <<= 8;
357*f1939f7cSShane Wang 	ADD128(t, rl, z, rh);
358*f1939f7cSShane Wang 	t += t << 8;
359*f1939f7cSShane Wang 	rl += t;
360*f1939f7cSShane Wang 	rl += (0 - (rl < t)) & 257;
361*f1939f7cSShane Wang 	rl += (0 - (rl > p64-1)) & 257;
362*f1939f7cSShane Wang 	return rl;
363*f1939f7cSShane Wang }
364*f1939f7cSShane Wang 
365*f1939f7cSShane Wang static void vhash_update(const unsigned char *m,
366*f1939f7cSShane Wang 			unsigned int mbytes, /* Pos multiple of VMAC_NHBYTES */
367*f1939f7cSShane Wang 			struct vmac_ctx *ctx)
368*f1939f7cSShane Wang {
369*f1939f7cSShane Wang 	u64 rh, rl, *mptr;
370*f1939f7cSShane Wang 	const u64 *kptr = (u64 *)ctx->nhkey;
371*f1939f7cSShane Wang 	int i;
372*f1939f7cSShane Wang 	u64 ch, cl;
373*f1939f7cSShane Wang 	u64 pkh = ctx->polykey[0];
374*f1939f7cSShane Wang 	u64 pkl = ctx->polykey[1];
375*f1939f7cSShane Wang 
376*f1939f7cSShane Wang 	mptr = (u64 *)m;
377*f1939f7cSShane Wang 	i = mbytes / VMAC_NHBYTES;  /* Must be non-zero */
378*f1939f7cSShane Wang 
379*f1939f7cSShane Wang 	ch = ctx->polytmp[0];
380*f1939f7cSShane Wang 	cl = ctx->polytmp[1];
381*f1939f7cSShane Wang 
382*f1939f7cSShane Wang 	if (!ctx->first_block_processed) {
383*f1939f7cSShane Wang 		ctx->first_block_processed = 1;
384*f1939f7cSShane Wang 		nh_vmac_nhbytes(mptr, kptr, VMAC_NHBYTES/8, rh, rl);
385*f1939f7cSShane Wang 		rh &= m62;
386*f1939f7cSShane Wang 		ADD128(ch, cl, rh, rl);
387*f1939f7cSShane Wang 		mptr += (VMAC_NHBYTES/sizeof(u64));
388*f1939f7cSShane Wang 		i--;
389*f1939f7cSShane Wang 	}
390*f1939f7cSShane Wang 
391*f1939f7cSShane Wang 	while (i--) {
392*f1939f7cSShane Wang 		nh_vmac_nhbytes(mptr, kptr, VMAC_NHBYTES/8, rh, rl);
393*f1939f7cSShane Wang 		rh &= m62;
394*f1939f7cSShane Wang 		poly_step(ch, cl, pkh, pkl, rh, rl);
395*f1939f7cSShane Wang 		mptr += (VMAC_NHBYTES/sizeof(u64));
396*f1939f7cSShane Wang 	}
397*f1939f7cSShane Wang 
398*f1939f7cSShane Wang 	ctx->polytmp[0] = ch;
399*f1939f7cSShane Wang 	ctx->polytmp[1] = cl;
400*f1939f7cSShane Wang }
401*f1939f7cSShane Wang 
402*f1939f7cSShane Wang static u64 vhash(unsigned char m[], unsigned int mbytes,
403*f1939f7cSShane Wang 			u64 *tagl, struct vmac_ctx *ctx)
404*f1939f7cSShane Wang {
405*f1939f7cSShane Wang 	u64 rh, rl, *mptr;
406*f1939f7cSShane Wang 	const u64 *kptr = (u64 *)ctx->nhkey;
407*f1939f7cSShane Wang 	int i, remaining;
408*f1939f7cSShane Wang 	u64 ch, cl;
409*f1939f7cSShane Wang 	u64 pkh = ctx->polykey[0];
410*f1939f7cSShane Wang 	u64 pkl = ctx->polykey[1];
411*f1939f7cSShane Wang 
412*f1939f7cSShane Wang 	mptr = (u64 *)m;
413*f1939f7cSShane Wang 	i = mbytes / VMAC_NHBYTES;
414*f1939f7cSShane Wang 	remaining = mbytes % VMAC_NHBYTES;
415*f1939f7cSShane Wang 
416*f1939f7cSShane Wang 	if (ctx->first_block_processed) {
417*f1939f7cSShane Wang 		ch = ctx->polytmp[0];
418*f1939f7cSShane Wang 		cl = ctx->polytmp[1];
419*f1939f7cSShane Wang 	} else if (i) {
420*f1939f7cSShane Wang 		nh_vmac_nhbytes(mptr, kptr, VMAC_NHBYTES/8, ch, cl);
421*f1939f7cSShane Wang 		ch &= m62;
422*f1939f7cSShane Wang 		ADD128(ch, cl, pkh, pkl);
423*f1939f7cSShane Wang 		mptr += (VMAC_NHBYTES/sizeof(u64));
424*f1939f7cSShane Wang 		i--;
425*f1939f7cSShane Wang 	} else if (remaining) {
426*f1939f7cSShane Wang 		nh_16(mptr, kptr, 2*((remaining+15)/16), ch, cl);
427*f1939f7cSShane Wang 		ch &= m62;
428*f1939f7cSShane Wang 		ADD128(ch, cl, pkh, pkl);
429*f1939f7cSShane Wang 		mptr += (VMAC_NHBYTES/sizeof(u64));
430*f1939f7cSShane Wang 		goto do_l3;
431*f1939f7cSShane Wang 	} else {/* Empty String */
432*f1939f7cSShane Wang 		ch = pkh; cl = pkl;
433*f1939f7cSShane Wang 		goto do_l3;
434*f1939f7cSShane Wang 	}
435*f1939f7cSShane Wang 
436*f1939f7cSShane Wang 	while (i--) {
437*f1939f7cSShane Wang 		nh_vmac_nhbytes(mptr, kptr, VMAC_NHBYTES/8, rh, rl);
438*f1939f7cSShane Wang 		rh &= m62;
439*f1939f7cSShane Wang 		poly_step(ch, cl, pkh, pkl, rh, rl);
440*f1939f7cSShane Wang 		mptr += (VMAC_NHBYTES/sizeof(u64));
441*f1939f7cSShane Wang 	}
442*f1939f7cSShane Wang 	if (remaining) {
443*f1939f7cSShane Wang 		nh_16(mptr, kptr, 2*((remaining+15)/16), rh, rl);
444*f1939f7cSShane Wang 		rh &= m62;
445*f1939f7cSShane Wang 		poly_step(ch, cl, pkh, pkl, rh, rl);
446*f1939f7cSShane Wang 	}
447*f1939f7cSShane Wang 
448*f1939f7cSShane Wang do_l3:
449*f1939f7cSShane Wang 	vhash_abort(ctx);
450*f1939f7cSShane Wang 	remaining *= 8;
451*f1939f7cSShane Wang 	return l3hash(ch, cl, ctx->l3key[0], ctx->l3key[1], remaining);
452*f1939f7cSShane Wang }
453*f1939f7cSShane Wang 
454*f1939f7cSShane Wang static u64 vmac(unsigned char m[], unsigned int mbytes,
455*f1939f7cSShane Wang 			unsigned char n[16], u64 *tagl,
456*f1939f7cSShane Wang 			struct vmac_ctx_t *ctx)
457*f1939f7cSShane Wang {
458*f1939f7cSShane Wang 	u64 *in_n, *out_p;
459*f1939f7cSShane Wang 	u64 p, h;
460*f1939f7cSShane Wang 	int i;
461*f1939f7cSShane Wang 
462*f1939f7cSShane Wang 	in_n = ctx->__vmac_ctx.cached_nonce;
463*f1939f7cSShane Wang 	out_p = ctx->__vmac_ctx.cached_aes;
464*f1939f7cSShane Wang 
465*f1939f7cSShane Wang 	i = n[15] & 1;
466*f1939f7cSShane Wang 	if ((*(u64 *)(n+8) != in_n[1]) || (*(u64 *)(n) != in_n[0])) {
467*f1939f7cSShane Wang 		in_n[0] = *(u64 *)(n);
468*f1939f7cSShane Wang 		in_n[1] = *(u64 *)(n+8);
469*f1939f7cSShane Wang 		((unsigned char *)in_n)[15] &= 0xFE;
470*f1939f7cSShane Wang 		crypto_cipher_encrypt_one(ctx->child,
471*f1939f7cSShane Wang 			(unsigned char *)out_p, (unsigned char *)in_n);
472*f1939f7cSShane Wang 
473*f1939f7cSShane Wang 		((unsigned char *)in_n)[15] |= (unsigned char)(1-i);
474*f1939f7cSShane Wang 	}
475*f1939f7cSShane Wang 	p = be64_to_cpup(out_p + i);
476*f1939f7cSShane Wang 	h = vhash(m, mbytes, (u64 *)0, &ctx->__vmac_ctx);
477*f1939f7cSShane Wang 	return p + h;
478*f1939f7cSShane Wang }
479*f1939f7cSShane Wang 
480*f1939f7cSShane Wang static int vmac_set_key(unsigned char user_key[], struct vmac_ctx_t *ctx)
481*f1939f7cSShane Wang {
482*f1939f7cSShane Wang 	u64 in[2] = {0}, out[2];
483*f1939f7cSShane Wang 	unsigned i;
484*f1939f7cSShane Wang 	int err = 0;
485*f1939f7cSShane Wang 
486*f1939f7cSShane Wang 	err = crypto_cipher_setkey(ctx->child, user_key, VMAC_KEY_LEN);
487*f1939f7cSShane Wang 	if (err)
488*f1939f7cSShane Wang 		return err;
489*f1939f7cSShane Wang 
490*f1939f7cSShane Wang 	/* Fill nh key */
491*f1939f7cSShane Wang 	((unsigned char *)in)[0] = 0x80;
492*f1939f7cSShane Wang 	for (i = 0; i < sizeof(ctx->__vmac_ctx.nhkey)/8; i += 2) {
493*f1939f7cSShane Wang 		crypto_cipher_encrypt_one(ctx->child,
494*f1939f7cSShane Wang 			(unsigned char *)out, (unsigned char *)in);
495*f1939f7cSShane Wang 		ctx->__vmac_ctx.nhkey[i] = be64_to_cpup(out);
496*f1939f7cSShane Wang 		ctx->__vmac_ctx.nhkey[i+1] = be64_to_cpup(out+1);
497*f1939f7cSShane Wang 		((unsigned char *)in)[15] += 1;
498*f1939f7cSShane Wang 	}
499*f1939f7cSShane Wang 
500*f1939f7cSShane Wang 	/* Fill poly key */
501*f1939f7cSShane Wang 	((unsigned char *)in)[0] = 0xC0;
502*f1939f7cSShane Wang 	in[1] = 0;
503*f1939f7cSShane Wang 	for (i = 0; i < sizeof(ctx->__vmac_ctx.polykey)/8; i += 2) {
504*f1939f7cSShane Wang 		crypto_cipher_encrypt_one(ctx->child,
505*f1939f7cSShane Wang 			(unsigned char *)out, (unsigned char *)in);
506*f1939f7cSShane Wang 		ctx->__vmac_ctx.polytmp[i] =
507*f1939f7cSShane Wang 			ctx->__vmac_ctx.polykey[i] =
508*f1939f7cSShane Wang 				be64_to_cpup(out) & mpoly;
509*f1939f7cSShane Wang 		ctx->__vmac_ctx.polytmp[i+1] =
510*f1939f7cSShane Wang 			ctx->__vmac_ctx.polykey[i+1] =
511*f1939f7cSShane Wang 				be64_to_cpup(out+1) & mpoly;
512*f1939f7cSShane Wang 		((unsigned char *)in)[15] += 1;
513*f1939f7cSShane Wang 	}
514*f1939f7cSShane Wang 
515*f1939f7cSShane Wang 	/* Fill ip key */
516*f1939f7cSShane Wang 	((unsigned char *)in)[0] = 0xE0;
517*f1939f7cSShane Wang 	in[1] = 0;
518*f1939f7cSShane Wang 	for (i = 0; i < sizeof(ctx->__vmac_ctx.l3key)/8; i += 2) {
519*f1939f7cSShane Wang 		do {
520*f1939f7cSShane Wang 			crypto_cipher_encrypt_one(ctx->child,
521*f1939f7cSShane Wang 				(unsigned char *)out, (unsigned char *)in);
522*f1939f7cSShane Wang 			ctx->__vmac_ctx.l3key[i] = be64_to_cpup(out);
523*f1939f7cSShane Wang 			ctx->__vmac_ctx.l3key[i+1] = be64_to_cpup(out+1);
524*f1939f7cSShane Wang 			((unsigned char *)in)[15] += 1;
525*f1939f7cSShane Wang 		} while (ctx->__vmac_ctx.l3key[i] >= p64
526*f1939f7cSShane Wang 			|| ctx->__vmac_ctx.l3key[i+1] >= p64);
527*f1939f7cSShane Wang 	}
528*f1939f7cSShane Wang 
529*f1939f7cSShane Wang 	/* Invalidate nonce/aes cache and reset other elements */
530*f1939f7cSShane Wang 	ctx->__vmac_ctx.cached_nonce[0] = (u64)-1; /* Ensure illegal nonce */
531*f1939f7cSShane Wang 	ctx->__vmac_ctx.cached_nonce[1] = (u64)0;  /* Ensure illegal nonce */
532*f1939f7cSShane Wang 	ctx->__vmac_ctx.first_block_processed = 0;
533*f1939f7cSShane Wang 
534*f1939f7cSShane Wang 	return err;
535*f1939f7cSShane Wang }
536*f1939f7cSShane Wang 
537*f1939f7cSShane Wang static int vmac_setkey(struct crypto_shash *parent,
538*f1939f7cSShane Wang 		const u8 *key, unsigned int keylen)
539*f1939f7cSShane Wang {
540*f1939f7cSShane Wang 	struct vmac_ctx_t *ctx = crypto_shash_ctx(parent);
541*f1939f7cSShane Wang 
542*f1939f7cSShane Wang 	if (keylen != VMAC_KEY_LEN) {
543*f1939f7cSShane Wang 		crypto_shash_set_flags(parent, CRYPTO_TFM_RES_BAD_KEY_LEN);
544*f1939f7cSShane Wang 		return -EINVAL;
545*f1939f7cSShane Wang 	}
546*f1939f7cSShane Wang 
547*f1939f7cSShane Wang 	return vmac_set_key((u8 *)key, ctx);
548*f1939f7cSShane Wang }
549*f1939f7cSShane Wang 
550*f1939f7cSShane Wang static int vmac_init(struct shash_desc *pdesc)
551*f1939f7cSShane Wang {
552*f1939f7cSShane Wang 	struct crypto_shash *parent = pdesc->tfm;
553*f1939f7cSShane Wang 	struct vmac_ctx_t *ctx = crypto_shash_ctx(parent);
554*f1939f7cSShane Wang 
555*f1939f7cSShane Wang 	memset(&ctx->__vmac_ctx, 0, sizeof(struct vmac_ctx));
556*f1939f7cSShane Wang 	return 0;
557*f1939f7cSShane Wang }
558*f1939f7cSShane Wang 
559*f1939f7cSShane Wang static int vmac_update(struct shash_desc *pdesc, const u8 *p,
560*f1939f7cSShane Wang 		unsigned int len)
561*f1939f7cSShane Wang {
562*f1939f7cSShane Wang 	struct crypto_shash *parent = pdesc->tfm;
563*f1939f7cSShane Wang 	struct vmac_ctx_t *ctx = crypto_shash_ctx(parent);
564*f1939f7cSShane Wang 
565*f1939f7cSShane Wang 	vhash_update(p, len, &ctx->__vmac_ctx);
566*f1939f7cSShane Wang 
567*f1939f7cSShane Wang 	return 0;
568*f1939f7cSShane Wang }
569*f1939f7cSShane Wang 
570*f1939f7cSShane Wang static int vmac_final(struct shash_desc *pdesc, u8 *out)
571*f1939f7cSShane Wang {
572*f1939f7cSShane Wang 	struct crypto_shash *parent = pdesc->tfm;
573*f1939f7cSShane Wang 	struct vmac_ctx_t *ctx = crypto_shash_ctx(parent);
574*f1939f7cSShane Wang 	vmac_t mac;
575*f1939f7cSShane Wang 	u8 nonce[16] = {};
576*f1939f7cSShane Wang 
577*f1939f7cSShane Wang 	mac = vmac(NULL, 0, nonce, NULL, ctx);
578*f1939f7cSShane Wang 	memcpy(out, &mac, sizeof(vmac_t));
579*f1939f7cSShane Wang 	memset(&mac, 0, sizeof(vmac_t));
580*f1939f7cSShane Wang 	memset(&ctx->__vmac_ctx, 0, sizeof(struct vmac_ctx));
581*f1939f7cSShane Wang 	return 0;
582*f1939f7cSShane Wang }
583*f1939f7cSShane Wang 
584*f1939f7cSShane Wang static int vmac_init_tfm(struct crypto_tfm *tfm)
585*f1939f7cSShane Wang {
586*f1939f7cSShane Wang 	struct crypto_cipher *cipher;
587*f1939f7cSShane Wang 	struct crypto_instance *inst = (void *)tfm->__crt_alg;
588*f1939f7cSShane Wang 	struct crypto_spawn *spawn = crypto_instance_ctx(inst);
589*f1939f7cSShane Wang 	struct vmac_ctx_t *ctx = crypto_tfm_ctx(tfm);
590*f1939f7cSShane Wang 
591*f1939f7cSShane Wang 	cipher = crypto_spawn_cipher(spawn);
592*f1939f7cSShane Wang 	if (IS_ERR(cipher))
593*f1939f7cSShane Wang 		return PTR_ERR(cipher);
594*f1939f7cSShane Wang 
595*f1939f7cSShane Wang 	ctx->child = cipher;
596*f1939f7cSShane Wang 	return 0;
597*f1939f7cSShane Wang }
598*f1939f7cSShane Wang 
599*f1939f7cSShane Wang static void vmac_exit_tfm(struct crypto_tfm *tfm)
600*f1939f7cSShane Wang {
601*f1939f7cSShane Wang 	struct vmac_ctx_t *ctx = crypto_tfm_ctx(tfm);
602*f1939f7cSShane Wang 	crypto_free_cipher(ctx->child);
603*f1939f7cSShane Wang }
604*f1939f7cSShane Wang 
605*f1939f7cSShane Wang static int vmac_create(struct crypto_template *tmpl, struct rtattr **tb)
606*f1939f7cSShane Wang {
607*f1939f7cSShane Wang 	struct shash_instance *inst;
608*f1939f7cSShane Wang 	struct crypto_alg *alg;
609*f1939f7cSShane Wang 	int err;
610*f1939f7cSShane Wang 
611*f1939f7cSShane Wang 	err = crypto_check_attr_type(tb, CRYPTO_ALG_TYPE_SHASH);
612*f1939f7cSShane Wang 	if (err)
613*f1939f7cSShane Wang 		return err;
614*f1939f7cSShane Wang 
615*f1939f7cSShane Wang 	alg = crypto_get_attr_alg(tb, CRYPTO_ALG_TYPE_CIPHER,
616*f1939f7cSShane Wang 			CRYPTO_ALG_TYPE_MASK);
617*f1939f7cSShane Wang 	if (IS_ERR(alg))
618*f1939f7cSShane Wang 		return PTR_ERR(alg);
619*f1939f7cSShane Wang 
620*f1939f7cSShane Wang 	inst = shash_alloc_instance("vmac", alg);
621*f1939f7cSShane Wang 	err = PTR_ERR(inst);
622*f1939f7cSShane Wang 	if (IS_ERR(inst))
623*f1939f7cSShane Wang 		goto out_put_alg;
624*f1939f7cSShane Wang 
625*f1939f7cSShane Wang 	err = crypto_init_spawn(shash_instance_ctx(inst), alg,
626*f1939f7cSShane Wang 			shash_crypto_instance(inst),
627*f1939f7cSShane Wang 			CRYPTO_ALG_TYPE_MASK);
628*f1939f7cSShane Wang 	if (err)
629*f1939f7cSShane Wang 		goto out_free_inst;
630*f1939f7cSShane Wang 
631*f1939f7cSShane Wang 	inst->alg.base.cra_priority = alg->cra_priority;
632*f1939f7cSShane Wang 	inst->alg.base.cra_blocksize = alg->cra_blocksize;
633*f1939f7cSShane Wang 	inst->alg.base.cra_alignmask = alg->cra_alignmask;
634*f1939f7cSShane Wang 
635*f1939f7cSShane Wang 	inst->alg.digestsize = sizeof(vmac_t);
636*f1939f7cSShane Wang 	inst->alg.base.cra_ctxsize = sizeof(struct vmac_ctx_t);
637*f1939f7cSShane Wang 	inst->alg.base.cra_init = vmac_init_tfm;
638*f1939f7cSShane Wang 	inst->alg.base.cra_exit = vmac_exit_tfm;
639*f1939f7cSShane Wang 
640*f1939f7cSShane Wang 	inst->alg.init = vmac_init;
641*f1939f7cSShane Wang 	inst->alg.update = vmac_update;
642*f1939f7cSShane Wang 	inst->alg.final = vmac_final;
643*f1939f7cSShane Wang 	inst->alg.setkey = vmac_setkey;
644*f1939f7cSShane Wang 
645*f1939f7cSShane Wang 	err = shash_register_instance(tmpl, inst);
646*f1939f7cSShane Wang 	if (err) {
647*f1939f7cSShane Wang out_free_inst:
648*f1939f7cSShane Wang 		shash_free_instance(shash_crypto_instance(inst));
649*f1939f7cSShane Wang 	}
650*f1939f7cSShane Wang 
651*f1939f7cSShane Wang out_put_alg:
652*f1939f7cSShane Wang 	crypto_mod_put(alg);
653*f1939f7cSShane Wang 	return err;
654*f1939f7cSShane Wang }
655*f1939f7cSShane Wang 
656*f1939f7cSShane Wang static struct crypto_template vmac_tmpl = {
657*f1939f7cSShane Wang 	.name = "vmac",
658*f1939f7cSShane Wang 	.create = vmac_create,
659*f1939f7cSShane Wang 	.free = shash_free_instance,
660*f1939f7cSShane Wang 	.module = THIS_MODULE,
661*f1939f7cSShane Wang };
662*f1939f7cSShane Wang 
663*f1939f7cSShane Wang static int __init vmac_module_init(void)
664*f1939f7cSShane Wang {
665*f1939f7cSShane Wang 	return crypto_register_template(&vmac_tmpl);
666*f1939f7cSShane Wang }
667*f1939f7cSShane Wang 
668*f1939f7cSShane Wang static void __exit vmac_module_exit(void)
669*f1939f7cSShane Wang {
670*f1939f7cSShane Wang 	crypto_unregister_template(&vmac_tmpl);
671*f1939f7cSShane Wang }
672*f1939f7cSShane Wang 
673*f1939f7cSShane Wang module_init(vmac_module_init);
674*f1939f7cSShane Wang module_exit(vmac_module_exit);
675*f1939f7cSShane Wang 
676*f1939f7cSShane Wang MODULE_LICENSE("GPL");
677*f1939f7cSShane Wang MODULE_DESCRIPTION("VMAC hash algorithm");
678*f1939f7cSShane Wang 
679