cast.c revision 104476
1104476Ssam/*	$FreeBSD: head/sys/opencrypto/cast.c 104476 2002-10-04 20:31:23Z sam $	*/
2104476Ssam/*      $OpenBSD: cast.c,v 1.2 2000/06/06 06:49:47 deraadt Exp $       */
3104476Ssam
4104476Ssam/*
5104476Ssam *	CAST-128 in C
6104476Ssam *	Written by Steve Reid <sreid@sea-to-sky.net>
7104476Ssam *	100% Public Domain - no warranty
8104476Ssam *	Released 1997.10.11
9104476Ssam */
10104476Ssam
11104476Ssam#include <sys/types.h>
12104476Ssam#include <opencrypto/cast.h>
13104476Ssam#include <opencrypto/castsb.h>
14104476Ssam
15104476Ssam/* Macros to access 8-bit bytes out of a 32-bit word */
16104476Ssam#define U_INT8_Ta(x) ( (u_int8_t) (x>>24) )
17104476Ssam#define U_INT8_Tb(x) ( (u_int8_t) ((x>>16)&255) )
18104476Ssam#define U_INT8_Tc(x) ( (u_int8_t) ((x>>8)&255) )
19104476Ssam#define U_INT8_Td(x) ( (u_int8_t) ((x)&255) )
20104476Ssam
21104476Ssam/* Circular left shift */
22104476Ssam#define ROL(x, n) ( ((x)<<(n)) | ((x)>>(32-(n))) )
23104476Ssam
24104476Ssam/* CAST-128 uses three different round functions */
25104476Ssam#define F1(l, r, i) \
26104476Ssam	t = ROL(key->xkey[i] + r, key->xkey[i+16]); \
27104476Ssam	l ^= ((cast_sbox1[U_INT8_Ta(t)] ^ cast_sbox2[U_INT8_Tb(t)]) - \
28104476Ssam	 cast_sbox3[U_INT8_Tc(t)]) + cast_sbox4[U_INT8_Td(t)];
29104476Ssam#define F2(l, r, i) \
30104476Ssam	t = ROL(key->xkey[i] ^ r, key->xkey[i+16]); \
31104476Ssam	l ^= ((cast_sbox1[U_INT8_Ta(t)] - cast_sbox2[U_INT8_Tb(t)]) + \
32104476Ssam	 cast_sbox3[U_INT8_Tc(t)]) ^ cast_sbox4[U_INT8_Td(t)];
33104476Ssam#define F3(l, r, i) \
34104476Ssam	t = ROL(key->xkey[i] - r, key->xkey[i+16]); \
35104476Ssam	l ^= ((cast_sbox1[U_INT8_Ta(t)] + cast_sbox2[U_INT8_Tb(t)]) ^ \
36104476Ssam	 cast_sbox3[U_INT8_Tc(t)]) - cast_sbox4[U_INT8_Td(t)];
37104476Ssam
38104476Ssam
39104476Ssam/***** Encryption Function *****/
40104476Ssam
41104476Ssamvoid cast_encrypt(cast_key* key, u_int8_t* inblock, u_int8_t* outblock)
42104476Ssam{
43104476Ssamu_int32_t t, l, r;
44104476Ssam
45104476Ssam	/* Get inblock into l,r */
46104476Ssam	l = ((u_int32_t)inblock[0] << 24) | ((u_int32_t)inblock[1] << 16) |
47104476Ssam	 ((u_int32_t)inblock[2] << 8) | (u_int32_t)inblock[3];
48104476Ssam	r = ((u_int32_t)inblock[4] << 24) | ((u_int32_t)inblock[5] << 16) |
49104476Ssam	 ((u_int32_t)inblock[6] << 8) | (u_int32_t)inblock[7];
50104476Ssam	/* Do the work */
51104476Ssam	F1(l, r,  0);
52104476Ssam	F2(r, l,  1);
53104476Ssam	F3(l, r,  2);
54104476Ssam	F1(r, l,  3);
55104476Ssam	F2(l, r,  4);
56104476Ssam	F3(r, l,  5);
57104476Ssam	F1(l, r,  6);
58104476Ssam	F2(r, l,  7);
59104476Ssam	F3(l, r,  8);
60104476Ssam	F1(r, l,  9);
61104476Ssam	F2(l, r, 10);
62104476Ssam	F3(r, l, 11);
63104476Ssam	/* Only do full 16 rounds if key length > 80 bits */
64104476Ssam	if (key->rounds > 12) {
65104476Ssam		F1(l, r, 12);
66104476Ssam		F2(r, l, 13);
67104476Ssam		F3(l, r, 14);
68104476Ssam		F1(r, l, 15);
69104476Ssam	}
70104476Ssam	/* Put l,r into outblock */
71104476Ssam	outblock[0] = U_INT8_Ta(r);
72104476Ssam	outblock[1] = U_INT8_Tb(r);
73104476Ssam	outblock[2] = U_INT8_Tc(r);
74104476Ssam	outblock[3] = U_INT8_Td(r);
75104476Ssam	outblock[4] = U_INT8_Ta(l);
76104476Ssam	outblock[5] = U_INT8_Tb(l);
77104476Ssam	outblock[6] = U_INT8_Tc(l);
78104476Ssam	outblock[7] = U_INT8_Td(l);
79104476Ssam	/* Wipe clean */
80104476Ssam	t = l = r = 0;
81104476Ssam}
82104476Ssam
83104476Ssam
84104476Ssam/***** Decryption Function *****/
85104476Ssam
86104476Ssamvoid cast_decrypt(cast_key* key, u_int8_t* inblock, u_int8_t* outblock)
87104476Ssam{
88104476Ssamu_int32_t t, l, r;
89104476Ssam
90104476Ssam	/* Get inblock into l,r */
91104476Ssam	r = ((u_int32_t)inblock[0] << 24) | ((u_int32_t)inblock[1] << 16) |
92104476Ssam	 ((u_int32_t)inblock[2] << 8) | (u_int32_t)inblock[3];
93104476Ssam	l = ((u_int32_t)inblock[4] << 24) | ((u_int32_t)inblock[5] << 16) |
94104476Ssam	 ((u_int32_t)inblock[6] << 8) | (u_int32_t)inblock[7];
95104476Ssam	/* Do the work */
96104476Ssam	/* Only do full 16 rounds if key length > 80 bits */
97104476Ssam	if (key->rounds > 12) {
98104476Ssam		F1(r, l, 15);
99104476Ssam		F3(l, r, 14);
100104476Ssam		F2(r, l, 13);
101104476Ssam		F1(l, r, 12);
102104476Ssam	}
103104476Ssam	F3(r, l, 11);
104104476Ssam	F2(l, r, 10);
105104476Ssam	F1(r, l,  9);
106104476Ssam	F3(l, r,  8);
107104476Ssam	F2(r, l,  7);
108104476Ssam	F1(l, r,  6);
109104476Ssam	F3(r, l,  5);
110104476Ssam	F2(l, r,  4);
111104476Ssam	F1(r, l,  3);
112104476Ssam	F3(l, r,  2);
113104476Ssam	F2(r, l,  1);
114104476Ssam	F1(l, r,  0);
115104476Ssam	/* Put l,r into outblock */
116104476Ssam	outblock[0] = U_INT8_Ta(l);
117104476Ssam	outblock[1] = U_INT8_Tb(l);
118104476Ssam	outblock[2] = U_INT8_Tc(l);
119104476Ssam	outblock[3] = U_INT8_Td(l);
120104476Ssam	outblock[4] = U_INT8_Ta(r);
121104476Ssam	outblock[5] = U_INT8_Tb(r);
122104476Ssam	outblock[6] = U_INT8_Tc(r);
123104476Ssam	outblock[7] = U_INT8_Td(r);
124104476Ssam	/* Wipe clean */
125104476Ssam	t = l = r = 0;
126104476Ssam}
127104476Ssam
128104476Ssam
129104476Ssam/***** Key Schedual *****/
130104476Ssam
131104476Ssamvoid cast_setkey(cast_key* key, u_int8_t* rawkey, int keybytes)
132104476Ssam{
133104476Ssamu_int32_t t[4], z[4], x[4];
134104476Ssamint i;
135104476Ssam
136104476Ssam	/* Set number of rounds to 12 or 16, depending on key length */
137104476Ssam	key->rounds = (keybytes <= 10 ? 12 : 16);
138104476Ssam
139104476Ssam	/* Copy key to workspace x */
140104476Ssam	for (i = 0; i < 4; i++) {
141104476Ssam		x[i] = 0;
142104476Ssam		if ((i*4+0) < keybytes) x[i] = (u_int32_t)rawkey[i*4+0] << 24;
143104476Ssam		if ((i*4+1) < keybytes) x[i] |= (u_int32_t)rawkey[i*4+1] << 16;
144104476Ssam		if ((i*4+2) < keybytes) x[i] |= (u_int32_t)rawkey[i*4+2] << 8;
145104476Ssam		if ((i*4+3) < keybytes) x[i] |= (u_int32_t)rawkey[i*4+3];
146104476Ssam	}
147104476Ssam	/* Generate 32 subkeys, four at a time */
148104476Ssam	for (i = 0; i < 32; i+=4) {
149104476Ssam		switch (i & 4) {
150104476Ssam		 case 0:
151104476Ssam			t[0] = z[0] = x[0] ^ cast_sbox5[U_INT8_Tb(x[3])] ^
152104476Ssam			 cast_sbox6[U_INT8_Td(x[3])] ^ cast_sbox7[U_INT8_Ta(x[3])] ^
153104476Ssam			 cast_sbox8[U_INT8_Tc(x[3])] ^ cast_sbox7[U_INT8_Ta(x[2])];
154104476Ssam			t[1] = z[1] = x[2] ^ cast_sbox5[U_INT8_Ta(z[0])] ^
155104476Ssam			 cast_sbox6[U_INT8_Tc(z[0])] ^ cast_sbox7[U_INT8_Tb(z[0])] ^
156104476Ssam			 cast_sbox8[U_INT8_Td(z[0])] ^ cast_sbox8[U_INT8_Tc(x[2])];
157104476Ssam			t[2] = z[2] = x[3] ^ cast_sbox5[U_INT8_Td(z[1])] ^
158104476Ssam			 cast_sbox6[U_INT8_Tc(z[1])] ^ cast_sbox7[U_INT8_Tb(z[1])] ^
159104476Ssam			 cast_sbox8[U_INT8_Ta(z[1])] ^ cast_sbox5[U_INT8_Tb(x[2])];
160104476Ssam			t[3] = z[3] = x[1] ^ cast_sbox5[U_INT8_Tc(z[2])] ^
161104476Ssam			 cast_sbox6[U_INT8_Tb(z[2])] ^ cast_sbox7[U_INT8_Td(z[2])] ^
162104476Ssam			 cast_sbox8[U_INT8_Ta(z[2])] ^ cast_sbox6[U_INT8_Td(x[2])];
163104476Ssam			break;
164104476Ssam		 case 4:
165104476Ssam			t[0] = x[0] = z[2] ^ cast_sbox5[U_INT8_Tb(z[1])] ^
166104476Ssam			 cast_sbox6[U_INT8_Td(z[1])] ^ cast_sbox7[U_INT8_Ta(z[1])] ^
167104476Ssam			 cast_sbox8[U_INT8_Tc(z[1])] ^ cast_sbox7[U_INT8_Ta(z[0])];
168104476Ssam			t[1] = x[1] = z[0] ^ cast_sbox5[U_INT8_Ta(x[0])] ^
169104476Ssam			 cast_sbox6[U_INT8_Tc(x[0])] ^ cast_sbox7[U_INT8_Tb(x[0])] ^
170104476Ssam			 cast_sbox8[U_INT8_Td(x[0])] ^ cast_sbox8[U_INT8_Tc(z[0])];
171104476Ssam			t[2] = x[2] = z[1] ^ cast_sbox5[U_INT8_Td(x[1])] ^
172104476Ssam			 cast_sbox6[U_INT8_Tc(x[1])] ^ cast_sbox7[U_INT8_Tb(x[1])] ^
173104476Ssam			 cast_sbox8[U_INT8_Ta(x[1])] ^ cast_sbox5[U_INT8_Tb(z[0])];
174104476Ssam			t[3] = x[3] = z[3] ^ cast_sbox5[U_INT8_Tc(x[2])] ^
175104476Ssam			 cast_sbox6[U_INT8_Tb(x[2])] ^ cast_sbox7[U_INT8_Td(x[2])] ^
176104476Ssam			 cast_sbox8[U_INT8_Ta(x[2])] ^ cast_sbox6[U_INT8_Td(z[0])];
177104476Ssam			break;
178104476Ssam		}
179104476Ssam		switch (i & 12) {
180104476Ssam		 case 0:
181104476Ssam		 case 12:
182104476Ssam			key->xkey[i+0] = cast_sbox5[U_INT8_Ta(t[2])] ^ cast_sbox6[U_INT8_Tb(t[2])] ^
183104476Ssam			 cast_sbox7[U_INT8_Td(t[1])] ^ cast_sbox8[U_INT8_Tc(t[1])];
184104476Ssam			key->xkey[i+1] = cast_sbox5[U_INT8_Tc(t[2])] ^ cast_sbox6[U_INT8_Td(t[2])] ^
185104476Ssam			 cast_sbox7[U_INT8_Tb(t[1])] ^ cast_sbox8[U_INT8_Ta(t[1])];
186104476Ssam			key->xkey[i+2] = cast_sbox5[U_INT8_Ta(t[3])] ^ cast_sbox6[U_INT8_Tb(t[3])] ^
187104476Ssam			 cast_sbox7[U_INT8_Td(t[0])] ^ cast_sbox8[U_INT8_Tc(t[0])];
188104476Ssam			key->xkey[i+3] = cast_sbox5[U_INT8_Tc(t[3])] ^ cast_sbox6[U_INT8_Td(t[3])] ^
189104476Ssam			 cast_sbox7[U_INT8_Tb(t[0])] ^ cast_sbox8[U_INT8_Ta(t[0])];
190104476Ssam			break;
191104476Ssam		 case 4:
192104476Ssam		 case 8:
193104476Ssam			key->xkey[i+0] = cast_sbox5[U_INT8_Td(t[0])] ^ cast_sbox6[U_INT8_Tc(t[0])] ^
194104476Ssam			 cast_sbox7[U_INT8_Ta(t[3])] ^ cast_sbox8[U_INT8_Tb(t[3])];
195104476Ssam			key->xkey[i+1] = cast_sbox5[U_INT8_Tb(t[0])] ^ cast_sbox6[U_INT8_Ta(t[0])] ^
196104476Ssam			 cast_sbox7[U_INT8_Tc(t[3])] ^ cast_sbox8[U_INT8_Td(t[3])];
197104476Ssam			key->xkey[i+2] = cast_sbox5[U_INT8_Td(t[1])] ^ cast_sbox6[U_INT8_Tc(t[1])] ^
198104476Ssam			 cast_sbox7[U_INT8_Ta(t[2])] ^ cast_sbox8[U_INT8_Tb(t[2])];
199104476Ssam			key->xkey[i+3] = cast_sbox5[U_INT8_Tb(t[1])] ^ cast_sbox6[U_INT8_Ta(t[1])] ^
200104476Ssam			 cast_sbox7[U_INT8_Tc(t[2])] ^ cast_sbox8[U_INT8_Td(t[2])];
201104476Ssam			break;
202104476Ssam		}
203104476Ssam		switch (i & 12) {
204104476Ssam		 case 0:
205104476Ssam			key->xkey[i+0] ^= cast_sbox5[U_INT8_Tc(z[0])];
206104476Ssam			key->xkey[i+1] ^= cast_sbox6[U_INT8_Tc(z[1])];
207104476Ssam			key->xkey[i+2] ^= cast_sbox7[U_INT8_Tb(z[2])];
208104476Ssam			key->xkey[i+3] ^= cast_sbox8[U_INT8_Ta(z[3])];
209104476Ssam			break;
210104476Ssam		 case 4:
211104476Ssam			key->xkey[i+0] ^= cast_sbox5[U_INT8_Ta(x[2])];
212104476Ssam			key->xkey[i+1] ^= cast_sbox6[U_INT8_Tb(x[3])];
213104476Ssam			key->xkey[i+2] ^= cast_sbox7[U_INT8_Td(x[0])];
214104476Ssam			key->xkey[i+3] ^= cast_sbox8[U_INT8_Td(x[1])];
215104476Ssam			break;
216104476Ssam		 case 8:
217104476Ssam			key->xkey[i+0] ^= cast_sbox5[U_INT8_Tb(z[2])];
218104476Ssam			key->xkey[i+1] ^= cast_sbox6[U_INT8_Ta(z[3])];
219104476Ssam			key->xkey[i+2] ^= cast_sbox7[U_INT8_Tc(z[0])];
220104476Ssam			key->xkey[i+3] ^= cast_sbox8[U_INT8_Tc(z[1])];
221104476Ssam			break;
222104476Ssam		 case 12:
223104476Ssam			key->xkey[i+0] ^= cast_sbox5[U_INT8_Td(x[0])];
224104476Ssam			key->xkey[i+1] ^= cast_sbox6[U_INT8_Td(x[1])];
225104476Ssam			key->xkey[i+2] ^= cast_sbox7[U_INT8_Ta(x[2])];
226104476Ssam			key->xkey[i+3] ^= cast_sbox8[U_INT8_Tb(x[3])];
227104476Ssam			break;
228104476Ssam		}
229104476Ssam		if (i >= 16) {
230104476Ssam			key->xkey[i+0] &= 31;
231104476Ssam			key->xkey[i+1] &= 31;
232104476Ssam			key->xkey[i+2] &= 31;
233104476Ssam			key->xkey[i+3] &= 31;
234104476Ssam		}
235104476Ssam	}
236104476Ssam	/* Wipe clean */
237104476Ssam	for (i = 0; i < 4; i++) {
238104476Ssam		t[i] = x[i] = z[i] = 0;
239104476Ssam	}
240104476Ssam}
241104476Ssam
242104476Ssam/* Made in Canada */
243104476Ssam
244