]> git.cryptolib.org Git - arm-crypto-lib.git/blob - serpent/serpent-sboxes-bitslice.c
switching to dedicated endian switching function
[arm-crypto-lib.git] / serpent / serpent-sboxes-bitslice.c
1 /* serpent-sboxes-bitslice.c */
2 /*
3     This file is part of the ARM-Crypto-Lib.
4     Copyright (C) 2006-2010  Daniel Otte (daniel.otte@rub.de)
5
6     This program is free software: you can redistribute it and/or modify
7     it under the terms of the GNU General Public License as published by
8     the Free Software Foundation, either version 3 of the License, or
9     (at your option) any later version.
10
11     This program is distributed in the hope that it will be useful,
12     but WITHOUT ANY WARRANTY; without even the implied warranty of
13     MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
14     GNU General Public License for more details.
15
16     You should have received a copy of the GNU General Public License
17     along with this program.  If not, see <http://www.gnu.org/licenses/>.
18 */
19 /* serpent-sboxes.c
20  * a bitsliced implementation of the serpent sboxes
21  * author: Daniel Otte 
22  * email:  daniel.otte@rub.de
23  * license: GPLv3
24  */
25
26 #include <stdint.h>
27 #include <string.h>
28 #include "serpent-sboxes.h"
29
30
31 /* S0:   3  8 15  1 10  6  5 11 14 13  4  2  7  0  9 12 */
32
33 /* depth = 5,7,4,2, Total gates=18 */
34 static
35 void sb0(uint8_t* out, const uint8_t* in){
36 // (a,b,c,d,w,x,y,z) 
37         uint8_t t01, t02, t03, t05, t06, t07, t08, t09, t11, t12, t13, t14, t15, t17;
38         t01          = in[4*1]  ^ in[4*2]; 
39         t02          = in[4*0]  | in[4*3]; 
40         t03          = in[4*0]  ^ in[4*1]; 
41         out[4*3]   = t02        ^ t01; 
42         t05          = in[4*2]  | out[4*3]; 
43         t06          = in[4*0]  ^ in[4*3]; 
44         t07          = in[4*1]  | in[4*2]; 
45         t08          = in[4*3]  & t05; 
46         t09          = t03        & t07; 
47         out[4*2]   = t09        ^ t08; 
48         t11          = t09        & out[4*2]; 
49         t12          = in[4*2]  ^ in[4*3]; 
50         t13          = t07        ^ t11; 
51         t14          = in[4*1]  & t06; 
52         t15          = t06        ^ t13; 
53         out[4*0]   =     ~ t15; 
54         t17          = out[4*0] ^ t14; 
55         out[4*1]   = t12        ^ t17; 
56 }
57
58 /* InvS0:  13  3 11  0 10  6  5 12  1 14  4  7 15  9  8  2 */
59
60 /* depth = 8,4,3,6, Total gates=19 */
61 static
62 void sb0_inv(uint8_t* out, const uint8_t* in){
63         uint8_t t02, t03, t04, t05, t06, t08, t09, t10, t12, t13, t14, t15, t17, t18, t01;
64         t01          = in[4*2] ^ in[4*3];
65         t02          = in[4*0] | in[4*1];
66         t03          = in[4*1] | in[4*2];
67         t04          = in[4*2] & t01;
68         t05          = t02       ^ t01;
69         t06          = in[4*0] | t04;
70         out[4*2]   =     ~ t05;
71         t08          = in[4*1]   ^ in[4*3];
72         t09          = t03       & t08;
73         t10          = in[4*3]   | out[4*2];
74         out[4*1]   = t09       ^ t06;
75         t12          = in[4*0]   | t05;
76         t13          = out[4*1]   ^ t12;
77         t14          = t03       ^ t10;
78         t15          = in[4*0]   ^ in[4*2];
79         out[4*3]   = t14       ^ t13;
80         t17          = t05       & t13;
81         t18          = t14       | t17;
82         out[4*0]   = t15       ^ t18; 
83 }
84
85 /* S1:  15 12  2  7  9  0  5 10  1 11 14  8  6 13  3  4 */
86
87 /* depth = 10,7,3,5, Total gates=18 */
88 static 
89 void sb1(uint8_t* out, const uint8_t* in){
90         uint8_t t02, t03, t04, t05, t06, t07, t08, t10, t11, t12, t13, t16, t17, t01;
91         t01          = in[4*0]   | in[4*3];
92         t02          = in[4*2]   ^ in[4*3];
93         t03          =     ~ in[4*1];
94         t04          = in[4*0]   ^ in[4*2];
95         t05          = in[4*0]   | t03;
96         t06          = in[4*3]   & t04;
97         t07          = t01       & t02;
98         t08          = in[4*1]   | t06;
99         out[4*2]   = t02       ^ t05;
100         t10          = t07       ^ t08;
101         t11          = t01       ^ t10;
102         t12          = out[4*2]   ^ t11;
103         t13          = in[4*1]   & in[4*3];
104         out[4*3]   =     ~ t10;
105         out[4*1]   = t13       ^ t12;
106         t16          = t10       | out[4*1];
107         t17          = t05       & t16;
108         out[4*0]   = in[4*2]   ^ t17; 
109 }
110
111 /* InvS1:   5  8  2 14 15  6 12  3 11  4  7  9  1 13 10  0 */
112
113 /* depth = 7,4,5,3, Total gates=18 */
114 static void sb1_inv(uint8_t* out, const uint8_t* in){
115         uint8_t t02, t03, t04, t05, t06, t07, t08, t09, t10, t11, t14, t15, t17, t01;
116         t01          = in[4*0]   ^ in[4*1];
117         t02          = in[4*1]   | in[4*3];
118         t03          = in[4*0]   & in[4*2];
119         t04          = in[4*2]   ^ t02;
120         t05          = in[4*0]   | t04;
121         t06          = t01       & t05;
122         t07          = in[4*3]   | t03;
123         t08          = in[4*1]   ^ t06;
124         t09          = t07       ^ t06;
125         t10          = t04       | t03;
126         t11          = in[4*3]   & t08;
127         out[4*2]   =     ~ t09;
128         out[4*1]   = t10       ^ t11;
129         t14          = in[4*0]   | out[4*2];
130         t15          = t06       ^ out[4*1];
131         out[4*3]   = t01       ^ t04;
132         t17          = in[4*2]   ^ t15;
133         out[4*0]   = t14       ^ t17; 
134 }
135
136 /* S2:   8  6  7  9  3 12 10 15 13  1 14  4  0 11  5  2 */
137
138 /* depth = 3,8,11,7, Total gates=16 */
139 static void sb2(uint8_t* out, const uint8_t* in){
140         uint8_t t02, t03, t05, t06, t07, t08, t09, t10, t12, t13, t14, t01;
141         t01          = in[4*0]   | in[4*2];
142         t02          = in[4*0]   ^ in[4*1];
143         t03          = in[4*3]   ^ t01;
144         out[4*0]   = t02       ^ t03;
145         t05          = in[4*2]   ^ out[4*0];
146         t06          = in[4*1]   ^ t05;
147         t07          = in[4*1]   | t05;
148         t08          = t01       & t06;
149         t09          = t03       ^ t07;
150         t10          = t02       | t09;
151         out[4*1]   = t10       ^ t08;
152         t12          = in[4*0]   | in[4*3];
153         t13          = t09       ^ out[4*1];
154         t14          = in[4*1]   ^ t13;
155         out[4*3]   =     ~ t09;
156         out[4*2]   = t12       ^ t14; 
157 }
158
159 /* InvS2:  12  9 15  4 11 14  1  2  0  3  6 13  5  8 10  7 */
160
161 /* depth = 3,6,8,3, Total gates=18 */
162 static void sb2_inv(uint8_t* out, const uint8_t* in){
163         uint8_t t02, t03, t04, t06, t07, t08, t09, t10, t11, t12, t15, t16, t17, t01;
164         t01          = in[4*0]   ^ in[4*3];
165         t02          = in[4*2]   ^ in[4*3];
166         t03          = in[4*0]   & in[4*2];
167         t04          = in[4*1]   | t02;
168         out[4*0]   = t01       ^ t04;
169         t06          = in[4*0]   | in[4*2];
170         t07          = in[4*3]   | out[4*0];
171         t08          =     ~ in[4*3];
172         t09          = in[4*1]   & t06;
173         t10          = t08       | t03;
174         t11          = in[4*1]   & t07;
175         t12          = t06       & t02;
176         out[4*3]   = t09       ^ t10;
177         out[4*1]   = t12       ^ t11;
178         t15          = in[4*2]   & out[4*3];
179         t16          = out[4*0]   ^ out[4*1];
180         t17          = t10       ^ t15;
181         out[4*2]   = t16       ^ t17; 
182 }
183
184 /* S3:   0 15 11  8 12  9  6  3 13  1  2  4 10  7  5 14 */
185
186 /* depth = 8,3,5,5, Total gates=18 */
187 static void sb3(uint8_t* out, const uint8_t* in){
188         uint8_t t02, t03, t04, t05, t06, t07, t08, t09, t10, t11, t13, t14, t15, t01;
189         t01          = in[4*0]   ^ in[4*2];
190         t02          = in[4*0]   | in[4*3];
191         t03          = in[4*0]   & in[4*3];
192         t04          = t01       & t02;
193         t05          = in[4*1]   | t03;
194         t06          = in[4*0]   & in[4*1];
195         t07          = in[4*3]   ^ t04;
196         t08          = in[4*2]   | t06;
197         t09          = in[4*1]   ^ t07;
198         t10          = in[4*3]   & t05;
199         t11          = t02       ^ t10;
200         out[4*3]   = t08       ^ t09;
201         t13          = in[4*3]   | out[4*3];
202         t14          = in[4*0]   | t07;
203         t15          = in[4*1]   & t13;
204         out[4*2]   = t08       ^ t11;
205         out[4*0]   = t14       ^ t15;
206         out[4*1]   = t05       ^ t04; 
207 }
208
209 /* InvS3:   0  9 10  7 11 14  6 13  3  5 12  2  4  8 15  1 */
210
211 /* depth = 3,6,4,4, Total gates=17 */
212 static void sb3_inv(uint8_t* out, const uint8_t* in){
213         uint8_t t02, t03, t04, t05, t06, t07, t09, t11, t12, t13, t14, t16, t01;
214         t01          = in[4*2]   | in[4*3];
215         t02          = in[4*0]   | in[4*3];
216         t03          = in[4*2]   ^ t02;
217         t04          = in[4*1]   ^ t02;
218         t05          = in[4*0]   ^ in[4*3];
219         t06          = t04       & t03;
220         t07          = in[4*1]   & t01;
221         out[4*2]   = t05       ^ t06;
222         t09          = in[4*0]   ^ t03;
223         out[4*0]   = t07       ^ t03;
224         t11          = out[4*0]   | t05;
225         t12          = t09       & t11;
226         t13          = in[4*0]   & out[4*2];
227         t14          = t01       ^ t05;
228         out[4*1]   = in[4*1]   ^ t12;
229         t16          = in[4*1]   | t13;
230         out[4*3]   = t14       ^ t16; 
231 }
232
233 /* S4:   1 15  8  3 12  0 11  6  2  5  4 10  9 14  7 13 */
234
235 /* depth = 6,7,5,3, Total gates=19 */
236 static void sb4(uint8_t* out, const uint8_t* in){
237         uint8_t t02, t03, t04, t05, t06, t08, t09, t10, t11, t12, t13, t14, t15, t16, t01;
238         t01          = in[4*0]   | in[4*1];
239         t02          = in[4*1]   | in[4*2];
240         t03          = in[4*0]   ^ t02;
241         t04          = in[4*1]   ^ in[4*3];
242         t05          = in[4*3]   | t03;
243         t06          = in[4*3]   & t01;
244         out[4*3]   = t03       ^ t06;
245         t08          = out[4*3]   & t04;
246         t09          = t04       & t05;
247         t10          = in[4*2]   ^ t06;
248         t11          = in[4*1]   & in[4*2];
249         t12          = t04       ^ t08;
250         t13          = t11       | t03;
251         t14          = t10       ^ t09;
252         t15          = in[4*0]   & t05;
253         t16          = t11       | t12;
254         out[4*2]   = t13       ^ t08;
255         out[4*1]   = t15       ^ t16;
256         out[4*0]   =     ~ t14; 
257 }
258
259 /* InvS4:   5  0  8  3 10  9  7 14  2 12 11  6  4 15 13  1 */
260
261 /* depth = 6,4,7,3, Total gates=17 */
262 static void sb4_inv(uint8_t* out, const uint8_t* in){
263         uint8_t t02, t03, t04, t05, t06, t07, t09, t10, t11, t12, t13, t15, t01;
264         t01          = in[4*1]   | in[4*3];
265         t02          = in[4*2]   | in[4*3];
266         t03          = in[4*0]   & t01;
267         t04          = in[4*1]   ^ t02;
268         t05          = in[4*2]   ^ in[4*3];
269         t06          =     ~ t03;
270         t07          = in[4*0]   & t04;
271         out[4*1]   = t05       ^ t07;
272         t09          = out[4*1]   | t06;
273         t10          = in[4*0]   ^ t07;
274         t11          = t01       ^ t09;
275         t12          = in[4*3]   ^ t04;
276         t13          = in[4*2]   | t10;
277         out[4*3]   = t03       ^ t12;
278         t15          = in[4*0]   ^ t04;
279         out[4*2]   = t11       ^ t13;
280         out[4*0]   = t15       ^ t09; 
281 }
282
283 /* S5:  15  5  2 11  4 10  9 12  0  3 14  8 13  6  7  1 */
284
285 /* depth = 4,6,8,6, Total gates=17 */
286 static void sb5(uint8_t* out, const uint8_t* in){
287         uint8_t t02, t03, t04, t05, t07, t08, t09, t10, t11, t12, t13, t14, t01;
288         t01          = in[4*1]   ^ in[4*3];
289         t02          = in[4*1]   | in[4*3];
290         t03          = in[4*0]   & t01;
291         t04          = in[4*2]   ^ t02;
292         t05          = t03       ^ t04;
293         out[4*0]   =     ~ t05;
294         t07          = in[4*0]   ^ t01;
295         t08          = in[4*3]   | out[4*0];
296         t09          = in[4*1]   | t05;
297         t10          = in[4*3]   ^ t08;
298         t11          = in[4*1]   | t07;
299         t12          = t03       | out[4*0];
300         t13          = t07       | t10;
301         t14          = t01       ^ t11;
302         out[4*2]   = t09       ^ t13;
303         out[4*1]   = t07       ^ t08;
304         out[4*3]   = t12       ^ t14; 
305 }
306
307 /* InvS5:   8 15  2  9  4  1 13 14 11  6  5  3  7 12 10  0 */
308
309 /* depth = 4,6,9,7, Total gates=17 */
310 static void sb5_inv(uint8_t* out, const uint8_t* in){
311         uint8_t t02, t03, t04, t05, t07, t08, t09, t10, t12, t13, t15, t16, t01;
312         t01          = in[4*0]   & in[4*3];
313         t02          = in[4*2]   ^ t01;
314         t03          = in[4*0]   ^ in[4*3];
315         t04          = in[4*1]   & t02;
316         t05          = in[4*0]   & in[4*2];
317         out[4*0]   = t03       ^ t04;
318         t07          = in[4*0]   & out[4*0];
319         t08          = t01       ^ out[4*0];
320         t09          = in[4*1]   | t05;
321         t10          =     ~ in[4*1];
322         out[4*1]   = t08       ^ t09;
323         t12          = t10       | t07;
324         t13          = out[4*0]   | out[4*1];
325         out[4*3]   = t02       ^ t12;
326         t15          = t02       ^ t13;
327         t16          = in[4*1]   ^ in[4*3];
328         out[4*2]   = t16       ^ t15; 
329 }
330
331 /* S6:   7  2 12  5  8  4  6 11 14  9  1 15 13  3 10  0 */
332
333 /* depth = 8,3,6,3, Total gates=19 */
334 static void sb6(uint8_t* out, const uint8_t* in){
335         uint8_t t02, t03, t04, t05, t07, t08, t09, t10, t11, t12, t13, t15, t17, t18, t01;
336         t01          = in[4*0]   & in[4*3];
337         t02          = in[4*1]   ^ in[4*2];
338         t03          = in[4*0]   ^ in[4*3];
339         t04          = t01       ^ t02;
340         t05          = in[4*1]   | in[4*2];
341         out[4*1]   =     ~ t04;
342         t07          = t03       & t05;
343         t08          = in[4*1]   & out[4*1];
344         t09          = in[4*0]   | in[4*2];
345         t10          = t07       ^ t08;
346         t11          = in[4*1]   | in[4*3];
347         t12          = in[4*2]   ^ t11;
348         t13          = t09       ^ t10;
349         out[4*2]   =     ~ t13;
350         t15          = out[4*1]   & t03;
351         out[4*3]   = t12       ^ t07;
352         t17          = in[4*0]   ^ in[4*1];
353         t18          = out[4*2]   ^ t15;
354         out[4*0]   = t17       ^ t18; 
355 }
356
357 /* InvS6:  15 10  1 13  5  3  6  0  4  9 14  7  2 12  8 11 */
358
359 /* depth = 5,3,8,6, Total gates=19 */
360 static void sb6_inv(uint8_t* out, const uint8_t* in){
361         uint8_t t02, t03, t04, t05, t06, t07, t08, t09, t12, t13, t14, t15, t16, t17, t01;
362         t01          = in[4*0]   ^ in[4*2];
363         t02          =     ~ in[4*2];
364         t03          = in[4*1]   & t01;
365         t04          = in[4*1]   | t02;
366         t05          = in[4*3]   | t03;
367         t06          = in[4*1]   ^ in[4*3];
368         t07          = in[4*0]   & t04;
369         t08          = in[4*0]   | t02;
370         t09          = t07       ^ t05;
371         out[4*1]   = t06       ^ t08;
372         out[4*0]   =     ~ t09;
373         t12          = in[4*1]   & out[4*0];
374         t13          = t01       & t05;
375         t14          = t01       ^ t12;
376         t15          = t07       ^ t13;
377         t16          = in[4*3]   | t02;
378         t17          = in[4*0]   ^ out[4*1];
379         out[4*3]   = t17       ^ t15;
380         out[4*2]   = t16       ^ t14; 
381 }
382
383 /* S7:   1 13 15  0 14  8  2 11  7  4 12 10  9  3  5  6 */
384
385 /* depth = 10,7,10,4, Total gates=19 */
386 static void sb7(uint8_t* out, const uint8_t* in){
387         uint8_t t02, t03, t04, t05, t06, t08, t09, t10, t11, t13, t14, t15, t16, t17, t01;
388         t01          = in[4*0]   & in[4*2];
389         t02          =     ~ in[4*3];
390         t03          = in[4*0]   & t02;
391         t04          = in[4*1]   | t01;
392         t05          = in[4*0]   & in[4*1];
393         t06          = in[4*2]   ^ t04;
394         out[4*3]   = t03       ^ t06;
395         t08          = in[4*2]   | out[4*3];
396         t09          = in[4*3]   | t05;
397         t10          = in[4*0]   ^ t08;
398         t11          = t04       & out[4*3];
399         out[4*1]   = t09       ^ t10;
400         t13          = in[4*1]   ^ out[4*1];
401         t14          = t01       ^ out[4*1];
402         t15          = in[4*2]   ^ t05;
403         t16          = t11       | t13;
404         t17          = t02       | t14;
405         out[4*0]   = t15       ^ t17;
406         out[4*2]   = in[4*0]   ^ t16; 
407 }
408
409 /* InvS7:   3  0  6 13  9 14 15  8  5 12 11  7 10  1  4  2 */
410
411 /* depth = 9,7,3,3, Total gates=18 */
412 static void sb7_inv(uint8_t* out, const uint8_t* in){
413         uint8_t t02, t03, t04, t06, t07, t08, t09, t10, t11, t13, t14, t15, t16, t01;
414         t01          = in[4*0]   & in[4*1];
415         t02          = in[4*0]   | in[4*1];
416         t03          = in[4*2]   | t01;
417         t04          = in[4*3]   & t02;
418         out[4*3]   = t03       ^ t04;
419         t06          = in[4*1]   ^ t04;
420         t07          = in[4*3]   ^ out[4*3];
421         t08          =     ~ t07;
422         t09          = t06       | t08;
423         t10          = in[4*1]   ^ in[4*3];
424         t11          = in[4*0]   | in[4*3];
425         out[4*1]   = in[4*0]   ^ t09;
426         t13          = in[4*2]   ^ t06;
427         t14          = in[4*2]   & t11;
428         t15          = in[4*3]   | out[4*1];
429         t16          = t01       | t10;
430         out[4*0]   = t13       ^ t15;
431         out[4*2]   = t14       ^ t16; 
432 }
433
434 typedef void(*sb_fpt)(uint8_t*, const uint8_t*);
435
436 const sb_fpt sf_tab[]= {
437         sb0, sb1, sb2, sb3, 
438         sb4, sb5, sb6, sb7
439 };
440
441 const sb_fpt sinvf_tab[] = {
442         sb0_inv, sb1_inv, sb2_inv, sb3_inv, 
443         sb4_inv, sb5_inv, sb6_inv, sb7_inv
444 };
445
446 void sbox128(void * w, uint8_t box){
447         uint8_t i, buffer[16];
448         box &= 0x7;
449         
450         sb_fpt fp;
451         fp = (sb_fpt)(sf_tab[box]);
452         for(i=0; i<4; ++i){
453                 fp(buffer+i, (uint8_t*)w+i);
454         }
455         memcpy(w, buffer, 16);
456 }
457
458 void inv_sbox128(void * w, uint8_t box){
459         uint8_t i, buffer[16];
460         box &= 0x7;
461         
462         sb_fpt fp;
463         fp = (sb_fpt)(sinvf_tab[box]);
464         for(i=0; i<4; ++i){
465                 fp(buffer+i, (uint8_t*)w+i);
466         }
467         memcpy(w, buffer, 16);
468 }
469
470
471
472
473
474
475
476