1 /* serpent-sboxes-bitslice.c */
3 This file is part of the ARM-Crypto-Lib.
4 Copyright (C) 2006-2010 Daniel Otte (daniel.otte@rub.de)
6 This program is free software: you can redistribute it and/or modify
7 it under the terms of the GNU General Public License as published by
8 the Free Software Foundation, either version 3 of the License, or
9 (at your option) any later version.
11 This program is distributed in the hope that it will be useful,
12 but WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 GNU General Public License for more details.
16 You should have received a copy of the GNU General Public License
17 along with this program. If not, see <http://www.gnu.org/licenses/>.
20 * a bitsliced implementation of the serpent sboxes
22 * email: daniel.otte@rub.de
28 #include "serpent-sboxes.h"
31 /* S0: 3 8 15 1 10 6 5 11 14 13 4 2 7 0 9 12 */
33 /* depth = 5,7,4,2, Total gates=18 */
35 void sb0(uint8_t* out, const uint8_t* in){
37 uint8_t t01, t02, t03, t05, t06, t07, t08, t09, t11, t12, t13, t14, t15, t17;
38 t01 = in[4*1] ^ in[4*2];
39 t02 = in[4*0] | in[4*3];
40 t03 = in[4*0] ^ in[4*1];
42 t05 = in[4*2] | out[4*3];
43 t06 = in[4*0] ^ in[4*3];
44 t07 = in[4*1] | in[4*2];
49 t12 = in[4*2] ^ in[4*3];
58 /* InvS0: 13 3 11 0 10 6 5 12 1 14 4 7 15 9 8 2 */
60 /* depth = 8,4,3,6, Total gates=19 */
62 void sb0_inv(uint8_t* out, const uint8_t* in){
63 uint8_t t02, t03, t04, t05, t06, t08, t09, t10, t12, t13, t14, t15, t17, t18, t01;
64 t01 = in[4*2] ^ in[4*3];
65 t02 = in[4*0] | in[4*1];
66 t03 = in[4*1] | in[4*2];
71 t08 = in[4*1] ^ in[4*3];
73 t10 = in[4*3] | out[4*2];
78 t15 = in[4*0] ^ in[4*2];
85 /* S1: 15 12 2 7 9 0 5 10 1 11 14 8 6 13 3 4 */
87 /* depth = 10,7,3,5, Total gates=18 */
89 void sb1(uint8_t* out, const uint8_t* in){
90 uint8_t t02, t03, t04, t05, t06, t07, t08, t10, t11, t12, t13, t16, t17, t01;
91 t01 = in[4*0] | in[4*3];
92 t02 = in[4*2] ^ in[4*3];
94 t04 = in[4*0] ^ in[4*2];
102 t12 = out[4*2] ^ t11;
103 t13 = in[4*1] & in[4*3];
105 out[4*1] = t13 ^ t12;
106 t16 = t10 | out[4*1];
108 out[4*0] = in[4*2] ^ t17;
111 /* InvS1: 5 8 2 14 15 6 12 3 11 4 7 9 1 13 10 0 */
113 /* depth = 7,4,5,3, Total gates=18 */
114 static void sb1_inv(uint8_t* out, const uint8_t* in){
115 uint8_t t02, t03, t04, t05, t06, t07, t08, t09, t10, t11, t14, t15, t17, t01;
116 t01 = in[4*0] ^ in[4*1];
117 t02 = in[4*1] | in[4*3];
118 t03 = in[4*0] & in[4*2];
128 out[4*1] = t10 ^ t11;
129 t14 = in[4*0] | out[4*2];
130 t15 = t06 ^ out[4*1];
131 out[4*3] = t01 ^ t04;
133 out[4*0] = t14 ^ t17;
136 /* S2: 8 6 7 9 3 12 10 15 13 1 14 4 0 11 5 2 */
138 /* depth = 3,8,11,7, Total gates=16 */
139 static void sb2(uint8_t* out, const uint8_t* in){
140 uint8_t t02, t03, t05, t06, t07, t08, t09, t10, t12, t13, t14, t01;
141 t01 = in[4*0] | in[4*2];
142 t02 = in[4*0] ^ in[4*1];
144 out[4*0] = t02 ^ t03;
145 t05 = in[4*2] ^ out[4*0];
151 out[4*1] = t10 ^ t08;
152 t12 = in[4*0] | in[4*3];
153 t13 = t09 ^ out[4*1];
156 out[4*2] = t12 ^ t14;
159 /* InvS2: 12 9 15 4 11 14 1 2 0 3 6 13 5 8 10 7 */
161 /* depth = 3,6,8,3, Total gates=18 */
162 static void sb2_inv(uint8_t* out, const uint8_t* in){
163 uint8_t t02, t03, t04, t06, t07, t08, t09, t10, t11, t12, t15, t16, t17, t01;
164 t01 = in[4*0] ^ in[4*3];
165 t02 = in[4*2] ^ in[4*3];
166 t03 = in[4*0] & in[4*2];
168 out[4*0] = t01 ^ t04;
169 t06 = in[4*0] | in[4*2];
170 t07 = in[4*3] | out[4*0];
176 out[4*3] = t09 ^ t10;
177 out[4*1] = t12 ^ t11;
178 t15 = in[4*2] & out[4*3];
179 t16 = out[4*0] ^ out[4*1];
181 out[4*2] = t16 ^ t17;
184 /* S3: 0 15 11 8 12 9 6 3 13 1 2 4 10 7 5 14 */
186 /* depth = 8,3,5,5, Total gates=18 */
187 static void sb3(uint8_t* out, const uint8_t* in){
188 uint8_t t02, t03, t04, t05, t06, t07, t08, t09, t10, t11, t13, t14, t15, t01;
189 t01 = in[4*0] ^ in[4*2];
190 t02 = in[4*0] | in[4*3];
191 t03 = in[4*0] & in[4*3];
194 t06 = in[4*0] & in[4*1];
200 out[4*3] = t08 ^ t09;
201 t13 = in[4*3] | out[4*3];
204 out[4*2] = t08 ^ t11;
205 out[4*0] = t14 ^ t15;
206 out[4*1] = t05 ^ t04;
209 /* InvS3: 0 9 10 7 11 14 6 13 3 5 12 2 4 8 15 1 */
211 /* depth = 3,6,4,4, Total gates=17 */
212 static void sb3_inv(uint8_t* out, const uint8_t* in){
213 uint8_t t02, t03, t04, t05, t06, t07, t09, t11, t12, t13, t14, t16, t01;
214 t01 = in[4*2] | in[4*3];
215 t02 = in[4*0] | in[4*3];
218 t05 = in[4*0] ^ in[4*3];
221 out[4*2] = t05 ^ t06;
223 out[4*0] = t07 ^ t03;
224 t11 = out[4*0] | t05;
226 t13 = in[4*0] & out[4*2];
228 out[4*1] = in[4*1] ^ t12;
230 out[4*3] = t14 ^ t16;
233 /* S4: 1 15 8 3 12 0 11 6 2 5 4 10 9 14 7 13 */
235 /* depth = 6,7,5,3, Total gates=19 */
236 static void sb4(uint8_t* out, const uint8_t* in){
237 uint8_t t02, t03, t04, t05, t06, t08, t09, t10, t11, t12, t13, t14, t15, t16, t01;
238 t01 = in[4*0] | in[4*1];
239 t02 = in[4*1] | in[4*2];
241 t04 = in[4*1] ^ in[4*3];
244 out[4*3] = t03 ^ t06;
245 t08 = out[4*3] & t04;
248 t11 = in[4*1] & in[4*2];
254 out[4*2] = t13 ^ t08;
255 out[4*1] = t15 ^ t16;
259 /* InvS4: 5 0 8 3 10 9 7 14 2 12 11 6 4 15 13 1 */
261 /* depth = 6,4,7,3, Total gates=17 */
262 static void sb4_inv(uint8_t* out, const uint8_t* in){
263 uint8_t t02, t03, t04, t05, t06, t07, t09, t10, t11, t12, t13, t15, t01;
264 t01 = in[4*1] | in[4*3];
265 t02 = in[4*2] | in[4*3];
268 t05 = in[4*2] ^ in[4*3];
271 out[4*1] = t05 ^ t07;
272 t09 = out[4*1] | t06;
277 out[4*3] = t03 ^ t12;
279 out[4*2] = t11 ^ t13;
280 out[4*0] = t15 ^ t09;
283 /* S5: 15 5 2 11 4 10 9 12 0 3 14 8 13 6 7 1 */
285 /* depth = 4,6,8,6, Total gates=17 */
286 static void sb5(uint8_t* out, const uint8_t* in){
287 uint8_t t02, t03, t04, t05, t07, t08, t09, t10, t11, t12, t13, t14, t01;
288 t01 = in[4*1] ^ in[4*3];
289 t02 = in[4*1] | in[4*3];
295 t08 = in[4*3] | out[4*0];
299 t12 = t03 | out[4*0];
302 out[4*2] = t09 ^ t13;
303 out[4*1] = t07 ^ t08;
304 out[4*3] = t12 ^ t14;
307 /* InvS5: 8 15 2 9 4 1 13 14 11 6 5 3 7 12 10 0 */
309 /* depth = 4,6,9,7, Total gates=17 */
310 static void sb5_inv(uint8_t* out, const uint8_t* in){
311 uint8_t t02, t03, t04, t05, t07, t08, t09, t10, t12, t13, t15, t16, t01;
312 t01 = in[4*0] & in[4*3];
314 t03 = in[4*0] ^ in[4*3];
316 t05 = in[4*0] & in[4*2];
317 out[4*0] = t03 ^ t04;
318 t07 = in[4*0] & out[4*0];
319 t08 = t01 ^ out[4*0];
322 out[4*1] = t08 ^ t09;
324 t13 = out[4*0] | out[4*1];
325 out[4*3] = t02 ^ t12;
327 t16 = in[4*1] ^ in[4*3];
328 out[4*2] = t16 ^ t15;
331 /* S6: 7 2 12 5 8 4 6 11 14 9 1 15 13 3 10 0 */
333 /* depth = 8,3,6,3, Total gates=19 */
334 static void sb6(uint8_t* out, const uint8_t* in){
335 uint8_t t02, t03, t04, t05, t07, t08, t09, t10, t11, t12, t13, t15, t17, t18, t01;
336 t01 = in[4*0] & in[4*3];
337 t02 = in[4*1] ^ in[4*2];
338 t03 = in[4*0] ^ in[4*3];
340 t05 = in[4*1] | in[4*2];
343 t08 = in[4*1] & out[4*1];
344 t09 = in[4*0] | in[4*2];
346 t11 = in[4*1] | in[4*3];
350 t15 = out[4*1] & t03;
351 out[4*3] = t12 ^ t07;
352 t17 = in[4*0] ^ in[4*1];
353 t18 = out[4*2] ^ t15;
354 out[4*0] = t17 ^ t18;
357 /* InvS6: 15 10 1 13 5 3 6 0 4 9 14 7 2 12 8 11 */
359 /* depth = 5,3,8,6, Total gates=19 */
360 static void sb6_inv(uint8_t* out, const uint8_t* in){
361 uint8_t t02, t03, t04, t05, t06, t07, t08, t09, t12, t13, t14, t15, t16, t17, t01;
362 t01 = in[4*0] ^ in[4*2];
367 t06 = in[4*1] ^ in[4*3];
371 out[4*1] = t06 ^ t08;
373 t12 = in[4*1] & out[4*0];
378 t17 = in[4*0] ^ out[4*1];
379 out[4*3] = t17 ^ t15;
380 out[4*2] = t16 ^ t14;
383 /* S7: 1 13 15 0 14 8 2 11 7 4 12 10 9 3 5 6 */
385 /* depth = 10,7,10,4, Total gates=19 */
386 static void sb7(uint8_t* out, const uint8_t* in){
387 uint8_t t02, t03, t04, t05, t06, t08, t09, t10, t11, t13, t14, t15, t16, t17, t01;
388 t01 = in[4*0] & in[4*2];
392 t05 = in[4*0] & in[4*1];
394 out[4*3] = t03 ^ t06;
395 t08 = in[4*2] | out[4*3];
398 t11 = t04 & out[4*3];
399 out[4*1] = t09 ^ t10;
400 t13 = in[4*1] ^ out[4*1];
401 t14 = t01 ^ out[4*1];
405 out[4*0] = t15 ^ t17;
406 out[4*2] = in[4*0] ^ t16;
409 /* InvS7: 3 0 6 13 9 14 15 8 5 12 11 7 10 1 4 2 */
411 /* depth = 9,7,3,3, Total gates=18 */
412 static void sb7_inv(uint8_t* out, const uint8_t* in){
413 uint8_t t02, t03, t04, t06, t07, t08, t09, t10, t11, t13, t14, t15, t16, t01;
414 t01 = in[4*0] & in[4*1];
415 t02 = in[4*0] | in[4*1];
418 out[4*3] = t03 ^ t04;
420 t07 = in[4*3] ^ out[4*3];
423 t10 = in[4*1] ^ in[4*3];
424 t11 = in[4*0] | in[4*3];
425 out[4*1] = in[4*0] ^ t09;
428 t15 = in[4*3] | out[4*1];
430 out[4*0] = t13 ^ t15;
431 out[4*2] = t14 ^ t16;
434 typedef void(*sb_fpt)(uint8_t*, const uint8_t*);
436 const sb_fpt sf_tab[]= {
441 const sb_fpt sinvf_tab[] = {
442 sb0_inv, sb1_inv, sb2_inv, sb3_inv,
443 sb4_inv, sb5_inv, sb6_inv, sb7_inv
446 void sbox128(void * w, uint8_t box){
447 uint8_t i, buffer[16];
451 fp = (sb_fpt)(sf_tab[box]);
453 fp(buffer+i, (uint8_t*)w+i);
455 memcpy(w, buffer, 16);
458 void inv_sbox128(void * w, uint8_t box){
459 uint8_t i, buffer[16];
463 fp = (sb_fpt)(sinvf_tab[box]);
465 fp(buffer+i, (uint8_t*)w+i);
467 memcpy(w, buffer, 16);