3 This file is part of the ARM-Crypto-Lib.
4 Copyright (C) 2006-2010 Daniel Otte (daniel.otte@rub.de)
6 This program is free software: you can redistribute it and/or modify
7 it under the terms of the GNU General Public License as published by
8 the Free Software Foundation, either version 3 of the License, or
9 (at your option) any later version.
11 This program is distributed in the hope that it will be useful,
12 but WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 GNU General Public License for more details.
16 You should have received a copy of the GNU General Public License
17 along with this program. If not, see <http://www.gnu.org/licenses/>.
20 tmp = +t[ 5] +t[10] +t[13] +(tr1=-t[ 7]+t[14]) ;
21 q[ 0] = S32_0(tmp) + h[ 1];
22 tmp = +t[ 8] +t[13] +t[ 0] -(tr2=+t[ 1]+t[10]) ;
23 q[ 3] = S32_3(tmp) + h[ 4];
24 tmp = -t[11] +t[13] -t[ 0] -t[ 3] +t[ 4] ;
25 q[ 6] = S32_1(tmp) + h[ 7];
26 tmp = +t[ 0] +(tr0=-t[ 3]+t[ 6]) +(tr1) ;
27 q[ 9] = S32_4(tmp) + h[10];
28 tmp = -t[ 9] -(tr0) +(tr2) ;
29 q[12] = S32_2(tmp) + h[13];
30 tmp = -t[ 4] +(tr0=-t[ 9]+t[12]) +(tr1=-t[ 6]+t[13]) ;
31 q[15] = S32_0(tmp) + h[ 0];
32 tmp = +t[ 7] +t[15] +t[ 0] -(tr0) ;
33 q[ 2] = S32_2(tmp) + h[ 3];
34 tmp = +t[10] +(tr0=-t[ 2]+t[15]) +(tr2=+t[ 3]-t[12]) ;
35 q[ 5] = S32_0(tmp) + h[ 6];
36 tmp = -t[ 5] -(tr0) +(tr1) ;
37 q[ 8] = S32_3(tmp) + h[ 9];
38 tmp = -t[ 0] -t[ 2] +t[ 9] +(tr0=-t[ 5]+t[ 8]) ;
39 q[11] = S32_1(tmp) + h[12];
40 tmp = -t[11] +(tr0) +(tr2) ;
41 q[14] = S32_4(tmp) + h[15];
42 tmp = +t[ 6] +(tr0=+t[11]+t[14]) -(tr1=+t[ 8]+t[15]) ;
43 q[ 1] = S32_1(tmp) + h[ 2];
44 tmp = +t[ 9] +t[ 1] +t[ 2] -(tr0) ;
45 q[ 4] = S32_4(tmp) + h[ 5];
46 tmp = -t[12] -t[14] +t[ 1] -t[ 4] -t[ 5] ;
47 q[ 7] = S32_2(tmp) + h[ 8];
48 tmp = -t[ 1] -(tr0=+t[ 4]+t[ 7]) +(tr1) ;
49 q[10] = S32_0(tmp) + h[11];
50 tmp = +t[ 2] +t[10] +t[11] +(tr0) ;
51 q[13] = S32_3(tmp) + h[14];
54 tmp = +t[ 5] +t[10] +t[13] +(tr1=-t[ 7]+t[14]) ;
55 q[ 0] = S32_0(tmp) + h[ 1];
56 tmp = +t[ 8] +t[13] +t[ 0] -(tr2=+t[ 1]+t[10]) ;
57 q[ 3] = S32_3(tmp) + h[ 4];
58 tmp = -t[11] +t[13] -t[ 0] -t[ 3] +t[ 4] ;
59 q[ 6] = S32_1(tmp) + h[ 7];
60 tmp = +t[ 0] +(tr0=-t[ 3]+t[ 6]) +(tr1) ;
61 q[ 9] = S32_4(tmp) + h[10];
62 tmp = -t[ 9] -(tr0) +(tr2) ;
63 q[12] = S32_2(tmp) + h[13];
64 tmp = -t[ 4] +(tr0=-t[ 9]+t[12]) +(tr1=-t[ 6]+t[13]) ;
65 q[15] = S32_0(tmp) + h[ 0];
66 tmp = +t[ 7] +t[15] +t[ 0] -(tr0) ;
67 q[ 2] = S32_2(tmp) + h[ 3];
68 tmp = +t[10] +(tr0=-t[ 2]+t[15]) +(tr2=+t[ 3]-t[12]) ;
69 q[ 5] = S32_0(tmp) + h[ 6];
70 tmp = -t[ 5] -(tr0) +(tr1) ;
71 q[ 8] = S32_3(tmp) + h[ 9];
72 tmp = -t[ 0] -t[ 2] +t[ 9] +(tr0=-t[ 5]+t[ 8]) ;
73 q[11] = S32_1(tmp) + h[12];
74 tmp = -t[11] +(tr0) +(tr2) ;
75 q[14] = S32_4(tmp) + h[15];
76 tmp = +t[ 6] +(tr0=+t[11]+t[14]) -(tr1=+t[ 8]+t[15]) ;
77 q[ 1] = S32_1(tmp) + h[ 2];
78 tmp = +t[ 9] +t[ 1] +t[ 2] -(tr0) ;
79 q[ 4] = S32_4(tmp) + h[ 5];
80 tmp = -t[12] -t[14] +t[ 1] -t[ 4] -t[ 5] ;
81 q[ 7] = S32_2(tmp) + h[ 8];
82 tmp = -t[ 1] -(tr0=+t[ 4]+t[ 7]) +(tr1) ;
83 q[10] = S32_0(tmp) + h[11];
84 tmp = +t[ 2] +t[10] +t[11] +(tr0) ;
85 q[13] = S32_3(tmp) + h[14];
88 $registers = ["r3", "r4", "r5", "r6", "r7", "r8", "r9", "r10", "r11", "r12", "r14"].reverse
101 def is_numeric?(b=10)
104 (self==s) or (self==('+'+s))
108 return self.to_i if self.is_numeric?
117 attr_reader :write_tr0, :write_tr1, :write_tr2
118 attr_reader :index, :s, :h
123 @write_tr0 = Array.new
124 @write_tr1 = Array.new
125 @write_tr2 = Array.new
133 while m = /([+-])t\[[\s]*([\d]*)\](.*)/.match(s)
138 while m = /([+-])\(tr([012])(.*)/.match(s)
139 @read_tr << m[1]+m[2]
143 while m = /tr0=([+-])t\[[\s]*([\d]*)\][\s]*([+-])t\[[\s]*([\d]*)\](.*)/.match(s)
144 @write_tr0 << m[1]+m[2]
145 @write_tr0 << m[3]+m[4]
149 while m = /tr1=([+-])t\[[\s]*([\d]*)\][\s]*([+-])t\[[\s]*([\d]*)\](.*)/.match(s)
150 @write_tr1 << m[1]+m[2]
151 @write_tr1 << m[3]+m[4]
155 while m = /tr2=([+-])t\[[\s]*([\d]*)\][\s]*([+-])t\[[\s]*([\d]*)\](.*)/.match(s)
156 @write_tr2 << m[1]+m[2]
157 @write_tr2 << m[3]+m[4]
160 if m=/q\[[\s]*([\d]*)\]/m.match(line)
163 if m=/S32_([0-4])\(tmp\)/m.match(line)
166 if m=/h\[[\s]*([\d]*)\]/m.match(line)
174 $operations = Array.new
179 $c_code.each_line do |line|
180 # puts "DBG: line=", line
181 if /^[\s]*tmp/.match(line)
184 if /^[\s]*q\[[\s\d\]]/.match(line)
186 $operations[i] = Operation.new
188 $operations[i].parse(s)
197 tmp.each {|x| return x if x>i}
202 return self.index(nil) if self.index(nil)
204 return self.index(tmp[-1])
208 def find_register_to_free(registermap, regusemap, step)
209 if i=registermap.index(nil)
213 registermap.each do |x|
214 if x.class==Fixnum and regusemap[x.abs]
215 t = regusemap[x.abs].getsmallest(step)
221 return tmp.getlargestindex
225 def load_registers(regmap, stack, op, step)
228 push_list = Array.new
229 # set to_load2 to all registers which are not already loaded
230 # puts "DBG(a): "+regmap.inspect
231 op.read_t.each do |x|
233 to_load2 << x if regmap.index(x)==nil
236 regmap[find_register_to_free(regmap, $regusemap, step)] = 'x'
238 if op.write_tr0.length!=0
239 regmap[find_register_to_free(regmap, $regusemap, step)] = 'tr0'
241 if op.write_tr1.length!=0
242 regmap[find_register_to_free(regmap, $regusemap, step)] = 'tr1'
244 if op.write_tr2.length!=0
245 regmap[find_register_to_free(regmap, $regusemap, step)] = 'tr2'
249 to_load2.length.times do |i|
252 if x and y and (to_load2[i]+1 == to_load2[i+1]) and stack.index(x) and stack.index(y)
253 rx = regmap.index('x')
255 ry = regmap.index('x')
257 asm_out += sprintf(" ldrd %s, %s, [SP, #%d*4]\n", $registers[rx], $registers[ry], x)
266 y = regmap.index('x')
267 puts "Strange error!\n" if not y
270 asm_out += sprintf(" ldr %s, [SP, #%d*4]\n", $registers[y], x)
272 asm_out += sprintf(" ldr %s, [r1, #%d*4]\n", $registers[y], x)
273 asm_out += sprintf(" ldr %s, [r2, #%d*4]\n", $registers[-1], x)
274 asm_out += sprintf(" eor %s, %s\n", $registers[y], $registers[-1])
275 asm_out += sprintf(" str %s, [SP, #%d*4]\n", $registers[y], x)
277 # push_list << [$registers[y], x]
280 # if push_list.length!=0
281 # push_list.sort!{ |x,y| x[0].chopf.to_i <=> y[0].chopf.to_i}
282 # push_regs = push_list.collect {|x| x[0]}
283 # push_list.reverse.each {|x| stack << x[1]}
284 # asm_out += sprintf(" stmdb SP, {%s}\n", push_regs.join(', '))
287 # puts "DBG(0): "+regmap.inspect
288 # puts "DBG(1): "+to_load.inspect
289 # puts "DBG(2): "+to_load2.inspect
291 #puts 'DBG('+__LINE__.to_s+'): regmap = '+regmap.inspect
292 return regmap, stack, asm_out
295 def gen_simple_assembler(operations)
298 accu = $registers.length-1
299 # outr = $registers.length-4
300 # tr0 = $registers.length-3
301 # tr1 = $registers.length-2
302 # tr2 = $registers.length-4
304 reg_cnt = $registers.length-1
305 regmap = Array.new(reg_cnt)
308 asm_out += sprintf(" sub SP, #%d*4\n", 16)
309 operations.each do |op|
310 asm_out += sprintf("/*=== W[%2d] ===*/\n", op.index)
311 regmap, stack, tstr = load_registers(regmap, stack, op, step-1)
315 op.read_t.each do |t|
316 if regmap.index(t.chopf.to_i)==nil
317 printf("ERROR: too few registers!\n")
319 reg_hash[t.chopf.to_i]=regmap.index(t.chopf.to_i)
321 if op.write_tr0.length==2
322 signs_code=op.write_tr0[0][0..0]+op.write_tr0[1][0..0]
325 asm_out += sprintf(" add %s, %s, %s\n", $registers[regmap.index('tr0')], \
326 $registers[reg_hash[op.write_tr0[0].chopf.to_i]], \
327 $registers[reg_hash[op.write_tr0[1].chopf.to_i]])
329 asm_out += sprintf(" sub %s, %s, %s\n", $registers[regmap.index('tr0')], \
330 $registers[reg_hash[op.write_tr0[0].chopf.to_i]], \
331 $registers[reg_hash[op.write_tr0[1].chopf.to_i]])
333 asm_out += sprintf(" sub %s, %s, %s\n", $registers[regmap.index('tr0')], \
334 $registers[reg_hash[op.write_tr0[1].chopf.to_i]], \
335 $registers[reg_hash[op.write_tr0[0].chopf.to_i]])
337 printf("ERROR: invalid signs_code (%d): %s\n", __LINE__, signs_code)
341 if op.write_tr1.length==2
342 signs_code=op.write_tr1[0][0..0]+op.write_tr1[1][0..0]
345 asm_out += sprintf(" add %s, %s, %s\n", $registers[regmap.index('tr1')], \
346 $registers[reg_hash[op.write_tr1[0].chopf.to_i]], \
347 $registers[reg_hash[op.write_tr1[1].chopf.to_i]])
349 asm_out += sprintf(" sub %s, %s, %s\n", $registers[regmap.index('tr1')], \
350 $registers[reg_hash[op.write_tr1[0].chopf.to_i]], \
351 $registers[reg_hash[op.write_tr1[1].chopf.to_i]])
353 # puts 'DBG: '+reg_hash.inspect
354 asm_out += sprintf(" sub %s, %s, %s\n", $registers[regmap.index('tr1')], \
355 $registers[reg_hash[op.write_tr1[1].chopf.to_i]], \
356 $registers[reg_hash[op.write_tr1[0].chopf.to_i]])
358 printf("ERROR: invalid signs_code (%d): %s\n", __LINE__, signs_code)
362 if op.write_tr2.length==2
363 signs_code=op.write_tr2[0][0..0]+op.write_tr2[1][0..0]
366 asm_out += sprintf(" add %s, %s, %s\n", $registers[regmap.index('tr2')], \
367 $registers[reg_hash[op.write_tr2[0].chopf.to_i]], \
368 $registers[reg_hash[op.write_tr2[1].chopf.to_i]])
370 asm_out += sprintf(" sub %s, %s, %s\n", $registers[regmap.index('tr2')], \
371 $registers[reg_hash[op.write_tr2[0].chopf.to_i]], \
372 $registers[reg_hash[op.write_tr2[1].chopf.to_i]])
374 asm_out += sprintf(" sub %s, %s, %s\n", $registers[regmap.index('tr2')], \
375 $registers[reg_hash[op.write_tr2[1].chopf.to_i]], \
376 $registers[reg_hash[op.write_tr2[0].chopf.to_i]])
378 printf("ERROR: invalid signs_code (%d): %s\n", __LINE__, signs_code)
382 reg_hash['0tr'] = regmap.index('tr0')
383 reg_hash['1tr'] = regmap.index('tr1')
384 reg_hash['2tr'] = regmap.index('tr2')
385 tr_to_delete = op.read_tr.collect { |x| x.chopf}
386 tr_to_delete.delete('0') if op.write_tr0.length!=0
387 tr_to_delete.delete('1') if op.write_tr1.length!=0
388 tr_to_delete.delete('2') if op.write_tr2.length!=0
389 tr_to_delete.each do |x|
390 y = regmap.index('tr'+x)
392 # puts 'DBG('+__LINE__.to_s+') deleted tr'+x+' @ '+y.to_s
394 operations_to_do = op.read_t
395 op.read_tr.each {|x| operations_to_do << x+'tr'}
396 op.write_tr0.each {|x| operations_to_do.delete(x)}
397 op.write_tr1.each {|x| operations_to_do.delete(x)}
398 op.write_tr2.each {|x| operations_to_do.delete(x)}
399 operations_to_do = operations_to_do.sort
400 asm_out += sprintf("/*(-- should do %s --)*/\n", operations_to_do.join(', '));
401 sign_code=operations_to_do[1][0..0]
404 # puts 'DBG('+__LINE__.to_s+'): x='+operations_to_do[0]+' reg_hash='+reg_hash.inspect
405 asm_out += sprintf(" add %s, %s, %s\n", $registers[accu], \
406 $registers[reg_hash[operations_to_do[0].chopf.xtr]], \
407 $registers[reg_hash[operations_to_do[1].chopf.xtr]])
409 # puts 'DBG('+__LINE__.to_s+'): x='+x+' reg_hash='+reg_hash.inspect
410 asm_out += sprintf(" sub %s, %s, %s\n", $registers[accu], \
411 $registers[reg_hash[operations_to_do[0].chopf.xtr]], \
412 $registers[reg_hash[operations_to_do[1].chopf.xtr]])
414 operations_to_do = operations_to_do[2..-1]
415 operations_to_do.each do |x|
419 # puts 'DBG('+__LINE__.to_s+'): x='+x+' reg_hash='+reg_hash.inspect
420 asm_out += sprintf(" add %s, %s\n", $registers[accu], \
421 $registers[reg_hash[x.chopf.xtr]])
423 asm_out += sprintf(" sub %s, %s\n", $registers[accu], \
424 $registers[reg_hash[x.chopf.xtr]])
427 outr = find_register_to_free(regmap, $regusemap, step)
430 asm_out += sprintf(" S32_4 %s\n", $registers[accu])
431 asm_out += sprintf(" ldr %s, [r1, #%d*4]\n", $registers[outr], op.h)
432 asm_out += sprintf(" add %s, %s\n", $registers[accu], $registers[outr])
433 asm_out += sprintf(" str %s, [r0, #%d*4]\n", $registers[accu], op.index)
435 asm_out += sprintf(" S32_%d %s %s\n", op.s, $registers[outr], $registers[accu])
436 asm_out += sprintf(" ldr %s, [r1, #%d*4]\n", $registers[accu], op.h)
437 asm_out += sprintf(" add %s, %s\n", $registers[outr], $registers[accu])
438 asm_out += sprintf(" str %s, [r0, #%d*4]\n", $registers[outr], op.index)
441 # asm_out += sprintf(" str %s, [r0, #%d*4]\n", $registers[accu], op.index)
443 asm_out += sprintf(" add SP, #%d*4", 16)
448 attr_accessor :usemap
449 attr_accessor :nextusemap
458 def gen_regmap_simple
462 $regusemap = Array.new
464 def build_regusemap(operations)
466 operations.each do |op|
467 op.read_t.each do |t|
469 if $regusemap[x]==nil
470 $regusemap[x]=Array.new
478 #-------------------------------------------------------------------------------
480 #-------------------------------------------------------------------------------
483 #puts $operations.inspect
484 build_regusemap($operations)
485 #puts $regusemap.inspect
486 puts gen_simple_assembler($operations)