diff options
Diffstat (limited to 'src/lib/libcrypto/aes/asm/aes-mips.pl')
| -rw-r--r-- | src/lib/libcrypto/aes/asm/aes-mips.pl | 1611 |
1 files changed, 1611 insertions, 0 deletions
diff --git a/src/lib/libcrypto/aes/asm/aes-mips.pl b/src/lib/libcrypto/aes/asm/aes-mips.pl new file mode 100644 index 0000000000..2ce6deffc8 --- /dev/null +++ b/src/lib/libcrypto/aes/asm/aes-mips.pl | |||
| @@ -0,0 +1,1611 @@ | |||
| 1 | #!/usr/bin/env perl | ||
| 2 | |||
| 3 | # ==================================================================== | ||
| 4 | # Written by Andy Polyakov <appro@openssl.org> for the OpenSSL | ||
| 5 | # project. The module is, however, dual licensed under OpenSSL and | ||
| 6 | # CRYPTOGAMS licenses depending on where you obtain it. For further | ||
| 7 | # details see http://www.openssl.org/~appro/cryptogams/. | ||
| 8 | # ==================================================================== | ||
| 9 | |||
| 10 | # AES for MIPS | ||
| 11 | |||
| 12 | # October 2010 | ||
| 13 | # | ||
| 14 | # Code uses 1K[+256B] S-box and on single-issue core [such as R5000] | ||
| 15 | # spends ~68 cycles per byte processed with 128-bit key. This is ~16% | ||
| 16 | # faster than gcc-generated code, which is not very impressive. But | ||
| 17 | # recall that compressed S-box requires extra processing, namely | ||
| 18 | # additional rotations. Rotations are implemented with lwl/lwr pairs, | ||
| 19 | # which is normally used for loading unaligned data. Another cool | ||
| 20 | # thing about this module is its endian neutrality, which means that | ||
| 21 | # it processes data without ever changing byte order... | ||
| 22 | |||
| 23 | ###################################################################### | ||
| 24 | # There is a number of MIPS ABI in use, O32 and N32/64 are most | ||
| 25 | # widely used. Then there is a new contender: NUBI. It appears that if | ||
| 26 | # one picks the latter, it's possible to arrange code in ABI neutral | ||
| 27 | # manner. Therefore let's stick to NUBI register layout: | ||
| 28 | # | ||
| 29 | ($zero,$at,$t0,$t1,$t2)=map("\$$_",(0..2,24,25)); | ||
| 30 | ($a0,$a1,$a2,$a3,$a4,$a5,$a6,$a7)=map("\$$_",(4..11)); | ||
| 31 | ($s0,$s1,$s2,$s3,$s4,$s5,$s6,$s7,$s8,$s9,$s10,$s11)=map("\$$_",(12..23)); | ||
| 32 | ($gp,$tp,$sp,$fp,$ra)=map("\$$_",(3,28..31)); | ||
| 33 | # | ||
| 34 | # The return value is placed in $a0. Following coding rules facilitate | ||
| 35 | # interoperability: | ||
| 36 | # | ||
| 37 | # - never ever touch $tp, "thread pointer", former $gp; | ||
| 38 | # - copy return value to $t0, former $v0 [or to $a0 if you're adapting | ||
| 39 | # old code]; | ||
| 40 | # - on O32 populate $a4-$a7 with 'lw $aN,4*N($sp)' if necessary; | ||
| 41 | # | ||
| 42 | # For reference here is register layout for N32/64 MIPS ABIs: | ||
| 43 | # | ||
| 44 | # ($zero,$at,$v0,$v1)=map("\$$_",(0..3)); | ||
| 45 | # ($a0,$a1,$a2,$a3,$a4,$a5,$a6,$a7)=map("\$$_",(4..11)); | ||
| 46 | # ($t0,$t1,$t2,$t3,$t8,$t9)=map("\$$_",(12..15,24,25)); | ||
| 47 | # ($s0,$s1,$s2,$s3,$s4,$s5,$s6,$s7)=map("\$$_",(16..23)); | ||
| 48 | # ($gp,$sp,$fp,$ra)=map("\$$_",(28..31)); | ||
| 49 | # | ||
| 50 | $flavour = shift; # supported flavours are o32,n32,64,nubi32,nubi64 | ||
| 51 | |||
| 52 | if ($flavour =~ /64|n32/i) { | ||
| 53 | $PTR_ADD="dadd"; # incidentally works even on n32 | ||
| 54 | $PTR_SUB="dsub"; # incidentally works even on n32 | ||
| 55 | $REG_S="sd"; | ||
| 56 | $REG_L="ld"; | ||
| 57 | $PTR_SLL="dsll"; # incidentally works even on n32 | ||
| 58 | $SZREG=8; | ||
| 59 | } else { | ||
| 60 | $PTR_ADD="add"; | ||
| 61 | $PTR_SUB="sub"; | ||
| 62 | $REG_S="sw"; | ||
| 63 | $REG_L="lw"; | ||
| 64 | $PTR_SLL="sll"; | ||
| 65 | $SZREG=4; | ||
| 66 | } | ||
| 67 | $pf = ($flavour =~ /nubi/i) ? $t0 : $t2; | ||
| 68 | # | ||
| 69 | # <appro@openssl.org> | ||
| 70 | # | ||
| 71 | ###################################################################### | ||
| 72 | |||
| 73 | $big_endian=(`echo MIPSEL | $ENV{CC} -E -P -`=~/MIPSEL/)?1:0; | ||
| 74 | |||
| 75 | for (@ARGV) { $output=$_ if (/^\w[\w\-]*\.\w+$/); } | ||
| 76 | open STDOUT,">$output"; | ||
| 77 | |||
| 78 | if (!defined($big_endian)) | ||
| 79 | { $big_endian=(unpack('L',pack('N',1))==1); } | ||
| 80 | |||
| 81 | while (($output=shift) && ($output!~/^\w[\w\-]*\.\w+$/)) {} | ||
| 82 | open STDOUT,">$output"; | ||
| 83 | |||
| 84 | my ($MSB,$LSB)=(0,3); # automatically converted to little-endian | ||
| 85 | |||
| 86 | $code.=<<___; | ||
| 87 | .text | ||
| 88 | #ifdef OPENSSL_FIPSCANISTER | ||
| 89 | # include <openssl/fipssyms.h> | ||
| 90 | #endif | ||
| 91 | |||
| 92 | #if !defined(__vxworks) || defined(__pic__) | ||
| 93 | .option pic2 | ||
| 94 | #endif | ||
| 95 | .set noat | ||
| 96 | ___ | ||
| 97 | |||
| 98 | {{{ | ||
| 99 | my $FRAMESIZE=16*$SZREG; | ||
| 100 | my $SAVED_REGS_MASK = ($flavour =~ /nubi/i) ? 0xc0fff008 : 0xc0ff0000; | ||
| 101 | |||
| 102 | my ($inp,$out,$key,$Tbl,$s0,$s1,$s2,$s3)=($a0,$a1,$a2,$a3,$a4,$a5,$a6,$a7); | ||
| 103 | my ($i0,$i1,$i2,$i3)=($at,$t0,$t1,$t2); | ||
| 104 | my ($t0,$t1,$t2,$t3,$t4,$t5,$t6,$t7,$t8,$t9,$t10,$t11) = map("\$$_",(12..23)); | ||
| 105 | my ($key0,$cnt)=($gp,$fp); | ||
| 106 | |||
| 107 | # instuction ordering is "stolen" from output from MIPSpro assembler | ||
| 108 | # invoked with -mips3 -O3 arguments... | ||
| 109 | $code.=<<___; | ||
| 110 | .align 5 | ||
| 111 | .ent _mips_AES_encrypt | ||
| 112 | _mips_AES_encrypt: | ||
| 113 | .frame $sp,0,$ra | ||
| 114 | .set reorder | ||
| 115 | lw $t0,0($key) | ||
| 116 | lw $t1,4($key) | ||
| 117 | lw $t2,8($key) | ||
| 118 | lw $t3,12($key) | ||
| 119 | lw $cnt,240($key) | ||
| 120 | $PTR_ADD $key0,$key,16 | ||
| 121 | |||
| 122 | xor $s0,$t0 | ||
| 123 | xor $s1,$t1 | ||
| 124 | xor $s2,$t2 | ||
| 125 | xor $s3,$t3 | ||
| 126 | |||
| 127 | sub $cnt,1 | ||
| 128 | _xtr $i0,$s1,16-2 | ||
| 129 | .Loop_enc: | ||
| 130 | _xtr $i1,$s2,16-2 | ||
| 131 | _xtr $i2,$s3,16-2 | ||
| 132 | _xtr $i3,$s0,16-2 | ||
| 133 | and $i0,0x3fc | ||
| 134 | and $i1,0x3fc | ||
| 135 | and $i2,0x3fc | ||
| 136 | and $i3,0x3fc | ||
| 137 | $PTR_ADD $i0,$Tbl | ||
| 138 | $PTR_ADD $i1,$Tbl | ||
| 139 | $PTR_ADD $i2,$Tbl | ||
| 140 | $PTR_ADD $i3,$Tbl | ||
| 141 | lwl $t0,3($i0) # Te1[s1>>16] | ||
| 142 | lwl $t1,3($i1) # Te1[s2>>16] | ||
| 143 | lwl $t2,3($i2) # Te1[s3>>16] | ||
| 144 | lwl $t3,3($i3) # Te1[s0>>16] | ||
| 145 | lwr $t0,2($i0) # Te1[s1>>16] | ||
| 146 | lwr $t1,2($i1) # Te1[s2>>16] | ||
| 147 | lwr $t2,2($i2) # Te1[s3>>16] | ||
| 148 | lwr $t3,2($i3) # Te1[s0>>16] | ||
| 149 | |||
| 150 | _xtr $i0,$s2,8-2 | ||
| 151 | _xtr $i1,$s3,8-2 | ||
| 152 | _xtr $i2,$s0,8-2 | ||
| 153 | _xtr $i3,$s1,8-2 | ||
| 154 | and $i0,0x3fc | ||
| 155 | and $i1,0x3fc | ||
| 156 | and $i2,0x3fc | ||
| 157 | and $i3,0x3fc | ||
| 158 | $PTR_ADD $i0,$Tbl | ||
| 159 | $PTR_ADD $i1,$Tbl | ||
| 160 | $PTR_ADD $i2,$Tbl | ||
| 161 | $PTR_ADD $i3,$Tbl | ||
| 162 | lwl $t4,2($i0) # Te2[s2>>8] | ||
| 163 | lwl $t5,2($i1) # Te2[s3>>8] | ||
| 164 | lwl $t6,2($i2) # Te2[s0>>8] | ||
| 165 | lwl $t7,2($i3) # Te2[s1>>8] | ||
| 166 | lwr $t4,1($i0) # Te2[s2>>8] | ||
| 167 | lwr $t5,1($i1) # Te2[s3>>8] | ||
| 168 | lwr $t6,1($i2) # Te2[s0>>8] | ||
| 169 | lwr $t7,1($i3) # Te2[s1>>8] | ||
| 170 | |||
| 171 | _xtr $i0,$s3,0-2 | ||
| 172 | _xtr $i1,$s0,0-2 | ||
| 173 | _xtr $i2,$s1,0-2 | ||
| 174 | _xtr $i3,$s2,0-2 | ||
| 175 | and $i0,0x3fc | ||
| 176 | and $i1,0x3fc | ||
| 177 | and $i2,0x3fc | ||
| 178 | and $i3,0x3fc | ||
| 179 | $PTR_ADD $i0,$Tbl | ||
| 180 | $PTR_ADD $i1,$Tbl | ||
| 181 | $PTR_ADD $i2,$Tbl | ||
| 182 | $PTR_ADD $i3,$Tbl | ||
| 183 | lwl $t8,1($i0) # Te3[s3] | ||
| 184 | lwl $t9,1($i1) # Te3[s0] | ||
| 185 | lwl $t10,1($i2) # Te3[s1] | ||
| 186 | lwl $t11,1($i3) # Te3[s2] | ||
| 187 | lwr $t8,0($i0) # Te3[s3] | ||
| 188 | lwr $t9,0($i1) # Te3[s0] | ||
| 189 | lwr $t10,0($i2) # Te3[s1] | ||
| 190 | lwr $t11,0($i3) # Te3[s2] | ||
| 191 | |||
| 192 | _xtr $i0,$s0,24-2 | ||
| 193 | _xtr $i1,$s1,24-2 | ||
| 194 | _xtr $i2,$s2,24-2 | ||
| 195 | _xtr $i3,$s3,24-2 | ||
| 196 | and $i0,0x3fc | ||
| 197 | and $i1,0x3fc | ||
| 198 | and $i2,0x3fc | ||
| 199 | and $i3,0x3fc | ||
| 200 | $PTR_ADD $i0,$Tbl | ||
| 201 | $PTR_ADD $i1,$Tbl | ||
| 202 | $PTR_ADD $i2,$Tbl | ||
| 203 | $PTR_ADD $i3,$Tbl | ||
| 204 | xor $t0,$t4 | ||
| 205 | xor $t1,$t5 | ||
| 206 | xor $t2,$t6 | ||
| 207 | xor $t3,$t7 | ||
| 208 | lw $t4,0($i0) # Te0[s0>>24] | ||
| 209 | lw $t5,0($i1) # Te0[s1>>24] | ||
| 210 | lw $t6,0($i2) # Te0[s2>>24] | ||
| 211 | lw $t7,0($i3) # Te0[s3>>24] | ||
| 212 | |||
| 213 | lw $s0,0($key0) | ||
| 214 | lw $s1,4($key0) | ||
| 215 | lw $s2,8($key0) | ||
| 216 | lw $s3,12($key0) | ||
| 217 | |||
| 218 | xor $t0,$t8 | ||
| 219 | xor $t1,$t9 | ||
| 220 | xor $t2,$t10 | ||
| 221 | xor $t3,$t11 | ||
| 222 | |||
| 223 | xor $t0,$t4 | ||
| 224 | xor $t1,$t5 | ||
| 225 | xor $t2,$t6 | ||
| 226 | xor $t3,$t7 | ||
| 227 | |||
| 228 | sub $cnt,1 | ||
| 229 | $PTR_ADD $key0,16 | ||
| 230 | xor $s0,$t0 | ||
| 231 | xor $s1,$t1 | ||
| 232 | xor $s2,$t2 | ||
| 233 | xor $s3,$t3 | ||
| 234 | .set noreorder | ||
| 235 | bnez $cnt,.Loop_enc | ||
| 236 | _xtr $i0,$s1,16-2 | ||
| 237 | |||
| 238 | .set reorder | ||
| 239 | _xtr $i1,$s2,16-2 | ||
| 240 | _xtr $i2,$s3,16-2 | ||
| 241 | _xtr $i3,$s0,16-2 | ||
| 242 | and $i0,0x3fc | ||
| 243 | and $i1,0x3fc | ||
| 244 | and $i2,0x3fc | ||
| 245 | and $i3,0x3fc | ||
| 246 | $PTR_ADD $i0,$Tbl | ||
| 247 | $PTR_ADD $i1,$Tbl | ||
| 248 | $PTR_ADD $i2,$Tbl | ||
| 249 | $PTR_ADD $i3,$Tbl | ||
| 250 | lbu $t0,2($i0) # Te4[s1>>16] | ||
| 251 | lbu $t1,2($i1) # Te4[s2>>16] | ||
| 252 | lbu $t2,2($i2) # Te4[s3>>16] | ||
| 253 | lbu $t3,2($i3) # Te4[s0>>16] | ||
| 254 | |||
| 255 | _xtr $i0,$s2,8-2 | ||
| 256 | _xtr $i1,$s3,8-2 | ||
| 257 | _xtr $i2,$s0,8-2 | ||
| 258 | _xtr $i3,$s1,8-2 | ||
| 259 | and $i0,0x3fc | ||
| 260 | and $i1,0x3fc | ||
| 261 | and $i2,0x3fc | ||
| 262 | and $i3,0x3fc | ||
| 263 | $PTR_ADD $i0,$Tbl | ||
| 264 | $PTR_ADD $i1,$Tbl | ||
| 265 | $PTR_ADD $i2,$Tbl | ||
| 266 | $PTR_ADD $i3,$Tbl | ||
| 267 | lbu $t4,2($i0) # Te4[s2>>8] | ||
| 268 | lbu $t5,2($i1) # Te4[s3>>8] | ||
| 269 | lbu $t6,2($i2) # Te4[s0>>8] | ||
| 270 | lbu $t7,2($i3) # Te4[s1>>8] | ||
| 271 | |||
| 272 | _xtr $i0,$s0,24-2 | ||
| 273 | _xtr $i1,$s1,24-2 | ||
| 274 | _xtr $i2,$s2,24-2 | ||
| 275 | _xtr $i3,$s3,24-2 | ||
| 276 | and $i0,0x3fc | ||
| 277 | and $i1,0x3fc | ||
| 278 | and $i2,0x3fc | ||
| 279 | and $i3,0x3fc | ||
| 280 | $PTR_ADD $i0,$Tbl | ||
| 281 | $PTR_ADD $i1,$Tbl | ||
| 282 | $PTR_ADD $i2,$Tbl | ||
| 283 | $PTR_ADD $i3,$Tbl | ||
| 284 | lbu $t8,2($i0) # Te4[s0>>24] | ||
| 285 | lbu $t9,2($i1) # Te4[s1>>24] | ||
| 286 | lbu $t10,2($i2) # Te4[s2>>24] | ||
| 287 | lbu $t11,2($i3) # Te4[s3>>24] | ||
| 288 | |||
| 289 | _xtr $i0,$s3,0-2 | ||
| 290 | _xtr $i1,$s0,0-2 | ||
| 291 | _xtr $i2,$s1,0-2 | ||
| 292 | _xtr $i3,$s2,0-2 | ||
| 293 | and $i0,0x3fc | ||
| 294 | and $i1,0x3fc | ||
| 295 | and $i2,0x3fc | ||
| 296 | and $i3,0x3fc | ||
| 297 | |||
| 298 | _ins $t0,16 | ||
| 299 | _ins $t1,16 | ||
| 300 | _ins $t2,16 | ||
| 301 | _ins $t3,16 | ||
| 302 | |||
| 303 | _ins $t4,8 | ||
| 304 | _ins $t5,8 | ||
| 305 | _ins $t6,8 | ||
| 306 | _ins $t7,8 | ||
| 307 | |||
| 308 | xor $t0,$t4 | ||
| 309 | xor $t1,$t5 | ||
| 310 | xor $t2,$t6 | ||
| 311 | xor $t3,$t7 | ||
| 312 | |||
| 313 | $PTR_ADD $i0,$Tbl | ||
| 314 | $PTR_ADD $i1,$Tbl | ||
| 315 | $PTR_ADD $i2,$Tbl | ||
| 316 | $PTR_ADD $i3,$Tbl | ||
| 317 | lbu $t4,2($i0) # Te4[s3] | ||
| 318 | lbu $t5,2($i1) # Te4[s0] | ||
| 319 | lbu $t6,2($i2) # Te4[s1] | ||
| 320 | lbu $t7,2($i3) # Te4[s2] | ||
| 321 | |||
| 322 | _ins $t8,24 | ||
| 323 | _ins $t9,24 | ||
| 324 | _ins $t10,24 | ||
| 325 | _ins $t11,24 | ||
| 326 | |||
| 327 | lw $s0,0($key0) | ||
| 328 | lw $s1,4($key0) | ||
| 329 | lw $s2,8($key0) | ||
| 330 | lw $s3,12($key0) | ||
| 331 | |||
| 332 | xor $t0,$t8 | ||
| 333 | xor $t1,$t9 | ||
| 334 | xor $t2,$t10 | ||
| 335 | xor $t3,$t11 | ||
| 336 | |||
| 337 | _ins $t4,0 | ||
| 338 | _ins $t5,0 | ||
| 339 | _ins $t6,0 | ||
| 340 | _ins $t7,0 | ||
| 341 | |||
| 342 | xor $t0,$t4 | ||
| 343 | xor $t1,$t5 | ||
| 344 | xor $t2,$t6 | ||
| 345 | xor $t3,$t7 | ||
| 346 | |||
| 347 | xor $s0,$t0 | ||
| 348 | xor $s1,$t1 | ||
| 349 | xor $s2,$t2 | ||
| 350 | xor $s3,$t3 | ||
| 351 | |||
| 352 | jr $ra | ||
| 353 | .end _mips_AES_encrypt | ||
| 354 | |||
| 355 | .align 5 | ||
| 356 | .globl AES_encrypt | ||
| 357 | .ent AES_encrypt | ||
| 358 | AES_encrypt: | ||
| 359 | .frame $sp,$FRAMESIZE,$ra | ||
| 360 | .mask $SAVED_REGS_MASK,-$SZREG | ||
| 361 | .set noreorder | ||
| 362 | ___ | ||
| 363 | $code.=<<___ if ($flavour =~ /o32/i); # o32 PIC-ification | ||
| 364 | .cpload $pf | ||
| 365 | ___ | ||
| 366 | $code.=<<___; | ||
| 367 | $PTR_SUB $sp,$FRAMESIZE | ||
| 368 | $REG_S $ra,$FRAMESIZE-1*$SZREG($sp) | ||
| 369 | $REG_S $fp,$FRAMESIZE-2*$SZREG($sp) | ||
| 370 | $REG_S $s11,$FRAMESIZE-3*$SZREG($sp) | ||
| 371 | $REG_S $s10,$FRAMESIZE-4*$SZREG($sp) | ||
| 372 | $REG_S $s9,$FRAMESIZE-5*$SZREG($sp) | ||
| 373 | $REG_S $s8,$FRAMESIZE-6*$SZREG($sp) | ||
| 374 | $REG_S $s7,$FRAMESIZE-7*$SZREG($sp) | ||
| 375 | $REG_S $s6,$FRAMESIZE-8*$SZREG($sp) | ||
| 376 | $REG_S $s5,$FRAMESIZE-9*$SZREG($sp) | ||
| 377 | $REG_S $s4,$FRAMESIZE-10*$SZREG($sp) | ||
| 378 | ___ | ||
| 379 | $code.=<<___ if ($flavour =~ /nubi/i); # optimize non-nubi prologue | ||
| 380 | $REG_S \$15,$FRAMESIZE-11*$SZREG($sp) | ||
| 381 | $REG_S \$14,$FRAMESIZE-12*$SZREG($sp) | ||
| 382 | $REG_S \$13,$FRAMESIZE-13*$SZREG($sp) | ||
| 383 | $REG_S \$12,$FRAMESIZE-14*$SZREG($sp) | ||
| 384 | $REG_S $gp,$FRAMESIZE-15*$SZREG($sp) | ||
| 385 | ___ | ||
| 386 | $code.=<<___ if ($flavour !~ /o32/i); # non-o32 PIC-ification | ||
| 387 | .cplocal $Tbl | ||
| 388 | .cpsetup $pf,$zero,AES_encrypt | ||
| 389 | ___ | ||
| 390 | $code.=<<___; | ||
| 391 | .set reorder | ||
| 392 | la $Tbl,AES_Te # PIC-ified 'load address' | ||
| 393 | |||
| 394 | lwl $s0,0+$MSB($inp) | ||
| 395 | lwl $s1,4+$MSB($inp) | ||
| 396 | lwl $s2,8+$MSB($inp) | ||
| 397 | lwl $s3,12+$MSB($inp) | ||
| 398 | lwr $s0,0+$LSB($inp) | ||
| 399 | lwr $s1,4+$LSB($inp) | ||
| 400 | lwr $s2,8+$LSB($inp) | ||
| 401 | lwr $s3,12+$LSB($inp) | ||
| 402 | |||
| 403 | bal _mips_AES_encrypt | ||
| 404 | |||
| 405 | swr $s0,0+$LSB($out) | ||
| 406 | swr $s1,4+$LSB($out) | ||
| 407 | swr $s2,8+$LSB($out) | ||
| 408 | swr $s3,12+$LSB($out) | ||
| 409 | swl $s0,0+$MSB($out) | ||
| 410 | swl $s1,4+$MSB($out) | ||
| 411 | swl $s2,8+$MSB($out) | ||
| 412 | swl $s3,12+$MSB($out) | ||
| 413 | |||
| 414 | .set noreorder | ||
| 415 | $REG_L $ra,$FRAMESIZE-1*$SZREG($sp) | ||
| 416 | $REG_L $fp,$FRAMESIZE-2*$SZREG($sp) | ||
| 417 | $REG_L $s11,$FRAMESIZE-3*$SZREG($sp) | ||
| 418 | $REG_L $s10,$FRAMESIZE-4*$SZREG($sp) | ||
| 419 | $REG_L $s9,$FRAMESIZE-5*$SZREG($sp) | ||
| 420 | $REG_L $s8,$FRAMESIZE-6*$SZREG($sp) | ||
| 421 | $REG_L $s7,$FRAMESIZE-7*$SZREG($sp) | ||
| 422 | $REG_L $s6,$FRAMESIZE-8*$SZREG($sp) | ||
| 423 | $REG_L $s5,$FRAMESIZE-9*$SZREG($sp) | ||
| 424 | $REG_L $s4,$FRAMESIZE-10*$SZREG($sp) | ||
| 425 | ___ | ||
| 426 | $code.=<<___ if ($flavour =~ /nubi/i); | ||
| 427 | $REG_L \$15,$FRAMESIZE-11*$SZREG($sp) | ||
| 428 | $REG_L \$14,$FRAMESIZE-12*$SZREG($sp) | ||
| 429 | $REG_L \$13,$FRAMESIZE-13*$SZREG($sp) | ||
| 430 | $REG_L \$12,$FRAMESIZE-14*$SZREG($sp) | ||
| 431 | $REG_L $gp,$FRAMESIZE-15*$SZREG($sp) | ||
| 432 | ___ | ||
| 433 | $code.=<<___; | ||
| 434 | jr $ra | ||
| 435 | $PTR_ADD $sp,$FRAMESIZE | ||
| 436 | .end AES_encrypt | ||
| 437 | ___ | ||
| 438 | |||
| 439 | $code.=<<___; | ||
| 440 | .align 5 | ||
| 441 | .ent _mips_AES_decrypt | ||
| 442 | _mips_AES_decrypt: | ||
| 443 | .frame $sp,0,$ra | ||
| 444 | .set reorder | ||
| 445 | lw $t0,0($key) | ||
| 446 | lw $t1,4($key) | ||
| 447 | lw $t2,8($key) | ||
| 448 | lw $t3,12($key) | ||
| 449 | lw $cnt,240($key) | ||
| 450 | $PTR_ADD $key0,$key,16 | ||
| 451 | |||
| 452 | xor $s0,$t0 | ||
| 453 | xor $s1,$t1 | ||
| 454 | xor $s2,$t2 | ||
| 455 | xor $s3,$t3 | ||
| 456 | |||
| 457 | sub $cnt,1 | ||
| 458 | _xtr $i0,$s3,16-2 | ||
| 459 | .Loop_dec: | ||
| 460 | _xtr $i1,$s0,16-2 | ||
| 461 | _xtr $i2,$s1,16-2 | ||
| 462 | _xtr $i3,$s2,16-2 | ||
| 463 | and $i0,0x3fc | ||
| 464 | and $i1,0x3fc | ||
| 465 | and $i2,0x3fc | ||
| 466 | and $i3,0x3fc | ||
| 467 | $PTR_ADD $i0,$Tbl | ||
| 468 | $PTR_ADD $i1,$Tbl | ||
| 469 | $PTR_ADD $i2,$Tbl | ||
| 470 | $PTR_ADD $i3,$Tbl | ||
| 471 | lwl $t0,3($i0) # Td1[s3>>16] | ||
| 472 | lwl $t1,3($i1) # Td1[s0>>16] | ||
| 473 | lwl $t2,3($i2) # Td1[s1>>16] | ||
| 474 | lwl $t3,3($i3) # Td1[s2>>16] | ||
| 475 | lwr $t0,2($i0) # Td1[s3>>16] | ||
| 476 | lwr $t1,2($i1) # Td1[s0>>16] | ||
| 477 | lwr $t2,2($i2) # Td1[s1>>16] | ||
| 478 | lwr $t3,2($i3) # Td1[s2>>16] | ||
| 479 | |||
| 480 | _xtr $i0,$s2,8-2 | ||
| 481 | _xtr $i1,$s3,8-2 | ||
| 482 | _xtr $i2,$s0,8-2 | ||
| 483 | _xtr $i3,$s1,8-2 | ||
| 484 | and $i0,0x3fc | ||
| 485 | and $i1,0x3fc | ||
| 486 | and $i2,0x3fc | ||
| 487 | and $i3,0x3fc | ||
| 488 | $PTR_ADD $i0,$Tbl | ||
| 489 | $PTR_ADD $i1,$Tbl | ||
| 490 | $PTR_ADD $i2,$Tbl | ||
| 491 | $PTR_ADD $i3,$Tbl | ||
| 492 | lwl $t4,2($i0) # Td2[s2>>8] | ||
| 493 | lwl $t5,2($i1) # Td2[s3>>8] | ||
| 494 | lwl $t6,2($i2) # Td2[s0>>8] | ||
| 495 | lwl $t7,2($i3) # Td2[s1>>8] | ||
| 496 | lwr $t4,1($i0) # Td2[s2>>8] | ||
| 497 | lwr $t5,1($i1) # Td2[s3>>8] | ||
| 498 | lwr $t6,1($i2) # Td2[s0>>8] | ||
| 499 | lwr $t7,1($i3) # Td2[s1>>8] | ||
| 500 | |||
| 501 | _xtr $i0,$s1,0-2 | ||
| 502 | _xtr $i1,$s2,0-2 | ||
| 503 | _xtr $i2,$s3,0-2 | ||
| 504 | _xtr $i3,$s0,0-2 | ||
| 505 | and $i0,0x3fc | ||
| 506 | and $i1,0x3fc | ||
| 507 | and $i2,0x3fc | ||
| 508 | and $i3,0x3fc | ||
| 509 | $PTR_ADD $i0,$Tbl | ||
| 510 | $PTR_ADD $i1,$Tbl | ||
| 511 | $PTR_ADD $i2,$Tbl | ||
| 512 | $PTR_ADD $i3,$Tbl | ||
| 513 | lwl $t8,1($i0) # Td3[s1] | ||
| 514 | lwl $t9,1($i1) # Td3[s2] | ||
| 515 | lwl $t10,1($i2) # Td3[s3] | ||
| 516 | lwl $t11,1($i3) # Td3[s0] | ||
| 517 | lwr $t8,0($i0) # Td3[s1] | ||
| 518 | lwr $t9,0($i1) # Td3[s2] | ||
| 519 | lwr $t10,0($i2) # Td3[s3] | ||
| 520 | lwr $t11,0($i3) # Td3[s0] | ||
| 521 | |||
| 522 | _xtr $i0,$s0,24-2 | ||
| 523 | _xtr $i1,$s1,24-2 | ||
| 524 | _xtr $i2,$s2,24-2 | ||
| 525 | _xtr $i3,$s3,24-2 | ||
| 526 | and $i0,0x3fc | ||
| 527 | and $i1,0x3fc | ||
| 528 | and $i2,0x3fc | ||
| 529 | and $i3,0x3fc | ||
| 530 | $PTR_ADD $i0,$Tbl | ||
| 531 | $PTR_ADD $i1,$Tbl | ||
| 532 | $PTR_ADD $i2,$Tbl | ||
| 533 | $PTR_ADD $i3,$Tbl | ||
| 534 | |||
| 535 | xor $t0,$t4 | ||
| 536 | xor $t1,$t5 | ||
| 537 | xor $t2,$t6 | ||
| 538 | xor $t3,$t7 | ||
| 539 | |||
| 540 | |||
| 541 | lw $t4,0($i0) # Td0[s0>>24] | ||
| 542 | lw $t5,0($i1) # Td0[s1>>24] | ||
| 543 | lw $t6,0($i2) # Td0[s2>>24] | ||
| 544 | lw $t7,0($i3) # Td0[s3>>24] | ||
| 545 | |||
| 546 | lw $s0,0($key0) | ||
| 547 | lw $s1,4($key0) | ||
| 548 | lw $s2,8($key0) | ||
| 549 | lw $s3,12($key0) | ||
| 550 | |||
| 551 | xor $t0,$t8 | ||
| 552 | xor $t1,$t9 | ||
| 553 | xor $t2,$t10 | ||
| 554 | xor $t3,$t11 | ||
| 555 | |||
| 556 | xor $t0,$t4 | ||
| 557 | xor $t1,$t5 | ||
| 558 | xor $t2,$t6 | ||
| 559 | xor $t3,$t7 | ||
| 560 | |||
| 561 | sub $cnt,1 | ||
| 562 | $PTR_ADD $key0,16 | ||
| 563 | xor $s0,$t0 | ||
| 564 | xor $s1,$t1 | ||
| 565 | xor $s2,$t2 | ||
| 566 | xor $s3,$t3 | ||
| 567 | .set noreorder | ||
| 568 | bnez $cnt,.Loop_dec | ||
| 569 | _xtr $i0,$s3,16-2 | ||
| 570 | |||
| 571 | .set reorder | ||
| 572 | lw $t4,1024($Tbl) # prefetch Td4 | ||
| 573 | lw $t5,1024+32($Tbl) | ||
| 574 | lw $t6,1024+64($Tbl) | ||
| 575 | lw $t7,1024+96($Tbl) | ||
| 576 | lw $t8,1024+128($Tbl) | ||
| 577 | lw $t9,1024+160($Tbl) | ||
| 578 | lw $t10,1024+192($Tbl) | ||
| 579 | lw $t11,1024+224($Tbl) | ||
| 580 | |||
| 581 | _xtr $i0,$s3,16 | ||
| 582 | _xtr $i1,$s0,16 | ||
| 583 | _xtr $i2,$s1,16 | ||
| 584 | _xtr $i3,$s2,16 | ||
| 585 | and $i0,0xff | ||
| 586 | and $i1,0xff | ||
| 587 | and $i2,0xff | ||
| 588 | and $i3,0xff | ||
| 589 | $PTR_ADD $i0,$Tbl | ||
| 590 | $PTR_ADD $i1,$Tbl | ||
| 591 | $PTR_ADD $i2,$Tbl | ||
| 592 | $PTR_ADD $i3,$Tbl | ||
| 593 | lbu $t0,1024($i0) # Td4[s3>>16] | ||
| 594 | lbu $t1,1024($i1) # Td4[s0>>16] | ||
| 595 | lbu $t2,1024($i2) # Td4[s1>>16] | ||
| 596 | lbu $t3,1024($i3) # Td4[s2>>16] | ||
| 597 | |||
| 598 | _xtr $i0,$s2,8 | ||
| 599 | _xtr $i1,$s3,8 | ||
| 600 | _xtr $i2,$s0,8 | ||
| 601 | _xtr $i3,$s1,8 | ||
| 602 | and $i0,0xff | ||
| 603 | and $i1,0xff | ||
| 604 | and $i2,0xff | ||
| 605 | and $i3,0xff | ||
| 606 | $PTR_ADD $i0,$Tbl | ||
| 607 | $PTR_ADD $i1,$Tbl | ||
| 608 | $PTR_ADD $i2,$Tbl | ||
| 609 | $PTR_ADD $i3,$Tbl | ||
| 610 | lbu $t4,1024($i0) # Td4[s2>>8] | ||
| 611 | lbu $t5,1024($i1) # Td4[s3>>8] | ||
| 612 | lbu $t6,1024($i2) # Td4[s0>>8] | ||
| 613 | lbu $t7,1024($i3) # Td4[s1>>8] | ||
| 614 | |||
| 615 | _xtr $i0,$s0,24 | ||
| 616 | _xtr $i1,$s1,24 | ||
| 617 | _xtr $i2,$s2,24 | ||
| 618 | _xtr $i3,$s3,24 | ||
| 619 | $PTR_ADD $i0,$Tbl | ||
| 620 | $PTR_ADD $i1,$Tbl | ||
| 621 | $PTR_ADD $i2,$Tbl | ||
| 622 | $PTR_ADD $i3,$Tbl | ||
| 623 | lbu $t8,1024($i0) # Td4[s0>>24] | ||
| 624 | lbu $t9,1024($i1) # Td4[s1>>24] | ||
| 625 | lbu $t10,1024($i2) # Td4[s2>>24] | ||
| 626 | lbu $t11,1024($i3) # Td4[s3>>24] | ||
| 627 | |||
| 628 | _xtr $i0,$s1,0 | ||
| 629 | _xtr $i1,$s2,0 | ||
| 630 | _xtr $i2,$s3,0 | ||
| 631 | _xtr $i3,$s0,0 | ||
| 632 | |||
| 633 | _ins $t0,16 | ||
| 634 | _ins $t1,16 | ||
| 635 | _ins $t2,16 | ||
| 636 | _ins $t3,16 | ||
| 637 | |||
| 638 | _ins $t4,8 | ||
| 639 | _ins $t5,8 | ||
| 640 | _ins $t6,8 | ||
| 641 | _ins $t7,8 | ||
| 642 | |||
| 643 | xor $t0,$t4 | ||
| 644 | xor $t1,$t5 | ||
| 645 | xor $t2,$t6 | ||
| 646 | xor $t3,$t7 | ||
| 647 | |||
| 648 | $PTR_ADD $i0,$Tbl | ||
| 649 | $PTR_ADD $i1,$Tbl | ||
| 650 | $PTR_ADD $i2,$Tbl | ||
| 651 | $PTR_ADD $i3,$Tbl | ||
| 652 | lbu $t4,1024($i0) # Td4[s1] | ||
| 653 | lbu $t5,1024($i1) # Td4[s2] | ||
| 654 | lbu $t6,1024($i2) # Td4[s3] | ||
| 655 | lbu $t7,1024($i3) # Td4[s0] | ||
| 656 | |||
| 657 | _ins $t8,24 | ||
| 658 | _ins $t9,24 | ||
| 659 | _ins $t10,24 | ||
| 660 | _ins $t11,24 | ||
| 661 | |||
| 662 | lw $s0,0($key0) | ||
| 663 | lw $s1,4($key0) | ||
| 664 | lw $s2,8($key0) | ||
| 665 | lw $s3,12($key0) | ||
| 666 | |||
| 667 | _ins $t4,0 | ||
| 668 | _ins $t5,0 | ||
| 669 | _ins $t6,0 | ||
| 670 | _ins $t7,0 | ||
| 671 | |||
| 672 | |||
| 673 | xor $t0,$t8 | ||
| 674 | xor $t1,$t9 | ||
| 675 | xor $t2,$t10 | ||
| 676 | xor $t3,$t11 | ||
| 677 | |||
| 678 | xor $t0,$t4 | ||
| 679 | xor $t1,$t5 | ||
| 680 | xor $t2,$t6 | ||
| 681 | xor $t3,$t7 | ||
| 682 | |||
| 683 | xor $s0,$t0 | ||
| 684 | xor $s1,$t1 | ||
| 685 | xor $s2,$t2 | ||
| 686 | xor $s3,$t3 | ||
| 687 | |||
| 688 | jr $ra | ||
| 689 | .end _mips_AES_decrypt | ||
| 690 | |||
| 691 | .align 5 | ||
| 692 | .globl AES_decrypt | ||
| 693 | .ent AES_decrypt | ||
| 694 | AES_decrypt: | ||
| 695 | .frame $sp,$FRAMESIZE,$ra | ||
| 696 | .mask $SAVED_REGS_MASK,-$SZREG | ||
| 697 | .set noreorder | ||
| 698 | ___ | ||
| 699 | $code.=<<___ if ($flavour =~ /o32/i); # o32 PIC-ification | ||
| 700 | .cpload $pf | ||
| 701 | ___ | ||
| 702 | $code.=<<___; | ||
| 703 | $PTR_SUB $sp,$FRAMESIZE | ||
| 704 | $REG_S $ra,$FRAMESIZE-1*$SZREG($sp) | ||
| 705 | $REG_S $fp,$FRAMESIZE-2*$SZREG($sp) | ||
| 706 | $REG_S $s11,$FRAMESIZE-3*$SZREG($sp) | ||
| 707 | $REG_S $s10,$FRAMESIZE-4*$SZREG($sp) | ||
| 708 | $REG_S $s9,$FRAMESIZE-5*$SZREG($sp) | ||
| 709 | $REG_S $s8,$FRAMESIZE-6*$SZREG($sp) | ||
| 710 | $REG_S $s7,$FRAMESIZE-7*$SZREG($sp) | ||
| 711 | $REG_S $s6,$FRAMESIZE-8*$SZREG($sp) | ||
| 712 | $REG_S $s5,$FRAMESIZE-9*$SZREG($sp) | ||
| 713 | $REG_S $s4,$FRAMESIZE-10*$SZREG($sp) | ||
| 714 | ___ | ||
| 715 | $code.=<<___ if ($flavour =~ /nubi/i); # optimize non-nubi prologue | ||
| 716 | $REG_S \$15,$FRAMESIZE-11*$SZREG($sp) | ||
| 717 | $REG_S \$14,$FRAMESIZE-12*$SZREG($sp) | ||
| 718 | $REG_S \$13,$FRAMESIZE-13*$SZREG($sp) | ||
| 719 | $REG_S \$12,$FRAMESIZE-14*$SZREG($sp) | ||
| 720 | $REG_S $gp,$FRAMESIZE-15*$SZREG($sp) | ||
| 721 | ___ | ||
| 722 | $code.=<<___ if ($flavour !~ /o32/i); # non-o32 PIC-ification | ||
| 723 | .cplocal $Tbl | ||
| 724 | .cpsetup $pf,$zero,AES_decrypt | ||
| 725 | ___ | ||
| 726 | $code.=<<___; | ||
| 727 | .set reorder | ||
| 728 | la $Tbl,AES_Td # PIC-ified 'load address' | ||
| 729 | |||
| 730 | lwl $s0,0+$MSB($inp) | ||
| 731 | lwl $s1,4+$MSB($inp) | ||
| 732 | lwl $s2,8+$MSB($inp) | ||
| 733 | lwl $s3,12+$MSB($inp) | ||
| 734 | lwr $s0,0+$LSB($inp) | ||
| 735 | lwr $s1,4+$LSB($inp) | ||
| 736 | lwr $s2,8+$LSB($inp) | ||
| 737 | lwr $s3,12+$LSB($inp) | ||
| 738 | |||
| 739 | bal _mips_AES_decrypt | ||
| 740 | |||
| 741 | swr $s0,0+$LSB($out) | ||
| 742 | swr $s1,4+$LSB($out) | ||
| 743 | swr $s2,8+$LSB($out) | ||
| 744 | swr $s3,12+$LSB($out) | ||
| 745 | swl $s0,0+$MSB($out) | ||
| 746 | swl $s1,4+$MSB($out) | ||
| 747 | swl $s2,8+$MSB($out) | ||
| 748 | swl $s3,12+$MSB($out) | ||
| 749 | |||
| 750 | .set noreorder | ||
| 751 | $REG_L $ra,$FRAMESIZE-1*$SZREG($sp) | ||
| 752 | $REG_L $fp,$FRAMESIZE-2*$SZREG($sp) | ||
| 753 | $REG_L $s11,$FRAMESIZE-3*$SZREG($sp) | ||
| 754 | $REG_L $s10,$FRAMESIZE-4*$SZREG($sp) | ||
| 755 | $REG_L $s9,$FRAMESIZE-5*$SZREG($sp) | ||
| 756 | $REG_L $s8,$FRAMESIZE-6*$SZREG($sp) | ||
| 757 | $REG_L $s7,$FRAMESIZE-7*$SZREG($sp) | ||
| 758 | $REG_L $s6,$FRAMESIZE-8*$SZREG($sp) | ||
| 759 | $REG_L $s5,$FRAMESIZE-9*$SZREG($sp) | ||
| 760 | $REG_L $s4,$FRAMESIZE-10*$SZREG($sp) | ||
| 761 | ___ | ||
| 762 | $code.=<<___ if ($flavour =~ /nubi/i); | ||
| 763 | $REG_L \$15,$FRAMESIZE-11*$SZREG($sp) | ||
| 764 | $REG_L \$14,$FRAMESIZE-12*$SZREG($sp) | ||
| 765 | $REG_L \$13,$FRAMESIZE-13*$SZREG($sp) | ||
| 766 | $REG_L \$12,$FRAMESIZE-14*$SZREG($sp) | ||
| 767 | $REG_L $gp,$FRAMESIZE-15*$SZREG($sp) | ||
| 768 | ___ | ||
| 769 | $code.=<<___; | ||
| 770 | jr $ra | ||
| 771 | $PTR_ADD $sp,$FRAMESIZE | ||
| 772 | .end AES_decrypt | ||
| 773 | ___ | ||
| 774 | }}} | ||
| 775 | |||
| 776 | {{{ | ||
| 777 | my $FRAMESIZE=8*$SZREG; | ||
| 778 | my $SAVED_REGS_MASK = ($flavour =~ /nubi/i) ? 0xc000f008 : 0xc0000000; | ||
| 779 | |||
| 780 | my ($inp,$bits,$key,$Tbl)=($a0,$a1,$a2,$a3); | ||
| 781 | my ($rk0,$rk1,$rk2,$rk3,$rk4,$rk5,$rk6,$rk7)=($a4,$a5,$a6,$a7,$s0,$s1,$s2,$s3); | ||
| 782 | my ($i0,$i1,$i2,$i3)=($at,$t0,$t1,$t2); | ||
| 783 | my ($rcon,$cnt)=($gp,$fp); | ||
| 784 | |||
| 785 | $code.=<<___; | ||
| 786 | .align 5 | ||
| 787 | .ent _mips_AES_set_encrypt_key | ||
| 788 | _mips_AES_set_encrypt_key: | ||
| 789 | .frame $sp,0,$ra | ||
| 790 | .set noreorder | ||
| 791 | beqz $inp,.Lekey_done | ||
| 792 | li $t0,-1 | ||
| 793 | beqz $key,.Lekey_done | ||
| 794 | $PTR_ADD $rcon,$Tbl,1024+256 | ||
| 795 | |||
| 796 | .set reorder | ||
| 797 | lwl $rk0,0+$MSB($inp) # load 128 bits | ||
| 798 | lwl $rk1,4+$MSB($inp) | ||
| 799 | lwl $rk2,8+$MSB($inp) | ||
| 800 | lwl $rk3,12+$MSB($inp) | ||
| 801 | li $at,128 | ||
| 802 | lwr $rk0,0+$LSB($inp) | ||
| 803 | lwr $rk1,4+$LSB($inp) | ||
| 804 | lwr $rk2,8+$LSB($inp) | ||
| 805 | lwr $rk3,12+$LSB($inp) | ||
| 806 | .set noreorder | ||
| 807 | beq $bits,$at,.L128bits | ||
| 808 | li $cnt,10 | ||
| 809 | |||
| 810 | .set reorder | ||
| 811 | lwl $rk4,16+$MSB($inp) # load 192 bits | ||
| 812 | lwl $rk5,20+$MSB($inp) | ||
| 813 | li $at,192 | ||
| 814 | lwr $rk4,16+$LSB($inp) | ||
| 815 | lwr $rk5,20+$LSB($inp) | ||
| 816 | .set noreorder | ||
| 817 | beq $bits,$at,.L192bits | ||
| 818 | li $cnt,8 | ||
| 819 | |||
| 820 | .set reorder | ||
| 821 | lwl $rk6,24+$MSB($inp) # load 256 bits | ||
| 822 | lwl $rk7,28+$MSB($inp) | ||
| 823 | li $at,256 | ||
| 824 | lwr $rk6,24+$LSB($inp) | ||
| 825 | lwr $rk7,28+$LSB($inp) | ||
| 826 | .set noreorder | ||
| 827 | beq $bits,$at,.L256bits | ||
| 828 | li $cnt,7 | ||
| 829 | |||
| 830 | b .Lekey_done | ||
| 831 | li $t0,-2 | ||
| 832 | |||
| 833 | .align 4 | ||
| 834 | .L128bits: | ||
| 835 | .set reorder | ||
| 836 | srl $i0,$rk3,16 | ||
| 837 | srl $i1,$rk3,8 | ||
| 838 | and $i0,0xff | ||
| 839 | and $i1,0xff | ||
| 840 | and $i2,$rk3,0xff | ||
| 841 | srl $i3,$rk3,24 | ||
| 842 | $PTR_ADD $i0,$Tbl | ||
| 843 | $PTR_ADD $i1,$Tbl | ||
| 844 | $PTR_ADD $i2,$Tbl | ||
| 845 | $PTR_ADD $i3,$Tbl | ||
| 846 | lbu $i0,1024($i0) | ||
| 847 | lbu $i1,1024($i1) | ||
| 848 | lbu $i2,1024($i2) | ||
| 849 | lbu $i3,1024($i3) | ||
| 850 | |||
| 851 | sw $rk0,0($key) | ||
| 852 | sw $rk1,4($key) | ||
| 853 | sw $rk2,8($key) | ||
| 854 | sw $rk3,12($key) | ||
| 855 | sub $cnt,1 | ||
| 856 | $PTR_ADD $key,16 | ||
| 857 | |||
| 858 | _bias $i0,24 | ||
| 859 | _bias $i1,16 | ||
| 860 | _bias $i2,8 | ||
| 861 | _bias $i3,0 | ||
| 862 | |||
| 863 | xor $rk0,$i0 | ||
| 864 | lw $i0,0($rcon) | ||
| 865 | xor $rk0,$i1 | ||
| 866 | xor $rk0,$i2 | ||
| 867 | xor $rk0,$i3 | ||
| 868 | xor $rk0,$i0 | ||
| 869 | |||
| 870 | xor $rk1,$rk0 | ||
| 871 | xor $rk2,$rk1 | ||
| 872 | xor $rk3,$rk2 | ||
| 873 | |||
| 874 | .set noreorder | ||
| 875 | bnez $cnt,.L128bits | ||
| 876 | $PTR_ADD $rcon,4 | ||
| 877 | |||
| 878 | sw $rk0,0($key) | ||
| 879 | sw $rk1,4($key) | ||
| 880 | sw $rk2,8($key) | ||
| 881 | li $cnt,10 | ||
| 882 | sw $rk3,12($key) | ||
| 883 | li $t0,0 | ||
| 884 | sw $cnt,80($key) | ||
| 885 | b .Lekey_done | ||
| 886 | $PTR_SUB $key,10*16 | ||
| 887 | |||
| 888 | .align 4 | ||
| 889 | .L192bits: | ||
| 890 | .set reorder | ||
| 891 | srl $i0,$rk5,16 | ||
| 892 | srl $i1,$rk5,8 | ||
| 893 | and $i0,0xff | ||
| 894 | and $i1,0xff | ||
| 895 | and $i2,$rk5,0xff | ||
| 896 | srl $i3,$rk5,24 | ||
| 897 | $PTR_ADD $i0,$Tbl | ||
| 898 | $PTR_ADD $i1,$Tbl | ||
| 899 | $PTR_ADD $i2,$Tbl | ||
| 900 | $PTR_ADD $i3,$Tbl | ||
| 901 | lbu $i0,1024($i0) | ||
| 902 | lbu $i1,1024($i1) | ||
| 903 | lbu $i2,1024($i2) | ||
| 904 | lbu $i3,1024($i3) | ||
| 905 | |||
| 906 | sw $rk0,0($key) | ||
| 907 | sw $rk1,4($key) | ||
| 908 | sw $rk2,8($key) | ||
| 909 | sw $rk3,12($key) | ||
| 910 | sw $rk4,16($key) | ||
| 911 | sw $rk5,20($key) | ||
| 912 | sub $cnt,1 | ||
| 913 | $PTR_ADD $key,24 | ||
| 914 | |||
| 915 | _bias $i0,24 | ||
| 916 | _bias $i1,16 | ||
| 917 | _bias $i2,8 | ||
| 918 | _bias $i3,0 | ||
| 919 | |||
| 920 | xor $rk0,$i0 | ||
| 921 | lw $i0,0($rcon) | ||
| 922 | xor $rk0,$i1 | ||
| 923 | xor $rk0,$i2 | ||
| 924 | xor $rk0,$i3 | ||
| 925 | xor $rk0,$i0 | ||
| 926 | |||
| 927 | xor $rk1,$rk0 | ||
| 928 | xor $rk2,$rk1 | ||
| 929 | xor $rk3,$rk2 | ||
| 930 | xor $rk4,$rk3 | ||
| 931 | xor $rk5,$rk4 | ||
| 932 | |||
| 933 | .set noreorder | ||
| 934 | bnez $cnt,.L192bits | ||
| 935 | $PTR_ADD $rcon,4 | ||
| 936 | |||
| 937 | sw $rk0,0($key) | ||
| 938 | sw $rk1,4($key) | ||
| 939 | sw $rk2,8($key) | ||
| 940 | li $cnt,12 | ||
| 941 | sw $rk3,12($key) | ||
| 942 | li $t0,0 | ||
| 943 | sw $cnt,48($key) | ||
| 944 | b .Lekey_done | ||
| 945 | $PTR_SUB $key,12*16 | ||
| 946 | |||
| 947 | .align 4 | ||
| 948 | .L256bits: | ||
| 949 | .set reorder | ||
| 950 | srl $i0,$rk7,16 | ||
| 951 | srl $i1,$rk7,8 | ||
| 952 | and $i0,0xff | ||
| 953 | and $i1,0xff | ||
| 954 | and $i2,$rk7,0xff | ||
| 955 | srl $i3,$rk7,24 | ||
| 956 | $PTR_ADD $i0,$Tbl | ||
| 957 | $PTR_ADD $i1,$Tbl | ||
| 958 | $PTR_ADD $i2,$Tbl | ||
| 959 | $PTR_ADD $i3,$Tbl | ||
| 960 | lbu $i0,1024($i0) | ||
| 961 | lbu $i1,1024($i1) | ||
| 962 | lbu $i2,1024($i2) | ||
| 963 | lbu $i3,1024($i3) | ||
| 964 | |||
| 965 | sw $rk0,0($key) | ||
| 966 | sw $rk1,4($key) | ||
| 967 | sw $rk2,8($key) | ||
| 968 | sw $rk3,12($key) | ||
| 969 | sw $rk4,16($key) | ||
| 970 | sw $rk5,20($key) | ||
| 971 | sw $rk6,24($key) | ||
| 972 | sw $rk7,28($key) | ||
| 973 | sub $cnt,1 | ||
| 974 | |||
| 975 | _bias $i0,24 | ||
| 976 | _bias $i1,16 | ||
| 977 | _bias $i2,8 | ||
| 978 | _bias $i3,0 | ||
| 979 | |||
| 980 | xor $rk0,$i0 | ||
| 981 | lw $i0,0($rcon) | ||
| 982 | xor $rk0,$i1 | ||
| 983 | xor $rk0,$i2 | ||
| 984 | xor $rk0,$i3 | ||
| 985 | xor $rk0,$i0 | ||
| 986 | |||
| 987 | xor $rk1,$rk0 | ||
| 988 | xor $rk2,$rk1 | ||
| 989 | xor $rk3,$rk2 | ||
| 990 | beqz $cnt,.L256bits_done | ||
| 991 | |||
| 992 | srl $i0,$rk3,24 | ||
| 993 | srl $i1,$rk3,16 | ||
| 994 | srl $i2,$rk3,8 | ||
| 995 | and $i3,$rk3,0xff | ||
| 996 | and $i1,0xff | ||
| 997 | and $i2,0xff | ||
| 998 | $PTR_ADD $i0,$Tbl | ||
| 999 | $PTR_ADD $i1,$Tbl | ||
| 1000 | $PTR_ADD $i2,$Tbl | ||
| 1001 | $PTR_ADD $i3,$Tbl | ||
| 1002 | lbu $i0,1024($i0) | ||
| 1003 | lbu $i1,1024($i1) | ||
| 1004 | lbu $i2,1024($i2) | ||
| 1005 | lbu $i3,1024($i3) | ||
| 1006 | sll $i0,24 | ||
| 1007 | sll $i1,16 | ||
| 1008 | sll $i2,8 | ||
| 1009 | |||
| 1010 | xor $rk4,$i0 | ||
| 1011 | xor $rk4,$i1 | ||
| 1012 | xor $rk4,$i2 | ||
| 1013 | xor $rk4,$i3 | ||
| 1014 | |||
| 1015 | xor $rk5,$rk4 | ||
| 1016 | xor $rk6,$rk5 | ||
| 1017 | xor $rk7,$rk6 | ||
| 1018 | |||
| 1019 | $PTR_ADD $key,32 | ||
| 1020 | .set noreorder | ||
| 1021 | b .L256bits | ||
| 1022 | $PTR_ADD $rcon,4 | ||
| 1023 | |||
| 1024 | .L256bits_done: | ||
| 1025 | sw $rk0,32($key) | ||
| 1026 | sw $rk1,36($key) | ||
| 1027 | sw $rk2,40($key) | ||
| 1028 | li $cnt,14 | ||
| 1029 | sw $rk3,44($key) | ||
| 1030 | li $t0,0 | ||
| 1031 | sw $cnt,48($key) | ||
| 1032 | $PTR_SUB $key,12*16 | ||
| 1033 | |||
| 1034 | .Lekey_done: | ||
| 1035 | jr $ra | ||
| 1036 | nop | ||
| 1037 | .end _mips_AES_set_encrypt_key | ||
| 1038 | |||
| 1039 | .globl AES_set_encrypt_key | ||
| 1040 | .ent AES_set_encrypt_key | ||
| 1041 | AES_set_encrypt_key: | ||
| 1042 | .frame $sp,$FRAMESIZE,$ra | ||
| 1043 | .mask $SAVED_REGS_MASK,-$SZREG | ||
| 1044 | .set noreorder | ||
| 1045 | ___ | ||
| 1046 | $code.=<<___ if ($flavour =~ /o32/i); # o32 PIC-ification | ||
| 1047 | .cpload $pf | ||
| 1048 | ___ | ||
| 1049 | $code.=<<___; | ||
| 1050 | $PTR_SUB $sp,$FRAMESIZE | ||
| 1051 | $REG_S $ra,$FRAMESIZE-1*$SZREG($sp) | ||
| 1052 | $REG_S $fp,$FRAMESIZE-2*$SZREG($sp) | ||
| 1053 | ___ | ||
| 1054 | $code.=<<___ if ($flavour =~ /nubi/i); # optimize non-nubi prologue | ||
| 1055 | $REG_S $s3,$FRAMESIZE-3*$SZREG($sp) | ||
| 1056 | $REG_S $s2,$FRAMESIZE-4*$SZREG($sp) | ||
| 1057 | $REG_S $s1,$FRAMESIZE-5*$SZREG($sp) | ||
| 1058 | $REG_S $s0,$FRAMESIZE-6*$SZREG($sp) | ||
| 1059 | $REG_S $gp,$FRAMESIZE-7*$SZREG($sp) | ||
| 1060 | ___ | ||
| 1061 | $code.=<<___ if ($flavour !~ /o32/i); # non-o32 PIC-ification | ||
| 1062 | .cplocal $Tbl | ||
| 1063 | .cpsetup $pf,$zero,AES_set_encrypt_key | ||
| 1064 | ___ | ||
| 1065 | $code.=<<___; | ||
| 1066 | .set reorder | ||
| 1067 | la $Tbl,AES_Te # PIC-ified 'load address' | ||
| 1068 | |||
| 1069 | bal _mips_AES_set_encrypt_key | ||
| 1070 | |||
| 1071 | .set noreorder | ||
| 1072 | move $a0,$t0 | ||
| 1073 | $REG_L $ra,$FRAMESIZE-1*$SZREG($sp) | ||
| 1074 | $REG_L $fp,$FRAMESIZE-2*$SZREG($sp) | ||
| 1075 | ___ | ||
| 1076 | $code.=<<___ if ($flavour =~ /nubi/i); | ||
| 1077 | $REG_L $s3,$FRAMESIZE-11*$SZREG($sp) | ||
| 1078 | $REG_L $s2,$FRAMESIZE-12*$SZREG($sp) | ||
| 1079 | $REG_L $s1,$FRAMESIZE-13*$SZREG($sp) | ||
| 1080 | $REG_L $s0,$FRAMESIZE-14*$SZREG($sp) | ||
| 1081 | $REG_L $gp,$FRAMESIZE-15*$SZREG($sp) | ||
| 1082 | ___ | ||
| 1083 | $code.=<<___; | ||
| 1084 | jr $ra | ||
| 1085 | $PTR_ADD $sp,$FRAMESIZE | ||
| 1086 | .end AES_set_encrypt_key | ||
| 1087 | ___ | ||
| 1088 | |||
| 1089 | my ($head,$tail)=($inp,$bits); | ||
| 1090 | my ($tp1,$tp2,$tp4,$tp8,$tp9,$tpb,$tpd,$tpe)=($a4,$a5,$a6,$a7,$s0,$s1,$s2,$s3); | ||
| 1091 | my ($m,$x80808080,$x7f7f7f7f,$x1b1b1b1b)=($at,$t0,$t1,$t2); | ||
| 1092 | $code.=<<___; | ||
| 1093 | .align 5 | ||
| 1094 | .globl AES_set_decrypt_key | ||
| 1095 | .ent AES_set_decrypt_key | ||
| 1096 | AES_set_decrypt_key: | ||
| 1097 | .frame $sp,$FRAMESIZE,$ra | ||
| 1098 | .mask $SAVED_REGS_MASK,-$SZREG | ||
| 1099 | .set noreorder | ||
| 1100 | ___ | ||
| 1101 | $code.=<<___ if ($flavour =~ /o32/i); # o32 PIC-ification | ||
| 1102 | .cpload $pf | ||
| 1103 | ___ | ||
| 1104 | $code.=<<___; | ||
| 1105 | $PTR_SUB $sp,$FRAMESIZE | ||
| 1106 | $REG_S $ra,$FRAMESIZE-1*$SZREG($sp) | ||
| 1107 | $REG_S $fp,$FRAMESIZE-2*$SZREG($sp) | ||
| 1108 | ___ | ||
| 1109 | $code.=<<___ if ($flavour =~ /nubi/i); # optimize non-nubi prologue | ||
| 1110 | $REG_S $s3,$FRAMESIZE-3*$SZREG($sp) | ||
| 1111 | $REG_S $s2,$FRAMESIZE-4*$SZREG($sp) | ||
| 1112 | $REG_S $s1,$FRAMESIZE-5*$SZREG($sp) | ||
| 1113 | $REG_S $s0,$FRAMESIZE-6*$SZREG($sp) | ||
| 1114 | $REG_S $gp,$FRAMESIZE-7*$SZREG($sp) | ||
| 1115 | ___ | ||
| 1116 | $code.=<<___ if ($flavour !~ /o32/i); # non-o32 PIC-ification | ||
| 1117 | .cplocal $Tbl | ||
| 1118 | .cpsetup $pf,$zero,AES_set_decrypt_key | ||
| 1119 | ___ | ||
| 1120 | $code.=<<___; | ||
| 1121 | .set reorder | ||
| 1122 | la $Tbl,AES_Te # PIC-ified 'load address' | ||
| 1123 | |||
| 1124 | bal _mips_AES_set_encrypt_key | ||
| 1125 | |||
| 1126 | bltz $t0,.Ldkey_done | ||
| 1127 | |||
| 1128 | sll $at,$cnt,4 | ||
| 1129 | $PTR_ADD $head,$key,0 | ||
| 1130 | $PTR_ADD $tail,$key,$at | ||
| 1131 | .align 4 | ||
| 1132 | .Lswap: | ||
| 1133 | lw $rk0,0($head) | ||
| 1134 | lw $rk1,4($head) | ||
| 1135 | lw $rk2,8($head) | ||
| 1136 | lw $rk3,12($head) | ||
| 1137 | lw $rk4,0($tail) | ||
| 1138 | lw $rk5,4($tail) | ||
| 1139 | lw $rk6,8($tail) | ||
| 1140 | lw $rk7,12($tail) | ||
| 1141 | sw $rk0,0($tail) | ||
| 1142 | sw $rk1,4($tail) | ||
| 1143 | sw $rk2,8($tail) | ||
| 1144 | sw $rk3,12($tail) | ||
| 1145 | $PTR_ADD $head,16 | ||
| 1146 | $PTR_SUB $tail,16 | ||
| 1147 | sw $rk4,-16($head) | ||
| 1148 | sw $rk5,-12($head) | ||
| 1149 | sw $rk6,-8($head) | ||
| 1150 | sw $rk7,-4($head) | ||
| 1151 | bne $head,$tail,.Lswap | ||
| 1152 | |||
| 1153 | lw $tp1,16($key) # modulo-scheduled | ||
| 1154 | lui $x80808080,0x8080 | ||
| 1155 | sub $cnt,1 | ||
| 1156 | or $x80808080,0x8080 | ||
| 1157 | sll $cnt,2 | ||
| 1158 | $PTR_ADD $key,16 | ||
| 1159 | lui $x1b1b1b1b,0x1b1b | ||
| 1160 | nor $x7f7f7f7f,$zero,$x80808080 | ||
| 1161 | or $x1b1b1b1b,0x1b1b | ||
| 1162 | .align 4 | ||
| 1163 | .Lmix: | ||
| 1164 | and $m,$tp1,$x80808080 | ||
| 1165 | and $tp2,$tp1,$x7f7f7f7f | ||
| 1166 | srl $tp4,$m,7 | ||
| 1167 | addu $tp2,$tp2 # tp2<<1 | ||
| 1168 | subu $m,$tp4 | ||
| 1169 | and $m,$x1b1b1b1b | ||
| 1170 | xor $tp2,$m | ||
| 1171 | |||
| 1172 | and $m,$tp2,$x80808080 | ||
| 1173 | and $tp4,$tp2,$x7f7f7f7f | ||
| 1174 | srl $tp8,$m,7 | ||
| 1175 | addu $tp4,$tp4 # tp4<<1 | ||
| 1176 | subu $m,$tp8 | ||
| 1177 | and $m,$x1b1b1b1b | ||
| 1178 | xor $tp4,$m | ||
| 1179 | |||
| 1180 | and $m,$tp4,$x80808080 | ||
| 1181 | and $tp8,$tp4,$x7f7f7f7f | ||
| 1182 | srl $tp9,$m,7 | ||
| 1183 | addu $tp8,$tp8 # tp8<<1 | ||
| 1184 | subu $m,$tp9 | ||
| 1185 | and $m,$x1b1b1b1b | ||
| 1186 | xor $tp8,$m | ||
| 1187 | |||
| 1188 | xor $tp9,$tp8,$tp1 | ||
| 1189 | xor $tpe,$tp8,$tp4 | ||
| 1190 | xor $tpb,$tp9,$tp2 | ||
| 1191 | xor $tpd,$tp9,$tp4 | ||
| 1192 | |||
| 1193 | _ror $tp1,$tpd,16 | ||
| 1194 | xor $tpe,$tp2 | ||
| 1195 | _ror $tp2,$tpd,-16 | ||
| 1196 | xor $tpe,$tp1 | ||
| 1197 | _ror $tp1,$tp9,8 | ||
| 1198 | xor $tpe,$tp2 | ||
| 1199 | _ror $tp2,$tp9,-24 | ||
| 1200 | xor $tpe,$tp1 | ||
| 1201 | _ror $tp1,$tpb,24 | ||
| 1202 | xor $tpe,$tp2 | ||
| 1203 | _ror $tp2,$tpb,-8 | ||
| 1204 | xor $tpe,$tp1 | ||
| 1205 | lw $tp1,4($key) # modulo-scheduled | ||
| 1206 | xor $tpe,$tp2 | ||
| 1207 | sub $cnt,1 | ||
| 1208 | sw $tpe,0($key) | ||
| 1209 | $PTR_ADD $key,4 | ||
| 1210 | bnez $cnt,.Lmix | ||
| 1211 | |||
| 1212 | li $t0,0 | ||
| 1213 | .Ldkey_done: | ||
| 1214 | .set noreorder | ||
| 1215 | move $a0,$t0 | ||
| 1216 | $REG_L $ra,$FRAMESIZE-1*$SZREG($sp) | ||
| 1217 | $REG_L $fp,$FRAMESIZE-2*$SZREG($sp) | ||
| 1218 | ___ | ||
| 1219 | $code.=<<___ if ($flavour =~ /nubi/i); | ||
| 1220 | $REG_L $s3,$FRAMESIZE-11*$SZREG($sp) | ||
| 1221 | $REG_L $s2,$FRAMESIZE-12*$SZREG($sp) | ||
| 1222 | $REG_L $s1,$FRAMESIZE-13*$SZREG($sp) | ||
| 1223 | $REG_L $s0,$FRAMESIZE-14*$SZREG($sp) | ||
| 1224 | $REG_L $gp,$FRAMESIZE-15*$SZREG($sp) | ||
| 1225 | ___ | ||
| 1226 | $code.=<<___; | ||
| 1227 | jr $ra | ||
| 1228 | $PTR_ADD $sp,$FRAMESIZE | ||
| 1229 | .end AES_set_decrypt_key | ||
| 1230 | ___ | ||
| 1231 | }}} | ||
| 1232 | |||
| 1233 | ###################################################################### | ||
| 1234 | # Tables are kept in endian-neutral manner | ||
| 1235 | $code.=<<___; | ||
| 1236 | .rdata | ||
| 1237 | .align 6 | ||
| 1238 | AES_Te: | ||
| 1239 | .byte 0xc6,0x63,0x63,0xa5, 0xf8,0x7c,0x7c,0x84 # Te0 | ||
| 1240 | .byte 0xee,0x77,0x77,0x99, 0xf6,0x7b,0x7b,0x8d | ||
| 1241 | .byte 0xff,0xf2,0xf2,0x0d, 0xd6,0x6b,0x6b,0xbd | ||
| 1242 | .byte 0xde,0x6f,0x6f,0xb1, 0x91,0xc5,0xc5,0x54 | ||
| 1243 | .byte 0x60,0x30,0x30,0x50, 0x02,0x01,0x01,0x03 | ||
| 1244 | .byte 0xce,0x67,0x67,0xa9, 0x56,0x2b,0x2b,0x7d | ||
| 1245 | .byte 0xe7,0xfe,0xfe,0x19, 0xb5,0xd7,0xd7,0x62 | ||
| 1246 | .byte 0x4d,0xab,0xab,0xe6, 0xec,0x76,0x76,0x9a | ||
| 1247 | .byte 0x8f,0xca,0xca,0x45, 0x1f,0x82,0x82,0x9d | ||
| 1248 | .byte 0x89,0xc9,0xc9,0x40, 0xfa,0x7d,0x7d,0x87 | ||
| 1249 | .byte 0xef,0xfa,0xfa,0x15, 0xb2,0x59,0x59,0xeb | ||
| 1250 | .byte 0x8e,0x47,0x47,0xc9, 0xfb,0xf0,0xf0,0x0b | ||
| 1251 | .byte 0x41,0xad,0xad,0xec, 0xb3,0xd4,0xd4,0x67 | ||
| 1252 | .byte 0x5f,0xa2,0xa2,0xfd, 0x45,0xaf,0xaf,0xea | ||
| 1253 | .byte 0x23,0x9c,0x9c,0xbf, 0x53,0xa4,0xa4,0xf7 | ||
| 1254 | .byte 0xe4,0x72,0x72,0x96, 0x9b,0xc0,0xc0,0x5b | ||
| 1255 | .byte 0x75,0xb7,0xb7,0xc2, 0xe1,0xfd,0xfd,0x1c | ||
| 1256 | .byte 0x3d,0x93,0x93,0xae, 0x4c,0x26,0x26,0x6a | ||
| 1257 | .byte 0x6c,0x36,0x36,0x5a, 0x7e,0x3f,0x3f,0x41 | ||
| 1258 | .byte 0xf5,0xf7,0xf7,0x02, 0x83,0xcc,0xcc,0x4f | ||
| 1259 | .byte 0x68,0x34,0x34,0x5c, 0x51,0xa5,0xa5,0xf4 | ||
| 1260 | .byte 0xd1,0xe5,0xe5,0x34, 0xf9,0xf1,0xf1,0x08 | ||
| 1261 | .byte 0xe2,0x71,0x71,0x93, 0xab,0xd8,0xd8,0x73 | ||
| 1262 | .byte 0x62,0x31,0x31,0x53, 0x2a,0x15,0x15,0x3f | ||
| 1263 | .byte 0x08,0x04,0x04,0x0c, 0x95,0xc7,0xc7,0x52 | ||
| 1264 | .byte 0x46,0x23,0x23,0x65, 0x9d,0xc3,0xc3,0x5e | ||
| 1265 | .byte 0x30,0x18,0x18,0x28, 0x37,0x96,0x96,0xa1 | ||
| 1266 | .byte 0x0a,0x05,0x05,0x0f, 0x2f,0x9a,0x9a,0xb5 | ||
| 1267 | .byte 0x0e,0x07,0x07,0x09, 0x24,0x12,0x12,0x36 | ||
| 1268 | .byte 0x1b,0x80,0x80,0x9b, 0xdf,0xe2,0xe2,0x3d | ||
| 1269 | .byte 0xcd,0xeb,0xeb,0x26, 0x4e,0x27,0x27,0x69 | ||
| 1270 | .byte 0x7f,0xb2,0xb2,0xcd, 0xea,0x75,0x75,0x9f | ||
| 1271 | .byte 0x12,0x09,0x09,0x1b, 0x1d,0x83,0x83,0x9e | ||
| 1272 | .byte 0x58,0x2c,0x2c,0x74, 0x34,0x1a,0x1a,0x2e | ||
| 1273 | .byte 0x36,0x1b,0x1b,0x2d, 0xdc,0x6e,0x6e,0xb2 | ||
| 1274 | .byte 0xb4,0x5a,0x5a,0xee, 0x5b,0xa0,0xa0,0xfb | ||
| 1275 | .byte 0xa4,0x52,0x52,0xf6, 0x76,0x3b,0x3b,0x4d | ||
| 1276 | .byte 0xb7,0xd6,0xd6,0x61, 0x7d,0xb3,0xb3,0xce | ||
| 1277 | .byte 0x52,0x29,0x29,0x7b, 0xdd,0xe3,0xe3,0x3e | ||
| 1278 | .byte 0x5e,0x2f,0x2f,0x71, 0x13,0x84,0x84,0x97 | ||
| 1279 | .byte 0xa6,0x53,0x53,0xf5, 0xb9,0xd1,0xd1,0x68 | ||
| 1280 | .byte 0x00,0x00,0x00,0x00, 0xc1,0xed,0xed,0x2c | ||
| 1281 | .byte 0x40,0x20,0x20,0x60, 0xe3,0xfc,0xfc,0x1f | ||
| 1282 | .byte 0x79,0xb1,0xb1,0xc8, 0xb6,0x5b,0x5b,0xed | ||
| 1283 | .byte 0xd4,0x6a,0x6a,0xbe, 0x8d,0xcb,0xcb,0x46 | ||
| 1284 | .byte 0x67,0xbe,0xbe,0xd9, 0x72,0x39,0x39,0x4b | ||
| 1285 | .byte 0x94,0x4a,0x4a,0xde, 0x98,0x4c,0x4c,0xd4 | ||
| 1286 | .byte 0xb0,0x58,0x58,0xe8, 0x85,0xcf,0xcf,0x4a | ||
| 1287 | .byte 0xbb,0xd0,0xd0,0x6b, 0xc5,0xef,0xef,0x2a | ||
| 1288 | .byte 0x4f,0xaa,0xaa,0xe5, 0xed,0xfb,0xfb,0x16 | ||
| 1289 | .byte 0x86,0x43,0x43,0xc5, 0x9a,0x4d,0x4d,0xd7 | ||
| 1290 | .byte 0x66,0x33,0x33,0x55, 0x11,0x85,0x85,0x94 | ||
| 1291 | .byte 0x8a,0x45,0x45,0xcf, 0xe9,0xf9,0xf9,0x10 | ||
| 1292 | .byte 0x04,0x02,0x02,0x06, 0xfe,0x7f,0x7f,0x81 | ||
| 1293 | .byte 0xa0,0x50,0x50,0xf0, 0x78,0x3c,0x3c,0x44 | ||
| 1294 | .byte 0x25,0x9f,0x9f,0xba, 0x4b,0xa8,0xa8,0xe3 | ||
| 1295 | .byte 0xa2,0x51,0x51,0xf3, 0x5d,0xa3,0xa3,0xfe | ||
| 1296 | .byte 0x80,0x40,0x40,0xc0, 0x05,0x8f,0x8f,0x8a | ||
| 1297 | .byte 0x3f,0x92,0x92,0xad, 0x21,0x9d,0x9d,0xbc | ||
| 1298 | .byte 0x70,0x38,0x38,0x48, 0xf1,0xf5,0xf5,0x04 | ||
| 1299 | .byte 0x63,0xbc,0xbc,0xdf, 0x77,0xb6,0xb6,0xc1 | ||
| 1300 | .byte 0xaf,0xda,0xda,0x75, 0x42,0x21,0x21,0x63 | ||
| 1301 | .byte 0x20,0x10,0x10,0x30, 0xe5,0xff,0xff,0x1a | ||
| 1302 | .byte 0xfd,0xf3,0xf3,0x0e, 0xbf,0xd2,0xd2,0x6d | ||
| 1303 | .byte 0x81,0xcd,0xcd,0x4c, 0x18,0x0c,0x0c,0x14 | ||
| 1304 | .byte 0x26,0x13,0x13,0x35, 0xc3,0xec,0xec,0x2f | ||
| 1305 | .byte 0xbe,0x5f,0x5f,0xe1, 0x35,0x97,0x97,0xa2 | ||
| 1306 | .byte 0x88,0x44,0x44,0xcc, 0x2e,0x17,0x17,0x39 | ||
| 1307 | .byte 0x93,0xc4,0xc4,0x57, 0x55,0xa7,0xa7,0xf2 | ||
| 1308 | .byte 0xfc,0x7e,0x7e,0x82, 0x7a,0x3d,0x3d,0x47 | ||
| 1309 | .byte 0xc8,0x64,0x64,0xac, 0xba,0x5d,0x5d,0xe7 | ||
| 1310 | .byte 0x32,0x19,0x19,0x2b, 0xe6,0x73,0x73,0x95 | ||
| 1311 | .byte 0xc0,0x60,0x60,0xa0, 0x19,0x81,0x81,0x98 | ||
| 1312 | .byte 0x9e,0x4f,0x4f,0xd1, 0xa3,0xdc,0xdc,0x7f | ||
| 1313 | .byte 0x44,0x22,0x22,0x66, 0x54,0x2a,0x2a,0x7e | ||
| 1314 | .byte 0x3b,0x90,0x90,0xab, 0x0b,0x88,0x88,0x83 | ||
| 1315 | .byte 0x8c,0x46,0x46,0xca, 0xc7,0xee,0xee,0x29 | ||
| 1316 | .byte 0x6b,0xb8,0xb8,0xd3, 0x28,0x14,0x14,0x3c | ||
| 1317 | .byte 0xa7,0xde,0xde,0x79, 0xbc,0x5e,0x5e,0xe2 | ||
| 1318 | .byte 0x16,0x0b,0x0b,0x1d, 0xad,0xdb,0xdb,0x76 | ||
| 1319 | .byte 0xdb,0xe0,0xe0,0x3b, 0x64,0x32,0x32,0x56 | ||
| 1320 | .byte 0x74,0x3a,0x3a,0x4e, 0x14,0x0a,0x0a,0x1e | ||
| 1321 | .byte 0x92,0x49,0x49,0xdb, 0x0c,0x06,0x06,0x0a | ||
| 1322 | .byte 0x48,0x24,0x24,0x6c, 0xb8,0x5c,0x5c,0xe4 | ||
| 1323 | .byte 0x9f,0xc2,0xc2,0x5d, 0xbd,0xd3,0xd3,0x6e | ||
| 1324 | .byte 0x43,0xac,0xac,0xef, 0xc4,0x62,0x62,0xa6 | ||
| 1325 | .byte 0x39,0x91,0x91,0xa8, 0x31,0x95,0x95,0xa4 | ||
| 1326 | .byte 0xd3,0xe4,0xe4,0x37, 0xf2,0x79,0x79,0x8b | ||
| 1327 | .byte 0xd5,0xe7,0xe7,0x32, 0x8b,0xc8,0xc8,0x43 | ||
| 1328 | .byte 0x6e,0x37,0x37,0x59, 0xda,0x6d,0x6d,0xb7 | ||
| 1329 | .byte 0x01,0x8d,0x8d,0x8c, 0xb1,0xd5,0xd5,0x64 | ||
| 1330 | .byte 0x9c,0x4e,0x4e,0xd2, 0x49,0xa9,0xa9,0xe0 | ||
| 1331 | .byte 0xd8,0x6c,0x6c,0xb4, 0xac,0x56,0x56,0xfa | ||
| 1332 | .byte 0xf3,0xf4,0xf4,0x07, 0xcf,0xea,0xea,0x25 | ||
| 1333 | .byte 0xca,0x65,0x65,0xaf, 0xf4,0x7a,0x7a,0x8e | ||
| 1334 | .byte 0x47,0xae,0xae,0xe9, 0x10,0x08,0x08,0x18 | ||
| 1335 | .byte 0x6f,0xba,0xba,0xd5, 0xf0,0x78,0x78,0x88 | ||
| 1336 | .byte 0x4a,0x25,0x25,0x6f, 0x5c,0x2e,0x2e,0x72 | ||
| 1337 | .byte 0x38,0x1c,0x1c,0x24, 0x57,0xa6,0xa6,0xf1 | ||
| 1338 | .byte 0x73,0xb4,0xb4,0xc7, 0x97,0xc6,0xc6,0x51 | ||
| 1339 | .byte 0xcb,0xe8,0xe8,0x23, 0xa1,0xdd,0xdd,0x7c | ||
| 1340 | .byte 0xe8,0x74,0x74,0x9c, 0x3e,0x1f,0x1f,0x21 | ||
| 1341 | .byte 0x96,0x4b,0x4b,0xdd, 0x61,0xbd,0xbd,0xdc | ||
| 1342 | .byte 0x0d,0x8b,0x8b,0x86, 0x0f,0x8a,0x8a,0x85 | ||
| 1343 | .byte 0xe0,0x70,0x70,0x90, 0x7c,0x3e,0x3e,0x42 | ||
| 1344 | .byte 0x71,0xb5,0xb5,0xc4, 0xcc,0x66,0x66,0xaa | ||
| 1345 | .byte 0x90,0x48,0x48,0xd8, 0x06,0x03,0x03,0x05 | ||
| 1346 | .byte 0xf7,0xf6,0xf6,0x01, 0x1c,0x0e,0x0e,0x12 | ||
| 1347 | .byte 0xc2,0x61,0x61,0xa3, 0x6a,0x35,0x35,0x5f | ||
| 1348 | .byte 0xae,0x57,0x57,0xf9, 0x69,0xb9,0xb9,0xd0 | ||
| 1349 | .byte 0x17,0x86,0x86,0x91, 0x99,0xc1,0xc1,0x58 | ||
| 1350 | .byte 0x3a,0x1d,0x1d,0x27, 0x27,0x9e,0x9e,0xb9 | ||
| 1351 | .byte 0xd9,0xe1,0xe1,0x38, 0xeb,0xf8,0xf8,0x13 | ||
| 1352 | .byte 0x2b,0x98,0x98,0xb3, 0x22,0x11,0x11,0x33 | ||
| 1353 | .byte 0xd2,0x69,0x69,0xbb, 0xa9,0xd9,0xd9,0x70 | ||
| 1354 | .byte 0x07,0x8e,0x8e,0x89, 0x33,0x94,0x94,0xa7 | ||
| 1355 | .byte 0x2d,0x9b,0x9b,0xb6, 0x3c,0x1e,0x1e,0x22 | ||
| 1356 | .byte 0x15,0x87,0x87,0x92, 0xc9,0xe9,0xe9,0x20 | ||
| 1357 | .byte 0x87,0xce,0xce,0x49, 0xaa,0x55,0x55,0xff | ||
| 1358 | .byte 0x50,0x28,0x28,0x78, 0xa5,0xdf,0xdf,0x7a | ||
| 1359 | .byte 0x03,0x8c,0x8c,0x8f, 0x59,0xa1,0xa1,0xf8 | ||
| 1360 | .byte 0x09,0x89,0x89,0x80, 0x1a,0x0d,0x0d,0x17 | ||
| 1361 | .byte 0x65,0xbf,0xbf,0xda, 0xd7,0xe6,0xe6,0x31 | ||
| 1362 | .byte 0x84,0x42,0x42,0xc6, 0xd0,0x68,0x68,0xb8 | ||
| 1363 | .byte 0x82,0x41,0x41,0xc3, 0x29,0x99,0x99,0xb0 | ||
| 1364 | .byte 0x5a,0x2d,0x2d,0x77, 0x1e,0x0f,0x0f,0x11 | ||
| 1365 | .byte 0x7b,0xb0,0xb0,0xcb, 0xa8,0x54,0x54,0xfc | ||
| 1366 | .byte 0x6d,0xbb,0xbb,0xd6, 0x2c,0x16,0x16,0x3a | ||
| 1367 | |||
| 1368 | .byte 0x63, 0x7c, 0x77, 0x7b, 0xf2, 0x6b, 0x6f, 0xc5 # Te4 | ||
| 1369 | .byte 0x30, 0x01, 0x67, 0x2b, 0xfe, 0xd7, 0xab, 0x76 | ||
| 1370 | .byte 0xca, 0x82, 0xc9, 0x7d, 0xfa, 0x59, 0x47, 0xf0 | ||
| 1371 | .byte 0xad, 0xd4, 0xa2, 0xaf, 0x9c, 0xa4, 0x72, 0xc0 | ||
| 1372 | .byte 0xb7, 0xfd, 0x93, 0x26, 0x36, 0x3f, 0xf7, 0xcc | ||
| 1373 | .byte 0x34, 0xa5, 0xe5, 0xf1, 0x71, 0xd8, 0x31, 0x15 | ||
| 1374 | .byte 0x04, 0xc7, 0x23, 0xc3, 0x18, 0x96, 0x05, 0x9a | ||
| 1375 | .byte 0x07, 0x12, 0x80, 0xe2, 0xeb, 0x27, 0xb2, 0x75 | ||
| 1376 | .byte 0x09, 0x83, 0x2c, 0x1a, 0x1b, 0x6e, 0x5a, 0xa0 | ||
| 1377 | .byte 0x52, 0x3b, 0xd6, 0xb3, 0x29, 0xe3, 0x2f, 0x84 | ||
| 1378 | .byte 0x53, 0xd1, 0x00, 0xed, 0x20, 0xfc, 0xb1, 0x5b | ||
| 1379 | .byte 0x6a, 0xcb, 0xbe, 0x39, 0x4a, 0x4c, 0x58, 0xcf | ||
| 1380 | .byte 0xd0, 0xef, 0xaa, 0xfb, 0x43, 0x4d, 0x33, 0x85 | ||
| 1381 | .byte 0x45, 0xf9, 0x02, 0x7f, 0x50, 0x3c, 0x9f, 0xa8 | ||
| 1382 | .byte 0x51, 0xa3, 0x40, 0x8f, 0x92, 0x9d, 0x38, 0xf5 | ||
| 1383 | .byte 0xbc, 0xb6, 0xda, 0x21, 0x10, 0xff, 0xf3, 0xd2 | ||
| 1384 | .byte 0xcd, 0x0c, 0x13, 0xec, 0x5f, 0x97, 0x44, 0x17 | ||
| 1385 | .byte 0xc4, 0xa7, 0x7e, 0x3d, 0x64, 0x5d, 0x19, 0x73 | ||
| 1386 | .byte 0x60, 0x81, 0x4f, 0xdc, 0x22, 0x2a, 0x90, 0x88 | ||
| 1387 | .byte 0x46, 0xee, 0xb8, 0x14, 0xde, 0x5e, 0x0b, 0xdb | ||
| 1388 | .byte 0xe0, 0x32, 0x3a, 0x0a, 0x49, 0x06, 0x24, 0x5c | ||
| 1389 | .byte 0xc2, 0xd3, 0xac, 0x62, 0x91, 0x95, 0xe4, 0x79 | ||
| 1390 | .byte 0xe7, 0xc8, 0x37, 0x6d, 0x8d, 0xd5, 0x4e, 0xa9 | ||
| 1391 | .byte 0x6c, 0x56, 0xf4, 0xea, 0x65, 0x7a, 0xae, 0x08 | ||
| 1392 | .byte 0xba, 0x78, 0x25, 0x2e, 0x1c, 0xa6, 0xb4, 0xc6 | ||
| 1393 | .byte 0xe8, 0xdd, 0x74, 0x1f, 0x4b, 0xbd, 0x8b, 0x8a | ||
| 1394 | .byte 0x70, 0x3e, 0xb5, 0x66, 0x48, 0x03, 0xf6, 0x0e | ||
| 1395 | .byte 0x61, 0x35, 0x57, 0xb9, 0x86, 0xc1, 0x1d, 0x9e | ||
| 1396 | .byte 0xe1, 0xf8, 0x98, 0x11, 0x69, 0xd9, 0x8e, 0x94 | ||
| 1397 | .byte 0x9b, 0x1e, 0x87, 0xe9, 0xce, 0x55, 0x28, 0xdf | ||
| 1398 | .byte 0x8c, 0xa1, 0x89, 0x0d, 0xbf, 0xe6, 0x42, 0x68 | ||
| 1399 | .byte 0x41, 0x99, 0x2d, 0x0f, 0xb0, 0x54, 0xbb, 0x16 | ||
| 1400 | |||
| 1401 | .byte 0x01,0x00,0x00,0x00, 0x02,0x00,0x00,0x00 # rcon | ||
| 1402 | .byte 0x04,0x00,0x00,0x00, 0x08,0x00,0x00,0x00 | ||
| 1403 | .byte 0x10,0x00,0x00,0x00, 0x20,0x00,0x00,0x00 | ||
| 1404 | .byte 0x40,0x00,0x00,0x00, 0x80,0x00,0x00,0x00 | ||
| 1405 | .byte 0x1B,0x00,0x00,0x00, 0x36,0x00,0x00,0x00 | ||
| 1406 | |||
| 1407 | .align 6 | ||
| 1408 | AES_Td: | ||
| 1409 | .byte 0x51,0xf4,0xa7,0x50, 0x7e,0x41,0x65,0x53 # Td0 | ||
| 1410 | .byte 0x1a,0x17,0xa4,0xc3, 0x3a,0x27,0x5e,0x96 | ||
| 1411 | .byte 0x3b,0xab,0x6b,0xcb, 0x1f,0x9d,0x45,0xf1 | ||
| 1412 | .byte 0xac,0xfa,0x58,0xab, 0x4b,0xe3,0x03,0x93 | ||
| 1413 | .byte 0x20,0x30,0xfa,0x55, 0xad,0x76,0x6d,0xf6 | ||
| 1414 | .byte 0x88,0xcc,0x76,0x91, 0xf5,0x02,0x4c,0x25 | ||
| 1415 | .byte 0x4f,0xe5,0xd7,0xfc, 0xc5,0x2a,0xcb,0xd7 | ||
| 1416 | .byte 0x26,0x35,0x44,0x80, 0xb5,0x62,0xa3,0x8f | ||
| 1417 | .byte 0xde,0xb1,0x5a,0x49, 0x25,0xba,0x1b,0x67 | ||
| 1418 | .byte 0x45,0xea,0x0e,0x98, 0x5d,0xfe,0xc0,0xe1 | ||
| 1419 | .byte 0xc3,0x2f,0x75,0x02, 0x81,0x4c,0xf0,0x12 | ||
| 1420 | .byte 0x8d,0x46,0x97,0xa3, 0x6b,0xd3,0xf9,0xc6 | ||
| 1421 | .byte 0x03,0x8f,0x5f,0xe7, 0x15,0x92,0x9c,0x95 | ||
| 1422 | .byte 0xbf,0x6d,0x7a,0xeb, 0x95,0x52,0x59,0xda | ||
| 1423 | .byte 0xd4,0xbe,0x83,0x2d, 0x58,0x74,0x21,0xd3 | ||
| 1424 | .byte 0x49,0xe0,0x69,0x29, 0x8e,0xc9,0xc8,0x44 | ||
| 1425 | .byte 0x75,0xc2,0x89,0x6a, 0xf4,0x8e,0x79,0x78 | ||
| 1426 | .byte 0x99,0x58,0x3e,0x6b, 0x27,0xb9,0x71,0xdd | ||
| 1427 | .byte 0xbe,0xe1,0x4f,0xb6, 0xf0,0x88,0xad,0x17 | ||
| 1428 | .byte 0xc9,0x20,0xac,0x66, 0x7d,0xce,0x3a,0xb4 | ||
| 1429 | .byte 0x63,0xdf,0x4a,0x18, 0xe5,0x1a,0x31,0x82 | ||
| 1430 | .byte 0x97,0x51,0x33,0x60, 0x62,0x53,0x7f,0x45 | ||
| 1431 | .byte 0xb1,0x64,0x77,0xe0, 0xbb,0x6b,0xae,0x84 | ||
| 1432 | .byte 0xfe,0x81,0xa0,0x1c, 0xf9,0x08,0x2b,0x94 | ||
| 1433 | .byte 0x70,0x48,0x68,0x58, 0x8f,0x45,0xfd,0x19 | ||
| 1434 | .byte 0x94,0xde,0x6c,0x87, 0x52,0x7b,0xf8,0xb7 | ||
| 1435 | .byte 0xab,0x73,0xd3,0x23, 0x72,0x4b,0x02,0xe2 | ||
| 1436 | .byte 0xe3,0x1f,0x8f,0x57, 0x66,0x55,0xab,0x2a | ||
| 1437 | .byte 0xb2,0xeb,0x28,0x07, 0x2f,0xb5,0xc2,0x03 | ||
| 1438 | .byte 0x86,0xc5,0x7b,0x9a, 0xd3,0x37,0x08,0xa5 | ||
| 1439 | .byte 0x30,0x28,0x87,0xf2, 0x23,0xbf,0xa5,0xb2 | ||
| 1440 | .byte 0x02,0x03,0x6a,0xba, 0xed,0x16,0x82,0x5c | ||
| 1441 | .byte 0x8a,0xcf,0x1c,0x2b, 0xa7,0x79,0xb4,0x92 | ||
| 1442 | .byte 0xf3,0x07,0xf2,0xf0, 0x4e,0x69,0xe2,0xa1 | ||
| 1443 | .byte 0x65,0xda,0xf4,0xcd, 0x06,0x05,0xbe,0xd5 | ||
| 1444 | .byte 0xd1,0x34,0x62,0x1f, 0xc4,0xa6,0xfe,0x8a | ||
| 1445 | .byte 0x34,0x2e,0x53,0x9d, 0xa2,0xf3,0x55,0xa0 | ||
| 1446 | .byte 0x05,0x8a,0xe1,0x32, 0xa4,0xf6,0xeb,0x75 | ||
| 1447 | .byte 0x0b,0x83,0xec,0x39, 0x40,0x60,0xef,0xaa | ||
| 1448 | .byte 0x5e,0x71,0x9f,0x06, 0xbd,0x6e,0x10,0x51 | ||
| 1449 | .byte 0x3e,0x21,0x8a,0xf9, 0x96,0xdd,0x06,0x3d | ||
| 1450 | .byte 0xdd,0x3e,0x05,0xae, 0x4d,0xe6,0xbd,0x46 | ||
| 1451 | .byte 0x91,0x54,0x8d,0xb5, 0x71,0xc4,0x5d,0x05 | ||
| 1452 | .byte 0x04,0x06,0xd4,0x6f, 0x60,0x50,0x15,0xff | ||
| 1453 | .byte 0x19,0x98,0xfb,0x24, 0xd6,0xbd,0xe9,0x97 | ||
| 1454 | .byte 0x89,0x40,0x43,0xcc, 0x67,0xd9,0x9e,0x77 | ||
| 1455 | .byte 0xb0,0xe8,0x42,0xbd, 0x07,0x89,0x8b,0x88 | ||
| 1456 | .byte 0xe7,0x19,0x5b,0x38, 0x79,0xc8,0xee,0xdb | ||
| 1457 | .byte 0xa1,0x7c,0x0a,0x47, 0x7c,0x42,0x0f,0xe9 | ||
| 1458 | .byte 0xf8,0x84,0x1e,0xc9, 0x00,0x00,0x00,0x00 | ||
| 1459 | .byte 0x09,0x80,0x86,0x83, 0x32,0x2b,0xed,0x48 | ||
| 1460 | .byte 0x1e,0x11,0x70,0xac, 0x6c,0x5a,0x72,0x4e | ||
| 1461 | .byte 0xfd,0x0e,0xff,0xfb, 0x0f,0x85,0x38,0x56 | ||
| 1462 | .byte 0x3d,0xae,0xd5,0x1e, 0x36,0x2d,0x39,0x27 | ||
| 1463 | .byte 0x0a,0x0f,0xd9,0x64, 0x68,0x5c,0xa6,0x21 | ||
| 1464 | .byte 0x9b,0x5b,0x54,0xd1, 0x24,0x36,0x2e,0x3a | ||
| 1465 | .byte 0x0c,0x0a,0x67,0xb1, 0x93,0x57,0xe7,0x0f | ||
| 1466 | .byte 0xb4,0xee,0x96,0xd2, 0x1b,0x9b,0x91,0x9e | ||
| 1467 | .byte 0x80,0xc0,0xc5,0x4f, 0x61,0xdc,0x20,0xa2 | ||
| 1468 | .byte 0x5a,0x77,0x4b,0x69, 0x1c,0x12,0x1a,0x16 | ||
| 1469 | .byte 0xe2,0x93,0xba,0x0a, 0xc0,0xa0,0x2a,0xe5 | ||
| 1470 | .byte 0x3c,0x22,0xe0,0x43, 0x12,0x1b,0x17,0x1d | ||
| 1471 | .byte 0x0e,0x09,0x0d,0x0b, 0xf2,0x8b,0xc7,0xad | ||
| 1472 | .byte 0x2d,0xb6,0xa8,0xb9, 0x14,0x1e,0xa9,0xc8 | ||
| 1473 | .byte 0x57,0xf1,0x19,0x85, 0xaf,0x75,0x07,0x4c | ||
| 1474 | .byte 0xee,0x99,0xdd,0xbb, 0xa3,0x7f,0x60,0xfd | ||
| 1475 | .byte 0xf7,0x01,0x26,0x9f, 0x5c,0x72,0xf5,0xbc | ||
| 1476 | .byte 0x44,0x66,0x3b,0xc5, 0x5b,0xfb,0x7e,0x34 | ||
| 1477 | .byte 0x8b,0x43,0x29,0x76, 0xcb,0x23,0xc6,0xdc | ||
| 1478 | .byte 0xb6,0xed,0xfc,0x68, 0xb8,0xe4,0xf1,0x63 | ||
| 1479 | .byte 0xd7,0x31,0xdc,0xca, 0x42,0x63,0x85,0x10 | ||
| 1480 | .byte 0x13,0x97,0x22,0x40, 0x84,0xc6,0x11,0x20 | ||
| 1481 | .byte 0x85,0x4a,0x24,0x7d, 0xd2,0xbb,0x3d,0xf8 | ||
| 1482 | .byte 0xae,0xf9,0x32,0x11, 0xc7,0x29,0xa1,0x6d | ||
| 1483 | .byte 0x1d,0x9e,0x2f,0x4b, 0xdc,0xb2,0x30,0xf3 | ||
| 1484 | .byte 0x0d,0x86,0x52,0xec, 0x77,0xc1,0xe3,0xd0 | ||
| 1485 | .byte 0x2b,0xb3,0x16,0x6c, 0xa9,0x70,0xb9,0x99 | ||
| 1486 | .byte 0x11,0x94,0x48,0xfa, 0x47,0xe9,0x64,0x22 | ||
| 1487 | .byte 0xa8,0xfc,0x8c,0xc4, 0xa0,0xf0,0x3f,0x1a | ||
| 1488 | .byte 0x56,0x7d,0x2c,0xd8, 0x22,0x33,0x90,0xef | ||
| 1489 | .byte 0x87,0x49,0x4e,0xc7, 0xd9,0x38,0xd1,0xc1 | ||
| 1490 | .byte 0x8c,0xca,0xa2,0xfe, 0x98,0xd4,0x0b,0x36 | ||
| 1491 | .byte 0xa6,0xf5,0x81,0xcf, 0xa5,0x7a,0xde,0x28 | ||
| 1492 | .byte 0xda,0xb7,0x8e,0x26, 0x3f,0xad,0xbf,0xa4 | ||
| 1493 | .byte 0x2c,0x3a,0x9d,0xe4, 0x50,0x78,0x92,0x0d | ||
| 1494 | .byte 0x6a,0x5f,0xcc,0x9b, 0x54,0x7e,0x46,0x62 | ||
| 1495 | .byte 0xf6,0x8d,0x13,0xc2, 0x90,0xd8,0xb8,0xe8 | ||
| 1496 | .byte 0x2e,0x39,0xf7,0x5e, 0x82,0xc3,0xaf,0xf5 | ||
| 1497 | .byte 0x9f,0x5d,0x80,0xbe, 0x69,0xd0,0x93,0x7c | ||
| 1498 | .byte 0x6f,0xd5,0x2d,0xa9, 0xcf,0x25,0x12,0xb3 | ||
| 1499 | .byte 0xc8,0xac,0x99,0x3b, 0x10,0x18,0x7d,0xa7 | ||
| 1500 | .byte 0xe8,0x9c,0x63,0x6e, 0xdb,0x3b,0xbb,0x7b | ||
| 1501 | .byte 0xcd,0x26,0x78,0x09, 0x6e,0x59,0x18,0xf4 | ||
| 1502 | .byte 0xec,0x9a,0xb7,0x01, 0x83,0x4f,0x9a,0xa8 | ||
| 1503 | .byte 0xe6,0x95,0x6e,0x65, 0xaa,0xff,0xe6,0x7e | ||
| 1504 | .byte 0x21,0xbc,0xcf,0x08, 0xef,0x15,0xe8,0xe6 | ||
| 1505 | .byte 0xba,0xe7,0x9b,0xd9, 0x4a,0x6f,0x36,0xce | ||
| 1506 | .byte 0xea,0x9f,0x09,0xd4, 0x29,0xb0,0x7c,0xd6 | ||
| 1507 | .byte 0x31,0xa4,0xb2,0xaf, 0x2a,0x3f,0x23,0x31 | ||
| 1508 | .byte 0xc6,0xa5,0x94,0x30, 0x35,0xa2,0x66,0xc0 | ||
| 1509 | .byte 0x74,0x4e,0xbc,0x37, 0xfc,0x82,0xca,0xa6 | ||
| 1510 | .byte 0xe0,0x90,0xd0,0xb0, 0x33,0xa7,0xd8,0x15 | ||
| 1511 | .byte 0xf1,0x04,0x98,0x4a, 0x41,0xec,0xda,0xf7 | ||
| 1512 | .byte 0x7f,0xcd,0x50,0x0e, 0x17,0x91,0xf6,0x2f | ||
| 1513 | .byte 0x76,0x4d,0xd6,0x8d, 0x43,0xef,0xb0,0x4d | ||
| 1514 | .byte 0xcc,0xaa,0x4d,0x54, 0xe4,0x96,0x04,0xdf | ||
| 1515 | .byte 0x9e,0xd1,0xb5,0xe3, 0x4c,0x6a,0x88,0x1b | ||
| 1516 | .byte 0xc1,0x2c,0x1f,0xb8, 0x46,0x65,0x51,0x7f | ||
| 1517 | .byte 0x9d,0x5e,0xea,0x04, 0x01,0x8c,0x35,0x5d | ||
| 1518 | .byte 0xfa,0x87,0x74,0x73, 0xfb,0x0b,0x41,0x2e | ||
| 1519 | .byte 0xb3,0x67,0x1d,0x5a, 0x92,0xdb,0xd2,0x52 | ||
| 1520 | .byte 0xe9,0x10,0x56,0x33, 0x6d,0xd6,0x47,0x13 | ||
| 1521 | .byte 0x9a,0xd7,0x61,0x8c, 0x37,0xa1,0x0c,0x7a | ||
| 1522 | .byte 0x59,0xf8,0x14,0x8e, 0xeb,0x13,0x3c,0x89 | ||
| 1523 | .byte 0xce,0xa9,0x27,0xee, 0xb7,0x61,0xc9,0x35 | ||
| 1524 | .byte 0xe1,0x1c,0xe5,0xed, 0x7a,0x47,0xb1,0x3c | ||
| 1525 | .byte 0x9c,0xd2,0xdf,0x59, 0x55,0xf2,0x73,0x3f | ||
| 1526 | .byte 0x18,0x14,0xce,0x79, 0x73,0xc7,0x37,0xbf | ||
| 1527 | .byte 0x53,0xf7,0xcd,0xea, 0x5f,0xfd,0xaa,0x5b | ||
| 1528 | .byte 0xdf,0x3d,0x6f,0x14, 0x78,0x44,0xdb,0x86 | ||
| 1529 | .byte 0xca,0xaf,0xf3,0x81, 0xb9,0x68,0xc4,0x3e | ||
| 1530 | .byte 0x38,0x24,0x34,0x2c, 0xc2,0xa3,0x40,0x5f | ||
| 1531 | .byte 0x16,0x1d,0xc3,0x72, 0xbc,0xe2,0x25,0x0c | ||
| 1532 | .byte 0x28,0x3c,0x49,0x8b, 0xff,0x0d,0x95,0x41 | ||
| 1533 | .byte 0x39,0xa8,0x01,0x71, 0x08,0x0c,0xb3,0xde | ||
| 1534 | .byte 0xd8,0xb4,0xe4,0x9c, 0x64,0x56,0xc1,0x90 | ||
| 1535 | .byte 0x7b,0xcb,0x84,0x61, 0xd5,0x32,0xb6,0x70 | ||
| 1536 | .byte 0x48,0x6c,0x5c,0x74, 0xd0,0xb8,0x57,0x42 | ||
| 1537 | |||
| 1538 | .byte 0x52, 0x09, 0x6a, 0xd5, 0x30, 0x36, 0xa5, 0x38 # Td4 | ||
| 1539 | .byte 0xbf, 0x40, 0xa3, 0x9e, 0x81, 0xf3, 0xd7, 0xfb | ||
| 1540 | .byte 0x7c, 0xe3, 0x39, 0x82, 0x9b, 0x2f, 0xff, 0x87 | ||
| 1541 | .byte 0x34, 0x8e, 0x43, 0x44, 0xc4, 0xde, 0xe9, 0xcb | ||
| 1542 | .byte 0x54, 0x7b, 0x94, 0x32, 0xa6, 0xc2, 0x23, 0x3d | ||
| 1543 | .byte 0xee, 0x4c, 0x95, 0x0b, 0x42, 0xfa, 0xc3, 0x4e | ||
| 1544 | .byte 0x08, 0x2e, 0xa1, 0x66, 0x28, 0xd9, 0x24, 0xb2 | ||
| 1545 | .byte 0x76, 0x5b, 0xa2, 0x49, 0x6d, 0x8b, 0xd1, 0x25 | ||
| 1546 | .byte 0x72, 0xf8, 0xf6, 0x64, 0x86, 0x68, 0x98, 0x16 | ||
| 1547 | .byte 0xd4, 0xa4, 0x5c, 0xcc, 0x5d, 0x65, 0xb6, 0x92 | ||
| 1548 | .byte 0x6c, 0x70, 0x48, 0x50, 0xfd, 0xed, 0xb9, 0xda | ||
| 1549 | .byte 0x5e, 0x15, 0x46, 0x57, 0xa7, 0x8d, 0x9d, 0x84 | ||
| 1550 | .byte 0x90, 0xd8, 0xab, 0x00, 0x8c, 0xbc, 0xd3, 0x0a | ||
| 1551 | .byte 0xf7, 0xe4, 0x58, 0x05, 0xb8, 0xb3, 0x45, 0x06 | ||
| 1552 | .byte 0xd0, 0x2c, 0x1e, 0x8f, 0xca, 0x3f, 0x0f, 0x02 | ||
| 1553 | .byte 0xc1, 0xaf, 0xbd, 0x03, 0x01, 0x13, 0x8a, 0x6b | ||
| 1554 | .byte 0x3a, 0x91, 0x11, 0x41, 0x4f, 0x67, 0xdc, 0xea | ||
| 1555 | .byte 0x97, 0xf2, 0xcf, 0xce, 0xf0, 0xb4, 0xe6, 0x73 | ||
| 1556 | .byte 0x96, 0xac, 0x74, 0x22, 0xe7, 0xad, 0x35, 0x85 | ||
| 1557 | .byte 0xe2, 0xf9, 0x37, 0xe8, 0x1c, 0x75, 0xdf, 0x6e | ||
| 1558 | .byte 0x47, 0xf1, 0x1a, 0x71, 0x1d, 0x29, 0xc5, 0x89 | ||
| 1559 | .byte 0x6f, 0xb7, 0x62, 0x0e, 0xaa, 0x18, 0xbe, 0x1b | ||
| 1560 | .byte 0xfc, 0x56, 0x3e, 0x4b, 0xc6, 0xd2, 0x79, 0x20 | ||
| 1561 | .byte 0x9a, 0xdb, 0xc0, 0xfe, 0x78, 0xcd, 0x5a, 0xf4 | ||
| 1562 | .byte 0x1f, 0xdd, 0xa8, 0x33, 0x88, 0x07, 0xc7, 0x31 | ||
| 1563 | .byte 0xb1, 0x12, 0x10, 0x59, 0x27, 0x80, 0xec, 0x5f | ||
| 1564 | .byte 0x60, 0x51, 0x7f, 0xa9, 0x19, 0xb5, 0x4a, 0x0d | ||
| 1565 | .byte 0x2d, 0xe5, 0x7a, 0x9f, 0x93, 0xc9, 0x9c, 0xef | ||
| 1566 | .byte 0xa0, 0xe0, 0x3b, 0x4d, 0xae, 0x2a, 0xf5, 0xb0 | ||
| 1567 | .byte 0xc8, 0xeb, 0xbb, 0x3c, 0x83, 0x53, 0x99, 0x61 | ||
| 1568 | .byte 0x17, 0x2b, 0x04, 0x7e, 0xba, 0x77, 0xd6, 0x26 | ||
| 1569 | .byte 0xe1, 0x69, 0x14, 0x63, 0x55, 0x21, 0x0c, 0x7d | ||
| 1570 | ___ | ||
| 1571 | |||
| 1572 | foreach (split("\n",$code)) { | ||
| 1573 | s/\`([^\`]*)\`/eval $1/ge; | ||
| 1574 | |||
| 1575 | # made-up _instructions, _xtr, _ins, _ror and _bias, cope | ||
| 1576 | # with byte order dependencies... | ||
| 1577 | if (/^\s+_/) { | ||
| 1578 | s/(_[a-z]+\s+)(\$[0-9]+),([^,]+)(#.*)*$/$1$2,$2,$3/; | ||
| 1579 | |||
| 1580 | s/_xtr\s+(\$[0-9]+),(\$[0-9]+),([0-9]+(\-2)*)/ | ||
| 1581 | sprintf("srl\t$1,$2,%d",$big_endian ? eval($3) | ||
| 1582 | : eval("24-$3"))/e or | ||
| 1583 | s/_ins\s+(\$[0-9]+),(\$[0-9]+),([0-9]+)/ | ||
| 1584 | sprintf("sll\t$1,$2,%d",$big_endian ? eval($3) | ||
| 1585 | : eval("24-$3"))/e or | ||
| 1586 | s/_ror\s+(\$[0-9]+),(\$[0-9]+),(\-?[0-9]+)/ | ||
| 1587 | sprintf("srl\t$1,$2,%d",$big_endian ? eval($3) | ||
| 1588 | : eval("$3*-1"))/e or | ||
| 1589 | s/_bias\s+(\$[0-9]+),(\$[0-9]+),([0-9]+)/ | ||
| 1590 | sprintf("sll\t$1,$2,%d",$big_endian ? eval($3) | ||
| 1591 | : eval("($3-16)&31"))/e; | ||
| 1592 | |||
| 1593 | s/srl\s+(\$[0-9]+),(\$[0-9]+),\-([0-9]+)/ | ||
| 1594 | sprintf("sll\t$1,$2,$3")/e or | ||
| 1595 | s/srl\s+(\$[0-9]+),(\$[0-9]+),0/ | ||
| 1596 | sprintf("and\t$1,$2,0xff")/e or | ||
| 1597 | s/(sll\s+\$[0-9]+,\$[0-9]+,0)/#$1/; | ||
| 1598 | } | ||
| 1599 | |||
| 1600 | # convert lwl/lwr and swr/swl to little-endian order | ||
| 1601 | if (!$big_endian && /^\s+[sl]w[lr]\s+/) { | ||
| 1602 | s/([sl]wl.*)([0-9]+)\((\$[0-9]+)\)/ | ||
| 1603 | sprintf("$1%d($3)",eval("$2-$2%4+($2%4-1)&3"))/e or | ||
| 1604 | s/([sl]wr.*)([0-9]+)\((\$[0-9]+)\)/ | ||
| 1605 | sprintf("$1%d($3)",eval("$2-$2%4+($2%4+1)&3"))/e; | ||
| 1606 | } | ||
| 1607 | |||
| 1608 | print $_,"\n"; | ||
| 1609 | } | ||
| 1610 | |||
| 1611 | close STDOUT; | ||
