Home | History | Annotate | Download | only in asm
      1 #!/usr/bin/env perl
      2 
      3 # ====================================================================
      4 # Written by Andy Polyakov <appro (at] fy.chalmers.se> for the OpenSSL
      5 # project. The module is, however, dual licensed under OpenSSL and
      6 # CRYPTOGAMS licenses depending on where you obtain it. For further
      7 # details see http://www.openssl.org/~appro/cryptogams/.
      8 # ====================================================================
      9 
     10 # AES for PA-RISC.
     11 #
     12 # June 2009.
     13 #
     14 # The module is mechanical transliteration of aes-sparcv9.pl, but with
     15 # a twist: S-boxes are compressed even further down to 1K+256B. On
     16 # PA-7100LC performance is ~40% better than gcc 3.2 generated code and
     17 # is about 33 cycles per byte processed with 128-bit key. Newer CPUs
     18 # perform at 16 cycles per byte. It's not faster than code generated
     19 # by vendor compiler, but recall that it has compressed S-boxes, which
     20 # requires extra processing.
     21 #
     22 # Special thanks to polarhome.com for providing HP-UX account.
     23 
     24 $flavour = shift;
     25 $output = shift;
     26 open STDOUT,">$output";
     27 
     28 if ($flavour =~ /64/) {
     29 	$LEVEL		="2.0W";
     30 	$SIZE_T		=8;
     31 	$FRAME_MARKER	=80;
     32 	$SAVED_RP	=16;
     33 	$PUSH		="std";
     34 	$PUSHMA		="std,ma";
     35 	$POP		="ldd";
     36 	$POPMB		="ldd,mb";
     37 } else {
     38 	$LEVEL		="1.0";
     39 	$SIZE_T		=4;
     40 	$FRAME_MARKER	=48;
     41 	$SAVED_RP	=20;
     42 	$PUSH		="stw";
     43 	$PUSHMA		="stwm";
     44 	$POP		="ldw";
     45 	$POPMB		="ldwm";
     46 }
     47 
     48 $FRAME=16*$SIZE_T+$FRAME_MARKER;# 16 saved regs + frame marker
     49 				#                 [+ argument transfer]
     50 $inp="%r26";	# arg0
     51 $out="%r25";	# arg1
     52 $key="%r24";	# arg2
     53 
     54 ($s0,$s1,$s2,$s3) = ("%r1","%r2","%r3","%r4");
     55 ($t0,$t1,$t2,$t3) = ("%r5","%r6","%r7","%r8");
     56 
     57 ($acc0, $acc1, $acc2, $acc3, $acc4, $acc5, $acc6, $acc7,
     58  $acc8, $acc9,$acc10,$acc11,$acc12,$acc13,$acc14,$acc15) =
     59 ("%r9","%r10","%r11","%r12","%r13","%r14","%r15","%r16",
     60 "%r17","%r18","%r19","%r20","%r21","%r22","%r23","%r26");
     61 
     62 $tbl="%r28";
     63 $rounds="%r29";
     64 
     65 $code=<<___;
     66 	.LEVEL	$LEVEL
     67 	.SPACE	\$TEXT\$
     68 	.SUBSPA	\$CODE\$,QUAD=0,ALIGN=8,ACCESS=0x2C,CODE_ONLY
     69 
     70 	.EXPORT	AES_encrypt,ENTRY,ARGW0=GR,ARGW1=GR,ARGW2=GR
     71 	.ALIGN	64
     72 AES_encrypt
     73 	.PROC
     74 	.CALLINFO	FRAME=`$FRAME-16*$SIZE_T`,NO_CALLS,SAVE_RP,ENTRY_GR=18
     75 	.ENTRY
     76 	$PUSH	%r2,-$SAVED_RP(%sp)	; standard prologue
     77 	$PUSHMA	%r3,$FRAME(%sp)
     78 	$PUSH	%r4,`-$FRAME+1*$SIZE_T`(%sp)
     79 	$PUSH	%r5,`-$FRAME+2*$SIZE_T`(%sp)
     80 	$PUSH	%r6,`-$FRAME+3*$SIZE_T`(%sp)
     81 	$PUSH	%r7,`-$FRAME+4*$SIZE_T`(%sp)
     82 	$PUSH	%r8,`-$FRAME+5*$SIZE_T`(%sp)
     83 	$PUSH	%r9,`-$FRAME+6*$SIZE_T`(%sp)
     84 	$PUSH	%r10,`-$FRAME+7*$SIZE_T`(%sp)
     85 	$PUSH	%r11,`-$FRAME+8*$SIZE_T`(%sp)
     86 	$PUSH	%r12,`-$FRAME+9*$SIZE_T`(%sp)
     87 	$PUSH	%r13,`-$FRAME+10*$SIZE_T`(%sp)
     88 	$PUSH	%r14,`-$FRAME+11*$SIZE_T`(%sp)
     89 	$PUSH	%r15,`-$FRAME+12*$SIZE_T`(%sp)
     90 	$PUSH	%r16,`-$FRAME+13*$SIZE_T`(%sp)
     91 	$PUSH	%r17,`-$FRAME+14*$SIZE_T`(%sp)
     92 	$PUSH	%r18,`-$FRAME+15*$SIZE_T`(%sp)
     93 
     94 	blr	%r0,$tbl
     95 	ldi	3,$t0
     96 L\$enc_pic
     97 	andcm	$tbl,$t0,$tbl
     98 	ldo	L\$AES_Te-L\$enc_pic($tbl),$tbl
     99 
    100 	and	$inp,$t0,$t0
    101 	sub	$inp,$t0,$inp
    102 	ldw	0($inp),$s0
    103 	ldw	4($inp),$s1
    104 	ldw	8($inp),$s2
    105 	comib,=	0,$t0,L\$enc_inp_aligned
    106 	ldw	12($inp),$s3
    107 
    108 	sh3addl	$t0,%r0,$t0
    109 	subi	32,$t0,$t0
    110 	mtctl	$t0,%cr11
    111 	ldw	16($inp),$t1
    112 	vshd	$s0,$s1,$s0
    113 	vshd	$s1,$s2,$s1
    114 	vshd	$s2,$s3,$s2
    115 	vshd	$s3,$t1,$s3
    116 
    117 L\$enc_inp_aligned
    118 	bl	_parisc_AES_encrypt,%r31
    119 	nop
    120 
    121 	extru,<> $out,31,2,%r0
    122 	b	L\$enc_out_aligned
    123 	nop
    124 
    125 	_srm	$s0,24,$acc0
    126 	_srm	$s0,16,$acc1
    127 	stb	$acc0,0($out)
    128 	_srm	$s0,8,$acc2
    129 	stb	$acc1,1($out)
    130 	_srm	$s1,24,$acc4
    131 	stb	$acc2,2($out)
    132 	_srm	$s1,16,$acc5
    133 	stb	$s0,3($out)
    134 	_srm	$s1,8,$acc6
    135 	stb	$acc4,4($out)
    136 	_srm	$s2,24,$acc0
    137 	stb	$acc5,5($out)
    138 	_srm	$s2,16,$acc1
    139 	stb	$acc6,6($out)
    140 	_srm	$s2,8,$acc2
    141 	stb	$s1,7($out)
    142 	_srm	$s3,24,$acc4
    143 	stb	$acc0,8($out)
    144 	_srm	$s3,16,$acc5
    145 	stb	$acc1,9($out)
    146 	_srm	$s3,8,$acc6
    147 	stb	$acc2,10($out)
    148 	stb	$s2,11($out)
    149 	stb	$acc4,12($out)
    150 	stb	$acc5,13($out)
    151 	stb	$acc6,14($out)
    152 	b	L\$enc_done
    153 	stb	$s3,15($out)
    154 
    155 L\$enc_out_aligned
    156 	stw	$s0,0($out)
    157 	stw	$s1,4($out)
    158 	stw	$s2,8($out)
    159 	stw	$s3,12($out)
    160 
    161 L\$enc_done
    162 	$POP	`-$FRAME-$SAVED_RP`(%sp),%r2	; standard epilogue
    163 	$POP	`-$FRAME+1*$SIZE_T`(%sp),%r4
    164 	$POP	`-$FRAME+2*$SIZE_T`(%sp),%r5
    165 	$POP	`-$FRAME+3*$SIZE_T`(%sp),%r6
    166 	$POP	`-$FRAME+4*$SIZE_T`(%sp),%r7
    167 	$POP	`-$FRAME+5*$SIZE_T`(%sp),%r8
    168 	$POP	`-$FRAME+6*$SIZE_T`(%sp),%r9
    169 	$POP	`-$FRAME+7*$SIZE_T`(%sp),%r10
    170 	$POP	`-$FRAME+8*$SIZE_T`(%sp),%r11
    171 	$POP	`-$FRAME+9*$SIZE_T`(%sp),%r12
    172 	$POP	`-$FRAME+10*$SIZE_T`(%sp),%r13
    173 	$POP	`-$FRAME+11*$SIZE_T`(%sp),%r14
    174 	$POP	`-$FRAME+12*$SIZE_T`(%sp),%r15
    175 	$POP	`-$FRAME+13*$SIZE_T`(%sp),%r16
    176 	$POP	`-$FRAME+14*$SIZE_T`(%sp),%r17
    177 	$POP	`-$FRAME+15*$SIZE_T`(%sp),%r18
    178 	bv	(%r2)
    179 	.EXIT
    180 	$POPMB	-$FRAME(%sp),%r3
    181 	.PROCEND
    182 
    183 	.ALIGN	16
    184 _parisc_AES_encrypt
    185 	.PROC
    186 	.CALLINFO	MILLICODE
    187 	.ENTRY
    188 	ldw	240($key),$rounds
    189 	ldw	0($key),$t0
    190 	ldw	4($key),$t1
    191 	ldw	8($key),$t2
    192 	_srm	$rounds,1,$rounds
    193 	xor	$t0,$s0,$s0
    194 	ldw	12($key),$t3
    195 	_srm	$s0,24,$acc0
    196 	xor	$t1,$s1,$s1
    197 	ldw	16($key),$t0
    198 	_srm	$s1,16,$acc1
    199 	xor	$t2,$s2,$s2
    200 	ldw	20($key),$t1
    201 	xor	$t3,$s3,$s3
    202 	ldw	24($key),$t2
    203 	ldw	28($key),$t3
    204 L\$enc_loop
    205 	_srm	$s2,8,$acc2
    206 	ldwx,s	$acc0($tbl),$acc0
    207 	_srm	$s3,0,$acc3
    208 	ldwx,s	$acc1($tbl),$acc1
    209 	_srm	$s1,24,$acc4
    210 	ldwx,s	$acc2($tbl),$acc2
    211 	_srm	$s2,16,$acc5
    212 	ldwx,s	$acc3($tbl),$acc3
    213 	_srm	$s3,8,$acc6
    214 	ldwx,s	$acc4($tbl),$acc4
    215 	_srm	$s0,0,$acc7
    216 	ldwx,s	$acc5($tbl),$acc5
    217 	_srm	$s2,24,$acc8
    218 	ldwx,s	$acc6($tbl),$acc6
    219 	_srm	$s3,16,$acc9
    220 	ldwx,s	$acc7($tbl),$acc7
    221 	_srm	$s0,8,$acc10
    222 	ldwx,s	$acc8($tbl),$acc8
    223 	_srm	$s1,0,$acc11
    224 	ldwx,s	$acc9($tbl),$acc9
    225 	_srm	$s3,24,$acc12
    226 	ldwx,s	$acc10($tbl),$acc10
    227 	_srm	$s0,16,$acc13
    228 	ldwx,s	$acc11($tbl),$acc11
    229 	_srm	$s1,8,$acc14
    230 	ldwx,s	$acc12($tbl),$acc12
    231 	_srm	$s2,0,$acc15
    232 	ldwx,s	$acc13($tbl),$acc13
    233 	ldwx,s	$acc14($tbl),$acc14
    234 	ldwx,s	$acc15($tbl),$acc15
    235 	addib,= -1,$rounds,L\$enc_last
    236 	ldo	32($key),$key
    237 
    238 		_ror	$acc1,8,$acc1
    239 		xor	$acc0,$t0,$t0
    240 	ldw	0($key),$s0
    241 		_ror	$acc2,16,$acc2
    242 		xor	$acc1,$t0,$t0
    243 	ldw	4($key),$s1
    244 		_ror	$acc3,24,$acc3
    245 		xor	$acc2,$t0,$t0
    246 	ldw	8($key),$s2
    247 		_ror	$acc5,8,$acc5
    248 		xor	$acc3,$t0,$t0
    249 	ldw	12($key),$s3
    250 		_ror	$acc6,16,$acc6
    251 		xor	$acc4,$t1,$t1
    252 		_ror	$acc7,24,$acc7
    253 		xor	$acc5,$t1,$t1
    254 		_ror	$acc9,8,$acc9
    255 		xor	$acc6,$t1,$t1
    256 		_ror	$acc10,16,$acc10
    257 		xor	$acc7,$t1,$t1
    258 		_ror	$acc11,24,$acc11
    259 		xor	$acc8,$t2,$t2
    260 		_ror	$acc13,8,$acc13
    261 		xor	$acc9,$t2,$t2
    262 		_ror	$acc14,16,$acc14
    263 		xor	$acc10,$t2,$t2
    264 		_ror	$acc15,24,$acc15
    265 		xor	$acc11,$t2,$t2
    266 		xor	$acc12,$acc14,$acc14
    267 		xor	$acc13,$t3,$t3
    268 	_srm	$t0,24,$acc0
    269 		xor	$acc14,$t3,$t3
    270 	_srm	$t1,16,$acc1
    271 		xor	$acc15,$t3,$t3
    272 
    273 	_srm	$t2,8,$acc2
    274 	ldwx,s	$acc0($tbl),$acc0
    275 	_srm	$t3,0,$acc3
    276 	ldwx,s	$acc1($tbl),$acc1
    277 	_srm	$t1,24,$acc4
    278 	ldwx,s	$acc2($tbl),$acc2
    279 	_srm	$t2,16,$acc5
    280 	ldwx,s	$acc3($tbl),$acc3
    281 	_srm	$t3,8,$acc6
    282 	ldwx,s	$acc4($tbl),$acc4
    283 	_srm	$t0,0,$acc7
    284 	ldwx,s	$acc5($tbl),$acc5
    285 	_srm	$t2,24,$acc8
    286 	ldwx,s	$acc6($tbl),$acc6
    287 	_srm	$t3,16,$acc9
    288 	ldwx,s	$acc7($tbl),$acc7
    289 	_srm	$t0,8,$acc10
    290 	ldwx,s	$acc8($tbl),$acc8
    291 	_srm	$t1,0,$acc11
    292 	ldwx,s	$acc9($tbl),$acc9
    293 	_srm	$t3,24,$acc12
    294 	ldwx,s	$acc10($tbl),$acc10
    295 	_srm	$t0,16,$acc13
    296 	ldwx,s	$acc11($tbl),$acc11
    297 	_srm	$t1,8,$acc14
    298 	ldwx,s	$acc12($tbl),$acc12
    299 	_srm	$t2,0,$acc15
    300 	ldwx,s	$acc13($tbl),$acc13
    301 		_ror	$acc1,8,$acc1
    302 	ldwx,s	$acc14($tbl),$acc14
    303 
    304 		_ror	$acc2,16,$acc2
    305 		xor	$acc0,$s0,$s0
    306 	ldwx,s	$acc15($tbl),$acc15
    307 		_ror	$acc3,24,$acc3
    308 		xor	$acc1,$s0,$s0
    309 	ldw	16($key),$t0
    310 		_ror	$acc5,8,$acc5
    311 		xor	$acc2,$s0,$s0
    312 	ldw	20($key),$t1
    313 		_ror	$acc6,16,$acc6
    314 		xor	$acc3,$s0,$s0
    315 	ldw	24($key),$t2
    316 		_ror	$acc7,24,$acc7
    317 		xor	$acc4,$s1,$s1
    318 	ldw	28($key),$t3
    319 		_ror	$acc9,8,$acc9
    320 		xor	$acc5,$s1,$s1
    321 	ldw	1024+0($tbl),%r0		; prefetch te4
    322 		_ror	$acc10,16,$acc10
    323 		xor	$acc6,$s1,$s1
    324 	ldw	1024+32($tbl),%r0		; prefetch te4
    325 		_ror	$acc11,24,$acc11
    326 		xor	$acc7,$s1,$s1
    327 	ldw	1024+64($tbl),%r0		; prefetch te4
    328 		_ror	$acc13,8,$acc13
    329 		xor	$acc8,$s2,$s2
    330 	ldw	1024+96($tbl),%r0		; prefetch te4
    331 		_ror	$acc14,16,$acc14
    332 		xor	$acc9,$s2,$s2
    333 	ldw	1024+128($tbl),%r0		; prefetch te4
    334 		_ror	$acc15,24,$acc15
    335 		xor	$acc10,$s2,$s2
    336 	ldw	1024+160($tbl),%r0		; prefetch te4
    337 	_srm	$s0,24,$acc0
    338 		xor	$acc11,$s2,$s2
    339 	ldw	1024+192($tbl),%r0		; prefetch te4
    340 		xor	$acc12,$acc14,$acc14
    341 		xor	$acc13,$s3,$s3
    342 	ldw	1024+224($tbl),%r0		; prefetch te4
    343 	_srm	$s1,16,$acc1
    344 		xor	$acc14,$s3,$s3
    345 	b	L\$enc_loop
    346 		xor	$acc15,$s3,$s3
    347 
    348 	.ALIGN	16
    349 L\$enc_last
    350 	ldo	1024($tbl),$rounds
    351 		_ror	$acc1,8,$acc1
    352 		xor	$acc0,$t0,$t0
    353 	ldw	0($key),$s0
    354 		_ror	$acc2,16,$acc2
    355 		xor	$acc1,$t0,$t0
    356 	ldw	4($key),$s1
    357 		_ror	$acc3,24,$acc3
    358 		xor	$acc2,$t0,$t0
    359 	ldw	8($key),$s2
    360 		_ror	$acc5,8,$acc5
    361 		xor	$acc3,$t0,$t0
    362 	ldw	12($key),$s3
    363 		_ror	$acc6,16,$acc6
    364 		xor	$acc4,$t1,$t1
    365 		_ror	$acc7,24,$acc7
    366 		xor	$acc5,$t1,$t1
    367 		_ror	$acc9,8,$acc9
    368 		xor	$acc6,$t1,$t1
    369 		_ror	$acc10,16,$acc10
    370 		xor	$acc7,$t1,$t1
    371 		_ror	$acc11,24,$acc11
    372 		xor	$acc8,$t2,$t2
    373 		_ror	$acc13,8,$acc13
    374 		xor	$acc9,$t2,$t2
    375 		_ror	$acc14,16,$acc14
    376 		xor	$acc10,$t2,$t2
    377 		_ror	$acc15,24,$acc15
    378 		xor	$acc11,$t2,$t2
    379 		xor	$acc12,$acc14,$acc14
    380 		xor	$acc13,$t3,$t3
    381 	_srm	$t0,24,$acc0
    382 		xor	$acc14,$t3,$t3
    383 	_srm	$t1,16,$acc1
    384 		xor	$acc15,$t3,$t3
    385 
    386 	_srm	$t2,8,$acc2
    387 	ldbx	$acc0($rounds),$acc0
    388 	_srm	$t1,24,$acc4
    389 	ldbx	$acc1($rounds),$acc1
    390 	_srm	$t2,16,$acc5
    391 	_srm	$t3,0,$acc3
    392 	ldbx	$acc2($rounds),$acc2
    393 	ldbx	$acc3($rounds),$acc3
    394 	_srm	$t3,8,$acc6
    395 	ldbx	$acc4($rounds),$acc4
    396 	_srm	$t2,24,$acc8
    397 	ldbx	$acc5($rounds),$acc5
    398 	_srm	$t3,16,$acc9
    399 	_srm	$t0,0,$acc7
    400 	ldbx	$acc6($rounds),$acc6
    401 	ldbx	$acc7($rounds),$acc7
    402 	_srm	$t0,8,$acc10
    403 	ldbx	$acc8($rounds),$acc8
    404 	_srm	$t3,24,$acc12
    405 	ldbx	$acc9($rounds),$acc9
    406 	_srm	$t0,16,$acc13
    407 	_srm	$t1,0,$acc11
    408 	ldbx	$acc10($rounds),$acc10
    409 	_srm	$t1,8,$acc14
    410 	ldbx	$acc11($rounds),$acc11
    411 	ldbx	$acc12($rounds),$acc12
    412 	ldbx	$acc13($rounds),$acc13
    413 	_srm	$t2,0,$acc15
    414 	ldbx	$acc14($rounds),$acc14
    415 
    416 		dep	$acc0,7,8,$acc3
    417 	ldbx	$acc15($rounds),$acc15
    418 		dep	$acc4,7,8,$acc7
    419 		dep	$acc1,15,8,$acc3
    420 		dep	$acc5,15,8,$acc7
    421 		dep	$acc2,23,8,$acc3
    422 		dep	$acc6,23,8,$acc7
    423 		xor	$acc3,$s0,$s0
    424 		xor	$acc7,$s1,$s1
    425 		dep	$acc8,7,8,$acc11
    426 		dep	$acc12,7,8,$acc15
    427 		dep	$acc9,15,8,$acc11
    428 		dep	$acc13,15,8,$acc15
    429 		dep	$acc10,23,8,$acc11
    430 		dep	$acc14,23,8,$acc15
    431 		xor	$acc11,$s2,$s2
    432 
    433 	bv	(%r31)
    434 	.EXIT
    435 		xor	$acc15,$s3,$s3
    436 	.PROCEND
    437 
    438 	.ALIGN	64
    439 L\$AES_Te
    440 	.WORD	0xc66363a5, 0xf87c7c84, 0xee777799, 0xf67b7b8d
    441 	.WORD	0xfff2f20d, 0xd66b6bbd, 0xde6f6fb1, 0x91c5c554
    442 	.WORD	0x60303050, 0x02010103, 0xce6767a9, 0x562b2b7d
    443 	.WORD	0xe7fefe19, 0xb5d7d762, 0x4dababe6, 0xec76769a
    444 	.WORD	0x8fcaca45, 0x1f82829d, 0x89c9c940, 0xfa7d7d87
    445 	.WORD	0xeffafa15, 0xb25959eb, 0x8e4747c9, 0xfbf0f00b
    446 	.WORD	0x41adadec, 0xb3d4d467, 0x5fa2a2fd, 0x45afafea
    447 	.WORD	0x239c9cbf, 0x53a4a4f7, 0xe4727296, 0x9bc0c05b
    448 	.WORD	0x75b7b7c2, 0xe1fdfd1c, 0x3d9393ae, 0x4c26266a
    449 	.WORD	0x6c36365a, 0x7e3f3f41, 0xf5f7f702, 0x83cccc4f
    450 	.WORD	0x6834345c, 0x51a5a5f4, 0xd1e5e534, 0xf9f1f108
    451 	.WORD	0xe2717193, 0xabd8d873, 0x62313153, 0x2a15153f
    452 	.WORD	0x0804040c, 0x95c7c752, 0x46232365, 0x9dc3c35e
    453 	.WORD	0x30181828, 0x379696a1, 0x0a05050f, 0x2f9a9ab5
    454 	.WORD	0x0e070709, 0x24121236, 0x1b80809b, 0xdfe2e23d
    455 	.WORD	0xcdebeb26, 0x4e272769, 0x7fb2b2cd, 0xea75759f
    456 	.WORD	0x1209091b, 0x1d83839e, 0x582c2c74, 0x341a1a2e
    457 	.WORD	0x361b1b2d, 0xdc6e6eb2, 0xb45a5aee, 0x5ba0a0fb
    458 	.WORD	0xa45252f6, 0x763b3b4d, 0xb7d6d661, 0x7db3b3ce
    459 	.WORD	0x5229297b, 0xdde3e33e, 0x5e2f2f71, 0x13848497
    460 	.WORD	0xa65353f5, 0xb9d1d168, 0x00000000, 0xc1eded2c
    461 	.WORD	0x40202060, 0xe3fcfc1f, 0x79b1b1c8, 0xb65b5bed
    462 	.WORD	0xd46a6abe, 0x8dcbcb46, 0x67bebed9, 0x7239394b
    463 	.WORD	0x944a4ade, 0x984c4cd4, 0xb05858e8, 0x85cfcf4a
    464 	.WORD	0xbbd0d06b, 0xc5efef2a, 0x4faaaae5, 0xedfbfb16
    465 	.WORD	0x864343c5, 0x9a4d4dd7, 0x66333355, 0x11858594
    466 	.WORD	0x8a4545cf, 0xe9f9f910, 0x04020206, 0xfe7f7f81
    467 	.WORD	0xa05050f0, 0x783c3c44, 0x259f9fba, 0x4ba8a8e3
    468 	.WORD	0xa25151f3, 0x5da3a3fe, 0x804040c0, 0x058f8f8a
    469 	.WORD	0x3f9292ad, 0x219d9dbc, 0x70383848, 0xf1f5f504
    470 	.WORD	0x63bcbcdf, 0x77b6b6c1, 0xafdada75, 0x42212163
    471 	.WORD	0x20101030, 0xe5ffff1a, 0xfdf3f30e, 0xbfd2d26d
    472 	.WORD	0x81cdcd4c, 0x180c0c14, 0x26131335, 0xc3ecec2f
    473 	.WORD	0xbe5f5fe1, 0x359797a2, 0x884444cc, 0x2e171739
    474 	.WORD	0x93c4c457, 0x55a7a7f2, 0xfc7e7e82, 0x7a3d3d47
    475 	.WORD	0xc86464ac, 0xba5d5de7, 0x3219192b, 0xe6737395
    476 	.WORD	0xc06060a0, 0x19818198, 0x9e4f4fd1, 0xa3dcdc7f
    477 	.WORD	0x44222266, 0x542a2a7e, 0x3b9090ab, 0x0b888883
    478 	.WORD	0x8c4646ca, 0xc7eeee29, 0x6bb8b8d3, 0x2814143c
    479 	.WORD	0xa7dede79, 0xbc5e5ee2, 0x160b0b1d, 0xaddbdb76
    480 	.WORD	0xdbe0e03b, 0x64323256, 0x743a3a4e, 0x140a0a1e
    481 	.WORD	0x924949db, 0x0c06060a, 0x4824246c, 0xb85c5ce4
    482 	.WORD	0x9fc2c25d, 0xbdd3d36e, 0x43acacef, 0xc46262a6
    483 	.WORD	0x399191a8, 0x319595a4, 0xd3e4e437, 0xf279798b
    484 	.WORD	0xd5e7e732, 0x8bc8c843, 0x6e373759, 0xda6d6db7
    485 	.WORD	0x018d8d8c, 0xb1d5d564, 0x9c4e4ed2, 0x49a9a9e0
    486 	.WORD	0xd86c6cb4, 0xac5656fa, 0xf3f4f407, 0xcfeaea25
    487 	.WORD	0xca6565af, 0xf47a7a8e, 0x47aeaee9, 0x10080818
    488 	.WORD	0x6fbabad5, 0xf0787888, 0x4a25256f, 0x5c2e2e72
    489 	.WORD	0x381c1c24, 0x57a6a6f1, 0x73b4b4c7, 0x97c6c651
    490 	.WORD	0xcbe8e823, 0xa1dddd7c, 0xe874749c, 0x3e1f1f21
    491 	.WORD	0x964b4bdd, 0x61bdbddc, 0x0d8b8b86, 0x0f8a8a85
    492 	.WORD	0xe0707090, 0x7c3e3e42, 0x71b5b5c4, 0xcc6666aa
    493 	.WORD	0x904848d8, 0x06030305, 0xf7f6f601, 0x1c0e0e12
    494 	.WORD	0xc26161a3, 0x6a35355f, 0xae5757f9, 0x69b9b9d0
    495 	.WORD	0x17868691, 0x99c1c158, 0x3a1d1d27, 0x279e9eb9
    496 	.WORD	0xd9e1e138, 0xebf8f813, 0x2b9898b3, 0x22111133
    497 	.WORD	0xd26969bb, 0xa9d9d970, 0x078e8e89, 0x339494a7
    498 	.WORD	0x2d9b9bb6, 0x3c1e1e22, 0x15878792, 0xc9e9e920
    499 	.WORD	0x87cece49, 0xaa5555ff, 0x50282878, 0xa5dfdf7a
    500 	.WORD	0x038c8c8f, 0x59a1a1f8, 0x09898980, 0x1a0d0d17
    501 	.WORD	0x65bfbfda, 0xd7e6e631, 0x844242c6, 0xd06868b8
    502 	.WORD	0x824141c3, 0x299999b0, 0x5a2d2d77, 0x1e0f0f11
    503 	.WORD	0x7bb0b0cb, 0xa85454fc, 0x6dbbbbd6, 0x2c16163a
    504 	.BYTE	0x63, 0x7c, 0x77, 0x7b, 0xf2, 0x6b, 0x6f, 0xc5
    505 	.BYTE	0x30, 0x01, 0x67, 0x2b, 0xfe, 0xd7, 0xab, 0x76
    506 	.BYTE	0xca, 0x82, 0xc9, 0x7d, 0xfa, 0x59, 0x47, 0xf0
    507 	.BYTE	0xad, 0xd4, 0xa2, 0xaf, 0x9c, 0xa4, 0x72, 0xc0
    508 	.BYTE	0xb7, 0xfd, 0x93, 0x26, 0x36, 0x3f, 0xf7, 0xcc
    509 	.BYTE	0x34, 0xa5, 0xe5, 0xf1, 0x71, 0xd8, 0x31, 0x15
    510 	.BYTE	0x04, 0xc7, 0x23, 0xc3, 0x18, 0x96, 0x05, 0x9a
    511 	.BYTE	0x07, 0x12, 0x80, 0xe2, 0xeb, 0x27, 0xb2, 0x75
    512 	.BYTE	0x09, 0x83, 0x2c, 0x1a, 0x1b, 0x6e, 0x5a, 0xa0
    513 	.BYTE	0x52, 0x3b, 0xd6, 0xb3, 0x29, 0xe3, 0x2f, 0x84
    514 	.BYTE	0x53, 0xd1, 0x00, 0xed, 0x20, 0xfc, 0xb1, 0x5b
    515 	.BYTE	0x6a, 0xcb, 0xbe, 0x39, 0x4a, 0x4c, 0x58, 0xcf
    516 	.BYTE	0xd0, 0xef, 0xaa, 0xfb, 0x43, 0x4d, 0x33, 0x85
    517 	.BYTE	0x45, 0xf9, 0x02, 0x7f, 0x50, 0x3c, 0x9f, 0xa8
    518 	.BYTE	0x51, 0xa3, 0x40, 0x8f, 0x92, 0x9d, 0x38, 0xf5
    519 	.BYTE	0xbc, 0xb6, 0xda, 0x21, 0x10, 0xff, 0xf3, 0xd2
    520 	.BYTE	0xcd, 0x0c, 0x13, 0xec, 0x5f, 0x97, 0x44, 0x17
    521 	.BYTE	0xc4, 0xa7, 0x7e, 0x3d, 0x64, 0x5d, 0x19, 0x73
    522 	.BYTE	0x60, 0x81, 0x4f, 0xdc, 0x22, 0x2a, 0x90, 0x88
    523 	.BYTE	0x46, 0xee, 0xb8, 0x14, 0xde, 0x5e, 0x0b, 0xdb
    524 	.BYTE	0xe0, 0x32, 0x3a, 0x0a, 0x49, 0x06, 0x24, 0x5c
    525 	.BYTE	0xc2, 0xd3, 0xac, 0x62, 0x91, 0x95, 0xe4, 0x79
    526 	.BYTE	0xe7, 0xc8, 0x37, 0x6d, 0x8d, 0xd5, 0x4e, 0xa9
    527 	.BYTE	0x6c, 0x56, 0xf4, 0xea, 0x65, 0x7a, 0xae, 0x08
    528 	.BYTE	0xba, 0x78, 0x25, 0x2e, 0x1c, 0xa6, 0xb4, 0xc6
    529 	.BYTE	0xe8, 0xdd, 0x74, 0x1f, 0x4b, 0xbd, 0x8b, 0x8a
    530 	.BYTE	0x70, 0x3e, 0xb5, 0x66, 0x48, 0x03, 0xf6, 0x0e
    531 	.BYTE	0x61, 0x35, 0x57, 0xb9, 0x86, 0xc1, 0x1d, 0x9e
    532 	.BYTE	0xe1, 0xf8, 0x98, 0x11, 0x69, 0xd9, 0x8e, 0x94
    533 	.BYTE	0x9b, 0x1e, 0x87, 0xe9, 0xce, 0x55, 0x28, 0xdf
    534 	.BYTE	0x8c, 0xa1, 0x89, 0x0d, 0xbf, 0xe6, 0x42, 0x68
    535 	.BYTE	0x41, 0x99, 0x2d, 0x0f, 0xb0, 0x54, 0xbb, 0x16
    536 ___
    537 
    538 $code.=<<___;
    539 	.EXPORT	AES_decrypt,ENTRY,ARGW0=GR,ARGW1=GR,ARGW2=GR
    540 	.ALIGN	16
    541 AES_decrypt
    542 	.PROC
    543 	.CALLINFO	FRAME=`$FRAME-16*$SIZE_T`,NO_CALLS,SAVE_RP,ENTRY_GR=18
    544 	.ENTRY
    545 	$PUSH	%r2,-$SAVED_RP(%sp)	; standard prologue
    546 	$PUSHMA	%r3,$FRAME(%sp)
    547 	$PUSH	%r4,`-$FRAME+1*$SIZE_T`(%sp)
    548 	$PUSH	%r5,`-$FRAME+2*$SIZE_T`(%sp)
    549 	$PUSH	%r6,`-$FRAME+3*$SIZE_T`(%sp)
    550 	$PUSH	%r7,`-$FRAME+4*$SIZE_T`(%sp)
    551 	$PUSH	%r8,`-$FRAME+5*$SIZE_T`(%sp)
    552 	$PUSH	%r9,`-$FRAME+6*$SIZE_T`(%sp)
    553 	$PUSH	%r10,`-$FRAME+7*$SIZE_T`(%sp)
    554 	$PUSH	%r11,`-$FRAME+8*$SIZE_T`(%sp)
    555 	$PUSH	%r12,`-$FRAME+9*$SIZE_T`(%sp)
    556 	$PUSH	%r13,`-$FRAME+10*$SIZE_T`(%sp)
    557 	$PUSH	%r14,`-$FRAME+11*$SIZE_T`(%sp)
    558 	$PUSH	%r15,`-$FRAME+12*$SIZE_T`(%sp)
    559 	$PUSH	%r16,`-$FRAME+13*$SIZE_T`(%sp)
    560 	$PUSH	%r17,`-$FRAME+14*$SIZE_T`(%sp)
    561 	$PUSH	%r18,`-$FRAME+15*$SIZE_T`(%sp)
    562 
    563 	blr	%r0,$tbl
    564 	ldi	3,$t0
    565 L\$dec_pic
    566 	andcm	$tbl,$t0,$tbl
    567 	ldo	L\$AES_Td-L\$dec_pic($tbl),$tbl
    568 
    569 	and	$inp,$t0,$t0
    570 	sub	$inp,$t0,$inp
    571 	ldw	0($inp),$s0
    572 	ldw	4($inp),$s1
    573 	ldw	8($inp),$s2
    574 	comib,=	0,$t0,L\$dec_inp_aligned
    575 	ldw	12($inp),$s3
    576 
    577 	sh3addl	$t0,%r0,$t0
    578 	subi	32,$t0,$t0
    579 	mtctl	$t0,%cr11
    580 	ldw	16($inp),$t1
    581 	vshd	$s0,$s1,$s0
    582 	vshd	$s1,$s2,$s1
    583 	vshd	$s2,$s3,$s2
    584 	vshd	$s3,$t1,$s3
    585 
    586 L\$dec_inp_aligned
    587 	bl	_parisc_AES_decrypt,%r31
    588 	nop
    589 
    590 	extru,<> $out,31,2,%r0
    591 	b	L\$dec_out_aligned
    592 	nop
    593 
    594 	_srm	$s0,24,$acc0
    595 	_srm	$s0,16,$acc1
    596 	stb	$acc0,0($out)
    597 	_srm	$s0,8,$acc2
    598 	stb	$acc1,1($out)
    599 	_srm	$s1,24,$acc4
    600 	stb	$acc2,2($out)
    601 	_srm	$s1,16,$acc5
    602 	stb	$s0,3($out)
    603 	_srm	$s1,8,$acc6
    604 	stb	$acc4,4($out)
    605 	_srm	$s2,24,$acc0
    606 	stb	$acc5,5($out)
    607 	_srm	$s2,16,$acc1
    608 	stb	$acc6,6($out)
    609 	_srm	$s2,8,$acc2
    610 	stb	$s1,7($out)
    611 	_srm	$s3,24,$acc4
    612 	stb	$acc0,8($out)
    613 	_srm	$s3,16,$acc5
    614 	stb	$acc1,9($out)
    615 	_srm	$s3,8,$acc6
    616 	stb	$acc2,10($out)
    617 	stb	$s2,11($out)
    618 	stb	$acc4,12($out)
    619 	stb	$acc5,13($out)
    620 	stb	$acc6,14($out)
    621 	b	L\$dec_done
    622 	stb	$s3,15($out)
    623 
    624 L\$dec_out_aligned
    625 	stw	$s0,0($out)
    626 	stw	$s1,4($out)
    627 	stw	$s2,8($out)
    628 	stw	$s3,12($out)
    629 
    630 L\$dec_done
    631 	$POP	`-$FRAME-$SAVED_RP`(%sp),%r2	; standard epilogue
    632 	$POP	`-$FRAME+1*$SIZE_T`(%sp),%r4
    633 	$POP	`-$FRAME+2*$SIZE_T`(%sp),%r5
    634 	$POP	`-$FRAME+3*$SIZE_T`(%sp),%r6
    635 	$POP	`-$FRAME+4*$SIZE_T`(%sp),%r7
    636 	$POP	`-$FRAME+5*$SIZE_T`(%sp),%r8
    637 	$POP	`-$FRAME+6*$SIZE_T`(%sp),%r9
    638 	$POP	`-$FRAME+7*$SIZE_T`(%sp),%r10
    639 	$POP	`-$FRAME+8*$SIZE_T`(%sp),%r11
    640 	$POP	`-$FRAME+9*$SIZE_T`(%sp),%r12
    641 	$POP	`-$FRAME+10*$SIZE_T`(%sp),%r13
    642 	$POP	`-$FRAME+11*$SIZE_T`(%sp),%r14
    643 	$POP	`-$FRAME+12*$SIZE_T`(%sp),%r15
    644 	$POP	`-$FRAME+13*$SIZE_T`(%sp),%r16
    645 	$POP	`-$FRAME+14*$SIZE_T`(%sp),%r17
    646 	$POP	`-$FRAME+15*$SIZE_T`(%sp),%r18
    647 	bv	(%r2)
    648 	.EXIT
    649 	$POPMB	-$FRAME(%sp),%r3
    650 	.PROCEND
    651 
    652 	.ALIGN	16
    653 _parisc_AES_decrypt
    654 	.PROC
    655 	.CALLINFO	MILLICODE
    656 	.ENTRY
    657 	ldw	240($key),$rounds
    658 	ldw	0($key),$t0
    659 	ldw	4($key),$t1
    660 	ldw	8($key),$t2
    661 	ldw	12($key),$t3
    662 	_srm	$rounds,1,$rounds
    663 	xor	$t0,$s0,$s0
    664 	ldw	16($key),$t0
    665 	xor	$t1,$s1,$s1
    666 	ldw	20($key),$t1
    667 	_srm	$s0,24,$acc0
    668 	xor	$t2,$s2,$s2
    669 	ldw	24($key),$t2
    670 	xor	$t3,$s3,$s3
    671 	ldw	28($key),$t3
    672 	_srm	$s3,16,$acc1
    673 L\$dec_loop
    674 	_srm	$s2,8,$acc2
    675 	ldwx,s	$acc0($tbl),$acc0
    676 	_srm	$s1,0,$acc3
    677 	ldwx,s	$acc1($tbl),$acc1
    678 	_srm	$s1,24,$acc4
    679 	ldwx,s	$acc2($tbl),$acc2
    680 	_srm	$s0,16,$acc5
    681 	ldwx,s	$acc3($tbl),$acc3
    682 	_srm	$s3,8,$acc6
    683 	ldwx,s	$acc4($tbl),$acc4
    684 	_srm	$s2,0,$acc7
    685 	ldwx,s	$acc5($tbl),$acc5
    686 	_srm	$s2,24,$acc8
    687 	ldwx,s	$acc6($tbl),$acc6
    688 	_srm	$s1,16,$acc9
    689 	ldwx,s	$acc7($tbl),$acc7
    690 	_srm	$s0,8,$acc10
    691 	ldwx,s	$acc8($tbl),$acc8
    692 	_srm	$s3,0,$acc11
    693 	ldwx,s	$acc9($tbl),$acc9
    694 	_srm	$s3,24,$acc12
    695 	ldwx,s	$acc10($tbl),$acc10
    696 	_srm	$s2,16,$acc13
    697 	ldwx,s	$acc11($tbl),$acc11
    698 	_srm	$s1,8,$acc14
    699 	ldwx,s	$acc12($tbl),$acc12
    700 	_srm	$s0,0,$acc15
    701 	ldwx,s	$acc13($tbl),$acc13
    702 	ldwx,s	$acc14($tbl),$acc14
    703 	ldwx,s	$acc15($tbl),$acc15
    704 	addib,= -1,$rounds,L\$dec_last
    705 	ldo	32($key),$key
    706 
    707 		_ror	$acc1,8,$acc1
    708 		xor	$acc0,$t0,$t0
    709 	ldw	0($key),$s0
    710 		_ror	$acc2,16,$acc2
    711 		xor	$acc1,$t0,$t0
    712 	ldw	4($key),$s1
    713 		_ror	$acc3,24,$acc3
    714 		xor	$acc2,$t0,$t0
    715 	ldw	8($key),$s2
    716 		_ror	$acc5,8,$acc5
    717 		xor	$acc3,$t0,$t0
    718 	ldw	12($key),$s3
    719 		_ror	$acc6,16,$acc6
    720 		xor	$acc4,$t1,$t1
    721 		_ror	$acc7,24,$acc7
    722 		xor	$acc5,$t1,$t1
    723 		_ror	$acc9,8,$acc9
    724 		xor	$acc6,$t1,$t1
    725 		_ror	$acc10,16,$acc10
    726 		xor	$acc7,$t1,$t1
    727 		_ror	$acc11,24,$acc11
    728 		xor	$acc8,$t2,$t2
    729 		_ror	$acc13,8,$acc13
    730 		xor	$acc9,$t2,$t2
    731 		_ror	$acc14,16,$acc14
    732 		xor	$acc10,$t2,$t2
    733 		_ror	$acc15,24,$acc15
    734 		xor	$acc11,$t2,$t2
    735 		xor	$acc12,$acc14,$acc14
    736 		xor	$acc13,$t3,$t3
    737 	_srm	$t0,24,$acc0
    738 		xor	$acc14,$t3,$t3
    739 		xor	$acc15,$t3,$t3
    740 	_srm	$t3,16,$acc1
    741 
    742 	_srm	$t2,8,$acc2
    743 	ldwx,s	$acc0($tbl),$acc0
    744 	_srm	$t1,0,$acc3
    745 	ldwx,s	$acc1($tbl),$acc1
    746 	_srm	$t1,24,$acc4
    747 	ldwx,s	$acc2($tbl),$acc2
    748 	_srm	$t0,16,$acc5
    749 	ldwx,s	$acc3($tbl),$acc3
    750 	_srm	$t3,8,$acc6
    751 	ldwx,s	$acc4($tbl),$acc4
    752 	_srm	$t2,0,$acc7
    753 	ldwx,s	$acc5($tbl),$acc5
    754 	_srm	$t2,24,$acc8
    755 	ldwx,s	$acc6($tbl),$acc6
    756 	_srm	$t1,16,$acc9
    757 	ldwx,s	$acc7($tbl),$acc7
    758 	_srm	$t0,8,$acc10
    759 	ldwx,s	$acc8($tbl),$acc8
    760 	_srm	$t3,0,$acc11
    761 	ldwx,s	$acc9($tbl),$acc9
    762 	_srm	$t3,24,$acc12
    763 	ldwx,s	$acc10($tbl),$acc10
    764 	_srm	$t2,16,$acc13
    765 	ldwx,s	$acc11($tbl),$acc11
    766 	_srm	$t1,8,$acc14
    767 	ldwx,s	$acc12($tbl),$acc12
    768 	_srm	$t0,0,$acc15
    769 	ldwx,s	$acc13($tbl),$acc13
    770 		_ror	$acc1,8,$acc1
    771 	ldwx,s	$acc14($tbl),$acc14
    772 
    773 		_ror	$acc2,16,$acc2
    774 		xor	$acc0,$s0,$s0
    775 	ldwx,s	$acc15($tbl),$acc15
    776 		_ror	$acc3,24,$acc3
    777 		xor	$acc1,$s0,$s0
    778 	ldw	16($key),$t0
    779 		_ror	$acc5,8,$acc5
    780 		xor	$acc2,$s0,$s0
    781 	ldw	20($key),$t1
    782 		_ror	$acc6,16,$acc6
    783 		xor	$acc3,$s0,$s0
    784 	ldw	24($key),$t2
    785 		_ror	$acc7,24,$acc7
    786 		xor	$acc4,$s1,$s1
    787 	ldw	28($key),$t3
    788 		_ror	$acc9,8,$acc9
    789 		xor	$acc5,$s1,$s1
    790 	ldw	1024+0($tbl),%r0		; prefetch td4
    791 		_ror	$acc10,16,$acc10
    792 		xor	$acc6,$s1,$s1
    793 	ldw	1024+32($tbl),%r0		; prefetch td4
    794 		_ror	$acc11,24,$acc11
    795 		xor	$acc7,$s1,$s1
    796 	ldw	1024+64($tbl),%r0		; prefetch td4
    797 		_ror	$acc13,8,$acc13
    798 		xor	$acc8,$s2,$s2
    799 	ldw	1024+96($tbl),%r0		; prefetch td4
    800 		_ror	$acc14,16,$acc14
    801 		xor	$acc9,$s2,$s2
    802 	ldw	1024+128($tbl),%r0		; prefetch td4
    803 		_ror	$acc15,24,$acc15
    804 		xor	$acc10,$s2,$s2
    805 	ldw	1024+160($tbl),%r0		; prefetch td4
    806 	_srm	$s0,24,$acc0
    807 		xor	$acc11,$s2,$s2
    808 	ldw	1024+192($tbl),%r0		; prefetch td4
    809 		xor	$acc12,$acc14,$acc14
    810 		xor	$acc13,$s3,$s3
    811 	ldw	1024+224($tbl),%r0		; prefetch td4
    812 		xor	$acc14,$s3,$s3
    813 		xor	$acc15,$s3,$s3
    814 	b	L\$dec_loop
    815 	_srm	$s3,16,$acc1
    816 
    817 	.ALIGN	16
    818 L\$dec_last
    819 	ldo	1024($tbl),$rounds
    820 		_ror	$acc1,8,$acc1
    821 		xor	$acc0,$t0,$t0
    822 	ldw	0($key),$s0
    823 		_ror	$acc2,16,$acc2
    824 		xor	$acc1,$t0,$t0
    825 	ldw	4($key),$s1
    826 		_ror	$acc3,24,$acc3
    827 		xor	$acc2,$t0,$t0
    828 	ldw	8($key),$s2
    829 		_ror	$acc5,8,$acc5
    830 		xor	$acc3,$t0,$t0
    831 	ldw	12($key),$s3
    832 		_ror	$acc6,16,$acc6
    833 		xor	$acc4,$t1,$t1
    834 		_ror	$acc7,24,$acc7
    835 		xor	$acc5,$t1,$t1
    836 		_ror	$acc9,8,$acc9
    837 		xor	$acc6,$t1,$t1
    838 		_ror	$acc10,16,$acc10
    839 		xor	$acc7,$t1,$t1
    840 		_ror	$acc11,24,$acc11
    841 		xor	$acc8,$t2,$t2
    842 		_ror	$acc13,8,$acc13
    843 		xor	$acc9,$t2,$t2
    844 		_ror	$acc14,16,$acc14
    845 		xor	$acc10,$t2,$t2
    846 		_ror	$acc15,24,$acc15
    847 		xor	$acc11,$t2,$t2
    848 		xor	$acc12,$acc14,$acc14
    849 		xor	$acc13,$t3,$t3
    850 	_srm	$t0,24,$acc0
    851 		xor	$acc14,$t3,$t3
    852 		xor	$acc15,$t3,$t3
    853 	_srm	$t3,16,$acc1
    854 
    855 	_srm	$t2,8,$acc2
    856 	ldbx	$acc0($rounds),$acc0
    857 	_srm	$t1,24,$acc4
    858 	ldbx	$acc1($rounds),$acc1
    859 	_srm	$t0,16,$acc5
    860 	_srm	$t1,0,$acc3
    861 	ldbx	$acc2($rounds),$acc2
    862 	ldbx	$acc3($rounds),$acc3
    863 	_srm	$t3,8,$acc6
    864 	ldbx	$acc4($rounds),$acc4
    865 	_srm	$t2,24,$acc8
    866 	ldbx	$acc5($rounds),$acc5
    867 	_srm	$t1,16,$acc9
    868 	_srm	$t2,0,$acc7
    869 	ldbx	$acc6($rounds),$acc6
    870 	ldbx	$acc7($rounds),$acc7
    871 	_srm	$t0,8,$acc10
    872 	ldbx	$acc8($rounds),$acc8
    873 	_srm	$t3,24,$acc12
    874 	ldbx	$acc9($rounds),$acc9
    875 	_srm	$t2,16,$acc13
    876 	_srm	$t3,0,$acc11
    877 	ldbx	$acc10($rounds),$acc10
    878 	_srm	$t1,8,$acc14
    879 	ldbx	$acc11($rounds),$acc11
    880 	ldbx	$acc12($rounds),$acc12
    881 	ldbx	$acc13($rounds),$acc13
    882 	_srm	$t0,0,$acc15
    883 	ldbx	$acc14($rounds),$acc14
    884 
    885 		dep	$acc0,7,8,$acc3
    886 	ldbx	$acc15($rounds),$acc15
    887 		dep	$acc4,7,8,$acc7
    888 		dep	$acc1,15,8,$acc3
    889 		dep	$acc5,15,8,$acc7
    890 		dep	$acc2,23,8,$acc3
    891 		dep	$acc6,23,8,$acc7
    892 		xor	$acc3,$s0,$s0
    893 		xor	$acc7,$s1,$s1
    894 		dep	$acc8,7,8,$acc11
    895 		dep	$acc12,7,8,$acc15
    896 		dep	$acc9,15,8,$acc11
    897 		dep	$acc13,15,8,$acc15
    898 		dep	$acc10,23,8,$acc11
    899 		dep	$acc14,23,8,$acc15
    900 		xor	$acc11,$s2,$s2
    901 
    902 	bv	(%r31)
    903 	.EXIT
    904 		xor	$acc15,$s3,$s3
    905 	.PROCEND
    906 
    907 	.ALIGN	64
    908 L\$AES_Td
    909 	.WORD	0x51f4a750, 0x7e416553, 0x1a17a4c3, 0x3a275e96
    910 	.WORD	0x3bab6bcb, 0x1f9d45f1, 0xacfa58ab, 0x4be30393
    911 	.WORD	0x2030fa55, 0xad766df6, 0x88cc7691, 0xf5024c25
    912 	.WORD	0x4fe5d7fc, 0xc52acbd7, 0x26354480, 0xb562a38f
    913 	.WORD	0xdeb15a49, 0x25ba1b67, 0x45ea0e98, 0x5dfec0e1
    914 	.WORD	0xc32f7502, 0x814cf012, 0x8d4697a3, 0x6bd3f9c6
    915 	.WORD	0x038f5fe7, 0x15929c95, 0xbf6d7aeb, 0x955259da
    916 	.WORD	0xd4be832d, 0x587421d3, 0x49e06929, 0x8ec9c844
    917 	.WORD	0x75c2896a, 0xf48e7978, 0x99583e6b, 0x27b971dd
    918 	.WORD	0xbee14fb6, 0xf088ad17, 0xc920ac66, 0x7dce3ab4
    919 	.WORD	0x63df4a18, 0xe51a3182, 0x97513360, 0x62537f45
    920 	.WORD	0xb16477e0, 0xbb6bae84, 0xfe81a01c, 0xf9082b94
    921 	.WORD	0x70486858, 0x8f45fd19, 0x94de6c87, 0x527bf8b7
    922 	.WORD	0xab73d323, 0x724b02e2, 0xe31f8f57, 0x6655ab2a
    923 	.WORD	0xb2eb2807, 0x2fb5c203, 0x86c57b9a, 0xd33708a5
    924 	.WORD	0x302887f2, 0x23bfa5b2, 0x02036aba, 0xed16825c
    925 	.WORD	0x8acf1c2b, 0xa779b492, 0xf307f2f0, 0x4e69e2a1
    926 	.WORD	0x65daf4cd, 0x0605bed5, 0xd134621f, 0xc4a6fe8a
    927 	.WORD	0x342e539d, 0xa2f355a0, 0x058ae132, 0xa4f6eb75
    928 	.WORD	0x0b83ec39, 0x4060efaa, 0x5e719f06, 0xbd6e1051
    929 	.WORD	0x3e218af9, 0x96dd063d, 0xdd3e05ae, 0x4de6bd46
    930 	.WORD	0x91548db5, 0x71c45d05, 0x0406d46f, 0x605015ff
    931 	.WORD	0x1998fb24, 0xd6bde997, 0x894043cc, 0x67d99e77
    932 	.WORD	0xb0e842bd, 0x07898b88, 0xe7195b38, 0x79c8eedb
    933 	.WORD	0xa17c0a47, 0x7c420fe9, 0xf8841ec9, 0x00000000
    934 	.WORD	0x09808683, 0x322bed48, 0x1e1170ac, 0x6c5a724e
    935 	.WORD	0xfd0efffb, 0x0f853856, 0x3daed51e, 0x362d3927
    936 	.WORD	0x0a0fd964, 0x685ca621, 0x9b5b54d1, 0x24362e3a
    937 	.WORD	0x0c0a67b1, 0x9357e70f, 0xb4ee96d2, 0x1b9b919e
    938 	.WORD	0x80c0c54f, 0x61dc20a2, 0x5a774b69, 0x1c121a16
    939 	.WORD	0xe293ba0a, 0xc0a02ae5, 0x3c22e043, 0x121b171d
    940 	.WORD	0x0e090d0b, 0xf28bc7ad, 0x2db6a8b9, 0x141ea9c8
    941 	.WORD	0x57f11985, 0xaf75074c, 0xee99ddbb, 0xa37f60fd
    942 	.WORD	0xf701269f, 0x5c72f5bc, 0x44663bc5, 0x5bfb7e34
    943 	.WORD	0x8b432976, 0xcb23c6dc, 0xb6edfc68, 0xb8e4f163
    944 	.WORD	0xd731dcca, 0x42638510, 0x13972240, 0x84c61120
    945 	.WORD	0x854a247d, 0xd2bb3df8, 0xaef93211, 0xc729a16d
    946 	.WORD	0x1d9e2f4b, 0xdcb230f3, 0x0d8652ec, 0x77c1e3d0
    947 	.WORD	0x2bb3166c, 0xa970b999, 0x119448fa, 0x47e96422
    948 	.WORD	0xa8fc8cc4, 0xa0f03f1a, 0x567d2cd8, 0x223390ef
    949 	.WORD	0x87494ec7, 0xd938d1c1, 0x8ccaa2fe, 0x98d40b36
    950 	.WORD	0xa6f581cf, 0xa57ade28, 0xdab78e26, 0x3fadbfa4
    951 	.WORD	0x2c3a9de4, 0x5078920d, 0x6a5fcc9b, 0x547e4662
    952 	.WORD	0xf68d13c2, 0x90d8b8e8, 0x2e39f75e, 0x82c3aff5
    953 	.WORD	0x9f5d80be, 0x69d0937c, 0x6fd52da9, 0xcf2512b3
    954 	.WORD	0xc8ac993b, 0x10187da7, 0xe89c636e, 0xdb3bbb7b
    955 	.WORD	0xcd267809, 0x6e5918f4, 0xec9ab701, 0x834f9aa8
    956 	.WORD	0xe6956e65, 0xaaffe67e, 0x21bccf08, 0xef15e8e6
    957 	.WORD	0xbae79bd9, 0x4a6f36ce, 0xea9f09d4, 0x29b07cd6
    958 	.WORD	0x31a4b2af, 0x2a3f2331, 0xc6a59430, 0x35a266c0
    959 	.WORD	0x744ebc37, 0xfc82caa6, 0xe090d0b0, 0x33a7d815
    960 	.WORD	0xf104984a, 0x41ecdaf7, 0x7fcd500e, 0x1791f62f
    961 	.WORD	0x764dd68d, 0x43efb04d, 0xccaa4d54, 0xe49604df
    962 	.WORD	0x9ed1b5e3, 0x4c6a881b, 0xc12c1fb8, 0x4665517f
    963 	.WORD	0x9d5eea04, 0x018c355d, 0xfa877473, 0xfb0b412e
    964 	.WORD	0xb3671d5a, 0x92dbd252, 0xe9105633, 0x6dd64713
    965 	.WORD	0x9ad7618c, 0x37a10c7a, 0x59f8148e, 0xeb133c89
    966 	.WORD	0xcea927ee, 0xb761c935, 0xe11ce5ed, 0x7a47b13c
    967 	.WORD	0x9cd2df59, 0x55f2733f, 0x1814ce79, 0x73c737bf
    968 	.WORD	0x53f7cdea, 0x5ffdaa5b, 0xdf3d6f14, 0x7844db86
    969 	.WORD	0xcaaff381, 0xb968c43e, 0x3824342c, 0xc2a3405f
    970 	.WORD	0x161dc372, 0xbce2250c, 0x283c498b, 0xff0d9541
    971 	.WORD	0x39a80171, 0x080cb3de, 0xd8b4e49c, 0x6456c190
    972 	.WORD	0x7bcb8461, 0xd532b670, 0x486c5c74, 0xd0b85742
    973 	.BYTE	0x52, 0x09, 0x6a, 0xd5, 0x30, 0x36, 0xa5, 0x38
    974 	.BYTE	0xbf, 0x40, 0xa3, 0x9e, 0x81, 0xf3, 0xd7, 0xfb
    975 	.BYTE	0x7c, 0xe3, 0x39, 0x82, 0x9b, 0x2f, 0xff, 0x87
    976 	.BYTE	0x34, 0x8e, 0x43, 0x44, 0xc4, 0xde, 0xe9, 0xcb
    977 	.BYTE	0x54, 0x7b, 0x94, 0x32, 0xa6, 0xc2, 0x23, 0x3d
    978 	.BYTE	0xee, 0x4c, 0x95, 0x0b, 0x42, 0xfa, 0xc3, 0x4e
    979 	.BYTE	0x08, 0x2e, 0xa1, 0x66, 0x28, 0xd9, 0x24, 0xb2
    980 	.BYTE	0x76, 0x5b, 0xa2, 0x49, 0x6d, 0x8b, 0xd1, 0x25
    981 	.BYTE	0x72, 0xf8, 0xf6, 0x64, 0x86, 0x68, 0x98, 0x16
    982 	.BYTE	0xd4, 0xa4, 0x5c, 0xcc, 0x5d, 0x65, 0xb6, 0x92
    983 	.BYTE	0x6c, 0x70, 0x48, 0x50, 0xfd, 0xed, 0xb9, 0xda
    984 	.BYTE	0x5e, 0x15, 0x46, 0x57, 0xa7, 0x8d, 0x9d, 0x84
    985 	.BYTE	0x90, 0xd8, 0xab, 0x00, 0x8c, 0xbc, 0xd3, 0x0a
    986 	.BYTE	0xf7, 0xe4, 0x58, 0x05, 0xb8, 0xb3, 0x45, 0x06
    987 	.BYTE	0xd0, 0x2c, 0x1e, 0x8f, 0xca, 0x3f, 0x0f, 0x02
    988 	.BYTE	0xc1, 0xaf, 0xbd, 0x03, 0x01, 0x13, 0x8a, 0x6b
    989 	.BYTE	0x3a, 0x91, 0x11, 0x41, 0x4f, 0x67, 0xdc, 0xea
    990 	.BYTE	0x97, 0xf2, 0xcf, 0xce, 0xf0, 0xb4, 0xe6, 0x73
    991 	.BYTE	0x96, 0xac, 0x74, 0x22, 0xe7, 0xad, 0x35, 0x85
    992 	.BYTE	0xe2, 0xf9, 0x37, 0xe8, 0x1c, 0x75, 0xdf, 0x6e
    993 	.BYTE	0x47, 0xf1, 0x1a, 0x71, 0x1d, 0x29, 0xc5, 0x89
    994 	.BYTE	0x6f, 0xb7, 0x62, 0x0e, 0xaa, 0x18, 0xbe, 0x1b
    995 	.BYTE	0xfc, 0x56, 0x3e, 0x4b, 0xc6, 0xd2, 0x79, 0x20
    996 	.BYTE	0x9a, 0xdb, 0xc0, 0xfe, 0x78, 0xcd, 0x5a, 0xf4
    997 	.BYTE	0x1f, 0xdd, 0xa8, 0x33, 0x88, 0x07, 0xc7, 0x31
    998 	.BYTE	0xb1, 0x12, 0x10, 0x59, 0x27, 0x80, 0xec, 0x5f
    999 	.BYTE	0x60, 0x51, 0x7f, 0xa9, 0x19, 0xb5, 0x4a, 0x0d
   1000 	.BYTE	0x2d, 0xe5, 0x7a, 0x9f, 0x93, 0xc9, 0x9c, 0xef
   1001 	.BYTE	0xa0, 0xe0, 0x3b, 0x4d, 0xae, 0x2a, 0xf5, 0xb0
   1002 	.BYTE	0xc8, 0xeb, 0xbb, 0x3c, 0x83, 0x53, 0x99, 0x61
   1003 	.BYTE	0x17, 0x2b, 0x04, 0x7e, 0xba, 0x77, 0xd6, 0x26
   1004 	.BYTE	0xe1, 0x69, 0x14, 0x63, 0x55, 0x21, 0x0c, 0x7d
   1005 	.STRINGZ "AES for PA-RISC, CRYPTOGAMS by <appro\@openssl.org>"
   1006 ___
   1007 
   1008 foreach (split("\n",$code)) {
   1009 	s/\`([^\`]*)\`/eval $1/ge;
   1010 
   1011 	# translate made up instructons: _ror, _srm
   1012 	s/_ror(\s+)(%r[0-9]+),/shd$1$2,$2,/				or
   1013 
   1014 	s/_srm(\s+%r[0-9]+),([0-9]+),/
   1015 		$SIZE_T==4 ? sprintf("extru%s,%d,8,",$1,31-$2)
   1016 		:            sprintf("extrd,u%s,%d,8,",$1,63-$2)/e;
   1017 
   1018 	s/,\*/,/ if ($SIZE_T==4);
   1019 	print $_,"\n";
   1020 }
   1021 close STDOUT;
   1022