aes-parisc.pl revision 392aa7cc7d2b122614c5393c3e357da07fd07af3
1#!/usr/bin/env perl
2
3# ====================================================================
4# Written by Andy Polyakov <appro@fy.chalmers.se> for the OpenSSL
5# project. The module is, however, dual licensed under OpenSSL and
6# CRYPTOGAMS licenses depending on where you obtain it. For further
7# details see http://www.openssl.org/~appro/cryptogams/.
8# ====================================================================
9
10# AES for PA-RISC.
11#
12# June 2009.
13#
14# The module is mechanical transliteration of aes-sparcv9.pl, but with
15# a twist: S-boxes are compressed even further down to 1K+256B. On
16# PA-7100LC performance is ~40% better than gcc 3.2 generated code and
17# is about 33 cycles per byte processed with 128-bit key. Newer CPUs
18# perform at 16 cycles per byte. It's not faster than code generated
19# by vendor compiler, but recall that it has compressed S-boxes, which
20# requires extra processing.
21#
22# Special thanks to polarhome.com for providing HP-UX account.
23
24$flavour = shift;
25$output = shift;
26open STDOUT,">$output";
27
28if ($flavour =~ /64/) {
29	$LEVEL		="2.0W";
30	$SIZE_T		=8;
31	$FRAME_MARKER	=80;
32	$SAVED_RP	=16;
33	$PUSH		="std";
34	$PUSHMA		="std,ma";
35	$POP		="ldd";
36	$POPMB		="ldd,mb";
37} else {
38	$LEVEL		="1.0";
39	$SIZE_T		=4;
40	$FRAME_MARKER	=48;
41	$SAVED_RP	=20;
42	$PUSH		="stw";
43	$PUSHMA		="stwm";
44	$POP		="ldw";
45	$POPMB		="ldwm";
46}
47
48$FRAME=16*$SIZE_T+$FRAME_MARKER;# 16 saved regs + frame marker
49				#                 [+ argument transfer]
50$inp="%r26";	# arg0
51$out="%r25";	# arg1
52$key="%r24";	# arg2
53
54($s0,$s1,$s2,$s3) = ("%r1","%r2","%r3","%r4");
55($t0,$t1,$t2,$t3) = ("%r5","%r6","%r7","%r8");
56
57($acc0, $acc1, $acc2, $acc3, $acc4, $acc5, $acc6, $acc7,
58 $acc8, $acc9,$acc10,$acc11,$acc12,$acc13,$acc14,$acc15) =
59("%r9","%r10","%r11","%r12","%r13","%r14","%r15","%r16",
60"%r17","%r18","%r19","%r20","%r21","%r22","%r23","%r26");
61
62$tbl="%r28";
63$rounds="%r29";
64
65$code=<<___;
66	.LEVEL	$LEVEL
67	.SPACE	\$TEXT\$
68	.SUBSPA	\$CODE\$,QUAD=0,ALIGN=8,ACCESS=0x2C,CODE_ONLY
69
70	.EXPORT	AES_encrypt,ENTRY,ARGW0=GR,ARGW1=GR,ARGW2=GR
71	.ALIGN	64
72AES_encrypt
73	.PROC
74	.CALLINFO	FRAME=`$FRAME-16*$SIZE_T`,NO_CALLS,SAVE_RP,ENTRY_GR=18
75	.ENTRY
76	$PUSH	%r2,-$SAVED_RP(%sp)	; standard prologue
77	$PUSHMA	%r3,$FRAME(%sp)
78	$PUSH	%r4,`-$FRAME+1*$SIZE_T`(%sp)
79	$PUSH	%r5,`-$FRAME+2*$SIZE_T`(%sp)
80	$PUSH	%r6,`-$FRAME+3*$SIZE_T`(%sp)
81	$PUSH	%r7,`-$FRAME+4*$SIZE_T`(%sp)
82	$PUSH	%r8,`-$FRAME+5*$SIZE_T`(%sp)
83	$PUSH	%r9,`-$FRAME+6*$SIZE_T`(%sp)
84	$PUSH	%r10,`-$FRAME+7*$SIZE_T`(%sp)
85	$PUSH	%r11,`-$FRAME+8*$SIZE_T`(%sp)
86	$PUSH	%r12,`-$FRAME+9*$SIZE_T`(%sp)
87	$PUSH	%r13,`-$FRAME+10*$SIZE_T`(%sp)
88	$PUSH	%r14,`-$FRAME+11*$SIZE_T`(%sp)
89	$PUSH	%r15,`-$FRAME+12*$SIZE_T`(%sp)
90	$PUSH	%r16,`-$FRAME+13*$SIZE_T`(%sp)
91	$PUSH	%r17,`-$FRAME+14*$SIZE_T`(%sp)
92	$PUSH	%r18,`-$FRAME+15*$SIZE_T`(%sp)
93
94	blr	%r0,$tbl
95	ldi	3,$t0
96L\$enc_pic
97	andcm	$tbl,$t0,$tbl
98	ldo	L\$AES_Te-L\$enc_pic($tbl),$tbl
99
100	and	$inp,$t0,$t0
101	sub	$inp,$t0,$inp
102	ldw	0($inp),$s0
103	ldw	4($inp),$s1
104	ldw	8($inp),$s2
105	comib,=	0,$t0,L\$enc_inp_aligned
106	ldw	12($inp),$s3
107
108	sh3addl	$t0,%r0,$t0
109	subi	32,$t0,$t0
110	mtctl	$t0,%cr11
111	ldw	16($inp),$t1
112	vshd	$s0,$s1,$s0
113	vshd	$s1,$s2,$s1
114	vshd	$s2,$s3,$s2
115	vshd	$s3,$t1,$s3
116
117L\$enc_inp_aligned
118	bl	_parisc_AES_encrypt,%r31
119	nop
120
121	extru,<> $out,31,2,%r0
122	b	L\$enc_out_aligned
123	nop
124
125	_srm	$s0,24,$acc0
126	_srm	$s0,16,$acc1
127	stb	$acc0,0($out)
128	_srm	$s0,8,$acc2
129	stb	$acc1,1($out)
130	_srm	$s1,24,$acc4
131	stb	$acc2,2($out)
132	_srm	$s1,16,$acc5
133	stb	$s0,3($out)
134	_srm	$s1,8,$acc6
135	stb	$acc4,4($out)
136	_srm	$s2,24,$acc0
137	stb	$acc5,5($out)
138	_srm	$s2,16,$acc1
139	stb	$acc6,6($out)
140	_srm	$s2,8,$acc2
141	stb	$s1,7($out)
142	_srm	$s3,24,$acc4
143	stb	$acc0,8($out)
144	_srm	$s3,16,$acc5
145	stb	$acc1,9($out)
146	_srm	$s3,8,$acc6
147	stb	$acc2,10($out)
148	stb	$s2,11($out)
149	stb	$acc4,12($out)
150	stb	$acc5,13($out)
151	stb	$acc6,14($out)
152	b	L\$enc_done
153	stb	$s3,15($out)
154
155L\$enc_out_aligned
156	stw	$s0,0($out)
157	stw	$s1,4($out)
158	stw	$s2,8($out)
159	stw	$s3,12($out)
160
161L\$enc_done
162	$POP	`-$FRAME-$SAVED_RP`(%sp),%r2	; standard epilogue
163	$POP	`-$FRAME+1*$SIZE_T`(%sp),%r4
164	$POP	`-$FRAME+2*$SIZE_T`(%sp),%r5
165	$POP	`-$FRAME+3*$SIZE_T`(%sp),%r6
166	$POP	`-$FRAME+4*$SIZE_T`(%sp),%r7
167	$POP	`-$FRAME+5*$SIZE_T`(%sp),%r8
168	$POP	`-$FRAME+6*$SIZE_T`(%sp),%r9
169	$POP	`-$FRAME+7*$SIZE_T`(%sp),%r10
170	$POP	`-$FRAME+8*$SIZE_T`(%sp),%r11
171	$POP	`-$FRAME+9*$SIZE_T`(%sp),%r12
172	$POP	`-$FRAME+10*$SIZE_T`(%sp),%r13
173	$POP	`-$FRAME+11*$SIZE_T`(%sp),%r14
174	$POP	`-$FRAME+12*$SIZE_T`(%sp),%r15
175	$POP	`-$FRAME+13*$SIZE_T`(%sp),%r16
176	$POP	`-$FRAME+14*$SIZE_T`(%sp),%r17
177	$POP	`-$FRAME+15*$SIZE_T`(%sp),%r18
178	bv	(%r2)
179	.EXIT
180	$POPMB	-$FRAME(%sp),%r3
181	.PROCEND
182
183	.ALIGN	16
184_parisc_AES_encrypt
185	.PROC
186	.CALLINFO	MILLICODE
187	.ENTRY
188	ldw	240($key),$rounds
189	ldw	0($key),$t0
190	ldw	4($key),$t1
191	ldw	8($key),$t2
192	_srm	$rounds,1,$rounds
193	xor	$t0,$s0,$s0
194	ldw	12($key),$t3
195	_srm	$s0,24,$acc0
196	xor	$t1,$s1,$s1
197	ldw	16($key),$t0
198	_srm	$s1,16,$acc1
199	xor	$t2,$s2,$s2
200	ldw	20($key),$t1
201	xor	$t3,$s3,$s3
202	ldw	24($key),$t2
203	ldw	28($key),$t3
204L\$enc_loop
205	_srm	$s2,8,$acc2
206	ldwx,s	$acc0($tbl),$acc0
207	_srm	$s3,0,$acc3
208	ldwx,s	$acc1($tbl),$acc1
209	_srm	$s1,24,$acc4
210	ldwx,s	$acc2($tbl),$acc2
211	_srm	$s2,16,$acc5
212	ldwx,s	$acc3($tbl),$acc3
213	_srm	$s3,8,$acc6
214	ldwx,s	$acc4($tbl),$acc4
215	_srm	$s0,0,$acc7
216	ldwx,s	$acc5($tbl),$acc5
217	_srm	$s2,24,$acc8
218	ldwx,s	$acc6($tbl),$acc6
219	_srm	$s3,16,$acc9
220	ldwx,s	$acc7($tbl),$acc7
221	_srm	$s0,8,$acc10
222	ldwx,s	$acc8($tbl),$acc8
223	_srm	$s1,0,$acc11
224	ldwx,s	$acc9($tbl),$acc9
225	_srm	$s3,24,$acc12
226	ldwx,s	$acc10($tbl),$acc10
227	_srm	$s0,16,$acc13
228	ldwx,s	$acc11($tbl),$acc11
229	_srm	$s1,8,$acc14
230	ldwx,s	$acc12($tbl),$acc12
231	_srm	$s2,0,$acc15
232	ldwx,s	$acc13($tbl),$acc13
233	ldwx,s	$acc14($tbl),$acc14
234	ldwx,s	$acc15($tbl),$acc15
235	addib,= -1,$rounds,L\$enc_last
236	ldo	32($key),$key
237
238		_ror	$acc1,8,$acc1
239		xor	$acc0,$t0,$t0
240	ldw	0($key),$s0
241		_ror	$acc2,16,$acc2
242		xor	$acc1,$t0,$t0
243	ldw	4($key),$s1
244		_ror	$acc3,24,$acc3
245		xor	$acc2,$t0,$t0
246	ldw	8($key),$s2
247		_ror	$acc5,8,$acc5
248		xor	$acc3,$t0,$t0
249	ldw	12($key),$s3
250		_ror	$acc6,16,$acc6
251		xor	$acc4,$t1,$t1
252		_ror	$acc7,24,$acc7
253		xor	$acc5,$t1,$t1
254		_ror	$acc9,8,$acc9
255		xor	$acc6,$t1,$t1
256		_ror	$acc10,16,$acc10
257		xor	$acc7,$t1,$t1
258		_ror	$acc11,24,$acc11
259		xor	$acc8,$t2,$t2
260		_ror	$acc13,8,$acc13
261		xor	$acc9,$t2,$t2
262		_ror	$acc14,16,$acc14
263		xor	$acc10,$t2,$t2
264		_ror	$acc15,24,$acc15
265		xor	$acc11,$t2,$t2
266		xor	$acc12,$acc14,$acc14
267		xor	$acc13,$t3,$t3
268	_srm	$t0,24,$acc0
269		xor	$acc14,$t3,$t3
270	_srm	$t1,16,$acc1
271		xor	$acc15,$t3,$t3
272
273	_srm	$t2,8,$acc2
274	ldwx,s	$acc0($tbl),$acc0
275	_srm	$t3,0,$acc3
276	ldwx,s	$acc1($tbl),$acc1
277	_srm	$t1,24,$acc4
278	ldwx,s	$acc2($tbl),$acc2
279	_srm	$t2,16,$acc5
280	ldwx,s	$acc3($tbl),$acc3
281	_srm	$t3,8,$acc6
282	ldwx,s	$acc4($tbl),$acc4
283	_srm	$t0,0,$acc7
284	ldwx,s	$acc5($tbl),$acc5
285	_srm	$t2,24,$acc8
286	ldwx,s	$acc6($tbl),$acc6
287	_srm	$t3,16,$acc9
288	ldwx,s	$acc7($tbl),$acc7
289	_srm	$t0,8,$acc10
290	ldwx,s	$acc8($tbl),$acc8
291	_srm	$t1,0,$acc11
292	ldwx,s	$acc9($tbl),$acc9
293	_srm	$t3,24,$acc12
294	ldwx,s	$acc10($tbl),$acc10
295	_srm	$t0,16,$acc13
296	ldwx,s	$acc11($tbl),$acc11
297	_srm	$t1,8,$acc14
298	ldwx,s	$acc12($tbl),$acc12
299	_srm	$t2,0,$acc15
300	ldwx,s	$acc13($tbl),$acc13
301		_ror	$acc1,8,$acc1
302	ldwx,s	$acc14($tbl),$acc14
303
304		_ror	$acc2,16,$acc2
305		xor	$acc0,$s0,$s0
306	ldwx,s	$acc15($tbl),$acc15
307		_ror	$acc3,24,$acc3
308		xor	$acc1,$s0,$s0
309	ldw	16($key),$t0
310		_ror	$acc5,8,$acc5
311		xor	$acc2,$s0,$s0
312	ldw	20($key),$t1
313		_ror	$acc6,16,$acc6
314		xor	$acc3,$s0,$s0
315	ldw	24($key),$t2
316		_ror	$acc7,24,$acc7
317		xor	$acc4,$s1,$s1
318	ldw	28($key),$t3
319		_ror	$acc9,8,$acc9
320		xor	$acc5,$s1,$s1
321	ldw	1024+0($tbl),%r0		; prefetch te4
322		_ror	$acc10,16,$acc10
323		xor	$acc6,$s1,$s1
324	ldw	1024+32($tbl),%r0		; prefetch te4
325		_ror	$acc11,24,$acc11
326		xor	$acc7,$s1,$s1
327	ldw	1024+64($tbl),%r0		; prefetch te4
328		_ror	$acc13,8,$acc13
329		xor	$acc8,$s2,$s2
330	ldw	1024+96($tbl),%r0		; prefetch te4
331		_ror	$acc14,16,$acc14
332		xor	$acc9,$s2,$s2
333	ldw	1024+128($tbl),%r0		; prefetch te4
334		_ror	$acc15,24,$acc15
335		xor	$acc10,$s2,$s2
336	ldw	1024+160($tbl),%r0		; prefetch te4
337	_srm	$s0,24,$acc0
338		xor	$acc11,$s2,$s2
339	ldw	1024+192($tbl),%r0		; prefetch te4
340		xor	$acc12,$acc14,$acc14
341		xor	$acc13,$s3,$s3
342	ldw	1024+224($tbl),%r0		; prefetch te4
343	_srm	$s1,16,$acc1
344		xor	$acc14,$s3,$s3
345	b	L\$enc_loop
346		xor	$acc15,$s3,$s3
347
348	.ALIGN	16
349L\$enc_last
350	ldo	1024($tbl),$rounds
351		_ror	$acc1,8,$acc1
352		xor	$acc0,$t0,$t0
353	ldw	0($key),$s0
354		_ror	$acc2,16,$acc2
355		xor	$acc1,$t0,$t0
356	ldw	4($key),$s1
357		_ror	$acc3,24,$acc3
358		xor	$acc2,$t0,$t0
359	ldw	8($key),$s2
360		_ror	$acc5,8,$acc5
361		xor	$acc3,$t0,$t0
362	ldw	12($key),$s3
363		_ror	$acc6,16,$acc6
364		xor	$acc4,$t1,$t1
365		_ror	$acc7,24,$acc7
366		xor	$acc5,$t1,$t1
367		_ror	$acc9,8,$acc9
368		xor	$acc6,$t1,$t1
369		_ror	$acc10,16,$acc10
370		xor	$acc7,$t1,$t1
371		_ror	$acc11,24,$acc11
372		xor	$acc8,$t2,$t2
373		_ror	$acc13,8,$acc13
374		xor	$acc9,$t2,$t2
375		_ror	$acc14,16,$acc14
376		xor	$acc10,$t2,$t2
377		_ror	$acc15,24,$acc15
378		xor	$acc11,$t2,$t2
379		xor	$acc12,$acc14,$acc14
380		xor	$acc13,$t3,$t3
381	_srm	$t0,24,$acc0
382		xor	$acc14,$t3,$t3
383	_srm	$t1,16,$acc1
384		xor	$acc15,$t3,$t3
385
386	_srm	$t2,8,$acc2
387	ldbx	$acc0($rounds),$acc0
388	_srm	$t1,24,$acc4
389	ldbx	$acc1($rounds),$acc1
390	_srm	$t2,16,$acc5
391	_srm	$t3,0,$acc3
392	ldbx	$acc2($rounds),$acc2
393	ldbx	$acc3($rounds),$acc3
394	_srm	$t3,8,$acc6
395	ldbx	$acc4($rounds),$acc4
396	_srm	$t2,24,$acc8
397	ldbx	$acc5($rounds),$acc5
398	_srm	$t3,16,$acc9
399	_srm	$t0,0,$acc7
400	ldbx	$acc6($rounds),$acc6
401	ldbx	$acc7($rounds),$acc7
402	_srm	$t0,8,$acc10
403	ldbx	$acc8($rounds),$acc8
404	_srm	$t3,24,$acc12
405	ldbx	$acc9($rounds),$acc9
406	_srm	$t0,16,$acc13
407	_srm	$t1,0,$acc11
408	ldbx	$acc10($rounds),$acc10
409	_srm	$t1,8,$acc14
410	ldbx	$acc11($rounds),$acc11
411	ldbx	$acc12($rounds),$acc12
412	ldbx	$acc13($rounds),$acc13
413	_srm	$t2,0,$acc15
414	ldbx	$acc14($rounds),$acc14
415
416		dep	$acc0,7,8,$acc3
417	ldbx	$acc15($rounds),$acc15
418		dep	$acc4,7,8,$acc7
419		dep	$acc1,15,8,$acc3
420		dep	$acc5,15,8,$acc7
421		dep	$acc2,23,8,$acc3
422		dep	$acc6,23,8,$acc7
423		xor	$acc3,$s0,$s0
424		xor	$acc7,$s1,$s1
425		dep	$acc8,7,8,$acc11
426		dep	$acc12,7,8,$acc15
427		dep	$acc9,15,8,$acc11
428		dep	$acc13,15,8,$acc15
429		dep	$acc10,23,8,$acc11
430		dep	$acc14,23,8,$acc15
431		xor	$acc11,$s2,$s2
432
433	bv	(%r31)
434	.EXIT
435		xor	$acc15,$s3,$s3
436	.PROCEND
437
438	.ALIGN	64
439L\$AES_Te
440	.WORD	0xc66363a5, 0xf87c7c84, 0xee777799, 0xf67b7b8d
441	.WORD	0xfff2f20d, 0xd66b6bbd, 0xde6f6fb1, 0x91c5c554
442	.WORD	0x60303050, 0x02010103, 0xce6767a9, 0x562b2b7d
443	.WORD	0xe7fefe19, 0xb5d7d762, 0x4dababe6, 0xec76769a
444	.WORD	0x8fcaca45, 0x1f82829d, 0x89c9c940, 0xfa7d7d87
445	.WORD	0xeffafa15, 0xb25959eb, 0x8e4747c9, 0xfbf0f00b
446	.WORD	0x41adadec, 0xb3d4d467, 0x5fa2a2fd, 0x45afafea
447	.WORD	0x239c9cbf, 0x53a4a4f7, 0xe4727296, 0x9bc0c05b
448	.WORD	0x75b7b7c2, 0xe1fdfd1c, 0x3d9393ae, 0x4c26266a
449	.WORD	0x6c36365a, 0x7e3f3f41, 0xf5f7f702, 0x83cccc4f
450	.WORD	0x6834345c, 0x51a5a5f4, 0xd1e5e534, 0xf9f1f108
451	.WORD	0xe2717193, 0xabd8d873, 0x62313153, 0x2a15153f
452	.WORD	0x0804040c, 0x95c7c752, 0x46232365, 0x9dc3c35e
453	.WORD	0x30181828, 0x379696a1, 0x0a05050f, 0x2f9a9ab5
454	.WORD	0x0e070709, 0x24121236, 0x1b80809b, 0xdfe2e23d
455	.WORD	0xcdebeb26, 0x4e272769, 0x7fb2b2cd, 0xea75759f
456	.WORD	0x1209091b, 0x1d83839e, 0x582c2c74, 0x341a1a2e
457	.WORD	0x361b1b2d, 0xdc6e6eb2, 0xb45a5aee, 0x5ba0a0fb
458	.WORD	0xa45252f6, 0x763b3b4d, 0xb7d6d661, 0x7db3b3ce
459	.WORD	0x5229297b, 0xdde3e33e, 0x5e2f2f71, 0x13848497
460	.WORD	0xa65353f5, 0xb9d1d168, 0x00000000, 0xc1eded2c
461	.WORD	0x40202060, 0xe3fcfc1f, 0x79b1b1c8, 0xb65b5bed
462	.WORD	0xd46a6abe, 0x8dcbcb46, 0x67bebed9, 0x7239394b
463	.WORD	0x944a4ade, 0x984c4cd4, 0xb05858e8, 0x85cfcf4a
464	.WORD	0xbbd0d06b, 0xc5efef2a, 0x4faaaae5, 0xedfbfb16
465	.WORD	0x864343c5, 0x9a4d4dd7, 0x66333355, 0x11858594
466	.WORD	0x8a4545cf, 0xe9f9f910, 0x04020206, 0xfe7f7f81
467	.WORD	0xa05050f0, 0x783c3c44, 0x259f9fba, 0x4ba8a8e3
468	.WORD	0xa25151f3, 0x5da3a3fe, 0x804040c0, 0x058f8f8a
469	.WORD	0x3f9292ad, 0x219d9dbc, 0x70383848, 0xf1f5f504
470	.WORD	0x63bcbcdf, 0x77b6b6c1, 0xafdada75, 0x42212163
471	.WORD	0x20101030, 0xe5ffff1a, 0xfdf3f30e, 0xbfd2d26d
472	.WORD	0x81cdcd4c, 0x180c0c14, 0x26131335, 0xc3ecec2f
473	.WORD	0xbe5f5fe1, 0x359797a2, 0x884444cc, 0x2e171739
474	.WORD	0x93c4c457, 0x55a7a7f2, 0xfc7e7e82, 0x7a3d3d47
475	.WORD	0xc86464ac, 0xba5d5de7, 0x3219192b, 0xe6737395
476	.WORD	0xc06060a0, 0x19818198, 0x9e4f4fd1, 0xa3dcdc7f
477	.WORD	0x44222266, 0x542a2a7e, 0x3b9090ab, 0x0b888883
478	.WORD	0x8c4646ca, 0xc7eeee29, 0x6bb8b8d3, 0x2814143c
479	.WORD	0xa7dede79, 0xbc5e5ee2, 0x160b0b1d, 0xaddbdb76
480	.WORD	0xdbe0e03b, 0x64323256, 0x743a3a4e, 0x140a0a1e
481	.WORD	0x924949db, 0x0c06060a, 0x4824246c, 0xb85c5ce4
482	.WORD	0x9fc2c25d, 0xbdd3d36e, 0x43acacef, 0xc46262a6
483	.WORD	0x399191a8, 0x319595a4, 0xd3e4e437, 0xf279798b
484	.WORD	0xd5e7e732, 0x8bc8c843, 0x6e373759, 0xda6d6db7
485	.WORD	0x018d8d8c, 0xb1d5d564, 0x9c4e4ed2, 0x49a9a9e0
486	.WORD	0xd86c6cb4, 0xac5656fa, 0xf3f4f407, 0xcfeaea25
487	.WORD	0xca6565af, 0xf47a7a8e, 0x47aeaee9, 0x10080818
488	.WORD	0x6fbabad5, 0xf0787888, 0x4a25256f, 0x5c2e2e72
489	.WORD	0x381c1c24, 0x57a6a6f1, 0x73b4b4c7, 0x97c6c651
490	.WORD	0xcbe8e823, 0xa1dddd7c, 0xe874749c, 0x3e1f1f21
491	.WORD	0x964b4bdd, 0x61bdbddc, 0x0d8b8b86, 0x0f8a8a85
492	.WORD	0xe0707090, 0x7c3e3e42, 0x71b5b5c4, 0xcc6666aa
493	.WORD	0x904848d8, 0x06030305, 0xf7f6f601, 0x1c0e0e12
494	.WORD	0xc26161a3, 0x6a35355f, 0xae5757f9, 0x69b9b9d0
495	.WORD	0x17868691, 0x99c1c158, 0x3a1d1d27, 0x279e9eb9
496	.WORD	0xd9e1e138, 0xebf8f813, 0x2b9898b3, 0x22111133
497	.WORD	0xd26969bb, 0xa9d9d970, 0x078e8e89, 0x339494a7
498	.WORD	0x2d9b9bb6, 0x3c1e1e22, 0x15878792, 0xc9e9e920
499	.WORD	0x87cece49, 0xaa5555ff, 0x50282878, 0xa5dfdf7a
500	.WORD	0x038c8c8f, 0x59a1a1f8, 0x09898980, 0x1a0d0d17
501	.WORD	0x65bfbfda, 0xd7e6e631, 0x844242c6, 0xd06868b8
502	.WORD	0x824141c3, 0x299999b0, 0x5a2d2d77, 0x1e0f0f11
503	.WORD	0x7bb0b0cb, 0xa85454fc, 0x6dbbbbd6, 0x2c16163a
504	.BYTE	0x63, 0x7c, 0x77, 0x7b, 0xf2, 0x6b, 0x6f, 0xc5
505	.BYTE	0x30, 0x01, 0x67, 0x2b, 0xfe, 0xd7, 0xab, 0x76
506	.BYTE	0xca, 0x82, 0xc9, 0x7d, 0xfa, 0x59, 0x47, 0xf0
507	.BYTE	0xad, 0xd4, 0xa2, 0xaf, 0x9c, 0xa4, 0x72, 0xc0
508	.BYTE	0xb7, 0xfd, 0x93, 0x26, 0x36, 0x3f, 0xf7, 0xcc
509	.BYTE	0x34, 0xa5, 0xe5, 0xf1, 0x71, 0xd8, 0x31, 0x15
510	.BYTE	0x04, 0xc7, 0x23, 0xc3, 0x18, 0x96, 0x05, 0x9a
511	.BYTE	0x07, 0x12, 0x80, 0xe2, 0xeb, 0x27, 0xb2, 0x75
512	.BYTE	0x09, 0x83, 0x2c, 0x1a, 0x1b, 0x6e, 0x5a, 0xa0
513	.BYTE	0x52, 0x3b, 0xd6, 0xb3, 0x29, 0xe3, 0x2f, 0x84
514	.BYTE	0x53, 0xd1, 0x00, 0xed, 0x20, 0xfc, 0xb1, 0x5b
515	.BYTE	0x6a, 0xcb, 0xbe, 0x39, 0x4a, 0x4c, 0x58, 0xcf
516	.BYTE	0xd0, 0xef, 0xaa, 0xfb, 0x43, 0x4d, 0x33, 0x85
517	.BYTE	0x45, 0xf9, 0x02, 0x7f, 0x50, 0x3c, 0x9f, 0xa8
518	.BYTE	0x51, 0xa3, 0x40, 0x8f, 0x92, 0x9d, 0x38, 0xf5
519	.BYTE	0xbc, 0xb6, 0xda, 0x21, 0x10, 0xff, 0xf3, 0xd2
520	.BYTE	0xcd, 0x0c, 0x13, 0xec, 0x5f, 0x97, 0x44, 0x17
521	.BYTE	0xc4, 0xa7, 0x7e, 0x3d, 0x64, 0x5d, 0x19, 0x73
522	.BYTE	0x60, 0x81, 0x4f, 0xdc, 0x22, 0x2a, 0x90, 0x88
523	.BYTE	0x46, 0xee, 0xb8, 0x14, 0xde, 0x5e, 0x0b, 0xdb
524	.BYTE	0xe0, 0x32, 0x3a, 0x0a, 0x49, 0x06, 0x24, 0x5c
525	.BYTE	0xc2, 0xd3, 0xac, 0x62, 0x91, 0x95, 0xe4, 0x79
526	.BYTE	0xe7, 0xc8, 0x37, 0x6d, 0x8d, 0xd5, 0x4e, 0xa9
527	.BYTE	0x6c, 0x56, 0xf4, 0xea, 0x65, 0x7a, 0xae, 0x08
528	.BYTE	0xba, 0x78, 0x25, 0x2e, 0x1c, 0xa6, 0xb4, 0xc6
529	.BYTE	0xe8, 0xdd, 0x74, 0x1f, 0x4b, 0xbd, 0x8b, 0x8a
530	.BYTE	0x70, 0x3e, 0xb5, 0x66, 0x48, 0x03, 0xf6, 0x0e
531	.BYTE	0x61, 0x35, 0x57, 0xb9, 0x86, 0xc1, 0x1d, 0x9e
532	.BYTE	0xe1, 0xf8, 0x98, 0x11, 0x69, 0xd9, 0x8e, 0x94
533	.BYTE	0x9b, 0x1e, 0x87, 0xe9, 0xce, 0x55, 0x28, 0xdf
534	.BYTE	0x8c, 0xa1, 0x89, 0x0d, 0xbf, 0xe6, 0x42, 0x68
535	.BYTE	0x41, 0x99, 0x2d, 0x0f, 0xb0, 0x54, 0xbb, 0x16
536___
537
538$code.=<<___;
539	.EXPORT	AES_decrypt,ENTRY,ARGW0=GR,ARGW1=GR,ARGW2=GR
540	.ALIGN	16
541AES_decrypt
542	.PROC
543	.CALLINFO	FRAME=`$FRAME-16*$SIZE_T`,NO_CALLS,SAVE_RP,ENTRY_GR=18
544	.ENTRY
545	$PUSH	%r2,-$SAVED_RP(%sp)	; standard prologue
546	$PUSHMA	%r3,$FRAME(%sp)
547	$PUSH	%r4,`-$FRAME+1*$SIZE_T`(%sp)
548	$PUSH	%r5,`-$FRAME+2*$SIZE_T`(%sp)
549	$PUSH	%r6,`-$FRAME+3*$SIZE_T`(%sp)
550	$PUSH	%r7,`-$FRAME+4*$SIZE_T`(%sp)
551	$PUSH	%r8,`-$FRAME+5*$SIZE_T`(%sp)
552	$PUSH	%r9,`-$FRAME+6*$SIZE_T`(%sp)
553	$PUSH	%r10,`-$FRAME+7*$SIZE_T`(%sp)
554	$PUSH	%r11,`-$FRAME+8*$SIZE_T`(%sp)
555	$PUSH	%r12,`-$FRAME+9*$SIZE_T`(%sp)
556	$PUSH	%r13,`-$FRAME+10*$SIZE_T`(%sp)
557	$PUSH	%r14,`-$FRAME+11*$SIZE_T`(%sp)
558	$PUSH	%r15,`-$FRAME+12*$SIZE_T`(%sp)
559	$PUSH	%r16,`-$FRAME+13*$SIZE_T`(%sp)
560	$PUSH	%r17,`-$FRAME+14*$SIZE_T`(%sp)
561	$PUSH	%r18,`-$FRAME+15*$SIZE_T`(%sp)
562
563	blr	%r0,$tbl
564	ldi	3,$t0
565L\$dec_pic
566	andcm	$tbl,$t0,$tbl
567	ldo	L\$AES_Td-L\$dec_pic($tbl),$tbl
568
569	and	$inp,$t0,$t0
570	sub	$inp,$t0,$inp
571	ldw	0($inp),$s0
572	ldw	4($inp),$s1
573	ldw	8($inp),$s2
574	comib,=	0,$t0,L\$dec_inp_aligned
575	ldw	12($inp),$s3
576
577	sh3addl	$t0,%r0,$t0
578	subi	32,$t0,$t0
579	mtctl	$t0,%cr11
580	ldw	16($inp),$t1
581	vshd	$s0,$s1,$s0
582	vshd	$s1,$s2,$s1
583	vshd	$s2,$s3,$s2
584	vshd	$s3,$t1,$s3
585
586L\$dec_inp_aligned
587	bl	_parisc_AES_decrypt,%r31
588	nop
589
590	extru,<> $out,31,2,%r0
591	b	L\$dec_out_aligned
592	nop
593
594	_srm	$s0,24,$acc0
595	_srm	$s0,16,$acc1
596	stb	$acc0,0($out)
597	_srm	$s0,8,$acc2
598	stb	$acc1,1($out)
599	_srm	$s1,24,$acc4
600	stb	$acc2,2($out)
601	_srm	$s1,16,$acc5
602	stb	$s0,3($out)
603	_srm	$s1,8,$acc6
604	stb	$acc4,4($out)
605	_srm	$s2,24,$acc0
606	stb	$acc5,5($out)
607	_srm	$s2,16,$acc1
608	stb	$acc6,6($out)
609	_srm	$s2,8,$acc2
610	stb	$s1,7($out)
611	_srm	$s3,24,$acc4
612	stb	$acc0,8($out)
613	_srm	$s3,16,$acc5
614	stb	$acc1,9($out)
615	_srm	$s3,8,$acc6
616	stb	$acc2,10($out)
617	stb	$s2,11($out)
618	stb	$acc4,12($out)
619	stb	$acc5,13($out)
620	stb	$acc6,14($out)
621	b	L\$dec_done
622	stb	$s3,15($out)
623
624L\$dec_out_aligned
625	stw	$s0,0($out)
626	stw	$s1,4($out)
627	stw	$s2,8($out)
628	stw	$s3,12($out)
629
630L\$dec_done
631	$POP	`-$FRAME-$SAVED_RP`(%sp),%r2	; standard epilogue
632	$POP	`-$FRAME+1*$SIZE_T`(%sp),%r4
633	$POP	`-$FRAME+2*$SIZE_T`(%sp),%r5
634	$POP	`-$FRAME+3*$SIZE_T`(%sp),%r6
635	$POP	`-$FRAME+4*$SIZE_T`(%sp),%r7
636	$POP	`-$FRAME+5*$SIZE_T`(%sp),%r8
637	$POP	`-$FRAME+6*$SIZE_T`(%sp),%r9
638	$POP	`-$FRAME+7*$SIZE_T`(%sp),%r10
639	$POP	`-$FRAME+8*$SIZE_T`(%sp),%r11
640	$POP	`-$FRAME+9*$SIZE_T`(%sp),%r12
641	$POP	`-$FRAME+10*$SIZE_T`(%sp),%r13
642	$POP	`-$FRAME+11*$SIZE_T`(%sp),%r14
643	$POP	`-$FRAME+12*$SIZE_T`(%sp),%r15
644	$POP	`-$FRAME+13*$SIZE_T`(%sp),%r16
645	$POP	`-$FRAME+14*$SIZE_T`(%sp),%r17
646	$POP	`-$FRAME+15*$SIZE_T`(%sp),%r18
647	bv	(%r2)
648	.EXIT
649	$POPMB	-$FRAME(%sp),%r3
650	.PROCEND
651
652	.ALIGN	16
653_parisc_AES_decrypt
654	.PROC
655	.CALLINFO	MILLICODE
656	.ENTRY
657	ldw	240($key),$rounds
658	ldw	0($key),$t0
659	ldw	4($key),$t1
660	ldw	8($key),$t2
661	ldw	12($key),$t3
662	_srm	$rounds,1,$rounds
663	xor	$t0,$s0,$s0
664	ldw	16($key),$t0
665	xor	$t1,$s1,$s1
666	ldw	20($key),$t1
667	_srm	$s0,24,$acc0
668	xor	$t2,$s2,$s2
669	ldw	24($key),$t2
670	xor	$t3,$s3,$s3
671	ldw	28($key),$t3
672	_srm	$s3,16,$acc1
673L\$dec_loop
674	_srm	$s2,8,$acc2
675	ldwx,s	$acc0($tbl),$acc0
676	_srm	$s1,0,$acc3
677	ldwx,s	$acc1($tbl),$acc1
678	_srm	$s1,24,$acc4
679	ldwx,s	$acc2($tbl),$acc2
680	_srm	$s0,16,$acc5
681	ldwx,s	$acc3($tbl),$acc3
682	_srm	$s3,8,$acc6
683	ldwx,s	$acc4($tbl),$acc4
684	_srm	$s2,0,$acc7
685	ldwx,s	$acc5($tbl),$acc5
686	_srm	$s2,24,$acc8
687	ldwx,s	$acc6($tbl),$acc6
688	_srm	$s1,16,$acc9
689	ldwx,s	$acc7($tbl),$acc7
690	_srm	$s0,8,$acc10
691	ldwx,s	$acc8($tbl),$acc8
692	_srm	$s3,0,$acc11
693	ldwx,s	$acc9($tbl),$acc9
694	_srm	$s3,24,$acc12
695	ldwx,s	$acc10($tbl),$acc10
696	_srm	$s2,16,$acc13
697	ldwx,s	$acc11($tbl),$acc11
698	_srm	$s1,8,$acc14
699	ldwx,s	$acc12($tbl),$acc12
700	_srm	$s0,0,$acc15
701	ldwx,s	$acc13($tbl),$acc13
702	ldwx,s	$acc14($tbl),$acc14
703	ldwx,s	$acc15($tbl),$acc15
704	addib,= -1,$rounds,L\$dec_last
705	ldo	32($key),$key
706
707		_ror	$acc1,8,$acc1
708		xor	$acc0,$t0,$t0
709	ldw	0($key),$s0
710		_ror	$acc2,16,$acc2
711		xor	$acc1,$t0,$t0
712	ldw	4($key),$s1
713		_ror	$acc3,24,$acc3
714		xor	$acc2,$t0,$t0
715	ldw	8($key),$s2
716		_ror	$acc5,8,$acc5
717		xor	$acc3,$t0,$t0
718	ldw	12($key),$s3
719		_ror	$acc6,16,$acc6
720		xor	$acc4,$t1,$t1
721		_ror	$acc7,24,$acc7
722		xor	$acc5,$t1,$t1
723		_ror	$acc9,8,$acc9
724		xor	$acc6,$t1,$t1
725		_ror	$acc10,16,$acc10
726		xor	$acc7,$t1,$t1
727		_ror	$acc11,24,$acc11
728		xor	$acc8,$t2,$t2
729		_ror	$acc13,8,$acc13
730		xor	$acc9,$t2,$t2
731		_ror	$acc14,16,$acc14
732		xor	$acc10,$t2,$t2
733		_ror	$acc15,24,$acc15
734		xor	$acc11,$t2,$t2
735		xor	$acc12,$acc14,$acc14
736		xor	$acc13,$t3,$t3
737	_srm	$t0,24,$acc0
738		xor	$acc14,$t3,$t3
739		xor	$acc15,$t3,$t3
740	_srm	$t3,16,$acc1
741
742	_srm	$t2,8,$acc2
743	ldwx,s	$acc0($tbl),$acc0
744	_srm	$t1,0,$acc3
745	ldwx,s	$acc1($tbl),$acc1
746	_srm	$t1,24,$acc4
747	ldwx,s	$acc2($tbl),$acc2
748	_srm	$t0,16,$acc5
749	ldwx,s	$acc3($tbl),$acc3
750	_srm	$t3,8,$acc6
751	ldwx,s	$acc4($tbl),$acc4
752	_srm	$t2,0,$acc7
753	ldwx,s	$acc5($tbl),$acc5
754	_srm	$t2,24,$acc8
755	ldwx,s	$acc6($tbl),$acc6
756	_srm	$t1,16,$acc9
757	ldwx,s	$acc7($tbl),$acc7
758	_srm	$t0,8,$acc10
759	ldwx,s	$acc8($tbl),$acc8
760	_srm	$t3,0,$acc11
761	ldwx,s	$acc9($tbl),$acc9
762	_srm	$t3,24,$acc12
763	ldwx,s	$acc10($tbl),$acc10
764	_srm	$t2,16,$acc13
765	ldwx,s	$acc11($tbl),$acc11
766	_srm	$t1,8,$acc14
767	ldwx,s	$acc12($tbl),$acc12
768	_srm	$t0,0,$acc15
769	ldwx,s	$acc13($tbl),$acc13
770		_ror	$acc1,8,$acc1
771	ldwx,s	$acc14($tbl),$acc14
772
773		_ror	$acc2,16,$acc2
774		xor	$acc0,$s0,$s0
775	ldwx,s	$acc15($tbl),$acc15
776		_ror	$acc3,24,$acc3
777		xor	$acc1,$s0,$s0
778	ldw	16($key),$t0
779		_ror	$acc5,8,$acc5
780		xor	$acc2,$s0,$s0
781	ldw	20($key),$t1
782		_ror	$acc6,16,$acc6
783		xor	$acc3,$s0,$s0
784	ldw	24($key),$t2
785		_ror	$acc7,24,$acc7
786		xor	$acc4,$s1,$s1
787	ldw	28($key),$t3
788		_ror	$acc9,8,$acc9
789		xor	$acc5,$s1,$s1
790	ldw	1024+0($tbl),%r0		; prefetch td4
791		_ror	$acc10,16,$acc10
792		xor	$acc6,$s1,$s1
793	ldw	1024+32($tbl),%r0		; prefetch td4
794		_ror	$acc11,24,$acc11
795		xor	$acc7,$s1,$s1
796	ldw	1024+64($tbl),%r0		; prefetch td4
797		_ror	$acc13,8,$acc13
798		xor	$acc8,$s2,$s2
799	ldw	1024+96($tbl),%r0		; prefetch td4
800		_ror	$acc14,16,$acc14
801		xor	$acc9,$s2,$s2
802	ldw	1024+128($tbl),%r0		; prefetch td4
803		_ror	$acc15,24,$acc15
804		xor	$acc10,$s2,$s2
805	ldw	1024+160($tbl),%r0		; prefetch td4
806	_srm	$s0,24,$acc0
807		xor	$acc11,$s2,$s2
808	ldw	1024+192($tbl),%r0		; prefetch td4
809		xor	$acc12,$acc14,$acc14
810		xor	$acc13,$s3,$s3
811	ldw	1024+224($tbl),%r0		; prefetch td4
812		xor	$acc14,$s3,$s3
813		xor	$acc15,$s3,$s3
814	b	L\$dec_loop
815	_srm	$s3,16,$acc1
816
817	.ALIGN	16
818L\$dec_last
819	ldo	1024($tbl),$rounds
820		_ror	$acc1,8,$acc1
821		xor	$acc0,$t0,$t0
822	ldw	0($key),$s0
823		_ror	$acc2,16,$acc2
824		xor	$acc1,$t0,$t0
825	ldw	4($key),$s1
826		_ror	$acc3,24,$acc3
827		xor	$acc2,$t0,$t0
828	ldw	8($key),$s2
829		_ror	$acc5,8,$acc5
830		xor	$acc3,$t0,$t0
831	ldw	12($key),$s3
832		_ror	$acc6,16,$acc6
833		xor	$acc4,$t1,$t1
834		_ror	$acc7,24,$acc7
835		xor	$acc5,$t1,$t1
836		_ror	$acc9,8,$acc9
837		xor	$acc6,$t1,$t1
838		_ror	$acc10,16,$acc10
839		xor	$acc7,$t1,$t1
840		_ror	$acc11,24,$acc11
841		xor	$acc8,$t2,$t2
842		_ror	$acc13,8,$acc13
843		xor	$acc9,$t2,$t2
844		_ror	$acc14,16,$acc14
845		xor	$acc10,$t2,$t2
846		_ror	$acc15,24,$acc15
847		xor	$acc11,$t2,$t2
848		xor	$acc12,$acc14,$acc14
849		xor	$acc13,$t3,$t3
850	_srm	$t0,24,$acc0
851		xor	$acc14,$t3,$t3
852		xor	$acc15,$t3,$t3
853	_srm	$t3,16,$acc1
854
855	_srm	$t2,8,$acc2
856	ldbx	$acc0($rounds),$acc0
857	_srm	$t1,24,$acc4
858	ldbx	$acc1($rounds),$acc1
859	_srm	$t0,16,$acc5
860	_srm	$t1,0,$acc3
861	ldbx	$acc2($rounds),$acc2
862	ldbx	$acc3($rounds),$acc3
863	_srm	$t3,8,$acc6
864	ldbx	$acc4($rounds),$acc4
865	_srm	$t2,24,$acc8
866	ldbx	$acc5($rounds),$acc5
867	_srm	$t1,16,$acc9
868	_srm	$t2,0,$acc7
869	ldbx	$acc6($rounds),$acc6
870	ldbx	$acc7($rounds),$acc7
871	_srm	$t0,8,$acc10
872	ldbx	$acc8($rounds),$acc8
873	_srm	$t3,24,$acc12
874	ldbx	$acc9($rounds),$acc9
875	_srm	$t2,16,$acc13
876	_srm	$t3,0,$acc11
877	ldbx	$acc10($rounds),$acc10
878	_srm	$t1,8,$acc14
879	ldbx	$acc11($rounds),$acc11
880	ldbx	$acc12($rounds),$acc12
881	ldbx	$acc13($rounds),$acc13
882	_srm	$t0,0,$acc15
883	ldbx	$acc14($rounds),$acc14
884
885		dep	$acc0,7,8,$acc3
886	ldbx	$acc15($rounds),$acc15
887		dep	$acc4,7,8,$acc7
888		dep	$acc1,15,8,$acc3
889		dep	$acc5,15,8,$acc7
890		dep	$acc2,23,8,$acc3
891		dep	$acc6,23,8,$acc7
892		xor	$acc3,$s0,$s0
893		xor	$acc7,$s1,$s1
894		dep	$acc8,7,8,$acc11
895		dep	$acc12,7,8,$acc15
896		dep	$acc9,15,8,$acc11
897		dep	$acc13,15,8,$acc15
898		dep	$acc10,23,8,$acc11
899		dep	$acc14,23,8,$acc15
900		xor	$acc11,$s2,$s2
901
902	bv	(%r31)
903	.EXIT
904		xor	$acc15,$s3,$s3
905	.PROCEND
906
907	.ALIGN	64
908L\$AES_Td
909	.WORD	0x51f4a750, 0x7e416553, 0x1a17a4c3, 0x3a275e96
910	.WORD	0x3bab6bcb, 0x1f9d45f1, 0xacfa58ab, 0x4be30393
911	.WORD	0x2030fa55, 0xad766df6, 0x88cc7691, 0xf5024c25
912	.WORD	0x4fe5d7fc, 0xc52acbd7, 0x26354480, 0xb562a38f
913	.WORD	0xdeb15a49, 0x25ba1b67, 0x45ea0e98, 0x5dfec0e1
914	.WORD	0xc32f7502, 0x814cf012, 0x8d4697a3, 0x6bd3f9c6
915	.WORD	0x038f5fe7, 0x15929c95, 0xbf6d7aeb, 0x955259da
916	.WORD	0xd4be832d, 0x587421d3, 0x49e06929, 0x8ec9c844
917	.WORD	0x75c2896a, 0xf48e7978, 0x99583e6b, 0x27b971dd
918	.WORD	0xbee14fb6, 0xf088ad17, 0xc920ac66, 0x7dce3ab4
919	.WORD	0x63df4a18, 0xe51a3182, 0x97513360, 0x62537f45
920	.WORD	0xb16477e0, 0xbb6bae84, 0xfe81a01c, 0xf9082b94
921	.WORD	0x70486858, 0x8f45fd19, 0x94de6c87, 0x527bf8b7
922	.WORD	0xab73d323, 0x724b02e2, 0xe31f8f57, 0x6655ab2a
923	.WORD	0xb2eb2807, 0x2fb5c203, 0x86c57b9a, 0xd33708a5
924	.WORD	0x302887f2, 0x23bfa5b2, 0x02036aba, 0xed16825c
925	.WORD	0x8acf1c2b, 0xa779b492, 0xf307f2f0, 0x4e69e2a1
926	.WORD	0x65daf4cd, 0x0605bed5, 0xd134621f, 0xc4a6fe8a
927	.WORD	0x342e539d, 0xa2f355a0, 0x058ae132, 0xa4f6eb75
928	.WORD	0x0b83ec39, 0x4060efaa, 0x5e719f06, 0xbd6e1051
929	.WORD	0x3e218af9, 0x96dd063d, 0xdd3e05ae, 0x4de6bd46
930	.WORD	0x91548db5, 0x71c45d05, 0x0406d46f, 0x605015ff
931	.WORD	0x1998fb24, 0xd6bde997, 0x894043cc, 0x67d99e77
932	.WORD	0xb0e842bd, 0x07898b88, 0xe7195b38, 0x79c8eedb
933	.WORD	0xa17c0a47, 0x7c420fe9, 0xf8841ec9, 0x00000000
934	.WORD	0x09808683, 0x322bed48, 0x1e1170ac, 0x6c5a724e
935	.WORD	0xfd0efffb, 0x0f853856, 0x3daed51e, 0x362d3927
936	.WORD	0x0a0fd964, 0x685ca621, 0x9b5b54d1, 0x24362e3a
937	.WORD	0x0c0a67b1, 0x9357e70f, 0xb4ee96d2, 0x1b9b919e
938	.WORD	0x80c0c54f, 0x61dc20a2, 0x5a774b69, 0x1c121a16
939	.WORD	0xe293ba0a, 0xc0a02ae5, 0x3c22e043, 0x121b171d
940	.WORD	0x0e090d0b, 0xf28bc7ad, 0x2db6a8b9, 0x141ea9c8
941	.WORD	0x57f11985, 0xaf75074c, 0xee99ddbb, 0xa37f60fd
942	.WORD	0xf701269f, 0x5c72f5bc, 0x44663bc5, 0x5bfb7e34
943	.WORD	0x8b432976, 0xcb23c6dc, 0xb6edfc68, 0xb8e4f163
944	.WORD	0xd731dcca, 0x42638510, 0x13972240, 0x84c61120
945	.WORD	0x854a247d, 0xd2bb3df8, 0xaef93211, 0xc729a16d
946	.WORD	0x1d9e2f4b, 0xdcb230f3, 0x0d8652ec, 0x77c1e3d0
947	.WORD	0x2bb3166c, 0xa970b999, 0x119448fa, 0x47e96422
948	.WORD	0xa8fc8cc4, 0xa0f03f1a, 0x567d2cd8, 0x223390ef
949	.WORD	0x87494ec7, 0xd938d1c1, 0x8ccaa2fe, 0x98d40b36
950	.WORD	0xa6f581cf, 0xa57ade28, 0xdab78e26, 0x3fadbfa4
951	.WORD	0x2c3a9de4, 0x5078920d, 0x6a5fcc9b, 0x547e4662
952	.WORD	0xf68d13c2, 0x90d8b8e8, 0x2e39f75e, 0x82c3aff5
953	.WORD	0x9f5d80be, 0x69d0937c, 0x6fd52da9, 0xcf2512b3
954	.WORD	0xc8ac993b, 0x10187da7, 0xe89c636e, 0xdb3bbb7b
955	.WORD	0xcd267809, 0x6e5918f4, 0xec9ab701, 0x834f9aa8
956	.WORD	0xe6956e65, 0xaaffe67e, 0x21bccf08, 0xef15e8e6
957	.WORD	0xbae79bd9, 0x4a6f36ce, 0xea9f09d4, 0x29b07cd6
958	.WORD	0x31a4b2af, 0x2a3f2331, 0xc6a59430, 0x35a266c0
959	.WORD	0x744ebc37, 0xfc82caa6, 0xe090d0b0, 0x33a7d815
960	.WORD	0xf104984a, 0x41ecdaf7, 0x7fcd500e, 0x1791f62f
961	.WORD	0x764dd68d, 0x43efb04d, 0xccaa4d54, 0xe49604df
962	.WORD	0x9ed1b5e3, 0x4c6a881b, 0xc12c1fb8, 0x4665517f
963	.WORD	0x9d5eea04, 0x018c355d, 0xfa877473, 0xfb0b412e
964	.WORD	0xb3671d5a, 0x92dbd252, 0xe9105633, 0x6dd64713
965	.WORD	0x9ad7618c, 0x37a10c7a, 0x59f8148e, 0xeb133c89
966	.WORD	0xcea927ee, 0xb761c935, 0xe11ce5ed, 0x7a47b13c
967	.WORD	0x9cd2df59, 0x55f2733f, 0x1814ce79, 0x73c737bf
968	.WORD	0x53f7cdea, 0x5ffdaa5b, 0xdf3d6f14, 0x7844db86
969	.WORD	0xcaaff381, 0xb968c43e, 0x3824342c, 0xc2a3405f
970	.WORD	0x161dc372, 0xbce2250c, 0x283c498b, 0xff0d9541
971	.WORD	0x39a80171, 0x080cb3de, 0xd8b4e49c, 0x6456c190
972	.WORD	0x7bcb8461, 0xd532b670, 0x486c5c74, 0xd0b85742
973	.BYTE	0x52, 0x09, 0x6a, 0xd5, 0x30, 0x36, 0xa5, 0x38
974	.BYTE	0xbf, 0x40, 0xa3, 0x9e, 0x81, 0xf3, 0xd7, 0xfb
975	.BYTE	0x7c, 0xe3, 0x39, 0x82, 0x9b, 0x2f, 0xff, 0x87
976	.BYTE	0x34, 0x8e, 0x43, 0x44, 0xc4, 0xde, 0xe9, 0xcb
977	.BYTE	0x54, 0x7b, 0x94, 0x32, 0xa6, 0xc2, 0x23, 0x3d
978	.BYTE	0xee, 0x4c, 0x95, 0x0b, 0x42, 0xfa, 0xc3, 0x4e
979	.BYTE	0x08, 0x2e, 0xa1, 0x66, 0x28, 0xd9, 0x24, 0xb2
980	.BYTE	0x76, 0x5b, 0xa2, 0x49, 0x6d, 0x8b, 0xd1, 0x25
981	.BYTE	0x72, 0xf8, 0xf6, 0x64, 0x86, 0x68, 0x98, 0x16
982	.BYTE	0xd4, 0xa4, 0x5c, 0xcc, 0x5d, 0x65, 0xb6, 0x92
983	.BYTE	0x6c, 0x70, 0x48, 0x50, 0xfd, 0xed, 0xb9, 0xda
984	.BYTE	0x5e, 0x15, 0x46, 0x57, 0xa7, 0x8d, 0x9d, 0x84
985	.BYTE	0x90, 0xd8, 0xab, 0x00, 0x8c, 0xbc, 0xd3, 0x0a
986	.BYTE	0xf7, 0xe4, 0x58, 0x05, 0xb8, 0xb3, 0x45, 0x06
987	.BYTE	0xd0, 0x2c, 0x1e, 0x8f, 0xca, 0x3f, 0x0f, 0x02
988	.BYTE	0xc1, 0xaf, 0xbd, 0x03, 0x01, 0x13, 0x8a, 0x6b
989	.BYTE	0x3a, 0x91, 0x11, 0x41, 0x4f, 0x67, 0xdc, 0xea
990	.BYTE	0x97, 0xf2, 0xcf, 0xce, 0xf0, 0xb4, 0xe6, 0x73
991	.BYTE	0x96, 0xac, 0x74, 0x22, 0xe7, 0xad, 0x35, 0x85
992	.BYTE	0xe2, 0xf9, 0x37, 0xe8, 0x1c, 0x75, 0xdf, 0x6e
993	.BYTE	0x47, 0xf1, 0x1a, 0x71, 0x1d, 0x29, 0xc5, 0x89
994	.BYTE	0x6f, 0xb7, 0x62, 0x0e, 0xaa, 0x18, 0xbe, 0x1b
995	.BYTE	0xfc, 0x56, 0x3e, 0x4b, 0xc6, 0xd2, 0x79, 0x20
996	.BYTE	0x9a, 0xdb, 0xc0, 0xfe, 0x78, 0xcd, 0x5a, 0xf4
997	.BYTE	0x1f, 0xdd, 0xa8, 0x33, 0x88, 0x07, 0xc7, 0x31
998	.BYTE	0xb1, 0x12, 0x10, 0x59, 0x27, 0x80, 0xec, 0x5f
999	.BYTE	0x60, 0x51, 0x7f, 0xa9, 0x19, 0xb5, 0x4a, 0x0d
1000	.BYTE	0x2d, 0xe5, 0x7a, 0x9f, 0x93, 0xc9, 0x9c, 0xef
1001	.BYTE	0xa0, 0xe0, 0x3b, 0x4d, 0xae, 0x2a, 0xf5, 0xb0
1002	.BYTE	0xc8, 0xeb, 0xbb, 0x3c, 0x83, 0x53, 0x99, 0x61
1003	.BYTE	0x17, 0x2b, 0x04, 0x7e, 0xba, 0x77, 0xd6, 0x26
1004	.BYTE	0xe1, 0x69, 0x14, 0x63, 0x55, 0x21, 0x0c, 0x7d
1005	.STRINGZ "AES for PA-RISC, CRYPTOGAMS by <appro\@openssl.org>"
1006___
1007
1008foreach (split("\n",$code)) {
1009	s/\`([^\`]*)\`/eval $1/ge;
1010
1011	# translate made up instructons: _ror, _srm
1012	s/_ror(\s+)(%r[0-9]+),/shd$1$2,$2,/				or
1013
1014	s/_srm(\s+%r[0-9]+),([0-9]+),/
1015		$SIZE_T==4 ? sprintf("extru%s,%d,8,",$1,31-$2)
1016		:            sprintf("extrd,u%s,%d,8,",$1,63-$2)/e;
1017
1018	s/,\*/,/ if ($SIZE_T==4);
1019	print $_,"\n";
1020}
1021close STDOUT;
1022