xref: /openssl/crypto/md5/asm/md5-586.pl (revision 572e6df7)
1#! /usr/bin/env perl
2# Copyright 1995-2020 The OpenSSL Project Authors. All Rights Reserved.
3#
4# Licensed under the Apache License 2.0 (the "License").  You may not use
5# this file except in compliance with the License.  You can obtain a copy
6# in the file LICENSE in the source distribution or at
7# https://www.openssl.org/source/license.html
8
9
10# Normal is the
11# md5_block_x86(MD5_CTX *c, ULONG *X);
12# version, non-normal is the
13# md5_block_x86(MD5_CTX *c, ULONG *X,int blocks);
14
15$normal=0;
16
17$0 =~ m/(.*[\/\\])[^\/\\]+$/; $dir=$1;
18push(@INC,"${dir}","${dir}../../perlasm");
19require "x86asm.pl";
20
21# $output is the last argument if it looks like a file (it has an extension)
22$output = $#ARGV >= 0 && $ARGV[$#ARGV] =~ m|\.\w+$| ? pop : undef;
23
24$output and open STDOUT,">$output";
25
26&asm_init($ARGV[0]);
27
28$A="eax";
29$B="ebx";
30$C="ecx";
31$D="edx";
32$tmp1="edi";
33$tmp2="ebp";
34$X="esi";
35
36# What we need to load into $tmp for the next round
37%Ltmp1=("R0",&Np($C), "R1",&Np($C), "R2",&Np($C), "R3",&Np($D));
38@xo=(
39 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15,	# R0
40 1, 6, 11, 0, 5, 10, 15, 4, 9, 14, 3, 8, 13, 2, 7, 12,	# R1
41 5, 8, 11, 14, 1, 4, 7, 10, 13, 0, 3, 6, 9, 12, 15, 2,	# R2
42 0, 7, 14, 5, 12, 3, 10, 1, 8, 15, 6, 13, 4, 11, 2, 9,	# R3
43 );
44
45&md5_block("ossl_md5_block_asm_data_order");
46&asm_finish();
47
48close STDOUT or die "error closing STDOUT: $!";
49
50sub Np
51	{
52	local($p)=@_;
53	local(%n)=($A,$D,$B,$A,$C,$B,$D,$C);
54	return($n{$p});
55	}
56
57sub R0
58	{
59	local($pos,$a,$b,$c,$d,$K,$ki,$s,$t)=@_;
60
61	&mov($tmp1,$C)  if $pos < 0;
62	&mov($tmp2,&DWP($xo[$ki]*4,$K,"",0)) if $pos < 0; # very first one
63
64	# body proper
65
66	&comment("R0 $ki");
67	&xor($tmp1,$d); # F function - part 2
68
69	&and($tmp1,$b); # F function - part 3
70	&lea($a,&DWP($t,$a,$tmp2,1));
71
72	&xor($tmp1,$d); # F function - part 4
73	&mov($tmp2,&DWP($xo[$ki+1]*4,$K,"",0)) if ($pos != 2);
74
75	&add($a,$tmp1);
76
77	&rotl($a,$s);
78
79	&mov($tmp1,&Np($c)) if $pos < 1;	# next tmp1 for R0
80	&mov($tmp1,&Np($c)) if $pos == 1;	# next tmp1 for R1
81
82	&add($a,$b);
83	}
84
85sub R1
86	{
87	local($pos,$a,$b,$c,$d,$K,$ki,$s,$t)=@_;
88
89	&comment("R1 $ki");
90
91	&xor($tmp1,$b); # G function - part 2
92	&and($tmp1,$d); # G function - part 3
93	&lea($a,&DWP($t,$a,$tmp2,1));
94
95	&xor($tmp1,$c);			# G function - part 4
96	&mov($tmp2,&DWP($xo[$ki+1]*4,$K,"",0)) if ($pos != 2);
97
98	&add($a,$tmp1);
99	&mov($tmp1,&Np($c)) if $pos < 1;	# G function - part 1
100	&mov($tmp1,&Np($c)) if $pos == 1;	# G function - part 1
101
102	&rotl($a,$s);
103
104	&add($a,$b);
105	}
106
107sub R2
108	{
109	local($n,$pos,$a,$b,$c,$d,$K,$ki,$s,$t)=@_;
110	# This one is different, only 3 logical operations
111
112if (($n & 1) == 0)
113	{
114	&comment("R2 $ki");
115	# make sure to do 'D' first, not 'B', else we clash with
116	# the last add from the previous round.
117
118	&xor($tmp1,$d); # H function - part 2
119
120	&xor($tmp1,$b); # H function - part 3
121	&lea($a,&DWP($t,$a,$tmp2,1));
122
123	&add($a,$tmp1);
124	&mov($tmp2,&DWP($xo[$ki+1]*4,$K,"",0));
125
126	&rotl($a,$s);
127
128	&mov($tmp1,&Np($c));
129	}
130else
131	{
132	&comment("R2 $ki");
133	# make sure to do 'D' first, not 'B', else we clash with
134	# the last add from the previous round.
135
136	&add($b,$c);			# MOVED FORWARD
137	&xor($tmp1,$d); # H function - part 2
138
139	&lea($a,&DWP($t,$a,$tmp2,1));
140
141	&xor($tmp1,$b); # H function - part 3
142	&mov($tmp2,&DWP($xo[$ki+1]*4,$K,"",0)) if ($pos != 2);
143
144	&add($a,$tmp1);
145	&mov($tmp1,&Np($c)) if $pos < 1;	# H function - part 1
146	&mov($tmp1,-1) if $pos == 1;		# I function - part 1
147
148	&rotl($a,$s);
149
150	&add($a,$b);
151	}
152	}
153
154sub R3
155	{
156	local($pos,$a,$b,$c,$d,$K,$ki,$s,$t)=@_;
157
158	&comment("R3 $ki");
159
160	# &not($tmp1)
161	&xor($tmp1,$d) if $pos < 0; 	# I function - part 2
162
163	&or($tmp1,$b);				# I function - part 3
164	&lea($a,&DWP($t,$a,$tmp2,1));
165
166	&xor($tmp1,$c); 			# I function - part 4
167	&mov($tmp2,&DWP($xo[$ki+1]*4,$K,"",0))	if $pos != 2; # load X/k value
168	&mov($tmp2,&wparam(0)) if $pos == 2;
169
170	&add($a,$tmp1);
171	&mov($tmp1,-1) if $pos < 1;	# H function - part 1
172	&add($K,64) if $pos >=1 && !$normal;
173
174	&rotl($a,$s);
175
176	&xor($tmp1,&Np($d)) if $pos <= 0; 	# I function - part = first time
177	&mov($tmp1,&DWP( 0,$tmp2,"",0)) if $pos > 0;
178	&add($a,$b);
179	}
180
181
182sub md5_block
183	{
184	local($name)=@_;
185
186	&function_begin_B($name,"",3);
187
188	# parameter 1 is the MD5_CTX structure.
189	# A	0
190	# B	4
191	# C	8
192	# D 	12
193
194	&push("esi");
195	 &push("edi");
196	&mov($tmp1,	&wparam(0)); # edi
197	 &mov($X,	&wparam(1)); # esi
198	&mov($C,	&wparam(2));
199	 &push("ebp");
200	&shl($C,	6);
201	&push("ebx");
202	 &add($C,	$X); # offset we end at
203	&sub($C,	64);
204	 &mov($A,	&DWP( 0,$tmp1,"",0));
205	&push($C);	# Put on the TOS
206	 &mov($B,	&DWP( 4,$tmp1,"",0));
207	&mov($C,	&DWP( 8,$tmp1,"",0));
208	 &mov($D,	&DWP(12,$tmp1,"",0));
209
210	&set_label("start") unless $normal;
211	&comment("");
212	&comment("R0 section");
213
214	&R0(-2,$A,$B,$C,$D,$X, 0, 7,0xd76aa478);
215	&R0( 0,$D,$A,$B,$C,$X, 1,12,0xe8c7b756);
216	&R0( 0,$C,$D,$A,$B,$X, 2,17,0x242070db);
217	&R0( 0,$B,$C,$D,$A,$X, 3,22,0xc1bdceee);
218	&R0( 0,$A,$B,$C,$D,$X, 4, 7,0xf57c0faf);
219	&R0( 0,$D,$A,$B,$C,$X, 5,12,0x4787c62a);
220	&R0( 0,$C,$D,$A,$B,$X, 6,17,0xa8304613);
221	&R0( 0,$B,$C,$D,$A,$X, 7,22,0xfd469501);
222	&R0( 0,$A,$B,$C,$D,$X, 8, 7,0x698098d8);
223	&R0( 0,$D,$A,$B,$C,$X, 9,12,0x8b44f7af);
224	&R0( 0,$C,$D,$A,$B,$X,10,17,0xffff5bb1);
225	&R0( 0,$B,$C,$D,$A,$X,11,22,0x895cd7be);
226	&R0( 0,$A,$B,$C,$D,$X,12, 7,0x6b901122);
227	&R0( 0,$D,$A,$B,$C,$X,13,12,0xfd987193);
228	&R0( 0,$C,$D,$A,$B,$X,14,17,0xa679438e);
229	&R0( 1,$B,$C,$D,$A,$X,15,22,0x49b40821);
230
231	&comment("");
232	&comment("R1 section");
233	&R1(-1,$A,$B,$C,$D,$X,16, 5,0xf61e2562);
234	&R1( 0,$D,$A,$B,$C,$X,17, 9,0xc040b340);
235	&R1( 0,$C,$D,$A,$B,$X,18,14,0x265e5a51);
236	&R1( 0,$B,$C,$D,$A,$X,19,20,0xe9b6c7aa);
237	&R1( 0,$A,$B,$C,$D,$X,20, 5,0xd62f105d);
238	&R1( 0,$D,$A,$B,$C,$X,21, 9,0x02441453);
239	&R1( 0,$C,$D,$A,$B,$X,22,14,0xd8a1e681);
240	&R1( 0,$B,$C,$D,$A,$X,23,20,0xe7d3fbc8);
241	&R1( 0,$A,$B,$C,$D,$X,24, 5,0x21e1cde6);
242	&R1( 0,$D,$A,$B,$C,$X,25, 9,0xc33707d6);
243	&R1( 0,$C,$D,$A,$B,$X,26,14,0xf4d50d87);
244	&R1( 0,$B,$C,$D,$A,$X,27,20,0x455a14ed);
245	&R1( 0,$A,$B,$C,$D,$X,28, 5,0xa9e3e905);
246	&R1( 0,$D,$A,$B,$C,$X,29, 9,0xfcefa3f8);
247	&R1( 0,$C,$D,$A,$B,$X,30,14,0x676f02d9);
248	&R1( 1,$B,$C,$D,$A,$X,31,20,0x8d2a4c8a);
249
250	&comment("");
251	&comment("R2 section");
252	&R2( 0,-1,$A,$B,$C,$D,$X,32, 4,0xfffa3942);
253	&R2( 1, 0,$D,$A,$B,$C,$X,33,11,0x8771f681);
254	&R2( 2, 0,$C,$D,$A,$B,$X,34,16,0x6d9d6122);
255	&R2( 3, 0,$B,$C,$D,$A,$X,35,23,0xfde5380c);
256	&R2( 4, 0,$A,$B,$C,$D,$X,36, 4,0xa4beea44);
257	&R2( 5, 0,$D,$A,$B,$C,$X,37,11,0x4bdecfa9);
258	&R2( 6, 0,$C,$D,$A,$B,$X,38,16,0xf6bb4b60);
259	&R2( 7, 0,$B,$C,$D,$A,$X,39,23,0xbebfbc70);
260	&R2( 8, 0,$A,$B,$C,$D,$X,40, 4,0x289b7ec6);
261	&R2( 9, 0,$D,$A,$B,$C,$X,41,11,0xeaa127fa);
262	&R2(10, 0,$C,$D,$A,$B,$X,42,16,0xd4ef3085);
263	&R2(11, 0,$B,$C,$D,$A,$X,43,23,0x04881d05);
264	&R2(12, 0,$A,$B,$C,$D,$X,44, 4,0xd9d4d039);
265	&R2(13, 0,$D,$A,$B,$C,$X,45,11,0xe6db99e5);
266	&R2(14, 0,$C,$D,$A,$B,$X,46,16,0x1fa27cf8);
267	&R2(15, 1,$B,$C,$D,$A,$X,47,23,0xc4ac5665);
268
269	&comment("");
270	&comment("R3 section");
271	&R3(-1,$A,$B,$C,$D,$X,48, 6,0xf4292244);
272	&R3( 0,$D,$A,$B,$C,$X,49,10,0x432aff97);
273	&R3( 0,$C,$D,$A,$B,$X,50,15,0xab9423a7);
274	&R3( 0,$B,$C,$D,$A,$X,51,21,0xfc93a039);
275	&R3( 0,$A,$B,$C,$D,$X,52, 6,0x655b59c3);
276	&R3( 0,$D,$A,$B,$C,$X,53,10,0x8f0ccc92);
277	&R3( 0,$C,$D,$A,$B,$X,54,15,0xffeff47d);
278	&R3( 0,$B,$C,$D,$A,$X,55,21,0x85845dd1);
279	&R3( 0,$A,$B,$C,$D,$X,56, 6,0x6fa87e4f);
280	&R3( 0,$D,$A,$B,$C,$X,57,10,0xfe2ce6e0);
281	&R3( 0,$C,$D,$A,$B,$X,58,15,0xa3014314);
282	&R3( 0,$B,$C,$D,$A,$X,59,21,0x4e0811a1);
283	&R3( 0,$A,$B,$C,$D,$X,60, 6,0xf7537e82);
284	&R3( 0,$D,$A,$B,$C,$X,61,10,0xbd3af235);
285	&R3( 0,$C,$D,$A,$B,$X,62,15,0x2ad7d2bb);
286	&R3( 2,$B,$C,$D,$A,$X,63,21,0xeb86d391);
287
288	# &mov($tmp2,&wparam(0));	# done in the last R3
289	# &mov($tmp1,	&DWP( 0,$tmp2,"",0)); # done is the last R3
290
291	&add($A,$tmp1);
292	 &mov($tmp1,	&DWP( 4,$tmp2,"",0));
293
294	&add($B,$tmp1);
295	&mov($tmp1,	&DWP( 8,$tmp2,"",0));
296
297	&add($C,$tmp1);
298	&mov($tmp1,	&DWP(12,$tmp2,"",0));
299
300	&add($D,$tmp1);
301	&mov(&DWP( 0,$tmp2,"",0),$A);
302
303	&mov(&DWP( 4,$tmp2,"",0),$B);
304	&mov($tmp1,&swtmp(0)) unless $normal;
305
306	&mov(&DWP( 8,$tmp2,"",0),$C);
307	 &mov(&DWP(12,$tmp2,"",0),$D);
308
309	&cmp($tmp1,$X) unless $normal;			# check count
310	 &jae(&label("start")) unless $normal;
311
312	&pop("eax"); # pop the temp variable off the stack
313	 &pop("ebx");
314	&pop("ebp");
315	 &pop("edi");
316	&pop("esi");
317	 &ret();
318	&function_end_B($name);
319	}
320
321