1 | #! /usr/bin/env perl
|
---|
2 | # Copyright 1995-2020 The OpenSSL Project Authors. All Rights Reserved.
|
---|
3 | #
|
---|
4 | # Licensed under the Apache License 2.0 (the "License"). You may not use
|
---|
5 | # this file except in compliance with the License. You can obtain a copy
|
---|
6 | # in the file LICENSE in the source distribution or at
|
---|
7 | # https://www.openssl.org/source/license.html
|
---|
8 |
|
---|
9 |
|
---|
10 | # Normal is the
|
---|
11 | # md5_block_x86(MD5_CTX *c, ULONG *X);
|
---|
12 | # version, non-normal is the
|
---|
13 | # md5_block_x86(MD5_CTX *c, ULONG *X,int blocks);
|
---|
14 |
|
---|
15 | $normal=0;
|
---|
16 |
|
---|
17 | $0 =~ m/(.*[\/\\])[^\/\\]+$/; $dir=$1;
|
---|
18 | push(@INC,"${dir}","${dir}../../perlasm");
|
---|
19 | require "x86asm.pl";
|
---|
20 |
|
---|
21 | # $output is the last argument if it looks like a file (it has an extension)
|
---|
22 | $output = $#ARGV >= 0 && $ARGV[$#ARGV] =~ m|\.\w+$| ? pop : undef;
|
---|
23 |
|
---|
24 | $output and open STDOUT,">$output";
|
---|
25 |
|
---|
26 | &asm_init($ARGV[0]);
|
---|
27 |
|
---|
28 | $A="eax";
|
---|
29 | $B="ebx";
|
---|
30 | $C="ecx";
|
---|
31 | $D="edx";
|
---|
32 | $tmp1="edi";
|
---|
33 | $tmp2="ebp";
|
---|
34 | $X="esi";
|
---|
35 |
|
---|
36 | # What we need to load into $tmp for the next round
|
---|
37 | %Ltmp1=("R0",&Np($C), "R1",&Np($C), "R2",&Np($C), "R3",&Np($D));
|
---|
38 | @xo=(
|
---|
39 | 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, # R0
|
---|
40 | 1, 6, 11, 0, 5, 10, 15, 4, 9, 14, 3, 8, 13, 2, 7, 12, # R1
|
---|
41 | 5, 8, 11, 14, 1, 4, 7, 10, 13, 0, 3, 6, 9, 12, 15, 2, # R2
|
---|
42 | 0, 7, 14, 5, 12, 3, 10, 1, 8, 15, 6, 13, 4, 11, 2, 9, # R3
|
---|
43 | );
|
---|
44 |
|
---|
45 | &md5_block("ossl_md5_block_asm_data_order");
|
---|
46 | &asm_finish();
|
---|
47 |
|
---|
48 | close STDOUT or die "error closing STDOUT: $!";
|
---|
49 |
|
---|
50 | sub Np
|
---|
51 | {
|
---|
52 | local($p)=@_;
|
---|
53 | local(%n)=($A,$D,$B,$A,$C,$B,$D,$C);
|
---|
54 | return($n{$p});
|
---|
55 | }
|
---|
56 |
|
---|
57 | sub R0
|
---|
58 | {
|
---|
59 | local($pos,$a,$b,$c,$d,$K,$ki,$s,$t)=@_;
|
---|
60 |
|
---|
61 | &mov($tmp1,$C) if $pos < 0;
|
---|
62 | &mov($tmp2,&DWP($xo[$ki]*4,$K,"",0)) if $pos < 0; # very first one
|
---|
63 |
|
---|
64 | # body proper
|
---|
65 |
|
---|
66 | &comment("R0 $ki");
|
---|
67 | &xor($tmp1,$d); # F function - part 2
|
---|
68 |
|
---|
69 | &and($tmp1,$b); # F function - part 3
|
---|
70 | &lea($a,&DWP($t,$a,$tmp2,1));
|
---|
71 |
|
---|
72 | &xor($tmp1,$d); # F function - part 4
|
---|
73 | &mov($tmp2,&DWP($xo[$ki+1]*4,$K,"",0)) if ($pos != 2);
|
---|
74 |
|
---|
75 | &add($a,$tmp1);
|
---|
76 |
|
---|
77 | &rotl($a,$s);
|
---|
78 |
|
---|
79 | &mov($tmp1,&Np($c)) if $pos < 1; # next tmp1 for R0
|
---|
80 | &mov($tmp1,&Np($c)) if $pos == 1; # next tmp1 for R1
|
---|
81 |
|
---|
82 | &add($a,$b);
|
---|
83 | }
|
---|
84 |
|
---|
85 | sub R1
|
---|
86 | {
|
---|
87 | local($pos,$a,$b,$c,$d,$K,$ki,$s,$t)=@_;
|
---|
88 |
|
---|
89 | &comment("R1 $ki");
|
---|
90 |
|
---|
91 | &xor($tmp1,$b); # G function - part 2
|
---|
92 | &and($tmp1,$d); # G function - part 3
|
---|
93 | &lea($a,&DWP($t,$a,$tmp2,1));
|
---|
94 |
|
---|
95 | &xor($tmp1,$c); # G function - part 4
|
---|
96 | &mov($tmp2,&DWP($xo[$ki+1]*4,$K,"",0)) if ($pos != 2);
|
---|
97 |
|
---|
98 | &add($a,$tmp1);
|
---|
99 | &mov($tmp1,&Np($c)) if $pos < 1; # G function - part 1
|
---|
100 | &mov($tmp1,&Np($c)) if $pos == 1; # G function - part 1
|
---|
101 |
|
---|
102 | &rotl($a,$s);
|
---|
103 |
|
---|
104 | &add($a,$b);
|
---|
105 | }
|
---|
106 |
|
---|
107 | sub R2
|
---|
108 | {
|
---|
109 | local($n,$pos,$a,$b,$c,$d,$K,$ki,$s,$t)=@_;
|
---|
110 | # This one is different, only 3 logical operations
|
---|
111 |
|
---|
112 | if (($n & 1) == 0)
|
---|
113 | {
|
---|
114 | &comment("R2 $ki");
|
---|
115 | # make sure to do 'D' first, not 'B', else we clash with
|
---|
116 | # the last add from the previous round.
|
---|
117 |
|
---|
118 | &xor($tmp1,$d); # H function - part 2
|
---|
119 |
|
---|
120 | &xor($tmp1,$b); # H function - part 3
|
---|
121 | &lea($a,&DWP($t,$a,$tmp2,1));
|
---|
122 |
|
---|
123 | &add($a,$tmp1);
|
---|
124 | &mov($tmp2,&DWP($xo[$ki+1]*4,$K,"",0));
|
---|
125 |
|
---|
126 | &rotl($a,$s);
|
---|
127 |
|
---|
128 | &mov($tmp1,&Np($c));
|
---|
129 | }
|
---|
130 | else
|
---|
131 | {
|
---|
132 | &comment("R2 $ki");
|
---|
133 | # make sure to do 'D' first, not 'B', else we clash with
|
---|
134 | # the last add from the previous round.
|
---|
135 |
|
---|
136 | &add($b,$c); # MOVED FORWARD
|
---|
137 | &xor($tmp1,$d); # H function - part 2
|
---|
138 |
|
---|
139 | &lea($a,&DWP($t,$a,$tmp2,1));
|
---|
140 |
|
---|
141 | &xor($tmp1,$b); # H function - part 3
|
---|
142 | &mov($tmp2,&DWP($xo[$ki+1]*4,$K,"",0)) if ($pos != 2);
|
---|
143 |
|
---|
144 | &add($a,$tmp1);
|
---|
145 | &mov($tmp1,&Np($c)) if $pos < 1; # H function - part 1
|
---|
146 | &mov($tmp1,-1) if $pos == 1; # I function - part 1
|
---|
147 |
|
---|
148 | &rotl($a,$s);
|
---|
149 |
|
---|
150 | &add($a,$b);
|
---|
151 | }
|
---|
152 | }
|
---|
153 |
|
---|
154 | sub R3
|
---|
155 | {
|
---|
156 | local($pos,$a,$b,$c,$d,$K,$ki,$s,$t)=@_;
|
---|
157 |
|
---|
158 | &comment("R3 $ki");
|
---|
159 |
|
---|
160 | # ¬($tmp1)
|
---|
161 | &xor($tmp1,$d) if $pos < 0; # I function - part 2
|
---|
162 |
|
---|
163 | &or($tmp1,$b); # I function - part 3
|
---|
164 | &lea($a,&DWP($t,$a,$tmp2,1));
|
---|
165 |
|
---|
166 | &xor($tmp1,$c); # I function - part 4
|
---|
167 | &mov($tmp2,&DWP($xo[$ki+1]*4,$K,"",0)) if $pos != 2; # load X/k value
|
---|
168 | &mov($tmp2,&wparam(0)) if $pos == 2;
|
---|
169 |
|
---|
170 | &add($a,$tmp1);
|
---|
171 | &mov($tmp1,-1) if $pos < 1; # H function - part 1
|
---|
172 | &add($K,64) if $pos >=1 && !$normal;
|
---|
173 |
|
---|
174 | &rotl($a,$s);
|
---|
175 |
|
---|
176 | &xor($tmp1,&Np($d)) if $pos <= 0; # I function - part = first time
|
---|
177 | &mov($tmp1,&DWP( 0,$tmp2,"",0)) if $pos > 0;
|
---|
178 | &add($a,$b);
|
---|
179 | }
|
---|
180 |
|
---|
181 |
|
---|
182 | sub md5_block
|
---|
183 | {
|
---|
184 | local($name)=@_;
|
---|
185 |
|
---|
186 | &function_begin_B($name,"",3);
|
---|
187 |
|
---|
188 | # parameter 1 is the MD5_CTX structure.
|
---|
189 | # A 0
|
---|
190 | # B 4
|
---|
191 | # C 8
|
---|
192 | # D 12
|
---|
193 |
|
---|
194 | &push("esi");
|
---|
195 | &push("edi");
|
---|
196 | &mov($tmp1, &wparam(0)); # edi
|
---|
197 | &mov($X, &wparam(1)); # esi
|
---|
198 | &mov($C, &wparam(2));
|
---|
199 | &push("ebp");
|
---|
200 | &shl($C, 6);
|
---|
201 | &push("ebx");
|
---|
202 | &add($C, $X); # offset we end at
|
---|
203 | &sub($C, 64);
|
---|
204 | &mov($A, &DWP( 0,$tmp1,"",0));
|
---|
205 | &push($C); # Put on the TOS
|
---|
206 | &mov($B, &DWP( 4,$tmp1,"",0));
|
---|
207 | &mov($C, &DWP( 8,$tmp1,"",0));
|
---|
208 | &mov($D, &DWP(12,$tmp1,"",0));
|
---|
209 |
|
---|
210 | &set_label("start") unless $normal;
|
---|
211 | &comment("");
|
---|
212 | &comment("R0 section");
|
---|
213 |
|
---|
214 | &R0(-2,$A,$B,$C,$D,$X, 0, 7,0xd76aa478);
|
---|
215 | &R0( 0,$D,$A,$B,$C,$X, 1,12,0xe8c7b756);
|
---|
216 | &R0( 0,$C,$D,$A,$B,$X, 2,17,0x242070db);
|
---|
217 | &R0( 0,$B,$C,$D,$A,$X, 3,22,0xc1bdceee);
|
---|
218 | &R0( 0,$A,$B,$C,$D,$X, 4, 7,0xf57c0faf);
|
---|
219 | &R0( 0,$D,$A,$B,$C,$X, 5,12,0x4787c62a);
|
---|
220 | &R0( 0,$C,$D,$A,$B,$X, 6,17,0xa8304613);
|
---|
221 | &R0( 0,$B,$C,$D,$A,$X, 7,22,0xfd469501);
|
---|
222 | &R0( 0,$A,$B,$C,$D,$X, 8, 7,0x698098d8);
|
---|
223 | &R0( 0,$D,$A,$B,$C,$X, 9,12,0x8b44f7af);
|
---|
224 | &R0( 0,$C,$D,$A,$B,$X,10,17,0xffff5bb1);
|
---|
225 | &R0( 0,$B,$C,$D,$A,$X,11,22,0x895cd7be);
|
---|
226 | &R0( 0,$A,$B,$C,$D,$X,12, 7,0x6b901122);
|
---|
227 | &R0( 0,$D,$A,$B,$C,$X,13,12,0xfd987193);
|
---|
228 | &R0( 0,$C,$D,$A,$B,$X,14,17,0xa679438e);
|
---|
229 | &R0( 1,$B,$C,$D,$A,$X,15,22,0x49b40821);
|
---|
230 |
|
---|
231 | &comment("");
|
---|
232 | &comment("R1 section");
|
---|
233 | &R1(-1,$A,$B,$C,$D,$X,16, 5,0xf61e2562);
|
---|
234 | &R1( 0,$D,$A,$B,$C,$X,17, 9,0xc040b340);
|
---|
235 | &R1( 0,$C,$D,$A,$B,$X,18,14,0x265e5a51);
|
---|
236 | &R1( 0,$B,$C,$D,$A,$X,19,20,0xe9b6c7aa);
|
---|
237 | &R1( 0,$A,$B,$C,$D,$X,20, 5,0xd62f105d);
|
---|
238 | &R1( 0,$D,$A,$B,$C,$X,21, 9,0x02441453);
|
---|
239 | &R1( 0,$C,$D,$A,$B,$X,22,14,0xd8a1e681);
|
---|
240 | &R1( 0,$B,$C,$D,$A,$X,23,20,0xe7d3fbc8);
|
---|
241 | &R1( 0,$A,$B,$C,$D,$X,24, 5,0x21e1cde6);
|
---|
242 | &R1( 0,$D,$A,$B,$C,$X,25, 9,0xc33707d6);
|
---|
243 | &R1( 0,$C,$D,$A,$B,$X,26,14,0xf4d50d87);
|
---|
244 | &R1( 0,$B,$C,$D,$A,$X,27,20,0x455a14ed);
|
---|
245 | &R1( 0,$A,$B,$C,$D,$X,28, 5,0xa9e3e905);
|
---|
246 | &R1( 0,$D,$A,$B,$C,$X,29, 9,0xfcefa3f8);
|
---|
247 | &R1( 0,$C,$D,$A,$B,$X,30,14,0x676f02d9);
|
---|
248 | &R1( 1,$B,$C,$D,$A,$X,31,20,0x8d2a4c8a);
|
---|
249 |
|
---|
250 | &comment("");
|
---|
251 | &comment("R2 section");
|
---|
252 | &R2( 0,-1,$A,$B,$C,$D,$X,32, 4,0xfffa3942);
|
---|
253 | &R2( 1, 0,$D,$A,$B,$C,$X,33,11,0x8771f681);
|
---|
254 | &R2( 2, 0,$C,$D,$A,$B,$X,34,16,0x6d9d6122);
|
---|
255 | &R2( 3, 0,$B,$C,$D,$A,$X,35,23,0xfde5380c);
|
---|
256 | &R2( 4, 0,$A,$B,$C,$D,$X,36, 4,0xa4beea44);
|
---|
257 | &R2( 5, 0,$D,$A,$B,$C,$X,37,11,0x4bdecfa9);
|
---|
258 | &R2( 6, 0,$C,$D,$A,$B,$X,38,16,0xf6bb4b60);
|
---|
259 | &R2( 7, 0,$B,$C,$D,$A,$X,39,23,0xbebfbc70);
|
---|
260 | &R2( 8, 0,$A,$B,$C,$D,$X,40, 4,0x289b7ec6);
|
---|
261 | &R2( 9, 0,$D,$A,$B,$C,$X,41,11,0xeaa127fa);
|
---|
262 | &R2(10, 0,$C,$D,$A,$B,$X,42,16,0xd4ef3085);
|
---|
263 | &R2(11, 0,$B,$C,$D,$A,$X,43,23,0x04881d05);
|
---|
264 | &R2(12, 0,$A,$B,$C,$D,$X,44, 4,0xd9d4d039);
|
---|
265 | &R2(13, 0,$D,$A,$B,$C,$X,45,11,0xe6db99e5);
|
---|
266 | &R2(14, 0,$C,$D,$A,$B,$X,46,16,0x1fa27cf8);
|
---|
267 | &R2(15, 1,$B,$C,$D,$A,$X,47,23,0xc4ac5665);
|
---|
268 |
|
---|
269 | &comment("");
|
---|
270 | &comment("R3 section");
|
---|
271 | &R3(-1,$A,$B,$C,$D,$X,48, 6,0xf4292244);
|
---|
272 | &R3( 0,$D,$A,$B,$C,$X,49,10,0x432aff97);
|
---|
273 | &R3( 0,$C,$D,$A,$B,$X,50,15,0xab9423a7);
|
---|
274 | &R3( 0,$B,$C,$D,$A,$X,51,21,0xfc93a039);
|
---|
275 | &R3( 0,$A,$B,$C,$D,$X,52, 6,0x655b59c3);
|
---|
276 | &R3( 0,$D,$A,$B,$C,$X,53,10,0x8f0ccc92);
|
---|
277 | &R3( 0,$C,$D,$A,$B,$X,54,15,0xffeff47d);
|
---|
278 | &R3( 0,$B,$C,$D,$A,$X,55,21,0x85845dd1);
|
---|
279 | &R3( 0,$A,$B,$C,$D,$X,56, 6,0x6fa87e4f);
|
---|
280 | &R3( 0,$D,$A,$B,$C,$X,57,10,0xfe2ce6e0);
|
---|
281 | &R3( 0,$C,$D,$A,$B,$X,58,15,0xa3014314);
|
---|
282 | &R3( 0,$B,$C,$D,$A,$X,59,21,0x4e0811a1);
|
---|
283 | &R3( 0,$A,$B,$C,$D,$X,60, 6,0xf7537e82);
|
---|
284 | &R3( 0,$D,$A,$B,$C,$X,61,10,0xbd3af235);
|
---|
285 | &R3( 0,$C,$D,$A,$B,$X,62,15,0x2ad7d2bb);
|
---|
286 | &R3( 2,$B,$C,$D,$A,$X,63,21,0xeb86d391);
|
---|
287 |
|
---|
288 | # &mov($tmp2,&wparam(0)); # done in the last R3
|
---|
289 | # &mov($tmp1, &DWP( 0,$tmp2,"",0)); # done is the last R3
|
---|
290 |
|
---|
291 | &add($A,$tmp1);
|
---|
292 | &mov($tmp1, &DWP( 4,$tmp2,"",0));
|
---|
293 |
|
---|
294 | &add($B,$tmp1);
|
---|
295 | &mov($tmp1, &DWP( 8,$tmp2,"",0));
|
---|
296 |
|
---|
297 | &add($C,$tmp1);
|
---|
298 | &mov($tmp1, &DWP(12,$tmp2,"",0));
|
---|
299 |
|
---|
300 | &add($D,$tmp1);
|
---|
301 | &mov(&DWP( 0,$tmp2,"",0),$A);
|
---|
302 |
|
---|
303 | &mov(&DWP( 4,$tmp2,"",0),$B);
|
---|
304 | &mov($tmp1,&swtmp(0)) unless $normal;
|
---|
305 |
|
---|
306 | &mov(&DWP( 8,$tmp2,"",0),$C);
|
---|
307 | &mov(&DWP(12,$tmp2,"",0),$D);
|
---|
308 |
|
---|
309 | &cmp($tmp1,$X) unless $normal; # check count
|
---|
310 | &jae(&label("start")) unless $normal;
|
---|
311 |
|
---|
312 | &pop("eax"); # pop the temp variable off the stack
|
---|
313 | &pop("ebx");
|
---|
314 | &pop("ebp");
|
---|
315 | &pop("edi");
|
---|
316 | &pop("esi");
|
---|
317 | &ret();
|
---|
318 | &function_end_B($name);
|
---|
319 | }
|
---|
320 |
|
---|