155714Skris#!/usr/local/bin/perl
255714Skris
355714Skris# Normal is the
455714Skris# md5_block_x86(MD5_CTX *c, ULONG *X);
555714Skris# version, non-normal is the
655714Skris# md5_block_x86(MD5_CTX *c, ULONG *X,int blocks);
755714Skris
855714Skris$normal=0;
955714Skris
10238405Sjkim$0 =~ m/(.*[\/\\])[^\/\\]+$/; $dir=$1;
11238405Sjkimpush(@INC,"${dir}","${dir}../../perlasm");
1255714Skrisrequire "x86asm.pl";
1355714Skris
1455714Skris&asm_init($ARGV[0],$0);
1555714Skris
1655714Skris$A="eax";
1755714Skris$B="ebx";
1855714Skris$C="ecx";
1955714Skris$D="edx";
2055714Skris$tmp1="edi";
2155714Skris$tmp2="ebp";
2255714Skris$X="esi";
2355714Skris
2455714Skris# What we need to load into $tmp for the next round
2555714Skris%Ltmp1=("R0",&Np($C), "R1",&Np($C), "R2",&Np($C), "R3",&Np($D));
2655714Skris@xo=(
2755714Skris 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15,	# R0
2855714Skris 1, 6, 11, 0, 5, 10, 15, 4, 9, 14, 3, 8, 13, 2, 7, 12,	# R1
2955714Skris 5, 8, 11, 14, 1, 4, 7, 10, 13, 0, 3, 6, 9, 12, 15, 2,	# R2
3055714Skris 0, 7, 14, 5, 12, 3, 10, 1, 8, 15, 6, 13, 4, 11, 2, 9,	# R3
3155714Skris );
3255714Skris
33194206Ssimon&md5_block("md5_block_asm_data_order");
3455714Skris&asm_finish();
3555714Skris
3655714Skrissub Np
3755714Skris	{
3855714Skris	local($p)=@_;
3955714Skris	local(%n)=($A,$D,$B,$A,$C,$B,$D,$C);
4055714Skris	return($n{$p});
4155714Skris	}
4255714Skris
4355714Skrissub R0
4455714Skris	{
4555714Skris	local($pos,$a,$b,$c,$d,$K,$ki,$s,$t)=@_;
4655714Skris
4755714Skris	&mov($tmp1,$C)  if $pos < 0;
4855714Skris	&mov($tmp2,&DWP($xo[$ki]*4,$K,"",0)) if $pos < 0; # very first one
4955714Skris
5055714Skris	# body proper
5155714Skris
5255714Skris	&comment("R0 $ki");
5355714Skris	&xor($tmp1,$d); # F function - part 2
5455714Skris
5555714Skris	&and($tmp1,$b); # F function - part 3
5655714Skris	&lea($a,&DWP($t,$a,$tmp2,1));
5755714Skris
5855714Skris	&xor($tmp1,$d); # F function - part 4
5955714Skris
6055714Skris	&add($a,$tmp1);
6155714Skris	&mov($tmp1,&Np($c)) if $pos < 1;	# next tmp1 for R0
6255714Skris	&mov($tmp1,&Np($c)) if $pos == 1;	# next tmp1 for R1
6355714Skris
6455714Skris	&rotl($a,$s);
6555714Skris
6655714Skris	&mov($tmp2,&DWP($xo[$ki+1]*4,$K,"",0)) if ($pos != 2);
6755714Skris
6855714Skris	&add($a,$b);
6955714Skris	}
7055714Skris
7155714Skrissub R1
7255714Skris	{
7355714Skris	local($pos,$a,$b,$c,$d,$K,$ki,$s,$t)=@_;
7455714Skris
7555714Skris	&comment("R1 $ki");
7655714Skris
7755714Skris	&lea($a,&DWP($t,$a,$tmp2,1));
7855714Skris
7955714Skris	&xor($tmp1,$b); # G function - part 2
8055714Skris	&and($tmp1,$d); # G function - part 3
8155714Skris
8255714Skris	&mov($tmp2,&DWP($xo[$ki+1]*4,$K,"",0)) if ($pos != 2);
8355714Skris	&xor($tmp1,$c);			# G function - part 4
8455714Skris
8555714Skris	&add($a,$tmp1);
8655714Skris	&mov($tmp1,&Np($c)) if $pos < 1;	# G function - part 1
8755714Skris	&mov($tmp1,&Np($c)) if $pos == 1;	# G function - part 1
8855714Skris
8955714Skris	&rotl($a,$s);
9055714Skris
9155714Skris	&add($a,$b);
9255714Skris	}
9355714Skris
9455714Skrissub R2
9555714Skris	{
9655714Skris	local($n,$pos,$a,$b,$c,$d,$K,$ki,$s,$t)=@_;
9755714Skris	# This one is different, only 3 logical operations
9855714Skris
9955714Skrisif (($n & 1) == 0)
10055714Skris	{
10155714Skris	&comment("R2 $ki");
10255714Skris	# make sure to do 'D' first, not 'B', else we clash with
10355714Skris	# the last add from the previous round.
10455714Skris
10555714Skris	&xor($tmp1,$d); # H function - part 2
10655714Skris
10755714Skris	&xor($tmp1,$b); # H function - part 3
10855714Skris	&lea($a,&DWP($t,$a,$tmp2,1));
10955714Skris
11055714Skris	&add($a,$tmp1);
11155714Skris
11255714Skris	&rotl($a,$s);
11355714Skris
11455714Skris	&mov($tmp2,&DWP($xo[$ki+1]*4,$K,"",0));
11555714Skris	&mov($tmp1,&Np($c));
11655714Skris	}
11755714Skriselse
11855714Skris	{
11955714Skris	&comment("R2 $ki");
12055714Skris	# make sure to do 'D' first, not 'B', else we clash with
12155714Skris	# the last add from the previous round.
12255714Skris
12355714Skris	&lea($a,&DWP($t,$a,$tmp2,1));
12455714Skris
12555714Skris	&add($b,$c);			# MOVED FORWARD
12655714Skris	&xor($tmp1,$d); # H function - part 2
12755714Skris
12855714Skris	&xor($tmp1,$b); # H function - part 3
12955714Skris	&mov($tmp2,&DWP($xo[$ki+1]*4,$K,"",0)) if ($pos != 2);
13055714Skris
13155714Skris	&add($a,$tmp1);
13255714Skris	&mov($tmp1,&Np($c)) if $pos < 1;	# H function - part 1
13355714Skris	&mov($tmp1,-1) if $pos == 1;		# I function - part 1
13455714Skris
13555714Skris	&rotl($a,$s);
13655714Skris
13755714Skris	&add($a,$b);
13855714Skris	}
13955714Skris	}
14055714Skris
14155714Skrissub R3
14255714Skris	{
14355714Skris	local($pos,$a,$b,$c,$d,$K,$ki,$s,$t)=@_;
14455714Skris
14555714Skris	&comment("R3 $ki");
14655714Skris
14755714Skris	# &not($tmp1)
14855714Skris	&xor($tmp1,$d) if $pos < 0; 	# I function - part 2
14955714Skris
15055714Skris	&or($tmp1,$b);				# I function - part 3
15155714Skris	&lea($a,&DWP($t,$a,$tmp2,1));
15255714Skris
15355714Skris	&xor($tmp1,$c); 			# I function - part 4
15455714Skris	&mov($tmp2,&DWP($xo[$ki+1]*4,$K,"",0))	if $pos != 2; # load X/k value
15555714Skris	&mov($tmp2,&wparam(0)) if $pos == 2;
15655714Skris
15755714Skris	&add($a,$tmp1);
15855714Skris	&mov($tmp1,-1) if $pos < 1;	# H function - part 1
15955714Skris	&add($K,64) if $pos >=1 && !$normal;
16055714Skris
16155714Skris	&rotl($a,$s);
16255714Skris
16355714Skris	&xor($tmp1,&Np($d)) if $pos <= 0; 	# I function - part = first time
16455714Skris	&mov($tmp1,&DWP( 0,$tmp2,"",0)) if $pos > 0;
16555714Skris	&add($a,$b);
16655714Skris	}
16755714Skris
16855714Skris
16955714Skrissub md5_block
17055714Skris	{
17155714Skris	local($name)=@_;
17255714Skris
17355714Skris	&function_begin_B($name,"",3);
17455714Skris
17555714Skris	# parameter 1 is the MD5_CTX structure.
17655714Skris	# A	0
17755714Skris	# B	4
17855714Skris	# C	8
17955714Skris	# D 	12
18055714Skris
18155714Skris	&push("esi");
18255714Skris	 &push("edi");
18355714Skris	&mov($tmp1,	&wparam(0)); # edi
18455714Skris	 &mov($X,	&wparam(1)); # esi
18555714Skris	&mov($C,	&wparam(2));
18655714Skris	 &push("ebp");
18755714Skris	&shl($C,	6);
18855714Skris	&push("ebx");
18955714Skris	 &add($C,	$X); # offset we end at
19055714Skris	&sub($C,	64);
19155714Skris	 &mov($A,	&DWP( 0,$tmp1,"",0));
19255714Skris	&push($C);	# Put on the TOS
19355714Skris	 &mov($B,	&DWP( 4,$tmp1,"",0));
19455714Skris	&mov($C,	&DWP( 8,$tmp1,"",0));
19555714Skris	 &mov($D,	&DWP(12,$tmp1,"",0));
19655714Skris
19755714Skris	&set_label("start") unless $normal;
19855714Skris	&comment("");
19955714Skris	&comment("R0 section");
20055714Skris
20155714Skris	&R0(-2,$A,$B,$C,$D,$X, 0, 7,0xd76aa478);
20255714Skris	&R0( 0,$D,$A,$B,$C,$X, 1,12,0xe8c7b756);
20355714Skris	&R0( 0,$C,$D,$A,$B,$X, 2,17,0x242070db);
20455714Skris	&R0( 0,$B,$C,$D,$A,$X, 3,22,0xc1bdceee);
20555714Skris	&R0( 0,$A,$B,$C,$D,$X, 4, 7,0xf57c0faf);
20655714Skris	&R0( 0,$D,$A,$B,$C,$X, 5,12,0x4787c62a);
20755714Skris	&R0( 0,$C,$D,$A,$B,$X, 6,17,0xa8304613);
20855714Skris	&R0( 0,$B,$C,$D,$A,$X, 7,22,0xfd469501);
20955714Skris	&R0( 0,$A,$B,$C,$D,$X, 8, 7,0x698098d8);
21055714Skris	&R0( 0,$D,$A,$B,$C,$X, 9,12,0x8b44f7af);
21155714Skris	&R0( 0,$C,$D,$A,$B,$X,10,17,0xffff5bb1);
21255714Skris	&R0( 0,$B,$C,$D,$A,$X,11,22,0x895cd7be);
21355714Skris	&R0( 0,$A,$B,$C,$D,$X,12, 7,0x6b901122);
21455714Skris	&R0( 0,$D,$A,$B,$C,$X,13,12,0xfd987193);
21555714Skris	&R0( 0,$C,$D,$A,$B,$X,14,17,0xa679438e);
21655714Skris	&R0( 1,$B,$C,$D,$A,$X,15,22,0x49b40821);
21755714Skris
21855714Skris	&comment("");
21955714Skris	&comment("R1 section");
22055714Skris	&R1(-1,$A,$B,$C,$D,$X,16, 5,0xf61e2562);
22155714Skris	&R1( 0,$D,$A,$B,$C,$X,17, 9,0xc040b340);
22255714Skris	&R1( 0,$C,$D,$A,$B,$X,18,14,0x265e5a51);
22355714Skris	&R1( 0,$B,$C,$D,$A,$X,19,20,0xe9b6c7aa);
22455714Skris	&R1( 0,$A,$B,$C,$D,$X,20, 5,0xd62f105d);
22555714Skris	&R1( 0,$D,$A,$B,$C,$X,21, 9,0x02441453);
22655714Skris	&R1( 0,$C,$D,$A,$B,$X,22,14,0xd8a1e681);
22755714Skris	&R1( 0,$B,$C,$D,$A,$X,23,20,0xe7d3fbc8);
22855714Skris	&R1( 0,$A,$B,$C,$D,$X,24, 5,0x21e1cde6);
22955714Skris	&R1( 0,$D,$A,$B,$C,$X,25, 9,0xc33707d6);
23055714Skris	&R1( 0,$C,$D,$A,$B,$X,26,14,0xf4d50d87);
23155714Skris	&R1( 0,$B,$C,$D,$A,$X,27,20,0x455a14ed);
23255714Skris	&R1( 0,$A,$B,$C,$D,$X,28, 5,0xa9e3e905);
23355714Skris	&R1( 0,$D,$A,$B,$C,$X,29, 9,0xfcefa3f8);
23455714Skris	&R1( 0,$C,$D,$A,$B,$X,30,14,0x676f02d9);
23555714Skris	&R1( 1,$B,$C,$D,$A,$X,31,20,0x8d2a4c8a);
23655714Skris
23755714Skris	&comment("");
23855714Skris	&comment("R2 section");
23955714Skris	&R2( 0,-1,$A,$B,$C,$D,$X,32, 4,0xfffa3942);
24055714Skris	&R2( 1, 0,$D,$A,$B,$C,$X,33,11,0x8771f681);
24155714Skris	&R2( 2, 0,$C,$D,$A,$B,$X,34,16,0x6d9d6122);
24255714Skris	&R2( 3, 0,$B,$C,$D,$A,$X,35,23,0xfde5380c);
24355714Skris	&R2( 4, 0,$A,$B,$C,$D,$X,36, 4,0xa4beea44);
24455714Skris	&R2( 5, 0,$D,$A,$B,$C,$X,37,11,0x4bdecfa9);
24555714Skris	&R2( 6, 0,$C,$D,$A,$B,$X,38,16,0xf6bb4b60);
24655714Skris	&R2( 7, 0,$B,$C,$D,$A,$X,39,23,0xbebfbc70);
24755714Skris	&R2( 8, 0,$A,$B,$C,$D,$X,40, 4,0x289b7ec6);
24855714Skris	&R2( 9, 0,$D,$A,$B,$C,$X,41,11,0xeaa127fa);
24955714Skris	&R2(10, 0,$C,$D,$A,$B,$X,42,16,0xd4ef3085);
25055714Skris	&R2(11, 0,$B,$C,$D,$A,$X,43,23,0x04881d05);
25155714Skris	&R2(12, 0,$A,$B,$C,$D,$X,44, 4,0xd9d4d039);
25255714Skris	&R2(13, 0,$D,$A,$B,$C,$X,45,11,0xe6db99e5);
25355714Skris	&R2(14, 0,$C,$D,$A,$B,$X,46,16,0x1fa27cf8);
25455714Skris	&R2(15, 1,$B,$C,$D,$A,$X,47,23,0xc4ac5665);
25555714Skris
25655714Skris	&comment("");
25755714Skris	&comment("R3 section");
25855714Skris	&R3(-1,$A,$B,$C,$D,$X,48, 6,0xf4292244);
25955714Skris	&R3( 0,$D,$A,$B,$C,$X,49,10,0x432aff97);
26055714Skris	&R3( 0,$C,$D,$A,$B,$X,50,15,0xab9423a7);
26155714Skris	&R3( 0,$B,$C,$D,$A,$X,51,21,0xfc93a039);
26255714Skris	&R3( 0,$A,$B,$C,$D,$X,52, 6,0x655b59c3);
26355714Skris	&R3( 0,$D,$A,$B,$C,$X,53,10,0x8f0ccc92);
26455714Skris	&R3( 0,$C,$D,$A,$B,$X,54,15,0xffeff47d);
26555714Skris	&R3( 0,$B,$C,$D,$A,$X,55,21,0x85845dd1);
26655714Skris	&R3( 0,$A,$B,$C,$D,$X,56, 6,0x6fa87e4f);
26755714Skris	&R3( 0,$D,$A,$B,$C,$X,57,10,0xfe2ce6e0);
26855714Skris	&R3( 0,$C,$D,$A,$B,$X,58,15,0xa3014314);
26955714Skris	&R3( 0,$B,$C,$D,$A,$X,59,21,0x4e0811a1);
27055714Skris	&R3( 0,$A,$B,$C,$D,$X,60, 6,0xf7537e82);
27155714Skris	&R3( 0,$D,$A,$B,$C,$X,61,10,0xbd3af235);
27255714Skris	&R3( 0,$C,$D,$A,$B,$X,62,15,0x2ad7d2bb);
27355714Skris	&R3( 2,$B,$C,$D,$A,$X,63,21,0xeb86d391);
27455714Skris
27555714Skris	# &mov($tmp2,&wparam(0));	# done in the last R3
27655714Skris	# &mov($tmp1,	&DWP( 0,$tmp2,"",0)); # done is the last R3
27755714Skris
27855714Skris	&add($A,$tmp1);
27955714Skris	 &mov($tmp1,	&DWP( 4,$tmp2,"",0));
28055714Skris
28155714Skris	&add($B,$tmp1);
28255714Skris	&mov($tmp1,	&DWP( 8,$tmp2,"",0));
28355714Skris
28455714Skris	&add($C,$tmp1);
28555714Skris	&mov($tmp1,	&DWP(12,$tmp2,"",0));
28655714Skris
28755714Skris	&add($D,$tmp1);
28855714Skris	&mov(&DWP( 0,$tmp2,"",0),$A);
28955714Skris
29055714Skris	&mov(&DWP( 4,$tmp2,"",0),$B);
29155714Skris	&mov($tmp1,&swtmp(0)) unless $normal;
29255714Skris
29355714Skris	&mov(&DWP( 8,$tmp2,"",0),$C);
29455714Skris	 &mov(&DWP(12,$tmp2,"",0),$D);
29555714Skris
29655714Skris	&cmp($tmp1,$X) unless $normal;			# check count
297120631Snectar	 &jae(&label("start")) unless $normal;
29855714Skris
29955714Skris	&pop("eax"); # pop the temp variable off the stack
30055714Skris	 &pop("ebx");
30155714Skris	&pop("ebp");
30255714Skris	 &pop("edi");
30355714Skris	&pop("esi");
30455714Skris	 &ret();
30555714Skris	&function_end_B($name);
30655714Skris	}
30755714Skris
308