xref: /openssl/crypto/perlasm/x86asm.pl (revision 27213879)
1#! /usr/bin/env perl
2# Copyright 1995-2018 The OpenSSL Project Authors. All Rights Reserved.
3#
4# Licensed under the Apache License 2.0 (the "License").  You may not use
5# this file except in compliance with the License.  You can obtain a copy
6# in the file LICENSE in the source distribution or at
7# https://www.openssl.org/source/license.html
8
9
10# require 'x86asm.pl';
11# &asm_init(<flavor>[,$i386only]);
12# &function_begin("foo");
13# ...
14# &function_end("foo");
15# &asm_finish
16
17$out=();
18$i386=0;
19
20# AUTOLOAD is this context has quite unpleasant side effect, namely
21# that typos in function calls effectively go to assembler output,
22# but on the pros side we don't have to implement one subroutine per
23# each opcode...
24sub ::AUTOLOAD
25{ my $opcode = $AUTOLOAD;
26
27    die "more than 4 arguments passed to $opcode" if ($#_>3);
28
29    $opcode =~ s/.*:://;
30    if    ($opcode =~ /^push/) { $stack+=4; }
31    elsif ($opcode =~ /^pop/)  { $stack-=4; }
32
33    &generic($opcode,@_) or die "undefined subroutine \&$AUTOLOAD";
34}
35
36sub ::emit
37{ my $opcode=shift;
38
39    if ($#_==-1)    { push(@out,"\t$opcode\n");				}
40    else            { push(@out,"\t$opcode\t".join(',',@_)."\n");	}
41}
42
43sub ::LB
44{   $_[0] =~ m/^e?([a-d])x$/o or die "$_[0] does not have a 'low byte'";
45  $1."l";
46}
47sub ::HB
48{   $_[0] =~ m/^e?([a-d])x$/o or die "$_[0] does not have a 'high byte'";
49  $1."h";
50}
51sub ::stack_push{ my $num=$_[0]*4; $stack+=$num; &sub("esp",$num);	}
52sub ::stack_pop	{ my $num=$_[0]*4; $stack-=$num; &add("esp",$num);	}
53sub ::blindpop	{ &pop($_[0]); $stack+=4;				}
54sub ::wparam	{ &DWP($stack+4*$_[0],"esp");				}
55sub ::swtmp	{ &DWP(4*$_[0],"esp");					}
56
57sub ::bswap
58{   if ($i386)	# emulate bswap for i386
59    {	&comment("bswap @_");
60	&xchg(&HB(@_),&LB(@_));
61	&ror (@_,16);
62	&xchg(&HB(@_),&LB(@_));
63    }
64    else
65    {	&generic("bswap",@_);	}
66}
67# These are made-up opcodes introduced over the years essentially
68# by ignorance, just alias them to real ones...
69sub ::movb	{ &mov(@_);	}
70sub ::xorb	{ &xor(@_);	}
71sub ::rotl	{ &rol(@_);	}
72sub ::rotr	{ &ror(@_);	}
73sub ::exch	{ &xchg(@_);	}
74sub ::halt	{ &hlt;		}
75sub ::movz	{ &movzx(@_);	}
76sub ::pushf	{ &pushfd;	}
77sub ::popf	{ &popfd;	}
78
79# 3 argument instructions
80sub ::movq
81{ my($p1,$p2,$optimize)=@_;
82
83    if ($optimize && $p1=~/^mm[0-7]$/ && $p2=~/^mm[0-7]$/)
84    # movq between mmx registers can sink Intel CPUs
85    {	&::pshufw($p1,$p2,0xe4);		}
86    else
87    {	&::generic("movq",@_);			}
88}
89
90# SSE>2 instructions
91my %regrm = (	"eax"=>0, "ecx"=>1, "edx"=>2, "ebx"=>3,
92		"esp"=>4, "ebp"=>5, "esi"=>6, "edi"=>7	);
93sub ::pextrd
94{ my($dst,$src,$imm)=@_;
95    if ("$dst:$src" =~ /(e[a-dsd][ixp]):xmm([0-7])/)
96    {	&::data_byte(0x66,0x0f,0x3a,0x16,0xc0|($2<<3)|$regrm{$1},$imm);	}
97    else
98    {	&::generic("pextrd",@_);		}
99}
100
101sub ::pinsrd
102{ my($dst,$src,$imm)=@_;
103    if ("$dst:$src" =~ /xmm([0-7]):(e[a-dsd][ixp])/)
104    {	&::data_byte(0x66,0x0f,0x3a,0x22,0xc0|($1<<3)|$regrm{$2},$imm);	}
105    else
106    {	&::generic("pinsrd",@_);		}
107}
108
109sub ::pshufb
110{ my($dst,$src)=@_;
111    if ("$dst:$src" =~ /xmm([0-7]):xmm([0-7])/)
112    {	&data_byte(0x66,0x0f,0x38,0x00,0xc0|($1<<3)|$2);	}
113    else
114    {	&::generic("pshufb",@_);		}
115}
116
117sub ::palignr
118{ my($dst,$src,$imm)=@_;
119    if ("$dst:$src" =~ /xmm([0-7]):xmm([0-7])/)
120    {	&::data_byte(0x66,0x0f,0x3a,0x0f,0xc0|($1<<3)|$2,$imm);	}
121    else
122    {	&::generic("palignr",@_);		}
123}
124
125sub ::pclmulqdq
126{ my($dst,$src,$imm)=@_;
127    if ("$dst:$src" =~ /xmm([0-7]):xmm([0-7])/)
128    {	&::data_byte(0x66,0x0f,0x3a,0x44,0xc0|($1<<3)|$2,$imm);	}
129    else
130    {	&::generic("pclmulqdq",@_);		}
131}
132
133sub ::rdrand
134{ my ($dst)=@_;
135    if ($dst =~ /(e[a-dsd][ixp])/)
136    {	&::data_byte(0x0f,0xc7,0xf0|$regrm{$dst});	}
137    else
138    {	&::generic("rdrand",@_);	}
139}
140
141sub ::rdseed
142{ my ($dst)=@_;
143    if ($dst =~ /(e[a-dsd][ixp])/)
144    {	&::data_byte(0x0f,0xc7,0xf8|$regrm{$dst});	}
145    else
146    {	&::generic("rdrand",@_);	}
147}
148
149sub rxb {
150 local *opcode=shift;
151 my ($dst,$src1,$src2,$rxb)=@_;
152
153   $rxb|=0x7<<5;
154   $rxb&=~(0x04<<5) if($dst>=8);
155   $rxb&=~(0x01<<5) if($src1>=8);
156   $rxb&=~(0x02<<5) if($src2>=8);
157   push @opcode,$rxb;
158}
159
160sub ::vprotd
161{ my $args=join(',',@_);
162    if ($args =~ /xmm([0-7]),xmm([0-7]),([x0-9a-f]+)/)
163    { my @opcode=(0x8f);
164	rxb(\@opcode,$1,$2,-1,0x08);
165	push @opcode,0x78,0xc2;
166	push @opcode,0xc0|($2&7)|(($1&7)<<3);		# ModR/M
167	my $c=$3;
168	push @opcode,$c=~/^0/?oct($c):$c;
169	&::data_byte(@opcode);
170    }
171    else
172    {	&::generic("vprotd",@_);	}
173}
174
175sub ::endbranch
176{
177    &::generic("#ifdef __CET__\n");
178    &::data_byte(0xf3,0x0f,0x1e,0xfb);
179    &::generic("#endif\n");
180}
181
182# label management
183$lbdecor="L";		# local label decoration, set by package
184$label="000";
185
186sub ::islabel		# see is argument is a known label
187{ my $i;
188    foreach $i (values %label) { return $i if ($i eq $_[0]); }
189  $label{$_[0]};	# can be undef
190}
191
192sub ::label		# instantiate a function-scope label
193{   if (!defined($label{$_[0]}))
194    {	$label{$_[0]}="${lbdecor}${label}${_[0]}"; $label++;   }
195  $label{$_[0]};
196}
197
198sub ::LABEL		# instantiate a file-scope label
199{   $label{$_[0]}=$_[1] if (!defined($label{$_[0]}));
200  $label{$_[0]};
201}
202
203sub ::static_label	{ &::LABEL($_[0],$lbdecor.$_[0]); }
204
205sub ::set_label_B	{ push(@out,"@_:\n"); }
206sub ::set_label
207{ my $label=&::label($_[0]);
208    &::align($_[1]) if ($_[1]>1);
209    &::set_label_B($label);
210  $label;
211}
212
213sub ::wipe_labels	# wipes function-scope labels
214{   foreach $i (keys %label)
215    {	delete $label{$i} if ($label{$i} =~ /^\Q${lbdecor}\E[0-9]{3}/);	}
216}
217
218# subroutine management
219sub ::function_begin
220{   &function_begin_B(@_);
221    $stack=4;
222    &push("ebp");
223    &push("ebx");
224    &push("esi");
225    &push("edi");
226}
227
228sub ::function_end
229{   &pop("edi");
230    &pop("esi");
231    &pop("ebx");
232    &pop("ebp");
233    &ret();
234    &function_end_B(@_);
235    $stack=0;
236    &wipe_labels();
237}
238
239sub ::function_end_A
240{   &pop("edi");
241    &pop("esi");
242    &pop("ebx");
243    &pop("ebp");
244    &ret();
245    $stack+=16;	# readjust esp as if we didn't pop anything
246}
247
248sub ::asciz
249{ my @str=unpack("C*",shift);
250    push @str,0;
251    while ($#str>15) {
252	&data_byte(@str[0..15]);
253	foreach (0..15) { shift @str; }
254    }
255    &data_byte(@str) if (@str);
256}
257
258sub ::asm_finish
259{   &file_end();
260    print @out;
261}
262
263sub ::asm_init
264{ my ($type,$cpu)=@_;
265
266    $i386=$cpu;
267
268    $elf=$cpp=$coff=$aout=$macosx=$win32=$mwerks=$android=0;
269    if    (($type eq "elf"))
270    {	$elf=1;			require "x86gas.pl";	}
271    elsif (($type eq "elf-1"))
272    {	$elf=-1;		require "x86gas.pl";	}
273    elsif (($type eq "a\.out"))
274    {	$aout=1;		require "x86gas.pl";	}
275    elsif (($type eq "coff" or $type eq "gaswin"))
276    {	$coff=1;		require "x86gas.pl";	}
277    elsif (($type eq "win32n"))
278    {	$win32=1;		require "x86nasm.pl";	}
279    elsif (($type eq "win32"))
280    {	$win32=1;		require "x86masm.pl";	}
281    elsif (($type eq "macosx"))
282    {	$aout=1; $macosx=1;	require "x86gas.pl";	}
283    elsif (($type eq "android"))
284    {	$elf=1; $android=1;	require "x86gas.pl";	}
285    else
286    {	print STDERR <<"EOF";
287Pick one target type from
288	elf	- Linux, FreeBSD, Solaris x86, etc.
289	a.out	- DJGPP, elder OpenBSD, etc.
290	coff	- GAS/COFF such as Win32 targets
291	win32n	- Windows 95/Windows NT NASM format
292	macosx	- Mac OS X
293EOF
294	exit(1);
295    }
296
297    $pic=0;
298    for (@ARGV) { $pic=1 if (/\-[fK]PIC/i); }
299
300    &file();
301}
302
303sub ::hidden {}
304
3051;
306