1 /*
2  *    Stack-less Just-In-Time compiler
3  *
4  *    Copyright Zoltan Herczeg (hzmester@freemail.hu). All rights reserved.
5  *
6  * Redistribution and use in source and binary forms, with or without modification, are
7  * permitted provided that the following conditions are met:
8  *
9  *   1. Redistributions of source code must retain the above copyright notice, this list of
10  *      conditions and the following disclaimer.
11  *
12  *   2. Redistributions in binary form must reproduce the above copyright notice, this list
13  *      of conditions and the following disclaimer in the documentation and/or other materials
14  *      provided with the distribution.
15  *
16  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDER(S) AND CONTRIBUTORS ``AS IS'' AND ANY
17  * EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
18  * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT
19  * SHALL THE COPYRIGHT HOLDER(S) OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT,
20  * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED
21  * TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
22  * BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
23  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN
24  * ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
25  */
26 
27 /* ppc 64-bit arch dependent functions. */
28 
29 #if defined(__GNUC__) || (defined(__IBM_GCC_ASM) && __IBM_GCC_ASM)
30 #define ASM_SLJIT_CLZ(src, dst) \
31 	__asm__ volatile ( "cntlzd %0, %1" : "=r"(dst) : "r"(src) )
32 #elif defined(__xlc__)
33 #error "Please enable GCC syntax for inline assembly statements"
34 #else
35 #error "Must implement count leading zeroes"
36 #endif
37 
38 /* Computes SLDI(63 - shift). */
39 #define PUSH_SLDI_NEG(reg, shift) \
40 	push_inst(compiler, RLDICR | S(reg) | A(reg) | RLDI_SH(63 - shift) | RLDI_ME(shift))
41 
load_immediate(struct sljit_compiler * compiler,sljit_s32 reg,sljit_sw imm)42 static sljit_s32 load_immediate(struct sljit_compiler *compiler, sljit_s32 reg, sljit_sw imm)
43 {
44 	sljit_uw tmp;
45 	sljit_uw shift;
46 	sljit_uw tmp2;
47 	sljit_uw shift2;
48 
49 	if (imm <= SIMM_MAX && imm >= SIMM_MIN)
50 		return push_inst(compiler, ADDI | D(reg) | A(0) | IMM(imm));
51 
52 	if (((sljit_uw)imm >> 16) == 0)
53 		return push_inst(compiler, ORI | S(TMP_ZERO) | A(reg) | IMM(imm));
54 
55 	if (imm <= 0x7fffffffl && imm >= -0x80000000l) {
56 		FAIL_IF(push_inst(compiler, ADDIS | D(reg) | A(0) | IMM(imm >> 16)));
57 		return (imm & 0xffff) ? push_inst(compiler, ORI | S(reg) | A(reg) | IMM(imm)) : SLJIT_SUCCESS;
58 	}
59 
60 	if (((sljit_uw)imm >> 32) == 0) {
61 		FAIL_IF(push_inst(compiler, ORIS | S(TMP_ZERO) | A(reg) | IMM(imm >> 16)));
62 		return (imm & 0xffff) ? push_inst(compiler, ORI | S(reg) | A(reg) | IMM(imm)) : SLJIT_SUCCESS;
63 	}
64 
65 	/* Count leading zeroes. */
66 	tmp = (sljit_uw)((imm >= 0) ? imm : ~imm);
67 	ASM_SLJIT_CLZ(tmp, shift);
68 	SLJIT_ASSERT(shift > 0);
69 	shift--;
70 	tmp = ((sljit_uw)imm << shift);
71 
72 	if ((tmp & ~0xffff000000000000ul) == 0) {
73 		FAIL_IF(push_inst(compiler, ADDI | D(reg) | A(0) | (sljit_ins)(tmp >> 48)));
74 		shift += 15;
75 		return PUSH_SLDI_NEG(reg, shift);
76 	}
77 
78 	if ((tmp & ~0xffffffff00000000ul) == 0) {
79 		FAIL_IF(push_inst(compiler, ADDIS | D(reg) | A(0) | (sljit_ins)(tmp >> 48)));
80 		FAIL_IF(push_inst(compiler, ORI | S(reg) | A(reg) | IMM(tmp >> 32)));
81 		shift += 31;
82 		return PUSH_SLDI_NEG(reg, shift);
83 	}
84 
85 	/* Cut out the 16 bit from immediate. */
86 	shift += 15;
87 	tmp2 = (sljit_uw)imm & (((sljit_uw)1 << (63 - shift)) - 1);
88 
89 	if (tmp2 <= 0xffff) {
90 		FAIL_IF(push_inst(compiler, ADDI | D(reg) | A(0) | (sljit_ins)(tmp >> 48)));
91 		FAIL_IF(PUSH_SLDI_NEG(reg, shift));
92 		return push_inst(compiler, ORI | S(reg) | A(reg) | (sljit_ins)tmp2);
93 	}
94 
95 	if (tmp2 <= 0xffffffff) {
96 		FAIL_IF(push_inst(compiler, ADDI | D(reg) | A(0) | IMM(tmp >> 48)));
97 		FAIL_IF(PUSH_SLDI_NEG(reg, shift));
98 		FAIL_IF(push_inst(compiler, ORIS | S(reg) | A(reg) | (sljit_ins)(tmp2 >> 16)));
99 		return (imm & 0xffff) ? push_inst(compiler, ORI | S(reg) | A(reg) | IMM(tmp2)) : SLJIT_SUCCESS;
100 	}
101 
102 	ASM_SLJIT_CLZ(tmp2, shift2);
103 	tmp2 <<= shift2;
104 
105 	if ((tmp2 & ~0xffff000000000000ul) == 0) {
106 		FAIL_IF(push_inst(compiler, ADDI | D(reg) | A(0) | (sljit_ins)(tmp >> 48)));
107 		shift2 += 15;
108 		shift += (63 - shift2);
109 		FAIL_IF(PUSH_SLDI_NEG(reg, shift));
110 		FAIL_IF(push_inst(compiler, ORI | S(reg) | A(reg) | (sljit_ins)(tmp2 >> 48)));
111 		return PUSH_SLDI_NEG(reg, shift2);
112 	}
113 
114 	/* The general version. */
115 	FAIL_IF(push_inst(compiler, ADDIS | D(reg) | A(0) | (sljit_ins)((sljit_uw)imm >> 48)));
116 	FAIL_IF(push_inst(compiler, ORI | S(reg) | A(reg) | IMM(imm >> 32)));
117 	FAIL_IF(PUSH_SLDI_NEG(reg, 31));
118 	FAIL_IF(push_inst(compiler, ORIS | S(reg) | A(reg) | IMM(imm >> 16)));
119 	return push_inst(compiler, ORI | S(reg) | A(reg) | IMM(imm));
120 }
121 
122 #undef PUSH_SLDI_NEG
123 
124 #define CLRLDI(dst, src, n) \
125 	(RLDICL | S(src) | A(dst) | RLDI_SH(0) | RLDI_MB(n))
126 
127 /* Sign extension for integer operations. */
128 #define UN_EXTS() \
129 	if ((flags & (ALT_SIGN_EXT | REG2_SOURCE)) == (ALT_SIGN_EXT | REG2_SOURCE)) { \
130 		FAIL_IF(push_inst(compiler, EXTSW | S(src2) | A(TMP_REG2))); \
131 		src2 = TMP_REG2; \
132 	}
133 
134 #define BIN_EXTS() \
135 	if (flags & ALT_SIGN_EXT) { \
136 		if (flags & REG1_SOURCE) { \
137 			FAIL_IF(push_inst(compiler, EXTSW | S(src1) | A(TMP_REG1))); \
138 			src1 = TMP_REG1; \
139 		} \
140 		if (flags & REG2_SOURCE) { \
141 			FAIL_IF(push_inst(compiler, EXTSW | S(src2) | A(TMP_REG2))); \
142 			src2 = TMP_REG2; \
143 		} \
144 	}
145 
146 #define BIN_IMM_EXTS() \
147 	if ((flags & (ALT_SIGN_EXT | REG1_SOURCE)) == (ALT_SIGN_EXT | REG1_SOURCE)) { \
148 		FAIL_IF(push_inst(compiler, EXTSW | S(src1) | A(TMP_REG1))); \
149 		src1 = TMP_REG1; \
150 	}
151 
emit_single_op(struct sljit_compiler * compiler,sljit_s32 op,sljit_s32 flags,sljit_s32 dst,sljit_s32 src1,sljit_s32 src2)152 static SLJIT_INLINE sljit_s32 emit_single_op(struct sljit_compiler *compiler, sljit_s32 op, sljit_s32 flags,
153 	sljit_s32 dst, sljit_s32 src1, sljit_s32 src2)
154 {
155 	sljit_u32 imm;
156 
157 	switch (op) {
158 	case SLJIT_MOV:
159 	case SLJIT_MOV_P:
160 		SLJIT_ASSERT(src1 == TMP_REG1);
161 		if (dst != src2)
162 			return push_inst(compiler, OR | S(src2) | A(dst) | B(src2));
163 		return SLJIT_SUCCESS;
164 
165 	case SLJIT_MOV_U32:
166 	case SLJIT_MOV_S32:
167 		SLJIT_ASSERT(src1 == TMP_REG1);
168 		if ((flags & (REG_DEST | REG2_SOURCE)) == (REG_DEST | REG2_SOURCE)) {
169 			if (op == SLJIT_MOV_S32)
170 				return push_inst(compiler, EXTSW | S(src2) | A(dst));
171 			return push_inst(compiler, CLRLDI(dst, src2, 32));
172 		}
173 		else {
174 			SLJIT_ASSERT(dst == src2);
175 		}
176 		return SLJIT_SUCCESS;
177 
178 	case SLJIT_MOV_U8:
179 	case SLJIT_MOV_S8:
180 		SLJIT_ASSERT(src1 == TMP_REG1);
181 		if ((flags & (REG_DEST | REG2_SOURCE)) == (REG_DEST | REG2_SOURCE)) {
182 			if (op == SLJIT_MOV_S8)
183 				return push_inst(compiler, EXTSB | S(src2) | A(dst));
184 			return push_inst(compiler, CLRLDI(dst, src2, 56));
185 		}
186 		else if ((flags & REG_DEST) && op == SLJIT_MOV_S8)
187 			return push_inst(compiler, EXTSB | S(src2) | A(dst));
188 		else {
189 			SLJIT_ASSERT(dst == src2);
190 		}
191 		return SLJIT_SUCCESS;
192 
193 	case SLJIT_MOV_U16:
194 	case SLJIT_MOV_S16:
195 		SLJIT_ASSERT(src1 == TMP_REG1);
196 		if ((flags & (REG_DEST | REG2_SOURCE)) == (REG_DEST | REG2_SOURCE)) {
197 			if (op == SLJIT_MOV_S16)
198 				return push_inst(compiler, EXTSH | S(src2) | A(dst));
199 			return push_inst(compiler, CLRLDI(dst, src2, 48));
200 		}
201 		else {
202 			SLJIT_ASSERT(dst == src2);
203 		}
204 		return SLJIT_SUCCESS;
205 
206 	case SLJIT_CLZ:
207 		SLJIT_ASSERT(src1 == TMP_REG1);
208 		return push_inst(compiler, ((flags & ALT_FORM1) ? CNTLZW : CNTLZD) | S(src2) | A(dst));
209 
210 	case SLJIT_CTZ:
211 		SLJIT_ASSERT(src1 == TMP_REG1);
212 		FAIL_IF(push_inst(compiler, NEG | D(TMP_REG1) | A(src2)));
213 		FAIL_IF(push_inst(compiler, AND | S(src2) | A(dst) | B(TMP_REG1)));
214 		FAIL_IF(push_inst(compiler, ((flags & ALT_FORM1) ? CNTLZW : CNTLZD) | S(dst) | A(dst)));
215 		FAIL_IF(push_inst(compiler, ADDI | D(TMP_REG1) | A(dst) | IMM((flags & ALT_FORM1) ? -32 : -64)));
216 		/* The highest bits are set, if dst < bit width, zero otherwise. */
217 		FAIL_IF(push_inst(compiler, ((flags & ALT_FORM1) ? SRWI(27) : SRDI(58)) | S(TMP_REG1) | A(TMP_REG1)));
218 		return push_inst(compiler, XOR | S(dst) | A(dst) | B(TMP_REG1));
219 
220 	case SLJIT_ADD:
221 		if (flags & ALT_FORM1) {
222 			if (flags & ALT_SIGN_EXT) {
223 				FAIL_IF(push_inst(compiler, SLDI(32) | S(src1) | A(TMP_REG1)));
224 				src1 = TMP_REG1;
225 				FAIL_IF(push_inst(compiler, SLDI(32) | S(src2) | A(TMP_REG2)));
226 				src2 = TMP_REG2;
227 			}
228 			/* Setting XER SO is not enough, CR SO is also needed. */
229 			FAIL_IF(push_inst(compiler, ADD | OE(ALT_SET_FLAGS) | RC(ALT_SET_FLAGS) | D(dst) | A(src1) | B(src2)));
230 			if (flags & ALT_SIGN_EXT)
231 				return push_inst(compiler, SRDI(32) | S(dst) | A(dst));
232 			return SLJIT_SUCCESS;
233 		}
234 
235 		if (flags & ALT_FORM2) {
236 			/* Flags does not set: BIN_IMM_EXTS unnecessary. */
237 			SLJIT_ASSERT(src2 == TMP_REG2);
238 
239 			if (flags & ALT_FORM3)
240 				return push_inst(compiler, ADDIS | D(dst) | A(src1) | compiler->imm);
241 
242 			imm = compiler->imm;
243 
244 			if (flags & ALT_FORM4) {
245 				FAIL_IF(push_inst(compiler, ADDIS | D(dst) | A(src1) | (((imm >> 16) & 0xffff) + ((imm >> 15) & 0x1))));
246 				src1 = dst;
247 			}
248 
249 			return push_inst(compiler, ADDI | D(dst) | A(src1) | (imm & 0xffff));
250 		}
251 		if (flags & ALT_FORM3) {
252 			SLJIT_ASSERT(src2 == TMP_REG2);
253 			BIN_IMM_EXTS();
254 			return push_inst(compiler, ADDIC | D(dst) | A(src1) | compiler->imm);
255 		}
256 		if (flags & ALT_FORM4) {
257 			if (flags & ALT_FORM5)
258 				FAIL_IF(push_inst(compiler, ADDI | D(dst) | A(src1) | compiler->imm));
259 			else
260 				FAIL_IF(push_inst(compiler, ADD | D(dst) | A(src1) | B(src2)));
261 			return push_inst(compiler, CMPI | A(dst) | 0);
262 		}
263 		if (!(flags & ALT_SET_FLAGS))
264 			return push_inst(compiler, ADD | D(dst) | A(src1) | B(src2));
265 		BIN_EXTS();
266 		if (flags & ALT_FORM5)
267 			return push_inst(compiler, ADDC | RC(ALT_SET_FLAGS) | D(dst) | A(src1) | B(src2));
268 		return push_inst(compiler, ADD | RC(flags) | D(dst) | A(src1) | B(src2));
269 
270 	case SLJIT_ADDC:
271 		BIN_EXTS();
272 		return push_inst(compiler, ADDE | D(dst) | A(src1) | B(src2));
273 
274 	case SLJIT_SUB:
275 		if (flags & ALT_FORM1) {
276 			if (flags & ALT_FORM2) {
277 				FAIL_IF(push_inst(compiler, CMPLI | CRD(0 | ((flags & ALT_SIGN_EXT) ? 0 : 1)) | A(src1) | compiler->imm));
278 				if (!(flags & ALT_FORM3))
279 					return SLJIT_SUCCESS;
280 				return push_inst(compiler, ADDI | D(dst) | A(src1) | (-compiler->imm & 0xffff));
281 			}
282 			FAIL_IF(push_inst(compiler, CMPL | CRD(0 | ((flags & ALT_SIGN_EXT) ? 0 : 1)) | A(src1) | B(src2)));
283 			if (!(flags & ALT_FORM3))
284 				return SLJIT_SUCCESS;
285 			return push_inst(compiler, SUBF | D(dst) | A(src2) | B(src1));
286 		}
287 
288 		if (flags & ALT_FORM2) {
289 			if (flags & ALT_FORM3) {
290 				FAIL_IF(push_inst(compiler, CMPI | CRD(0 | ((flags & ALT_SIGN_EXT) ? 0 : 1)) | A(src1) | compiler->imm));
291 				if (!(flags & ALT_FORM4))
292 					return SLJIT_SUCCESS;
293 				return push_inst(compiler, ADDI | D(dst) | A(src1) | (-compiler->imm & 0xffff));
294 			}
295 			FAIL_IF(push_inst(compiler, CMP | CRD(0 | ((flags & ALT_SIGN_EXT) ? 0 : 1)) | A(src1) | B(src2)));
296 			if (!(flags & ALT_FORM4))
297 				return SLJIT_SUCCESS;
298 			return push_inst(compiler, SUBF | D(dst) | A(src2) | B(src1));
299 		}
300 
301 		if (flags & ALT_FORM3) {
302 			if (flags & ALT_SIGN_EXT) {
303 				if (src1 != TMP_ZERO) {
304 					FAIL_IF(push_inst(compiler, SLDI(32) | S(src1) | A(TMP_REG1)));
305 					src1 = TMP_REG1;
306 				}
307 				if (src2 != TMP_ZERO) {
308 					FAIL_IF(push_inst(compiler, SLDI(32) | S(src2) | A(TMP_REG2)));
309 					src2 = TMP_REG2;
310 				}
311 			}
312 
313 			/* Setting XER SO is not enough, CR SO is also needed. */
314 			if (src1 != TMP_ZERO)
315 				FAIL_IF(push_inst(compiler, SUBF | OE(ALT_SET_FLAGS) | RC(ALT_SET_FLAGS) | D(dst) | A(src2) | B(src1)));
316 			else
317 				FAIL_IF(push_inst(compiler, NEG | OE(ALT_SET_FLAGS) | RC(ALT_SET_FLAGS) | D(dst) | A(src2)));
318 
319 			if (flags & ALT_SIGN_EXT)
320 				return push_inst(compiler, SRDI(32) | S(dst) | A(dst));
321 			return SLJIT_SUCCESS;
322 		}
323 
324 		if (flags & ALT_FORM4) {
325 			/* Flags does not set: BIN_IMM_EXTS unnecessary. */
326 			SLJIT_ASSERT(src2 == TMP_REG2);
327 			return push_inst(compiler, SUBFIC | D(dst) | A(src1) | compiler->imm);
328 		}
329 
330 		if (!(flags & ALT_SET_FLAGS)) {
331 			SLJIT_ASSERT(src1 != TMP_ZERO);
332 			return push_inst(compiler, SUBF | D(dst) | A(src2) | B(src1));
333 		}
334 
335 		BIN_EXTS();
336 		if (flags & ALT_FORM5)
337 			return push_inst(compiler, SUBFC | RC(ALT_SET_FLAGS) | D(dst) | A(src2) | B(src1));
338 
339 		if (src1 != TMP_ZERO)
340 			return push_inst(compiler, SUBF | RC(ALT_SET_FLAGS) | D(dst) | A(src2) | B(src1));
341 		return push_inst(compiler, NEG | RC(ALT_SET_FLAGS) | D(dst) | A(src2));
342 
343 	case SLJIT_SUBC:
344 		BIN_EXTS();
345 		return push_inst(compiler, SUBFE | D(dst) | A(src2) | B(src1));
346 
347 	case SLJIT_MUL:
348 		if (flags & ALT_FORM1) {
349 			SLJIT_ASSERT(src2 == TMP_REG2);
350 			return push_inst(compiler, MULLI | D(dst) | A(src1) | compiler->imm);
351 		}
352 		BIN_EXTS();
353 		if (flags & ALT_FORM2)
354 			return push_inst(compiler, MULLW | OE(flags) | RC(flags) | D(dst) | A(src2) | B(src1));
355 		return push_inst(compiler, MULLD | OE(flags) | RC(flags) | D(dst) | A(src2) | B(src1));
356 
357 	case SLJIT_AND:
358 		if (flags & ALT_FORM1) {
359 			SLJIT_ASSERT(src2 == TMP_REG2);
360 			return push_inst(compiler, ANDI | S(src1) | A(dst) | compiler->imm);
361 		}
362 		if (flags & ALT_FORM2) {
363 			SLJIT_ASSERT(src2 == TMP_REG2);
364 			return push_inst(compiler, ANDIS | S(src1) | A(dst) | compiler->imm);
365 		}
366 		return push_inst(compiler, AND | RC(flags) | S(src1) | A(dst) | B(src2));
367 
368 	case SLJIT_OR:
369 		if (flags & ALT_FORM1) {
370 			SLJIT_ASSERT(src2 == TMP_REG2);
371 			return push_inst(compiler, ORI | S(src1) | A(dst) | compiler->imm);
372 		}
373 		if (flags & ALT_FORM2) {
374 			SLJIT_ASSERT(src2 == TMP_REG2);
375 			return push_inst(compiler, ORIS | S(src1) | A(dst) | compiler->imm);
376 		}
377 		if (flags & ALT_FORM3) {
378 			SLJIT_ASSERT(src2 == TMP_REG2);
379 			imm = compiler->imm;
380 
381 			FAIL_IF(push_inst(compiler, ORI | S(src1) | A(dst) | IMM(imm)));
382 			return push_inst(compiler, ORIS | S(dst) | A(dst) | IMM(imm >> 16));
383 		}
384 		return push_inst(compiler, OR | RC(flags) | S(src1) | A(dst) | B(src2));
385 
386 	case SLJIT_XOR:
387 		if (flags & ALT_FORM1) {
388 			SLJIT_ASSERT(src2 == TMP_REG2);
389 			return push_inst(compiler, XORI | S(src1) | A(dst) | compiler->imm);
390 		}
391 		if (flags & ALT_FORM2) {
392 			SLJIT_ASSERT(src2 == TMP_REG2);
393 			return push_inst(compiler, XORIS | S(src1) | A(dst) | compiler->imm);
394 		}
395 		if (flags & ALT_FORM3) {
396 			SLJIT_ASSERT(src2 == TMP_REG2);
397 			imm = compiler->imm;
398 
399 			FAIL_IF(push_inst(compiler, XORI | S(src1) | A(dst) | IMM(imm)));
400 			return push_inst(compiler, XORIS | S(dst) | A(dst) | IMM(imm >> 16));
401 		}
402 		if (flags & ALT_FORM4) {
403 			SLJIT_ASSERT(src1 == TMP_REG1);
404 			UN_EXTS();
405 			return push_inst(compiler, NOR | RC(flags) | S(src2) | A(dst) | B(src2));
406 		}
407 		return push_inst(compiler, XOR | RC(flags) | S(src1) | A(dst) | B(src2));
408 
409 	case SLJIT_SHL:
410 	case SLJIT_MSHL:
411 		if (flags & ALT_FORM1) {
412 			SLJIT_ASSERT(src2 == TMP_REG2);
413 			imm = compiler->imm;
414 
415 			if (flags & ALT_FORM2) {
416 				imm &= 0x1f;
417 				return push_inst(compiler, SLWI(imm) | RC(flags) | S(src1) | A(dst));
418 			}
419 
420 			imm &= 0x3f;
421 			return push_inst(compiler, SLDI(imm) | RC(flags) | S(src1) | A(dst));
422 		}
423 
424 		if (op == SLJIT_MSHL) {
425 			FAIL_IF(push_inst(compiler, ANDI | S(src2) | A(TMP_REG2) | ((flags & ALT_FORM2) ? 0x1f : 0x3f)));
426 			src2 = TMP_REG2;
427 		}
428 
429 		return push_inst(compiler, ((flags & ALT_FORM2) ? SLW : SLD) | RC(flags) | S(src1) | A(dst) | B(src2));
430 
431 	case SLJIT_LSHR:
432 	case SLJIT_MLSHR:
433 		if (flags & ALT_FORM1) {
434 			SLJIT_ASSERT(src2 == TMP_REG2);
435 			imm = compiler->imm;
436 
437 			if (flags & ALT_FORM2) {
438 				imm &= 0x1f;
439 				/* Since imm can be 0, SRWI() cannot be used. */
440 				return push_inst(compiler, RLWINM | RC(flags) | S(src1) | A(dst) | RLWI_SH((32 - imm) & 0x1f) | RLWI_MBE(imm, 31));
441 			}
442 
443 			imm &= 0x3f;
444 			/* Since imm can be 0, SRDI() cannot be used. */
445 			return push_inst(compiler, RLDICL | RC(flags) | S(src1) | A(dst) | RLDI_SH((64 - imm) & 0x3f) | RLDI_MB(imm));
446 		}
447 
448 		if (op == SLJIT_MLSHR) {
449 			FAIL_IF(push_inst(compiler, ANDI | S(src2) | A(TMP_REG2) | ((flags & ALT_FORM2) ? 0x1f : 0x3f)));
450 			src2 = TMP_REG2;
451 		}
452 
453 		return push_inst(compiler, ((flags & ALT_FORM2) ? SRW : SRD) | RC(flags) | S(src1) | A(dst) | B(src2));
454 
455 	case SLJIT_ASHR:
456 	case SLJIT_MASHR:
457 		if (flags & ALT_FORM1) {
458 			SLJIT_ASSERT(src2 == TMP_REG2);
459 			imm = compiler->imm;
460 
461 			if (flags & ALT_FORM2) {
462 				imm &= 0x1f;
463 				return push_inst(compiler, SRAWI | RC(flags) | S(src1) | A(dst) | (imm << 11));
464 			}
465 
466 			imm &= 0x3f;
467 			return push_inst(compiler, SRADI | RC(flags) | S(src1) | A(dst) | RLDI_SH(imm));
468 		}
469 
470 		if (op == SLJIT_MASHR) {
471 			FAIL_IF(push_inst(compiler, ANDI | S(src2) | A(TMP_REG2) | ((flags & ALT_FORM2) ? 0x1f : 0x3f)));
472 			src2 = TMP_REG2;
473 		}
474 
475 		return push_inst(compiler, ((flags & ALT_FORM2) ? SRAW : SRAD) | RC(flags) | S(src1) | A(dst) | B(src2));
476 
477 	case SLJIT_ROTL:
478 	case SLJIT_ROTR:
479 		if (flags & ALT_FORM1) {
480 			SLJIT_ASSERT(src2 == TMP_REG2);
481 			imm = compiler->imm;
482 
483 			if (op == SLJIT_ROTR)
484 				imm = (sljit_u32)(-(sljit_s32)imm);
485 
486 			if (flags & ALT_FORM2) {
487 				imm &= 0x1f;
488 				return push_inst(compiler, RLWINM | S(src1) | A(dst) | RLWI_SH(imm) | RLWI_MBE(0, 31));
489 			}
490 
491 			imm &= 0x3f;
492 			return push_inst(compiler, RLDICL | S(src1) | A(dst) | RLDI_SH(imm));
493 		}
494 
495 		if (op == SLJIT_ROTR) {
496 			FAIL_IF(push_inst(compiler, SUBFIC | D(TMP_REG2) | A(src2) | 0));
497 			src2 = TMP_REG2;
498 		}
499 
500 		return push_inst(compiler, ((flags & ALT_FORM2) ? (RLWNM | RLWI_MBE(0, 31)) : (RLDCL | RLDI_MB(0))) | S(src1) | A(dst) | B(src2));
501 	}
502 
503 	SLJIT_UNREACHABLE();
504 	return SLJIT_SUCCESS;
505 }
506 
call_with_args(struct sljit_compiler * compiler,sljit_s32 arg_types,sljit_s32 * src)507 static sljit_s32 call_with_args(struct sljit_compiler *compiler, sljit_s32 arg_types, sljit_s32 *src)
508 {
509 	sljit_s32 arg_count = 0;
510 	sljit_s32 word_arg_count = 0;
511 	sljit_s32 types = 0;
512 	sljit_s32 reg = 0;
513 
514 	if (src)
515 		reg = *src & REG_MASK;
516 
517 	arg_types >>= SLJIT_ARG_SHIFT;
518 
519 	while (arg_types) {
520 		types = (types << SLJIT_ARG_SHIFT) | (arg_types & SLJIT_ARG_MASK);
521 
522 		switch (arg_types & SLJIT_ARG_MASK) {
523 		case SLJIT_ARG_TYPE_F64:
524 		case SLJIT_ARG_TYPE_F32:
525 			arg_count++;
526 			break;
527 		default:
528 			arg_count++;
529 			word_arg_count++;
530 
531 			if (arg_count != word_arg_count && arg_count == reg) {
532 				FAIL_IF(push_inst(compiler, OR | S(reg) | A(TMP_CALL_REG) | B(reg)));
533 				*src = TMP_CALL_REG;
534 			}
535 			break;
536 		}
537 
538 		arg_types >>= SLJIT_ARG_SHIFT;
539 	}
540 
541 	while (types) {
542 		switch (types & SLJIT_ARG_MASK) {
543 		case SLJIT_ARG_TYPE_F64:
544 		case SLJIT_ARG_TYPE_F32:
545 			arg_count--;
546 			break;
547 		default:
548 			if (arg_count != word_arg_count)
549 				FAIL_IF(push_inst(compiler, OR | S(word_arg_count) | A(arg_count) | B(word_arg_count)));
550 
551 			arg_count--;
552 			word_arg_count--;
553 			break;
554 		}
555 
556 		types >>= SLJIT_ARG_SHIFT;
557 	}
558 
559 	return SLJIT_SUCCESS;
560 }
561 
emit_const(struct sljit_compiler * compiler,sljit_s32 reg,sljit_sw init_value)562 static SLJIT_INLINE sljit_s32 emit_const(struct sljit_compiler *compiler, sljit_s32 reg, sljit_sw init_value)
563 {
564 	FAIL_IF(push_inst(compiler, ADDIS | D(reg) | A(0) | IMM(init_value >> 48)));
565 	FAIL_IF(push_inst(compiler, ORI | S(reg) | A(reg) | IMM(init_value >> 32)));
566 	FAIL_IF(push_inst(compiler, SLDI(32) | S(reg) | A(reg)));
567 	FAIL_IF(push_inst(compiler, ORIS | S(reg) | A(reg) | IMM(init_value >> 16)));
568 	return push_inst(compiler, ORI | S(reg) | A(reg) | IMM(init_value));
569 }
570 
sljit_emit_fop1_conv_f64_from_sw(struct sljit_compiler * compiler,sljit_s32 op,sljit_s32 dst,sljit_sw dstw,sljit_s32 src,sljit_sw srcw)571 static SLJIT_INLINE sljit_s32 sljit_emit_fop1_conv_f64_from_sw(struct sljit_compiler *compiler, sljit_s32 op,
572 	sljit_s32 dst, sljit_sw dstw,
573 	sljit_s32 src, sljit_sw srcw)
574 {
575 	sljit_s32 dst_r = FAST_IS_REG(dst) ? dst : TMP_FREG1;
576 
577 	if (src == SLJIT_IMM) {
578 		if (GET_OPCODE(op) == SLJIT_CONV_F64_FROM_S32)
579 			srcw = (sljit_s32)srcw;
580 
581 		FAIL_IF(load_immediate(compiler, TMP_REG1, srcw));
582 		src = TMP_REG1;
583 	} else if (GET_OPCODE(op) == SLJIT_CONV_F64_FROM_S32) {
584 		if (FAST_IS_REG(src))
585 			FAIL_IF(push_inst(compiler, EXTSW | S(src) | A(TMP_REG1)));
586 		else
587 			FAIL_IF(emit_op_mem(compiler, INT_DATA | SIGNED_DATA | LOAD_DATA, TMP_REG1, src, srcw, TMP_REG1));
588 		src = TMP_REG1;
589 	}
590 
591 	if (FAST_IS_REG(src)) {
592 		FAIL_IF(push_inst(compiler, STD | S(src) | A(SLJIT_SP) | TMP_MEM_OFFSET));
593 		FAIL_IF(push_inst(compiler, LFD | FS(TMP_FREG1) | A(SLJIT_SP) | TMP_MEM_OFFSET));
594 	} else
595 		FAIL_IF(emit_op_mem(compiler, DOUBLE_DATA | LOAD_DATA, TMP_FREG1, src, srcw, TMP_REG1));
596 
597 	FAIL_IF(push_inst(compiler, FCFID | FD(dst_r) | FB(TMP_FREG1)));
598 
599 	if (op & SLJIT_32)
600 		FAIL_IF(push_inst(compiler, FRSP | FD(dst_r) | FB(dst_r)));
601 
602 	if (dst & SLJIT_MEM)
603 		return emit_op_mem(compiler, FLOAT_DATA(op), TMP_FREG1, dst, dstw, TMP_REG1);
604 	return SLJIT_SUCCESS;
605 }
606 
sljit_emit_fop1_conv_f64_from_uw(struct sljit_compiler * compiler,sljit_s32 op,sljit_s32 dst,sljit_sw dstw,sljit_s32 src,sljit_sw srcw)607 static SLJIT_INLINE sljit_s32 sljit_emit_fop1_conv_f64_from_uw(struct sljit_compiler *compiler, sljit_s32 op,
608 	sljit_s32 dst, sljit_sw dstw,
609 	sljit_s32 src, sljit_sw srcw)
610 {
611 	sljit_s32 dst_r = FAST_IS_REG(dst) ? dst : TMP_FREG1;
612 
613 	if (GET_OPCODE(op) == SLJIT_CONV_F64_FROM_U32) {
614 		if (src == SLJIT_IMM) {
615 			FAIL_IF(load_immediate(compiler, TMP_REG1, (sljit_u32)srcw));
616 			src = TMP_REG1;
617 		} else {
618 			if (FAST_IS_REG(src))
619 				FAIL_IF(push_inst(compiler, CLRLDI(TMP_REG1, src, 32)));
620 			else
621 				FAIL_IF(emit_op_mem(compiler, INT_DATA | LOAD_DATA, TMP_REG1, src, srcw, TMP_REG1));
622 			src = TMP_REG1;
623 		}
624 
625 		FAIL_IF(push_inst(compiler, STD | S(src) | A(SLJIT_SP) | TMP_MEM_OFFSET));
626 		FAIL_IF(push_inst(compiler, LFD | FS(TMP_FREG1) | A(SLJIT_SP) | TMP_MEM_OFFSET));
627 		FAIL_IF(push_inst(compiler, FCFID | FD(dst_r) | FB(TMP_FREG1)));
628 	} else {
629 		if (src == SLJIT_IMM) {
630 			FAIL_IF(load_immediate(compiler, TMP_REG1, srcw));
631 			src = TMP_REG1;
632 		} else if (src & SLJIT_MEM) {
633 			FAIL_IF(emit_op_mem(compiler, WORD_DATA | LOAD_DATA, TMP_REG1, src, srcw, TMP_REG1));
634 			src = TMP_REG1;
635 		}
636 
637 		FAIL_IF(push_inst(compiler, CMPI | CRD(0 | 1) | A(src) | 0));
638 		FAIL_IF(push_inst(compiler, BCx | (12 << 21) | (0 << 16) | 20));
639 		FAIL_IF(push_inst(compiler, STD | S(src) | A(SLJIT_SP) | TMP_MEM_OFFSET));
640 		FAIL_IF(push_inst(compiler, LFD | FS(TMP_FREG1) | A(SLJIT_SP) | TMP_MEM_OFFSET));
641 		FAIL_IF(push_inst(compiler, FCFID | FD(dst_r) | FB(TMP_FREG1)));
642 		FAIL_IF(push_inst(compiler, Bx | ((op & SLJIT_32) ? 36 : 32)));
643 
644 		if (op & SLJIT_32)
645 			FAIL_IF(push_inst(compiler, RLWINM | S(src) | A(TMP_REG2) | RLWI_SH(10) | RLWI_MBE(10, 21)));
646 		else
647 			FAIL_IF(push_inst(compiler, ANDI | S(src) | A(TMP_REG2) | 0x1));
648 
649 		/* Shift right. */
650 		FAIL_IF(push_inst(compiler, RLDICL | S(src) | A(TMP_REG1) | RLDI_SH(63) | RLDI_MB(1)));
651 
652 		if (op & SLJIT_32)
653 			FAIL_IF(push_inst(compiler, RLDICR | S(TMP_REG1) | A(TMP_REG1) | RLDI_SH(0) | RLDI_ME(53)));
654 
655 		FAIL_IF(push_inst(compiler, OR | S(TMP_REG1) | A(TMP_REG1) | B(TMP_REG2)));
656 
657 		FAIL_IF(push_inst(compiler, STD | S(TMP_REG1) | A(SLJIT_SP) | TMP_MEM_OFFSET));
658 		FAIL_IF(push_inst(compiler, LFD | FS(TMP_FREG1) | A(SLJIT_SP) | TMP_MEM_OFFSET));
659 		FAIL_IF(push_inst(compiler, FCFID | FD(dst_r) | FB(TMP_FREG1)));
660 		FAIL_IF(push_inst(compiler, FADD | FD(dst_r) | FA(dst_r) | FB(dst_r)));
661 	}
662 
663 	if (op & SLJIT_32)
664 		FAIL_IF(push_inst(compiler, FRSP | FD(dst_r) | FB(dst_r)));
665 
666 	if (dst & SLJIT_MEM)
667 		return emit_op_mem(compiler, FLOAT_DATA(op), TMP_FREG1, dst, dstw, TMP_REG1);
668 	return SLJIT_SUCCESS;
669 }
670 
sljit_emit_fset64(struct sljit_compiler * compiler,sljit_s32 freg,sljit_f64 value)671 SLJIT_API_FUNC_ATTRIBUTE sljit_s32 sljit_emit_fset64(struct sljit_compiler *compiler,
672 	sljit_s32 freg, sljit_f64 value)
673 {
674 	union {
675 		sljit_sw imm;
676 		sljit_f64 value;
677 	} u;
678 
679 	CHECK_ERROR();
680 	CHECK(check_sljit_emit_fset64(compiler, freg, value));
681 
682 	u.value = value;
683 
684 	if (u.imm != 0)
685 		FAIL_IF(load_immediate(compiler, TMP_REG1, u.imm));
686 
687 	FAIL_IF(push_inst(compiler, STD | S(u.imm != 0 ? TMP_REG1 : TMP_ZERO) | A(SLJIT_SP) | TMP_MEM_OFFSET));
688 	return push_inst(compiler, LFD | FS(freg) | A(SLJIT_SP) | TMP_MEM_OFFSET);
689 }
690 
sljit_emit_fcopy(struct sljit_compiler * compiler,sljit_s32 op,sljit_s32 freg,sljit_s32 reg)691 SLJIT_API_FUNC_ATTRIBUTE sljit_s32 sljit_emit_fcopy(struct sljit_compiler *compiler, sljit_s32 op,
692 	sljit_s32 freg, sljit_s32 reg)
693 {
694 	CHECK_ERROR();
695 	CHECK(check_sljit_emit_fcopy(compiler, op, freg, reg));
696 
697 	if (GET_OPCODE(op) == SLJIT_COPY_TO_F64) {
698 		FAIL_IF(push_inst(compiler, ((op & SLJIT_32) ? STW : STD) | S(reg) | A(SLJIT_SP) | TMP_MEM_OFFSET));
699 		return push_inst(compiler, ((op & SLJIT_32) ? LFS : LFD) | FS(freg) | A(SLJIT_SP) | TMP_MEM_OFFSET);
700 	}
701 
702 	FAIL_IF(push_inst(compiler, ((op & SLJIT_32) ? STFS : STFD) | FS(freg) | A(SLJIT_SP) | TMP_MEM_OFFSET));
703 	return push_inst(compiler, ((op & SLJIT_32) ? LWZ : LD) | S(reg) | A(SLJIT_SP) | TMP_MEM_OFFSET);
704 }
705 
sljit_set_jump_addr(sljit_uw addr,sljit_uw new_target,sljit_sw executable_offset)706 SLJIT_API_FUNC_ATTRIBUTE void sljit_set_jump_addr(sljit_uw addr, sljit_uw new_target, sljit_sw executable_offset)
707 {
708 	sljit_ins *inst = (sljit_ins*)addr;
709 	SLJIT_UNUSED_ARG(executable_offset);
710 
711 	SLJIT_UPDATE_WX_FLAGS(inst, inst + 5, 0);
712 	inst[0] = (inst[0] & 0xffff0000u) | ((sljit_ins)(new_target >> 48) & 0xffff);
713 	inst[1] = (inst[1] & 0xffff0000u) | ((sljit_ins)(new_target >> 32) & 0xffff);
714 	inst[3] = (inst[3] & 0xffff0000u) | ((sljit_ins)(new_target >> 16) & 0xffff);
715 	inst[4] = (inst[4] & 0xffff0000u) | ((sljit_ins)new_target & 0xffff);
716 	SLJIT_UPDATE_WX_FLAGS(inst, inst + 5, 1);
717 	inst = (sljit_ins *)SLJIT_ADD_EXEC_OFFSET(inst, executable_offset);
718 	SLJIT_CACHE_FLUSH(inst, inst + 5);
719 }
720