1 /*
2  *    Stack-less Just-In-Time compiler
3  *
4  *    Copyright Zoltan Herczeg (hzmester@freemail.hu). All rights reserved.
5  *
6  * Redistribution and use in source and binary forms, with or without modification, are
7  * permitted provided that the following conditions are met:
8  *
9  *   1. Redistributions of source code must retain the above copyright notice, this list of
10  *      conditions and the following disclaimer.
11  *
12  *   2. Redistributions in binary form must reproduce the above copyright notice, this list
13  *      of conditions and the following disclaimer in the documentation and/or other materials
14  *      provided with the distribution.
15  *
16  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDER(S) AND CONTRIBUTORS ``AS IS'' AND ANY
17  * EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
18  * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT
19  * SHALL THE COPYRIGHT HOLDER(S) OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT,
20  * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED
21  * TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
22  * BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
23  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN
24  * ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
25  */
26 
27 /* ppc 64-bit arch dependent functions. */
28 
29 #if defined(__GNUC__) || (defined(__IBM_GCC_ASM) && __IBM_GCC_ASM)
30 #define ASM_SLJIT_CLZ(src, dst) \
31 	__asm__ volatile ( "cntlzd %0, %1" : "=r"(dst) : "r"(src) )
32 #elif defined(__xlc__)
33 #error "Please enable GCC syntax for inline assembly statements"
34 #else
35 #error "Must implement count leading zeroes"
36 #endif
37 
38 /* Computes SLDI(63 - shift). */
39 #define PUSH_SLDI_NEG(reg, shift) \
40 	push_inst(compiler, RLDICR | S(reg) | A(reg) | RLDI_SH(63 - shift) | RLDI_ME(shift))
41 
load_immediate(struct sljit_compiler * compiler,sljit_s32 reg,sljit_sw imm)42 static sljit_s32 load_immediate(struct sljit_compiler *compiler, sljit_s32 reg, sljit_sw imm)
43 {
44 	sljit_uw tmp;
45 	sljit_uw shift;
46 	sljit_uw tmp2;
47 	sljit_uw shift2;
48 
49 	if (imm <= SIMM_MAX && imm >= SIMM_MIN)
50 		return push_inst(compiler, ADDI | D(reg) | A(0) | IMM(imm));
51 
52 	if (!(imm & ~0xffff))
53 		return push_inst(compiler, ORI | S(TMP_ZERO) | A(reg) | IMM(imm));
54 
55 	if (imm <= 0x7fffffffl && imm >= -0x80000000l) {
56 		FAIL_IF(push_inst(compiler, ADDIS | D(reg) | A(0) | IMM(imm >> 16)));
57 		return (imm & 0xffff) ? push_inst(compiler, ORI | S(reg) | A(reg) | IMM(imm)) : SLJIT_SUCCESS;
58 	}
59 
60 	/* Count leading zeroes. */
61 	tmp = (sljit_uw)((imm >= 0) ? imm : ~imm);
62 	ASM_SLJIT_CLZ(tmp, shift);
63 	SLJIT_ASSERT(shift > 0);
64 	shift--;
65 	tmp = ((sljit_uw)imm << shift);
66 
67 	if ((tmp & ~0xffff000000000000ul) == 0) {
68 		FAIL_IF(push_inst(compiler, ADDI | D(reg) | A(0) | (sljit_ins)(tmp >> 48)));
69 		shift += 15;
70 		return PUSH_SLDI_NEG(reg, shift);
71 	}
72 
73 	if ((tmp & ~0xffffffff00000000ul) == 0) {
74 		FAIL_IF(push_inst(compiler, ADDIS | D(reg) | A(0) | (sljit_ins)(tmp >> 48)));
75 		FAIL_IF(push_inst(compiler, ORI | S(reg) | A(reg) | IMM(tmp >> 32)));
76 		shift += 31;
77 		return PUSH_SLDI_NEG(reg, shift);
78 	}
79 
80 	/* Cut out the 16 bit from immediate. */
81 	shift += 15;
82 	tmp2 = (sljit_uw)imm & (((sljit_uw)1 << (63 - shift)) - 1);
83 
84 	if (tmp2 <= 0xffff) {
85 		FAIL_IF(push_inst(compiler, ADDI | D(reg) | A(0) | (sljit_ins)(tmp >> 48)));
86 		FAIL_IF(PUSH_SLDI_NEG(reg, shift));
87 		return push_inst(compiler, ORI | S(reg) | A(reg) | (sljit_ins)tmp2);
88 	}
89 
90 	if (tmp2 <= 0xffffffff) {
91 		FAIL_IF(push_inst(compiler, ADDI | D(reg) | A(0) | IMM(tmp >> 48)));
92 		FAIL_IF(PUSH_SLDI_NEG(reg, shift));
93 		FAIL_IF(push_inst(compiler, ORIS | S(reg) | A(reg) | (sljit_ins)(tmp2 >> 16)));
94 		return (imm & 0xffff) ? push_inst(compiler, ORI | S(reg) | A(reg) | IMM(tmp2)) : SLJIT_SUCCESS;
95 	}
96 
97 	ASM_SLJIT_CLZ(tmp2, shift2);
98 	tmp2 <<= shift2;
99 
100 	if ((tmp2 & ~0xffff000000000000ul) == 0) {
101 		FAIL_IF(push_inst(compiler, ADDI | D(reg) | A(0) | (sljit_ins)(tmp >> 48)));
102 		shift2 += 15;
103 		shift += (63 - shift2);
104 		FAIL_IF(PUSH_SLDI_NEG(reg, shift));
105 		FAIL_IF(push_inst(compiler, ORI | S(reg) | A(reg) | (sljit_ins)(tmp2 >> 48)));
106 		return PUSH_SLDI_NEG(reg, shift2);
107 	}
108 
109 	/* The general version. */
110 	FAIL_IF(push_inst(compiler, ADDIS | D(reg) | A(0) | (sljit_ins)((sljit_uw)imm >> 48)));
111 	FAIL_IF(push_inst(compiler, ORI | S(reg) | A(reg) | IMM(imm >> 32)));
112 	FAIL_IF(PUSH_SLDI_NEG(reg, 31));
113 	FAIL_IF(push_inst(compiler, ORIS | S(reg) | A(reg) | IMM(imm >> 16)));
114 	return push_inst(compiler, ORI | S(reg) | A(reg) | IMM(imm));
115 }
116 
117 #undef PUSH_SLDI_NEG
118 
119 #define CLRLDI(dst, src, n) \
120 	(RLDICL | S(src) | A(dst) | RLDI_SH(0) | RLDI_MB(n))
121 
122 /* Sign extension for integer operations. */
123 #define UN_EXTS() \
124 	if ((flags & (ALT_SIGN_EXT | REG2_SOURCE)) == (ALT_SIGN_EXT | REG2_SOURCE)) { \
125 		FAIL_IF(push_inst(compiler, EXTSW | S(src2) | A(TMP_REG2))); \
126 		src2 = TMP_REG2; \
127 	}
128 
129 #define BIN_EXTS() \
130 	if (flags & ALT_SIGN_EXT) { \
131 		if (flags & REG1_SOURCE) { \
132 			FAIL_IF(push_inst(compiler, EXTSW | S(src1) | A(TMP_REG1))); \
133 			src1 = TMP_REG1; \
134 		} \
135 		if (flags & REG2_SOURCE) { \
136 			FAIL_IF(push_inst(compiler, EXTSW | S(src2) | A(TMP_REG2))); \
137 			src2 = TMP_REG2; \
138 		} \
139 	}
140 
141 #define BIN_IMM_EXTS() \
142 	if ((flags & (ALT_SIGN_EXT | REG1_SOURCE)) == (ALT_SIGN_EXT | REG1_SOURCE)) { \
143 		FAIL_IF(push_inst(compiler, EXTSW | S(src1) | A(TMP_REG1))); \
144 		src1 = TMP_REG1; \
145 	}
146 
emit_single_op(struct sljit_compiler * compiler,sljit_s32 op,sljit_s32 flags,sljit_s32 dst,sljit_s32 src1,sljit_s32 src2)147 static SLJIT_INLINE sljit_s32 emit_single_op(struct sljit_compiler *compiler, sljit_s32 op, sljit_s32 flags,
148 	sljit_s32 dst, sljit_s32 src1, sljit_s32 src2)
149 {
150 	sljit_u32 imm;
151 
152 	switch (op) {
153 	case SLJIT_MOV:
154 	case SLJIT_MOV_P:
155 		SLJIT_ASSERT(src1 == TMP_REG1);
156 		if (dst != src2)
157 			return push_inst(compiler, OR | S(src2) | A(dst) | B(src2));
158 		return SLJIT_SUCCESS;
159 
160 	case SLJIT_MOV_U32:
161 	case SLJIT_MOV_S32:
162 		SLJIT_ASSERT(src1 == TMP_REG1);
163 		if ((flags & (REG_DEST | REG2_SOURCE)) == (REG_DEST | REG2_SOURCE)) {
164 			if (op == SLJIT_MOV_S32)
165 				return push_inst(compiler, EXTSW | S(src2) | A(dst));
166 			return push_inst(compiler, CLRLDI(dst, src2, 32));
167 		}
168 		else {
169 			SLJIT_ASSERT(dst == src2);
170 		}
171 		return SLJIT_SUCCESS;
172 
173 	case SLJIT_MOV_U8:
174 	case SLJIT_MOV_S8:
175 		SLJIT_ASSERT(src1 == TMP_REG1);
176 		if ((flags & (REG_DEST | REG2_SOURCE)) == (REG_DEST | REG2_SOURCE)) {
177 			if (op == SLJIT_MOV_S8)
178 				return push_inst(compiler, EXTSB | S(src2) | A(dst));
179 			return push_inst(compiler, CLRLDI(dst, src2, 56));
180 		}
181 		else if ((flags & REG_DEST) && op == SLJIT_MOV_S8)
182 			return push_inst(compiler, EXTSB | S(src2) | A(dst));
183 		else {
184 			SLJIT_ASSERT(dst == src2);
185 		}
186 		return SLJIT_SUCCESS;
187 
188 	case SLJIT_MOV_U16:
189 	case SLJIT_MOV_S16:
190 		SLJIT_ASSERT(src1 == TMP_REG1);
191 		if ((flags & (REG_DEST | REG2_SOURCE)) == (REG_DEST | REG2_SOURCE)) {
192 			if (op == SLJIT_MOV_S16)
193 				return push_inst(compiler, EXTSH | S(src2) | A(dst));
194 			return push_inst(compiler, CLRLDI(dst, src2, 48));
195 		}
196 		else {
197 			SLJIT_ASSERT(dst == src2);
198 		}
199 		return SLJIT_SUCCESS;
200 
201 	case SLJIT_NOT:
202 		SLJIT_ASSERT(src1 == TMP_REG1);
203 		UN_EXTS();
204 		return push_inst(compiler, NOR | RC(flags) | S(src2) | A(dst) | B(src2));
205 
206 	case SLJIT_CLZ:
207 		SLJIT_ASSERT(src1 == TMP_REG1);
208 		return push_inst(compiler, ((flags & ALT_FORM1) ? CNTLZW : CNTLZD) | S(src2) | A(dst));
209 
210 	case SLJIT_CTZ:
211 		SLJIT_ASSERT(src1 == TMP_REG1);
212 		FAIL_IF(push_inst(compiler, NEG | D(TMP_REG1) | A(src2)));
213 		FAIL_IF(push_inst(compiler, AND | S(src2) | A(dst) | B(TMP_REG1)));
214 		FAIL_IF(push_inst(compiler, ((flags & ALT_FORM1) ? CNTLZW : CNTLZD) | S(dst) | A(dst)));
215 		FAIL_IF(push_inst(compiler, ADDI | D(TMP_REG1) | A(dst) | IMM((flags & ALT_FORM1) ? -32 : -64)));
216 		/* The highest bits are set, if dst < bit width, zero otherwise. */
217 		FAIL_IF(push_inst(compiler, ((flags & ALT_FORM1) ? SRWI(27) : SRDI(58)) | S(TMP_REG1) | A(TMP_REG1)));
218 		return push_inst(compiler, XOR | S(dst) | A(dst) | B(TMP_REG1));
219 
220 	case SLJIT_ADD:
221 		if (flags & ALT_FORM1) {
222 			if (flags & ALT_SIGN_EXT) {
223 				FAIL_IF(push_inst(compiler, SLDI(32) | S(src1) | A(TMP_REG1)));
224 				src1 = TMP_REG1;
225 				FAIL_IF(push_inst(compiler, SLDI(32) | S(src2) | A(TMP_REG2)));
226 				src2 = TMP_REG2;
227 			}
228 			/* Setting XER SO is not enough, CR SO is also needed. */
229 			FAIL_IF(push_inst(compiler, ADD | OE(ALT_SET_FLAGS) | RC(ALT_SET_FLAGS) | D(dst) | A(src1) | B(src2)));
230 			if (flags & ALT_SIGN_EXT)
231 				return push_inst(compiler, SRDI(32) | S(dst) | A(dst));
232 			return SLJIT_SUCCESS;
233 		}
234 
235 		if (flags & ALT_FORM2) {
236 			/* Flags does not set: BIN_IMM_EXTS unnecessary. */
237 			SLJIT_ASSERT(src2 == TMP_REG2);
238 
239 			if (flags & ALT_FORM3)
240 				return push_inst(compiler, ADDIS | D(dst) | A(src1) | compiler->imm);
241 
242 			imm = compiler->imm;
243 
244 			if (flags & ALT_FORM4) {
245 				FAIL_IF(push_inst(compiler, ADDIS | D(dst) | A(src1) | (((imm >> 16) & 0xffff) + ((imm >> 15) & 0x1))));
246 				src1 = dst;
247 			}
248 
249 			return push_inst(compiler, ADDI | D(dst) | A(src1) | (imm & 0xffff));
250 		}
251 		if (flags & ALT_FORM3) {
252 			SLJIT_ASSERT(src2 == TMP_REG2);
253 			BIN_IMM_EXTS();
254 			return push_inst(compiler, ADDIC | D(dst) | A(src1) | compiler->imm);
255 		}
256 		if (flags & ALT_FORM4) {
257 			if (flags & ALT_FORM5)
258 				FAIL_IF(push_inst(compiler, ADDI | D(dst) | A(src1) | compiler->imm));
259 			else
260 				FAIL_IF(push_inst(compiler, ADD | D(dst) | A(src1) | B(src2)));
261 			return push_inst(compiler, CMPI | A(dst) | 0);
262 		}
263 		if (!(flags & ALT_SET_FLAGS))
264 			return push_inst(compiler, ADD | D(dst) | A(src1) | B(src2));
265 		BIN_EXTS();
266 		if (flags & ALT_FORM5)
267 			return push_inst(compiler, ADDC | RC(ALT_SET_FLAGS) | D(dst) | A(src1) | B(src2));
268 		return push_inst(compiler, ADD | RC(flags) | D(dst) | A(src1) | B(src2));
269 
270 	case SLJIT_ADDC:
271 		BIN_EXTS();
272 		return push_inst(compiler, ADDE | D(dst) | A(src1) | B(src2));
273 
274 	case SLJIT_SUB:
275 		if (flags & ALT_FORM1) {
276 			if (flags & ALT_FORM2) {
277 				FAIL_IF(push_inst(compiler, CMPLI | CRD(0 | ((flags & ALT_SIGN_EXT) ? 0 : 1)) | A(src1) | compiler->imm));
278 				if (!(flags & ALT_FORM3))
279 					return SLJIT_SUCCESS;
280 				return push_inst(compiler, ADDI | D(dst) | A(src1) | (-compiler->imm & 0xffff));
281 			}
282 			FAIL_IF(push_inst(compiler, CMPL | CRD(0 | ((flags & ALT_SIGN_EXT) ? 0 : 1)) | A(src1) | B(src2)));
283 			if (!(flags & ALT_FORM3))
284 				return SLJIT_SUCCESS;
285 			return push_inst(compiler, SUBF | D(dst) | A(src2) | B(src1));
286 		}
287 
288 		if (flags & ALT_FORM2) {
289 			if (flags & ALT_FORM3) {
290 				FAIL_IF(push_inst(compiler, CMPI | CRD(0 | ((flags & ALT_SIGN_EXT) ? 0 : 1)) | A(src1) | compiler->imm));
291 				if (!(flags & ALT_FORM4))
292 					return SLJIT_SUCCESS;
293 				return push_inst(compiler, ADDI | D(dst) | A(src1) | (-compiler->imm & 0xffff));
294 			}
295 			FAIL_IF(push_inst(compiler, CMP | CRD(0 | ((flags & ALT_SIGN_EXT) ? 0 : 1)) | A(src1) | B(src2)));
296 			if (!(flags & ALT_FORM4))
297 				return SLJIT_SUCCESS;
298 			return push_inst(compiler, SUBF | D(dst) | A(src2) | B(src1));
299 		}
300 
301 		if (flags & ALT_FORM3) {
302 			if (flags & ALT_SIGN_EXT) {
303 				if (src1 != TMP_ZERO) {
304 					FAIL_IF(push_inst(compiler, SLDI(32) | S(src1) | A(TMP_REG1)));
305 					src1 = TMP_REG1;
306 				}
307 				if (src2 != TMP_ZERO) {
308 					FAIL_IF(push_inst(compiler, SLDI(32) | S(src2) | A(TMP_REG2)));
309 					src2 = TMP_REG2;
310 				}
311 			}
312 
313 			/* Setting XER SO is not enough, CR SO is also needed. */
314 			if (src1 != TMP_ZERO)
315 				FAIL_IF(push_inst(compiler, SUBF | OE(ALT_SET_FLAGS) | RC(ALT_SET_FLAGS) | D(dst) | A(src2) | B(src1)));
316 			else
317 				FAIL_IF(push_inst(compiler, NEG | OE(ALT_SET_FLAGS) | RC(ALT_SET_FLAGS) | D(dst) | A(src2)));
318 
319 			if (flags & ALT_SIGN_EXT)
320 				return push_inst(compiler, SRDI(32) | S(dst) | A(dst));
321 			return SLJIT_SUCCESS;
322 		}
323 
324 		if (flags & ALT_FORM4) {
325 			/* Flags does not set: BIN_IMM_EXTS unnecessary. */
326 			SLJIT_ASSERT(src2 == TMP_REG2);
327 			return push_inst(compiler, SUBFIC | D(dst) | A(src1) | compiler->imm);
328 		}
329 
330 		if (!(flags & ALT_SET_FLAGS)) {
331 			SLJIT_ASSERT(src1 != TMP_ZERO);
332 			return push_inst(compiler, SUBF | D(dst) | A(src2) | B(src1));
333 		}
334 
335 		BIN_EXTS();
336 		if (flags & ALT_FORM5)
337 			return push_inst(compiler, SUBFC | RC(ALT_SET_FLAGS) | D(dst) | A(src2) | B(src1));
338 
339 		if (src1 != TMP_ZERO)
340 			return push_inst(compiler, SUBF | RC(ALT_SET_FLAGS) | D(dst) | A(src2) | B(src1));
341 		return push_inst(compiler, NEG | RC(ALT_SET_FLAGS) | D(dst) | A(src2));
342 
343 	case SLJIT_SUBC:
344 		BIN_EXTS();
345 		return push_inst(compiler, SUBFE | D(dst) | A(src2) | B(src1));
346 
347 	case SLJIT_MUL:
348 		if (flags & ALT_FORM1) {
349 			SLJIT_ASSERT(src2 == TMP_REG2);
350 			return push_inst(compiler, MULLI | D(dst) | A(src1) | compiler->imm);
351 		}
352 		BIN_EXTS();
353 		if (flags & ALT_FORM2)
354 			return push_inst(compiler, MULLW | OE(flags) | RC(flags) | D(dst) | A(src2) | B(src1));
355 		return push_inst(compiler, MULLD | OE(flags) | RC(flags) | D(dst) | A(src2) | B(src1));
356 
357 	case SLJIT_AND:
358 		if (flags & ALT_FORM1) {
359 			SLJIT_ASSERT(src2 == TMP_REG2);
360 			return push_inst(compiler, ANDI | S(src1) | A(dst) | compiler->imm);
361 		}
362 		if (flags & ALT_FORM2) {
363 			SLJIT_ASSERT(src2 == TMP_REG2);
364 			return push_inst(compiler, ANDIS | S(src1) | A(dst) | compiler->imm);
365 		}
366 		return push_inst(compiler, AND | RC(flags) | S(src1) | A(dst) | B(src2));
367 
368 	case SLJIT_OR:
369 		if (flags & ALT_FORM1) {
370 			SLJIT_ASSERT(src2 == TMP_REG2);
371 			return push_inst(compiler, ORI | S(src1) | A(dst) | compiler->imm);
372 		}
373 		if (flags & ALT_FORM2) {
374 			SLJIT_ASSERT(src2 == TMP_REG2);
375 			return push_inst(compiler, ORIS | S(src1) | A(dst) | compiler->imm);
376 		}
377 		if (flags & ALT_FORM3) {
378 			SLJIT_ASSERT(src2 == TMP_REG2);
379 			imm = compiler->imm;
380 
381 			FAIL_IF(push_inst(compiler, ORI | S(src1) | A(dst) | IMM(imm)));
382 			return push_inst(compiler, ORIS | S(dst) | A(dst) | IMM(imm >> 16));
383 		}
384 		return push_inst(compiler, OR | RC(flags) | S(src1) | A(dst) | B(src2));
385 
386 	case SLJIT_XOR:
387 		if (flags & ALT_FORM1) {
388 			SLJIT_ASSERT(src2 == TMP_REG2);
389 			return push_inst(compiler, XORI | S(src1) | A(dst) | compiler->imm);
390 		}
391 		if (flags & ALT_FORM2) {
392 			SLJIT_ASSERT(src2 == TMP_REG2);
393 			return push_inst(compiler, XORIS | S(src1) | A(dst) | compiler->imm);
394 		}
395 		if (flags & ALT_FORM3) {
396 			SLJIT_ASSERT(src2 == TMP_REG2);
397 			imm = compiler->imm;
398 
399 			FAIL_IF(push_inst(compiler, XORI | S(src1) | A(dst) | IMM(imm)));
400 			return push_inst(compiler, XORIS | S(dst) | A(dst) | IMM(imm >> 16));
401 		}
402 		return push_inst(compiler, XOR | RC(flags) | S(src1) | A(dst) | B(src2));
403 
404 	case SLJIT_SHL:
405 	case SLJIT_MSHL:
406 		if (flags & ALT_FORM1) {
407 			SLJIT_ASSERT(src2 == TMP_REG2);
408 			imm = compiler->imm;
409 
410 			if (flags & ALT_FORM2) {
411 				imm &= 0x1f;
412 				return push_inst(compiler, SLWI(imm) | RC(flags) | S(src1) | A(dst));
413 			}
414 
415 			imm &= 0x3f;
416 			return push_inst(compiler, SLDI(imm) | RC(flags) | S(src1) | A(dst));
417 		}
418 
419 		if (op == SLJIT_MSHL) {
420 			FAIL_IF(push_inst(compiler, ANDI | S(src2) | A(TMP_REG2) | ((flags & ALT_FORM2) ? 0x1f : 0x3f)));
421 			src2 = TMP_REG2;
422 		}
423 
424 		return push_inst(compiler, ((flags & ALT_FORM2) ? SLW : SLD) | RC(flags) | S(src1) | A(dst) | B(src2));
425 
426 	case SLJIT_LSHR:
427 	case SLJIT_MLSHR:
428 		if (flags & ALT_FORM1) {
429 			SLJIT_ASSERT(src2 == TMP_REG2);
430 			imm = compiler->imm;
431 
432 			if (flags & ALT_FORM2) {
433 				imm &= 0x1f;
434 				/* Since imm can be 0, SRWI() cannot be used. */
435 				return push_inst(compiler, RLWINM | RC(flags) | S(src1) | A(dst) | RLWI_SH((32 - imm) & 0x1f) | RLWI_MBE(imm, 31));
436 			}
437 
438 			imm &= 0x3f;
439 			/* Since imm can be 0, SRDI() cannot be used. */
440 			return push_inst(compiler, RLDICL | RC(flags) | S(src1) | A(dst) | RLDI_SH((64 - imm) & 0x3f) | RLDI_MB(imm));
441 		}
442 
443 		if (op == SLJIT_MLSHR) {
444 			FAIL_IF(push_inst(compiler, ANDI | S(src2) | A(TMP_REG2) | ((flags & ALT_FORM2) ? 0x1f : 0x3f)));
445 			src2 = TMP_REG2;
446 		}
447 
448 		return push_inst(compiler, ((flags & ALT_FORM2) ? SRW : SRD) | RC(flags) | S(src1) | A(dst) | B(src2));
449 
450 	case SLJIT_ASHR:
451 	case SLJIT_MASHR:
452 		if (flags & ALT_FORM1) {
453 			SLJIT_ASSERT(src2 == TMP_REG2);
454 			imm = compiler->imm;
455 
456 			if (flags & ALT_FORM2) {
457 				imm &= 0x1f;
458 				return push_inst(compiler, SRAWI | RC(flags) | S(src1) | A(dst) | (imm << 11));
459 			}
460 
461 			imm &= 0x3f;
462 			return push_inst(compiler, SRADI | RC(flags) | S(src1) | A(dst) | RLDI_SH(imm));
463 		}
464 
465 		if (op == SLJIT_MASHR) {
466 			FAIL_IF(push_inst(compiler, ANDI | S(src2) | A(TMP_REG2) | ((flags & ALT_FORM2) ? 0x1f : 0x3f)));
467 			src2 = TMP_REG2;
468 		}
469 
470 		return push_inst(compiler, ((flags & ALT_FORM2) ? SRAW : SRAD) | RC(flags) | S(src1) | A(dst) | B(src2));
471 
472 	case SLJIT_ROTL:
473 	case SLJIT_ROTR:
474 		if (flags & ALT_FORM1) {
475 			SLJIT_ASSERT(src2 == TMP_REG2);
476 			imm = compiler->imm;
477 
478 			if (op == SLJIT_ROTR)
479 				imm = (sljit_u32)(-(sljit_s32)imm);
480 
481 			if (flags & ALT_FORM2) {
482 				imm &= 0x1f;
483 				return push_inst(compiler, RLWINM | S(src1) | A(dst) | RLWI_SH(imm) | RLWI_MBE(0, 31));
484 			}
485 
486 			imm &= 0x3f;
487 			return push_inst(compiler, RLDICL | S(src1) | A(dst) | RLDI_SH(imm));
488 		}
489 
490 		if (op == SLJIT_ROTR) {
491 			FAIL_IF(push_inst(compiler, SUBFIC | D(TMP_REG2) | A(src2) | 0));
492 			src2 = TMP_REG2;
493 		}
494 
495 		return push_inst(compiler, ((flags & ALT_FORM2) ? (RLWNM | RLWI_MBE(0, 31)) : (RLDCL | RLDI_MB(0))) | S(src1) | A(dst) | B(src2));
496 	}
497 
498 	SLJIT_UNREACHABLE();
499 	return SLJIT_SUCCESS;
500 }
501 
call_with_args(struct sljit_compiler * compiler,sljit_s32 arg_types,sljit_s32 * src)502 static sljit_s32 call_with_args(struct sljit_compiler *compiler, sljit_s32 arg_types, sljit_s32 *src)
503 {
504 	sljit_s32 arg_count = 0;
505 	sljit_s32 word_arg_count = 0;
506 	sljit_s32 types = 0;
507 	sljit_s32 reg = 0;
508 
509 	if (src)
510 		reg = *src & REG_MASK;
511 
512 	arg_types >>= SLJIT_ARG_SHIFT;
513 
514 	while (arg_types) {
515 		types = (types << SLJIT_ARG_SHIFT) | (arg_types & SLJIT_ARG_MASK);
516 
517 		switch (arg_types & SLJIT_ARG_MASK) {
518 		case SLJIT_ARG_TYPE_F64:
519 		case SLJIT_ARG_TYPE_F32:
520 			arg_count++;
521 			break;
522 		default:
523 			arg_count++;
524 			word_arg_count++;
525 
526 			if (arg_count != word_arg_count && arg_count == reg) {
527 				FAIL_IF(push_inst(compiler, OR | S(reg) | A(TMP_CALL_REG) | B(reg)));
528 				*src = TMP_CALL_REG;
529 			}
530 			break;
531 		}
532 
533 		arg_types >>= SLJIT_ARG_SHIFT;
534 	}
535 
536 	while (types) {
537 		switch (types & SLJIT_ARG_MASK) {
538 		case SLJIT_ARG_TYPE_F64:
539 		case SLJIT_ARG_TYPE_F32:
540 			arg_count--;
541 			break;
542 		default:
543 			if (arg_count != word_arg_count)
544 				FAIL_IF(push_inst(compiler, OR | S(word_arg_count) | A(arg_count) | B(word_arg_count)));
545 
546 			arg_count--;
547 			word_arg_count--;
548 			break;
549 		}
550 
551 		types >>= SLJIT_ARG_SHIFT;
552 	}
553 
554 	return SLJIT_SUCCESS;
555 }
556 
emit_const(struct sljit_compiler * compiler,sljit_s32 reg,sljit_sw init_value)557 static SLJIT_INLINE sljit_s32 emit_const(struct sljit_compiler *compiler, sljit_s32 reg, sljit_sw init_value)
558 {
559 	FAIL_IF(push_inst(compiler, ADDIS | D(reg) | A(0) | IMM(init_value >> 48)));
560 	FAIL_IF(push_inst(compiler, ORI | S(reg) | A(reg) | IMM(init_value >> 32)));
561 	FAIL_IF(push_inst(compiler, SLDI(32) | S(reg) | A(reg)));
562 	FAIL_IF(push_inst(compiler, ORIS | S(reg) | A(reg) | IMM(init_value >> 16)));
563 	return push_inst(compiler, ORI | S(reg) | A(reg) | IMM(init_value));
564 }
565 
sljit_set_jump_addr(sljit_uw addr,sljit_uw new_target,sljit_sw executable_offset)566 SLJIT_API_FUNC_ATTRIBUTE void sljit_set_jump_addr(sljit_uw addr, sljit_uw new_target, sljit_sw executable_offset)
567 {
568 	sljit_ins *inst = (sljit_ins*)addr;
569 	SLJIT_UNUSED_ARG(executable_offset);
570 
571 	SLJIT_UPDATE_WX_FLAGS(inst, inst + 5, 0);
572 	inst[0] = (inst[0] & 0xffff0000u) | ((sljit_ins)(new_target >> 48) & 0xffff);
573 	inst[1] = (inst[1] & 0xffff0000u) | ((sljit_ins)(new_target >> 32) & 0xffff);
574 	inst[3] = (inst[3] & 0xffff0000u) | ((sljit_ins)(new_target >> 16) & 0xffff);
575 	inst[4] = (inst[4] & 0xffff0000u) | ((sljit_ins)new_target & 0xffff);
576 	SLJIT_UPDATE_WX_FLAGS(inst, inst + 5, 1);
577 	inst = (sljit_ins *)SLJIT_ADD_EXEC_OFFSET(inst, executable_offset);
578 	SLJIT_CACHE_FLUSH(inst, inst + 5);
579 }
580