1 /*
2 * Stack-less Just-In-Time compiler
3 *
4 * Copyright Zoltan Herczeg (hzmester@freemail.hu). All rights reserved.
5 *
6 * Redistribution and use in source and binary forms, with or without modification, are
7 * permitted provided that the following conditions are met:
8 *
9 * 1. Redistributions of source code must retain the above copyright notice, this list of
10 * conditions and the following disclaimer.
11 *
12 * 2. Redistributions in binary form must reproduce the above copyright notice, this list
13 * of conditions and the following disclaimer in the documentation and/or other materials
14 * provided with the distribution.
15 *
16 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDER(S) AND CONTRIBUTORS ``AS IS'' AND ANY
17 * EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
18 * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT
19 * SHALL THE COPYRIGHT HOLDER(S) OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT,
20 * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED
21 * TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
22 * BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
23 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN
24 * ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
25 */
26
27 /* ppc 64-bit arch dependent functions. */
28
29 #if defined(__GNUC__) || (defined(__IBM_GCC_ASM) && __IBM_GCC_ASM)
30 #define ASM_SLJIT_CLZ(src, dst) \
31 __asm__ volatile ( "cntlzd %0, %1" : "=r"(dst) : "r"(src) )
32 #elif defined(__xlc__)
33 #error "Please enable GCC syntax for inline assembly statements"
34 #else
35 #error "Must implement count leading zeroes"
36 #endif
37
38 /* Computes SLDI(63 - shift). */
39 #define PUSH_SLDI_NEG(reg, shift) \
40 push_inst(compiler, RLDICR | S(reg) | A(reg) | RLDI_SH(63 - shift) | RLDI_ME(shift))
41
load_immediate(struct sljit_compiler * compiler,sljit_s32 reg,sljit_sw imm)42 static sljit_s32 load_immediate(struct sljit_compiler *compiler, sljit_s32 reg, sljit_sw imm)
43 {
44 sljit_uw tmp;
45 sljit_uw shift;
46 sljit_uw tmp2;
47 sljit_uw shift2;
48
49 if (imm <= SIMM_MAX && imm >= SIMM_MIN)
50 return push_inst(compiler, ADDI | D(reg) | A(0) | IMM(imm));
51
52 if (!(imm & ~0xffff))
53 return push_inst(compiler, ORI | S(TMP_ZERO) | A(reg) | IMM(imm));
54
55 if (imm <= 0x7fffffffl && imm >= -0x80000000l) {
56 FAIL_IF(push_inst(compiler, ADDIS | D(reg) | A(0) | IMM(imm >> 16)));
57 return (imm & 0xffff) ? push_inst(compiler, ORI | S(reg) | A(reg) | IMM(imm)) : SLJIT_SUCCESS;
58 }
59
60 /* Count leading zeroes. */
61 tmp = (sljit_uw)((imm >= 0) ? imm : ~imm);
62 ASM_SLJIT_CLZ(tmp, shift);
63 SLJIT_ASSERT(shift > 0);
64 shift--;
65 tmp = ((sljit_uw)imm << shift);
66
67 if ((tmp & ~0xffff000000000000ul) == 0) {
68 FAIL_IF(push_inst(compiler, ADDI | D(reg) | A(0) | (sljit_ins)(tmp >> 48)));
69 shift += 15;
70 return PUSH_SLDI_NEG(reg, shift);
71 }
72
73 if ((tmp & ~0xffffffff00000000ul) == 0) {
74 FAIL_IF(push_inst(compiler, ADDIS | D(reg) | A(0) | (sljit_ins)(tmp >> 48)));
75 FAIL_IF(push_inst(compiler, ORI | S(reg) | A(reg) | IMM(tmp >> 32)));
76 shift += 31;
77 return PUSH_SLDI_NEG(reg, shift);
78 }
79
80 /* Cut out the 16 bit from immediate. */
81 shift += 15;
82 tmp2 = (sljit_uw)imm & (((sljit_uw)1 << (63 - shift)) - 1);
83
84 if (tmp2 <= 0xffff) {
85 FAIL_IF(push_inst(compiler, ADDI | D(reg) | A(0) | (sljit_ins)(tmp >> 48)));
86 FAIL_IF(PUSH_SLDI_NEG(reg, shift));
87 return push_inst(compiler, ORI | S(reg) | A(reg) | (sljit_ins)tmp2);
88 }
89
90 if (tmp2 <= 0xffffffff) {
91 FAIL_IF(push_inst(compiler, ADDI | D(reg) | A(0) | IMM(tmp >> 48)));
92 FAIL_IF(PUSH_SLDI_NEG(reg, shift));
93 FAIL_IF(push_inst(compiler, ORIS | S(reg) | A(reg) | (sljit_ins)(tmp2 >> 16)));
94 return (imm & 0xffff) ? push_inst(compiler, ORI | S(reg) | A(reg) | IMM(tmp2)) : SLJIT_SUCCESS;
95 }
96
97 ASM_SLJIT_CLZ(tmp2, shift2);
98 tmp2 <<= shift2;
99
100 if ((tmp2 & ~0xffff000000000000ul) == 0) {
101 FAIL_IF(push_inst(compiler, ADDI | D(reg) | A(0) | (sljit_ins)(tmp >> 48)));
102 shift2 += 15;
103 shift += (63 - shift2);
104 FAIL_IF(PUSH_SLDI_NEG(reg, shift));
105 FAIL_IF(push_inst(compiler, ORI | S(reg) | A(reg) | (sljit_ins)(tmp2 >> 48)));
106 return PUSH_SLDI_NEG(reg, shift2);
107 }
108
109 /* The general version. */
110 FAIL_IF(push_inst(compiler, ADDIS | D(reg) | A(0) | (sljit_ins)((sljit_uw)imm >> 48)));
111 FAIL_IF(push_inst(compiler, ORI | S(reg) | A(reg) | IMM(imm >> 32)));
112 FAIL_IF(PUSH_SLDI_NEG(reg, 31));
113 FAIL_IF(push_inst(compiler, ORIS | S(reg) | A(reg) | IMM(imm >> 16)));
114 return push_inst(compiler, ORI | S(reg) | A(reg) | IMM(imm));
115 }
116
117 #undef PUSH_SLDI_NEG
118
119 #define CLRLDI(dst, src, n) \
120 (RLDICL | S(src) | A(dst) | RLDI_SH(0) | RLDI_MB(n))
121
122 /* Sign extension for integer operations. */
123 #define UN_EXTS() \
124 if ((flags & (ALT_SIGN_EXT | REG2_SOURCE)) == (ALT_SIGN_EXT | REG2_SOURCE)) { \
125 FAIL_IF(push_inst(compiler, EXTSW | S(src2) | A(TMP_REG2))); \
126 src2 = TMP_REG2; \
127 }
128
129 #define BIN_EXTS() \
130 if (flags & ALT_SIGN_EXT) { \
131 if (flags & REG1_SOURCE) { \
132 FAIL_IF(push_inst(compiler, EXTSW | S(src1) | A(TMP_REG1))); \
133 src1 = TMP_REG1; \
134 } \
135 if (flags & REG2_SOURCE) { \
136 FAIL_IF(push_inst(compiler, EXTSW | S(src2) | A(TMP_REG2))); \
137 src2 = TMP_REG2; \
138 } \
139 }
140
141 #define BIN_IMM_EXTS() \
142 if ((flags & (ALT_SIGN_EXT | REG1_SOURCE)) == (ALT_SIGN_EXT | REG1_SOURCE)) { \
143 FAIL_IF(push_inst(compiler, EXTSW | S(src1) | A(TMP_REG1))); \
144 src1 = TMP_REG1; \
145 }
146
emit_single_op(struct sljit_compiler * compiler,sljit_s32 op,sljit_s32 flags,sljit_s32 dst,sljit_s32 src1,sljit_s32 src2)147 static SLJIT_INLINE sljit_s32 emit_single_op(struct sljit_compiler *compiler, sljit_s32 op, sljit_s32 flags,
148 sljit_s32 dst, sljit_s32 src1, sljit_s32 src2)
149 {
150 sljit_u32 imm;
151
152 switch (op) {
153 case SLJIT_MOV:
154 case SLJIT_MOV_P:
155 SLJIT_ASSERT(src1 == TMP_REG1);
156 if (dst != src2)
157 return push_inst(compiler, OR | S(src2) | A(dst) | B(src2));
158 return SLJIT_SUCCESS;
159
160 case SLJIT_MOV_U32:
161 case SLJIT_MOV_S32:
162 SLJIT_ASSERT(src1 == TMP_REG1);
163 if ((flags & (REG_DEST | REG2_SOURCE)) == (REG_DEST | REG2_SOURCE)) {
164 if (op == SLJIT_MOV_S32)
165 return push_inst(compiler, EXTSW | S(src2) | A(dst));
166 return push_inst(compiler, CLRLDI(dst, src2, 32));
167 }
168 else {
169 SLJIT_ASSERT(dst == src2);
170 }
171 return SLJIT_SUCCESS;
172
173 case SLJIT_MOV_U8:
174 case SLJIT_MOV_S8:
175 SLJIT_ASSERT(src1 == TMP_REG1);
176 if ((flags & (REG_DEST | REG2_SOURCE)) == (REG_DEST | REG2_SOURCE)) {
177 if (op == SLJIT_MOV_S8)
178 return push_inst(compiler, EXTSB | S(src2) | A(dst));
179 return push_inst(compiler, CLRLDI(dst, src2, 56));
180 }
181 else if ((flags & REG_DEST) && op == SLJIT_MOV_S8)
182 return push_inst(compiler, EXTSB | S(src2) | A(dst));
183 else {
184 SLJIT_ASSERT(dst == src2);
185 }
186 return SLJIT_SUCCESS;
187
188 case SLJIT_MOV_U16:
189 case SLJIT_MOV_S16:
190 SLJIT_ASSERT(src1 == TMP_REG1);
191 if ((flags & (REG_DEST | REG2_SOURCE)) == (REG_DEST | REG2_SOURCE)) {
192 if (op == SLJIT_MOV_S16)
193 return push_inst(compiler, EXTSH | S(src2) | A(dst));
194 return push_inst(compiler, CLRLDI(dst, src2, 48));
195 }
196 else {
197 SLJIT_ASSERT(dst == src2);
198 }
199 return SLJIT_SUCCESS;
200
201 case SLJIT_NOT:
202 SLJIT_ASSERT(src1 == TMP_REG1);
203 UN_EXTS();
204 return push_inst(compiler, NOR | RC(flags) | S(src2) | A(dst) | B(src2));
205
206 case SLJIT_CLZ:
207 SLJIT_ASSERT(src1 == TMP_REG1);
208 return push_inst(compiler, ((flags & ALT_FORM1) ? CNTLZW : CNTLZD) | S(src2) | A(dst));
209
210 case SLJIT_CTZ:
211 SLJIT_ASSERT(src1 == TMP_REG1);
212 FAIL_IF(push_inst(compiler, NEG | D(TMP_REG1) | A(src2)));
213 FAIL_IF(push_inst(compiler, AND | S(src2) | A(dst) | B(TMP_REG1)));
214 FAIL_IF(push_inst(compiler, ((flags & ALT_FORM1) ? CNTLZW : CNTLZD) | S(dst) | A(dst)));
215 FAIL_IF(push_inst(compiler, ADDI | D(TMP_REG1) | A(dst) | IMM((flags & ALT_FORM1) ? -32 : -64)));
216 /* The highest bits are set, if dst < bit width, zero otherwise. */
217 FAIL_IF(push_inst(compiler, ((flags & ALT_FORM1) ? SRWI(27) : SRDI(58)) | S(TMP_REG1) | A(TMP_REG1)));
218 return push_inst(compiler, XOR | S(dst) | A(dst) | B(TMP_REG1));
219
220 case SLJIT_ADD:
221 if (flags & ALT_FORM1) {
222 if (flags & ALT_SIGN_EXT) {
223 FAIL_IF(push_inst(compiler, SLDI(32) | S(src1) | A(TMP_REG1)));
224 src1 = TMP_REG1;
225 FAIL_IF(push_inst(compiler, SLDI(32) | S(src2) | A(TMP_REG2)));
226 src2 = TMP_REG2;
227 }
228 /* Setting XER SO is not enough, CR SO is also needed. */
229 FAIL_IF(push_inst(compiler, ADD | OE(ALT_SET_FLAGS) | RC(ALT_SET_FLAGS) | D(dst) | A(src1) | B(src2)));
230 if (flags & ALT_SIGN_EXT)
231 return push_inst(compiler, SRDI(32) | S(dst) | A(dst));
232 return SLJIT_SUCCESS;
233 }
234
235 if (flags & ALT_FORM2) {
236 /* Flags does not set: BIN_IMM_EXTS unnecessary. */
237 SLJIT_ASSERT(src2 == TMP_REG2);
238
239 if (flags & ALT_FORM3)
240 return push_inst(compiler, ADDIS | D(dst) | A(src1) | compiler->imm);
241
242 imm = compiler->imm;
243
244 if (flags & ALT_FORM4) {
245 FAIL_IF(push_inst(compiler, ADDIS | D(dst) | A(src1) | (((imm >> 16) & 0xffff) + ((imm >> 15) & 0x1))));
246 src1 = dst;
247 }
248
249 return push_inst(compiler, ADDI | D(dst) | A(src1) | (imm & 0xffff));
250 }
251 if (flags & ALT_FORM3) {
252 SLJIT_ASSERT(src2 == TMP_REG2);
253 BIN_IMM_EXTS();
254 return push_inst(compiler, ADDIC | D(dst) | A(src1) | compiler->imm);
255 }
256 if (flags & ALT_FORM4) {
257 if (flags & ALT_FORM5)
258 FAIL_IF(push_inst(compiler, ADDI | D(dst) | A(src1) | compiler->imm));
259 else
260 FAIL_IF(push_inst(compiler, ADD | D(dst) | A(src1) | B(src2)));
261 return push_inst(compiler, CMPI | A(dst) | 0);
262 }
263 if (!(flags & ALT_SET_FLAGS))
264 return push_inst(compiler, ADD | D(dst) | A(src1) | B(src2));
265 BIN_EXTS();
266 if (flags & ALT_FORM5)
267 return push_inst(compiler, ADDC | RC(ALT_SET_FLAGS) | D(dst) | A(src1) | B(src2));
268 return push_inst(compiler, ADD | RC(flags) | D(dst) | A(src1) | B(src2));
269
270 case SLJIT_ADDC:
271 BIN_EXTS();
272 return push_inst(compiler, ADDE | D(dst) | A(src1) | B(src2));
273
274 case SLJIT_SUB:
275 if (flags & ALT_FORM1) {
276 if (flags & ALT_FORM2) {
277 FAIL_IF(push_inst(compiler, CMPLI | CRD(0 | ((flags & ALT_SIGN_EXT) ? 0 : 1)) | A(src1) | compiler->imm));
278 if (!(flags & ALT_FORM3))
279 return SLJIT_SUCCESS;
280 return push_inst(compiler, ADDI | D(dst) | A(src1) | (-compiler->imm & 0xffff));
281 }
282 FAIL_IF(push_inst(compiler, CMPL | CRD(0 | ((flags & ALT_SIGN_EXT) ? 0 : 1)) | A(src1) | B(src2)));
283 if (!(flags & ALT_FORM3))
284 return SLJIT_SUCCESS;
285 return push_inst(compiler, SUBF | D(dst) | A(src2) | B(src1));
286 }
287
288 if (flags & ALT_FORM2) {
289 if (flags & ALT_FORM3) {
290 FAIL_IF(push_inst(compiler, CMPI | CRD(0 | ((flags & ALT_SIGN_EXT) ? 0 : 1)) | A(src1) | compiler->imm));
291 if (!(flags & ALT_FORM4))
292 return SLJIT_SUCCESS;
293 return push_inst(compiler, ADDI | D(dst) | A(src1) | (-compiler->imm & 0xffff));
294 }
295 FAIL_IF(push_inst(compiler, CMP | CRD(0 | ((flags & ALT_SIGN_EXT) ? 0 : 1)) | A(src1) | B(src2)));
296 if (!(flags & ALT_FORM4))
297 return SLJIT_SUCCESS;
298 return push_inst(compiler, SUBF | D(dst) | A(src2) | B(src1));
299 }
300
301 if (flags & ALT_FORM3) {
302 if (flags & ALT_SIGN_EXT) {
303 if (src1 != TMP_ZERO) {
304 FAIL_IF(push_inst(compiler, SLDI(32) | S(src1) | A(TMP_REG1)));
305 src1 = TMP_REG1;
306 }
307 if (src2 != TMP_ZERO) {
308 FAIL_IF(push_inst(compiler, SLDI(32) | S(src2) | A(TMP_REG2)));
309 src2 = TMP_REG2;
310 }
311 }
312
313 /* Setting XER SO is not enough, CR SO is also needed. */
314 if (src1 != TMP_ZERO)
315 FAIL_IF(push_inst(compiler, SUBF | OE(ALT_SET_FLAGS) | RC(ALT_SET_FLAGS) | D(dst) | A(src2) | B(src1)));
316 else
317 FAIL_IF(push_inst(compiler, NEG | OE(ALT_SET_FLAGS) | RC(ALT_SET_FLAGS) | D(dst) | A(src2)));
318
319 if (flags & ALT_SIGN_EXT)
320 return push_inst(compiler, SRDI(32) | S(dst) | A(dst));
321 return SLJIT_SUCCESS;
322 }
323
324 if (flags & ALT_FORM4) {
325 /* Flags does not set: BIN_IMM_EXTS unnecessary. */
326 SLJIT_ASSERT(src2 == TMP_REG2);
327 return push_inst(compiler, SUBFIC | D(dst) | A(src1) | compiler->imm);
328 }
329
330 if (!(flags & ALT_SET_FLAGS)) {
331 SLJIT_ASSERT(src1 != TMP_ZERO);
332 return push_inst(compiler, SUBF | D(dst) | A(src2) | B(src1));
333 }
334
335 BIN_EXTS();
336 if (flags & ALT_FORM5)
337 return push_inst(compiler, SUBFC | RC(ALT_SET_FLAGS) | D(dst) | A(src2) | B(src1));
338
339 if (src1 != TMP_ZERO)
340 return push_inst(compiler, SUBF | RC(ALT_SET_FLAGS) | D(dst) | A(src2) | B(src1));
341 return push_inst(compiler, NEG | RC(ALT_SET_FLAGS) | D(dst) | A(src2));
342
343 case SLJIT_SUBC:
344 BIN_EXTS();
345 return push_inst(compiler, SUBFE | D(dst) | A(src2) | B(src1));
346
347 case SLJIT_MUL:
348 if (flags & ALT_FORM1) {
349 SLJIT_ASSERT(src2 == TMP_REG2);
350 return push_inst(compiler, MULLI | D(dst) | A(src1) | compiler->imm);
351 }
352 BIN_EXTS();
353 if (flags & ALT_FORM2)
354 return push_inst(compiler, MULLW | OE(flags) | RC(flags) | D(dst) | A(src2) | B(src1));
355 return push_inst(compiler, MULLD | OE(flags) | RC(flags) | D(dst) | A(src2) | B(src1));
356
357 case SLJIT_AND:
358 if (flags & ALT_FORM1) {
359 SLJIT_ASSERT(src2 == TMP_REG2);
360 return push_inst(compiler, ANDI | S(src1) | A(dst) | compiler->imm);
361 }
362 if (flags & ALT_FORM2) {
363 SLJIT_ASSERT(src2 == TMP_REG2);
364 return push_inst(compiler, ANDIS | S(src1) | A(dst) | compiler->imm);
365 }
366 return push_inst(compiler, AND | RC(flags) | S(src1) | A(dst) | B(src2));
367
368 case SLJIT_OR:
369 if (flags & ALT_FORM1) {
370 SLJIT_ASSERT(src2 == TMP_REG2);
371 return push_inst(compiler, ORI | S(src1) | A(dst) | compiler->imm);
372 }
373 if (flags & ALT_FORM2) {
374 SLJIT_ASSERT(src2 == TMP_REG2);
375 return push_inst(compiler, ORIS | S(src1) | A(dst) | compiler->imm);
376 }
377 if (flags & ALT_FORM3) {
378 SLJIT_ASSERT(src2 == TMP_REG2);
379 imm = compiler->imm;
380
381 FAIL_IF(push_inst(compiler, ORI | S(src1) | A(dst) | IMM(imm)));
382 return push_inst(compiler, ORIS | S(dst) | A(dst) | IMM(imm >> 16));
383 }
384 return push_inst(compiler, OR | RC(flags) | S(src1) | A(dst) | B(src2));
385
386 case SLJIT_XOR:
387 if (flags & ALT_FORM1) {
388 SLJIT_ASSERT(src2 == TMP_REG2);
389 return push_inst(compiler, XORI | S(src1) | A(dst) | compiler->imm);
390 }
391 if (flags & ALT_FORM2) {
392 SLJIT_ASSERT(src2 == TMP_REG2);
393 return push_inst(compiler, XORIS | S(src1) | A(dst) | compiler->imm);
394 }
395 if (flags & ALT_FORM3) {
396 SLJIT_ASSERT(src2 == TMP_REG2);
397 imm = compiler->imm;
398
399 FAIL_IF(push_inst(compiler, XORI | S(src1) | A(dst) | IMM(imm)));
400 return push_inst(compiler, XORIS | S(dst) | A(dst) | IMM(imm >> 16));
401 }
402 return push_inst(compiler, XOR | RC(flags) | S(src1) | A(dst) | B(src2));
403
404 case SLJIT_SHL:
405 case SLJIT_MSHL:
406 if (flags & ALT_FORM1) {
407 SLJIT_ASSERT(src2 == TMP_REG2);
408 imm = compiler->imm;
409
410 if (flags & ALT_FORM2) {
411 imm &= 0x1f;
412 return push_inst(compiler, SLWI(imm) | RC(flags) | S(src1) | A(dst));
413 }
414
415 imm &= 0x3f;
416 return push_inst(compiler, SLDI(imm) | RC(flags) | S(src1) | A(dst));
417 }
418
419 if (op == SLJIT_MSHL) {
420 FAIL_IF(push_inst(compiler, ANDI | S(src2) | A(TMP_REG2) | ((flags & ALT_FORM2) ? 0x1f : 0x3f)));
421 src2 = TMP_REG2;
422 }
423
424 return push_inst(compiler, ((flags & ALT_FORM2) ? SLW : SLD) | RC(flags) | S(src1) | A(dst) | B(src2));
425
426 case SLJIT_LSHR:
427 case SLJIT_MLSHR:
428 if (flags & ALT_FORM1) {
429 SLJIT_ASSERT(src2 == TMP_REG2);
430 imm = compiler->imm;
431
432 if (flags & ALT_FORM2) {
433 imm &= 0x1f;
434 /* Since imm can be 0, SRWI() cannot be used. */
435 return push_inst(compiler, RLWINM | RC(flags) | S(src1) | A(dst) | RLWI_SH((32 - imm) & 0x1f) | RLWI_MBE(imm, 31));
436 }
437
438 imm &= 0x3f;
439 /* Since imm can be 0, SRDI() cannot be used. */
440 return push_inst(compiler, RLDICL | RC(flags) | S(src1) | A(dst) | RLDI_SH((64 - imm) & 0x3f) | RLDI_MB(imm));
441 }
442
443 if (op == SLJIT_MLSHR) {
444 FAIL_IF(push_inst(compiler, ANDI | S(src2) | A(TMP_REG2) | ((flags & ALT_FORM2) ? 0x1f : 0x3f)));
445 src2 = TMP_REG2;
446 }
447
448 return push_inst(compiler, ((flags & ALT_FORM2) ? SRW : SRD) | RC(flags) | S(src1) | A(dst) | B(src2));
449
450 case SLJIT_ASHR:
451 case SLJIT_MASHR:
452 if (flags & ALT_FORM1) {
453 SLJIT_ASSERT(src2 == TMP_REG2);
454 imm = compiler->imm;
455
456 if (flags & ALT_FORM2) {
457 imm &= 0x1f;
458 return push_inst(compiler, SRAWI | RC(flags) | S(src1) | A(dst) | (imm << 11));
459 }
460
461 imm &= 0x3f;
462 return push_inst(compiler, SRADI | RC(flags) | S(src1) | A(dst) | RLDI_SH(imm));
463 }
464
465 if (op == SLJIT_MASHR) {
466 FAIL_IF(push_inst(compiler, ANDI | S(src2) | A(TMP_REG2) | ((flags & ALT_FORM2) ? 0x1f : 0x3f)));
467 src2 = TMP_REG2;
468 }
469
470 return push_inst(compiler, ((flags & ALT_FORM2) ? SRAW : SRAD) | RC(flags) | S(src1) | A(dst) | B(src2));
471
472 case SLJIT_ROTL:
473 case SLJIT_ROTR:
474 if (flags & ALT_FORM1) {
475 SLJIT_ASSERT(src2 == TMP_REG2);
476 imm = compiler->imm;
477
478 if (op == SLJIT_ROTR)
479 imm = (sljit_u32)(-(sljit_s32)imm);
480
481 if (flags & ALT_FORM2) {
482 imm &= 0x1f;
483 return push_inst(compiler, RLWINM | S(src1) | A(dst) | RLWI_SH(imm) | RLWI_MBE(0, 31));
484 }
485
486 imm &= 0x3f;
487 return push_inst(compiler, RLDICL | S(src1) | A(dst) | RLDI_SH(imm));
488 }
489
490 if (op == SLJIT_ROTR) {
491 FAIL_IF(push_inst(compiler, SUBFIC | D(TMP_REG2) | A(src2) | 0));
492 src2 = TMP_REG2;
493 }
494
495 return push_inst(compiler, ((flags & ALT_FORM2) ? (RLWNM | RLWI_MBE(0, 31)) : (RLDCL | RLDI_MB(0))) | S(src1) | A(dst) | B(src2));
496 }
497
498 SLJIT_UNREACHABLE();
499 return SLJIT_SUCCESS;
500 }
501
call_with_args(struct sljit_compiler * compiler,sljit_s32 arg_types,sljit_s32 * src)502 static sljit_s32 call_with_args(struct sljit_compiler *compiler, sljit_s32 arg_types, sljit_s32 *src)
503 {
504 sljit_s32 arg_count = 0;
505 sljit_s32 word_arg_count = 0;
506 sljit_s32 types = 0;
507 sljit_s32 reg = 0;
508
509 if (src)
510 reg = *src & REG_MASK;
511
512 arg_types >>= SLJIT_ARG_SHIFT;
513
514 while (arg_types) {
515 types = (types << SLJIT_ARG_SHIFT) | (arg_types & SLJIT_ARG_MASK);
516
517 switch (arg_types & SLJIT_ARG_MASK) {
518 case SLJIT_ARG_TYPE_F64:
519 case SLJIT_ARG_TYPE_F32:
520 arg_count++;
521 break;
522 default:
523 arg_count++;
524 word_arg_count++;
525
526 if (arg_count != word_arg_count && arg_count == reg) {
527 FAIL_IF(push_inst(compiler, OR | S(reg) | A(TMP_CALL_REG) | B(reg)));
528 *src = TMP_CALL_REG;
529 }
530 break;
531 }
532
533 arg_types >>= SLJIT_ARG_SHIFT;
534 }
535
536 while (types) {
537 switch (types & SLJIT_ARG_MASK) {
538 case SLJIT_ARG_TYPE_F64:
539 case SLJIT_ARG_TYPE_F32:
540 arg_count--;
541 break;
542 default:
543 if (arg_count != word_arg_count)
544 FAIL_IF(push_inst(compiler, OR | S(word_arg_count) | A(arg_count) | B(word_arg_count)));
545
546 arg_count--;
547 word_arg_count--;
548 break;
549 }
550
551 types >>= SLJIT_ARG_SHIFT;
552 }
553
554 return SLJIT_SUCCESS;
555 }
556
emit_const(struct sljit_compiler * compiler,sljit_s32 reg,sljit_sw init_value)557 static SLJIT_INLINE sljit_s32 emit_const(struct sljit_compiler *compiler, sljit_s32 reg, sljit_sw init_value)
558 {
559 FAIL_IF(push_inst(compiler, ADDIS | D(reg) | A(0) | IMM(init_value >> 48)));
560 FAIL_IF(push_inst(compiler, ORI | S(reg) | A(reg) | IMM(init_value >> 32)));
561 FAIL_IF(push_inst(compiler, SLDI(32) | S(reg) | A(reg)));
562 FAIL_IF(push_inst(compiler, ORIS | S(reg) | A(reg) | IMM(init_value >> 16)));
563 return push_inst(compiler, ORI | S(reg) | A(reg) | IMM(init_value));
564 }
565
sljit_set_jump_addr(sljit_uw addr,sljit_uw new_target,sljit_sw executable_offset)566 SLJIT_API_FUNC_ATTRIBUTE void sljit_set_jump_addr(sljit_uw addr, sljit_uw new_target, sljit_sw executable_offset)
567 {
568 sljit_ins *inst = (sljit_ins*)addr;
569 SLJIT_UNUSED_ARG(executable_offset);
570
571 SLJIT_UPDATE_WX_FLAGS(inst, inst + 5, 0);
572 inst[0] = (inst[0] & 0xffff0000u) | ((sljit_ins)(new_target >> 48) & 0xffff);
573 inst[1] = (inst[1] & 0xffff0000u) | ((sljit_ins)(new_target >> 32) & 0xffff);
574 inst[3] = (inst[3] & 0xffff0000u) | ((sljit_ins)(new_target >> 16) & 0xffff);
575 inst[4] = (inst[4] & 0xffff0000u) | ((sljit_ins)new_target & 0xffff);
576 SLJIT_UPDATE_WX_FLAGS(inst, inst + 5, 1);
577 inst = (sljit_ins *)SLJIT_ADD_EXEC_OFFSET(inst, executable_offset);
578 SLJIT_CACHE_FLUSH(inst, inst + 5);
579 }
580