1 /*
2  *    Stack-less Just-In-Time compiler
3  *
4  *    Copyright Zoltan Herczeg (hzmester@freemail.hu). All rights reserved.
5  *
6  * Redistribution and use in source and binary forms, with or without modification, are
7  * permitted provided that the following conditions are met:
8  *
9  *   1. Redistributions of source code must retain the above copyright notice, this list of
10  *      conditions and the following disclaimer.
11  *
12  *   2. Redistributions in binary form must reproduce the above copyright notice, this list
13  *      of conditions and the following disclaimer in the documentation and/or other materials
14  *      provided with the distribution.
15  *
16  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDER(S) AND CONTRIBUTORS ``AS IS'' AND ANY
17  * EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
18  * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT
19  * SHALL THE COPYRIGHT HOLDER(S) OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT,
20  * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED
21  * TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
22  * BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
23  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN
24  * ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
25  */
26 
27 /* mips 32-bit arch dependent functions. */
28 
load_immediate(struct sljit_compiler * compiler,sljit_s32 dst_ar,sljit_sw imm)29 static sljit_s32 load_immediate(struct sljit_compiler *compiler, sljit_s32 dst_ar, sljit_sw imm)
30 {
31 	if (!(imm & ~0xffff))
32 		return push_inst(compiler, ORI | SA(0) | TA(dst_ar) | IMM(imm), dst_ar);
33 
34 	if (imm < 0 && imm >= SIMM_MIN)
35 		return push_inst(compiler, ADDIU | SA(0) | TA(dst_ar) | IMM(imm), dst_ar);
36 
37 	FAIL_IF(push_inst(compiler, LUI | TA(dst_ar) | IMM(imm >> 16), dst_ar));
38 	return (imm & 0xffff) ? push_inst(compiler, ORI | SA(dst_ar) | TA(dst_ar) | IMM(imm), dst_ar) : SLJIT_SUCCESS;
39 }
40 
41 #define EMIT_LOGICAL(op_imm, op_norm) \
42 	if (flags & SRC2_IMM) { \
43 		if (op & SLJIT_SET_Z) \
44 			FAIL_IF(push_inst(compiler, op_imm | S(src1) | TA(EQUAL_FLAG) | IMM(src2), EQUAL_FLAG)); \
45 		if (!(flags & UNUSED_DEST)) \
46 			FAIL_IF(push_inst(compiler, op_imm | S(src1) | T(dst) | IMM(src2), DR(dst))); \
47 	} \
48 	else { \
49 		if (op & SLJIT_SET_Z) \
50 			FAIL_IF(push_inst(compiler, op_norm | S(src1) | T(src2) | DA(EQUAL_FLAG), EQUAL_FLAG)); \
51 		if (!(flags & UNUSED_DEST)) \
52 			FAIL_IF(push_inst(compiler, op_norm | S(src1) | T(src2) | D(dst), DR(dst))); \
53 	}
54 
55 #define EMIT_SHIFT(op_imm, op_v) \
56 	if (flags & SRC2_IMM) { \
57 		if (op & SLJIT_SET_Z) \
58 			FAIL_IF(push_inst(compiler, op_imm | T(src1) | DA(EQUAL_FLAG) | SH_IMM(src2), EQUAL_FLAG)); \
59 		if (!(flags & UNUSED_DEST)) \
60 			FAIL_IF(push_inst(compiler, op_imm | T(src1) | D(dst) | SH_IMM(src2), DR(dst))); \
61 	} \
62 	else { \
63 		if (op & SLJIT_SET_Z) \
64 			FAIL_IF(push_inst(compiler, op_v | S(src2) | T(src1) | DA(EQUAL_FLAG), EQUAL_FLAG)); \
65 		if (!(flags & UNUSED_DEST)) \
66 			FAIL_IF(push_inst(compiler, op_v | S(src2) | T(src1) | D(dst), DR(dst))); \
67 	}
68 
emit_single_op(struct sljit_compiler * compiler,sljit_s32 op,sljit_s32 flags,sljit_s32 dst,sljit_s32 src1,sljit_sw src2)69 static SLJIT_INLINE sljit_s32 emit_single_op(struct sljit_compiler *compiler, sljit_s32 op, sljit_s32 flags,
70 	sljit_s32 dst, sljit_s32 src1, sljit_sw src2)
71 {
72 	sljit_s32 is_overflow, is_carry, is_handled;
73 
74 	switch (GET_OPCODE(op)) {
75 	case SLJIT_MOV:
76 	case SLJIT_MOV_U32:
77 	case SLJIT_MOV_S32:
78 	case SLJIT_MOV_P:
79 		SLJIT_ASSERT(src1 == TMP_REG1 && !(flags & SRC2_IMM));
80 		if (dst != src2)
81 			return push_inst(compiler, ADDU | S(src2) | TA(0) | D(dst), DR(dst));
82 		return SLJIT_SUCCESS;
83 
84 	case SLJIT_MOV_U8:
85 	case SLJIT_MOV_S8:
86 		SLJIT_ASSERT(src1 == TMP_REG1 && !(flags & SRC2_IMM));
87 		if ((flags & (REG_DEST | REG2_SOURCE)) == (REG_DEST | REG2_SOURCE)) {
88 			if (op == SLJIT_MOV_S8) {
89 #if (defined SLJIT_MIPS_REV && SLJIT_MIPS_REV >= 1)
90 				return push_inst(compiler, SEB | T(src2) | D(dst), DR(dst));
91 #else /* SLJIT_MIPS_REV < 1 */
92 				FAIL_IF(push_inst(compiler, SLL | T(src2) | D(dst) | SH_IMM(24), DR(dst)));
93 				return push_inst(compiler, SRA | T(dst) | D(dst) | SH_IMM(24), DR(dst));
94 #endif /* SLJIT_MIPS_REV >= 1 */
95 			}
96 			return push_inst(compiler, ANDI | S(src2) | T(dst) | IMM(0xff), DR(dst));
97 		}
98 		else {
99 			SLJIT_ASSERT(dst == src2);
100 		}
101 		return SLJIT_SUCCESS;
102 
103 	case SLJIT_MOV_U16:
104 	case SLJIT_MOV_S16:
105 		SLJIT_ASSERT(src1 == TMP_REG1 && !(flags & SRC2_IMM));
106 		if ((flags & (REG_DEST | REG2_SOURCE)) == (REG_DEST | REG2_SOURCE)) {
107 			if (op == SLJIT_MOV_S16) {
108 #if (defined SLJIT_MIPS_REV && SLJIT_MIPS_REV >= 1)
109 				return push_inst(compiler, SEH | T(src2) | D(dst), DR(dst));
110 #else /* SLJIT_MIPS_REV < 1 */
111 				FAIL_IF(push_inst(compiler, SLL | T(src2) | D(dst) | SH_IMM(16), DR(dst)));
112 				return push_inst(compiler, SRA | T(dst) | D(dst) | SH_IMM(16), DR(dst));
113 #endif /* SLJIT_MIPS_REV >= 1 */
114 			}
115 			return push_inst(compiler, ANDI | S(src2) | T(dst) | IMM(0xffff), DR(dst));
116 		}
117 		else {
118 			SLJIT_ASSERT(dst == src2);
119 		}
120 		return SLJIT_SUCCESS;
121 
122 	case SLJIT_NOT:
123 		SLJIT_ASSERT(src1 == TMP_REG1 && !(flags & SRC2_IMM));
124 		if (op & SLJIT_SET_Z)
125 			FAIL_IF(push_inst(compiler, NOR | S(src2) | T(src2) | DA(EQUAL_FLAG), EQUAL_FLAG));
126 		if (!(flags & UNUSED_DEST))
127 			FAIL_IF(push_inst(compiler, NOR | S(src2) | T(src2) | D(dst), DR(dst)));
128 		return SLJIT_SUCCESS;
129 
130 	case SLJIT_CLZ:
131 		SLJIT_ASSERT(src1 == TMP_REG1 && !(flags & SRC2_IMM));
132 #if (defined SLJIT_MIPS_REV && SLJIT_MIPS_REV >= 1)
133 		if (op & SLJIT_SET_Z)
134 			FAIL_IF(push_inst(compiler, CLZ | S(src2) | TA(EQUAL_FLAG) | DA(EQUAL_FLAG), EQUAL_FLAG));
135 		if (!(flags & UNUSED_DEST))
136 			FAIL_IF(push_inst(compiler, CLZ | S(src2) | T(dst) | D(dst), DR(dst)));
137 #else /* SLJIT_MIPS_REV < 1 */
138 		if (SLJIT_UNLIKELY(flags & UNUSED_DEST)) {
139 			FAIL_IF(push_inst(compiler, SRL | T(src2) | DA(EQUAL_FLAG) | SH_IMM(31), EQUAL_FLAG));
140 			return push_inst(compiler, XORI | SA(EQUAL_FLAG) | TA(EQUAL_FLAG) | IMM(1), EQUAL_FLAG);
141 		}
142 		/* Nearly all instructions are unmovable in the following sequence. */
143 		FAIL_IF(push_inst(compiler, ADDU | S(src2) | TA(0) | D(TMP_REG1), DR(TMP_REG1)));
144 		/* Check zero. */
145 		FAIL_IF(push_inst(compiler, BEQ | S(TMP_REG1) | TA(0) | IMM(5), UNMOVABLE_INS));
146 		FAIL_IF(push_inst(compiler, ORI | SA(0) | T(dst) | IMM(32), UNMOVABLE_INS));
147 		FAIL_IF(push_inst(compiler, ADDIU | SA(0) | T(dst) | IMM(-1), DR(dst)));
148 		/* Loop for searching the highest bit. */
149 		FAIL_IF(push_inst(compiler, ADDIU | S(dst) | T(dst) | IMM(1), DR(dst)));
150 		FAIL_IF(push_inst(compiler, BGEZ | S(TMP_REG1) | IMM(-2), UNMOVABLE_INS));
151 		FAIL_IF(push_inst(compiler, SLL | T(TMP_REG1) | D(TMP_REG1) | SH_IMM(1), UNMOVABLE_INS));
152 #endif /* SLJIT_MIPS_REV >= 1 */
153 		return SLJIT_SUCCESS;
154 
155 	case SLJIT_ADD:
156 		is_overflow = GET_FLAG_TYPE(op) == SLJIT_OVERFLOW;
157 		is_carry = GET_FLAG_TYPE(op) == GET_FLAG_TYPE(SLJIT_SET_CARRY);
158 
159 		if (flags & SRC2_IMM) {
160 			if (is_overflow) {
161 				if (src2 >= 0)
162 					FAIL_IF(push_inst(compiler, OR | S(src1) | T(src1) | DA(EQUAL_FLAG), EQUAL_FLAG));
163 				else
164 					FAIL_IF(push_inst(compiler, NOR | S(src1) | T(src1) | DA(EQUAL_FLAG), EQUAL_FLAG));
165 			}
166 			else if (op & SLJIT_SET_Z)
167 				FAIL_IF(push_inst(compiler, ADDIU | S(src1) | TA(EQUAL_FLAG) | IMM(src2), EQUAL_FLAG));
168 
169 			if (is_overflow || is_carry) {
170 				if (src2 >= 0)
171 					FAIL_IF(push_inst(compiler, ORI | S(src1) | TA(OTHER_FLAG) | IMM(src2), OTHER_FLAG));
172 				else {
173 					FAIL_IF(push_inst(compiler, ADDIU | SA(0) | TA(OTHER_FLAG) | IMM(src2), OTHER_FLAG));
174 					FAIL_IF(push_inst(compiler, OR | S(src1) | TA(OTHER_FLAG) | DA(OTHER_FLAG), OTHER_FLAG));
175 				}
176 			}
177 			/* dst may be the same as src1 or src2. */
178 			if (!(flags & UNUSED_DEST) || (op & VARIABLE_FLAG_MASK))
179 				FAIL_IF(push_inst(compiler, ADDIU | S(src1) | T(dst) | IMM(src2), DR(dst)));
180 		}
181 		else {
182 			if (is_overflow)
183 				FAIL_IF(push_inst(compiler, XOR | S(src1) | T(src2) | DA(EQUAL_FLAG), EQUAL_FLAG));
184 			else if (op & SLJIT_SET_Z)
185 				FAIL_IF(push_inst(compiler, ADDU | S(src1) | T(src2) | DA(EQUAL_FLAG), EQUAL_FLAG));
186 
187 			if (is_overflow || is_carry)
188 				FAIL_IF(push_inst(compiler, OR | S(src1) | T(src2) | DA(OTHER_FLAG), OTHER_FLAG));
189 			/* dst may be the same as src1 or src2. */
190 			if (!(flags & UNUSED_DEST) || (op & VARIABLE_FLAG_MASK))
191 				FAIL_IF(push_inst(compiler, ADDU | S(src1) | T(src2) | D(dst), DR(dst)));
192 		}
193 
194 		/* a + b >= a | b (otherwise, the carry should be set to 1). */
195 		if (is_overflow || is_carry)
196 			FAIL_IF(push_inst(compiler, SLTU | S(dst) | TA(OTHER_FLAG) | DA(OTHER_FLAG), OTHER_FLAG));
197 		if (!is_overflow)
198 			return SLJIT_SUCCESS;
199 		FAIL_IF(push_inst(compiler, SLL | TA(OTHER_FLAG) | D(TMP_REG1) | SH_IMM(31), DR(TMP_REG1)));
200 		FAIL_IF(push_inst(compiler, XOR | S(TMP_REG1) | TA(EQUAL_FLAG) | DA(EQUAL_FLAG), EQUAL_FLAG));
201 		FAIL_IF(push_inst(compiler, XOR | S(dst) | TA(EQUAL_FLAG) | DA(OTHER_FLAG), OTHER_FLAG));
202 		if (op & SLJIT_SET_Z)
203 			FAIL_IF(push_inst(compiler, ADDU | S(dst) | TA(0) | DA(EQUAL_FLAG), EQUAL_FLAG));
204 		return push_inst(compiler, SRL | TA(OTHER_FLAG) | DA(OTHER_FLAG) | SH_IMM(31), OTHER_FLAG);
205 
206 	case SLJIT_ADDC:
207 		is_carry = GET_FLAG_TYPE(op) == GET_FLAG_TYPE(SLJIT_SET_CARRY);
208 
209 		if (flags & SRC2_IMM) {
210 			if (is_carry) {
211 				if (src2 >= 0)
212 					FAIL_IF(push_inst(compiler, ORI | S(src1) | TA(EQUAL_FLAG) | IMM(src2), EQUAL_FLAG));
213 				else {
214 					FAIL_IF(push_inst(compiler, ADDIU | SA(0) | TA(EQUAL_FLAG) | IMM(src2), EQUAL_FLAG));
215 					FAIL_IF(push_inst(compiler, OR | S(src1) | TA(EQUAL_FLAG) | DA(EQUAL_FLAG), EQUAL_FLAG));
216 				}
217 			}
218 			FAIL_IF(push_inst(compiler, ADDIU | S(src1) | T(dst) | IMM(src2), DR(dst)));
219 		} else {
220 			if (is_carry)
221 				FAIL_IF(push_inst(compiler, OR | S(src1) | T(src2) | DA(EQUAL_FLAG), EQUAL_FLAG));
222 			/* dst may be the same as src1 or src2. */
223 			FAIL_IF(push_inst(compiler, ADDU | S(src1) | T(src2) | D(dst), DR(dst)));
224 		}
225 		if (is_carry)
226 			FAIL_IF(push_inst(compiler, SLTU | S(dst) | TA(EQUAL_FLAG) | DA(EQUAL_FLAG), EQUAL_FLAG));
227 
228 		FAIL_IF(push_inst(compiler, ADDU | S(dst) | TA(OTHER_FLAG) | D(dst), DR(dst)));
229 		if (!is_carry)
230 			return SLJIT_SUCCESS;
231 
232 		/* Set ULESS_FLAG (dst == 0) && (OTHER_FLAG == 1). */
233 		FAIL_IF(push_inst(compiler, SLTU | S(dst) | TA(OTHER_FLAG) | DA(OTHER_FLAG), OTHER_FLAG));
234 		/* Set carry flag. */
235 		return push_inst(compiler, OR | SA(OTHER_FLAG) | TA(EQUAL_FLAG) | DA(OTHER_FLAG), OTHER_FLAG);
236 
237 	case SLJIT_SUB:
238 		if ((flags & SRC2_IMM) && src2 == SIMM_MIN) {
239 			FAIL_IF(push_inst(compiler, ADDIU | SA(0) | T(TMP_REG2) | IMM(src2), DR(TMP_REG2)));
240 			src2 = TMP_REG2;
241 			flags &= ~SRC2_IMM;
242 		}
243 
244 		is_handled = 0;
245 
246 		if (flags & SRC2_IMM) {
247 			if (GET_FLAG_TYPE(op) == SLJIT_LESS || GET_FLAG_TYPE(op) == SLJIT_GREATER_EQUAL) {
248 				FAIL_IF(push_inst(compiler, SLTIU | S(src1) | TA(OTHER_FLAG) | IMM(src2), OTHER_FLAG));
249 				is_handled = 1;
250 			}
251 			else if (GET_FLAG_TYPE(op) == SLJIT_SIG_LESS || GET_FLAG_TYPE(op) == SLJIT_SIG_GREATER_EQUAL) {
252 				FAIL_IF(push_inst(compiler, SLTI | S(src1) | TA(OTHER_FLAG) | IMM(src2), OTHER_FLAG));
253 				is_handled = 1;
254 			}
255 		}
256 
257 		if (!is_handled && GET_FLAG_TYPE(op) >= SLJIT_LESS && GET_FLAG_TYPE(op) <= SLJIT_SIG_LESS_EQUAL) {
258 			is_handled = 1;
259 
260 			if (flags & SRC2_IMM) {
261 				FAIL_IF(push_inst(compiler, ADDIU | SA(0) | T(TMP_REG2) | IMM(src2), DR(TMP_REG2)));
262 				src2 = TMP_REG2;
263 				flags &= ~SRC2_IMM;
264 			}
265 
266 			if (GET_FLAG_TYPE(op) == SLJIT_LESS || GET_FLAG_TYPE(op) == SLJIT_GREATER_EQUAL) {
267 				FAIL_IF(push_inst(compiler, SLTU | S(src1) | T(src2) | DA(OTHER_FLAG), OTHER_FLAG));
268 			}
269 			else if (GET_FLAG_TYPE(op) == SLJIT_GREATER || GET_FLAG_TYPE(op) == SLJIT_LESS_EQUAL)
270 			{
271 				FAIL_IF(push_inst(compiler, SLTU | S(src2) | T(src1) | DA(OTHER_FLAG), OTHER_FLAG));
272 			}
273 			else if (GET_FLAG_TYPE(op) == SLJIT_SIG_LESS || GET_FLAG_TYPE(op) == SLJIT_SIG_GREATER_EQUAL) {
274 				FAIL_IF(push_inst(compiler, SLT | S(src1) | T(src2) | DA(OTHER_FLAG), OTHER_FLAG));
275 			}
276 			else if (GET_FLAG_TYPE(op) == SLJIT_SIG_GREATER || GET_FLAG_TYPE(op) == SLJIT_SIG_LESS_EQUAL)
277 			{
278 				FAIL_IF(push_inst(compiler, SLT | S(src2) | T(src1) | DA(OTHER_FLAG), OTHER_FLAG));
279 			}
280 		}
281 
282 		if (is_handled) {
283 			if (flags & SRC2_IMM) {
284 				if (op & SLJIT_SET_Z)
285 					FAIL_IF(push_inst(compiler, ADDIU | S(src1) | TA(EQUAL_FLAG) | IMM(-src2), EQUAL_FLAG));
286 				if (!(flags & UNUSED_DEST))
287 					return push_inst(compiler, ADDIU | S(src1) | T(dst) | IMM(-src2), DR(dst));
288 			}
289 			else {
290 				if (op & SLJIT_SET_Z)
291 					FAIL_IF(push_inst(compiler, SUBU | S(src1) | T(src2) | DA(EQUAL_FLAG), EQUAL_FLAG));
292 				if (!(flags & UNUSED_DEST))
293 					return push_inst(compiler, SUBU | S(src1) | T(src2) | D(dst), DR(dst));
294 			}
295 			return SLJIT_SUCCESS;
296 		}
297 
298 		is_overflow = GET_FLAG_TYPE(op) == SLJIT_OVERFLOW;
299 		is_carry = GET_FLAG_TYPE(op) == GET_FLAG_TYPE(SLJIT_SET_CARRY);
300 
301 		if (flags & SRC2_IMM) {
302 			if (is_overflow) {
303 				if (src2 >= 0)
304 					FAIL_IF(push_inst(compiler, OR | S(src1) | T(src1) | DA(EQUAL_FLAG), EQUAL_FLAG));
305 				else
306 					FAIL_IF(push_inst(compiler, NOR | S(src1) | T(src1) | DA(EQUAL_FLAG), EQUAL_FLAG));
307 			}
308 			else if (op & SLJIT_SET_Z)
309 				FAIL_IF(push_inst(compiler, ADDIU | S(src1) | TA(EQUAL_FLAG) | IMM(-src2), EQUAL_FLAG));
310 
311 			if (is_overflow || is_carry)
312 				FAIL_IF(push_inst(compiler, SLTIU | S(src1) | TA(OTHER_FLAG) | IMM(src2), OTHER_FLAG));
313 			/* dst may be the same as src1 or src2. */
314 			if (!(flags & UNUSED_DEST) || (op & VARIABLE_FLAG_MASK))
315 				FAIL_IF(push_inst(compiler, ADDIU | S(src1) | T(dst) | IMM(-src2), DR(dst)));
316 		}
317 		else {
318 			if (is_overflow)
319 				FAIL_IF(push_inst(compiler, XOR | S(src1) | T(src2) | DA(EQUAL_FLAG), EQUAL_FLAG));
320 			else if (op & SLJIT_SET_Z)
321 				FAIL_IF(push_inst(compiler, SUBU | S(src1) | T(src2) | DA(EQUAL_FLAG), EQUAL_FLAG));
322 
323 			if (is_overflow || is_carry)
324 				FAIL_IF(push_inst(compiler, SLTU | S(src1) | T(src2) | DA(OTHER_FLAG), OTHER_FLAG));
325 			/* dst may be the same as src1 or src2. */
326 			if (!(flags & UNUSED_DEST) || (op & VARIABLE_FLAG_MASK))
327 				FAIL_IF(push_inst(compiler, SUBU | S(src1) | T(src2) | D(dst), DR(dst)));
328 		}
329 
330 		if (!is_overflow)
331 			return SLJIT_SUCCESS;
332 		FAIL_IF(push_inst(compiler, SLL | TA(OTHER_FLAG) | D(TMP_REG1) | SH_IMM(31), DR(TMP_REG1)));
333 		FAIL_IF(push_inst(compiler, XOR | S(TMP_REG1) | TA(EQUAL_FLAG) | DA(EQUAL_FLAG), EQUAL_FLAG));
334 		FAIL_IF(push_inst(compiler, XOR | S(dst) | TA(EQUAL_FLAG) | DA(OTHER_FLAG), OTHER_FLAG));
335 		if (op & SLJIT_SET_Z)
336 			FAIL_IF(push_inst(compiler, ADDU | S(dst) | TA(0) | DA(EQUAL_FLAG), EQUAL_FLAG));
337 		return push_inst(compiler, SRL | TA(OTHER_FLAG) | DA(OTHER_FLAG) | SH_IMM(31), OTHER_FLAG);
338 
339 	case SLJIT_SUBC:
340 		if ((flags & SRC2_IMM) && src2 == SIMM_MIN) {
341 			FAIL_IF(push_inst(compiler, ADDIU | SA(0) | T(TMP_REG2) | IMM(src2), DR(TMP_REG2)));
342 			src2 = TMP_REG2;
343 			flags &= ~SRC2_IMM;
344 		}
345 
346 		is_carry = GET_FLAG_TYPE(op) == GET_FLAG_TYPE(SLJIT_SET_CARRY);
347 
348 		if (flags & SRC2_IMM) {
349 			if (is_carry)
350 				FAIL_IF(push_inst(compiler, SLTIU | S(src1) | TA(EQUAL_FLAG) | IMM(src2), EQUAL_FLAG));
351 			/* dst may be the same as src1 or src2. */
352 			FAIL_IF(push_inst(compiler, ADDIU | S(src1) | T(dst) | IMM(-src2), DR(dst)));
353 		}
354 		else {
355 			if (is_carry)
356 				FAIL_IF(push_inst(compiler, SLTU | S(src1) | T(src2) | DA(EQUAL_FLAG), EQUAL_FLAG));
357 			/* dst may be the same as src1 or src2. */
358 			FAIL_IF(push_inst(compiler, SUBU | S(src1) | T(src2) | D(dst), DR(dst)));
359 		}
360 
361 		if (is_carry)
362 			FAIL_IF(push_inst(compiler, SLTU | S(dst) | TA(OTHER_FLAG) | D(TMP_REG1), DR(TMP_REG1)));
363 
364 		FAIL_IF(push_inst(compiler, SUBU | S(dst) | TA(OTHER_FLAG) | D(dst), DR(dst)));
365 		return (is_carry) ? push_inst(compiler, OR | SA(EQUAL_FLAG) | T(TMP_REG1) | DA(OTHER_FLAG), OTHER_FLAG) : SLJIT_SUCCESS;
366 
367 	case SLJIT_MUL:
368 		SLJIT_ASSERT(!(flags & SRC2_IMM));
369 
370 		if (GET_FLAG_TYPE(op) != SLJIT_MUL_OVERFLOW) {
371 #if (defined SLJIT_MIPS_REV && SLJIT_MIPS_REV >= 1)
372 			return push_inst(compiler, MUL | S(src1) | T(src2) | D(dst), DR(dst));
373 #else /* SLJIT_MIPS_REV < 1 */
374 			FAIL_IF(push_inst(compiler, MULT | S(src1) | T(src2), MOVABLE_INS));
375 			return push_inst(compiler, MFLO | D(dst), DR(dst));
376 #endif /* SLJIT_MIPS_REV >= 1 */
377 		}
378 
379 #if (defined SLJIT_MIPS_REV && SLJIT_MIPS_REV >= 6)
380 		FAIL_IF(push_inst(compiler, MUL | S(src1) | T(src2) | D(dst), DR(dst)));
381 		FAIL_IF(push_inst(compiler, MUH | S(src1) | T(src2) | DA(EQUAL_FLAG), EQUAL_FLAG));
382 #else /* SLJIT_MIPS_REV < 6 */
383 		FAIL_IF(push_inst(compiler, MULT | S(src1) | T(src2), MOVABLE_INS));
384 		FAIL_IF(push_inst(compiler, MFHI | DA(EQUAL_FLAG), EQUAL_FLAG));
385 		FAIL_IF(push_inst(compiler, MFLO | D(dst), DR(dst)));
386 #endif /* SLJIT_MIPS_REV >= 6 */
387 		FAIL_IF(push_inst(compiler, SRA | T(dst) | DA(OTHER_FLAG) | SH_IMM(31), OTHER_FLAG));
388 		return push_inst(compiler, SUBU | SA(EQUAL_FLAG) | TA(OTHER_FLAG) | DA(OTHER_FLAG), OTHER_FLAG);
389 
390 	case SLJIT_AND:
391 		EMIT_LOGICAL(ANDI, AND);
392 		return SLJIT_SUCCESS;
393 
394 	case SLJIT_OR:
395 		EMIT_LOGICAL(ORI, OR);
396 		return SLJIT_SUCCESS;
397 
398 	case SLJIT_XOR:
399 		EMIT_LOGICAL(XORI, XOR);
400 		return SLJIT_SUCCESS;
401 
402 	case SLJIT_SHL:
403 		EMIT_SHIFT(SLL, SLLV);
404 		return SLJIT_SUCCESS;
405 
406 	case SLJIT_LSHR:
407 		EMIT_SHIFT(SRL, SRLV);
408 		return SLJIT_SUCCESS;
409 
410 	case SLJIT_ASHR:
411 		EMIT_SHIFT(SRA, SRAV);
412 		return SLJIT_SUCCESS;
413 	}
414 
415 	SLJIT_UNREACHABLE();
416 	return SLJIT_SUCCESS;
417 }
418 
emit_const(struct sljit_compiler * compiler,sljit_s32 dst,sljit_sw init_value)419 static SLJIT_INLINE sljit_s32 emit_const(struct sljit_compiler *compiler, sljit_s32 dst, sljit_sw init_value)
420 {
421 	FAIL_IF(push_inst(compiler, LUI | T(dst) | IMM(init_value >> 16), DR(dst)));
422 	return push_inst(compiler, ORI | S(dst) | T(dst) | IMM(init_value), DR(dst));
423 }
424 
sljit_set_jump_addr(sljit_uw addr,sljit_uw new_target,sljit_sw executable_offset)425 SLJIT_API_FUNC_ATTRIBUTE void sljit_set_jump_addr(sljit_uw addr, sljit_uw new_target, sljit_sw executable_offset)
426 {
427 	sljit_ins *inst = (sljit_ins *)addr;
428 
429 	SLJIT_ASSERT((inst[0] & 0xffe00000) == LUI && (inst[1] & 0xfc000000) == ORI);
430 	inst[0] = (inst[0] & 0xffff0000) | ((new_target >> 16) & 0xffff);
431 	inst[1] = (inst[1] & 0xffff0000) | (new_target & 0xffff);
432 	inst = (sljit_ins *)SLJIT_ADD_EXEC_OFFSET(inst, executable_offset);
433 	SLJIT_CACHE_FLUSH(inst, inst + 2);
434 }
435 
sljit_set_const(sljit_uw addr,sljit_sw new_constant,sljit_sw executable_offset)436 SLJIT_API_FUNC_ATTRIBUTE void sljit_set_const(sljit_uw addr, sljit_sw new_constant, sljit_sw executable_offset)
437 {
438 	sljit_ins *inst = (sljit_ins *)addr;
439 
440 	SLJIT_ASSERT((inst[0] & 0xffe00000) == LUI && (inst[1] & 0xfc000000) == ORI);
441 	inst[0] = (inst[0] & 0xffff0000) | ((new_constant >> 16) & 0xffff);
442 	inst[1] = (inst[1] & 0xffff0000) | (new_constant & 0xffff);
443 	inst = (sljit_ins *)SLJIT_ADD_EXEC_OFFSET(inst, executable_offset);
444 	SLJIT_CACHE_FLUSH(inst, inst + 2);
445 }
446 
call_with_args(struct sljit_compiler * compiler,sljit_s32 arg_types,sljit_ins * ins_ptr)447 static sljit_s32 call_with_args(struct sljit_compiler *compiler, sljit_s32 arg_types, sljit_ins *ins_ptr)
448 {
449 	sljit_s32 stack_offset = 0;
450 	sljit_s32 arg_count = 0;
451 	sljit_s32 float_arg_count = 0;
452 	sljit_s32 word_arg_count = 0;
453 	sljit_s32 types = 0;
454 	sljit_s32 arg_count_save, types_save;
455 	sljit_ins prev_ins = NOP;
456 	sljit_ins ins = NOP;
457 	sljit_u8 offsets[4];
458 
459 	SLJIT_ASSERT(reg_map[TMP_REG1] == 4 && freg_map[TMP_FREG1] == 12);
460 
461 	arg_types >>= SLJIT_DEF_SHIFT;
462 
463 	while (arg_types) {
464 		types = (types << SLJIT_DEF_SHIFT) | (arg_types & SLJIT_DEF_MASK);
465 
466 		switch (arg_types & SLJIT_DEF_MASK) {
467 		case SLJIT_ARG_TYPE_F32:
468 			offsets[arg_count] = (sljit_u8)stack_offset;
469 
470 			if (word_arg_count == 0 && arg_count <= 1)
471 				offsets[arg_count] = 254 + arg_count;
472 
473 			stack_offset += sizeof(sljit_f32);
474 			arg_count++;
475 			float_arg_count++;
476 			break;
477 		case SLJIT_ARG_TYPE_F64:
478 			if (stack_offset & 0x7)
479 				stack_offset += sizeof(sljit_sw);
480 			offsets[arg_count] = (sljit_u8)stack_offset;
481 
482 			if (word_arg_count == 0 && arg_count <= 1)
483 				offsets[arg_count] = 254 + arg_count;
484 
485 			stack_offset += sizeof(sljit_f64);
486 			arg_count++;
487 			float_arg_count++;
488 			break;
489 		default:
490 			offsets[arg_count] = (sljit_u8)stack_offset;
491 			stack_offset += sizeof(sljit_sw);
492 			arg_count++;
493 			word_arg_count++;
494 			break;
495 		}
496 
497 		arg_types >>= SLJIT_DEF_SHIFT;
498 	}
499 
500 	/* Stack is aligned to 16 bytes, max two doubles can be placed on the stack. */
501 	if (stack_offset > 16)
502 		FAIL_IF(push_inst(compiler, ADDIU | S(SLJIT_SP) | T(SLJIT_SP) | IMM(-16), DR(SLJIT_SP)));
503 
504 	types_save = types;
505 	arg_count_save = arg_count;
506 
507 	while (types) {
508 		switch (types & SLJIT_DEF_MASK) {
509 		case SLJIT_ARG_TYPE_F32:
510 			arg_count--;
511 			if (offsets[arg_count] < 254)
512 				ins = SWC1 | S(SLJIT_SP) | FT(float_arg_count) | IMM(offsets[arg_count]);
513 			float_arg_count--;
514 			break;
515 		case SLJIT_ARG_TYPE_F64:
516 			arg_count--;
517 			if (offsets[arg_count] < 254)
518 				ins = SDC1 | S(SLJIT_SP) | FT(float_arg_count) | IMM(offsets[arg_count]);
519 			float_arg_count--;
520 			break;
521 		default:
522 			if (offsets[arg_count - 1] >= 16)
523 				ins = SW | S(SLJIT_SP) | T(word_arg_count) | IMM(offsets[arg_count - 1]);
524 			else if (arg_count != word_arg_count)
525 				ins = ADDU | S(word_arg_count) | TA(0) | DA(4 + (offsets[arg_count - 1] >> 2));
526 			else if (arg_count == 1)
527 				ins = ADDU | S(SLJIT_R0) | TA(0) | DA(4);
528 
529 			arg_count--;
530 			word_arg_count--;
531 			break;
532 		}
533 
534 		if (ins != NOP) {
535 			if (prev_ins != NOP)
536 				FAIL_IF(push_inst(compiler, prev_ins, MOVABLE_INS));
537 			prev_ins = ins;
538 			ins = NOP;
539 		}
540 
541 		types >>= SLJIT_DEF_SHIFT;
542 	}
543 
544 	types = types_save;
545 	arg_count = arg_count_save;
546 
547 	while (types) {
548 		switch (types & SLJIT_DEF_MASK) {
549 		case SLJIT_ARG_TYPE_F32:
550 			arg_count--;
551 			if (offsets[arg_count] == 254)
552 				ins = MOV_S | FMT_S | FS(SLJIT_FR0) | FD(TMP_FREG1);
553 			else if (offsets[arg_count] < 16)
554 				ins = LW | S(SLJIT_SP) | TA(4 + (offsets[arg_count] >> 2)) | IMM(offsets[arg_count]);
555 			break;
556 		case SLJIT_ARG_TYPE_F64:
557 			arg_count--;
558 			if (offsets[arg_count] == 254)
559 				ins = MOV_S | FMT_D | FS(SLJIT_FR0) | FD(TMP_FREG1);
560 			else if (offsets[arg_count] < 16) {
561 				if (prev_ins != NOP)
562 					FAIL_IF(push_inst(compiler, prev_ins, MOVABLE_INS));
563 				prev_ins = LW | S(SLJIT_SP) | TA(4 + (offsets[arg_count] >> 2)) | IMM(offsets[arg_count]);
564 				ins = LW | S(SLJIT_SP) | TA(5 + (offsets[arg_count] >> 2)) | IMM(offsets[arg_count] + sizeof(sljit_sw));
565 			}
566 			break;
567 		default:
568 			arg_count--;
569 			break;
570 		}
571 
572 		if (ins != NOP) {
573 			if (prev_ins != NOP)
574 				FAIL_IF(push_inst(compiler, prev_ins, MOVABLE_INS));
575 			prev_ins = ins;
576 			ins = NOP;
577 		}
578 
579 		types >>= SLJIT_DEF_SHIFT;
580 	}
581 
582 	*ins_ptr = prev_ins;
583 
584 	return SLJIT_SUCCESS;
585 }
586 
post_call_with_args(struct sljit_compiler * compiler,sljit_s32 arg_types)587 static sljit_s32 post_call_with_args(struct sljit_compiler *compiler, sljit_s32 arg_types)
588 {
589 	sljit_s32 stack_offset = 0;
590 
591 	arg_types >>= SLJIT_DEF_SHIFT;
592 
593 	while (arg_types) {
594 		switch (arg_types & SLJIT_DEF_MASK) {
595 		case SLJIT_ARG_TYPE_F32:
596 			stack_offset += sizeof(sljit_f32);
597 			break;
598 		case SLJIT_ARG_TYPE_F64:
599 			if (stack_offset & 0x7)
600 				stack_offset += sizeof(sljit_sw);
601 			stack_offset += sizeof(sljit_f64);
602 			break;
603 		default:
604 			stack_offset += sizeof(sljit_sw);
605 			break;
606 		}
607 
608 		arg_types >>= SLJIT_DEF_SHIFT;
609 	}
610 
611 	/* Stack is aligned to 16 bytes, max two doubles can be placed on the stack. */
612 	if (stack_offset > 16)
613 		return push_inst(compiler, ADDIU | S(SLJIT_SP) | T(SLJIT_SP) | IMM(16), DR(SLJIT_SP));
614 
615 	return SLJIT_SUCCESS;
616 }
617 
sljit_emit_call(struct sljit_compiler * compiler,sljit_s32 type,sljit_s32 arg_types)618 SLJIT_API_FUNC_ATTRIBUTE struct sljit_jump* sljit_emit_call(struct sljit_compiler *compiler, sljit_s32 type,
619 	sljit_s32 arg_types)
620 {
621 	struct sljit_jump *jump;
622 	sljit_ins ins;
623 
624 	CHECK_ERROR_PTR();
625 	CHECK_PTR(check_sljit_emit_call(compiler, type, arg_types));
626 
627 	jump = (struct sljit_jump*)ensure_abuf(compiler, sizeof(struct sljit_jump));
628 	PTR_FAIL_IF(!jump);
629 	set_jump(jump, compiler, type & SLJIT_REWRITABLE_JUMP);
630 	type &= 0xff;
631 
632 	PTR_FAIL_IF(call_with_args(compiler, arg_types, &ins));
633 
634 	SLJIT_ASSERT(DR(PIC_ADDR_REG) == 25 && PIC_ADDR_REG == TMP_REG2);
635 
636 	PTR_FAIL_IF(emit_const(compiler, PIC_ADDR_REG, 0));
637 
638 	jump->flags |= IS_JAL | IS_CALL;
639 	PTR_FAIL_IF(push_inst(compiler, JALR | S(PIC_ADDR_REG) | DA(RETURN_ADDR_REG), UNMOVABLE_INS));
640 	jump->addr = compiler->size;
641 	PTR_FAIL_IF(push_inst(compiler, ins, UNMOVABLE_INS));
642 
643 	PTR_FAIL_IF(post_call_with_args(compiler, arg_types));
644 
645 	return jump;
646 }
647 
sljit_emit_icall(struct sljit_compiler * compiler,sljit_s32 type,sljit_s32 arg_types,sljit_s32 src,sljit_sw srcw)648 SLJIT_API_FUNC_ATTRIBUTE sljit_s32 sljit_emit_icall(struct sljit_compiler *compiler, sljit_s32 type,
649 	sljit_s32 arg_types,
650 	sljit_s32 src, sljit_sw srcw)
651 {
652 	sljit_ins ins;
653 
654 	CHECK_ERROR();
655 	CHECK(check_sljit_emit_icall(compiler, type, arg_types, src, srcw));
656 
657 	SLJIT_ASSERT(DR(PIC_ADDR_REG) == 25 && PIC_ADDR_REG == TMP_REG2);
658 
659 	if (src & SLJIT_IMM)
660 		FAIL_IF(load_immediate(compiler, DR(PIC_ADDR_REG), srcw));
661 	else if (FAST_IS_REG(src))
662 		FAIL_IF(push_inst(compiler, ADDU | S(src) | TA(0) | D(PIC_ADDR_REG), DR(PIC_ADDR_REG)));
663 	else if (src & SLJIT_MEM) {
664 		ADJUST_LOCAL_OFFSET(src, srcw);
665 		FAIL_IF(emit_op_mem(compiler, WORD_DATA | LOAD_DATA, DR(PIC_ADDR_REG), src, srcw));
666 	}
667 
668 	FAIL_IF(call_with_args(compiler, arg_types, &ins));
669 
670 	/* Register input. */
671 	FAIL_IF(push_inst(compiler, JALR | S(PIC_ADDR_REG) | DA(RETURN_ADDR_REG), UNMOVABLE_INS));
672 	FAIL_IF(push_inst(compiler, ins, UNMOVABLE_INS));
673 	return post_call_with_args(compiler, arg_types);
674 }
675