1 /* $NetBSD: sljitNativeSPARC_common.c,v 1.2 2014/06/17 19:33:20 alnsn Exp $ */ 2 3 /* 4 * Stack-less Just-In-Time compiler 5 * 6 * Copyright 2009-2012 Zoltan Herczeg (hzmester@freemail.hu). All rights reserved. 7 * 8 * Redistribution and use in source and binary forms, with or without modification, are 9 * permitted provided that the following conditions are met: 10 * 11 * 1. Redistributions of source code must retain the above copyright notice, this list of 12 * conditions and the following disclaimer. 13 * 14 * 2. Redistributions in binary form must reproduce the above copyright notice, this list 15 * of conditions and the following disclaimer in the documentation and/or other materials 16 * provided with the distribution. 17 * 18 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDER(S) AND CONTRIBUTORS ``AS IS'' AND ANY 19 * EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES 20 * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT 21 * SHALL THE COPYRIGHT HOLDER(S) OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, 22 * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED 23 * TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR 24 * BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN 25 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN 26 * ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. 27 */ 28 29 SLJIT_API_FUNC_ATTRIBUTE SLJIT_CONST char* sljit_get_platform_name(void) 30 { 31 return "SPARC" SLJIT_CPUINFO; 32 } 33 34 /* Length of an instruction word 35 Both for sparc-32 and sparc-64 */ 36 typedef sljit_ui sljit_ins; 37 38 static void sparc_cache_flush(sljit_ins *from, sljit_ins *to) 39 { 40 #if defined(__SUNPRO_C) && __SUNPRO_C < 0x590 41 __asm ( 42 /* if (from == to) return */ 43 "cmp %i0, %i1\n" 44 "be .leave\n" 45 "nop\n" 46 47 /* loop until from >= to */ 48 ".mainloop:\n" 49 "flush %i0\n" 50 "add %i0, 8, %i0\n" 51 "cmp %i0, %i1\n" 52 "bcs .mainloop\n" 53 "nop\n" 54 55 /* The comparison was done above. */ 56 "bne .leave\n" 57 /* nop is not necessary here, since the 58 sub operation has no side effect. */ 59 "sub %i0, 4, %i0\n" 60 "flush %i0\n" 61 ".leave:" 62 ); 63 #else 64 if (SLJIT_UNLIKELY(from == to)) 65 return; 66 67 do { 68 __asm__ volatile ( 69 "flush %0\n" 70 : : "r"(from) 71 ); 72 /* Operates at least on doubleword. */ 73 from += 2; 74 } while (from < to); 75 76 if (from == to) { 77 /* Flush the last word. */ 78 from --; 79 __asm__ volatile ( 80 "flush %0\n" 81 : : "r"(from) 82 ); 83 } 84 #endif 85 } 86 87 /* TMP_REG2 is not used by getput_arg */ 88 #define TMP_REG1 (SLJIT_NO_REGISTERS + 1) 89 #define TMP_REG2 (SLJIT_NO_REGISTERS + 2) 90 #define TMP_REG3 (SLJIT_NO_REGISTERS + 3) 91 #define TMP_REG4 (SLJIT_NO_REGISTERS + 4) 92 #define TMP_LINK (SLJIT_NO_REGISTERS + 5) 93 94 #define TMP_FREG1 (0) 95 #define TMP_FREG2 ((SLJIT_FLOAT_REG6 + 1) << 1) 96 97 static SLJIT_CONST sljit_ub reg_map[SLJIT_NO_REGISTERS + 7] = { 98 0, 8, 9, 10, 11, 12, 16, 17, 18, 19, 20, 14, 1, 24, 25, 26, 15 99 }; 100 101 /* --------------------------------------------------------------------- */ 102 /* Instrucion forms */ 103 /* --------------------------------------------------------------------- */ 104 105 #define D(d) (reg_map[d] << 25) 106 #define DA(d) ((d) << 25) 107 #define S1(s1) (reg_map[s1] << 14) 108 #define S2(s2) (reg_map[s2]) 109 #define S1A(s1) ((s1) << 14) 110 #define S2A(s2) (s2) 111 #define IMM_ARG 0x2000 112 #define DOP(op) ((op) << 5) 113 #define IMM(imm) (((imm) & 0x1fff) | IMM_ARG) 114 115 #define DR(dr) (reg_map[dr]) 116 #define OPC1(opcode) ((opcode) << 30) 117 #define OPC2(opcode) ((opcode) << 22) 118 #define OPC3(opcode) ((opcode) << 19) 119 #define SET_FLAGS OPC3(0x10) 120 121 #define ADD (OPC1(0x2) | OPC3(0x00)) 122 #define ADDC (OPC1(0x2) | OPC3(0x08)) 123 #define AND (OPC1(0x2) | OPC3(0x01)) 124 #define ANDN (OPC1(0x2) | OPC3(0x05)) 125 #define CALL (OPC1(0x1)) 126 #define FABSS (OPC1(0x2) | OPC3(0x34) | DOP(0x09)) 127 #define FADDD (OPC1(0x2) | OPC3(0x34) | DOP(0x42)) 128 #define FADDS (OPC1(0x2) | OPC3(0x34) | DOP(0x41)) 129 #define FCMPD (OPC1(0x2) | OPC3(0x35) | DOP(0x52)) 130 #define FCMPS (OPC1(0x2) | OPC3(0x35) | DOP(0x51)) 131 #define FDIVD (OPC1(0x2) | OPC3(0x34) | DOP(0x4e)) 132 #define FDIVS (OPC1(0x2) | OPC3(0x34) | DOP(0x4d)) 133 #define FMOVS (OPC1(0x2) | OPC3(0x34) | DOP(0x01)) 134 #define FMULD (OPC1(0x2) | OPC3(0x34) | DOP(0x4a)) 135 #define FMULS (OPC1(0x2) | OPC3(0x34) | DOP(0x49)) 136 #define FNEGS (OPC1(0x2) | OPC3(0x34) | DOP(0x05)) 137 #define FSUBD (OPC1(0x2) | OPC3(0x34) | DOP(0x46)) 138 #define FSUBS (OPC1(0x2) | OPC3(0x34) | DOP(0x45)) 139 #define JMPL (OPC1(0x2) | OPC3(0x38)) 140 #define NOP (OPC1(0x0) | OPC2(0x04)) 141 #define OR (OPC1(0x2) | OPC3(0x02)) 142 #define ORN (OPC1(0x2) | OPC3(0x06)) 143 #define RDY (OPC1(0x2) | OPC3(0x28) | S1A(0)) 144 #define RESTORE (OPC1(0x2) | OPC3(0x3d)) 145 #define SAVE (OPC1(0x2) | OPC3(0x3c)) 146 #define SETHI (OPC1(0x0) | OPC2(0x04)) 147 #define SLL (OPC1(0x2) | OPC3(0x25)) 148 #define SLLX (OPC1(0x2) | OPC3(0x25) | (1 << 12)) 149 #define SRA (OPC1(0x2) | OPC3(0x27)) 150 #define SRAX (OPC1(0x2) | OPC3(0x27) | (1 << 12)) 151 #define SRL (OPC1(0x2) | OPC3(0x26)) 152 #define SRLX (OPC1(0x2) | OPC3(0x26) | (1 << 12)) 153 #define SUB (OPC1(0x2) | OPC3(0x04)) 154 #define SUBC (OPC1(0x2) | OPC3(0x0c)) 155 #define TA (OPC1(0x2) | OPC3(0x3a) | (8 << 25)) 156 #define WRY (OPC1(0x2) | OPC3(0x30) | DA(0)) 157 #define XOR (OPC1(0x2) | OPC3(0x03)) 158 #define XNOR (OPC1(0x2) | OPC3(0x07)) 159 160 #if (defined SLJIT_CONFIG_SPARC_32 && SLJIT_CONFIG_SPARC_32) 161 #define MAX_DISP (0x1fffff) 162 #define MIN_DISP (-0x200000) 163 #define DISP_MASK (0x3fffff) 164 165 #define BICC (OPC1(0x0) | OPC2(0x2)) 166 #define FBFCC (OPC1(0x0) | OPC2(0x6)) 167 #define SLL_W SLL 168 #define SDIV (OPC1(0x2) | OPC3(0x0f)) 169 #define SMUL (OPC1(0x2) | OPC3(0x0b)) 170 #define UDIV (OPC1(0x2) | OPC3(0x0e)) 171 #define UMUL (OPC1(0x2) | OPC3(0x0a)) 172 #else 173 #define SLL_W SLLX 174 #endif 175 176 #define SIMM_MAX (0x0fff) 177 #define SIMM_MIN (-0x1000) 178 179 /* dest_reg is the absolute name of the register 180 Useful for reordering instructions in the delay slot. */ 181 static sljit_si push_inst(struct sljit_compiler *compiler, sljit_ins ins, sljit_si delay_slot) 182 { 183 sljit_ins *ptr; 184 SLJIT_ASSERT((delay_slot & DST_INS_MASK) == UNMOVABLE_INS 185 || (delay_slot & DST_INS_MASK) == MOVABLE_INS 186 || (delay_slot & DST_INS_MASK) == ((ins >> 25) & 0x1f)); 187 ptr = (sljit_ins*)ensure_buf(compiler, sizeof(sljit_ins)); 188 FAIL_IF(!ptr); 189 *ptr = ins; 190 compiler->size++; 191 compiler->delay_slot = delay_slot; 192 return SLJIT_SUCCESS; 193 } 194 195 static SLJIT_INLINE sljit_ins* detect_jump_type(struct sljit_jump *jump, sljit_ins *code_ptr, sljit_ins *code) 196 { 197 sljit_sw diff; 198 sljit_uw target_addr; 199 sljit_ins *inst; 200 sljit_ins saved_inst; 201 202 if (jump->flags & SLJIT_REWRITABLE_JUMP) 203 return code_ptr; 204 205 if (jump->flags & JUMP_ADDR) 206 target_addr = jump->u.target; 207 else { 208 SLJIT_ASSERT(jump->flags & JUMP_LABEL); 209 target_addr = (sljit_uw)(code + jump->u.label->size); 210 } 211 inst = (sljit_ins*)jump->addr; 212 213 #if (defined SLJIT_CONFIG_SPARC_32 && SLJIT_CONFIG_SPARC_32) 214 if (jump->flags & IS_CALL) { 215 /* Call is always patchable on sparc 32. */ 216 jump->flags |= PATCH_CALL; 217 if (jump->flags & IS_MOVABLE) { 218 inst[0] = inst[-1]; 219 inst[-1] = CALL; 220 jump->addr -= sizeof(sljit_ins); 221 return inst; 222 } 223 inst[0] = CALL; 224 inst[1] = NOP; 225 return inst + 1; 226 } 227 #else 228 /* Both calls and BPr instructions shall not pass this point. */ 229 #error "Implementation required" 230 #endif 231 232 if (jump->flags & IS_COND) 233 inst--; 234 235 if (jump->flags & IS_MOVABLE) { 236 diff = ((sljit_sw)target_addr - (sljit_sw)(inst - 1)) >> 2; 237 if (diff <= MAX_DISP && diff >= MIN_DISP) { 238 jump->flags |= PATCH_B; 239 inst--; 240 if (jump->flags & IS_COND) { 241 saved_inst = inst[0]; 242 inst[0] = inst[1] ^ (1 << 28); 243 inst[1] = saved_inst; 244 } else { 245 inst[1] = inst[0]; 246 inst[0] = BICC | DA(0x8); 247 } 248 jump->addr = (sljit_uw)inst; 249 return inst + 1; 250 } 251 } 252 253 diff = ((sljit_sw)target_addr - (sljit_sw)(inst)) >> 2; 254 if (diff <= MAX_DISP && diff >= MIN_DISP) { 255 jump->flags |= PATCH_B; 256 if (jump->flags & IS_COND) 257 inst[0] ^= (1 << 28); 258 else 259 inst[0] = BICC | DA(0x8); 260 inst[1] = NOP; 261 jump->addr = (sljit_uw)inst; 262 return inst + 1; 263 } 264 265 return code_ptr; 266 } 267 268 SLJIT_API_FUNC_ATTRIBUTE void* sljit_generate_code(struct sljit_compiler *compiler) 269 { 270 struct sljit_memory_fragment *buf; 271 sljit_ins *code; 272 sljit_ins *code_ptr; 273 sljit_ins *buf_ptr; 274 sljit_ins *buf_end; 275 sljit_uw word_count; 276 sljit_uw addr; 277 278 struct sljit_label *label; 279 struct sljit_jump *jump; 280 struct sljit_const *const_; 281 282 CHECK_ERROR_PTR(); 283 check_sljit_generate_code(compiler); 284 reverse_buf(compiler); 285 286 code = (sljit_ins*)SLJIT_MALLOC_EXEC(compiler->size * sizeof(sljit_ins)); 287 PTR_FAIL_WITH_EXEC_IF(code); 288 buf = compiler->buf; 289 290 code_ptr = code; 291 word_count = 0; 292 label = compiler->labels; 293 jump = compiler->jumps; 294 const_ = compiler->consts; 295 do { 296 buf_ptr = (sljit_ins*)buf->memory; 297 buf_end = buf_ptr + (buf->used_size >> 2); 298 do { 299 *code_ptr = *buf_ptr++; 300 SLJIT_ASSERT(!label || label->size >= word_count); 301 SLJIT_ASSERT(!jump || jump->addr >= word_count); 302 SLJIT_ASSERT(!const_ || const_->addr >= word_count); 303 /* These structures are ordered by their address. */ 304 if (label && label->size == word_count) { 305 /* Just recording the address. */ 306 label->addr = (sljit_uw)code_ptr; 307 label->size = code_ptr - code; 308 label = label->next; 309 } 310 if (jump && jump->addr == word_count) { 311 #if (defined SLJIT_CONFIG_SPARC_32 && SLJIT_CONFIG_SPARC_32) 312 jump->addr = (sljit_uw)(code_ptr - 3); 313 #else 314 jump->addr = (sljit_uw)(code_ptr - 6); 315 #endif 316 code_ptr = detect_jump_type(jump, code_ptr, code); 317 jump = jump->next; 318 } 319 if (const_ && const_->addr == word_count) { 320 /* Just recording the address. */ 321 const_->addr = (sljit_uw)code_ptr; 322 const_ = const_->next; 323 } 324 code_ptr ++; 325 word_count ++; 326 } while (buf_ptr < buf_end); 327 328 buf = buf->next; 329 } while (buf); 330 331 if (label && label->size == word_count) { 332 label->addr = (sljit_uw)code_ptr; 333 label->size = code_ptr - code; 334 label = label->next; 335 } 336 337 SLJIT_ASSERT(!label); 338 SLJIT_ASSERT(!jump); 339 SLJIT_ASSERT(!const_); 340 SLJIT_ASSERT(code_ptr - code <= (sljit_si)compiler->size); 341 342 jump = compiler->jumps; 343 while (jump) { 344 do { 345 addr = (jump->flags & JUMP_LABEL) ? jump->u.label->addr : jump->u.target; 346 buf_ptr = (sljit_ins*)jump->addr; 347 348 if (jump->flags & PATCH_CALL) { 349 addr = (sljit_sw)(addr - jump->addr) >> 2; 350 SLJIT_ASSERT((sljit_sw)addr <= 0x1fffffff && (sljit_sw)addr >= -0x20000000); 351 buf_ptr[0] = CALL | (addr & 0x3fffffff); 352 break; 353 } 354 if (jump->flags & PATCH_B) { 355 addr = (sljit_sw)(addr - jump->addr) >> 2; 356 SLJIT_ASSERT((sljit_sw)addr <= MAX_DISP && (sljit_sw)addr >= MIN_DISP); 357 buf_ptr[0] = (buf_ptr[0] & ~DISP_MASK) | (addr & DISP_MASK); 358 break; 359 } 360 361 /* Set the fields of immediate loads. */ 362 #if (defined SLJIT_CONFIG_SPARC_32 && SLJIT_CONFIG_SPARC_32) 363 buf_ptr[0] = (buf_ptr[0] & 0xffc00000) | ((addr >> 10) & 0x3fffff); 364 buf_ptr[1] = (buf_ptr[1] & 0xfffffc00) | (addr & 0x3ff); 365 #else 366 #error "Implementation required" 367 #endif 368 } while (0); 369 jump = jump->next; 370 } 371 372 373 compiler->error = SLJIT_ERR_COMPILED; 374 compiler->executable_size = (code_ptr - code) * sizeof(sljit_ins); 375 SLJIT_CACHE_FLUSH(code, code_ptr); 376 return code; 377 } 378 379 /* --------------------------------------------------------------------- */ 380 /* Entry, exit */ 381 /* --------------------------------------------------------------------- */ 382 383 /* Creates an index in data_transfer_insts array. */ 384 #define LOAD_DATA 0x01 385 #define WORD_DATA 0x00 386 #define BYTE_DATA 0x02 387 #define HALF_DATA 0x04 388 #define INT_DATA 0x06 389 #define SIGNED_DATA 0x08 390 /* Separates integer and floating point registers */ 391 #define GPR_REG 0x0f 392 #define DOUBLE_DATA 0x10 393 394 #define MEM_MASK 0x1f 395 396 #define WRITE_BACK 0x00020 397 #define ARG_TEST 0x00040 398 #define ALT_KEEP_CACHE 0x00080 399 #define CUMULATIVE_OP 0x00100 400 #define IMM_OP 0x00200 401 #define SRC2_IMM 0x00400 402 403 #define REG_DEST 0x00800 404 #define REG2_SOURCE 0x01000 405 #define SLOW_SRC1 0x02000 406 #define SLOW_SRC2 0x04000 407 #define SLOW_DEST 0x08000 408 409 /* SET_FLAGS (0x10 << 19) also belong here! */ 410 411 #if (defined SLJIT_CONFIG_SPARC_32 && SLJIT_CONFIG_SPARC_32) 412 #include "sljitNativeSPARC_32.c" 413 #else 414 #include "sljitNativeSPARC_64.c" 415 #endif 416 417 SLJIT_API_FUNC_ATTRIBUTE sljit_si sljit_emit_enter(struct sljit_compiler *compiler, sljit_si args, sljit_si scratches, sljit_si saveds, sljit_si local_size) 418 { 419 CHECK_ERROR(); 420 check_sljit_emit_enter(compiler, args, scratches, saveds, local_size); 421 422 compiler->scratches = scratches; 423 compiler->saveds = saveds; 424 #if (defined SLJIT_DEBUG && SLJIT_DEBUG) 425 compiler->logical_local_size = local_size; 426 #endif 427 428 local_size += 23 * sizeof(sljit_sw); 429 local_size = (local_size + 7) & ~0x7; 430 compiler->local_size = local_size; 431 432 if (local_size <= SIMM_MAX) { 433 FAIL_IF(push_inst(compiler, SAVE | D(SLJIT_LOCALS_REG) | S1(SLJIT_LOCALS_REG) | IMM(-local_size), UNMOVABLE_INS)); 434 } 435 else { 436 FAIL_IF(load_immediate(compiler, TMP_REG1, -local_size)); 437 FAIL_IF(push_inst(compiler, SAVE | D(SLJIT_LOCALS_REG) | S1(SLJIT_LOCALS_REG) | S2(TMP_REG1), UNMOVABLE_INS)); 438 } 439 440 if (args >= 1) 441 FAIL_IF(push_inst(compiler, OR | D(SLJIT_SAVED_REG1) | S1(0) | S2A(24), DR(SLJIT_SAVED_REG1))); 442 if (args >= 2) 443 FAIL_IF(push_inst(compiler, OR | D(SLJIT_SAVED_REG2) | S1(0) | S2A(25), DR(SLJIT_SAVED_REG2))); 444 if (args >= 3) 445 FAIL_IF(push_inst(compiler, OR | D(SLJIT_SAVED_REG3) | S1(0) | S2A(26), DR(SLJIT_SAVED_REG3))); 446 447 return SLJIT_SUCCESS; 448 } 449 450 SLJIT_API_FUNC_ATTRIBUTE void sljit_set_context(struct sljit_compiler *compiler, sljit_si args, sljit_si scratches, sljit_si saveds, sljit_si local_size) 451 { 452 CHECK_ERROR_VOID(); 453 check_sljit_set_context(compiler, args, scratches, saveds, local_size); 454 455 compiler->scratches = scratches; 456 compiler->saveds = saveds; 457 #if (defined SLJIT_DEBUG && SLJIT_DEBUG) 458 compiler->logical_local_size = local_size; 459 #endif 460 461 local_size += 23 * sizeof(sljit_sw); 462 compiler->local_size = (local_size + 7) & ~0x7; 463 } 464 465 SLJIT_API_FUNC_ATTRIBUTE sljit_si sljit_emit_return(struct sljit_compiler *compiler, sljit_si op, sljit_si src, sljit_sw srcw) 466 { 467 CHECK_ERROR(); 468 check_sljit_emit_return(compiler, op, src, srcw); 469 470 if (op != SLJIT_MOV || !FAST_IS_REG(src)) { 471 FAIL_IF(emit_mov_before_return(compiler, op, src, srcw)); 472 src = SLJIT_SCRATCH_REG1; 473 } 474 475 FAIL_IF(push_inst(compiler, JMPL | D(0) | S1A(31) | IMM(8), UNMOVABLE_INS)); 476 return push_inst(compiler, RESTORE | D(SLJIT_SCRATCH_REG1) | S1(src) | S2(0), UNMOVABLE_INS); 477 } 478 479 /* --------------------------------------------------------------------- */ 480 /* Operators */ 481 /* --------------------------------------------------------------------- */ 482 483 #if (defined SLJIT_CONFIG_SPARC_32 && SLJIT_CONFIG_SPARC_32) 484 #define ARCH_32_64(a, b) a 485 #else 486 #define ARCH_32_64(a, b) b 487 #endif 488 489 static SLJIT_CONST sljit_ins data_transfer_insts[16 + 4] = { 490 /* u w s */ ARCH_32_64(OPC1(3) | OPC3(0x04) /* stw */, OPC1(3) | OPC3(0x0e) /* stx */), 491 /* u w l */ ARCH_32_64(OPC1(3) | OPC3(0x00) /* lduw */, OPC1(3) | OPC3(0x0b) /* ldx */), 492 /* u b s */ OPC1(3) | OPC3(0x05) /* stb */, 493 /* u b l */ OPC1(3) | OPC3(0x01) /* ldub */, 494 /* u h s */ OPC1(3) | OPC3(0x06) /* sth */, 495 /* u h l */ OPC1(3) | OPC3(0x02) /* lduh */, 496 /* u i s */ OPC1(3) | OPC3(0x04) /* stw */, 497 /* u i l */ OPC1(3) | OPC3(0x00) /* lduw */, 498 499 /* s w s */ ARCH_32_64(OPC1(3) | OPC3(0x04) /* stw */, OPC1(3) | OPC3(0x0e) /* stx */), 500 /* s w l */ ARCH_32_64(OPC1(3) | OPC3(0x00) /* lduw */, OPC1(3) | OPC3(0x0b) /* ldx */), 501 /* s b s */ OPC1(3) | OPC3(0x05) /* stb */, 502 /* s b l */ OPC1(3) | OPC3(0x09) /* ldsb */, 503 /* s h s */ OPC1(3) | OPC3(0x06) /* sth */, 504 /* s h l */ OPC1(3) | OPC3(0x0a) /* ldsh */, 505 /* s i s */ OPC1(3) | OPC3(0x04) /* stw */, 506 /* s i l */ ARCH_32_64(OPC1(3) | OPC3(0x00) /* lduw */, OPC1(3) | OPC3(0x08) /* ldsw */), 507 508 /* d s */ OPC1(3) | OPC3(0x27), 509 /* d l */ OPC1(3) | OPC3(0x23), 510 /* s s */ OPC1(3) | OPC3(0x24), 511 /* s l */ OPC1(3) | OPC3(0x20), 512 }; 513 514 #undef ARCH_32_64 515 516 /* Can perform an operation using at most 1 instruction. */ 517 static sljit_si getput_arg_fast(struct sljit_compiler *compiler, sljit_si flags, sljit_si reg, sljit_si arg, sljit_sw argw) 518 { 519 SLJIT_ASSERT(arg & SLJIT_MEM); 520 521 if (!(flags & WRITE_BACK) || !(arg & REG_MASK)) { 522 if ((!(arg & OFFS_REG_MASK) && argw <= SIMM_MAX && argw >= SIMM_MIN) 523 || ((arg & OFFS_REG_MASK) && (argw & 0x3) == 0)) { 524 /* Works for both absoulte and relative addresses (immediate case). */ 525 if (SLJIT_UNLIKELY(flags & ARG_TEST)) 526 return 1; 527 FAIL_IF(push_inst(compiler, data_transfer_insts[flags & MEM_MASK] 528 | ((flags & MEM_MASK) <= GPR_REG ? D(reg) : DA(reg)) 529 | S1(arg & REG_MASK) | ((arg & OFFS_REG_MASK) ? S2(OFFS_REG(arg)) : IMM(argw)), 530 ((flags & MEM_MASK) <= GPR_REG && (flags & LOAD_DATA)) ? DR(reg) : MOVABLE_INS)); 531 return -1; 532 } 533 } 534 return 0; 535 } 536 537 /* See getput_arg below. 538 Note: can_cache is called only for binary operators. Those 539 operators always uses word arguments without write back. */ 540 static sljit_si can_cache(sljit_si arg, sljit_sw argw, sljit_si next_arg, sljit_sw next_argw) 541 { 542 SLJIT_ASSERT((arg & SLJIT_MEM) && (next_arg & SLJIT_MEM)); 543 544 /* Simple operation except for updates. */ 545 if (arg & OFFS_REG_MASK) { 546 argw &= 0x3; 547 SLJIT_ASSERT(argw); 548 next_argw &= 0x3; 549 if ((arg & OFFS_REG_MASK) == (next_arg & OFFS_REG_MASK) && argw == next_argw) 550 return 1; 551 return 0; 552 } 553 554 if (((next_argw - argw) <= SIMM_MAX && (next_argw - argw) >= SIMM_MIN)) 555 return 1; 556 return 0; 557 } 558 559 /* Emit the necessary instructions. See can_cache above. */ 560 static sljit_si getput_arg(struct sljit_compiler *compiler, sljit_si flags, sljit_si reg, sljit_si arg, sljit_sw argw, sljit_si next_arg, sljit_sw next_argw) 561 { 562 sljit_si base, arg2, delay_slot; 563 sljit_ins dest; 564 565 SLJIT_ASSERT(arg & SLJIT_MEM); 566 if (!(next_arg & SLJIT_MEM)) { 567 next_arg = 0; 568 next_argw = 0; 569 } 570 571 base = arg & REG_MASK; 572 if (SLJIT_UNLIKELY(arg & OFFS_REG_MASK)) { 573 argw &= 0x3; 574 SLJIT_ASSERT(argw != 0); 575 576 /* Using the cache. */ 577 if (((SLJIT_MEM | (arg & OFFS_REG_MASK)) == compiler->cache_arg) && (argw == compiler->cache_argw)) 578 arg2 = TMP_REG3; 579 else { 580 if ((arg & OFFS_REG_MASK) == (next_arg & OFFS_REG_MASK) && argw == (next_argw & 0x3)) { 581 compiler->cache_arg = SLJIT_MEM | (arg & OFFS_REG_MASK); 582 compiler->cache_argw = argw; 583 arg2 = TMP_REG3; 584 } 585 else if ((flags & LOAD_DATA) && ((flags & MEM_MASK) <= GPR_REG) && reg != base && reg != OFFS_REG(arg)) 586 arg2 = reg; 587 else /* It must be a mov operation, so tmp1 must be free to use. */ 588 arg2 = TMP_REG1; 589 FAIL_IF(push_inst(compiler, SLL_W | D(arg2) | S1(OFFS_REG(arg)) | IMM_ARG | argw, DR(arg2))); 590 } 591 } 592 else { 593 /* Using the cache. */ 594 if ((compiler->cache_arg == SLJIT_MEM) && (argw - compiler->cache_argw) <= SIMM_MAX && (argw - compiler->cache_argw) >= SIMM_MIN) { 595 if (argw != compiler->cache_argw) { 596 FAIL_IF(push_inst(compiler, ADD | D(TMP_REG3) | S1(TMP_REG3) | IMM(argw - compiler->cache_argw), DR(TMP_REG3))); 597 compiler->cache_argw = argw; 598 } 599 arg2 = TMP_REG3; 600 } else { 601 if ((next_argw - argw) <= SIMM_MAX && (next_argw - argw) >= SIMM_MIN) { 602 compiler->cache_arg = SLJIT_MEM; 603 compiler->cache_argw = argw; 604 arg2 = TMP_REG3; 605 } 606 else if ((flags & LOAD_DATA) && ((flags & MEM_MASK) <= GPR_REG) && reg != base) 607 arg2 = reg; 608 else /* It must be a mov operation, so tmp1 must be free to use. */ 609 arg2 = TMP_REG1; 610 FAIL_IF(load_immediate(compiler, arg2, argw)); 611 } 612 } 613 614 dest = ((flags & MEM_MASK) <= GPR_REG ? D(reg) : DA(reg)); 615 delay_slot = ((flags & MEM_MASK) <= GPR_REG && (flags & LOAD_DATA)) ? DR(reg) : MOVABLE_INS; 616 if (!base) 617 return push_inst(compiler, data_transfer_insts[flags & MEM_MASK] | dest | S1(arg2) | IMM(0), delay_slot); 618 if (!(flags & WRITE_BACK)) 619 return push_inst(compiler, data_transfer_insts[flags & MEM_MASK] | dest | S1(base) | S2(arg2), delay_slot); 620 FAIL_IF(push_inst(compiler, data_transfer_insts[flags & MEM_MASK] | dest | S1(base) | S2(arg2), delay_slot)); 621 return push_inst(compiler, ADD | D(base) | S1(base) | S2(arg2), DR(base)); 622 } 623 624 static SLJIT_INLINE sljit_si emit_op_mem(struct sljit_compiler *compiler, sljit_si flags, sljit_si reg, sljit_si arg, sljit_sw argw) 625 { 626 if (getput_arg_fast(compiler, flags, reg, arg, argw)) 627 return compiler->error; 628 compiler->cache_arg = 0; 629 compiler->cache_argw = 0; 630 return getput_arg(compiler, flags, reg, arg, argw, 0, 0); 631 } 632 633 static SLJIT_INLINE sljit_si emit_op_mem2(struct sljit_compiler *compiler, sljit_si flags, sljit_si reg, sljit_si arg1, sljit_sw arg1w, sljit_si arg2, sljit_sw arg2w) 634 { 635 if (getput_arg_fast(compiler, flags, reg, arg1, arg1w)) 636 return compiler->error; 637 return getput_arg(compiler, flags, reg, arg1, arg1w, arg2, arg2w); 638 } 639 640 static sljit_si emit_op(struct sljit_compiler *compiler, sljit_si op, sljit_si flags, 641 sljit_si dst, sljit_sw dstw, 642 sljit_si src1, sljit_sw src1w, 643 sljit_si src2, sljit_sw src2w) 644 { 645 /* arg1 goes to TMP_REG1 or src reg 646 arg2 goes to TMP_REG2, imm or src reg 647 TMP_REG3 can be used for caching 648 result goes to TMP_REG2, so put result can use TMP_REG1 and TMP_REG3. */ 649 sljit_si dst_r = TMP_REG2; 650 sljit_si src1_r; 651 sljit_sw src2_r = 0; 652 sljit_si sugg_src2_r = TMP_REG2; 653 654 if (!(flags & ALT_KEEP_CACHE)) { 655 compiler->cache_arg = 0; 656 compiler->cache_argw = 0; 657 } 658 659 if (SLJIT_UNLIKELY(dst == SLJIT_UNUSED)) { 660 if (op >= SLJIT_MOV && op <= SLJIT_MOVU_SI && !(src2 & SLJIT_MEM)) 661 return SLJIT_SUCCESS; 662 } 663 else if (FAST_IS_REG(dst)) { 664 dst_r = dst; 665 flags |= REG_DEST; 666 if (op >= SLJIT_MOV && op <= SLJIT_MOVU_SI) 667 sugg_src2_r = dst_r; 668 } 669 else if ((dst & SLJIT_MEM) && !getput_arg_fast(compiler, flags | ARG_TEST, TMP_REG1, dst, dstw)) 670 flags |= SLOW_DEST; 671 672 if (flags & IMM_OP) { 673 if ((src2 & SLJIT_IMM) && src2w) { 674 if (src2w <= SIMM_MAX && src2w >= SIMM_MIN) { 675 flags |= SRC2_IMM; 676 src2_r = src2w; 677 } 678 } 679 if (!(flags & SRC2_IMM) && (flags & CUMULATIVE_OP) && (src1 & SLJIT_IMM) && src1w) { 680 if (src1w <= SIMM_MAX && src1w >= SIMM_MIN) { 681 flags |= SRC2_IMM; 682 src2_r = src1w; 683 684 /* And swap arguments. */ 685 src1 = src2; 686 src1w = src2w; 687 src2 = SLJIT_IMM; 688 /* src2w = src2_r unneeded. */ 689 } 690 } 691 } 692 693 /* Source 1. */ 694 if (FAST_IS_REG(src1)) 695 src1_r = src1; 696 else if (src1 & SLJIT_IMM) { 697 if (src1w) { 698 FAIL_IF(load_immediate(compiler, TMP_REG1, src1w)); 699 src1_r = TMP_REG1; 700 } 701 else 702 src1_r = 0; 703 } 704 else { 705 if (getput_arg_fast(compiler, flags | LOAD_DATA, TMP_REG1, src1, src1w)) 706 FAIL_IF(compiler->error); 707 else 708 flags |= SLOW_SRC1; 709 src1_r = TMP_REG1; 710 } 711 712 /* Source 2. */ 713 if (FAST_IS_REG(src2)) { 714 src2_r = src2; 715 flags |= REG2_SOURCE; 716 if (!(flags & REG_DEST) && op >= SLJIT_MOV && op <= SLJIT_MOVU_SI) 717 dst_r = src2_r; 718 } 719 else if (src2 & SLJIT_IMM) { 720 if (!(flags & SRC2_IMM)) { 721 if (src2w) { 722 FAIL_IF(load_immediate(compiler, sugg_src2_r, src2w)); 723 src2_r = sugg_src2_r; 724 } 725 else { 726 src2_r = 0; 727 if ((op >= SLJIT_MOV && op <= SLJIT_MOVU_SI) && (dst & SLJIT_MEM)) 728 dst_r = 0; 729 } 730 } 731 } 732 else { 733 if (getput_arg_fast(compiler, flags | LOAD_DATA, sugg_src2_r, src2, src2w)) 734 FAIL_IF(compiler->error); 735 else 736 flags |= SLOW_SRC2; 737 src2_r = sugg_src2_r; 738 } 739 740 if ((flags & (SLOW_SRC1 | SLOW_SRC2)) == (SLOW_SRC1 | SLOW_SRC2)) { 741 SLJIT_ASSERT(src2_r == TMP_REG2); 742 if (!can_cache(src1, src1w, src2, src2w) && can_cache(src1, src1w, dst, dstw)) { 743 FAIL_IF(getput_arg(compiler, flags | LOAD_DATA, TMP_REG2, src2, src2w, src1, src1w)); 744 FAIL_IF(getput_arg(compiler, flags | LOAD_DATA, TMP_REG1, src1, src1w, dst, dstw)); 745 } 746 else { 747 FAIL_IF(getput_arg(compiler, flags | LOAD_DATA, TMP_REG1, src1, src1w, src2, src2w)); 748 FAIL_IF(getput_arg(compiler, flags | LOAD_DATA, TMP_REG2, src2, src2w, dst, dstw)); 749 } 750 } 751 else if (flags & SLOW_SRC1) 752 FAIL_IF(getput_arg(compiler, flags | LOAD_DATA, TMP_REG1, src1, src1w, dst, dstw)); 753 else if (flags & SLOW_SRC2) 754 FAIL_IF(getput_arg(compiler, flags | LOAD_DATA, sugg_src2_r, src2, src2w, dst, dstw)); 755 756 FAIL_IF(emit_single_op(compiler, op, flags, dst_r, src1_r, src2_r)); 757 758 if (dst & SLJIT_MEM) { 759 if (!(flags & SLOW_DEST)) { 760 getput_arg_fast(compiler, flags, dst_r, dst, dstw); 761 return compiler->error; 762 } 763 return getput_arg(compiler, flags, dst_r, dst, dstw, 0, 0); 764 } 765 766 return SLJIT_SUCCESS; 767 } 768 769 SLJIT_API_FUNC_ATTRIBUTE sljit_si sljit_emit_op0(struct sljit_compiler *compiler, sljit_si op) 770 { 771 CHECK_ERROR(); 772 check_sljit_emit_op0(compiler, op); 773 774 op = GET_OPCODE(op); 775 switch (op) { 776 case SLJIT_BREAKPOINT: 777 return push_inst(compiler, TA, UNMOVABLE_INS); 778 case SLJIT_NOP: 779 return push_inst(compiler, NOP, UNMOVABLE_INS); 780 case SLJIT_UMUL: 781 case SLJIT_SMUL: 782 #if (defined SLJIT_CONFIG_SPARC_32 && SLJIT_CONFIG_SPARC_32) 783 FAIL_IF(push_inst(compiler, (op == SLJIT_UMUL ? UMUL : SMUL) | D(SLJIT_SCRATCH_REG1) | S1(SLJIT_SCRATCH_REG1) | S2(SLJIT_SCRATCH_REG2), DR(SLJIT_SCRATCH_REG1))); 784 return push_inst(compiler, RDY | D(SLJIT_SCRATCH_REG2), DR(SLJIT_SCRATCH_REG2)); 785 #else 786 #error "Implementation required" 787 #endif 788 case SLJIT_UDIV: 789 case SLJIT_SDIV: 790 #if (defined SLJIT_CONFIG_SPARC_32 && SLJIT_CONFIG_SPARC_32) 791 if (op == SLJIT_UDIV) 792 FAIL_IF(push_inst(compiler, WRY | S1(0), MOVABLE_INS)); 793 else { 794 FAIL_IF(push_inst(compiler, SRA | D(TMP_REG1) | S1(SLJIT_SCRATCH_REG1) | IMM(31), DR(TMP_REG1))); 795 FAIL_IF(push_inst(compiler, WRY | S1(TMP_REG1), MOVABLE_INS)); 796 } 797 FAIL_IF(push_inst(compiler, OR | D(TMP_REG2) | S1(0) | S2(SLJIT_SCRATCH_REG1), DR(TMP_REG2))); 798 FAIL_IF(push_inst(compiler, (op == SLJIT_UDIV ? UDIV : SDIV) | D(SLJIT_SCRATCH_REG1) | S1(SLJIT_SCRATCH_REG1) | S2(SLJIT_SCRATCH_REG2), DR(SLJIT_SCRATCH_REG1))); 799 FAIL_IF(push_inst(compiler, SMUL | D(SLJIT_SCRATCH_REG2) | S1(SLJIT_SCRATCH_REG1) | S2(SLJIT_SCRATCH_REG2), DR(SLJIT_SCRATCH_REG2))); 800 FAIL_IF(push_inst(compiler, SUB | D(SLJIT_SCRATCH_REG2) | S1(TMP_REG2) | S2(SLJIT_SCRATCH_REG2), DR(SLJIT_SCRATCH_REG2))); 801 return SLJIT_SUCCESS; 802 #else 803 #error "Implementation required" 804 #endif 805 } 806 807 return SLJIT_SUCCESS; 808 } 809 810 SLJIT_API_FUNC_ATTRIBUTE sljit_si sljit_emit_op1(struct sljit_compiler *compiler, sljit_si op, 811 sljit_si dst, sljit_sw dstw, 812 sljit_si src, sljit_sw srcw) 813 { 814 sljit_si flags = GET_FLAGS(op) ? SET_FLAGS : 0; 815 816 CHECK_ERROR(); 817 check_sljit_emit_op1(compiler, op, dst, dstw, src, srcw); 818 ADJUST_LOCAL_OFFSET(dst, dstw); 819 ADJUST_LOCAL_OFFSET(src, srcw); 820 821 op = GET_OPCODE(op); 822 switch (op) { 823 case SLJIT_MOV: 824 case SLJIT_MOV_P: 825 return emit_op(compiler, SLJIT_MOV, flags | WORD_DATA, dst, dstw, TMP_REG1, 0, src, srcw); 826 827 case SLJIT_MOV_UI: 828 return emit_op(compiler, SLJIT_MOV_UI, flags | INT_DATA, dst, dstw, TMP_REG1, 0, src, srcw); 829 830 case SLJIT_MOV_SI: 831 return emit_op(compiler, SLJIT_MOV_SI, flags | INT_DATA | SIGNED_DATA, dst, dstw, TMP_REG1, 0, src, srcw); 832 833 case SLJIT_MOV_UB: 834 return emit_op(compiler, SLJIT_MOV_UB, flags | BYTE_DATA, dst, dstw, TMP_REG1, 0, src, (src & SLJIT_IMM) ? (sljit_ub)srcw : srcw); 835 836 case SLJIT_MOV_SB: 837 return emit_op(compiler, SLJIT_MOV_SB, flags | BYTE_DATA | SIGNED_DATA, dst, dstw, TMP_REG1, 0, src, (src & SLJIT_IMM) ? (sljit_sb)srcw : srcw); 838 839 case SLJIT_MOV_UH: 840 return emit_op(compiler, SLJIT_MOV_UH, flags | HALF_DATA, dst, dstw, TMP_REG1, 0, src, (src & SLJIT_IMM) ? (sljit_uh)srcw : srcw); 841 842 case SLJIT_MOV_SH: 843 return emit_op(compiler, SLJIT_MOV_SH, flags | HALF_DATA | SIGNED_DATA, dst, dstw, TMP_REG1, 0, src, (src & SLJIT_IMM) ? (sljit_sh)srcw : srcw); 844 845 case SLJIT_MOVU: 846 case SLJIT_MOVU_P: 847 return emit_op(compiler, SLJIT_MOV, flags | WORD_DATA | WRITE_BACK, dst, dstw, TMP_REG1, 0, src, srcw); 848 849 case SLJIT_MOVU_UI: 850 return emit_op(compiler, SLJIT_MOV_UI, flags | INT_DATA | WRITE_BACK, dst, dstw, TMP_REG1, 0, src, srcw); 851 852 case SLJIT_MOVU_SI: 853 return emit_op(compiler, SLJIT_MOV_SI, flags | INT_DATA | SIGNED_DATA | WRITE_BACK, dst, dstw, TMP_REG1, 0, src, srcw); 854 855 case SLJIT_MOVU_UB: 856 return emit_op(compiler, SLJIT_MOV_UB, flags | BYTE_DATA | WRITE_BACK, dst, dstw, TMP_REG1, 0, src, (src & SLJIT_IMM) ? (sljit_ub)srcw : srcw); 857 858 case SLJIT_MOVU_SB: 859 return emit_op(compiler, SLJIT_MOV_SB, flags | BYTE_DATA | SIGNED_DATA | WRITE_BACK, dst, dstw, TMP_REG1, 0, src, (src & SLJIT_IMM) ? (sljit_sb)srcw : srcw); 860 861 case SLJIT_MOVU_UH: 862 return emit_op(compiler, SLJIT_MOV_UH, flags | HALF_DATA | WRITE_BACK, dst, dstw, TMP_REG1, 0, src, (src & SLJIT_IMM) ? (sljit_uh)srcw : srcw); 863 864 case SLJIT_MOVU_SH: 865 return emit_op(compiler, SLJIT_MOV_SH, flags | HALF_DATA | SIGNED_DATA | WRITE_BACK, dst, dstw, TMP_REG1, 0, src, (src & SLJIT_IMM) ? (sljit_sh)srcw : srcw); 866 867 case SLJIT_NOT: 868 case SLJIT_CLZ: 869 return emit_op(compiler, op, flags, dst, dstw, TMP_REG1, 0, src, srcw); 870 871 case SLJIT_NEG: 872 return emit_op(compiler, SLJIT_SUB, flags | IMM_OP, dst, dstw, SLJIT_IMM, 0, src, srcw); 873 } 874 875 return SLJIT_SUCCESS; 876 } 877 878 SLJIT_API_FUNC_ATTRIBUTE sljit_si sljit_emit_op2(struct sljit_compiler *compiler, sljit_si op, 879 sljit_si dst, sljit_sw dstw, 880 sljit_si src1, sljit_sw src1w, 881 sljit_si src2, sljit_sw src2w) 882 { 883 sljit_si flags = GET_FLAGS(op) ? SET_FLAGS : 0; 884 885 CHECK_ERROR(); 886 check_sljit_emit_op2(compiler, op, dst, dstw, src1, src1w, src2, src2w); 887 ADJUST_LOCAL_OFFSET(dst, dstw); 888 ADJUST_LOCAL_OFFSET(src1, src1w); 889 ADJUST_LOCAL_OFFSET(src2, src2w); 890 891 op = GET_OPCODE(op); 892 switch (op) { 893 case SLJIT_ADD: 894 case SLJIT_ADDC: 895 case SLJIT_MUL: 896 case SLJIT_AND: 897 case SLJIT_OR: 898 case SLJIT_XOR: 899 return emit_op(compiler, op, flags | CUMULATIVE_OP | IMM_OP, dst, dstw, src1, src1w, src2, src2w); 900 901 case SLJIT_SUB: 902 case SLJIT_SUBC: 903 return emit_op(compiler, op, flags | IMM_OP, dst, dstw, src1, src1w, src2, src2w); 904 905 case SLJIT_SHL: 906 case SLJIT_LSHR: 907 case SLJIT_ASHR: 908 #if (defined SLJIT_CONFIG_SPARC_32 && SLJIT_CONFIG_SPARC_32) 909 if (src2 & SLJIT_IMM) 910 src2w &= 0x1f; 911 #else 912 SLJIT_ASSERT_STOP(); 913 #endif 914 return emit_op(compiler, op, flags | IMM_OP, dst, dstw, src1, src1w, src2, src2w); 915 } 916 917 return SLJIT_SUCCESS; 918 } 919 920 SLJIT_API_FUNC_ATTRIBUTE sljit_si sljit_get_register_index(sljit_si reg) 921 { 922 check_sljit_get_register_index(reg); 923 return reg_map[reg]; 924 } 925 926 SLJIT_API_FUNC_ATTRIBUTE sljit_si sljit_get_float_register_index(sljit_si reg) 927 { 928 check_sljit_get_float_register_index(reg); 929 return reg << 1; 930 } 931 932 SLJIT_API_FUNC_ATTRIBUTE sljit_si sljit_emit_op_custom(struct sljit_compiler *compiler, 933 void *instruction, sljit_si size) 934 { 935 CHECK_ERROR(); 936 check_sljit_emit_op_custom(compiler, instruction, size); 937 SLJIT_ASSERT(size == 4); 938 939 return push_inst(compiler, *(sljit_ins*)instruction, UNMOVABLE_INS); 940 } 941 942 /* --------------------------------------------------------------------- */ 943 /* Floating point operators */ 944 /* --------------------------------------------------------------------- */ 945 946 SLJIT_API_FUNC_ATTRIBUTE sljit_si sljit_is_fpu_available(void) 947 { 948 #ifdef SLJIT_IS_FPU_AVAILABLE 949 return SLJIT_IS_FPU_AVAILABLE; 950 #else 951 /* Available by default. */ 952 return 1; 953 #endif 954 } 955 956 #define FLOAT_DATA(op) (DOUBLE_DATA | ((op & SLJIT_SINGLE_OP) >> 7)) 957 #define SELECT_FOP(op, single, double) ((op & SLJIT_SINGLE_OP) ? single : double) 958 959 SLJIT_API_FUNC_ATTRIBUTE sljit_si sljit_emit_fop1(struct sljit_compiler *compiler, sljit_si op, 960 sljit_si dst, sljit_sw dstw, 961 sljit_si src, sljit_sw srcw) 962 { 963 sljit_si dst_fr; 964 965 CHECK_ERROR(); 966 check_sljit_emit_fop1(compiler, op, dst, dstw, src, srcw); 967 SLJIT_COMPILE_ASSERT((SLJIT_SINGLE_OP == 0x100) && !(DOUBLE_DATA & 0x2), float_transfer_bit_error); 968 969 compiler->cache_arg = 0; 970 compiler->cache_argw = 0; 971 972 if (GET_OPCODE(op) == SLJIT_CMPD) { 973 if (dst & SLJIT_MEM) { 974 FAIL_IF(emit_op_mem2(compiler, FLOAT_DATA(op) | LOAD_DATA, TMP_FREG1, dst, dstw, src, srcw)); 975 dst = TMP_FREG1; 976 } 977 else 978 dst <<= 1; 979 980 if (src & SLJIT_MEM) { 981 FAIL_IF(emit_op_mem2(compiler, FLOAT_DATA(op) | LOAD_DATA, TMP_FREG2, src, srcw, 0, 0)); 982 src = TMP_FREG2; 983 } 984 else 985 src <<= 1; 986 987 return push_inst(compiler, SELECT_FOP(op, FCMPS, FCMPD) | S1A(dst) | S2A(src), FCC_IS_SET | MOVABLE_INS); 988 } 989 990 dst_fr = FAST_IS_REG(dst) ? (dst << 1) : TMP_FREG1; 991 992 if (src & SLJIT_MEM) { 993 FAIL_IF(emit_op_mem2(compiler, FLOAT_DATA(op) | LOAD_DATA, dst_fr, src, srcw, dst, dstw)); 994 src = dst_fr; 995 } 996 else 997 src <<= 1; 998 999 switch (GET_OPCODE(op)) { 1000 case SLJIT_MOVD: 1001 if (src != dst_fr && dst_fr != TMP_FREG1) { 1002 FAIL_IF(push_inst(compiler, FMOVS | DA(dst_fr) | S2A(src), MOVABLE_INS)); 1003 if (!(op & SLJIT_SINGLE_OP)) 1004 FAIL_IF(push_inst(compiler, FMOVS | DA(dst_fr | 1) | S2A(src | 1), MOVABLE_INS)); 1005 } 1006 break; 1007 case SLJIT_NEGD: 1008 FAIL_IF(push_inst(compiler, FNEGS | DA(dst_fr) | S2A(src), MOVABLE_INS)); 1009 if (dst_fr != src && !(op & SLJIT_SINGLE_OP)) 1010 FAIL_IF(push_inst(compiler, FMOVS | DA(dst_fr | 1) | S2A(src | 1), MOVABLE_INS)); 1011 break; 1012 case SLJIT_ABSD: 1013 FAIL_IF(push_inst(compiler, FABSS | DA(dst_fr) | S2A(src), MOVABLE_INS)); 1014 if (dst_fr != src && !(op & SLJIT_SINGLE_OP)) 1015 FAIL_IF(push_inst(compiler, FMOVS | DA(dst_fr | 1) | S2A(src | 1), MOVABLE_INS)); 1016 break; 1017 } 1018 1019 if (dst_fr == TMP_FREG1) { 1020 if (GET_OPCODE(op) == SLJIT_MOVD) 1021 dst_fr = src; 1022 FAIL_IF(emit_op_mem2(compiler, FLOAT_DATA(op), dst_fr, dst, dstw, 0, 0)); 1023 } 1024 1025 return SLJIT_SUCCESS; 1026 } 1027 1028 SLJIT_API_FUNC_ATTRIBUTE sljit_si sljit_emit_fop2(struct sljit_compiler *compiler, sljit_si op, 1029 sljit_si dst, sljit_sw dstw, 1030 sljit_si src1, sljit_sw src1w, 1031 sljit_si src2, sljit_sw src2w) 1032 { 1033 sljit_si dst_fr, flags = 0; 1034 1035 CHECK_ERROR(); 1036 check_sljit_emit_fop2(compiler, op, dst, dstw, src1, src1w, src2, src2w); 1037 1038 compiler->cache_arg = 0; 1039 compiler->cache_argw = 0; 1040 1041 dst_fr = FAST_IS_REG(dst) ? (dst << 1) : TMP_FREG2; 1042 1043 if (src1 & SLJIT_MEM) { 1044 if (getput_arg_fast(compiler, FLOAT_DATA(op) | LOAD_DATA, TMP_FREG1, src1, src1w)) { 1045 FAIL_IF(compiler->error); 1046 src1 = TMP_FREG1; 1047 } else 1048 flags |= SLOW_SRC1; 1049 } 1050 else 1051 src1 <<= 1; 1052 1053 if (src2 & SLJIT_MEM) { 1054 if (getput_arg_fast(compiler, FLOAT_DATA(op) | LOAD_DATA, TMP_FREG2, src2, src2w)) { 1055 FAIL_IF(compiler->error); 1056 src2 = TMP_FREG2; 1057 } else 1058 flags |= SLOW_SRC2; 1059 } 1060 else 1061 src2 <<= 1; 1062 1063 if ((flags & (SLOW_SRC1 | SLOW_SRC2)) == (SLOW_SRC1 | SLOW_SRC2)) { 1064 if (!can_cache(src1, src1w, src2, src2w) && can_cache(src1, src1w, dst, dstw)) { 1065 FAIL_IF(getput_arg(compiler, FLOAT_DATA(op) | LOAD_DATA, TMP_FREG2, src2, src2w, src1, src1w)); 1066 FAIL_IF(getput_arg(compiler, FLOAT_DATA(op) | LOAD_DATA, TMP_FREG1, src1, src1w, dst, dstw)); 1067 } 1068 else { 1069 FAIL_IF(getput_arg(compiler, FLOAT_DATA(op) | LOAD_DATA, TMP_FREG1, src1, src1w, src2, src2w)); 1070 FAIL_IF(getput_arg(compiler, FLOAT_DATA(op) | LOAD_DATA, TMP_FREG2, src2, src2w, dst, dstw)); 1071 } 1072 } 1073 else if (flags & SLOW_SRC1) 1074 FAIL_IF(getput_arg(compiler, FLOAT_DATA(op) | LOAD_DATA, TMP_FREG1, src1, src1w, dst, dstw)); 1075 else if (flags & SLOW_SRC2) 1076 FAIL_IF(getput_arg(compiler, FLOAT_DATA(op) | LOAD_DATA, TMP_FREG2, src2, src2w, dst, dstw)); 1077 1078 if (flags & SLOW_SRC1) 1079 src1 = TMP_FREG1; 1080 if (flags & SLOW_SRC2) 1081 src2 = TMP_FREG2; 1082 1083 switch (GET_OPCODE(op)) { 1084 case SLJIT_ADDD: 1085 FAIL_IF(push_inst(compiler, SELECT_FOP(op, FADDS, FADDD) | DA(dst_fr) | S1A(src1) | S2A(src2), MOVABLE_INS)); 1086 break; 1087 1088 case SLJIT_SUBD: 1089 FAIL_IF(push_inst(compiler, SELECT_FOP(op, FSUBS, FSUBD) | DA(dst_fr) | S1A(src1) | S2A(src2), MOVABLE_INS)); 1090 break; 1091 1092 case SLJIT_MULD: 1093 FAIL_IF(push_inst(compiler, SELECT_FOP(op, FMULS, FMULD) | DA(dst_fr) | S1A(src1) | S2A(src2), MOVABLE_INS)); 1094 break; 1095 1096 case SLJIT_DIVD: 1097 FAIL_IF(push_inst(compiler, SELECT_FOP(op, FDIVS, FDIVD) | DA(dst_fr) | S1A(src1) | S2A(src2), MOVABLE_INS)); 1098 break; 1099 } 1100 1101 if (dst_fr == TMP_FREG2) 1102 FAIL_IF(emit_op_mem2(compiler, FLOAT_DATA(op), TMP_FREG2, dst, dstw, 0, 0)); 1103 1104 return SLJIT_SUCCESS; 1105 } 1106 1107 #undef FLOAT_DATA 1108 #undef SELECT_FOP 1109 1110 /* --------------------------------------------------------------------- */ 1111 /* Other instructions */ 1112 /* --------------------------------------------------------------------- */ 1113 1114 SLJIT_API_FUNC_ATTRIBUTE sljit_si sljit_emit_fast_enter(struct sljit_compiler *compiler, sljit_si dst, sljit_sw dstw) 1115 { 1116 CHECK_ERROR(); 1117 check_sljit_emit_fast_enter(compiler, dst, dstw); 1118 ADJUST_LOCAL_OFFSET(dst, dstw); 1119 1120 /* For UNUSED dst. Uncommon, but possible. */ 1121 if (dst == SLJIT_UNUSED) 1122 return SLJIT_SUCCESS; 1123 1124 if (FAST_IS_REG(dst)) 1125 return push_inst(compiler, OR | D(dst) | S1(0) | S2(TMP_LINK), DR(dst)); 1126 1127 /* Memory. */ 1128 return emit_op_mem(compiler, WORD_DATA, TMP_LINK, dst, dstw); 1129 } 1130 1131 SLJIT_API_FUNC_ATTRIBUTE sljit_si sljit_emit_fast_return(struct sljit_compiler *compiler, sljit_si src, sljit_sw srcw) 1132 { 1133 CHECK_ERROR(); 1134 check_sljit_emit_fast_return(compiler, src, srcw); 1135 ADJUST_LOCAL_OFFSET(src, srcw); 1136 1137 if (FAST_IS_REG(src)) 1138 FAIL_IF(push_inst(compiler, OR | D(TMP_LINK) | S1(0) | S2(src), DR(TMP_LINK))); 1139 else if (src & SLJIT_MEM) 1140 FAIL_IF(emit_op_mem(compiler, WORD_DATA | LOAD_DATA, TMP_LINK, src, srcw)); 1141 else if (src & SLJIT_IMM) 1142 FAIL_IF(load_immediate(compiler, TMP_LINK, srcw)); 1143 1144 FAIL_IF(push_inst(compiler, JMPL | D(0) | S1(TMP_LINK) | IMM(8), UNMOVABLE_INS)); 1145 return push_inst(compiler, NOP, UNMOVABLE_INS); 1146 } 1147 1148 /* --------------------------------------------------------------------- */ 1149 /* Conditional instructions */ 1150 /* --------------------------------------------------------------------- */ 1151 1152 SLJIT_API_FUNC_ATTRIBUTE struct sljit_label* sljit_emit_label(struct sljit_compiler *compiler) 1153 { 1154 struct sljit_label *label; 1155 1156 CHECK_ERROR_PTR(); 1157 check_sljit_emit_label(compiler); 1158 1159 if (compiler->last_label && compiler->last_label->size == compiler->size) 1160 return compiler->last_label; 1161 1162 label = (struct sljit_label*)ensure_abuf(compiler, sizeof(struct sljit_label)); 1163 PTR_FAIL_IF(!label); 1164 set_label(label, compiler); 1165 compiler->delay_slot = UNMOVABLE_INS; 1166 return label; 1167 } 1168 1169 static sljit_ins get_cc(sljit_si type) 1170 { 1171 switch (type) { 1172 case SLJIT_C_EQUAL: 1173 case SLJIT_C_MUL_NOT_OVERFLOW: 1174 return DA(0x1); 1175 1176 case SLJIT_C_NOT_EQUAL: 1177 case SLJIT_C_MUL_OVERFLOW: 1178 return DA(0x9); 1179 1180 case SLJIT_C_LESS: 1181 return DA(0x5); 1182 1183 case SLJIT_C_GREATER_EQUAL: 1184 return DA(0xd); 1185 1186 case SLJIT_C_GREATER: 1187 return DA(0xc); 1188 1189 case SLJIT_C_LESS_EQUAL: 1190 return DA(0x4); 1191 1192 case SLJIT_C_SIG_LESS: 1193 return DA(0x3); 1194 1195 case SLJIT_C_SIG_GREATER_EQUAL: 1196 return DA(0xb); 1197 1198 case SLJIT_C_SIG_GREATER: 1199 return DA(0xa); 1200 1201 case SLJIT_C_SIG_LESS_EQUAL: 1202 return DA(0x2); 1203 1204 case SLJIT_C_OVERFLOW: 1205 return DA(0x7); 1206 1207 case SLJIT_C_NOT_OVERFLOW: 1208 return DA(0xf); 1209 1210 case SLJIT_C_FLOAT_EQUAL: 1211 return DA(0x9); 1212 1213 case SLJIT_C_FLOAT_NOT_EQUAL: /* Unordered. */ 1214 return DA(0x1); 1215 1216 case SLJIT_C_FLOAT_LESS: 1217 return DA(0x4); 1218 1219 case SLJIT_C_FLOAT_GREATER_EQUAL: /* Unordered. */ 1220 return DA(0xc); 1221 1222 case SLJIT_C_FLOAT_LESS_EQUAL: 1223 return DA(0xd); 1224 1225 case SLJIT_C_FLOAT_GREATER: /* Unordered. */ 1226 return DA(0x5); 1227 1228 case SLJIT_C_FLOAT_UNORDERED: 1229 return DA(0x7); 1230 1231 case SLJIT_C_FLOAT_ORDERED: 1232 return DA(0xf); 1233 1234 default: 1235 SLJIT_ASSERT_STOP(); 1236 return DA(0x8); 1237 } 1238 } 1239 1240 SLJIT_API_FUNC_ATTRIBUTE struct sljit_jump* sljit_emit_jump(struct sljit_compiler *compiler, sljit_si type) 1241 { 1242 struct sljit_jump *jump; 1243 1244 CHECK_ERROR_PTR(); 1245 check_sljit_emit_jump(compiler, type); 1246 1247 jump = (struct sljit_jump*)ensure_abuf(compiler, sizeof(struct sljit_jump)); 1248 PTR_FAIL_IF(!jump); 1249 set_jump(jump, compiler, type & SLJIT_REWRITABLE_JUMP); 1250 type &= 0xff; 1251 1252 if (type < SLJIT_C_FLOAT_EQUAL) { 1253 jump->flags |= IS_COND; 1254 if (((compiler->delay_slot & DST_INS_MASK) != UNMOVABLE_INS) && !(compiler->delay_slot & ICC_IS_SET)) 1255 jump->flags |= IS_MOVABLE; 1256 #if (defined SLJIT_CONFIG_SPARC_32 && SLJIT_CONFIG_SPARC_32) 1257 PTR_FAIL_IF(push_inst(compiler, BICC | get_cc(type ^ 1) | 5, UNMOVABLE_INS)); 1258 #else 1259 #error "Implementation required" 1260 #endif 1261 } 1262 else if (type < SLJIT_JUMP) { 1263 jump->flags |= IS_COND; 1264 if (((compiler->delay_slot & DST_INS_MASK) != UNMOVABLE_INS) && !(compiler->delay_slot & FCC_IS_SET)) 1265 jump->flags |= IS_MOVABLE; 1266 #if (defined SLJIT_CONFIG_SPARC_32 && SLJIT_CONFIG_SPARC_32) 1267 PTR_FAIL_IF(push_inst(compiler, FBFCC | get_cc(type ^ 1) | 5, UNMOVABLE_INS)); 1268 #else 1269 #error "Implementation required" 1270 #endif 1271 } else { 1272 if ((compiler->delay_slot & DST_INS_MASK) != UNMOVABLE_INS) 1273 jump->flags |= IS_MOVABLE; 1274 if (type >= SLJIT_FAST_CALL) 1275 jump->flags |= IS_CALL; 1276 } 1277 1278 PTR_FAIL_IF(emit_const(compiler, TMP_REG2, 0)); 1279 PTR_FAIL_IF(push_inst(compiler, JMPL | D(type >= SLJIT_FAST_CALL ? TMP_LINK : 0) | S1(TMP_REG2) | IMM(0), UNMOVABLE_INS)); 1280 jump->addr = compiler->size; 1281 PTR_FAIL_IF(push_inst(compiler, NOP, UNMOVABLE_INS)); 1282 1283 return jump; 1284 } 1285 1286 SLJIT_API_FUNC_ATTRIBUTE sljit_si sljit_emit_ijump(struct sljit_compiler *compiler, sljit_si type, sljit_si src, sljit_sw srcw) 1287 { 1288 struct sljit_jump *jump = NULL; 1289 sljit_si src_r; 1290 1291 CHECK_ERROR(); 1292 check_sljit_emit_ijump(compiler, type, src, srcw); 1293 ADJUST_LOCAL_OFFSET(src, srcw); 1294 1295 if (FAST_IS_REG(src)) 1296 src_r = src; 1297 else if (src & SLJIT_IMM) { 1298 jump = (struct sljit_jump*)ensure_abuf(compiler, sizeof(struct sljit_jump)); 1299 FAIL_IF(!jump); 1300 set_jump(jump, compiler, JUMP_ADDR); 1301 jump->u.target = srcw; 1302 if ((compiler->delay_slot & DST_INS_MASK) != UNMOVABLE_INS) 1303 jump->flags |= IS_MOVABLE; 1304 if (type >= SLJIT_FAST_CALL) 1305 jump->flags |= IS_CALL; 1306 1307 FAIL_IF(emit_const(compiler, TMP_REG2, 0)); 1308 src_r = TMP_REG2; 1309 } 1310 else { 1311 FAIL_IF(emit_op_mem(compiler, WORD_DATA | LOAD_DATA, TMP_REG2, src, srcw)); 1312 src_r = TMP_REG2; 1313 } 1314 1315 FAIL_IF(push_inst(compiler, JMPL | D(type >= SLJIT_FAST_CALL ? TMP_LINK : 0) | S1(src_r) | IMM(0), UNMOVABLE_INS)); 1316 if (jump) 1317 jump->addr = compiler->size; 1318 return push_inst(compiler, NOP, UNMOVABLE_INS); 1319 } 1320 1321 SLJIT_API_FUNC_ATTRIBUTE sljit_si sljit_emit_op_flags(struct sljit_compiler *compiler, sljit_si op, 1322 sljit_si dst, sljit_sw dstw, 1323 sljit_si src, sljit_sw srcw, 1324 sljit_si type) 1325 { 1326 sljit_si reg, flags = (GET_FLAGS(op) ? SET_FLAGS : 0); 1327 1328 CHECK_ERROR(); 1329 check_sljit_emit_op_flags(compiler, op, dst, dstw, src, srcw, type); 1330 ADJUST_LOCAL_OFFSET(dst, dstw); 1331 1332 if (dst == SLJIT_UNUSED) 1333 return SLJIT_SUCCESS; 1334 1335 #if (defined SLJIT_CONFIG_SPARC_32 && SLJIT_CONFIG_SPARC_32) 1336 op = GET_OPCODE(op); 1337 reg = (op < SLJIT_ADD && FAST_IS_REG(dst)) ? dst : TMP_REG2; 1338 1339 compiler->cache_arg = 0; 1340 compiler->cache_argw = 0; 1341 if (op >= SLJIT_ADD && (src & SLJIT_MEM)) { 1342 ADJUST_LOCAL_OFFSET(src, srcw); 1343 FAIL_IF(emit_op_mem2(compiler, WORD_DATA | LOAD_DATA, TMP_REG1, src, srcw, dst, dstw)); 1344 src = TMP_REG1; 1345 srcw = 0; 1346 } 1347 1348 if (type < SLJIT_C_FLOAT_EQUAL) 1349 FAIL_IF(push_inst(compiler, BICC | get_cc(type) | 3, UNMOVABLE_INS)); 1350 else 1351 FAIL_IF(push_inst(compiler, FBFCC | get_cc(type) | 3, UNMOVABLE_INS)); 1352 1353 FAIL_IF(push_inst(compiler, OR | D(reg) | S1(0) | IMM(1), UNMOVABLE_INS)); 1354 FAIL_IF(push_inst(compiler, OR | D(reg) | S1(0) | IMM(0), UNMOVABLE_INS)); 1355 1356 if (op >= SLJIT_ADD) 1357 return emit_op(compiler, op, flags | CUMULATIVE_OP | IMM_OP | ALT_KEEP_CACHE, dst, dstw, src, srcw, TMP_REG2, 0); 1358 1359 return (reg == TMP_REG2) ? emit_op_mem(compiler, WORD_DATA, TMP_REG2, dst, dstw) : SLJIT_SUCCESS; 1360 #else 1361 #error "Implementation required" 1362 #endif 1363 } 1364 1365 SLJIT_API_FUNC_ATTRIBUTE struct sljit_const* sljit_emit_const(struct sljit_compiler *compiler, sljit_si dst, sljit_sw dstw, sljit_sw init_value) 1366 { 1367 sljit_si reg; 1368 struct sljit_const *const_; 1369 1370 CHECK_ERROR_PTR(); 1371 check_sljit_emit_const(compiler, dst, dstw, init_value); 1372 ADJUST_LOCAL_OFFSET(dst, dstw); 1373 1374 const_ = (struct sljit_const*)ensure_abuf(compiler, sizeof(struct sljit_const)); 1375 PTR_FAIL_IF(!const_); 1376 set_const(const_, compiler); 1377 1378 reg = SLOW_IS_REG(dst) ? dst : TMP_REG2; 1379 1380 PTR_FAIL_IF(emit_const(compiler, reg, init_value)); 1381 1382 if (dst & SLJIT_MEM) 1383 PTR_FAIL_IF(emit_op_mem(compiler, WORD_DATA, TMP_REG2, dst, dstw)); 1384 return const_; 1385 } 1386