1 /* Subroutines used for MIPS code generation. 2 Copyright (C) 1989, 1990, 1991, 1993, 1994, 1995, 1996, 1997, 1998, 3 1999, 2000, 2001, 2002, 2003, 2004, 2005, 2006, 2007, 2008, 2009 4 Free Software Foundation, Inc. 5 Contributed by A. Lichnewsky, lich@inria.inria.fr. 6 Changes by Michael Meissner, meissner@osf.org. 7 64-bit r4000 support by Ian Lance Taylor, ian@cygnus.com, and 8 Brendan Eich, brendan@microunity.com. 9 10 This file is part of GCC. 11 12 GCC is free software; you can redistribute it and/or modify 13 it under the terms of the GNU General Public License as published by 14 the Free Software Foundation; either version 3, or (at your option) 15 any later version. 16 17 GCC is distributed in the hope that it will be useful, 18 but WITHOUT ANY WARRANTY; without even the implied warranty of 19 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the 20 GNU General Public License for more details. 21 22 You should have received a copy of the GNU General Public License 23 along with GCC; see the file COPYING3. If not see 24 <http://www.gnu.org/licenses/>. */ 25 26 #include "config.h" 27 #include "system.h" 28 #include "coretypes.h" 29 #include "tm.h" 30 #include <signal.h> 31 #include "rtl.h" 32 #include "regs.h" 33 #include "hard-reg-set.h" 34 #include "real.h" 35 #include "insn-config.h" 36 #include "conditions.h" 37 #include "insn-attr.h" 38 #include "recog.h" 39 #include "toplev.h" 40 #include "output.h" 41 #include "tree.h" 42 #include "function.h" 43 #include "expr.h" 44 #include "optabs.h" 45 #include "libfuncs.h" 46 #include "flags.h" 47 #include "reload.h" 48 #include "tm_p.h" 49 #include "ggc.h" 50 #include "gstab.h" 51 #include "hashtab.h" 52 #include "debug.h" 53 #include "target.h" 54 #include "target-def.h" 55 #include "integrate.h" 56 #include "langhooks.h" 57 #include "cfglayout.h" 58 #include "sched-int.h" 59 #include "gimple.h" 60 #include "bitmap.h" 61 #include "diagnostic.h" 62 63 /* True if X is an UNSPEC wrapper around a SYMBOL_REF or LABEL_REF. */ 64 #define UNSPEC_ADDRESS_P(X) \ 65 (GET_CODE (X) == UNSPEC \ 66 && XINT (X, 1) >= UNSPEC_ADDRESS_FIRST \ 67 && XINT (X, 1) < UNSPEC_ADDRESS_FIRST + NUM_SYMBOL_TYPES) 68 69 /* Extract the symbol or label from UNSPEC wrapper X. */ 70 #define UNSPEC_ADDRESS(X) \ 71 XVECEXP (X, 0, 0) 72 73 /* Extract the symbol type from UNSPEC wrapper X. */ 74 #define UNSPEC_ADDRESS_TYPE(X) \ 75 ((enum mips_symbol_type) (XINT (X, 1) - UNSPEC_ADDRESS_FIRST)) 76 77 /* The maximum distance between the top of the stack frame and the 78 value $sp has when we save and restore registers. 79 80 The value for normal-mode code must be a SMALL_OPERAND and must 81 preserve the maximum stack alignment. We therefore use a value 82 of 0x7ff0 in this case. 83 84 MIPS16e SAVE and RESTORE instructions can adjust the stack pointer by 85 up to 0x7f8 bytes and can usually save or restore all the registers 86 that we need to save or restore. (Note that we can only use these 87 instructions for o32, for which the stack alignment is 8 bytes.) 88 89 We use a maximum gap of 0x100 or 0x400 for MIPS16 code when SAVE and 90 RESTORE are not available. We can then use unextended instructions 91 to save and restore registers, and to allocate and deallocate the top 92 part of the frame. */ 93 #define MIPS_MAX_FIRST_STACK_STEP \ 94 (!TARGET_MIPS16 ? 0x7ff0 \ 95 : GENERATE_MIPS16E_SAVE_RESTORE ? 0x7f8 \ 96 : TARGET_64BIT ? 0x100 : 0x400) 97 98 /* True if INSN is a mips.md pattern or asm statement. */ 99 #define USEFUL_INSN_P(INSN) \ 100 (NONDEBUG_INSN_P (INSN) \ 101 && GET_CODE (PATTERN (INSN)) != USE \ 102 && GET_CODE (PATTERN (INSN)) != CLOBBER \ 103 && GET_CODE (PATTERN (INSN)) != ADDR_VEC \ 104 && GET_CODE (PATTERN (INSN)) != ADDR_DIFF_VEC) 105 106 /* If INSN is a delayed branch sequence, return the first instruction 107 in the sequence, otherwise return INSN itself. */ 108 #define SEQ_BEGIN(INSN) \ 109 (INSN_P (INSN) && GET_CODE (PATTERN (INSN)) == SEQUENCE \ 110 ? XVECEXP (PATTERN (INSN), 0, 0) \ 111 : (INSN)) 112 113 /* Likewise for the last instruction in a delayed branch sequence. */ 114 #define SEQ_END(INSN) \ 115 (INSN_P (INSN) && GET_CODE (PATTERN (INSN)) == SEQUENCE \ 116 ? XVECEXP (PATTERN (INSN), 0, XVECLEN (PATTERN (INSN), 0) - 1) \ 117 : (INSN)) 118 119 /* Execute the following loop body with SUBINSN set to each instruction 120 between SEQ_BEGIN (INSN) and SEQ_END (INSN) inclusive. */ 121 #define FOR_EACH_SUBINSN(SUBINSN, INSN) \ 122 for ((SUBINSN) = SEQ_BEGIN (INSN); \ 123 (SUBINSN) != NEXT_INSN (SEQ_END (INSN)); \ 124 (SUBINSN) = NEXT_INSN (SUBINSN)) 125 126 /* True if bit BIT is set in VALUE. */ 127 #define BITSET_P(VALUE, BIT) (((VALUE) & (1 << (BIT))) != 0) 128 129 /* Return the opcode for a ptr_mode load of the form: 130 131 l[wd] DEST, OFFSET(BASE). */ 132 #define MIPS_LOAD_PTR(DEST, OFFSET, BASE) \ 133 (((ptr_mode == DImode ? 0x37 : 0x23) << 26) \ 134 | ((BASE) << 21) \ 135 | ((DEST) << 16) \ 136 | (OFFSET)) 137 138 /* Return the opcode to move register SRC into register DEST. */ 139 #define MIPS_MOVE(DEST, SRC) \ 140 ((TARGET_64BIT ? 0x2d : 0x21) \ 141 | ((DEST) << 11) \ 142 | ((SRC) << 21)) 143 144 /* Return the opcode for: 145 146 lui DEST, VALUE. */ 147 #define MIPS_LUI(DEST, VALUE) \ 148 ((0xf << 26) | ((DEST) << 16) | (VALUE)) 149 150 /* Return the opcode to jump to register DEST. */ 151 #define MIPS_JR(DEST) \ 152 (((DEST) << 21) | 0x8) 153 154 /* Return the opcode for: 155 156 bal . + (1 + OFFSET) * 4. */ 157 #define MIPS_BAL(OFFSET) \ 158 ((0x1 << 26) | (0x11 << 16) | (OFFSET)) 159 160 /* Return the usual opcode for a nop. */ 161 #define MIPS_NOP 0 162 163 /* Classifies an address. 164 165 ADDRESS_REG 166 A natural register + offset address. The register satisfies 167 mips_valid_base_register_p and the offset is a const_arith_operand. 168 169 ADDRESS_LO_SUM 170 A LO_SUM rtx. The first operand is a valid base register and 171 the second operand is a symbolic address. 172 173 ADDRESS_CONST_INT 174 A signed 16-bit constant address. 175 176 ADDRESS_SYMBOLIC: 177 A constant symbolic address. */ 178 enum mips_address_type { 179 ADDRESS_REG, 180 ADDRESS_LO_SUM, 181 ADDRESS_CONST_INT, 182 ADDRESS_SYMBOLIC 183 }; 184 185 /* Enumerates the setting of the -mr10k-cache-barrier option. */ 186 enum mips_r10k_cache_barrier_setting { 187 R10K_CACHE_BARRIER_NONE, 188 R10K_CACHE_BARRIER_STORE, 189 R10K_CACHE_BARRIER_LOAD_STORE 190 }; 191 192 /* Macros to create an enumeration identifier for a function prototype. */ 193 #define MIPS_FTYPE_NAME1(A, B) MIPS_##A##_FTYPE_##B 194 #define MIPS_FTYPE_NAME2(A, B, C) MIPS_##A##_FTYPE_##B##_##C 195 #define MIPS_FTYPE_NAME3(A, B, C, D) MIPS_##A##_FTYPE_##B##_##C##_##D 196 #define MIPS_FTYPE_NAME4(A, B, C, D, E) MIPS_##A##_FTYPE_##B##_##C##_##D##_##E 197 198 /* Classifies the prototype of a built-in function. */ 199 enum mips_function_type { 200 #define DEF_MIPS_FTYPE(NARGS, LIST) MIPS_FTYPE_NAME##NARGS LIST, 201 #include "config/mips/mips-ftypes.def" 202 #undef DEF_MIPS_FTYPE 203 MIPS_MAX_FTYPE_MAX 204 }; 205 206 /* Specifies how a built-in function should be converted into rtl. */ 207 enum mips_builtin_type { 208 /* The function corresponds directly to an .md pattern. The return 209 value is mapped to operand 0 and the arguments are mapped to 210 operands 1 and above. */ 211 MIPS_BUILTIN_DIRECT, 212 213 /* The function corresponds directly to an .md pattern. There is no return 214 value and the arguments are mapped to operands 0 and above. */ 215 MIPS_BUILTIN_DIRECT_NO_TARGET, 216 217 /* The function corresponds to a comparison instruction followed by 218 a mips_cond_move_tf_ps pattern. The first two arguments are the 219 values to compare and the second two arguments are the vector 220 operands for the movt.ps or movf.ps instruction (in assembly order). */ 221 MIPS_BUILTIN_MOVF, 222 MIPS_BUILTIN_MOVT, 223 224 /* The function corresponds to a V2SF comparison instruction. Operand 0 225 of this instruction is the result of the comparison, which has mode 226 CCV2 or CCV4. The function arguments are mapped to operands 1 and 227 above. The function's return value is an SImode boolean that is 228 true under the following conditions: 229 230 MIPS_BUILTIN_CMP_ANY: one of the registers is true 231 MIPS_BUILTIN_CMP_ALL: all of the registers are true 232 MIPS_BUILTIN_CMP_LOWER: the first register is true 233 MIPS_BUILTIN_CMP_UPPER: the second register is true. */ 234 MIPS_BUILTIN_CMP_ANY, 235 MIPS_BUILTIN_CMP_ALL, 236 MIPS_BUILTIN_CMP_UPPER, 237 MIPS_BUILTIN_CMP_LOWER, 238 239 /* As above, but the instruction only sets a single $fcc register. */ 240 MIPS_BUILTIN_CMP_SINGLE, 241 242 /* For generating bposge32 branch instructions in MIPS32 DSP ASE. */ 243 MIPS_BUILTIN_BPOSGE32 244 }; 245 246 /* Invoke MACRO (COND) for each C.cond.fmt condition. */ 247 #define MIPS_FP_CONDITIONS(MACRO) \ 248 MACRO (f), \ 249 MACRO (un), \ 250 MACRO (eq), \ 251 MACRO (ueq), \ 252 MACRO (olt), \ 253 MACRO (ult), \ 254 MACRO (ole), \ 255 MACRO (ule), \ 256 MACRO (sf), \ 257 MACRO (ngle), \ 258 MACRO (seq), \ 259 MACRO (ngl), \ 260 MACRO (lt), \ 261 MACRO (nge), \ 262 MACRO (le), \ 263 MACRO (ngt) 264 265 /* Enumerates the codes above as MIPS_FP_COND_<X>. */ 266 #define DECLARE_MIPS_COND(X) MIPS_FP_COND_ ## X 267 enum mips_fp_condition { 268 MIPS_FP_CONDITIONS (DECLARE_MIPS_COND) 269 }; 270 271 /* Index X provides the string representation of MIPS_FP_COND_<X>. */ 272 #define STRINGIFY(X) #X 273 static const char *const mips_fp_conditions[] = { 274 MIPS_FP_CONDITIONS (STRINGIFY) 275 }; 276 277 /* Information about a function's frame layout. */ 278 struct GTY(()) mips_frame_info { 279 /* The size of the frame in bytes. */ 280 HOST_WIDE_INT total_size; 281 282 /* The number of bytes allocated to variables. */ 283 HOST_WIDE_INT var_size; 284 285 /* The number of bytes allocated to outgoing function arguments. */ 286 HOST_WIDE_INT args_size; 287 288 /* The number of bytes allocated to the .cprestore slot, or 0 if there 289 is no such slot. */ 290 HOST_WIDE_INT cprestore_size; 291 292 /* Bit X is set if the function saves or restores GPR X. */ 293 unsigned int mask; 294 295 /* Likewise FPR X. */ 296 unsigned int fmask; 297 298 /* Likewise doubleword accumulator X ($acX). */ 299 unsigned int acc_mask; 300 301 /* The number of GPRs, FPRs, doubleword accumulators and COP0 302 registers saved. */ 303 unsigned int num_gp; 304 unsigned int num_fp; 305 unsigned int num_acc; 306 unsigned int num_cop0_regs; 307 308 /* The offset of the topmost GPR, FPR, accumulator and COP0-register 309 save slots from the top of the frame, or zero if no such slots are 310 needed. */ 311 HOST_WIDE_INT gp_save_offset; 312 HOST_WIDE_INT fp_save_offset; 313 HOST_WIDE_INT acc_save_offset; 314 HOST_WIDE_INT cop0_save_offset; 315 316 /* Likewise, but giving offsets from the bottom of the frame. */ 317 HOST_WIDE_INT gp_sp_offset; 318 HOST_WIDE_INT fp_sp_offset; 319 HOST_WIDE_INT acc_sp_offset; 320 HOST_WIDE_INT cop0_sp_offset; 321 322 /* Similar, but the value passed to _mcount. */ 323 HOST_WIDE_INT ra_fp_offset; 324 325 /* The offset of arg_pointer_rtx from the bottom of the frame. */ 326 HOST_WIDE_INT arg_pointer_offset; 327 328 /* The offset of hard_frame_pointer_rtx from the bottom of the frame. */ 329 HOST_WIDE_INT hard_frame_pointer_offset; 330 }; 331 332 struct GTY(()) machine_function { 333 /* The register returned by mips16_gp_pseudo_reg; see there for details. */ 334 rtx mips16_gp_pseudo_rtx; 335 336 /* The number of extra stack bytes taken up by register varargs. 337 This area is allocated by the callee at the very top of the frame. */ 338 int varargs_size; 339 340 /* The current frame information, calculated by mips_compute_frame_info. */ 341 struct mips_frame_info frame; 342 343 /* The register to use as the function's global pointer, or INVALID_REGNUM 344 if the function doesn't need one. */ 345 unsigned int global_pointer; 346 347 /* How many instructions it takes to load a label into $AT, or 0 if 348 this property hasn't yet been calculated. */ 349 unsigned int load_label_num_insns; 350 351 /* True if mips_adjust_insn_length should ignore an instruction's 352 hazard attribute. */ 353 bool ignore_hazard_length_p; 354 355 /* True if the whole function is suitable for .set noreorder and 356 .set nomacro. */ 357 bool all_noreorder_p; 358 359 /* True if the function has "inflexible" and "flexible" references 360 to the global pointer. See mips_cfun_has_inflexible_gp_ref_p 361 and mips_cfun_has_flexible_gp_ref_p for details. */ 362 bool has_inflexible_gp_insn_p; 363 bool has_flexible_gp_insn_p; 364 365 /* True if the function's prologue must load the global pointer 366 value into pic_offset_table_rtx and store the same value in 367 the function's cprestore slot (if any). Even if this value 368 is currently false, we may decide to set it to true later; 369 see mips_must_initialize_gp_p () for details. */ 370 bool must_initialize_gp_p; 371 372 /* True if the current function must restore $gp after any potential 373 clobber. This value is only meaningful during the first post-epilogue 374 split_insns pass; see mips_must_initialize_gp_p () for details. */ 375 bool must_restore_gp_when_clobbered_p; 376 377 /* True if we have emitted an instruction to initialize 378 mips16_gp_pseudo_rtx. */ 379 bool initialized_mips16_gp_pseudo_p; 380 381 /* True if this is an interrupt handler. */ 382 bool interrupt_handler_p; 383 384 /* True if this is an interrupt handler that uses shadow registers. */ 385 bool use_shadow_register_set_p; 386 387 /* True if this is an interrupt handler that should keep interrupts 388 masked. */ 389 bool keep_interrupts_masked_p; 390 391 /* True if this is an interrupt handler that should use DERET 392 instead of ERET. */ 393 bool use_debug_exception_return_p; 394 }; 395 396 /* Information about a single argument. */ 397 struct mips_arg_info { 398 /* True if the argument is passed in a floating-point register, or 399 would have been if we hadn't run out of registers. */ 400 bool fpr_p; 401 402 /* The number of words passed in registers, rounded up. */ 403 unsigned int reg_words; 404 405 /* For EABI, the offset of the first register from GP_ARG_FIRST or 406 FP_ARG_FIRST. For other ABIs, the offset of the first register from 407 the start of the ABI's argument structure (see the CUMULATIVE_ARGS 408 comment for details). 409 410 The value is MAX_ARGS_IN_REGISTERS if the argument is passed entirely 411 on the stack. */ 412 unsigned int reg_offset; 413 414 /* The number of words that must be passed on the stack, rounded up. */ 415 unsigned int stack_words; 416 417 /* The offset from the start of the stack overflow area of the argument's 418 first stack word. Only meaningful when STACK_WORDS is nonzero. */ 419 unsigned int stack_offset; 420 }; 421 422 /* Information about an address described by mips_address_type. 423 424 ADDRESS_CONST_INT 425 No fields are used. 426 427 ADDRESS_REG 428 REG is the base register and OFFSET is the constant offset. 429 430 ADDRESS_LO_SUM 431 REG and OFFSET are the operands to the LO_SUM and SYMBOL_TYPE 432 is the type of symbol it references. 433 434 ADDRESS_SYMBOLIC 435 SYMBOL_TYPE is the type of symbol that the address references. */ 436 struct mips_address_info { 437 enum mips_address_type type; 438 rtx reg; 439 rtx offset; 440 enum mips_symbol_type symbol_type; 441 }; 442 443 /* One stage in a constant building sequence. These sequences have 444 the form: 445 446 A = VALUE[0] 447 A = A CODE[1] VALUE[1] 448 A = A CODE[2] VALUE[2] 449 ... 450 451 where A is an accumulator, each CODE[i] is a binary rtl operation 452 and each VALUE[i] is a constant integer. CODE[0] is undefined. */ 453 struct mips_integer_op { 454 enum rtx_code code; 455 unsigned HOST_WIDE_INT value; 456 }; 457 458 /* The largest number of operations needed to load an integer constant. 459 The worst accepted case for 64-bit constants is LUI,ORI,SLL,ORI,SLL,ORI. 460 When the lowest bit is clear, we can try, but reject a sequence with 461 an extra SLL at the end. */ 462 #define MIPS_MAX_INTEGER_OPS 7 463 464 /* Information about a MIPS16e SAVE or RESTORE instruction. */ 465 struct mips16e_save_restore_info { 466 /* The number of argument registers saved by a SAVE instruction. 467 0 for RESTORE instructions. */ 468 unsigned int nargs; 469 470 /* Bit X is set if the instruction saves or restores GPR X. */ 471 unsigned int mask; 472 473 /* The total number of bytes to allocate. */ 474 HOST_WIDE_INT size; 475 }; 476 477 /* Global variables for machine-dependent things. */ 478 479 /* The -G setting, or the configuration's default small-data limit if 480 no -G option is given. */ 481 static unsigned int mips_small_data_threshold; 482 483 /* The number of file directives written by mips_output_filename. */ 484 int num_source_filenames; 485 486 /* The name that appeared in the last .file directive written by 487 mips_output_filename, or "" if mips_output_filename hasn't 488 written anything yet. */ 489 const char *current_function_file = ""; 490 491 /* A label counter used by PUT_SDB_BLOCK_START and PUT_SDB_BLOCK_END. */ 492 int sdb_label_count; 493 494 /* Arrays that map GCC register numbers to debugger register numbers. */ 495 int mips_dbx_regno[FIRST_PSEUDO_REGISTER]; 496 int mips_dwarf_regno[FIRST_PSEUDO_REGISTER]; 497 498 /* The nesting depth of the PRINT_OPERAND '%(', '%<' and '%[' constructs. */ 499 struct mips_asm_switch mips_noreorder = { "reorder", 0 }; 500 struct mips_asm_switch mips_nomacro = { "macro", 0 }; 501 struct mips_asm_switch mips_noat = { "at", 0 }; 502 503 /* True if we're writing out a branch-likely instruction rather than a 504 normal branch. */ 505 static bool mips_branch_likely; 506 507 /* The current instruction-set architecture. */ 508 enum processor_type mips_arch; 509 const struct mips_cpu_info *mips_arch_info; 510 511 /* The processor that we should tune the code for. */ 512 enum processor_type mips_tune; 513 const struct mips_cpu_info *mips_tune_info; 514 515 /* The ISA level associated with mips_arch. */ 516 int mips_isa; 517 518 /* The architecture selected by -mipsN, or null if -mipsN wasn't used. */ 519 static const struct mips_cpu_info *mips_isa_option_info; 520 521 /* Which ABI to use. */ 522 int mips_abi = MIPS_ABI_DEFAULT; 523 524 /* Which cost information to use. */ 525 const struct mips_rtx_cost_data *mips_cost; 526 527 /* The ambient target flags, excluding MASK_MIPS16. */ 528 static int mips_base_target_flags; 529 530 /* True if MIPS16 is the default mode. */ 531 bool mips_base_mips16; 532 533 /* The ambient values of other global variables. */ 534 static int mips_base_schedule_insns; /* flag_schedule_insns */ 535 static int mips_base_reorder_blocks_and_partition; /* flag_reorder... */ 536 static int mips_base_move_loop_invariants; /* flag_move_loop_invariants */ 537 static int mips_base_align_loops; /* align_loops */ 538 static int mips_base_align_jumps; /* align_jumps */ 539 static int mips_base_align_functions; /* align_functions */ 540 541 /* The -mcode-readable setting. */ 542 enum mips_code_readable_setting mips_code_readable = CODE_READABLE_YES; 543 544 /* The -mr10k-cache-barrier setting. */ 545 static enum mips_r10k_cache_barrier_setting mips_r10k_cache_barrier; 546 547 /* Index [M][R] is true if register R is allowed to hold a value of mode M. */ 548 bool mips_hard_regno_mode_ok[(int) MAX_MACHINE_MODE][FIRST_PSEUDO_REGISTER]; 549 550 /* Index C is true if character C is a valid PRINT_OPERAND punctation 551 character. */ 552 bool mips_print_operand_punct[256]; 553 554 static GTY (()) int mips_output_filename_first_time = 1; 555 556 /* mips_split_p[X] is true if symbols of type X can be split by 557 mips_split_symbol. */ 558 bool mips_split_p[NUM_SYMBOL_TYPES]; 559 560 /* mips_split_hi_p[X] is true if the high parts of symbols of type X 561 can be split by mips_split_symbol. */ 562 bool mips_split_hi_p[NUM_SYMBOL_TYPES]; 563 564 /* mips_lo_relocs[X] is the relocation to use when a symbol of type X 565 appears in a LO_SUM. It can be null if such LO_SUMs aren't valid or 566 if they are matched by a special .md file pattern. */ 567 static const char *mips_lo_relocs[NUM_SYMBOL_TYPES]; 568 569 /* Likewise for HIGHs. */ 570 static const char *mips_hi_relocs[NUM_SYMBOL_TYPES]; 571 572 /* Index R is the smallest register class that contains register R. */ 573 const enum reg_class mips_regno_to_class[FIRST_PSEUDO_REGISTER] = { 574 LEA_REGS, LEA_REGS, M16_REGS, V1_REG, 575 M16_REGS, M16_REGS, M16_REGS, M16_REGS, 576 LEA_REGS, LEA_REGS, LEA_REGS, LEA_REGS, 577 LEA_REGS, LEA_REGS, LEA_REGS, LEA_REGS, 578 M16_REGS, M16_REGS, LEA_REGS, LEA_REGS, 579 LEA_REGS, LEA_REGS, LEA_REGS, LEA_REGS, 580 T_REG, PIC_FN_ADDR_REG, LEA_REGS, LEA_REGS, 581 LEA_REGS, LEA_REGS, LEA_REGS, LEA_REGS, 582 FP_REGS, FP_REGS, FP_REGS, FP_REGS, 583 FP_REGS, FP_REGS, FP_REGS, FP_REGS, 584 FP_REGS, FP_REGS, FP_REGS, FP_REGS, 585 FP_REGS, FP_REGS, FP_REGS, FP_REGS, 586 FP_REGS, FP_REGS, FP_REGS, FP_REGS, 587 FP_REGS, FP_REGS, FP_REGS, FP_REGS, 588 FP_REGS, FP_REGS, FP_REGS, FP_REGS, 589 FP_REGS, FP_REGS, FP_REGS, FP_REGS, 590 MD0_REG, MD1_REG, NO_REGS, ST_REGS, 591 ST_REGS, ST_REGS, ST_REGS, ST_REGS, 592 ST_REGS, ST_REGS, ST_REGS, NO_REGS, 593 NO_REGS, FRAME_REGS, FRAME_REGS, NO_REGS, 594 COP0_REGS, COP0_REGS, COP0_REGS, COP0_REGS, 595 COP0_REGS, COP0_REGS, COP0_REGS, COP0_REGS, 596 COP0_REGS, COP0_REGS, COP0_REGS, COP0_REGS, 597 COP0_REGS, COP0_REGS, COP0_REGS, COP0_REGS, 598 COP0_REGS, COP0_REGS, COP0_REGS, COP0_REGS, 599 COP0_REGS, COP0_REGS, COP0_REGS, COP0_REGS, 600 COP0_REGS, COP0_REGS, COP0_REGS, COP0_REGS, 601 COP0_REGS, COP0_REGS, COP0_REGS, COP0_REGS, 602 COP2_REGS, COP2_REGS, COP2_REGS, COP2_REGS, 603 COP2_REGS, COP2_REGS, COP2_REGS, COP2_REGS, 604 COP2_REGS, COP2_REGS, COP2_REGS, COP2_REGS, 605 COP2_REGS, COP2_REGS, COP2_REGS, COP2_REGS, 606 COP2_REGS, COP2_REGS, COP2_REGS, COP2_REGS, 607 COP2_REGS, COP2_REGS, COP2_REGS, COP2_REGS, 608 COP2_REGS, COP2_REGS, COP2_REGS, COP2_REGS, 609 COP2_REGS, COP2_REGS, COP2_REGS, COP2_REGS, 610 COP3_REGS, COP3_REGS, COP3_REGS, COP3_REGS, 611 COP3_REGS, COP3_REGS, COP3_REGS, COP3_REGS, 612 COP3_REGS, COP3_REGS, COP3_REGS, COP3_REGS, 613 COP3_REGS, COP3_REGS, COP3_REGS, COP3_REGS, 614 COP3_REGS, COP3_REGS, COP3_REGS, COP3_REGS, 615 COP3_REGS, COP3_REGS, COP3_REGS, COP3_REGS, 616 COP3_REGS, COP3_REGS, COP3_REGS, COP3_REGS, 617 COP3_REGS, COP3_REGS, COP3_REGS, COP3_REGS, 618 DSP_ACC_REGS, DSP_ACC_REGS, DSP_ACC_REGS, DSP_ACC_REGS, 619 DSP_ACC_REGS, DSP_ACC_REGS, ALL_REGS, ALL_REGS, 620 ALL_REGS, ALL_REGS, ALL_REGS, ALL_REGS 621 }; 622 623 /* The value of TARGET_ATTRIBUTE_TABLE. */ 624 static const struct attribute_spec mips_attribute_table[] = { 625 /* { name, min_len, max_len, decl_req, type_req, fn_type_req, handler } */ 626 { "long_call", 0, 0, false, true, true, NULL }, 627 { "far", 0, 0, false, true, true, NULL }, 628 { "near", 0, 0, false, true, true, NULL }, 629 /* We would really like to treat "mips16" and "nomips16" as type 630 attributes, but GCC doesn't provide the hooks we need to support 631 the right conversion rules. As declaration attributes, they affect 632 code generation but don't carry other semantics. */ 633 { "mips16", 0, 0, true, false, false, NULL }, 634 { "nomips16", 0, 0, true, false, false, NULL }, 635 /* Allow functions to be specified as interrupt handlers */ 636 { "interrupt", 0, 0, false, true, true, NULL }, 637 { "use_shadow_register_set", 0, 0, false, true, true, NULL }, 638 { "keep_interrupts_masked", 0, 0, false, true, true, NULL }, 639 { "use_debug_exception_return", 0, 0, false, true, true, NULL }, 640 { NULL, 0, 0, false, false, false, NULL } 641 }; 642 643 /* A table describing all the processors GCC knows about. Names are 644 matched in the order listed. The first mention of an ISA level is 645 taken as the canonical name for that ISA. 646 647 To ease comparison, please keep this table in the same order 648 as GAS's mips_cpu_info_table. Please also make sure that 649 MIPS_ISA_LEVEL_SPEC and MIPS_ARCH_FLOAT_SPEC handle all -march 650 options correctly. */ 651 static const struct mips_cpu_info mips_cpu_info_table[] = { 652 /* Entries for generic ISAs. */ 653 { "mips1", PROCESSOR_R3000, 1, 0 }, 654 { "mips2", PROCESSOR_R6000, 2, 0 }, 655 { "mips3", PROCESSOR_R4000, 3, 0 }, 656 { "mips4", PROCESSOR_R8000, 4, 0 }, 657 /* Prefer not to use branch-likely instructions for generic MIPS32rX 658 and MIPS64rX code. The instructions were officially deprecated 659 in revisions 2 and earlier, but revision 3 is likely to downgrade 660 that to a recommendation to avoid the instructions in code that 661 isn't tuned to a specific processor. */ 662 { "mips32", PROCESSOR_4KC, 32, PTF_AVOID_BRANCHLIKELY }, 663 { "mips32r2", PROCESSOR_M4K, 33, PTF_AVOID_BRANCHLIKELY }, 664 { "mips64", PROCESSOR_5KC, 64, PTF_AVOID_BRANCHLIKELY }, 665 /* ??? For now just tune the generic MIPS64r2 for 5KC as well. */ 666 { "mips64r2", PROCESSOR_5KC, 65, PTF_AVOID_BRANCHLIKELY }, 667 668 /* MIPS I processors. */ 669 { "r3000", PROCESSOR_R3000, 1, 0 }, 670 { "r2000", PROCESSOR_R3000, 1, 0 }, 671 { "r3900", PROCESSOR_R3900, 1, 0 }, 672 673 /* MIPS II processors. */ 674 { "r6000", PROCESSOR_R6000, 2, 0 }, 675 676 /* MIPS III processors. */ 677 { "r4000", PROCESSOR_R4000, 3, 0 }, 678 { "vr4100", PROCESSOR_R4100, 3, 0 }, 679 { "vr4111", PROCESSOR_R4111, 3, 0 }, 680 { "vr4120", PROCESSOR_R4120, 3, 0 }, 681 { "vr4130", PROCESSOR_R4130, 3, 0 }, 682 { "vr4300", PROCESSOR_R4300, 3, 0 }, 683 { "r4400", PROCESSOR_R4000, 3, 0 }, 684 { "r4600", PROCESSOR_R4600, 3, 0 }, 685 { "orion", PROCESSOR_R4600, 3, 0 }, 686 { "r4650", PROCESSOR_R4650, 3, 0 }, 687 /* ST Loongson 2E/2F processors. */ 688 { "loongson2e", PROCESSOR_LOONGSON_2E, 3, PTF_AVOID_BRANCHLIKELY }, 689 { "loongson2f", PROCESSOR_LOONGSON_2F, 3, PTF_AVOID_BRANCHLIKELY }, 690 691 /* MIPS IV processors. */ 692 { "r8000", PROCESSOR_R8000, 4, 0 }, 693 { "r10000", PROCESSOR_R10000, 4, 0 }, 694 { "r12000", PROCESSOR_R10000, 4, 0 }, 695 { "r14000", PROCESSOR_R10000, 4, 0 }, 696 { "r16000", PROCESSOR_R10000, 4, 0 }, 697 { "vr5000", PROCESSOR_R5000, 4, 0 }, 698 { "vr5400", PROCESSOR_R5400, 4, 0 }, 699 { "vr5500", PROCESSOR_R5500, 4, PTF_AVOID_BRANCHLIKELY }, 700 { "rm7000", PROCESSOR_R7000, 4, 0 }, 701 { "rm9000", PROCESSOR_R9000, 4, 0 }, 702 703 /* MIPS32 processors. */ 704 { "4kc", PROCESSOR_4KC, 32, 0 }, 705 { "4km", PROCESSOR_4KC, 32, 0 }, 706 { "4kp", PROCESSOR_4KP, 32, 0 }, 707 { "4ksc", PROCESSOR_4KC, 32, 0 }, 708 709 /* MIPS32 Release 2 processors. */ 710 { "m4k", PROCESSOR_M4K, 33, 0 }, 711 { "4kec", PROCESSOR_4KC, 33, 0 }, 712 { "4kem", PROCESSOR_4KC, 33, 0 }, 713 { "4kep", PROCESSOR_4KP, 33, 0 }, 714 { "4ksd", PROCESSOR_4KC, 33, 0 }, 715 716 { "24kc", PROCESSOR_24KC, 33, 0 }, 717 { "24kf2_1", PROCESSOR_24KF2_1, 33, 0 }, 718 { "24kf", PROCESSOR_24KF2_1, 33, 0 }, 719 { "24kf1_1", PROCESSOR_24KF1_1, 33, 0 }, 720 { "24kfx", PROCESSOR_24KF1_1, 33, 0 }, 721 { "24kx", PROCESSOR_24KF1_1, 33, 0 }, 722 723 { "24kec", PROCESSOR_24KC, 33, 0 }, /* 24K with DSP. */ 724 { "24kef2_1", PROCESSOR_24KF2_1, 33, 0 }, 725 { "24kef", PROCESSOR_24KF2_1, 33, 0 }, 726 { "24kef1_1", PROCESSOR_24KF1_1, 33, 0 }, 727 { "24kefx", PROCESSOR_24KF1_1, 33, 0 }, 728 { "24kex", PROCESSOR_24KF1_1, 33, 0 }, 729 730 { "34kc", PROCESSOR_24KC, 33, 0 }, /* 34K with MT/DSP. */ 731 { "34kf2_1", PROCESSOR_24KF2_1, 33, 0 }, 732 { "34kf", PROCESSOR_24KF2_1, 33, 0 }, 733 { "34kf1_1", PROCESSOR_24KF1_1, 33, 0 }, 734 { "34kfx", PROCESSOR_24KF1_1, 33, 0 }, 735 { "34kx", PROCESSOR_24KF1_1, 33, 0 }, 736 737 { "74kc", PROCESSOR_74KC, 33, 0 }, /* 74K with DSPr2. */ 738 { "74kf2_1", PROCESSOR_74KF2_1, 33, 0 }, 739 { "74kf", PROCESSOR_74KF2_1, 33, 0 }, 740 { "74kf1_1", PROCESSOR_74KF1_1, 33, 0 }, 741 { "74kfx", PROCESSOR_74KF1_1, 33, 0 }, 742 { "74kx", PROCESSOR_74KF1_1, 33, 0 }, 743 { "74kf3_2", PROCESSOR_74KF3_2, 33, 0 }, 744 745 { "1004kc", PROCESSOR_24KC, 33, 0 }, /* 1004K with MT/DSP. */ 746 { "1004kf2_1", PROCESSOR_24KF2_1, 33, 0 }, 747 { "1004kf", PROCESSOR_24KF2_1, 33, 0 }, 748 { "1004kf1_1", PROCESSOR_24KF1_1, 33, 0 }, 749 750 /* MIPS64 processors. */ 751 { "5kc", PROCESSOR_5KC, 64, 0 }, 752 { "5kf", PROCESSOR_5KF, 64, 0 }, 753 { "20kc", PROCESSOR_20KC, 64, PTF_AVOID_BRANCHLIKELY }, 754 { "sb1", PROCESSOR_SB1, 64, PTF_AVOID_BRANCHLIKELY }, 755 { "sb1a", PROCESSOR_SB1A, 64, PTF_AVOID_BRANCHLIKELY }, 756 { "sr71000", PROCESSOR_SR71000, 64, PTF_AVOID_BRANCHLIKELY }, 757 { "xlr", PROCESSOR_XLR, 64, 0 }, 758 759 /* MIPS64 Release 2 processors. */ 760 { "octeon", PROCESSOR_OCTEON, 65, PTF_AVOID_BRANCHLIKELY } 761 }; 762 763 /* Default costs. If these are used for a processor we should look 764 up the actual costs. */ 765 #define DEFAULT_COSTS COSTS_N_INSNS (6), /* fp_add */ \ 766 COSTS_N_INSNS (7), /* fp_mult_sf */ \ 767 COSTS_N_INSNS (8), /* fp_mult_df */ \ 768 COSTS_N_INSNS (23), /* fp_div_sf */ \ 769 COSTS_N_INSNS (36), /* fp_div_df */ \ 770 COSTS_N_INSNS (10), /* int_mult_si */ \ 771 COSTS_N_INSNS (10), /* int_mult_di */ \ 772 COSTS_N_INSNS (69), /* int_div_si */ \ 773 COSTS_N_INSNS (69), /* int_div_di */ \ 774 2, /* branch_cost */ \ 775 4 /* memory_latency */ 776 777 /* Floating-point costs for processors without an FPU. Just assume that 778 all floating-point libcalls are very expensive. */ 779 #define SOFT_FP_COSTS COSTS_N_INSNS (256), /* fp_add */ \ 780 COSTS_N_INSNS (256), /* fp_mult_sf */ \ 781 COSTS_N_INSNS (256), /* fp_mult_df */ \ 782 COSTS_N_INSNS (256), /* fp_div_sf */ \ 783 COSTS_N_INSNS (256) /* fp_div_df */ 784 785 /* Costs to use when optimizing for size. */ 786 static const struct mips_rtx_cost_data mips_rtx_cost_optimize_size = { 787 COSTS_N_INSNS (1), /* fp_add */ 788 COSTS_N_INSNS (1), /* fp_mult_sf */ 789 COSTS_N_INSNS (1), /* fp_mult_df */ 790 COSTS_N_INSNS (1), /* fp_div_sf */ 791 COSTS_N_INSNS (1), /* fp_div_df */ 792 COSTS_N_INSNS (1), /* int_mult_si */ 793 COSTS_N_INSNS (1), /* int_mult_di */ 794 COSTS_N_INSNS (1), /* int_div_si */ 795 COSTS_N_INSNS (1), /* int_div_di */ 796 2, /* branch_cost */ 797 4 /* memory_latency */ 798 }; 799 800 /* Costs to use when optimizing for speed, indexed by processor. */ 801 static const struct mips_rtx_cost_data mips_rtx_cost_data[PROCESSOR_MAX] = { 802 { /* R3000 */ 803 COSTS_N_INSNS (2), /* fp_add */ 804 COSTS_N_INSNS (4), /* fp_mult_sf */ 805 COSTS_N_INSNS (5), /* fp_mult_df */ 806 COSTS_N_INSNS (12), /* fp_div_sf */ 807 COSTS_N_INSNS (19), /* fp_div_df */ 808 COSTS_N_INSNS (12), /* int_mult_si */ 809 COSTS_N_INSNS (12), /* int_mult_di */ 810 COSTS_N_INSNS (35), /* int_div_si */ 811 COSTS_N_INSNS (35), /* int_div_di */ 812 1, /* branch_cost */ 813 4 /* memory_latency */ 814 }, 815 { /* 4KC */ 816 SOFT_FP_COSTS, 817 COSTS_N_INSNS (6), /* int_mult_si */ 818 COSTS_N_INSNS (6), /* int_mult_di */ 819 COSTS_N_INSNS (36), /* int_div_si */ 820 COSTS_N_INSNS (36), /* int_div_di */ 821 1, /* branch_cost */ 822 4 /* memory_latency */ 823 }, 824 { /* 4KP */ 825 SOFT_FP_COSTS, 826 COSTS_N_INSNS (36), /* int_mult_si */ 827 COSTS_N_INSNS (36), /* int_mult_di */ 828 COSTS_N_INSNS (37), /* int_div_si */ 829 COSTS_N_INSNS (37), /* int_div_di */ 830 1, /* branch_cost */ 831 4 /* memory_latency */ 832 }, 833 { /* 5KC */ 834 SOFT_FP_COSTS, 835 COSTS_N_INSNS (4), /* int_mult_si */ 836 COSTS_N_INSNS (11), /* int_mult_di */ 837 COSTS_N_INSNS (36), /* int_div_si */ 838 COSTS_N_INSNS (68), /* int_div_di */ 839 1, /* branch_cost */ 840 4 /* memory_latency */ 841 }, 842 { /* 5KF */ 843 COSTS_N_INSNS (4), /* fp_add */ 844 COSTS_N_INSNS (4), /* fp_mult_sf */ 845 COSTS_N_INSNS (5), /* fp_mult_df */ 846 COSTS_N_INSNS (17), /* fp_div_sf */ 847 COSTS_N_INSNS (32), /* fp_div_df */ 848 COSTS_N_INSNS (4), /* int_mult_si */ 849 COSTS_N_INSNS (11), /* int_mult_di */ 850 COSTS_N_INSNS (36), /* int_div_si */ 851 COSTS_N_INSNS (68), /* int_div_di */ 852 1, /* branch_cost */ 853 4 /* memory_latency */ 854 }, 855 { /* 20KC */ 856 COSTS_N_INSNS (4), /* fp_add */ 857 COSTS_N_INSNS (4), /* fp_mult_sf */ 858 COSTS_N_INSNS (5), /* fp_mult_df */ 859 COSTS_N_INSNS (17), /* fp_div_sf */ 860 COSTS_N_INSNS (32), /* fp_div_df */ 861 COSTS_N_INSNS (4), /* int_mult_si */ 862 COSTS_N_INSNS (7), /* int_mult_di */ 863 COSTS_N_INSNS (42), /* int_div_si */ 864 COSTS_N_INSNS (72), /* int_div_di */ 865 1, /* branch_cost */ 866 4 /* memory_latency */ 867 }, 868 { /* 24KC */ 869 SOFT_FP_COSTS, 870 COSTS_N_INSNS (5), /* int_mult_si */ 871 COSTS_N_INSNS (5), /* int_mult_di */ 872 COSTS_N_INSNS (41), /* int_div_si */ 873 COSTS_N_INSNS (41), /* int_div_di */ 874 1, /* branch_cost */ 875 4 /* memory_latency */ 876 }, 877 { /* 24KF2_1 */ 878 COSTS_N_INSNS (8), /* fp_add */ 879 COSTS_N_INSNS (8), /* fp_mult_sf */ 880 COSTS_N_INSNS (10), /* fp_mult_df */ 881 COSTS_N_INSNS (34), /* fp_div_sf */ 882 COSTS_N_INSNS (64), /* fp_div_df */ 883 COSTS_N_INSNS (5), /* int_mult_si */ 884 COSTS_N_INSNS (5), /* int_mult_di */ 885 COSTS_N_INSNS (41), /* int_div_si */ 886 COSTS_N_INSNS (41), /* int_div_di */ 887 1, /* branch_cost */ 888 4 /* memory_latency */ 889 }, 890 { /* 24KF1_1 */ 891 COSTS_N_INSNS (4), /* fp_add */ 892 COSTS_N_INSNS (4), /* fp_mult_sf */ 893 COSTS_N_INSNS (5), /* fp_mult_df */ 894 COSTS_N_INSNS (17), /* fp_div_sf */ 895 COSTS_N_INSNS (32), /* fp_div_df */ 896 COSTS_N_INSNS (5), /* int_mult_si */ 897 COSTS_N_INSNS (5), /* int_mult_di */ 898 COSTS_N_INSNS (41), /* int_div_si */ 899 COSTS_N_INSNS (41), /* int_div_di */ 900 1, /* branch_cost */ 901 4 /* memory_latency */ 902 }, 903 { /* 74KC */ 904 SOFT_FP_COSTS, 905 COSTS_N_INSNS (5), /* int_mult_si */ 906 COSTS_N_INSNS (5), /* int_mult_di */ 907 COSTS_N_INSNS (41), /* int_div_si */ 908 COSTS_N_INSNS (41), /* int_div_di */ 909 1, /* branch_cost */ 910 4 /* memory_latency */ 911 }, 912 { /* 74KF2_1 */ 913 COSTS_N_INSNS (8), /* fp_add */ 914 COSTS_N_INSNS (8), /* fp_mult_sf */ 915 COSTS_N_INSNS (10), /* fp_mult_df */ 916 COSTS_N_INSNS (34), /* fp_div_sf */ 917 COSTS_N_INSNS (64), /* fp_div_df */ 918 COSTS_N_INSNS (5), /* int_mult_si */ 919 COSTS_N_INSNS (5), /* int_mult_di */ 920 COSTS_N_INSNS (41), /* int_div_si */ 921 COSTS_N_INSNS (41), /* int_div_di */ 922 1, /* branch_cost */ 923 4 /* memory_latency */ 924 }, 925 { /* 74KF1_1 */ 926 COSTS_N_INSNS (4), /* fp_add */ 927 COSTS_N_INSNS (4), /* fp_mult_sf */ 928 COSTS_N_INSNS (5), /* fp_mult_df */ 929 COSTS_N_INSNS (17), /* fp_div_sf */ 930 COSTS_N_INSNS (32), /* fp_div_df */ 931 COSTS_N_INSNS (5), /* int_mult_si */ 932 COSTS_N_INSNS (5), /* int_mult_di */ 933 COSTS_N_INSNS (41), /* int_div_si */ 934 COSTS_N_INSNS (41), /* int_div_di */ 935 1, /* branch_cost */ 936 4 /* memory_latency */ 937 }, 938 { /* 74KF3_2 */ 939 COSTS_N_INSNS (6), /* fp_add */ 940 COSTS_N_INSNS (6), /* fp_mult_sf */ 941 COSTS_N_INSNS (7), /* fp_mult_df */ 942 COSTS_N_INSNS (25), /* fp_div_sf */ 943 COSTS_N_INSNS (48), /* fp_div_df */ 944 COSTS_N_INSNS (5), /* int_mult_si */ 945 COSTS_N_INSNS (5), /* int_mult_di */ 946 COSTS_N_INSNS (41), /* int_div_si */ 947 COSTS_N_INSNS (41), /* int_div_di */ 948 1, /* branch_cost */ 949 4 /* memory_latency */ 950 }, 951 { /* Loongson-2E */ 952 DEFAULT_COSTS 953 }, 954 { /* Loongson-2F */ 955 DEFAULT_COSTS 956 }, 957 { /* M4k */ 958 DEFAULT_COSTS 959 }, 960 /* Octeon */ 961 { 962 SOFT_FP_COSTS, 963 COSTS_N_INSNS (5), /* int_mult_si */ 964 COSTS_N_INSNS (5), /* int_mult_di */ 965 COSTS_N_INSNS (72), /* int_div_si */ 966 COSTS_N_INSNS (72), /* int_div_di */ 967 1, /* branch_cost */ 968 4 /* memory_latency */ 969 }, 970 { /* R3900 */ 971 COSTS_N_INSNS (2), /* fp_add */ 972 COSTS_N_INSNS (4), /* fp_mult_sf */ 973 COSTS_N_INSNS (5), /* fp_mult_df */ 974 COSTS_N_INSNS (12), /* fp_div_sf */ 975 COSTS_N_INSNS (19), /* fp_div_df */ 976 COSTS_N_INSNS (2), /* int_mult_si */ 977 COSTS_N_INSNS (2), /* int_mult_di */ 978 COSTS_N_INSNS (35), /* int_div_si */ 979 COSTS_N_INSNS (35), /* int_div_di */ 980 1, /* branch_cost */ 981 4 /* memory_latency */ 982 }, 983 { /* R6000 */ 984 COSTS_N_INSNS (3), /* fp_add */ 985 COSTS_N_INSNS (5), /* fp_mult_sf */ 986 COSTS_N_INSNS (6), /* fp_mult_df */ 987 COSTS_N_INSNS (15), /* fp_div_sf */ 988 COSTS_N_INSNS (16), /* fp_div_df */ 989 COSTS_N_INSNS (17), /* int_mult_si */ 990 COSTS_N_INSNS (17), /* int_mult_di */ 991 COSTS_N_INSNS (38), /* int_div_si */ 992 COSTS_N_INSNS (38), /* int_div_di */ 993 2, /* branch_cost */ 994 6 /* memory_latency */ 995 }, 996 { /* R4000 */ 997 COSTS_N_INSNS (6), /* fp_add */ 998 COSTS_N_INSNS (7), /* fp_mult_sf */ 999 COSTS_N_INSNS (8), /* fp_mult_df */ 1000 COSTS_N_INSNS (23), /* fp_div_sf */ 1001 COSTS_N_INSNS (36), /* fp_div_df */ 1002 COSTS_N_INSNS (10), /* int_mult_si */ 1003 COSTS_N_INSNS (10), /* int_mult_di */ 1004 COSTS_N_INSNS (69), /* int_div_si */ 1005 COSTS_N_INSNS (69), /* int_div_di */ 1006 2, /* branch_cost */ 1007 6 /* memory_latency */ 1008 }, 1009 { /* R4100 */ 1010 DEFAULT_COSTS 1011 }, 1012 { /* R4111 */ 1013 DEFAULT_COSTS 1014 }, 1015 { /* R4120 */ 1016 DEFAULT_COSTS 1017 }, 1018 { /* R4130 */ 1019 /* The only costs that appear to be updated here are 1020 integer multiplication. */ 1021 SOFT_FP_COSTS, 1022 COSTS_N_INSNS (4), /* int_mult_si */ 1023 COSTS_N_INSNS (6), /* int_mult_di */ 1024 COSTS_N_INSNS (69), /* int_div_si */ 1025 COSTS_N_INSNS (69), /* int_div_di */ 1026 1, /* branch_cost */ 1027 4 /* memory_latency */ 1028 }, 1029 { /* R4300 */ 1030 DEFAULT_COSTS 1031 }, 1032 { /* R4600 */ 1033 DEFAULT_COSTS 1034 }, 1035 { /* R4650 */ 1036 DEFAULT_COSTS 1037 }, 1038 { /* R5000 */ 1039 COSTS_N_INSNS (6), /* fp_add */ 1040 COSTS_N_INSNS (4), /* fp_mult_sf */ 1041 COSTS_N_INSNS (5), /* fp_mult_df */ 1042 COSTS_N_INSNS (23), /* fp_div_sf */ 1043 COSTS_N_INSNS (36), /* fp_div_df */ 1044 COSTS_N_INSNS (5), /* int_mult_si */ 1045 COSTS_N_INSNS (5), /* int_mult_di */ 1046 COSTS_N_INSNS (36), /* int_div_si */ 1047 COSTS_N_INSNS (36), /* int_div_di */ 1048 1, /* branch_cost */ 1049 4 /* memory_latency */ 1050 }, 1051 { /* R5400 */ 1052 COSTS_N_INSNS (6), /* fp_add */ 1053 COSTS_N_INSNS (5), /* fp_mult_sf */ 1054 COSTS_N_INSNS (6), /* fp_mult_df */ 1055 COSTS_N_INSNS (30), /* fp_div_sf */ 1056 COSTS_N_INSNS (59), /* fp_div_df */ 1057 COSTS_N_INSNS (3), /* int_mult_si */ 1058 COSTS_N_INSNS (4), /* int_mult_di */ 1059 COSTS_N_INSNS (42), /* int_div_si */ 1060 COSTS_N_INSNS (74), /* int_div_di */ 1061 1, /* branch_cost */ 1062 4 /* memory_latency */ 1063 }, 1064 { /* R5500 */ 1065 COSTS_N_INSNS (6), /* fp_add */ 1066 COSTS_N_INSNS (5), /* fp_mult_sf */ 1067 COSTS_N_INSNS (6), /* fp_mult_df */ 1068 COSTS_N_INSNS (30), /* fp_div_sf */ 1069 COSTS_N_INSNS (59), /* fp_div_df */ 1070 COSTS_N_INSNS (5), /* int_mult_si */ 1071 COSTS_N_INSNS (9), /* int_mult_di */ 1072 COSTS_N_INSNS (42), /* int_div_si */ 1073 COSTS_N_INSNS (74), /* int_div_di */ 1074 1, /* branch_cost */ 1075 4 /* memory_latency */ 1076 }, 1077 { /* R7000 */ 1078 /* The only costs that are changed here are 1079 integer multiplication. */ 1080 COSTS_N_INSNS (6), /* fp_add */ 1081 COSTS_N_INSNS (7), /* fp_mult_sf */ 1082 COSTS_N_INSNS (8), /* fp_mult_df */ 1083 COSTS_N_INSNS (23), /* fp_div_sf */ 1084 COSTS_N_INSNS (36), /* fp_div_df */ 1085 COSTS_N_INSNS (5), /* int_mult_si */ 1086 COSTS_N_INSNS (9), /* int_mult_di */ 1087 COSTS_N_INSNS (69), /* int_div_si */ 1088 COSTS_N_INSNS (69), /* int_div_di */ 1089 1, /* branch_cost */ 1090 4 /* memory_latency */ 1091 }, 1092 { /* R8000 */ 1093 DEFAULT_COSTS 1094 }, 1095 { /* R9000 */ 1096 /* The only costs that are changed here are 1097 integer multiplication. */ 1098 COSTS_N_INSNS (6), /* fp_add */ 1099 COSTS_N_INSNS (7), /* fp_mult_sf */ 1100 COSTS_N_INSNS (8), /* fp_mult_df */ 1101 COSTS_N_INSNS (23), /* fp_div_sf */ 1102 COSTS_N_INSNS (36), /* fp_div_df */ 1103 COSTS_N_INSNS (3), /* int_mult_si */ 1104 COSTS_N_INSNS (8), /* int_mult_di */ 1105 COSTS_N_INSNS (69), /* int_div_si */ 1106 COSTS_N_INSNS (69), /* int_div_di */ 1107 1, /* branch_cost */ 1108 4 /* memory_latency */ 1109 }, 1110 { /* R1x000 */ 1111 COSTS_N_INSNS (2), /* fp_add */ 1112 COSTS_N_INSNS (2), /* fp_mult_sf */ 1113 COSTS_N_INSNS (2), /* fp_mult_df */ 1114 COSTS_N_INSNS (12), /* fp_div_sf */ 1115 COSTS_N_INSNS (19), /* fp_div_df */ 1116 COSTS_N_INSNS (5), /* int_mult_si */ 1117 COSTS_N_INSNS (9), /* int_mult_di */ 1118 COSTS_N_INSNS (34), /* int_div_si */ 1119 COSTS_N_INSNS (66), /* int_div_di */ 1120 1, /* branch_cost */ 1121 4 /* memory_latency */ 1122 }, 1123 { /* SB1 */ 1124 /* These costs are the same as the SB-1A below. */ 1125 COSTS_N_INSNS (4), /* fp_add */ 1126 COSTS_N_INSNS (4), /* fp_mult_sf */ 1127 COSTS_N_INSNS (4), /* fp_mult_df */ 1128 COSTS_N_INSNS (24), /* fp_div_sf */ 1129 COSTS_N_INSNS (32), /* fp_div_df */ 1130 COSTS_N_INSNS (3), /* int_mult_si */ 1131 COSTS_N_INSNS (4), /* int_mult_di */ 1132 COSTS_N_INSNS (36), /* int_div_si */ 1133 COSTS_N_INSNS (68), /* int_div_di */ 1134 1, /* branch_cost */ 1135 4 /* memory_latency */ 1136 }, 1137 { /* SB1-A */ 1138 /* These costs are the same as the SB-1 above. */ 1139 COSTS_N_INSNS (4), /* fp_add */ 1140 COSTS_N_INSNS (4), /* fp_mult_sf */ 1141 COSTS_N_INSNS (4), /* fp_mult_df */ 1142 COSTS_N_INSNS (24), /* fp_div_sf */ 1143 COSTS_N_INSNS (32), /* fp_div_df */ 1144 COSTS_N_INSNS (3), /* int_mult_si */ 1145 COSTS_N_INSNS (4), /* int_mult_di */ 1146 COSTS_N_INSNS (36), /* int_div_si */ 1147 COSTS_N_INSNS (68), /* int_div_di */ 1148 1, /* branch_cost */ 1149 4 /* memory_latency */ 1150 }, 1151 { /* SR71000 */ 1152 DEFAULT_COSTS 1153 }, 1154 { /* XLR */ 1155 SOFT_FP_COSTS, 1156 COSTS_N_INSNS (8), /* int_mult_si */ 1157 COSTS_N_INSNS (8), /* int_mult_di */ 1158 COSTS_N_INSNS (72), /* int_div_si */ 1159 COSTS_N_INSNS (72), /* int_div_di */ 1160 1, /* branch_cost */ 1161 4 /* memory_latency */ 1162 } 1163 }; 1164 1165 static rtx mips_find_pic_call_symbol (rtx, rtx, bool); 1166 1167 /* This hash table keeps track of implicit "mips16" and "nomips16" attributes 1168 for -mflip_mips16. It maps decl names onto a boolean mode setting. */ 1169 struct GTY (()) mflip_mips16_entry { 1170 const char *name; 1171 bool mips16_p; 1172 }; 1173 static GTY ((param_is (struct mflip_mips16_entry))) htab_t mflip_mips16_htab; 1174 1175 /* Hash table callbacks for mflip_mips16_htab. */ 1176 1177 static hashval_t 1178 mflip_mips16_htab_hash (const void *entry) 1179 { 1180 return htab_hash_string (((const struct mflip_mips16_entry *) entry)->name); 1181 } 1182 1183 static int 1184 mflip_mips16_htab_eq (const void *entry, const void *name) 1185 { 1186 return strcmp (((const struct mflip_mips16_entry *) entry)->name, 1187 (const char *) name) == 0; 1188 } 1189 1190 /* True if -mflip-mips16 should next add an attribute for the default MIPS16 1191 mode, false if it should next add an attribute for the opposite mode. */ 1192 static GTY(()) bool mips16_flipper; 1193 1194 /* DECL is a function that needs a default "mips16" or "nomips16" attribute 1195 for -mflip-mips16. Return true if it should use "mips16" and false if 1196 it should use "nomips16". */ 1197 1198 static bool 1199 mflip_mips16_use_mips16_p (tree decl) 1200 { 1201 struct mflip_mips16_entry *entry; 1202 const char *name; 1203 hashval_t hash; 1204 void **slot; 1205 1206 /* Use the opposite of the command-line setting for anonymous decls. */ 1207 if (!DECL_NAME (decl)) 1208 return !mips_base_mips16; 1209 1210 if (!mflip_mips16_htab) 1211 mflip_mips16_htab = htab_create_ggc (37, mflip_mips16_htab_hash, 1212 mflip_mips16_htab_eq, NULL); 1213 1214 name = IDENTIFIER_POINTER (DECL_NAME (decl)); 1215 hash = htab_hash_string (name); 1216 slot = htab_find_slot_with_hash (mflip_mips16_htab, name, hash, INSERT); 1217 entry = (struct mflip_mips16_entry *) *slot; 1218 if (!entry) 1219 { 1220 mips16_flipper = !mips16_flipper; 1221 entry = GGC_NEW (struct mflip_mips16_entry); 1222 entry->name = name; 1223 entry->mips16_p = mips16_flipper ? !mips_base_mips16 : mips_base_mips16; 1224 *slot = entry; 1225 } 1226 return entry->mips16_p; 1227 } 1228 1229 /* Predicates to test for presence of "near" and "far"/"long_call" 1230 attributes on the given TYPE. */ 1231 1232 static bool 1233 mips_near_type_p (const_tree type) 1234 { 1235 return lookup_attribute ("near", TYPE_ATTRIBUTES (type)) != NULL; 1236 } 1237 1238 static bool 1239 mips_far_type_p (const_tree type) 1240 { 1241 return (lookup_attribute ("long_call", TYPE_ATTRIBUTES (type)) != NULL 1242 || lookup_attribute ("far", TYPE_ATTRIBUTES (type)) != NULL); 1243 } 1244 1245 /* Similar predicates for "mips16"/"nomips16" function attributes. */ 1246 1247 static bool 1248 mips_mips16_decl_p (const_tree decl) 1249 { 1250 return lookup_attribute ("mips16", DECL_ATTRIBUTES (decl)) != NULL; 1251 } 1252 1253 static bool 1254 mips_nomips16_decl_p (const_tree decl) 1255 { 1256 return lookup_attribute ("nomips16", DECL_ATTRIBUTES (decl)) != NULL; 1257 } 1258 1259 /* Check if the interrupt attribute is set for a function. */ 1260 1261 static bool 1262 mips_interrupt_type_p (tree type) 1263 { 1264 return lookup_attribute ("interrupt", TYPE_ATTRIBUTES (type)) != NULL; 1265 } 1266 1267 /* Check if the attribute to use shadow register set is set for a function. */ 1268 1269 static bool 1270 mips_use_shadow_register_set_p (tree type) 1271 { 1272 return lookup_attribute ("use_shadow_register_set", 1273 TYPE_ATTRIBUTES (type)) != NULL; 1274 } 1275 1276 /* Check if the attribute to keep interrupts masked is set for a function. */ 1277 1278 static bool 1279 mips_keep_interrupts_masked_p (tree type) 1280 { 1281 return lookup_attribute ("keep_interrupts_masked", 1282 TYPE_ATTRIBUTES (type)) != NULL; 1283 } 1284 1285 /* Check if the attribute to use debug exception return is set for 1286 a function. */ 1287 1288 static bool 1289 mips_use_debug_exception_return_p (tree type) 1290 { 1291 return lookup_attribute ("use_debug_exception_return", 1292 TYPE_ATTRIBUTES (type)) != NULL; 1293 } 1294 1295 /* Return true if function DECL is a MIPS16 function. Return the ambient 1296 setting if DECL is null. */ 1297 1298 static bool 1299 mips_use_mips16_mode_p (tree decl) 1300 { 1301 if (decl) 1302 { 1303 /* Nested functions must use the same frame pointer as their 1304 parent and must therefore use the same ISA mode. */ 1305 tree parent = decl_function_context (decl); 1306 if (parent) 1307 decl = parent; 1308 if (mips_mips16_decl_p (decl)) 1309 return true; 1310 if (mips_nomips16_decl_p (decl)) 1311 return false; 1312 } 1313 return mips_base_mips16; 1314 } 1315 1316 /* Implement TARGET_COMP_TYPE_ATTRIBUTES. */ 1317 1318 static int 1319 mips_comp_type_attributes (const_tree type1, const_tree type2) 1320 { 1321 /* Disallow mixed near/far attributes. */ 1322 if (mips_far_type_p (type1) && mips_near_type_p (type2)) 1323 return 0; 1324 if (mips_near_type_p (type1) && mips_far_type_p (type2)) 1325 return 0; 1326 return 1; 1327 } 1328 1329 /* Implement TARGET_INSERT_ATTRIBUTES. */ 1330 1331 static void 1332 mips_insert_attributes (tree decl, tree *attributes) 1333 { 1334 const char *name; 1335 bool mips16_p, nomips16_p; 1336 1337 /* Check for "mips16" and "nomips16" attributes. */ 1338 mips16_p = lookup_attribute ("mips16", *attributes) != NULL; 1339 nomips16_p = lookup_attribute ("nomips16", *attributes) != NULL; 1340 if (TREE_CODE (decl) != FUNCTION_DECL) 1341 { 1342 if (mips16_p) 1343 error ("%qs attribute only applies to functions", "mips16"); 1344 if (nomips16_p) 1345 error ("%qs attribute only applies to functions", "nomips16"); 1346 } 1347 else 1348 { 1349 mips16_p |= mips_mips16_decl_p (decl); 1350 nomips16_p |= mips_nomips16_decl_p (decl); 1351 if (mips16_p || nomips16_p) 1352 { 1353 /* DECL cannot be simultaneously "mips16" and "nomips16". */ 1354 if (mips16_p && nomips16_p) 1355 error ("%qE cannot have both %<mips16%> and " 1356 "%<nomips16%> attributes", 1357 DECL_NAME (decl)); 1358 } 1359 else if (TARGET_FLIP_MIPS16 && !DECL_ARTIFICIAL (decl)) 1360 { 1361 /* Implement -mflip-mips16. If DECL has neither a "nomips16" nor a 1362 "mips16" attribute, arbitrarily pick one. We must pick the same 1363 setting for duplicate declarations of a function. */ 1364 name = mflip_mips16_use_mips16_p (decl) ? "mips16" : "nomips16"; 1365 *attributes = tree_cons (get_identifier (name), NULL, *attributes); 1366 } 1367 } 1368 } 1369 1370 /* Implement TARGET_MERGE_DECL_ATTRIBUTES. */ 1371 1372 static tree 1373 mips_merge_decl_attributes (tree olddecl, tree newdecl) 1374 { 1375 /* The decls' "mips16" and "nomips16" attributes must match exactly. */ 1376 if (mips_mips16_decl_p (olddecl) != mips_mips16_decl_p (newdecl)) 1377 error ("%qE redeclared with conflicting %qs attributes", 1378 DECL_NAME (newdecl), "mips16"); 1379 if (mips_nomips16_decl_p (olddecl) != mips_nomips16_decl_p (newdecl)) 1380 error ("%qE redeclared with conflicting %qs attributes", 1381 DECL_NAME (newdecl), "nomips16"); 1382 1383 return merge_attributes (DECL_ATTRIBUTES (olddecl), 1384 DECL_ATTRIBUTES (newdecl)); 1385 } 1386 1387 /* If X is a PLUS of a CONST_INT, return the two terms in *BASE_PTR 1388 and *OFFSET_PTR. Return X in *BASE_PTR and 0 in *OFFSET_PTR otherwise. */ 1389 1390 static void 1391 mips_split_plus (rtx x, rtx *base_ptr, HOST_WIDE_INT *offset_ptr) 1392 { 1393 if (GET_CODE (x) == PLUS && CONST_INT_P (XEXP (x, 1))) 1394 { 1395 *base_ptr = XEXP (x, 0); 1396 *offset_ptr = INTVAL (XEXP (x, 1)); 1397 } 1398 else 1399 { 1400 *base_ptr = x; 1401 *offset_ptr = 0; 1402 } 1403 } 1404 1405 static unsigned int mips_build_integer (struct mips_integer_op *, 1406 unsigned HOST_WIDE_INT); 1407 1408 /* A subroutine of mips_build_integer, with the same interface. 1409 Assume that the final action in the sequence should be a left shift. */ 1410 1411 static unsigned int 1412 mips_build_shift (struct mips_integer_op *codes, HOST_WIDE_INT value) 1413 { 1414 unsigned int i, shift; 1415 1416 /* Shift VALUE right until its lowest bit is set. Shift arithmetically 1417 since signed numbers are easier to load than unsigned ones. */ 1418 shift = 0; 1419 while ((value & 1) == 0) 1420 value /= 2, shift++; 1421 1422 i = mips_build_integer (codes, value); 1423 codes[i].code = ASHIFT; 1424 codes[i].value = shift; 1425 return i + 1; 1426 } 1427 1428 /* As for mips_build_shift, but assume that the final action will be 1429 an IOR or PLUS operation. */ 1430 1431 static unsigned int 1432 mips_build_lower (struct mips_integer_op *codes, unsigned HOST_WIDE_INT value) 1433 { 1434 unsigned HOST_WIDE_INT high; 1435 unsigned int i; 1436 1437 high = value & ~(unsigned HOST_WIDE_INT) 0xffff; 1438 if (!LUI_OPERAND (high) && (value & 0x18000) == 0x18000) 1439 { 1440 /* The constant is too complex to load with a simple LUI/ORI pair, 1441 so we want to give the recursive call as many trailing zeros as 1442 possible. In this case, we know bit 16 is set and that the 1443 low 16 bits form a negative number. If we subtract that number 1444 from VALUE, we will clear at least the lowest 17 bits, maybe more. */ 1445 i = mips_build_integer (codes, CONST_HIGH_PART (value)); 1446 codes[i].code = PLUS; 1447 codes[i].value = CONST_LOW_PART (value); 1448 } 1449 else 1450 { 1451 /* Either this is a simple LUI/ORI pair, or clearing the lowest 16 1452 bits gives a value with at least 17 trailing zeros. */ 1453 i = mips_build_integer (codes, high); 1454 codes[i].code = IOR; 1455 codes[i].value = value & 0xffff; 1456 } 1457 return i + 1; 1458 } 1459 1460 /* Fill CODES with a sequence of rtl operations to load VALUE. 1461 Return the number of operations needed. */ 1462 1463 static unsigned int 1464 mips_build_integer (struct mips_integer_op *codes, 1465 unsigned HOST_WIDE_INT value) 1466 { 1467 if (SMALL_OPERAND (value) 1468 || SMALL_OPERAND_UNSIGNED (value) 1469 || LUI_OPERAND (value)) 1470 { 1471 /* The value can be loaded with a single instruction. */ 1472 codes[0].code = UNKNOWN; 1473 codes[0].value = value; 1474 return 1; 1475 } 1476 else if ((value & 1) != 0 || LUI_OPERAND (CONST_HIGH_PART (value))) 1477 { 1478 /* Either the constant is a simple LUI/ORI combination or its 1479 lowest bit is set. We don't want to shift in this case. */ 1480 return mips_build_lower (codes, value); 1481 } 1482 else if ((value & 0xffff) == 0) 1483 { 1484 /* The constant will need at least three actions. The lowest 1485 16 bits are clear, so the final action will be a shift. */ 1486 return mips_build_shift (codes, value); 1487 } 1488 else 1489 { 1490 /* The final action could be a shift, add or inclusive OR. 1491 Rather than use a complex condition to select the best 1492 approach, try both mips_build_shift and mips_build_lower 1493 and pick the one that gives the shortest sequence. 1494 Note that this case is only used once per constant. */ 1495 struct mips_integer_op alt_codes[MIPS_MAX_INTEGER_OPS]; 1496 unsigned int cost, alt_cost; 1497 1498 cost = mips_build_shift (codes, value); 1499 alt_cost = mips_build_lower (alt_codes, value); 1500 if (alt_cost < cost) 1501 { 1502 memcpy (codes, alt_codes, alt_cost * sizeof (codes[0])); 1503 cost = alt_cost; 1504 } 1505 return cost; 1506 } 1507 } 1508 1509 /* Return true if symbols of type TYPE require a GOT access. */ 1510 1511 static bool 1512 mips_got_symbol_type_p (enum mips_symbol_type type) 1513 { 1514 switch (type) 1515 { 1516 case SYMBOL_GOT_PAGE_OFST: 1517 case SYMBOL_GOT_DISP: 1518 return true; 1519 1520 default: 1521 return false; 1522 } 1523 } 1524 1525 /* Return true if X is a thread-local symbol. */ 1526 1527 static bool 1528 mips_tls_symbol_p (rtx x) 1529 { 1530 return GET_CODE (x) == SYMBOL_REF && SYMBOL_REF_TLS_MODEL (x) != 0; 1531 } 1532 1533 /* Return true if SYMBOL_REF X is associated with a global symbol 1534 (in the STB_GLOBAL sense). */ 1535 1536 static bool 1537 mips_global_symbol_p (const_rtx x) 1538 { 1539 const_tree decl = SYMBOL_REF_DECL (x); 1540 1541 if (!decl) 1542 return !SYMBOL_REF_LOCAL_P (x) || SYMBOL_REF_EXTERNAL_P (x); 1543 1544 /* Weakref symbols are not TREE_PUBLIC, but their targets are global 1545 or weak symbols. Relocations in the object file will be against 1546 the target symbol, so it's that symbol's binding that matters here. */ 1547 return DECL_P (decl) && (TREE_PUBLIC (decl) || DECL_WEAK (decl)); 1548 } 1549 1550 /* Return true if function X is a libgcc MIPS16 stub function. */ 1551 1552 static bool 1553 mips16_stub_function_p (const_rtx x) 1554 { 1555 return (GET_CODE (x) == SYMBOL_REF 1556 && strncmp (XSTR (x, 0), "__mips16_", 9) == 0); 1557 } 1558 1559 /* Return true if function X is a locally-defined and locally-binding 1560 MIPS16 function. */ 1561 1562 static bool 1563 mips16_local_function_p (const_rtx x) 1564 { 1565 return (GET_CODE (x) == SYMBOL_REF 1566 && SYMBOL_REF_LOCAL_P (x) 1567 && !SYMBOL_REF_EXTERNAL_P (x) 1568 && mips_use_mips16_mode_p (SYMBOL_REF_DECL (x))); 1569 } 1570 1571 /* Return true if SYMBOL_REF X binds locally. */ 1572 1573 static bool 1574 mips_symbol_binds_local_p (const_rtx x) 1575 { 1576 return (SYMBOL_REF_DECL (x) 1577 ? targetm.binds_local_p (SYMBOL_REF_DECL (x)) 1578 : SYMBOL_REF_LOCAL_P (x)); 1579 } 1580 1581 /* Return true if rtx constants of mode MODE should be put into a small 1582 data section. */ 1583 1584 static bool 1585 mips_rtx_constant_in_small_data_p (enum machine_mode mode) 1586 { 1587 return (!TARGET_EMBEDDED_DATA 1588 && TARGET_LOCAL_SDATA 1589 && GET_MODE_SIZE (mode) <= mips_small_data_threshold); 1590 } 1591 1592 /* Return true if X should not be moved directly into register $25. 1593 We need this because many versions of GAS will treat "la $25,foo" as 1594 part of a call sequence and so allow a global "foo" to be lazily bound. */ 1595 1596 bool 1597 mips_dangerous_for_la25_p (rtx x) 1598 { 1599 return (!TARGET_EXPLICIT_RELOCS 1600 && TARGET_USE_GOT 1601 && GET_CODE (x) == SYMBOL_REF 1602 && mips_global_symbol_p (x)); 1603 } 1604 1605 /* Return true if calls to X might need $25 to be valid on entry. */ 1606 1607 bool 1608 mips_use_pic_fn_addr_reg_p (const_rtx x) 1609 { 1610 if (!TARGET_USE_PIC_FN_ADDR_REG) 1611 return false; 1612 1613 /* MIPS16 stub functions are guaranteed not to use $25. */ 1614 if (mips16_stub_function_p (x)) 1615 return false; 1616 1617 if (GET_CODE (x) == SYMBOL_REF) 1618 { 1619 /* If PLTs and copy relocations are available, the static linker 1620 will make sure that $25 is valid on entry to the target function. */ 1621 if (TARGET_ABICALLS_PIC0) 1622 return false; 1623 1624 /* Locally-defined functions use absolute accesses to set up 1625 the global pointer. */ 1626 if (TARGET_ABSOLUTE_ABICALLS 1627 && mips_symbol_binds_local_p (x) 1628 && !SYMBOL_REF_EXTERNAL_P (x)) 1629 return false; 1630 } 1631 1632 return true; 1633 } 1634 1635 /* Return the method that should be used to access SYMBOL_REF or 1636 LABEL_REF X in context CONTEXT. */ 1637 1638 static enum mips_symbol_type 1639 mips_classify_symbol (const_rtx x, enum mips_symbol_context context) 1640 { 1641 if (TARGET_RTP_PIC) 1642 return SYMBOL_GOT_DISP; 1643 1644 if (GET_CODE (x) == LABEL_REF) 1645 { 1646 /* LABEL_REFs are used for jump tables as well as text labels. 1647 Only return SYMBOL_PC_RELATIVE if we know the label is in 1648 the text section. */ 1649 if (TARGET_MIPS16_SHORT_JUMP_TABLES) 1650 return SYMBOL_PC_RELATIVE; 1651 1652 if (TARGET_ABICALLS && !TARGET_ABSOLUTE_ABICALLS) 1653 return SYMBOL_GOT_PAGE_OFST; 1654 1655 return SYMBOL_ABSOLUTE; 1656 } 1657 1658 gcc_assert (GET_CODE (x) == SYMBOL_REF); 1659 1660 if (SYMBOL_REF_TLS_MODEL (x)) 1661 return SYMBOL_TLS; 1662 1663 if (CONSTANT_POOL_ADDRESS_P (x)) 1664 { 1665 if (TARGET_MIPS16_TEXT_LOADS) 1666 return SYMBOL_PC_RELATIVE; 1667 1668 if (TARGET_MIPS16_PCREL_LOADS && context == SYMBOL_CONTEXT_MEM) 1669 return SYMBOL_PC_RELATIVE; 1670 1671 if (mips_rtx_constant_in_small_data_p (get_pool_mode (x))) 1672 return SYMBOL_GP_RELATIVE; 1673 } 1674 1675 /* Do not use small-data accesses for weak symbols; they may end up 1676 being zero. */ 1677 if (TARGET_GPOPT && SYMBOL_REF_SMALL_P (x) && !SYMBOL_REF_WEAK (x)) 1678 return SYMBOL_GP_RELATIVE; 1679 1680 /* Don't use GOT accesses for locally-binding symbols when -mno-shared 1681 is in effect. */ 1682 if (TARGET_ABICALLS_PIC2 1683 && !(TARGET_ABSOLUTE_ABICALLS && mips_symbol_binds_local_p (x))) 1684 { 1685 /* There are three cases to consider: 1686 1687 - o32 PIC (either with or without explicit relocs) 1688 - n32/n64 PIC without explicit relocs 1689 - n32/n64 PIC with explicit relocs 1690 1691 In the first case, both local and global accesses will use an 1692 R_MIPS_GOT16 relocation. We must correctly predict which of 1693 the two semantics (local or global) the assembler and linker 1694 will apply. The choice depends on the symbol's binding rather 1695 than its visibility. 1696 1697 In the second case, the assembler will not use R_MIPS_GOT16 1698 relocations, but it chooses between local and global accesses 1699 in the same way as for o32 PIC. 1700 1701 In the third case we have more freedom since both forms of 1702 access will work for any kind of symbol. However, there seems 1703 little point in doing things differently. */ 1704 if (mips_global_symbol_p (x)) 1705 return SYMBOL_GOT_DISP; 1706 1707 return SYMBOL_GOT_PAGE_OFST; 1708 } 1709 1710 if (TARGET_MIPS16_PCREL_LOADS && context != SYMBOL_CONTEXT_CALL) 1711 return SYMBOL_FORCE_TO_MEM; 1712 1713 return SYMBOL_ABSOLUTE; 1714 } 1715 1716 /* Classify the base of symbolic expression X, given that X appears in 1717 context CONTEXT. */ 1718 1719 static enum mips_symbol_type 1720 mips_classify_symbolic_expression (rtx x, enum mips_symbol_context context) 1721 { 1722 rtx offset; 1723 1724 split_const (x, &x, &offset); 1725 if (UNSPEC_ADDRESS_P (x)) 1726 return UNSPEC_ADDRESS_TYPE (x); 1727 1728 return mips_classify_symbol (x, context); 1729 } 1730 1731 /* Return true if OFFSET is within the range [0, ALIGN), where ALIGN 1732 is the alignment in bytes of SYMBOL_REF X. */ 1733 1734 static bool 1735 mips_offset_within_alignment_p (rtx x, HOST_WIDE_INT offset) 1736 { 1737 HOST_WIDE_INT align; 1738 1739 align = SYMBOL_REF_DECL (x) ? DECL_ALIGN_UNIT (SYMBOL_REF_DECL (x)) : 1; 1740 return IN_RANGE (offset, 0, align - 1); 1741 } 1742 1743 /* Return true if X is a symbolic constant that can be used in context 1744 CONTEXT. If it is, store the type of the symbol in *SYMBOL_TYPE. */ 1745 1746 bool 1747 mips_symbolic_constant_p (rtx x, enum mips_symbol_context context, 1748 enum mips_symbol_type *symbol_type) 1749 { 1750 rtx offset; 1751 1752 split_const (x, &x, &offset); 1753 if (UNSPEC_ADDRESS_P (x)) 1754 { 1755 *symbol_type = UNSPEC_ADDRESS_TYPE (x); 1756 x = UNSPEC_ADDRESS (x); 1757 } 1758 else if (GET_CODE (x) == SYMBOL_REF || GET_CODE (x) == LABEL_REF) 1759 { 1760 *symbol_type = mips_classify_symbol (x, context); 1761 if (*symbol_type == SYMBOL_TLS) 1762 return false; 1763 } 1764 else 1765 return false; 1766 1767 if (offset == const0_rtx) 1768 return true; 1769 1770 /* Check whether a nonzero offset is valid for the underlying 1771 relocations. */ 1772 switch (*symbol_type) 1773 { 1774 case SYMBOL_ABSOLUTE: 1775 case SYMBOL_FORCE_TO_MEM: 1776 case SYMBOL_32_HIGH: 1777 case SYMBOL_64_HIGH: 1778 case SYMBOL_64_MID: 1779 case SYMBOL_64_LOW: 1780 /* If the target has 64-bit pointers and the object file only 1781 supports 32-bit symbols, the values of those symbols will be 1782 sign-extended. In this case we can't allow an arbitrary offset 1783 in case the 32-bit value X + OFFSET has a different sign from X. */ 1784 if (Pmode == DImode && !ABI_HAS_64BIT_SYMBOLS) 1785 return offset_within_block_p (x, INTVAL (offset)); 1786 1787 /* In other cases the relocations can handle any offset. */ 1788 return true; 1789 1790 case SYMBOL_PC_RELATIVE: 1791 /* Allow constant pool references to be converted to LABEL+CONSTANT. 1792 In this case, we no longer have access to the underlying constant, 1793 but the original symbol-based access was known to be valid. */ 1794 if (GET_CODE (x) == LABEL_REF) 1795 return true; 1796 1797 /* Fall through. */ 1798 1799 case SYMBOL_GP_RELATIVE: 1800 /* Make sure that the offset refers to something within the 1801 same object block. This should guarantee that the final 1802 PC- or GP-relative offset is within the 16-bit limit. */ 1803 return offset_within_block_p (x, INTVAL (offset)); 1804 1805 case SYMBOL_GOT_PAGE_OFST: 1806 case SYMBOL_GOTOFF_PAGE: 1807 /* If the symbol is global, the GOT entry will contain the symbol's 1808 address, and we will apply a 16-bit offset after loading it. 1809 If the symbol is local, the linker should provide enough local 1810 GOT entries for a 16-bit offset, but larger offsets may lead 1811 to GOT overflow. */ 1812 return SMALL_INT (offset); 1813 1814 case SYMBOL_TPREL: 1815 case SYMBOL_DTPREL: 1816 /* There is no carry between the HI and LO REL relocations, so the 1817 offset is only valid if we know it won't lead to such a carry. */ 1818 return mips_offset_within_alignment_p (x, INTVAL (offset)); 1819 1820 case SYMBOL_GOT_DISP: 1821 case SYMBOL_GOTOFF_DISP: 1822 case SYMBOL_GOTOFF_CALL: 1823 case SYMBOL_GOTOFF_LOADGP: 1824 case SYMBOL_TLSGD: 1825 case SYMBOL_TLSLDM: 1826 case SYMBOL_GOTTPREL: 1827 case SYMBOL_TLS: 1828 case SYMBOL_HALF: 1829 return false; 1830 } 1831 gcc_unreachable (); 1832 } 1833 1834 /* Like mips_symbol_insns, but treat extended MIPS16 instructions as a 1835 single instruction. We rely on the fact that, in the worst case, 1836 all instructions involved in a MIPS16 address calculation are usually 1837 extended ones. */ 1838 1839 static int 1840 mips_symbol_insns_1 (enum mips_symbol_type type, enum machine_mode mode) 1841 { 1842 switch (type) 1843 { 1844 case SYMBOL_ABSOLUTE: 1845 /* When using 64-bit symbols, we need 5 preparatory instructions, 1846 such as: 1847 1848 lui $at,%highest(symbol) 1849 daddiu $at,$at,%higher(symbol) 1850 dsll $at,$at,16 1851 daddiu $at,$at,%hi(symbol) 1852 dsll $at,$at,16 1853 1854 The final address is then $at + %lo(symbol). With 32-bit 1855 symbols we just need a preparatory LUI for normal mode and 1856 a preparatory LI and SLL for MIPS16. */ 1857 return ABI_HAS_64BIT_SYMBOLS ? 6 : TARGET_MIPS16 ? 3 : 2; 1858 1859 case SYMBOL_GP_RELATIVE: 1860 /* Treat GP-relative accesses as taking a single instruction on 1861 MIPS16 too; the copy of $gp can often be shared. */ 1862 return 1; 1863 1864 case SYMBOL_PC_RELATIVE: 1865 /* PC-relative constants can be only be used with ADDIUPC, 1866 DADDIUPC, LWPC and LDPC. */ 1867 if (mode == MAX_MACHINE_MODE 1868 || GET_MODE_SIZE (mode) == 4 1869 || GET_MODE_SIZE (mode) == 8) 1870 return 1; 1871 1872 /* The constant must be loaded using ADDIUPC or DADDIUPC first. */ 1873 return 0; 1874 1875 case SYMBOL_FORCE_TO_MEM: 1876 /* LEAs will be converted into constant-pool references by 1877 mips_reorg. */ 1878 if (mode == MAX_MACHINE_MODE) 1879 return 1; 1880 1881 /* The constant must be loaded and then dereferenced. */ 1882 return 0; 1883 1884 case SYMBOL_GOT_DISP: 1885 /* The constant will have to be loaded from the GOT before it 1886 is used in an address. */ 1887 if (mode != MAX_MACHINE_MODE) 1888 return 0; 1889 1890 /* Fall through. */ 1891 1892 case SYMBOL_GOT_PAGE_OFST: 1893 /* Unless -funit-at-a-time is in effect, we can't be sure whether the 1894 local/global classification is accurate. The worst cases are: 1895 1896 (1) For local symbols when generating o32 or o64 code. The assembler 1897 will use: 1898 1899 lw $at,%got(symbol) 1900 nop 1901 1902 ...and the final address will be $at + %lo(symbol). 1903 1904 (2) For global symbols when -mxgot. The assembler will use: 1905 1906 lui $at,%got_hi(symbol) 1907 (d)addu $at,$at,$gp 1908 1909 ...and the final address will be $at + %got_lo(symbol). */ 1910 return 3; 1911 1912 case SYMBOL_GOTOFF_PAGE: 1913 case SYMBOL_GOTOFF_DISP: 1914 case SYMBOL_GOTOFF_CALL: 1915 case SYMBOL_GOTOFF_LOADGP: 1916 case SYMBOL_32_HIGH: 1917 case SYMBOL_64_HIGH: 1918 case SYMBOL_64_MID: 1919 case SYMBOL_64_LOW: 1920 case SYMBOL_TLSGD: 1921 case SYMBOL_TLSLDM: 1922 case SYMBOL_DTPREL: 1923 case SYMBOL_GOTTPREL: 1924 case SYMBOL_TPREL: 1925 case SYMBOL_HALF: 1926 /* A 16-bit constant formed by a single relocation, or a 32-bit 1927 constant formed from a high 16-bit relocation and a low 16-bit 1928 relocation. Use mips_split_p to determine which. 32-bit 1929 constants need an "lui; addiu" sequence for normal mode and 1930 an "li; sll; addiu" sequence for MIPS16 mode. */ 1931 return !mips_split_p[type] ? 1 : TARGET_MIPS16 ? 3 : 2; 1932 1933 case SYMBOL_TLS: 1934 /* We don't treat a bare TLS symbol as a constant. */ 1935 return 0; 1936 } 1937 gcc_unreachable (); 1938 } 1939 1940 /* If MODE is MAX_MACHINE_MODE, return the number of instructions needed 1941 to load symbols of type TYPE into a register. Return 0 if the given 1942 type of symbol cannot be used as an immediate operand. 1943 1944 Otherwise, return the number of instructions needed to load or store 1945 values of mode MODE to or from addresses of type TYPE. Return 0 if 1946 the given type of symbol is not valid in addresses. 1947 1948 In both cases, treat extended MIPS16 instructions as two instructions. */ 1949 1950 static int 1951 mips_symbol_insns (enum mips_symbol_type type, enum machine_mode mode) 1952 { 1953 return mips_symbol_insns_1 (type, mode) * (TARGET_MIPS16 ? 2 : 1); 1954 } 1955 1956 /* A for_each_rtx callback. Stop the search if *X references a 1957 thread-local symbol. */ 1958 1959 static int 1960 mips_tls_symbol_ref_1 (rtx *x, void *data ATTRIBUTE_UNUSED) 1961 { 1962 return mips_tls_symbol_p (*x); 1963 } 1964 1965 /* Implement TARGET_CANNOT_FORCE_CONST_MEM. */ 1966 1967 static bool 1968 mips_cannot_force_const_mem (rtx x) 1969 { 1970 enum mips_symbol_type type; 1971 rtx base, offset; 1972 1973 /* There is no assembler syntax for expressing an address-sized 1974 high part. */ 1975 if (GET_CODE (x) == HIGH) 1976 return true; 1977 1978 /* As an optimization, reject constants that mips_legitimize_move 1979 can expand inline. 1980 1981 Suppose we have a multi-instruction sequence that loads constant C 1982 into register R. If R does not get allocated a hard register, and 1983 R is used in an operand that allows both registers and memory 1984 references, reload will consider forcing C into memory and using 1985 one of the instruction's memory alternatives. Returning false 1986 here will force it to use an input reload instead. */ 1987 if (CONST_INT_P (x) && LEGITIMATE_CONSTANT_P (x)) 1988 return true; 1989 1990 split_const (x, &base, &offset); 1991 if (mips_symbolic_constant_p (base, SYMBOL_CONTEXT_LEA, &type) 1992 && type != SYMBOL_FORCE_TO_MEM) 1993 { 1994 /* The same optimization as for CONST_INT. */ 1995 if (SMALL_INT (offset) && mips_symbol_insns (type, MAX_MACHINE_MODE) > 0) 1996 return true; 1997 1998 /* If MIPS16 constant pools live in the text section, they should 1999 not refer to anything that might need run-time relocation. */ 2000 if (TARGET_MIPS16_PCREL_LOADS && mips_got_symbol_type_p (type)) 2001 return true; 2002 } 2003 2004 /* TLS symbols must be computed by mips_legitimize_move. */ 2005 if (for_each_rtx (&x, &mips_tls_symbol_ref_1, NULL)) 2006 return true; 2007 2008 return false; 2009 } 2010 2011 /* Implement TARGET_USE_BLOCKS_FOR_CONSTANT_P. We can't use blocks for 2012 constants when we're using a per-function constant pool. */ 2013 2014 static bool 2015 mips_use_blocks_for_constant_p (enum machine_mode mode ATTRIBUTE_UNUSED, 2016 const_rtx x ATTRIBUTE_UNUSED) 2017 { 2018 return !TARGET_MIPS16_PCREL_LOADS; 2019 } 2020 2021 /* Return true if register REGNO is a valid base register for mode MODE. 2022 STRICT_P is true if REG_OK_STRICT is in effect. */ 2023 2024 int 2025 mips_regno_mode_ok_for_base_p (int regno, enum machine_mode mode, 2026 bool strict_p) 2027 { 2028 if (!HARD_REGISTER_NUM_P (regno)) 2029 { 2030 if (!strict_p) 2031 return true; 2032 regno = reg_renumber[regno]; 2033 } 2034 2035 /* These fake registers will be eliminated to either the stack or 2036 hard frame pointer, both of which are usually valid base registers. 2037 Reload deals with the cases where the eliminated form isn't valid. */ 2038 if (regno == ARG_POINTER_REGNUM || regno == FRAME_POINTER_REGNUM) 2039 return true; 2040 2041 /* In MIPS16 mode, the stack pointer can only address word and doubleword 2042 values, nothing smaller. There are two problems here: 2043 2044 (a) Instantiating virtual registers can introduce new uses of the 2045 stack pointer. If these virtual registers are valid addresses, 2046 the stack pointer should be too. 2047 2048 (b) Most uses of the stack pointer are not made explicit until 2049 FRAME_POINTER_REGNUM and ARG_POINTER_REGNUM have been eliminated. 2050 We don't know until that stage whether we'll be eliminating to the 2051 stack pointer (which needs the restriction) or the hard frame 2052 pointer (which doesn't). 2053 2054 All in all, it seems more consistent to only enforce this restriction 2055 during and after reload. */ 2056 if (TARGET_MIPS16 && regno == STACK_POINTER_REGNUM) 2057 return !strict_p || GET_MODE_SIZE (mode) == 4 || GET_MODE_SIZE (mode) == 8; 2058 2059 return TARGET_MIPS16 ? M16_REG_P (regno) : GP_REG_P (regno); 2060 } 2061 2062 /* Return true if X is a valid base register for mode MODE. 2063 STRICT_P is true if REG_OK_STRICT is in effect. */ 2064 2065 static bool 2066 mips_valid_base_register_p (rtx x, enum machine_mode mode, bool strict_p) 2067 { 2068 if (!strict_p && GET_CODE (x) == SUBREG) 2069 x = SUBREG_REG (x); 2070 2071 return (REG_P (x) 2072 && mips_regno_mode_ok_for_base_p (REGNO (x), mode, strict_p)); 2073 } 2074 2075 /* Return true if, for every base register BASE_REG, (plus BASE_REG X) 2076 can address a value of mode MODE. */ 2077 2078 static bool 2079 mips_valid_offset_p (rtx x, enum machine_mode mode) 2080 { 2081 /* Check that X is a signed 16-bit number. */ 2082 if (!const_arith_operand (x, Pmode)) 2083 return false; 2084 2085 /* We may need to split multiword moves, so make sure that every word 2086 is accessible. */ 2087 if (GET_MODE_SIZE (mode) > UNITS_PER_WORD 2088 && !SMALL_OPERAND (INTVAL (x) + GET_MODE_SIZE (mode) - UNITS_PER_WORD)) 2089 return false; 2090 2091 return true; 2092 } 2093 2094 /* Return true if a LO_SUM can address a value of mode MODE when the 2095 LO_SUM symbol has type SYMBOL_TYPE. */ 2096 2097 static bool 2098 mips_valid_lo_sum_p (enum mips_symbol_type symbol_type, enum machine_mode mode) 2099 { 2100 /* Check that symbols of type SYMBOL_TYPE can be used to access values 2101 of mode MODE. */ 2102 if (mips_symbol_insns (symbol_type, mode) == 0) 2103 return false; 2104 2105 /* Check that there is a known low-part relocation. */ 2106 if (mips_lo_relocs[symbol_type] == NULL) 2107 return false; 2108 2109 /* We may need to split multiword moves, so make sure that each word 2110 can be accessed without inducing a carry. This is mainly needed 2111 for o64, which has historically only guaranteed 64-bit alignment 2112 for 128-bit types. */ 2113 if (GET_MODE_SIZE (mode) > UNITS_PER_WORD 2114 && GET_MODE_BITSIZE (mode) > GET_MODE_ALIGNMENT (mode)) 2115 return false; 2116 2117 return true; 2118 } 2119 2120 /* Return true if X is a valid address for machine mode MODE. If it is, 2121 fill in INFO appropriately. STRICT_P is true if REG_OK_STRICT is in 2122 effect. */ 2123 2124 static bool 2125 mips_classify_address (struct mips_address_info *info, rtx x, 2126 enum machine_mode mode, bool strict_p) 2127 { 2128 switch (GET_CODE (x)) 2129 { 2130 case REG: 2131 case SUBREG: 2132 info->type = ADDRESS_REG; 2133 info->reg = x; 2134 info->offset = const0_rtx; 2135 return mips_valid_base_register_p (info->reg, mode, strict_p); 2136 2137 case PLUS: 2138 info->type = ADDRESS_REG; 2139 info->reg = XEXP (x, 0); 2140 info->offset = XEXP (x, 1); 2141 return (mips_valid_base_register_p (info->reg, mode, strict_p) 2142 && mips_valid_offset_p (info->offset, mode)); 2143 2144 case LO_SUM: 2145 info->type = ADDRESS_LO_SUM; 2146 info->reg = XEXP (x, 0); 2147 info->offset = XEXP (x, 1); 2148 /* We have to trust the creator of the LO_SUM to do something vaguely 2149 sane. Target-independent code that creates a LO_SUM should also 2150 create and verify the matching HIGH. Target-independent code that 2151 adds an offset to a LO_SUM must prove that the offset will not 2152 induce a carry. Failure to do either of these things would be 2153 a bug, and we are not required to check for it here. The MIPS 2154 backend itself should only create LO_SUMs for valid symbolic 2155 constants, with the high part being either a HIGH or a copy 2156 of _gp. */ 2157 info->symbol_type 2158 = mips_classify_symbolic_expression (info->offset, SYMBOL_CONTEXT_MEM); 2159 return (mips_valid_base_register_p (info->reg, mode, strict_p) 2160 && mips_valid_lo_sum_p (info->symbol_type, mode)); 2161 2162 case CONST_INT: 2163 /* Small-integer addresses don't occur very often, but they 2164 are legitimate if $0 is a valid base register. */ 2165 info->type = ADDRESS_CONST_INT; 2166 return !TARGET_MIPS16 && SMALL_INT (x); 2167 2168 case CONST: 2169 case LABEL_REF: 2170 case SYMBOL_REF: 2171 info->type = ADDRESS_SYMBOLIC; 2172 return (mips_symbolic_constant_p (x, SYMBOL_CONTEXT_MEM, 2173 &info->symbol_type) 2174 && mips_symbol_insns (info->symbol_type, mode) > 0 2175 && !mips_split_p[info->symbol_type]); 2176 2177 default: 2178 return false; 2179 } 2180 } 2181 2182 /* Implement TARGET_LEGITIMATE_ADDRESS_P. */ 2183 2184 static bool 2185 mips_legitimate_address_p (enum machine_mode mode, rtx x, bool strict_p) 2186 { 2187 struct mips_address_info addr; 2188 2189 return mips_classify_address (&addr, x, mode, strict_p); 2190 } 2191 2192 /* Return true if X is a legitimate $sp-based address for mode MDOE. */ 2193 2194 bool 2195 mips_stack_address_p (rtx x, enum machine_mode mode) 2196 { 2197 struct mips_address_info addr; 2198 2199 return (mips_classify_address (&addr, x, mode, false) 2200 && addr.type == ADDRESS_REG 2201 && addr.reg == stack_pointer_rtx); 2202 } 2203 2204 /* Return true if ADDR matches the pattern for the LWXS load scaled indexed 2205 address instruction. Note that such addresses are not considered 2206 legitimate in the TARGET_LEGITIMATE_ADDRESS_P sense, because their use 2207 is so restricted. */ 2208 2209 static bool 2210 mips_lwxs_address_p (rtx addr) 2211 { 2212 if (ISA_HAS_LWXS 2213 && GET_CODE (addr) == PLUS 2214 && REG_P (XEXP (addr, 1))) 2215 { 2216 rtx offset = XEXP (addr, 0); 2217 if (GET_CODE (offset) == MULT 2218 && REG_P (XEXP (offset, 0)) 2219 && CONST_INT_P (XEXP (offset, 1)) 2220 && INTVAL (XEXP (offset, 1)) == 4) 2221 return true; 2222 } 2223 return false; 2224 } 2225 2226 /* Return true if a value at OFFSET bytes from base register BASE can be 2227 accessed using an unextended MIPS16 instruction. MODE is the mode of 2228 the value. 2229 2230 Usually the offset in an unextended instruction is a 5-bit field. 2231 The offset is unsigned and shifted left once for LH and SH, twice 2232 for LW and SW, and so on. An exception is LWSP and SWSP, which have 2233 an 8-bit immediate field that's shifted left twice. */ 2234 2235 static bool 2236 mips16_unextended_reference_p (enum machine_mode mode, rtx base, 2237 unsigned HOST_WIDE_INT offset) 2238 { 2239 if (offset % GET_MODE_SIZE (mode) == 0) 2240 { 2241 if (GET_MODE_SIZE (mode) == 4 && base == stack_pointer_rtx) 2242 return offset < 256U * GET_MODE_SIZE (mode); 2243 return offset < 32U * GET_MODE_SIZE (mode); 2244 } 2245 return false; 2246 } 2247 2248 /* Return the number of instructions needed to load or store a value 2249 of mode MODE at address X. Return 0 if X isn't valid for MODE. 2250 Assume that multiword moves may need to be split into word moves 2251 if MIGHT_SPLIT_P, otherwise assume that a single load or store is 2252 enough. 2253 2254 For MIPS16 code, count extended instructions as two instructions. */ 2255 2256 int 2257 mips_address_insns (rtx x, enum machine_mode mode, bool might_split_p) 2258 { 2259 struct mips_address_info addr; 2260 int factor; 2261 2262 /* BLKmode is used for single unaligned loads and stores and should 2263 not count as a multiword mode. (GET_MODE_SIZE (BLKmode) is pretty 2264 meaningless, so we have to single it out as a special case one way 2265 or the other.) */ 2266 if (mode != BLKmode && might_split_p) 2267 factor = (GET_MODE_SIZE (mode) + UNITS_PER_WORD - 1) / UNITS_PER_WORD; 2268 else 2269 factor = 1; 2270 2271 if (mips_classify_address (&addr, x, mode, false)) 2272 switch (addr.type) 2273 { 2274 case ADDRESS_REG: 2275 if (TARGET_MIPS16 2276 && !mips16_unextended_reference_p (mode, addr.reg, 2277 UINTVAL (addr.offset))) 2278 return factor * 2; 2279 return factor; 2280 2281 case ADDRESS_LO_SUM: 2282 return TARGET_MIPS16 ? factor * 2 : factor; 2283 2284 case ADDRESS_CONST_INT: 2285 return factor; 2286 2287 case ADDRESS_SYMBOLIC: 2288 return factor * mips_symbol_insns (addr.symbol_type, mode); 2289 } 2290 return 0; 2291 } 2292 2293 /* Return the number of instructions needed to load constant X. 2294 Return 0 if X isn't a valid constant. */ 2295 2296 int 2297 mips_const_insns (rtx x) 2298 { 2299 struct mips_integer_op codes[MIPS_MAX_INTEGER_OPS]; 2300 enum mips_symbol_type symbol_type; 2301 rtx offset; 2302 2303 switch (GET_CODE (x)) 2304 { 2305 case HIGH: 2306 if (!mips_symbolic_constant_p (XEXP (x, 0), SYMBOL_CONTEXT_LEA, 2307 &symbol_type) 2308 || !mips_split_p[symbol_type]) 2309 return 0; 2310 2311 /* This is simply an LUI for normal mode. It is an extended 2312 LI followed by an extended SLL for MIPS16. */ 2313 return TARGET_MIPS16 ? 4 : 1; 2314 2315 case CONST_INT: 2316 if (TARGET_MIPS16) 2317 /* Unsigned 8-bit constants can be loaded using an unextended 2318 LI instruction. Unsigned 16-bit constants can be loaded 2319 using an extended LI. Negative constants must be loaded 2320 using LI and then negated. */ 2321 return (IN_RANGE (INTVAL (x), 0, 255) ? 1 2322 : SMALL_OPERAND_UNSIGNED (INTVAL (x)) ? 2 2323 : IN_RANGE (-INTVAL (x), 0, 255) ? 2 2324 : SMALL_OPERAND_UNSIGNED (-INTVAL (x)) ? 3 2325 : 0); 2326 2327 return mips_build_integer (codes, INTVAL (x)); 2328 2329 case CONST_DOUBLE: 2330 case CONST_VECTOR: 2331 /* Allow zeros for normal mode, where we can use $0. */ 2332 return !TARGET_MIPS16 && x == CONST0_RTX (GET_MODE (x)) ? 1 : 0; 2333 2334 case CONST: 2335 if (CONST_GP_P (x)) 2336 return 1; 2337 2338 /* See if we can refer to X directly. */ 2339 if (mips_symbolic_constant_p (x, SYMBOL_CONTEXT_LEA, &symbol_type)) 2340 return mips_symbol_insns (symbol_type, MAX_MACHINE_MODE); 2341 2342 /* Otherwise try splitting the constant into a base and offset. 2343 If the offset is a 16-bit value, we can load the base address 2344 into a register and then use (D)ADDIU to add in the offset. 2345 If the offset is larger, we can load the base and offset 2346 into separate registers and add them together with (D)ADDU. 2347 However, the latter is only possible before reload; during 2348 and after reload, we must have the option of forcing the 2349 constant into the pool instead. */ 2350 split_const (x, &x, &offset); 2351 if (offset != 0) 2352 { 2353 int n = mips_const_insns (x); 2354 if (n != 0) 2355 { 2356 if (SMALL_INT (offset)) 2357 return n + 1; 2358 else if (!targetm.cannot_force_const_mem (x)) 2359 return n + 1 + mips_build_integer (codes, INTVAL (offset)); 2360 } 2361 } 2362 return 0; 2363 2364 case SYMBOL_REF: 2365 case LABEL_REF: 2366 return mips_symbol_insns (mips_classify_symbol (x, SYMBOL_CONTEXT_LEA), 2367 MAX_MACHINE_MODE); 2368 2369 default: 2370 return 0; 2371 } 2372 } 2373 2374 /* X is a doubleword constant that can be handled by splitting it into 2375 two words and loading each word separately. Return the number of 2376 instructions required to do this. */ 2377 2378 int 2379 mips_split_const_insns (rtx x) 2380 { 2381 unsigned int low, high; 2382 2383 low = mips_const_insns (mips_subword (x, false)); 2384 high = mips_const_insns (mips_subword (x, true)); 2385 gcc_assert (low > 0 && high > 0); 2386 return low + high; 2387 } 2388 2389 /* Return the number of instructions needed to implement INSN, 2390 given that it loads from or stores to MEM. Count extended 2391 MIPS16 instructions as two instructions. */ 2392 2393 int 2394 mips_load_store_insns (rtx mem, rtx insn) 2395 { 2396 enum machine_mode mode; 2397 bool might_split_p; 2398 rtx set; 2399 2400 gcc_assert (MEM_P (mem)); 2401 mode = GET_MODE (mem); 2402 2403 /* Try to prove that INSN does not need to be split. */ 2404 might_split_p = true; 2405 if (GET_MODE_BITSIZE (mode) == 64) 2406 { 2407 set = single_set (insn); 2408 if (set && !mips_split_64bit_move_p (SET_DEST (set), SET_SRC (set))) 2409 might_split_p = false; 2410 } 2411 2412 return mips_address_insns (XEXP (mem, 0), mode, might_split_p); 2413 } 2414 2415 /* Return the number of instructions needed for an integer division. */ 2416 2417 int 2418 mips_idiv_insns (void) 2419 { 2420 int count; 2421 2422 count = 1; 2423 if (TARGET_CHECK_ZERO_DIV) 2424 { 2425 if (GENERATE_DIVIDE_TRAPS) 2426 count++; 2427 else 2428 count += 2; 2429 } 2430 2431 if (TARGET_FIX_R4000 || TARGET_FIX_R4400) 2432 count++; 2433 return count; 2434 } 2435 2436 /* Emit a move from SRC to DEST. Assume that the move expanders can 2437 handle all moves if !can_create_pseudo_p (). The distinction is 2438 important because, unlike emit_move_insn, the move expanders know 2439 how to force Pmode objects into the constant pool even when the 2440 constant pool address is not itself legitimate. */ 2441 2442 rtx 2443 mips_emit_move (rtx dest, rtx src) 2444 { 2445 return (can_create_pseudo_p () 2446 ? emit_move_insn (dest, src) 2447 : emit_move_insn_1 (dest, src)); 2448 } 2449 2450 /* Emit an instruction of the form (set TARGET (CODE OP0)). */ 2451 2452 static void 2453 mips_emit_unary (enum rtx_code code, rtx target, rtx op0) 2454 { 2455 emit_insn (gen_rtx_SET (VOIDmode, target, 2456 gen_rtx_fmt_e (code, GET_MODE (op0), op0))); 2457 } 2458 2459 /* Compute (CODE OP0) and store the result in a new register of mode MODE. 2460 Return that new register. */ 2461 2462 static rtx 2463 mips_force_unary (enum machine_mode mode, enum rtx_code code, rtx op0) 2464 { 2465 rtx reg; 2466 2467 reg = gen_reg_rtx (mode); 2468 mips_emit_unary (code, reg, op0); 2469 return reg; 2470 } 2471 2472 /* Emit an instruction of the form (set TARGET (CODE OP0 OP1)). */ 2473 2474 static void 2475 mips_emit_binary (enum rtx_code code, rtx target, rtx op0, rtx op1) 2476 { 2477 emit_insn (gen_rtx_SET (VOIDmode, target, 2478 gen_rtx_fmt_ee (code, GET_MODE (target), op0, op1))); 2479 } 2480 2481 /* Compute (CODE OP0 OP1) and store the result in a new register 2482 of mode MODE. Return that new register. */ 2483 2484 static rtx 2485 mips_force_binary (enum machine_mode mode, enum rtx_code code, rtx op0, rtx op1) 2486 { 2487 rtx reg; 2488 2489 reg = gen_reg_rtx (mode); 2490 mips_emit_binary (code, reg, op0, op1); 2491 return reg; 2492 } 2493 2494 /* Copy VALUE to a register and return that register. If new pseudos 2495 are allowed, copy it into a new register, otherwise use DEST. */ 2496 2497 static rtx 2498 mips_force_temporary (rtx dest, rtx value) 2499 { 2500 if (can_create_pseudo_p ()) 2501 return force_reg (Pmode, value); 2502 else 2503 { 2504 mips_emit_move (dest, value); 2505 return dest; 2506 } 2507 } 2508 2509 /* Emit a call sequence with call pattern PATTERN and return the call 2510 instruction itself (which is not necessarily the last instruction 2511 emitted). ORIG_ADDR is the original, unlegitimized address, 2512 ADDR is the legitimized form, and LAZY_P is true if the call 2513 address is lazily-bound. */ 2514 2515 static rtx 2516 mips_emit_call_insn (rtx pattern, rtx orig_addr, rtx addr, bool lazy_p) 2517 { 2518 rtx insn, reg; 2519 2520 insn = emit_call_insn (pattern); 2521 2522 if (TARGET_MIPS16 && mips_use_pic_fn_addr_reg_p (orig_addr)) 2523 { 2524 /* MIPS16 JALRs only take MIPS16 registers. If the target 2525 function requires $25 to be valid on entry, we must copy it 2526 there separately. The move instruction can be put in the 2527 call's delay slot. */ 2528 reg = gen_rtx_REG (Pmode, PIC_FUNCTION_ADDR_REGNUM); 2529 emit_insn_before (gen_move_insn (reg, addr), insn); 2530 use_reg (&CALL_INSN_FUNCTION_USAGE (insn), reg); 2531 } 2532 2533 if (lazy_p) 2534 /* Lazy-binding stubs require $gp to be valid on entry. */ 2535 use_reg (&CALL_INSN_FUNCTION_USAGE (insn), pic_offset_table_rtx); 2536 2537 if (TARGET_USE_GOT) 2538 { 2539 /* See the comment above load_call<mode> for details. */ 2540 use_reg (&CALL_INSN_FUNCTION_USAGE (insn), 2541 gen_rtx_REG (Pmode, GOT_VERSION_REGNUM)); 2542 emit_insn (gen_update_got_version ()); 2543 } 2544 return insn; 2545 } 2546 2547 /* Wrap symbol or label BASE in an UNSPEC address of type SYMBOL_TYPE, 2548 then add CONST_INT OFFSET to the result. */ 2549 2550 static rtx 2551 mips_unspec_address_offset (rtx base, rtx offset, 2552 enum mips_symbol_type symbol_type) 2553 { 2554 base = gen_rtx_UNSPEC (Pmode, gen_rtvec (1, base), 2555 UNSPEC_ADDRESS_FIRST + symbol_type); 2556 if (offset != const0_rtx) 2557 base = gen_rtx_PLUS (Pmode, base, offset); 2558 return gen_rtx_CONST (Pmode, base); 2559 } 2560 2561 /* Return an UNSPEC address with underlying address ADDRESS and symbol 2562 type SYMBOL_TYPE. */ 2563 2564 rtx 2565 mips_unspec_address (rtx address, enum mips_symbol_type symbol_type) 2566 { 2567 rtx base, offset; 2568 2569 split_const (address, &base, &offset); 2570 return mips_unspec_address_offset (base, offset, symbol_type); 2571 } 2572 2573 /* If OP is an UNSPEC address, return the address to which it refers, 2574 otherwise return OP itself. */ 2575 2576 static rtx 2577 mips_strip_unspec_address (rtx op) 2578 { 2579 rtx base, offset; 2580 2581 split_const (op, &base, &offset); 2582 if (UNSPEC_ADDRESS_P (base)) 2583 op = plus_constant (UNSPEC_ADDRESS (base), INTVAL (offset)); 2584 return op; 2585 } 2586 2587 /* If mips_unspec_address (ADDR, SYMBOL_TYPE) is a 32-bit value, add the 2588 high part to BASE and return the result. Just return BASE otherwise. 2589 TEMP is as for mips_force_temporary. 2590 2591 The returned expression can be used as the first operand to a LO_SUM. */ 2592 2593 static rtx 2594 mips_unspec_offset_high (rtx temp, rtx base, rtx addr, 2595 enum mips_symbol_type symbol_type) 2596 { 2597 if (mips_split_p[symbol_type]) 2598 { 2599 addr = gen_rtx_HIGH (Pmode, mips_unspec_address (addr, symbol_type)); 2600 addr = mips_force_temporary (temp, addr); 2601 base = mips_force_temporary (temp, gen_rtx_PLUS (Pmode, addr, base)); 2602 } 2603 return base; 2604 } 2605 2606 /* Return an instruction that copies $gp into register REG. We want 2607 GCC to treat the register's value as constant, so that its value 2608 can be rematerialized on demand. */ 2609 2610 static rtx 2611 gen_load_const_gp (rtx reg) 2612 { 2613 return (Pmode == SImode 2614 ? gen_load_const_gp_si (reg) 2615 : gen_load_const_gp_di (reg)); 2616 } 2617 2618 /* Return a pseudo register that contains the value of $gp throughout 2619 the current function. Such registers are needed by MIPS16 functions, 2620 for which $gp itself is not a valid base register or addition operand. */ 2621 2622 static rtx 2623 mips16_gp_pseudo_reg (void) 2624 { 2625 if (cfun->machine->mips16_gp_pseudo_rtx == NULL_RTX) 2626 cfun->machine->mips16_gp_pseudo_rtx = gen_reg_rtx (Pmode); 2627 2628 /* Don't emit an instruction to initialize the pseudo register if 2629 we are being called from the tree optimizers' cost-calculation 2630 routines. */ 2631 if (!cfun->machine->initialized_mips16_gp_pseudo_p 2632 && (current_ir_type () != IR_GIMPLE || currently_expanding_to_rtl)) 2633 { 2634 rtx insn, scan; 2635 2636 push_topmost_sequence (); 2637 2638 scan = get_insns (); 2639 while (NEXT_INSN (scan) && !INSN_P (NEXT_INSN (scan))) 2640 scan = NEXT_INSN (scan); 2641 2642 insn = gen_load_const_gp (cfun->machine->mips16_gp_pseudo_rtx); 2643 emit_insn_after (insn, scan); 2644 2645 pop_topmost_sequence (); 2646 2647 cfun->machine->initialized_mips16_gp_pseudo_p = true; 2648 } 2649 2650 return cfun->machine->mips16_gp_pseudo_rtx; 2651 } 2652 2653 /* Return a base register that holds pic_offset_table_rtx. 2654 TEMP, if nonnull, is a scratch Pmode base register. */ 2655 2656 rtx 2657 mips_pic_base_register (rtx temp) 2658 { 2659 if (!TARGET_MIPS16) 2660 return pic_offset_table_rtx; 2661 2662 if (can_create_pseudo_p ()) 2663 return mips16_gp_pseudo_reg (); 2664 2665 if (TARGET_USE_GOT) 2666 /* The first post-reload split exposes all references to $gp 2667 (both uses and definitions). All references must remain 2668 explicit after that point. 2669 2670 It is safe to introduce uses of $gp at any time, so for 2671 simplicity, we do that before the split too. */ 2672 mips_emit_move (temp, pic_offset_table_rtx); 2673 else 2674 emit_insn (gen_load_const_gp (temp)); 2675 return temp; 2676 } 2677 2678 /* Return the RHS of a load_call<mode> insn. */ 2679 2680 static rtx 2681 mips_unspec_call (rtx reg, rtx symbol) 2682 { 2683 rtvec vec; 2684 2685 vec = gen_rtvec (3, reg, symbol, gen_rtx_REG (SImode, GOT_VERSION_REGNUM)); 2686 return gen_rtx_UNSPEC (Pmode, vec, UNSPEC_LOAD_CALL); 2687 } 2688 2689 /* If SRC is the RHS of a load_call<mode> insn, return the underlying symbol 2690 reference. Return NULL_RTX otherwise. */ 2691 2692 static rtx 2693 mips_strip_unspec_call (rtx src) 2694 { 2695 if (GET_CODE (src) == UNSPEC && XINT (src, 1) == UNSPEC_LOAD_CALL) 2696 return mips_strip_unspec_address (XVECEXP (src, 0, 1)); 2697 return NULL_RTX; 2698 } 2699 2700 /* Create and return a GOT reference of type TYPE for address ADDR. 2701 TEMP, if nonnull, is a scratch Pmode base register. */ 2702 2703 rtx 2704 mips_got_load (rtx temp, rtx addr, enum mips_symbol_type type) 2705 { 2706 rtx base, high, lo_sum_symbol; 2707 2708 base = mips_pic_base_register (temp); 2709 2710 /* If we used the temporary register to load $gp, we can't use 2711 it for the high part as well. */ 2712 if (temp != NULL && reg_overlap_mentioned_p (base, temp)) 2713 temp = NULL; 2714 2715 high = mips_unspec_offset_high (temp, base, addr, type); 2716 lo_sum_symbol = mips_unspec_address (addr, type); 2717 2718 if (type == SYMBOL_GOTOFF_CALL) 2719 return mips_unspec_call (high, lo_sum_symbol); 2720 else 2721 return (Pmode == SImode 2722 ? gen_unspec_gotsi (high, lo_sum_symbol) 2723 : gen_unspec_gotdi (high, lo_sum_symbol)); 2724 } 2725 2726 /* If MODE is MAX_MACHINE_MODE, ADDR appears as a move operand, otherwise 2727 it appears in a MEM of that mode. Return true if ADDR is a legitimate 2728 constant in that context and can be split into high and low parts. 2729 If so, and if LOW_OUT is nonnull, emit the high part and store the 2730 low part in *LOW_OUT. Leave *LOW_OUT unchanged otherwise. 2731 2732 TEMP is as for mips_force_temporary and is used to load the high 2733 part into a register. 2734 2735 When MODE is MAX_MACHINE_MODE, the low part is guaranteed to be 2736 a legitimize SET_SRC for an .md pattern, otherwise the low part 2737 is guaranteed to be a legitimate address for mode MODE. */ 2738 2739 bool 2740 mips_split_symbol (rtx temp, rtx addr, enum machine_mode mode, rtx *low_out) 2741 { 2742 enum mips_symbol_context context; 2743 enum mips_symbol_type symbol_type; 2744 rtx high; 2745 2746 context = (mode == MAX_MACHINE_MODE 2747 ? SYMBOL_CONTEXT_LEA 2748 : SYMBOL_CONTEXT_MEM); 2749 if (GET_CODE (addr) == HIGH && context == SYMBOL_CONTEXT_LEA) 2750 { 2751 addr = XEXP (addr, 0); 2752 if (mips_symbolic_constant_p (addr, context, &symbol_type) 2753 && mips_symbol_insns (symbol_type, mode) > 0 2754 && mips_split_hi_p[symbol_type]) 2755 { 2756 if (low_out) 2757 switch (symbol_type) 2758 { 2759 case SYMBOL_GOT_PAGE_OFST: 2760 /* The high part of a page/ofst pair is loaded from the GOT. */ 2761 *low_out = mips_got_load (temp, addr, SYMBOL_GOTOFF_PAGE); 2762 break; 2763 2764 default: 2765 gcc_unreachable (); 2766 } 2767 return true; 2768 } 2769 } 2770 else 2771 { 2772 if (mips_symbolic_constant_p (addr, context, &symbol_type) 2773 && mips_symbol_insns (symbol_type, mode) > 0 2774 && mips_split_p[symbol_type]) 2775 { 2776 if (low_out) 2777 switch (symbol_type) 2778 { 2779 case SYMBOL_GOT_DISP: 2780 /* SYMBOL_GOT_DISP symbols are loaded from the GOT. */ 2781 *low_out = mips_got_load (temp, addr, SYMBOL_GOTOFF_DISP); 2782 break; 2783 2784 case SYMBOL_GP_RELATIVE: 2785 high = mips_pic_base_register (temp); 2786 *low_out = gen_rtx_LO_SUM (Pmode, high, addr); 2787 break; 2788 2789 default: 2790 high = gen_rtx_HIGH (Pmode, copy_rtx (addr)); 2791 high = mips_force_temporary (temp, high); 2792 *low_out = gen_rtx_LO_SUM (Pmode, high, addr); 2793 break; 2794 } 2795 return true; 2796 } 2797 } 2798 return false; 2799 } 2800 2801 /* Return a legitimate address for REG + OFFSET. TEMP is as for 2802 mips_force_temporary; it is only needed when OFFSET is not a 2803 SMALL_OPERAND. */ 2804 2805 static rtx 2806 mips_add_offset (rtx temp, rtx reg, HOST_WIDE_INT offset) 2807 { 2808 if (!SMALL_OPERAND (offset)) 2809 { 2810 rtx high; 2811 2812 if (TARGET_MIPS16) 2813 { 2814 /* Load the full offset into a register so that we can use 2815 an unextended instruction for the address itself. */ 2816 high = GEN_INT (offset); 2817 offset = 0; 2818 } 2819 else 2820 { 2821 /* Leave OFFSET as a 16-bit offset and put the excess in HIGH. 2822 The addition inside the macro CONST_HIGH_PART may cause an 2823 overflow, so we need to force a sign-extension check. */ 2824 high = gen_int_mode (CONST_HIGH_PART (offset), Pmode); 2825 offset = CONST_LOW_PART (offset); 2826 } 2827 high = mips_force_temporary (temp, high); 2828 reg = mips_force_temporary (temp, gen_rtx_PLUS (Pmode, high, reg)); 2829 } 2830 return plus_constant (reg, offset); 2831 } 2832 2833 /* The __tls_get_attr symbol. */ 2834 static GTY(()) rtx mips_tls_symbol; 2835 2836 /* Return an instruction sequence that calls __tls_get_addr. SYM is 2837 the TLS symbol we are referencing and TYPE is the symbol type to use 2838 (either global dynamic or local dynamic). V0 is an RTX for the 2839 return value location. */ 2840 2841 static rtx 2842 mips_call_tls_get_addr (rtx sym, enum mips_symbol_type type, rtx v0) 2843 { 2844 rtx insn, loc, a0; 2845 2846 a0 = gen_rtx_REG (Pmode, GP_ARG_FIRST); 2847 2848 if (!mips_tls_symbol) 2849 mips_tls_symbol = init_one_libfunc ("__tls_get_addr"); 2850 2851 loc = mips_unspec_address (sym, type); 2852 2853 start_sequence (); 2854 2855 emit_insn (gen_rtx_SET (Pmode, a0, 2856 gen_rtx_LO_SUM (Pmode, pic_offset_table_rtx, loc))); 2857 insn = mips_expand_call (MIPS_CALL_NORMAL, v0, mips_tls_symbol, 2858 const0_rtx, NULL_RTX, false); 2859 RTL_CONST_CALL_P (insn) = 1; 2860 use_reg (&CALL_INSN_FUNCTION_USAGE (insn), a0); 2861 insn = get_insns (); 2862 2863 end_sequence (); 2864 2865 return insn; 2866 } 2867 2868 /* Return a pseudo register that contains the current thread pointer. */ 2869 2870 static rtx 2871 mips_get_tp (void) 2872 { 2873 rtx tp; 2874 2875 tp = gen_reg_rtx (Pmode); 2876 if (Pmode == DImode) 2877 emit_insn (gen_tls_get_tp_di (tp)); 2878 else 2879 emit_insn (gen_tls_get_tp_si (tp)); 2880 return tp; 2881 } 2882 2883 /* Generate the code to access LOC, a thread-local SYMBOL_REF, and return 2884 its address. The return value will be both a valid address and a valid 2885 SET_SRC (either a REG or a LO_SUM). */ 2886 2887 static rtx 2888 mips_legitimize_tls_address (rtx loc) 2889 { 2890 rtx dest, insn, v0, tp, tmp1, tmp2, eqv; 2891 enum tls_model model; 2892 2893 if (TARGET_MIPS16) 2894 { 2895 sorry ("MIPS16 TLS"); 2896 return gen_reg_rtx (Pmode); 2897 } 2898 2899 model = SYMBOL_REF_TLS_MODEL (loc); 2900 /* Only TARGET_ABICALLS code can have more than one module; other 2901 code must be be static and should not use a GOT. All TLS models 2902 reduce to local exec in this situation. */ 2903 if (!TARGET_ABICALLS) 2904 model = TLS_MODEL_LOCAL_EXEC; 2905 2906 switch (model) 2907 { 2908 case TLS_MODEL_GLOBAL_DYNAMIC: 2909 v0 = gen_rtx_REG (Pmode, GP_RETURN); 2910 insn = mips_call_tls_get_addr (loc, SYMBOL_TLSGD, v0); 2911 dest = gen_reg_rtx (Pmode); 2912 emit_libcall_block (insn, dest, v0, loc); 2913 break; 2914 2915 case TLS_MODEL_LOCAL_DYNAMIC: 2916 v0 = gen_rtx_REG (Pmode, GP_RETURN); 2917 insn = mips_call_tls_get_addr (loc, SYMBOL_TLSLDM, v0); 2918 tmp1 = gen_reg_rtx (Pmode); 2919 2920 /* Attach a unique REG_EQUIV, to allow the RTL optimizers to 2921 share the LDM result with other LD model accesses. */ 2922 eqv = gen_rtx_UNSPEC (Pmode, gen_rtvec (1, const0_rtx), 2923 UNSPEC_TLS_LDM); 2924 emit_libcall_block (insn, tmp1, v0, eqv); 2925 2926 tmp2 = mips_unspec_offset_high (NULL, tmp1, loc, SYMBOL_DTPREL); 2927 dest = gen_rtx_LO_SUM (Pmode, tmp2, 2928 mips_unspec_address (loc, SYMBOL_DTPREL)); 2929 break; 2930 2931 case TLS_MODEL_INITIAL_EXEC: 2932 tp = mips_get_tp (); 2933 tmp1 = gen_reg_rtx (Pmode); 2934 tmp2 = mips_unspec_address (loc, SYMBOL_GOTTPREL); 2935 if (Pmode == DImode) 2936 emit_insn (gen_load_gotdi (tmp1, pic_offset_table_rtx, tmp2)); 2937 else 2938 emit_insn (gen_load_gotsi (tmp1, pic_offset_table_rtx, tmp2)); 2939 dest = gen_reg_rtx (Pmode); 2940 emit_insn (gen_add3_insn (dest, tmp1, tp)); 2941 break; 2942 2943 case TLS_MODEL_LOCAL_EXEC: 2944 tp = mips_get_tp (); 2945 tmp1 = mips_unspec_offset_high (NULL, tp, loc, SYMBOL_TPREL); 2946 dest = gen_rtx_LO_SUM (Pmode, tmp1, 2947 mips_unspec_address (loc, SYMBOL_TPREL)); 2948 break; 2949 2950 default: 2951 gcc_unreachable (); 2952 } 2953 return dest; 2954 } 2955 2956 /* If X is not a valid address for mode MODE, force it into a register. */ 2957 2958 static rtx 2959 mips_force_address (rtx x, enum machine_mode mode) 2960 { 2961 if (!mips_legitimate_address_p (mode, x, false)) 2962 x = force_reg (Pmode, x); 2963 return x; 2964 } 2965 2966 /* This function is used to implement LEGITIMIZE_ADDRESS. If X can 2967 be legitimized in a way that the generic machinery might not expect, 2968 return a new address, otherwise return NULL. MODE is the mode of 2969 the memory being accessed. */ 2970 2971 static rtx 2972 mips_legitimize_address (rtx x, rtx oldx ATTRIBUTE_UNUSED, 2973 enum machine_mode mode) 2974 { 2975 rtx base, addr; 2976 HOST_WIDE_INT offset; 2977 2978 if (mips_tls_symbol_p (x)) 2979 return mips_legitimize_tls_address (x); 2980 2981 /* See if the address can split into a high part and a LO_SUM. */ 2982 if (mips_split_symbol (NULL, x, mode, &addr)) 2983 return mips_force_address (addr, mode); 2984 2985 /* Handle BASE + OFFSET using mips_add_offset. */ 2986 mips_split_plus (x, &base, &offset); 2987 if (offset != 0) 2988 { 2989 if (!mips_valid_base_register_p (base, mode, false)) 2990 base = copy_to_mode_reg (Pmode, base); 2991 addr = mips_add_offset (NULL, base, offset); 2992 return mips_force_address (addr, mode); 2993 } 2994 2995 return x; 2996 } 2997 2998 /* Load VALUE into DEST. TEMP is as for mips_force_temporary. */ 2999 3000 void 3001 mips_move_integer (rtx temp, rtx dest, unsigned HOST_WIDE_INT value) 3002 { 3003 struct mips_integer_op codes[MIPS_MAX_INTEGER_OPS]; 3004 enum machine_mode mode; 3005 unsigned int i, num_ops; 3006 rtx x; 3007 3008 mode = GET_MODE (dest); 3009 num_ops = mips_build_integer (codes, value); 3010 3011 /* Apply each binary operation to X. Invariant: X is a legitimate 3012 source operand for a SET pattern. */ 3013 x = GEN_INT (codes[0].value); 3014 for (i = 1; i < num_ops; i++) 3015 { 3016 if (!can_create_pseudo_p ()) 3017 { 3018 emit_insn (gen_rtx_SET (VOIDmode, temp, x)); 3019 x = temp; 3020 } 3021 else 3022 x = force_reg (mode, x); 3023 x = gen_rtx_fmt_ee (codes[i].code, mode, x, GEN_INT (codes[i].value)); 3024 } 3025 3026 emit_insn (gen_rtx_SET (VOIDmode, dest, x)); 3027 } 3028 3029 /* Subroutine of mips_legitimize_move. Move constant SRC into register 3030 DEST given that SRC satisfies immediate_operand but doesn't satisfy 3031 move_operand. */ 3032 3033 static void 3034 mips_legitimize_const_move (enum machine_mode mode, rtx dest, rtx src) 3035 { 3036 rtx base, offset; 3037 3038 /* Split moves of big integers into smaller pieces. */ 3039 if (splittable_const_int_operand (src, mode)) 3040 { 3041 mips_move_integer (dest, dest, INTVAL (src)); 3042 return; 3043 } 3044 3045 /* Split moves of symbolic constants into high/low pairs. */ 3046 if (mips_split_symbol (dest, src, MAX_MACHINE_MODE, &src)) 3047 { 3048 emit_insn (gen_rtx_SET (VOIDmode, dest, src)); 3049 return; 3050 } 3051 3052 /* Generate the appropriate access sequences for TLS symbols. */ 3053 if (mips_tls_symbol_p (src)) 3054 { 3055 mips_emit_move (dest, mips_legitimize_tls_address (src)); 3056 return; 3057 } 3058 3059 /* If we have (const (plus symbol offset)), and that expression cannot 3060 be forced into memory, load the symbol first and add in the offset. 3061 In non-MIPS16 mode, prefer to do this even if the constant _can_ be 3062 forced into memory, as it usually produces better code. */ 3063 split_const (src, &base, &offset); 3064 if (offset != const0_rtx 3065 && (targetm.cannot_force_const_mem (src) 3066 || (!TARGET_MIPS16 && can_create_pseudo_p ()))) 3067 { 3068 base = mips_force_temporary (dest, base); 3069 mips_emit_move (dest, mips_add_offset (NULL, base, INTVAL (offset))); 3070 return; 3071 } 3072 3073 src = force_const_mem (mode, src); 3074 3075 /* When using explicit relocs, constant pool references are sometimes 3076 not legitimate addresses. */ 3077 mips_split_symbol (dest, XEXP (src, 0), mode, &XEXP (src, 0)); 3078 mips_emit_move (dest, src); 3079 } 3080 3081 /* If (set DEST SRC) is not a valid move instruction, emit an equivalent 3082 sequence that is valid. */ 3083 3084 bool 3085 mips_legitimize_move (enum machine_mode mode, rtx dest, rtx src) 3086 { 3087 if (!register_operand (dest, mode) && !reg_or_0_operand (src, mode)) 3088 { 3089 mips_emit_move (dest, force_reg (mode, src)); 3090 return true; 3091 } 3092 3093 /* We need to deal with constants that would be legitimate 3094 immediate_operands but aren't legitimate move_operands. */ 3095 if (CONSTANT_P (src) && !move_operand (src, mode)) 3096 { 3097 mips_legitimize_const_move (mode, dest, src); 3098 set_unique_reg_note (get_last_insn (), REG_EQUAL, copy_rtx (src)); 3099 return true; 3100 } 3101 return false; 3102 } 3103 3104 /* Return true if value X in context CONTEXT is a small-data address 3105 that can be rewritten as a LO_SUM. */ 3106 3107 static bool 3108 mips_rewrite_small_data_p (rtx x, enum mips_symbol_context context) 3109 { 3110 enum mips_symbol_type symbol_type; 3111 3112 return (mips_lo_relocs[SYMBOL_GP_RELATIVE] 3113 && !mips_split_p[SYMBOL_GP_RELATIVE] 3114 && mips_symbolic_constant_p (x, context, &symbol_type) 3115 && symbol_type == SYMBOL_GP_RELATIVE); 3116 } 3117 3118 /* A for_each_rtx callback for mips_small_data_pattern_p. DATA is the 3119 containing MEM, or null if none. */ 3120 3121 static int 3122 mips_small_data_pattern_1 (rtx *loc, void *data) 3123 { 3124 enum mips_symbol_context context; 3125 3126 if (GET_CODE (*loc) == LO_SUM) 3127 return -1; 3128 3129 if (MEM_P (*loc)) 3130 { 3131 if (for_each_rtx (&XEXP (*loc, 0), mips_small_data_pattern_1, *loc)) 3132 return 1; 3133 return -1; 3134 } 3135 3136 context = data ? SYMBOL_CONTEXT_MEM : SYMBOL_CONTEXT_LEA; 3137 return mips_rewrite_small_data_p (*loc, context); 3138 } 3139 3140 /* Return true if OP refers to small data symbols directly, not through 3141 a LO_SUM. */ 3142 3143 bool 3144 mips_small_data_pattern_p (rtx op) 3145 { 3146 return for_each_rtx (&op, mips_small_data_pattern_1, NULL); 3147 } 3148 3149 /* A for_each_rtx callback, used by mips_rewrite_small_data. 3150 DATA is the containing MEM, or null if none. */ 3151 3152 static int 3153 mips_rewrite_small_data_1 (rtx *loc, void *data) 3154 { 3155 enum mips_symbol_context context; 3156 3157 if (MEM_P (*loc)) 3158 { 3159 for_each_rtx (&XEXP (*loc, 0), mips_rewrite_small_data_1, *loc); 3160 return -1; 3161 } 3162 3163 context = data ? SYMBOL_CONTEXT_MEM : SYMBOL_CONTEXT_LEA; 3164 if (mips_rewrite_small_data_p (*loc, context)) 3165 *loc = gen_rtx_LO_SUM (Pmode, pic_offset_table_rtx, *loc); 3166 3167 if (GET_CODE (*loc) == LO_SUM) 3168 return -1; 3169 3170 return 0; 3171 } 3172 3173 /* Rewrite instruction pattern PATTERN so that it refers to small data 3174 using explicit relocations. */ 3175 3176 rtx 3177 mips_rewrite_small_data (rtx pattern) 3178 { 3179 pattern = copy_insn (pattern); 3180 for_each_rtx (&pattern, mips_rewrite_small_data_1, NULL); 3181 return pattern; 3182 } 3183 3184 /* We need a lot of little routines to check the range of MIPS16 immediate 3185 operands. */ 3186 3187 static int 3188 m16_check_op (rtx op, int low, int high, int mask) 3189 { 3190 return (CONST_INT_P (op) 3191 && IN_RANGE (INTVAL (op), low, high) 3192 && (INTVAL (op) & mask) == 0); 3193 } 3194 3195 int 3196 m16_uimm3_b (rtx op, enum machine_mode mode ATTRIBUTE_UNUSED) 3197 { 3198 return m16_check_op (op, 0x1, 0x8, 0); 3199 } 3200 3201 int 3202 m16_simm4_1 (rtx op, enum machine_mode mode ATTRIBUTE_UNUSED) 3203 { 3204 return m16_check_op (op, -0x8, 0x7, 0); 3205 } 3206 3207 int 3208 m16_nsimm4_1 (rtx op, enum machine_mode mode ATTRIBUTE_UNUSED) 3209 { 3210 return m16_check_op (op, -0x7, 0x8, 0); 3211 } 3212 3213 int 3214 m16_simm5_1 (rtx op, enum machine_mode mode ATTRIBUTE_UNUSED) 3215 { 3216 return m16_check_op (op, -0x10, 0xf, 0); 3217 } 3218 3219 int 3220 m16_nsimm5_1 (rtx op, enum machine_mode mode ATTRIBUTE_UNUSED) 3221 { 3222 return m16_check_op (op, -0xf, 0x10, 0); 3223 } 3224 3225 int 3226 m16_uimm5_4 (rtx op, enum machine_mode mode ATTRIBUTE_UNUSED) 3227 { 3228 return m16_check_op (op, -0x10 << 2, 0xf << 2, 3); 3229 } 3230 3231 int 3232 m16_nuimm5_4 (rtx op, enum machine_mode mode ATTRIBUTE_UNUSED) 3233 { 3234 return m16_check_op (op, -0xf << 2, 0x10 << 2, 3); 3235 } 3236 3237 int 3238 m16_simm8_1 (rtx op, enum machine_mode mode ATTRIBUTE_UNUSED) 3239 { 3240 return m16_check_op (op, -0x80, 0x7f, 0); 3241 } 3242 3243 int 3244 m16_nsimm8_1 (rtx op, enum machine_mode mode ATTRIBUTE_UNUSED) 3245 { 3246 return m16_check_op (op, -0x7f, 0x80, 0); 3247 } 3248 3249 int 3250 m16_uimm8_1 (rtx op, enum machine_mode mode ATTRIBUTE_UNUSED) 3251 { 3252 return m16_check_op (op, 0x0, 0xff, 0); 3253 } 3254 3255 int 3256 m16_nuimm8_1 (rtx op, enum machine_mode mode ATTRIBUTE_UNUSED) 3257 { 3258 return m16_check_op (op, -0xff, 0x0, 0); 3259 } 3260 3261 int 3262 m16_uimm8_m1_1 (rtx op, enum machine_mode mode ATTRIBUTE_UNUSED) 3263 { 3264 return m16_check_op (op, -0x1, 0xfe, 0); 3265 } 3266 3267 int 3268 m16_uimm8_4 (rtx op, enum machine_mode mode ATTRIBUTE_UNUSED) 3269 { 3270 return m16_check_op (op, 0x0, 0xff << 2, 3); 3271 } 3272 3273 int 3274 m16_nuimm8_4 (rtx op, enum machine_mode mode ATTRIBUTE_UNUSED) 3275 { 3276 return m16_check_op (op, -0xff << 2, 0x0, 3); 3277 } 3278 3279 int 3280 m16_simm8_8 (rtx op, enum machine_mode mode ATTRIBUTE_UNUSED) 3281 { 3282 return m16_check_op (op, -0x80 << 3, 0x7f << 3, 7); 3283 } 3284 3285 int 3286 m16_nsimm8_8 (rtx op, enum machine_mode mode ATTRIBUTE_UNUSED) 3287 { 3288 return m16_check_op (op, -0x7f << 3, 0x80 << 3, 7); 3289 } 3290 3291 /* The cost of loading values from the constant pool. It should be 3292 larger than the cost of any constant we want to synthesize inline. */ 3293 #define CONSTANT_POOL_COST COSTS_N_INSNS (TARGET_MIPS16 ? 4 : 8) 3294 3295 /* Return the cost of X when used as an operand to the MIPS16 instruction 3296 that implements CODE. Return -1 if there is no such instruction, or if 3297 X is not a valid immediate operand for it. */ 3298 3299 static int 3300 mips16_constant_cost (int code, HOST_WIDE_INT x) 3301 { 3302 switch (code) 3303 { 3304 case ASHIFT: 3305 case ASHIFTRT: 3306 case LSHIFTRT: 3307 /* Shifts by between 1 and 8 bits (inclusive) are unextended, 3308 other shifts are extended. The shift patterns truncate the shift 3309 count to the right size, so there are no out-of-range values. */ 3310 if (IN_RANGE (x, 1, 8)) 3311 return 0; 3312 return COSTS_N_INSNS (1); 3313 3314 case PLUS: 3315 if (IN_RANGE (x, -128, 127)) 3316 return 0; 3317 if (SMALL_OPERAND (x)) 3318 return COSTS_N_INSNS (1); 3319 return -1; 3320 3321 case LEU: 3322 /* Like LE, but reject the always-true case. */ 3323 if (x == -1) 3324 return -1; 3325 case LE: 3326 /* We add 1 to the immediate and use SLT. */ 3327 x += 1; 3328 case XOR: 3329 /* We can use CMPI for an xor with an unsigned 16-bit X. */ 3330 case LT: 3331 case LTU: 3332 if (IN_RANGE (x, 0, 255)) 3333 return 0; 3334 if (SMALL_OPERAND_UNSIGNED (x)) 3335 return COSTS_N_INSNS (1); 3336 return -1; 3337 3338 case EQ: 3339 case NE: 3340 /* Equality comparisons with 0 are cheap. */ 3341 if (x == 0) 3342 return 0; 3343 return -1; 3344 3345 default: 3346 return -1; 3347 } 3348 } 3349 3350 /* Return true if there is a non-MIPS16 instruction that implements CODE 3351 and if that instruction accepts X as an immediate operand. */ 3352 3353 static int 3354 mips_immediate_operand_p (int code, HOST_WIDE_INT x) 3355 { 3356 switch (code) 3357 { 3358 case ASHIFT: 3359 case ASHIFTRT: 3360 case LSHIFTRT: 3361 /* All shift counts are truncated to a valid constant. */ 3362 return true; 3363 3364 case ROTATE: 3365 case ROTATERT: 3366 /* Likewise rotates, if the target supports rotates at all. */ 3367 return ISA_HAS_ROR; 3368 3369 case AND: 3370 case IOR: 3371 case XOR: 3372 /* These instructions take 16-bit unsigned immediates. */ 3373 return SMALL_OPERAND_UNSIGNED (x); 3374 3375 case PLUS: 3376 case LT: 3377 case LTU: 3378 /* These instructions take 16-bit signed immediates. */ 3379 return SMALL_OPERAND (x); 3380 3381 case EQ: 3382 case NE: 3383 case GT: 3384 case GTU: 3385 /* The "immediate" forms of these instructions are really 3386 implemented as comparisons with register 0. */ 3387 return x == 0; 3388 3389 case GE: 3390 case GEU: 3391 /* Likewise, meaning that the only valid immediate operand is 1. */ 3392 return x == 1; 3393 3394 case LE: 3395 /* We add 1 to the immediate and use SLT. */ 3396 return SMALL_OPERAND (x + 1); 3397 3398 case LEU: 3399 /* Likewise SLTU, but reject the always-true case. */ 3400 return SMALL_OPERAND (x + 1) && x + 1 != 0; 3401 3402 case SIGN_EXTRACT: 3403 case ZERO_EXTRACT: 3404 /* The bit position and size are immediate operands. */ 3405 return ISA_HAS_EXT_INS; 3406 3407 default: 3408 /* By default assume that $0 can be used for 0. */ 3409 return x == 0; 3410 } 3411 } 3412 3413 /* Return the cost of binary operation X, given that the instruction 3414 sequence for a word-sized or smaller operation has cost SINGLE_COST 3415 and that the sequence of a double-word operation has cost DOUBLE_COST. 3416 If SPEED is true, optimize for speed otherwise optimize for size. */ 3417 3418 static int 3419 mips_binary_cost (rtx x, int single_cost, int double_cost, bool speed) 3420 { 3421 int cost; 3422 3423 if (GET_MODE_SIZE (GET_MODE (x)) == UNITS_PER_WORD * 2) 3424 cost = double_cost; 3425 else 3426 cost = single_cost; 3427 return (cost 3428 + rtx_cost (XEXP (x, 0), SET, speed) 3429 + rtx_cost (XEXP (x, 1), GET_CODE (x), speed)); 3430 } 3431 3432 /* Return the cost of floating-point multiplications of mode MODE. */ 3433 3434 static int 3435 mips_fp_mult_cost (enum machine_mode mode) 3436 { 3437 return mode == DFmode ? mips_cost->fp_mult_df : mips_cost->fp_mult_sf; 3438 } 3439 3440 /* Return the cost of floating-point divisions of mode MODE. */ 3441 3442 static int 3443 mips_fp_div_cost (enum machine_mode mode) 3444 { 3445 return mode == DFmode ? mips_cost->fp_div_df : mips_cost->fp_div_sf; 3446 } 3447 3448 /* Return the cost of sign-extending OP to mode MODE, not including the 3449 cost of OP itself. */ 3450 3451 static int 3452 mips_sign_extend_cost (enum machine_mode mode, rtx op) 3453 { 3454 if (MEM_P (op)) 3455 /* Extended loads are as cheap as unextended ones. */ 3456 return 0; 3457 3458 if (TARGET_64BIT && mode == DImode && GET_MODE (op) == SImode) 3459 /* A sign extension from SImode to DImode in 64-bit mode is free. */ 3460 return 0; 3461 3462 if (ISA_HAS_SEB_SEH || GENERATE_MIPS16E) 3463 /* We can use SEB or SEH. */ 3464 return COSTS_N_INSNS (1); 3465 3466 /* We need to use a shift left and a shift right. */ 3467 return COSTS_N_INSNS (TARGET_MIPS16 ? 4 : 2); 3468 } 3469 3470 /* Return the cost of zero-extending OP to mode MODE, not including the 3471 cost of OP itself. */ 3472 3473 static int 3474 mips_zero_extend_cost (enum machine_mode mode, rtx op) 3475 { 3476 if (MEM_P (op)) 3477 /* Extended loads are as cheap as unextended ones. */ 3478 return 0; 3479 3480 if (TARGET_64BIT && mode == DImode && GET_MODE (op) == SImode) 3481 /* We need a shift left by 32 bits and a shift right by 32 bits. */ 3482 return COSTS_N_INSNS (TARGET_MIPS16 ? 4 : 2); 3483 3484 if (GENERATE_MIPS16E) 3485 /* We can use ZEB or ZEH. */ 3486 return COSTS_N_INSNS (1); 3487 3488 if (TARGET_MIPS16) 3489 /* We need to load 0xff or 0xffff into a register and use AND. */ 3490 return COSTS_N_INSNS (GET_MODE (op) == QImode ? 2 : 3); 3491 3492 /* We can use ANDI. */ 3493 return COSTS_N_INSNS (1); 3494 } 3495 3496 /* Implement TARGET_RTX_COSTS. */ 3497 3498 static bool 3499 mips_rtx_costs (rtx x, int code, int outer_code, int *total, bool speed) 3500 { 3501 enum machine_mode mode = GET_MODE (x); 3502 bool float_mode_p = FLOAT_MODE_P (mode); 3503 int cost; 3504 rtx addr; 3505 3506 /* The cost of a COMPARE is hard to define for MIPS. COMPAREs don't 3507 appear in the instruction stream, and the cost of a comparison is 3508 really the cost of the branch or scc condition. At the time of 3509 writing, GCC only uses an explicit outer COMPARE code when optabs 3510 is testing whether a constant is expensive enough to force into a 3511 register. We want optabs to pass such constants through the MIPS 3512 expanders instead, so make all constants very cheap here. */ 3513 if (outer_code == COMPARE) 3514 { 3515 gcc_assert (CONSTANT_P (x)); 3516 *total = 0; 3517 return true; 3518 } 3519 3520 switch (code) 3521 { 3522 case CONST_INT: 3523 /* Treat *clear_upper32-style ANDs as having zero cost in the 3524 second operand. The cost is entirely in the first operand. 3525 3526 ??? This is needed because we would otherwise try to CSE 3527 the constant operand. Although that's the right thing for 3528 instructions that continue to be a register operation throughout 3529 compilation, it is disastrous for instructions that could 3530 later be converted into a memory operation. */ 3531 if (TARGET_64BIT 3532 && outer_code == AND 3533 && UINTVAL (x) == 0xffffffff) 3534 { 3535 *total = 0; 3536 return true; 3537 } 3538 3539 if (TARGET_MIPS16) 3540 { 3541 cost = mips16_constant_cost (outer_code, INTVAL (x)); 3542 if (cost >= 0) 3543 { 3544 *total = cost; 3545 return true; 3546 } 3547 } 3548 else 3549 { 3550 /* When not optimizing for size, we care more about the cost 3551 of hot code, and hot code is often in a loop. If a constant 3552 operand needs to be forced into a register, we will often be 3553 able to hoist the constant load out of the loop, so the load 3554 should not contribute to the cost. */ 3555 if (speed || mips_immediate_operand_p (outer_code, INTVAL (x))) 3556 { 3557 *total = 0; 3558 return true; 3559 } 3560 } 3561 /* Fall through. */ 3562 3563 case CONST: 3564 case SYMBOL_REF: 3565 case LABEL_REF: 3566 case CONST_DOUBLE: 3567 if (force_to_mem_operand (x, VOIDmode)) 3568 { 3569 *total = COSTS_N_INSNS (1); 3570 return true; 3571 } 3572 cost = mips_const_insns (x); 3573 if (cost > 0) 3574 { 3575 /* If the constant is likely to be stored in a GPR, SETs of 3576 single-insn constants are as cheap as register sets; we 3577 never want to CSE them. 3578 3579 Don't reduce the cost of storing a floating-point zero in 3580 FPRs. If we have a zero in an FPR for other reasons, we 3581 can get better cfg-cleanup and delayed-branch results by 3582 using it consistently, rather than using $0 sometimes and 3583 an FPR at other times. Also, moves between floating-point 3584 registers are sometimes cheaper than (D)MTC1 $0. */ 3585 if (cost == 1 3586 && outer_code == SET 3587 && !(float_mode_p && TARGET_HARD_FLOAT)) 3588 cost = 0; 3589 /* When non-MIPS16 code loads a constant N>1 times, we rarely 3590 want to CSE the constant itself. It is usually better to 3591 have N copies of the last operation in the sequence and one 3592 shared copy of the other operations. (Note that this is 3593 not true for MIPS16 code, where the final operation in the 3594 sequence is often an extended instruction.) 3595 3596 Also, if we have a CONST_INT, we don't know whether it is 3597 for a word or doubleword operation, so we cannot rely on 3598 the result of mips_build_integer. */ 3599 else if (!TARGET_MIPS16 3600 && (outer_code == SET || mode == VOIDmode)) 3601 cost = 1; 3602 *total = COSTS_N_INSNS (cost); 3603 return true; 3604 } 3605 /* The value will need to be fetched from the constant pool. */ 3606 *total = CONSTANT_POOL_COST; 3607 return true; 3608 3609 case MEM: 3610 /* If the address is legitimate, return the number of 3611 instructions it needs. */ 3612 addr = XEXP (x, 0); 3613 cost = mips_address_insns (addr, mode, true); 3614 if (cost > 0) 3615 { 3616 *total = COSTS_N_INSNS (cost + 1); 3617 return true; 3618 } 3619 /* Check for a scaled indexed address. */ 3620 if (mips_lwxs_address_p (addr)) 3621 { 3622 *total = COSTS_N_INSNS (2); 3623 return true; 3624 } 3625 /* Otherwise use the default handling. */ 3626 return false; 3627 3628 case FFS: 3629 *total = COSTS_N_INSNS (6); 3630 return false; 3631 3632 case NOT: 3633 *total = COSTS_N_INSNS (GET_MODE_SIZE (mode) > UNITS_PER_WORD ? 2 : 1); 3634 return false; 3635 3636 case AND: 3637 /* Check for a *clear_upper32 pattern and treat it like a zero 3638 extension. See the pattern's comment for details. */ 3639 if (TARGET_64BIT 3640 && mode == DImode 3641 && CONST_INT_P (XEXP (x, 1)) 3642 && UINTVAL (XEXP (x, 1)) == 0xffffffff) 3643 { 3644 *total = (mips_zero_extend_cost (mode, XEXP (x, 0)) 3645 + rtx_cost (XEXP (x, 0), SET, speed)); 3646 return true; 3647 } 3648 /* Fall through. */ 3649 3650 case IOR: 3651 case XOR: 3652 /* Double-word operations use two single-word operations. */ 3653 *total = mips_binary_cost (x, COSTS_N_INSNS (1), COSTS_N_INSNS (2), 3654 speed); 3655 return true; 3656 3657 case ASHIFT: 3658 case ASHIFTRT: 3659 case LSHIFTRT: 3660 case ROTATE: 3661 case ROTATERT: 3662 if (CONSTANT_P (XEXP (x, 1))) 3663 *total = mips_binary_cost (x, COSTS_N_INSNS (1), COSTS_N_INSNS (4), 3664 speed); 3665 else 3666 *total = mips_binary_cost (x, COSTS_N_INSNS (1), COSTS_N_INSNS (12), 3667 speed); 3668 return true; 3669 3670 case ABS: 3671 if (float_mode_p) 3672 *total = mips_cost->fp_add; 3673 else 3674 *total = COSTS_N_INSNS (4); 3675 return false; 3676 3677 case LO_SUM: 3678 /* Low-part immediates need an extended MIPS16 instruction. */ 3679 *total = (COSTS_N_INSNS (TARGET_MIPS16 ? 2 : 1) 3680 + rtx_cost (XEXP (x, 0), SET, speed)); 3681 return true; 3682 3683 case LT: 3684 case LTU: 3685 case LE: 3686 case LEU: 3687 case GT: 3688 case GTU: 3689 case GE: 3690 case GEU: 3691 case EQ: 3692 case NE: 3693 case UNORDERED: 3694 case LTGT: 3695 /* Branch comparisons have VOIDmode, so use the first operand's 3696 mode instead. */ 3697 mode = GET_MODE (XEXP (x, 0)); 3698 if (FLOAT_MODE_P (mode)) 3699 { 3700 *total = mips_cost->fp_add; 3701 return false; 3702 } 3703 *total = mips_binary_cost (x, COSTS_N_INSNS (1), COSTS_N_INSNS (4), 3704 speed); 3705 return true; 3706 3707 case MINUS: 3708 if (float_mode_p 3709 && (ISA_HAS_NMADD4_NMSUB4 (mode) || ISA_HAS_NMADD3_NMSUB3 (mode)) 3710 && TARGET_FUSED_MADD 3711 && !HONOR_NANS (mode) 3712 && !HONOR_SIGNED_ZEROS (mode)) 3713 { 3714 /* See if we can use NMADD or NMSUB. See mips.md for the 3715 associated patterns. */ 3716 rtx op0 = XEXP (x, 0); 3717 rtx op1 = XEXP (x, 1); 3718 if (GET_CODE (op0) == MULT && GET_CODE (XEXP (op0, 0)) == NEG) 3719 { 3720 *total = (mips_fp_mult_cost (mode) 3721 + rtx_cost (XEXP (XEXP (op0, 0), 0), SET, speed) 3722 + rtx_cost (XEXP (op0, 1), SET, speed) 3723 + rtx_cost (op1, SET, speed)); 3724 return true; 3725 } 3726 if (GET_CODE (op1) == MULT) 3727 { 3728 *total = (mips_fp_mult_cost (mode) 3729 + rtx_cost (op0, SET, speed) 3730 + rtx_cost (XEXP (op1, 0), SET, speed) 3731 + rtx_cost (XEXP (op1, 1), SET, speed)); 3732 return true; 3733 } 3734 } 3735 /* Fall through. */ 3736 3737 case PLUS: 3738 if (float_mode_p) 3739 { 3740 /* If this is part of a MADD or MSUB, treat the PLUS as 3741 being free. */ 3742 if (ISA_HAS_FP4 3743 && TARGET_FUSED_MADD 3744 && GET_CODE (XEXP (x, 0)) == MULT) 3745 *total = 0; 3746 else 3747 *total = mips_cost->fp_add; 3748 return false; 3749 } 3750 3751 /* Double-word operations require three single-word operations and 3752 an SLTU. The MIPS16 version then needs to move the result of 3753 the SLTU from $24 to a MIPS16 register. */ 3754 *total = mips_binary_cost (x, COSTS_N_INSNS (1), 3755 COSTS_N_INSNS (TARGET_MIPS16 ? 5 : 4), 3756 speed); 3757 return true; 3758 3759 case NEG: 3760 if (float_mode_p 3761 && (ISA_HAS_NMADD4_NMSUB4 (mode) || ISA_HAS_NMADD3_NMSUB3 (mode)) 3762 && TARGET_FUSED_MADD 3763 && !HONOR_NANS (mode) 3764 && HONOR_SIGNED_ZEROS (mode)) 3765 { 3766 /* See if we can use NMADD or NMSUB. See mips.md for the 3767 associated patterns. */ 3768 rtx op = XEXP (x, 0); 3769 if ((GET_CODE (op) == PLUS || GET_CODE (op) == MINUS) 3770 && GET_CODE (XEXP (op, 0)) == MULT) 3771 { 3772 *total = (mips_fp_mult_cost (mode) 3773 + rtx_cost (XEXP (XEXP (op, 0), 0), SET, speed) 3774 + rtx_cost (XEXP (XEXP (op, 0), 1), SET, speed) 3775 + rtx_cost (XEXP (op, 1), SET, speed)); 3776 return true; 3777 } 3778 } 3779 3780 if (float_mode_p) 3781 *total = mips_cost->fp_add; 3782 else 3783 *total = COSTS_N_INSNS (GET_MODE_SIZE (mode) > UNITS_PER_WORD ? 4 : 1); 3784 return false; 3785 3786 case MULT: 3787 if (float_mode_p) 3788 *total = mips_fp_mult_cost (mode); 3789 else if (mode == DImode && !TARGET_64BIT) 3790 /* Synthesized from 2 mulsi3s, 1 mulsidi3 and two additions, 3791 where the mulsidi3 always includes an MFHI and an MFLO. */ 3792 *total = (speed 3793 ? mips_cost->int_mult_si * 3 + 6 3794 : COSTS_N_INSNS (ISA_HAS_MUL3 ? 7 : 9)); 3795 else if (!speed) 3796 *total = (ISA_HAS_MUL3 ? 1 : 2); 3797 else if (mode == DImode) 3798 *total = mips_cost->int_mult_di; 3799 else 3800 *total = mips_cost->int_mult_si; 3801 return false; 3802 3803 case DIV: 3804 /* Check for a reciprocal. */ 3805 if (float_mode_p 3806 && ISA_HAS_FP4 3807 && flag_unsafe_math_optimizations 3808 && XEXP (x, 0) == CONST1_RTX (mode)) 3809 { 3810 if (outer_code == SQRT || GET_CODE (XEXP (x, 1)) == SQRT) 3811 /* An rsqrt<mode>a or rsqrt<mode>b pattern. Count the 3812 division as being free. */ 3813 *total = rtx_cost (XEXP (x, 1), SET, speed); 3814 else 3815 *total = (mips_fp_div_cost (mode) 3816 + rtx_cost (XEXP (x, 1), SET, speed)); 3817 return true; 3818 } 3819 /* Fall through. */ 3820 3821 case SQRT: 3822 case MOD: 3823 if (float_mode_p) 3824 { 3825 *total = mips_fp_div_cost (mode); 3826 return false; 3827 } 3828 /* Fall through. */ 3829 3830 case UDIV: 3831 case UMOD: 3832 if (!speed) 3833 { 3834 /* It is our responsibility to make division by a power of 2 3835 as cheap as 2 register additions if we want the division 3836 expanders to be used for such operations; see the setting 3837 of sdiv_pow2_cheap in optabs.c. Using (D)DIV for MIPS16 3838 should always produce shorter code than using 3839 expand_sdiv2_pow2. */ 3840 if (TARGET_MIPS16 3841 && CONST_INT_P (XEXP (x, 1)) 3842 && exact_log2 (INTVAL (XEXP (x, 1))) >= 0) 3843 { 3844 *total = COSTS_N_INSNS (2) + rtx_cost (XEXP (x, 0), SET, speed); 3845 return true; 3846 } 3847 *total = COSTS_N_INSNS (mips_idiv_insns ()); 3848 } 3849 else if (mode == DImode) 3850 *total = mips_cost->int_div_di; 3851 else 3852 *total = mips_cost->int_div_si; 3853 return false; 3854 3855 case SIGN_EXTEND: 3856 *total = mips_sign_extend_cost (mode, XEXP (x, 0)); 3857 return false; 3858 3859 case ZERO_EXTEND: 3860 *total = mips_zero_extend_cost (mode, XEXP (x, 0)); 3861 return false; 3862 3863 case FLOAT: 3864 case UNSIGNED_FLOAT: 3865 case FIX: 3866 case FLOAT_EXTEND: 3867 case FLOAT_TRUNCATE: 3868 *total = mips_cost->fp_add; 3869 return false; 3870 3871 default: 3872 return false; 3873 } 3874 } 3875 3876 /* Implement TARGET_ADDRESS_COST. */ 3877 3878 static int 3879 mips_address_cost (rtx addr, bool speed ATTRIBUTE_UNUSED) 3880 { 3881 return mips_address_insns (addr, SImode, false); 3882 } 3883 3884 /* Information about a single instruction in a multi-instruction 3885 asm sequence. */ 3886 struct mips_multi_member { 3887 /* True if this is a label, false if it is code. */ 3888 bool is_label_p; 3889 3890 /* The output_asm_insn format of the instruction. */ 3891 const char *format; 3892 3893 /* The operands to the instruction. */ 3894 rtx operands[MAX_RECOG_OPERANDS]; 3895 }; 3896 typedef struct mips_multi_member mips_multi_member; 3897 3898 /* Vector definitions for the above. */ 3899 DEF_VEC_O(mips_multi_member); 3900 DEF_VEC_ALLOC_O(mips_multi_member, heap); 3901 3902 /* The instructions that make up the current multi-insn sequence. */ 3903 static VEC (mips_multi_member, heap) *mips_multi_members; 3904 3905 /* How many instructions (as opposed to labels) are in the current 3906 multi-insn sequence. */ 3907 static unsigned int mips_multi_num_insns; 3908 3909 /* Start a new multi-insn sequence. */ 3910 3911 static void 3912 mips_multi_start (void) 3913 { 3914 VEC_truncate (mips_multi_member, mips_multi_members, 0); 3915 mips_multi_num_insns = 0; 3916 } 3917 3918 /* Add a new, uninitialized member to the current multi-insn sequence. */ 3919 3920 static struct mips_multi_member * 3921 mips_multi_add (void) 3922 { 3923 return VEC_safe_push (mips_multi_member, heap, mips_multi_members, 0); 3924 } 3925 3926 /* Add a normal insn with the given asm format to the current multi-insn 3927 sequence. The other arguments are a null-terminated list of operands. */ 3928 3929 static void 3930 mips_multi_add_insn (const char *format, ...) 3931 { 3932 struct mips_multi_member *member; 3933 va_list ap; 3934 unsigned int i; 3935 rtx op; 3936 3937 member = mips_multi_add (); 3938 member->is_label_p = false; 3939 member->format = format; 3940 va_start (ap, format); 3941 i = 0; 3942 while ((op = va_arg (ap, rtx))) 3943 member->operands[i++] = op; 3944 va_end (ap); 3945 mips_multi_num_insns++; 3946 } 3947 3948 /* Add the given label definition to the current multi-insn sequence. 3949 The definition should include the colon. */ 3950 3951 static void 3952 mips_multi_add_label (const char *label) 3953 { 3954 struct mips_multi_member *member; 3955 3956 member = mips_multi_add (); 3957 member->is_label_p = true; 3958 member->format = label; 3959 } 3960 3961 /* Return the index of the last member of the current multi-insn sequence. */ 3962 3963 static unsigned int 3964 mips_multi_last_index (void) 3965 { 3966 return VEC_length (mips_multi_member, mips_multi_members) - 1; 3967 } 3968 3969 /* Add a copy of an existing instruction to the current multi-insn 3970 sequence. I is the index of the instruction that should be copied. */ 3971 3972 static void 3973 mips_multi_copy_insn (unsigned int i) 3974 { 3975 struct mips_multi_member *member; 3976 3977 member = mips_multi_add (); 3978 memcpy (member, VEC_index (mips_multi_member, mips_multi_members, i), 3979 sizeof (*member)); 3980 gcc_assert (!member->is_label_p); 3981 } 3982 3983 /* Change the operand of an existing instruction in the current 3984 multi-insn sequence. I is the index of the instruction, 3985 OP is the index of the operand, and X is the new value. */ 3986 3987 static void 3988 mips_multi_set_operand (unsigned int i, unsigned int op, rtx x) 3989 { 3990 VEC_index (mips_multi_member, mips_multi_members, i)->operands[op] = x; 3991 } 3992 3993 /* Write out the asm code for the current multi-insn sequence. */ 3994 3995 static void 3996 mips_multi_write (void) 3997 { 3998 struct mips_multi_member *member; 3999 unsigned int i; 4000 4001 for (i = 0; 4002 VEC_iterate (mips_multi_member, mips_multi_members, i, member); 4003 i++) 4004 if (member->is_label_p) 4005 fprintf (asm_out_file, "%s\n", member->format); 4006 else 4007 output_asm_insn (member->format, member->operands); 4008 } 4009 4010 /* Return one word of double-word value OP, taking into account the fixed 4011 endianness of certain registers. HIGH_P is true to select the high part, 4012 false to select the low part. */ 4013 4014 rtx 4015 mips_subword (rtx op, bool high_p) 4016 { 4017 unsigned int byte, offset; 4018 enum machine_mode mode; 4019 4020 mode = GET_MODE (op); 4021 if (mode == VOIDmode) 4022 mode = TARGET_64BIT ? TImode : DImode; 4023 4024 if (TARGET_BIG_ENDIAN ? !high_p : high_p) 4025 byte = UNITS_PER_WORD; 4026 else 4027 byte = 0; 4028 4029 if (FP_REG_RTX_P (op)) 4030 { 4031 /* Paired FPRs are always ordered little-endian. */ 4032 offset = (UNITS_PER_WORD < UNITS_PER_HWFPVALUE ? high_p : byte != 0); 4033 return gen_rtx_REG (word_mode, REGNO (op) + offset); 4034 } 4035 4036 if (MEM_P (op)) 4037 return mips_rewrite_small_data (adjust_address (op, word_mode, byte)); 4038 4039 return simplify_gen_subreg (word_mode, op, mode, byte); 4040 } 4041 4042 /* Return true if a 64-bit move from SRC to DEST should be split into two. */ 4043 4044 bool 4045 mips_split_64bit_move_p (rtx dest, rtx src) 4046 { 4047 if (TARGET_64BIT) 4048 return false; 4049 4050 /* FPR-to-FPR moves can be done in a single instruction, if they're 4051 allowed at all. */ 4052 if (FP_REG_RTX_P (src) && FP_REG_RTX_P (dest)) 4053 return false; 4054 4055 /* Check for floating-point loads and stores. */ 4056 if (ISA_HAS_LDC1_SDC1) 4057 { 4058 if (FP_REG_RTX_P (dest) && MEM_P (src)) 4059 return false; 4060 if (FP_REG_RTX_P (src) && MEM_P (dest)) 4061 return false; 4062 } 4063 return true; 4064 } 4065 4066 /* Split a doubleword move from SRC to DEST. On 32-bit targets, 4067 this function handles 64-bit moves for which mips_split_64bit_move_p 4068 holds. For 64-bit targets, this function handles 128-bit moves. */ 4069 4070 void 4071 mips_split_doubleword_move (rtx dest, rtx src) 4072 { 4073 rtx low_dest; 4074 4075 if (FP_REG_RTX_P (dest) || FP_REG_RTX_P (src)) 4076 { 4077 if (!TARGET_64BIT && GET_MODE (dest) == DImode) 4078 emit_insn (gen_move_doubleword_fprdi (dest, src)); 4079 else if (!TARGET_64BIT && GET_MODE (dest) == DFmode) 4080 emit_insn (gen_move_doubleword_fprdf (dest, src)); 4081 else if (!TARGET_64BIT && GET_MODE (dest) == V2SFmode) 4082 emit_insn (gen_move_doubleword_fprv2sf (dest, src)); 4083 else if (!TARGET_64BIT && GET_MODE (dest) == V2SImode) 4084 emit_insn (gen_move_doubleword_fprv2si (dest, src)); 4085 else if (!TARGET_64BIT && GET_MODE (dest) == V4HImode) 4086 emit_insn (gen_move_doubleword_fprv4hi (dest, src)); 4087 else if (!TARGET_64BIT && GET_MODE (dest) == V8QImode) 4088 emit_insn (gen_move_doubleword_fprv8qi (dest, src)); 4089 else if (TARGET_64BIT && GET_MODE (dest) == TFmode) 4090 emit_insn (gen_move_doubleword_fprtf (dest, src)); 4091 else 4092 gcc_unreachable (); 4093 } 4094 else if (REG_P (dest) && REGNO (dest) == MD_REG_FIRST) 4095 { 4096 low_dest = mips_subword (dest, false); 4097 mips_emit_move (low_dest, mips_subword (src, false)); 4098 if (TARGET_64BIT) 4099 emit_insn (gen_mthidi_ti (dest, mips_subword (src, true), low_dest)); 4100 else 4101 emit_insn (gen_mthisi_di (dest, mips_subword (src, true), low_dest)); 4102 } 4103 else if (REG_P (src) && REGNO (src) == MD_REG_FIRST) 4104 { 4105 mips_emit_move (mips_subword (dest, false), mips_subword (src, false)); 4106 if (TARGET_64BIT) 4107 emit_insn (gen_mfhidi_ti (mips_subword (dest, true), src)); 4108 else 4109 emit_insn (gen_mfhisi_di (mips_subword (dest, true), src)); 4110 } 4111 else 4112 { 4113 /* The operation can be split into two normal moves. Decide in 4114 which order to do them. */ 4115 low_dest = mips_subword (dest, false); 4116 if (REG_P (low_dest) 4117 && reg_overlap_mentioned_p (low_dest, src)) 4118 { 4119 mips_emit_move (mips_subword (dest, true), mips_subword (src, true)); 4120 mips_emit_move (low_dest, mips_subword (src, false)); 4121 } 4122 else 4123 { 4124 mips_emit_move (low_dest, mips_subword (src, false)); 4125 mips_emit_move (mips_subword (dest, true), mips_subword (src, true)); 4126 } 4127 } 4128 } 4129 4130 /* Return the appropriate instructions to move SRC into DEST. Assume 4131 that SRC is operand 1 and DEST is operand 0. */ 4132 4133 const char * 4134 mips_output_move (rtx dest, rtx src) 4135 { 4136 enum rtx_code dest_code, src_code; 4137 enum machine_mode mode; 4138 enum mips_symbol_type symbol_type; 4139 bool dbl_p; 4140 4141 dest_code = GET_CODE (dest); 4142 src_code = GET_CODE (src); 4143 mode = GET_MODE (dest); 4144 dbl_p = (GET_MODE_SIZE (mode) == 8); 4145 4146 if (dbl_p && mips_split_64bit_move_p (dest, src)) 4147 return "#"; 4148 4149 if ((src_code == REG && GP_REG_P (REGNO (src))) 4150 || (!TARGET_MIPS16 && src == CONST0_RTX (mode))) 4151 { 4152 if (dest_code == REG) 4153 { 4154 if (GP_REG_P (REGNO (dest))) 4155 return "move\t%0,%z1"; 4156 4157 /* Moves to HI are handled by special .md insns. */ 4158 if (REGNO (dest) == LO_REGNUM) 4159 return "mtlo\t%z1"; 4160 4161 if (DSP_ACC_REG_P (REGNO (dest))) 4162 { 4163 static char retval[] = "mt__\t%z1,%q0"; 4164 4165 retval[2] = reg_names[REGNO (dest)][4]; 4166 retval[3] = reg_names[REGNO (dest)][5]; 4167 return retval; 4168 } 4169 4170 if (FP_REG_P (REGNO (dest))) 4171 return dbl_p ? "dmtc1\t%z1,%0" : "mtc1\t%z1,%0"; 4172 4173 if (ALL_COP_REG_P (REGNO (dest))) 4174 { 4175 static char retval[] = "dmtc_\t%z1,%0"; 4176 4177 retval[4] = COPNUM_AS_CHAR_FROM_REGNUM (REGNO (dest)); 4178 return dbl_p ? retval : retval + 1; 4179 } 4180 } 4181 if (dest_code == MEM) 4182 switch (GET_MODE_SIZE (mode)) 4183 { 4184 case 1: return "sb\t%z1,%0"; 4185 case 2: return "sh\t%z1,%0"; 4186 case 4: return "sw\t%z1,%0"; 4187 case 8: return "sd\t%z1,%0"; 4188 } 4189 } 4190 if (dest_code == REG && GP_REG_P (REGNO (dest))) 4191 { 4192 if (src_code == REG) 4193 { 4194 /* Moves from HI are handled by special .md insns. */ 4195 if (REGNO (src) == LO_REGNUM) 4196 { 4197 /* When generating VR4120 or VR4130 code, we use MACC and 4198 DMACC instead of MFLO. This avoids both the normal 4199 MIPS III HI/LO hazards and the errata related to 4200 -mfix-vr4130. */ 4201 if (ISA_HAS_MACCHI) 4202 return dbl_p ? "dmacc\t%0,%.,%." : "macc\t%0,%.,%."; 4203 return "mflo\t%0"; 4204 } 4205 4206 if (DSP_ACC_REG_P (REGNO (src))) 4207 { 4208 static char retval[] = "mf__\t%0,%q1"; 4209 4210 retval[2] = reg_names[REGNO (src)][4]; 4211 retval[3] = reg_names[REGNO (src)][5]; 4212 return retval; 4213 } 4214 4215 if (FP_REG_P (REGNO (src))) 4216 return dbl_p ? "dmfc1\t%0,%1" : "mfc1\t%0,%1"; 4217 4218 if (ALL_COP_REG_P (REGNO (src))) 4219 { 4220 static char retval[] = "dmfc_\t%0,%1"; 4221 4222 retval[4] = COPNUM_AS_CHAR_FROM_REGNUM (REGNO (src)); 4223 return dbl_p ? retval : retval + 1; 4224 } 4225 4226 if (ST_REG_P (REGNO (src)) && ISA_HAS_8CC) 4227 return "lui\t%0,0x3f80\n\tmovf\t%0,%.,%1"; 4228 } 4229 4230 if (src_code == MEM) 4231 switch (GET_MODE_SIZE (mode)) 4232 { 4233 case 1: return "lbu\t%0,%1"; 4234 case 2: return "lhu\t%0,%1"; 4235 case 4: return "lw\t%0,%1"; 4236 case 8: return "ld\t%0,%1"; 4237 } 4238 4239 if (src_code == CONST_INT) 4240 { 4241 /* Don't use the X format for the operand itself, because that 4242 will give out-of-range numbers for 64-bit hosts and 32-bit 4243 targets. */ 4244 if (!TARGET_MIPS16) 4245 return "li\t%0,%1\t\t\t# %X1"; 4246 4247 if (SMALL_OPERAND_UNSIGNED (INTVAL (src))) 4248 return "li\t%0,%1"; 4249 4250 if (SMALL_OPERAND_UNSIGNED (-INTVAL (src))) 4251 return "#"; 4252 } 4253 4254 if (src_code == HIGH) 4255 return TARGET_MIPS16 ? "#" : "lui\t%0,%h1"; 4256 4257 if (CONST_GP_P (src)) 4258 return "move\t%0,%1"; 4259 4260 if (mips_symbolic_constant_p (src, SYMBOL_CONTEXT_LEA, &symbol_type) 4261 && mips_lo_relocs[symbol_type] != 0) 4262 { 4263 /* A signed 16-bit constant formed by applying a relocation 4264 operator to a symbolic address. */ 4265 gcc_assert (!mips_split_p[symbol_type]); 4266 return "li\t%0,%R1"; 4267 } 4268 4269 if (symbolic_operand (src, VOIDmode)) 4270 { 4271 gcc_assert (TARGET_MIPS16 4272 ? TARGET_MIPS16_TEXT_LOADS 4273 : !TARGET_EXPLICIT_RELOCS); 4274 return dbl_p ? "dla\t%0,%1" : "la\t%0,%1"; 4275 } 4276 } 4277 if (src_code == REG && FP_REG_P (REGNO (src))) 4278 { 4279 if (dest_code == REG && FP_REG_P (REGNO (dest))) 4280 { 4281 if (GET_MODE (dest) == V2SFmode) 4282 return "mov.ps\t%0,%1"; 4283 else 4284 return dbl_p ? "mov.d\t%0,%1" : "mov.s\t%0,%1"; 4285 } 4286 4287 if (dest_code == MEM) 4288 return dbl_p ? "sdc1\t%1,%0" : "swc1\t%1,%0"; 4289 } 4290 if (dest_code == REG && FP_REG_P (REGNO (dest))) 4291 { 4292 if (src_code == MEM) 4293 return dbl_p ? "ldc1\t%0,%1" : "lwc1\t%0,%1"; 4294 } 4295 if (dest_code == REG && ALL_COP_REG_P (REGNO (dest)) && src_code == MEM) 4296 { 4297 static char retval[] = "l_c_\t%0,%1"; 4298 4299 retval[1] = (dbl_p ? 'd' : 'w'); 4300 retval[3] = COPNUM_AS_CHAR_FROM_REGNUM (REGNO (dest)); 4301 return retval; 4302 } 4303 if (dest_code == MEM && src_code == REG && ALL_COP_REG_P (REGNO (src))) 4304 { 4305 static char retval[] = "s_c_\t%1,%0"; 4306 4307 retval[1] = (dbl_p ? 'd' : 'w'); 4308 retval[3] = COPNUM_AS_CHAR_FROM_REGNUM (REGNO (src)); 4309 return retval; 4310 } 4311 gcc_unreachable (); 4312 } 4313 4314 /* Return true if CMP1 is a suitable second operand for integer ordering 4315 test CODE. See also the *sCC patterns in mips.md. */ 4316 4317 static bool 4318 mips_int_order_operand_ok_p (enum rtx_code code, rtx cmp1) 4319 { 4320 switch (code) 4321 { 4322 case GT: 4323 case GTU: 4324 return reg_or_0_operand (cmp1, VOIDmode); 4325 4326 case GE: 4327 case GEU: 4328 return !TARGET_MIPS16 && cmp1 == const1_rtx; 4329 4330 case LT: 4331 case LTU: 4332 return arith_operand (cmp1, VOIDmode); 4333 4334 case LE: 4335 return sle_operand (cmp1, VOIDmode); 4336 4337 case LEU: 4338 return sleu_operand (cmp1, VOIDmode); 4339 4340 default: 4341 gcc_unreachable (); 4342 } 4343 } 4344 4345 /* Return true if *CMP1 (of mode MODE) is a valid second operand for 4346 integer ordering test *CODE, or if an equivalent combination can 4347 be formed by adjusting *CODE and *CMP1. When returning true, update 4348 *CODE and *CMP1 with the chosen code and operand, otherwise leave 4349 them alone. */ 4350 4351 static bool 4352 mips_canonicalize_int_order_test (enum rtx_code *code, rtx *cmp1, 4353 enum machine_mode mode) 4354 { 4355 HOST_WIDE_INT plus_one; 4356 4357 if (mips_int_order_operand_ok_p (*code, *cmp1)) 4358 return true; 4359 4360 if (CONST_INT_P (*cmp1)) 4361 switch (*code) 4362 { 4363 case LE: 4364 plus_one = trunc_int_for_mode (UINTVAL (*cmp1) + 1, mode); 4365 if (INTVAL (*cmp1) < plus_one) 4366 { 4367 *code = LT; 4368 *cmp1 = force_reg (mode, GEN_INT (plus_one)); 4369 return true; 4370 } 4371 break; 4372 4373 case LEU: 4374 plus_one = trunc_int_for_mode (UINTVAL (*cmp1) + 1, mode); 4375 if (plus_one != 0) 4376 { 4377 *code = LTU; 4378 *cmp1 = force_reg (mode, GEN_INT (plus_one)); 4379 return true; 4380 } 4381 break; 4382 4383 default: 4384 break; 4385 } 4386 return false; 4387 } 4388 4389 /* Compare CMP0 and CMP1 using ordering test CODE and store the result 4390 in TARGET. CMP0 and TARGET are register_operands. If INVERT_PTR 4391 is nonnull, it's OK to set TARGET to the inverse of the result and 4392 flip *INVERT_PTR instead. */ 4393 4394 static void 4395 mips_emit_int_order_test (enum rtx_code code, bool *invert_ptr, 4396 rtx target, rtx cmp0, rtx cmp1) 4397 { 4398 enum machine_mode mode; 4399 4400 /* First see if there is a MIPS instruction that can do this operation. 4401 If not, try doing the same for the inverse operation. If that also 4402 fails, force CMP1 into a register and try again. */ 4403 mode = GET_MODE (cmp0); 4404 if (mips_canonicalize_int_order_test (&code, &cmp1, mode)) 4405 mips_emit_binary (code, target, cmp0, cmp1); 4406 else 4407 { 4408 enum rtx_code inv_code = reverse_condition (code); 4409 if (!mips_canonicalize_int_order_test (&inv_code, &cmp1, mode)) 4410 { 4411 cmp1 = force_reg (mode, cmp1); 4412 mips_emit_int_order_test (code, invert_ptr, target, cmp0, cmp1); 4413 } 4414 else if (invert_ptr == 0) 4415 { 4416 rtx inv_target; 4417 4418 inv_target = mips_force_binary (GET_MODE (target), 4419 inv_code, cmp0, cmp1); 4420 mips_emit_binary (XOR, target, inv_target, const1_rtx); 4421 } 4422 else 4423 { 4424 *invert_ptr = !*invert_ptr; 4425 mips_emit_binary (inv_code, target, cmp0, cmp1); 4426 } 4427 } 4428 } 4429 4430 /* Return a register that is zero iff CMP0 and CMP1 are equal. 4431 The register will have the same mode as CMP0. */ 4432 4433 static rtx 4434 mips_zero_if_equal (rtx cmp0, rtx cmp1) 4435 { 4436 if (cmp1 == const0_rtx) 4437 return cmp0; 4438 4439 if (uns_arith_operand (cmp1, VOIDmode)) 4440 return expand_binop (GET_MODE (cmp0), xor_optab, 4441 cmp0, cmp1, 0, 0, OPTAB_DIRECT); 4442 4443 return expand_binop (GET_MODE (cmp0), sub_optab, 4444 cmp0, cmp1, 0, 0, OPTAB_DIRECT); 4445 } 4446 4447 /* Convert *CODE into a code that can be used in a floating-point 4448 scc instruction (C.cond.fmt). Return true if the values of 4449 the condition code registers will be inverted, with 0 indicating 4450 that the condition holds. */ 4451 4452 static bool 4453 mips_reversed_fp_cond (enum rtx_code *code) 4454 { 4455 switch (*code) 4456 { 4457 case NE: 4458 case LTGT: 4459 case ORDERED: 4460 *code = reverse_condition_maybe_unordered (*code); 4461 return true; 4462 4463 default: 4464 return false; 4465 } 4466 } 4467 4468 /* Convert a comparison into something that can be used in a branch or 4469 conditional move. On entry, *OP0 and *OP1 are the values being 4470 compared and *CODE is the code used to compare them. 4471 4472 Update *CODE, *OP0 and *OP1 so that they describe the final comparison. 4473 If NEED_EQ_NE_P, then only EQ or NE comparisons against zero are possible, 4474 otherwise any standard branch condition can be used. The standard branch 4475 conditions are: 4476 4477 - EQ or NE between two registers. 4478 - any comparison between a register and zero. */ 4479 4480 static void 4481 mips_emit_compare (enum rtx_code *code, rtx *op0, rtx *op1, bool need_eq_ne_p) 4482 { 4483 rtx cmp_op0 = *op0; 4484 rtx cmp_op1 = *op1; 4485 4486 if (GET_MODE_CLASS (GET_MODE (*op0)) == MODE_INT) 4487 { 4488 if (!need_eq_ne_p && *op1 == const0_rtx) 4489 ; 4490 else if (*code == EQ || *code == NE) 4491 { 4492 if (need_eq_ne_p) 4493 { 4494 *op0 = mips_zero_if_equal (cmp_op0, cmp_op1); 4495 *op1 = const0_rtx; 4496 } 4497 else 4498 *op1 = force_reg (GET_MODE (cmp_op0), cmp_op1); 4499 } 4500 else 4501 { 4502 /* The comparison needs a separate scc instruction. Store the 4503 result of the scc in *OP0 and compare it against zero. */ 4504 bool invert = false; 4505 *op0 = gen_reg_rtx (GET_MODE (cmp_op0)); 4506 mips_emit_int_order_test (*code, &invert, *op0, cmp_op0, cmp_op1); 4507 *code = (invert ? EQ : NE); 4508 *op1 = const0_rtx; 4509 } 4510 } 4511 else if (ALL_FIXED_POINT_MODE_P (GET_MODE (cmp_op0))) 4512 { 4513 *op0 = gen_rtx_REG (CCDSPmode, CCDSP_CC_REGNUM); 4514 mips_emit_binary (*code, *op0, cmp_op0, cmp_op1); 4515 *code = NE; 4516 *op1 = const0_rtx; 4517 } 4518 else 4519 { 4520 enum rtx_code cmp_code; 4521 4522 /* Floating-point tests use a separate C.cond.fmt comparison to 4523 set a condition code register. The branch or conditional move 4524 will then compare that register against zero. 4525 4526 Set CMP_CODE to the code of the comparison instruction and 4527 *CODE to the code that the branch or move should use. */ 4528 cmp_code = *code; 4529 *code = mips_reversed_fp_cond (&cmp_code) ? EQ : NE; 4530 *op0 = (ISA_HAS_8CC 4531 ? gen_reg_rtx (CCmode) 4532 : gen_rtx_REG (CCmode, FPSW_REGNUM)); 4533 *op1 = const0_rtx; 4534 mips_emit_binary (cmp_code, *op0, cmp_op0, cmp_op1); 4535 } 4536 } 4537 4538 /* Try performing the comparison in OPERANDS[1], whose arms are OPERANDS[2] 4539 and OPERAND[3]. Store the result in OPERANDS[0]. 4540 4541 On 64-bit targets, the mode of the comparison and target will always be 4542 SImode, thus possibly narrower than that of the comparison's operands. */ 4543 4544 void 4545 mips_expand_scc (rtx operands[]) 4546 { 4547 rtx target = operands[0]; 4548 enum rtx_code code = GET_CODE (operands[1]); 4549 rtx op0 = operands[2]; 4550 rtx op1 = operands[3]; 4551 4552 gcc_assert (GET_MODE_CLASS (GET_MODE (op0)) == MODE_INT); 4553 4554 if (code == EQ || code == NE) 4555 { 4556 if (ISA_HAS_SEQ_SNE 4557 && reg_imm10_operand (op1, GET_MODE (op1))) 4558 mips_emit_binary (code, target, op0, op1); 4559 else 4560 { 4561 rtx zie = mips_zero_if_equal (op0, op1); 4562 mips_emit_binary (code, target, zie, const0_rtx); 4563 } 4564 } 4565 else 4566 mips_emit_int_order_test (code, 0, target, op0, op1); 4567 } 4568 4569 /* Compare OPERANDS[1] with OPERANDS[2] using comparison code 4570 CODE and jump to OPERANDS[3] if the condition holds. */ 4571 4572 void 4573 mips_expand_conditional_branch (rtx *operands) 4574 { 4575 enum rtx_code code = GET_CODE (operands[0]); 4576 rtx op0 = operands[1]; 4577 rtx op1 = operands[2]; 4578 rtx condition; 4579 4580 mips_emit_compare (&code, &op0, &op1, TARGET_MIPS16); 4581 condition = gen_rtx_fmt_ee (code, VOIDmode, op0, op1); 4582 emit_jump_insn (gen_condjump (condition, operands[3])); 4583 } 4584 4585 /* Implement: 4586 4587 (set temp (COND:CCV2 CMP_OP0 CMP_OP1)) 4588 (set DEST (unspec [TRUE_SRC FALSE_SRC temp] UNSPEC_MOVE_TF_PS)) */ 4589 4590 void 4591 mips_expand_vcondv2sf (rtx dest, rtx true_src, rtx false_src, 4592 enum rtx_code cond, rtx cmp_op0, rtx cmp_op1) 4593 { 4594 rtx cmp_result; 4595 bool reversed_p; 4596 4597 reversed_p = mips_reversed_fp_cond (&cond); 4598 cmp_result = gen_reg_rtx (CCV2mode); 4599 emit_insn (gen_scc_ps (cmp_result, 4600 gen_rtx_fmt_ee (cond, VOIDmode, cmp_op0, cmp_op1))); 4601 if (reversed_p) 4602 emit_insn (gen_mips_cond_move_tf_ps (dest, false_src, true_src, 4603 cmp_result)); 4604 else 4605 emit_insn (gen_mips_cond_move_tf_ps (dest, true_src, false_src, 4606 cmp_result)); 4607 } 4608 4609 /* Perform the comparison in OPERANDS[1]. Move OPERANDS[2] into OPERANDS[0] 4610 if the condition holds, otherwise move OPERANDS[3] into OPERANDS[0]. */ 4611 4612 void 4613 mips_expand_conditional_move (rtx *operands) 4614 { 4615 rtx cond; 4616 enum rtx_code code = GET_CODE (operands[1]); 4617 rtx op0 = XEXP (operands[1], 0); 4618 rtx op1 = XEXP (operands[1], 1); 4619 4620 mips_emit_compare (&code, &op0, &op1, true); 4621 cond = gen_rtx_fmt_ee (code, GET_MODE (op0), op0, op1); 4622 emit_insn (gen_rtx_SET (VOIDmode, operands[0], 4623 gen_rtx_IF_THEN_ELSE (GET_MODE (operands[0]), cond, 4624 operands[2], operands[3]))); 4625 } 4626 4627 /* Perform the comparison in COMPARISON, then trap if the condition holds. */ 4628 4629 void 4630 mips_expand_conditional_trap (rtx comparison) 4631 { 4632 rtx op0, op1; 4633 enum machine_mode mode; 4634 enum rtx_code code; 4635 4636 /* MIPS conditional trap instructions don't have GT or LE flavors, 4637 so we must swap the operands and convert to LT and GE respectively. */ 4638 code = GET_CODE (comparison); 4639 switch (code) 4640 { 4641 case GT: 4642 case LE: 4643 case GTU: 4644 case LEU: 4645 code = swap_condition (code); 4646 op0 = XEXP (comparison, 1); 4647 op1 = XEXP (comparison, 0); 4648 break; 4649 4650 default: 4651 op0 = XEXP (comparison, 0); 4652 op1 = XEXP (comparison, 1); 4653 break; 4654 } 4655 4656 mode = GET_MODE (XEXP (comparison, 0)); 4657 op0 = force_reg (mode, op0); 4658 if (!arith_operand (op1, mode)) 4659 op1 = force_reg (mode, op1); 4660 4661 emit_insn (gen_rtx_TRAP_IF (VOIDmode, 4662 gen_rtx_fmt_ee (code, mode, op0, op1), 4663 const0_rtx)); 4664 } 4665 4666 /* Initialize *CUM for a call to a function of type FNTYPE. */ 4667 4668 void 4669 mips_init_cumulative_args (CUMULATIVE_ARGS *cum, tree fntype) 4670 { 4671 memset (cum, 0, sizeof (*cum)); 4672 cum->prototype = (fntype && prototype_p (fntype)); 4673 cum->gp_reg_found = (cum->prototype && stdarg_p (fntype)); 4674 } 4675 4676 /* Fill INFO with information about a single argument. CUM is the 4677 cumulative state for earlier arguments. MODE is the mode of this 4678 argument and TYPE is its type (if known). NAMED is true if this 4679 is a named (fixed) argument rather than a variable one. */ 4680 4681 static void 4682 mips_get_arg_info (struct mips_arg_info *info, const CUMULATIVE_ARGS *cum, 4683 enum machine_mode mode, tree type, int named) 4684 { 4685 bool doubleword_aligned_p; 4686 unsigned int num_bytes, num_words, max_regs; 4687 4688 /* Work out the size of the argument. */ 4689 num_bytes = type ? int_size_in_bytes (type) : GET_MODE_SIZE (mode); 4690 num_words = (num_bytes + UNITS_PER_WORD - 1) / UNITS_PER_WORD; 4691 4692 /* Decide whether it should go in a floating-point register, assuming 4693 one is free. Later code checks for availability. 4694 4695 The checks against UNITS_PER_FPVALUE handle the soft-float and 4696 single-float cases. */ 4697 switch (mips_abi) 4698 { 4699 case ABI_EABI: 4700 /* The EABI conventions have traditionally been defined in terms 4701 of TYPE_MODE, regardless of the actual type. */ 4702 info->fpr_p = ((GET_MODE_CLASS (mode) == MODE_FLOAT 4703 || GET_MODE_CLASS (mode) == MODE_VECTOR_FLOAT) 4704 && GET_MODE_SIZE (mode) <= UNITS_PER_FPVALUE); 4705 break; 4706 4707 case ABI_32: 4708 case ABI_O64: 4709 /* Only leading floating-point scalars are passed in 4710 floating-point registers. We also handle vector floats the same 4711 say, which is OK because they are not covered by the standard ABI. */ 4712 info->fpr_p = (!cum->gp_reg_found 4713 && cum->arg_number < 2 4714 && (type == 0 4715 || SCALAR_FLOAT_TYPE_P (type) 4716 || VECTOR_FLOAT_TYPE_P (type)) 4717 && (GET_MODE_CLASS (mode) == MODE_FLOAT 4718 || GET_MODE_CLASS (mode) == MODE_VECTOR_FLOAT) 4719 && GET_MODE_SIZE (mode) <= UNITS_PER_FPVALUE); 4720 break; 4721 4722 case ABI_N32: 4723 case ABI_64: 4724 /* Scalar, complex and vector floating-point types are passed in 4725 floating-point registers, as long as this is a named rather 4726 than a variable argument. */ 4727 info->fpr_p = (named 4728 && (type == 0 || FLOAT_TYPE_P (type)) 4729 && (GET_MODE_CLASS (mode) == MODE_FLOAT 4730 || GET_MODE_CLASS (mode) == MODE_COMPLEX_FLOAT 4731 || GET_MODE_CLASS (mode) == MODE_VECTOR_FLOAT) 4732 && GET_MODE_UNIT_SIZE (mode) <= UNITS_PER_FPVALUE); 4733 4734 /* ??? According to the ABI documentation, the real and imaginary 4735 parts of complex floats should be passed in individual registers. 4736 The real and imaginary parts of stack arguments are supposed 4737 to be contiguous and there should be an extra word of padding 4738 at the end. 4739 4740 This has two problems. First, it makes it impossible to use a 4741 single "void *" va_list type, since register and stack arguments 4742 are passed differently. (At the time of writing, MIPSpro cannot 4743 handle complex float varargs correctly.) Second, it's unclear 4744 what should happen when there is only one register free. 4745 4746 For now, we assume that named complex floats should go into FPRs 4747 if there are two FPRs free, otherwise they should be passed in the 4748 same way as a struct containing two floats. */ 4749 if (info->fpr_p 4750 && GET_MODE_CLASS (mode) == MODE_COMPLEX_FLOAT 4751 && GET_MODE_UNIT_SIZE (mode) < UNITS_PER_FPVALUE) 4752 { 4753 if (cum->num_gprs >= MAX_ARGS_IN_REGISTERS - 1) 4754 info->fpr_p = false; 4755 else 4756 num_words = 2; 4757 } 4758 break; 4759 4760 default: 4761 gcc_unreachable (); 4762 } 4763 4764 /* See whether the argument has doubleword alignment. */ 4765 doubleword_aligned_p = FUNCTION_ARG_BOUNDARY (mode, type) > BITS_PER_WORD; 4766 4767 /* Set REG_OFFSET to the register count we're interested in. 4768 The EABI allocates the floating-point registers separately, 4769 but the other ABIs allocate them like integer registers. */ 4770 info->reg_offset = (mips_abi == ABI_EABI && info->fpr_p 4771 ? cum->num_fprs 4772 : cum->num_gprs); 4773 4774 /* Advance to an even register if the argument is doubleword-aligned. */ 4775 if (doubleword_aligned_p) 4776 info->reg_offset += info->reg_offset & 1; 4777 4778 /* Work out the offset of a stack argument. */ 4779 info->stack_offset = cum->stack_words; 4780 if (doubleword_aligned_p) 4781 info->stack_offset += info->stack_offset & 1; 4782 4783 max_regs = MAX_ARGS_IN_REGISTERS - info->reg_offset; 4784 4785 /* Partition the argument between registers and stack. */ 4786 info->reg_words = MIN (num_words, max_regs); 4787 info->stack_words = num_words - info->reg_words; 4788 } 4789 4790 /* INFO describes a register argument that has the normal format for the 4791 argument's mode. Return the register it uses, assuming that FPRs are 4792 available if HARD_FLOAT_P. */ 4793 4794 static unsigned int 4795 mips_arg_regno (const struct mips_arg_info *info, bool hard_float_p) 4796 { 4797 if (!info->fpr_p || !hard_float_p) 4798 return GP_ARG_FIRST + info->reg_offset; 4799 else if (mips_abi == ABI_32 && TARGET_DOUBLE_FLOAT && info->reg_offset > 0) 4800 /* In o32, the second argument is always passed in $f14 4801 for TARGET_DOUBLE_FLOAT, regardless of whether the 4802 first argument was a word or doubleword. */ 4803 return FP_ARG_FIRST + 2; 4804 else 4805 return FP_ARG_FIRST + info->reg_offset; 4806 } 4807 4808 /* Implement TARGET_STRICT_ARGUMENT_NAMING. */ 4809 4810 static bool 4811 mips_strict_argument_naming (CUMULATIVE_ARGS *ca ATTRIBUTE_UNUSED) 4812 { 4813 return !TARGET_OLDABI; 4814 } 4815 4816 /* Implement FUNCTION_ARG. */ 4817 4818 rtx 4819 mips_function_arg (const CUMULATIVE_ARGS *cum, enum machine_mode mode, 4820 tree type, int named) 4821 { 4822 struct mips_arg_info info; 4823 4824 /* We will be called with a mode of VOIDmode after the last argument 4825 has been seen. Whatever we return will be passed to the call expander. 4826 If we need a MIPS16 fp_code, return a REG with the code stored as 4827 the mode. */ 4828 if (mode == VOIDmode) 4829 { 4830 if (TARGET_MIPS16 && cum->fp_code != 0) 4831 return gen_rtx_REG ((enum machine_mode) cum->fp_code, 0); 4832 else 4833 return NULL; 4834 } 4835 4836 mips_get_arg_info (&info, cum, mode, type, named); 4837 4838 /* Return straight away if the whole argument is passed on the stack. */ 4839 if (info.reg_offset == MAX_ARGS_IN_REGISTERS) 4840 return NULL; 4841 4842 /* The n32 and n64 ABIs say that if any 64-bit chunk of the structure 4843 contains a double in its entirety, then that 64-bit chunk is passed 4844 in a floating-point register. */ 4845 if (TARGET_NEWABI 4846 && TARGET_HARD_FLOAT 4847 && named 4848 && type != 0 4849 && TREE_CODE (type) == RECORD_TYPE 4850 && TYPE_SIZE_UNIT (type) 4851 && host_integerp (TYPE_SIZE_UNIT (type), 1)) 4852 { 4853 tree field; 4854 4855 /* First check to see if there is any such field. */ 4856 for (field = TYPE_FIELDS (type); field; field = TREE_CHAIN (field)) 4857 if (TREE_CODE (field) == FIELD_DECL 4858 && SCALAR_FLOAT_TYPE_P (TREE_TYPE (field)) 4859 && TYPE_PRECISION (TREE_TYPE (field)) == BITS_PER_WORD 4860 && host_integerp (bit_position (field), 0) 4861 && int_bit_position (field) % BITS_PER_WORD == 0) 4862 break; 4863 4864 if (field != 0) 4865 { 4866 /* Now handle the special case by returning a PARALLEL 4867 indicating where each 64-bit chunk goes. INFO.REG_WORDS 4868 chunks are passed in registers. */ 4869 unsigned int i; 4870 HOST_WIDE_INT bitpos; 4871 rtx ret; 4872 4873 /* assign_parms checks the mode of ENTRY_PARM, so we must 4874 use the actual mode here. */ 4875 ret = gen_rtx_PARALLEL (mode, rtvec_alloc (info.reg_words)); 4876 4877 bitpos = 0; 4878 field = TYPE_FIELDS (type); 4879 for (i = 0; i < info.reg_words; i++) 4880 { 4881 rtx reg; 4882 4883 for (; field; field = TREE_CHAIN (field)) 4884 if (TREE_CODE (field) == FIELD_DECL 4885 && int_bit_position (field) >= bitpos) 4886 break; 4887 4888 if (field 4889 && int_bit_position (field) == bitpos 4890 && SCALAR_FLOAT_TYPE_P (TREE_TYPE (field)) 4891 && TYPE_PRECISION (TREE_TYPE (field)) == BITS_PER_WORD) 4892 reg = gen_rtx_REG (DFmode, FP_ARG_FIRST + info.reg_offset + i); 4893 else 4894 reg = gen_rtx_REG (DImode, GP_ARG_FIRST + info.reg_offset + i); 4895 4896 XVECEXP (ret, 0, i) 4897 = gen_rtx_EXPR_LIST (VOIDmode, reg, 4898 GEN_INT (bitpos / BITS_PER_UNIT)); 4899 4900 bitpos += BITS_PER_WORD; 4901 } 4902 return ret; 4903 } 4904 } 4905 4906 /* Handle the n32/n64 conventions for passing complex floating-point 4907 arguments in FPR pairs. The real part goes in the lower register 4908 and the imaginary part goes in the upper register. */ 4909 if (TARGET_NEWABI 4910 && info.fpr_p 4911 && GET_MODE_CLASS (mode) == MODE_COMPLEX_FLOAT) 4912 { 4913 rtx real, imag; 4914 enum machine_mode inner; 4915 unsigned int regno; 4916 4917 inner = GET_MODE_INNER (mode); 4918 regno = FP_ARG_FIRST + info.reg_offset; 4919 if (info.reg_words * UNITS_PER_WORD == GET_MODE_SIZE (inner)) 4920 { 4921 /* Real part in registers, imaginary part on stack. */ 4922 gcc_assert (info.stack_words == info.reg_words); 4923 return gen_rtx_REG (inner, regno); 4924 } 4925 else 4926 { 4927 gcc_assert (info.stack_words == 0); 4928 real = gen_rtx_EXPR_LIST (VOIDmode, 4929 gen_rtx_REG (inner, regno), 4930 const0_rtx); 4931 imag = gen_rtx_EXPR_LIST (VOIDmode, 4932 gen_rtx_REG (inner, 4933 regno + info.reg_words / 2), 4934 GEN_INT (GET_MODE_SIZE (inner))); 4935 return gen_rtx_PARALLEL (mode, gen_rtvec (2, real, imag)); 4936 } 4937 } 4938 4939 return gen_rtx_REG (mode, mips_arg_regno (&info, TARGET_HARD_FLOAT)); 4940 } 4941 4942 /* Implement FUNCTION_ARG_ADVANCE. */ 4943 4944 void 4945 mips_function_arg_advance (CUMULATIVE_ARGS *cum, enum machine_mode mode, 4946 tree type, int named) 4947 { 4948 struct mips_arg_info info; 4949 4950 mips_get_arg_info (&info, cum, mode, type, named); 4951 4952 if (!info.fpr_p) 4953 cum->gp_reg_found = true; 4954 4955 /* See the comment above the CUMULATIVE_ARGS structure in mips.h for 4956 an explanation of what this code does. It assumes that we're using 4957 either the o32 or the o64 ABI, both of which pass at most 2 arguments 4958 in FPRs. */ 4959 if (cum->arg_number < 2 && info.fpr_p) 4960 cum->fp_code += (mode == SFmode ? 1 : 2) << (cum->arg_number * 2); 4961 4962 /* Advance the register count. This has the effect of setting 4963 num_gprs to MAX_ARGS_IN_REGISTERS if a doubleword-aligned 4964 argument required us to skip the final GPR and pass the whole 4965 argument on the stack. */ 4966 if (mips_abi != ABI_EABI || !info.fpr_p) 4967 cum->num_gprs = info.reg_offset + info.reg_words; 4968 else if (info.reg_words > 0) 4969 cum->num_fprs += MAX_FPRS_PER_FMT; 4970 4971 /* Advance the stack word count. */ 4972 if (info.stack_words > 0) 4973 cum->stack_words = info.stack_offset + info.stack_words; 4974 4975 cum->arg_number++; 4976 } 4977 4978 /* Implement TARGET_ARG_PARTIAL_BYTES. */ 4979 4980 static int 4981 mips_arg_partial_bytes (CUMULATIVE_ARGS *cum, 4982 enum machine_mode mode, tree type, bool named) 4983 { 4984 struct mips_arg_info info; 4985 4986 mips_get_arg_info (&info, cum, mode, type, named); 4987 return info.stack_words > 0 ? info.reg_words * UNITS_PER_WORD : 0; 4988 } 4989 4990 /* Implement FUNCTION_ARG_BOUNDARY. Every parameter gets at least 4991 PARM_BOUNDARY bits of alignment, but will be given anything up 4992 to STACK_BOUNDARY bits if the type requires it. */ 4993 4994 int 4995 mips_function_arg_boundary (enum machine_mode mode, tree type) 4996 { 4997 unsigned int alignment; 4998 4999 alignment = type ? TYPE_ALIGN (type) : GET_MODE_ALIGNMENT (mode); 5000 if (alignment < PARM_BOUNDARY) 5001 alignment = PARM_BOUNDARY; 5002 if (alignment > STACK_BOUNDARY) 5003 alignment = STACK_BOUNDARY; 5004 return alignment; 5005 } 5006 5007 /* Return true if FUNCTION_ARG_PADDING (MODE, TYPE) should return 5008 upward rather than downward. In other words, return true if the 5009 first byte of the stack slot has useful data, false if the last 5010 byte does. */ 5011 5012 bool 5013 mips_pad_arg_upward (enum machine_mode mode, const_tree type) 5014 { 5015 /* On little-endian targets, the first byte of every stack argument 5016 is passed in the first byte of the stack slot. */ 5017 if (!BYTES_BIG_ENDIAN) 5018 return true; 5019 5020 /* Otherwise, integral types are padded downward: the last byte of a 5021 stack argument is passed in the last byte of the stack slot. */ 5022 if (type != 0 5023 ? (INTEGRAL_TYPE_P (type) 5024 || POINTER_TYPE_P (type) 5025 || FIXED_POINT_TYPE_P (type)) 5026 : (SCALAR_INT_MODE_P (mode) 5027 || ALL_SCALAR_FIXED_POINT_MODE_P (mode))) 5028 return false; 5029 5030 /* Big-endian o64 pads floating-point arguments downward. */ 5031 if (mips_abi == ABI_O64) 5032 if (type != 0 ? FLOAT_TYPE_P (type) : GET_MODE_CLASS (mode) == MODE_FLOAT) 5033 return false; 5034 5035 /* Other types are padded upward for o32, o64, n32 and n64. */ 5036 if (mips_abi != ABI_EABI) 5037 return true; 5038 5039 /* Arguments smaller than a stack slot are padded downward. */ 5040 if (mode != BLKmode) 5041 return GET_MODE_BITSIZE (mode) >= PARM_BOUNDARY; 5042 else 5043 return int_size_in_bytes (type) >= (PARM_BOUNDARY / BITS_PER_UNIT); 5044 } 5045 5046 /* Likewise BLOCK_REG_PADDING (MODE, TYPE, ...). Return !BYTES_BIG_ENDIAN 5047 if the least significant byte of the register has useful data. Return 5048 the opposite if the most significant byte does. */ 5049 5050 bool 5051 mips_pad_reg_upward (enum machine_mode mode, tree type) 5052 { 5053 /* No shifting is required for floating-point arguments. */ 5054 if (type != 0 ? FLOAT_TYPE_P (type) : GET_MODE_CLASS (mode) == MODE_FLOAT) 5055 return !BYTES_BIG_ENDIAN; 5056 5057 /* Otherwise, apply the same padding to register arguments as we do 5058 to stack arguments. */ 5059 return mips_pad_arg_upward (mode, type); 5060 } 5061 5062 /* Return nonzero when an argument must be passed by reference. */ 5063 5064 static bool 5065 mips_pass_by_reference (CUMULATIVE_ARGS *cum ATTRIBUTE_UNUSED, 5066 enum machine_mode mode, const_tree type, 5067 bool named ATTRIBUTE_UNUSED) 5068 { 5069 if (mips_abi == ABI_EABI) 5070 { 5071 int size; 5072 5073 /* ??? How should SCmode be handled? */ 5074 if (mode == DImode || mode == DFmode 5075 || mode == DQmode || mode == UDQmode 5076 || mode == DAmode || mode == UDAmode) 5077 return 0; 5078 5079 size = type ? int_size_in_bytes (type) : GET_MODE_SIZE (mode); 5080 return size == -1 || size > UNITS_PER_WORD; 5081 } 5082 else 5083 { 5084 /* If we have a variable-sized parameter, we have no choice. */ 5085 return targetm.calls.must_pass_in_stack (mode, type); 5086 } 5087 } 5088 5089 /* Implement TARGET_CALLEE_COPIES. */ 5090 5091 static bool 5092 mips_callee_copies (CUMULATIVE_ARGS *cum ATTRIBUTE_UNUSED, 5093 enum machine_mode mode ATTRIBUTE_UNUSED, 5094 const_tree type ATTRIBUTE_UNUSED, bool named) 5095 { 5096 return mips_abi == ABI_EABI && named; 5097 } 5098 5099 /* See whether VALTYPE is a record whose fields should be returned in 5100 floating-point registers. If so, return the number of fields and 5101 list them in FIELDS (which should have two elements). Return 0 5102 otherwise. 5103 5104 For n32 & n64, a structure with one or two fields is returned in 5105 floating-point registers as long as every field has a floating-point 5106 type. */ 5107 5108 static int 5109 mips_fpr_return_fields (const_tree valtype, tree *fields) 5110 { 5111 tree field; 5112 int i; 5113 5114 if (!TARGET_NEWABI) 5115 return 0; 5116 5117 if (TREE_CODE (valtype) != RECORD_TYPE) 5118 return 0; 5119 5120 i = 0; 5121 for (field = TYPE_FIELDS (valtype); field != 0; field = TREE_CHAIN (field)) 5122 { 5123 if (TREE_CODE (field) != FIELD_DECL) 5124 continue; 5125 5126 if (!SCALAR_FLOAT_TYPE_P (TREE_TYPE (field))) 5127 return 0; 5128 5129 if (i == 2) 5130 return 0; 5131 5132 fields[i++] = field; 5133 } 5134 return i; 5135 } 5136 5137 /* Implement TARGET_RETURN_IN_MSB. For n32 & n64, we should return 5138 a value in the most significant part of $2/$3 if: 5139 5140 - the target is big-endian; 5141 5142 - the value has a structure or union type (we generalize this to 5143 cover aggregates from other languages too); and 5144 5145 - the structure is not returned in floating-point registers. */ 5146 5147 static bool 5148 mips_return_in_msb (const_tree valtype) 5149 { 5150 tree fields[2]; 5151 5152 return (TARGET_NEWABI 5153 && TARGET_BIG_ENDIAN 5154 && AGGREGATE_TYPE_P (valtype) 5155 && mips_fpr_return_fields (valtype, fields) == 0); 5156 } 5157 5158 /* Return true if the function return value MODE will get returned in a 5159 floating-point register. */ 5160 5161 static bool 5162 mips_return_mode_in_fpr_p (enum machine_mode mode) 5163 { 5164 return ((GET_MODE_CLASS (mode) == MODE_FLOAT 5165 || GET_MODE_CLASS (mode) == MODE_VECTOR_FLOAT 5166 || GET_MODE_CLASS (mode) == MODE_COMPLEX_FLOAT) 5167 && GET_MODE_UNIT_SIZE (mode) <= UNITS_PER_HWFPVALUE); 5168 } 5169 5170 /* Return the representation of an FPR return register when the 5171 value being returned in FP_RETURN has mode VALUE_MODE and the 5172 return type itself has mode TYPE_MODE. On NewABI targets, 5173 the two modes may be different for structures like: 5174 5175 struct __attribute__((packed)) foo { float f; } 5176 5177 where we return the SFmode value of "f" in FP_RETURN, but where 5178 the structure itself has mode BLKmode. */ 5179 5180 static rtx 5181 mips_return_fpr_single (enum machine_mode type_mode, 5182 enum machine_mode value_mode) 5183 { 5184 rtx x; 5185 5186 x = gen_rtx_REG (value_mode, FP_RETURN); 5187 if (type_mode != value_mode) 5188 { 5189 x = gen_rtx_EXPR_LIST (VOIDmode, x, const0_rtx); 5190 x = gen_rtx_PARALLEL (type_mode, gen_rtvec (1, x)); 5191 } 5192 return x; 5193 } 5194 5195 /* Return a composite value in a pair of floating-point registers. 5196 MODE1 and OFFSET1 are the mode and byte offset for the first value, 5197 likewise MODE2 and OFFSET2 for the second. MODE is the mode of the 5198 complete value. 5199 5200 For n32 & n64, $f0 always holds the first value and $f2 the second. 5201 Otherwise the values are packed together as closely as possible. */ 5202 5203 static rtx 5204 mips_return_fpr_pair (enum machine_mode mode, 5205 enum machine_mode mode1, HOST_WIDE_INT offset1, 5206 enum machine_mode mode2, HOST_WIDE_INT offset2) 5207 { 5208 int inc; 5209 5210 inc = (TARGET_NEWABI ? 2 : MAX_FPRS_PER_FMT); 5211 return gen_rtx_PARALLEL 5212 (mode, 5213 gen_rtvec (2, 5214 gen_rtx_EXPR_LIST (VOIDmode, 5215 gen_rtx_REG (mode1, FP_RETURN), 5216 GEN_INT (offset1)), 5217 gen_rtx_EXPR_LIST (VOIDmode, 5218 gen_rtx_REG (mode2, FP_RETURN + inc), 5219 GEN_INT (offset2)))); 5220 5221 } 5222 5223 /* Implement FUNCTION_VALUE and LIBCALL_VALUE. For normal calls, 5224 VALTYPE is the return type and MODE is VOIDmode. For libcalls, 5225 VALTYPE is null and MODE is the mode of the return value. */ 5226 5227 rtx 5228 mips_function_value (const_tree valtype, const_tree func, enum machine_mode mode) 5229 { 5230 if (valtype) 5231 { 5232 tree fields[2]; 5233 int unsigned_p; 5234 5235 mode = TYPE_MODE (valtype); 5236 unsigned_p = TYPE_UNSIGNED (valtype); 5237 5238 /* Since TARGET_PROMOTE_FUNCTION_MODE unconditionally promotes, 5239 return values, promote the mode here too. */ 5240 mode = promote_function_mode (valtype, mode, &unsigned_p, func, 1); 5241 5242 /* Handle structures whose fields are returned in $f0/$f2. */ 5243 switch (mips_fpr_return_fields (valtype, fields)) 5244 { 5245 case 1: 5246 return mips_return_fpr_single (mode, 5247 TYPE_MODE (TREE_TYPE (fields[0]))); 5248 5249 case 2: 5250 return mips_return_fpr_pair (mode, 5251 TYPE_MODE (TREE_TYPE (fields[0])), 5252 int_byte_position (fields[0]), 5253 TYPE_MODE (TREE_TYPE (fields[1])), 5254 int_byte_position (fields[1])); 5255 } 5256 5257 /* If a value is passed in the most significant part of a register, see 5258 whether we have to round the mode up to a whole number of words. */ 5259 if (mips_return_in_msb (valtype)) 5260 { 5261 HOST_WIDE_INT size = int_size_in_bytes (valtype); 5262 if (size % UNITS_PER_WORD != 0) 5263 { 5264 size += UNITS_PER_WORD - size % UNITS_PER_WORD; 5265 mode = mode_for_size (size * BITS_PER_UNIT, MODE_INT, 0); 5266 } 5267 } 5268 5269 /* For EABI, the class of return register depends entirely on MODE. 5270 For example, "struct { some_type x; }" and "union { some_type x; }" 5271 are returned in the same way as a bare "some_type" would be. 5272 Other ABIs only use FPRs for scalar, complex or vector types. */ 5273 if (mips_abi != ABI_EABI && !FLOAT_TYPE_P (valtype)) 5274 return gen_rtx_REG (mode, GP_RETURN); 5275 } 5276 5277 if (!TARGET_MIPS16) 5278 { 5279 /* Handle long doubles for n32 & n64. */ 5280 if (mode == TFmode) 5281 return mips_return_fpr_pair (mode, 5282 DImode, 0, 5283 DImode, GET_MODE_SIZE (mode) / 2); 5284 5285 if (mips_return_mode_in_fpr_p (mode)) 5286 { 5287 if (GET_MODE_CLASS (mode) == MODE_COMPLEX_FLOAT) 5288 return mips_return_fpr_pair (mode, 5289 GET_MODE_INNER (mode), 0, 5290 GET_MODE_INNER (mode), 5291 GET_MODE_SIZE (mode) / 2); 5292 else 5293 return gen_rtx_REG (mode, FP_RETURN); 5294 } 5295 } 5296 5297 return gen_rtx_REG (mode, GP_RETURN); 5298 } 5299 5300 /* Implement TARGET_RETURN_IN_MEMORY. Under the o32 and o64 ABIs, 5301 all BLKmode objects are returned in memory. Under the n32, n64 5302 and embedded ABIs, small structures are returned in a register. 5303 Objects with varying size must still be returned in memory, of 5304 course. */ 5305 5306 static bool 5307 mips_return_in_memory (const_tree type, const_tree fndecl ATTRIBUTE_UNUSED) 5308 { 5309 return (TARGET_OLDABI 5310 ? TYPE_MODE (type) == BLKmode 5311 : !IN_RANGE (int_size_in_bytes (type), 0, 2 * UNITS_PER_WORD)); 5312 } 5313 5314 /* Implement TARGET_SETUP_INCOMING_VARARGS. */ 5315 5316 static void 5317 mips_setup_incoming_varargs (CUMULATIVE_ARGS *cum, enum machine_mode mode, 5318 tree type, int *pretend_size ATTRIBUTE_UNUSED, 5319 int no_rtl) 5320 { 5321 CUMULATIVE_ARGS local_cum; 5322 int gp_saved, fp_saved; 5323 5324 /* The caller has advanced CUM up to, but not beyond, the last named 5325 argument. Advance a local copy of CUM past the last "real" named 5326 argument, to find out how many registers are left over. */ 5327 local_cum = *cum; 5328 FUNCTION_ARG_ADVANCE (local_cum, mode, type, true); 5329 5330 /* Found out how many registers we need to save. */ 5331 gp_saved = MAX_ARGS_IN_REGISTERS - local_cum.num_gprs; 5332 fp_saved = (EABI_FLOAT_VARARGS_P 5333 ? MAX_ARGS_IN_REGISTERS - local_cum.num_fprs 5334 : 0); 5335 5336 if (!no_rtl) 5337 { 5338 if (gp_saved > 0) 5339 { 5340 rtx ptr, mem; 5341 5342 ptr = plus_constant (virtual_incoming_args_rtx, 5343 REG_PARM_STACK_SPACE (cfun->decl) 5344 - gp_saved * UNITS_PER_WORD); 5345 mem = gen_frame_mem (BLKmode, ptr); 5346 set_mem_alias_set (mem, get_varargs_alias_set ()); 5347 5348 move_block_from_reg (local_cum.num_gprs + GP_ARG_FIRST, 5349 mem, gp_saved); 5350 } 5351 if (fp_saved > 0) 5352 { 5353 /* We can't use move_block_from_reg, because it will use 5354 the wrong mode. */ 5355 enum machine_mode mode; 5356 int off, i; 5357 5358 /* Set OFF to the offset from virtual_incoming_args_rtx of 5359 the first float register. The FP save area lies below 5360 the integer one, and is aligned to UNITS_PER_FPVALUE bytes. */ 5361 off = (-gp_saved * UNITS_PER_WORD) & -UNITS_PER_FPVALUE; 5362 off -= fp_saved * UNITS_PER_FPREG; 5363 5364 mode = TARGET_SINGLE_FLOAT ? SFmode : DFmode; 5365 5366 for (i = local_cum.num_fprs; i < MAX_ARGS_IN_REGISTERS; 5367 i += MAX_FPRS_PER_FMT) 5368 { 5369 rtx ptr, mem; 5370 5371 ptr = plus_constant (virtual_incoming_args_rtx, off); 5372 mem = gen_frame_mem (mode, ptr); 5373 set_mem_alias_set (mem, get_varargs_alias_set ()); 5374 mips_emit_move (mem, gen_rtx_REG (mode, FP_ARG_FIRST + i)); 5375 off += UNITS_PER_HWFPVALUE; 5376 } 5377 } 5378 } 5379 if (REG_PARM_STACK_SPACE (cfun->decl) == 0) 5380 cfun->machine->varargs_size = (gp_saved * UNITS_PER_WORD 5381 + fp_saved * UNITS_PER_FPREG); 5382 } 5383 5384 /* Implement TARGET_BUILTIN_VA_LIST. */ 5385 5386 static tree 5387 mips_build_builtin_va_list (void) 5388 { 5389 if (EABI_FLOAT_VARARGS_P) 5390 { 5391 /* We keep 3 pointers, and two offsets. 5392 5393 Two pointers are to the overflow area, which starts at the CFA. 5394 One of these is constant, for addressing into the GPR save area 5395 below it. The other is advanced up the stack through the 5396 overflow region. 5397 5398 The third pointer is to the bottom of the GPR save area. 5399 Since the FPR save area is just below it, we can address 5400 FPR slots off this pointer. 5401 5402 We also keep two one-byte offsets, which are to be subtracted 5403 from the constant pointers to yield addresses in the GPR and 5404 FPR save areas. These are downcounted as float or non-float 5405 arguments are used, and when they get to zero, the argument 5406 must be obtained from the overflow region. */ 5407 tree f_ovfl, f_gtop, f_ftop, f_goff, f_foff, f_res, record; 5408 tree array, index; 5409 5410 record = lang_hooks.types.make_type (RECORD_TYPE); 5411 5412 f_ovfl = build_decl (BUILTINS_LOCATION, 5413 FIELD_DECL, get_identifier ("__overflow_argptr"), 5414 ptr_type_node); 5415 f_gtop = build_decl (BUILTINS_LOCATION, 5416 FIELD_DECL, get_identifier ("__gpr_top"), 5417 ptr_type_node); 5418 f_ftop = build_decl (BUILTINS_LOCATION, 5419 FIELD_DECL, get_identifier ("__fpr_top"), 5420 ptr_type_node); 5421 f_goff = build_decl (BUILTINS_LOCATION, 5422 FIELD_DECL, get_identifier ("__gpr_offset"), 5423 unsigned_char_type_node); 5424 f_foff = build_decl (BUILTINS_LOCATION, 5425 FIELD_DECL, get_identifier ("__fpr_offset"), 5426 unsigned_char_type_node); 5427 /* Explicitly pad to the size of a pointer, so that -Wpadded won't 5428 warn on every user file. */ 5429 index = build_int_cst (NULL_TREE, GET_MODE_SIZE (ptr_mode) - 2 - 1); 5430 array = build_array_type (unsigned_char_type_node, 5431 build_index_type (index)); 5432 f_res = build_decl (BUILTINS_LOCATION, 5433 FIELD_DECL, get_identifier ("__reserved"), array); 5434 5435 DECL_FIELD_CONTEXT (f_ovfl) = record; 5436 DECL_FIELD_CONTEXT (f_gtop) = record; 5437 DECL_FIELD_CONTEXT (f_ftop) = record; 5438 DECL_FIELD_CONTEXT (f_goff) = record; 5439 DECL_FIELD_CONTEXT (f_foff) = record; 5440 DECL_FIELD_CONTEXT (f_res) = record; 5441 5442 TYPE_FIELDS (record) = f_ovfl; 5443 TREE_CHAIN (f_ovfl) = f_gtop; 5444 TREE_CHAIN (f_gtop) = f_ftop; 5445 TREE_CHAIN (f_ftop) = f_goff; 5446 TREE_CHAIN (f_goff) = f_foff; 5447 TREE_CHAIN (f_foff) = f_res; 5448 5449 layout_type (record); 5450 return record; 5451 } 5452 else if (TARGET_IRIX && TARGET_IRIX6) 5453 /* On IRIX 6, this type is 'char *'. */ 5454 return build_pointer_type (char_type_node); 5455 else 5456 /* Otherwise, we use 'void *'. */ 5457 return ptr_type_node; 5458 } 5459 5460 /* Implement TARGET_EXPAND_BUILTIN_VA_START. */ 5461 5462 static void 5463 mips_va_start (tree valist, rtx nextarg) 5464 { 5465 if (EABI_FLOAT_VARARGS_P) 5466 { 5467 const CUMULATIVE_ARGS *cum; 5468 tree f_ovfl, f_gtop, f_ftop, f_goff, f_foff; 5469 tree ovfl, gtop, ftop, goff, foff; 5470 tree t; 5471 int gpr_save_area_size; 5472 int fpr_save_area_size; 5473 int fpr_offset; 5474 5475 cum = &crtl->args.info; 5476 gpr_save_area_size 5477 = (MAX_ARGS_IN_REGISTERS - cum->num_gprs) * UNITS_PER_WORD; 5478 fpr_save_area_size 5479 = (MAX_ARGS_IN_REGISTERS - cum->num_fprs) * UNITS_PER_FPREG; 5480 5481 f_ovfl = TYPE_FIELDS (va_list_type_node); 5482 f_gtop = TREE_CHAIN (f_ovfl); 5483 f_ftop = TREE_CHAIN (f_gtop); 5484 f_goff = TREE_CHAIN (f_ftop); 5485 f_foff = TREE_CHAIN (f_goff); 5486 5487 ovfl = build3 (COMPONENT_REF, TREE_TYPE (f_ovfl), valist, f_ovfl, 5488 NULL_TREE); 5489 gtop = build3 (COMPONENT_REF, TREE_TYPE (f_gtop), valist, f_gtop, 5490 NULL_TREE); 5491 ftop = build3 (COMPONENT_REF, TREE_TYPE (f_ftop), valist, f_ftop, 5492 NULL_TREE); 5493 goff = build3 (COMPONENT_REF, TREE_TYPE (f_goff), valist, f_goff, 5494 NULL_TREE); 5495 foff = build3 (COMPONENT_REF, TREE_TYPE (f_foff), valist, f_foff, 5496 NULL_TREE); 5497 5498 /* Emit code to initialize OVFL, which points to the next varargs 5499 stack argument. CUM->STACK_WORDS gives the number of stack 5500 words used by named arguments. */ 5501 t = make_tree (TREE_TYPE (ovfl), virtual_incoming_args_rtx); 5502 if (cum->stack_words > 0) 5503 t = build2 (POINTER_PLUS_EXPR, TREE_TYPE (ovfl), t, 5504 size_int (cum->stack_words * UNITS_PER_WORD)); 5505 t = build2 (MODIFY_EXPR, TREE_TYPE (ovfl), ovfl, t); 5506 expand_expr (t, const0_rtx, VOIDmode, EXPAND_NORMAL); 5507 5508 /* Emit code to initialize GTOP, the top of the GPR save area. */ 5509 t = make_tree (TREE_TYPE (gtop), virtual_incoming_args_rtx); 5510 t = build2 (MODIFY_EXPR, TREE_TYPE (gtop), gtop, t); 5511 expand_expr (t, const0_rtx, VOIDmode, EXPAND_NORMAL); 5512 5513 /* Emit code to initialize FTOP, the top of the FPR save area. 5514 This address is gpr_save_area_bytes below GTOP, rounded 5515 down to the next fp-aligned boundary. */ 5516 t = make_tree (TREE_TYPE (ftop), virtual_incoming_args_rtx); 5517 fpr_offset = gpr_save_area_size + UNITS_PER_FPVALUE - 1; 5518 fpr_offset &= -UNITS_PER_FPVALUE; 5519 if (fpr_offset) 5520 t = build2 (POINTER_PLUS_EXPR, TREE_TYPE (ftop), t, 5521 size_int (-fpr_offset)); 5522 t = build2 (MODIFY_EXPR, TREE_TYPE (ftop), ftop, t); 5523 expand_expr (t, const0_rtx, VOIDmode, EXPAND_NORMAL); 5524 5525 /* Emit code to initialize GOFF, the offset from GTOP of the 5526 next GPR argument. */ 5527 t = build2 (MODIFY_EXPR, TREE_TYPE (goff), goff, 5528 build_int_cst (TREE_TYPE (goff), gpr_save_area_size)); 5529 expand_expr (t, const0_rtx, VOIDmode, EXPAND_NORMAL); 5530 5531 /* Likewise emit code to initialize FOFF, the offset from FTOP 5532 of the next FPR argument. */ 5533 t = build2 (MODIFY_EXPR, TREE_TYPE (foff), foff, 5534 build_int_cst (TREE_TYPE (foff), fpr_save_area_size)); 5535 expand_expr (t, const0_rtx, VOIDmode, EXPAND_NORMAL); 5536 } 5537 else 5538 { 5539 nextarg = plus_constant (nextarg, -cfun->machine->varargs_size); 5540 std_expand_builtin_va_start (valist, nextarg); 5541 } 5542 } 5543 5544 /* Implement TARGET_GIMPLIFY_VA_ARG_EXPR. */ 5545 5546 static tree 5547 mips_gimplify_va_arg_expr (tree valist, tree type, gimple_seq *pre_p, 5548 gimple_seq *post_p) 5549 { 5550 tree addr; 5551 bool indirect_p; 5552 5553 indirect_p = pass_by_reference (NULL, TYPE_MODE (type), type, 0); 5554 if (indirect_p) 5555 type = build_pointer_type (type); 5556 5557 if (!EABI_FLOAT_VARARGS_P) 5558 addr = std_gimplify_va_arg_expr (valist, type, pre_p, post_p); 5559 else 5560 { 5561 tree f_ovfl, f_gtop, f_ftop, f_goff, f_foff; 5562 tree ovfl, top, off, align; 5563 HOST_WIDE_INT size, rsize, osize; 5564 tree t, u; 5565 5566 f_ovfl = TYPE_FIELDS (va_list_type_node); 5567 f_gtop = TREE_CHAIN (f_ovfl); 5568 f_ftop = TREE_CHAIN (f_gtop); 5569 f_goff = TREE_CHAIN (f_ftop); 5570 f_foff = TREE_CHAIN (f_goff); 5571 5572 /* Let: 5573 5574 TOP be the top of the GPR or FPR save area; 5575 OFF be the offset from TOP of the next register; 5576 ADDR_RTX be the address of the argument; 5577 SIZE be the number of bytes in the argument type; 5578 RSIZE be the number of bytes used to store the argument 5579 when it's in the register save area; and 5580 OSIZE be the number of bytes used to store it when it's 5581 in the stack overflow area. 5582 5583 The code we want is: 5584 5585 1: off &= -rsize; // round down 5586 2: if (off != 0) 5587 3: { 5588 4: addr_rtx = top - off + (BYTES_BIG_ENDIAN ? RSIZE - SIZE : 0); 5589 5: off -= rsize; 5590 6: } 5591 7: else 5592 8: { 5593 9: ovfl = ((intptr_t) ovfl + osize - 1) & -osize; 5594 10: addr_rtx = ovfl + (BYTES_BIG_ENDIAN ? OSIZE - SIZE : 0); 5595 11: ovfl += osize; 5596 14: } 5597 5598 [1] and [9] can sometimes be optimized away. */ 5599 5600 ovfl = build3 (COMPONENT_REF, TREE_TYPE (f_ovfl), valist, f_ovfl, 5601 NULL_TREE); 5602 size = int_size_in_bytes (type); 5603 5604 if (GET_MODE_CLASS (TYPE_MODE (type)) == MODE_FLOAT 5605 && GET_MODE_SIZE (TYPE_MODE (type)) <= UNITS_PER_FPVALUE) 5606 { 5607 top = build3 (COMPONENT_REF, TREE_TYPE (f_ftop), 5608 unshare_expr (valist), f_ftop, NULL_TREE); 5609 off = build3 (COMPONENT_REF, TREE_TYPE (f_foff), 5610 unshare_expr (valist), f_foff, NULL_TREE); 5611 5612 /* When va_start saves FPR arguments to the stack, each slot 5613 takes up UNITS_PER_HWFPVALUE bytes, regardless of the 5614 argument's precision. */ 5615 rsize = UNITS_PER_HWFPVALUE; 5616 5617 /* Overflow arguments are padded to UNITS_PER_WORD bytes 5618 (= PARM_BOUNDARY bits). This can be different from RSIZE 5619 in two cases: 5620 5621 (1) On 32-bit targets when TYPE is a structure such as: 5622 5623 struct s { float f; }; 5624 5625 Such structures are passed in paired FPRs, so RSIZE 5626 will be 8 bytes. However, the structure only takes 5627 up 4 bytes of memory, so OSIZE will only be 4. 5628 5629 (2) In combinations such as -mgp64 -msingle-float 5630 -fshort-double. Doubles passed in registers will then take 5631 up 4 (UNITS_PER_HWFPVALUE) bytes, but those passed on the 5632 stack take up UNITS_PER_WORD bytes. */ 5633 osize = MAX (GET_MODE_SIZE (TYPE_MODE (type)), UNITS_PER_WORD); 5634 } 5635 else 5636 { 5637 top = build3 (COMPONENT_REF, TREE_TYPE (f_gtop), 5638 unshare_expr (valist), f_gtop, NULL_TREE); 5639 off = build3 (COMPONENT_REF, TREE_TYPE (f_goff), 5640 unshare_expr (valist), f_goff, NULL_TREE); 5641 rsize = (size + UNITS_PER_WORD - 1) & -UNITS_PER_WORD; 5642 if (rsize > UNITS_PER_WORD) 5643 { 5644 /* [1] Emit code for: off &= -rsize. */ 5645 t = build2 (BIT_AND_EXPR, TREE_TYPE (off), unshare_expr (off), 5646 build_int_cst (TREE_TYPE (off), -rsize)); 5647 gimplify_assign (unshare_expr (off), t, pre_p); 5648 } 5649 osize = rsize; 5650 } 5651 5652 /* [2] Emit code to branch if off == 0. */ 5653 t = build2 (NE_EXPR, boolean_type_node, off, 5654 build_int_cst (TREE_TYPE (off), 0)); 5655 addr = build3 (COND_EXPR, ptr_type_node, t, NULL_TREE, NULL_TREE); 5656 5657 /* [5] Emit code for: off -= rsize. We do this as a form of 5658 post-decrement not available to C. */ 5659 t = fold_convert (TREE_TYPE (off), build_int_cst (NULL_TREE, rsize)); 5660 t = build2 (POSTDECREMENT_EXPR, TREE_TYPE (off), off, t); 5661 5662 /* [4] Emit code for: 5663 addr_rtx = top - off + (BYTES_BIG_ENDIAN ? RSIZE - SIZE : 0). */ 5664 t = fold_convert (sizetype, t); 5665 t = fold_build1 (NEGATE_EXPR, sizetype, t); 5666 t = build2 (POINTER_PLUS_EXPR, TREE_TYPE (top), top, t); 5667 if (BYTES_BIG_ENDIAN && rsize > size) 5668 { 5669 u = size_int (rsize - size); 5670 t = build2 (POINTER_PLUS_EXPR, TREE_TYPE (t), t, u); 5671 } 5672 COND_EXPR_THEN (addr) = t; 5673 5674 if (osize > UNITS_PER_WORD) 5675 { 5676 /* [9] Emit: ovfl = ((intptr_t) ovfl + osize - 1) & -osize. */ 5677 u = size_int (osize - 1); 5678 t = build2 (POINTER_PLUS_EXPR, TREE_TYPE (ovfl), 5679 unshare_expr (ovfl), u); 5680 t = fold_convert (sizetype, t); 5681 u = size_int (-osize); 5682 t = build2 (BIT_AND_EXPR, sizetype, t, u); 5683 t = fold_convert (TREE_TYPE (ovfl), t); 5684 align = build2 (MODIFY_EXPR, TREE_TYPE (ovfl), 5685 unshare_expr (ovfl), t); 5686 } 5687 else 5688 align = NULL; 5689 5690 /* [10, 11] Emit code for: 5691 addr_rtx = ovfl + (BYTES_BIG_ENDIAN ? OSIZE - SIZE : 0) 5692 ovfl += osize. */ 5693 u = fold_convert (TREE_TYPE (ovfl), build_int_cst (NULL_TREE, osize)); 5694 t = build2 (POSTINCREMENT_EXPR, TREE_TYPE (ovfl), ovfl, u); 5695 if (BYTES_BIG_ENDIAN && osize > size) 5696 { 5697 u = size_int (osize - size); 5698 t = build2 (POINTER_PLUS_EXPR, TREE_TYPE (t), t, u); 5699 } 5700 5701 /* String [9] and [10, 11] together. */ 5702 if (align) 5703 t = build2 (COMPOUND_EXPR, TREE_TYPE (t), align, t); 5704 COND_EXPR_ELSE (addr) = t; 5705 5706 addr = fold_convert (build_pointer_type (type), addr); 5707 addr = build_va_arg_indirect_ref (addr); 5708 } 5709 5710 if (indirect_p) 5711 addr = build_va_arg_indirect_ref (addr); 5712 5713 return addr; 5714 } 5715 5716 /* Start a definition of function NAME. MIPS16_P indicates whether the 5717 function contains MIPS16 code. */ 5718 5719 static void 5720 mips_start_function_definition (const char *name, bool mips16_p) 5721 { 5722 if (mips16_p) 5723 fprintf (asm_out_file, "\t.set\tmips16\n"); 5724 else 5725 fprintf (asm_out_file, "\t.set\tnomips16\n"); 5726 5727 if (!flag_inhibit_size_directive) 5728 { 5729 fputs ("\t.ent\t", asm_out_file); 5730 assemble_name (asm_out_file, name); 5731 fputs ("\n", asm_out_file); 5732 } 5733 5734 ASM_OUTPUT_TYPE_DIRECTIVE (asm_out_file, name, "function"); 5735 5736 /* Start the definition proper. */ 5737 assemble_name (asm_out_file, name); 5738 fputs (":\n", asm_out_file); 5739 } 5740 5741 /* End a function definition started by mips_start_function_definition. */ 5742 5743 static void 5744 mips_end_function_definition (const char *name) 5745 { 5746 if (!flag_inhibit_size_directive) 5747 { 5748 fputs ("\t.end\t", asm_out_file); 5749 assemble_name (asm_out_file, name); 5750 fputs ("\n", asm_out_file); 5751 } 5752 } 5753 5754 /* Return true if calls to X can use R_MIPS_CALL* relocations. */ 5755 5756 static bool 5757 mips_ok_for_lazy_binding_p (rtx x) 5758 { 5759 return (TARGET_USE_GOT 5760 && GET_CODE (x) == SYMBOL_REF 5761 && !SYMBOL_REF_BIND_NOW_P (x) 5762 && !mips_symbol_binds_local_p (x)); 5763 } 5764 5765 /* Load function address ADDR into register DEST. TYPE is as for 5766 mips_expand_call. Return true if we used an explicit lazy-binding 5767 sequence. */ 5768 5769 static bool 5770 mips_load_call_address (enum mips_call_type type, rtx dest, rtx addr) 5771 { 5772 /* If we're generating PIC, and this call is to a global function, 5773 try to allow its address to be resolved lazily. This isn't 5774 possible for sibcalls when $gp is call-saved because the value 5775 of $gp on entry to the stub would be our caller's gp, not ours. */ 5776 if (TARGET_EXPLICIT_RELOCS 5777 && !(type == MIPS_CALL_SIBCALL && TARGET_CALL_SAVED_GP) 5778 && mips_ok_for_lazy_binding_p (addr)) 5779 { 5780 addr = mips_got_load (dest, addr, SYMBOL_GOTOFF_CALL); 5781 emit_insn (gen_rtx_SET (VOIDmode, dest, addr)); 5782 return true; 5783 } 5784 else 5785 { 5786 mips_emit_move (dest, addr); 5787 return false; 5788 } 5789 } 5790 5791 /* Each locally-defined hard-float MIPS16 function has a local symbol 5792 associated with it. This hash table maps the function symbol (FUNC) 5793 to the local symbol (LOCAL). */ 5794 struct GTY(()) mips16_local_alias { 5795 rtx func; 5796 rtx local; 5797 }; 5798 static GTY ((param_is (struct mips16_local_alias))) htab_t mips16_local_aliases; 5799 5800 /* Hash table callbacks for mips16_local_aliases. */ 5801 5802 static hashval_t 5803 mips16_local_aliases_hash (const void *entry) 5804 { 5805 const struct mips16_local_alias *alias; 5806 5807 alias = (const struct mips16_local_alias *) entry; 5808 return htab_hash_string (XSTR (alias->func, 0)); 5809 } 5810 5811 static int 5812 mips16_local_aliases_eq (const void *entry1, const void *entry2) 5813 { 5814 const struct mips16_local_alias *alias1, *alias2; 5815 5816 alias1 = (const struct mips16_local_alias *) entry1; 5817 alias2 = (const struct mips16_local_alias *) entry2; 5818 return rtx_equal_p (alias1->func, alias2->func); 5819 } 5820 5821 /* FUNC is the symbol for a locally-defined hard-float MIPS16 function. 5822 Return a local alias for it, creating a new one if necessary. */ 5823 5824 static rtx 5825 mips16_local_alias (rtx func) 5826 { 5827 struct mips16_local_alias *alias, tmp_alias; 5828 void **slot; 5829 5830 /* Create the hash table if this is the first call. */ 5831 if (mips16_local_aliases == NULL) 5832 mips16_local_aliases = htab_create_ggc (37, mips16_local_aliases_hash, 5833 mips16_local_aliases_eq, NULL); 5834 5835 /* Look up the function symbol, creating a new entry if need be. */ 5836 tmp_alias.func = func; 5837 slot = htab_find_slot (mips16_local_aliases, &tmp_alias, INSERT); 5838 gcc_assert (slot != NULL); 5839 5840 alias = (struct mips16_local_alias *) *slot; 5841 if (alias == NULL) 5842 { 5843 const char *func_name, *local_name; 5844 rtx local; 5845 5846 /* Create a new SYMBOL_REF for the local symbol. The choice of 5847 __fn_local_* is based on the __fn_stub_* names that we've 5848 traditionally used for the non-MIPS16 stub. */ 5849 func_name = targetm.strip_name_encoding (XSTR (func, 0)); 5850 local_name = ACONCAT (("__fn_local_", func_name, NULL)); 5851 local = gen_rtx_SYMBOL_REF (Pmode, ggc_strdup (local_name)); 5852 SYMBOL_REF_FLAGS (local) = SYMBOL_REF_FLAGS (func) | SYMBOL_FLAG_LOCAL; 5853 5854 /* Create a new structure to represent the mapping. */ 5855 alias = GGC_NEW (struct mips16_local_alias); 5856 alias->func = func; 5857 alias->local = local; 5858 *slot = alias; 5859 } 5860 return alias->local; 5861 } 5862 5863 /* A chained list of functions for which mips16_build_call_stub has already 5864 generated a stub. NAME is the name of the function and FP_RET_P is true 5865 if the function returns a value in floating-point registers. */ 5866 struct mips16_stub { 5867 struct mips16_stub *next; 5868 char *name; 5869 bool fp_ret_p; 5870 }; 5871 static struct mips16_stub *mips16_stubs; 5872 5873 /* Return a SYMBOL_REF for a MIPS16 function called NAME. */ 5874 5875 static rtx 5876 mips16_stub_function (const char *name) 5877 { 5878 rtx x; 5879 5880 x = gen_rtx_SYMBOL_REF (Pmode, ggc_strdup (name)); 5881 SYMBOL_REF_FLAGS (x) |= (SYMBOL_FLAG_EXTERNAL | SYMBOL_FLAG_FUNCTION); 5882 return x; 5883 } 5884 5885 /* Return the two-character string that identifies floating-point 5886 return mode MODE in the name of a MIPS16 function stub. */ 5887 5888 static const char * 5889 mips16_call_stub_mode_suffix (enum machine_mode mode) 5890 { 5891 if (mode == SFmode) 5892 return "sf"; 5893 else if (mode == DFmode) 5894 return "df"; 5895 else if (mode == SCmode) 5896 return "sc"; 5897 else if (mode == DCmode) 5898 return "dc"; 5899 else if (mode == V2SFmode) 5900 return "df"; 5901 else 5902 gcc_unreachable (); 5903 } 5904 5905 /* Write instructions to move a 32-bit value between general register 5906 GPREG and floating-point register FPREG. DIRECTION is 't' to move 5907 from GPREG to FPREG and 'f' to move in the opposite direction. */ 5908 5909 static void 5910 mips_output_32bit_xfer (char direction, unsigned int gpreg, unsigned int fpreg) 5911 { 5912 fprintf (asm_out_file, "\tm%cc1\t%s,%s\n", direction, 5913 reg_names[gpreg], reg_names[fpreg]); 5914 } 5915 5916 /* Likewise for 64-bit values. */ 5917 5918 static void 5919 mips_output_64bit_xfer (char direction, unsigned int gpreg, unsigned int fpreg) 5920 { 5921 if (TARGET_64BIT) 5922 fprintf (asm_out_file, "\tdm%cc1\t%s,%s\n", direction, 5923 reg_names[gpreg], reg_names[fpreg]); 5924 else if (TARGET_FLOAT64) 5925 { 5926 fprintf (asm_out_file, "\tm%cc1\t%s,%s\n", direction, 5927 reg_names[gpreg + TARGET_BIG_ENDIAN], reg_names[fpreg]); 5928 fprintf (asm_out_file, "\tm%chc1\t%s,%s\n", direction, 5929 reg_names[gpreg + TARGET_LITTLE_ENDIAN], reg_names[fpreg]); 5930 } 5931 else 5932 { 5933 /* Move the least-significant word. */ 5934 fprintf (asm_out_file, "\tm%cc1\t%s,%s\n", direction, 5935 reg_names[gpreg + TARGET_BIG_ENDIAN], reg_names[fpreg]); 5936 /* ...then the most significant word. */ 5937 fprintf (asm_out_file, "\tm%cc1\t%s,%s\n", direction, 5938 reg_names[gpreg + TARGET_LITTLE_ENDIAN], reg_names[fpreg + 1]); 5939 } 5940 } 5941 5942 /* Write out code to move floating-point arguments into or out of 5943 general registers. FP_CODE is the code describing which arguments 5944 are present (see the comment above the definition of CUMULATIVE_ARGS 5945 in mips.h). DIRECTION is as for mips_output_32bit_xfer. */ 5946 5947 static void 5948 mips_output_args_xfer (int fp_code, char direction) 5949 { 5950 unsigned int gparg, fparg, f; 5951 CUMULATIVE_ARGS cum; 5952 5953 /* This code only works for o32 and o64. */ 5954 gcc_assert (TARGET_OLDABI); 5955 5956 mips_init_cumulative_args (&cum, NULL); 5957 5958 for (f = (unsigned int) fp_code; f != 0; f >>= 2) 5959 { 5960 enum machine_mode mode; 5961 struct mips_arg_info info; 5962 5963 if ((f & 3) == 1) 5964 mode = SFmode; 5965 else if ((f & 3) == 2) 5966 mode = DFmode; 5967 else 5968 gcc_unreachable (); 5969 5970 mips_get_arg_info (&info, &cum, mode, NULL, true); 5971 gparg = mips_arg_regno (&info, false); 5972 fparg = mips_arg_regno (&info, true); 5973 5974 if (mode == SFmode) 5975 mips_output_32bit_xfer (direction, gparg, fparg); 5976 else 5977 mips_output_64bit_xfer (direction, gparg, fparg); 5978 5979 mips_function_arg_advance (&cum, mode, NULL, true); 5980 } 5981 } 5982 5983 /* Write a MIPS16 stub for the current function. This stub is used 5984 for functions which take arguments in the floating-point registers. 5985 It is normal-mode code that moves the floating-point arguments 5986 into the general registers and then jumps to the MIPS16 code. */ 5987 5988 static void 5989 mips16_build_function_stub (void) 5990 { 5991 const char *fnname, *alias_name, *separator; 5992 char *secname, *stubname; 5993 tree stubdecl; 5994 unsigned int f; 5995 rtx symbol, alias; 5996 5997 /* Create the name of the stub, and its unique section. */ 5998 symbol = XEXP (DECL_RTL (current_function_decl), 0); 5999 alias = mips16_local_alias (symbol); 6000 6001 fnname = targetm.strip_name_encoding (XSTR (symbol, 0)); 6002 alias_name = targetm.strip_name_encoding (XSTR (alias, 0)); 6003 secname = ACONCAT ((".mips16.fn.", fnname, NULL)); 6004 stubname = ACONCAT (("__fn_stub_", fnname, NULL)); 6005 6006 /* Build a decl for the stub. */ 6007 stubdecl = build_decl (BUILTINS_LOCATION, 6008 FUNCTION_DECL, get_identifier (stubname), 6009 build_function_type (void_type_node, NULL_TREE)); 6010 DECL_SECTION_NAME (stubdecl) = build_string (strlen (secname), secname); 6011 DECL_RESULT (stubdecl) = build_decl (BUILTINS_LOCATION, 6012 RESULT_DECL, NULL_TREE, void_type_node); 6013 6014 /* Output a comment. */ 6015 fprintf (asm_out_file, "\t# Stub function for %s (", 6016 current_function_name ()); 6017 separator = ""; 6018 for (f = (unsigned int) crtl->args.info.fp_code; f != 0; f >>= 2) 6019 { 6020 fprintf (asm_out_file, "%s%s", separator, 6021 (f & 3) == 1 ? "float" : "double"); 6022 separator = ", "; 6023 } 6024 fprintf (asm_out_file, ")\n"); 6025 6026 /* Start the function definition. */ 6027 assemble_start_function (stubdecl, stubname); 6028 mips_start_function_definition (stubname, false); 6029 6030 /* If generating pic2 code, either set up the global pointer or 6031 switch to pic0. */ 6032 if (TARGET_ABICALLS_PIC2) 6033 { 6034 if (TARGET_ABSOLUTE_ABICALLS) 6035 fprintf (asm_out_file, "\t.option\tpic0\n"); 6036 else 6037 { 6038 output_asm_insn ("%(.cpload\t%^%)", NULL); 6039 /* Emit an R_MIPS_NONE relocation to tell the linker what the 6040 target function is. Use a local GOT access when loading the 6041 symbol, to cut down on the number of unnecessary GOT entries 6042 for stubs that aren't needed. */ 6043 output_asm_insn (".reloc\t0,R_MIPS_NONE,%0", &symbol); 6044 symbol = alias; 6045 } 6046 } 6047 6048 /* Load the address of the MIPS16 function into $25. Do this first so 6049 that targets with coprocessor interlocks can use an MFC1 to fill the 6050 delay slot. */ 6051 output_asm_insn ("la\t%^,%0", &symbol); 6052 6053 /* Move the arguments from floating-point registers to general registers. */ 6054 mips_output_args_xfer (crtl->args.info.fp_code, 'f'); 6055 6056 /* Jump to the MIPS16 function. */ 6057 output_asm_insn ("jr\t%^", NULL); 6058 6059 if (TARGET_ABICALLS_PIC2 && TARGET_ABSOLUTE_ABICALLS) 6060 fprintf (asm_out_file, "\t.option\tpic2\n"); 6061 6062 mips_end_function_definition (stubname); 6063 6064 /* If the linker needs to create a dynamic symbol for the target 6065 function, it will associate the symbol with the stub (which, 6066 unlike the target function, follows the proper calling conventions). 6067 It is therefore useful to have a local alias for the target function, 6068 so that it can still be identified as MIPS16 code. As an optimization, 6069 this symbol can also be used for indirect MIPS16 references from 6070 within this file. */ 6071 ASM_OUTPUT_DEF (asm_out_file, alias_name, fnname); 6072 6073 switch_to_section (function_section (current_function_decl)); 6074 } 6075 6076 /* The current function is a MIPS16 function that returns a value in an FPR. 6077 Copy the return value from its soft-float to its hard-float location. 6078 libgcc2 has special non-MIPS16 helper functions for each case. */ 6079 6080 static void 6081 mips16_copy_fpr_return_value (void) 6082 { 6083 rtx fn, insn, retval; 6084 tree return_type; 6085 enum machine_mode return_mode; 6086 const char *name; 6087 6088 return_type = DECL_RESULT (current_function_decl); 6089 return_mode = DECL_MODE (return_type); 6090 6091 name = ACONCAT (("__mips16_ret_", 6092 mips16_call_stub_mode_suffix (return_mode), 6093 NULL)); 6094 fn = mips16_stub_function (name); 6095 6096 /* The function takes arguments in $2 (and possibly $3), so calls 6097 to it cannot be lazily bound. */ 6098 SYMBOL_REF_FLAGS (fn) |= SYMBOL_FLAG_BIND_NOW; 6099 6100 /* Model the call as something that takes the GPR return value as 6101 argument and returns an "updated" value. */ 6102 retval = gen_rtx_REG (return_mode, GP_RETURN); 6103 insn = mips_expand_call (MIPS_CALL_EPILOGUE, retval, fn, 6104 const0_rtx, NULL_RTX, false); 6105 use_reg (&CALL_INSN_FUNCTION_USAGE (insn), retval); 6106 } 6107 6108 /* Consider building a stub for a MIPS16 call to function *FN_PTR. 6109 RETVAL is the location of the return value, or null if this is 6110 a "call" rather than a "call_value". ARGS_SIZE is the size of the 6111 arguments and FP_CODE is the code built by mips_function_arg; 6112 see the comment before the fp_code field in CUMULATIVE_ARGS for details. 6113 6114 There are three alternatives: 6115 6116 - If a stub was needed, emit the call and return the call insn itself. 6117 6118 - If we can avoid using a stub by redirecting the call, set *FN_PTR 6119 to the new target and return null. 6120 6121 - If *FN_PTR doesn't need a stub, return null and leave *FN_PTR 6122 unmodified. 6123 6124 A stub is needed for calls to functions that, in normal mode, 6125 receive arguments in FPRs or return values in FPRs. The stub 6126 copies the arguments from their soft-float positions to their 6127 hard-float positions, calls the real function, then copies the 6128 return value from its hard-float position to its soft-float 6129 position. 6130 6131 We can emit a JAL to *FN_PTR even when *FN_PTR might need a stub. 6132 If *FN_PTR turns out to be to a non-MIPS16 function, the linker 6133 automatically redirects the JAL to the stub, otherwise the JAL 6134 continues to call FN directly. */ 6135 6136 static rtx 6137 mips16_build_call_stub (rtx retval, rtx *fn_ptr, rtx args_size, int fp_code) 6138 { 6139 const char *fnname; 6140 bool fp_ret_p; 6141 struct mips16_stub *l; 6142 rtx insn, fn; 6143 6144 /* We don't need to do anything if we aren't in MIPS16 mode, or if 6145 we were invoked with the -msoft-float option. */ 6146 if (!TARGET_MIPS16 || TARGET_SOFT_FLOAT_ABI) 6147 return NULL_RTX; 6148 6149 /* Figure out whether the value might come back in a floating-point 6150 register. */ 6151 fp_ret_p = retval && mips_return_mode_in_fpr_p (GET_MODE (retval)); 6152 6153 /* We don't need to do anything if there were no floating-point 6154 arguments and the value will not be returned in a floating-point 6155 register. */ 6156 if (fp_code == 0 && !fp_ret_p) 6157 return NULL_RTX; 6158 6159 /* We don't need to do anything if this is a call to a special 6160 MIPS16 support function. */ 6161 fn = *fn_ptr; 6162 if (mips16_stub_function_p (fn)) 6163 return NULL_RTX; 6164 6165 /* This code will only work for o32 and o64 abis. The other ABI's 6166 require more sophisticated support. */ 6167 gcc_assert (TARGET_OLDABI); 6168 6169 /* If we're calling via a function pointer, use one of the magic 6170 libgcc.a stubs provided for each (FP_CODE, FP_RET_P) combination. 6171 Each stub expects the function address to arrive in register $2. */ 6172 if (GET_CODE (fn) != SYMBOL_REF 6173 || !call_insn_operand (fn, VOIDmode)) 6174 { 6175 char buf[30]; 6176 rtx stub_fn, insn, addr; 6177 bool lazy_p; 6178 6179 /* If this is a locally-defined and locally-binding function, 6180 avoid the stub by calling the local alias directly. */ 6181 if (mips16_local_function_p (fn)) 6182 { 6183 *fn_ptr = mips16_local_alias (fn); 6184 return NULL_RTX; 6185 } 6186 6187 /* Create a SYMBOL_REF for the libgcc.a function. */ 6188 if (fp_ret_p) 6189 sprintf (buf, "__mips16_call_stub_%s_%d", 6190 mips16_call_stub_mode_suffix (GET_MODE (retval)), 6191 fp_code); 6192 else 6193 sprintf (buf, "__mips16_call_stub_%d", fp_code); 6194 stub_fn = mips16_stub_function (buf); 6195 6196 /* The function uses $2 as an argument, so calls to it 6197 cannot be lazily bound. */ 6198 SYMBOL_REF_FLAGS (stub_fn) |= SYMBOL_FLAG_BIND_NOW; 6199 6200 /* Load the target function into $2. */ 6201 addr = gen_rtx_REG (Pmode, GP_REG_FIRST + 2); 6202 lazy_p = mips_load_call_address (MIPS_CALL_NORMAL, addr, fn); 6203 6204 /* Emit the call. */ 6205 insn = mips_expand_call (MIPS_CALL_NORMAL, retval, stub_fn, 6206 args_size, NULL_RTX, lazy_p); 6207 6208 /* Tell GCC that this call does indeed use the value of $2. */ 6209 use_reg (&CALL_INSN_FUNCTION_USAGE (insn), addr); 6210 6211 /* If we are handling a floating-point return value, we need to 6212 save $18 in the function prologue. Putting a note on the 6213 call will mean that df_regs_ever_live_p ($18) will be true if the 6214 call is not eliminated, and we can check that in the prologue 6215 code. */ 6216 if (fp_ret_p) 6217 CALL_INSN_FUNCTION_USAGE (insn) = 6218 gen_rtx_EXPR_LIST (VOIDmode, 6219 gen_rtx_CLOBBER (VOIDmode, 6220 gen_rtx_REG (word_mode, 18)), 6221 CALL_INSN_FUNCTION_USAGE (insn)); 6222 6223 return insn; 6224 } 6225 6226 /* We know the function we are going to call. If we have already 6227 built a stub, we don't need to do anything further. */ 6228 fnname = targetm.strip_name_encoding (XSTR (fn, 0)); 6229 for (l = mips16_stubs; l != NULL; l = l->next) 6230 if (strcmp (l->name, fnname) == 0) 6231 break; 6232 6233 if (l == NULL) 6234 { 6235 const char *separator; 6236 char *secname, *stubname; 6237 tree stubid, stubdecl; 6238 unsigned int f; 6239 6240 /* If the function does not return in FPRs, the special stub 6241 section is named 6242 .mips16.call.FNNAME 6243 6244 If the function does return in FPRs, the stub section is named 6245 .mips16.call.fp.FNNAME 6246 6247 Build a decl for the stub. */ 6248 secname = ACONCAT ((".mips16.call.", fp_ret_p ? "fp." : "", 6249 fnname, NULL)); 6250 stubname = ACONCAT (("__call_stub_", fp_ret_p ? "fp_" : "", 6251 fnname, NULL)); 6252 stubid = get_identifier (stubname); 6253 stubdecl = build_decl (BUILTINS_LOCATION, 6254 FUNCTION_DECL, stubid, 6255 build_function_type (void_type_node, NULL_TREE)); 6256 DECL_SECTION_NAME (stubdecl) = build_string (strlen (secname), secname); 6257 DECL_RESULT (stubdecl) = build_decl (BUILTINS_LOCATION, 6258 RESULT_DECL, NULL_TREE, 6259 void_type_node); 6260 6261 /* Output a comment. */ 6262 fprintf (asm_out_file, "\t# Stub function to call %s%s (", 6263 (fp_ret_p 6264 ? (GET_MODE (retval) == SFmode ? "float " : "double ") 6265 : ""), 6266 fnname); 6267 separator = ""; 6268 for (f = (unsigned int) fp_code; f != 0; f >>= 2) 6269 { 6270 fprintf (asm_out_file, "%s%s", separator, 6271 (f & 3) == 1 ? "float" : "double"); 6272 separator = ", "; 6273 } 6274 fprintf (asm_out_file, ")\n"); 6275 6276 /* Start the function definition. */ 6277 assemble_start_function (stubdecl, stubname); 6278 mips_start_function_definition (stubname, false); 6279 6280 if (!fp_ret_p) 6281 { 6282 /* Load the address of the MIPS16 function into $25. Do this 6283 first so that targets with coprocessor interlocks can use 6284 an MFC1 to fill the delay slot. */ 6285 if (TARGET_EXPLICIT_RELOCS) 6286 { 6287 output_asm_insn ("lui\t%^,%%hi(%0)", &fn); 6288 output_asm_insn ("addiu\t%^,%^,%%lo(%0)", &fn); 6289 } 6290 else 6291 output_asm_insn ("la\t%^,%0", &fn); 6292 } 6293 6294 /* Move the arguments from general registers to floating-point 6295 registers. */ 6296 mips_output_args_xfer (fp_code, 't'); 6297 6298 if (!fp_ret_p) 6299 { 6300 /* Jump to the previously-loaded address. */ 6301 output_asm_insn ("jr\t%^", NULL); 6302 } 6303 else 6304 { 6305 /* Save the return address in $18 and call the non-MIPS16 function. 6306 The stub's caller knows that $18 might be clobbered, even though 6307 $18 is usually a call-saved register. */ 6308 fprintf (asm_out_file, "\tmove\t%s,%s\n", 6309 reg_names[GP_REG_FIRST + 18], reg_names[RETURN_ADDR_REGNUM]); 6310 output_asm_insn (MIPS_CALL ("jal", &fn, 0, -1), &fn); 6311 6312 /* Move the result from floating-point registers to 6313 general registers. */ 6314 switch (GET_MODE (retval)) 6315 { 6316 case SCmode: 6317 mips_output_32bit_xfer ('f', GP_RETURN + 1, 6318 FP_REG_FIRST + MAX_FPRS_PER_FMT); 6319 /* Fall though. */ 6320 case SFmode: 6321 mips_output_32bit_xfer ('f', GP_RETURN, FP_REG_FIRST); 6322 if (GET_MODE (retval) == SCmode && TARGET_64BIT) 6323 { 6324 /* On 64-bit targets, complex floats are returned in 6325 a single GPR, such that "sd" on a suitably-aligned 6326 target would store the value correctly. */ 6327 fprintf (asm_out_file, "\tdsll\t%s,%s,32\n", 6328 reg_names[GP_RETURN + TARGET_LITTLE_ENDIAN], 6329 reg_names[GP_RETURN + TARGET_LITTLE_ENDIAN]); 6330 fprintf (asm_out_file, "\tor\t%s,%s,%s\n", 6331 reg_names[GP_RETURN], 6332 reg_names[GP_RETURN], 6333 reg_names[GP_RETURN + 1]); 6334 } 6335 break; 6336 6337 case DCmode: 6338 mips_output_64bit_xfer ('f', GP_RETURN + (8 / UNITS_PER_WORD), 6339 FP_REG_FIRST + MAX_FPRS_PER_FMT); 6340 /* Fall though. */ 6341 case DFmode: 6342 case V2SFmode: 6343 mips_output_64bit_xfer ('f', GP_RETURN, FP_REG_FIRST); 6344 break; 6345 6346 default: 6347 gcc_unreachable (); 6348 } 6349 fprintf (asm_out_file, "\tjr\t%s\n", reg_names[GP_REG_FIRST + 18]); 6350 } 6351 6352 #ifdef ASM_DECLARE_FUNCTION_SIZE 6353 ASM_DECLARE_FUNCTION_SIZE (asm_out_file, stubname, stubdecl); 6354 #endif 6355 6356 mips_end_function_definition (stubname); 6357 6358 /* Record this stub. */ 6359 l = XNEW (struct mips16_stub); 6360 l->name = xstrdup (fnname); 6361 l->fp_ret_p = fp_ret_p; 6362 l->next = mips16_stubs; 6363 mips16_stubs = l; 6364 } 6365 6366 /* If we expect a floating-point return value, but we've built a 6367 stub which does not expect one, then we're in trouble. We can't 6368 use the existing stub, because it won't handle the floating-point 6369 value. We can't build a new stub, because the linker won't know 6370 which stub to use for the various calls in this object file. 6371 Fortunately, this case is illegal, since it means that a function 6372 was declared in two different ways in a single compilation. */ 6373 if (fp_ret_p && !l->fp_ret_p) 6374 error ("cannot handle inconsistent calls to %qs", fnname); 6375 6376 if (retval == NULL_RTX) 6377 insn = gen_call_internal_direct (fn, args_size); 6378 else 6379 insn = gen_call_value_internal_direct (retval, fn, args_size); 6380 insn = mips_emit_call_insn (insn, fn, fn, false); 6381 6382 /* If we are calling a stub which handles a floating-point return 6383 value, we need to arrange to save $18 in the prologue. We do this 6384 by marking the function call as using the register. The prologue 6385 will later see that it is used, and emit code to save it. */ 6386 if (fp_ret_p) 6387 CALL_INSN_FUNCTION_USAGE (insn) = 6388 gen_rtx_EXPR_LIST (VOIDmode, 6389 gen_rtx_CLOBBER (VOIDmode, 6390 gen_rtx_REG (word_mode, 18)), 6391 CALL_INSN_FUNCTION_USAGE (insn)); 6392 6393 return insn; 6394 } 6395 6396 /* Expand a call of type TYPE. RESULT is where the result will go (null 6397 for "call"s and "sibcall"s), ADDR is the address of the function, 6398 ARGS_SIZE is the size of the arguments and AUX is the value passed 6399 to us by mips_function_arg. LAZY_P is true if this call already 6400 involves a lazily-bound function address (such as when calling 6401 functions through a MIPS16 hard-float stub). 6402 6403 Return the call itself. */ 6404 6405 rtx 6406 mips_expand_call (enum mips_call_type type, rtx result, rtx addr, 6407 rtx args_size, rtx aux, bool lazy_p) 6408 { 6409 rtx orig_addr, pattern, insn; 6410 int fp_code; 6411 6412 fp_code = aux == 0 ? 0 : (int) GET_MODE (aux); 6413 insn = mips16_build_call_stub (result, &addr, args_size, fp_code); 6414 if (insn) 6415 { 6416 gcc_assert (!lazy_p && type == MIPS_CALL_NORMAL); 6417 return insn; 6418 } 6419 ; 6420 orig_addr = addr; 6421 if (!call_insn_operand (addr, VOIDmode)) 6422 { 6423 if (type == MIPS_CALL_EPILOGUE) 6424 addr = MIPS_EPILOGUE_TEMP (Pmode); 6425 else 6426 addr = gen_reg_rtx (Pmode); 6427 lazy_p |= mips_load_call_address (type, addr, orig_addr); 6428 } 6429 6430 if (result == 0) 6431 { 6432 rtx (*fn) (rtx, rtx); 6433 6434 if (type == MIPS_CALL_SIBCALL) 6435 fn = gen_sibcall_internal; 6436 else 6437 fn = gen_call_internal; 6438 6439 pattern = fn (addr, args_size); 6440 } 6441 else if (GET_CODE (result) == PARALLEL && XVECLEN (result, 0) == 2) 6442 { 6443 /* Handle return values created by mips_return_fpr_pair. */ 6444 rtx (*fn) (rtx, rtx, rtx, rtx); 6445 rtx reg1, reg2; 6446 6447 if (type == MIPS_CALL_SIBCALL) 6448 fn = gen_sibcall_value_multiple_internal; 6449 else 6450 fn = gen_call_value_multiple_internal; 6451 6452 reg1 = XEXP (XVECEXP (result, 0, 0), 0); 6453 reg2 = XEXP (XVECEXP (result, 0, 1), 0); 6454 pattern = fn (reg1, addr, args_size, reg2); 6455 } 6456 else 6457 { 6458 rtx (*fn) (rtx, rtx, rtx); 6459 6460 if (type == MIPS_CALL_SIBCALL) 6461 fn = gen_sibcall_value_internal; 6462 else 6463 fn = gen_call_value_internal; 6464 6465 /* Handle return values created by mips_return_fpr_single. */ 6466 if (GET_CODE (result) == PARALLEL && XVECLEN (result, 0) == 1) 6467 result = XEXP (XVECEXP (result, 0, 0), 0); 6468 pattern = fn (result, addr, args_size); 6469 } 6470 6471 return mips_emit_call_insn (pattern, orig_addr, addr, lazy_p); 6472 } 6473 6474 /* Split call instruction INSN into a $gp-clobbering call and 6475 (where necessary) an instruction to restore $gp from its save slot. 6476 CALL_PATTERN is the pattern of the new call. */ 6477 6478 void 6479 mips_split_call (rtx insn, rtx call_pattern) 6480 { 6481 rtx new_insn; 6482 6483 new_insn = emit_call_insn (call_pattern); 6484 CALL_INSN_FUNCTION_USAGE (new_insn) 6485 = copy_rtx (CALL_INSN_FUNCTION_USAGE (insn)); 6486 if (!find_reg_note (insn, REG_NORETURN, 0)) 6487 /* Pick a temporary register that is suitable for both MIPS16 and 6488 non-MIPS16 code. $4 and $5 are used for returning complex double 6489 values in soft-float code, so $6 is the first suitable candidate. */ 6490 mips_restore_gp_from_cprestore_slot (gen_rtx_REG (Pmode, GP_ARG_FIRST + 2)); 6491 } 6492 6493 /* Implement TARGET_FUNCTION_OK_FOR_SIBCALL. */ 6494 6495 static bool 6496 mips_function_ok_for_sibcall (tree decl, tree exp ATTRIBUTE_UNUSED) 6497 { 6498 if (!TARGET_SIBCALLS) 6499 return false; 6500 6501 /* Interrupt handlers need special epilogue code and therefore can't 6502 use sibcalls. */ 6503 if (mips_interrupt_type_p (TREE_TYPE (current_function_decl))) 6504 return false; 6505 6506 /* We can't do a sibcall if the called function is a MIPS16 function 6507 because there is no direct "jx" instruction equivalent to "jalx" to 6508 switch the ISA mode. We only care about cases where the sibling 6509 and normal calls would both be direct. */ 6510 if (decl 6511 && mips_use_mips16_mode_p (decl) 6512 && const_call_insn_operand (XEXP (DECL_RTL (decl), 0), VOIDmode)) 6513 return false; 6514 6515 /* When -minterlink-mips16 is in effect, assume that non-locally-binding 6516 functions could be MIPS16 ones unless an attribute explicitly tells 6517 us otherwise. */ 6518 if (TARGET_INTERLINK_MIPS16 6519 && decl 6520 && (DECL_EXTERNAL (decl) || !targetm.binds_local_p (decl)) 6521 && !mips_nomips16_decl_p (decl) 6522 && const_call_insn_operand (XEXP (DECL_RTL (decl), 0), VOIDmode)) 6523 return false; 6524 6525 /* Sibling calls should not prevent lazy binding. Lazy-binding stubs 6526 require $gp to be valid on entry, so sibcalls can only use stubs 6527 if $gp is call-clobbered. */ 6528 if (decl 6529 && TARGET_CALL_SAVED_GP 6530 && !TARGET_ABICALLS_PIC0 6531 && !targetm.binds_local_p (decl)) 6532 return false; 6533 6534 /* Otherwise OK. */ 6535 return true; 6536 } 6537 6538 /* Emit code to move general operand SRC into condition-code 6539 register DEST given that SCRATCH is a scratch TFmode FPR. 6540 The sequence is: 6541 6542 FP1 = SRC 6543 FP2 = 0.0f 6544 DEST = FP2 < FP1 6545 6546 where FP1 and FP2 are single-precision FPRs taken from SCRATCH. */ 6547 6548 void 6549 mips_expand_fcc_reload (rtx dest, rtx src, rtx scratch) 6550 { 6551 rtx fp1, fp2; 6552 6553 /* Change the source to SFmode. */ 6554 if (MEM_P (src)) 6555 src = adjust_address (src, SFmode, 0); 6556 else if (REG_P (src) || GET_CODE (src) == SUBREG) 6557 src = gen_rtx_REG (SFmode, true_regnum (src)); 6558 6559 fp1 = gen_rtx_REG (SFmode, REGNO (scratch)); 6560 fp2 = gen_rtx_REG (SFmode, REGNO (scratch) + MAX_FPRS_PER_FMT); 6561 6562 mips_emit_move (copy_rtx (fp1), src); 6563 mips_emit_move (copy_rtx (fp2), CONST0_RTX (SFmode)); 6564 emit_insn (gen_slt_sf (dest, fp2, fp1)); 6565 } 6566 6567 /* Emit straight-line code to move LENGTH bytes from SRC to DEST. 6568 Assume that the areas do not overlap. */ 6569 6570 static void 6571 mips_block_move_straight (rtx dest, rtx src, HOST_WIDE_INT length) 6572 { 6573 HOST_WIDE_INT offset, delta; 6574 unsigned HOST_WIDE_INT bits; 6575 int i; 6576 enum machine_mode mode; 6577 rtx *regs; 6578 6579 /* Work out how many bits to move at a time. If both operands have 6580 half-word alignment, it is usually better to move in half words. 6581 For instance, lh/lh/sh/sh is usually better than lwl/lwr/swl/swr 6582 and lw/lw/sw/sw is usually better than ldl/ldr/sdl/sdr. 6583 Otherwise move word-sized chunks. */ 6584 if (MEM_ALIGN (src) == BITS_PER_WORD / 2 6585 && MEM_ALIGN (dest) == BITS_PER_WORD / 2) 6586 bits = BITS_PER_WORD / 2; 6587 else 6588 bits = BITS_PER_WORD; 6589 6590 mode = mode_for_size (bits, MODE_INT, 0); 6591 delta = bits / BITS_PER_UNIT; 6592 6593 /* Allocate a buffer for the temporary registers. */ 6594 regs = XALLOCAVEC (rtx, length / delta); 6595 6596 /* Load as many BITS-sized chunks as possible. Use a normal load if 6597 the source has enough alignment, otherwise use left/right pairs. */ 6598 for (offset = 0, i = 0; offset + delta <= length; offset += delta, i++) 6599 { 6600 regs[i] = gen_reg_rtx (mode); 6601 if (MEM_ALIGN (src) >= bits) 6602 mips_emit_move (regs[i], adjust_address (src, mode, offset)); 6603 else 6604 { 6605 rtx part = adjust_address (src, BLKmode, offset); 6606 if (!mips_expand_ext_as_unaligned_load (regs[i], part, bits, 0)) 6607 gcc_unreachable (); 6608 } 6609 } 6610 6611 /* Copy the chunks to the destination. */ 6612 for (offset = 0, i = 0; offset + delta <= length; offset += delta, i++) 6613 if (MEM_ALIGN (dest) >= bits) 6614 mips_emit_move (adjust_address (dest, mode, offset), regs[i]); 6615 else 6616 { 6617 rtx part = adjust_address (dest, BLKmode, offset); 6618 if (!mips_expand_ins_as_unaligned_store (part, regs[i], bits, 0)) 6619 gcc_unreachable (); 6620 } 6621 6622 /* Mop up any left-over bytes. */ 6623 if (offset < length) 6624 { 6625 src = adjust_address (src, BLKmode, offset); 6626 dest = adjust_address (dest, BLKmode, offset); 6627 move_by_pieces (dest, src, length - offset, 6628 MIN (MEM_ALIGN (src), MEM_ALIGN (dest)), 0); 6629 } 6630 } 6631 6632 /* Helper function for doing a loop-based block operation on memory 6633 reference MEM. Each iteration of the loop will operate on LENGTH 6634 bytes of MEM. 6635 6636 Create a new base register for use within the loop and point it to 6637 the start of MEM. Create a new memory reference that uses this 6638 register. Store them in *LOOP_REG and *LOOP_MEM respectively. */ 6639 6640 static void 6641 mips_adjust_block_mem (rtx mem, HOST_WIDE_INT length, 6642 rtx *loop_reg, rtx *loop_mem) 6643 { 6644 *loop_reg = copy_addr_to_reg (XEXP (mem, 0)); 6645 6646 /* Although the new mem does not refer to a known location, 6647 it does keep up to LENGTH bytes of alignment. */ 6648 *loop_mem = change_address (mem, BLKmode, *loop_reg); 6649 set_mem_align (*loop_mem, MIN (MEM_ALIGN (mem), length * BITS_PER_UNIT)); 6650 } 6651 6652 /* Move LENGTH bytes from SRC to DEST using a loop that moves BYTES_PER_ITER 6653 bytes at a time. LENGTH must be at least BYTES_PER_ITER. Assume that 6654 the memory regions do not overlap. */ 6655 6656 static void 6657 mips_block_move_loop (rtx dest, rtx src, HOST_WIDE_INT length, 6658 HOST_WIDE_INT bytes_per_iter) 6659 { 6660 rtx label, src_reg, dest_reg, final_src, test; 6661 HOST_WIDE_INT leftover; 6662 6663 leftover = length % bytes_per_iter; 6664 length -= leftover; 6665 6666 /* Create registers and memory references for use within the loop. */ 6667 mips_adjust_block_mem (src, bytes_per_iter, &src_reg, &src); 6668 mips_adjust_block_mem (dest, bytes_per_iter, &dest_reg, &dest); 6669 6670 /* Calculate the value that SRC_REG should have after the last iteration 6671 of the loop. */ 6672 final_src = expand_simple_binop (Pmode, PLUS, src_reg, GEN_INT (length), 6673 0, 0, OPTAB_WIDEN); 6674 6675 /* Emit the start of the loop. */ 6676 label = gen_label_rtx (); 6677 emit_label (label); 6678 6679 /* Emit the loop body. */ 6680 mips_block_move_straight (dest, src, bytes_per_iter); 6681 6682 /* Move on to the next block. */ 6683 mips_emit_move (src_reg, plus_constant (src_reg, bytes_per_iter)); 6684 mips_emit_move (dest_reg, plus_constant (dest_reg, bytes_per_iter)); 6685 6686 /* Emit the loop condition. */ 6687 test = gen_rtx_NE (VOIDmode, src_reg, final_src); 6688 if (Pmode == DImode) 6689 emit_jump_insn (gen_cbranchdi4 (test, src_reg, final_src, label)); 6690 else 6691 emit_jump_insn (gen_cbranchsi4 (test, src_reg, final_src, label)); 6692 6693 /* Mop up any left-over bytes. */ 6694 if (leftover) 6695 mips_block_move_straight (dest, src, leftover); 6696 } 6697 6698 /* Expand a movmemsi instruction, which copies LENGTH bytes from 6699 memory reference SRC to memory reference DEST. */ 6700 6701 bool 6702 mips_expand_block_move (rtx dest, rtx src, rtx length) 6703 { 6704 if (CONST_INT_P (length)) 6705 { 6706 if (INTVAL (length) <= MIPS_MAX_MOVE_BYTES_STRAIGHT) 6707 { 6708 mips_block_move_straight (dest, src, INTVAL (length)); 6709 return true; 6710 } 6711 else if (optimize) 6712 { 6713 mips_block_move_loop (dest, src, INTVAL (length), 6714 MIPS_MAX_MOVE_BYTES_PER_LOOP_ITER); 6715 return true; 6716 } 6717 } 6718 return false; 6719 } 6720 6721 /* Expand a loop of synci insns for the address range [BEGIN, END). */ 6722 6723 void 6724 mips_expand_synci_loop (rtx begin, rtx end) 6725 { 6726 rtx inc, label, end_label, cmp_result, mask, length; 6727 6728 /* Create end_label. */ 6729 end_label = gen_label_rtx (); 6730 6731 /* Check if begin equals end. */ 6732 cmp_result = gen_rtx_EQ (VOIDmode, begin, end); 6733 emit_jump_insn (gen_condjump (cmp_result, end_label)); 6734 6735 /* Load INC with the cache line size (rdhwr INC,$1). */ 6736 inc = gen_reg_rtx (Pmode); 6737 emit_insn (Pmode == SImode 6738 ? gen_rdhwr_synci_step_si (inc) 6739 : gen_rdhwr_synci_step_di (inc)); 6740 6741 /* Check if inc is 0. */ 6742 cmp_result = gen_rtx_EQ (VOIDmode, inc, const0_rtx); 6743 emit_jump_insn (gen_condjump (cmp_result, end_label)); 6744 6745 /* Calculate mask. */ 6746 mask = mips_force_unary (Pmode, NEG, inc); 6747 6748 /* Mask out begin by mask. */ 6749 begin = mips_force_binary (Pmode, AND, begin, mask); 6750 6751 /* Calculate length. */ 6752 length = mips_force_binary (Pmode, MINUS, end, begin); 6753 6754 /* Loop back to here. */ 6755 label = gen_label_rtx (); 6756 emit_label (label); 6757 6758 emit_insn (gen_synci (begin)); 6759 6760 /* Update length. */ 6761 mips_emit_binary (MINUS, length, length, inc); 6762 6763 /* Update begin. */ 6764 mips_emit_binary (PLUS, begin, begin, inc); 6765 6766 /* Check if length is greater than 0. */ 6767 cmp_result = gen_rtx_GT (VOIDmode, length, const0_rtx); 6768 emit_jump_insn (gen_condjump (cmp_result, label)); 6769 6770 emit_label (end_label); 6771 } 6772 6773 /* Expand a QI or HI mode atomic memory operation. 6774 6775 GENERATOR contains a pointer to the gen_* function that generates 6776 the SI mode underlying atomic operation using masks that we 6777 calculate. 6778 6779 RESULT is the return register for the operation. Its value is NULL 6780 if unused. 6781 6782 MEM is the location of the atomic access. 6783 6784 OLDVAL is the first operand for the operation. 6785 6786 NEWVAL is the optional second operand for the operation. Its value 6787 is NULL if unused. */ 6788 6789 void 6790 mips_expand_atomic_qihi (union mips_gen_fn_ptrs generator, 6791 rtx result, rtx mem, rtx oldval, rtx newval) 6792 { 6793 rtx orig_addr, memsi_addr, memsi, shift, shiftsi, unshifted_mask; 6794 rtx unshifted_mask_reg, mask, inverted_mask, si_op; 6795 rtx res = NULL; 6796 enum machine_mode mode; 6797 6798 mode = GET_MODE (mem); 6799 6800 /* Compute the address of the containing SImode value. */ 6801 orig_addr = force_reg (Pmode, XEXP (mem, 0)); 6802 memsi_addr = mips_force_binary (Pmode, AND, orig_addr, 6803 force_reg (Pmode, GEN_INT (-4))); 6804 6805 /* Create a memory reference for it. */ 6806 memsi = gen_rtx_MEM (SImode, memsi_addr); 6807 set_mem_alias_set (memsi, ALIAS_SET_MEMORY_BARRIER); 6808 MEM_VOLATILE_P (memsi) = MEM_VOLATILE_P (mem); 6809 6810 /* Work out the byte offset of the QImode or HImode value, 6811 counting from the least significant byte. */ 6812 shift = mips_force_binary (Pmode, AND, orig_addr, GEN_INT (3)); 6813 if (TARGET_BIG_ENDIAN) 6814 mips_emit_binary (XOR, shift, shift, GEN_INT (mode == QImode ? 3 : 2)); 6815 6816 /* Multiply by eight to convert the shift value from bytes to bits. */ 6817 mips_emit_binary (ASHIFT, shift, shift, GEN_INT (3)); 6818 6819 /* Make the final shift an SImode value, so that it can be used in 6820 SImode operations. */ 6821 shiftsi = force_reg (SImode, gen_lowpart (SImode, shift)); 6822 6823 /* Set MASK to an inclusive mask of the QImode or HImode value. */ 6824 unshifted_mask = GEN_INT (GET_MODE_MASK (mode)); 6825 unshifted_mask_reg = force_reg (SImode, unshifted_mask); 6826 mask = mips_force_binary (SImode, ASHIFT, unshifted_mask_reg, shiftsi); 6827 6828 /* Compute the equivalent exclusive mask. */ 6829 inverted_mask = gen_reg_rtx (SImode); 6830 emit_insn (gen_rtx_SET (VOIDmode, inverted_mask, 6831 gen_rtx_NOT (SImode, mask))); 6832 6833 /* Shift the old value into place. */ 6834 if (oldval != const0_rtx) 6835 { 6836 oldval = convert_modes (SImode, mode, oldval, true); 6837 oldval = force_reg (SImode, oldval); 6838 oldval = mips_force_binary (SImode, ASHIFT, oldval, shiftsi); 6839 } 6840 6841 /* Do the same for the new value. */ 6842 if (newval && newval != const0_rtx) 6843 { 6844 newval = convert_modes (SImode, mode, newval, true); 6845 newval = force_reg (SImode, newval); 6846 newval = mips_force_binary (SImode, ASHIFT, newval, shiftsi); 6847 } 6848 6849 /* Do the SImode atomic access. */ 6850 if (result) 6851 res = gen_reg_rtx (SImode); 6852 if (newval) 6853 si_op = generator.fn_6 (res, memsi, mask, inverted_mask, oldval, newval); 6854 else if (result) 6855 si_op = generator.fn_5 (res, memsi, mask, inverted_mask, oldval); 6856 else 6857 si_op = generator.fn_4 (memsi, mask, inverted_mask, oldval); 6858 6859 emit_insn (si_op); 6860 6861 if (result) 6862 { 6863 /* Shift and convert the result. */ 6864 mips_emit_binary (AND, res, res, mask); 6865 mips_emit_binary (LSHIFTRT, res, res, shiftsi); 6866 mips_emit_move (result, gen_lowpart (GET_MODE (result), res)); 6867 } 6868 } 6869 6870 /* Return true if it is possible to use left/right accesses for a 6871 bitfield of WIDTH bits starting BITPOS bits into *OP. When 6872 returning true, update *OP, *LEFT and *RIGHT as follows: 6873 6874 *OP is a BLKmode reference to the whole field. 6875 6876 *LEFT is a QImode reference to the first byte if big endian or 6877 the last byte if little endian. This address can be used in the 6878 left-side instructions (LWL, SWL, LDL, SDL). 6879 6880 *RIGHT is a QImode reference to the opposite end of the field and 6881 can be used in the patterning right-side instruction. */ 6882 6883 static bool 6884 mips_get_unaligned_mem (rtx *op, HOST_WIDE_INT width, HOST_WIDE_INT bitpos, 6885 rtx *left, rtx *right) 6886 { 6887 rtx first, last; 6888 6889 /* Check that the operand really is a MEM. Not all the extv and 6890 extzv predicates are checked. */ 6891 if (!MEM_P (*op)) 6892 return false; 6893 6894 /* Check that the size is valid. */ 6895 if (width != 32 && (!TARGET_64BIT || width != 64)) 6896 return false; 6897 6898 /* We can only access byte-aligned values. Since we are always passed 6899 a reference to the first byte of the field, it is not necessary to 6900 do anything with BITPOS after this check. */ 6901 if (bitpos % BITS_PER_UNIT != 0) 6902 return false; 6903 6904 /* Reject aligned bitfields: we want to use a normal load or store 6905 instead of a left/right pair. */ 6906 if (MEM_ALIGN (*op) >= width) 6907 return false; 6908 6909 /* Adjust *OP to refer to the whole field. This also has the effect 6910 of legitimizing *OP's address for BLKmode, possibly simplifying it. */ 6911 *op = adjust_address (*op, BLKmode, 0); 6912 set_mem_size (*op, GEN_INT (width / BITS_PER_UNIT)); 6913 6914 /* Get references to both ends of the field. We deliberately don't 6915 use the original QImode *OP for FIRST since the new BLKmode one 6916 might have a simpler address. */ 6917 first = adjust_address (*op, QImode, 0); 6918 last = adjust_address (*op, QImode, width / BITS_PER_UNIT - 1); 6919 6920 /* Allocate to LEFT and RIGHT according to endianness. LEFT should 6921 correspond to the MSB and RIGHT to the LSB. */ 6922 if (TARGET_BIG_ENDIAN) 6923 *left = first, *right = last; 6924 else 6925 *left = last, *right = first; 6926 6927 return true; 6928 } 6929 6930 /* Try to use left/right loads to expand an "extv" or "extzv" pattern. 6931 DEST, SRC, WIDTH and BITPOS are the operands passed to the expander; 6932 the operation is the equivalent of: 6933 6934 (set DEST (*_extract SRC WIDTH BITPOS)) 6935 6936 Return true on success. */ 6937 6938 bool 6939 mips_expand_ext_as_unaligned_load (rtx dest, rtx src, HOST_WIDE_INT width, 6940 HOST_WIDE_INT bitpos) 6941 { 6942 rtx left, right, temp; 6943 6944 /* If TARGET_64BIT, the destination of a 32-bit "extz" or "extzv" will 6945 be a paradoxical word_mode subreg. This is the only case in which 6946 we allow the destination to be larger than the source. */ 6947 if (GET_CODE (dest) == SUBREG 6948 && GET_MODE (dest) == DImode 6949 && GET_MODE (SUBREG_REG (dest)) == SImode) 6950 dest = SUBREG_REG (dest); 6951 6952 /* After the above adjustment, the destination must be the same 6953 width as the source. */ 6954 if (GET_MODE_BITSIZE (GET_MODE (dest)) != width) 6955 return false; 6956 6957 if (!mips_get_unaligned_mem (&src, width, bitpos, &left, &right)) 6958 return false; 6959 6960 temp = gen_reg_rtx (GET_MODE (dest)); 6961 if (GET_MODE (dest) == DImode) 6962 { 6963 emit_insn (gen_mov_ldl (temp, src, left)); 6964 emit_insn (gen_mov_ldr (dest, copy_rtx (src), right, temp)); 6965 } 6966 else 6967 { 6968 emit_insn (gen_mov_lwl (temp, src, left)); 6969 emit_insn (gen_mov_lwr (dest, copy_rtx (src), right, temp)); 6970 } 6971 return true; 6972 } 6973 6974 /* Try to use left/right stores to expand an "ins" pattern. DEST, WIDTH, 6975 BITPOS and SRC are the operands passed to the expander; the operation 6976 is the equivalent of: 6977 6978 (set (zero_extract DEST WIDTH BITPOS) SRC) 6979 6980 Return true on success. */ 6981 6982 bool 6983 mips_expand_ins_as_unaligned_store (rtx dest, rtx src, HOST_WIDE_INT width, 6984 HOST_WIDE_INT bitpos) 6985 { 6986 rtx left, right; 6987 enum machine_mode mode; 6988 6989 if (!mips_get_unaligned_mem (&dest, width, bitpos, &left, &right)) 6990 return false; 6991 6992 mode = mode_for_size (width, MODE_INT, 0); 6993 src = gen_lowpart (mode, src); 6994 if (mode == DImode) 6995 { 6996 emit_insn (gen_mov_sdl (dest, src, left)); 6997 emit_insn (gen_mov_sdr (copy_rtx (dest), copy_rtx (src), right)); 6998 } 6999 else 7000 { 7001 emit_insn (gen_mov_swl (dest, src, left)); 7002 emit_insn (gen_mov_swr (copy_rtx (dest), copy_rtx (src), right)); 7003 } 7004 return true; 7005 } 7006 7007 /* Return true if X is a MEM with the same size as MODE. */ 7008 7009 bool 7010 mips_mem_fits_mode_p (enum machine_mode mode, rtx x) 7011 { 7012 rtx size; 7013 7014 if (!MEM_P (x)) 7015 return false; 7016 7017 size = MEM_SIZE (x); 7018 return size && INTVAL (size) == GET_MODE_SIZE (mode); 7019 } 7020 7021 /* Return true if (zero_extract OP WIDTH BITPOS) can be used as the 7022 source of an "ext" instruction or the destination of an "ins" 7023 instruction. OP must be a register operand and the following 7024 conditions must hold: 7025 7026 0 <= BITPOS < GET_MODE_BITSIZE (GET_MODE (op)) 7027 0 < WIDTH <= GET_MODE_BITSIZE (GET_MODE (op)) 7028 0 < BITPOS + WIDTH <= GET_MODE_BITSIZE (GET_MODE (op)) 7029 7030 Also reject lengths equal to a word as they are better handled 7031 by the move patterns. */ 7032 7033 bool 7034 mips_use_ins_ext_p (rtx op, HOST_WIDE_INT width, HOST_WIDE_INT bitpos) 7035 { 7036 if (!ISA_HAS_EXT_INS 7037 || !register_operand (op, VOIDmode) 7038 || GET_MODE_BITSIZE (GET_MODE (op)) > BITS_PER_WORD) 7039 return false; 7040 7041 if (!IN_RANGE (width, 1, GET_MODE_BITSIZE (GET_MODE (op)) - 1)) 7042 return false; 7043 7044 if (bitpos < 0 || bitpos + width > GET_MODE_BITSIZE (GET_MODE (op))) 7045 return false; 7046 7047 return true; 7048 } 7049 7050 /* Check if MASK and SHIFT are valid in mask-low-and-shift-left 7051 operation if MAXLEN is the maxium length of consecutive bits that 7052 can make up MASK. MODE is the mode of the operation. See 7053 mask_low_and_shift_len for the actual definition. */ 7054 7055 bool 7056 mask_low_and_shift_p (enum machine_mode mode, rtx mask, rtx shift, int maxlen) 7057 { 7058 return IN_RANGE (mask_low_and_shift_len (mode, mask, shift), 1, maxlen); 7059 } 7060 7061 /* Return true iff OP1 and OP2 are valid operands together for the 7062 *and<MODE>3 and *and<MODE>3_mips16 patterns. For the cases to consider, 7063 see the table in the comment before the pattern. */ 7064 7065 bool 7066 and_operands_ok (enum machine_mode mode, rtx op1, rtx op2) 7067 { 7068 return (memory_operand (op1, mode) 7069 ? and_load_operand (op2, mode) 7070 : and_reg_operand (op2, mode)); 7071 } 7072 7073 /* The canonical form of a mask-low-and-shift-left operation is 7074 (and (ashift X SHIFT) MASK) where MASK has the lower SHIFT number of bits 7075 cleared. Thus we need to shift MASK to the right before checking if it 7076 is a valid mask value. MODE is the mode of the operation. If true 7077 return the length of the mask, otherwise return -1. */ 7078 7079 int 7080 mask_low_and_shift_len (enum machine_mode mode, rtx mask, rtx shift) 7081 { 7082 HOST_WIDE_INT shval; 7083 7084 shval = INTVAL (shift) & (GET_MODE_BITSIZE (mode) - 1); 7085 return exact_log2 ((UINTVAL (mask) >> shval) + 1); 7086 } 7087 7088 /* Return true if -msplit-addresses is selected and should be honored. 7089 7090 -msplit-addresses is a half-way house between explicit relocations 7091 and the traditional assembler macros. It can split absolute 32-bit 7092 symbolic constants into a high/lo_sum pair but uses macros for other 7093 sorts of access. 7094 7095 Like explicit relocation support for REL targets, it relies 7096 on GNU extensions in the assembler and the linker. 7097 7098 Although this code should work for -O0, it has traditionally 7099 been treated as an optimization. */ 7100 7101 static bool 7102 mips_split_addresses_p (void) 7103 { 7104 return (TARGET_SPLIT_ADDRESSES 7105 && optimize 7106 && !TARGET_MIPS16 7107 && !flag_pic 7108 && !ABI_HAS_64BIT_SYMBOLS); 7109 } 7110 7111 /* (Re-)Initialize mips_split_p, mips_lo_relocs and mips_hi_relocs. */ 7112 7113 static void 7114 mips_init_relocs (void) 7115 { 7116 memset (mips_split_p, '\0', sizeof (mips_split_p)); 7117 memset (mips_split_hi_p, '\0', sizeof (mips_split_hi_p)); 7118 memset (mips_hi_relocs, '\0', sizeof (mips_hi_relocs)); 7119 memset (mips_lo_relocs, '\0', sizeof (mips_lo_relocs)); 7120 7121 if (ABI_HAS_64BIT_SYMBOLS) 7122 { 7123 if (TARGET_EXPLICIT_RELOCS) 7124 { 7125 mips_split_p[SYMBOL_64_HIGH] = true; 7126 mips_hi_relocs[SYMBOL_64_HIGH] = "%highest("; 7127 mips_lo_relocs[SYMBOL_64_HIGH] = "%higher("; 7128 7129 mips_split_p[SYMBOL_64_MID] = true; 7130 mips_hi_relocs[SYMBOL_64_MID] = "%higher("; 7131 mips_lo_relocs[SYMBOL_64_MID] = "%hi("; 7132 7133 mips_split_p[SYMBOL_64_LOW] = true; 7134 mips_hi_relocs[SYMBOL_64_LOW] = "%hi("; 7135 mips_lo_relocs[SYMBOL_64_LOW] = "%lo("; 7136 7137 mips_split_p[SYMBOL_ABSOLUTE] = true; 7138 mips_lo_relocs[SYMBOL_ABSOLUTE] = "%lo("; 7139 } 7140 } 7141 else 7142 { 7143 if (TARGET_EXPLICIT_RELOCS || mips_split_addresses_p () || TARGET_MIPS16) 7144 { 7145 mips_split_p[SYMBOL_ABSOLUTE] = true; 7146 mips_hi_relocs[SYMBOL_ABSOLUTE] = "%hi("; 7147 mips_lo_relocs[SYMBOL_ABSOLUTE] = "%lo("; 7148 7149 mips_lo_relocs[SYMBOL_32_HIGH] = "%hi("; 7150 } 7151 } 7152 7153 if (TARGET_MIPS16) 7154 { 7155 /* The high part is provided by a pseudo copy of $gp. */ 7156 mips_split_p[SYMBOL_GP_RELATIVE] = true; 7157 mips_lo_relocs[SYMBOL_GP_RELATIVE] = "%gprel("; 7158 } 7159 else if (TARGET_EXPLICIT_RELOCS) 7160 /* Small data constants are kept whole until after reload, 7161 then lowered by mips_rewrite_small_data. */ 7162 mips_lo_relocs[SYMBOL_GP_RELATIVE] = "%gp_rel("; 7163 7164 if (TARGET_EXPLICIT_RELOCS) 7165 { 7166 mips_split_p[SYMBOL_GOT_PAGE_OFST] = true; 7167 if (TARGET_NEWABI) 7168 { 7169 mips_lo_relocs[SYMBOL_GOTOFF_PAGE] = "%got_page("; 7170 mips_lo_relocs[SYMBOL_GOT_PAGE_OFST] = "%got_ofst("; 7171 } 7172 else 7173 { 7174 mips_lo_relocs[SYMBOL_GOTOFF_PAGE] = "%got("; 7175 mips_lo_relocs[SYMBOL_GOT_PAGE_OFST] = "%lo("; 7176 } 7177 if (TARGET_MIPS16) 7178 /* Expose the use of $28 as soon as possible. */ 7179 mips_split_hi_p[SYMBOL_GOT_PAGE_OFST] = true; 7180 7181 if (TARGET_XGOT) 7182 { 7183 /* The HIGH and LO_SUM are matched by special .md patterns. */ 7184 mips_split_p[SYMBOL_GOT_DISP] = true; 7185 7186 mips_split_p[SYMBOL_GOTOFF_DISP] = true; 7187 mips_hi_relocs[SYMBOL_GOTOFF_DISP] = "%got_hi("; 7188 mips_lo_relocs[SYMBOL_GOTOFF_DISP] = "%got_lo("; 7189 7190 mips_split_p[SYMBOL_GOTOFF_CALL] = true; 7191 mips_hi_relocs[SYMBOL_GOTOFF_CALL] = "%call_hi("; 7192 mips_lo_relocs[SYMBOL_GOTOFF_CALL] = "%call_lo("; 7193 } 7194 else 7195 { 7196 if (TARGET_NEWABI) 7197 mips_lo_relocs[SYMBOL_GOTOFF_DISP] = "%got_disp("; 7198 else 7199 mips_lo_relocs[SYMBOL_GOTOFF_DISP] = "%got("; 7200 mips_lo_relocs[SYMBOL_GOTOFF_CALL] = "%call16("; 7201 if (TARGET_MIPS16) 7202 /* Expose the use of $28 as soon as possible. */ 7203 mips_split_p[SYMBOL_GOT_DISP] = true; 7204 } 7205 } 7206 7207 if (TARGET_NEWABI) 7208 { 7209 mips_split_p[SYMBOL_GOTOFF_LOADGP] = true; 7210 mips_hi_relocs[SYMBOL_GOTOFF_LOADGP] = "%hi(%neg(%gp_rel("; 7211 mips_lo_relocs[SYMBOL_GOTOFF_LOADGP] = "%lo(%neg(%gp_rel("; 7212 } 7213 7214 mips_lo_relocs[SYMBOL_TLSGD] = "%tlsgd("; 7215 mips_lo_relocs[SYMBOL_TLSLDM] = "%tlsldm("; 7216 7217 mips_split_p[SYMBOL_DTPREL] = true; 7218 mips_hi_relocs[SYMBOL_DTPREL] = "%dtprel_hi("; 7219 mips_lo_relocs[SYMBOL_DTPREL] = "%dtprel_lo("; 7220 7221 mips_lo_relocs[SYMBOL_GOTTPREL] = "%gottprel("; 7222 7223 mips_split_p[SYMBOL_TPREL] = true; 7224 mips_hi_relocs[SYMBOL_TPREL] = "%tprel_hi("; 7225 mips_lo_relocs[SYMBOL_TPREL] = "%tprel_lo("; 7226 7227 mips_lo_relocs[SYMBOL_HALF] = "%half("; 7228 } 7229 7230 /* Print symbolic operand OP, which is part of a HIGH or LO_SUM 7231 in context CONTEXT. RELOCS is the array of relocations to use. */ 7232 7233 static void 7234 mips_print_operand_reloc (FILE *file, rtx op, enum mips_symbol_context context, 7235 const char **relocs) 7236 { 7237 enum mips_symbol_type symbol_type; 7238 const char *p; 7239 7240 symbol_type = mips_classify_symbolic_expression (op, context); 7241 gcc_assert (relocs[symbol_type]); 7242 7243 fputs (relocs[symbol_type], file); 7244 output_addr_const (file, mips_strip_unspec_address (op)); 7245 for (p = relocs[symbol_type]; *p != 0; p++) 7246 if (*p == '(') 7247 fputc (')', file); 7248 } 7249 7250 /* Start a new block with the given asm switch enabled. If we need 7251 to print a directive, emit PREFIX before it and SUFFIX after it. */ 7252 7253 static void 7254 mips_push_asm_switch_1 (struct mips_asm_switch *asm_switch, 7255 const char *prefix, const char *suffix) 7256 { 7257 if (asm_switch->nesting_level == 0) 7258 fprintf (asm_out_file, "%s.set\tno%s%s", prefix, asm_switch->name, suffix); 7259 asm_switch->nesting_level++; 7260 } 7261 7262 /* Likewise, but end a block. */ 7263 7264 static void 7265 mips_pop_asm_switch_1 (struct mips_asm_switch *asm_switch, 7266 const char *prefix, const char *suffix) 7267 { 7268 gcc_assert (asm_switch->nesting_level); 7269 asm_switch->nesting_level--; 7270 if (asm_switch->nesting_level == 0) 7271 fprintf (asm_out_file, "%s.set\t%s%s", prefix, asm_switch->name, suffix); 7272 } 7273 7274 /* Wrappers around mips_push_asm_switch_1 and mips_pop_asm_switch_1 7275 that either print a complete line or print nothing. */ 7276 7277 void 7278 mips_push_asm_switch (struct mips_asm_switch *asm_switch) 7279 { 7280 mips_push_asm_switch_1 (asm_switch, "\t", "\n"); 7281 } 7282 7283 void 7284 mips_pop_asm_switch (struct mips_asm_switch *asm_switch) 7285 { 7286 mips_pop_asm_switch_1 (asm_switch, "\t", "\n"); 7287 } 7288 7289 /* Print the text for PRINT_OPERAND punctation character CH to FILE. 7290 The punctuation characters are: 7291 7292 '(' Start a nested ".set noreorder" block. 7293 ')' End a nested ".set noreorder" block. 7294 '[' Start a nested ".set noat" block. 7295 ']' End a nested ".set noat" block. 7296 '<' Start a nested ".set nomacro" block. 7297 '>' End a nested ".set nomacro" block. 7298 '*' Behave like %(%< if generating a delayed-branch sequence. 7299 '#' Print a nop if in a ".set noreorder" block. 7300 '/' Like '#', but do nothing within a delayed-branch sequence. 7301 '?' Print "l" if mips_branch_likely is true 7302 '~' Print a nop if mips_branch_likely is true 7303 '.' Print the name of the register with a hard-wired zero (zero or $0). 7304 '@' Print the name of the assembler temporary register (at or $1). 7305 '^' Print the name of the pic call-through register (t9 or $25). 7306 '+' Print the name of the gp register (usually gp or $28). 7307 '$' Print the name of the stack pointer register (sp or $29). 7308 7309 See also mips_init_print_operand_pucnt. */ 7310 7311 static void 7312 mips_print_operand_punctuation (FILE *file, int ch) 7313 { 7314 switch (ch) 7315 { 7316 case '(': 7317 mips_push_asm_switch_1 (&mips_noreorder, "", "\n\t"); 7318 break; 7319 7320 case ')': 7321 mips_pop_asm_switch_1 (&mips_noreorder, "\n\t", ""); 7322 break; 7323 7324 case '[': 7325 mips_push_asm_switch_1 (&mips_noat, "", "\n\t"); 7326 break; 7327 7328 case ']': 7329 mips_pop_asm_switch_1 (&mips_noat, "\n\t", ""); 7330 break; 7331 7332 case '<': 7333 mips_push_asm_switch_1 (&mips_nomacro, "", "\n\t"); 7334 break; 7335 7336 case '>': 7337 mips_pop_asm_switch_1 (&mips_nomacro, "\n\t", ""); 7338 break; 7339 7340 case '*': 7341 if (final_sequence != 0) 7342 { 7343 mips_print_operand_punctuation (file, '('); 7344 mips_print_operand_punctuation (file, '<'); 7345 } 7346 break; 7347 7348 case '#': 7349 if (mips_noreorder.nesting_level > 0) 7350 fputs ("\n\tnop", file); 7351 break; 7352 7353 case '/': 7354 /* Print an extra newline so that the delayed insn is separated 7355 from the following ones. This looks neater and is consistent 7356 with non-nop delayed sequences. */ 7357 if (mips_noreorder.nesting_level > 0 && final_sequence == 0) 7358 fputs ("\n\tnop\n", file); 7359 break; 7360 7361 case '?': 7362 if (mips_branch_likely) 7363 putc ('l', file); 7364 break; 7365 7366 case '~': 7367 if (mips_branch_likely) 7368 fputs ("\n\tnop", file); 7369 break; 7370 7371 case '.': 7372 fputs (reg_names[GP_REG_FIRST + 0], file); 7373 break; 7374 7375 case '@': 7376 fputs (reg_names[AT_REGNUM], file); 7377 break; 7378 7379 case '^': 7380 fputs (reg_names[PIC_FUNCTION_ADDR_REGNUM], file); 7381 break; 7382 7383 case '+': 7384 fputs (reg_names[PIC_OFFSET_TABLE_REGNUM], file); 7385 break; 7386 7387 case '$': 7388 fputs (reg_names[STACK_POINTER_REGNUM], file); 7389 break; 7390 7391 default: 7392 gcc_unreachable (); 7393 break; 7394 } 7395 } 7396 7397 /* Initialize mips_print_operand_punct. */ 7398 7399 static void 7400 mips_init_print_operand_punct (void) 7401 { 7402 const char *p; 7403 7404 for (p = "()[]<>*#/?~.@^+$"; *p; p++) 7405 mips_print_operand_punct[(unsigned char) *p] = true; 7406 } 7407 7408 /* PRINT_OPERAND prefix LETTER refers to the integer branch instruction 7409 associated with condition CODE. Print the condition part of the 7410 opcode to FILE. */ 7411 7412 static void 7413 mips_print_int_branch_condition (FILE *file, enum rtx_code code, int letter) 7414 { 7415 switch (code) 7416 { 7417 case EQ: 7418 case NE: 7419 case GT: 7420 case GE: 7421 case LT: 7422 case LE: 7423 case GTU: 7424 case GEU: 7425 case LTU: 7426 case LEU: 7427 /* Conveniently, the MIPS names for these conditions are the same 7428 as their RTL equivalents. */ 7429 fputs (GET_RTX_NAME (code), file); 7430 break; 7431 7432 default: 7433 output_operand_lossage ("'%%%c' is not a valid operand prefix", letter); 7434 break; 7435 } 7436 } 7437 7438 /* Likewise floating-point branches. */ 7439 7440 static void 7441 mips_print_float_branch_condition (FILE *file, enum rtx_code code, int letter) 7442 { 7443 switch (code) 7444 { 7445 case EQ: 7446 fputs ("c1f", file); 7447 break; 7448 7449 case NE: 7450 fputs ("c1t", file); 7451 break; 7452 7453 default: 7454 output_operand_lossage ("'%%%c' is not a valid operand prefix", letter); 7455 break; 7456 } 7457 } 7458 7459 /* Implement the PRINT_OPERAND macro. The MIPS-specific operand codes are: 7460 7461 'X' Print CONST_INT OP in hexadecimal format. 7462 'x' Print the low 16 bits of CONST_INT OP in hexadecimal format. 7463 'd' Print CONST_INT OP in decimal. 7464 'm' Print one less than CONST_INT OP in decimal. 7465 'h' Print the high-part relocation associated with OP, after stripping 7466 any outermost HIGH. 7467 'R' Print the low-part relocation associated with OP. 7468 'C' Print the integer branch condition for comparison OP. 7469 'N' Print the inverse of the integer branch condition for comparison OP. 7470 'F' Print the FPU branch condition for comparison OP. 7471 'W' Print the inverse of the FPU branch condition for comparison OP. 7472 'T' Print 'f' for (eq:CC ...), 't' for (ne:CC ...), 7473 'z' for (eq:?I ...), 'n' for (ne:?I ...). 7474 't' Like 'T', but with the EQ/NE cases reversed 7475 'Y' Print mips_fp_conditions[INTVAL (OP)] 7476 'Z' Print OP and a comma for ISA_HAS_8CC, otherwise print nothing. 7477 'q' Print a DSP accumulator register. 7478 'D' Print the second part of a double-word register or memory operand. 7479 'L' Print the low-order register in a double-word register operand. 7480 'M' Print high-order register in a double-word register operand. 7481 'z' Print $0 if OP is zero, otherwise print OP normally. */ 7482 7483 void 7484 mips_print_operand (FILE *file, rtx op, int letter) 7485 { 7486 enum rtx_code code; 7487 7488 if (PRINT_OPERAND_PUNCT_VALID_P (letter)) 7489 { 7490 mips_print_operand_punctuation (file, letter); 7491 return; 7492 } 7493 7494 gcc_assert (op); 7495 code = GET_CODE (op); 7496 7497 switch (letter) 7498 { 7499 case 'X': 7500 if (CONST_INT_P (op)) 7501 fprintf (file, HOST_WIDE_INT_PRINT_HEX, INTVAL (op)); 7502 else 7503 output_operand_lossage ("invalid use of '%%%c'", letter); 7504 break; 7505 7506 case 'x': 7507 if (CONST_INT_P (op)) 7508 fprintf (file, HOST_WIDE_INT_PRINT_HEX, INTVAL (op) & 0xffff); 7509 else 7510 output_operand_lossage ("invalid use of '%%%c'", letter); 7511 break; 7512 7513 case 'd': 7514 if (CONST_INT_P (op)) 7515 fprintf (file, HOST_WIDE_INT_PRINT_DEC, INTVAL (op)); 7516 else 7517 output_operand_lossage ("invalid use of '%%%c'", letter); 7518 break; 7519 7520 case 'm': 7521 if (CONST_INT_P (op)) 7522 fprintf (file, HOST_WIDE_INT_PRINT_DEC, INTVAL (op) - 1); 7523 else 7524 output_operand_lossage ("invalid use of '%%%c'", letter); 7525 break; 7526 7527 case 'h': 7528 if (code == HIGH) 7529 op = XEXP (op, 0); 7530 mips_print_operand_reloc (file, op, SYMBOL_CONTEXT_LEA, mips_hi_relocs); 7531 break; 7532 7533 case 'R': 7534 mips_print_operand_reloc (file, op, SYMBOL_CONTEXT_LEA, mips_lo_relocs); 7535 break; 7536 7537 case 'C': 7538 mips_print_int_branch_condition (file, code, letter); 7539 break; 7540 7541 case 'N': 7542 mips_print_int_branch_condition (file, reverse_condition (code), letter); 7543 break; 7544 7545 case 'F': 7546 mips_print_float_branch_condition (file, code, letter); 7547 break; 7548 7549 case 'W': 7550 mips_print_float_branch_condition (file, reverse_condition (code), 7551 letter); 7552 break; 7553 7554 case 'T': 7555 case 't': 7556 { 7557 int truth = (code == NE) == (letter == 'T'); 7558 fputc ("zfnt"[truth * 2 + (GET_MODE (op) == CCmode)], file); 7559 } 7560 break; 7561 7562 case 'Y': 7563 if (code == CONST_INT && UINTVAL (op) < ARRAY_SIZE (mips_fp_conditions)) 7564 fputs (mips_fp_conditions[UINTVAL (op)], file); 7565 else 7566 output_operand_lossage ("'%%%c' is not a valid operand prefix", 7567 letter); 7568 break; 7569 7570 case 'Z': 7571 if (ISA_HAS_8CC) 7572 { 7573 mips_print_operand (file, op, 0); 7574 fputc (',', file); 7575 } 7576 break; 7577 7578 case 'q': 7579 if (code == REG && MD_REG_P (REGNO (op))) 7580 fprintf (file, "$ac0"); 7581 else if (code == REG && DSP_ACC_REG_P (REGNO (op))) 7582 fprintf (file, "$ac%c", reg_names[REGNO (op)][3]); 7583 else 7584 output_operand_lossage ("invalid use of '%%%c'", letter); 7585 break; 7586 7587 default: 7588 switch (code) 7589 { 7590 case REG: 7591 { 7592 unsigned int regno = REGNO (op); 7593 if ((letter == 'M' && TARGET_LITTLE_ENDIAN) 7594 || (letter == 'L' && TARGET_BIG_ENDIAN) 7595 || letter == 'D') 7596 regno++; 7597 else if (letter && letter != 'z' && letter != 'M' && letter != 'L') 7598 output_operand_lossage ("invalid use of '%%%c'", letter); 7599 /* We need to print $0 .. $31 for COP0 registers. */ 7600 if (COP0_REG_P (regno)) 7601 fprintf (file, "$%s", ®_names[regno][4]); 7602 else 7603 fprintf (file, "%s", reg_names[regno]); 7604 } 7605 break; 7606 7607 case MEM: 7608 if (letter == 'D') 7609 output_address (plus_constant (XEXP (op, 0), 4)); 7610 else if (letter && letter != 'z') 7611 output_operand_lossage ("invalid use of '%%%c'", letter); 7612 else 7613 output_address (XEXP (op, 0)); 7614 break; 7615 7616 default: 7617 if (letter == 'z' && op == CONST0_RTX (GET_MODE (op))) 7618 fputs (reg_names[GP_REG_FIRST], file); 7619 else if (letter && letter != 'z') 7620 output_operand_lossage ("invalid use of '%%%c'", letter); 7621 else if (CONST_GP_P (op)) 7622 fputs (reg_names[GLOBAL_POINTER_REGNUM], file); 7623 else 7624 output_addr_const (file, mips_strip_unspec_address (op)); 7625 break; 7626 } 7627 } 7628 } 7629 7630 /* Output address operand X to FILE. */ 7631 7632 void 7633 mips_print_operand_address (FILE *file, rtx x) 7634 { 7635 struct mips_address_info addr; 7636 7637 if (mips_classify_address (&addr, x, word_mode, true)) 7638 switch (addr.type) 7639 { 7640 case ADDRESS_REG: 7641 mips_print_operand (file, addr.offset, 0); 7642 fprintf (file, "(%s)", reg_names[REGNO (addr.reg)]); 7643 return; 7644 7645 case ADDRESS_LO_SUM: 7646 mips_print_operand_reloc (file, addr.offset, SYMBOL_CONTEXT_MEM, 7647 mips_lo_relocs); 7648 fprintf (file, "(%s)", reg_names[REGNO (addr.reg)]); 7649 return; 7650 7651 case ADDRESS_CONST_INT: 7652 output_addr_const (file, x); 7653 fprintf (file, "(%s)", reg_names[GP_REG_FIRST]); 7654 return; 7655 7656 case ADDRESS_SYMBOLIC: 7657 output_addr_const (file, mips_strip_unspec_address (x)); 7658 return; 7659 } 7660 gcc_unreachable (); 7661 } 7662 7663 /* Implement TARGET_ENCODE_SECTION_INFO. */ 7664 7665 static void 7666 mips_encode_section_info (tree decl, rtx rtl, int first) 7667 { 7668 default_encode_section_info (decl, rtl, first); 7669 7670 if (TREE_CODE (decl) == FUNCTION_DECL) 7671 { 7672 rtx symbol = XEXP (rtl, 0); 7673 tree type = TREE_TYPE (decl); 7674 7675 /* Encode whether the symbol is short or long. */ 7676 if ((TARGET_LONG_CALLS && !mips_near_type_p (type)) 7677 || mips_far_type_p (type)) 7678 SYMBOL_REF_FLAGS (symbol) |= SYMBOL_FLAG_LONG_CALL; 7679 } 7680 } 7681 7682 /* Implement TARGET_SELECT_RTX_SECTION. */ 7683 7684 static section * 7685 mips_select_rtx_section (enum machine_mode mode, rtx x, 7686 unsigned HOST_WIDE_INT align) 7687 { 7688 /* ??? Consider using mergeable small data sections. */ 7689 if (mips_rtx_constant_in_small_data_p (mode)) 7690 return get_named_section (NULL, ".sdata", 0); 7691 7692 return default_elf_select_rtx_section (mode, x, align); 7693 } 7694 7695 /* Implement TARGET_ASM_FUNCTION_RODATA_SECTION. 7696 7697 The complication here is that, with the combination TARGET_ABICALLS 7698 && !TARGET_ABSOLUTE_ABICALLS && !TARGET_GPWORD, jump tables will use 7699 absolute addresses, and should therefore not be included in the 7700 read-only part of a DSO. Handle such cases by selecting a normal 7701 data section instead of a read-only one. The logic apes that in 7702 default_function_rodata_section. */ 7703 7704 static section * 7705 mips_function_rodata_section (tree decl) 7706 { 7707 if (!TARGET_ABICALLS || TARGET_ABSOLUTE_ABICALLS || TARGET_GPWORD) 7708 return default_function_rodata_section (decl); 7709 7710 if (decl && DECL_SECTION_NAME (decl)) 7711 { 7712 const char *name = TREE_STRING_POINTER (DECL_SECTION_NAME (decl)); 7713 if (DECL_ONE_ONLY (decl) && strncmp (name, ".gnu.linkonce.t.", 16) == 0) 7714 { 7715 char *rname = ASTRDUP (name); 7716 rname[14] = 'd'; 7717 return get_section (rname, SECTION_LINKONCE | SECTION_WRITE, decl); 7718 } 7719 else if (flag_function_sections 7720 && flag_data_sections 7721 && strncmp (name, ".text.", 6) == 0) 7722 { 7723 char *rname = ASTRDUP (name); 7724 memcpy (rname + 1, "data", 4); 7725 return get_section (rname, SECTION_WRITE, decl); 7726 } 7727 } 7728 return data_section; 7729 } 7730 7731 /* Implement TARGET_IN_SMALL_DATA_P. */ 7732 7733 static bool 7734 mips_in_small_data_p (const_tree decl) 7735 { 7736 unsigned HOST_WIDE_INT size; 7737 7738 if (TREE_CODE (decl) == STRING_CST || TREE_CODE (decl) == FUNCTION_DECL) 7739 return false; 7740 7741 /* We don't yet generate small-data references for -mabicalls 7742 or VxWorks RTP code. See the related -G handling in 7743 mips_override_options. */ 7744 if (TARGET_ABICALLS || TARGET_VXWORKS_RTP) 7745 return false; 7746 7747 if (TREE_CODE (decl) == VAR_DECL && DECL_SECTION_NAME (decl) != 0) 7748 { 7749 const char *name; 7750 7751 /* Reject anything that isn't in a known small-data section. */ 7752 name = TREE_STRING_POINTER (DECL_SECTION_NAME (decl)); 7753 if (strcmp (name, ".sdata") != 0 && strcmp (name, ".sbss") != 0) 7754 return false; 7755 7756 /* If a symbol is defined externally, the assembler will use the 7757 usual -G rules when deciding how to implement macros. */ 7758 if (mips_lo_relocs[SYMBOL_GP_RELATIVE] || !DECL_EXTERNAL (decl)) 7759 return true; 7760 } 7761 else if (TARGET_EMBEDDED_DATA) 7762 { 7763 /* Don't put constants into the small data section: we want them 7764 to be in ROM rather than RAM. */ 7765 if (TREE_CODE (decl) != VAR_DECL) 7766 return false; 7767 7768 if (TREE_READONLY (decl) 7769 && !TREE_SIDE_EFFECTS (decl) 7770 && (!DECL_INITIAL (decl) || TREE_CONSTANT (DECL_INITIAL (decl)))) 7771 return false; 7772 } 7773 7774 /* Enforce -mlocal-sdata. */ 7775 if (!TARGET_LOCAL_SDATA && !TREE_PUBLIC (decl)) 7776 return false; 7777 7778 /* Enforce -mextern-sdata. */ 7779 if (!TARGET_EXTERN_SDATA && DECL_P (decl)) 7780 { 7781 if (DECL_EXTERNAL (decl)) 7782 return false; 7783 if (DECL_COMMON (decl) && DECL_INITIAL (decl) == NULL) 7784 return false; 7785 } 7786 7787 /* We have traditionally not treated zero-sized objects as small data, 7788 so this is now effectively part of the ABI. */ 7789 size = int_size_in_bytes (TREE_TYPE (decl)); 7790 return size > 0 && size <= mips_small_data_threshold; 7791 } 7792 7793 /* Implement TARGET_USE_ANCHORS_FOR_SYMBOL_P. We don't want to use 7794 anchors for small data: the GP register acts as an anchor in that 7795 case. We also don't want to use them for PC-relative accesses, 7796 where the PC acts as an anchor. */ 7797 7798 static bool 7799 mips_use_anchors_for_symbol_p (const_rtx symbol) 7800 { 7801 switch (mips_classify_symbol (symbol, SYMBOL_CONTEXT_MEM)) 7802 { 7803 case SYMBOL_PC_RELATIVE: 7804 case SYMBOL_GP_RELATIVE: 7805 return false; 7806 7807 default: 7808 return default_use_anchors_for_symbol_p (symbol); 7809 } 7810 } 7811 7812 /* The MIPS debug format wants all automatic variables and arguments 7813 to be in terms of the virtual frame pointer (stack pointer before 7814 any adjustment in the function), while the MIPS 3.0 linker wants 7815 the frame pointer to be the stack pointer after the initial 7816 adjustment. So, we do the adjustment here. The arg pointer (which 7817 is eliminated) points to the virtual frame pointer, while the frame 7818 pointer (which may be eliminated) points to the stack pointer after 7819 the initial adjustments. */ 7820 7821 HOST_WIDE_INT 7822 mips_debugger_offset (rtx addr, HOST_WIDE_INT offset) 7823 { 7824 rtx offset2 = const0_rtx; 7825 rtx reg = eliminate_constant_term (addr, &offset2); 7826 7827 if (offset == 0) 7828 offset = INTVAL (offset2); 7829 7830 if (reg == stack_pointer_rtx 7831 || reg == frame_pointer_rtx 7832 || reg == hard_frame_pointer_rtx) 7833 { 7834 offset -= cfun->machine->frame.total_size; 7835 if (reg == hard_frame_pointer_rtx) 7836 offset += cfun->machine->frame.hard_frame_pointer_offset; 7837 } 7838 7839 /* sdbout_parms does not want this to crash for unrecognized cases. */ 7840 #if 0 7841 else if (reg != arg_pointer_rtx) 7842 fatal_insn ("mips_debugger_offset called with non stack/frame/arg pointer", 7843 addr); 7844 #endif 7845 7846 return offset; 7847 } 7848 7849 /* Implement ASM_OUTPUT_EXTERNAL. */ 7850 7851 void 7852 mips_output_external (FILE *file, tree decl, const char *name) 7853 { 7854 default_elf_asm_output_external (file, decl, name); 7855 7856 /* We output the name if and only if TREE_SYMBOL_REFERENCED is 7857 set in order to avoid putting out names that are never really 7858 used. */ 7859 if (TREE_SYMBOL_REFERENCED (DECL_ASSEMBLER_NAME (decl))) 7860 { 7861 if (!TARGET_EXPLICIT_RELOCS && mips_in_small_data_p (decl)) 7862 { 7863 /* When using assembler macros, emit .extern directives for 7864 all small-data externs so that the assembler knows how 7865 big they are. 7866 7867 In most cases it would be safe (though pointless) to emit 7868 .externs for other symbols too. One exception is when an 7869 object is within the -G limit but declared by the user to 7870 be in a section other than .sbss or .sdata. */ 7871 fputs ("\t.extern\t", file); 7872 assemble_name (file, name); 7873 fprintf (file, ", " HOST_WIDE_INT_PRINT_DEC "\n", 7874 int_size_in_bytes (TREE_TYPE (decl))); 7875 } 7876 else if (TARGET_IRIX 7877 && mips_abi == ABI_32 7878 && TREE_CODE (decl) == FUNCTION_DECL) 7879 { 7880 /* In IRIX 5 or IRIX 6 for the O32 ABI, we must output a 7881 `.global name .text' directive for every used but 7882 undefined function. If we don't, the linker may perform 7883 an optimization (skipping over the insns that set $gp) 7884 when it is unsafe. */ 7885 fputs ("\t.globl ", file); 7886 assemble_name (file, name); 7887 fputs (" .text\n", file); 7888 } 7889 } 7890 } 7891 7892 /* Implement ASM_OUTPUT_SOURCE_FILENAME. */ 7893 7894 void 7895 mips_output_filename (FILE *stream, const char *name) 7896 { 7897 /* If we are emitting DWARF-2, let dwarf2out handle the ".file" 7898 directives. */ 7899 if (write_symbols == DWARF2_DEBUG) 7900 return; 7901 else if (mips_output_filename_first_time) 7902 { 7903 mips_output_filename_first_time = 0; 7904 num_source_filenames += 1; 7905 current_function_file = name; 7906 fprintf (stream, "\t.file\t%d ", num_source_filenames); 7907 output_quoted_string (stream, name); 7908 putc ('\n', stream); 7909 } 7910 /* If we are emitting stabs, let dbxout.c handle this (except for 7911 the mips_output_filename_first_time case). */ 7912 else if (write_symbols == DBX_DEBUG) 7913 return; 7914 else if (name != current_function_file 7915 && strcmp (name, current_function_file) != 0) 7916 { 7917 num_source_filenames += 1; 7918 current_function_file = name; 7919 fprintf (stream, "\t.file\t%d ", num_source_filenames); 7920 output_quoted_string (stream, name); 7921 putc ('\n', stream); 7922 } 7923 } 7924 7925 /* Implement TARGET_ASM_OUTPUT_DWARF_DTPREL. */ 7926 7927 static void ATTRIBUTE_UNUSED 7928 mips_output_dwarf_dtprel (FILE *file, int size, rtx x) 7929 { 7930 switch (size) 7931 { 7932 case 4: 7933 fputs ("\t.dtprelword\t", file); 7934 break; 7935 7936 case 8: 7937 fputs ("\t.dtpreldword\t", file); 7938 break; 7939 7940 default: 7941 gcc_unreachable (); 7942 } 7943 output_addr_const (file, x); 7944 fputs ("+0x8000", file); 7945 } 7946 7947 /* Implement TARGET_DWARF_REGISTER_SPAN. */ 7948 7949 static rtx 7950 mips_dwarf_register_span (rtx reg) 7951 { 7952 rtx high, low; 7953 enum machine_mode mode; 7954 7955 /* By default, GCC maps increasing register numbers to increasing 7956 memory locations, but paired FPRs are always little-endian, 7957 regardless of the prevailing endianness. */ 7958 mode = GET_MODE (reg); 7959 if (FP_REG_P (REGNO (reg)) 7960 && TARGET_BIG_ENDIAN 7961 && MAX_FPRS_PER_FMT > 1 7962 && GET_MODE_SIZE (mode) > UNITS_PER_FPREG) 7963 { 7964 gcc_assert (GET_MODE_SIZE (mode) == UNITS_PER_HWFPVALUE); 7965 high = mips_subword (reg, true); 7966 low = mips_subword (reg, false); 7967 return gen_rtx_PARALLEL (VOIDmode, gen_rtvec (2, high, low)); 7968 } 7969 7970 return NULL_RTX; 7971 } 7972 7973 /* Implement ASM_OUTPUT_ASCII. */ 7974 7975 void 7976 mips_output_ascii (FILE *stream, const char *string, size_t len) 7977 { 7978 size_t i; 7979 int cur_pos; 7980 7981 cur_pos = 17; 7982 fprintf (stream, "\t.ascii\t\""); 7983 for (i = 0; i < len; i++) 7984 { 7985 int c; 7986 7987 c = (unsigned char) string[i]; 7988 if (ISPRINT (c)) 7989 { 7990 if (c == '\\' || c == '\"') 7991 { 7992 putc ('\\', stream); 7993 cur_pos++; 7994 } 7995 putc (c, stream); 7996 cur_pos++; 7997 } 7998 else 7999 { 8000 fprintf (stream, "\\%03o", c); 8001 cur_pos += 4; 8002 } 8003 8004 if (cur_pos > 72 && i+1 < len) 8005 { 8006 cur_pos = 17; 8007 fprintf (stream, "\"\n\t.ascii\t\""); 8008 } 8009 } 8010 fprintf (stream, "\"\n"); 8011 } 8012 8013 /* Emit either a label, .comm, or .lcomm directive. When using assembler 8014 macros, mark the symbol as written so that mips_asm_output_external 8015 won't emit an .extern for it. STREAM is the output file, NAME is the 8016 name of the symbol, INIT_STRING is the string that should be written 8017 before the symbol and FINAL_STRING is the string that should be 8018 written after it. FINAL_STRING is a printf format that consumes the 8019 remaining arguments. */ 8020 8021 void 8022 mips_declare_object (FILE *stream, const char *name, const char *init_string, 8023 const char *final_string, ...) 8024 { 8025 va_list ap; 8026 8027 fputs (init_string, stream); 8028 assemble_name (stream, name); 8029 va_start (ap, final_string); 8030 vfprintf (stream, final_string, ap); 8031 va_end (ap); 8032 8033 if (!TARGET_EXPLICIT_RELOCS) 8034 { 8035 tree name_tree = get_identifier (name); 8036 TREE_ASM_WRITTEN (name_tree) = 1; 8037 } 8038 } 8039 8040 /* Declare a common object of SIZE bytes using asm directive INIT_STRING. 8041 NAME is the name of the object and ALIGN is the required alignment 8042 in bytes. TAKES_ALIGNMENT_P is true if the directive takes a third 8043 alignment argument. */ 8044 8045 void 8046 mips_declare_common_object (FILE *stream, const char *name, 8047 const char *init_string, 8048 unsigned HOST_WIDE_INT size, 8049 unsigned int align, bool takes_alignment_p) 8050 { 8051 if (!takes_alignment_p) 8052 { 8053 size += (align / BITS_PER_UNIT) - 1; 8054 size -= size % (align / BITS_PER_UNIT); 8055 mips_declare_object (stream, name, init_string, 8056 "," HOST_WIDE_INT_PRINT_UNSIGNED "\n", size); 8057 } 8058 else 8059 mips_declare_object (stream, name, init_string, 8060 "," HOST_WIDE_INT_PRINT_UNSIGNED ",%u\n", 8061 size, align / BITS_PER_UNIT); 8062 } 8063 8064 /* Implement ASM_OUTPUT_ALIGNED_DECL_COMMON. This is usually the same as the 8065 elfos.h version, but we also need to handle -muninit-const-in-rodata. */ 8066 8067 void 8068 mips_output_aligned_decl_common (FILE *stream, tree decl, const char *name, 8069 unsigned HOST_WIDE_INT size, 8070 unsigned int align) 8071 { 8072 /* If the target wants uninitialized const declarations in 8073 .rdata then don't put them in .comm. */ 8074 if (TARGET_EMBEDDED_DATA 8075 && TARGET_UNINIT_CONST_IN_RODATA 8076 && TREE_CODE (decl) == VAR_DECL 8077 && TREE_READONLY (decl) 8078 && (DECL_INITIAL (decl) == 0 || DECL_INITIAL (decl) == error_mark_node)) 8079 { 8080 if (TREE_PUBLIC (decl) && DECL_NAME (decl)) 8081 targetm.asm_out.globalize_label (stream, name); 8082 8083 switch_to_section (readonly_data_section); 8084 ASM_OUTPUT_ALIGN (stream, floor_log2 (align / BITS_PER_UNIT)); 8085 mips_declare_object (stream, name, "", 8086 ":\n\t.space\t" HOST_WIDE_INT_PRINT_UNSIGNED "\n", 8087 size); 8088 } 8089 else 8090 mips_declare_common_object (stream, name, "\n\t.comm\t", 8091 size, align, true); 8092 } 8093 8094 #ifdef ASM_OUTPUT_SIZE_DIRECTIVE 8095 extern int size_directive_output; 8096 8097 /* Implement ASM_DECLARE_OBJECT_NAME. This is like most of the standard ELF 8098 definitions except that it uses mips_declare_object to emit the label. */ 8099 8100 void 8101 mips_declare_object_name (FILE *stream, const char *name, 8102 tree decl ATTRIBUTE_UNUSED) 8103 { 8104 #ifdef ASM_OUTPUT_TYPE_DIRECTIVE 8105 ASM_OUTPUT_TYPE_DIRECTIVE (stream, name, "object"); 8106 #endif 8107 8108 size_directive_output = 0; 8109 if (!flag_inhibit_size_directive && DECL_SIZE (decl)) 8110 { 8111 HOST_WIDE_INT size; 8112 8113 size_directive_output = 1; 8114 size = int_size_in_bytes (TREE_TYPE (decl)); 8115 ASM_OUTPUT_SIZE_DIRECTIVE (stream, name, size); 8116 } 8117 8118 mips_declare_object (stream, name, "", ":\n"); 8119 } 8120 8121 /* Implement ASM_FINISH_DECLARE_OBJECT. This is generic ELF stuff. */ 8122 8123 void 8124 mips_finish_declare_object (FILE *stream, tree decl, int top_level, int at_end) 8125 { 8126 const char *name; 8127 8128 name = XSTR (XEXP (DECL_RTL (decl), 0), 0); 8129 if (!flag_inhibit_size_directive 8130 && DECL_SIZE (decl) != 0 8131 && !at_end 8132 && top_level 8133 && DECL_INITIAL (decl) == error_mark_node 8134 && !size_directive_output) 8135 { 8136 HOST_WIDE_INT size; 8137 8138 size_directive_output = 1; 8139 size = int_size_in_bytes (TREE_TYPE (decl)); 8140 ASM_OUTPUT_SIZE_DIRECTIVE (stream, name, size); 8141 } 8142 } 8143 #endif 8144 8145 /* Return the FOO in the name of the ".mdebug.FOO" section associated 8146 with the current ABI. */ 8147 8148 static const char * 8149 mips_mdebug_abi_name (void) 8150 { 8151 switch (mips_abi) 8152 { 8153 case ABI_32: 8154 return "abi32"; 8155 case ABI_O64: 8156 return "abiO64"; 8157 case ABI_N32: 8158 return "abiN32"; 8159 case ABI_64: 8160 return "abi64"; 8161 case ABI_EABI: 8162 return TARGET_64BIT ? "eabi64" : "eabi32"; 8163 default: 8164 gcc_unreachable (); 8165 } 8166 } 8167 8168 /* Implement TARGET_ASM_FILE_START. */ 8169 8170 static void 8171 mips_file_start (void) 8172 { 8173 default_file_start (); 8174 8175 /* Generate a special section to describe the ABI switches used to 8176 produce the resultant binary. This is unnecessary on IRIX and 8177 causes unwanted warnings from the native linker. */ 8178 if (!TARGET_IRIX) 8179 { 8180 /* Record the ABI itself. Modern versions of binutils encode 8181 this information in the ELF header flags, but GDB needs the 8182 information in order to correctly debug binaries produced by 8183 older binutils. See the function mips_gdbarch_init in 8184 gdb/mips-tdep.c. */ 8185 fprintf (asm_out_file, "\t.section .mdebug.%s\n\t.previous\n", 8186 mips_mdebug_abi_name ()); 8187 8188 /* There is no ELF header flag to distinguish long32 forms of the 8189 EABI from long64 forms. Emit a special section to help tools 8190 such as GDB. Do the same for o64, which is sometimes used with 8191 -mlong64. */ 8192 if (mips_abi == ABI_EABI || mips_abi == ABI_O64) 8193 fprintf (asm_out_file, "\t.section .gcc_compiled_long%d\n" 8194 "\t.previous\n", TARGET_LONG64 ? 64 : 32); 8195 8196 #ifdef HAVE_AS_GNU_ATTRIBUTE 8197 fprintf (asm_out_file, "\t.gnu_attribute 4, %d\n", 8198 (TARGET_HARD_FLOAT_ABI 8199 ? (TARGET_DOUBLE_FLOAT 8200 ? ((!TARGET_64BIT && TARGET_FLOAT64) ? 4 : 1) : 2) : 3)); 8201 #endif 8202 } 8203 8204 /* If TARGET_ABICALLS, tell GAS to generate -KPIC code. */ 8205 if (TARGET_ABICALLS) 8206 { 8207 fprintf (asm_out_file, "\t.abicalls\n"); 8208 if (TARGET_ABICALLS_PIC0) 8209 fprintf (asm_out_file, "\t.option\tpic0\n"); 8210 } 8211 8212 if (flag_verbose_asm) 8213 fprintf (asm_out_file, "\n%s -G value = %d, Arch = %s, ISA = %d\n", 8214 ASM_COMMENT_START, 8215 mips_small_data_threshold, mips_arch_info->name, mips_isa); 8216 } 8217 8218 /* Make the last instruction frame-related and note that it performs 8219 the operation described by FRAME_PATTERN. */ 8220 8221 static void 8222 mips_set_frame_expr (rtx frame_pattern) 8223 { 8224 rtx insn; 8225 8226 insn = get_last_insn (); 8227 RTX_FRAME_RELATED_P (insn) = 1; 8228 REG_NOTES (insn) = alloc_EXPR_LIST (REG_FRAME_RELATED_EXPR, 8229 frame_pattern, 8230 REG_NOTES (insn)); 8231 } 8232 8233 /* Return a frame-related rtx that stores REG at MEM. 8234 REG must be a single register. */ 8235 8236 static rtx 8237 mips_frame_set (rtx mem, rtx reg) 8238 { 8239 rtx set; 8240 8241 /* If we're saving the return address register and the DWARF return 8242 address column differs from the hard register number, adjust the 8243 note reg to refer to the former. */ 8244 if (REGNO (reg) == RETURN_ADDR_REGNUM 8245 && DWARF_FRAME_RETURN_COLUMN != RETURN_ADDR_REGNUM) 8246 reg = gen_rtx_REG (GET_MODE (reg), DWARF_FRAME_RETURN_COLUMN); 8247 8248 set = gen_rtx_SET (VOIDmode, mem, reg); 8249 RTX_FRAME_RELATED_P (set) = 1; 8250 8251 return set; 8252 } 8253 8254 /* If a MIPS16e SAVE or RESTORE instruction saves or restores register 8255 mips16e_s2_s8_regs[X], it must also save the registers in indexes 8256 X + 1 onwards. Likewise mips16e_a0_a3_regs. */ 8257 static const unsigned char mips16e_s2_s8_regs[] = { 8258 30, 23, 22, 21, 20, 19, 18 8259 }; 8260 static const unsigned char mips16e_a0_a3_regs[] = { 8261 4, 5, 6, 7 8262 }; 8263 8264 /* A list of the registers that can be saved by the MIPS16e SAVE instruction, 8265 ordered from the uppermost in memory to the lowest in memory. */ 8266 static const unsigned char mips16e_save_restore_regs[] = { 8267 31, 30, 23, 22, 21, 20, 19, 18, 17, 16, 7, 6, 5, 4 8268 }; 8269 8270 /* Return the index of the lowest X in the range [0, SIZE) for which 8271 bit REGS[X] is set in MASK. Return SIZE if there is no such X. */ 8272 8273 static unsigned int 8274 mips16e_find_first_register (unsigned int mask, const unsigned char *regs, 8275 unsigned int size) 8276 { 8277 unsigned int i; 8278 8279 for (i = 0; i < size; i++) 8280 if (BITSET_P (mask, regs[i])) 8281 break; 8282 8283 return i; 8284 } 8285 8286 /* *MASK_PTR is a mask of general-purpose registers and *NUM_REGS_PTR 8287 is the number of set bits. If *MASK_PTR contains REGS[X] for some X 8288 in [0, SIZE), adjust *MASK_PTR and *NUM_REGS_PTR so that the same 8289 is true for all indexes (X, SIZE). */ 8290 8291 static void 8292 mips16e_mask_registers (unsigned int *mask_ptr, const unsigned char *regs, 8293 unsigned int size, unsigned int *num_regs_ptr) 8294 { 8295 unsigned int i; 8296 8297 i = mips16e_find_first_register (*mask_ptr, regs, size); 8298 for (i++; i < size; i++) 8299 if (!BITSET_P (*mask_ptr, regs[i])) 8300 { 8301 *num_regs_ptr += 1; 8302 *mask_ptr |= 1 << regs[i]; 8303 } 8304 } 8305 8306 /* Return a simplified form of X using the register values in REG_VALUES. 8307 REG_VALUES[R] is the last value assigned to hard register R, or null 8308 if R has not been modified. 8309 8310 This function is rather limited, but is good enough for our purposes. */ 8311 8312 static rtx 8313 mips16e_collect_propagate_value (rtx x, rtx *reg_values) 8314 { 8315 x = avoid_constant_pool_reference (x); 8316 8317 if (UNARY_P (x)) 8318 { 8319 rtx x0 = mips16e_collect_propagate_value (XEXP (x, 0), reg_values); 8320 return simplify_gen_unary (GET_CODE (x), GET_MODE (x), 8321 x0, GET_MODE (XEXP (x, 0))); 8322 } 8323 8324 if (ARITHMETIC_P (x)) 8325 { 8326 rtx x0 = mips16e_collect_propagate_value (XEXP (x, 0), reg_values); 8327 rtx x1 = mips16e_collect_propagate_value (XEXP (x, 1), reg_values); 8328 return simplify_gen_binary (GET_CODE (x), GET_MODE (x), x0, x1); 8329 } 8330 8331 if (REG_P (x) 8332 && reg_values[REGNO (x)] 8333 && !rtx_unstable_p (reg_values[REGNO (x)])) 8334 return reg_values[REGNO (x)]; 8335 8336 return x; 8337 } 8338 8339 /* Return true if (set DEST SRC) stores an argument register into its 8340 caller-allocated save slot, storing the number of that argument 8341 register in *REGNO_PTR if so. REG_VALUES is as for 8342 mips16e_collect_propagate_value. */ 8343 8344 static bool 8345 mips16e_collect_argument_save_p (rtx dest, rtx src, rtx *reg_values, 8346 unsigned int *regno_ptr) 8347 { 8348 unsigned int argno, regno; 8349 HOST_WIDE_INT offset, required_offset; 8350 rtx addr, base; 8351 8352 /* Check that this is a word-mode store. */ 8353 if (!MEM_P (dest) || !REG_P (src) || GET_MODE (dest) != word_mode) 8354 return false; 8355 8356 /* Check that the register being saved is an unmodified argument 8357 register. */ 8358 regno = REGNO (src); 8359 if (!IN_RANGE (regno, GP_ARG_FIRST, GP_ARG_LAST) || reg_values[regno]) 8360 return false; 8361 argno = regno - GP_ARG_FIRST; 8362 8363 /* Check whether the address is an appropriate stack-pointer or 8364 frame-pointer access. */ 8365 addr = mips16e_collect_propagate_value (XEXP (dest, 0), reg_values); 8366 mips_split_plus (addr, &base, &offset); 8367 required_offset = cfun->machine->frame.total_size + argno * UNITS_PER_WORD; 8368 if (base == hard_frame_pointer_rtx) 8369 required_offset -= cfun->machine->frame.hard_frame_pointer_offset; 8370 else if (base != stack_pointer_rtx) 8371 return false; 8372 if (offset != required_offset) 8373 return false; 8374 8375 *regno_ptr = regno; 8376 return true; 8377 } 8378 8379 /* A subroutine of mips_expand_prologue, called only when generating 8380 MIPS16e SAVE instructions. Search the start of the function for any 8381 instructions that save argument registers into their caller-allocated 8382 save slots. Delete such instructions and return a value N such that 8383 saving [GP_ARG_FIRST, GP_ARG_FIRST + N) would make all the deleted 8384 instructions redundant. */ 8385 8386 static unsigned int 8387 mips16e_collect_argument_saves (void) 8388 { 8389 rtx reg_values[FIRST_PSEUDO_REGISTER]; 8390 rtx insn, next, set, dest, src; 8391 unsigned int nargs, regno; 8392 8393 push_topmost_sequence (); 8394 nargs = 0; 8395 memset (reg_values, 0, sizeof (reg_values)); 8396 for (insn = get_insns (); insn; insn = next) 8397 { 8398 next = NEXT_INSN (insn); 8399 if (NOTE_P (insn) || DEBUG_INSN_P (insn)) 8400 continue; 8401 8402 if (!INSN_P (insn)) 8403 break; 8404 8405 set = PATTERN (insn); 8406 if (GET_CODE (set) != SET) 8407 break; 8408 8409 dest = SET_DEST (set); 8410 src = SET_SRC (set); 8411 if (mips16e_collect_argument_save_p (dest, src, reg_values, ®no)) 8412 { 8413 if (!BITSET_P (cfun->machine->frame.mask, regno)) 8414 { 8415 delete_insn (insn); 8416 nargs = MAX (nargs, (regno - GP_ARG_FIRST) + 1); 8417 } 8418 } 8419 else if (REG_P (dest) && GET_MODE (dest) == word_mode) 8420 reg_values[REGNO (dest)] 8421 = mips16e_collect_propagate_value (src, reg_values); 8422 else 8423 break; 8424 } 8425 pop_topmost_sequence (); 8426 8427 return nargs; 8428 } 8429 8430 /* Return a move between register REGNO and memory location SP + OFFSET. 8431 Make the move a load if RESTORE_P, otherwise make it a frame-related 8432 store. */ 8433 8434 static rtx 8435 mips16e_save_restore_reg (bool restore_p, HOST_WIDE_INT offset, 8436 unsigned int regno) 8437 { 8438 rtx reg, mem; 8439 8440 mem = gen_frame_mem (SImode, plus_constant (stack_pointer_rtx, offset)); 8441 reg = gen_rtx_REG (SImode, regno); 8442 return (restore_p 8443 ? gen_rtx_SET (VOIDmode, reg, mem) 8444 : mips_frame_set (mem, reg)); 8445 } 8446 8447 /* Return RTL for a MIPS16e SAVE or RESTORE instruction; RESTORE_P says which. 8448 The instruction must: 8449 8450 - Allocate or deallocate SIZE bytes in total; SIZE is known 8451 to be nonzero. 8452 8453 - Save or restore as many registers in *MASK_PTR as possible. 8454 The instruction saves the first registers at the top of the 8455 allocated area, with the other registers below it. 8456 8457 - Save NARGS argument registers above the allocated area. 8458 8459 (NARGS is always zero if RESTORE_P.) 8460 8461 The SAVE and RESTORE instructions cannot save and restore all general 8462 registers, so there may be some registers left over for the caller to 8463 handle. Destructively modify *MASK_PTR so that it contains the registers 8464 that still need to be saved or restored. The caller can save these 8465 registers in the memory immediately below *OFFSET_PTR, which is a 8466 byte offset from the bottom of the allocated stack area. */ 8467 8468 static rtx 8469 mips16e_build_save_restore (bool restore_p, unsigned int *mask_ptr, 8470 HOST_WIDE_INT *offset_ptr, unsigned int nargs, 8471 HOST_WIDE_INT size) 8472 { 8473 rtx pattern, set; 8474 HOST_WIDE_INT offset, top_offset; 8475 unsigned int i, regno; 8476 int n; 8477 8478 gcc_assert (cfun->machine->frame.num_fp == 0); 8479 8480 /* Calculate the number of elements in the PARALLEL. We need one element 8481 for the stack adjustment, one for each argument register save, and one 8482 for each additional register move. */ 8483 n = 1 + nargs; 8484 for (i = 0; i < ARRAY_SIZE (mips16e_save_restore_regs); i++) 8485 if (BITSET_P (*mask_ptr, mips16e_save_restore_regs[i])) 8486 n++; 8487 8488 /* Create the final PARALLEL. */ 8489 pattern = gen_rtx_PARALLEL (VOIDmode, rtvec_alloc (n)); 8490 n = 0; 8491 8492 /* Add the stack pointer adjustment. */ 8493 set = gen_rtx_SET (VOIDmode, stack_pointer_rtx, 8494 plus_constant (stack_pointer_rtx, 8495 restore_p ? size : -size)); 8496 RTX_FRAME_RELATED_P (set) = 1; 8497 XVECEXP (pattern, 0, n++) = set; 8498 8499 /* Stack offsets in the PARALLEL are relative to the old stack pointer. */ 8500 top_offset = restore_p ? size : 0; 8501 8502 /* Save the arguments. */ 8503 for (i = 0; i < nargs; i++) 8504 { 8505 offset = top_offset + i * UNITS_PER_WORD; 8506 set = mips16e_save_restore_reg (restore_p, offset, GP_ARG_FIRST + i); 8507 XVECEXP (pattern, 0, n++) = set; 8508 } 8509 8510 /* Then fill in the other register moves. */ 8511 offset = top_offset; 8512 for (i = 0; i < ARRAY_SIZE (mips16e_save_restore_regs); i++) 8513 { 8514 regno = mips16e_save_restore_regs[i]; 8515 if (BITSET_P (*mask_ptr, regno)) 8516 { 8517 offset -= UNITS_PER_WORD; 8518 set = mips16e_save_restore_reg (restore_p, offset, regno); 8519 XVECEXP (pattern, 0, n++) = set; 8520 *mask_ptr &= ~(1 << regno); 8521 } 8522 } 8523 8524 /* Tell the caller what offset it should use for the remaining registers. */ 8525 *offset_ptr = size + (offset - top_offset); 8526 8527 gcc_assert (n == XVECLEN (pattern, 0)); 8528 8529 return pattern; 8530 } 8531 8532 /* PATTERN is a PARALLEL whose first element adds ADJUST to the stack 8533 pointer. Return true if PATTERN matches the kind of instruction 8534 generated by mips16e_build_save_restore. If INFO is nonnull, 8535 initialize it when returning true. */ 8536 8537 bool 8538 mips16e_save_restore_pattern_p (rtx pattern, HOST_WIDE_INT adjust, 8539 struct mips16e_save_restore_info *info) 8540 { 8541 unsigned int i, nargs, mask, extra; 8542 HOST_WIDE_INT top_offset, save_offset, offset; 8543 rtx set, reg, mem, base; 8544 int n; 8545 8546 if (!GENERATE_MIPS16E_SAVE_RESTORE) 8547 return false; 8548 8549 /* Stack offsets in the PARALLEL are relative to the old stack pointer. */ 8550 top_offset = adjust > 0 ? adjust : 0; 8551 8552 /* Interpret all other members of the PARALLEL. */ 8553 save_offset = top_offset - UNITS_PER_WORD; 8554 mask = 0; 8555 nargs = 0; 8556 i = 0; 8557 for (n = 1; n < XVECLEN (pattern, 0); n++) 8558 { 8559 /* Check that we have a SET. */ 8560 set = XVECEXP (pattern, 0, n); 8561 if (GET_CODE (set) != SET) 8562 return false; 8563 8564 /* Check that the SET is a load (if restoring) or a store 8565 (if saving). */ 8566 mem = adjust > 0 ? SET_SRC (set) : SET_DEST (set); 8567 if (!MEM_P (mem)) 8568 return false; 8569 8570 /* Check that the address is the sum of the stack pointer and a 8571 possibly-zero constant offset. */ 8572 mips_split_plus (XEXP (mem, 0), &base, &offset); 8573 if (base != stack_pointer_rtx) 8574 return false; 8575 8576 /* Check that SET's other operand is a register. */ 8577 reg = adjust > 0 ? SET_DEST (set) : SET_SRC (set); 8578 if (!REG_P (reg)) 8579 return false; 8580 8581 /* Check for argument saves. */ 8582 if (offset == top_offset + nargs * UNITS_PER_WORD 8583 && REGNO (reg) == GP_ARG_FIRST + nargs) 8584 nargs++; 8585 else if (offset == save_offset) 8586 { 8587 while (mips16e_save_restore_regs[i++] != REGNO (reg)) 8588 if (i == ARRAY_SIZE (mips16e_save_restore_regs)) 8589 return false; 8590 8591 mask |= 1 << REGNO (reg); 8592 save_offset -= UNITS_PER_WORD; 8593 } 8594 else 8595 return false; 8596 } 8597 8598 /* Check that the restrictions on register ranges are met. */ 8599 extra = 0; 8600 mips16e_mask_registers (&mask, mips16e_s2_s8_regs, 8601 ARRAY_SIZE (mips16e_s2_s8_regs), &extra); 8602 mips16e_mask_registers (&mask, mips16e_a0_a3_regs, 8603 ARRAY_SIZE (mips16e_a0_a3_regs), &extra); 8604 if (extra != 0) 8605 return false; 8606 8607 /* Make sure that the topmost argument register is not saved twice. 8608 The checks above ensure that the same is then true for the other 8609 argument registers. */ 8610 if (nargs > 0 && BITSET_P (mask, GP_ARG_FIRST + nargs - 1)) 8611 return false; 8612 8613 /* Pass back information, if requested. */ 8614 if (info) 8615 { 8616 info->nargs = nargs; 8617 info->mask = mask; 8618 info->size = (adjust > 0 ? adjust : -adjust); 8619 } 8620 8621 return true; 8622 } 8623 8624 /* Add a MIPS16e SAVE or RESTORE register-range argument to string S 8625 for the register range [MIN_REG, MAX_REG]. Return a pointer to 8626 the null terminator. */ 8627 8628 static char * 8629 mips16e_add_register_range (char *s, unsigned int min_reg, 8630 unsigned int max_reg) 8631 { 8632 if (min_reg != max_reg) 8633 s += sprintf (s, ",%s-%s", reg_names[min_reg], reg_names[max_reg]); 8634 else 8635 s += sprintf (s, ",%s", reg_names[min_reg]); 8636 return s; 8637 } 8638 8639 /* Return the assembly instruction for a MIPS16e SAVE or RESTORE instruction. 8640 PATTERN and ADJUST are as for mips16e_save_restore_pattern_p. */ 8641 8642 const char * 8643 mips16e_output_save_restore (rtx pattern, HOST_WIDE_INT adjust) 8644 { 8645 static char buffer[300]; 8646 8647 struct mips16e_save_restore_info info; 8648 unsigned int i, end; 8649 char *s; 8650 8651 /* Parse the pattern. */ 8652 if (!mips16e_save_restore_pattern_p (pattern, adjust, &info)) 8653 gcc_unreachable (); 8654 8655 /* Add the mnemonic. */ 8656 s = strcpy (buffer, adjust > 0 ? "restore\t" : "save\t"); 8657 s += strlen (s); 8658 8659 /* Save the arguments. */ 8660 if (info.nargs > 1) 8661 s += sprintf (s, "%s-%s,", reg_names[GP_ARG_FIRST], 8662 reg_names[GP_ARG_FIRST + info.nargs - 1]); 8663 else if (info.nargs == 1) 8664 s += sprintf (s, "%s,", reg_names[GP_ARG_FIRST]); 8665 8666 /* Emit the amount of stack space to allocate or deallocate. */ 8667 s += sprintf (s, "%d", (int) info.size); 8668 8669 /* Save or restore $16. */ 8670 if (BITSET_P (info.mask, 16)) 8671 s += sprintf (s, ",%s", reg_names[GP_REG_FIRST + 16]); 8672 8673 /* Save or restore $17. */ 8674 if (BITSET_P (info.mask, 17)) 8675 s += sprintf (s, ",%s", reg_names[GP_REG_FIRST + 17]); 8676 8677 /* Save or restore registers in the range $s2...$s8, which 8678 mips16e_s2_s8_regs lists in decreasing order. Note that this 8679 is a software register range; the hardware registers are not 8680 numbered consecutively. */ 8681 end = ARRAY_SIZE (mips16e_s2_s8_regs); 8682 i = mips16e_find_first_register (info.mask, mips16e_s2_s8_regs, end); 8683 if (i < end) 8684 s = mips16e_add_register_range (s, mips16e_s2_s8_regs[end - 1], 8685 mips16e_s2_s8_regs[i]); 8686 8687 /* Save or restore registers in the range $a0...$a3. */ 8688 end = ARRAY_SIZE (mips16e_a0_a3_regs); 8689 i = mips16e_find_first_register (info.mask, mips16e_a0_a3_regs, end); 8690 if (i < end) 8691 s = mips16e_add_register_range (s, mips16e_a0_a3_regs[i], 8692 mips16e_a0_a3_regs[end - 1]); 8693 8694 /* Save or restore $31. */ 8695 if (BITSET_P (info.mask, RETURN_ADDR_REGNUM)) 8696 s += sprintf (s, ",%s", reg_names[RETURN_ADDR_REGNUM]); 8697 8698 return buffer; 8699 } 8700 8701 /* Return true if the current function returns its value in a floating-point 8702 register in MIPS16 mode. */ 8703 8704 static bool 8705 mips16_cfun_returns_in_fpr_p (void) 8706 { 8707 tree return_type = DECL_RESULT (current_function_decl); 8708 return (TARGET_MIPS16 8709 && TARGET_HARD_FLOAT_ABI 8710 && !aggregate_value_p (return_type, current_function_decl) 8711 && mips_return_mode_in_fpr_p (DECL_MODE (return_type))); 8712 } 8713 8714 /* Return true if predicate PRED is true for at least one instruction. 8715 Cache the result in *CACHE, and assume that the result is true 8716 if *CACHE is already true. */ 8717 8718 static bool 8719 mips_find_gp_ref (bool *cache, bool (*pred) (rtx)) 8720 { 8721 rtx insn; 8722 8723 if (!*cache) 8724 { 8725 push_topmost_sequence (); 8726 for (insn = get_insns (); insn; insn = NEXT_INSN (insn)) 8727 if (USEFUL_INSN_P (insn) && pred (insn)) 8728 { 8729 *cache = true; 8730 break; 8731 } 8732 pop_topmost_sequence (); 8733 } 8734 return *cache; 8735 } 8736 8737 /* Return true if INSN refers to the global pointer in an "inflexible" way. 8738 See mips_cfun_has_inflexible_gp_ref_p for details. */ 8739 8740 static bool 8741 mips_insn_has_inflexible_gp_ref_p (rtx insn) 8742 { 8743 /* Uses of pic_offset_table_rtx in CALL_INSN_FUNCTION_USAGE 8744 indicate that the target could be a traditional MIPS 8745 lazily-binding stub. */ 8746 return find_reg_fusage (insn, USE, pic_offset_table_rtx); 8747 } 8748 8749 /* Return true if the current function refers to the global pointer 8750 in a way that forces $28 to be valid. This means that we can't 8751 change the choice of global pointer, even for NewABI code. 8752 8753 One example of this (and one which needs several checks) is that 8754 $28 must be valid when calling traditional MIPS lazy-binding stubs. 8755 (This restriction does not apply to PLTs.) */ 8756 8757 static bool 8758 mips_cfun_has_inflexible_gp_ref_p (void) 8759 { 8760 /* If the function has a nonlocal goto, $28 must hold the correct 8761 global pointer for the target function. That is, the target 8762 of the goto implicitly uses $28. */ 8763 if (crtl->has_nonlocal_goto) 8764 return true; 8765 8766 if (TARGET_ABICALLS_PIC2) 8767 { 8768 /* Symbolic accesses implicitly use the global pointer unless 8769 -mexplicit-relocs is in effect. JAL macros to symbolic addresses 8770 might go to traditional MIPS lazy-binding stubs. */ 8771 if (!TARGET_EXPLICIT_RELOCS) 8772 return true; 8773 8774 /* FUNCTION_PROFILER includes a JAL to _mcount, which again 8775 can be lazily-bound. */ 8776 if (crtl->profile) 8777 return true; 8778 8779 /* MIPS16 functions that return in FPRs need to call an 8780 external libgcc routine. This call is only made explict 8781 during mips_expand_epilogue, and it too might be lazily bound. */ 8782 if (mips16_cfun_returns_in_fpr_p ()) 8783 return true; 8784 } 8785 8786 return mips_find_gp_ref (&cfun->machine->has_inflexible_gp_insn_p, 8787 mips_insn_has_inflexible_gp_ref_p); 8788 } 8789 8790 /* Return true if INSN refers to the global pointer in a "flexible" way. 8791 See mips_cfun_has_flexible_gp_ref_p for details. */ 8792 8793 static bool 8794 mips_insn_has_flexible_gp_ref_p (rtx insn) 8795 { 8796 return (get_attr_got (insn) != GOT_UNSET 8797 || mips_small_data_pattern_p (PATTERN (insn)) 8798 || reg_overlap_mentioned_p (pic_offset_table_rtx, PATTERN (insn))); 8799 } 8800 8801 /* Return true if the current function references the global pointer, 8802 but if those references do not inherently require the global pointer 8803 to be $28. Assume !mips_cfun_has_inflexible_gp_ref_p (). */ 8804 8805 static bool 8806 mips_cfun_has_flexible_gp_ref_p (void) 8807 { 8808 /* Reload can sometimes introduce constant pool references 8809 into a function that otherwise didn't need them. For example, 8810 suppose we have an instruction like: 8811 8812 (set (reg:DF R1) (float:DF (reg:SI R2))) 8813 8814 If R2 turns out to be a constant such as 1, the instruction may 8815 have a REG_EQUAL note saying that R1 == 1.0. Reload then has 8816 the option of using this constant if R2 doesn't get allocated 8817 to a register. 8818 8819 In cases like these, reload will have added the constant to the 8820 pool but no instruction will yet refer to it. */ 8821 if (TARGET_ABICALLS_PIC2 && !reload_completed && crtl->uses_const_pool) 8822 return true; 8823 8824 return mips_find_gp_ref (&cfun->machine->has_flexible_gp_insn_p, 8825 mips_insn_has_flexible_gp_ref_p); 8826 } 8827 8828 /* Return the register that should be used as the global pointer 8829 within this function. Return INVALID_REGNUM if the function 8830 doesn't need a global pointer. */ 8831 8832 static unsigned int 8833 mips_global_pointer (void) 8834 { 8835 unsigned int regno; 8836 8837 /* $gp is always available unless we're using a GOT. */ 8838 if (!TARGET_USE_GOT) 8839 return GLOBAL_POINTER_REGNUM; 8840 8841 /* If there are inflexible references to $gp, we must use the 8842 standard register. */ 8843 if (mips_cfun_has_inflexible_gp_ref_p ()) 8844 return GLOBAL_POINTER_REGNUM; 8845 8846 /* If there are no current references to $gp, then the only uses 8847 we can introduce later are those involved in long branches. */ 8848 if (TARGET_ABSOLUTE_JUMPS && !mips_cfun_has_flexible_gp_ref_p ()) 8849 return INVALID_REGNUM; 8850 8851 /* If the global pointer is call-saved, try to use a call-clobbered 8852 alternative. */ 8853 if (TARGET_CALL_SAVED_GP && current_function_is_leaf) 8854 for (regno = GP_REG_FIRST; regno <= GP_REG_LAST; regno++) 8855 if (!df_regs_ever_live_p (regno) 8856 && call_really_used_regs[regno] 8857 && !fixed_regs[regno] 8858 && regno != PIC_FUNCTION_ADDR_REGNUM) 8859 return regno; 8860 8861 return GLOBAL_POINTER_REGNUM; 8862 } 8863 8864 /* Return true if the current function's prologue must load the global 8865 pointer value into pic_offset_table_rtx and store the same value in 8866 the function's cprestore slot (if any). 8867 8868 One problem we have to deal with is that, when emitting GOT-based 8869 position independent code, long-branch sequences will need to load 8870 the address of the branch target from the GOT. We don't know until 8871 the very end of compilation whether (and where) the function needs 8872 long branches, so we must ensure that _any_ branch can access the 8873 global pointer in some form. However, we do not want to pessimize 8874 the usual case in which all branches are short. 8875 8876 We handle this as follows: 8877 8878 (1) During reload, we set cfun->machine->global_pointer to 8879 INVALID_REGNUM if we _know_ that the current function 8880 doesn't need a global pointer. This is only valid if 8881 long branches don't need the GOT. 8882 8883 Otherwise, we assume that we might need a global pointer 8884 and pick an appropriate register. 8885 8886 (2) If cfun->machine->global_pointer != INVALID_REGNUM, 8887 we ensure that the global pointer is available at every 8888 block boundary bar entry and exit. We do this in one of two ways: 8889 8890 - If the function has a cprestore slot, we ensure that this 8891 slot is valid at every branch. However, as explained in 8892 point (6) below, there is no guarantee that pic_offset_table_rtx 8893 itself is valid if new uses of the global pointer are introduced 8894 after the first post-epilogue split. 8895 8896 We guarantee that the cprestore slot is valid by loading it 8897 into a fake register, CPRESTORE_SLOT_REGNUM. We then make 8898 this register live at every block boundary bar function entry 8899 and exit. It is then invalid to move the load (and thus the 8900 preceding store) across a block boundary. 8901 8902 - If the function has no cprestore slot, we guarantee that 8903 pic_offset_table_rtx itself is valid at every branch. 8904 8905 See mips_eh_uses for the handling of the register liveness. 8906 8907 (3) During prologue and epilogue generation, we emit "ghost" 8908 placeholder instructions to manipulate the global pointer. 8909 8910 (4) During prologue generation, we set cfun->machine->must_initialize_gp_p 8911 and cfun->machine->must_restore_gp_when_clobbered_p if we already know 8912 that the function needs a global pointer. (There is no need to set 8913 them earlier than this, and doing it as late as possible leads to 8914 fewer false positives.) 8915 8916 (5) If cfun->machine->must_initialize_gp_p is true during a 8917 split_insns pass, we split the ghost instructions into real 8918 instructions. These split instructions can then be optimized in 8919 the usual way. Otherwise, we keep the ghost instructions intact, 8920 and optimize for the case where they aren't needed. We still 8921 have the option of splitting them later, if we need to introduce 8922 new uses of the global pointer. 8923 8924 For example, the scheduler ignores a ghost instruction that 8925 stores $28 to the stack, but it handles the split form of 8926 the ghost instruction as an ordinary store. 8927 8928 (6) [OldABI only.] If cfun->machine->must_restore_gp_when_clobbered_p 8929 is true during the first post-epilogue split_insns pass, we split 8930 calls and restore_gp patterns into instructions that explicitly 8931 load pic_offset_table_rtx from the cprestore slot. Otherwise, 8932 we split these patterns into instructions that _don't_ load from 8933 the cprestore slot. 8934 8935 If cfun->machine->must_restore_gp_when_clobbered_p is true at the 8936 time of the split, then any instructions that exist at that time 8937 can make free use of pic_offset_table_rtx. However, if we want 8938 to introduce new uses of the global pointer after the split, 8939 we must explicitly load the value from the cprestore slot, since 8940 pic_offset_table_rtx itself might not be valid at a given point 8941 in the function. 8942 8943 The idea is that we want to be able to delete redundant 8944 loads from the cprestore slot in the usual case where no 8945 long branches are needed. 8946 8947 (7) If cfun->machine->must_initialize_gp_p is still false at the end 8948 of md_reorg, we decide whether the global pointer is needed for 8949 long branches. If so, we set cfun->machine->must_initialize_gp_p 8950 to true and split the ghost instructions into real instructions 8951 at that stage. 8952 8953 Note that the ghost instructions must have a zero length for three reasons: 8954 8955 - Giving the length of the underlying $gp sequence might cause 8956 us to use long branches in cases where they aren't really needed. 8957 8958 - They would perturb things like alignment calculations. 8959 8960 - More importantly, the hazard detection in md_reorg relies on 8961 empty instructions having a zero length. 8962 8963 If we find a long branch and split the ghost instructions at the 8964 end of md_reorg, the split could introduce more long branches. 8965 That isn't a problem though, because we still do the split before 8966 the final shorten_branches pass. 8967 8968 This is extremely ugly, but it seems like the best compromise between 8969 correctness and efficiency. */ 8970 8971 bool 8972 mips_must_initialize_gp_p (void) 8973 { 8974 return cfun->machine->must_initialize_gp_p; 8975 } 8976 8977 /* Return true if REGNO is a register that is ordinarily call-clobbered 8978 but must nevertheless be preserved by an interrupt handler. */ 8979 8980 static bool 8981 mips_interrupt_extra_call_saved_reg_p (unsigned int regno) 8982 { 8983 if (MD_REG_P (regno)) 8984 return true; 8985 8986 if (TARGET_DSP && DSP_ACC_REG_P (regno)) 8987 return true; 8988 8989 if (GP_REG_P (regno) && !cfun->machine->use_shadow_register_set_p) 8990 { 8991 /* $0 is hard-wired. */ 8992 if (regno == GP_REG_FIRST) 8993 return false; 8994 8995 /* The interrupt handler can treat kernel registers as 8996 scratch registers. */ 8997 if (KERNEL_REG_P (regno)) 8998 return false; 8999 9000 /* The function will return the stack pointer to its original value 9001 anyway. */ 9002 if (regno == STACK_POINTER_REGNUM) 9003 return false; 9004 9005 /* Otherwise, return true for registers that aren't ordinarily 9006 call-clobbered. */ 9007 return call_really_used_regs[regno]; 9008 } 9009 9010 return false; 9011 } 9012 9013 /* Return true if the current function should treat register REGNO 9014 as call-saved. */ 9015 9016 static bool 9017 mips_cfun_call_saved_reg_p (unsigned int regno) 9018 { 9019 /* If the user makes an ordinarily-call-saved register global, 9020 that register is no longer call-saved. */ 9021 if (global_regs[regno]) 9022 return false; 9023 9024 /* Interrupt handlers need to save extra registers. */ 9025 if (cfun->machine->interrupt_handler_p 9026 && mips_interrupt_extra_call_saved_reg_p (regno)) 9027 return true; 9028 9029 /* call_insns preserve $28 unless they explicitly say otherwise, 9030 so call_really_used_regs[] treats $28 as call-saved. However, 9031 we want the ABI property rather than the default call_insn 9032 property here. */ 9033 return (regno == GLOBAL_POINTER_REGNUM 9034 ? TARGET_CALL_SAVED_GP 9035 : !call_really_used_regs[regno]); 9036 } 9037 9038 /* Return true if the function body might clobber register REGNO. 9039 We know that REGNO is call-saved. */ 9040 9041 static bool 9042 mips_cfun_might_clobber_call_saved_reg_p (unsigned int regno) 9043 { 9044 /* Some functions should be treated as clobbering all call-saved 9045 registers. */ 9046 if (crtl->saves_all_registers) 9047 return true; 9048 9049 /* DF handles cases where a register is explicitly referenced in 9050 the rtl. Incoming values are passed in call-clobbered registers, 9051 so we can assume that any live call-saved register is set within 9052 the function. */ 9053 if (df_regs_ever_live_p (regno)) 9054 return true; 9055 9056 /* Check for registers that are clobbered by FUNCTION_PROFILER. 9057 These clobbers are not explicit in the rtl. */ 9058 if (crtl->profile && MIPS_SAVE_REG_FOR_PROFILING_P (regno)) 9059 return true; 9060 9061 /* If we're using a call-saved global pointer, the function's 9062 prologue will need to set it up. */ 9063 if (cfun->machine->global_pointer == regno) 9064 return true; 9065 9066 /* The function's prologue will need to set the frame pointer if 9067 frame_pointer_needed. */ 9068 if (regno == HARD_FRAME_POINTER_REGNUM && frame_pointer_needed) 9069 return true; 9070 9071 /* If a MIPS16 function returns a value in FPRs, its epilogue 9072 will need to call an external libgcc routine. This yet-to-be 9073 generated call_insn will clobber $31. */ 9074 if (regno == RETURN_ADDR_REGNUM && mips16_cfun_returns_in_fpr_p ()) 9075 return true; 9076 9077 /* If REGNO is ordinarily call-clobbered, we must assume that any 9078 called function could modify it. */ 9079 if (cfun->machine->interrupt_handler_p 9080 && !current_function_is_leaf 9081 && mips_interrupt_extra_call_saved_reg_p (regno)) 9082 return true; 9083 9084 return false; 9085 } 9086 9087 /* Return true if the current function must save register REGNO. */ 9088 9089 static bool 9090 mips_save_reg_p (unsigned int regno) 9091 { 9092 if (mips_cfun_call_saved_reg_p (regno)) 9093 { 9094 if (mips_cfun_might_clobber_call_saved_reg_p (regno)) 9095 return true; 9096 9097 /* Save both registers in an FPR pair if either one is used. This is 9098 needed for the case when MIN_FPRS_PER_FMT == 1, which allows the odd 9099 register to be used without the even register. */ 9100 if (FP_REG_P (regno) 9101 && MAX_FPRS_PER_FMT == 2 9102 && mips_cfun_might_clobber_call_saved_reg_p (regno + 1)) 9103 return true; 9104 } 9105 9106 /* We need to save the incoming return address if __builtin_eh_return 9107 is being used to set a different return address. */ 9108 if (regno == RETURN_ADDR_REGNUM && crtl->calls_eh_return) 9109 return true; 9110 9111 return false; 9112 } 9113 9114 /* Populate the current function's mips_frame_info structure. 9115 9116 MIPS stack frames look like: 9117 9118 +-------------------------------+ 9119 | | 9120 | incoming stack arguments | 9121 | | 9122 +-------------------------------+ 9123 | | 9124 | caller-allocated save area | 9125 A | for register arguments | 9126 | | 9127 +-------------------------------+ <-- incoming stack pointer 9128 | | 9129 | callee-allocated save area | 9130 B | for arguments that are | 9131 | split between registers and | 9132 | the stack | 9133 | | 9134 +-------------------------------+ <-- arg_pointer_rtx 9135 | | 9136 C | callee-allocated save area | 9137 | for register varargs | 9138 | | 9139 +-------------------------------+ <-- frame_pointer_rtx 9140 | | + cop0_sp_offset 9141 | COP0 reg save area | + UNITS_PER_WORD 9142 | | 9143 +-------------------------------+ <-- frame_pointer_rtx + acc_sp_offset 9144 | | + UNITS_PER_WORD 9145 | accumulator save area | 9146 | | 9147 +-------------------------------+ <-- stack_pointer_rtx + fp_sp_offset 9148 | | + UNITS_PER_HWFPVALUE 9149 | FPR save area | 9150 | | 9151 +-------------------------------+ <-- stack_pointer_rtx + gp_sp_offset 9152 | | + UNITS_PER_WORD 9153 | GPR save area | 9154 | | 9155 +-------------------------------+ <-- frame_pointer_rtx with 9156 | | \ -fstack-protector 9157 | local variables | | var_size 9158 | | / 9159 +-------------------------------+ 9160 | | \ 9161 | $gp save area | | cprestore_size 9162 | | / 9163 P +-------------------------------+ <-- hard_frame_pointer_rtx for 9164 | | \ MIPS16 code 9165 | outgoing stack arguments | | 9166 | | | 9167 +-------------------------------+ | args_size 9168 | | | 9169 | caller-allocated save area | | 9170 | for register arguments | | 9171 | | / 9172 +-------------------------------+ <-- stack_pointer_rtx 9173 frame_pointer_rtx without 9174 -fstack-protector 9175 hard_frame_pointer_rtx for 9176 non-MIPS16 code. 9177 9178 At least two of A, B and C will be empty. 9179 9180 Dynamic stack allocations such as alloca insert data at point P. 9181 They decrease stack_pointer_rtx but leave frame_pointer_rtx and 9182 hard_frame_pointer_rtx unchanged. */ 9183 9184 static void 9185 mips_compute_frame_info (void) 9186 { 9187 struct mips_frame_info *frame; 9188 HOST_WIDE_INT offset, size; 9189 unsigned int regno, i; 9190 9191 /* Set this function's interrupt properties. */ 9192 if (mips_interrupt_type_p (TREE_TYPE (current_function_decl))) 9193 { 9194 if (!ISA_MIPS32R2) 9195 error ("the %<interrupt%> attribute requires a MIPS32r2 processor"); 9196 else if (TARGET_HARD_FLOAT) 9197 error ("the %<interrupt%> attribute requires %<-msoft-float%>"); 9198 else if (TARGET_MIPS16) 9199 error ("interrupt handlers cannot be MIPS16 functions"); 9200 else 9201 { 9202 cfun->machine->interrupt_handler_p = true; 9203 cfun->machine->use_shadow_register_set_p = 9204 mips_use_shadow_register_set_p (TREE_TYPE (current_function_decl)); 9205 cfun->machine->keep_interrupts_masked_p = 9206 mips_keep_interrupts_masked_p (TREE_TYPE (current_function_decl)); 9207 cfun->machine->use_debug_exception_return_p = 9208 mips_use_debug_exception_return_p (TREE_TYPE 9209 (current_function_decl)); 9210 } 9211 } 9212 9213 frame = &cfun->machine->frame; 9214 memset (frame, 0, sizeof (*frame)); 9215 size = get_frame_size (); 9216 9217 cfun->machine->global_pointer = mips_global_pointer (); 9218 9219 /* The first two blocks contain the outgoing argument area and the $gp save 9220 slot. This area isn't needed in leaf functions, but if the 9221 target-independent frame size is nonzero, we have already committed to 9222 allocating these in STARTING_FRAME_OFFSET for !FRAME_GROWS_DOWNWARD. */ 9223 if ((size == 0 || FRAME_GROWS_DOWNWARD) && current_function_is_leaf) 9224 { 9225 /* The MIPS 3.0 linker does not like functions that dynamically 9226 allocate the stack and have 0 for STACK_DYNAMIC_OFFSET, since it 9227 looks like we are trying to create a second frame pointer to the 9228 function, so allocate some stack space to make it happy. */ 9229 if (cfun->calls_alloca) 9230 frame->args_size = REG_PARM_STACK_SPACE (cfun->decl); 9231 else 9232 frame->args_size = 0; 9233 frame->cprestore_size = 0; 9234 } 9235 else 9236 { 9237 frame->args_size = crtl->outgoing_args_size; 9238 frame->cprestore_size = MIPS_GP_SAVE_AREA_SIZE; 9239 } 9240 offset = frame->args_size + frame->cprestore_size; 9241 9242 /* Move above the local variables. */ 9243 frame->var_size = MIPS_STACK_ALIGN (size); 9244 offset += frame->var_size; 9245 9246 /* Find out which GPRs we need to save. */ 9247 for (regno = GP_REG_FIRST; regno <= GP_REG_LAST; regno++) 9248 if (mips_save_reg_p (regno)) 9249 { 9250 frame->num_gp++; 9251 frame->mask |= 1 << (regno - GP_REG_FIRST); 9252 } 9253 9254 /* If this function calls eh_return, we must also save and restore the 9255 EH data registers. */ 9256 if (crtl->calls_eh_return) 9257 for (i = 0; EH_RETURN_DATA_REGNO (i) != INVALID_REGNUM; i++) 9258 { 9259 frame->num_gp++; 9260 frame->mask |= 1 << (EH_RETURN_DATA_REGNO (i) - GP_REG_FIRST); 9261 } 9262 9263 /* The MIPS16e SAVE and RESTORE instructions have two ranges of registers: 9264 $a3-$a0 and $s2-$s8. If we save one register in the range, we must 9265 save all later registers too. */ 9266 if (GENERATE_MIPS16E_SAVE_RESTORE) 9267 { 9268 mips16e_mask_registers (&frame->mask, mips16e_s2_s8_regs, 9269 ARRAY_SIZE (mips16e_s2_s8_regs), &frame->num_gp); 9270 mips16e_mask_registers (&frame->mask, mips16e_a0_a3_regs, 9271 ARRAY_SIZE (mips16e_a0_a3_regs), &frame->num_gp); 9272 } 9273 9274 /* Move above the GPR save area. */ 9275 if (frame->num_gp > 0) 9276 { 9277 offset += MIPS_STACK_ALIGN (frame->num_gp * UNITS_PER_WORD); 9278 frame->gp_sp_offset = offset - UNITS_PER_WORD; 9279 } 9280 9281 /* Find out which FPRs we need to save. This loop must iterate over 9282 the same space as its companion in mips_for_each_saved_gpr_and_fpr. */ 9283 if (TARGET_HARD_FLOAT) 9284 for (regno = FP_REG_FIRST; regno <= FP_REG_LAST; regno += MAX_FPRS_PER_FMT) 9285 if (mips_save_reg_p (regno)) 9286 { 9287 frame->num_fp += MAX_FPRS_PER_FMT; 9288 frame->fmask |= ~(~0 << MAX_FPRS_PER_FMT) << (regno - FP_REG_FIRST); 9289 } 9290 9291 /* Move above the FPR save area. */ 9292 if (frame->num_fp > 0) 9293 { 9294 offset += MIPS_STACK_ALIGN (frame->num_fp * UNITS_PER_FPREG); 9295 frame->fp_sp_offset = offset - UNITS_PER_HWFPVALUE; 9296 } 9297 9298 /* Add in space for the interrupt context information. */ 9299 if (cfun->machine->interrupt_handler_p) 9300 { 9301 /* Check HI/LO. */ 9302 if (mips_save_reg_p (LO_REGNUM) || mips_save_reg_p (HI_REGNUM)) 9303 { 9304 frame->num_acc++; 9305 frame->acc_mask |= (1 << 0); 9306 } 9307 9308 /* Check accumulators 1, 2, 3. */ 9309 for (i = DSP_ACC_REG_FIRST; i <= DSP_ACC_REG_LAST; i += 2) 9310 if (mips_save_reg_p (i) || mips_save_reg_p (i + 1)) 9311 { 9312 frame->num_acc++; 9313 frame->acc_mask |= 1 << (((i - DSP_ACC_REG_FIRST) / 2) + 1); 9314 } 9315 9316 /* All interrupt context functions need space to preserve STATUS. */ 9317 frame->num_cop0_regs++; 9318 9319 /* If we don't keep interrupts masked, we need to save EPC. */ 9320 if (!cfun->machine->keep_interrupts_masked_p) 9321 frame->num_cop0_regs++; 9322 } 9323 9324 /* Move above the accumulator save area. */ 9325 if (frame->num_acc > 0) 9326 { 9327 /* Each accumulator needs 2 words. */ 9328 offset += frame->num_acc * 2 * UNITS_PER_WORD; 9329 frame->acc_sp_offset = offset - UNITS_PER_WORD; 9330 } 9331 9332 /* Move above the COP0 register save area. */ 9333 if (frame->num_cop0_regs > 0) 9334 { 9335 offset += frame->num_cop0_regs * UNITS_PER_WORD; 9336 frame->cop0_sp_offset = offset - UNITS_PER_WORD; 9337 } 9338 9339 /* Move above the callee-allocated varargs save area. */ 9340 offset += MIPS_STACK_ALIGN (cfun->machine->varargs_size); 9341 frame->arg_pointer_offset = offset; 9342 9343 /* Move above the callee-allocated area for pretend stack arguments. */ 9344 offset += crtl->args.pretend_args_size; 9345 frame->total_size = offset; 9346 9347 /* Work out the offsets of the save areas from the top of the frame. */ 9348 if (frame->gp_sp_offset > 0) 9349 frame->gp_save_offset = frame->gp_sp_offset - offset; 9350 if (frame->fp_sp_offset > 0) 9351 frame->fp_save_offset = frame->fp_sp_offset - offset; 9352 if (frame->acc_sp_offset > 0) 9353 frame->acc_save_offset = frame->acc_sp_offset - offset; 9354 if (frame->num_cop0_regs > 0) 9355 frame->cop0_save_offset = frame->cop0_sp_offset - offset; 9356 9357 /* MIPS16 code offsets the frame pointer by the size of the outgoing 9358 arguments. This tends to increase the chances of using unextended 9359 instructions for local variables and incoming arguments. */ 9360 if (TARGET_MIPS16) 9361 frame->hard_frame_pointer_offset = frame->args_size; 9362 } 9363 9364 /* Return the style of GP load sequence that is being used for the 9365 current function. */ 9366 9367 enum mips_loadgp_style 9368 mips_current_loadgp_style (void) 9369 { 9370 if (!TARGET_USE_GOT || cfun->machine->global_pointer == INVALID_REGNUM) 9371 return LOADGP_NONE; 9372 9373 if (TARGET_RTP_PIC) 9374 return LOADGP_RTP; 9375 9376 if (TARGET_ABSOLUTE_ABICALLS) 9377 return LOADGP_ABSOLUTE; 9378 9379 return TARGET_NEWABI ? LOADGP_NEWABI : LOADGP_OLDABI; 9380 } 9381 9382 /* Implement TARGET_FRAME_POINTER_REQUIRED. */ 9383 9384 static bool 9385 mips_frame_pointer_required (void) 9386 { 9387 /* If the function contains dynamic stack allocations, we need to 9388 use the frame pointer to access the static parts of the frame. */ 9389 if (cfun->calls_alloca) 9390 return true; 9391 9392 /* In MIPS16 mode, we need a frame pointer for a large frame; otherwise, 9393 reload may be unable to compute the address of a local variable, 9394 since there is no way to add a large constant to the stack pointer 9395 without using a second temporary register. */ 9396 if (TARGET_MIPS16) 9397 { 9398 mips_compute_frame_info (); 9399 if (!SMALL_OPERAND (cfun->machine->frame.total_size)) 9400 return true; 9401 } 9402 9403 return false; 9404 } 9405 9406 /* Make sure that we're not trying to eliminate to the wrong hard frame 9407 pointer. */ 9408 9409 static bool 9410 mips_can_eliminate (const int from ATTRIBUTE_UNUSED, const int to) 9411 { 9412 return (to == HARD_FRAME_POINTER_REGNUM || to == STACK_POINTER_REGNUM); 9413 } 9414 9415 /* Implement INITIAL_ELIMINATION_OFFSET. FROM is either the frame pointer 9416 or argument pointer. TO is either the stack pointer or hard frame 9417 pointer. */ 9418 9419 HOST_WIDE_INT 9420 mips_initial_elimination_offset (int from, int to) 9421 { 9422 HOST_WIDE_INT offset; 9423 9424 mips_compute_frame_info (); 9425 9426 /* Set OFFSET to the offset from the end-of-prologue stack pointer. */ 9427 switch (from) 9428 { 9429 case FRAME_POINTER_REGNUM: 9430 if (FRAME_GROWS_DOWNWARD) 9431 offset = (cfun->machine->frame.args_size 9432 + cfun->machine->frame.cprestore_size 9433 + cfun->machine->frame.var_size); 9434 else 9435 offset = 0; 9436 break; 9437 9438 case ARG_POINTER_REGNUM: 9439 offset = cfun->machine->frame.arg_pointer_offset; 9440 break; 9441 9442 default: 9443 gcc_unreachable (); 9444 } 9445 9446 if (to == HARD_FRAME_POINTER_REGNUM) 9447 offset -= cfun->machine->frame.hard_frame_pointer_offset; 9448 9449 return offset; 9450 } 9451 9452 /* Implement TARGET_EXTRA_LIVE_ON_ENTRY. */ 9453 9454 static void 9455 mips_extra_live_on_entry (bitmap regs) 9456 { 9457 if (TARGET_USE_GOT) 9458 { 9459 /* PIC_FUNCTION_ADDR_REGNUM is live if we need it to set up 9460 the global pointer. */ 9461 if (!TARGET_ABSOLUTE_ABICALLS) 9462 bitmap_set_bit (regs, PIC_FUNCTION_ADDR_REGNUM); 9463 9464 /* The prologue may set MIPS16_PIC_TEMP_REGNUM to the value of 9465 the global pointer. */ 9466 if (TARGET_MIPS16) 9467 bitmap_set_bit (regs, MIPS16_PIC_TEMP_REGNUM); 9468 9469 /* See the comment above load_call<mode> for details. */ 9470 bitmap_set_bit (regs, GOT_VERSION_REGNUM); 9471 } 9472 } 9473 9474 /* Implement RETURN_ADDR_RTX. We do not support moving back to a 9475 previous frame. */ 9476 9477 rtx 9478 mips_return_addr (int count, rtx frame ATTRIBUTE_UNUSED) 9479 { 9480 if (count != 0) 9481 return const0_rtx; 9482 9483 return get_hard_reg_initial_val (Pmode, RETURN_ADDR_REGNUM); 9484 } 9485 9486 /* Emit code to change the current function's return address to 9487 ADDRESS. SCRATCH is available as a scratch register, if needed. 9488 ADDRESS and SCRATCH are both word-mode GPRs. */ 9489 9490 void 9491 mips_set_return_address (rtx address, rtx scratch) 9492 { 9493 rtx slot_address; 9494 9495 gcc_assert (BITSET_P (cfun->machine->frame.mask, RETURN_ADDR_REGNUM)); 9496 slot_address = mips_add_offset (scratch, stack_pointer_rtx, 9497 cfun->machine->frame.gp_sp_offset); 9498 mips_emit_move (gen_frame_mem (GET_MODE (address), slot_address), address); 9499 } 9500 9501 /* Return true if the current function has a cprestore slot. */ 9502 9503 bool 9504 mips_cfun_has_cprestore_slot_p (void) 9505 { 9506 return (cfun->machine->global_pointer != INVALID_REGNUM 9507 && cfun->machine->frame.cprestore_size > 0); 9508 } 9509 9510 /* Fill *BASE and *OFFSET such that *BASE + *OFFSET refers to the 9511 cprestore slot. LOAD_P is true if the caller wants to load from 9512 the cprestore slot; it is false if the caller wants to store to 9513 the slot. */ 9514 9515 static void 9516 mips_get_cprestore_base_and_offset (rtx *base, HOST_WIDE_INT *offset, 9517 bool load_p) 9518 { 9519 const struct mips_frame_info *frame; 9520 9521 frame = &cfun->machine->frame; 9522 /* .cprestore always uses the stack pointer instead of the frame pointer. 9523 We have a free choice for direct stores for non-MIPS16 functions, 9524 and for MIPS16 functions whose cprestore slot is in range of the 9525 stack pointer. Using the stack pointer would sometimes give more 9526 (early) scheduling freedom, but using the frame pointer would 9527 sometimes give more (late) scheduling freedom. It's hard to 9528 predict which applies to a given function, so let's keep things 9529 simple. 9530 9531 Loads must always use the frame pointer in functions that call 9532 alloca, and there's little benefit to using the stack pointer 9533 otherwise. */ 9534 if (frame_pointer_needed && !(TARGET_CPRESTORE_DIRECTIVE && !load_p)) 9535 { 9536 *base = hard_frame_pointer_rtx; 9537 *offset = frame->args_size - frame->hard_frame_pointer_offset; 9538 } 9539 else 9540 { 9541 *base = stack_pointer_rtx; 9542 *offset = frame->args_size; 9543 } 9544 } 9545 9546 /* Return true if X is the load or store address of the cprestore slot; 9547 LOAD_P says which. */ 9548 9549 bool 9550 mips_cprestore_address_p (rtx x, bool load_p) 9551 { 9552 rtx given_base, required_base; 9553 HOST_WIDE_INT given_offset, required_offset; 9554 9555 mips_split_plus (x, &given_base, &given_offset); 9556 mips_get_cprestore_base_and_offset (&required_base, &required_offset, load_p); 9557 return given_base == required_base && given_offset == required_offset; 9558 } 9559 9560 /* Return a MEM rtx for the cprestore slot. LOAD_P is true if we are 9561 going to load from it, false if we are going to store to it. 9562 Use TEMP as a temporary register if need be. */ 9563 9564 static rtx 9565 mips_cprestore_slot (rtx temp, bool load_p) 9566 { 9567 rtx base; 9568 HOST_WIDE_INT offset; 9569 9570 mips_get_cprestore_base_and_offset (&base, &offset, load_p); 9571 return gen_frame_mem (Pmode, mips_add_offset (temp, base, offset)); 9572 } 9573 9574 /* Emit instructions to save global pointer value GP into cprestore 9575 slot MEM. OFFSET is the offset that MEM applies to the base register. 9576 9577 MEM may not be a legitimate address. If it isn't, TEMP is a 9578 temporary register that can be used, otherwise it is a SCRATCH. */ 9579 9580 void 9581 mips_save_gp_to_cprestore_slot (rtx mem, rtx offset, rtx gp, rtx temp) 9582 { 9583 if (TARGET_CPRESTORE_DIRECTIVE) 9584 { 9585 gcc_assert (gp == pic_offset_table_rtx); 9586 emit_insn (gen_cprestore (mem, offset)); 9587 } 9588 else 9589 mips_emit_move (mips_cprestore_slot (temp, false), gp); 9590 } 9591 9592 /* Restore $gp from its save slot, using TEMP as a temporary base register 9593 if need be. This function is for o32 and o64 abicalls only. 9594 9595 See mips_must_initialize_gp_p for details about how we manage the 9596 global pointer. */ 9597 9598 void 9599 mips_restore_gp_from_cprestore_slot (rtx temp) 9600 { 9601 gcc_assert (TARGET_ABICALLS && TARGET_OLDABI && epilogue_completed); 9602 9603 if (!cfun->machine->must_restore_gp_when_clobbered_p) 9604 { 9605 emit_note (NOTE_INSN_DELETED); 9606 return; 9607 } 9608 9609 if (TARGET_MIPS16) 9610 { 9611 mips_emit_move (temp, mips_cprestore_slot (temp, true)); 9612 mips_emit_move (pic_offset_table_rtx, temp); 9613 } 9614 else 9615 mips_emit_move (pic_offset_table_rtx, mips_cprestore_slot (temp, true)); 9616 if (!TARGET_EXPLICIT_RELOCS) 9617 emit_insn (gen_blockage ()); 9618 } 9619 9620 /* A function to save or store a register. The first argument is the 9621 register and the second is the stack slot. */ 9622 typedef void (*mips_save_restore_fn) (rtx, rtx); 9623 9624 /* Use FN to save or restore register REGNO. MODE is the register's 9625 mode and OFFSET is the offset of its save slot from the current 9626 stack pointer. */ 9627 9628 static void 9629 mips_save_restore_reg (enum machine_mode mode, int regno, 9630 HOST_WIDE_INT offset, mips_save_restore_fn fn) 9631 { 9632 rtx mem; 9633 9634 mem = gen_frame_mem (mode, plus_constant (stack_pointer_rtx, offset)); 9635 fn (gen_rtx_REG (mode, regno), mem); 9636 } 9637 9638 /* Call FN for each accumlator that is saved by the current function. 9639 SP_OFFSET is the offset of the current stack pointer from the start 9640 of the frame. */ 9641 9642 static void 9643 mips_for_each_saved_acc (HOST_WIDE_INT sp_offset, mips_save_restore_fn fn) 9644 { 9645 HOST_WIDE_INT offset; 9646 int regno; 9647 9648 offset = cfun->machine->frame.acc_sp_offset - sp_offset; 9649 if (BITSET_P (cfun->machine->frame.acc_mask, 0)) 9650 { 9651 mips_save_restore_reg (word_mode, LO_REGNUM, offset, fn); 9652 offset -= UNITS_PER_WORD; 9653 mips_save_restore_reg (word_mode, HI_REGNUM, offset, fn); 9654 offset -= UNITS_PER_WORD; 9655 } 9656 9657 for (regno = DSP_ACC_REG_FIRST; regno <= DSP_ACC_REG_LAST; regno++) 9658 if (BITSET_P (cfun->machine->frame.acc_mask, 9659 ((regno - DSP_ACC_REG_FIRST) / 2) + 1)) 9660 { 9661 mips_save_restore_reg (word_mode, regno, offset, fn); 9662 offset -= UNITS_PER_WORD; 9663 } 9664 } 9665 9666 /* Call FN for each register that is saved by the current function. 9667 SP_OFFSET is the offset of the current stack pointer from the start 9668 of the frame. */ 9669 9670 static void 9671 mips_for_each_saved_gpr_and_fpr (HOST_WIDE_INT sp_offset, 9672 mips_save_restore_fn fn) 9673 { 9674 enum machine_mode fpr_mode; 9675 HOST_WIDE_INT offset; 9676 int regno; 9677 9678 /* Save registers starting from high to low. The debuggers prefer at least 9679 the return register be stored at func+4, and also it allows us not to 9680 need a nop in the epilogue if at least one register is reloaded in 9681 addition to return address. */ 9682 offset = cfun->machine->frame.gp_sp_offset - sp_offset; 9683 for (regno = GP_REG_LAST; regno >= GP_REG_FIRST; regno--) 9684 if (BITSET_P (cfun->machine->frame.mask, regno - GP_REG_FIRST)) 9685 { 9686 /* Record the ra offset for use by mips_function_profiler. */ 9687 if (regno == RETURN_ADDR_REGNUM) 9688 cfun->machine->frame.ra_fp_offset = offset + sp_offset; 9689 mips_save_restore_reg (word_mode, regno, offset, fn); 9690 offset -= UNITS_PER_WORD; 9691 } 9692 9693 /* This loop must iterate over the same space as its companion in 9694 mips_compute_frame_info. */ 9695 offset = cfun->machine->frame.fp_sp_offset - sp_offset; 9696 fpr_mode = (TARGET_SINGLE_FLOAT ? SFmode : DFmode); 9697 for (regno = FP_REG_LAST - MAX_FPRS_PER_FMT + 1; 9698 regno >= FP_REG_FIRST; 9699 regno -= MAX_FPRS_PER_FMT) 9700 if (BITSET_P (cfun->machine->frame.fmask, regno - FP_REG_FIRST)) 9701 { 9702 mips_save_restore_reg (fpr_mode, regno, offset, fn); 9703 offset -= GET_MODE_SIZE (fpr_mode); 9704 } 9705 } 9706 9707 /* Return true if a move between register REGNO and its save slot (MEM) 9708 can be done in a single move. LOAD_P is true if we are loading 9709 from the slot, false if we are storing to it. */ 9710 9711 static bool 9712 mips_direct_save_slot_move_p (unsigned int regno, rtx mem, bool load_p) 9713 { 9714 /* There is a specific MIPS16 instruction for saving $31 to the stack. */ 9715 if (TARGET_MIPS16 && !load_p && regno == RETURN_ADDR_REGNUM) 9716 return false; 9717 9718 return mips_secondary_reload_class (REGNO_REG_CLASS (regno), 9719 GET_MODE (mem), mem, load_p) == NO_REGS; 9720 } 9721 9722 /* Emit a move from SRC to DEST, given that one of them is a register 9723 save slot and that the other is a register. TEMP is a temporary 9724 GPR of the same mode that is available if need be. */ 9725 9726 void 9727 mips_emit_save_slot_move (rtx dest, rtx src, rtx temp) 9728 { 9729 unsigned int regno; 9730 rtx mem; 9731 9732 if (REG_P (src)) 9733 { 9734 regno = REGNO (src); 9735 mem = dest; 9736 } 9737 else 9738 { 9739 regno = REGNO (dest); 9740 mem = src; 9741 } 9742 9743 if (regno == cfun->machine->global_pointer && !mips_must_initialize_gp_p ()) 9744 { 9745 /* We don't yet know whether we'll need this instruction or not. 9746 Postpone the decision by emitting a ghost move. This move 9747 is specifically not frame-related; only the split version is. */ 9748 if (TARGET_64BIT) 9749 emit_insn (gen_move_gpdi (dest, src)); 9750 else 9751 emit_insn (gen_move_gpsi (dest, src)); 9752 return; 9753 } 9754 9755 if (regno == HI_REGNUM) 9756 { 9757 if (REG_P (dest)) 9758 { 9759 mips_emit_move (temp, src); 9760 if (TARGET_64BIT) 9761 emit_insn (gen_mthisi_di (gen_rtx_REG (TImode, MD_REG_FIRST), 9762 temp, gen_rtx_REG (DImode, LO_REGNUM))); 9763 else 9764 emit_insn (gen_mthisi_di (gen_rtx_REG (DImode, MD_REG_FIRST), 9765 temp, gen_rtx_REG (SImode, LO_REGNUM))); 9766 } 9767 else 9768 { 9769 if (TARGET_64BIT) 9770 emit_insn (gen_mfhidi_ti (temp, 9771 gen_rtx_REG (TImode, MD_REG_FIRST))); 9772 else 9773 emit_insn (gen_mfhisi_di (temp, 9774 gen_rtx_REG (DImode, MD_REG_FIRST))); 9775 mips_emit_move (dest, temp); 9776 } 9777 } 9778 else if (mips_direct_save_slot_move_p (regno, mem, mem == src)) 9779 mips_emit_move (dest, src); 9780 else 9781 { 9782 gcc_assert (!reg_overlap_mentioned_p (dest, temp)); 9783 mips_emit_move (temp, src); 9784 mips_emit_move (dest, temp); 9785 } 9786 if (MEM_P (dest)) 9787 mips_set_frame_expr (mips_frame_set (dest, src)); 9788 } 9789 9790 /* If we're generating n32 or n64 abicalls, and the current function 9791 does not use $28 as its global pointer, emit a cplocal directive. 9792 Use pic_offset_table_rtx as the argument to the directive. */ 9793 9794 static void 9795 mips_output_cplocal (void) 9796 { 9797 if (!TARGET_EXPLICIT_RELOCS 9798 && mips_must_initialize_gp_p () 9799 && cfun->machine->global_pointer != GLOBAL_POINTER_REGNUM) 9800 output_asm_insn (".cplocal %+", 0); 9801 } 9802 9803 /* Implement TARGET_OUTPUT_FUNCTION_PROLOGUE. */ 9804 9805 static void 9806 mips_output_function_prologue (FILE *file, HOST_WIDE_INT size ATTRIBUTE_UNUSED) 9807 { 9808 const char *fnname; 9809 9810 #ifdef SDB_DEBUGGING_INFO 9811 if (debug_info_level != DINFO_LEVEL_TERSE && write_symbols == SDB_DEBUG) 9812 SDB_OUTPUT_SOURCE_LINE (file, DECL_SOURCE_LINE (current_function_decl)); 9813 #endif 9814 9815 /* In MIPS16 mode, we may need to generate a non-MIPS16 stub to handle 9816 floating-point arguments. */ 9817 if (TARGET_MIPS16 9818 && TARGET_HARD_FLOAT_ABI 9819 && crtl->args.info.fp_code != 0) 9820 mips16_build_function_stub (); 9821 9822 /* Get the function name the same way that toplev.c does before calling 9823 assemble_start_function. This is needed so that the name used here 9824 exactly matches the name used in ASM_DECLARE_FUNCTION_NAME. */ 9825 fnname = XSTR (XEXP (DECL_RTL (current_function_decl), 0), 0); 9826 mips_start_function_definition (fnname, TARGET_MIPS16); 9827 9828 /* Stop mips_file_end from treating this function as external. */ 9829 if (TARGET_IRIX && mips_abi == ABI_32) 9830 TREE_ASM_WRITTEN (DECL_NAME (cfun->decl)) = 1; 9831 9832 /* Output MIPS-specific frame information. */ 9833 if (!flag_inhibit_size_directive) 9834 { 9835 const struct mips_frame_info *frame; 9836 9837 frame = &cfun->machine->frame; 9838 9839 /* .frame FRAMEREG, FRAMESIZE, RETREG. */ 9840 fprintf (file, 9841 "\t.frame\t%s," HOST_WIDE_INT_PRINT_DEC ",%s\t\t" 9842 "# vars= " HOST_WIDE_INT_PRINT_DEC 9843 ", regs= %d/%d" 9844 ", args= " HOST_WIDE_INT_PRINT_DEC 9845 ", gp= " HOST_WIDE_INT_PRINT_DEC "\n", 9846 reg_names[frame_pointer_needed 9847 ? HARD_FRAME_POINTER_REGNUM 9848 : STACK_POINTER_REGNUM], 9849 (frame_pointer_needed 9850 ? frame->total_size - frame->hard_frame_pointer_offset 9851 : frame->total_size), 9852 reg_names[RETURN_ADDR_REGNUM], 9853 frame->var_size, 9854 frame->num_gp, frame->num_fp, 9855 frame->args_size, 9856 frame->cprestore_size); 9857 9858 /* .mask MASK, OFFSET. */ 9859 fprintf (file, "\t.mask\t0x%08x," HOST_WIDE_INT_PRINT_DEC "\n", 9860 frame->mask, frame->gp_save_offset); 9861 9862 /* .fmask MASK, OFFSET. */ 9863 fprintf (file, "\t.fmask\t0x%08x," HOST_WIDE_INT_PRINT_DEC "\n", 9864 frame->fmask, frame->fp_save_offset); 9865 } 9866 9867 /* Handle the initialization of $gp for SVR4 PIC, if applicable. 9868 Also emit the ".set noreorder; .set nomacro" sequence for functions 9869 that need it. */ 9870 if (mips_must_initialize_gp_p () 9871 && mips_current_loadgp_style () == LOADGP_OLDABI) 9872 { 9873 if (TARGET_MIPS16) 9874 { 9875 /* This is a fixed-form sequence. The position of the 9876 first two instructions is important because of the 9877 way _gp_disp is defined. */ 9878 output_asm_insn ("li\t$2,%%hi(_gp_disp)", 0); 9879 output_asm_insn ("addiu\t$3,$pc,%%lo(_gp_disp)", 0); 9880 output_asm_insn ("sll\t$2,16", 0); 9881 output_asm_insn ("addu\t$2,$3", 0); 9882 } 9883 else 9884 { 9885 /* .cpload must be in a .set noreorder but not a 9886 .set nomacro block. */ 9887 mips_push_asm_switch (&mips_noreorder); 9888 output_asm_insn (".cpload\t%^", 0); 9889 if (!cfun->machine->all_noreorder_p) 9890 mips_pop_asm_switch (&mips_noreorder); 9891 else 9892 mips_push_asm_switch (&mips_nomacro); 9893 } 9894 } 9895 else if (cfun->machine->all_noreorder_p) 9896 { 9897 mips_push_asm_switch (&mips_noreorder); 9898 mips_push_asm_switch (&mips_nomacro); 9899 } 9900 9901 /* Tell the assembler which register we're using as the global 9902 pointer. This is needed for thunks, since they can use either 9903 explicit relocs or assembler macros. */ 9904 mips_output_cplocal (); 9905 } 9906 9907 /* Implement TARGET_OUTPUT_FUNCTION_EPILOGUE. */ 9908 9909 static void 9910 mips_output_function_epilogue (FILE *file ATTRIBUTE_UNUSED, 9911 HOST_WIDE_INT size ATTRIBUTE_UNUSED) 9912 { 9913 const char *fnname; 9914 9915 /* Reinstate the normal $gp. */ 9916 SET_REGNO (pic_offset_table_rtx, GLOBAL_POINTER_REGNUM); 9917 mips_output_cplocal (); 9918 9919 if (cfun->machine->all_noreorder_p) 9920 { 9921 mips_pop_asm_switch (&mips_nomacro); 9922 mips_pop_asm_switch (&mips_noreorder); 9923 } 9924 9925 /* Get the function name the same way that toplev.c does before calling 9926 assemble_start_function. This is needed so that the name used here 9927 exactly matches the name used in ASM_DECLARE_FUNCTION_NAME. */ 9928 fnname = XSTR (XEXP (DECL_RTL (current_function_decl), 0), 0); 9929 mips_end_function_definition (fnname); 9930 } 9931 9932 /* Save register REG to MEM. Make the instruction frame-related. */ 9933 9934 static void 9935 mips_save_reg (rtx reg, rtx mem) 9936 { 9937 if (GET_MODE (reg) == DFmode && !TARGET_FLOAT64) 9938 { 9939 rtx x1, x2; 9940 9941 if (mips_split_64bit_move_p (mem, reg)) 9942 mips_split_doubleword_move (mem, reg); 9943 else 9944 mips_emit_move (mem, reg); 9945 9946 x1 = mips_frame_set (mips_subword (mem, false), 9947 mips_subword (reg, false)); 9948 x2 = mips_frame_set (mips_subword (mem, true), 9949 mips_subword (reg, true)); 9950 mips_set_frame_expr (gen_rtx_PARALLEL (VOIDmode, gen_rtvec (2, x1, x2))); 9951 } 9952 else 9953 mips_emit_save_slot_move (mem, reg, MIPS_PROLOGUE_TEMP (GET_MODE (reg))); 9954 } 9955 9956 /* The __gnu_local_gp symbol. */ 9957 9958 static GTY(()) rtx mips_gnu_local_gp; 9959 9960 /* If we're generating n32 or n64 abicalls, emit instructions 9961 to set up the global pointer. */ 9962 9963 static void 9964 mips_emit_loadgp (void) 9965 { 9966 rtx addr, offset, incoming_address, base, index, pic_reg; 9967 9968 pic_reg = TARGET_MIPS16 ? MIPS16_PIC_TEMP : pic_offset_table_rtx; 9969 switch (mips_current_loadgp_style ()) 9970 { 9971 case LOADGP_ABSOLUTE: 9972 if (mips_gnu_local_gp == NULL) 9973 { 9974 mips_gnu_local_gp = gen_rtx_SYMBOL_REF (Pmode, "__gnu_local_gp"); 9975 SYMBOL_REF_FLAGS (mips_gnu_local_gp) |= SYMBOL_FLAG_LOCAL; 9976 } 9977 emit_insn (Pmode == SImode 9978 ? gen_loadgp_absolute_si (pic_reg, mips_gnu_local_gp) 9979 : gen_loadgp_absolute_di (pic_reg, mips_gnu_local_gp)); 9980 break; 9981 9982 case LOADGP_OLDABI: 9983 /* Added by mips_output_function_prologue. */ 9984 break; 9985 9986 case LOADGP_NEWABI: 9987 addr = XEXP (DECL_RTL (current_function_decl), 0); 9988 offset = mips_unspec_address (addr, SYMBOL_GOTOFF_LOADGP); 9989 incoming_address = gen_rtx_REG (Pmode, PIC_FUNCTION_ADDR_REGNUM); 9990 emit_insn (Pmode == SImode 9991 ? gen_loadgp_newabi_si (pic_reg, offset, incoming_address) 9992 : gen_loadgp_newabi_di (pic_reg, offset, incoming_address)); 9993 break; 9994 9995 case LOADGP_RTP: 9996 base = gen_rtx_SYMBOL_REF (Pmode, ggc_strdup (VXWORKS_GOTT_BASE)); 9997 index = gen_rtx_SYMBOL_REF (Pmode, ggc_strdup (VXWORKS_GOTT_INDEX)); 9998 emit_insn (Pmode == SImode 9999 ? gen_loadgp_rtp_si (pic_reg, base, index) 10000 : gen_loadgp_rtp_di (pic_reg, base, index)); 10001 break; 10002 10003 default: 10004 return; 10005 } 10006 10007 if (TARGET_MIPS16) 10008 emit_insn (gen_copygp_mips16 (pic_offset_table_rtx, pic_reg)); 10009 10010 /* Emit a blockage if there are implicit uses of the GP register. 10011 This includes profiled functions, because FUNCTION_PROFILE uses 10012 a jal macro. */ 10013 if (!TARGET_EXPLICIT_RELOCS || crtl->profile) 10014 emit_insn (gen_loadgp_blockage ()); 10015 } 10016 10017 /* A for_each_rtx callback. Stop the search if *X is a kernel register. */ 10018 10019 static int 10020 mips_kernel_reg_p (rtx *x, void *data ATTRIBUTE_UNUSED) 10021 { 10022 return REG_P (*x) && KERNEL_REG_P (REGNO (*x)); 10023 } 10024 10025 /* Expand the "prologue" pattern. */ 10026 10027 void 10028 mips_expand_prologue (void) 10029 { 10030 const struct mips_frame_info *frame; 10031 HOST_WIDE_INT size; 10032 unsigned int nargs; 10033 rtx insn; 10034 10035 if (cfun->machine->global_pointer != INVALID_REGNUM) 10036 { 10037 /* Check whether an insn uses pic_offset_table_rtx, either explicitly 10038 or implicitly. If so, we can commit to using a global pointer 10039 straight away, otherwise we need to defer the decision. */ 10040 if (mips_cfun_has_inflexible_gp_ref_p () 10041 || mips_cfun_has_flexible_gp_ref_p ()) 10042 { 10043 cfun->machine->must_initialize_gp_p = true; 10044 cfun->machine->must_restore_gp_when_clobbered_p = true; 10045 } 10046 10047 SET_REGNO (pic_offset_table_rtx, cfun->machine->global_pointer); 10048 } 10049 10050 frame = &cfun->machine->frame; 10051 size = frame->total_size; 10052 10053 /* Save the registers. Allocate up to MIPS_MAX_FIRST_STACK_STEP 10054 bytes beforehand; this is enough to cover the register save area 10055 without going out of range. */ 10056 if (((frame->mask | frame->fmask | frame->acc_mask) != 0) 10057 || frame->num_cop0_regs > 0) 10058 { 10059 HOST_WIDE_INT step1; 10060 10061 step1 = MIN (size, MIPS_MAX_FIRST_STACK_STEP); 10062 if (GENERATE_MIPS16E_SAVE_RESTORE) 10063 { 10064 HOST_WIDE_INT offset; 10065 unsigned int mask, regno; 10066 10067 /* Try to merge argument stores into the save instruction. */ 10068 nargs = mips16e_collect_argument_saves (); 10069 10070 /* Build the save instruction. */ 10071 mask = frame->mask; 10072 insn = mips16e_build_save_restore (false, &mask, &offset, 10073 nargs, step1); 10074 RTX_FRAME_RELATED_P (emit_insn (insn)) = 1; 10075 size -= step1; 10076 10077 /* Check if we need to save other registers. */ 10078 for (regno = GP_REG_FIRST; regno < GP_REG_LAST; regno++) 10079 if (BITSET_P (mask, regno - GP_REG_FIRST)) 10080 { 10081 offset -= UNITS_PER_WORD; 10082 mips_save_restore_reg (word_mode, regno, 10083 offset, mips_save_reg); 10084 } 10085 } 10086 else 10087 { 10088 if (cfun->machine->interrupt_handler_p) 10089 { 10090 HOST_WIDE_INT offset; 10091 rtx mem; 10092 10093 /* If this interrupt is using a shadow register set, we need to 10094 get the stack pointer from the previous register set. */ 10095 if (cfun->machine->use_shadow_register_set_p) 10096 emit_insn (gen_mips_rdpgpr (stack_pointer_rtx, 10097 stack_pointer_rtx)); 10098 10099 if (!cfun->machine->keep_interrupts_masked_p) 10100 { 10101 /* Move from COP0 Cause to K0. */ 10102 emit_insn (gen_cop0_move (gen_rtx_REG (SImode, K0_REG_NUM), 10103 gen_rtx_REG (SImode, 10104 COP0_CAUSE_REG_NUM))); 10105 /* Move from COP0 EPC to K1. */ 10106 emit_insn (gen_cop0_move (gen_rtx_REG (SImode, K1_REG_NUM), 10107 gen_rtx_REG (SImode, 10108 COP0_EPC_REG_NUM))); 10109 } 10110 10111 /* Allocate the first part of the frame. */ 10112 insn = gen_add3_insn (stack_pointer_rtx, stack_pointer_rtx, 10113 GEN_INT (-step1)); 10114 RTX_FRAME_RELATED_P (emit_insn (insn)) = 1; 10115 size -= step1; 10116 10117 /* Start at the uppermost location for saving. */ 10118 offset = frame->cop0_sp_offset - size; 10119 if (!cfun->machine->keep_interrupts_masked_p) 10120 { 10121 /* Push EPC into its stack slot. */ 10122 mem = gen_frame_mem (word_mode, 10123 plus_constant (stack_pointer_rtx, 10124 offset)); 10125 mips_emit_move (mem, gen_rtx_REG (word_mode, K1_REG_NUM)); 10126 offset -= UNITS_PER_WORD; 10127 } 10128 10129 /* Move from COP0 Status to K1. */ 10130 emit_insn (gen_cop0_move (gen_rtx_REG (SImode, K1_REG_NUM), 10131 gen_rtx_REG (SImode, 10132 COP0_STATUS_REG_NUM))); 10133 10134 /* Right justify the RIPL in k0. */ 10135 if (!cfun->machine->keep_interrupts_masked_p) 10136 emit_insn (gen_lshrsi3 (gen_rtx_REG (SImode, K0_REG_NUM), 10137 gen_rtx_REG (SImode, K0_REG_NUM), 10138 GEN_INT (CAUSE_IPL))); 10139 10140 /* Push Status into its stack slot. */ 10141 mem = gen_frame_mem (word_mode, 10142 plus_constant (stack_pointer_rtx, offset)); 10143 mips_emit_move (mem, gen_rtx_REG (word_mode, K1_REG_NUM)); 10144 offset -= UNITS_PER_WORD; 10145 10146 /* Insert the RIPL into our copy of SR (k1) as the new IPL. */ 10147 if (!cfun->machine->keep_interrupts_masked_p) 10148 emit_insn (gen_insvsi (gen_rtx_REG (SImode, K1_REG_NUM), 10149 GEN_INT (6), 10150 GEN_INT (SR_IPL), 10151 gen_rtx_REG (SImode, K0_REG_NUM))); 10152 10153 if (!cfun->machine->keep_interrupts_masked_p) 10154 /* Enable interrupts by clearing the KSU ERL and EXL bits. 10155 IE is already the correct value, so we don't have to do 10156 anything explicit. */ 10157 emit_insn (gen_insvsi (gen_rtx_REG (SImode, K1_REG_NUM), 10158 GEN_INT (4), 10159 GEN_INT (SR_EXL), 10160 gen_rtx_REG (SImode, GP_REG_FIRST))); 10161 else 10162 /* Disable interrupts by clearing the KSU, ERL, EXL, 10163 and IE bits. */ 10164 emit_insn (gen_insvsi (gen_rtx_REG (SImode, K1_REG_NUM), 10165 GEN_INT (5), 10166 GEN_INT (SR_IE), 10167 gen_rtx_REG (SImode, GP_REG_FIRST))); 10168 } 10169 else 10170 { 10171 insn = gen_add3_insn (stack_pointer_rtx, 10172 stack_pointer_rtx, 10173 GEN_INT (-step1)); 10174 RTX_FRAME_RELATED_P (emit_insn (insn)) = 1; 10175 size -= step1; 10176 } 10177 mips_for_each_saved_acc (size, mips_save_reg); 10178 mips_for_each_saved_gpr_and_fpr (size, mips_save_reg); 10179 } 10180 } 10181 10182 /* Allocate the rest of the frame. */ 10183 if (size > 0) 10184 { 10185 if (SMALL_OPERAND (-size)) 10186 RTX_FRAME_RELATED_P (emit_insn (gen_add3_insn (stack_pointer_rtx, 10187 stack_pointer_rtx, 10188 GEN_INT (-size)))) = 1; 10189 else 10190 { 10191 mips_emit_move (MIPS_PROLOGUE_TEMP (Pmode), GEN_INT (size)); 10192 if (TARGET_MIPS16) 10193 { 10194 /* There are no instructions to add or subtract registers 10195 from the stack pointer, so use the frame pointer as a 10196 temporary. We should always be using a frame pointer 10197 in this case anyway. */ 10198 gcc_assert (frame_pointer_needed); 10199 mips_emit_move (hard_frame_pointer_rtx, stack_pointer_rtx); 10200 emit_insn (gen_sub3_insn (hard_frame_pointer_rtx, 10201 hard_frame_pointer_rtx, 10202 MIPS_PROLOGUE_TEMP (Pmode))); 10203 mips_emit_move (stack_pointer_rtx, hard_frame_pointer_rtx); 10204 } 10205 else 10206 emit_insn (gen_sub3_insn (stack_pointer_rtx, 10207 stack_pointer_rtx, 10208 MIPS_PROLOGUE_TEMP (Pmode))); 10209 10210 /* Describe the combined effect of the previous instructions. */ 10211 mips_set_frame_expr 10212 (gen_rtx_SET (VOIDmode, stack_pointer_rtx, 10213 plus_constant (stack_pointer_rtx, -size))); 10214 } 10215 } 10216 10217 /* Set up the frame pointer, if we're using one. */ 10218 if (frame_pointer_needed) 10219 { 10220 HOST_WIDE_INT offset; 10221 10222 offset = frame->hard_frame_pointer_offset; 10223 if (offset == 0) 10224 { 10225 insn = mips_emit_move (hard_frame_pointer_rtx, stack_pointer_rtx); 10226 RTX_FRAME_RELATED_P (insn) = 1; 10227 } 10228 else if (SMALL_OPERAND (offset)) 10229 { 10230 insn = gen_add3_insn (hard_frame_pointer_rtx, 10231 stack_pointer_rtx, GEN_INT (offset)); 10232 RTX_FRAME_RELATED_P (emit_insn (insn)) = 1; 10233 } 10234 else 10235 { 10236 mips_emit_move (MIPS_PROLOGUE_TEMP (Pmode), GEN_INT (offset)); 10237 mips_emit_move (hard_frame_pointer_rtx, stack_pointer_rtx); 10238 emit_insn (gen_add3_insn (hard_frame_pointer_rtx, 10239 hard_frame_pointer_rtx, 10240 MIPS_PROLOGUE_TEMP (Pmode))); 10241 mips_set_frame_expr 10242 (gen_rtx_SET (VOIDmode, hard_frame_pointer_rtx, 10243 plus_constant (stack_pointer_rtx, offset))); 10244 } 10245 } 10246 10247 mips_emit_loadgp (); 10248 10249 /* Initialize the $gp save slot. */ 10250 if (mips_cfun_has_cprestore_slot_p ()) 10251 { 10252 rtx base, mem, gp, temp; 10253 HOST_WIDE_INT offset; 10254 10255 mips_get_cprestore_base_and_offset (&base, &offset, false); 10256 mem = gen_frame_mem (Pmode, plus_constant (base, offset)); 10257 gp = TARGET_MIPS16 ? MIPS16_PIC_TEMP : pic_offset_table_rtx; 10258 temp = (SMALL_OPERAND (offset) 10259 ? gen_rtx_SCRATCH (Pmode) 10260 : MIPS_PROLOGUE_TEMP (Pmode)); 10261 emit_insn (gen_potential_cprestore (mem, GEN_INT (offset), gp, temp)); 10262 10263 mips_get_cprestore_base_and_offset (&base, &offset, true); 10264 mem = gen_frame_mem (Pmode, plus_constant (base, offset)); 10265 emit_insn (gen_use_cprestore (mem)); 10266 } 10267 10268 /* We need to search back to the last use of K0 or K1. */ 10269 if (cfun->machine->interrupt_handler_p) 10270 { 10271 for (insn = get_last_insn (); insn != NULL_RTX; insn = PREV_INSN (insn)) 10272 if (INSN_P (insn) 10273 && for_each_rtx (&PATTERN (insn), mips_kernel_reg_p, NULL)) 10274 break; 10275 /* Emit a move from K1 to COP0 Status after insn. */ 10276 gcc_assert (insn != NULL_RTX); 10277 emit_insn_after (gen_cop0_move (gen_rtx_REG (SImode, COP0_STATUS_REG_NUM), 10278 gen_rtx_REG (SImode, K1_REG_NUM)), 10279 insn); 10280 } 10281 10282 /* If we are profiling, make sure no instructions are scheduled before 10283 the call to mcount. */ 10284 if (crtl->profile) 10285 emit_insn (gen_blockage ()); 10286 } 10287 10288 /* Emit instructions to restore register REG from slot MEM. */ 10289 10290 static void 10291 mips_restore_reg (rtx reg, rtx mem) 10292 { 10293 /* There's no MIPS16 instruction to load $31 directly. Load into 10294 $7 instead and adjust the return insn appropriately. */ 10295 if (TARGET_MIPS16 && REGNO (reg) == RETURN_ADDR_REGNUM) 10296 reg = gen_rtx_REG (GET_MODE (reg), GP_REG_FIRST + 7); 10297 10298 mips_emit_save_slot_move (reg, mem, MIPS_EPILOGUE_TEMP (GET_MODE (reg))); 10299 } 10300 10301 /* Emit any instructions needed before a return. */ 10302 10303 void 10304 mips_expand_before_return (void) 10305 { 10306 /* When using a call-clobbered gp, we start out with unified call 10307 insns that include instructions to restore the gp. We then split 10308 these unified calls after reload. These split calls explicitly 10309 clobber gp, so there is no need to define 10310 PIC_OFFSET_TABLE_REG_CALL_CLOBBERED. 10311 10312 For consistency, we should also insert an explicit clobber of $28 10313 before return insns, so that the post-reload optimizers know that 10314 the register is not live on exit. */ 10315 if (TARGET_CALL_CLOBBERED_GP) 10316 emit_clobber (pic_offset_table_rtx); 10317 } 10318 10319 /* Expand an "epilogue" or "sibcall_epilogue" pattern; SIBCALL_P 10320 says which. */ 10321 10322 void 10323 mips_expand_epilogue (bool sibcall_p) 10324 { 10325 const struct mips_frame_info *frame; 10326 HOST_WIDE_INT step1, step2; 10327 rtx base, target, insn; 10328 10329 if (!sibcall_p && mips_can_use_return_insn ()) 10330 { 10331 emit_jump_insn (gen_return ()); 10332 return; 10333 } 10334 10335 /* In MIPS16 mode, if the return value should go into a floating-point 10336 register, we need to call a helper routine to copy it over. */ 10337 if (mips16_cfun_returns_in_fpr_p ()) 10338 mips16_copy_fpr_return_value (); 10339 10340 /* Split the frame into two. STEP1 is the amount of stack we should 10341 deallocate before restoring the registers. STEP2 is the amount we 10342 should deallocate afterwards. 10343 10344 Start off by assuming that no registers need to be restored. */ 10345 frame = &cfun->machine->frame; 10346 step1 = frame->total_size; 10347 step2 = 0; 10348 10349 /* Work out which register holds the frame address. */ 10350 if (!frame_pointer_needed) 10351 base = stack_pointer_rtx; 10352 else 10353 { 10354 base = hard_frame_pointer_rtx; 10355 step1 -= frame->hard_frame_pointer_offset; 10356 } 10357 10358 /* If we need to restore registers, deallocate as much stack as 10359 possible in the second step without going out of range. */ 10360 if ((frame->mask | frame->fmask | frame->acc_mask) != 0 10361 || frame->num_cop0_regs > 0) 10362 { 10363 step2 = MIN (step1, MIPS_MAX_FIRST_STACK_STEP); 10364 step1 -= step2; 10365 } 10366 10367 /* Set TARGET to BASE + STEP1. */ 10368 target = base; 10369 if (step1 > 0) 10370 { 10371 rtx adjust; 10372 10373 /* Get an rtx for STEP1 that we can add to BASE. */ 10374 adjust = GEN_INT (step1); 10375 if (!SMALL_OPERAND (step1)) 10376 { 10377 mips_emit_move (MIPS_EPILOGUE_TEMP (Pmode), adjust); 10378 adjust = MIPS_EPILOGUE_TEMP (Pmode); 10379 } 10380 10381 /* Normal mode code can copy the result straight into $sp. */ 10382 if (!TARGET_MIPS16) 10383 target = stack_pointer_rtx; 10384 10385 emit_insn (gen_add3_insn (target, base, adjust)); 10386 } 10387 10388 /* Copy TARGET into the stack pointer. */ 10389 if (target != stack_pointer_rtx) 10390 mips_emit_move (stack_pointer_rtx, target); 10391 10392 /* If we're using addressing macros, $gp is implicitly used by all 10393 SYMBOL_REFs. We must emit a blockage insn before restoring $gp 10394 from the stack. */ 10395 if (TARGET_CALL_SAVED_GP && !TARGET_EXPLICIT_RELOCS) 10396 emit_insn (gen_blockage ()); 10397 10398 if (GENERATE_MIPS16E_SAVE_RESTORE && frame->mask != 0) 10399 { 10400 unsigned int regno, mask; 10401 HOST_WIDE_INT offset; 10402 rtx restore; 10403 10404 /* Generate the restore instruction. */ 10405 mask = frame->mask; 10406 restore = mips16e_build_save_restore (true, &mask, &offset, 0, step2); 10407 10408 /* Restore any other registers manually. */ 10409 for (regno = GP_REG_FIRST; regno < GP_REG_LAST; regno++) 10410 if (BITSET_P (mask, regno - GP_REG_FIRST)) 10411 { 10412 offset -= UNITS_PER_WORD; 10413 mips_save_restore_reg (word_mode, regno, offset, mips_restore_reg); 10414 } 10415 10416 /* Restore the remaining registers and deallocate the final bit 10417 of the frame. */ 10418 emit_insn (restore); 10419 } 10420 else 10421 { 10422 /* Restore the registers. */ 10423 mips_for_each_saved_acc (frame->total_size - step2, mips_restore_reg); 10424 mips_for_each_saved_gpr_and_fpr (frame->total_size - step2, 10425 mips_restore_reg); 10426 10427 if (cfun->machine->interrupt_handler_p) 10428 { 10429 HOST_WIDE_INT offset; 10430 rtx mem; 10431 10432 offset = frame->cop0_sp_offset - (frame->total_size - step2); 10433 if (!cfun->machine->keep_interrupts_masked_p) 10434 { 10435 /* Restore the original EPC. */ 10436 mem = gen_frame_mem (word_mode, 10437 plus_constant (stack_pointer_rtx, offset)); 10438 mips_emit_move (gen_rtx_REG (word_mode, K0_REG_NUM), mem); 10439 offset -= UNITS_PER_WORD; 10440 10441 /* Move to COP0 EPC. */ 10442 emit_insn (gen_cop0_move (gen_rtx_REG (SImode, COP0_EPC_REG_NUM), 10443 gen_rtx_REG (SImode, K0_REG_NUM))); 10444 } 10445 10446 /* Restore the original Status. */ 10447 mem = gen_frame_mem (word_mode, 10448 plus_constant (stack_pointer_rtx, offset)); 10449 mips_emit_move (gen_rtx_REG (word_mode, K0_REG_NUM), mem); 10450 offset -= UNITS_PER_WORD; 10451 10452 /* If we don't use shoadow register set, we need to update SP. */ 10453 if (!cfun->machine->use_shadow_register_set_p && step2 > 0) 10454 emit_insn (gen_add3_insn (stack_pointer_rtx, 10455 stack_pointer_rtx, 10456 GEN_INT (step2))); 10457 10458 /* Move to COP0 Status. */ 10459 emit_insn (gen_cop0_move (gen_rtx_REG (SImode, COP0_STATUS_REG_NUM), 10460 gen_rtx_REG (SImode, K0_REG_NUM))); 10461 } 10462 else 10463 { 10464 /* Deallocate the final bit of the frame. */ 10465 if (step2 > 0) 10466 emit_insn (gen_add3_insn (stack_pointer_rtx, 10467 stack_pointer_rtx, 10468 GEN_INT (step2))); 10469 } 10470 } 10471 10472 /* Add in the __builtin_eh_return stack adjustment. We need to 10473 use a temporary in MIPS16 code. */ 10474 if (crtl->calls_eh_return) 10475 { 10476 if (TARGET_MIPS16) 10477 { 10478 mips_emit_move (MIPS_EPILOGUE_TEMP (Pmode), stack_pointer_rtx); 10479 emit_insn (gen_add3_insn (MIPS_EPILOGUE_TEMP (Pmode), 10480 MIPS_EPILOGUE_TEMP (Pmode), 10481 EH_RETURN_STACKADJ_RTX)); 10482 mips_emit_move (stack_pointer_rtx, MIPS_EPILOGUE_TEMP (Pmode)); 10483 } 10484 else 10485 emit_insn (gen_add3_insn (stack_pointer_rtx, 10486 stack_pointer_rtx, 10487 EH_RETURN_STACKADJ_RTX)); 10488 } 10489 10490 if (!sibcall_p) 10491 { 10492 mips_expand_before_return (); 10493 if (cfun->machine->interrupt_handler_p) 10494 { 10495 /* Interrupt handlers generate eret or deret. */ 10496 if (cfun->machine->use_debug_exception_return_p) 10497 emit_jump_insn (gen_mips_deret ()); 10498 else 10499 emit_jump_insn (gen_mips_eret ()); 10500 } 10501 else 10502 { 10503 unsigned int regno; 10504 10505 /* When generating MIPS16 code, the normal 10506 mips_for_each_saved_gpr_and_fpr path will restore the return 10507 address into $7 rather than $31. */ 10508 if (TARGET_MIPS16 10509 && !GENERATE_MIPS16E_SAVE_RESTORE 10510 && BITSET_P (frame->mask, RETURN_ADDR_REGNUM)) 10511 regno = GP_REG_FIRST + 7; 10512 else 10513 regno = RETURN_ADDR_REGNUM; 10514 emit_jump_insn (gen_return_internal (gen_rtx_REG (Pmode, regno))); 10515 } 10516 } 10517 10518 /* Search from the beginning to the first use of K0 or K1. */ 10519 if (cfun->machine->interrupt_handler_p 10520 && !cfun->machine->keep_interrupts_masked_p) 10521 { 10522 for (insn = get_insns (); insn != NULL_RTX; insn = NEXT_INSN (insn)) 10523 if (INSN_P (insn) 10524 && for_each_rtx (&PATTERN(insn), mips_kernel_reg_p, NULL)) 10525 break; 10526 gcc_assert (insn != NULL_RTX); 10527 /* Insert disable interrupts before the first use of K0 or K1. */ 10528 emit_insn_before (gen_mips_di (), insn); 10529 emit_insn_before (gen_mips_ehb (), insn); 10530 } 10531 } 10532 10533 /* Return nonzero if this function is known to have a null epilogue. 10534 This allows the optimizer to omit jumps to jumps if no stack 10535 was created. */ 10536 10537 bool 10538 mips_can_use_return_insn (void) 10539 { 10540 /* Interrupt handlers need to go through the epilogue. */ 10541 if (cfun->machine->interrupt_handler_p) 10542 return false; 10543 10544 if (!reload_completed) 10545 return false; 10546 10547 if (crtl->profile) 10548 return false; 10549 10550 /* In MIPS16 mode, a function that returns a floating-point value 10551 needs to arrange to copy the return value into the floating-point 10552 registers. */ 10553 if (mips16_cfun_returns_in_fpr_p ()) 10554 return false; 10555 10556 return cfun->machine->frame.total_size == 0; 10557 } 10558 10559 /* Return true if register REGNO can store a value of mode MODE. 10560 The result of this function is cached in mips_hard_regno_mode_ok. */ 10561 10562 static bool 10563 mips_hard_regno_mode_ok_p (unsigned int regno, enum machine_mode mode) 10564 { 10565 unsigned int size; 10566 enum mode_class mclass; 10567 10568 if (mode == CCV2mode) 10569 return (ISA_HAS_8CC 10570 && ST_REG_P (regno) 10571 && (regno - ST_REG_FIRST) % 2 == 0); 10572 10573 if (mode == CCV4mode) 10574 return (ISA_HAS_8CC 10575 && ST_REG_P (regno) 10576 && (regno - ST_REG_FIRST) % 4 == 0); 10577 10578 if (mode == CCmode) 10579 { 10580 if (!ISA_HAS_8CC) 10581 return regno == FPSW_REGNUM; 10582 10583 return (ST_REG_P (regno) 10584 || GP_REG_P (regno) 10585 || FP_REG_P (regno)); 10586 } 10587 10588 size = GET_MODE_SIZE (mode); 10589 mclass = GET_MODE_CLASS (mode); 10590 10591 if (GP_REG_P (regno)) 10592 return ((regno - GP_REG_FIRST) & 1) == 0 || size <= UNITS_PER_WORD; 10593 10594 if (FP_REG_P (regno) 10595 && (((regno - FP_REG_FIRST) % MAX_FPRS_PER_FMT) == 0 10596 || (MIN_FPRS_PER_FMT == 1 && size <= UNITS_PER_FPREG))) 10597 { 10598 /* Allow TFmode for CCmode reloads. */ 10599 if (mode == TFmode && ISA_HAS_8CC) 10600 return true; 10601 10602 /* Allow 64-bit vector modes for Loongson-2E/2F. */ 10603 if (TARGET_LOONGSON_VECTORS 10604 && (mode == V2SImode 10605 || mode == V4HImode 10606 || mode == V8QImode 10607 || mode == DImode)) 10608 return true; 10609 10610 if (mclass == MODE_FLOAT 10611 || mclass == MODE_COMPLEX_FLOAT 10612 || mclass == MODE_VECTOR_FLOAT) 10613 return size <= UNITS_PER_FPVALUE; 10614 10615 /* Allow integer modes that fit into a single register. We need 10616 to put integers into FPRs when using instructions like CVT 10617 and TRUNC. There's no point allowing sizes smaller than a word, 10618 because the FPU has no appropriate load/store instructions. */ 10619 if (mclass == MODE_INT) 10620 return size >= MIN_UNITS_PER_WORD && size <= UNITS_PER_FPREG; 10621 } 10622 10623 if (ACC_REG_P (regno) 10624 && (INTEGRAL_MODE_P (mode) || ALL_FIXED_POINT_MODE_P (mode))) 10625 { 10626 if (MD_REG_P (regno)) 10627 { 10628 /* After a multiplication or division, clobbering HI makes 10629 the value of LO unpredictable, and vice versa. This means 10630 that, for all interesting cases, HI and LO are effectively 10631 a single register. 10632 10633 We model this by requiring that any value that uses HI 10634 also uses LO. */ 10635 if (size <= UNITS_PER_WORD * 2) 10636 return regno == (size <= UNITS_PER_WORD ? LO_REGNUM : MD_REG_FIRST); 10637 } 10638 else 10639 { 10640 /* DSP accumulators do not have the same restrictions as 10641 HI and LO, so we can treat them as normal doubleword 10642 registers. */ 10643 if (size <= UNITS_PER_WORD) 10644 return true; 10645 10646 if (size <= UNITS_PER_WORD * 2 10647 && ((regno - DSP_ACC_REG_FIRST) & 1) == 0) 10648 return true; 10649 } 10650 } 10651 10652 if (ALL_COP_REG_P (regno)) 10653 return mclass == MODE_INT && size <= UNITS_PER_WORD; 10654 10655 if (regno == GOT_VERSION_REGNUM) 10656 return mode == SImode; 10657 10658 return false; 10659 } 10660 10661 /* Implement HARD_REGNO_NREGS. */ 10662 10663 unsigned int 10664 mips_hard_regno_nregs (int regno, enum machine_mode mode) 10665 { 10666 if (ST_REG_P (regno)) 10667 /* The size of FP status registers is always 4, because they only hold 10668 CCmode values, and CCmode is always considered to be 4 bytes wide. */ 10669 return (GET_MODE_SIZE (mode) + 3) / 4; 10670 10671 if (FP_REG_P (regno)) 10672 return (GET_MODE_SIZE (mode) + UNITS_PER_FPREG - 1) / UNITS_PER_FPREG; 10673 10674 /* All other registers are word-sized. */ 10675 return (GET_MODE_SIZE (mode) + UNITS_PER_WORD - 1) / UNITS_PER_WORD; 10676 } 10677 10678 /* Implement CLASS_MAX_NREGS, taking the maximum of the cases 10679 in mips_hard_regno_nregs. */ 10680 10681 int 10682 mips_class_max_nregs (enum reg_class rclass, enum machine_mode mode) 10683 { 10684 int size; 10685 HARD_REG_SET left; 10686 10687 size = 0x8000; 10688 COPY_HARD_REG_SET (left, reg_class_contents[(int) rclass]); 10689 if (hard_reg_set_intersect_p (left, reg_class_contents[(int) ST_REGS])) 10690 { 10691 size = MIN (size, 4); 10692 AND_COMPL_HARD_REG_SET (left, reg_class_contents[(int) ST_REGS]); 10693 } 10694 if (hard_reg_set_intersect_p (left, reg_class_contents[(int) FP_REGS])) 10695 { 10696 size = MIN (size, UNITS_PER_FPREG); 10697 AND_COMPL_HARD_REG_SET (left, reg_class_contents[(int) FP_REGS]); 10698 } 10699 if (!hard_reg_set_empty_p (left)) 10700 size = MIN (size, UNITS_PER_WORD); 10701 return (GET_MODE_SIZE (mode) + size - 1) / size; 10702 } 10703 10704 /* Implement CANNOT_CHANGE_MODE_CLASS. */ 10705 10706 bool 10707 mips_cannot_change_mode_class (enum machine_mode from ATTRIBUTE_UNUSED, 10708 enum machine_mode to ATTRIBUTE_UNUSED, 10709 enum reg_class rclass) 10710 { 10711 /* There are several problems with changing the modes of values 10712 in floating-point registers: 10713 10714 - When a multi-word value is stored in paired floating-point 10715 registers, the first register always holds the low word. 10716 We therefore can't allow FPRs to change between single-word 10717 and multi-word modes on big-endian targets. 10718 10719 - GCC assumes that each word of a multiword register can be accessed 10720 individually using SUBREGs. This is not true for floating-point 10721 registers if they are bigger than a word. 10722 10723 - Loading a 32-bit value into a 64-bit floating-point register 10724 will not sign-extend the value, despite what LOAD_EXTEND_OP says. 10725 We can't allow FPRs to change from SImode to to a wider mode on 10726 64-bit targets. 10727 10728 - If the FPU has already interpreted a value in one format, we must 10729 not ask it to treat the value as having a different format. 10730 10731 We therefore disallow all mode changes involving FPRs. */ 10732 return reg_classes_intersect_p (FP_REGS, rclass); 10733 } 10734 10735 /* Return true if moves in mode MODE can use the FPU's mov.fmt instruction. */ 10736 10737 static bool 10738 mips_mode_ok_for_mov_fmt_p (enum machine_mode mode) 10739 { 10740 switch (mode) 10741 { 10742 case SFmode: 10743 return TARGET_HARD_FLOAT; 10744 10745 case DFmode: 10746 return TARGET_HARD_FLOAT && TARGET_DOUBLE_FLOAT; 10747 10748 case V2SFmode: 10749 return TARGET_HARD_FLOAT && TARGET_PAIRED_SINGLE_FLOAT; 10750 10751 default: 10752 return false; 10753 } 10754 } 10755 10756 /* Implement MODES_TIEABLE_P. */ 10757 10758 bool 10759 mips_modes_tieable_p (enum machine_mode mode1, enum machine_mode mode2) 10760 { 10761 /* FPRs allow no mode punning, so it's not worth tying modes if we'd 10762 prefer to put one of them in FPRs. */ 10763 return (mode1 == mode2 10764 || (!mips_mode_ok_for_mov_fmt_p (mode1) 10765 && !mips_mode_ok_for_mov_fmt_p (mode2))); 10766 } 10767 10768 /* Implement PREFERRED_RELOAD_CLASS. */ 10769 10770 enum reg_class 10771 mips_preferred_reload_class (rtx x, enum reg_class rclass) 10772 { 10773 if (mips_dangerous_for_la25_p (x) && reg_class_subset_p (LEA_REGS, rclass)) 10774 return LEA_REGS; 10775 10776 if (reg_class_subset_p (FP_REGS, rclass) 10777 && mips_mode_ok_for_mov_fmt_p (GET_MODE (x))) 10778 return FP_REGS; 10779 10780 if (reg_class_subset_p (GR_REGS, rclass)) 10781 rclass = GR_REGS; 10782 10783 if (TARGET_MIPS16 && reg_class_subset_p (M16_REGS, rclass)) 10784 rclass = M16_REGS; 10785 10786 return rclass; 10787 } 10788 10789 /* RCLASS is a class involved in a REGISTER_MOVE_COST calculation. 10790 Return a "canonical" class to represent it in later calculations. */ 10791 10792 static enum reg_class 10793 mips_canonicalize_move_class (enum reg_class rclass) 10794 { 10795 /* All moves involving accumulator registers have the same cost. */ 10796 if (reg_class_subset_p (rclass, ACC_REGS)) 10797 rclass = ACC_REGS; 10798 10799 /* Likewise promote subclasses of general registers to the most 10800 interesting containing class. */ 10801 if (TARGET_MIPS16 && reg_class_subset_p (rclass, M16_REGS)) 10802 rclass = M16_REGS; 10803 else if (reg_class_subset_p (rclass, GENERAL_REGS)) 10804 rclass = GENERAL_REGS; 10805 10806 return rclass; 10807 } 10808 10809 /* Return the cost of moving a value of mode MODE from a register of 10810 class FROM to a GPR. Return 0 for classes that are unions of other 10811 classes handled by this function. */ 10812 10813 static int 10814 mips_move_to_gpr_cost (enum machine_mode mode ATTRIBUTE_UNUSED, 10815 enum reg_class from) 10816 { 10817 switch (from) 10818 { 10819 case GENERAL_REGS: 10820 /* A MIPS16 MOVE instruction, or a non-MIPS16 MOVE macro. */ 10821 return 2; 10822 10823 case ACC_REGS: 10824 /* MFLO and MFHI. */ 10825 return 6; 10826 10827 case FP_REGS: 10828 /* MFC1, etc. */ 10829 return 4; 10830 10831 case ST_REGS: 10832 /* LUI followed by MOVF. */ 10833 return 4; 10834 10835 case COP0_REGS: 10836 case COP2_REGS: 10837 case COP3_REGS: 10838 /* This choice of value is historical. */ 10839 return 5; 10840 10841 default: 10842 return 0; 10843 } 10844 } 10845 10846 /* Return the cost of moving a value of mode MODE from a GPR to a 10847 register of class TO. Return 0 for classes that are unions of 10848 other classes handled by this function. */ 10849 10850 static int 10851 mips_move_from_gpr_cost (enum machine_mode mode, enum reg_class to) 10852 { 10853 switch (to) 10854 { 10855 case GENERAL_REGS: 10856 /* A MIPS16 MOVE instruction, or a non-MIPS16 MOVE macro. */ 10857 return 2; 10858 10859 case ACC_REGS: 10860 /* MTLO and MTHI. */ 10861 return 6; 10862 10863 case FP_REGS: 10864 /* MTC1, etc. */ 10865 return 4; 10866 10867 case ST_REGS: 10868 /* A secondary reload through an FPR scratch. */ 10869 return (mips_register_move_cost (mode, GENERAL_REGS, FP_REGS) 10870 + mips_register_move_cost (mode, FP_REGS, ST_REGS)); 10871 10872 case COP0_REGS: 10873 case COP2_REGS: 10874 case COP3_REGS: 10875 /* This choice of value is historical. */ 10876 return 5; 10877 10878 default: 10879 return 0; 10880 } 10881 } 10882 10883 /* Implement REGISTER_MOVE_COST. Return 0 for classes that are the 10884 maximum of the move costs for subclasses; regclass will work out 10885 the maximum for us. */ 10886 10887 int 10888 mips_register_move_cost (enum machine_mode mode, 10889 enum reg_class from, enum reg_class to) 10890 { 10891 enum reg_class dregs; 10892 int cost1, cost2; 10893 10894 from = mips_canonicalize_move_class (from); 10895 to = mips_canonicalize_move_class (to); 10896 10897 /* Handle moves that can be done without using general-purpose registers. */ 10898 if (from == FP_REGS) 10899 { 10900 if (to == FP_REGS && mips_mode_ok_for_mov_fmt_p (mode)) 10901 /* MOV.FMT. */ 10902 return 4; 10903 if (to == ST_REGS) 10904 /* The sequence generated by mips_expand_fcc_reload. */ 10905 return 8; 10906 } 10907 10908 /* Handle cases in which only one class deviates from the ideal. */ 10909 dregs = TARGET_MIPS16 ? M16_REGS : GENERAL_REGS; 10910 if (from == dregs) 10911 return mips_move_from_gpr_cost (mode, to); 10912 if (to == dregs) 10913 return mips_move_to_gpr_cost (mode, from); 10914 10915 /* Handles cases that require a GPR temporary. */ 10916 cost1 = mips_move_to_gpr_cost (mode, from); 10917 if (cost1 != 0) 10918 { 10919 cost2 = mips_move_from_gpr_cost (mode, to); 10920 if (cost2 != 0) 10921 return cost1 + cost2; 10922 } 10923 10924 return 0; 10925 } 10926 10927 /* Implement TARGET_IRA_COVER_CLASSES. */ 10928 10929 static const enum reg_class * 10930 mips_ira_cover_classes (void) 10931 { 10932 static const enum reg_class acc_classes[] = { 10933 GR_AND_ACC_REGS, FP_REGS, COP0_REGS, COP2_REGS, COP3_REGS, 10934 ST_REGS, LIM_REG_CLASSES 10935 }; 10936 static const enum reg_class no_acc_classes[] = { 10937 GR_REGS, FP_REGS, COP0_REGS, COP2_REGS, COP3_REGS, 10938 ST_REGS, LIM_REG_CLASSES 10939 }; 10940 10941 /* Don't allow the register allocators to use LO and HI in MIPS16 mode, 10942 which has no MTLO or MTHI instructions. Also, using GR_AND_ACC_REGS 10943 as a cover class only works well when we keep per-register costs. 10944 Using it when not optimizing can cause us to think accumulators 10945 have the same cost as GPRs in cases where GPRs are actually much 10946 cheaper. */ 10947 return TARGET_MIPS16 || !optimize ? no_acc_classes : acc_classes; 10948 } 10949 10950 /* Return the register class required for a secondary register when 10951 copying between one of the registers in RCLASS and value X, which 10952 has mode MODE. X is the source of the move if IN_P, otherwise it 10953 is the destination. Return NO_REGS if no secondary register is 10954 needed. */ 10955 10956 enum reg_class 10957 mips_secondary_reload_class (enum reg_class rclass, 10958 enum machine_mode mode, rtx x, bool in_p) 10959 { 10960 int regno; 10961 10962 /* If X is a constant that cannot be loaded into $25, it must be loaded 10963 into some other GPR. No other register class allows a direct move. */ 10964 if (mips_dangerous_for_la25_p (x)) 10965 return reg_class_subset_p (rclass, LEA_REGS) ? NO_REGS : LEA_REGS; 10966 10967 regno = true_regnum (x); 10968 if (TARGET_MIPS16) 10969 { 10970 /* In MIPS16 mode, every move must involve a member of M16_REGS. */ 10971 if (!reg_class_subset_p (rclass, M16_REGS) && !M16_REG_P (regno)) 10972 return M16_REGS; 10973 10974 return NO_REGS; 10975 } 10976 10977 /* Copying from accumulator registers to anywhere other than a general 10978 register requires a temporary general register. */ 10979 if (reg_class_subset_p (rclass, ACC_REGS)) 10980 return GP_REG_P (regno) ? NO_REGS : GR_REGS; 10981 if (ACC_REG_P (regno)) 10982 return reg_class_subset_p (rclass, GR_REGS) ? NO_REGS : GR_REGS; 10983 10984 /* We can only copy a value to a condition code register from a 10985 floating-point register, and even then we require a scratch 10986 floating-point register. We can only copy a value out of a 10987 condition-code register into a general register. */ 10988 if (reg_class_subset_p (rclass, ST_REGS)) 10989 { 10990 if (in_p) 10991 return FP_REGS; 10992 return GP_REG_P (regno) ? NO_REGS : GR_REGS; 10993 } 10994 if (ST_REG_P (regno)) 10995 { 10996 if (!in_p) 10997 return FP_REGS; 10998 return reg_class_subset_p (rclass, GR_REGS) ? NO_REGS : GR_REGS; 10999 } 11000 11001 if (reg_class_subset_p (rclass, FP_REGS)) 11002 { 11003 if (MEM_P (x) 11004 && (GET_MODE_SIZE (mode) == 4 || GET_MODE_SIZE (mode) == 8)) 11005 /* In this case we can use lwc1, swc1, ldc1 or sdc1. We'll use 11006 pairs of lwc1s and swc1s if ldc1 and sdc1 are not supported. */ 11007 return NO_REGS; 11008 11009 if (GP_REG_P (regno) || x == CONST0_RTX (mode)) 11010 /* In this case we can use mtc1, mfc1, dmtc1 or dmfc1. */ 11011 return NO_REGS; 11012 11013 if (CONSTANT_P (x) && !targetm.cannot_force_const_mem (x)) 11014 /* We can force the constant to memory and use lwc1 11015 and ldc1. As above, we will use pairs of lwc1s if 11016 ldc1 is not supported. */ 11017 return NO_REGS; 11018 11019 if (FP_REG_P (regno) && mips_mode_ok_for_mov_fmt_p (mode)) 11020 /* In this case we can use mov.fmt. */ 11021 return NO_REGS; 11022 11023 /* Otherwise, we need to reload through an integer register. */ 11024 return GR_REGS; 11025 } 11026 if (FP_REG_P (regno)) 11027 return reg_class_subset_p (rclass, GR_REGS) ? NO_REGS : GR_REGS; 11028 11029 return NO_REGS; 11030 } 11031 11032 /* Implement TARGET_MODE_REP_EXTENDED. */ 11033 11034 static int 11035 mips_mode_rep_extended (enum machine_mode mode, enum machine_mode mode_rep) 11036 { 11037 /* On 64-bit targets, SImode register values are sign-extended to DImode. */ 11038 if (TARGET_64BIT && mode == SImode && mode_rep == DImode) 11039 return SIGN_EXTEND; 11040 11041 return UNKNOWN; 11042 } 11043 11044 /* Implement TARGET_VALID_POINTER_MODE. */ 11045 11046 static bool 11047 mips_valid_pointer_mode (enum machine_mode mode) 11048 { 11049 return mode == SImode || (TARGET_64BIT && mode == DImode); 11050 } 11051 11052 /* Implement TARGET_VECTOR_MODE_SUPPORTED_P. */ 11053 11054 static bool 11055 mips_vector_mode_supported_p (enum machine_mode mode) 11056 { 11057 switch (mode) 11058 { 11059 case V2SFmode: 11060 return TARGET_PAIRED_SINGLE_FLOAT; 11061 11062 case V2HImode: 11063 case V4QImode: 11064 case V2HQmode: 11065 case V2UHQmode: 11066 case V2HAmode: 11067 case V2UHAmode: 11068 case V4QQmode: 11069 case V4UQQmode: 11070 return TARGET_DSP; 11071 11072 case V2SImode: 11073 case V4HImode: 11074 case V8QImode: 11075 return TARGET_LOONGSON_VECTORS; 11076 11077 default: 11078 return false; 11079 } 11080 } 11081 11082 /* Implement TARGET_SCALAR_MODE_SUPPORTED_P. */ 11083 11084 static bool 11085 mips_scalar_mode_supported_p (enum machine_mode mode) 11086 { 11087 if (ALL_FIXED_POINT_MODE_P (mode) 11088 && GET_MODE_PRECISION (mode) <= 2 * BITS_PER_WORD) 11089 return true; 11090 11091 return default_scalar_mode_supported_p (mode); 11092 } 11093 11094 /* Implement TARGET_INIT_LIBFUNCS. */ 11095 11096 #include "config/gofast.h" 11097 11098 static void 11099 mips_init_libfuncs (void) 11100 { 11101 if (TARGET_FIX_VR4120) 11102 { 11103 /* Register the special divsi3 and modsi3 functions needed to work 11104 around VR4120 division errata. */ 11105 set_optab_libfunc (sdiv_optab, SImode, "__vr4120_divsi3"); 11106 set_optab_libfunc (smod_optab, SImode, "__vr4120_modsi3"); 11107 } 11108 11109 if (TARGET_MIPS16 && TARGET_HARD_FLOAT_ABI) 11110 { 11111 /* Register the MIPS16 -mhard-float stubs. */ 11112 set_optab_libfunc (add_optab, SFmode, "__mips16_addsf3"); 11113 set_optab_libfunc (sub_optab, SFmode, "__mips16_subsf3"); 11114 set_optab_libfunc (smul_optab, SFmode, "__mips16_mulsf3"); 11115 set_optab_libfunc (sdiv_optab, SFmode, "__mips16_divsf3"); 11116 11117 set_optab_libfunc (eq_optab, SFmode, "__mips16_eqsf2"); 11118 set_optab_libfunc (ne_optab, SFmode, "__mips16_nesf2"); 11119 set_optab_libfunc (gt_optab, SFmode, "__mips16_gtsf2"); 11120 set_optab_libfunc (ge_optab, SFmode, "__mips16_gesf2"); 11121 set_optab_libfunc (lt_optab, SFmode, "__mips16_ltsf2"); 11122 set_optab_libfunc (le_optab, SFmode, "__mips16_lesf2"); 11123 set_optab_libfunc (unord_optab, SFmode, "__mips16_unordsf2"); 11124 11125 set_conv_libfunc (sfix_optab, SImode, SFmode, "__mips16_fix_truncsfsi"); 11126 set_conv_libfunc (sfloat_optab, SFmode, SImode, "__mips16_floatsisf"); 11127 set_conv_libfunc (ufloat_optab, SFmode, SImode, "__mips16_floatunsisf"); 11128 11129 if (TARGET_DOUBLE_FLOAT) 11130 { 11131 set_optab_libfunc (add_optab, DFmode, "__mips16_adddf3"); 11132 set_optab_libfunc (sub_optab, DFmode, "__mips16_subdf3"); 11133 set_optab_libfunc (smul_optab, DFmode, "__mips16_muldf3"); 11134 set_optab_libfunc (sdiv_optab, DFmode, "__mips16_divdf3"); 11135 11136 set_optab_libfunc (eq_optab, DFmode, "__mips16_eqdf2"); 11137 set_optab_libfunc (ne_optab, DFmode, "__mips16_nedf2"); 11138 set_optab_libfunc (gt_optab, DFmode, "__mips16_gtdf2"); 11139 set_optab_libfunc (ge_optab, DFmode, "__mips16_gedf2"); 11140 set_optab_libfunc (lt_optab, DFmode, "__mips16_ltdf2"); 11141 set_optab_libfunc (le_optab, DFmode, "__mips16_ledf2"); 11142 set_optab_libfunc (unord_optab, DFmode, "__mips16_unorddf2"); 11143 11144 set_conv_libfunc (sext_optab, DFmode, SFmode, 11145 "__mips16_extendsfdf2"); 11146 set_conv_libfunc (trunc_optab, SFmode, DFmode, 11147 "__mips16_truncdfsf2"); 11148 set_conv_libfunc (sfix_optab, SImode, DFmode, 11149 "__mips16_fix_truncdfsi"); 11150 set_conv_libfunc (sfloat_optab, DFmode, SImode, 11151 "__mips16_floatsidf"); 11152 set_conv_libfunc (ufloat_optab, DFmode, SImode, 11153 "__mips16_floatunsidf"); 11154 } 11155 } 11156 else 11157 /* Register the gofast functions if selected using --enable-gofast. */ 11158 gofast_maybe_init_libfuncs (); 11159 11160 /* The MIPS16 ISA does not have an encoding for "sync", so we rely 11161 on an external non-MIPS16 routine to implement __sync_synchronize. */ 11162 if (TARGET_MIPS16) 11163 synchronize_libfunc = init_one_libfunc ("__sync_synchronize"); 11164 } 11165 11166 /* Build up a multi-insn sequence that loads label TARGET into $AT. */ 11167 11168 static void 11169 mips_process_load_label (rtx target) 11170 { 11171 rtx base, gp, intop; 11172 HOST_WIDE_INT offset; 11173 11174 mips_multi_start (); 11175 switch (mips_abi) 11176 { 11177 case ABI_N32: 11178 mips_multi_add_insn ("lw\t%@,%%got_page(%0)(%+)", target, 0); 11179 mips_multi_add_insn ("addiu\t%@,%@,%%got_ofst(%0)", target, 0); 11180 break; 11181 11182 case ABI_64: 11183 mips_multi_add_insn ("ld\t%@,%%got_page(%0)(%+)", target, 0); 11184 mips_multi_add_insn ("daddiu\t%@,%@,%%got_ofst(%0)", target, 0); 11185 break; 11186 11187 default: 11188 gp = pic_offset_table_rtx; 11189 if (mips_cfun_has_cprestore_slot_p ()) 11190 { 11191 gp = gen_rtx_REG (Pmode, AT_REGNUM); 11192 mips_get_cprestore_base_and_offset (&base, &offset, true); 11193 if (!SMALL_OPERAND (offset)) 11194 { 11195 intop = GEN_INT (CONST_HIGH_PART (offset)); 11196 mips_multi_add_insn ("lui\t%0,%1", gp, intop, 0); 11197 mips_multi_add_insn ("addu\t%0,%0,%1", gp, base, 0); 11198 11199 base = gp; 11200 offset = CONST_LOW_PART (offset); 11201 } 11202 intop = GEN_INT (offset); 11203 if (ISA_HAS_LOAD_DELAY) 11204 mips_multi_add_insn ("lw\t%0,%1(%2)%#", gp, intop, base, 0); 11205 else 11206 mips_multi_add_insn ("lw\t%0,%1(%2)", gp, intop, base, 0); 11207 } 11208 if (ISA_HAS_LOAD_DELAY) 11209 mips_multi_add_insn ("lw\t%@,%%got(%0)(%1)%#", target, gp, 0); 11210 else 11211 mips_multi_add_insn ("lw\t%@,%%got(%0)(%1)", target, gp, 0); 11212 mips_multi_add_insn ("addiu\t%@,%@,%%lo(%0)", target, 0); 11213 break; 11214 } 11215 } 11216 11217 /* Return the number of instructions needed to load a label into $AT. */ 11218 11219 static unsigned int 11220 mips_load_label_num_insns (void) 11221 { 11222 if (cfun->machine->load_label_num_insns == 0) 11223 { 11224 mips_process_load_label (pc_rtx); 11225 cfun->machine->load_label_num_insns = mips_multi_num_insns; 11226 } 11227 return cfun->machine->load_label_num_insns; 11228 } 11229 11230 /* Emit an asm sequence to start a noat block and load the address 11231 of a label into $1. */ 11232 11233 void 11234 mips_output_load_label (rtx target) 11235 { 11236 mips_push_asm_switch (&mips_noat); 11237 if (TARGET_EXPLICIT_RELOCS) 11238 { 11239 mips_process_load_label (target); 11240 mips_multi_write (); 11241 } 11242 else 11243 { 11244 if (Pmode == DImode) 11245 output_asm_insn ("dla\t%@,%0", &target); 11246 else 11247 output_asm_insn ("la\t%@,%0", &target); 11248 } 11249 } 11250 11251 /* Return the length of INSN. LENGTH is the initial length computed by 11252 attributes in the machine-description file. */ 11253 11254 int 11255 mips_adjust_insn_length (rtx insn, int length) 11256 { 11257 /* mips.md uses MAX_PIC_BRANCH_LENGTH as a placeholder for the length 11258 of a PIC long-branch sequence. Substitute the correct value. */ 11259 if (length == MAX_PIC_BRANCH_LENGTH 11260 && INSN_CODE (insn) >= 0 11261 && get_attr_type (insn) == TYPE_BRANCH) 11262 { 11263 /* Add the branch-over instruction and its delay slot, if this 11264 is a conditional branch. */ 11265 length = simplejump_p (insn) ? 0 : 8; 11266 11267 /* Load the label into $AT and jump to it. Ignore the delay 11268 slot of the jump. */ 11269 length += 4 * mips_load_label_num_insns() + 4; 11270 } 11271 11272 /* A unconditional jump has an unfilled delay slot if it is not part 11273 of a sequence. A conditional jump normally has a delay slot, but 11274 does not on MIPS16. */ 11275 if (CALL_P (insn) || (TARGET_MIPS16 ? simplejump_p (insn) : JUMP_P (insn))) 11276 length += 4; 11277 11278 /* See how many nops might be needed to avoid hardware hazards. */ 11279 if (!cfun->machine->ignore_hazard_length_p && INSN_CODE (insn) >= 0) 11280 switch (get_attr_hazard (insn)) 11281 { 11282 case HAZARD_NONE: 11283 break; 11284 11285 case HAZARD_DELAY: 11286 length += 4; 11287 break; 11288 11289 case HAZARD_HILO: 11290 length += 8; 11291 break; 11292 } 11293 11294 /* In order to make it easier to share MIPS16 and non-MIPS16 patterns, 11295 the .md file length attributes are 4-based for both modes. 11296 Adjust the MIPS16 ones here. */ 11297 if (TARGET_MIPS16) 11298 length /= 2; 11299 11300 return length; 11301 } 11302 11303 /* Return the assembly code for INSN, which has the operands given by 11304 OPERANDS, and which branches to OPERANDS[0] if some condition is true. 11305 BRANCH_IF_TRUE is the asm template that should be used if OPERANDS[0] 11306 is in range of a direct branch. BRANCH_IF_FALSE is an inverted 11307 version of BRANCH_IF_TRUE. */ 11308 11309 const char * 11310 mips_output_conditional_branch (rtx insn, rtx *operands, 11311 const char *branch_if_true, 11312 const char *branch_if_false) 11313 { 11314 unsigned int length; 11315 rtx taken, not_taken; 11316 11317 gcc_assert (LABEL_P (operands[0])); 11318 11319 length = get_attr_length (insn); 11320 if (length <= 8) 11321 { 11322 /* Just a simple conditional branch. */ 11323 mips_branch_likely = (final_sequence && INSN_ANNULLED_BRANCH_P (insn)); 11324 return branch_if_true; 11325 } 11326 11327 /* Generate a reversed branch around a direct jump. This fallback does 11328 not use branch-likely instructions. */ 11329 mips_branch_likely = false; 11330 not_taken = gen_label_rtx (); 11331 taken = operands[0]; 11332 11333 /* Generate the reversed branch to NOT_TAKEN. */ 11334 operands[0] = not_taken; 11335 output_asm_insn (branch_if_false, operands); 11336 11337 /* If INSN has a delay slot, we must provide delay slots for both the 11338 branch to NOT_TAKEN and the conditional jump. We must also ensure 11339 that INSN's delay slot is executed in the appropriate cases. */ 11340 if (final_sequence) 11341 { 11342 /* This first delay slot will always be executed, so use INSN's 11343 delay slot if is not annulled. */ 11344 if (!INSN_ANNULLED_BRANCH_P (insn)) 11345 { 11346 final_scan_insn (XVECEXP (final_sequence, 0, 1), 11347 asm_out_file, optimize, 1, NULL); 11348 INSN_DELETED_P (XVECEXP (final_sequence, 0, 1)) = 1; 11349 } 11350 else 11351 output_asm_insn ("nop", 0); 11352 fprintf (asm_out_file, "\n"); 11353 } 11354 11355 /* Output the unconditional branch to TAKEN. */ 11356 if (TARGET_ABSOLUTE_JUMPS) 11357 output_asm_insn (MIPS_ABSOLUTE_JUMP ("j\t%0%/"), &taken); 11358 else 11359 { 11360 mips_output_load_label (taken); 11361 output_asm_insn ("jr\t%@%]%/", 0); 11362 } 11363 11364 /* Now deal with its delay slot; see above. */ 11365 if (final_sequence) 11366 { 11367 /* This delay slot will only be executed if the branch is taken. 11368 Use INSN's delay slot if is annulled. */ 11369 if (INSN_ANNULLED_BRANCH_P (insn)) 11370 { 11371 final_scan_insn (XVECEXP (final_sequence, 0, 1), 11372 asm_out_file, optimize, 1, NULL); 11373 INSN_DELETED_P (XVECEXP (final_sequence, 0, 1)) = 1; 11374 } 11375 else 11376 output_asm_insn ("nop", 0); 11377 fprintf (asm_out_file, "\n"); 11378 } 11379 11380 /* Output NOT_TAKEN. */ 11381 targetm.asm_out.internal_label (asm_out_file, "L", 11382 CODE_LABEL_NUMBER (not_taken)); 11383 return ""; 11384 } 11385 11386 /* Return the assembly code for INSN, which branches to OPERANDS[0] 11387 if some ordering condition is true. The condition is given by 11388 OPERANDS[1] if !INVERTED_P, otherwise it is the inverse of 11389 OPERANDS[1]. OPERANDS[2] is the comparison's first operand; 11390 its second is always zero. */ 11391 11392 const char * 11393 mips_output_order_conditional_branch (rtx insn, rtx *operands, bool inverted_p) 11394 { 11395 const char *branch[2]; 11396 11397 /* Make BRANCH[1] branch to OPERANDS[0] when the condition is true. 11398 Make BRANCH[0] branch on the inverse condition. */ 11399 switch (GET_CODE (operands[1])) 11400 { 11401 /* These cases are equivalent to comparisons against zero. */ 11402 case LEU: 11403 inverted_p = !inverted_p; 11404 /* Fall through. */ 11405 case GTU: 11406 branch[!inverted_p] = MIPS_BRANCH ("bne", "%2,%.,%0"); 11407 branch[inverted_p] = MIPS_BRANCH ("beq", "%2,%.,%0"); 11408 break; 11409 11410 /* These cases are always true or always false. */ 11411 case LTU: 11412 inverted_p = !inverted_p; 11413 /* Fall through. */ 11414 case GEU: 11415 branch[!inverted_p] = MIPS_BRANCH ("beq", "%.,%.,%0"); 11416 branch[inverted_p] = MIPS_BRANCH ("bne", "%.,%.,%0"); 11417 break; 11418 11419 default: 11420 branch[!inverted_p] = MIPS_BRANCH ("b%C1z", "%2,%0"); 11421 branch[inverted_p] = MIPS_BRANCH ("b%N1z", "%2,%0"); 11422 break; 11423 } 11424 return mips_output_conditional_branch (insn, operands, branch[1], branch[0]); 11425 } 11426 11427 /* Start a block of code that needs access to the LL, SC and SYNC 11428 instructions. */ 11429 11430 static void 11431 mips_start_ll_sc_sync_block (void) 11432 { 11433 if (!ISA_HAS_LL_SC) 11434 { 11435 output_asm_insn (".set\tpush", 0); 11436 output_asm_insn (".set\tmips2", 0); 11437 } 11438 } 11439 11440 /* End a block started by mips_start_ll_sc_sync_block. */ 11441 11442 static void 11443 mips_end_ll_sc_sync_block (void) 11444 { 11445 if (!ISA_HAS_LL_SC) 11446 output_asm_insn (".set\tpop", 0); 11447 } 11448 11449 /* Output and/or return the asm template for a sync instruction. */ 11450 11451 const char * 11452 mips_output_sync (void) 11453 { 11454 mips_start_ll_sc_sync_block (); 11455 output_asm_insn ("sync", 0); 11456 mips_end_ll_sc_sync_block (); 11457 return ""; 11458 } 11459 11460 /* Return the asm template associated with sync_insn1 value TYPE. 11461 IS_64BIT_P is true if we want a 64-bit rather than 32-bit operation. */ 11462 11463 static const char * 11464 mips_sync_insn1_template (enum attr_sync_insn1 type, bool is_64bit_p) 11465 { 11466 switch (type) 11467 { 11468 case SYNC_INSN1_MOVE: 11469 return "move\t%0,%z2"; 11470 case SYNC_INSN1_LI: 11471 return "li\t%0,%2"; 11472 case SYNC_INSN1_ADDU: 11473 return is_64bit_p ? "daddu\t%0,%1,%z2" : "addu\t%0,%1,%z2"; 11474 case SYNC_INSN1_ADDIU: 11475 return is_64bit_p ? "daddiu\t%0,%1,%2" : "addiu\t%0,%1,%2"; 11476 case SYNC_INSN1_SUBU: 11477 return is_64bit_p ? "dsubu\t%0,%1,%z2" : "subu\t%0,%1,%z2"; 11478 case SYNC_INSN1_AND: 11479 return "and\t%0,%1,%z2"; 11480 case SYNC_INSN1_ANDI: 11481 return "andi\t%0,%1,%2"; 11482 case SYNC_INSN1_OR: 11483 return "or\t%0,%1,%z2"; 11484 case SYNC_INSN1_ORI: 11485 return "ori\t%0,%1,%2"; 11486 case SYNC_INSN1_XOR: 11487 return "xor\t%0,%1,%z2"; 11488 case SYNC_INSN1_XORI: 11489 return "xori\t%0,%1,%2"; 11490 } 11491 gcc_unreachable (); 11492 } 11493 11494 /* Return the asm template associated with sync_insn2 value TYPE. */ 11495 11496 static const char * 11497 mips_sync_insn2_template (enum attr_sync_insn2 type) 11498 { 11499 switch (type) 11500 { 11501 case SYNC_INSN2_NOP: 11502 gcc_unreachable (); 11503 case SYNC_INSN2_AND: 11504 return "and\t%0,%1,%z2"; 11505 case SYNC_INSN2_XOR: 11506 return "xor\t%0,%1,%z2"; 11507 case SYNC_INSN2_NOT: 11508 return "nor\t%0,%1,%."; 11509 } 11510 gcc_unreachable (); 11511 } 11512 11513 /* OPERANDS are the operands to a sync loop instruction and INDEX is 11514 the value of the one of the sync_* attributes. Return the operand 11515 referred to by the attribute, or DEFAULT_VALUE if the insn doesn't 11516 have the associated attribute. */ 11517 11518 static rtx 11519 mips_get_sync_operand (rtx *operands, int index, rtx default_value) 11520 { 11521 if (index > 0) 11522 default_value = operands[index - 1]; 11523 return default_value; 11524 } 11525 11526 /* INSN is a sync loop with operands OPERANDS. Build up a multi-insn 11527 sequence for it. */ 11528 11529 static void 11530 mips_process_sync_loop (rtx insn, rtx *operands) 11531 { 11532 rtx at, mem, oldval, newval, inclusive_mask, exclusive_mask; 11533 rtx required_oldval, insn1_op2, tmp1, tmp2, tmp3; 11534 unsigned int tmp3_insn; 11535 enum attr_sync_insn1 insn1; 11536 enum attr_sync_insn2 insn2; 11537 bool is_64bit_p; 11538 11539 /* Read an operand from the sync_WHAT attribute and store it in 11540 variable WHAT. DEFAULT is the default value if no attribute 11541 is specified. */ 11542 #define READ_OPERAND(WHAT, DEFAULT) \ 11543 WHAT = mips_get_sync_operand (operands, (int) get_attr_sync_##WHAT (insn), \ 11544 DEFAULT) 11545 11546 /* Read the memory. */ 11547 READ_OPERAND (mem, 0); 11548 gcc_assert (mem); 11549 is_64bit_p = (GET_MODE_BITSIZE (GET_MODE (mem)) == 64); 11550 11551 /* Read the other attributes. */ 11552 at = gen_rtx_REG (GET_MODE (mem), AT_REGNUM); 11553 READ_OPERAND (oldval, at); 11554 READ_OPERAND (newval, at); 11555 READ_OPERAND (inclusive_mask, 0); 11556 READ_OPERAND (exclusive_mask, 0); 11557 READ_OPERAND (required_oldval, 0); 11558 READ_OPERAND (insn1_op2, 0); 11559 insn1 = get_attr_sync_insn1 (insn); 11560 insn2 = get_attr_sync_insn2 (insn); 11561 11562 mips_multi_start (); 11563 11564 /* Output the release side of the memory barrier. */ 11565 if (get_attr_sync_release_barrier (insn) == SYNC_RELEASE_BARRIER_YES) 11566 { 11567 if (required_oldval == 0 && TARGET_OCTEON) 11568 { 11569 /* Octeon doesn't reorder reads, so a full barrier can be 11570 created by using SYNCW to order writes combined with the 11571 write from the following SC. When the SC successfully 11572 completes, we know that all preceding writes are also 11573 committed to the coherent memory system. It is possible 11574 for a single SYNCW to fail, but a pair of them will never 11575 fail, so we use two. */ 11576 mips_multi_add_insn ("syncw", NULL); 11577 mips_multi_add_insn ("syncw", NULL); 11578 } 11579 else 11580 mips_multi_add_insn ("sync", NULL); 11581 } 11582 11583 /* Output the branch-back label. */ 11584 mips_multi_add_label ("1:"); 11585 11586 /* OLDVAL = *MEM. */ 11587 mips_multi_add_insn (is_64bit_p ? "lld\t%0,%1" : "ll\t%0,%1", 11588 oldval, mem, NULL); 11589 11590 /* if ((OLDVAL & INCLUSIVE_MASK) != REQUIRED_OLDVAL) goto 2. */ 11591 if (required_oldval) 11592 { 11593 if (inclusive_mask == 0) 11594 tmp1 = oldval; 11595 else 11596 { 11597 gcc_assert (oldval != at); 11598 mips_multi_add_insn ("and\t%0,%1,%2", 11599 at, oldval, inclusive_mask, NULL); 11600 tmp1 = at; 11601 } 11602 mips_multi_add_insn ("bne\t%0,%z1,2f", tmp1, required_oldval, NULL); 11603 } 11604 11605 /* $TMP1 = OLDVAL & EXCLUSIVE_MASK. */ 11606 if (exclusive_mask == 0) 11607 tmp1 = const0_rtx; 11608 else 11609 { 11610 gcc_assert (oldval != at); 11611 mips_multi_add_insn ("and\t%0,%1,%z2", 11612 at, oldval, exclusive_mask, NULL); 11613 tmp1 = at; 11614 } 11615 11616 /* $TMP2 = INSN1 (OLDVAL, INSN1_OP2). 11617 11618 We can ignore moves if $TMP4 != INSN1_OP2, since we'll still emit 11619 at least one instruction in that case. */ 11620 if (insn1 == SYNC_INSN1_MOVE 11621 && (tmp1 != const0_rtx || insn2 != SYNC_INSN2_NOP)) 11622 tmp2 = insn1_op2; 11623 else 11624 { 11625 mips_multi_add_insn (mips_sync_insn1_template (insn1, is_64bit_p), 11626 newval, oldval, insn1_op2, NULL); 11627 tmp2 = newval; 11628 } 11629 11630 /* $TMP3 = INSN2 ($TMP2, INCLUSIVE_MASK). */ 11631 if (insn2 == SYNC_INSN2_NOP) 11632 tmp3 = tmp2; 11633 else 11634 { 11635 mips_multi_add_insn (mips_sync_insn2_template (insn2), 11636 newval, tmp2, inclusive_mask, NULL); 11637 tmp3 = newval; 11638 } 11639 tmp3_insn = mips_multi_last_index (); 11640 11641 /* $AT = $TMP1 | $TMP3. */ 11642 if (tmp1 == const0_rtx || tmp3 == const0_rtx) 11643 { 11644 mips_multi_set_operand (tmp3_insn, 0, at); 11645 tmp3 = at; 11646 } 11647 else 11648 { 11649 gcc_assert (tmp1 != tmp3); 11650 mips_multi_add_insn ("or\t%0,%1,%2", at, tmp1, tmp3, NULL); 11651 } 11652 11653 /* if (!commit (*MEM = $AT)) goto 1. 11654 11655 This will sometimes be a delayed branch; see the write code below 11656 for details. */ 11657 mips_multi_add_insn (is_64bit_p ? "scd\t%0,%1" : "sc\t%0,%1", at, mem, NULL); 11658 mips_multi_add_insn ("beq%?\t%0,%.,1b", at, NULL); 11659 11660 /* if (INSN1 != MOVE && INSN1 != LI) NEWVAL = $TMP3 [delay slot]. */ 11661 if (insn1 != SYNC_INSN1_MOVE && insn1 != SYNC_INSN1_LI && tmp3 != newval) 11662 { 11663 mips_multi_copy_insn (tmp3_insn); 11664 mips_multi_set_operand (mips_multi_last_index (), 0, newval); 11665 } 11666 else 11667 mips_multi_add_insn ("nop", NULL); 11668 11669 /* Output the acquire side of the memory barrier. */ 11670 if (TARGET_SYNC_AFTER_SC) 11671 mips_multi_add_insn ("sync", NULL); 11672 11673 /* Output the exit label, if needed. */ 11674 if (required_oldval) 11675 mips_multi_add_label ("2:"); 11676 11677 #undef READ_OPERAND 11678 } 11679 11680 /* Output and/or return the asm template for sync loop INSN, which has 11681 the operands given by OPERANDS. */ 11682 11683 const char * 11684 mips_output_sync_loop (rtx insn, rtx *operands) 11685 { 11686 mips_process_sync_loop (insn, operands); 11687 11688 /* Use branch-likely instructions to work around the LL/SC R10000 11689 errata. */ 11690 mips_branch_likely = TARGET_FIX_R10000; 11691 11692 mips_push_asm_switch (&mips_noreorder); 11693 mips_push_asm_switch (&mips_nomacro); 11694 mips_push_asm_switch (&mips_noat); 11695 mips_start_ll_sc_sync_block (); 11696 11697 mips_multi_write (); 11698 11699 mips_end_ll_sc_sync_block (); 11700 mips_pop_asm_switch (&mips_noat); 11701 mips_pop_asm_switch (&mips_nomacro); 11702 mips_pop_asm_switch (&mips_noreorder); 11703 11704 return ""; 11705 } 11706 11707 /* Return the number of individual instructions in sync loop INSN, 11708 which has the operands given by OPERANDS. */ 11709 11710 unsigned int 11711 mips_sync_loop_insns (rtx insn, rtx *operands) 11712 { 11713 mips_process_sync_loop (insn, operands); 11714 return mips_multi_num_insns; 11715 } 11716 11717 /* Return the assembly code for DIV or DDIV instruction DIVISION, which has 11718 the operands given by OPERANDS. Add in a divide-by-zero check if needed. 11719 11720 When working around R4000 and R4400 errata, we need to make sure that 11721 the division is not immediately followed by a shift[1][2]. We also 11722 need to stop the division from being put into a branch delay slot[3]. 11723 The easiest way to avoid both problems is to add a nop after the 11724 division. When a divide-by-zero check is needed, this nop can be 11725 used to fill the branch delay slot. 11726 11727 [1] If a double-word or a variable shift executes immediately 11728 after starting an integer division, the shift may give an 11729 incorrect result. See quotations of errata #16 and #28 from 11730 "MIPS R4000PC/SC Errata, Processor Revision 2.2 and 3.0" 11731 in mips.md for details. 11732 11733 [2] A similar bug to [1] exists for all revisions of the 11734 R4000 and the R4400 when run in an MC configuration. 11735 From "MIPS R4000MC Errata, Processor Revision 2.2 and 3.0": 11736 11737 "19. In this following sequence: 11738 11739 ddiv (or ddivu or div or divu) 11740 dsll32 (or dsrl32, dsra32) 11741 11742 if an MPT stall occurs, while the divide is slipping the cpu 11743 pipeline, then the following double shift would end up with an 11744 incorrect result. 11745 11746 Workaround: The compiler needs to avoid generating any 11747 sequence with divide followed by extended double shift." 11748 11749 This erratum is also present in "MIPS R4400MC Errata, Processor 11750 Revision 1.0" and "MIPS R4400MC Errata, Processor Revision 2.0 11751 & 3.0" as errata #10 and #4, respectively. 11752 11753 [3] From "MIPS R4000PC/SC Errata, Processor Revision 2.2 and 3.0" 11754 (also valid for MIPS R4000MC processors): 11755 11756 "52. R4000SC: This bug does not apply for the R4000PC. 11757 11758 There are two flavors of this bug: 11759 11760 1) If the instruction just after divide takes an RF exception 11761 (tlb-refill, tlb-invalid) and gets an instruction cache 11762 miss (both primary and secondary) and the line which is 11763 currently in secondary cache at this index had the first 11764 data word, where the bits 5..2 are set, then R4000 would 11765 get a wrong result for the div. 11766 11767 ##1 11768 nop 11769 div r8, r9 11770 ------------------- # end-of page. -tlb-refill 11771 nop 11772 ##2 11773 nop 11774 div r8, r9 11775 ------------------- # end-of page. -tlb-invalid 11776 nop 11777 11778 2) If the divide is in the taken branch delay slot, where the 11779 target takes RF exception and gets an I-cache miss for the 11780 exception vector or where I-cache miss occurs for the 11781 target address, under the above mentioned scenarios, the 11782 div would get wrong results. 11783 11784 ##1 11785 j r2 # to next page mapped or unmapped 11786 div r8,r9 # this bug would be there as long 11787 # as there is an ICache miss and 11788 nop # the "data pattern" is present 11789 11790 ##2 11791 beq r0, r0, NextPage # to Next page 11792 div r8,r9 11793 nop 11794 11795 This bug is present for div, divu, ddiv, and ddivu 11796 instructions. 11797 11798 Workaround: For item 1), OS could make sure that the next page 11799 after the divide instruction is also mapped. For item 2), the 11800 compiler could make sure that the divide instruction is not in 11801 the branch delay slot." 11802 11803 These processors have PRId values of 0x00004220 and 0x00004300 for 11804 the R4000 and 0x00004400, 0x00004500 and 0x00004600 for the R4400. */ 11805 11806 const char * 11807 mips_output_division (const char *division, rtx *operands) 11808 { 11809 const char *s; 11810 11811 s = division; 11812 if (TARGET_FIX_R4000 || TARGET_FIX_R4400) 11813 { 11814 output_asm_insn (s, operands); 11815 s = "nop"; 11816 } 11817 if (TARGET_CHECK_ZERO_DIV) 11818 { 11819 if (TARGET_MIPS16) 11820 { 11821 output_asm_insn (s, operands); 11822 s = "bnez\t%2,1f\n\tbreak\t7\n1:"; 11823 } 11824 else if (GENERATE_DIVIDE_TRAPS) 11825 { 11826 output_asm_insn (s, operands); 11827 s = "teq\t%2,%.,7"; 11828 } 11829 else 11830 { 11831 output_asm_insn ("%(bne\t%2,%.,1f", operands); 11832 output_asm_insn (s, operands); 11833 s = "break\t7%)\n1:"; 11834 } 11835 } 11836 return s; 11837 } 11838 11839 /* Return true if IN_INSN is a multiply-add or multiply-subtract 11840 instruction and if OUT_INSN assigns to the accumulator operand. */ 11841 11842 bool 11843 mips_linked_madd_p (rtx out_insn, rtx in_insn) 11844 { 11845 rtx x; 11846 11847 x = single_set (in_insn); 11848 if (x == 0) 11849 return false; 11850 11851 x = SET_SRC (x); 11852 11853 if (GET_CODE (x) == PLUS 11854 && GET_CODE (XEXP (x, 0)) == MULT 11855 && reg_set_p (XEXP (x, 1), out_insn)) 11856 return true; 11857 11858 if (GET_CODE (x) == MINUS 11859 && GET_CODE (XEXP (x, 1)) == MULT 11860 && reg_set_p (XEXP (x, 0), out_insn)) 11861 return true; 11862 11863 return false; 11864 } 11865 11866 /* True if the dependency between OUT_INSN and IN_INSN is on the store 11867 data rather than the address. We need this because the cprestore 11868 pattern is type "store", but is defined using an UNSPEC_VOLATILE, 11869 which causes the default routine to abort. We just return false 11870 for that case. */ 11871 11872 bool 11873 mips_store_data_bypass_p (rtx out_insn, rtx in_insn) 11874 { 11875 if (GET_CODE (PATTERN (in_insn)) == UNSPEC_VOLATILE) 11876 return false; 11877 11878 return !store_data_bypass_p (out_insn, in_insn); 11879 } 11880 11881 11882 /* Variables and flags used in scheduler hooks when tuning for 11883 Loongson 2E/2F. */ 11884 static struct 11885 { 11886 /* Variables to support Loongson 2E/2F round-robin [F]ALU1/2 dispatch 11887 strategy. */ 11888 11889 /* If true, then next ALU1/2 instruction will go to ALU1. */ 11890 bool alu1_turn_p; 11891 11892 /* If true, then next FALU1/2 unstruction will go to FALU1. */ 11893 bool falu1_turn_p; 11894 11895 /* Codes to query if [f]alu{1,2}_core units are subscribed or not. */ 11896 int alu1_core_unit_code; 11897 int alu2_core_unit_code; 11898 int falu1_core_unit_code; 11899 int falu2_core_unit_code; 11900 11901 /* True if current cycle has a multi instruction. 11902 This flag is used in mips_ls2_dfa_post_advance_cycle. */ 11903 bool cycle_has_multi_p; 11904 11905 /* Instructions to subscribe ls2_[f]alu{1,2}_turn_enabled units. 11906 These are used in mips_ls2_dfa_post_advance_cycle to initialize 11907 DFA state. 11908 E.g., when alu1_turn_enabled_insn is issued it makes next ALU1/2 11909 instruction to go ALU1. */ 11910 rtx alu1_turn_enabled_insn; 11911 rtx alu2_turn_enabled_insn; 11912 rtx falu1_turn_enabled_insn; 11913 rtx falu2_turn_enabled_insn; 11914 } mips_ls2; 11915 11916 /* Implement TARGET_SCHED_ADJUST_COST. We assume that anti and output 11917 dependencies have no cost, except on the 20Kc where output-dependence 11918 is treated like input-dependence. */ 11919 11920 static int 11921 mips_adjust_cost (rtx insn ATTRIBUTE_UNUSED, rtx link, 11922 rtx dep ATTRIBUTE_UNUSED, int cost) 11923 { 11924 if (REG_NOTE_KIND (link) == REG_DEP_OUTPUT 11925 && TUNE_20KC) 11926 return cost; 11927 if (REG_NOTE_KIND (link) != 0) 11928 return 0; 11929 return cost; 11930 } 11931 11932 /* Return the number of instructions that can be issued per cycle. */ 11933 11934 static int 11935 mips_issue_rate (void) 11936 { 11937 switch (mips_tune) 11938 { 11939 case PROCESSOR_74KC: 11940 case PROCESSOR_74KF2_1: 11941 case PROCESSOR_74KF1_1: 11942 case PROCESSOR_74KF3_2: 11943 /* The 74k is not strictly quad-issue cpu, but can be seen as one 11944 by the scheduler. It can issue 1 ALU, 1 AGEN and 2 FPU insns, 11945 but in reality only a maximum of 3 insns can be issued as 11946 floating-point loads and stores also require a slot in the 11947 AGEN pipe. */ 11948 case PROCESSOR_R10000: 11949 /* All R10K Processors are quad-issue (being the first MIPS 11950 processors to support this feature). */ 11951 return 4; 11952 11953 case PROCESSOR_20KC: 11954 case PROCESSOR_R4130: 11955 case PROCESSOR_R5400: 11956 case PROCESSOR_R5500: 11957 case PROCESSOR_R7000: 11958 case PROCESSOR_R9000: 11959 case PROCESSOR_OCTEON: 11960 return 2; 11961 11962 case PROCESSOR_SB1: 11963 case PROCESSOR_SB1A: 11964 /* This is actually 4, but we get better performance if we claim 3. 11965 This is partly because of unwanted speculative code motion with the 11966 larger number, and partly because in most common cases we can't 11967 reach the theoretical max of 4. */ 11968 return 3; 11969 11970 case PROCESSOR_LOONGSON_2E: 11971 case PROCESSOR_LOONGSON_2F: 11972 return 4; 11973 11974 default: 11975 return 1; 11976 } 11977 } 11978 11979 /* Implement TARGET_SCHED_INIT_DFA_POST_CYCLE_INSN hook for Loongson2. */ 11980 11981 static void 11982 mips_ls2_init_dfa_post_cycle_insn (void) 11983 { 11984 start_sequence (); 11985 emit_insn (gen_ls2_alu1_turn_enabled_insn ()); 11986 mips_ls2.alu1_turn_enabled_insn = get_insns (); 11987 end_sequence (); 11988 11989 start_sequence (); 11990 emit_insn (gen_ls2_alu2_turn_enabled_insn ()); 11991 mips_ls2.alu2_turn_enabled_insn = get_insns (); 11992 end_sequence (); 11993 11994 start_sequence (); 11995 emit_insn (gen_ls2_falu1_turn_enabled_insn ()); 11996 mips_ls2.falu1_turn_enabled_insn = get_insns (); 11997 end_sequence (); 11998 11999 start_sequence (); 12000 emit_insn (gen_ls2_falu2_turn_enabled_insn ()); 12001 mips_ls2.falu2_turn_enabled_insn = get_insns (); 12002 end_sequence (); 12003 12004 mips_ls2.alu1_core_unit_code = get_cpu_unit_code ("ls2_alu1_core"); 12005 mips_ls2.alu2_core_unit_code = get_cpu_unit_code ("ls2_alu2_core"); 12006 mips_ls2.falu1_core_unit_code = get_cpu_unit_code ("ls2_falu1_core"); 12007 mips_ls2.falu2_core_unit_code = get_cpu_unit_code ("ls2_falu2_core"); 12008 } 12009 12010 /* Implement TARGET_SCHED_INIT_DFA_POST_CYCLE_INSN hook. 12011 Init data used in mips_dfa_post_advance_cycle. */ 12012 12013 static void 12014 mips_init_dfa_post_cycle_insn (void) 12015 { 12016 if (TUNE_LOONGSON_2EF) 12017 mips_ls2_init_dfa_post_cycle_insn (); 12018 } 12019 12020 /* Initialize STATE when scheduling for Loongson 2E/2F. 12021 Support round-robin dispatch scheme by enabling only one of 12022 ALU1/ALU2 and one of FALU1/FALU2 units for ALU1/2 and FALU1/2 instructions 12023 respectively. */ 12024 12025 static void 12026 mips_ls2_dfa_post_advance_cycle (state_t state) 12027 { 12028 if (cpu_unit_reservation_p (state, mips_ls2.alu1_core_unit_code)) 12029 { 12030 /* Though there are no non-pipelined ALU1 insns, 12031 we can get an instruction of type 'multi' before reload. */ 12032 gcc_assert (mips_ls2.cycle_has_multi_p); 12033 mips_ls2.alu1_turn_p = false; 12034 } 12035 12036 mips_ls2.cycle_has_multi_p = false; 12037 12038 if (cpu_unit_reservation_p (state, mips_ls2.alu2_core_unit_code)) 12039 /* We have a non-pipelined alu instruction in the core, 12040 adjust round-robin counter. */ 12041 mips_ls2.alu1_turn_p = true; 12042 12043 if (mips_ls2.alu1_turn_p) 12044 { 12045 if (state_transition (state, mips_ls2.alu1_turn_enabled_insn) >= 0) 12046 gcc_unreachable (); 12047 } 12048 else 12049 { 12050 if (state_transition (state, mips_ls2.alu2_turn_enabled_insn) >= 0) 12051 gcc_unreachable (); 12052 } 12053 12054 if (cpu_unit_reservation_p (state, mips_ls2.falu1_core_unit_code)) 12055 { 12056 /* There are no non-pipelined FALU1 insns. */ 12057 gcc_unreachable (); 12058 mips_ls2.falu1_turn_p = false; 12059 } 12060 12061 if (cpu_unit_reservation_p (state, mips_ls2.falu2_core_unit_code)) 12062 /* We have a non-pipelined falu instruction in the core, 12063 adjust round-robin counter. */ 12064 mips_ls2.falu1_turn_p = true; 12065 12066 if (mips_ls2.falu1_turn_p) 12067 { 12068 if (state_transition (state, mips_ls2.falu1_turn_enabled_insn) >= 0) 12069 gcc_unreachable (); 12070 } 12071 else 12072 { 12073 if (state_transition (state, mips_ls2.falu2_turn_enabled_insn) >= 0) 12074 gcc_unreachable (); 12075 } 12076 } 12077 12078 /* Implement TARGET_SCHED_DFA_POST_ADVANCE_CYCLE. 12079 This hook is being called at the start of each cycle. */ 12080 12081 static void 12082 mips_dfa_post_advance_cycle (void) 12083 { 12084 if (TUNE_LOONGSON_2EF) 12085 mips_ls2_dfa_post_advance_cycle (curr_state); 12086 } 12087 12088 /* Implement TARGET_SCHED_FIRST_CYCLE_MULTIPASS_DFA_LOOKAHEAD. This should 12089 be as wide as the scheduling freedom in the DFA. */ 12090 12091 static int 12092 mips_multipass_dfa_lookahead (void) 12093 { 12094 /* Can schedule up to 4 of the 6 function units in any one cycle. */ 12095 if (TUNE_SB1) 12096 return 4; 12097 12098 if (TUNE_LOONGSON_2EF) 12099 return 4; 12100 12101 if (TUNE_OCTEON) 12102 return 2; 12103 12104 return 0; 12105 } 12106 12107 /* Remove the instruction at index LOWER from ready queue READY and 12108 reinsert it in front of the instruction at index HIGHER. LOWER must 12109 be <= HIGHER. */ 12110 12111 static void 12112 mips_promote_ready (rtx *ready, int lower, int higher) 12113 { 12114 rtx new_head; 12115 int i; 12116 12117 new_head = ready[lower]; 12118 for (i = lower; i < higher; i++) 12119 ready[i] = ready[i + 1]; 12120 ready[i] = new_head; 12121 } 12122 12123 /* If the priority of the instruction at POS2 in the ready queue READY 12124 is within LIMIT units of that of the instruction at POS1, swap the 12125 instructions if POS2 is not already less than POS1. */ 12126 12127 static void 12128 mips_maybe_swap_ready (rtx *ready, int pos1, int pos2, int limit) 12129 { 12130 if (pos1 < pos2 12131 && INSN_PRIORITY (ready[pos1]) + limit >= INSN_PRIORITY (ready[pos2])) 12132 { 12133 rtx temp; 12134 12135 temp = ready[pos1]; 12136 ready[pos1] = ready[pos2]; 12137 ready[pos2] = temp; 12138 } 12139 } 12140 12141 /* Used by TUNE_MACC_CHAINS to record the last scheduled instruction 12142 that may clobber hi or lo. */ 12143 static rtx mips_macc_chains_last_hilo; 12144 12145 /* A TUNE_MACC_CHAINS helper function. Record that instruction INSN has 12146 been scheduled, updating mips_macc_chains_last_hilo appropriately. */ 12147 12148 static void 12149 mips_macc_chains_record (rtx insn) 12150 { 12151 if (get_attr_may_clobber_hilo (insn)) 12152 mips_macc_chains_last_hilo = insn; 12153 } 12154 12155 /* A TUNE_MACC_CHAINS helper function. Search ready queue READY, which 12156 has NREADY elements, looking for a multiply-add or multiply-subtract 12157 instruction that is cumulative with mips_macc_chains_last_hilo. 12158 If there is one, promote it ahead of anything else that might 12159 clobber hi or lo. */ 12160 12161 static void 12162 mips_macc_chains_reorder (rtx *ready, int nready) 12163 { 12164 int i, j; 12165 12166 if (mips_macc_chains_last_hilo != 0) 12167 for (i = nready - 1; i >= 0; i--) 12168 if (mips_linked_madd_p (mips_macc_chains_last_hilo, ready[i])) 12169 { 12170 for (j = nready - 1; j > i; j--) 12171 if (recog_memoized (ready[j]) >= 0 12172 && get_attr_may_clobber_hilo (ready[j])) 12173 { 12174 mips_promote_ready (ready, i, j); 12175 break; 12176 } 12177 break; 12178 } 12179 } 12180 12181 /* The last instruction to be scheduled. */ 12182 static rtx vr4130_last_insn; 12183 12184 /* A note_stores callback used by vr4130_true_reg_dependence_p. DATA 12185 points to an rtx that is initially an instruction. Nullify the rtx 12186 if the instruction uses the value of register X. */ 12187 12188 static void 12189 vr4130_true_reg_dependence_p_1 (rtx x, const_rtx pat ATTRIBUTE_UNUSED, 12190 void *data) 12191 { 12192 rtx *insn_ptr; 12193 12194 insn_ptr = (rtx *) data; 12195 if (REG_P (x) 12196 && *insn_ptr != 0 12197 && reg_referenced_p (x, PATTERN (*insn_ptr))) 12198 *insn_ptr = 0; 12199 } 12200 12201 /* Return true if there is true register dependence between vr4130_last_insn 12202 and INSN. */ 12203 12204 static bool 12205 vr4130_true_reg_dependence_p (rtx insn) 12206 { 12207 note_stores (PATTERN (vr4130_last_insn), 12208 vr4130_true_reg_dependence_p_1, &insn); 12209 return insn == 0; 12210 } 12211 12212 /* A TUNE_MIPS4130 helper function. Given that INSN1 is at the head of 12213 the ready queue and that INSN2 is the instruction after it, return 12214 true if it is worth promoting INSN2 ahead of INSN1. Look for cases 12215 in which INSN1 and INSN2 can probably issue in parallel, but for 12216 which (INSN2, INSN1) should be less sensitive to instruction 12217 alignment than (INSN1, INSN2). See 4130.md for more details. */ 12218 12219 static bool 12220 vr4130_swap_insns_p (rtx insn1, rtx insn2) 12221 { 12222 sd_iterator_def sd_it; 12223 dep_t dep; 12224 12225 /* Check for the following case: 12226 12227 1) there is some other instruction X with an anti dependence on INSN1; 12228 2) X has a higher priority than INSN2; and 12229 3) X is an arithmetic instruction (and thus has no unit restrictions). 12230 12231 If INSN1 is the last instruction blocking X, it would better to 12232 choose (INSN1, X) over (INSN2, INSN1). */ 12233 FOR_EACH_DEP (insn1, SD_LIST_FORW, sd_it, dep) 12234 if (DEP_TYPE (dep) == REG_DEP_ANTI 12235 && INSN_PRIORITY (DEP_CON (dep)) > INSN_PRIORITY (insn2) 12236 && recog_memoized (DEP_CON (dep)) >= 0 12237 && get_attr_vr4130_class (DEP_CON (dep)) == VR4130_CLASS_ALU) 12238 return false; 12239 12240 if (vr4130_last_insn != 0 12241 && recog_memoized (insn1) >= 0 12242 && recog_memoized (insn2) >= 0) 12243 { 12244 /* See whether INSN1 and INSN2 use different execution units, 12245 or if they are both ALU-type instructions. If so, they can 12246 probably execute in parallel. */ 12247 enum attr_vr4130_class class1 = get_attr_vr4130_class (insn1); 12248 enum attr_vr4130_class class2 = get_attr_vr4130_class (insn2); 12249 if (class1 != class2 || class1 == VR4130_CLASS_ALU) 12250 { 12251 /* If only one of the instructions has a dependence on 12252 vr4130_last_insn, prefer to schedule the other one first. */ 12253 bool dep1_p = vr4130_true_reg_dependence_p (insn1); 12254 bool dep2_p = vr4130_true_reg_dependence_p (insn2); 12255 if (dep1_p != dep2_p) 12256 return dep1_p; 12257 12258 /* Prefer to schedule INSN2 ahead of INSN1 if vr4130_last_insn 12259 is not an ALU-type instruction and if INSN1 uses the same 12260 execution unit. (Note that if this condition holds, we already 12261 know that INSN2 uses a different execution unit.) */ 12262 if (class1 != VR4130_CLASS_ALU 12263 && recog_memoized (vr4130_last_insn) >= 0 12264 && class1 == get_attr_vr4130_class (vr4130_last_insn)) 12265 return true; 12266 } 12267 } 12268 return false; 12269 } 12270 12271 /* A TUNE_MIPS4130 helper function. (READY, NREADY) describes a ready 12272 queue with at least two instructions. Swap the first two if 12273 vr4130_swap_insns_p says that it could be worthwhile. */ 12274 12275 static void 12276 vr4130_reorder (rtx *ready, int nready) 12277 { 12278 if (vr4130_swap_insns_p (ready[nready - 1], ready[nready - 2])) 12279 mips_promote_ready (ready, nready - 2, nready - 1); 12280 } 12281 12282 /* Record whether last 74k AGEN instruction was a load or store. */ 12283 static enum attr_type mips_last_74k_agen_insn = TYPE_UNKNOWN; 12284 12285 /* Initialize mips_last_74k_agen_insn from INSN. A null argument 12286 resets to TYPE_UNKNOWN state. */ 12287 12288 static void 12289 mips_74k_agen_init (rtx insn) 12290 { 12291 if (!insn || CALL_P (insn) || JUMP_P (insn)) 12292 mips_last_74k_agen_insn = TYPE_UNKNOWN; 12293 else 12294 { 12295 enum attr_type type = get_attr_type (insn); 12296 if (type == TYPE_LOAD || type == TYPE_STORE) 12297 mips_last_74k_agen_insn = type; 12298 } 12299 } 12300 12301 /* A TUNE_74K helper function. The 74K AGEN pipeline likes multiple 12302 loads to be grouped together, and multiple stores to be grouped 12303 together. Swap things around in the ready queue to make this happen. */ 12304 12305 static void 12306 mips_74k_agen_reorder (rtx *ready, int nready) 12307 { 12308 int i; 12309 int store_pos, load_pos; 12310 12311 store_pos = -1; 12312 load_pos = -1; 12313 12314 for (i = nready - 1; i >= 0; i--) 12315 { 12316 rtx insn = ready[i]; 12317 if (USEFUL_INSN_P (insn)) 12318 switch (get_attr_type (insn)) 12319 { 12320 case TYPE_STORE: 12321 if (store_pos == -1) 12322 store_pos = i; 12323 break; 12324 12325 case TYPE_LOAD: 12326 if (load_pos == -1) 12327 load_pos = i; 12328 break; 12329 12330 default: 12331 break; 12332 } 12333 } 12334 12335 if (load_pos == -1 || store_pos == -1) 12336 return; 12337 12338 switch (mips_last_74k_agen_insn) 12339 { 12340 case TYPE_UNKNOWN: 12341 /* Prefer to schedule loads since they have a higher latency. */ 12342 case TYPE_LOAD: 12343 /* Swap loads to the front of the queue. */ 12344 mips_maybe_swap_ready (ready, load_pos, store_pos, 4); 12345 break; 12346 case TYPE_STORE: 12347 /* Swap stores to the front of the queue. */ 12348 mips_maybe_swap_ready (ready, store_pos, load_pos, 4); 12349 break; 12350 default: 12351 break; 12352 } 12353 } 12354 12355 /* Implement TARGET_SCHED_INIT. */ 12356 12357 static void 12358 mips_sched_init (FILE *file ATTRIBUTE_UNUSED, int verbose ATTRIBUTE_UNUSED, 12359 int max_ready ATTRIBUTE_UNUSED) 12360 { 12361 mips_macc_chains_last_hilo = 0; 12362 vr4130_last_insn = 0; 12363 mips_74k_agen_init (NULL_RTX); 12364 12365 /* When scheduling for Loongson2, branch instructions go to ALU1, 12366 therefore basic block is most likely to start with round-robin counter 12367 pointed to ALU2. */ 12368 mips_ls2.alu1_turn_p = false; 12369 mips_ls2.falu1_turn_p = true; 12370 } 12371 12372 /* Implement TARGET_SCHED_REORDER and TARGET_SCHED_REORDER2. */ 12373 12374 static int 12375 mips_sched_reorder (FILE *file ATTRIBUTE_UNUSED, int verbose ATTRIBUTE_UNUSED, 12376 rtx *ready, int *nreadyp, int cycle ATTRIBUTE_UNUSED) 12377 { 12378 if (!reload_completed 12379 && TUNE_MACC_CHAINS 12380 && *nreadyp > 0) 12381 mips_macc_chains_reorder (ready, *nreadyp); 12382 12383 if (reload_completed 12384 && TUNE_MIPS4130 12385 && !TARGET_VR4130_ALIGN 12386 && *nreadyp > 1) 12387 vr4130_reorder (ready, *nreadyp); 12388 12389 if (TUNE_74K) 12390 mips_74k_agen_reorder (ready, *nreadyp); 12391 12392 return mips_issue_rate (); 12393 } 12394 12395 /* Update round-robin counters for ALU1/2 and FALU1/2. */ 12396 12397 static void 12398 mips_ls2_variable_issue (rtx insn) 12399 { 12400 if (mips_ls2.alu1_turn_p) 12401 { 12402 if (cpu_unit_reservation_p (curr_state, mips_ls2.alu1_core_unit_code)) 12403 mips_ls2.alu1_turn_p = false; 12404 } 12405 else 12406 { 12407 if (cpu_unit_reservation_p (curr_state, mips_ls2.alu2_core_unit_code)) 12408 mips_ls2.alu1_turn_p = true; 12409 } 12410 12411 if (mips_ls2.falu1_turn_p) 12412 { 12413 if (cpu_unit_reservation_p (curr_state, mips_ls2.falu1_core_unit_code)) 12414 mips_ls2.falu1_turn_p = false; 12415 } 12416 else 12417 { 12418 if (cpu_unit_reservation_p (curr_state, mips_ls2.falu2_core_unit_code)) 12419 mips_ls2.falu1_turn_p = true; 12420 } 12421 12422 if (recog_memoized (insn) >= 0) 12423 mips_ls2.cycle_has_multi_p |= (get_attr_type (insn) == TYPE_MULTI); 12424 } 12425 12426 /* Implement TARGET_SCHED_VARIABLE_ISSUE. */ 12427 12428 static int 12429 mips_variable_issue (FILE *file ATTRIBUTE_UNUSED, int verbose ATTRIBUTE_UNUSED, 12430 rtx insn, int more) 12431 { 12432 /* Ignore USEs and CLOBBERs; don't count them against the issue rate. */ 12433 if (USEFUL_INSN_P (insn)) 12434 { 12435 if (get_attr_type (insn) != TYPE_GHOST) 12436 more--; 12437 if (!reload_completed && TUNE_MACC_CHAINS) 12438 mips_macc_chains_record (insn); 12439 vr4130_last_insn = insn; 12440 if (TUNE_74K) 12441 mips_74k_agen_init (insn); 12442 else if (TUNE_LOONGSON_2EF) 12443 mips_ls2_variable_issue (insn); 12444 } 12445 12446 /* Instructions of type 'multi' should all be split before 12447 the second scheduling pass. */ 12448 gcc_assert (!reload_completed 12449 || recog_memoized (insn) < 0 12450 || get_attr_type (insn) != TYPE_MULTI); 12451 12452 return more; 12453 } 12454 12455 /* Given that we have an rtx of the form (prefetch ... WRITE LOCALITY), 12456 return the first operand of the associated PREF or PREFX insn. */ 12457 12458 rtx 12459 mips_prefetch_cookie (rtx write, rtx locality) 12460 { 12461 /* store_streamed / load_streamed. */ 12462 if (INTVAL (locality) <= 0) 12463 return GEN_INT (INTVAL (write) + 4); 12464 12465 /* store / load. */ 12466 if (INTVAL (locality) <= 2) 12467 return write; 12468 12469 /* store_retained / load_retained. */ 12470 return GEN_INT (INTVAL (write) + 6); 12471 } 12472 12473 /* Flags that indicate when a built-in function is available. 12474 12475 BUILTIN_AVAIL_NON_MIPS16 12476 The function is available on the current target, but only 12477 in non-MIPS16 mode. */ 12478 #define BUILTIN_AVAIL_NON_MIPS16 1 12479 12480 /* Declare an availability predicate for built-in functions that 12481 require non-MIPS16 mode and also require COND to be true. 12482 NAME is the main part of the predicate's name. */ 12483 #define AVAIL_NON_MIPS16(NAME, COND) \ 12484 static unsigned int \ 12485 mips_builtin_avail_##NAME (void) \ 12486 { \ 12487 return (COND) ? BUILTIN_AVAIL_NON_MIPS16 : 0; \ 12488 } 12489 12490 /* This structure describes a single built-in function. */ 12491 struct mips_builtin_description { 12492 /* The code of the main .md file instruction. See mips_builtin_type 12493 for more information. */ 12494 enum insn_code icode; 12495 12496 /* The floating-point comparison code to use with ICODE, if any. */ 12497 enum mips_fp_condition cond; 12498 12499 /* The name of the built-in function. */ 12500 const char *name; 12501 12502 /* Specifies how the function should be expanded. */ 12503 enum mips_builtin_type builtin_type; 12504 12505 /* The function's prototype. */ 12506 enum mips_function_type function_type; 12507 12508 /* Whether the function is available. */ 12509 unsigned int (*avail) (void); 12510 }; 12511 12512 AVAIL_NON_MIPS16 (paired_single, TARGET_PAIRED_SINGLE_FLOAT) 12513 AVAIL_NON_MIPS16 (sb1_paired_single, TARGET_SB1 && TARGET_PAIRED_SINGLE_FLOAT) 12514 AVAIL_NON_MIPS16 (mips3d, TARGET_MIPS3D) 12515 AVAIL_NON_MIPS16 (dsp, TARGET_DSP) 12516 AVAIL_NON_MIPS16 (dspr2, TARGET_DSPR2) 12517 AVAIL_NON_MIPS16 (dsp_32, !TARGET_64BIT && TARGET_DSP) 12518 AVAIL_NON_MIPS16 (dspr2_32, !TARGET_64BIT && TARGET_DSPR2) 12519 AVAIL_NON_MIPS16 (loongson, TARGET_LOONGSON_VECTORS) 12520 AVAIL_NON_MIPS16 (cache, TARGET_CACHE_BUILTIN) 12521 12522 /* Construct a mips_builtin_description from the given arguments. 12523 12524 INSN is the name of the associated instruction pattern, without the 12525 leading CODE_FOR_mips_. 12526 12527 CODE is the floating-point condition code associated with the 12528 function. It can be 'f' if the field is not applicable. 12529 12530 NAME is the name of the function itself, without the leading 12531 "__builtin_mips_". 12532 12533 BUILTIN_TYPE and FUNCTION_TYPE are mips_builtin_description fields. 12534 12535 AVAIL is the name of the availability predicate, without the leading 12536 mips_builtin_avail_. */ 12537 #define MIPS_BUILTIN(INSN, COND, NAME, BUILTIN_TYPE, \ 12538 FUNCTION_TYPE, AVAIL) \ 12539 { CODE_FOR_mips_ ## INSN, MIPS_FP_COND_ ## COND, \ 12540 "__builtin_mips_" NAME, BUILTIN_TYPE, FUNCTION_TYPE, \ 12541 mips_builtin_avail_ ## AVAIL } 12542 12543 /* Define __builtin_mips_<INSN>, which is a MIPS_BUILTIN_DIRECT function 12544 mapped to instruction CODE_FOR_mips_<INSN>, FUNCTION_TYPE and AVAIL 12545 are as for MIPS_BUILTIN. */ 12546 #define DIRECT_BUILTIN(INSN, FUNCTION_TYPE, AVAIL) \ 12547 MIPS_BUILTIN (INSN, f, #INSN, MIPS_BUILTIN_DIRECT, FUNCTION_TYPE, AVAIL) 12548 12549 /* Define __builtin_mips_<INSN>_<COND>_{s,d} functions, both of which 12550 are subject to mips_builtin_avail_<AVAIL>. */ 12551 #define CMP_SCALAR_BUILTINS(INSN, COND, AVAIL) \ 12552 MIPS_BUILTIN (INSN ## _cond_s, COND, #INSN "_" #COND "_s", \ 12553 MIPS_BUILTIN_CMP_SINGLE, MIPS_INT_FTYPE_SF_SF, AVAIL), \ 12554 MIPS_BUILTIN (INSN ## _cond_d, COND, #INSN "_" #COND "_d", \ 12555 MIPS_BUILTIN_CMP_SINGLE, MIPS_INT_FTYPE_DF_DF, AVAIL) 12556 12557 /* Define __builtin_mips_{any,all,upper,lower}_<INSN>_<COND>_ps. 12558 The lower and upper forms are subject to mips_builtin_avail_<AVAIL> 12559 while the any and all forms are subject to mips_builtin_avail_mips3d. */ 12560 #define CMP_PS_BUILTINS(INSN, COND, AVAIL) \ 12561 MIPS_BUILTIN (INSN ## _cond_ps, COND, "any_" #INSN "_" #COND "_ps", \ 12562 MIPS_BUILTIN_CMP_ANY, MIPS_INT_FTYPE_V2SF_V2SF, \ 12563 mips3d), \ 12564 MIPS_BUILTIN (INSN ## _cond_ps, COND, "all_" #INSN "_" #COND "_ps", \ 12565 MIPS_BUILTIN_CMP_ALL, MIPS_INT_FTYPE_V2SF_V2SF, \ 12566 mips3d), \ 12567 MIPS_BUILTIN (INSN ## _cond_ps, COND, "lower_" #INSN "_" #COND "_ps", \ 12568 MIPS_BUILTIN_CMP_LOWER, MIPS_INT_FTYPE_V2SF_V2SF, \ 12569 AVAIL), \ 12570 MIPS_BUILTIN (INSN ## _cond_ps, COND, "upper_" #INSN "_" #COND "_ps", \ 12571 MIPS_BUILTIN_CMP_UPPER, MIPS_INT_FTYPE_V2SF_V2SF, \ 12572 AVAIL) 12573 12574 /* Define __builtin_mips_{any,all}_<INSN>_<COND>_4s. The functions 12575 are subject to mips_builtin_avail_mips3d. */ 12576 #define CMP_4S_BUILTINS(INSN, COND) \ 12577 MIPS_BUILTIN (INSN ## _cond_4s, COND, "any_" #INSN "_" #COND "_4s", \ 12578 MIPS_BUILTIN_CMP_ANY, \ 12579 MIPS_INT_FTYPE_V2SF_V2SF_V2SF_V2SF, mips3d), \ 12580 MIPS_BUILTIN (INSN ## _cond_4s, COND, "all_" #INSN "_" #COND "_4s", \ 12581 MIPS_BUILTIN_CMP_ALL, \ 12582 MIPS_INT_FTYPE_V2SF_V2SF_V2SF_V2SF, mips3d) 12583 12584 /* Define __builtin_mips_mov{t,f}_<INSN>_<COND>_ps. The comparison 12585 instruction requires mips_builtin_avail_<AVAIL>. */ 12586 #define MOVTF_BUILTINS(INSN, COND, AVAIL) \ 12587 MIPS_BUILTIN (INSN ## _cond_ps, COND, "movt_" #INSN "_" #COND "_ps", \ 12588 MIPS_BUILTIN_MOVT, MIPS_V2SF_FTYPE_V2SF_V2SF_V2SF_V2SF, \ 12589 AVAIL), \ 12590 MIPS_BUILTIN (INSN ## _cond_ps, COND, "movf_" #INSN "_" #COND "_ps", \ 12591 MIPS_BUILTIN_MOVF, MIPS_V2SF_FTYPE_V2SF_V2SF_V2SF_V2SF, \ 12592 AVAIL) 12593 12594 /* Define all the built-in functions related to C.cond.fmt condition COND. */ 12595 #define CMP_BUILTINS(COND) \ 12596 MOVTF_BUILTINS (c, COND, paired_single), \ 12597 MOVTF_BUILTINS (cabs, COND, mips3d), \ 12598 CMP_SCALAR_BUILTINS (cabs, COND, mips3d), \ 12599 CMP_PS_BUILTINS (c, COND, paired_single), \ 12600 CMP_PS_BUILTINS (cabs, COND, mips3d), \ 12601 CMP_4S_BUILTINS (c, COND), \ 12602 CMP_4S_BUILTINS (cabs, COND) 12603 12604 /* Define __builtin_mips_<INSN>, which is a MIPS_BUILTIN_DIRECT_NO_TARGET 12605 function mapped to instruction CODE_FOR_mips_<INSN>, FUNCTION_TYPE 12606 and AVAIL are as for MIPS_BUILTIN. */ 12607 #define DIRECT_NO_TARGET_BUILTIN(INSN, FUNCTION_TYPE, AVAIL) \ 12608 MIPS_BUILTIN (INSN, f, #INSN, MIPS_BUILTIN_DIRECT_NO_TARGET, \ 12609 FUNCTION_TYPE, AVAIL) 12610 12611 /* Define __builtin_mips_bposge<VALUE>. <VALUE> is 32 for the MIPS32 DSP 12612 branch instruction. AVAIL is as for MIPS_BUILTIN. */ 12613 #define BPOSGE_BUILTIN(VALUE, AVAIL) \ 12614 MIPS_BUILTIN (bposge, f, "bposge" #VALUE, \ 12615 MIPS_BUILTIN_BPOSGE ## VALUE, MIPS_SI_FTYPE_VOID, AVAIL) 12616 12617 /* Define a Loongson MIPS_BUILTIN_DIRECT function __builtin_loongson_<FN_NAME> 12618 for instruction CODE_FOR_loongson_<INSN>. FUNCTION_TYPE is a 12619 builtin_description field. */ 12620 #define LOONGSON_BUILTIN_ALIAS(INSN, FN_NAME, FUNCTION_TYPE) \ 12621 { CODE_FOR_loongson_ ## INSN, MIPS_FP_COND_f, \ 12622 "__builtin_loongson_" #FN_NAME, MIPS_BUILTIN_DIRECT, \ 12623 FUNCTION_TYPE, mips_builtin_avail_loongson } 12624 12625 /* Define a Loongson MIPS_BUILTIN_DIRECT function __builtin_loongson_<INSN> 12626 for instruction CODE_FOR_loongson_<INSN>. FUNCTION_TYPE is a 12627 builtin_description field. */ 12628 #define LOONGSON_BUILTIN(INSN, FUNCTION_TYPE) \ 12629 LOONGSON_BUILTIN_ALIAS (INSN, INSN, FUNCTION_TYPE) 12630 12631 /* Like LOONGSON_BUILTIN, but add _<SUFFIX> to the end of the function name. 12632 We use functions of this form when the same insn can be usefully applied 12633 to more than one datatype. */ 12634 #define LOONGSON_BUILTIN_SUFFIX(INSN, SUFFIX, FUNCTION_TYPE) \ 12635 LOONGSON_BUILTIN_ALIAS (INSN, INSN ## _ ## SUFFIX, FUNCTION_TYPE) 12636 12637 #define CODE_FOR_mips_sqrt_ps CODE_FOR_sqrtv2sf2 12638 #define CODE_FOR_mips_addq_ph CODE_FOR_addv2hi3 12639 #define CODE_FOR_mips_addu_qb CODE_FOR_addv4qi3 12640 #define CODE_FOR_mips_subq_ph CODE_FOR_subv2hi3 12641 #define CODE_FOR_mips_subu_qb CODE_FOR_subv4qi3 12642 #define CODE_FOR_mips_mul_ph CODE_FOR_mulv2hi3 12643 12644 #define CODE_FOR_loongson_packsswh CODE_FOR_vec_pack_ssat_v2si 12645 #define CODE_FOR_loongson_packsshb CODE_FOR_vec_pack_ssat_v4hi 12646 #define CODE_FOR_loongson_packushb CODE_FOR_vec_pack_usat_v4hi 12647 #define CODE_FOR_loongson_paddw CODE_FOR_addv2si3 12648 #define CODE_FOR_loongson_paddh CODE_FOR_addv4hi3 12649 #define CODE_FOR_loongson_paddb CODE_FOR_addv8qi3 12650 #define CODE_FOR_loongson_paddsh CODE_FOR_ssaddv4hi3 12651 #define CODE_FOR_loongson_paddsb CODE_FOR_ssaddv8qi3 12652 #define CODE_FOR_loongson_paddush CODE_FOR_usaddv4hi3 12653 #define CODE_FOR_loongson_paddusb CODE_FOR_usaddv8qi3 12654 #define CODE_FOR_loongson_pmaxsh CODE_FOR_smaxv4hi3 12655 #define CODE_FOR_loongson_pmaxub CODE_FOR_umaxv8qi3 12656 #define CODE_FOR_loongson_pminsh CODE_FOR_sminv4hi3 12657 #define CODE_FOR_loongson_pminub CODE_FOR_uminv8qi3 12658 #define CODE_FOR_loongson_pmulhuh CODE_FOR_umulv4hi3_highpart 12659 #define CODE_FOR_loongson_pmulhh CODE_FOR_smulv4hi3_highpart 12660 #define CODE_FOR_loongson_psubw CODE_FOR_subv2si3 12661 #define CODE_FOR_loongson_psubh CODE_FOR_subv4hi3 12662 #define CODE_FOR_loongson_psubb CODE_FOR_subv8qi3 12663 #define CODE_FOR_loongson_psubsh CODE_FOR_sssubv4hi3 12664 #define CODE_FOR_loongson_psubsb CODE_FOR_sssubv8qi3 12665 #define CODE_FOR_loongson_psubush CODE_FOR_ussubv4hi3 12666 #define CODE_FOR_loongson_psubusb CODE_FOR_ussubv8qi3 12667 #define CODE_FOR_loongson_punpckhbh CODE_FOR_vec_interleave_highv8qi 12668 #define CODE_FOR_loongson_punpckhhw CODE_FOR_vec_interleave_highv4hi 12669 #define CODE_FOR_loongson_punpckhwd CODE_FOR_vec_interleave_highv2si 12670 #define CODE_FOR_loongson_punpcklbh CODE_FOR_vec_interleave_lowv8qi 12671 #define CODE_FOR_loongson_punpcklhw CODE_FOR_vec_interleave_lowv4hi 12672 #define CODE_FOR_loongson_punpcklwd CODE_FOR_vec_interleave_lowv2si 12673 12674 static const struct mips_builtin_description mips_builtins[] = { 12675 DIRECT_BUILTIN (pll_ps, MIPS_V2SF_FTYPE_V2SF_V2SF, paired_single), 12676 DIRECT_BUILTIN (pul_ps, MIPS_V2SF_FTYPE_V2SF_V2SF, paired_single), 12677 DIRECT_BUILTIN (plu_ps, MIPS_V2SF_FTYPE_V2SF_V2SF, paired_single), 12678 DIRECT_BUILTIN (puu_ps, MIPS_V2SF_FTYPE_V2SF_V2SF, paired_single), 12679 DIRECT_BUILTIN (cvt_ps_s, MIPS_V2SF_FTYPE_SF_SF, paired_single), 12680 DIRECT_BUILTIN (cvt_s_pl, MIPS_SF_FTYPE_V2SF, paired_single), 12681 DIRECT_BUILTIN (cvt_s_pu, MIPS_SF_FTYPE_V2SF, paired_single), 12682 DIRECT_BUILTIN (abs_ps, MIPS_V2SF_FTYPE_V2SF, paired_single), 12683 12684 DIRECT_BUILTIN (alnv_ps, MIPS_V2SF_FTYPE_V2SF_V2SF_INT, paired_single), 12685 DIRECT_BUILTIN (addr_ps, MIPS_V2SF_FTYPE_V2SF_V2SF, mips3d), 12686 DIRECT_BUILTIN (mulr_ps, MIPS_V2SF_FTYPE_V2SF_V2SF, mips3d), 12687 DIRECT_BUILTIN (cvt_pw_ps, MIPS_V2SF_FTYPE_V2SF, mips3d), 12688 DIRECT_BUILTIN (cvt_ps_pw, MIPS_V2SF_FTYPE_V2SF, mips3d), 12689 12690 DIRECT_BUILTIN (recip1_s, MIPS_SF_FTYPE_SF, mips3d), 12691 DIRECT_BUILTIN (recip1_d, MIPS_DF_FTYPE_DF, mips3d), 12692 DIRECT_BUILTIN (recip1_ps, MIPS_V2SF_FTYPE_V2SF, mips3d), 12693 DIRECT_BUILTIN (recip2_s, MIPS_SF_FTYPE_SF_SF, mips3d), 12694 DIRECT_BUILTIN (recip2_d, MIPS_DF_FTYPE_DF_DF, mips3d), 12695 DIRECT_BUILTIN (recip2_ps, MIPS_V2SF_FTYPE_V2SF_V2SF, mips3d), 12696 12697 DIRECT_BUILTIN (rsqrt1_s, MIPS_SF_FTYPE_SF, mips3d), 12698 DIRECT_BUILTIN (rsqrt1_d, MIPS_DF_FTYPE_DF, mips3d), 12699 DIRECT_BUILTIN (rsqrt1_ps, MIPS_V2SF_FTYPE_V2SF, mips3d), 12700 DIRECT_BUILTIN (rsqrt2_s, MIPS_SF_FTYPE_SF_SF, mips3d), 12701 DIRECT_BUILTIN (rsqrt2_d, MIPS_DF_FTYPE_DF_DF, mips3d), 12702 DIRECT_BUILTIN (rsqrt2_ps, MIPS_V2SF_FTYPE_V2SF_V2SF, mips3d), 12703 12704 MIPS_FP_CONDITIONS (CMP_BUILTINS), 12705 12706 /* Built-in functions for the SB-1 processor. */ 12707 DIRECT_BUILTIN (sqrt_ps, MIPS_V2SF_FTYPE_V2SF, sb1_paired_single), 12708 12709 /* Built-in functions for the DSP ASE (32-bit and 64-bit). */ 12710 DIRECT_BUILTIN (addq_ph, MIPS_V2HI_FTYPE_V2HI_V2HI, dsp), 12711 DIRECT_BUILTIN (addq_s_ph, MIPS_V2HI_FTYPE_V2HI_V2HI, dsp), 12712 DIRECT_BUILTIN (addq_s_w, MIPS_SI_FTYPE_SI_SI, dsp), 12713 DIRECT_BUILTIN (addu_qb, MIPS_V4QI_FTYPE_V4QI_V4QI, dsp), 12714 DIRECT_BUILTIN (addu_s_qb, MIPS_V4QI_FTYPE_V4QI_V4QI, dsp), 12715 DIRECT_BUILTIN (subq_ph, MIPS_V2HI_FTYPE_V2HI_V2HI, dsp), 12716 DIRECT_BUILTIN (subq_s_ph, MIPS_V2HI_FTYPE_V2HI_V2HI, dsp), 12717 DIRECT_BUILTIN (subq_s_w, MIPS_SI_FTYPE_SI_SI, dsp), 12718 DIRECT_BUILTIN (subu_qb, MIPS_V4QI_FTYPE_V4QI_V4QI, dsp), 12719 DIRECT_BUILTIN (subu_s_qb, MIPS_V4QI_FTYPE_V4QI_V4QI, dsp), 12720 DIRECT_BUILTIN (addsc, MIPS_SI_FTYPE_SI_SI, dsp), 12721 DIRECT_BUILTIN (addwc, MIPS_SI_FTYPE_SI_SI, dsp), 12722 DIRECT_BUILTIN (modsub, MIPS_SI_FTYPE_SI_SI, dsp), 12723 DIRECT_BUILTIN (raddu_w_qb, MIPS_SI_FTYPE_V4QI, dsp), 12724 DIRECT_BUILTIN (absq_s_ph, MIPS_V2HI_FTYPE_V2HI, dsp), 12725 DIRECT_BUILTIN (absq_s_w, MIPS_SI_FTYPE_SI, dsp), 12726 DIRECT_BUILTIN (precrq_qb_ph, MIPS_V4QI_FTYPE_V2HI_V2HI, dsp), 12727 DIRECT_BUILTIN (precrq_ph_w, MIPS_V2HI_FTYPE_SI_SI, dsp), 12728 DIRECT_BUILTIN (precrq_rs_ph_w, MIPS_V2HI_FTYPE_SI_SI, dsp), 12729 DIRECT_BUILTIN (precrqu_s_qb_ph, MIPS_V4QI_FTYPE_V2HI_V2HI, dsp), 12730 DIRECT_BUILTIN (preceq_w_phl, MIPS_SI_FTYPE_V2HI, dsp), 12731 DIRECT_BUILTIN (preceq_w_phr, MIPS_SI_FTYPE_V2HI, dsp), 12732 DIRECT_BUILTIN (precequ_ph_qbl, MIPS_V2HI_FTYPE_V4QI, dsp), 12733 DIRECT_BUILTIN (precequ_ph_qbr, MIPS_V2HI_FTYPE_V4QI, dsp), 12734 DIRECT_BUILTIN (precequ_ph_qbla, MIPS_V2HI_FTYPE_V4QI, dsp), 12735 DIRECT_BUILTIN (precequ_ph_qbra, MIPS_V2HI_FTYPE_V4QI, dsp), 12736 DIRECT_BUILTIN (preceu_ph_qbl, MIPS_V2HI_FTYPE_V4QI, dsp), 12737 DIRECT_BUILTIN (preceu_ph_qbr, MIPS_V2HI_FTYPE_V4QI, dsp), 12738 DIRECT_BUILTIN (preceu_ph_qbla, MIPS_V2HI_FTYPE_V4QI, dsp), 12739 DIRECT_BUILTIN (preceu_ph_qbra, MIPS_V2HI_FTYPE_V4QI, dsp), 12740 DIRECT_BUILTIN (shll_qb, MIPS_V4QI_FTYPE_V4QI_SI, dsp), 12741 DIRECT_BUILTIN (shll_ph, MIPS_V2HI_FTYPE_V2HI_SI, dsp), 12742 DIRECT_BUILTIN (shll_s_ph, MIPS_V2HI_FTYPE_V2HI_SI, dsp), 12743 DIRECT_BUILTIN (shll_s_w, MIPS_SI_FTYPE_SI_SI, dsp), 12744 DIRECT_BUILTIN (shrl_qb, MIPS_V4QI_FTYPE_V4QI_SI, dsp), 12745 DIRECT_BUILTIN (shra_ph, MIPS_V2HI_FTYPE_V2HI_SI, dsp), 12746 DIRECT_BUILTIN (shra_r_ph, MIPS_V2HI_FTYPE_V2HI_SI, dsp), 12747 DIRECT_BUILTIN (shra_r_w, MIPS_SI_FTYPE_SI_SI, dsp), 12748 DIRECT_BUILTIN (muleu_s_ph_qbl, MIPS_V2HI_FTYPE_V4QI_V2HI, dsp), 12749 DIRECT_BUILTIN (muleu_s_ph_qbr, MIPS_V2HI_FTYPE_V4QI_V2HI, dsp), 12750 DIRECT_BUILTIN (mulq_rs_ph, MIPS_V2HI_FTYPE_V2HI_V2HI, dsp), 12751 DIRECT_BUILTIN (muleq_s_w_phl, MIPS_SI_FTYPE_V2HI_V2HI, dsp), 12752 DIRECT_BUILTIN (muleq_s_w_phr, MIPS_SI_FTYPE_V2HI_V2HI, dsp), 12753 DIRECT_BUILTIN (bitrev, MIPS_SI_FTYPE_SI, dsp), 12754 DIRECT_BUILTIN (insv, MIPS_SI_FTYPE_SI_SI, dsp), 12755 DIRECT_BUILTIN (repl_qb, MIPS_V4QI_FTYPE_SI, dsp), 12756 DIRECT_BUILTIN (repl_ph, MIPS_V2HI_FTYPE_SI, dsp), 12757 DIRECT_NO_TARGET_BUILTIN (cmpu_eq_qb, MIPS_VOID_FTYPE_V4QI_V4QI, dsp), 12758 DIRECT_NO_TARGET_BUILTIN (cmpu_lt_qb, MIPS_VOID_FTYPE_V4QI_V4QI, dsp), 12759 DIRECT_NO_TARGET_BUILTIN (cmpu_le_qb, MIPS_VOID_FTYPE_V4QI_V4QI, dsp), 12760 DIRECT_BUILTIN (cmpgu_eq_qb, MIPS_SI_FTYPE_V4QI_V4QI, dsp), 12761 DIRECT_BUILTIN (cmpgu_lt_qb, MIPS_SI_FTYPE_V4QI_V4QI, dsp), 12762 DIRECT_BUILTIN (cmpgu_le_qb, MIPS_SI_FTYPE_V4QI_V4QI, dsp), 12763 DIRECT_NO_TARGET_BUILTIN (cmp_eq_ph, MIPS_VOID_FTYPE_V2HI_V2HI, dsp), 12764 DIRECT_NO_TARGET_BUILTIN (cmp_lt_ph, MIPS_VOID_FTYPE_V2HI_V2HI, dsp), 12765 DIRECT_NO_TARGET_BUILTIN (cmp_le_ph, MIPS_VOID_FTYPE_V2HI_V2HI, dsp), 12766 DIRECT_BUILTIN (pick_qb, MIPS_V4QI_FTYPE_V4QI_V4QI, dsp), 12767 DIRECT_BUILTIN (pick_ph, MIPS_V2HI_FTYPE_V2HI_V2HI, dsp), 12768 DIRECT_BUILTIN (packrl_ph, MIPS_V2HI_FTYPE_V2HI_V2HI, dsp), 12769 DIRECT_NO_TARGET_BUILTIN (wrdsp, MIPS_VOID_FTYPE_SI_SI, dsp), 12770 DIRECT_BUILTIN (rddsp, MIPS_SI_FTYPE_SI, dsp), 12771 DIRECT_BUILTIN (lbux, MIPS_SI_FTYPE_POINTER_SI, dsp), 12772 DIRECT_BUILTIN (lhx, MIPS_SI_FTYPE_POINTER_SI, dsp), 12773 DIRECT_BUILTIN (lwx, MIPS_SI_FTYPE_POINTER_SI, dsp), 12774 BPOSGE_BUILTIN (32, dsp), 12775 12776 /* The following are for the MIPS DSP ASE REV 2 (32-bit and 64-bit). */ 12777 DIRECT_BUILTIN (absq_s_qb, MIPS_V4QI_FTYPE_V4QI, dspr2), 12778 DIRECT_BUILTIN (addu_ph, MIPS_V2HI_FTYPE_V2HI_V2HI, dspr2), 12779 DIRECT_BUILTIN (addu_s_ph, MIPS_V2HI_FTYPE_V2HI_V2HI, dspr2), 12780 DIRECT_BUILTIN (adduh_qb, MIPS_V4QI_FTYPE_V4QI_V4QI, dspr2), 12781 DIRECT_BUILTIN (adduh_r_qb, MIPS_V4QI_FTYPE_V4QI_V4QI, dspr2), 12782 DIRECT_BUILTIN (append, MIPS_SI_FTYPE_SI_SI_SI, dspr2), 12783 DIRECT_BUILTIN (balign, MIPS_SI_FTYPE_SI_SI_SI, dspr2), 12784 DIRECT_BUILTIN (cmpgdu_eq_qb, MIPS_SI_FTYPE_V4QI_V4QI, dspr2), 12785 DIRECT_BUILTIN (cmpgdu_lt_qb, MIPS_SI_FTYPE_V4QI_V4QI, dspr2), 12786 DIRECT_BUILTIN (cmpgdu_le_qb, MIPS_SI_FTYPE_V4QI_V4QI, dspr2), 12787 DIRECT_BUILTIN (mul_ph, MIPS_V2HI_FTYPE_V2HI_V2HI, dspr2), 12788 DIRECT_BUILTIN (mul_s_ph, MIPS_V2HI_FTYPE_V2HI_V2HI, dspr2), 12789 DIRECT_BUILTIN (mulq_rs_w, MIPS_SI_FTYPE_SI_SI, dspr2), 12790 DIRECT_BUILTIN (mulq_s_ph, MIPS_V2HI_FTYPE_V2HI_V2HI, dspr2), 12791 DIRECT_BUILTIN (mulq_s_w, MIPS_SI_FTYPE_SI_SI, dspr2), 12792 DIRECT_BUILTIN (precr_qb_ph, MIPS_V4QI_FTYPE_V2HI_V2HI, dspr2), 12793 DIRECT_BUILTIN (precr_sra_ph_w, MIPS_V2HI_FTYPE_SI_SI_SI, dspr2), 12794 DIRECT_BUILTIN (precr_sra_r_ph_w, MIPS_V2HI_FTYPE_SI_SI_SI, dspr2), 12795 DIRECT_BUILTIN (prepend, MIPS_SI_FTYPE_SI_SI_SI, dspr2), 12796 DIRECT_BUILTIN (shra_qb, MIPS_V4QI_FTYPE_V4QI_SI, dspr2), 12797 DIRECT_BUILTIN (shra_r_qb, MIPS_V4QI_FTYPE_V4QI_SI, dspr2), 12798 DIRECT_BUILTIN (shrl_ph, MIPS_V2HI_FTYPE_V2HI_SI, dspr2), 12799 DIRECT_BUILTIN (subu_ph, MIPS_V2HI_FTYPE_V2HI_V2HI, dspr2), 12800 DIRECT_BUILTIN (subu_s_ph, MIPS_V2HI_FTYPE_V2HI_V2HI, dspr2), 12801 DIRECT_BUILTIN (subuh_qb, MIPS_V4QI_FTYPE_V4QI_V4QI, dspr2), 12802 DIRECT_BUILTIN (subuh_r_qb, MIPS_V4QI_FTYPE_V4QI_V4QI, dspr2), 12803 DIRECT_BUILTIN (addqh_ph, MIPS_V2HI_FTYPE_V2HI_V2HI, dspr2), 12804 DIRECT_BUILTIN (addqh_r_ph, MIPS_V2HI_FTYPE_V2HI_V2HI, dspr2), 12805 DIRECT_BUILTIN (addqh_w, MIPS_SI_FTYPE_SI_SI, dspr2), 12806 DIRECT_BUILTIN (addqh_r_w, MIPS_SI_FTYPE_SI_SI, dspr2), 12807 DIRECT_BUILTIN (subqh_ph, MIPS_V2HI_FTYPE_V2HI_V2HI, dspr2), 12808 DIRECT_BUILTIN (subqh_r_ph, MIPS_V2HI_FTYPE_V2HI_V2HI, dspr2), 12809 DIRECT_BUILTIN (subqh_w, MIPS_SI_FTYPE_SI_SI, dspr2), 12810 DIRECT_BUILTIN (subqh_r_w, MIPS_SI_FTYPE_SI_SI, dspr2), 12811 12812 /* Built-in functions for the DSP ASE (32-bit only). */ 12813 DIRECT_BUILTIN (dpau_h_qbl, MIPS_DI_FTYPE_DI_V4QI_V4QI, dsp_32), 12814 DIRECT_BUILTIN (dpau_h_qbr, MIPS_DI_FTYPE_DI_V4QI_V4QI, dsp_32), 12815 DIRECT_BUILTIN (dpsu_h_qbl, MIPS_DI_FTYPE_DI_V4QI_V4QI, dsp_32), 12816 DIRECT_BUILTIN (dpsu_h_qbr, MIPS_DI_FTYPE_DI_V4QI_V4QI, dsp_32), 12817 DIRECT_BUILTIN (dpaq_s_w_ph, MIPS_DI_FTYPE_DI_V2HI_V2HI, dsp_32), 12818 DIRECT_BUILTIN (dpsq_s_w_ph, MIPS_DI_FTYPE_DI_V2HI_V2HI, dsp_32), 12819 DIRECT_BUILTIN (mulsaq_s_w_ph, MIPS_DI_FTYPE_DI_V2HI_V2HI, dsp_32), 12820 DIRECT_BUILTIN (dpaq_sa_l_w, MIPS_DI_FTYPE_DI_SI_SI, dsp_32), 12821 DIRECT_BUILTIN (dpsq_sa_l_w, MIPS_DI_FTYPE_DI_SI_SI, dsp_32), 12822 DIRECT_BUILTIN (maq_s_w_phl, MIPS_DI_FTYPE_DI_V2HI_V2HI, dsp_32), 12823 DIRECT_BUILTIN (maq_s_w_phr, MIPS_DI_FTYPE_DI_V2HI_V2HI, dsp_32), 12824 DIRECT_BUILTIN (maq_sa_w_phl, MIPS_DI_FTYPE_DI_V2HI_V2HI, dsp_32), 12825 DIRECT_BUILTIN (maq_sa_w_phr, MIPS_DI_FTYPE_DI_V2HI_V2HI, dsp_32), 12826 DIRECT_BUILTIN (extr_w, MIPS_SI_FTYPE_DI_SI, dsp_32), 12827 DIRECT_BUILTIN (extr_r_w, MIPS_SI_FTYPE_DI_SI, dsp_32), 12828 DIRECT_BUILTIN (extr_rs_w, MIPS_SI_FTYPE_DI_SI, dsp_32), 12829 DIRECT_BUILTIN (extr_s_h, MIPS_SI_FTYPE_DI_SI, dsp_32), 12830 DIRECT_BUILTIN (extp, MIPS_SI_FTYPE_DI_SI, dsp_32), 12831 DIRECT_BUILTIN (extpdp, MIPS_SI_FTYPE_DI_SI, dsp_32), 12832 DIRECT_BUILTIN (shilo, MIPS_DI_FTYPE_DI_SI, dsp_32), 12833 DIRECT_BUILTIN (mthlip, MIPS_DI_FTYPE_DI_SI, dsp_32), 12834 12835 /* The following are for the MIPS DSP ASE REV 2 (32-bit only). */ 12836 DIRECT_BUILTIN (dpa_w_ph, MIPS_DI_FTYPE_DI_V2HI_V2HI, dspr2_32), 12837 DIRECT_BUILTIN (dps_w_ph, MIPS_DI_FTYPE_DI_V2HI_V2HI, dspr2_32), 12838 DIRECT_BUILTIN (madd, MIPS_DI_FTYPE_DI_SI_SI, dspr2_32), 12839 DIRECT_BUILTIN (maddu, MIPS_DI_FTYPE_DI_USI_USI, dspr2_32), 12840 DIRECT_BUILTIN (msub, MIPS_DI_FTYPE_DI_SI_SI, dspr2_32), 12841 DIRECT_BUILTIN (msubu, MIPS_DI_FTYPE_DI_USI_USI, dspr2_32), 12842 DIRECT_BUILTIN (mulsa_w_ph, MIPS_DI_FTYPE_DI_V2HI_V2HI, dspr2_32), 12843 DIRECT_BUILTIN (mult, MIPS_DI_FTYPE_SI_SI, dspr2_32), 12844 DIRECT_BUILTIN (multu, MIPS_DI_FTYPE_USI_USI, dspr2_32), 12845 DIRECT_BUILTIN (dpax_w_ph, MIPS_DI_FTYPE_DI_V2HI_V2HI, dspr2_32), 12846 DIRECT_BUILTIN (dpsx_w_ph, MIPS_DI_FTYPE_DI_V2HI_V2HI, dspr2_32), 12847 DIRECT_BUILTIN (dpaqx_s_w_ph, MIPS_DI_FTYPE_DI_V2HI_V2HI, dspr2_32), 12848 DIRECT_BUILTIN (dpaqx_sa_w_ph, MIPS_DI_FTYPE_DI_V2HI_V2HI, dspr2_32), 12849 DIRECT_BUILTIN (dpsqx_s_w_ph, MIPS_DI_FTYPE_DI_V2HI_V2HI, dspr2_32), 12850 DIRECT_BUILTIN (dpsqx_sa_w_ph, MIPS_DI_FTYPE_DI_V2HI_V2HI, dspr2_32), 12851 12852 /* Builtin functions for ST Microelectronics Loongson-2E/2F cores. */ 12853 LOONGSON_BUILTIN (packsswh, MIPS_V4HI_FTYPE_V2SI_V2SI), 12854 LOONGSON_BUILTIN (packsshb, MIPS_V8QI_FTYPE_V4HI_V4HI), 12855 LOONGSON_BUILTIN (packushb, MIPS_UV8QI_FTYPE_UV4HI_UV4HI), 12856 LOONGSON_BUILTIN_SUFFIX (paddw, u, MIPS_UV2SI_FTYPE_UV2SI_UV2SI), 12857 LOONGSON_BUILTIN_SUFFIX (paddh, u, MIPS_UV4HI_FTYPE_UV4HI_UV4HI), 12858 LOONGSON_BUILTIN_SUFFIX (paddb, u, MIPS_UV8QI_FTYPE_UV8QI_UV8QI), 12859 LOONGSON_BUILTIN_SUFFIX (paddw, s, MIPS_V2SI_FTYPE_V2SI_V2SI), 12860 LOONGSON_BUILTIN_SUFFIX (paddh, s, MIPS_V4HI_FTYPE_V4HI_V4HI), 12861 LOONGSON_BUILTIN_SUFFIX (paddb, s, MIPS_V8QI_FTYPE_V8QI_V8QI), 12862 LOONGSON_BUILTIN_SUFFIX (paddd, u, MIPS_UDI_FTYPE_UDI_UDI), 12863 LOONGSON_BUILTIN_SUFFIX (paddd, s, MIPS_DI_FTYPE_DI_DI), 12864 LOONGSON_BUILTIN (paddsh, MIPS_V4HI_FTYPE_V4HI_V4HI), 12865 LOONGSON_BUILTIN (paddsb, MIPS_V8QI_FTYPE_V8QI_V8QI), 12866 LOONGSON_BUILTIN (paddush, MIPS_UV4HI_FTYPE_UV4HI_UV4HI), 12867 LOONGSON_BUILTIN (paddusb, MIPS_UV8QI_FTYPE_UV8QI_UV8QI), 12868 LOONGSON_BUILTIN_ALIAS (pandn_d, pandn_ud, MIPS_UDI_FTYPE_UDI_UDI), 12869 LOONGSON_BUILTIN_ALIAS (pandn_w, pandn_uw, MIPS_UV2SI_FTYPE_UV2SI_UV2SI), 12870 LOONGSON_BUILTIN_ALIAS (pandn_h, pandn_uh, MIPS_UV4HI_FTYPE_UV4HI_UV4HI), 12871 LOONGSON_BUILTIN_ALIAS (pandn_b, pandn_ub, MIPS_UV8QI_FTYPE_UV8QI_UV8QI), 12872 LOONGSON_BUILTIN_ALIAS (pandn_d, pandn_sd, MIPS_DI_FTYPE_DI_DI), 12873 LOONGSON_BUILTIN_ALIAS (pandn_w, pandn_sw, MIPS_V2SI_FTYPE_V2SI_V2SI), 12874 LOONGSON_BUILTIN_ALIAS (pandn_h, pandn_sh, MIPS_V4HI_FTYPE_V4HI_V4HI), 12875 LOONGSON_BUILTIN_ALIAS (pandn_b, pandn_sb, MIPS_V8QI_FTYPE_V8QI_V8QI), 12876 LOONGSON_BUILTIN (pavgh, MIPS_UV4HI_FTYPE_UV4HI_UV4HI), 12877 LOONGSON_BUILTIN (pavgb, MIPS_UV8QI_FTYPE_UV8QI_UV8QI), 12878 LOONGSON_BUILTIN_SUFFIX (pcmpeqw, u, MIPS_UV2SI_FTYPE_UV2SI_UV2SI), 12879 LOONGSON_BUILTIN_SUFFIX (pcmpeqh, u, MIPS_UV4HI_FTYPE_UV4HI_UV4HI), 12880 LOONGSON_BUILTIN_SUFFIX (pcmpeqb, u, MIPS_UV8QI_FTYPE_UV8QI_UV8QI), 12881 LOONGSON_BUILTIN_SUFFIX (pcmpeqw, s, MIPS_V2SI_FTYPE_V2SI_V2SI), 12882 LOONGSON_BUILTIN_SUFFIX (pcmpeqh, s, MIPS_V4HI_FTYPE_V4HI_V4HI), 12883 LOONGSON_BUILTIN_SUFFIX (pcmpeqb, s, MIPS_V8QI_FTYPE_V8QI_V8QI), 12884 LOONGSON_BUILTIN_SUFFIX (pcmpgtw, u, MIPS_UV2SI_FTYPE_UV2SI_UV2SI), 12885 LOONGSON_BUILTIN_SUFFIX (pcmpgth, u, MIPS_UV4HI_FTYPE_UV4HI_UV4HI), 12886 LOONGSON_BUILTIN_SUFFIX (pcmpgtb, u, MIPS_UV8QI_FTYPE_UV8QI_UV8QI), 12887 LOONGSON_BUILTIN_SUFFIX (pcmpgtw, s, MIPS_V2SI_FTYPE_V2SI_V2SI), 12888 LOONGSON_BUILTIN_SUFFIX (pcmpgth, s, MIPS_V4HI_FTYPE_V4HI_V4HI), 12889 LOONGSON_BUILTIN_SUFFIX (pcmpgtb, s, MIPS_V8QI_FTYPE_V8QI_V8QI), 12890 LOONGSON_BUILTIN_SUFFIX (pextrh, u, MIPS_UV4HI_FTYPE_UV4HI_USI), 12891 LOONGSON_BUILTIN_SUFFIX (pextrh, s, MIPS_V4HI_FTYPE_V4HI_USI), 12892 LOONGSON_BUILTIN_SUFFIX (pinsrh_0, u, MIPS_UV4HI_FTYPE_UV4HI_UV4HI), 12893 LOONGSON_BUILTIN_SUFFIX (pinsrh_1, u, MIPS_UV4HI_FTYPE_UV4HI_UV4HI), 12894 LOONGSON_BUILTIN_SUFFIX (pinsrh_2, u, MIPS_UV4HI_FTYPE_UV4HI_UV4HI), 12895 LOONGSON_BUILTIN_SUFFIX (pinsrh_3, u, MIPS_UV4HI_FTYPE_UV4HI_UV4HI), 12896 LOONGSON_BUILTIN_SUFFIX (pinsrh_0, s, MIPS_V4HI_FTYPE_V4HI_V4HI), 12897 LOONGSON_BUILTIN_SUFFIX (pinsrh_1, s, MIPS_V4HI_FTYPE_V4HI_V4HI), 12898 LOONGSON_BUILTIN_SUFFIX (pinsrh_2, s, MIPS_V4HI_FTYPE_V4HI_V4HI), 12899 LOONGSON_BUILTIN_SUFFIX (pinsrh_3, s, MIPS_V4HI_FTYPE_V4HI_V4HI), 12900 LOONGSON_BUILTIN (pmaddhw, MIPS_V2SI_FTYPE_V4HI_V4HI), 12901 LOONGSON_BUILTIN (pmaxsh, MIPS_V4HI_FTYPE_V4HI_V4HI), 12902 LOONGSON_BUILTIN (pmaxub, MIPS_UV8QI_FTYPE_UV8QI_UV8QI), 12903 LOONGSON_BUILTIN (pminsh, MIPS_V4HI_FTYPE_V4HI_V4HI), 12904 LOONGSON_BUILTIN (pminub, MIPS_UV8QI_FTYPE_UV8QI_UV8QI), 12905 LOONGSON_BUILTIN_SUFFIX (pmovmskb, u, MIPS_UV8QI_FTYPE_UV8QI), 12906 LOONGSON_BUILTIN_SUFFIX (pmovmskb, s, MIPS_V8QI_FTYPE_V8QI), 12907 LOONGSON_BUILTIN (pmulhuh, MIPS_UV4HI_FTYPE_UV4HI_UV4HI), 12908 LOONGSON_BUILTIN (pmulhh, MIPS_V4HI_FTYPE_V4HI_V4HI), 12909 LOONGSON_BUILTIN (pmullh, MIPS_V4HI_FTYPE_V4HI_V4HI), 12910 LOONGSON_BUILTIN (pmuluw, MIPS_UDI_FTYPE_UV2SI_UV2SI), 12911 LOONGSON_BUILTIN (pasubub, MIPS_UV8QI_FTYPE_UV8QI_UV8QI), 12912 LOONGSON_BUILTIN (biadd, MIPS_UV4HI_FTYPE_UV8QI), 12913 LOONGSON_BUILTIN (psadbh, MIPS_UV4HI_FTYPE_UV8QI_UV8QI), 12914 LOONGSON_BUILTIN_SUFFIX (pshufh, u, MIPS_UV4HI_FTYPE_UV4HI_UV4HI_UQI), 12915 LOONGSON_BUILTIN_SUFFIX (pshufh, s, MIPS_V4HI_FTYPE_V4HI_V4HI_UQI), 12916 LOONGSON_BUILTIN_SUFFIX (psllh, u, MIPS_UV4HI_FTYPE_UV4HI_UQI), 12917 LOONGSON_BUILTIN_SUFFIX (psllh, s, MIPS_V4HI_FTYPE_V4HI_UQI), 12918 LOONGSON_BUILTIN_SUFFIX (psllw, u, MIPS_UV2SI_FTYPE_UV2SI_UQI), 12919 LOONGSON_BUILTIN_SUFFIX (psllw, s, MIPS_V2SI_FTYPE_V2SI_UQI), 12920 LOONGSON_BUILTIN_SUFFIX (psrah, u, MIPS_UV4HI_FTYPE_UV4HI_UQI), 12921 LOONGSON_BUILTIN_SUFFIX (psrah, s, MIPS_V4HI_FTYPE_V4HI_UQI), 12922 LOONGSON_BUILTIN_SUFFIX (psraw, u, MIPS_UV2SI_FTYPE_UV2SI_UQI), 12923 LOONGSON_BUILTIN_SUFFIX (psraw, s, MIPS_V2SI_FTYPE_V2SI_UQI), 12924 LOONGSON_BUILTIN_SUFFIX (psrlh, u, MIPS_UV4HI_FTYPE_UV4HI_UQI), 12925 LOONGSON_BUILTIN_SUFFIX (psrlh, s, MIPS_V4HI_FTYPE_V4HI_UQI), 12926 LOONGSON_BUILTIN_SUFFIX (psrlw, u, MIPS_UV2SI_FTYPE_UV2SI_UQI), 12927 LOONGSON_BUILTIN_SUFFIX (psrlw, s, MIPS_V2SI_FTYPE_V2SI_UQI), 12928 LOONGSON_BUILTIN_SUFFIX (psubw, u, MIPS_UV2SI_FTYPE_UV2SI_UV2SI), 12929 LOONGSON_BUILTIN_SUFFIX (psubh, u, MIPS_UV4HI_FTYPE_UV4HI_UV4HI), 12930 LOONGSON_BUILTIN_SUFFIX (psubb, u, MIPS_UV8QI_FTYPE_UV8QI_UV8QI), 12931 LOONGSON_BUILTIN_SUFFIX (psubw, s, MIPS_V2SI_FTYPE_V2SI_V2SI), 12932 LOONGSON_BUILTIN_SUFFIX (psubh, s, MIPS_V4HI_FTYPE_V4HI_V4HI), 12933 LOONGSON_BUILTIN_SUFFIX (psubb, s, MIPS_V8QI_FTYPE_V8QI_V8QI), 12934 LOONGSON_BUILTIN_SUFFIX (psubd, u, MIPS_UDI_FTYPE_UDI_UDI), 12935 LOONGSON_BUILTIN_SUFFIX (psubd, s, MIPS_DI_FTYPE_DI_DI), 12936 LOONGSON_BUILTIN (psubsh, MIPS_V4HI_FTYPE_V4HI_V4HI), 12937 LOONGSON_BUILTIN (psubsb, MIPS_V8QI_FTYPE_V8QI_V8QI), 12938 LOONGSON_BUILTIN (psubush, MIPS_UV4HI_FTYPE_UV4HI_UV4HI), 12939 LOONGSON_BUILTIN (psubusb, MIPS_UV8QI_FTYPE_UV8QI_UV8QI), 12940 LOONGSON_BUILTIN_SUFFIX (punpckhbh, u, MIPS_UV8QI_FTYPE_UV8QI_UV8QI), 12941 LOONGSON_BUILTIN_SUFFIX (punpckhhw, u, MIPS_UV4HI_FTYPE_UV4HI_UV4HI), 12942 LOONGSON_BUILTIN_SUFFIX (punpckhwd, u, MIPS_UV2SI_FTYPE_UV2SI_UV2SI), 12943 LOONGSON_BUILTIN_SUFFIX (punpckhbh, s, MIPS_V8QI_FTYPE_V8QI_V8QI), 12944 LOONGSON_BUILTIN_SUFFIX (punpckhhw, s, MIPS_V4HI_FTYPE_V4HI_V4HI), 12945 LOONGSON_BUILTIN_SUFFIX (punpckhwd, s, MIPS_V2SI_FTYPE_V2SI_V2SI), 12946 LOONGSON_BUILTIN_SUFFIX (punpcklbh, u, MIPS_UV8QI_FTYPE_UV8QI_UV8QI), 12947 LOONGSON_BUILTIN_SUFFIX (punpcklhw, u, MIPS_UV4HI_FTYPE_UV4HI_UV4HI), 12948 LOONGSON_BUILTIN_SUFFIX (punpcklwd, u, MIPS_UV2SI_FTYPE_UV2SI_UV2SI), 12949 LOONGSON_BUILTIN_SUFFIX (punpcklbh, s, MIPS_V8QI_FTYPE_V8QI_V8QI), 12950 LOONGSON_BUILTIN_SUFFIX (punpcklhw, s, MIPS_V4HI_FTYPE_V4HI_V4HI), 12951 LOONGSON_BUILTIN_SUFFIX (punpcklwd, s, MIPS_V2SI_FTYPE_V2SI_V2SI), 12952 12953 /* Sundry other built-in functions. */ 12954 DIRECT_NO_TARGET_BUILTIN (cache, MIPS_VOID_FTYPE_SI_CVPOINTER, cache) 12955 }; 12956 12957 /* MODE is a vector mode whose elements have type TYPE. Return the type 12958 of the vector itself. */ 12959 12960 static tree 12961 mips_builtin_vector_type (tree type, enum machine_mode mode) 12962 { 12963 static tree types[2 * (int) MAX_MACHINE_MODE]; 12964 int mode_index; 12965 12966 mode_index = (int) mode; 12967 12968 if (TREE_CODE (type) == INTEGER_TYPE && TYPE_UNSIGNED (type)) 12969 mode_index += MAX_MACHINE_MODE; 12970 12971 if (types[mode_index] == NULL_TREE) 12972 types[mode_index] = build_vector_type_for_mode (type, mode); 12973 return types[mode_index]; 12974 } 12975 12976 /* Return a type for 'const volatile void *'. */ 12977 12978 static tree 12979 mips_build_cvpointer_type (void) 12980 { 12981 static tree cache; 12982 12983 if (cache == NULL_TREE) 12984 cache = build_pointer_type (build_qualified_type 12985 (void_type_node, 12986 TYPE_QUAL_CONST | TYPE_QUAL_VOLATILE)); 12987 return cache; 12988 } 12989 12990 /* Source-level argument types. */ 12991 #define MIPS_ATYPE_VOID void_type_node 12992 #define MIPS_ATYPE_INT integer_type_node 12993 #define MIPS_ATYPE_POINTER ptr_type_node 12994 #define MIPS_ATYPE_CVPOINTER mips_build_cvpointer_type () 12995 12996 /* Standard mode-based argument types. */ 12997 #define MIPS_ATYPE_UQI unsigned_intQI_type_node 12998 #define MIPS_ATYPE_SI intSI_type_node 12999 #define MIPS_ATYPE_USI unsigned_intSI_type_node 13000 #define MIPS_ATYPE_DI intDI_type_node 13001 #define MIPS_ATYPE_UDI unsigned_intDI_type_node 13002 #define MIPS_ATYPE_SF float_type_node 13003 #define MIPS_ATYPE_DF double_type_node 13004 13005 /* Vector argument types. */ 13006 #define MIPS_ATYPE_V2SF mips_builtin_vector_type (float_type_node, V2SFmode) 13007 #define MIPS_ATYPE_V2HI mips_builtin_vector_type (intHI_type_node, V2HImode) 13008 #define MIPS_ATYPE_V2SI mips_builtin_vector_type (intSI_type_node, V2SImode) 13009 #define MIPS_ATYPE_V4QI mips_builtin_vector_type (intQI_type_node, V4QImode) 13010 #define MIPS_ATYPE_V4HI mips_builtin_vector_type (intHI_type_node, V4HImode) 13011 #define MIPS_ATYPE_V8QI mips_builtin_vector_type (intQI_type_node, V8QImode) 13012 #define MIPS_ATYPE_UV2SI \ 13013 mips_builtin_vector_type (unsigned_intSI_type_node, V2SImode) 13014 #define MIPS_ATYPE_UV4HI \ 13015 mips_builtin_vector_type (unsigned_intHI_type_node, V4HImode) 13016 #define MIPS_ATYPE_UV8QI \ 13017 mips_builtin_vector_type (unsigned_intQI_type_node, V8QImode) 13018 13019 /* MIPS_FTYPE_ATYPESN takes N MIPS_FTYPES-like type codes and lists 13020 their associated MIPS_ATYPEs. */ 13021 #define MIPS_FTYPE_ATYPES1(A, B) \ 13022 MIPS_ATYPE_##A, MIPS_ATYPE_##B 13023 13024 #define MIPS_FTYPE_ATYPES2(A, B, C) \ 13025 MIPS_ATYPE_##A, MIPS_ATYPE_##B, MIPS_ATYPE_##C 13026 13027 #define MIPS_FTYPE_ATYPES3(A, B, C, D) \ 13028 MIPS_ATYPE_##A, MIPS_ATYPE_##B, MIPS_ATYPE_##C, MIPS_ATYPE_##D 13029 13030 #define MIPS_FTYPE_ATYPES4(A, B, C, D, E) \ 13031 MIPS_ATYPE_##A, MIPS_ATYPE_##B, MIPS_ATYPE_##C, MIPS_ATYPE_##D, \ 13032 MIPS_ATYPE_##E 13033 13034 /* Return the function type associated with function prototype TYPE. */ 13035 13036 static tree 13037 mips_build_function_type (enum mips_function_type type) 13038 { 13039 static tree types[(int) MIPS_MAX_FTYPE_MAX]; 13040 13041 if (types[(int) type] == NULL_TREE) 13042 switch (type) 13043 { 13044 #define DEF_MIPS_FTYPE(NUM, ARGS) \ 13045 case MIPS_FTYPE_NAME##NUM ARGS: \ 13046 types[(int) type] \ 13047 = build_function_type_list (MIPS_FTYPE_ATYPES##NUM ARGS, \ 13048 NULL_TREE); \ 13049 break; 13050 #include "config/mips/mips-ftypes.def" 13051 #undef DEF_MIPS_FTYPE 13052 default: 13053 gcc_unreachable (); 13054 } 13055 13056 return types[(int) type]; 13057 } 13058 13059 /* Implement TARGET_INIT_BUILTINS. */ 13060 13061 static void 13062 mips_init_builtins (void) 13063 { 13064 const struct mips_builtin_description *d; 13065 unsigned int i; 13066 13067 /* Iterate through all of the bdesc arrays, initializing all of the 13068 builtin functions. */ 13069 for (i = 0; i < ARRAY_SIZE (mips_builtins); i++) 13070 { 13071 d = &mips_builtins[i]; 13072 if (d->avail ()) 13073 add_builtin_function (d->name, 13074 mips_build_function_type (d->function_type), 13075 i, BUILT_IN_MD, NULL, NULL); 13076 } 13077 } 13078 13079 /* Take argument ARGNO from EXP's argument list and convert it into a 13080 form suitable for input operand OPNO of instruction ICODE. Return the 13081 value. */ 13082 13083 static rtx 13084 mips_prepare_builtin_arg (enum insn_code icode, 13085 unsigned int opno, tree exp, unsigned int argno) 13086 { 13087 tree arg; 13088 rtx value; 13089 enum machine_mode mode; 13090 13091 arg = CALL_EXPR_ARG (exp, argno); 13092 value = expand_normal (arg); 13093 mode = insn_data[icode].operand[opno].mode; 13094 if (!insn_data[icode].operand[opno].predicate (value, mode)) 13095 { 13096 /* We need to get the mode from ARG for two reasons: 13097 13098 - to cope with address operands, where MODE is the mode of the 13099 memory, rather than of VALUE itself. 13100 13101 - to cope with special predicates like pmode_register_operand, 13102 where MODE is VOIDmode. */ 13103 value = copy_to_mode_reg (TYPE_MODE (TREE_TYPE (arg)), value); 13104 13105 /* Check the predicate again. */ 13106 if (!insn_data[icode].operand[opno].predicate (value, mode)) 13107 { 13108 error ("invalid argument to built-in function"); 13109 return const0_rtx; 13110 } 13111 } 13112 13113 return value; 13114 } 13115 13116 /* Return an rtx suitable for output operand OP of instruction ICODE. 13117 If TARGET is non-null, try to use it where possible. */ 13118 13119 static rtx 13120 mips_prepare_builtin_target (enum insn_code icode, unsigned int op, rtx target) 13121 { 13122 enum machine_mode mode; 13123 13124 mode = insn_data[icode].operand[op].mode; 13125 if (target == 0 || !insn_data[icode].operand[op].predicate (target, mode)) 13126 target = gen_reg_rtx (mode); 13127 13128 return target; 13129 } 13130 13131 /* Expand a MIPS_BUILTIN_DIRECT or MIPS_BUILTIN_DIRECT_NO_TARGET function; 13132 HAS_TARGET_P says which. EXP is the CALL_EXPR that calls the function 13133 and ICODE is the code of the associated .md pattern. TARGET, if nonnull, 13134 suggests a good place to put the result. */ 13135 13136 static rtx 13137 mips_expand_builtin_direct (enum insn_code icode, rtx target, tree exp, 13138 bool has_target_p) 13139 { 13140 rtx ops[MAX_RECOG_OPERANDS]; 13141 int opno, argno; 13142 13143 /* Map any target to operand 0. */ 13144 opno = 0; 13145 if (has_target_p) 13146 { 13147 target = mips_prepare_builtin_target (icode, opno, target); 13148 ops[opno] = target; 13149 opno++; 13150 } 13151 13152 /* Map the arguments to the other operands. The n_operands value 13153 for an expander includes match_dups and match_scratches as well as 13154 match_operands, so n_operands is only an upper bound on the number 13155 of arguments to the expander function. */ 13156 gcc_assert (opno + call_expr_nargs (exp) <= insn_data[icode].n_operands); 13157 for (argno = 0; argno < call_expr_nargs (exp); argno++, opno++) 13158 ops[opno] = mips_prepare_builtin_arg (icode, opno, exp, argno); 13159 13160 switch (opno) 13161 { 13162 case 2: 13163 emit_insn (GEN_FCN (icode) (ops[0], ops[1])); 13164 break; 13165 13166 case 3: 13167 emit_insn (GEN_FCN (icode) (ops[0], ops[1], ops[2])); 13168 break; 13169 13170 case 4: 13171 emit_insn (GEN_FCN (icode) (ops[0], ops[1], ops[2], ops[3])); 13172 break; 13173 13174 default: 13175 gcc_unreachable (); 13176 } 13177 return target; 13178 } 13179 13180 /* Expand a __builtin_mips_movt_*_ps or __builtin_mips_movf_*_ps 13181 function; TYPE says which. EXP is the CALL_EXPR that calls the 13182 function, ICODE is the instruction that should be used to compare 13183 the first two arguments, and COND is the condition it should test. 13184 TARGET, if nonnull, suggests a good place to put the result. */ 13185 13186 static rtx 13187 mips_expand_builtin_movtf (enum mips_builtin_type type, 13188 enum insn_code icode, enum mips_fp_condition cond, 13189 rtx target, tree exp) 13190 { 13191 rtx cmp_result, op0, op1; 13192 13193 cmp_result = mips_prepare_builtin_target (icode, 0, 0); 13194 op0 = mips_prepare_builtin_arg (icode, 1, exp, 0); 13195 op1 = mips_prepare_builtin_arg (icode, 2, exp, 1); 13196 emit_insn (GEN_FCN (icode) (cmp_result, op0, op1, GEN_INT (cond))); 13197 13198 icode = CODE_FOR_mips_cond_move_tf_ps; 13199 target = mips_prepare_builtin_target (icode, 0, target); 13200 if (type == MIPS_BUILTIN_MOVT) 13201 { 13202 op1 = mips_prepare_builtin_arg (icode, 2, exp, 2); 13203 op0 = mips_prepare_builtin_arg (icode, 1, exp, 3); 13204 } 13205 else 13206 { 13207 op0 = mips_prepare_builtin_arg (icode, 1, exp, 2); 13208 op1 = mips_prepare_builtin_arg (icode, 2, exp, 3); 13209 } 13210 emit_insn (gen_mips_cond_move_tf_ps (target, op0, op1, cmp_result)); 13211 return target; 13212 } 13213 13214 /* Move VALUE_IF_TRUE into TARGET if CONDITION is true; move VALUE_IF_FALSE 13215 into TARGET otherwise. Return TARGET. */ 13216 13217 static rtx 13218 mips_builtin_branch_and_move (rtx condition, rtx target, 13219 rtx value_if_true, rtx value_if_false) 13220 { 13221 rtx true_label, done_label; 13222 13223 true_label = gen_label_rtx (); 13224 done_label = gen_label_rtx (); 13225 13226 /* First assume that CONDITION is false. */ 13227 mips_emit_move (target, value_if_false); 13228 13229 /* Branch to TRUE_LABEL if CONDITION is true and DONE_LABEL otherwise. */ 13230 emit_jump_insn (gen_condjump (condition, true_label)); 13231 emit_jump_insn (gen_jump (done_label)); 13232 emit_barrier (); 13233 13234 /* Fix TARGET if CONDITION is true. */ 13235 emit_label (true_label); 13236 mips_emit_move (target, value_if_true); 13237 13238 emit_label (done_label); 13239 return target; 13240 } 13241 13242 /* Expand a comparison built-in function of type BUILTIN_TYPE. EXP is 13243 the CALL_EXPR that calls the function, ICODE is the code of the 13244 comparison instruction, and COND is the condition it should test. 13245 TARGET, if nonnull, suggests a good place to put the boolean result. */ 13246 13247 static rtx 13248 mips_expand_builtin_compare (enum mips_builtin_type builtin_type, 13249 enum insn_code icode, enum mips_fp_condition cond, 13250 rtx target, tree exp) 13251 { 13252 rtx offset, condition, cmp_result, args[MAX_RECOG_OPERANDS]; 13253 int argno; 13254 13255 if (target == 0 || GET_MODE (target) != SImode) 13256 target = gen_reg_rtx (SImode); 13257 13258 /* The instruction should have a target operand, an operand for each 13259 argument, and an operand for COND. */ 13260 gcc_assert (call_expr_nargs (exp) + 2 == insn_data[icode].n_operands); 13261 13262 /* Prepare the operands to the comparison. */ 13263 cmp_result = mips_prepare_builtin_target (icode, 0, 0); 13264 for (argno = 0; argno < call_expr_nargs (exp); argno++) 13265 args[argno] = mips_prepare_builtin_arg (icode, argno + 1, exp, argno); 13266 13267 switch (insn_data[icode].n_operands) 13268 { 13269 case 4: 13270 emit_insn (GEN_FCN (icode) (cmp_result, args[0], args[1], 13271 GEN_INT (cond))); 13272 break; 13273 13274 case 6: 13275 emit_insn (GEN_FCN (icode) (cmp_result, args[0], args[1], 13276 args[2], args[3], GEN_INT (cond))); 13277 break; 13278 13279 default: 13280 gcc_unreachable (); 13281 } 13282 13283 /* If the comparison sets more than one register, we define the result 13284 to be 0 if all registers are false and -1 if all registers are true. 13285 The value of the complete result is indeterminate otherwise. */ 13286 switch (builtin_type) 13287 { 13288 case MIPS_BUILTIN_CMP_ALL: 13289 condition = gen_rtx_NE (VOIDmode, cmp_result, constm1_rtx); 13290 return mips_builtin_branch_and_move (condition, target, 13291 const0_rtx, const1_rtx); 13292 13293 case MIPS_BUILTIN_CMP_UPPER: 13294 case MIPS_BUILTIN_CMP_LOWER: 13295 offset = GEN_INT (builtin_type == MIPS_BUILTIN_CMP_UPPER); 13296 condition = gen_single_cc (cmp_result, offset); 13297 return mips_builtin_branch_and_move (condition, target, 13298 const1_rtx, const0_rtx); 13299 13300 default: 13301 condition = gen_rtx_NE (VOIDmode, cmp_result, const0_rtx); 13302 return mips_builtin_branch_and_move (condition, target, 13303 const1_rtx, const0_rtx); 13304 } 13305 } 13306 13307 /* Expand a bposge built-in function of type BUILTIN_TYPE. TARGET, 13308 if nonnull, suggests a good place to put the boolean result. */ 13309 13310 static rtx 13311 mips_expand_builtin_bposge (enum mips_builtin_type builtin_type, rtx target) 13312 { 13313 rtx condition, cmp_result; 13314 int cmp_value; 13315 13316 if (target == 0 || GET_MODE (target) != SImode) 13317 target = gen_reg_rtx (SImode); 13318 13319 cmp_result = gen_rtx_REG (CCDSPmode, CCDSP_PO_REGNUM); 13320 13321 if (builtin_type == MIPS_BUILTIN_BPOSGE32) 13322 cmp_value = 32; 13323 else 13324 gcc_assert (0); 13325 13326 condition = gen_rtx_GE (VOIDmode, cmp_result, GEN_INT (cmp_value)); 13327 return mips_builtin_branch_and_move (condition, target, 13328 const1_rtx, const0_rtx); 13329 } 13330 13331 /* Implement TARGET_EXPAND_BUILTIN. */ 13332 13333 static rtx 13334 mips_expand_builtin (tree exp, rtx target, rtx subtarget ATTRIBUTE_UNUSED, 13335 enum machine_mode mode, int ignore) 13336 { 13337 tree fndecl; 13338 unsigned int fcode, avail; 13339 const struct mips_builtin_description *d; 13340 13341 fndecl = TREE_OPERAND (CALL_EXPR_FN (exp), 0); 13342 fcode = DECL_FUNCTION_CODE (fndecl); 13343 gcc_assert (fcode < ARRAY_SIZE (mips_builtins)); 13344 d = &mips_builtins[fcode]; 13345 avail = d->avail (); 13346 gcc_assert (avail != 0); 13347 if (TARGET_MIPS16) 13348 { 13349 error ("built-in function %qE not supported for MIPS16", 13350 DECL_NAME (fndecl)); 13351 return ignore ? const0_rtx : CONST0_RTX (mode); 13352 } 13353 switch (d->builtin_type) 13354 { 13355 case MIPS_BUILTIN_DIRECT: 13356 return mips_expand_builtin_direct (d->icode, target, exp, true); 13357 13358 case MIPS_BUILTIN_DIRECT_NO_TARGET: 13359 return mips_expand_builtin_direct (d->icode, target, exp, false); 13360 13361 case MIPS_BUILTIN_MOVT: 13362 case MIPS_BUILTIN_MOVF: 13363 return mips_expand_builtin_movtf (d->builtin_type, d->icode, 13364 d->cond, target, exp); 13365 13366 case MIPS_BUILTIN_CMP_ANY: 13367 case MIPS_BUILTIN_CMP_ALL: 13368 case MIPS_BUILTIN_CMP_UPPER: 13369 case MIPS_BUILTIN_CMP_LOWER: 13370 case MIPS_BUILTIN_CMP_SINGLE: 13371 return mips_expand_builtin_compare (d->builtin_type, d->icode, 13372 d->cond, target, exp); 13373 13374 case MIPS_BUILTIN_BPOSGE32: 13375 return mips_expand_builtin_bposge (d->builtin_type, target); 13376 } 13377 gcc_unreachable (); 13378 } 13379 13380 /* An entry in the MIPS16 constant pool. VALUE is the pool constant, 13381 MODE is its mode, and LABEL is the CODE_LABEL associated with it. */ 13382 struct mips16_constant { 13383 struct mips16_constant *next; 13384 rtx value; 13385 rtx label; 13386 enum machine_mode mode; 13387 }; 13388 13389 /* Information about an incomplete MIPS16 constant pool. FIRST is the 13390 first constant, HIGHEST_ADDRESS is the highest address that the first 13391 byte of the pool can have, and INSN_ADDRESS is the current instruction 13392 address. */ 13393 struct mips16_constant_pool { 13394 struct mips16_constant *first; 13395 int highest_address; 13396 int insn_address; 13397 }; 13398 13399 /* Add constant VALUE to POOL and return its label. MODE is the 13400 value's mode (used for CONST_INTs, etc.). */ 13401 13402 static rtx 13403 mips16_add_constant (struct mips16_constant_pool *pool, 13404 rtx value, enum machine_mode mode) 13405 { 13406 struct mips16_constant **p, *c; 13407 bool first_of_size_p; 13408 13409 /* See whether the constant is already in the pool. If so, return the 13410 existing label, otherwise leave P pointing to the place where the 13411 constant should be added. 13412 13413 Keep the pool sorted in increasing order of mode size so that we can 13414 reduce the number of alignments needed. */ 13415 first_of_size_p = true; 13416 for (p = &pool->first; *p != 0; p = &(*p)->next) 13417 { 13418 if (mode == (*p)->mode && rtx_equal_p (value, (*p)->value)) 13419 return (*p)->label; 13420 if (GET_MODE_SIZE (mode) < GET_MODE_SIZE ((*p)->mode)) 13421 break; 13422 if (GET_MODE_SIZE (mode) == GET_MODE_SIZE ((*p)->mode)) 13423 first_of_size_p = false; 13424 } 13425 13426 /* In the worst case, the constant needed by the earliest instruction 13427 will end up at the end of the pool. The entire pool must then be 13428 accessible from that instruction. 13429 13430 When adding the first constant, set the pool's highest address to 13431 the address of the first out-of-range byte. Adjust this address 13432 downwards each time a new constant is added. */ 13433 if (pool->first == 0) 13434 /* For LWPC, ADDIUPC and DADDIUPC, the base PC value is the address 13435 of the instruction with the lowest two bits clear. The base PC 13436 value for LDPC has the lowest three bits clear. Assume the worst 13437 case here; namely that the PC-relative instruction occupies the 13438 last 2 bytes in an aligned word. */ 13439 pool->highest_address = pool->insn_address - (UNITS_PER_WORD - 2) + 0x8000; 13440 pool->highest_address -= GET_MODE_SIZE (mode); 13441 if (first_of_size_p) 13442 /* Take into account the worst possible padding due to alignment. */ 13443 pool->highest_address -= GET_MODE_SIZE (mode) - 1; 13444 13445 /* Create a new entry. */ 13446 c = XNEW (struct mips16_constant); 13447 c->value = value; 13448 c->mode = mode; 13449 c->label = gen_label_rtx (); 13450 c->next = *p; 13451 *p = c; 13452 13453 return c->label; 13454 } 13455 13456 /* Output constant VALUE after instruction INSN and return the last 13457 instruction emitted. MODE is the mode of the constant. */ 13458 13459 static rtx 13460 mips16_emit_constants_1 (enum machine_mode mode, rtx value, rtx insn) 13461 { 13462 if (SCALAR_INT_MODE_P (mode) || ALL_SCALAR_FIXED_POINT_MODE_P (mode)) 13463 { 13464 rtx size = GEN_INT (GET_MODE_SIZE (mode)); 13465 return emit_insn_after (gen_consttable_int (value, size), insn); 13466 } 13467 13468 if (SCALAR_FLOAT_MODE_P (mode)) 13469 return emit_insn_after (gen_consttable_float (value), insn); 13470 13471 if (VECTOR_MODE_P (mode)) 13472 { 13473 int i; 13474 13475 for (i = 0; i < CONST_VECTOR_NUNITS (value); i++) 13476 insn = mips16_emit_constants_1 (GET_MODE_INNER (mode), 13477 CONST_VECTOR_ELT (value, i), insn); 13478 return insn; 13479 } 13480 13481 gcc_unreachable (); 13482 } 13483 13484 /* Dump out the constants in CONSTANTS after INSN. */ 13485 13486 static void 13487 mips16_emit_constants (struct mips16_constant *constants, rtx insn) 13488 { 13489 struct mips16_constant *c, *next; 13490 int align; 13491 13492 align = 0; 13493 for (c = constants; c != NULL; c = next) 13494 { 13495 /* If necessary, increase the alignment of PC. */ 13496 if (align < GET_MODE_SIZE (c->mode)) 13497 { 13498 int align_log = floor_log2 (GET_MODE_SIZE (c->mode)); 13499 insn = emit_insn_after (gen_align (GEN_INT (align_log)), insn); 13500 } 13501 align = GET_MODE_SIZE (c->mode); 13502 13503 insn = emit_label_after (c->label, insn); 13504 insn = mips16_emit_constants_1 (c->mode, c->value, insn); 13505 13506 next = c->next; 13507 free (c); 13508 } 13509 13510 emit_barrier_after (insn); 13511 } 13512 13513 /* Return the length of instruction INSN. */ 13514 13515 static int 13516 mips16_insn_length (rtx insn) 13517 { 13518 if (JUMP_P (insn)) 13519 { 13520 rtx body = PATTERN (insn); 13521 if (GET_CODE (body) == ADDR_VEC) 13522 return GET_MODE_SIZE (GET_MODE (body)) * XVECLEN (body, 0); 13523 if (GET_CODE (body) == ADDR_DIFF_VEC) 13524 return GET_MODE_SIZE (GET_MODE (body)) * XVECLEN (body, 1); 13525 } 13526 return get_attr_length (insn); 13527 } 13528 13529 /* If *X is a symbolic constant that refers to the constant pool, add 13530 the constant to POOL and rewrite *X to use the constant's label. */ 13531 13532 static void 13533 mips16_rewrite_pool_constant (struct mips16_constant_pool *pool, rtx *x) 13534 { 13535 rtx base, offset, label; 13536 13537 split_const (*x, &base, &offset); 13538 if (GET_CODE (base) == SYMBOL_REF && CONSTANT_POOL_ADDRESS_P (base)) 13539 { 13540 label = mips16_add_constant (pool, get_pool_constant (base), 13541 get_pool_mode (base)); 13542 base = gen_rtx_LABEL_REF (Pmode, label); 13543 *x = mips_unspec_address_offset (base, offset, SYMBOL_PC_RELATIVE); 13544 } 13545 } 13546 13547 /* This structure is used to communicate with mips16_rewrite_pool_refs. 13548 INSN is the instruction we're rewriting and POOL points to the current 13549 constant pool. */ 13550 struct mips16_rewrite_pool_refs_info { 13551 rtx insn; 13552 struct mips16_constant_pool *pool; 13553 }; 13554 13555 /* Rewrite *X so that constant pool references refer to the constant's 13556 label instead. DATA points to a mips16_rewrite_pool_refs_info 13557 structure. */ 13558 13559 static int 13560 mips16_rewrite_pool_refs (rtx *x, void *data) 13561 { 13562 struct mips16_rewrite_pool_refs_info *info = 13563 (struct mips16_rewrite_pool_refs_info *) data; 13564 13565 if (force_to_mem_operand (*x, Pmode)) 13566 { 13567 rtx mem = force_const_mem (GET_MODE (*x), *x); 13568 validate_change (info->insn, x, mem, false); 13569 } 13570 13571 if (MEM_P (*x)) 13572 { 13573 mips16_rewrite_pool_constant (info->pool, &XEXP (*x, 0)); 13574 return -1; 13575 } 13576 13577 if (TARGET_MIPS16_TEXT_LOADS) 13578 mips16_rewrite_pool_constant (info->pool, x); 13579 13580 return GET_CODE (*x) == CONST ? -1 : 0; 13581 } 13582 13583 /* Return whether CFG is used in mips_reorg. */ 13584 13585 static bool 13586 mips_cfg_in_reorg (void) 13587 { 13588 return (mips_r10k_cache_barrier != R10K_CACHE_BARRIER_NONE 13589 || TARGET_RELAX_PIC_CALLS); 13590 } 13591 13592 /* Build MIPS16 constant pools. */ 13593 13594 static void 13595 mips16_lay_out_constants (void) 13596 { 13597 struct mips16_constant_pool pool; 13598 struct mips16_rewrite_pool_refs_info info; 13599 rtx insn, barrier; 13600 13601 if (!TARGET_MIPS16_PCREL_LOADS) 13602 return; 13603 13604 if (mips_cfg_in_reorg ()) 13605 split_all_insns (); 13606 else 13607 split_all_insns_noflow (); 13608 barrier = 0; 13609 memset (&pool, 0, sizeof (pool)); 13610 for (insn = get_insns (); insn; insn = NEXT_INSN (insn)) 13611 { 13612 /* Rewrite constant pool references in INSN. */ 13613 if (USEFUL_INSN_P (insn)) 13614 { 13615 info.insn = insn; 13616 info.pool = &pool; 13617 for_each_rtx (&PATTERN (insn), mips16_rewrite_pool_refs, &info); 13618 } 13619 13620 pool.insn_address += mips16_insn_length (insn); 13621 13622 if (pool.first != NULL) 13623 { 13624 /* If there are no natural barriers between the first user of 13625 the pool and the highest acceptable address, we'll need to 13626 create a new instruction to jump around the constant pool. 13627 In the worst case, this instruction will be 4 bytes long. 13628 13629 If it's too late to do this transformation after INSN, 13630 do it immediately before INSN. */ 13631 if (barrier == 0 && pool.insn_address + 4 > pool.highest_address) 13632 { 13633 rtx label, jump; 13634 13635 label = gen_label_rtx (); 13636 13637 jump = emit_jump_insn_before (gen_jump (label), insn); 13638 JUMP_LABEL (jump) = label; 13639 LABEL_NUSES (label) = 1; 13640 barrier = emit_barrier_after (jump); 13641 13642 emit_label_after (label, barrier); 13643 pool.insn_address += 4; 13644 } 13645 13646 /* See whether the constant pool is now out of range of the first 13647 user. If so, output the constants after the previous barrier. 13648 Note that any instructions between BARRIER and INSN (inclusive) 13649 will use negative offsets to refer to the pool. */ 13650 if (pool.insn_address > pool.highest_address) 13651 { 13652 mips16_emit_constants (pool.first, barrier); 13653 pool.first = NULL; 13654 barrier = 0; 13655 } 13656 else if (BARRIER_P (insn)) 13657 barrier = insn; 13658 } 13659 } 13660 mips16_emit_constants (pool.first, get_last_insn ()); 13661 } 13662 13663 /* Return true if it is worth r10k_simplify_address's while replacing 13664 an address with X. We are looking for constants, and for addresses 13665 at a known offset from the incoming stack pointer. */ 13666 13667 static bool 13668 r10k_simplified_address_p (rtx x) 13669 { 13670 if (GET_CODE (x) == PLUS && CONST_INT_P (XEXP (x, 1))) 13671 x = XEXP (x, 0); 13672 return x == virtual_incoming_args_rtx || CONSTANT_P (x); 13673 } 13674 13675 /* X is an expression that appears in INSN. Try to use the UD chains 13676 to simplify it, returning the simplified form on success and the 13677 original form otherwise. Replace the incoming value of $sp with 13678 virtual_incoming_args_rtx (which should never occur in X otherwise). */ 13679 13680 static rtx 13681 r10k_simplify_address (rtx x, rtx insn) 13682 { 13683 rtx newx, op0, op1, set, def_insn, note; 13684 df_ref use, def; 13685 struct df_link *defs; 13686 13687 newx = NULL_RTX; 13688 if (UNARY_P (x)) 13689 { 13690 op0 = r10k_simplify_address (XEXP (x, 0), insn); 13691 if (op0 != XEXP (x, 0)) 13692 newx = simplify_gen_unary (GET_CODE (x), GET_MODE (x), 13693 op0, GET_MODE (XEXP (x, 0))); 13694 } 13695 else if (BINARY_P (x)) 13696 { 13697 op0 = r10k_simplify_address (XEXP (x, 0), insn); 13698 op1 = r10k_simplify_address (XEXP (x, 1), insn); 13699 if (op0 != XEXP (x, 0) || op1 != XEXP (x, 1)) 13700 newx = simplify_gen_binary (GET_CODE (x), GET_MODE (x), op0, op1); 13701 } 13702 else if (GET_CODE (x) == LO_SUM) 13703 { 13704 /* LO_SUMs can be offset from HIGHs, if we know they won't 13705 overflow. See mips_classify_address for the rationale behind 13706 the lax check. */ 13707 op0 = r10k_simplify_address (XEXP (x, 0), insn); 13708 if (GET_CODE (op0) == HIGH) 13709 newx = XEXP (x, 1); 13710 } 13711 else if (REG_P (x)) 13712 { 13713 /* Uses are recorded by regno_reg_rtx, not X itself. */ 13714 use = df_find_use (insn, regno_reg_rtx[REGNO (x)]); 13715 gcc_assert (use); 13716 defs = DF_REF_CHAIN (use); 13717 13718 /* Require a single definition. */ 13719 if (defs && defs->next == NULL) 13720 { 13721 def = defs->ref; 13722 if (DF_REF_IS_ARTIFICIAL (def)) 13723 { 13724 /* Replace the incoming value of $sp with 13725 virtual_incoming_args_rtx. */ 13726 if (x == stack_pointer_rtx 13727 && DF_REF_BB (def) == ENTRY_BLOCK_PTR) 13728 newx = virtual_incoming_args_rtx; 13729 } 13730 else if (dominated_by_p (CDI_DOMINATORS, DF_REF_BB (use), 13731 DF_REF_BB (def))) 13732 { 13733 /* Make sure that DEF_INSN is a single set of REG. */ 13734 def_insn = DF_REF_INSN (def); 13735 if (NONJUMP_INSN_P (def_insn)) 13736 { 13737 set = single_set (def_insn); 13738 if (set && rtx_equal_p (SET_DEST (set), x)) 13739 { 13740 /* Prefer to use notes, since the def-use chains 13741 are often shorter. */ 13742 note = find_reg_equal_equiv_note (def_insn); 13743 if (note) 13744 newx = XEXP (note, 0); 13745 else 13746 newx = SET_SRC (set); 13747 newx = r10k_simplify_address (newx, def_insn); 13748 } 13749 } 13750 } 13751 } 13752 } 13753 if (newx && r10k_simplified_address_p (newx)) 13754 return newx; 13755 return x; 13756 } 13757 13758 /* Return true if ADDRESS is known to be an uncached address 13759 on R10K systems. */ 13760 13761 static bool 13762 r10k_uncached_address_p (unsigned HOST_WIDE_INT address) 13763 { 13764 unsigned HOST_WIDE_INT upper; 13765 13766 /* Check for KSEG1. */ 13767 if (address + 0x60000000 < 0x20000000) 13768 return true; 13769 13770 /* Check for uncached XKPHYS addresses. */ 13771 if (Pmode == DImode) 13772 { 13773 upper = (address >> 40) & 0xf9ffff; 13774 if (upper == 0x900000 || upper == 0xb80000) 13775 return true; 13776 } 13777 return false; 13778 } 13779 13780 /* Return true if we can prove that an access to address X in instruction 13781 INSN would be safe from R10K speculation. This X is a general 13782 expression; it might not be a legitimate address. */ 13783 13784 static bool 13785 r10k_safe_address_p (rtx x, rtx insn) 13786 { 13787 rtx base, offset; 13788 HOST_WIDE_INT offset_val; 13789 13790 x = r10k_simplify_address (x, insn); 13791 13792 /* Check for references to the stack frame. It doesn't really matter 13793 how much of the frame has been allocated at INSN; -mr10k-cache-barrier 13794 allows us to assume that accesses to any part of the eventual frame 13795 is safe from speculation at any point in the function. */ 13796 mips_split_plus (x, &base, &offset_val); 13797 if (base == virtual_incoming_args_rtx 13798 && offset_val >= -cfun->machine->frame.total_size 13799 && offset_val < cfun->machine->frame.args_size) 13800 return true; 13801 13802 /* Check for uncached addresses. */ 13803 if (CONST_INT_P (x)) 13804 return r10k_uncached_address_p (INTVAL (x)); 13805 13806 /* Check for accesses to a static object. */ 13807 split_const (x, &base, &offset); 13808 return offset_within_block_p (base, INTVAL (offset)); 13809 } 13810 13811 /* Return true if a MEM with MEM_EXPR EXPR and MEM_OFFSET OFFSET is 13812 an in-range access to an automatic variable, or to an object with 13813 a link-time-constant address. */ 13814 13815 static bool 13816 r10k_safe_mem_expr_p (tree expr, rtx offset) 13817 { 13818 if (expr == NULL_TREE 13819 || offset == NULL_RTX 13820 || !CONST_INT_P (offset) 13821 || INTVAL (offset) < 0 13822 || INTVAL (offset) >= int_size_in_bytes (TREE_TYPE (expr))) 13823 return false; 13824 13825 while (TREE_CODE (expr) == COMPONENT_REF) 13826 { 13827 expr = TREE_OPERAND (expr, 0); 13828 if (expr == NULL_TREE) 13829 return false; 13830 } 13831 13832 return DECL_P (expr); 13833 } 13834 13835 /* A for_each_rtx callback for which DATA points to the instruction 13836 containing *X. Stop the search if we find a MEM that is not safe 13837 from R10K speculation. */ 13838 13839 static int 13840 r10k_needs_protection_p_1 (rtx *loc, void *data) 13841 { 13842 rtx mem; 13843 13844 mem = *loc; 13845 if (!MEM_P (mem)) 13846 return 0; 13847 13848 if (r10k_safe_mem_expr_p (MEM_EXPR (mem), MEM_OFFSET (mem))) 13849 return -1; 13850 13851 if (r10k_safe_address_p (XEXP (mem, 0), (rtx) data)) 13852 return -1; 13853 13854 return 1; 13855 } 13856 13857 /* A note_stores callback for which DATA points to an instruction pointer. 13858 If *DATA is nonnull, make it null if it X contains a MEM that is not 13859 safe from R10K speculation. */ 13860 13861 static void 13862 r10k_needs_protection_p_store (rtx x, const_rtx pat ATTRIBUTE_UNUSED, 13863 void *data) 13864 { 13865 rtx *insn_ptr; 13866 13867 insn_ptr = (rtx *) data; 13868 if (*insn_ptr && for_each_rtx (&x, r10k_needs_protection_p_1, *insn_ptr)) 13869 *insn_ptr = NULL_RTX; 13870 } 13871 13872 /* A for_each_rtx callback that iterates over the pattern of a CALL_INSN. 13873 Return nonzero if the call is not to a declared function. */ 13874 13875 static int 13876 r10k_needs_protection_p_call (rtx *loc, void *data ATTRIBUTE_UNUSED) 13877 { 13878 rtx x; 13879 13880 x = *loc; 13881 if (!MEM_P (x)) 13882 return 0; 13883 13884 x = XEXP (x, 0); 13885 if (GET_CODE (x) == SYMBOL_REF && SYMBOL_REF_DECL (x)) 13886 return -1; 13887 13888 return 1; 13889 } 13890 13891 /* Return true if instruction INSN needs to be protected by an R10K 13892 cache barrier. */ 13893 13894 static bool 13895 r10k_needs_protection_p (rtx insn) 13896 { 13897 if (CALL_P (insn)) 13898 return for_each_rtx (&PATTERN (insn), r10k_needs_protection_p_call, NULL); 13899 13900 if (mips_r10k_cache_barrier == R10K_CACHE_BARRIER_STORE) 13901 { 13902 note_stores (PATTERN (insn), r10k_needs_protection_p_store, &insn); 13903 return insn == NULL_RTX; 13904 } 13905 13906 return for_each_rtx (&PATTERN (insn), r10k_needs_protection_p_1, insn); 13907 } 13908 13909 /* Return true if BB is only reached by blocks in PROTECTED_BBS and if every 13910 edge is unconditional. */ 13911 13912 static bool 13913 r10k_protected_bb_p (basic_block bb, sbitmap protected_bbs) 13914 { 13915 edge_iterator ei; 13916 edge e; 13917 13918 FOR_EACH_EDGE (e, ei, bb->preds) 13919 if (!single_succ_p (e->src) 13920 || !TEST_BIT (protected_bbs, e->src->index) 13921 || (e->flags & EDGE_COMPLEX) != 0) 13922 return false; 13923 return true; 13924 } 13925 13926 /* Implement -mr10k-cache-barrier= for the current function. */ 13927 13928 static void 13929 r10k_insert_cache_barriers (void) 13930 { 13931 int *rev_post_order; 13932 unsigned int i, n; 13933 basic_block bb; 13934 sbitmap protected_bbs; 13935 rtx insn, end, unprotected_region; 13936 13937 if (TARGET_MIPS16) 13938 { 13939 sorry ("%qs does not support MIPS16 code", "-mr10k-cache-barrier"); 13940 return; 13941 } 13942 13943 /* Calculate dominators. */ 13944 calculate_dominance_info (CDI_DOMINATORS); 13945 13946 /* Bit X of PROTECTED_BBS is set if the last operation in basic block 13947 X is protected by a cache barrier. */ 13948 protected_bbs = sbitmap_alloc (last_basic_block); 13949 sbitmap_zero (protected_bbs); 13950 13951 /* Iterate over the basic blocks in reverse post-order. */ 13952 rev_post_order = XNEWVEC (int, last_basic_block); 13953 n = pre_and_rev_post_order_compute (NULL, rev_post_order, false); 13954 for (i = 0; i < n; i++) 13955 { 13956 bb = BASIC_BLOCK (rev_post_order[i]); 13957 13958 /* If this block is only reached by unconditional edges, and if the 13959 source of every edge is protected, the beginning of the block is 13960 also protected. */ 13961 if (r10k_protected_bb_p (bb, protected_bbs)) 13962 unprotected_region = NULL_RTX; 13963 else 13964 unprotected_region = pc_rtx; 13965 end = NEXT_INSN (BB_END (bb)); 13966 13967 /* UNPROTECTED_REGION is: 13968 13969 - null if we are processing a protected region, 13970 - pc_rtx if we are processing an unprotected region but have 13971 not yet found the first instruction in it 13972 - the first instruction in an unprotected region otherwise. */ 13973 for (insn = BB_HEAD (bb); insn != end; insn = NEXT_INSN (insn)) 13974 { 13975 if (unprotected_region && USEFUL_INSN_P (insn)) 13976 { 13977 if (recog_memoized (insn) == CODE_FOR_mips_cache) 13978 /* This CACHE instruction protects the following code. */ 13979 unprotected_region = NULL_RTX; 13980 else 13981 { 13982 /* See if INSN is the first instruction in this 13983 unprotected region. */ 13984 if (unprotected_region == pc_rtx) 13985 unprotected_region = insn; 13986 13987 /* See if INSN needs to be protected. If so, 13988 we must insert a cache barrier somewhere between 13989 PREV_INSN (UNPROTECTED_REGION) and INSN. It isn't 13990 clear which position is better performance-wise, 13991 but as a tie-breaker, we assume that it is better 13992 to allow delay slots to be back-filled where 13993 possible, and that it is better not to insert 13994 barriers in the middle of already-scheduled code. 13995 We therefore insert the barrier at the beginning 13996 of the region. */ 13997 if (r10k_needs_protection_p (insn)) 13998 { 13999 emit_insn_before (gen_r10k_cache_barrier (), 14000 unprotected_region); 14001 unprotected_region = NULL_RTX; 14002 } 14003 } 14004 } 14005 14006 if (CALL_P (insn)) 14007 /* The called function is not required to protect the exit path. 14008 The code that follows a call is therefore unprotected. */ 14009 unprotected_region = pc_rtx; 14010 } 14011 14012 /* Record whether the end of this block is protected. */ 14013 if (unprotected_region == NULL_RTX) 14014 SET_BIT (protected_bbs, bb->index); 14015 } 14016 XDELETEVEC (rev_post_order); 14017 14018 sbitmap_free (protected_bbs); 14019 14020 free_dominance_info (CDI_DOMINATORS); 14021 } 14022 14023 /* If INSN is a call, return the underlying CALL expr. Return NULL_RTX 14024 otherwise. If INSN has two call rtx, then store the second one in 14025 SECOND_CALL. */ 14026 14027 static rtx 14028 mips_call_expr_from_insn (rtx insn, rtx *second_call) 14029 { 14030 rtx x; 14031 rtx x2; 14032 14033 if (!CALL_P (insn)) 14034 return NULL_RTX; 14035 14036 x = PATTERN (insn); 14037 if (GET_CODE (x) == PARALLEL) 14038 { 14039 /* Calls returning complex values have two CALL rtx. Look for the second 14040 one here, and return it via the SECOND_CALL arg. */ 14041 x2 = XVECEXP (x, 0, 1); 14042 if (GET_CODE (x2) == SET) 14043 x2 = XEXP (x2, 1); 14044 if (GET_CODE (x2) == CALL) 14045 *second_call = x2; 14046 14047 x = XVECEXP (x, 0, 0); 14048 } 14049 if (GET_CODE (x) == SET) 14050 x = XEXP (x, 1); 14051 gcc_assert (GET_CODE (x) == CALL); 14052 14053 return x; 14054 } 14055 14056 /* REG is set in DEF. See if the definition is one of the ways we load a 14057 register with a symbol address for a mips_use_pic_fn_addr_reg_p call. 14058 If it is, return the symbol reference of the function, otherwise return 14059 NULL_RTX. 14060 14061 If RECURSE_P is true, use mips_find_pic_call_symbol to interpret 14062 the values of source registers, otherwise treat such registers as 14063 having an unknown value. */ 14064 14065 static rtx 14066 mips_pic_call_symbol_from_set (df_ref def, rtx reg, bool recurse_p) 14067 { 14068 rtx def_insn, set; 14069 14070 if (DF_REF_IS_ARTIFICIAL (def)) 14071 return NULL_RTX; 14072 14073 def_insn = DF_REF_INSN (def); 14074 set = single_set (def_insn); 14075 if (set && rtx_equal_p (SET_DEST (set), reg)) 14076 { 14077 rtx note, src, symbol; 14078 14079 /* First, look at REG_EQUAL/EQUIV notes. */ 14080 note = find_reg_equal_equiv_note (def_insn); 14081 if (note && GET_CODE (XEXP (note, 0)) == SYMBOL_REF) 14082 return XEXP (note, 0); 14083 14084 /* For %call16 references we don't have REG_EQUAL. */ 14085 src = SET_SRC (set); 14086 symbol = mips_strip_unspec_call (src); 14087 if (symbol) 14088 { 14089 gcc_assert (GET_CODE (symbol) == SYMBOL_REF); 14090 return symbol; 14091 } 14092 14093 /* Follow at most one simple register copy. Such copies are 14094 interesting in cases like: 14095 14096 for (...) 14097 { 14098 locally_binding_fn (...); 14099 } 14100 14101 and: 14102 14103 locally_binding_fn (...); 14104 ... 14105 locally_binding_fn (...); 14106 14107 where the load of locally_binding_fn can legitimately be 14108 hoisted or shared. However, we do not expect to see complex 14109 chains of copies, so a full worklist solution to the problem 14110 would probably be overkill. */ 14111 if (recurse_p && REG_P (src)) 14112 return mips_find_pic_call_symbol (def_insn, src, false); 14113 } 14114 14115 return NULL_RTX; 14116 } 14117 14118 /* Find the definition of the use of REG in INSN. See if the definition 14119 is one of the ways we load a register with a symbol address for a 14120 mips_use_pic_fn_addr_reg_p call. If it is return the symbol reference 14121 of the function, otherwise return NULL_RTX. RECURSE_P is as for 14122 mips_pic_call_symbol_from_set. */ 14123 14124 static rtx 14125 mips_find_pic_call_symbol (rtx insn, rtx reg, bool recurse_p) 14126 { 14127 df_ref use; 14128 struct df_link *defs; 14129 rtx symbol; 14130 14131 use = df_find_use (insn, regno_reg_rtx[REGNO (reg)]); 14132 if (!use) 14133 return NULL_RTX; 14134 defs = DF_REF_CHAIN (use); 14135 if (!defs) 14136 return NULL_RTX; 14137 symbol = mips_pic_call_symbol_from_set (defs->ref, reg, recurse_p); 14138 if (!symbol) 14139 return NULL_RTX; 14140 14141 /* If we have more than one definition, they need to be identical. */ 14142 for (defs = defs->next; defs; defs = defs->next) 14143 { 14144 rtx other; 14145 14146 other = mips_pic_call_symbol_from_set (defs->ref, reg, recurse_p); 14147 if (!rtx_equal_p (symbol, other)) 14148 return NULL_RTX; 14149 } 14150 14151 return symbol; 14152 } 14153 14154 /* Replace the args_size operand of the call expression CALL with the 14155 call-attribute UNSPEC and fill in SYMBOL as the function symbol. */ 14156 14157 static void 14158 mips_annotate_pic_call_expr (rtx call, rtx symbol) 14159 { 14160 rtx args_size; 14161 14162 args_size = XEXP (call, 1); 14163 XEXP (call, 1) = gen_rtx_UNSPEC (GET_MODE (args_size), 14164 gen_rtvec (2, args_size, symbol), 14165 UNSPEC_CALL_ATTR); 14166 } 14167 14168 /* OPERANDS[ARGS_SIZE_OPNO] is the arg_size operand of a CALL expression. See 14169 if instead of the arg_size argument it contains the call attributes. If 14170 yes return true along with setting OPERANDS[ARGS_SIZE_OPNO] to the function 14171 symbol from the call attributes. Also return false if ARGS_SIZE_OPNO is 14172 -1. */ 14173 14174 bool 14175 mips_get_pic_call_symbol (rtx *operands, int args_size_opno) 14176 { 14177 rtx args_size, symbol; 14178 14179 if (!TARGET_RELAX_PIC_CALLS || args_size_opno == -1) 14180 return false; 14181 14182 args_size = operands[args_size_opno]; 14183 if (GET_CODE (args_size) != UNSPEC) 14184 return false; 14185 gcc_assert (XINT (args_size, 1) == UNSPEC_CALL_ATTR); 14186 14187 symbol = XVECEXP (args_size, 0, 1); 14188 gcc_assert (GET_CODE (symbol) == SYMBOL_REF); 14189 14190 operands[args_size_opno] = symbol; 14191 return true; 14192 } 14193 14194 /* Use DF to annotate PIC indirect calls with the function symbol they 14195 dispatch to. */ 14196 14197 static void 14198 mips_annotate_pic_calls (void) 14199 { 14200 basic_block bb; 14201 rtx insn; 14202 14203 FOR_EACH_BB (bb) 14204 FOR_BB_INSNS (bb, insn) 14205 { 14206 rtx call, reg, symbol, second_call; 14207 14208 second_call = 0; 14209 call = mips_call_expr_from_insn (insn, &second_call); 14210 if (!call) 14211 continue; 14212 gcc_assert (MEM_P (XEXP (call, 0))); 14213 reg = XEXP (XEXP (call, 0), 0); 14214 if (!REG_P (reg)) 14215 continue; 14216 14217 symbol = mips_find_pic_call_symbol (insn, reg, true); 14218 if (symbol) 14219 { 14220 mips_annotate_pic_call_expr (call, symbol); 14221 if (second_call) 14222 mips_annotate_pic_call_expr (second_call, symbol); 14223 } 14224 } 14225 } 14226 14227 /* A temporary variable used by for_each_rtx callbacks, etc. */ 14228 static rtx mips_sim_insn; 14229 14230 /* A structure representing the state of the processor pipeline. 14231 Used by the mips_sim_* family of functions. */ 14232 struct mips_sim { 14233 /* The maximum number of instructions that can be issued in a cycle. 14234 (Caches mips_issue_rate.) */ 14235 unsigned int issue_rate; 14236 14237 /* The current simulation time. */ 14238 unsigned int time; 14239 14240 /* How many more instructions can be issued in the current cycle. */ 14241 unsigned int insns_left; 14242 14243 /* LAST_SET[X].INSN is the last instruction to set register X. 14244 LAST_SET[X].TIME is the time at which that instruction was issued. 14245 INSN is null if no instruction has yet set register X. */ 14246 struct { 14247 rtx insn; 14248 unsigned int time; 14249 } last_set[FIRST_PSEUDO_REGISTER]; 14250 14251 /* The pipeline's current DFA state. */ 14252 state_t dfa_state; 14253 }; 14254 14255 /* Reset STATE to the initial simulation state. */ 14256 14257 static void 14258 mips_sim_reset (struct mips_sim *state) 14259 { 14260 state->time = 0; 14261 state->insns_left = state->issue_rate; 14262 memset (&state->last_set, 0, sizeof (state->last_set)); 14263 state_reset (state->dfa_state); 14264 } 14265 14266 /* Initialize STATE before its first use. DFA_STATE points to an 14267 allocated but uninitialized DFA state. */ 14268 14269 static void 14270 mips_sim_init (struct mips_sim *state, state_t dfa_state) 14271 { 14272 state->issue_rate = mips_issue_rate (); 14273 state->dfa_state = dfa_state; 14274 mips_sim_reset (state); 14275 } 14276 14277 /* Advance STATE by one clock cycle. */ 14278 14279 static void 14280 mips_sim_next_cycle (struct mips_sim *state) 14281 { 14282 state->time++; 14283 state->insns_left = state->issue_rate; 14284 state_transition (state->dfa_state, 0); 14285 } 14286 14287 /* Advance simulation state STATE until instruction INSN can read 14288 register REG. */ 14289 14290 static void 14291 mips_sim_wait_reg (struct mips_sim *state, rtx insn, rtx reg) 14292 { 14293 unsigned int regno, end_regno; 14294 14295 end_regno = END_REGNO (reg); 14296 for (regno = REGNO (reg); regno < end_regno; regno++) 14297 if (state->last_set[regno].insn != 0) 14298 { 14299 unsigned int t; 14300 14301 t = (state->last_set[regno].time 14302 + insn_latency (state->last_set[regno].insn, insn)); 14303 while (state->time < t) 14304 mips_sim_next_cycle (state); 14305 } 14306 } 14307 14308 /* A for_each_rtx callback. If *X is a register, advance simulation state 14309 DATA until mips_sim_insn can read the register's value. */ 14310 14311 static int 14312 mips_sim_wait_regs_2 (rtx *x, void *data) 14313 { 14314 if (REG_P (*x)) 14315 mips_sim_wait_reg ((struct mips_sim *) data, mips_sim_insn, *x); 14316 return 0; 14317 } 14318 14319 /* Call mips_sim_wait_regs_2 (R, DATA) for each register R mentioned in *X. */ 14320 14321 static void 14322 mips_sim_wait_regs_1 (rtx *x, void *data) 14323 { 14324 for_each_rtx (x, mips_sim_wait_regs_2, data); 14325 } 14326 14327 /* Advance simulation state STATE until all of INSN's register 14328 dependencies are satisfied. */ 14329 14330 static void 14331 mips_sim_wait_regs (struct mips_sim *state, rtx insn) 14332 { 14333 mips_sim_insn = insn; 14334 note_uses (&PATTERN (insn), mips_sim_wait_regs_1, state); 14335 } 14336 14337 /* Advance simulation state STATE until the units required by 14338 instruction INSN are available. */ 14339 14340 static void 14341 mips_sim_wait_units (struct mips_sim *state, rtx insn) 14342 { 14343 state_t tmp_state; 14344 14345 tmp_state = alloca (state_size ()); 14346 while (state->insns_left == 0 14347 || (memcpy (tmp_state, state->dfa_state, state_size ()), 14348 state_transition (tmp_state, insn) >= 0)) 14349 mips_sim_next_cycle (state); 14350 } 14351 14352 /* Advance simulation state STATE until INSN is ready to issue. */ 14353 14354 static void 14355 mips_sim_wait_insn (struct mips_sim *state, rtx insn) 14356 { 14357 mips_sim_wait_regs (state, insn); 14358 mips_sim_wait_units (state, insn); 14359 } 14360 14361 /* mips_sim_insn has just set X. Update the LAST_SET array 14362 in simulation state DATA. */ 14363 14364 static void 14365 mips_sim_record_set (rtx x, const_rtx pat ATTRIBUTE_UNUSED, void *data) 14366 { 14367 struct mips_sim *state; 14368 14369 state = (struct mips_sim *) data; 14370 if (REG_P (x)) 14371 { 14372 unsigned int regno, end_regno; 14373 14374 end_regno = END_REGNO (x); 14375 for (regno = REGNO (x); regno < end_regno; regno++) 14376 { 14377 state->last_set[regno].insn = mips_sim_insn; 14378 state->last_set[regno].time = state->time; 14379 } 14380 } 14381 } 14382 14383 /* Issue instruction INSN in scheduler state STATE. Assume that INSN 14384 can issue immediately (i.e., that mips_sim_wait_insn has already 14385 been called). */ 14386 14387 static void 14388 mips_sim_issue_insn (struct mips_sim *state, rtx insn) 14389 { 14390 state_transition (state->dfa_state, insn); 14391 state->insns_left--; 14392 14393 mips_sim_insn = insn; 14394 note_stores (PATTERN (insn), mips_sim_record_set, state); 14395 } 14396 14397 /* Simulate issuing a NOP in state STATE. */ 14398 14399 static void 14400 mips_sim_issue_nop (struct mips_sim *state) 14401 { 14402 if (state->insns_left == 0) 14403 mips_sim_next_cycle (state); 14404 state->insns_left--; 14405 } 14406 14407 /* Update simulation state STATE so that it's ready to accept the instruction 14408 after INSN. INSN should be part of the main rtl chain, not a member of a 14409 SEQUENCE. */ 14410 14411 static void 14412 mips_sim_finish_insn (struct mips_sim *state, rtx insn) 14413 { 14414 /* If INSN is a jump with an implicit delay slot, simulate a nop. */ 14415 if (JUMP_P (insn)) 14416 mips_sim_issue_nop (state); 14417 14418 switch (GET_CODE (SEQ_BEGIN (insn))) 14419 { 14420 case CODE_LABEL: 14421 case CALL_INSN: 14422 /* We can't predict the processor state after a call or label. */ 14423 mips_sim_reset (state); 14424 break; 14425 14426 case JUMP_INSN: 14427 /* The delay slots of branch likely instructions are only executed 14428 when the branch is taken. Therefore, if the caller has simulated 14429 the delay slot instruction, STATE does not really reflect the state 14430 of the pipeline for the instruction after the delay slot. Also, 14431 branch likely instructions tend to incur a penalty when not taken, 14432 so there will probably be an extra delay between the branch and 14433 the instruction after the delay slot. */ 14434 if (INSN_ANNULLED_BRANCH_P (SEQ_BEGIN (insn))) 14435 mips_sim_reset (state); 14436 break; 14437 14438 default: 14439 break; 14440 } 14441 } 14442 14443 /* The VR4130 pipeline issues aligned pairs of instructions together, 14444 but it stalls the second instruction if it depends on the first. 14445 In order to cut down the amount of logic required, this dependence 14446 check is not based on a full instruction decode. Instead, any non-SPECIAL 14447 instruction is assumed to modify the register specified by bits 20-16 14448 (which is usually the "rt" field). 14449 14450 In BEQ, BEQL, BNE and BNEL instructions, the rt field is actually an 14451 input, so we can end up with a false dependence between the branch 14452 and its delay slot. If this situation occurs in instruction INSN, 14453 try to avoid it by swapping rs and rt. */ 14454 14455 static void 14456 vr4130_avoid_branch_rt_conflict (rtx insn) 14457 { 14458 rtx first, second; 14459 14460 first = SEQ_BEGIN (insn); 14461 second = SEQ_END (insn); 14462 if (JUMP_P (first) 14463 && NONJUMP_INSN_P (second) 14464 && GET_CODE (PATTERN (first)) == SET 14465 && GET_CODE (SET_DEST (PATTERN (first))) == PC 14466 && GET_CODE (SET_SRC (PATTERN (first))) == IF_THEN_ELSE) 14467 { 14468 /* Check for the right kind of condition. */ 14469 rtx cond = XEXP (SET_SRC (PATTERN (first)), 0); 14470 if ((GET_CODE (cond) == EQ || GET_CODE (cond) == NE) 14471 && REG_P (XEXP (cond, 0)) 14472 && REG_P (XEXP (cond, 1)) 14473 && reg_referenced_p (XEXP (cond, 1), PATTERN (second)) 14474 && !reg_referenced_p (XEXP (cond, 0), PATTERN (second))) 14475 { 14476 /* SECOND mentions the rt register but not the rs register. */ 14477 rtx tmp = XEXP (cond, 0); 14478 XEXP (cond, 0) = XEXP (cond, 1); 14479 XEXP (cond, 1) = tmp; 14480 } 14481 } 14482 } 14483 14484 /* Implement -mvr4130-align. Go through each basic block and simulate the 14485 processor pipeline. If we find that a pair of instructions could execute 14486 in parallel, and the first of those instructions is not 8-byte aligned, 14487 insert a nop to make it aligned. */ 14488 14489 static void 14490 vr4130_align_insns (void) 14491 { 14492 struct mips_sim state; 14493 rtx insn, subinsn, last, last2, next; 14494 bool aligned_p; 14495 14496 dfa_start (); 14497 14498 /* LAST is the last instruction before INSN to have a nonzero length. 14499 LAST2 is the last such instruction before LAST. */ 14500 last = 0; 14501 last2 = 0; 14502 14503 /* ALIGNED_P is true if INSN is known to be at an aligned address. */ 14504 aligned_p = true; 14505 14506 mips_sim_init (&state, alloca (state_size ())); 14507 for (insn = get_insns (); insn != 0; insn = next) 14508 { 14509 unsigned int length; 14510 14511 next = NEXT_INSN (insn); 14512 14513 /* See the comment above vr4130_avoid_branch_rt_conflict for details. 14514 This isn't really related to the alignment pass, but we do it on 14515 the fly to avoid a separate instruction walk. */ 14516 vr4130_avoid_branch_rt_conflict (insn); 14517 14518 if (USEFUL_INSN_P (insn)) 14519 FOR_EACH_SUBINSN (subinsn, insn) 14520 { 14521 mips_sim_wait_insn (&state, subinsn); 14522 14523 /* If we want this instruction to issue in parallel with the 14524 previous one, make sure that the previous instruction is 14525 aligned. There are several reasons why this isn't worthwhile 14526 when the second instruction is a call: 14527 14528 - Calls are less likely to be performance critical, 14529 - There's a good chance that the delay slot can execute 14530 in parallel with the call. 14531 - The return address would then be unaligned. 14532 14533 In general, if we're going to insert a nop between instructions 14534 X and Y, it's better to insert it immediately after X. That 14535 way, if the nop makes Y aligned, it will also align any labels 14536 between X and Y. */ 14537 if (state.insns_left != state.issue_rate 14538 && !CALL_P (subinsn)) 14539 { 14540 if (subinsn == SEQ_BEGIN (insn) && aligned_p) 14541 { 14542 /* SUBINSN is the first instruction in INSN and INSN is 14543 aligned. We want to align the previous instruction 14544 instead, so insert a nop between LAST2 and LAST. 14545 14546 Note that LAST could be either a single instruction 14547 or a branch with a delay slot. In the latter case, 14548 LAST, like INSN, is already aligned, but the delay 14549 slot must have some extra delay that stops it from 14550 issuing at the same time as the branch. We therefore 14551 insert a nop before the branch in order to align its 14552 delay slot. */ 14553 emit_insn_after (gen_nop (), last2); 14554 aligned_p = false; 14555 } 14556 else if (subinsn != SEQ_BEGIN (insn) && !aligned_p) 14557 { 14558 /* SUBINSN is the delay slot of INSN, but INSN is 14559 currently unaligned. Insert a nop between 14560 LAST and INSN to align it. */ 14561 emit_insn_after (gen_nop (), last); 14562 aligned_p = true; 14563 } 14564 } 14565 mips_sim_issue_insn (&state, subinsn); 14566 } 14567 mips_sim_finish_insn (&state, insn); 14568 14569 /* Update LAST, LAST2 and ALIGNED_P for the next instruction. */ 14570 length = get_attr_length (insn); 14571 if (length > 0) 14572 { 14573 /* If the instruction is an asm statement or multi-instruction 14574 mips.md patern, the length is only an estimate. Insert an 14575 8 byte alignment after it so that the following instructions 14576 can be handled correctly. */ 14577 if (NONJUMP_INSN_P (SEQ_BEGIN (insn)) 14578 && (recog_memoized (insn) < 0 || length >= 8)) 14579 { 14580 next = emit_insn_after (gen_align (GEN_INT (3)), insn); 14581 next = NEXT_INSN (next); 14582 mips_sim_next_cycle (&state); 14583 aligned_p = true; 14584 } 14585 else if (length & 4) 14586 aligned_p = !aligned_p; 14587 last2 = last; 14588 last = insn; 14589 } 14590 14591 /* See whether INSN is an aligned label. */ 14592 if (LABEL_P (insn) && label_to_alignment (insn) >= 3) 14593 aligned_p = true; 14594 } 14595 dfa_finish (); 14596 } 14597 14598 /* This structure records that the current function has a LO_SUM 14599 involving SYMBOL_REF or LABEL_REF BASE and that MAX_OFFSET is 14600 the largest offset applied to BASE by all such LO_SUMs. */ 14601 struct mips_lo_sum_offset { 14602 rtx base; 14603 HOST_WIDE_INT offset; 14604 }; 14605 14606 /* Return a hash value for SYMBOL_REF or LABEL_REF BASE. */ 14607 14608 static hashval_t 14609 mips_hash_base (rtx base) 14610 { 14611 int do_not_record_p; 14612 14613 return hash_rtx (base, GET_MODE (base), &do_not_record_p, NULL, false); 14614 } 14615 14616 /* Hash-table callbacks for mips_lo_sum_offsets. */ 14617 14618 static hashval_t 14619 mips_lo_sum_offset_hash (const void *entry) 14620 { 14621 return mips_hash_base (((const struct mips_lo_sum_offset *) entry)->base); 14622 } 14623 14624 static int 14625 mips_lo_sum_offset_eq (const void *entry, const void *value) 14626 { 14627 return rtx_equal_p (((const struct mips_lo_sum_offset *) entry)->base, 14628 (const_rtx) value); 14629 } 14630 14631 /* Look up symbolic constant X in HTAB, which is a hash table of 14632 mips_lo_sum_offsets. If OPTION is NO_INSERT, return true if X can be 14633 paired with a recorded LO_SUM, otherwise record X in the table. */ 14634 14635 static bool 14636 mips_lo_sum_offset_lookup (htab_t htab, rtx x, enum insert_option option) 14637 { 14638 rtx base, offset; 14639 void **slot; 14640 struct mips_lo_sum_offset *entry; 14641 14642 /* Split X into a base and offset. */ 14643 split_const (x, &base, &offset); 14644 if (UNSPEC_ADDRESS_P (base)) 14645 base = UNSPEC_ADDRESS (base); 14646 14647 /* Look up the base in the hash table. */ 14648 slot = htab_find_slot_with_hash (htab, base, mips_hash_base (base), option); 14649 if (slot == NULL) 14650 return false; 14651 14652 entry = (struct mips_lo_sum_offset *) *slot; 14653 if (option == INSERT) 14654 { 14655 if (entry == NULL) 14656 { 14657 entry = XNEW (struct mips_lo_sum_offset); 14658 entry->base = base; 14659 entry->offset = INTVAL (offset); 14660 *slot = entry; 14661 } 14662 else 14663 { 14664 if (INTVAL (offset) > entry->offset) 14665 entry->offset = INTVAL (offset); 14666 } 14667 } 14668 return INTVAL (offset) <= entry->offset; 14669 } 14670 14671 /* A for_each_rtx callback for which DATA is a mips_lo_sum_offset hash table. 14672 Record every LO_SUM in *LOC. */ 14673 14674 static int 14675 mips_record_lo_sum (rtx *loc, void *data) 14676 { 14677 if (GET_CODE (*loc) == LO_SUM) 14678 mips_lo_sum_offset_lookup ((htab_t) data, XEXP (*loc, 1), INSERT); 14679 return 0; 14680 } 14681 14682 /* Return true if INSN is a SET of an orphaned high-part relocation. 14683 HTAB is a hash table of mips_lo_sum_offsets that describes all the 14684 LO_SUMs in the current function. */ 14685 14686 static bool 14687 mips_orphaned_high_part_p (htab_t htab, rtx insn) 14688 { 14689 enum mips_symbol_type type; 14690 rtx x, set; 14691 14692 set = single_set (insn); 14693 if (set) 14694 { 14695 /* Check for %his. */ 14696 x = SET_SRC (set); 14697 if (GET_CODE (x) == HIGH 14698 && absolute_symbolic_operand (XEXP (x, 0), VOIDmode)) 14699 return !mips_lo_sum_offset_lookup (htab, XEXP (x, 0), NO_INSERT); 14700 14701 /* Check for local %gots (and %got_pages, which is redundant but OK). */ 14702 if (GET_CODE (x) == UNSPEC 14703 && XINT (x, 1) == UNSPEC_LOAD_GOT 14704 && mips_symbolic_constant_p (XVECEXP (x, 0, 1), 14705 SYMBOL_CONTEXT_LEA, &type) 14706 && type == SYMBOL_GOTOFF_PAGE) 14707 return !mips_lo_sum_offset_lookup (htab, XVECEXP (x, 0, 1), NO_INSERT); 14708 } 14709 return false; 14710 } 14711 14712 /* Subroutine of mips_reorg_process_insns. If there is a hazard between 14713 INSN and a previous instruction, avoid it by inserting nops after 14714 instruction AFTER. 14715 14716 *DELAYED_REG and *HILO_DELAY describe the hazards that apply at 14717 this point. If *DELAYED_REG is non-null, INSN must wait a cycle 14718 before using the value of that register. *HILO_DELAY counts the 14719 number of instructions since the last hilo hazard (that is, 14720 the number of instructions since the last MFLO or MFHI). 14721 14722 After inserting nops for INSN, update *DELAYED_REG and *HILO_DELAY 14723 for the next instruction. 14724 14725 LO_REG is an rtx for the LO register, used in dependence checking. */ 14726 14727 static void 14728 mips_avoid_hazard (rtx after, rtx insn, int *hilo_delay, 14729 rtx *delayed_reg, rtx lo_reg) 14730 { 14731 rtx pattern, set; 14732 int nops, ninsns; 14733 14734 pattern = PATTERN (insn); 14735 14736 /* Do not put the whole function in .set noreorder if it contains 14737 an asm statement. We don't know whether there will be hazards 14738 between the asm statement and the gcc-generated code. */ 14739 if (GET_CODE (pattern) == ASM_INPUT || asm_noperands (pattern) >= 0) 14740 cfun->machine->all_noreorder_p = false; 14741 14742 /* Ignore zero-length instructions (barriers and the like). */ 14743 ninsns = get_attr_length (insn) / 4; 14744 if (ninsns == 0) 14745 return; 14746 14747 /* Work out how many nops are needed. Note that we only care about 14748 registers that are explicitly mentioned in the instruction's pattern. 14749 It doesn't matter that calls use the argument registers or that they 14750 clobber hi and lo. */ 14751 if (*hilo_delay < 2 && reg_set_p (lo_reg, pattern)) 14752 nops = 2 - *hilo_delay; 14753 else if (*delayed_reg != 0 && reg_referenced_p (*delayed_reg, pattern)) 14754 nops = 1; 14755 else 14756 nops = 0; 14757 14758 /* Insert the nops between this instruction and the previous one. 14759 Each new nop takes us further from the last hilo hazard. */ 14760 *hilo_delay += nops; 14761 while (nops-- > 0) 14762 emit_insn_after (gen_hazard_nop (), after); 14763 14764 /* Set up the state for the next instruction. */ 14765 *hilo_delay += ninsns; 14766 *delayed_reg = 0; 14767 if (INSN_CODE (insn) >= 0) 14768 switch (get_attr_hazard (insn)) 14769 { 14770 case HAZARD_NONE: 14771 break; 14772 14773 case HAZARD_HILO: 14774 *hilo_delay = 0; 14775 break; 14776 14777 case HAZARD_DELAY: 14778 set = single_set (insn); 14779 gcc_assert (set); 14780 *delayed_reg = SET_DEST (set); 14781 break; 14782 } 14783 } 14784 14785 /* Go through the instruction stream and insert nops where necessary. 14786 Also delete any high-part relocations whose partnering low parts 14787 are now all dead. See if the whole function can then be put into 14788 .set noreorder and .set nomacro. */ 14789 14790 static void 14791 mips_reorg_process_insns (void) 14792 { 14793 rtx insn, last_insn, subinsn, next_insn, lo_reg, delayed_reg; 14794 int hilo_delay; 14795 htab_t htab; 14796 14797 /* Force all instructions to be split into their final form. */ 14798 split_all_insns_noflow (); 14799 14800 /* Recalculate instruction lengths without taking nops into account. */ 14801 cfun->machine->ignore_hazard_length_p = true; 14802 shorten_branches (get_insns ()); 14803 14804 cfun->machine->all_noreorder_p = true; 14805 14806 /* We don't track MIPS16 PC-relative offsets closely enough to make 14807 a good job of "set .noreorder" code in MIPS16 mode. */ 14808 if (TARGET_MIPS16) 14809 cfun->machine->all_noreorder_p = false; 14810 14811 /* Code that doesn't use explicit relocs can't be ".set nomacro". */ 14812 if (!TARGET_EXPLICIT_RELOCS) 14813 cfun->machine->all_noreorder_p = false; 14814 14815 /* Profiled functions can't be all noreorder because the profiler 14816 support uses assembler macros. */ 14817 if (crtl->profile) 14818 cfun->machine->all_noreorder_p = false; 14819 14820 /* Code compiled with -mfix-vr4120 can't be all noreorder because 14821 we rely on the assembler to work around some errata. */ 14822 if (TARGET_FIX_VR4120) 14823 cfun->machine->all_noreorder_p = false; 14824 14825 /* The same is true for -mfix-vr4130 if we might generate MFLO or 14826 MFHI instructions. Note that we avoid using MFLO and MFHI if 14827 the VR4130 MACC and DMACC instructions are available instead; 14828 see the *mfhilo_{si,di}_macc patterns. */ 14829 if (TARGET_FIX_VR4130 && !ISA_HAS_MACCHI) 14830 cfun->machine->all_noreorder_p = false; 14831 14832 htab = htab_create (37, mips_lo_sum_offset_hash, 14833 mips_lo_sum_offset_eq, free); 14834 14835 /* Make a first pass over the instructions, recording all the LO_SUMs. */ 14836 for (insn = get_insns (); insn != 0; insn = NEXT_INSN (insn)) 14837 FOR_EACH_SUBINSN (subinsn, insn) 14838 if (USEFUL_INSN_P (subinsn)) 14839 for_each_rtx (&PATTERN (subinsn), mips_record_lo_sum, htab); 14840 14841 last_insn = 0; 14842 hilo_delay = 2; 14843 delayed_reg = 0; 14844 lo_reg = gen_rtx_REG (SImode, LO_REGNUM); 14845 14846 /* Make a second pass over the instructions. Delete orphaned 14847 high-part relocations or turn them into NOPs. Avoid hazards 14848 by inserting NOPs. */ 14849 for (insn = get_insns (); insn != 0; insn = next_insn) 14850 { 14851 next_insn = NEXT_INSN (insn); 14852 if (USEFUL_INSN_P (insn)) 14853 { 14854 if (GET_CODE (PATTERN (insn)) == SEQUENCE) 14855 { 14856 /* If we find an orphaned high-part relocation in a delay 14857 slot, it's easier to turn that instruction into a NOP than 14858 to delete it. The delay slot will be a NOP either way. */ 14859 FOR_EACH_SUBINSN (subinsn, insn) 14860 if (INSN_P (subinsn)) 14861 { 14862 if (mips_orphaned_high_part_p (htab, subinsn)) 14863 { 14864 PATTERN (subinsn) = gen_nop (); 14865 INSN_CODE (subinsn) = CODE_FOR_nop; 14866 } 14867 mips_avoid_hazard (last_insn, subinsn, &hilo_delay, 14868 &delayed_reg, lo_reg); 14869 } 14870 last_insn = insn; 14871 } 14872 else 14873 { 14874 /* INSN is a single instruction. Delete it if it's an 14875 orphaned high-part relocation. */ 14876 if (mips_orphaned_high_part_p (htab, insn)) 14877 delete_insn (insn); 14878 /* Also delete cache barriers if the last instruction 14879 was an annulled branch. INSN will not be speculatively 14880 executed. */ 14881 else if (recog_memoized (insn) == CODE_FOR_r10k_cache_barrier 14882 && last_insn 14883 && INSN_ANNULLED_BRANCH_P (SEQ_BEGIN (last_insn))) 14884 delete_insn (insn); 14885 else 14886 { 14887 mips_avoid_hazard (last_insn, insn, &hilo_delay, 14888 &delayed_reg, lo_reg); 14889 last_insn = insn; 14890 } 14891 } 14892 } 14893 } 14894 14895 htab_delete (htab); 14896 } 14897 14898 /* If we are using a GOT, but have not decided to use a global pointer yet, 14899 see whether we need one to implement long branches. Convert the ghost 14900 global-pointer instructions into real ones if so. */ 14901 14902 static bool 14903 mips_expand_ghost_gp_insns (void) 14904 { 14905 rtx insn; 14906 int normal_length; 14907 14908 /* Quick exit if we already know that we will or won't need a 14909 global pointer. */ 14910 if (!TARGET_USE_GOT 14911 || cfun->machine->global_pointer == INVALID_REGNUM 14912 || mips_must_initialize_gp_p ()) 14913 return false; 14914 14915 shorten_branches (get_insns ()); 14916 14917 /* Look for a branch that is longer than normal. The normal length for 14918 non-MIPS16 branches is 8, because the length includes the delay slot. 14919 It is 4 for MIPS16, because MIPS16 branches are extended instructions, 14920 but they have no delay slot. */ 14921 normal_length = (TARGET_MIPS16 ? 4 : 8); 14922 for (insn = get_insns (); insn; insn = NEXT_INSN (insn)) 14923 if (JUMP_P (insn) 14924 && USEFUL_INSN_P (insn) 14925 && get_attr_length (insn) > normal_length) 14926 break; 14927 14928 if (insn == NULL_RTX) 14929 return false; 14930 14931 /* We've now established that we need $gp. */ 14932 cfun->machine->must_initialize_gp_p = true; 14933 split_all_insns_noflow (); 14934 14935 return true; 14936 } 14937 14938 /* Subroutine of mips_reorg to manage passes that require DF. */ 14939 14940 static void 14941 mips_df_reorg (void) 14942 { 14943 /* Create def-use chains. */ 14944 df_set_flags (DF_EQ_NOTES); 14945 df_chain_add_problem (DF_UD_CHAIN); 14946 df_analyze (); 14947 14948 if (TARGET_RELAX_PIC_CALLS) 14949 mips_annotate_pic_calls (); 14950 14951 if (mips_r10k_cache_barrier != R10K_CACHE_BARRIER_NONE) 14952 r10k_insert_cache_barriers (); 14953 14954 df_finish_pass (false); 14955 } 14956 14957 /* Implement TARGET_MACHINE_DEPENDENT_REORG. */ 14958 14959 static void 14960 mips_reorg (void) 14961 { 14962 /* Restore the BLOCK_FOR_INSN pointers, which are needed by DF. Also during 14963 insn splitting in mips16_lay_out_constants, DF insn info is only kept up 14964 to date if the CFG is available. */ 14965 if (mips_cfg_in_reorg ()) 14966 compute_bb_for_insn (); 14967 mips16_lay_out_constants (); 14968 if (mips_cfg_in_reorg ()) 14969 { 14970 mips_df_reorg (); 14971 free_bb_for_insn (); 14972 } 14973 14974 if (optimize > 0 && flag_delayed_branch) 14975 dbr_schedule (get_insns ()); 14976 mips_reorg_process_insns (); 14977 if (!TARGET_MIPS16 14978 && TARGET_EXPLICIT_RELOCS 14979 && TUNE_MIPS4130 14980 && TARGET_VR4130_ALIGN) 14981 vr4130_align_insns (); 14982 if (mips_expand_ghost_gp_insns ()) 14983 /* The expansion could invalidate some of the VR4130 alignment 14984 optimizations, but this should be an extremely rare case anyhow. */ 14985 mips_reorg_process_insns (); 14986 } 14987 14988 /* Implement TARGET_ASM_OUTPUT_MI_THUNK. Generate rtl rather than asm text 14989 in order to avoid duplicating too much logic from elsewhere. */ 14990 14991 static void 14992 mips_output_mi_thunk (FILE *file, tree thunk_fndecl ATTRIBUTE_UNUSED, 14993 HOST_WIDE_INT delta, HOST_WIDE_INT vcall_offset, 14994 tree function) 14995 { 14996 rtx this_rtx, temp1, temp2, insn, fnaddr; 14997 bool use_sibcall_p; 14998 14999 /* Pretend to be a post-reload pass while generating rtl. */ 15000 reload_completed = 1; 15001 15002 /* Mark the end of the (empty) prologue. */ 15003 emit_note (NOTE_INSN_PROLOGUE_END); 15004 15005 /* Determine if we can use a sibcall to call FUNCTION directly. */ 15006 fnaddr = XEXP (DECL_RTL (function), 0); 15007 use_sibcall_p = (mips_function_ok_for_sibcall (function, NULL) 15008 && const_call_insn_operand (fnaddr, Pmode)); 15009 15010 /* Determine if we need to load FNADDR from the GOT. */ 15011 if (!use_sibcall_p 15012 && (mips_got_symbol_type_p 15013 (mips_classify_symbol (fnaddr, SYMBOL_CONTEXT_LEA)))) 15014 { 15015 /* Pick a global pointer. Use a call-clobbered register if 15016 TARGET_CALL_SAVED_GP. */ 15017 cfun->machine->global_pointer 15018 = TARGET_CALL_SAVED_GP ? 15 : GLOBAL_POINTER_REGNUM; 15019 cfun->machine->must_initialize_gp_p = true; 15020 SET_REGNO (pic_offset_table_rtx, cfun->machine->global_pointer); 15021 15022 /* Set up the global pointer for n32 or n64 abicalls. */ 15023 mips_emit_loadgp (); 15024 } 15025 15026 /* We need two temporary registers in some cases. */ 15027 temp1 = gen_rtx_REG (Pmode, 2); 15028 temp2 = gen_rtx_REG (Pmode, 3); 15029 15030 /* Find out which register contains the "this" pointer. */ 15031 if (aggregate_value_p (TREE_TYPE (TREE_TYPE (function)), function)) 15032 this_rtx = gen_rtx_REG (Pmode, GP_ARG_FIRST + 1); 15033 else 15034 this_rtx = gen_rtx_REG (Pmode, GP_ARG_FIRST); 15035 15036 /* Add DELTA to THIS_RTX. */ 15037 if (delta != 0) 15038 { 15039 rtx offset = GEN_INT (delta); 15040 if (!SMALL_OPERAND (delta)) 15041 { 15042 mips_emit_move (temp1, offset); 15043 offset = temp1; 15044 } 15045 emit_insn (gen_add3_insn (this_rtx, this_rtx, offset)); 15046 } 15047 15048 /* If needed, add *(*THIS_RTX + VCALL_OFFSET) to THIS_RTX. */ 15049 if (vcall_offset != 0) 15050 { 15051 rtx addr; 15052 15053 /* Set TEMP1 to *THIS_RTX. */ 15054 mips_emit_move (temp1, gen_rtx_MEM (Pmode, this_rtx)); 15055 15056 /* Set ADDR to a legitimate address for *THIS_RTX + VCALL_OFFSET. */ 15057 addr = mips_add_offset (temp2, temp1, vcall_offset); 15058 15059 /* Load the offset and add it to THIS_RTX. */ 15060 mips_emit_move (temp1, gen_rtx_MEM (Pmode, addr)); 15061 emit_insn (gen_add3_insn (this_rtx, this_rtx, temp1)); 15062 } 15063 15064 /* Jump to the target function. Use a sibcall if direct jumps are 15065 allowed, otherwise load the address into a register first. */ 15066 if (use_sibcall_p) 15067 { 15068 insn = emit_call_insn (gen_sibcall_internal (fnaddr, const0_rtx)); 15069 SIBLING_CALL_P (insn) = 1; 15070 } 15071 else 15072 { 15073 /* This is messy. GAS treats "la $25,foo" as part of a call 15074 sequence and may allow a global "foo" to be lazily bound. 15075 The general move patterns therefore reject this combination. 15076 15077 In this context, lazy binding would actually be OK 15078 for TARGET_CALL_CLOBBERED_GP, but it's still wrong for 15079 TARGET_CALL_SAVED_GP; see mips_load_call_address. 15080 We must therefore load the address via a temporary 15081 register if mips_dangerous_for_la25_p. 15082 15083 If we jump to the temporary register rather than $25, 15084 the assembler can use the move insn to fill the jump's 15085 delay slot. 15086 15087 We can use the same technique for MIPS16 code, where $25 15088 is not a valid JR register. */ 15089 if (TARGET_USE_PIC_FN_ADDR_REG 15090 && !TARGET_MIPS16 15091 && !mips_dangerous_for_la25_p (fnaddr)) 15092 temp1 = gen_rtx_REG (Pmode, PIC_FUNCTION_ADDR_REGNUM); 15093 mips_load_call_address (MIPS_CALL_SIBCALL, temp1, fnaddr); 15094 15095 if (TARGET_USE_PIC_FN_ADDR_REG 15096 && REGNO (temp1) != PIC_FUNCTION_ADDR_REGNUM) 15097 mips_emit_move (gen_rtx_REG (Pmode, PIC_FUNCTION_ADDR_REGNUM), temp1); 15098 emit_jump_insn (gen_indirect_jump (temp1)); 15099 } 15100 15101 /* Run just enough of rest_of_compilation. This sequence was 15102 "borrowed" from alpha.c. */ 15103 insn = get_insns (); 15104 insn_locators_alloc (); 15105 split_all_insns_noflow (); 15106 mips16_lay_out_constants (); 15107 shorten_branches (insn); 15108 final_start_function (insn, file, 1); 15109 final (insn, file, 1); 15110 final_end_function (); 15111 15112 /* Clean up the vars set above. Note that final_end_function resets 15113 the global pointer for us. */ 15114 reload_completed = 0; 15115 } 15116 15117 /* The last argument passed to mips_set_mips16_mode, or negative if the 15118 function hasn't been called yet. 15119 15120 There are two copies of this information. One is saved and restored 15121 by the PCH process while the other is specific to this compiler 15122 invocation. The information calculated by mips_set_mips16_mode 15123 is invalid unless the two variables are the same. */ 15124 static int was_mips16_p = -1; 15125 static GTY(()) int was_mips16_pch_p = -1; 15126 15127 /* Set up the target-dependent global state so that it matches the 15128 current function's ISA mode. */ 15129 15130 static void 15131 mips_set_mips16_mode (int mips16_p) 15132 { 15133 if (mips16_p == was_mips16_p 15134 && mips16_p == was_mips16_pch_p) 15135 return; 15136 15137 /* Restore base settings of various flags. */ 15138 target_flags = mips_base_target_flags; 15139 flag_schedule_insns = mips_base_schedule_insns; 15140 flag_reorder_blocks_and_partition = mips_base_reorder_blocks_and_partition; 15141 flag_move_loop_invariants = mips_base_move_loop_invariants; 15142 align_loops = mips_base_align_loops; 15143 align_jumps = mips_base_align_jumps; 15144 align_functions = mips_base_align_functions; 15145 15146 if (mips16_p) 15147 { 15148 /* Switch to MIPS16 mode. */ 15149 target_flags |= MASK_MIPS16; 15150 15151 /* Don't run the scheduler before reload, since it tends to 15152 increase register pressure. */ 15153 flag_schedule_insns = 0; 15154 15155 /* Don't do hot/cold partitioning. mips16_lay_out_constants expects 15156 the whole function to be in a single section. */ 15157 flag_reorder_blocks_and_partition = 0; 15158 15159 /* Don't move loop invariants, because it tends to increase 15160 register pressure. It also introduces an extra move in cases 15161 where the constant is the first operand in a two-operand binary 15162 instruction, or when it forms a register argument to a functon 15163 call. */ 15164 flag_move_loop_invariants = 0; 15165 15166 target_flags |= MASK_EXPLICIT_RELOCS; 15167 15168 /* Experiments suggest we get the best overall section-anchor 15169 results from using the range of an unextended LW or SW. Code 15170 that makes heavy use of byte or short accesses can do better 15171 with ranges of 0...31 and 0...63 respectively, but most code is 15172 sensitive to the range of LW and SW instead. */ 15173 targetm.min_anchor_offset = 0; 15174 targetm.max_anchor_offset = 127; 15175 15176 targetm.const_anchor = 0; 15177 15178 /* MIPS16 has no BAL instruction. */ 15179 target_flags &= ~MASK_RELAX_PIC_CALLS; 15180 15181 if (flag_pic && !TARGET_OLDABI) 15182 sorry ("MIPS16 PIC for ABIs other than o32 and o64"); 15183 15184 if (TARGET_XGOT) 15185 sorry ("MIPS16 -mxgot code"); 15186 15187 if (TARGET_HARD_FLOAT_ABI && !TARGET_OLDABI) 15188 sorry ("hard-float MIPS16 code for ABIs other than o32 and o64"); 15189 } 15190 else 15191 { 15192 /* Switch to normal (non-MIPS16) mode. */ 15193 target_flags &= ~MASK_MIPS16; 15194 15195 /* Provide default values for align_* for 64-bit targets. */ 15196 if (TARGET_64BIT) 15197 { 15198 if (align_loops == 0) 15199 align_loops = 8; 15200 if (align_jumps == 0) 15201 align_jumps = 8; 15202 if (align_functions == 0) 15203 align_functions = 8; 15204 } 15205 15206 targetm.min_anchor_offset = -32768; 15207 targetm.max_anchor_offset = 32767; 15208 15209 targetm.const_anchor = 0x8000; 15210 } 15211 15212 /* (Re)initialize MIPS target internals for new ISA. */ 15213 mips_init_relocs (); 15214 15215 if (was_mips16_p >= 0 || was_mips16_pch_p >= 0) 15216 /* Reinitialize target-dependent state. */ 15217 target_reinit (); 15218 15219 was_mips16_p = mips16_p; 15220 was_mips16_pch_p = mips16_p; 15221 } 15222 15223 /* Implement TARGET_SET_CURRENT_FUNCTION. Decide whether the current 15224 function should use the MIPS16 ISA and switch modes accordingly. */ 15225 15226 static void 15227 mips_set_current_function (tree fndecl) 15228 { 15229 mips_set_mips16_mode (mips_use_mips16_mode_p (fndecl)); 15230 } 15231 15232 /* Allocate a chunk of memory for per-function machine-dependent data. */ 15233 15234 static struct machine_function * 15235 mips_init_machine_status (void) 15236 { 15237 return ((struct machine_function *) 15238 ggc_alloc_cleared (sizeof (struct machine_function))); 15239 } 15240 15241 /* Return the processor associated with the given ISA level, or null 15242 if the ISA isn't valid. */ 15243 15244 static const struct mips_cpu_info * 15245 mips_cpu_info_from_isa (int isa) 15246 { 15247 unsigned int i; 15248 15249 for (i = 0; i < ARRAY_SIZE (mips_cpu_info_table); i++) 15250 if (mips_cpu_info_table[i].isa == isa) 15251 return mips_cpu_info_table + i; 15252 15253 return NULL; 15254 } 15255 15256 /* Return true if GIVEN is the same as CANONICAL, or if it is CANONICAL 15257 with a final "000" replaced by "k". Ignore case. 15258 15259 Note: this function is shared between GCC and GAS. */ 15260 15261 static bool 15262 mips_strict_matching_cpu_name_p (const char *canonical, const char *given) 15263 { 15264 while (*given != 0 && TOLOWER (*given) == TOLOWER (*canonical)) 15265 given++, canonical++; 15266 15267 return ((*given == 0 && *canonical == 0) 15268 || (strcmp (canonical, "000") == 0 && strcasecmp (given, "k") == 0)); 15269 } 15270 15271 /* Return true if GIVEN matches CANONICAL, where GIVEN is a user-supplied 15272 CPU name. We've traditionally allowed a lot of variation here. 15273 15274 Note: this function is shared between GCC and GAS. */ 15275 15276 static bool 15277 mips_matching_cpu_name_p (const char *canonical, const char *given) 15278 { 15279 /* First see if the name matches exactly, or with a final "000" 15280 turned into "k". */ 15281 if (mips_strict_matching_cpu_name_p (canonical, given)) 15282 return true; 15283 15284 /* If not, try comparing based on numerical designation alone. 15285 See if GIVEN is an unadorned number, or 'r' followed by a number. */ 15286 if (TOLOWER (*given) == 'r') 15287 given++; 15288 if (!ISDIGIT (*given)) 15289 return false; 15290 15291 /* Skip over some well-known prefixes in the canonical name, 15292 hoping to find a number there too. */ 15293 if (TOLOWER (canonical[0]) == 'v' && TOLOWER (canonical[1]) == 'r') 15294 canonical += 2; 15295 else if (TOLOWER (canonical[0]) == 'r' && TOLOWER (canonical[1]) == 'm') 15296 canonical += 2; 15297 else if (TOLOWER (canonical[0]) == 'r') 15298 canonical += 1; 15299 15300 return mips_strict_matching_cpu_name_p (canonical, given); 15301 } 15302 15303 /* Return the mips_cpu_info entry for the processor or ISA given 15304 by CPU_STRING. Return null if the string isn't recognized. 15305 15306 A similar function exists in GAS. */ 15307 15308 static const struct mips_cpu_info * 15309 mips_parse_cpu (const char *cpu_string) 15310 { 15311 unsigned int i; 15312 const char *s; 15313 15314 /* In the past, we allowed upper-case CPU names, but it doesn't 15315 work well with the multilib machinery. */ 15316 for (s = cpu_string; *s != 0; s++) 15317 if (ISUPPER (*s)) 15318 { 15319 warning (0, "CPU names must be lower case"); 15320 break; 15321 } 15322 15323 /* 'from-abi' selects the most compatible architecture for the given 15324 ABI: MIPS I for 32-bit ABIs and MIPS III for 64-bit ABIs. For the 15325 EABIs, we have to decide whether we're using the 32-bit or 64-bit 15326 version. */ 15327 if (strcasecmp (cpu_string, "from-abi") == 0) 15328 return mips_cpu_info_from_isa (ABI_NEEDS_32BIT_REGS ? 1 15329 : ABI_NEEDS_64BIT_REGS ? 3 15330 : (TARGET_64BIT ? 3 : 1)); 15331 15332 /* 'default' has traditionally been a no-op. Probably not very useful. */ 15333 if (strcasecmp (cpu_string, "default") == 0) 15334 return NULL; 15335 15336 for (i = 0; i < ARRAY_SIZE (mips_cpu_info_table); i++) 15337 if (mips_matching_cpu_name_p (mips_cpu_info_table[i].name, cpu_string)) 15338 return mips_cpu_info_table + i; 15339 15340 return NULL; 15341 } 15342 15343 /* Set up globals to generate code for the ISA or processor 15344 described by INFO. */ 15345 15346 static void 15347 mips_set_architecture (const struct mips_cpu_info *info) 15348 { 15349 if (info != 0) 15350 { 15351 mips_arch_info = info; 15352 mips_arch = info->cpu; 15353 mips_isa = info->isa; 15354 } 15355 } 15356 15357 /* Likewise for tuning. */ 15358 15359 static void 15360 mips_set_tune (const struct mips_cpu_info *info) 15361 { 15362 if (info != 0) 15363 { 15364 mips_tune_info = info; 15365 mips_tune = info->cpu; 15366 } 15367 } 15368 15369 /* Implement TARGET_HANDLE_OPTION. */ 15370 15371 static bool 15372 mips_handle_option (size_t code, const char *arg, int value ATTRIBUTE_UNUSED) 15373 { 15374 switch (code) 15375 { 15376 case OPT_mabi_: 15377 if (strcmp (arg, "32") == 0) 15378 mips_abi = ABI_32; 15379 else if (strcmp (arg, "o64") == 0) 15380 mips_abi = ABI_O64; 15381 else if (strcmp (arg, "n32") == 0) 15382 mips_abi = ABI_N32; 15383 else if (strcmp (arg, "64") == 0) 15384 mips_abi = ABI_64; 15385 else if (strcmp (arg, "eabi") == 0) 15386 mips_abi = ABI_EABI; 15387 else 15388 return false; 15389 return true; 15390 15391 case OPT_march_: 15392 case OPT_mtune_: 15393 return mips_parse_cpu (arg) != 0; 15394 15395 case OPT_mips: 15396 mips_isa_option_info = mips_parse_cpu (ACONCAT (("mips", arg, NULL))); 15397 return mips_isa_option_info != 0; 15398 15399 case OPT_mno_flush_func: 15400 mips_cache_flush_func = NULL; 15401 return true; 15402 15403 case OPT_mcode_readable_: 15404 if (strcmp (arg, "yes") == 0) 15405 mips_code_readable = CODE_READABLE_YES; 15406 else if (strcmp (arg, "pcrel") == 0) 15407 mips_code_readable = CODE_READABLE_PCREL; 15408 else if (strcmp (arg, "no") == 0) 15409 mips_code_readable = CODE_READABLE_NO; 15410 else 15411 return false; 15412 return true; 15413 15414 case OPT_mr10k_cache_barrier_: 15415 if (strcmp (arg, "load-store") == 0) 15416 mips_r10k_cache_barrier = R10K_CACHE_BARRIER_LOAD_STORE; 15417 else if (strcmp (arg, "store") == 0) 15418 mips_r10k_cache_barrier = R10K_CACHE_BARRIER_STORE; 15419 else if (strcmp (arg, "none") == 0) 15420 mips_r10k_cache_barrier = R10K_CACHE_BARRIER_NONE; 15421 else 15422 return false; 15423 return true; 15424 15425 default: 15426 return true; 15427 } 15428 } 15429 15430 /* Implement OVERRIDE_OPTIONS. */ 15431 15432 void 15433 mips_override_options (void) 15434 { 15435 int i, start, regno, mode; 15436 15437 /* Process flags as though we were generating non-MIPS16 code. */ 15438 mips_base_mips16 = TARGET_MIPS16; 15439 target_flags &= ~MASK_MIPS16; 15440 15441 #ifdef SUBTARGET_OVERRIDE_OPTIONS 15442 SUBTARGET_OVERRIDE_OPTIONS; 15443 #endif 15444 15445 /* Set the small data limit. */ 15446 mips_small_data_threshold = (g_switch_set 15447 ? g_switch_value 15448 : MIPS_DEFAULT_GVALUE); 15449 15450 /* The following code determines the architecture and register size. 15451 Similar code was added to GAS 2.14 (see tc-mips.c:md_after_parse_args()). 15452 The GAS and GCC code should be kept in sync as much as possible. */ 15453 15454 if (mips_arch_string != 0) 15455 mips_set_architecture (mips_parse_cpu (mips_arch_string)); 15456 15457 if (mips_isa_option_info != 0) 15458 { 15459 if (mips_arch_info == 0) 15460 mips_set_architecture (mips_isa_option_info); 15461 else if (mips_arch_info->isa != mips_isa_option_info->isa) 15462 error ("%<-%s%> conflicts with the other architecture options, " 15463 "which specify a %s processor", 15464 mips_isa_option_info->name, 15465 mips_cpu_info_from_isa (mips_arch_info->isa)->name); 15466 } 15467 15468 if (mips_arch_info == 0) 15469 { 15470 #ifdef MIPS_CPU_STRING_DEFAULT 15471 mips_set_architecture (mips_parse_cpu (MIPS_CPU_STRING_DEFAULT)); 15472 #else 15473 mips_set_architecture (mips_cpu_info_from_isa (MIPS_ISA_DEFAULT)); 15474 #endif 15475 } 15476 15477 if (ABI_NEEDS_64BIT_REGS && !ISA_HAS_64BIT_REGS) 15478 error ("%<-march=%s%> is not compatible with the selected ABI", 15479 mips_arch_info->name); 15480 15481 /* Optimize for mips_arch, unless -mtune selects a different processor. */ 15482 if (mips_tune_string != 0) 15483 mips_set_tune (mips_parse_cpu (mips_tune_string)); 15484 15485 if (mips_tune_info == 0) 15486 mips_set_tune (mips_arch_info); 15487 15488 if ((target_flags_explicit & MASK_64BIT) != 0) 15489 { 15490 /* The user specified the size of the integer registers. Make sure 15491 it agrees with the ABI and ISA. */ 15492 if (TARGET_64BIT && !ISA_HAS_64BIT_REGS) 15493 error ("%<-mgp64%> used with a 32-bit processor"); 15494 else if (!TARGET_64BIT && ABI_NEEDS_64BIT_REGS) 15495 error ("%<-mgp32%> used with a 64-bit ABI"); 15496 else if (TARGET_64BIT && ABI_NEEDS_32BIT_REGS) 15497 error ("%<-mgp64%> used with a 32-bit ABI"); 15498 } 15499 else 15500 { 15501 /* Infer the integer register size from the ABI and processor. 15502 Restrict ourselves to 32-bit registers if that's all the 15503 processor has, or if the ABI cannot handle 64-bit registers. */ 15504 if (ABI_NEEDS_32BIT_REGS || !ISA_HAS_64BIT_REGS) 15505 target_flags &= ~MASK_64BIT; 15506 else 15507 target_flags |= MASK_64BIT; 15508 } 15509 15510 if ((target_flags_explicit & MASK_FLOAT64) != 0) 15511 { 15512 if (TARGET_SINGLE_FLOAT && TARGET_FLOAT64) 15513 error ("unsupported combination: %s", "-mfp64 -msingle-float"); 15514 else if (TARGET_64BIT && TARGET_DOUBLE_FLOAT && !TARGET_FLOAT64) 15515 error ("unsupported combination: %s", "-mgp64 -mfp32 -mdouble-float"); 15516 else if (!TARGET_64BIT && TARGET_FLOAT64) 15517 { 15518 if (!ISA_HAS_MXHC1) 15519 error ("%<-mgp32%> and %<-mfp64%> can only be combined if" 15520 " the target supports the mfhc1 and mthc1 instructions"); 15521 else if (mips_abi != ABI_32) 15522 error ("%<-mgp32%> and %<-mfp64%> can only be combined when using" 15523 " the o32 ABI"); 15524 } 15525 } 15526 else 15527 { 15528 /* -msingle-float selects 32-bit float registers. Otherwise the 15529 float registers should be the same size as the integer ones. */ 15530 if (TARGET_64BIT && TARGET_DOUBLE_FLOAT) 15531 target_flags |= MASK_FLOAT64; 15532 else 15533 target_flags &= ~MASK_FLOAT64; 15534 } 15535 15536 /* End of code shared with GAS. */ 15537 15538 /* If no -mlong* option was given, infer it from the other options. */ 15539 if ((target_flags_explicit & MASK_LONG64) == 0) 15540 { 15541 if ((mips_abi == ABI_EABI && TARGET_64BIT) || mips_abi == ABI_64) 15542 target_flags |= MASK_LONG64; 15543 else 15544 target_flags &= ~MASK_LONG64; 15545 } 15546 15547 if (!TARGET_OLDABI) 15548 flag_pcc_struct_return = 0; 15549 15550 /* Decide which rtx_costs structure to use. */ 15551 if (optimize_size) 15552 mips_cost = &mips_rtx_cost_optimize_size; 15553 else 15554 mips_cost = &mips_rtx_cost_data[mips_tune]; 15555 15556 /* If the user hasn't specified a branch cost, use the processor's 15557 default. */ 15558 if (mips_branch_cost == 0) 15559 mips_branch_cost = mips_cost->branch_cost; 15560 15561 /* If neither -mbranch-likely nor -mno-branch-likely was given 15562 on the command line, set MASK_BRANCHLIKELY based on the target 15563 architecture and tuning flags. Annulled delay slots are a 15564 size win, so we only consider the processor-specific tuning 15565 for !optimize_size. */ 15566 if ((target_flags_explicit & MASK_BRANCHLIKELY) == 0) 15567 { 15568 if (ISA_HAS_BRANCHLIKELY 15569 && (optimize_size 15570 || (mips_tune_info->tune_flags & PTF_AVOID_BRANCHLIKELY) == 0)) 15571 target_flags |= MASK_BRANCHLIKELY; 15572 else 15573 target_flags &= ~MASK_BRANCHLIKELY; 15574 } 15575 else if (TARGET_BRANCHLIKELY && !ISA_HAS_BRANCHLIKELY) 15576 warning (0, "the %qs architecture does not support branch-likely" 15577 " instructions", mips_arch_info->name); 15578 15579 /* The effect of -mabicalls isn't defined for the EABI. */ 15580 if (mips_abi == ABI_EABI && TARGET_ABICALLS) 15581 { 15582 error ("unsupported combination: %s", "-mabicalls -mabi=eabi"); 15583 target_flags &= ~MASK_ABICALLS; 15584 } 15585 15586 if (TARGET_ABICALLS_PIC2) 15587 /* We need to set flag_pic for executables as well as DSOs 15588 because we may reference symbols that are not defined in 15589 the final executable. (MIPS does not use things like 15590 copy relocs, for example.) 15591 15592 There is a body of code that uses __PIC__ to distinguish 15593 between -mabicalls and -mno-abicalls code. The non-__PIC__ 15594 variant is usually appropriate for TARGET_ABICALLS_PIC0, as 15595 long as any indirect jumps use $25. */ 15596 flag_pic = 1; 15597 15598 /* -mvr4130-align is a "speed over size" optimization: it usually produces 15599 faster code, but at the expense of more nops. Enable it at -O3 and 15600 above. */ 15601 if (optimize > 2 && (target_flags_explicit & MASK_VR4130_ALIGN) == 0) 15602 target_flags |= MASK_VR4130_ALIGN; 15603 15604 /* Prefer a call to memcpy over inline code when optimizing for size, 15605 though see MOVE_RATIO in mips.h. */ 15606 if (optimize_size && (target_flags_explicit & MASK_MEMCPY) == 0) 15607 target_flags |= MASK_MEMCPY; 15608 15609 /* If we have a nonzero small-data limit, check that the -mgpopt 15610 setting is consistent with the other target flags. */ 15611 if (mips_small_data_threshold > 0) 15612 { 15613 if (!TARGET_GPOPT) 15614 { 15615 if (!TARGET_EXPLICIT_RELOCS) 15616 error ("%<-mno-gpopt%> needs %<-mexplicit-relocs%>"); 15617 15618 TARGET_LOCAL_SDATA = false; 15619 TARGET_EXTERN_SDATA = false; 15620 } 15621 else 15622 { 15623 if (TARGET_VXWORKS_RTP) 15624 warning (0, "cannot use small-data accesses for %qs", "-mrtp"); 15625 15626 if (TARGET_ABICALLS) 15627 warning (0, "cannot use small-data accesses for %qs", 15628 "-mabicalls"); 15629 } 15630 } 15631 15632 #ifdef MIPS_TFMODE_FORMAT 15633 REAL_MODE_FORMAT (TFmode) = &MIPS_TFMODE_FORMAT; 15634 #endif 15635 15636 /* Make sure that the user didn't turn off paired single support when 15637 MIPS-3D support is requested. */ 15638 if (TARGET_MIPS3D 15639 && (target_flags_explicit & MASK_PAIRED_SINGLE_FLOAT) 15640 && !TARGET_PAIRED_SINGLE_FLOAT) 15641 error ("%<-mips3d%> requires %<-mpaired-single%>"); 15642 15643 /* If TARGET_MIPS3D, enable MASK_PAIRED_SINGLE_FLOAT. */ 15644 if (TARGET_MIPS3D) 15645 target_flags |= MASK_PAIRED_SINGLE_FLOAT; 15646 15647 /* Make sure that when TARGET_PAIRED_SINGLE_FLOAT is true, TARGET_FLOAT64 15648 and TARGET_HARD_FLOAT_ABI are both true. */ 15649 if (TARGET_PAIRED_SINGLE_FLOAT && !(TARGET_FLOAT64 && TARGET_HARD_FLOAT_ABI)) 15650 error ("%qs must be used with %qs", 15651 TARGET_MIPS3D ? "-mips3d" : "-mpaired-single", 15652 TARGET_HARD_FLOAT_ABI ? "-mfp64" : "-mhard-float"); 15653 15654 /* Make sure that the ISA supports TARGET_PAIRED_SINGLE_FLOAT when it is 15655 enabled. */ 15656 if (TARGET_PAIRED_SINGLE_FLOAT && !ISA_HAS_PAIRED_SINGLE) 15657 warning (0, "the %qs architecture does not support paired-single" 15658 " instructions", mips_arch_info->name); 15659 15660 if (mips_r10k_cache_barrier != R10K_CACHE_BARRIER_NONE 15661 && !TARGET_CACHE_BUILTIN) 15662 { 15663 error ("%qs requires a target that provides the %qs instruction", 15664 "-mr10k-cache-barrier", "cache"); 15665 mips_r10k_cache_barrier = R10K_CACHE_BARRIER_NONE; 15666 } 15667 15668 /* If TARGET_DSPR2, enable MASK_DSP. */ 15669 if (TARGET_DSPR2) 15670 target_flags |= MASK_DSP; 15671 15672 /* .eh_frame addresses should be the same width as a C pointer. 15673 Most MIPS ABIs support only one pointer size, so the assembler 15674 will usually know exactly how big an .eh_frame address is. 15675 15676 Unfortunately, this is not true of the 64-bit EABI. The ABI was 15677 originally defined to use 64-bit pointers (i.e. it is LP64), and 15678 this is still the default mode. However, we also support an n32-like 15679 ILP32 mode, which is selected by -mlong32. The problem is that the 15680 assembler has traditionally not had an -mlong option, so it has 15681 traditionally not known whether we're using the ILP32 or LP64 form. 15682 15683 As it happens, gas versions up to and including 2.19 use _32-bit_ 15684 addresses for EABI64 .cfi_* directives. This is wrong for the 15685 default LP64 mode, so we can't use the directives by default. 15686 Moreover, since gas's current behavior is at odds with gcc's 15687 default behavior, it seems unwise to rely on future versions 15688 of gas behaving the same way. We therefore avoid using .cfi 15689 directives for -mlong32 as well. */ 15690 if (mips_abi == ABI_EABI && TARGET_64BIT) 15691 flag_dwarf2_cfi_asm = 0; 15692 15693 /* .cfi_* directives generate a read-only section, so fall back on 15694 manual .eh_frame creation if we need the section to be writable. */ 15695 if (TARGET_WRITABLE_EH_FRAME) 15696 flag_dwarf2_cfi_asm = 0; 15697 15698 mips_init_print_operand_punct (); 15699 15700 /* Set up array to map GCC register number to debug register number. 15701 Ignore the special purpose register numbers. */ 15702 15703 for (i = 0; i < FIRST_PSEUDO_REGISTER; i++) 15704 { 15705 mips_dbx_regno[i] = INVALID_REGNUM; 15706 if (GP_REG_P (i) || FP_REG_P (i) || ALL_COP_REG_P (i)) 15707 mips_dwarf_regno[i] = i; 15708 else 15709 mips_dwarf_regno[i] = INVALID_REGNUM; 15710 } 15711 15712 start = GP_DBX_FIRST - GP_REG_FIRST; 15713 for (i = GP_REG_FIRST; i <= GP_REG_LAST; i++) 15714 mips_dbx_regno[i] = i + start; 15715 15716 start = FP_DBX_FIRST - FP_REG_FIRST; 15717 for (i = FP_REG_FIRST; i <= FP_REG_LAST; i++) 15718 mips_dbx_regno[i] = i + start; 15719 15720 /* Accumulator debug registers use big-endian ordering. */ 15721 mips_dbx_regno[HI_REGNUM] = MD_DBX_FIRST + 0; 15722 mips_dbx_regno[LO_REGNUM] = MD_DBX_FIRST + 1; 15723 mips_dwarf_regno[HI_REGNUM] = MD_REG_FIRST + 0; 15724 mips_dwarf_regno[LO_REGNUM] = MD_REG_FIRST + 1; 15725 for (i = DSP_ACC_REG_FIRST; i <= DSP_ACC_REG_LAST; i += 2) 15726 { 15727 mips_dwarf_regno[i + TARGET_LITTLE_ENDIAN] = i; 15728 mips_dwarf_regno[i + TARGET_BIG_ENDIAN] = i + 1; 15729 } 15730 15731 /* Set up mips_hard_regno_mode_ok. */ 15732 for (mode = 0; mode < MAX_MACHINE_MODE; mode++) 15733 for (regno = 0; regno < FIRST_PSEUDO_REGISTER; regno++) 15734 mips_hard_regno_mode_ok[mode][regno] 15735 = mips_hard_regno_mode_ok_p (regno, (enum machine_mode) mode); 15736 15737 /* Function to allocate machine-dependent function status. */ 15738 init_machine_status = &mips_init_machine_status; 15739 15740 /* Default to working around R4000 errata only if the processor 15741 was selected explicitly. */ 15742 if ((target_flags_explicit & MASK_FIX_R4000) == 0 15743 && mips_matching_cpu_name_p (mips_arch_info->name, "r4000")) 15744 target_flags |= MASK_FIX_R4000; 15745 15746 /* Default to working around R4400 errata only if the processor 15747 was selected explicitly. */ 15748 if ((target_flags_explicit & MASK_FIX_R4400) == 0 15749 && mips_matching_cpu_name_p (mips_arch_info->name, "r4400")) 15750 target_flags |= MASK_FIX_R4400; 15751 15752 /* Default to working around R10000 errata only if the processor 15753 was selected explicitly. */ 15754 if ((target_flags_explicit & MASK_FIX_R10000) == 0 15755 && mips_matching_cpu_name_p (mips_arch_info->name, "r10000")) 15756 target_flags |= MASK_FIX_R10000; 15757 15758 /* Make sure that branch-likely instructions available when using 15759 -mfix-r10000. The instructions are not available if either: 15760 15761 1. -mno-branch-likely was passed. 15762 2. The selected ISA does not support branch-likely and 15763 the command line does not include -mbranch-likely. */ 15764 if (TARGET_FIX_R10000 15765 && ((target_flags_explicit & MASK_BRANCHLIKELY) == 0 15766 ? !ISA_HAS_BRANCHLIKELY 15767 : !TARGET_BRANCHLIKELY)) 15768 sorry ("%qs requires branch-likely instructions", "-mfix-r10000"); 15769 15770 if (TARGET_SYNCI && !ISA_HAS_SYNCI) 15771 { 15772 warning (0, "the %qs architecture does not support the synci " 15773 "instruction", mips_arch_info->name); 15774 target_flags &= ~MASK_SYNCI; 15775 } 15776 15777 /* Only optimize PIC indirect calls if they are actually required. */ 15778 if (!TARGET_USE_GOT || !TARGET_EXPLICIT_RELOCS) 15779 target_flags &= ~MASK_RELAX_PIC_CALLS; 15780 15781 /* Save base state of options. */ 15782 mips_base_target_flags = target_flags; 15783 mips_base_schedule_insns = flag_schedule_insns; 15784 mips_base_reorder_blocks_and_partition = flag_reorder_blocks_and_partition; 15785 mips_base_move_loop_invariants = flag_move_loop_invariants; 15786 mips_base_align_loops = align_loops; 15787 mips_base_align_jumps = align_jumps; 15788 mips_base_align_functions = align_functions; 15789 15790 /* Now select the ISA mode. 15791 15792 Do all CPP-sensitive stuff in non-MIPS16 mode; we'll switch to 15793 MIPS16 mode afterwards if need be. */ 15794 mips_set_mips16_mode (false); 15795 } 15796 15797 /* Swap the register information for registers I and I + 1, which 15798 currently have the wrong endianness. Note that the registers' 15799 fixedness and call-clobberedness might have been set on the 15800 command line. */ 15801 15802 static void 15803 mips_swap_registers (unsigned int i) 15804 { 15805 int tmpi; 15806 const char *tmps; 15807 15808 #define SWAP_INT(X, Y) (tmpi = (X), (X) = (Y), (Y) = tmpi) 15809 #define SWAP_STRING(X, Y) (tmps = (X), (X) = (Y), (Y) = tmps) 15810 15811 SWAP_INT (fixed_regs[i], fixed_regs[i + 1]); 15812 SWAP_INT (call_used_regs[i], call_used_regs[i + 1]); 15813 SWAP_INT (call_really_used_regs[i], call_really_used_regs[i + 1]); 15814 SWAP_STRING (reg_names[i], reg_names[i + 1]); 15815 15816 #undef SWAP_STRING 15817 #undef SWAP_INT 15818 } 15819 15820 /* Implement CONDITIONAL_REGISTER_USAGE. */ 15821 15822 void 15823 mips_conditional_register_usage (void) 15824 { 15825 15826 if (ISA_HAS_DSP) 15827 { 15828 /* These DSP control register fields are global. */ 15829 global_regs[CCDSP_PO_REGNUM] = 1; 15830 global_regs[CCDSP_SC_REGNUM] = 1; 15831 } 15832 else 15833 { 15834 int regno; 15835 15836 for (regno = DSP_ACC_REG_FIRST; regno <= DSP_ACC_REG_LAST; regno++) 15837 fixed_regs[regno] = call_used_regs[regno] = 1; 15838 } 15839 if (!TARGET_HARD_FLOAT) 15840 { 15841 int regno; 15842 15843 for (regno = FP_REG_FIRST; regno <= FP_REG_LAST; regno++) 15844 fixed_regs[regno] = call_used_regs[regno] = 1; 15845 for (regno = ST_REG_FIRST; regno <= ST_REG_LAST; regno++) 15846 fixed_regs[regno] = call_used_regs[regno] = 1; 15847 } 15848 else if (! ISA_HAS_8CC) 15849 { 15850 int regno; 15851 15852 /* We only have a single condition-code register. We implement 15853 this by fixing all the condition-code registers and generating 15854 RTL that refers directly to ST_REG_FIRST. */ 15855 for (regno = ST_REG_FIRST; regno <= ST_REG_LAST; regno++) 15856 fixed_regs[regno] = call_used_regs[regno] = 1; 15857 } 15858 /* In MIPS16 mode, we permit the $t temporary registers to be used 15859 for reload. We prohibit the unused $s registers, since they 15860 are call-saved, and saving them via a MIPS16 register would 15861 probably waste more time than just reloading the value. */ 15862 if (TARGET_MIPS16) 15863 { 15864 fixed_regs[18] = call_used_regs[18] = 1; 15865 fixed_regs[19] = call_used_regs[19] = 1; 15866 fixed_regs[20] = call_used_regs[20] = 1; 15867 fixed_regs[21] = call_used_regs[21] = 1; 15868 fixed_regs[22] = call_used_regs[22] = 1; 15869 fixed_regs[23] = call_used_regs[23] = 1; 15870 fixed_regs[26] = call_used_regs[26] = 1; 15871 fixed_regs[27] = call_used_regs[27] = 1; 15872 fixed_regs[30] = call_used_regs[30] = 1; 15873 } 15874 /* $f20-$f23 are call-clobbered for n64. */ 15875 if (mips_abi == ABI_64) 15876 { 15877 int regno; 15878 for (regno = FP_REG_FIRST + 20; regno < FP_REG_FIRST + 24; regno++) 15879 call_really_used_regs[regno] = call_used_regs[regno] = 1; 15880 } 15881 /* Odd registers in the range $f21-$f31 (inclusive) are call-clobbered 15882 for n32. */ 15883 if (mips_abi == ABI_N32) 15884 { 15885 int regno; 15886 for (regno = FP_REG_FIRST + 21; regno <= FP_REG_FIRST + 31; regno+=2) 15887 call_really_used_regs[regno] = call_used_regs[regno] = 1; 15888 } 15889 /* Make sure that double-register accumulator values are correctly 15890 ordered for the current endianness. */ 15891 if (TARGET_LITTLE_ENDIAN) 15892 { 15893 unsigned int regno; 15894 15895 mips_swap_registers (MD_REG_FIRST); 15896 for (regno = DSP_ACC_REG_FIRST; regno <= DSP_ACC_REG_LAST; regno += 2) 15897 mips_swap_registers (regno); 15898 } 15899 } 15900 15901 /* Initialize vector TARGET to VALS. */ 15902 15903 void 15904 mips_expand_vector_init (rtx target, rtx vals) 15905 { 15906 enum machine_mode mode; 15907 enum machine_mode inner; 15908 unsigned int i, n_elts; 15909 rtx mem; 15910 15911 mode = GET_MODE (target); 15912 inner = GET_MODE_INNER (mode); 15913 n_elts = GET_MODE_NUNITS (mode); 15914 15915 gcc_assert (VECTOR_MODE_P (mode)); 15916 15917 mem = assign_stack_temp (mode, GET_MODE_SIZE (mode), 0); 15918 for (i = 0; i < n_elts; i++) 15919 emit_move_insn (adjust_address_nv (mem, inner, i * GET_MODE_SIZE (inner)), 15920 XVECEXP (vals, 0, i)); 15921 15922 emit_move_insn (target, mem); 15923 } 15924 15925 /* When generating MIPS16 code, we want to allocate $24 (T_REG) before 15926 other registers for instructions for which it is possible. This 15927 encourages the compiler to use CMP in cases where an XOR would 15928 require some register shuffling. */ 15929 15930 void 15931 mips_order_regs_for_local_alloc (void) 15932 { 15933 int i; 15934 15935 for (i = 0; i < FIRST_PSEUDO_REGISTER; i++) 15936 reg_alloc_order[i] = i; 15937 15938 if (TARGET_MIPS16) 15939 { 15940 /* It really doesn't matter where we put register 0, since it is 15941 a fixed register anyhow. */ 15942 reg_alloc_order[0] = 24; 15943 reg_alloc_order[24] = 0; 15944 } 15945 } 15946 15947 /* Implement EH_USES. */ 15948 15949 bool 15950 mips_eh_uses (unsigned int regno) 15951 { 15952 if (reload_completed && !TARGET_ABSOLUTE_JUMPS) 15953 { 15954 /* We need to force certain registers to be live in order to handle 15955 PIC long branches correctly. See mips_must_initialize_gp_p for 15956 details. */ 15957 if (mips_cfun_has_cprestore_slot_p ()) 15958 { 15959 if (regno == CPRESTORE_SLOT_REGNUM) 15960 return true; 15961 } 15962 else 15963 { 15964 if (cfun->machine->global_pointer == regno) 15965 return true; 15966 } 15967 } 15968 15969 return false; 15970 } 15971 15972 /* Implement EPILOGUE_USES. */ 15973 15974 bool 15975 mips_epilogue_uses (unsigned int regno) 15976 { 15977 /* Say that the epilogue uses the return address register. Note that 15978 in the case of sibcalls, the values "used by the epilogue" are 15979 considered live at the start of the called function. */ 15980 if (regno == RETURN_ADDR_REGNUM) 15981 return true; 15982 15983 /* If using a GOT, say that the epilogue also uses GOT_VERSION_REGNUM. 15984 See the comment above load_call<mode> for details. */ 15985 if (TARGET_USE_GOT && (regno) == GOT_VERSION_REGNUM) 15986 return true; 15987 15988 /* An interrupt handler must preserve some registers that are 15989 ordinarily call-clobbered. */ 15990 if (cfun->machine->interrupt_handler_p 15991 && mips_interrupt_extra_call_saved_reg_p (regno)) 15992 return true; 15993 15994 return false; 15995 } 15996 15997 /* A for_each_rtx callback. Stop the search if *X is an AT register. */ 15998 15999 static int 16000 mips_at_reg_p (rtx *x, void *data ATTRIBUTE_UNUSED) 16001 { 16002 return REG_P (*x) && REGNO (*x) == AT_REGNUM; 16003 } 16004 16005 /* Return true if INSN needs to be wrapped in ".set noat". 16006 INSN has NOPERANDS operands, stored in OPVEC. */ 16007 16008 static bool 16009 mips_need_noat_wrapper_p (rtx insn, rtx *opvec, int noperands) 16010 { 16011 int i; 16012 16013 if (recog_memoized (insn) >= 0) 16014 for (i = 0; i < noperands; i++) 16015 if (for_each_rtx (&opvec[i], mips_at_reg_p, NULL)) 16016 return true; 16017 return false; 16018 } 16019 16020 /* Implement FINAL_PRESCAN_INSN. */ 16021 16022 void 16023 mips_final_prescan_insn (rtx insn, rtx *opvec, int noperands) 16024 { 16025 if (mips_need_noat_wrapper_p (insn, opvec, noperands)) 16026 mips_push_asm_switch (&mips_noat); 16027 } 16028 16029 /* Implement TARGET_ASM_FINAL_POSTSCAN_INSN. */ 16030 16031 static void 16032 mips_final_postscan_insn (FILE *file ATTRIBUTE_UNUSED, rtx insn, 16033 rtx *opvec, int noperands) 16034 { 16035 if (mips_need_noat_wrapper_p (insn, opvec, noperands)) 16036 mips_pop_asm_switch (&mips_noat); 16037 } 16038 16039 /* Return the function that is used to expand the <u>mulsidi3 pattern. 16040 EXT_CODE is the code of the extension used. Return NULL if widening 16041 multiplication shouldn't be used. */ 16042 16043 mulsidi3_gen_fn 16044 mips_mulsidi3_gen_fn (enum rtx_code ext_code) 16045 { 16046 bool signed_p; 16047 16048 signed_p = ext_code == SIGN_EXTEND; 16049 if (TARGET_64BIT) 16050 { 16051 /* Don't use widening multiplication with MULT when we have DMUL. Even 16052 with the extension of its input operands DMUL is faster. Note that 16053 the extension is not needed for signed multiplication. In order to 16054 ensure that we always remove the redundant sign-extension in this 16055 case we still expand mulsidi3 for DMUL. */ 16056 if (ISA_HAS_DMUL3) 16057 return signed_p ? gen_mulsidi3_64bit_dmul : NULL; 16058 if (TARGET_FIX_R4000) 16059 return NULL; 16060 return signed_p ? gen_mulsidi3_64bit : gen_umulsidi3_64bit; 16061 } 16062 else 16063 { 16064 if (TARGET_FIX_R4000) 16065 return signed_p ? gen_mulsidi3_32bit_r4000 : gen_umulsidi3_32bit_r4000; 16066 if (ISA_HAS_DSPR2) 16067 return signed_p ? gen_mips_mult : gen_mips_multu; 16068 return signed_p ? gen_mulsidi3_32bit : gen_umulsidi3_32bit; 16069 } 16070 } 16071 16072 /* Return the size in bytes of the trampoline code, padded to 16073 TRAMPOLINE_ALIGNMENT bits. The static chain pointer and target 16074 function address immediately follow. */ 16075 16076 int 16077 mips_trampoline_code_size (void) 16078 { 16079 if (TARGET_USE_PIC_FN_ADDR_REG) 16080 return 4 * 4; 16081 else if (ptr_mode == DImode) 16082 return 8 * 4; 16083 else if (ISA_HAS_LOAD_DELAY) 16084 return 6 * 4; 16085 else 16086 return 4 * 4; 16087 } 16088 16089 /* Implement TARGET_TRAMPOLINE_INIT. */ 16090 16091 static void 16092 mips_trampoline_init (rtx m_tramp, tree fndecl, rtx chain_value) 16093 { 16094 rtx addr, end_addr, high, low, opcode, mem; 16095 rtx trampoline[8]; 16096 unsigned int i, j; 16097 HOST_WIDE_INT end_addr_offset, static_chain_offset, target_function_offset; 16098 16099 /* Work out the offsets of the pointers from the start of the 16100 trampoline code. */ 16101 end_addr_offset = mips_trampoline_code_size (); 16102 static_chain_offset = end_addr_offset; 16103 target_function_offset = static_chain_offset + GET_MODE_SIZE (ptr_mode); 16104 16105 /* Get pointers to the beginning and end of the code block. */ 16106 addr = force_reg (Pmode, XEXP (m_tramp, 0)); 16107 end_addr = mips_force_binary (Pmode, PLUS, addr, GEN_INT (end_addr_offset)); 16108 16109 #define OP(X) gen_int_mode (X, SImode) 16110 16111 /* Build up the code in TRAMPOLINE. */ 16112 i = 0; 16113 if (TARGET_USE_PIC_FN_ADDR_REG) 16114 { 16115 /* $25 contains the address of the trampoline. Emit code of the form: 16116 16117 l[wd] $1, target_function_offset($25) 16118 l[wd] $static_chain, static_chain_offset($25) 16119 jr $1 16120 move $25,$1. */ 16121 trampoline[i++] = OP (MIPS_LOAD_PTR (AT_REGNUM, 16122 target_function_offset, 16123 PIC_FUNCTION_ADDR_REGNUM)); 16124 trampoline[i++] = OP (MIPS_LOAD_PTR (STATIC_CHAIN_REGNUM, 16125 static_chain_offset, 16126 PIC_FUNCTION_ADDR_REGNUM)); 16127 trampoline[i++] = OP (MIPS_JR (AT_REGNUM)); 16128 trampoline[i++] = OP (MIPS_MOVE (PIC_FUNCTION_ADDR_REGNUM, AT_REGNUM)); 16129 } 16130 else if (ptr_mode == DImode) 16131 { 16132 /* It's too cumbersome to create the full 64-bit address, so let's 16133 instead use: 16134 16135 move $1, $31 16136 bal 1f 16137 nop 16138 1: l[wd] $25, target_function_offset - 12($31) 16139 l[wd] $static_chain, static_chain_offset - 12($31) 16140 jr $25 16141 move $31, $1 16142 16143 where 12 is the offset of "1:" from the start of the code block. */ 16144 trampoline[i++] = OP (MIPS_MOVE (AT_REGNUM, RETURN_ADDR_REGNUM)); 16145 trampoline[i++] = OP (MIPS_BAL (1)); 16146 trampoline[i++] = OP (MIPS_NOP); 16147 trampoline[i++] = OP (MIPS_LOAD_PTR (PIC_FUNCTION_ADDR_REGNUM, 16148 target_function_offset - 12, 16149 RETURN_ADDR_REGNUM)); 16150 trampoline[i++] = OP (MIPS_LOAD_PTR (STATIC_CHAIN_REGNUM, 16151 static_chain_offset - 12, 16152 RETURN_ADDR_REGNUM)); 16153 trampoline[i++] = OP (MIPS_JR (PIC_FUNCTION_ADDR_REGNUM)); 16154 trampoline[i++] = OP (MIPS_MOVE (RETURN_ADDR_REGNUM, AT_REGNUM)); 16155 } 16156 else 16157 { 16158 /* If the target has load delays, emit: 16159 16160 lui $1, %hi(end_addr) 16161 lw $25, %lo(end_addr + ...)($1) 16162 lw $static_chain, %lo(end_addr + ...)($1) 16163 jr $25 16164 nop 16165 16166 Otherwise emit: 16167 16168 lui $1, %hi(end_addr) 16169 lw $25, %lo(end_addr + ...)($1) 16170 jr $25 16171 lw $static_chain, %lo(end_addr + ...)($1). */ 16172 16173 /* Split END_ADDR into %hi and %lo values. Trampolines are aligned 16174 to 64 bits, so the %lo value will have the bottom 3 bits clear. */ 16175 high = expand_simple_binop (SImode, PLUS, end_addr, GEN_INT (0x8000), 16176 NULL, false, OPTAB_WIDEN); 16177 high = expand_simple_binop (SImode, LSHIFTRT, high, GEN_INT (16), 16178 NULL, false, OPTAB_WIDEN); 16179 low = convert_to_mode (SImode, gen_lowpart (HImode, end_addr), true); 16180 16181 /* Emit the LUI. */ 16182 opcode = OP (MIPS_LUI (AT_REGNUM, 0)); 16183 trampoline[i++] = expand_simple_binop (SImode, IOR, opcode, high, 16184 NULL, false, OPTAB_WIDEN); 16185 16186 /* Emit the load of the target function. */ 16187 opcode = OP (MIPS_LOAD_PTR (PIC_FUNCTION_ADDR_REGNUM, 16188 target_function_offset - end_addr_offset, 16189 AT_REGNUM)); 16190 trampoline[i++] = expand_simple_binop (SImode, IOR, opcode, low, 16191 NULL, false, OPTAB_WIDEN); 16192 16193 /* Emit the JR here, if we can. */ 16194 if (!ISA_HAS_LOAD_DELAY) 16195 trampoline[i++] = OP (MIPS_JR (PIC_FUNCTION_ADDR_REGNUM)); 16196 16197 /* Emit the load of the static chain register. */ 16198 opcode = OP (MIPS_LOAD_PTR (STATIC_CHAIN_REGNUM, 16199 static_chain_offset - end_addr_offset, 16200 AT_REGNUM)); 16201 trampoline[i++] = expand_simple_binop (SImode, IOR, opcode, low, 16202 NULL, false, OPTAB_WIDEN); 16203 16204 /* Emit the JR, if we couldn't above. */ 16205 if (ISA_HAS_LOAD_DELAY) 16206 { 16207 trampoline[i++] = OP (MIPS_JR (PIC_FUNCTION_ADDR_REGNUM)); 16208 trampoline[i++] = OP (MIPS_NOP); 16209 } 16210 } 16211 16212 #undef OP 16213 16214 /* Copy the trampoline code. Leave any padding uninitialized. */ 16215 for (j = 0; j < i; j++) 16216 { 16217 mem = adjust_address (m_tramp, SImode, j * GET_MODE_SIZE (SImode)); 16218 mips_emit_move (mem, trampoline[j]); 16219 } 16220 16221 /* Set up the static chain pointer field. */ 16222 mem = adjust_address (m_tramp, ptr_mode, static_chain_offset); 16223 mips_emit_move (mem, chain_value); 16224 16225 /* Set up the target function field. */ 16226 mem = adjust_address (m_tramp, ptr_mode, target_function_offset); 16227 mips_emit_move (mem, XEXP (DECL_RTL (fndecl), 0)); 16228 16229 /* Flush the code part of the trampoline. */ 16230 emit_insn (gen_add3_insn (end_addr, addr, GEN_INT (TRAMPOLINE_SIZE))); 16231 emit_insn (gen_clear_cache (addr, end_addr)); 16232 } 16233 16234 /* Implement FUNCTION_PROFILER. */ 16235 16236 void mips_function_profiler (FILE *file) 16237 { 16238 if (TARGET_MIPS16) 16239 sorry ("mips16 function profiling"); 16240 if (TARGET_LONG_CALLS) 16241 { 16242 /* For TARGET_LONG_CALLS use $3 for the address of _mcount. */ 16243 if (Pmode == DImode) 16244 fprintf (file, "\tdla\t%s,_mcount\n", reg_names[3]); 16245 else 16246 fprintf (file, "\tla\t%s,_mcount\n", reg_names[3]); 16247 } 16248 mips_push_asm_switch (&mips_noat); 16249 fprintf (file, "\tmove\t%s,%s\t\t# save current return address\n", 16250 reg_names[AT_REGNUM], reg_names[RETURN_ADDR_REGNUM]); 16251 /* _mcount treats $2 as the static chain register. */ 16252 if (cfun->static_chain_decl != NULL) 16253 fprintf (file, "\tmove\t%s,%s\n", reg_names[2], 16254 reg_names[STATIC_CHAIN_REGNUM]); 16255 if (TARGET_MCOUNT_RA_ADDRESS) 16256 { 16257 /* If TARGET_MCOUNT_RA_ADDRESS load $12 with the address of the 16258 ra save location. */ 16259 if (cfun->machine->frame.ra_fp_offset == 0) 16260 /* ra not saved, pass zero. */ 16261 fprintf (file, "\tmove\t%s,%s\n", reg_names[12], reg_names[0]); 16262 else 16263 fprintf (file, "\t%s\t%s," HOST_WIDE_INT_PRINT_DEC "(%s)\n", 16264 Pmode == DImode ? "dla" : "la", reg_names[12], 16265 cfun->machine->frame.ra_fp_offset, 16266 reg_names[STACK_POINTER_REGNUM]); 16267 } 16268 if (!TARGET_NEWABI) 16269 fprintf (file, 16270 "\t%s\t%s,%s,%d\t\t# _mcount pops 2 words from stack\n", 16271 TARGET_64BIT ? "dsubu" : "subu", 16272 reg_names[STACK_POINTER_REGNUM], 16273 reg_names[STACK_POINTER_REGNUM], 16274 Pmode == DImode ? 16 : 8); 16275 16276 if (TARGET_LONG_CALLS) 16277 fprintf (file, "\tjalr\t%s\n", reg_names[3]); 16278 else 16279 fprintf (file, "\tjal\t_mcount\n"); 16280 mips_pop_asm_switch (&mips_noat); 16281 /* _mcount treats $2 as the static chain register. */ 16282 if (cfun->static_chain_decl != NULL) 16283 fprintf (file, "\tmove\t%s,%s\n", reg_names[STATIC_CHAIN_REGNUM], 16284 reg_names[2]); 16285 } 16286 16287 /* Initialize the GCC target structure. */ 16288 #undef TARGET_ASM_ALIGNED_HI_OP 16289 #define TARGET_ASM_ALIGNED_HI_OP "\t.half\t" 16290 #undef TARGET_ASM_ALIGNED_SI_OP 16291 #define TARGET_ASM_ALIGNED_SI_OP "\t.word\t" 16292 #undef TARGET_ASM_ALIGNED_DI_OP 16293 #define TARGET_ASM_ALIGNED_DI_OP "\t.dword\t" 16294 16295 #undef TARGET_LEGITIMIZE_ADDRESS 16296 #define TARGET_LEGITIMIZE_ADDRESS mips_legitimize_address 16297 16298 #undef TARGET_ASM_FUNCTION_PROLOGUE 16299 #define TARGET_ASM_FUNCTION_PROLOGUE mips_output_function_prologue 16300 #undef TARGET_ASM_FUNCTION_EPILOGUE 16301 #define TARGET_ASM_FUNCTION_EPILOGUE mips_output_function_epilogue 16302 #undef TARGET_ASM_SELECT_RTX_SECTION 16303 #define TARGET_ASM_SELECT_RTX_SECTION mips_select_rtx_section 16304 #undef TARGET_ASM_FUNCTION_RODATA_SECTION 16305 #define TARGET_ASM_FUNCTION_RODATA_SECTION mips_function_rodata_section 16306 16307 #undef TARGET_SCHED_INIT 16308 #define TARGET_SCHED_INIT mips_sched_init 16309 #undef TARGET_SCHED_REORDER 16310 #define TARGET_SCHED_REORDER mips_sched_reorder 16311 #undef TARGET_SCHED_REORDER2 16312 #define TARGET_SCHED_REORDER2 mips_sched_reorder 16313 #undef TARGET_SCHED_VARIABLE_ISSUE 16314 #define TARGET_SCHED_VARIABLE_ISSUE mips_variable_issue 16315 #undef TARGET_SCHED_ADJUST_COST 16316 #define TARGET_SCHED_ADJUST_COST mips_adjust_cost 16317 #undef TARGET_SCHED_ISSUE_RATE 16318 #define TARGET_SCHED_ISSUE_RATE mips_issue_rate 16319 #undef TARGET_SCHED_INIT_DFA_POST_CYCLE_INSN 16320 #define TARGET_SCHED_INIT_DFA_POST_CYCLE_INSN mips_init_dfa_post_cycle_insn 16321 #undef TARGET_SCHED_DFA_POST_ADVANCE_CYCLE 16322 #define TARGET_SCHED_DFA_POST_ADVANCE_CYCLE mips_dfa_post_advance_cycle 16323 #undef TARGET_SCHED_FIRST_CYCLE_MULTIPASS_DFA_LOOKAHEAD 16324 #define TARGET_SCHED_FIRST_CYCLE_MULTIPASS_DFA_LOOKAHEAD \ 16325 mips_multipass_dfa_lookahead 16326 16327 #undef TARGET_DEFAULT_TARGET_FLAGS 16328 #define TARGET_DEFAULT_TARGET_FLAGS \ 16329 (TARGET_DEFAULT \ 16330 | TARGET_CPU_DEFAULT \ 16331 | TARGET_ENDIAN_DEFAULT \ 16332 | TARGET_FP_EXCEPTIONS_DEFAULT \ 16333 | MASK_CHECK_ZERO_DIV \ 16334 | MASK_FUSED_MADD) 16335 #undef TARGET_HANDLE_OPTION 16336 #define TARGET_HANDLE_OPTION mips_handle_option 16337 16338 #undef TARGET_FUNCTION_OK_FOR_SIBCALL 16339 #define TARGET_FUNCTION_OK_FOR_SIBCALL mips_function_ok_for_sibcall 16340 16341 #undef TARGET_INSERT_ATTRIBUTES 16342 #define TARGET_INSERT_ATTRIBUTES mips_insert_attributes 16343 #undef TARGET_MERGE_DECL_ATTRIBUTES 16344 #define TARGET_MERGE_DECL_ATTRIBUTES mips_merge_decl_attributes 16345 #undef TARGET_SET_CURRENT_FUNCTION 16346 #define TARGET_SET_CURRENT_FUNCTION mips_set_current_function 16347 16348 #undef TARGET_VALID_POINTER_MODE 16349 #define TARGET_VALID_POINTER_MODE mips_valid_pointer_mode 16350 #undef TARGET_RTX_COSTS 16351 #define TARGET_RTX_COSTS mips_rtx_costs 16352 #undef TARGET_ADDRESS_COST 16353 #define TARGET_ADDRESS_COST mips_address_cost 16354 16355 #undef TARGET_IN_SMALL_DATA_P 16356 #define TARGET_IN_SMALL_DATA_P mips_in_small_data_p 16357 16358 #undef TARGET_MACHINE_DEPENDENT_REORG 16359 #define TARGET_MACHINE_DEPENDENT_REORG mips_reorg 16360 16361 #undef TARGET_ASM_FILE_START 16362 #define TARGET_ASM_FILE_START mips_file_start 16363 #undef TARGET_ASM_FILE_START_FILE_DIRECTIVE 16364 #define TARGET_ASM_FILE_START_FILE_DIRECTIVE true 16365 16366 #undef TARGET_INIT_LIBFUNCS 16367 #define TARGET_INIT_LIBFUNCS mips_init_libfuncs 16368 16369 #undef TARGET_BUILD_BUILTIN_VA_LIST 16370 #define TARGET_BUILD_BUILTIN_VA_LIST mips_build_builtin_va_list 16371 #undef TARGET_EXPAND_BUILTIN_VA_START 16372 #define TARGET_EXPAND_BUILTIN_VA_START mips_va_start 16373 #undef TARGET_GIMPLIFY_VA_ARG_EXPR 16374 #define TARGET_GIMPLIFY_VA_ARG_EXPR mips_gimplify_va_arg_expr 16375 16376 #undef TARGET_PROMOTE_FUNCTION_MODE 16377 #define TARGET_PROMOTE_FUNCTION_MODE default_promote_function_mode_always_promote 16378 #undef TARGET_PROMOTE_PROTOTYPES 16379 #define TARGET_PROMOTE_PROTOTYPES hook_bool_const_tree_true 16380 16381 #undef TARGET_RETURN_IN_MEMORY 16382 #define TARGET_RETURN_IN_MEMORY mips_return_in_memory 16383 #undef TARGET_RETURN_IN_MSB 16384 #define TARGET_RETURN_IN_MSB mips_return_in_msb 16385 16386 #undef TARGET_ASM_OUTPUT_MI_THUNK 16387 #define TARGET_ASM_OUTPUT_MI_THUNK mips_output_mi_thunk 16388 #undef TARGET_ASM_CAN_OUTPUT_MI_THUNK 16389 #define TARGET_ASM_CAN_OUTPUT_MI_THUNK hook_bool_const_tree_hwi_hwi_const_tree_true 16390 16391 #undef TARGET_SETUP_INCOMING_VARARGS 16392 #define TARGET_SETUP_INCOMING_VARARGS mips_setup_incoming_varargs 16393 #undef TARGET_STRICT_ARGUMENT_NAMING 16394 #define TARGET_STRICT_ARGUMENT_NAMING mips_strict_argument_naming 16395 #undef TARGET_MUST_PASS_IN_STACK 16396 #define TARGET_MUST_PASS_IN_STACK must_pass_in_stack_var_size 16397 #undef TARGET_PASS_BY_REFERENCE 16398 #define TARGET_PASS_BY_REFERENCE mips_pass_by_reference 16399 #undef TARGET_CALLEE_COPIES 16400 #define TARGET_CALLEE_COPIES mips_callee_copies 16401 #undef TARGET_ARG_PARTIAL_BYTES 16402 #define TARGET_ARG_PARTIAL_BYTES mips_arg_partial_bytes 16403 16404 #undef TARGET_MODE_REP_EXTENDED 16405 #define TARGET_MODE_REP_EXTENDED mips_mode_rep_extended 16406 16407 #undef TARGET_VECTOR_MODE_SUPPORTED_P 16408 #define TARGET_VECTOR_MODE_SUPPORTED_P mips_vector_mode_supported_p 16409 16410 #undef TARGET_SCALAR_MODE_SUPPORTED_P 16411 #define TARGET_SCALAR_MODE_SUPPORTED_P mips_scalar_mode_supported_p 16412 16413 #undef TARGET_INIT_BUILTINS 16414 #define TARGET_INIT_BUILTINS mips_init_builtins 16415 #undef TARGET_EXPAND_BUILTIN 16416 #define TARGET_EXPAND_BUILTIN mips_expand_builtin 16417 16418 #undef TARGET_HAVE_TLS 16419 #define TARGET_HAVE_TLS HAVE_AS_TLS 16420 16421 #undef TARGET_CANNOT_FORCE_CONST_MEM 16422 #define TARGET_CANNOT_FORCE_CONST_MEM mips_cannot_force_const_mem 16423 16424 #undef TARGET_ENCODE_SECTION_INFO 16425 #define TARGET_ENCODE_SECTION_INFO mips_encode_section_info 16426 16427 #undef TARGET_ATTRIBUTE_TABLE 16428 #define TARGET_ATTRIBUTE_TABLE mips_attribute_table 16429 /* All our function attributes are related to how out-of-line copies should 16430 be compiled or called. They don't in themselves prevent inlining. */ 16431 #undef TARGET_FUNCTION_ATTRIBUTE_INLINABLE_P 16432 #define TARGET_FUNCTION_ATTRIBUTE_INLINABLE_P hook_bool_const_tree_true 16433 16434 #undef TARGET_EXTRA_LIVE_ON_ENTRY 16435 #define TARGET_EXTRA_LIVE_ON_ENTRY mips_extra_live_on_entry 16436 16437 #undef TARGET_USE_BLOCKS_FOR_CONSTANT_P 16438 #define TARGET_USE_BLOCKS_FOR_CONSTANT_P mips_use_blocks_for_constant_p 16439 #undef TARGET_USE_ANCHORS_FOR_SYMBOL_P 16440 #define TARGET_USE_ANCHORS_FOR_SYMBOL_P mips_use_anchors_for_symbol_p 16441 16442 #undef TARGET_COMP_TYPE_ATTRIBUTES 16443 #define TARGET_COMP_TYPE_ATTRIBUTES mips_comp_type_attributes 16444 16445 #ifdef HAVE_AS_DTPRELWORD 16446 #undef TARGET_ASM_OUTPUT_DWARF_DTPREL 16447 #define TARGET_ASM_OUTPUT_DWARF_DTPREL mips_output_dwarf_dtprel 16448 #endif 16449 #undef TARGET_DWARF_REGISTER_SPAN 16450 #define TARGET_DWARF_REGISTER_SPAN mips_dwarf_register_span 16451 16452 #undef TARGET_IRA_COVER_CLASSES 16453 #define TARGET_IRA_COVER_CLASSES mips_ira_cover_classes 16454 16455 #undef TARGET_ASM_FINAL_POSTSCAN_INSN 16456 #define TARGET_ASM_FINAL_POSTSCAN_INSN mips_final_postscan_insn 16457 16458 #undef TARGET_LEGITIMATE_ADDRESS_P 16459 #define TARGET_LEGITIMATE_ADDRESS_P mips_legitimate_address_p 16460 16461 #undef TARGET_FRAME_POINTER_REQUIRED 16462 #define TARGET_FRAME_POINTER_REQUIRED mips_frame_pointer_required 16463 16464 #undef TARGET_CAN_ELIMINATE 16465 #define TARGET_CAN_ELIMINATE mips_can_eliminate 16466 16467 #undef TARGET_TRAMPOLINE_INIT 16468 #define TARGET_TRAMPOLINE_INIT mips_trampoline_init 16469 16470 struct gcc_target targetm = TARGET_INITIALIZER; 16471 16472 #include "gt-mips.h" 16473