1 /* Target Definitions for NVPTX. 2 Copyright (C) 2014-2015 Free Software Foundation, Inc. 3 Contributed by Bernd Schmidt <bernds@codesourcery.com> 4 5 This file is part of GCC. 6 7 GCC is free software; you can redistribute it and/or modify it 8 under the terms of the GNU General Public License as published 9 by the Free Software Foundation; either version 3, or (at your 10 option) any later version. 11 12 GCC is distributed in the hope that it will be useful, but WITHOUT 13 ANY WARRANTY; without even the implied warranty of MERCHANTABILITY 14 or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public 15 License for more details. 16 17 You should have received a copy of the GNU General Public License 18 along with GCC; see the file COPYING3. If not see 19 <http://www.gnu.org/licenses/>. */ 20 21 #ifndef GCC_NVPTX_H 22 #define GCC_NVPTX_H 23 24 /* Run-time Target. */ 25 26 #define STARTFILE_SPEC "%{mmainkernel:crt0.o}" 27 28 #define TARGET_CPU_CPP_BUILTINS() \ 29 do \ 30 { \ 31 builtin_assert ("machine=nvptx"); \ 32 builtin_assert ("cpu=nvptx"); \ 33 builtin_define ("__nvptx__"); \ 34 } while (0) 35 36 /* Avoid the default in ../../gcc.c, which adds "-pthread", which is not 37 supported for nvptx. */ 38 #define GOMP_SELF_SPECS "" 39 40 /* Storage Layout. */ 41 42 #define BITS_BIG_ENDIAN 0 43 #define BYTES_BIG_ENDIAN 0 44 #define WORDS_BIG_ENDIAN 0 45 46 /* Chosen such that we won't have to deal with multi-word subregs. */ 47 #define UNITS_PER_WORD 8 48 49 #define PARM_BOUNDARY 8 50 #define STACK_BOUNDARY 64 51 #define FUNCTION_BOUNDARY 32 52 #define BIGGEST_ALIGNMENT 64 53 #define STRICT_ALIGNMENT 1 54 55 /* Copied from elf.h and other places. We'd otherwise use 56 BIGGEST_ALIGNMENT and fail a number of testcases. */ 57 #define MAX_OFILE_ALIGNMENT (32768 * 8) 58 59 /* Type Layout. */ 60 61 #define DEFAULT_SIGNED_CHAR 1 62 63 #define SHORT_TYPE_SIZE 16 64 #define INT_TYPE_SIZE 32 65 #define LONG_TYPE_SIZE (TARGET_ABI64 ? 64 : 32) 66 #define LONG_LONG_TYPE_SIZE 64 67 #define FLOAT_TYPE_SIZE 32 68 #define DOUBLE_TYPE_SIZE 64 69 #define LONG_DOUBLE_TYPE_SIZE 64 70 71 #undef SIZE_TYPE 72 #define SIZE_TYPE (TARGET_ABI64 ? "long unsigned int" : "unsigned int") 73 #undef PTRDIFF_TYPE 74 #define PTRDIFF_TYPE (TARGET_ABI64 ? "long int" : "int") 75 76 #define POINTER_SIZE (TARGET_ABI64 ? 64 : 32) 77 78 #define Pmode (TARGET_ABI64 ? DImode : SImode) 79 80 /* Registers. Since ptx is a virtual target, we just define a few 81 hard registers for special purposes and leave pseudos unallocated. */ 82 83 #define FIRST_PSEUDO_REGISTER 16 84 #define FIXED_REGISTERS \ 85 { 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1 } 86 #define CALL_USED_REGISTERS \ 87 { 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1 } 88 89 #define HARD_REGNO_NREGS(regno, mode) 1 90 #define CANNOT_CHANGE_MODE_CLASS(M1, M2, CLS) ((CLS) == RETURN_REG) 91 #define HARD_REGNO_MODE_OK(REG, MODE) nvptx_hard_regno_mode_ok (REG, MODE) 92 93 /* Register Classes. */ 94 95 enum reg_class 96 { 97 NO_REGS, 98 RETURN_REG, 99 ALL_REGS, 100 LIM_REG_CLASSES 101 }; 102 103 #define N_REG_CLASSES (int) LIM_REG_CLASSES 104 105 #define REG_CLASS_NAMES { \ 106 "RETURN_REG", \ 107 "NO_REGS", \ 108 "ALL_REGS" } 109 110 #define REG_CLASS_CONTENTS \ 111 { \ 112 /* NO_REGS. */ \ 113 { 0x0000 }, \ 114 /* RETURN_REG. */ \ 115 { 0x0008 }, \ 116 /* ALL_REGS. */ \ 117 { 0xFFFF }, \ 118 } 119 120 #define GENERAL_REGS ALL_REGS 121 122 #define REGNO_REG_CLASS(R) ((R) == 4 ? RETURN_REG : ALL_REGS) 123 124 #define BASE_REG_CLASS ALL_REGS 125 #define INDEX_REG_CLASS NO_REGS 126 127 #define REGNO_OK_FOR_BASE_P(X) true 128 #define REGNO_OK_FOR_INDEX_P(X) false 129 130 #define CLASS_MAX_NREGS(class, mode) \ 131 ((GET_MODE_SIZE (mode) + UNITS_PER_WORD - 1) / UNITS_PER_WORD) 132 133 #define MODES_TIEABLE_P(M1, M2) false 134 135 #define PROMOTE_MODE(MODE, UNSIGNEDP, TYPE) \ 136 if (GET_MODE_CLASS (MODE) == MODE_INT \ 137 && GET_MODE_SIZE (MODE) < GET_MODE_SIZE (SImode)) \ 138 { \ 139 (MODE) = SImode; \ 140 } 141 142 /* Address spaces. */ 143 #define ADDR_SPACE_GLOBAL 1 144 #define ADDR_SPACE_SHARED 3 145 #define ADDR_SPACE_CONST 4 146 #define ADDR_SPACE_LOCAL 5 147 #define ADDR_SPACE_PARAM 101 148 149 /* Stack and Calling. */ 150 151 #define STARTING_FRAME_OFFSET 0 152 #define FRAME_GROWS_DOWNWARD 0 153 #define STACK_GROWS_DOWNWARD 154 155 #define STACK_POINTER_REGNUM 1 156 #define HARD_FRAME_POINTER_REGNUM 2 157 #define NVPTX_PUNNING_BUFFER_REGNUM 3 158 #define NVPTX_RETURN_REGNUM 4 159 #define FRAME_POINTER_REGNUM 15 160 #define ARG_POINTER_REGNUM 14 161 #define RETURN_ADDR_REGNO 13 162 163 #define STATIC_CHAIN_REGNUM 12 164 #define OUTGOING_ARG_POINTER_REGNUM 11 165 #define OUTGOING_STATIC_CHAIN_REGNUM 10 166 167 #define FIRST_PARM_OFFSET(FNDECL) 0 168 #define PUSH_ARGS_REVERSED 1 169 170 #define ACCUMULATE_OUTGOING_ARGS 1 171 172 #ifdef HOST_WIDE_INT 173 struct nvptx_args { 174 union tree_node *fntype; 175 /* Number of arguments passed in registers so far. */ 176 int count; 177 /* Offset into the stdarg area so far. */ 178 HOST_WIDE_INT off; 179 }; 180 #endif 181 182 #define CUMULATIVE_ARGS struct nvptx_args 183 184 #define INIT_CUMULATIVE_ARGS(CUM, FNTYPE, LIBNAME, FNDECL, N_NAMED_ARGS) \ 185 do { (CUM).fntype = (FNTYPE); (CUM).count = 0; (CUM).off = 0; } while (0) 186 187 #define FUNCTION_ARG_REGNO_P(r) 0 188 189 #define DEFAULT_PCC_STRUCT_RETURN 0 190 191 #define FUNCTION_PROFILER(file, labelno) \ 192 fatal_error (input_location, \ 193 "profiling is not yet implemented for this architecture") 194 195 #define TRAMPOLINE_SIZE 32 196 #define TRAMPOLINE_ALIGNMENT 256 197 198 /* We don't run reload, so this isn't actually used, but it still needs to be 199 defined. Showing an argp->fp elimination also stops 200 expand_builtin_setjmp_receiver from generating invalid insns. */ 201 #define ELIMINABLE_REGS \ 202 { \ 203 { FRAME_POINTER_REGNUM, HARD_FRAME_POINTER_REGNUM}, \ 204 { ARG_POINTER_REGNUM, HARD_FRAME_POINTER_REGNUM} \ 205 } 206 207 /* Define the offset between two registers, one to be eliminated, and the other 208 its replacement, at the start of a routine. */ 209 210 #define INITIAL_ELIMINATION_OFFSET(FROM, TO, OFFSET) \ 211 ((OFFSET) = 0) 212 213 /* Addressing Modes. */ 214 215 #define MAX_REGS_PER_ADDRESS 1 216 217 #define LEGITIMATE_PIC_OPERAND_P(X) 1 218 219 220 struct nvptx_pseudo_info 221 { 222 int true_size; 223 int renumber; 224 }; 225 226 #if defined HOST_WIDE_INT 227 struct GTY(()) machine_function 228 { 229 rtx_expr_list *call_args; 230 rtx start_call; 231 tree funtype; 232 bool has_call_with_varargs; 233 bool has_call_with_sc; 234 struct GTY((skip)) nvptx_pseudo_info *pseudos; 235 HOST_WIDE_INT outgoing_stdarg_size; 236 int ret_reg_mode; 237 int punning_buffer_size; 238 }; 239 #endif 240 241 /* Costs. */ 242 243 #define NO_FUNCTION_CSE 1 244 #define SLOW_BYTE_ACCESS 0 245 #define BRANCH_COST(speed_p, predictable_p) 6 246 247 /* Assembler Format. */ 248 249 #undef ASM_DECLARE_FUNCTION_NAME 250 #define ASM_DECLARE_FUNCTION_NAME(FILE, NAME, DECL) \ 251 nvptx_declare_function_name (FILE, NAME, DECL) 252 253 #undef ASM_DECLARE_FUNCTION_SIZE 254 #define ASM_DECLARE_FUNCTION_SIZE(STREAM, NAME, DECL) \ 255 nvptx_function_end (STREAM) 256 257 #define DWARF2_ASM_LINE_DEBUG_INFO 1 258 259 #undef ASM_APP_ON 260 #define ASM_APP_ON "\t// #APP \n" 261 #undef ASM_APP_OFF 262 #define ASM_APP_OFF "\t// #NO_APP \n" 263 264 #define ASM_OUTPUT_COMMON(stream, name, size, rounded) 265 #define ASM_OUTPUT_LOCAL(stream, name, size, rounded) 266 267 #define REGISTER_NAMES \ 268 { \ 269 "%hr0", "%outargs", "%hfp", "%punbuffer", "%retval", "%retval_in", "%hr6", "%hr7", \ 270 "%hr8", "%hr9", "%hr10", "%hr11", "%hr12", "%hr13", "%argp", "%frame" \ 271 } 272 273 #define DBX_REGISTER_NUMBER(N) N 274 275 #define TEXT_SECTION_ASM_OP "" 276 #define DATA_SECTION_ASM_OP "" 277 278 #undef ASM_GENERATE_INTERNAL_LABEL 279 #define ASM_GENERATE_INTERNAL_LABEL(LABEL, PREFIX, NUM) \ 280 do \ 281 { \ 282 char *__p; \ 283 __p = stpcpy (&(LABEL)[1], PREFIX); \ 284 (LABEL)[0] = '$'; \ 285 sprint_ul (__p, (unsigned long) (NUM)); \ 286 } \ 287 while (0) 288 289 #define ASM_OUTPUT_ALIGN(FILE, POWER) \ 290 do \ 291 { \ 292 (void) (FILE); \ 293 (void) (POWER); \ 294 } \ 295 while (0) 296 297 #define ASM_OUTPUT_SKIP(FILE, N) \ 298 nvptx_output_skip (FILE, N) 299 300 #undef ASM_OUTPUT_ASCII 301 #define ASM_OUTPUT_ASCII(FILE, STR, LENGTH) \ 302 nvptx_output_ascii (FILE, STR, LENGTH); 303 304 #define ASM_DECLARE_OBJECT_NAME(FILE, NAME, DECL) \ 305 nvptx_declare_object_name (FILE, NAME, DECL) 306 307 #undef ASM_OUTPUT_ALIGNED_DECL_COMMON 308 #define ASM_OUTPUT_ALIGNED_DECL_COMMON(FILE, DECL, NAME, SIZE, ALIGN) \ 309 do \ 310 { \ 311 fprintf (FILE, "// BEGIN%s VAR DEF: ", \ 312 TREE_PUBLIC (DECL) ? " GLOBAL" : ""); \ 313 assemble_name_raw (FILE, NAME); \ 314 fputc ('\n', FILE); \ 315 const char *sec = nvptx_section_for_decl (DECL); \ 316 fprintf (FILE, ".visible%s.align %d .b8 ", sec, \ 317 (ALIGN) / BITS_PER_UNIT); \ 318 assemble_name ((FILE), (NAME)); \ 319 if ((SIZE) > 0) \ 320 fprintf (FILE, "["HOST_WIDE_INT_PRINT_DEC"]", (SIZE)); \ 321 fprintf (FILE, ";\n"); \ 322 } \ 323 while (0) 324 325 #undef ASM_OUTPUT_ALIGNED_DECL_LOCAL 326 #define ASM_OUTPUT_ALIGNED_DECL_LOCAL(FILE, DECL, NAME, SIZE, ALIGN) \ 327 do \ 328 { \ 329 fprintf (FILE, "// BEGIN VAR DEF: "); \ 330 assemble_name_raw (FILE, NAME); \ 331 fputc ('\n', FILE); \ 332 const char *sec = nvptx_section_for_decl (DECL); \ 333 fprintf (FILE, ".visible%s.align %d .b8 ", sec, \ 334 (ALIGN) / BITS_PER_UNIT); \ 335 assemble_name ((FILE), (NAME)); \ 336 if ((SIZE) > 0) \ 337 fprintf (FILE, "["HOST_WIDE_INT_PRINT_DEC"]", (SIZE)); \ 338 fprintf (FILE, ";\n"); \ 339 } \ 340 while (0) 341 342 #define CASE_VECTOR_PC_RELATIVE flag_pic 343 #define JUMP_TABLES_IN_TEXT_SECTION flag_pic 344 345 #define ADDR_VEC_ALIGN(VEC) (JUMP_TABLES_IN_TEXT_SECTION ? 5 : 2) 346 347 /* Misc. */ 348 349 #define DWARF2_DEBUGGING_INFO 1 350 351 #define CLZ_DEFINED_VALUE_AT_ZERO(MODE, VALUE) \ 352 ((VALUE) = GET_MODE_BITSIZE ((MODE)), 2) 353 #define CTZ_DEFINED_VALUE_AT_ZERO(MODE, VALUE) \ 354 ((VALUE) = GET_MODE_BITSIZE ((MODE)), 2) 355 356 #define NO_DOT_IN_LABEL 357 #define ASM_COMMENT_START "//" 358 359 #define STORE_FLAG_VALUE -1 360 #define FLOAT_STORE_FLAG_VALUE(MODE) REAL_VALUE_ATOF("1.0", (MODE)) 361 362 #define CASE_VECTOR_MODE SImode 363 #define MOVE_MAX 4 364 #define MOVE_RATIO(SPEED) 4 365 #define TRULY_NOOP_TRUNCATION(outprec, inprec) 1 366 #define FUNCTION_MODE QImode 367 #define HAS_INIT_SECTION 1 368 369 /* The C++ front end insists to link against libstdc++ -- which we don't build. 370 Tell it to instead link against the innocuous libgcc. */ 371 #define LIBSTDCXX "gcc" 372 373 #endif /* GCC_NVPTX_H */ 374