xref: /netbsd-src/external/gpl3/gcc.old/dist/gcc/common/config/aarch64/aarch64-common.c (revision 8feb0f0b7eaff0608f8350bbfa3098827b4bb91b)
1 /* Common hooks for AArch64.
2    Copyright (C) 2012-2020 Free Software Foundation, Inc.
3    Contributed by ARM Ltd.
4 
5    This file is part of GCC.
6 
7    GCC is free software; you can redistribute it and/or modify it
8    under the terms of the GNU General Public License as published
9    by the Free Software Foundation; either version 3, or (at your
10    option) any later version.
11 
12    GCC is distributed in the hope that it will be useful, but WITHOUT
13    ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
14    or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public
15    License for more details.
16 
17    You should have received a copy of the GNU General Public License
18    along with GCC; see the file COPYING3.  If not see
19    <http://www.gnu.org/licenses/>.  */
20 
21 #include "config.h"
22 #define INCLUDE_STRING
23 #include "system.h"
24 #include "coretypes.h"
25 #include "tm.h"
26 #include "memmodel.h"
27 #include "tm_p.h"
28 #include "common/common-target.h"
29 #include "common/common-target-def.h"
30 #include "opts.h"
31 #include "flags.h"
32 #include "diagnostic.h"
33 
34 #ifdef  TARGET_BIG_ENDIAN_DEFAULT
35 #undef  TARGET_DEFAULT_TARGET_FLAGS
36 #define TARGET_DEFAULT_TARGET_FLAGS (MASK_BIG_END)
37 #endif
38 
39 #undef  TARGET_HANDLE_OPTION
40 #define TARGET_HANDLE_OPTION aarch64_handle_option
41 
42 #undef	TARGET_OPTION_OPTIMIZATION_TABLE
43 #define TARGET_OPTION_OPTIMIZATION_TABLE aarch_option_optimization_table
44 #undef TARGET_OPTION_INIT_STRUCT
45 #define TARGET_OPTION_INIT_STRUCT aarch64_option_init_struct
46 
47 /* Set default optimization options.  */
48 static const struct default_options aarch_option_optimization_table[] =
49   {
50     /* Enable section anchors by default at -O1 or higher.  */
51     { OPT_LEVELS_1_PLUS, OPT_fsection_anchors, NULL, 1 },
52     /* Disable fomit-frame-pointer by default.  */
53     { OPT_LEVELS_ALL, OPT_fomit_frame_pointer, NULL, 0 },
54     /* Enable -fsched-pressure by default when optimizing.  */
55     { OPT_LEVELS_1_PLUS, OPT_fsched_pressure, NULL, 1 },
56     /* Enable redundant extension instructions removal at -O2 and higher.  */
57     { OPT_LEVELS_2_PLUS, OPT_free, NULL, 1 },
58 #if (TARGET_DEFAULT_ASYNC_UNWIND_TABLES == 1)
59     { OPT_LEVELS_ALL, OPT_fasynchronous_unwind_tables, NULL, 1 },
60     { OPT_LEVELS_ALL, OPT_funwind_tables, NULL, 1},
61 #endif
62     { OPT_LEVELS_ALL, OPT__param_stack_clash_protection_guard_size_, NULL,
63       DEFAULT_STK_CLASH_GUARD_SIZE == 0 ? 16 : DEFAULT_STK_CLASH_GUARD_SIZE },
64 
65     { OPT_LEVELS_NONE, 0, NULL, 0 }
66   };
67 
68 /* Implement TARGET_HANDLE_OPTION.
69    This function handles the target specific options for CPU/target selection.
70 
71    -mcpu=CPU is shorthand for -march=ARCH_FOR_CPU, -mtune=CPU.
72    If either of -march or -mtune is given, they override their
73    respective component of -mcpu.  This logic is implemented
74    in config/aarch64/aarch64.c:aarch64_override_options.  */
75 
76 bool
aarch64_handle_option(struct gcc_options * opts,struct gcc_options * opts_set ATTRIBUTE_UNUSED,const struct cl_decoded_option * decoded,location_t loc ATTRIBUTE_UNUSED)77 aarch64_handle_option (struct gcc_options *opts,
78 		       struct gcc_options *opts_set ATTRIBUTE_UNUSED,
79 		       const struct cl_decoded_option *decoded,
80 		       location_t loc ATTRIBUTE_UNUSED)
81 {
82   size_t code = decoded->opt_index;
83   const char *arg = decoded->arg;
84   int val = decoded->value;
85 
86   switch (code)
87     {
88     case OPT_march_:
89       opts->x_aarch64_arch_string = arg;
90       return true;
91 
92     case OPT_mcpu_:
93       opts->x_aarch64_cpu_string = arg;
94       return true;
95 
96     case OPT_mtune_:
97       opts->x_aarch64_tune_string = arg;
98       return true;
99 
100     case OPT_mgeneral_regs_only:
101       opts->x_target_flags |= MASK_GENERAL_REGS_ONLY;
102       return true;
103 
104     case OPT_mfix_cortex_a53_835769:
105       opts->x_aarch64_fix_a53_err835769 = val;
106       return true;
107 
108     case OPT_mstrict_align:
109       if (val)
110 	opts->x_target_flags |= MASK_STRICT_ALIGN;
111       else
112 	opts->x_target_flags &= ~MASK_STRICT_ALIGN;
113       return true;
114 
115     case OPT_momit_leaf_frame_pointer:
116       opts->x_flag_omit_leaf_frame_pointer = val;
117       return true;
118 
119     case OPT_moutline_atomics:
120       opts->x_aarch64_flag_outline_atomics = val;
121       return true;
122 
123     default:
124       return true;
125     }
126 }
127 
128 /* An ISA extension in the co-processor and main instruction set space.  */
129 struct aarch64_option_extension
130 {
131   const char *const name;
132   const uint64_t flag_canonical;
133   const uint64_t flags_on;
134   const uint64_t flags_off;
135   const bool is_synthetic;
136 };
137 
138 /* ISA extensions in AArch64.  */
139 static const struct aarch64_option_extension all_extensions[] =
140 {
141 #define AARCH64_OPT_EXTENSION(NAME, FLAG_CANONICAL, FLAGS_ON, FLAGS_OFF, \
142 			      SYNTHETIC, Z) \
143   {NAME, FLAG_CANONICAL, FLAGS_ON, FLAGS_OFF, SYNTHETIC},
144 #include "config/aarch64/aarch64-option-extensions.def"
145   {NULL, 0, 0, 0, false}
146 };
147 
148 /* A copy of the ISA extensions list for AArch64 sorted by the popcount of
149    bits and extension turned on.  Cached for efficiency.  */
150 static struct aarch64_option_extension all_extensions_by_on[] =
151 {
152 #define AARCH64_OPT_EXTENSION(NAME, FLAG_CANONICAL, FLAGS_ON, FLAGS_OFF, \
153 			      SYNTHETIC, Z) \
154   {NAME, FLAG_CANONICAL, FLAGS_ON, FLAGS_OFF, SYNTHETIC},
155 #include "config/aarch64/aarch64-option-extensions.def"
156   {NULL, 0, 0, 0, false}
157 };
158 
159 struct processor_name_to_arch
160 {
161   const std::string processor_name;
162   const enum aarch64_arch arch;
163   const uint64_t flags;
164 };
165 
166 struct arch_to_arch_name
167 {
168   const enum aarch64_arch arch;
169   const std::string arch_name;
170   const uint64_t flags;
171 };
172 
173 /* Map processor names to the architecture revision they implement and
174    the default set of architectural feature flags they support.  */
175 static const struct processor_name_to_arch all_cores[] =
176 {
177 #define AARCH64_CORE(NAME, X, IDENT, ARCH_IDENT, FLAGS, COSTS, IMP, PART, VARIANT) \
178   {NAME, AARCH64_ARCH_##ARCH_IDENT, FLAGS},
179 #include "config/aarch64/aarch64-cores.def"
180   {"generic", AARCH64_ARCH_8A, AARCH64_FL_FOR_ARCH8},
181   {"", aarch64_no_arch, 0}
182 };
183 
184 /* Map architecture revisions to their string representation.  */
185 static const struct arch_to_arch_name all_architectures[] =
186 {
187 #define AARCH64_ARCH(NAME, CORE, ARCH_IDENT, ARCH, FLAGS) \
188   {AARCH64_ARCH_##ARCH_IDENT, NAME, FLAGS},
189 #include "config/aarch64/aarch64-arches.def"
190   {aarch64_no_arch, "", 0}
191 };
192 
193 /* Parse the architecture extension string STR and update ISA_FLAGS
194    with the architecture features turned on or off.  Return a
195    aarch64_parse_opt_result describing the result.
196    When the STR string contains an invalid extension,
197    a copy of the string is created and stored to INVALID_EXTENSION.  */
198 
199 enum aarch64_parse_opt_result
aarch64_parse_extension(const char * str,uint64_t * isa_flags,std::string * invalid_extension)200 aarch64_parse_extension (const char *str, uint64_t *isa_flags,
201 			 std::string *invalid_extension)
202 {
203   /* The extension string is parsed left to right.  */
204   const struct aarch64_option_extension *opt = NULL;
205 
206   /* Flag to say whether we are adding or removing an extension.  */
207   int adding_ext = -1;
208 
209   while (str != NULL && *str != 0)
210     {
211       const char *ext;
212       size_t len;
213 
214       str++;
215       ext = strchr (str, '+');
216 
217       if (ext != NULL)
218 	len = ext - str;
219       else
220 	len = strlen (str);
221 
222       if (len >= 2 && strncmp (str, "no", 2) == 0)
223 	{
224 	  adding_ext = 0;
225 	  len -= 2;
226 	  str += 2;
227 	}
228       else if (len > 0)
229 	adding_ext = 1;
230 
231       if (len == 0)
232 	return AARCH64_PARSE_MISSING_ARG;
233 
234 
235       /* Scan over the extensions table trying to find an exact match.  */
236       for (opt = all_extensions; opt->name != NULL; opt++)
237 	{
238 	  if (strlen (opt->name) == len && strncmp (opt->name, str, len) == 0)
239 	    {
240 	      /* Add or remove the extension.  */
241 	      if (adding_ext)
242 		*isa_flags |= (opt->flags_on | opt->flag_canonical);
243 	      else
244 		*isa_flags &= ~(opt->flags_off | opt->flag_canonical);
245 	      break;
246 	    }
247 	}
248 
249       if (opt->name == NULL)
250 	{
251 	  /* Extension not found in list.  */
252 	  if (invalid_extension)
253 	    *invalid_extension = std::string (str, len);
254 	  return AARCH64_PARSE_INVALID_FEATURE;
255 	}
256 
257       str = ext;
258     };
259 
260   return AARCH64_PARSE_OK;
261 }
262 
263 /* Append all architecture extension candidates to the CANDIDATES vector.  */
264 
265 void
aarch64_get_all_extension_candidates(auto_vec<const char * > * candidates)266 aarch64_get_all_extension_candidates (auto_vec<const char *> *candidates)
267 {
268   const struct aarch64_option_extension *opt;
269   for (opt = all_extensions; opt->name != NULL; opt++)
270     candidates->safe_push (opt->name);
271 }
272 
273 /* Comparer to sort aarch64's feature extensions by population count. Largest
274    first.  */
275 
276 typedef const struct aarch64_option_extension opt_ext;
277 
opt_ext_cmp(const void * a,const void * b)278 int opt_ext_cmp (const void* a, const void* b)
279 {
280   opt_ext *opt_a = (opt_ext *)a;
281   opt_ext *opt_b = (opt_ext *)b;
282 
283   /* We consider the total set of bits an options turns on to be the union of
284      the singleton set containing the option itself and the set of options it
285      turns on as a dependency.  As an example +dotprod turns on FL_DOTPROD and
286      FL_SIMD.  As such the set of bits represented by this option is
287      {FL_DOTPROD, FL_SIMD}. */
288   uint64_t total_flags_a = opt_a->flag_canonical & opt_a->flags_on;
289   uint64_t total_flags_b = opt_b->flag_canonical & opt_b->flags_on;
290   int popcnt_a = popcount_hwi ((HOST_WIDE_INT)total_flags_a);
291   int popcnt_b = popcount_hwi ((HOST_WIDE_INT)total_flags_b);
292   int order = popcnt_b - popcnt_a;
293 
294   /* If they have the same amount of bits set, give it a more
295      deterministic ordering by using the value of the bits themselves.  */
296   if (order != 0)
297     return order;
298 
299   if (total_flags_a != total_flags_b)
300     return total_flags_a < total_flags_b ? 1 : -1;
301 
302   return 0;
303 }
304 
305 /* Implement TARGET_OPTION_INIT_STRUCT.  */
306 
307 static void
aarch64_option_init_struct(struct gcc_options * opts ATTRIBUTE_UNUSED)308 aarch64_option_init_struct (struct gcc_options *opts ATTRIBUTE_UNUSED)
309 {
310     /* Sort the extensions based on how many bits they set, order the larger
311        counts first.  We sort the list because this makes processing the
312        feature bits O(n) instead of O(n^2).  While n is small, the function
313        to calculate the feature strings is called on every options push,
314        pop and attribute change (arm_neon headers, lto etc all cause this to
315        happen quite frequently).  It is a trade-off between time and space and
316        so time won.  Keep NULL entry last.  */
317     int n_extensions
318       = sizeof (all_extensions_by_on) / sizeof (all_extensions_by_on[0]) - 1;
319     qsort (&all_extensions_by_on, n_extensions,
320 	   sizeof (struct aarch64_option_extension), opt_ext_cmp);
321 }
322 
323 /* Checks to see if enough bits from the option OPT are enabled in
324    ISA_FLAG_BITS to be able to replace the individual options with the
325    canonicalized version of the option.  This is done based on two rules:
326 
327    1) Synthetic groups, such as +crypto we only care about the bits that are
328       turned on. e.g. +aes+sha2 can be replaced with +crypto.
329 
330    2) Options that themselves have a bit, such as +rdma, in this case, all the
331       feature bits they turn on must be available and the bit for the option
332       itself must be.  In this case it's effectively a reduction rather than a
333       grouping. e.g. +fp+simd is not enough to turn on +rdma, for that you would
334       need +rdma+fp+simd which is reduced down to +rdma.
335 */
336 
337 static bool
aarch64_contains_opt(uint64_t isa_flag_bits,opt_ext * opt)338 aarch64_contains_opt (uint64_t isa_flag_bits, opt_ext *opt)
339 {
340   uint64_t flags_check
341     = opt->is_synthetic ? opt->flags_on : opt->flag_canonical;
342 
343   return (isa_flag_bits & flags_check) == flags_check;
344 }
345 
346 /* Return a string representation of ISA_FLAGS.  DEFAULT_ARCH_FLAGS
347    gives the default set of flags which are implied by whatever -march
348    we'd put out.  Our job is to figure out the minimal set of "+" and
349    "+no" feature flags to put out, and to put them out grouped such
350    that all the "+" flags come before the "+no" flags.  */
351 
352 std::string
aarch64_get_extension_string_for_isa_flags(uint64_t isa_flags,uint64_t default_arch_flags)353 aarch64_get_extension_string_for_isa_flags (uint64_t isa_flags,
354 					    uint64_t default_arch_flags)
355 {
356   const struct aarch64_option_extension *opt = NULL;
357   std::string outstr = "";
358 
359   uint64_t isa_flag_bits = isa_flags;
360 
361   /* Pass one: Minimize the search space by reducing the set of options
362      to the smallest set that still turns on the same features as before in
363      conjunction with the bits that are turned on by default for the selected
364      architecture.  */
365   for (opt = all_extensions_by_on; opt->name != NULL; opt++)
366     {
367       /* If the bit is on by default, then all the options it turns on are also
368 	 on by default due to the transitive dependencies.
369 
370          If the option is enabled explicitly in the set then we need to emit
371 	 an option for it.  Since this list is sorted by extensions setting the
372 	 largest number of featers first, we can be sure that nothing else will
373 	 ever need to set the bits we already set.  Consider the following
374 	 situation:
375 
376 	  Feat1 = A + B + C
377 	  Feat2 = A + B
378 	  Feat3 = A + D
379 	  Feat4 = B + C
380 	  Feat5 = C
381 
382 	The following results are expected:
383 
384 	  A + C = A + Feat5
385 	  B + C = Feat4
386 	  Feat4 + A = Feat1
387 	  Feat2 + Feat5 = Feat1
388 	  Feat1 + C = Feat1
389           Feat3 + Feat4 = Feat1 + D
390 
391 	This search assumes that all invidual feature bits are use visible,
392 	in other words the user must be able to do +A, +B, +C and +D.  */
393       if (aarch64_contains_opt (isa_flag_bits | default_arch_flags, opt))
394       {
395 	/* We remove all the dependent bits, to prevent them from being turned
396 	   on twice.  This only works because we assume that all there are
397 	   individual options to set all bits standalone.  */
398 
399 	/* PR target/94396.
400 
401 	   For flags which would already imply a bit that's on by default (e.g
402 	   fp16fml which implies +fp,+fp16) we must emit the flags that are not
403 	   on by default.  i.e. in Armv8.4-a +fp16fml is default if +fp16.  So
404 	   if a user passes armv8.4-a+fp16 (or +fp16fml) then we need to emit
405 	   +fp16.  But if +fp16fml is used in an architecture where it is
406 	   completely optional we only have to emit the canonical flag.  */
407 	uint64_t toggle_bits = opt->flags_on & default_arch_flags;
408 	/* Now check to see if the canonical flag is on by default.  If it
409 	   is not then enabling it will enable all bits in flags_on.  */
410 	if ((opt->flag_canonical & default_arch_flags) == 0)
411 	  toggle_bits = opt->flags_on;
412 
413 	isa_flag_bits &= ~toggle_bits;
414 	isa_flag_bits |= opt->flag_canonical;
415       }
416     }
417 
418    /* By toggling bits on and off, we may have set bits on that are already
419       enabled by default.  So we mask the default set out so we don't emit an
420       option for them.  Instead of checking for this each time during Pass One
421       we just mask all default bits away at the end.  */
422    isa_flag_bits &= ~default_arch_flags;
423 
424    /* We now have the smallest set of features we need to process.  A subsequent
425       linear scan of the bits in isa_flag_bits will allow us to print the ext
426       names.  However as a special case if CRC was enabled before, always print
427       it.  This is required because some CPUs have an incorrect specification
428       in older assemblers.  Even though CRC should be the default for these
429       cases the -mcpu values won't turn it on.  */
430   if (isa_flags & AARCH64_ISA_CRC)
431     isa_flag_bits |= AARCH64_ISA_CRC;
432 
433   /* Pass Two:
434      Print the option names that we're sure we must turn on.  These are only
435      optional extension names.  Mandatory ones have already been removed and
436      ones we explicitly want off have been too.  */
437   for (opt = all_extensions_by_on; opt->name != NULL; opt++)
438     {
439       if (isa_flag_bits & opt->flag_canonical)
440 	{
441 	  outstr += "+";
442 	  outstr += opt->name;
443 	}
444     }
445 
446   /* Pass Three:
447      Print out a +no for any mandatory extension that we are
448      turning off.  By this point aarch64_parse_extension would have ensured
449      that any optional extensions are turned off.  The only things left are
450      things that can't be turned off usually, e.g. something that is on by
451      default because it's mandatory and we want it off.  For turning off bits
452      we don't guarantee the smallest set of flags, but instead just emit all
453      options the user has specified.
454 
455      The assembler requires all +<opts> to be printed before +no<opts>.  */
456   for (opt = all_extensions_by_on; opt->name != NULL; opt++)
457     {
458       if ((~isa_flags) & opt->flag_canonical
459 		&& !((~default_arch_flags) & opt->flag_canonical))
460 	{
461 	  outstr += "+no";
462 	  outstr += opt->name;
463 	}
464     }
465 
466   return outstr;
467 }
468 
469 /* Attempt to rewrite NAME, which has been passed on the command line
470    as a -mcpu option to an equivalent -march value.  If we can do so,
471    return the new string, otherwise return an error.  */
472 
473 const char *
aarch64_rewrite_selected_cpu(const char * name)474 aarch64_rewrite_selected_cpu (const char *name)
475 {
476   std::string original_string (name);
477   std::string extension_str;
478   std::string processor;
479   size_t extension_pos = original_string.find_first_of ('+');
480 
481   /* Strip and save the extension string.  */
482   if (extension_pos != std::string::npos)
483     {
484       processor = original_string.substr (0, extension_pos);
485       extension_str = original_string.substr (extension_pos,
486 					      std::string::npos);
487     }
488   else
489     {
490       /* No extensions.  */
491       processor = original_string;
492     }
493 
494   const struct processor_name_to_arch* p_to_a;
495   for (p_to_a = all_cores;
496        p_to_a->arch != aarch64_no_arch;
497        p_to_a++)
498     {
499       if (p_to_a->processor_name == processor)
500 	break;
501     }
502 
503   const struct arch_to_arch_name* a_to_an;
504   for (a_to_an = all_architectures;
505        a_to_an->arch != aarch64_no_arch;
506        a_to_an++)
507     {
508       if (a_to_an->arch == p_to_a->arch)
509 	break;
510     }
511 
512   /* We couldn't find that proceesor name, or the processor name we
513      found does not map to an architecture we understand.  */
514   if (p_to_a->arch == aarch64_no_arch
515       || a_to_an->arch == aarch64_no_arch)
516     fatal_error (input_location, "unknown value %qs for %<-mcpu%>", name);
517 
518   uint64_t extensions = p_to_a->flags;
519   aarch64_parse_extension (extension_str.c_str (), &extensions, NULL);
520 
521   std::string outstr = a_to_an->arch_name
522 	+ aarch64_get_extension_string_for_isa_flags (extensions,
523 						      a_to_an->flags);
524 
525   /* We are going to memory leak here, nobody elsewhere
526      in the callchain is going to clean up after us.  The alternative is
527      to allocate a static buffer, and assert that it is big enough for our
528      modified string, which seems much worse!  */
529   return xstrdup (outstr.c_str ());
530 }
531 
532 /* Called by the driver to rewrite a name passed to the -mcpu
533    argument in preparation to be passed to the assembler.  The
534    names passed from the commend line will be in ARGV, we want
535    to use the right-most argument, which should be in
536    ARGV[ARGC - 1].  ARGC should always be greater than 0.  */
537 
538 const char *
aarch64_rewrite_mcpu(int argc,const char ** argv)539 aarch64_rewrite_mcpu (int argc, const char **argv)
540 {
541   gcc_assert (argc);
542   return aarch64_rewrite_selected_cpu (argv[argc - 1]);
543 }
544 
545 struct gcc_targetm_common targetm_common = TARGETM_COMMON_INITIALIZER;
546 
547 #undef AARCH64_CPU_NAME_LENGTH
548 
549