xref: /netbsd-src/external/lgpl3/gmp/dist/mpn/x86_64/fat/gmp-mparam.h (revision d11b170b9000ada93db553723522a63d5deac310)
1 /* Fat binary x86_64 gmp-mparam.h -- Compiler/machine parameter header file.
2 
3 Copyright 1991, 1993, 1994, 2000, 2001, 2002, 2003, 2009, 2011 Free Software
4 Foundation, Inc.
5 
6 This file is part of the GNU MP Library.
7 
8 The GNU MP Library is free software; you can redistribute it and/or modify
9 it under the terms of the GNU Lesser General Public License as published by
10 the Free Software Foundation; either version 3 of the License, or (at your
11 option) any later version.
12 
13 The GNU MP Library is distributed in the hope that it will be useful, but
14 WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
15 or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Lesser General Public
16 License for more details.
17 
18 You should have received a copy of the GNU Lesser General Public License
19 along with the GNU MP Library.  If not, see http://www.gnu.org/licenses/.  */
20 
21 #define GMP_LIMB_BITS 64
22 #define BYTES_PER_MP_LIMB 8
23 
24 
25 /* mpn_divexact_1 is faster than mpn_divrem_1 at all sizes.  The only time
26    this might not be true currently is for actual 80386 and 80486 chips,
27    where mpn/x86/dive_1.asm might be slower than mpn/x86/divrem_1.asm, but
28    that's not worth worrying about.  */
29 #define DIVEXACT_1_THRESHOLD  0
30 
31 /* Only some of the x86s have an mpn_preinv_divrem_1, but we set
32    USE_PREINV_DIVREM_1 so that all callers use it, and then let the
33    __gmpn_cpuvec pointer go to plain mpn_divrem_1 if there's not an actual
34    preinv.  */
35 #define USE_PREINV_DIVREM_1   1
36 
37 #define BMOD_1_TO_MOD_1_THRESHOLD           20
38 
39 /* mpn_sqr_basecase is faster than mpn_mul_basecase at all sizes, no need
40    for mpn_sqr to call the latter.  */
41 #define SQR_BASECASE_THRESHOLD 0
42 
43 /* Sensible fallbacks for these, when not taken from a cpu-specific
44    gmp-mparam.h.  */
45 #define MUL_TOOM22_THRESHOLD      20
46 #define MUL_TOOM33_THRESHOLD     130
47 #define SQR_TOOM2_THRESHOLD       30
48 #define SQR_TOOM3_THRESHOLD      200
49 
50 /* These are values more or less in the middle of what the typical x86 chips
51    come out as.  For a fat binary it's necessary to have values for these,
52    since the defaults for MUL_FFT_TABLE and SQR_FFT_TABLE otherwise come out
53    as non-constant array initializers.  FIXME: Perhaps these should be done
54    in the cpuvec structure like other thresholds.  */
55 #define MUL_FFT_TABLE  { 464, 928, 1920, 3584, 10240, 40960, 0 }
56 #define MUL_FFT_MODF_THRESHOLD          400
57 #define MUL_FFT_THRESHOLD              2000
58 
59 #define SQR_FFT_TABLE  { 528, 1184, 1920, 4608, 14336, 40960, 0 }
60 #define SQR_FFT_MODF_THRESHOLD          500
61 #define SQR_FFT_THRESHOLD              3000
62