xref: /netbsd-src/external/lgpl3/gmp/dist/mpn/x86/atom/gmp-mparam.h (revision 72c7faa4dbb41dbb0238d6b4a109da0d4b236dd4)
1 /* Intel Atom/32 gmp-mparam.h -- Compiler/machine parameter header file.
2 
3 Copyright 2019 Free Software Foundation, Inc.
4 
5 This file is part of the GNU MP Library.
6 
7 The GNU MP Library is free software; you can redistribute it and/or modify
8 it under the terms of either:
9 
10   * the GNU Lesser General Public License as published by the Free
11     Software Foundation; either version 3 of the License, or (at your
12     option) any later version.
13 
14 or
15 
16   * the GNU General Public License as published by the Free Software
17     Foundation; either version 2 of the License, or (at your option) any
18     later version.
19 
20 or both in parallel, as here.
21 
22 The GNU MP Library is distributed in the hope that it will be useful, but
23 WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
24 or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
25 for more details.
26 
27 You should have received copies of the GNU General Public License and the
28 GNU Lesser General Public License along with the GNU MP Library.  If not,
29 see https://www.gnu.org/licenses/.  */
30 
31 #define GMP_LIMB_BITS 32
32 #define GMP_LIMB_BYTES 4
33 
34 /* 1600 MHz Diamondville (Atom 330) */
35 /* FFT tuning limit = 67,000,000 */
36 /* Generated by tuneup.c, 2019-10-18, gcc 8.3 */
37 
38 #define MOD_1_NORM_THRESHOLD                 3
39 #define MOD_1_UNNORM_THRESHOLD               5
40 #define MOD_1N_TO_MOD_1_1_THRESHOLD         11
41 #define MOD_1U_TO_MOD_1_1_THRESHOLD          5
42 #define MOD_1_1_TO_MOD_1_2_THRESHOLD        10
43 #define MOD_1_2_TO_MOD_1_4_THRESHOLD         0  /* never mpn_mod_1s_2p */
44 #define PREINV_MOD_1_TO_MOD_1_THRESHOLD     17
45 #define USE_PREINV_DIVREM_1                  1  /* native */
46 #define DIV_QR_1N_PI1_METHOD                 1  /* 72.60% faster than 2 */
47 #define DIV_QR_1_NORM_THRESHOLD          MP_SIZE_T_MAX  /* never */
48 #define DIV_QR_1_UNNORM_THRESHOLD        MP_SIZE_T_MAX  /* never */
49 #define DIV_QR_2_PI2_THRESHOLD           MP_SIZE_T_MAX  /* never */
50 #define DIVEXACT_1_THRESHOLD                 0  /* always (native) */
51 #define BMOD_1_TO_MOD_1_THRESHOLD           35
52 
53 #define DIV_1_VS_MUL_1_PERCENT             236
54 
55 #define MUL_TOOM22_THRESHOLD                22
56 #define MUL_TOOM33_THRESHOLD                81
57 #define MUL_TOOM44_THRESHOLD               178
58 #define MUL_TOOM6H_THRESHOLD               270
59 #define MUL_TOOM8H_THRESHOLD               399
60 
61 #define MUL_TOOM32_TO_TOOM43_THRESHOLD      97
62 #define MUL_TOOM32_TO_TOOM53_THRESHOLD     126
63 #define MUL_TOOM42_TO_TOOM53_THRESHOLD     115
64 #define MUL_TOOM42_TO_TOOM63_THRESHOLD     129
65 #define MUL_TOOM43_TO_TOOM54_THRESHOLD     115
66 
67 #define SQR_BASECASE_THRESHOLD               0  /* always (native) */
68 #define SQR_TOOM2_THRESHOLD                 32
69 #define SQR_TOOM3_THRESHOLD                117
70 #define SQR_TOOM4_THRESHOLD                178
71 #define SQR_TOOM6_THRESHOLD                366
72 #define SQR_TOOM8_THRESHOLD                527
73 
74 #define MULMID_TOOM42_THRESHOLD             50
75 
76 #define MULMOD_BNM1_THRESHOLD               13
77 #define SQRMOD_BNM1_THRESHOLD               17
78 
79 #define MUL_FFT_MODF_THRESHOLD             404  /* k = 5 */
80 #define MUL_FFT_TABLE3                                      \
81   { {    404, 5}, {     21, 6}, {     11, 5}, {     23, 6}, \
82     {     12, 5}, {     25, 6}, {     13, 5}, {     27, 6}, \
83     {     21, 7}, {     11, 6}, {     25, 7}, {     13, 6}, \
84     {     27, 7}, {     15, 6}, {     31, 7}, {     21, 8}, \
85     {     11, 7}, {     27, 8}, {     15, 7}, {     35, 8}, \
86     {     19, 7}, {     39, 8}, {     23, 7}, {     47, 8}, \
87     {     27, 9}, {     15, 8}, {     39, 9}, {     23, 8}, \
88     {     51,10}, {     15, 9}, {     31, 8}, {     67, 9}, \
89     {     39, 8}, {     79, 9}, {     47, 8}, {     95,10}, \
90     {     31, 9}, {     79,10}, {     47, 9}, {     95,11}, \
91     {     31,10}, {     63, 9}, {    135,10}, {     79, 9}, \
92     {    159,10}, {     95, 9}, {    191,10}, {    111,11}, \
93     {     63,10}, {    127, 9}, {    255, 8}, {    511,10}, \
94     {    143, 9}, {    287, 8}, {    575, 9}, {    303,10}, \
95     {    159,11}, {     95,10}, {    191, 9}, {    383,12}, \
96     {     63,11}, {    127,10}, {    255, 9}, {    511,10}, \
97     {    271, 9}, {    543,10}, {    287, 9}, {    575,10}, \
98     {    303,11}, {    159,10}, {    351, 9}, {    703,10}, \
99     {    367, 9}, {    735,11}, {    191,10}, {    383, 9}, \
100     {    767,10}, {    415,11}, {    223,10}, {    447,12}, \
101     {    127,11}, {    255,10}, {    543,11}, {    287,10}, \
102     {    607,11}, {    319,10}, {    671,11}, {    351,10}, \
103     {    735,12}, {    191,11}, {    383,10}, {    767,11}, \
104     {    415,10}, {    831,11}, {    447,13}, {    127,12}, \
105     {    255,11}, {    543,10}, {   1087,11}, {    607,12}, \
106     {    319,11}, {    735,12}, {    383,11}, {    831,12}, \
107     {    447,11}, {    959,13}, {    255,12}, {    511,11}, \
108     {   1087,12}, {    575,11}, {   1215,12}, {    639,11}, \
109     {   1279,12}, {    703,11}, {   1407,13}, {    383,12}, \
110     {    831,11}, {   1663,12}, {    959,14}, {    255,13}, \
111     {    511,12}, {   1215,13}, {    639,12}, {   1471,13}, \
112     {    767,12}, {   1599,13}, {    895,12}, {   1791,14}, \
113     {    511,13}, {   1023,12}, {   2111,13}, {   1151,12}, \
114     {   2431,13}, {   1407,14}, {    767,13}, {   1663,12}, \
115     {   3455,13}, {   1791,15}, {    511,14}, {   1023,13}, \
116     {   2431,14}, {   1279,13}, {   2943,12}, {   5887,14}, \
117     {   1535,13}, {   3455,14}, {   1791,13}, {   3839,15}, \
118     {   1023,14}, {   2047,13}, {   4223,14}, {   2303,13}, \
119     {   4991,12}, {   9983,14}, {   2815,13}, {   5887,15}, \
120     {   1535,14}, {   3839,16} }
121 #define MUL_FFT_TABLE3_SIZE 158
122 #define MUL_FFT_THRESHOLD                 4544
123 
124 #define SQR_FFT_MODF_THRESHOLD             368  /* k = 5 */
125 #define SQR_FFT_TABLE3                                      \
126   { {    368, 5}, {     23, 6}, {     12, 5}, {     25, 6}, \
127     {     13, 5}, {     27, 6}, {     25, 7}, {     13, 6}, \
128     {     28, 7}, {     15, 6}, {     31, 7}, {     17, 6}, \
129     {     35, 7}, {     21, 8}, {     11, 7}, {     27, 8}, \
130     {     15, 7}, {     35, 8}, {     19, 7}, {     41, 8}, \
131     {     23, 7}, {     47, 8}, {     27, 9}, {     15, 8}, \
132     {     39, 9}, {     23, 8}, {     51,10}, {     15, 9}, \
133     {     31, 8}, {     63, 9}, {     39, 8}, {     79, 9}, \
134     {     47,10}, {     31, 9}, {     79,10}, {     47, 9}, \
135     {     95,11}, {     31,10}, {     63, 9}, {    127, 8}, \
136     {    255, 9}, {    135,10}, {     79, 9}, {    159, 8}, \
137     {    319,10}, {     95, 9}, {    191,11}, {     63,10}, \
138     {    127, 9}, {    255, 8}, {    511, 9}, {    271,10}, \
139     {    143, 9}, {    287, 8}, {    575, 9}, {    303,10}, \
140     {    159, 9}, {    319,11}, {     95,10}, {    191, 9}, \
141     {    383,12}, {     63,11}, {    127,10}, {    255, 9}, \
142     {    511,10}, {    271, 9}, {    543,10}, {    287, 9}, \
143     {    575,10}, {    303, 9}, {    607,11}, {    159,10}, \
144     {    319, 9}, {    639,10}, {    335, 9}, {    671,10}, \
145     {    351, 9}, {    703,11}, {    191,10}, {    383, 9}, \
146     {    767,10}, {    415,11}, {    223,10}, {    447,12}, \
147     {    127,11}, {    255,10}, {    543,11}, {    287,10}, \
148     {    607,11}, {    319,10}, {    671,11}, {    351,10}, \
149     {    703,12}, {    191,11}, {    383,10}, {    767,11}, \
150     {    415,10}, {    831,11}, {    447,13}, {    127,12}, \
151     {    255,11}, {    543,10}, {   1087,11}, {    607,12}, \
152     {    319,11}, {    671,10}, {   1343,11}, {    735,12}, \
153     {    383,11}, {    831,12}, {    447,11}, {    959,13}, \
154     {    255,12}, {    511,11}, {   1087,12}, {    575,11}, \
155     {   1215,12}, {    639,11}, {   1343,12}, {    703,13}, \
156     {    383,12}, {    959,14}, {    255,13}, {    511,12}, \
157     {   1215,13}, {    639,12}, {   1471,13}, {    767,12}, \
158     {   1599,13}, {    895,14}, {    511,13}, {   1023,12}, \
159     {   2111,13}, {   1151,12}, {   2431,13}, {   1407,14}, \
160     {    767,13}, {   1663,12}, {   3455,15}, {    511,14}, \
161     {   1023,13}, {   2175,12}, {   4351,13}, {   2431,14}, \
162     {   1279,13}, {   2943,12}, {   5887,14}, {   1535,13}, \
163     {   3455,14}, {   1791,13}, {   3839,15}, {   1023,14}, \
164     {   2047,13}, {   4351,14}, {   2303,13}, {   4991,12}, \
165     {   9983,14}, {   2815,13}, {   5887,15}, {   1535,14}, \
166     {   3839,16} }
167 #define SQR_FFT_TABLE3_SIZE 161
168 #define SQR_FFT_THRESHOLD                 3712
169 
170 #define MULLO_BASECASE_THRESHOLD             0  /* always */
171 #define MULLO_DC_THRESHOLD                  56
172 #define MULLO_MUL_N_THRESHOLD             8907
173 #define SQRLO_BASECASE_THRESHOLD             6
174 #define SQRLO_DC_THRESHOLD                 111
175 #define SQRLO_SQR_THRESHOLD               6654
176 
177 #define DC_DIV_QR_THRESHOLD                 67
178 #define DC_DIVAPPR_Q_THRESHOLD             252
179 #define DC_BDIV_QR_THRESHOLD                63
180 #define DC_BDIV_Q_THRESHOLD                172
181 
182 #define INV_MULMOD_BNM1_THRESHOLD           42
183 #define INV_NEWTON_THRESHOLD               250
184 #define INV_APPR_THRESHOLD                 250
185 
186 #define BINV_NEWTON_THRESHOLD              276
187 #define REDC_1_TO_REDC_N_THRESHOLD          68
188 
189 #define MU_DIV_QR_THRESHOLD               1334
190 #define MU_DIVAPPR_Q_THRESHOLD            1442
191 #define MUPI_DIV_QR_THRESHOLD              116
192 #define MU_BDIV_QR_THRESHOLD              1142
193 #define MU_BDIV_Q_THRESHOLD               1341
194 
195 #define POWM_SEC_TABLE  1,16,98,376,1259
196 
197 #define GET_STR_DC_THRESHOLD                12
198 #define GET_STR_PRECOMPUTE_THRESHOLD        23
199 #define SET_STR_DC_THRESHOLD               298
200 #define SET_STR_PRECOMPUTE_THRESHOLD      1037
201 
202 #define FAC_DSC_THRESHOLD                  171
203 #define FAC_ODD_THRESHOLD                   34
204 
205 #define MATRIX22_STRASSEN_THRESHOLD         17
206 #define HGCD2_DIV1_METHOD                    3  /* 3.71% faster than 1 */
207 #define HGCD_THRESHOLD                     128
208 #define HGCD_APPR_THRESHOLD                186
209 #define HGCD_REDUCE_THRESHOLD             2479
210 #define GCD_DC_THRESHOLD                   465
211 #define GCDEXT_DC_THRESHOLD                339
212 #define JACOBI_BASE_METHOD                   3  /* 2.58% faster than 2 */
213 
214 /* Tuneup completed successfully, took 214190 seconds */
215