14a1767b4Smrg /* Intel Atom/64 gmp-mparam.h -- Compiler/machine parameter header file.
24a1767b4Smrg 
3*671ea119Smrg Copyright 2019 Free Software Foundation, Inc.
44a1767b4Smrg 
54a1767b4Smrg This file is part of the GNU MP Library.
64a1767b4Smrg 
74a1767b4Smrg The GNU MP Library is free software; you can redistribute it and/or modify
8f81b1c5bSmrg it under the terms of either:
9f81b1c5bSmrg 
10f81b1c5bSmrg   * the GNU Lesser General Public License as published by the Free
11f81b1c5bSmrg     Software Foundation; either version 3 of the License, or (at your
124a1767b4Smrg     option) any later version.
134a1767b4Smrg 
14f81b1c5bSmrg or
15f81b1c5bSmrg 
16f81b1c5bSmrg   * the GNU General Public License as published by the Free Software
17f81b1c5bSmrg     Foundation; either version 2 of the License, or (at your option) any
18f81b1c5bSmrg     later version.
19f81b1c5bSmrg 
20f81b1c5bSmrg or both in parallel, as here.
21f81b1c5bSmrg 
224a1767b4Smrg The GNU MP Library is distributed in the hope that it will be useful, but
234a1767b4Smrg WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
24f81b1c5bSmrg or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
25f81b1c5bSmrg for more details.
264a1767b4Smrg 
27f81b1c5bSmrg You should have received copies of the GNU General Public License and the
28f81b1c5bSmrg GNU Lesser General Public License along with the GNU MP Library.  If not,
29f81b1c5bSmrg see https://www.gnu.org/licenses/.  */
304a1767b4Smrg 
314a1767b4Smrg #define GMP_LIMB_BITS 64
32f81b1c5bSmrg #define GMP_LIMB_BYTES 8
334a1767b4Smrg 
34d25e02daSmrg #define SHLD_SLOW 1
35d25e02daSmrg #define SHRD_SLOW 1
36d25e02daSmrg 
37f81b1c5bSmrg /* 1600 MHz Diamondville (Atom 330) */
38*671ea119Smrg /* FFT tuning limit = 50,646,641 */
39*671ea119Smrg /* Generated by tuneup.c, 2019-10-16, gcc 8.3 */
40d25e02daSmrg 
414a1767b4Smrg #define MOD_1_NORM_THRESHOLD                 0  /* always */
424a1767b4Smrg #define MOD_1_UNNORM_THRESHOLD               0  /* always */
43f81b1c5bSmrg #define MOD_1N_TO_MOD_1_1_THRESHOLD          5
44*671ea119Smrg #define MOD_1U_TO_MOD_1_1_THRESHOLD          3
45d25e02daSmrg #define MOD_1_1_TO_MOD_1_2_THRESHOLD     MP_SIZE_T_MAX
46f81b1c5bSmrg #define MOD_1_2_TO_MOD_1_4_THRESHOLD         0  /* never mpn_mod_1s_2p */
47*671ea119Smrg #define PREINV_MOD_1_TO_MOD_1_THRESHOLD     12
484a1767b4Smrg #define USE_PREINV_DIVREM_1                  1  /* native */
49f81b1c5bSmrg #define DIV_QR_1_NORM_THRESHOLD              1
50f81b1c5bSmrg #define DIV_QR_1_UNNORM_THRESHOLD        MP_SIZE_T_MAX  /* never */
51d25e02daSmrg #define DIV_QR_2_PI2_THRESHOLD           MP_SIZE_T_MAX  /* never */
524a1767b4Smrg #define DIVEXACT_1_THRESHOLD                 0  /* always (native) */
53f81b1c5bSmrg #define BMOD_1_TO_MOD_1_THRESHOLD           16
544a1767b4Smrg 
55*671ea119Smrg #define DIV_1_VS_MUL_1_PERCENT             201
56*671ea119Smrg 
57f81b1c5bSmrg #define MUL_TOOM22_THRESHOLD                12
58f81b1c5bSmrg #define MUL_TOOM33_THRESHOLD                74
59*671ea119Smrg #define MUL_TOOM44_THRESHOLD               106
60*671ea119Smrg #define MUL_TOOM6H_THRESHOLD               155
61*671ea119Smrg #define MUL_TOOM8H_THRESHOLD               212
624a1767b4Smrg 
63f81b1c5bSmrg #define MUL_TOOM32_TO_TOOM43_THRESHOLD      73
64*671ea119Smrg #define MUL_TOOM32_TO_TOOM53_THRESHOLD      77
65*671ea119Smrg #define MUL_TOOM42_TO_TOOM53_THRESHOLD      73
66*671ea119Smrg #define MUL_TOOM42_TO_TOOM63_THRESHOLD      72
67f81b1c5bSmrg #define MUL_TOOM43_TO_TOOM54_THRESHOLD      58
684a1767b4Smrg 
69f81b1c5bSmrg #define SQR_BASECASE_THRESHOLD               5
70*671ea119Smrg #define SQR_TOOM2_THRESHOLD                 22
71*671ea119Smrg #define SQR_TOOM3_THRESHOLD                 73
72*671ea119Smrg #define SQR_TOOM4_THRESHOLD                130
73*671ea119Smrg #define SQR_TOOM6_THRESHOLD                159
74*671ea119Smrg #define SQR_TOOM8_THRESHOLD                236
754a1767b4Smrg 
76*671ea119Smrg #define MULMID_TOOM42_THRESHOLD             16
77d25e02daSmrg 
78f81b1c5bSmrg #define MULMOD_BNM1_THRESHOLD                9
79*671ea119Smrg #define SQRMOD_BNM1_THRESHOLD                9
804a1767b4Smrg 
81*671ea119Smrg #define MUL_FFT_MODF_THRESHOLD             220  /* k = 5 */
824a1767b4Smrg #define MUL_FFT_TABLE3                                      \
83*671ea119Smrg   { {    220, 5}, {     11, 6}, {      6, 5}, {     13, 6}, \
84*671ea119Smrg     {     13, 7}, {      7, 6}, {     15, 7}, {      8, 6}, \
85*671ea119Smrg     {     17, 7}, {     13, 8}, {      7, 7}, {     17, 8}, \
86f81b1c5bSmrg     {      9, 7}, {     19, 8}, {     11, 7}, {     23, 8}, \
87f81b1c5bSmrg     {     13, 9}, {      7, 8}, {     19, 9}, {     11, 8}, \
88*671ea119Smrg     {     25,10}, {      7, 9}, {     15, 8}, {     33, 9}, \
89*671ea119Smrg     {     19, 8}, {     39, 9}, {     23, 8}, {     47, 9}, \
90*671ea119Smrg     {     27,10}, {     15, 9}, {     39,10}, {     23, 9}, \
91*671ea119Smrg     {     47,11}, {     15,10}, {     31, 9}, {     67,10}, \
92*671ea119Smrg     {     39, 9}, {     79,10}, {     47, 9}, {     95,11}, \
93*671ea119Smrg     {     31,10}, {     63, 9}, {    127, 8}, {    255,10}, \
94*671ea119Smrg     {     71, 9}, {    143, 8}, {    287,10}, {     79,11}, \
95*671ea119Smrg     {     47,10}, {     95, 9}, {    191,12}, {     31,11}, \
96*671ea119Smrg     {     63,10}, {    127, 9}, {    255, 8}, {    511,10}, \
97*671ea119Smrg     {    143, 9}, {    287,11}, {     79,10}, {    159, 9}, \
98*671ea119Smrg     {    319,10}, {    175, 9}, {    351,11}, {     95,10}, \
99*671ea119Smrg     {    191, 9}, {    383,10}, {    207,11}, {    111,10}, \
100*671ea119Smrg     {    223,12}, {     63,11}, {    127,10}, {    255, 9}, \
101*671ea119Smrg     {    511,11}, {    143,10}, {    287, 9}, {    575,11}, \
102*671ea119Smrg     {    159,10}, {    319,11}, {    175,10}, {    351,12}, \
103*671ea119Smrg     {     95,11}, {    191,10}, {    383,11}, {    207,10}, \
104*671ea119Smrg     {    415,11}, {    223,13}, {     63,12}, {    127,11}, \
105*671ea119Smrg     {    255,10}, {    511,11}, {    287,10}, {    575,12}, \
106*671ea119Smrg     {    159,11}, {    319,10}, {    639,11}, {    351,12}, \
107*671ea119Smrg     {    191,11}, {    383,10}, {    767,12}, {    223,11}, \
108*671ea119Smrg     {    447,13}, {    127,12}, {    255,11}, {    511,12}, \
109*671ea119Smrg     {    287,11}, {    575,12}, {    319,11}, {    639,12}, \
110*671ea119Smrg     {    351,13}, {    191,12}, {    383,11}, {    767,12}, \
111*671ea119Smrg     {    447,14}, {    127,13}, {    255,12}, {    575,13}, \
112*671ea119Smrg     {    319,12}, {    703,13}, {    383,12}, {    767,13}, \
113*671ea119Smrg     {    447,14}, {    255,13}, {    511,12}, {   1023,13}, \
114*671ea119Smrg     {    575,12}, {   1151,13}, {    703,14}, {    383,13}, \
115*671ea119Smrg     {    831,12}, {   1663,15}, {    255,14}, {    511,13}, \
116*671ea119Smrg     {   1087,12}, {   2175,13}, {   1151,14}, {    639,13}, \
117*671ea119Smrg     {   1407,12}, {   2815,14}, {    767,13}, {   1663,14}, \
118*671ea119Smrg     {    895,13}, {   1791,15}, {    511,14}, {   1023,13}, \
119*671ea119Smrg     {   2175,14}, {   1151,13}, {   2431,12}, {   4863,14}, \
120*671ea119Smrg     {   1407,13}, {   2815,15}, {    767,14}, {   1791,16}, \
121*671ea119Smrg     {    511,15}, {   1023,14}, {   2431,13}, {   4863,15}, \
122*671ea119Smrg     {   1279,14}, {   2943,15}, {   1535,14}, {  16384,15}, \
123d25e02daSmrg     {  32768,16}, {  65536,17}, { 131072,18}, { 262144,19}, \
124d25e02daSmrg     { 524288,20}, {1048576,21}, {2097152,22}, {4194304,23}, \
125d25e02daSmrg     {8388608,24} }
126*671ea119Smrg #define MUL_FFT_TABLE3_SIZE 169
127f81b1c5bSmrg #define MUL_FFT_THRESHOLD                 2240
128d25e02daSmrg 
129*671ea119Smrg #define SQR_FFT_MODF_THRESHOLD             184  /* k = 5 */
130d25e02daSmrg #define SQR_FFT_TABLE3                                      \
131*671ea119Smrg   { {    184, 5}, {     11, 6}, {     13, 7}, {      7, 6}, \
132*671ea119Smrg     {     15, 7}, {      8, 6}, {     17, 7}, {     13, 8}, \
133*671ea119Smrg     {      7, 7}, {     17, 8}, {      9, 7}, {     19, 8}, \
134*671ea119Smrg     {     11, 7}, {     23, 8}, {     13, 9}, {      7, 8}, \
135*671ea119Smrg     {     19, 9}, {     11, 8}, {     25,10}, {      7, 9}, \
136*671ea119Smrg     {     15, 8}, {     33, 9}, {     19, 8}, {     39, 9}, \
137*671ea119Smrg     {     23,10}, {     15, 9}, {     39,10}, {     23, 9}, \
138*671ea119Smrg     {     47,11}, {     15,10}, {     31, 9}, {     63, 8}, \
139*671ea119Smrg     {    127, 7}, {    255,10}, {     39, 8}, {    159,10}, \
140*671ea119Smrg     {     47, 9}, {     95, 8}, {    191,11}, {     31,10}, \
141*671ea119Smrg     {     63, 9}, {    127, 8}, {    255, 7}, {    511,10}, \
142*671ea119Smrg     {     71, 9}, {    143, 8}, {    287, 7}, {    575, 9}, \
143*671ea119Smrg     {    159, 8}, {    319,11}, {     47,10}, {     95, 9}, \
144f81b1c5bSmrg     {    191, 8}, {    383,12}, {     31,11}, {     63,10}, \
145f81b1c5bSmrg     {    127, 9}, {    255, 8}, {    511,10}, {    143, 9}, \
146*671ea119Smrg     {    287, 8}, {    575,10}, {    159, 9}, {    319, 8}, \
147*671ea119Smrg     {    639,10}, {    175, 9}, {    351,11}, {     95,10}, \
148*671ea119Smrg     {    191, 9}, {    383,11}, {    111,10}, {    223, 9}, \
149f81b1c5bSmrg     {    447,12}, {     63,11}, {    127,10}, {    255, 9}, \
150f81b1c5bSmrg     {    511,11}, {    143,10}, {    287, 9}, {    575,11}, \
151*671ea119Smrg     {    159,10}, {    319, 9}, {    639,11}, {    175,10}, \
152*671ea119Smrg     {    351,12}, {     95,11}, {    191,10}, {    383, 9}, \
153*671ea119Smrg     {    767,11}, {    223,10}, {    447,13}, {     63,12}, \
154f81b1c5bSmrg     {    127,11}, {    255,10}, {    511,11}, {    287,10}, \
155f81b1c5bSmrg     {    575,12}, {    159,11}, {    319,10}, {    639,11}, \
156*671ea119Smrg     {    351,12}, {    191,11}, {    383,10}, {    767,12}, \
157*671ea119Smrg     {    223,11}, {    447,13}, {    127,12}, {    255,11}, \
158*671ea119Smrg     {    511,12}, {    287,11}, {    575,12}, {    319,11}, \
159*671ea119Smrg     {    639,12}, {    351,13}, {    191,12}, {    383,11}, \
160*671ea119Smrg     {    767,12}, {    447,14}, {    127,13}, {    255,12}, \
161*671ea119Smrg     {    575,13}, {    319,12}, {    703,13}, {    383,12}, \
162*671ea119Smrg     {    767,13}, {    447,14}, {    255,13}, {    511,12}, \
163f81b1c5bSmrg     {   1023,13}, {    575,12}, {   1151,13}, {    703,14}, \
164*671ea119Smrg     {    383,13}, {    831,12}, {   1663,15}, {    255,14}, \
165*671ea119Smrg     {    511,13}, {   1151,14}, {    639,13}, {   1407,12}, \
166*671ea119Smrg     {   2815,14}, {    767,13}, {   1663,14}, {    895,13}, \
167*671ea119Smrg     {   1791,15}, {    511,14}, {   1023,13}, {   2047,14}, \
168*671ea119Smrg     {   1151,13}, {   2431,12}, {   4863,14}, {   1407,13}, \
169*671ea119Smrg     {   2815,15}, {    767,14}, {   1791,16}, {    511,15}, \
170*671ea119Smrg     {   1023,14}, {   2431,13}, {   4863,15}, {   1279,14}, \
171*671ea119Smrg     {   2943,15}, {   1535,14}, {  16384,15}, {  32768,16}, \
172f81b1c5bSmrg     {  65536,17}, { 131072,18}, { 262144,19}, { 524288,20}, \
173f81b1c5bSmrg     {1048576,21}, {2097152,22}, {4194304,23}, {8388608,24} }
174f81b1c5bSmrg #define SQR_FFT_TABLE3_SIZE 172
175f81b1c5bSmrg #define SQR_FFT_THRESHOLD                 1728
1764a1767b4Smrg 
177d25e02daSmrg #define MULLO_BASECASE_THRESHOLD             0  /* always */
178*671ea119Smrg #define MULLO_DC_THRESHOLD                  33
179f81b1c5bSmrg #define MULLO_MUL_N_THRESHOLD             4392
180f81b1c5bSmrg #define SQRLO_BASECASE_THRESHOLD             0  /* always */
181*671ea119Smrg #define SQRLO_DC_THRESHOLD                  85
182f81b1c5bSmrg #define SQRLO_SQR_THRESHOLD               3176
1834a1767b4Smrg 
184*671ea119Smrg #define DC_DIV_QR_THRESHOLD                 34
185*671ea119Smrg #define DC_DIVAPPR_Q_THRESHOLD             119
186*671ea119Smrg #define DC_BDIV_QR_THRESHOLD                31
187*671ea119Smrg #define DC_BDIV_Q_THRESHOLD                 76
1884a1767b4Smrg 
189f81b1c5bSmrg #define INV_MULMOD_BNM1_THRESHOLD           22
190*671ea119Smrg #define INV_NEWTON_THRESHOLD               149
191*671ea119Smrg #define INV_APPR_THRESHOLD                 123
1924a1767b4Smrg 
193f81b1c5bSmrg #define BINV_NEWTON_THRESHOLD              179
194*671ea119Smrg #define REDC_1_TO_REDC_2_THRESHOLD          24
195*671ea119Smrg #define REDC_2_TO_REDC_N_THRESHOLD          39
1964a1767b4Smrg 
197*671ea119Smrg #define MU_DIV_QR_THRESHOLD                807
198*671ea119Smrg #define MU_DIVAPPR_Q_THRESHOLD             807
199*671ea119Smrg #define MUPI_DIV_QR_THRESHOLD               77
200*671ea119Smrg #define MU_BDIV_QR_THRESHOLD               748
201f81b1c5bSmrg #define MU_BDIV_Q_THRESHOLD                807
2024a1767b4Smrg 
203*671ea119Smrg #define POWM_SEC_TABLE  1,22,114,326,1486
204d25e02daSmrg 
205*671ea119Smrg #define GET_STR_DC_THRESHOLD                16
206*671ea119Smrg #define GET_STR_PRECOMPUTE_THRESHOLD        30
207*671ea119Smrg #define SET_STR_DC_THRESHOLD               381
208*671ea119Smrg #define SET_STR_PRECOMPUTE_THRESHOLD      1565
209d25e02daSmrg 
210*671ea119Smrg #define FAC_DSC_THRESHOLD                  960
211d25e02daSmrg #define FAC_ODD_THRESHOLD                    0  /* always */
212f81b1c5bSmrg 
213*671ea119Smrg #define MATRIX22_STRASSEN_THRESHOLD         13
214*671ea119Smrg #define HGCD2_DIV1_METHOD                    3  /* 5.86% faster than 4 */
215*671ea119Smrg #define HGCD_THRESHOLD                      88
216*671ea119Smrg #define HGCD_APPR_THRESHOLD                 88
217*671ea119Smrg #define HGCD_REDUCE_THRESHOLD             1182
218*671ea119Smrg #define GCD_DC_THRESHOLD                   241
219*671ea119Smrg #define GCDEXT_DC_THRESHOLD                192
220*671ea119Smrg #define JACOBI_BASE_METHOD                   3  /* 9.43% faster than 2 */
221*671ea119Smrg 
222*671ea119Smrg /* Tuneup completed successfully, took 193098 seconds */
223