diff options
author | Torbjorn Granlund <tege@gmplib.org> | 2011-11-28 23:11:55 +0100 |
---|---|---|
committer | Torbjorn Granlund <tege@gmplib.org> | 2011-11-28 23:11:55 +0100 |
commit | d4f5eddea43f682b380e85a9db69b4e8fd8ea54a (patch) | |
tree | 3ad00b0a4190b2f887e66f5c1f87ec5111601897 /mpn | |
parent | dc3473c8e0d2c4e84a698901cc82327b7df24286 (diff) | |
download | gmp-d4f5eddea43f682b380e85a9db69b4e8fd8ea54a.tar.gz |
Retune.
Diffstat (limited to 'mpn')
-rw-r--r-- | mpn/ia64/gmp-mparam.h | 16 | ||||
-rw-r--r-- | mpn/s390_32/esame/gmp-mparam.h | 86 | ||||
-rw-r--r-- | mpn/s390_64/gmp-mparam.h | 8 | ||||
-rw-r--r-- | mpn/x86/bobcat/gmp-mparam.h | 113 |
4 files changed, 114 insertions, 109 deletions
diff --git a/mpn/ia64/gmp-mparam.h b/mpn/ia64/gmp-mparam.h index f080b876e..77e02f518 100644 --- a/mpn/ia64/gmp-mparam.h +++ b/mpn/ia64/gmp-mparam.h @@ -26,10 +26,10 @@ along with the GNU MP Library. If not, see http://www.gnu.org/licenses/. */ #define MOD_1_1P_METHOD 2 #define MOD_1_NORM_THRESHOLD 0 /* always */ #define MOD_1_UNNORM_THRESHOLD 0 /* always */ -#define MOD_1N_TO_MOD_1_1_THRESHOLD 3 -#define MOD_1U_TO_MOD_1_1_THRESHOLD 8 -#define MOD_1_1_TO_MOD_1_2_THRESHOLD 0 /* never mpn_mod_1_1p */ -#define MOD_1_2_TO_MOD_1_4_THRESHOLD 21 +#define MOD_1N_TO_MOD_1_1_THRESHOLD 4 +#define MOD_1U_TO_MOD_1_1_THRESHOLD 5 +#define MOD_1_1_TO_MOD_1_2_THRESHOLD 26 +#define MOD_1_2_TO_MOD_1_4_THRESHOLD 0 /* never mpn_mod_1s_2p */ #define PREINV_MOD_1_TO_MOD_1_THRESHOLD 10 #define USE_PREINV_DIVREM_1 1 /* native */ #define DIV_QR_2_PI2_THRESHOLD 12 @@ -54,6 +54,8 @@ along with the GNU MP Library. If not, see http://www.gnu.org/licenses/. */ #define SQR_TOOM6_THRESHOLD 0 /* always */ #define SQR_TOOM8_THRESHOLD 0 /* always */ +#define MULMID_TOOM42_THRESHOLD 98 + #define MULMOD_BNM1_THRESHOLD 23 #define SQRMOD_BNM1_THRESHOLD 28 @@ -171,9 +173,9 @@ along with the GNU MP Library. If not, see http://www.gnu.org/licenses/. */ #define MATRIX22_STRASSEN_THRESHOLD 23 #define HGCD_THRESHOLD 117 -#define HGCD_APPR_THRESHOLD 50 -#define HGCD_REDUCE_THRESHOLD 3389 -#define GCD_DC_THRESHOLD 496 +#define HGCD_APPR_THRESHOLD 111 +#define HGCD_REDUCE_THRESHOLD 3014 +#define GCD_DC_THRESHOLD 555 #define GCDEXT_DC_THRESHOLD 368 #define JACOBI_BASE_METHOD 4 diff --git a/mpn/s390_32/esame/gmp-mparam.h b/mpn/s390_32/esame/gmp-mparam.h index 5dedeeb81..a6508be1a 100644 --- a/mpn/s390_32/esame/gmp-mparam.h +++ b/mpn/s390_32/esame/gmp-mparam.h @@ -24,43 +24,45 @@ along with the GNU MP Library. If not, see http://www.gnu.org/licenses/. */ /* 1200 MHz IBM z990 running in 32-bit mode */ #define DIVREM_1_NORM_THRESHOLD 0 /* always */ -#define DIVREM_1_UNNORM_THRESHOLD 3 -#define MOD_1_1P_METHOD 1 +#define DIVREM_1_UNNORM_THRESHOLD 4 +#define MOD_1_1P_METHOD 2 #define MOD_1_NORM_THRESHOLD 0 /* always */ #define MOD_1_UNNORM_THRESHOLD 3 -#define MOD_1N_TO_MOD_1_1_THRESHOLD 12 -#define MOD_1U_TO_MOD_1_1_THRESHOLD 7 -#define MOD_1_1_TO_MOD_1_2_THRESHOLD 15 -#define MOD_1_2_TO_MOD_1_4_THRESHOLD 0 /* never mpn_mod_1s_2p */ -#define PREINV_MOD_1_TO_MOD_1_THRESHOLD 21 +#define MOD_1N_TO_MOD_1_1_THRESHOLD 17 +#define MOD_1U_TO_MOD_1_1_THRESHOLD 8 +#define MOD_1_1_TO_MOD_1_2_THRESHOLD 0 /* never mpn_mod_1_1p */ +#define MOD_1_2_TO_MOD_1_4_THRESHOLD 34 +#define PREINV_MOD_1_TO_MOD_1_THRESHOLD 42 #define USE_PREINV_DIVREM_1 1 #define DIV_QR_2_PI2_THRESHOLD MP_SIZE_T_MAX /* never */ #define DIVEXACT_1_THRESHOLD 0 /* always */ -#define BMOD_1_TO_MOD_1_THRESHOLD 50 +#define BMOD_1_TO_MOD_1_THRESHOLD 30 #define MUL_TOOM22_THRESHOLD 16 -#define MUL_TOOM33_THRESHOLD 66 -#define MUL_TOOM44_THRESHOLD 169 -#define MUL_TOOM6H_THRESHOLD 369 -#define MUL_TOOM8H_THRESHOLD 517 +#define MUL_TOOM33_THRESHOLD 57 +#define MUL_TOOM44_THRESHOLD 147 +#define MUL_TOOM6H_THRESHOLD 226 +#define MUL_TOOM8H_THRESHOLD 333 -#define MUL_TOOM32_TO_TOOM43_THRESHOLD 106 -#define MUL_TOOM32_TO_TOOM53_THRESHOLD 114 -#define MUL_TOOM42_TO_TOOM53_THRESHOLD 114 -#define MUL_TOOM42_TO_TOOM63_THRESHOLD 187 +#define MUL_TOOM32_TO_TOOM43_THRESHOLD 65 +#define MUL_TOOM32_TO_TOOM53_THRESHOLD 100 +#define MUL_TOOM42_TO_TOOM53_THRESHOLD 97 +#define MUL_TOOM42_TO_TOOM63_THRESHOLD 102 #define SQR_BASECASE_THRESHOLD 0 /* always (native) */ -#define SQR_TOOM2_THRESHOLD 28 -#define SQR_TOOM3_THRESHOLD 93 -#define SQR_TOOM4_THRESHOLD 387 -#define SQR_TOOM6_THRESHOLD 552 -#define SQR_TOOM8_THRESHOLD 0 /* always */ +#define SQR_TOOM2_THRESHOLD 26 +#define SQR_TOOM3_THRESHOLD 81 +#define SQR_TOOM4_THRESHOLD 154 +#define SQR_TOOM6_THRESHOLD 318 +#define SQR_TOOM8_THRESHOLD 478 #define MULMID_TOOM42_THRESHOLD 38 #define MULMOD_BNM1_THRESHOLD 13 #define SQRMOD_BNM1_THRESHOLD 15 +#define POWM_SEC_TABLE 4,23,262,892,2500 + #define MUL_FFT_MODF_THRESHOLD 336 /* k = 5 */ #define MUL_FFT_TABLE3 \ { { 336, 5}, { 19, 6}, { 11, 5}, { 23, 6}, \ @@ -91,37 +93,37 @@ along with the GNU MP Library. If not, see http://www.gnu.org/licenses/. */ #define SQR_FFT_TABLE3_SIZE 35 #define SQR_FFT_THRESHOLD 2368 -#define MULLO_BASECASE_THRESHOLD 6 -#define MULLO_DC_THRESHOLD 45 +#define MULLO_BASECASE_THRESHOLD 5 +#define MULLO_DC_THRESHOLD 49 #define MULLO_MUL_N_THRESHOLD 5397 -#define DC_DIV_QR_THRESHOLD 40 -#define DC_DIVAPPR_Q_THRESHOLD 152 +#define DC_DIV_QR_THRESHOLD 42 +#define DC_DIVAPPR_Q_THRESHOLD 146 #define DC_BDIV_QR_THRESHOLD 51 -#define DC_BDIV_Q_THRESHOLD 136 +#define DC_BDIV_Q_THRESHOLD 124 #define INV_MULMOD_BNM1_THRESHOLD 46 -#define INV_NEWTON_THRESHOLD 197 -#define INV_APPR_THRESHOLD 157 +#define INV_NEWTON_THRESHOLD 179 +#define INV_APPR_THRESHOLD 153 -#define BINV_NEWTON_THRESHOLD 114 +#define BINV_NEWTON_THRESHOLD 214 #define REDC_1_TO_REDC_N_THRESHOLD 55 -#define MU_DIV_QR_THRESHOLD 1210 -#define MU_DIVAPPR_Q_THRESHOLD 1334 -#define MUPI_DIV_QR_THRESHOLD 81 -#define MU_BDIV_QR_THRESHOLD 942 -#define MU_BDIV_Q_THRESHOLD 1258 - -#define MATRIX22_STRASSEN_THRESHOLD 17 -#define HGCD_THRESHOLD 104 -#define GCD_DC_THRESHOLD 278 +#define MU_DIV_QR_THRESHOLD 1078 +#define MU_DIVAPPR_Q_THRESHOLD 1078 +#define MUPI_DIV_QR_THRESHOLD 74 +#define MU_BDIV_QR_THRESHOLD 872 +#define MU_BDIV_Q_THRESHOLD 1078 + +#define MATRIX22_STRASSEN_THRESHOLD 14 +#define HGCD_THRESHOLD 90 +#define HGCD_APPR_THRESHOLD 111 +#define HGCD_REDUCE_THRESHOLD 1962 +#define GCD_DC_THRESHOLD 225 #define GCDEXT_DC_THRESHOLD 217 #define JACOBI_BASE_METHOD 2 -#define GET_STR_DC_THRESHOLD 16 -#define GET_STR_PRECOMPUTE_THRESHOLD 30 +#define GET_STR_DC_THRESHOLD 13 +#define GET_STR_PRECOMPUTE_THRESHOLD 27 #define SET_STR_DC_THRESHOLD 274 #define SET_STR_PRECOMPUTE_THRESHOLD 824 - -/* Tuneup completed successfully, took 108 seconds */ diff --git a/mpn/s390_64/gmp-mparam.h b/mpn/s390_64/gmp-mparam.h index 46ca86726..c0ade71c2 100644 --- a/mpn/s390_64/gmp-mparam.h +++ b/mpn/s390_64/gmp-mparam.h @@ -28,19 +28,19 @@ along with the GNU MP Library. If not, see http://www.gnu.org/licenses/. */ #define MOD_1_1P_METHOD 2 #define MOD_1_NORM_THRESHOLD 0 /* always */ #define MOD_1_UNNORM_THRESHOLD 0 /* always */ -#define MOD_1N_TO_MOD_1_1_THRESHOLD 9 +#define MOD_1N_TO_MOD_1_1_THRESHOLD 8 #define MOD_1U_TO_MOD_1_1_THRESHOLD 5 -#define MOD_1_1_TO_MOD_1_2_THRESHOLD 58 +#define MOD_1_1_TO_MOD_1_2_THRESHOLD 38 #define MOD_1_2_TO_MOD_1_4_THRESHOLD 0 #define PREINV_MOD_1_TO_MOD_1_THRESHOLD 19 #define USE_PREINV_DIVREM_1 1 #define DIV_QR_2_PI2_THRESHOLD MP_SIZE_T_MAX /* never */ #define DIVEXACT_1_THRESHOLD 0 /* always */ -#define BMOD_1_TO_MOD_1_THRESHOLD 47 +#define BMOD_1_TO_MOD_1_THRESHOLD 88 #define MUL_TOOM22_THRESHOLD 10 #define MUL_TOOM33_THRESHOLD 41 -#define MUL_TOOM44_THRESHOLD 99 +#define MUL_TOOM44_THRESHOLD 104 #define MUL_TOOM6H_THRESHOLD 149 #define MUL_TOOM8H_THRESHOLD 212 diff --git a/mpn/x86/bobcat/gmp-mparam.h b/mpn/x86/bobcat/gmp-mparam.h index 58dfee1cf..e14ba39f5 100644 --- a/mpn/x86/bobcat/gmp-mparam.h +++ b/mpn/x86/bobcat/gmp-mparam.h @@ -25,30 +25,30 @@ along with the GNU MP Library. If not, see http://www.gnu.org/licenses/. */ #define MOD_1_NORM_THRESHOLD 0 /* always */ #define MOD_1_UNNORM_THRESHOLD 0 /* always */ -#define MOD_1N_TO_MOD_1_1_THRESHOLD 12 -#define MOD_1U_TO_MOD_1_1_THRESHOLD 5 -#define MOD_1_1_TO_MOD_1_2_THRESHOLD 18 -#define MOD_1_2_TO_MOD_1_4_THRESHOLD 0 /* never mpn_mod_1s_2p */ -#define PREINV_MOD_1_TO_MOD_1_THRESHOLD 7 +#define MOD_1N_TO_MOD_1_1_THRESHOLD 9 +#define MOD_1U_TO_MOD_1_1_THRESHOLD 3 +#define MOD_1_1_TO_MOD_1_2_THRESHOLD 12 +#define MOD_1_2_TO_MOD_1_4_THRESHOLD 23 +#define PREINV_MOD_1_TO_MOD_1_THRESHOLD 13 #define USE_PREINV_DIVREM_1 1 /* native */ #define DIV_QR_2_PI2_THRESHOLD MP_SIZE_T_MAX /* never */ #define DIVEXACT_1_THRESHOLD 0 /* always (native) */ -#define BMOD_1_TO_MOD_1_THRESHOLD 40 +#define BMOD_1_TO_MOD_1_THRESHOLD 42 #define MUL_TOOM22_THRESHOLD 28 -#define MUL_TOOM33_THRESHOLD 85 +#define MUL_TOOM33_THRESHOLD 90 #define MUL_TOOM44_THRESHOLD 147 -#define MUL_TOOM6H_THRESHOLD 270 +#define MUL_TOOM6H_THRESHOLD 274 #define MUL_TOOM8H_THRESHOLD 454 -#define MUL_TOOM32_TO_TOOM43_THRESHOLD 93 -#define MUL_TOOM32_TO_TOOM53_THRESHOLD 107 -#define MUL_TOOM42_TO_TOOM53_THRESHOLD 97 -#define MUL_TOOM42_TO_TOOM63_THRESHOLD 111 +#define MUL_TOOM32_TO_TOOM43_THRESHOLD 89 +#define MUL_TOOM32_TO_TOOM53_THRESHOLD 122 +#define MUL_TOOM42_TO_TOOM53_THRESHOLD 93 +#define MUL_TOOM42_TO_TOOM63_THRESHOLD 113 #define SQR_BASECASE_THRESHOLD 0 /* always (native) */ #define SQR_TOOM2_THRESHOLD 38 -#define SQR_TOOM3_THRESHOLD 101 +#define SQR_TOOM3_THRESHOLD 89 #define SQR_TOOM4_THRESHOLD 220 #define SQR_TOOM6_THRESHOLD 303 #define SQR_TOOM8_THRESHOLD 454 @@ -58,84 +58,85 @@ along with the GNU MP Library. If not, see http://www.gnu.org/licenses/. */ #define MULMOD_BNM1_THRESHOLD 19 #define SQRMOD_BNM1_THRESHOLD 23 -#define POWM_SEC_TABLE 2,17,225,357,2212 +#define POWM_SEC_TABLE 4,14,290,357,2178 #define MUL_FFT_MODF_THRESHOLD 888 /* k = 6 */ #define MUL_FFT_TABLE3 \ - { { 888, 6}, { 27, 7}, { 15, 6}, { 33, 7}, \ - { 17, 6}, { 35, 7}, { 19, 6}, { 39, 7}, \ - { 23, 6}, { 47, 7}, { 27, 8}, { 15, 7}, \ - { 31, 6}, { 63, 7}, { 35, 8}, { 19, 7}, \ - { 41, 8}, { 23, 7}, { 49, 8}, { 31, 7}, \ - { 63, 8}, { 39, 7}, { 79, 9}, { 23, 8}, \ - { 51, 9}, { 31, 8}, { 67, 9}, { 39, 8}, \ - { 79, 9}, { 47, 8}, { 95, 9}, { 55,10}, \ - { 31, 9}, { 63, 8}, { 127, 9}, { 79,10}, \ - { 47, 9}, { 95,11}, { 31,10}, { 63, 9}, \ - { 135,10}, { 79, 9}, { 159,10}, { 95, 9}, \ - { 191,11}, { 63,10}, { 127, 9}, { 255,10}, \ - { 159,11}, { 95,10}, { 191,12}, { 63,11}, \ - { 127,10}, { 271,11}, { 159,10}, { 319, 9}, \ - { 639,10}, { 335,11}, { 191,10}, { 383, 9}, \ - { 767,11}, { 223,12}, { 4096,13}, { 8192,14}, \ + { { 888, 6}, { 25, 7}, { 13, 6}, { 27, 7}, \ + { 15, 6}, { 33, 7}, { 17, 6}, { 35, 7}, \ + { 19, 6}, { 39, 7}, { 23, 6}, { 47, 7}, \ + { 27, 8}, { 15, 7}, { 31, 6}, { 63, 7}, \ + { 35, 8}, { 19, 7}, { 41, 8}, { 23, 7}, \ + { 49, 8}, { 31, 7}, { 63, 8}, { 39, 7}, \ + { 79, 8}, { 43, 9}, { 23, 8}, { 51, 9}, \ + { 31, 8}, { 67, 9}, { 39, 8}, { 79, 9}, \ + { 47, 8}, { 95, 9}, { 55,10}, { 31, 9}, \ + { 63, 8}, { 127, 9}, { 79,10}, { 47, 9}, \ + { 95,11}, { 31,10}, { 63, 9}, { 135,10}, \ + { 79, 9}, { 159,10}, { 95, 9}, { 191,11}, \ + { 63,10}, { 127, 9}, { 255,10}, { 159,11}, \ + { 95,10}, { 191,12}, { 63,11}, { 127,10}, \ + { 255, 9}, { 511,10}, { 271, 9}, { 543,11}, \ + { 159,10}, { 319, 9}, { 671,11}, { 191,10}, \ + { 383, 9}, { 767,12}, { 4096,13}, { 8192,14}, \ { 16384,15}, { 32768,16} } -#define MUL_FFT_TABLE3_SIZE 66 +#define MUL_FFT_TABLE3_SIZE 70 #define MUL_FFT_THRESHOLD 7552 -#define SQR_FFT_MODF_THRESHOLD 730 /* k = 5 */ +#define SQR_FFT_MODF_THRESHOLD 723 /* k = 5 */ #define SQR_FFT_TABLE3 \ - { { 730, 5}, { 25, 6}, { 13, 5}, { 28, 6}, \ + { { 723, 5}, { 25, 6}, { 13, 5}, { 28, 6}, \ { 15, 5}, { 31, 6}, { 27, 7}, { 15, 6}, \ { 33, 7}, { 17, 6}, { 35, 7}, { 19, 6}, \ { 39, 7}, { 23, 6}, { 47, 7}, { 27, 8}, \ { 15, 7}, { 31, 6}, { 63, 7}, { 35, 8}, \ - { 19, 7}, { 41, 8}, { 23, 7}, { 49, 8}, \ - { 31, 7}, { 63, 8}, { 39, 7}, { 79, 8}, \ - { 43, 9}, { 23, 8}, { 51, 9}, { 31, 8}, \ + { 19, 7}, { 41, 8}, { 23, 7}, { 47, 8}, \ + { 31, 7}, { 63, 8}, { 43, 9}, { 23, 8}, \ + { 47, 7}, { 95, 8}, { 51, 9}, { 31, 8}, \ { 67, 9}, { 39, 8}, { 79, 9}, { 47, 8}, \ { 95,10}, { 31, 9}, { 63, 8}, { 127, 9}, \ { 79,10}, { 47, 9}, { 95,11}, { 31,10}, \ { 63, 9}, { 135,10}, { 79, 9}, { 159,10}, \ { 95, 9}, { 191,11}, { 63,10}, { 127, 9}, \ { 255,10}, { 159,11}, { 95,10}, { 191,12}, \ - { 63,11}, { 127,10}, { 255, 9}, { 511,10}, \ - { 271,11}, { 159,10}, { 319, 9}, { 671,11}, \ - { 191, 9}, { 767,12}, { 4096,13}, { 8192,14}, \ - { 16384,15}, { 32768,16} } -#define SQR_FFT_TABLE3_SIZE 70 -#define SQR_FFT_THRESHOLD 7296 + { 63,11}, { 127,10}, { 255, 9}, { 543,11}, \ + { 159, 9}, { 671,11}, { 191,10}, { 383, 9}, \ + { 799,12}, { 4096,13}, { 8192,14}, { 16384,15}, \ + { 32768,16} } +#define SQR_FFT_TABLE3_SIZE 69 +#define SQR_FFT_THRESHOLD 5760 #define MULLO_BASECASE_THRESHOLD 5 #define MULLO_DC_THRESHOLD 45 #define MULLO_MUL_N_THRESHOLD 13463 -#define DC_DIV_QR_THRESHOLD 72 -#define DC_DIVAPPR_Q_THRESHOLD 214 +#define DC_DIV_QR_THRESHOLD 75 +#define DC_DIVAPPR_Q_THRESHOLD 216 #define DC_BDIV_QR_THRESHOLD 67 -#define DC_BDIV_Q_THRESHOLD 142 +#define DC_BDIV_Q_THRESHOLD 143 -#define INV_MULMOD_BNM1_THRESHOLD 71 -#define INV_NEWTON_THRESHOLD 250 +#define INV_MULMOD_BNM1_THRESHOLD 75 +#define INV_NEWTON_THRESHOLD 244 #define INV_APPR_THRESHOLD 228 -#define BINV_NEWTON_THRESHOLD 270 +#define BINV_NEWTON_THRESHOLD 276 #define REDC_1_TO_REDC_N_THRESHOLD 71 -#define MU_DIV_QR_THRESHOLD 2089 +#define MU_DIV_QR_THRESHOLD 1858 #define MU_DIVAPPR_Q_THRESHOLD 1822 #define MUPI_DIV_QR_THRESHOLD 122 #define MU_BDIV_QR_THRESHOLD 1787 #define MU_BDIV_Q_THRESHOLD 1787 -#define MATRIX22_STRASSEN_THRESHOLD 21 -#define HGCD_THRESHOLD 81 -#define HGCD_APPR_THRESHOLD 128 -#define HGCD_REDUCE_THRESHOLD 4455 -#define GCD_DC_THRESHOLD 465 +#define MATRIX22_STRASSEN_THRESHOLD 19 +#define HGCD_THRESHOLD 78 +#define HGCD_APPR_THRESHOLD 55 +#define HGCD_REDUCE_THRESHOLD 4633 +#define GCD_DC_THRESHOLD 474 #define GCDEXT_DC_THRESHOLD 345 #define JACOBI_BASE_METHOD 4 -#define GET_STR_DC_THRESHOLD 11 -#define GET_STR_PRECOMPUTE_THRESHOLD 32 +#define GET_STR_DC_THRESHOLD 14 +#define GET_STR_PRECOMPUTE_THRESHOLD 31 #define SET_STR_DC_THRESHOLD 270 #define SET_STR_PRECOMPUTE_THRESHOLD 812 |