Source-Changes-HG archive

[Date Prev][Date Next][Thread Prev][Thread Next][Date Index][Thread Index][Old Index]

[src/trunk]: src/external/lgpl3/gmp/lib/libgmp/arch re-run native-gmp for gmp...



details:   https://anonhg.NetBSD.org/src/rev/d1dd7fbbb1c0
branches:  trunk
changeset: 939698:d1dd7fbbb1c0
user:      mrg <mrg%NetBSD.org@localhost>
date:      Sun Sep 27 21:19:36 2020 +0000

description:
re-run native-gmp for gmp 6.2.0 and arm:  run with a v4 toolchain
instead of a v7 toolchain, so it works on all.

should fix latest build mess.

future: test the speed of this vs armv[567] specific on armv[567].

diffstat:

 external/lgpl3/gmp/lib/libgmp/arch/arm/config.h       |   28 +-
 external/lgpl3/gmp/lib/libgmp/arch/arm/config.m4      |    7 +-
 external/lgpl3/gmp/lib/libgmp/arch/arm/gmp-mparam.h   |  228 +++++------------
 external/lgpl3/gmp/lib/libgmp/arch/arm/gmp.h          |   11 +-
 external/lgpl3/gmp/lib/libgmp/arch/arm/srcs.mk        |   36 +-
 external/lgpl3/gmp/lib/libgmp/arch/armeb/config.h     |   28 +-
 external/lgpl3/gmp/lib/libgmp/arch/armeb/config.m4    |    7 +-
 external/lgpl3/gmp/lib/libgmp/arch/armeb/gmp-mparam.h |  228 +++++------------
 external/lgpl3/gmp/lib/libgmp/arch/armeb/gmp.h        |   11 +-
 external/lgpl3/gmp/lib/libgmp/arch/armeb/srcs.mk      |   36 +-
 10 files changed, 232 insertions(+), 388 deletions(-)

diffs (truncated from 1110 to 300 lines):

diff -r 24c78990d10b -r d1dd7fbbb1c0 external/lgpl3/gmp/lib/libgmp/arch/arm/config.h
--- a/external/lgpl3/gmp/lib/libgmp/arch/arm/config.h   Sun Sep 27 20:13:44 2020 +0000
+++ b/external/lgpl3/gmp/lib/libgmp/arch/arm/config.h   Sun Sep 27 21:19:36 2020 +0000
@@ -37,7 +37,7 @@
 
 /* The gmp-mparam.h file (a string) the tune program should suggest updating.
    */
-#define GMP_MPARAM_H_SUGGEST "./mpn/arm/v7a/cora5/gmp-mparam.h"
+#define GMP_MPARAM_H_SUGGEST "./mpn/arm/gmp-mparam.h"
 
 /* Define to 1 if you have the `alarm' function. */
 #define HAVE_ALARM 1
@@ -278,8 +278,8 @@
 /* #undef HAVE_NATIVE_mpn_addlsh2_nc_ip2 */
 /* #undef HAVE_NATIVE_mpn_addlsh_nc_ip2 */
 /* #undef HAVE_NATIVE_mpn_addmul_1c */
-#define HAVE_NATIVE_mpn_addmul_2 1
-#define HAVE_NATIVE_mpn_addmul_3 1
+/* #undef HAVE_NATIVE_mpn_addmul_2 */
+/* #undef HAVE_NATIVE_mpn_addmul_3 */
 /* #undef HAVE_NATIVE_mpn_addmul_4 */
 /* #undef HAVE_NATIVE_mpn_addmul_5 */
 /* #undef HAVE_NATIVE_mpn_addmul_6 */
@@ -300,13 +300,13 @@
 /* #undef HAVE_NATIVE_mpn_div_qr_2 */
 #define HAVE_NATIVE_mpn_divexact_1 1
 /* #undef HAVE_NATIVE_mpn_divexact_by3c */
-#define HAVE_NATIVE_mpn_divrem_1 1
+/* #undef HAVE_NATIVE_mpn_divrem_1 */
 /* #undef HAVE_NATIVE_mpn_divrem_1c */
 /* #undef HAVE_NATIVE_mpn_divrem_2 */
 /* #undef HAVE_NATIVE_mpn_gcd_1 */
-#define HAVE_NATIVE_mpn_gcd_11 1
-#define HAVE_NATIVE_mpn_gcd_22 1
-#define HAVE_NATIVE_mpn_hamdist 1
+/* #undef HAVE_NATIVE_mpn_gcd_11 */
+/* #undef HAVE_NATIVE_mpn_gcd_22 */
+/* #undef HAVE_NATIVE_mpn_hamdist */
 #define HAVE_NATIVE_mpn_invert_limb 1
 #define HAVE_NATIVE_mpn_ior_n 1
 #define HAVE_NATIVE_mpn_iorn_n 1
@@ -314,16 +314,16 @@
 #define HAVE_NATIVE_mpn_lshiftc 1
 /* #undef HAVE_NATIVE_mpn_lshsub_n */
 /* #undef HAVE_NATIVE_mpn_mod_1 */
-#define HAVE_NATIVE_mpn_mod_1_1p 1
+/* #undef HAVE_NATIVE_mpn_mod_1_1p */
 /* #undef HAVE_NATIVE_mpn_mod_1c */
-#define HAVE_NATIVE_mpn_mod_1s_2p 1
+/* #undef HAVE_NATIVE_mpn_mod_1s_2p */
 /* #undef HAVE_NATIVE_mpn_mod_1s_4p */
 #define HAVE_NATIVE_mpn_mod_34lsub1 1
 /* #undef HAVE_NATIVE_mpn_modexact_1_odd */
 #define HAVE_NATIVE_mpn_modexact_1c_odd 1
 #define HAVE_NATIVE_mpn_mul_1 1
 /* #undef HAVE_NATIVE_mpn_mul_1c */
-#define HAVE_NATIVE_mpn_mul_2 1
+/* #undef HAVE_NATIVE_mpn_mul_2 */
 /* #undef HAVE_NATIVE_mpn_mul_3 */
 /* #undef HAVE_NATIVE_mpn_mul_4 */
 /* #undef HAVE_NATIVE_mpn_mul_5 */
@@ -332,8 +332,8 @@
 /* #undef HAVE_NATIVE_mpn_mullo_basecase */
 #define HAVE_NATIVE_mpn_nand_n 1
 #define HAVE_NATIVE_mpn_nior_n 1
-#define HAVE_NATIVE_mpn_popcount 1
-#define HAVE_NATIVE_mpn_preinv_divrem_1 1
+/* #undef HAVE_NATIVE_mpn_popcount */
+/* #undef HAVE_NATIVE_mpn_preinv_divrem_1 */
 /* #undef HAVE_NATIVE_mpn_preinv_mod_1 */
 /* #undef HAVE_NATIVE_mpn_redc_1 */
 /* #undef HAVE_NATIVE_mpn_redc_2 */
@@ -349,7 +349,7 @@
 /* #undef HAVE_NATIVE_mpn_rsh1sub_nc */
 #define HAVE_NATIVE_mpn_rshift 1
 /* #undef HAVE_NATIVE_mpn_sbpi1_bdiv_r */
-#define HAVE_NATIVE_mpn_sqr_basecase 1
+/* #undef HAVE_NATIVE_mpn_sqr_basecase */
 /* #undef HAVE_NATIVE_mpn_sqr_diagonal */
 /* #undef HAVE_NATIVE_mpn_sqr_diag_addlsh1 */
 #define HAVE_NATIVE_mpn_sub_n 1
@@ -587,7 +587,7 @@
 #define TIME_WITH_SYS_TIME 1
 
 /* Maximum size the tune program can test for SQR_TOOM2_THRESHOLD */
-/* #undef TUNE_SQR_TOOM2_MAX */
+#define TUNE_SQR_TOOM2_MAX SQR_TOOM2_MAX_GENERIC
 
 /* Version number of package */
 #define VERSION "6.2.0"
diff -r 24c78990d10b -r d1dd7fbbb1c0 external/lgpl3/gmp/lib/libgmp/arch/arm/config.m4
--- a/external/lgpl3/gmp/lib/libgmp/arch/arm/config.m4  Sun Sep 27 20:13:44 2020 +0000
+++ b/external/lgpl3/gmp/lib/libgmp/arch/arm/config.m4  Sun Sep 27 21:19:36 2020 +0000
@@ -4,6 +4,7 @@
 
 define(<WANT_ASSERT>,0)
 define(<WANT_PROFILING>,<`no'>)
+define(<NOTHUMB>,1)
 define(<M4WRAP_SPURIOUS>,<no>)
 define(<TEXT>, <.text>)
 define(<DATA>, <.data>)
@@ -17,8 +18,8 @@
 define(<LSYM_PREFIX>, <.L>)
 define(<W32>, <.long>)
 define(<ALIGN_LOGARITHMIC>,<yes>)
-define(<SQR_TOOM2_THRESHOLD>,<66>)
-define(<BMOD_1_TO_MOD_1_THRESHOLD>,<52>)
+define(<SQR_TOOM2_THRESHOLD>,<78>)
+define(<BMOD_1_TO_MOD_1_THRESHOLD>,<41>)
 define(<SIZEOF_UNSIGNED>,<4>)
 define(<GMP_LIMB_BITS>,32)
 define(<GMP_NAIL_BITS>,0)
@@ -28,7 +29,7 @@
 ifdef(`__CONFIG_M4_INCLUDED__',,`
 include(CONFIG_TOP_SRCDIR`/mpn/asm-defs.m4')
 include_mpn(`arm/arm-defs.m4')
-define_not_for_expansion(`HAVE_HOST_CPU_armv7')
+define_not_for_expansion(`HAVE_HOST_CPU_armv4')
 define_not_for_expansion(`HAVE_ABI_32')
 define_not_for_expansion(`HAVE_LIMB_LITTLE_ENDIAN')
 define_not_for_expansion(`HAVE_DOUBLE_IEEE_LITTLE_ENDIAN')
diff -r 24c78990d10b -r d1dd7fbbb1c0 external/lgpl3/gmp/lib/libgmp/arch/arm/gmp-mparam.h
--- a/external/lgpl3/gmp/lib/libgmp/arch/arm/gmp-mparam.h       Sun Sep 27 20:13:44 2020 +0000
+++ b/external/lgpl3/gmp/lib/libgmp/arch/arm/gmp-mparam.h       Sun Sep 27 21:19:36 2020 +0000
@@ -1,6 +1,7 @@
 /* gmp-mparam.h -- Compiler/machine parameter header file.
 
-Copyright 2019 Free Software Foundation, Inc.
+Copyright 1991, 1993, 1994, 1999-2003, 2009, 2010 Free Software Foundation,
+Inc.
 
 This file is part of the GNU MP Library.
 
@@ -31,175 +32,96 @@
 #define GMP_LIMB_BITS 32
 #define GMP_LIMB_BYTES 4
 
-/* 1500 MHz Cortex-A5 (odroid c1) */
-/* FFT tuning limit = 18,235,562 */
-/* Generated by tuneup.c, 2019-10-22, gcc 4.9 */
+/* 1193MHz ARM (gcc55.fsffrance.org) */
 
+#define DIVREM_1_NORM_THRESHOLD              0  /* preinv always */
+#define DIVREM_1_UNNORM_THRESHOLD            0  /* always */
 #define MOD_1_NORM_THRESHOLD                 0  /* always */
 #define MOD_1_UNNORM_THRESHOLD               0  /* always */
-#define MOD_1N_TO_MOD_1_1_THRESHOLD          7
-#define MOD_1U_TO_MOD_1_1_THRESHOLD          7
-#define MOD_1_1_TO_MOD_1_2_THRESHOLD         8
+#define MOD_1N_TO_MOD_1_1_THRESHOLD         56
+#define MOD_1U_TO_MOD_1_1_THRESHOLD         11
+#define MOD_1_1_TO_MOD_1_2_THRESHOLD         0  /* never mpn_mod_1_1p */
 #define MOD_1_2_TO_MOD_1_4_THRESHOLD     MP_SIZE_T_MAX
-#define PREINV_MOD_1_TO_MOD_1_THRESHOLD     23
-#define USE_PREINV_DIVREM_1                  1  /* native */
-#define DIV_QR_1N_PI1_METHOD                 1  /* 132.79% faster than 2 */
-#define DIV_QR_1_NORM_THRESHOLD          MP_SIZE_T_MAX  /* never */
-#define DIV_QR_1_UNNORM_THRESHOLD        MP_SIZE_T_MAX  /* never */
-#define DIV_QR_2_PI2_THRESHOLD           MP_SIZE_T_MAX  /* never */
-#define DIVEXACT_1_THRESHOLD                 0  /* always (native) */
-#define BMOD_1_TO_MOD_1_THRESHOLD           52
+#define PREINV_MOD_1_TO_MOD_1_THRESHOLD     71
+#define USE_PREINV_DIVREM_1                  1  /* preinv always */
+#define DIVREM_2_THRESHOLD                   0  /* preinv always */
+#define DIVEXACT_1_THRESHOLD                 0  /* always */
+#define BMOD_1_TO_MOD_1_THRESHOLD           41
 
-#define DIV_1_VS_MUL_1_PERCENT             213
+#define MUL_TOOM22_THRESHOLD                36
+#define MUL_TOOM33_THRESHOLD               125
+#define MUL_TOOM44_THRESHOLD               193
+#define MUL_TOOM6H_THRESHOLD               303
+#define MUL_TOOM8H_THRESHOLD               418
 
-#define MUL_TOOM22_THRESHOLD                48
-#define MUL_TOOM33_THRESHOLD               143
-#define MUL_TOOM44_THRESHOLD               262
-#define MUL_TOOM6H_THRESHOLD               414
-#define MUL_TOOM8H_THRESHOLD               527
-
-#define MUL_TOOM32_TO_TOOM43_THRESHOLD     153
-#define MUL_TOOM32_TO_TOOM53_THRESHOLD     168
-#define MUL_TOOM42_TO_TOOM53_THRESHOLD     152
-#define MUL_TOOM42_TO_TOOM63_THRESHOLD     180
-#define MUL_TOOM43_TO_TOOM54_THRESHOLD     226
+#define MUL_TOOM32_TO_TOOM43_THRESHOLD     125
+#define MUL_TOOM32_TO_TOOM53_THRESHOLD     176
+#define MUL_TOOM42_TO_TOOM53_THRESHOLD     114
+#define MUL_TOOM42_TO_TOOM63_THRESHOLD     129
 
-#define SQR_BASECASE_THRESHOLD               0  /* always (native) */
-#define SQR_TOOM2_THRESHOLD                 66
-#define SQR_TOOM3_THRESHOLD                149
-#define SQR_TOOM4_THRESHOLD                348
-#define SQR_TOOM6_THRESHOLD                517
-#define SQR_TOOM8_THRESHOLD                608
+#define SQR_BASECASE_THRESHOLD              12
+#define SQR_TOOM2_THRESHOLD                 78
+#define SQR_TOOM3_THRESHOLD                137
+#define SQR_TOOM4_THRESHOLD                212
+#define SQR_TOOM6_THRESHOLD                306
+#define SQR_TOOM8_THRESHOLD                422
 
-#define MULMID_TOOM42_THRESHOLD             70
+#define MULMOD_BNM1_THRESHOLD               20
+#define SQRMOD_BNM1_THRESHOLD               26
 
-#define MULMOD_BNM1_THRESHOLD               26
-#define SQRMOD_BNM1_THRESHOLD               28
-
-#define MUL_FFT_MODF_THRESHOLD             660  /* k = 5 */
+#define MUL_FFT_MODF_THRESHOLD             436  /* k = 5 */
 #define MUL_FFT_TABLE3                                      \
-  { {    660, 5}, {     29, 6}, {     15, 5}, {     33, 6}, \
-    {     17, 5}, {     35, 6}, {     29, 7}, {     15, 6}, \
-    {     37, 7}, {     19, 6}, {     40, 7}, {     21, 6}, \
-    {     43, 7}, {     37, 8}, {     19, 7}, {     43, 8}, \
-    {     23, 7}, {     51, 8}, {     27, 7}, {     55, 8}, \
-    {     31, 7}, {     63, 8}, {     43, 9}, {     23, 8}, \
-    {     55, 9}, {     31, 8}, {     71, 9}, {     39, 8}, \
-    {     83, 9}, {     47, 8}, {     99, 9}, {     55,10}, \
-    {     31, 9}, {     63, 8}, {    127, 9}, {     79,10}, \
-    {     47, 9}, {    103,11}, {     31,10}, {     63, 9}, \
-    {    135,10}, {     79, 9}, {    167,10}, {     95, 9}, \
-    {    191,10}, {    111,11}, {     63,10}, {    159,11}, \
-    {     95,10}, {    191, 9}, {    383,12}, {     63,11}, \
-    {    127,10}, {    255, 9}, {    511,10}, {    271,11}, \
-    {    159,10}, {    319, 9}, {    639,10}, {    335, 9}, \
-    {    671,11}, {    191,10}, {    383, 9}, {    767,10}, \
-    {    399, 9}, {    799,10}, {    415,11}, {    223,12}, \
-    {    127,11}, {    255,10}, {    511, 9}, {   1023,10}, \
-    {    543,11}, {    287,10}, {    607,11}, {    319,10}, \
-    {    671,11}, {    351,12}, {    191,11}, {    383,10}, \
-    {    799,11}, {    415,10}, {    831,13}, {    127,12}, \
-    {    255,11}, {    511,10}, {   1023,11}, {    543,10}, \
-    {   1087,11}, {    575,10}, {   1151,11}, {    607,12}, \
-    {    319,11}, {    703,12}, {    383,11}, {    831,12}, \
-    {    447,11}, {    895,13}, {    255,12}, {    511,11}, \
-    {   1087,12}, {    575,11}, {   1183,12}, {    639,11}, \
-    {   1279,12}, {    703,13}, {    383,12}, {    767,11}, \
-    {   1535,12}, {    895,14}, {    255,13}, {    511,12}, \
-    {   1151,13}, {    639,12}, {   1407,13}, {    767,12}, \
-    {   1599,13}, {    895,12}, {   1791,14}, {    511,13}, \
-    {   1023,12}, {   2111,13}, {   1151,12}, {   2367,13}, \
-    {   1279,12}, {   2559,13}, {   1407,14}, {    767,13}, \
-    {   1535,12}, {   3071,13}, {   1663,12}, {   3327,13}, \
-    {   1791,15}, {    511,14}, {   1023,13}, {   2175,12}, \
-    {   4351,13}, {   8192,14}, {  16384,15}, {  32768,16} }
-#define MUL_FFT_TABLE3_SIZE 140
-#define MUL_FFT_THRESHOLD                 7552
+  { {    436, 5}, {     27, 6}, {     28, 7}, {     15, 6}, \
+    {     32, 7}, {     17, 6}, {     35, 7}, {     19, 6}, \
+    {     39, 7}, {     29, 8}, {     15, 7}, {     35, 8}, \
+    {     19, 7}, {     41, 8}, {     23, 7}, {     49, 8}, \
+    {     27, 9}, {     15, 8}, {     31, 7}, {     63, 8}, \
+    {    256, 9}, {    512,10}, {   1024,11}, {   2048,12}, \
+    {   4096,13}, {   8192,14}, {  16384,15}, {  32768,16} }
+#define MUL_FFT_TABLE3_SIZE 28
+#define MUL_FFT_THRESHOLD                 5760
 
-#define SQR_FFT_MODF_THRESHOLD             590  /* k = 5 */
+#define SQR_FFT_MODF_THRESHOLD             404  /* k = 5 */
 #define SQR_FFT_TABLE3                                      \
-  { {    590, 5}, {     33, 6}, {     17, 5}, {     35, 6}, \
-    {     36, 7}, {     19, 6}, {     40, 7}, {     21, 6}, \
-    {     43, 7}, {     23, 6}, {     47, 7}, {     37, 8}, \
-    {     19, 7}, {     43, 8}, {     23, 7}, {     49, 8}, \
-    {     27, 7}, {     55, 8}, {     31, 7}, {     63, 8}, \
-    {     43, 9}, {     23, 8}, {     55, 9}, {     31, 8}, \
-    {     67, 9}, {     39, 8}, {     83, 9}, {     47, 8}, \
-    {     95, 9}, {     55,10}, {     31, 9}, {     79,10}, \
-    {     47, 9}, {    103,11}, {     31,10}, {     63, 9}, \
-    {    135,10}, {     79, 9}, {    167,10}, {     95, 9}, \
-    {    191,10}, {    111,11}, {     63,10}, {    159,11}, \
-    {     95,10}, {    191, 9}, {    383,12}, {     63,11}, \
-    {    127,10}, {    255, 9}, {    511,10}, {    271, 9}, \
-    {    543,11}, {    159,10}, {    319, 9}, {    639,10}, \
-    {    335, 9}, {    671,10}, {    351,11}, {    191,10}, \
-    {    383, 9}, {    767,10}, {    415,12}, {    127,11}, \
-    {    255,10}, {    511, 9}, {   1023,10}, {    543, 9}, \
-    {   1087,11}, {    287,10}, {    575, 9}, {   1151,10}, \
-    {    607,11}, {    319,10}, {    671,11}, {    351,12}, \
-    {    191,11}, {    383,10}, {    799,11}, {    415,10}, \
-    {    831,13}, {    127,12}, {    255,11}, {    511,10}, \
-    {   1023,11}, {    543,10}, {   1087,11}, {    575,10}, \
-    {   1151,11}, {    607,12}, {    319,11}, {    735,12}, \
-    {    383,11}, {    831,12}, {    447,11}, {    927,13}, \
-    {    255,12}, {    511,11}, {   1087,12}, {    575,11}, \
-    {   1151,12}, {    639,11}, {   1279,12}, {    703,13}, \
-    {    383,12}, {    767,11}, {   1535,12}, {    831,11}, \
-    {   1663,12}, {    895,11}, {   1791,12}, {    959,14}, \
-    {    255,13}, {    511,12}, {   1023,11}, {   2047,12}, \
-    {   1151,13}, {    639,12}, {   1407,13}, {    767,12}, \
-    {   1599,13}, {    895,12}, {   1791,14}, {    511,13}, \
-    {   1023,12}, {   2111,13}, {   1151,12}, {   2367,13}, \
-    {   1279,12}, {   2559,13}, {   1407,14}, {    767,13}, \
-    {   1535,12}, {   3071,13}, {   1663,12}, {   3327,13}, \
-    {   1791,15}, {    511,14}, {   1023,13}, {   2175,12}, \
-    {   4351,13}, {   8192,14}, {  16384,15}, {  32768,16} }
-#define SQR_FFT_TABLE3_SIZE 144



Home | Main Index | Thread Index | Old Index