Skip to content

Commit 9f1799e

Browse files
committed
[armdmav] prepare to merge Daniele's fix-arm-support - revert 4 non-CODEGEN commits
Revert "[fix-arm-support] gg_tt.mad: undefine__ARM_NEON for cppnone on arm/apple (with DanieleM)" This reverts commit d427fcf. Revert "[fix-arm-support] gg_tt.mad: use builtin __ARM_NEON for aarch64 simd (with DanieleM)" This reverts commit 82645d2. Revert "[fix-arm-support] gg_tt.mad: use higher tolerance for constexpr_tan tests on aarch64 (with DanieleM)" This reverts commit 625bca8. Revert "Regenerate processes" This reverts commit 1e1c899.
1 parent 91a98e1 commit 9f1799e

202 files changed

Lines changed: 1273 additions & 1678 deletions

File tree

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

epochX/cudacpp/ee_mumu.mad/CODEGEN_mad_ee_mumu_log.txt

Lines changed: 26 additions & 26 deletions
Original file line numberDiff line numberDiff line change
@@ -48,7 +48,7 @@ Note that you can still compile and run aMC@NLO with the built-in PDFs
4848

4949
Using default eps viewer "evince". Set another one in ./input/mg5_configuration.txt
5050
Using default web browser "firefox". Set another one in ./input/mg5_configuration.txt
51-
import /home/dmass/Development/madgraph4gpu/fix-arm-support/MG5aMC/TMPOUT/CODEGEN_mad_ee_mumu.mg
51+
import /home/dmass/Development/madgraph4gpu/release-v1.01.01/MG5aMC/TMPOUT/CODEGEN_mad_ee_mumu.mg
5252
The import format was not given, so we guess it as command
5353
set stdout_level DEBUG
5454
set output information to level: 10
@@ -57,7 +57,7 @@ generate e+ e- > mu+ mu-
5757
No model currently active, so we import the Standard Model
5858
INFO: load particles
5959
INFO: load vertices
60-
DEBUG: model prefixing takes 0.004563808441162109 
60+
DEBUG: model prefixing takes 0.004445075988769531 
6161
INFO: Restrict model sm with file models/sm/restrict_default.dat .
6262
DEBUG: Simplifying conditional expressions 
6363
DEBUG: remove interactions: u s w+ at order: QED=1 
@@ -160,10 +160,10 @@ output madevent_simd ../TMPOUT/CODEGEN_mad_ee_mumu --hel_recycling=False --vecto
160160
INFO: initialize a new directory: CODEGEN_mad_ee_mumu
161161
INFO: remove old information in CODEGEN_mad_ee_mumu
162162
DEBUG: Entering PLUGIN_ProcessExporter.copy_template (initialise the directory) [output.py at line 180] 
163-
WARNING: File exists /home/dmass/Development/madgraph4gpu/fix-arm-support/MG5aMC/TMPOUT/CODEGEN_mad_ee_mumu 
164-
INFO: Creating subdirectories in directory /home/dmass/Development/madgraph4gpu/fix-arm-support/MG5aMC/TMPOUT/CODEGEN_mad_ee_mumu
165-
WARNING: File exists /home/dmass/Development/madgraph4gpu/fix-arm-support/MG5aMC/TMPOUT/CODEGEN_mad_ee_mumu/Cards 
166-
WARNING: File exists /home/dmass/Development/madgraph4gpu/fix-arm-support/MG5aMC/TMPOUT/CODEGEN_mad_ee_mumu/SubProcesses 
163+
WARNING: File exists /home/dmass/Development/madgraph4gpu/release-v1.01.01/MG5aMC/TMPOUT/CODEGEN_mad_ee_mumu 
164+
INFO: Creating subdirectories in directory /home/dmass/Development/madgraph4gpu/release-v1.01.01/MG5aMC/TMPOUT/CODEGEN_mad_ee_mumu
165+
WARNING: File exists /home/dmass/Development/madgraph4gpu/release-v1.01.01/MG5aMC/TMPOUT/CODEGEN_mad_ee_mumu/Cards 
166+
WARNING: File exists /home/dmass/Development/madgraph4gpu/release-v1.01.01/MG5aMC/TMPOUT/CODEGEN_mad_ee_mumu/SubProcesses 
167167
INFO: Organizing processes into subprocess groups
168168
INFO: Generating Helas calls for process: e+ e- > mu+ mu- WEIGHTED<=4 @1
169169
INFO: Processing color information for process: e+ e- > mu+ mu- @1
@@ -179,18 +179,18 @@ INFO: Finding symmetric diagrams for subprocess group epem_mupmum
179179
DEBUG: iconfig_to_diag =  {1: 1, 2: 2} [model_handling.py at line 1576] 
180180
DEBUG: diag_to_iconfig =  {1: 1, 2: 2} [model_handling.py at line 1577] 
181181
Generated helas calls for 1 subprocesses (2 diagrams) in 0.004 s
182-
Wrote files for 8 helas calls in 0.058 s
182+
Wrote files for 8 helas calls in 0.060 s
183183
ALOHA: aloha starts to compute helicity amplitudes
184184
ALOHA: aloha creates FFV1 routines
185185
ALOHA: aloha creates FFV2 routines
186186
ALOHA: aloha creates FFV4 routines
187-
ALOHA: aloha creates 3 routines in 0.138 s
187+
ALOHA: aloha creates 3 routines in 0.170 s
188188
ALOHA: aloha starts to compute helicity amplitudes
189189
ALOHA: aloha creates FFV1 routines
190190
ALOHA: aloha creates FFV2 routines
191191
ALOHA: aloha creates FFV4 routines
192192
ALOHA: aloha creates FFV2_4 routines
193-
ALOHA: aloha creates 7 routines in 0.166 s
193+
ALOHA: aloha creates 7 routines in 0.184 s
194194
<class 'aloha.create_aloha.AbstractRoutine'> FFV1
195195
<class 'aloha.create_aloha.AbstractRoutine'> FFV1
196196
<class 'aloha.create_aloha.AbstractRoutine'> FFV2
@@ -199,31 +199,31 @@ ALOHA: aloha creates 7 routines in 0.166 s
199199
<class 'aloha.create_aloha.AbstractRoutine'> FFV4
200200
<class 'aloha.create_aloha.AbstractRoutine'> FFV2_4
201201
<class 'aloha.create_aloha.AbstractRoutine'> FFV2_4
202-
FileWriter <class 'MG5aMC_PLUGIN.CUDACPP_OUTPUT.model_handling.PLUGIN_CPPWriter'> for /home/dmass/Development/madgraph4gpu/fix-arm-support/MG5aMC/TMPOUT/CODEGEN_mad_ee_mumu/src/./HelAmps_sm.h
203-
INFO: Created file HelAmps_sm.h in directory /home/dmass/Development/madgraph4gpu/fix-arm-support/MG5aMC/TMPOUT/CODEGEN_mad_ee_mumu/src/.
202+
FileWriter <class 'MG5aMC_PLUGIN.CUDACPP_OUTPUT.model_handling.PLUGIN_CPPWriter'> for /home/dmass/Development/madgraph4gpu/release-v1.01.01/MG5aMC/TMPOUT/CODEGEN_mad_ee_mumu/src/./HelAmps_sm.h
203+
INFO: Created file HelAmps_sm.h in directory /home/dmass/Development/madgraph4gpu/release-v1.01.01/MG5aMC/TMPOUT/CODEGEN_mad_ee_mumu/src/.
204204
super_write_set_parameters_onlyfixMajorana (hardcoded=False)
205205
super_write_set_parameters_onlyfixMajorana (hardcoded=True)
206-
FileWriter <class 'MG5aMC_PLUGIN.CUDACPP_OUTPUT.model_handling.PLUGIN_CPPWriter'> for /home/dmass/Development/madgraph4gpu/fix-arm-support/MG5aMC/TMPOUT/CODEGEN_mad_ee_mumu/src/./Parameters_sm.h
207-
FileWriter <class 'MG5aMC_PLUGIN.CUDACPP_OUTPUT.model_handling.PLUGIN_CPPWriter'> for /home/dmass/Development/madgraph4gpu/fix-arm-support/MG5aMC/TMPOUT/CODEGEN_mad_ee_mumu/src/./Parameters_sm.cc
206+
FileWriter <class 'MG5aMC_PLUGIN.CUDACPP_OUTPUT.model_handling.PLUGIN_CPPWriter'> for /home/dmass/Development/madgraph4gpu/release-v1.01.01/MG5aMC/TMPOUT/CODEGEN_mad_ee_mumu/src/./Parameters_sm.h
207+
FileWriter <class 'MG5aMC_PLUGIN.CUDACPP_OUTPUT.model_handling.PLUGIN_CPPWriter'> for /home/dmass/Development/madgraph4gpu/release-v1.01.01/MG5aMC/TMPOUT/CODEGEN_mad_ee_mumu/src/./Parameters_sm.cc
208208
INFO: Created files Parameters_sm.h and Parameters_sm.cc in directory
209-
INFO: /home/dmass/Development/madgraph4gpu/fix-arm-support/MG5aMC/TMPOUT/CODEGEN_mad_ee_mumu/src/. and /home/dmass/Development/madgraph4gpu/fix-arm-support/MG5aMC/TMPOUT/CODEGEN_mad_ee_mumu/src/.
209+
INFO: /home/dmass/Development/madgraph4gpu/release-v1.01.01/MG5aMC/TMPOUT/CODEGEN_mad_ee_mumu/src/. and /home/dmass/Development/madgraph4gpu/release-v1.01.01/MG5aMC/TMPOUT/CODEGEN_mad_ee_mumu/src/.
210210
The option zerowidth_tchannel is modified [True] but will not be written in the configuration files.
211211
If you want to make this value the default for future session, you can run 'save options --all'
212-
save configuration file to /home/dmass/Development/madgraph4gpu/fix-arm-support/MG5aMC/TMPOUT/CODEGEN_mad_ee_mumu/Cards/me5_configuration.txt
212+
save configuration file to /home/dmass/Development/madgraph4gpu/release-v1.01.01/MG5aMC/TMPOUT/CODEGEN_mad_ee_mumu/Cards/me5_configuration.txt
213213
INFO: Use Fortran compiler gfortran
214214
INFO: Use c++ compiler g++
215215
INFO: Generate jpeg diagrams
216216
INFO: Generate web pages
217217
DEBUG: result.returncode =  0 [output.py at line 273] 
218-
Output to directory /home/dmass/Development/madgraph4gpu/fix-arm-support/MG5aMC/TMPOUT/CODEGEN_mad_ee_mumu done.
218+
Output to directory /home/dmass/Development/madgraph4gpu/release-v1.01.01/MG5aMC/TMPOUT/CODEGEN_mad_ee_mumu done.
219219
Type "launch" to generate events from this process, or see
220-
/home/dmass/Development/madgraph4gpu/fix-arm-support/MG5aMC/TMPOUT/CODEGEN_mad_ee_mumu/README
220+
/home/dmass/Development/madgraph4gpu/release-v1.01.01/MG5aMC/TMPOUT/CODEGEN_mad_ee_mumu/README
221221
Run "open index.html" to see more information about this process.
222222
quit
223223

224-
real 0m2.272s
225-
user 0m1.761s
226-
sys 0m0.429s
224+
real 0m2.396s
225+
user 0m1.798s
226+
sys 0m0.425s
227227
Code generation completed in 2 seconds
228228
************************************************************
229229
* *
@@ -245,9 +245,9 @@ Code generation completed in 2 seconds
245245
* Type 'help' for in-line help. *
246246
* *
247247
************************************************************
248-
INFO: load configuration from /home/dmass/Development/madgraph4gpu/fix-arm-support/MG5aMC/TMPOUT/CODEGEN_mad_ee_mumu/Cards/me5_configuration.txt
249-
INFO: load configuration from /home/dmass/Development/madgraph4gpu/fix-arm-support/MG5aMC/mg5amcnlo/input/mg5_configuration.txt
250-
INFO: load configuration from /home/dmass/Development/madgraph4gpu/fix-arm-support/MG5aMC/TMPOUT/CODEGEN_mad_ee_mumu/Cards/me5_configuration.txt
248+
INFO: load configuration from /home/dmass/Development/madgraph4gpu/release-v1.01.01/MG5aMC/TMPOUT/CODEGEN_mad_ee_mumu/Cards/me5_configuration.txt
249+
INFO: load configuration from /home/dmass/Development/madgraph4gpu/release-v1.01.01/MG5aMC/mg5amcnlo/input/mg5_configuration.txt
250+
INFO: load configuration from /home/dmass/Development/madgraph4gpu/release-v1.01.01/MG5aMC/TMPOUT/CODEGEN_mad_ee_mumu/Cards/me5_configuration.txt
251251
Using default eps viewer "evince". Set another one in ./input/mg5_configuration.txt
252252
Using default web browser "firefox". Set another one in ./input/mg5_configuration.txt
253253
treatcards run
@@ -274,9 +274,9 @@ launch in debug mode
274274
* Type 'help' for in-line help. *
275275
* *
276276
************************************************************
277-
INFO: load configuration from /home/dmass/Development/madgraph4gpu/fix-arm-support/MG5aMC/TMPOUT/CODEGEN_mad_ee_mumu/Cards/me5_configuration.txt
278-
INFO: load configuration from /home/dmass/Development/madgraph4gpu/fix-arm-support/MG5aMC/mg5amcnlo/input/mg5_configuration.txt
279-
INFO: load configuration from /home/dmass/Development/madgraph4gpu/fix-arm-support/MG5aMC/TMPOUT/CODEGEN_mad_ee_mumu/Cards/me5_configuration.txt
277+
INFO: load configuration from /home/dmass/Development/madgraph4gpu/release-v1.01.01/MG5aMC/TMPOUT/CODEGEN_mad_ee_mumu/Cards/me5_configuration.txt
278+
INFO: load configuration from /home/dmass/Development/madgraph4gpu/release-v1.01.01/MG5aMC/mg5amcnlo/input/mg5_configuration.txt
279+
INFO: load configuration from /home/dmass/Development/madgraph4gpu/release-v1.01.01/MG5aMC/TMPOUT/CODEGEN_mad_ee_mumu/Cards/me5_configuration.txt
280280
Using default eps viewer "evince". Set another one in ./input/mg5_configuration.txt
281281
Using default web browser "firefox". Set another one in ./input/mg5_configuration.txt
282282
treatcards param

epochX/cudacpp/ee_mumu.mad/Cards/me5_configuration.txt

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -235,7 +235,7 @@
235235
# pineappl = pineappl
236236

237237

238-
#mg5_path = /home/dmass/Development/madgraph4gpu/fix-arm-support/MG5aMC/mg5amcnlo
238+
#mg5_path = /home/dmass/Development/madgraph4gpu/release-v1.01.01/MG5aMC/mg5amcnlo
239239

240240
# MG5 MAIN DIRECTORY
241-
#mg5_path = /home/dmass/Development/madgraph4gpu/fix-arm-support/MG5aMC/mg5amcnlo
241+
#mg5_path = /home/dmass/Development/madgraph4gpu/release-v1.01.01/MG5aMC/mg5amcnlo

epochX/cudacpp/ee_mumu.mad/SubProcesses/MatrixElementKernels.cc

Lines changed: 8 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -250,23 +250,25 @@ namespace mg5amcCpu
250250
bool known = true;
251251
bool ok = __builtin_cpu_supports( "vsx" );
252252
const std::string tag = "powerpc vsx (128bit as in SSE4.2)";
253+
#elif defined __ARM_NEON__ // consider using __BUILTIN_CPU_SUPPORTS__
254+
bool known = false; // __builtin_cpu_supports is not supported
255+
// See https://gcc.gnu.org/onlinedocs/gcc/Basic-PowerPC-Built-in-Functions-Available-on-all-Configurations.html
256+
// See https://stackoverflow.com/q/62783908
257+
// See https://community.arm.com/arm-community-blogs/b/operating-systems-blog/posts/runtime-detection-of-cpu-features-on-an-armv8-a-cpu
258+
bool ok = true; // this is just an assumption!
259+
const std::string tag = "arm neon (128bit as in SSE4.2)";
253260
#elif defined( __x86_64__ ) || defined( __i386__ )
254261
bool known = true;
255262
bool ok = __builtin_cpu_supports( "sse4.2" );
256263
const std::string tag = "nehalem (SSE4.2)";
257264
#else // AV FIXME! Added by OM for Mac, should identify the correct __xxx__ flag that should be targeted
258-
// DM now we have an explicit NEON target for ARM
259-
bool known = false; // __builtin_cpu_supports is not supported
260-
bool ok = true; // this is just an assumption!
261-
const std::string tag = "simd arch not defined";
262-
#endif
263-
#elif defined __ARM_NEON__ // consider using __BUILTIN_CPU_SUPPORTS__
264265
bool known = false; // __builtin_cpu_supports is not supported
265266
// See https://gcc.gnu.org/onlinedocs/gcc/Basic-PowerPC-Built-in-Functions-Available-on-all-Configurations.html
266267
// See https://stackoverflow.com/q/62783908
267268
// See https://community.arm.com/arm-community-blogs/b/operating-systems-blog/posts/runtime-detection-of-cpu-features-on-an-armv8-a-cpu
268269
bool ok = true; // this is just an assumption!
269270
const std::string tag = "arm neon (128bit as in SSE4.2)";
271+
#endif
270272
#else
271273
bool known = true;
272274
bool ok = true;

epochX/cudacpp/ee_mumu.mad/SubProcesses/P1_epem_mupmum/check_sa.cc

Lines changed: 5 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -912,13 +912,13 @@ main( int argc, char** argv )
912912
#elif defined __SSE4_2__
913913
#ifdef __PPC__
914914
wrkflwtxt += "/ppcv";
915+
#elif defined __ARM_NEON__
916+
wrkflwtxt += "/neon";
915917
#else
916918
wrkflwtxt += "/sse4";
917919
#endif
918-
#elif defined __ARM_NEON__
919-
wrkflwtxt += "/neon";
920920
#else
921-
wrkflwtxt += "/????"; // no path to this statement
921+
wrkflwtxt += "/????"; // no path to this statement
922922
#endif
923923
// -- Has cxtype_v::operator[] bracket with non-const reference?
924924
#if defined MGONGPU_CPPSIMD
@@ -1028,12 +1028,11 @@ main( int argc, char** argv )
10281028
<< "Internal loops fptype_sv = VECTOR[" << neppV
10291029
#ifdef __PPC__
10301030
<< "] ('sse4': PPC VSX, 128bit)" << cxtref << std::endl
1031+
#elif defined __ARM_NEON__
1032+
<< "] ('sse4': ARM NEON, 128bit)" << cxtref << std::endl
10311033
#else
10321034
<< "] ('sse4': SSE4.2, 128bit)" << cxtref << std::endl
10331035
#endif
1034-
#elif defined __ARM_NEON__
1035-
<< "Internal loops fptype_sv = VECTOR[" << neppV
1036-
<< "] ('sse4': ARM NEON, 128bit)" << cxtref << std::endl
10371036
#else
10381037
#error Internal error: unknown SIMD build configuration
10391038
#endif

epochX/cudacpp/ee_mumu.mad/SubProcesses/cudacpp.mk

Lines changed: 3 additions & 15 deletions
Original file line numberDiff line numberDiff line change
@@ -60,7 +60,7 @@ endif
6060
ifeq ($(BACKEND),cppauto)
6161
ifeq ($(UNAME_P),ppc64le)
6262
override BACKEND = cppsse4
63-
else ifneq (,$(filter $(UNAME_P),arm aarch64))
63+
else ifeq ($(UNAME_P),arm)
6464
override BACKEND = cppsse4
6565
else ifeq ($(wildcard /proc/cpuinfo),)
6666
override BACKEND = cppnone
@@ -528,26 +528,14 @@ ifeq ($(UNAME_P),ppc64le)
528528
endif
529529
else ifeq ($(UNAME_P),arm)
530530
ifeq ($(BACKEND),cppsse4)
531-
override AVXFLAGS = -D__ARM_NEON__ # ARM NEON with 128 width (Q/quadword registers)
531+
override AVXFLAGS = -D__SSE4_2__ # ARM NEON with 128 width (Q/quadword registers)
532532
else ifeq ($(BACKEND),cppavx2)
533533
$(error Invalid SIMD BACKEND='$(BACKEND)': only 'cppnone' and 'cppsse4' are supported on ARM for the moment)
534534
else ifeq ($(BACKEND),cpp512y)
535535
$(error Invalid SIMD BACKEND='$(BACKEND)': only 'cppnone' and 'cppsse4' are supported on ARM for the moment)
536536
else ifeq ($(BACKEND),cpp512z)
537537
$(error Invalid SIMD BACKEND='$(BACKEND)': only 'cppnone' and 'cppsse4' are supported on ARM for the moment)
538538
endif
539-
else ifeq ($(UNAME_P),aarch64)
540-
ifeq ($(BACKEND),cppnone)
541-
override AVXFLAGS = -march=armv8-a+nosimd
542-
else ifeq ($(BACKEND),cppsse4)
543-
override AVXFLAGS = -march=armv8-a+simd -D__ARM_NEON__
544-
else ifeq ($(BACKEND),cppavx2)
545-
$(error Invalid SIMD BACKEND='$(BACKEND)': only 'cppnone' and 'cppsse4' are supported on aarch64 for the moment)
546-
else ifeq ($(BACKEND),cpp512y)
547-
$(error Invalid SIMD BACKEND='$(BACKEND)': only 'cppnone' and 'cppsse4' are supported on aarch64 for the moment)
548-
else ifeq ($(BACKEND),cpp512z)
549-
$(error Invalid SIMD BACKEND='$(BACKEND)': only 'cppnone' and 'cppsse4' are supported on aarch64 for the moment)
550-
endif
551539
else ifneq ($(shell $(CXX) --version | grep ^nvc++),) # support nvc++ #531
552540
ifeq ($(BACKEND),cppnone)
553541
override AVXFLAGS = -mno-sse3 # no SIMD
@@ -1104,7 +1092,7 @@ bld512z:
11041092
ifeq ($(UNAME_P),ppc64le)
11051093
###bldavxs: $(INCDIR)/fbridge.inc bldnone bldsse4
11061094
bldavxs: bldnone bldsse4
1107-
else ifneq (,$(filter $(UNAME_P),arm aarch64))
1095+
else ifeq ($(UNAME_P),arm)
11081096
###bldavxs: $(INCDIR)/fbridge.inc bldnone bldsse4
11091097
bldavxs: bldnone bldsse4
11101098
else

epochX/cudacpp/ee_mumu.mad/SubProcesses/cudacpp_overlay.mk

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -114,7 +114,7 @@ $(LIBS): .libs
114114
touch $@
115115

116116
$(CUDACPP_BUILDDIR)/.cudacpplibs:
117-
$(MAKE) VERBOSE=1 -f $(CUDACPP_MAKEFILE)
117+
$(MAKE) -f $(CUDACPP_MAKEFILE)
118118
touch $@
119119

120120
# Remove per-library recipes from makefile to avoid duplicate sub-makes
@@ -225,7 +225,7 @@ madevent_%_link:
225225
# Cudacpp bldall targets
226226
ifeq ($(UNAME_P),ppc64le)
227227
bldavxs: bldnone bldsse4
228-
else ifneq (,$(filter $(UNAME_P),arm aarch64))
228+
else ifeq ($(UNAME_P),arm)
229229
bldavxs: bldnone bldsse4
230230
else
231231
bldavxs: bldnone bldsse4 bldavx2 bld512y bld512z

epochX/cudacpp/ee_mumu.mad/src/mgOnGpuConfig.h

Lines changed: 1 addition & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -235,13 +235,7 @@ using mgOnGpu::fptype2;
235235
#else
236236
#define MGONGPU_CPPSIMD 8
237237
#endif
238-
#elif defined __SSE4_2__ // C++ "sse4" SSE4.2 (128-bit ie 16-byte): 2 (DOUBLE) or 4 (FLOAT) [Power9 default]
239-
#ifdef MGONGPU_FPTYPE_DOUBLE
240-
#define MGONGPU_CPPSIMD 2
241-
#else
242-
#define MGONGPU_CPPSIMD 4
243-
#endif
244-
#elif defined __ARM_NEON__ // C++ "sse4" ARM NEON (128-bit ie 16-byte): 2 (DOUBLE) or 4 (FLOAT) [ARM default]
238+
#elif defined __SSE4_2__ // C++ "sse4" SSE4.2 (128-bit ie 16-byte): 2 (DOUBLE) or 4 (FLOAT) [Power9 and ARM default]
245239
#ifdef MGONGPU_FPTYPE_DOUBLE
246240
#define MGONGPU_CPPSIMD 2
247241
#else

epochX/cudacpp/ee_mumu.mad/test/cudacpp_test.mk

Lines changed: 1 addition & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -7,13 +7,10 @@ THISDIR = $(dir $(abspath $(lastword $(MAKEFILE_LIST))))
77

88
# Host detection
99
UNAME_S := $(shell uname -s)
10-
UNAME_P := $(shell uname -p)
1110

12-
# Only add AVX2/FMA on non-mac and non-ARM hosts
11+
# Only add AVX2/FMA on non-mac hosts
1312
ifeq ($(UNAME_S),Darwin)
1413
GTEST_CMAKE_FLAGS :=
15-
else ifeq ($(UNAME_P),aarch64)
16-
GTEST_CMAKE_FLAGS :=
1714
else
1815
GTEST_CMAKE_FLAGS := -DCMAKE_CXX_FLAGS="-mavx2 -mfma"
1916
endif

0 commit comments

Comments
 (0)