Skip to content

Commit 63ddd4d

Browse files
authored
Merge pull request #780 from valassi/oct23av
Patches and test results over the latest PRs
2 parents 00dbc53 + f53166d commit 63ddd4d

591 files changed

Lines changed: 34691 additions & 28177 deletions

File tree

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

.github/workflows/c-cpp.yml

Lines changed: 10 additions & 10 deletions
Original file line numberDiff line numberDiff line change
@@ -15,40 +15,40 @@ jobs:
1515
fail-fast: false
1616
steps:
1717
- uses: actions/checkout@v2
18-
- name: make epoch1
18+
- name: make debug
1919
run: make -C ${{ matrix.folder }} debug
2020
CPU:
2121
runs-on: ubuntu-latest
2222
strategy:
2323
matrix:
24-
folder: [ epochX/cudacpp/ee_mumu.sa/SubProcesses/P1_Sigma_sm_epem_mupmum , epochX/cudacpp/gg_ttgg.sa/SubProcesses/P1_Sigma_sm_gg_ttxgg ]
24+
folder: [ epochX/cudacpp/ee_mumu.mad/SubProcesses/P1_epem_mupmum , epochX/cudacpp/gg_ttgg.mad/SubProcesses/P1_gg_ttxgg ]
2525
precision: [ d , f , m ]
2626
fail-fast: false
2727
steps:
2828
- uses: actions/checkout@v2
2929
- name: make info
30-
run: make FPTYPE=${{ matrix.precision }} -C ${{ matrix.folder }} info
30+
run: make FPTYPE=${{ matrix.precision }} -C ${{ matrix.folder }} -f cudacpp.mk info
3131
- name: make
3232
run: make FPTYPE=${{ matrix.precision }} -C ${{ matrix.folder }}
3333
- name: make check
34-
run: make FPTYPE=${{ matrix.precision }} -C ${{ matrix.folder }} check
34+
run: make FPTYPE=${{ matrix.precision }} -C ${{ matrix.folder }} -f cudacpp.mk check
3535
CPU_MAC:
3636
runs-on: macos-latest
3737
env:
3838
FC: gfortran-11
3939
strategy:
4040
matrix:
41-
folder: [ epochX/cudacpp/ee_mumu.sa/SubProcesses/P1_Sigma_sm_epem_mupmum, epochX/cudacpp/gg_ttgg.sa/SubProcesses/P1_Sigma_sm_gg_ttxgg ]
41+
folder: [ epochX/cudacpp/ee_mumu.mad/SubProcesses/P1_epem_mupmum, epochX/cudacpp/gg_ttgg.mad/SubProcesses/P1_gg_ttxgg ]
4242
precision: [ d , f , m ]
4343
fail-fast: false
4444
steps:
4545
- uses: actions/checkout@v2
4646
- name: make info
47-
run: make AVX=none OMPFLAGS= FPTYPE=${{ matrix.precision }} -C ${{ matrix.folder }} info
47+
run: make AVX=none OMPFLAGS= FPTYPE=${{ matrix.precision }} -C ${{ matrix.folder }} -f cudacpp.mk info
4848
- name: make
4949
run: make AVX=none OMPFLAGS= FPTYPE=${{ matrix.precision }} -C ${{ matrix.folder }}
5050
- name: make check
51-
run: make AVX=none OMPFLAGS= FPTYPE=${{ matrix.precision }} -C ${{ matrix.folder }} check
51+
run: make AVX=none OMPFLAGS= FPTYPE=${{ matrix.precision }} -C ${{ matrix.folder }} -f cudacpp.mk check
5252
GPU:
5353
runs-on: self-hosted
5454
env:
@@ -57,16 +57,16 @@ jobs:
5757
REQUIRE_CUDA: 1
5858
strategy:
5959
matrix:
60-
folder: [ epochX/cudacpp/ee_mumu.sa/SubProcesses/P1_Sigma_sm_epem_mupmum , epochX/cudacpp/gg_ttgg.sa/SubProcesses/P1_Sigma_sm_gg_ttxgg ]
60+
folder: [ epochX/cudacpp/ee_mumu.mad/SubProcesses/P1_epem_mupmum , epochX/cudacpp/gg_ttgg.mad/SubProcesses/P1_gg_ttxgg ]
6161
precision: [ d , f , m ]
6262
fail-fast: false
6363
steps:
6464
- uses: actions/checkout@v2
6565
- name: path
6666
run: echo "PATH=$PATH"
6767
- name: make info
68-
run: make FPTYPE=${{ matrix.precision }} -C ${{ matrix.folder }} info
68+
run: make FPTYPE=${{ matrix.precision }} -C ${{ matrix.folder }} -f cudacpp.mk info
6969
- name: make
7070
run: make FPTYPE=${{ matrix.precision }} -C ${{ matrix.folder }}
7171
- name: make check
72-
run: make FPTYPE=${{ matrix.precision }} -C ${{ matrix.folder }} check
72+
run: make FPTYPE=${{ matrix.precision }} -C ${{ matrix.folder }} -f cudacpp.mk check

epochX/cudacpp/CODEGEN/PLUGIN/CUDACPP_SA_OUTPUT/MG5aMC_patches/PROD/counters.cc

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1,7 +1,7 @@
11
// Copyright (C) 2020-2023 CERN and UCLouvain.
22
// Licensed under the GNU Lesser General Public License (version 3 or later).
33
// Created by: A. Valassi (Dec 2022) for the MG5aMC CUDACPP plugin.
4-
// Further modified by: A. Valassi (2022-2023) for the MG5aMC CUDACPP plugin.
4+
// Further modified by: S. Hageboeck, A. Valassi (2022-2023) for the MG5aMC CUDACPP plugin.
55

66
#include "timer.h"
77
#define TIMERTYPE std::chrono::high_resolution_clock
@@ -40,7 +40,6 @@ extern "C"
4040
static float smatrix1_totaltime = 0;
4141
static mgOnGpu::Timer<TIMERTYPE> smatrix1multi_timer[nimplC];
4242
static float smatrix1multi_totaltime[nimplC] = { 0 };
43-
static int matrix1_counter = 0;
4443
static int smatrix1_counter = 0;
4544
static int smatrix1multi_counter[nimplC] = { 0 };
4645

epochX/cudacpp/CODEGEN/PLUGIN/CUDACPP_SA_OUTPUT/MG5aMC_patches/PROD/patch.P1

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -1,8 +1,8 @@
11
diff --git b/epochX/cudacpp/gg_tt.mad/SubProcesses/P1_gg_ttx/auto_dsig1.f a/epochX/cudacpp/gg_tt.mad/SubProcesses/P1_gg_ttx/auto_dsig1.f
2-
index 27ed1439e..3b24a9924 100644
2+
index 880769442..5a3da931f 100644
33
--- b/epochX/cudacpp/gg_tt.mad/SubProcesses/P1_gg_ttx/auto_dsig1.f
44
+++ a/epochX/cudacpp/gg_tt.mad/SubProcesses/P1_gg_ttx/auto_dsig1.f
5-
@@ -469,23 +469,140 @@ C
5+
@@ -484,23 +484,140 @@ C
66
INTEGER VECSIZE_USED
77

88
INTEGER IVEC
@@ -284,7 +284,7 @@ index 71fbf2b25..0f1d199fc 100644
284284
open(unit=lun,file=tempname,status='old',ERR=20)
285285
fopened=.true.
286286
diff --git b/epochX/cudacpp/gg_tt.mad/SubProcesses/P1_gg_ttx/matrix1.f a/epochX/cudacpp/gg_tt.mad/SubProcesses/P1_gg_ttx/matrix1.f
287-
index 3ac962688..ef18aff22 100644
287+
index 3ac962688..daea73a6d 100644
288288
--- b/epochX/cudacpp/gg_tt.mad/SubProcesses/P1_gg_ttx/matrix1.f
289289
+++ a/epochX/cudacpp/gg_tt.mad/SubProcesses/P1_gg_ttx/matrix1.f
290290
@@ -72,7 +72,10 @@ C

epochX/cudacpp/CODEGEN/PLUGIN/CUDACPP_SA_OUTPUT/MG5aMC_patches/PROD/patch.common

Lines changed: 36 additions & 26 deletions
Original file line numberDiff line numberDiff line change
@@ -13,7 +13,7 @@ index a59181c70..af7e0efbc 100644
1313
PARAMETER(MAXTRIES=25)
1414
C To pass the helicity configuration chosen by the DiscreteSampler to
1515
diff --git b/epochX/cudacpp/gg_tt.mad/Source/makefile a/epochX/cudacpp/gg_tt.mad/Source/makefile
16-
index 617f10b93..dbe08b846 100644
16+
index 617f10b93..00c73099a 100644
1717
--- b/epochX/cudacpp/gg_tt.mad/Source/makefile
1818
+++ a/epochX/cudacpp/gg_tt.mad/Source/makefile
1919
@@ -120,7 +120,7 @@ $(LIBDIR)libiregi.a: $(IREGIDIR)
@@ -37,12 +37,11 @@ index 617f10b93..dbe08b846 100644
3737
+ for i in `ls -d ../SubProcesses/P*`; do cd $$i; make cleanavxs; cd -; done;
3838
+cleanall: cleanSource # THIS IS THE ONE
3939
+ for i in `ls -d ../SubProcesses/P*`; do cd $$i; make cleanavxs; cd -; done;
40-
+
4140
diff --git b/epochX/cudacpp/gg_tt.mad/SubProcesses/makefile a/epochX/cudacpp/gg_tt.mad/SubProcesses/makefile
42-
index 348c283be..74db44d84 100644
41+
index 348c283be..65369d610 100644
4342
--- b/epochX/cudacpp/gg_tt.mad/SubProcesses/makefile
4443
+++ a/epochX/cudacpp/gg_tt.mad/SubProcesses/makefile
45-
@@ -1,6 +1,22 @@
44+
@@ -1,6 +1,28 @@
4645
+SHELL := /bin/bash
4746
+
4847
include ../../Source/make_opts
@@ -54,6 +53,12 @@ index 348c283be..74db44d84 100644
5453
+# Compile counters with -O3 as in the cudacpp makefile (avoid being "unfair" to Fortran #740)
5554
+CXXFLAGS = -O3 -Wall -Wshadow -Wextra
5655
+
56+
+# Add -std=c++17 explicitly to avoid build errors on macOS
57+
+# Add -mmacosx-version-min=11.3 to avoid "ld: warning: object file was built for newer macOS version than being linked"
58+
+ifneq ($(shell $(CXX) --version | egrep '^Apple clang'),)
59+
+CXXFLAGS += -std=c++17 -mmacosx-version-min=11.3
60+
+endif
61+
+
5762
+# Enable ccache if USECCACHE=1
5863
+ifeq ($(USECCACHE)$(shell echo $(CXX) | grep ccache),1)
5964
+ override CXX:=ccache $(CXX)
@@ -65,7 +70,7 @@ index 348c283be..74db44d84 100644
6570
# Load additional dependencies of the bias module, if present
6671
ifeq (,$(wildcard ../bias_dependencies))
6772
BIASDEPENDENCIES =
68-
@@ -24,7 +40,26 @@ else
73+
@@ -24,7 +46,26 @@ else
6974
MADLOOP_LIB =
7075
endif
7176

@@ -81,19 +86,19 @@ index 348c283be..74db44d84 100644
8186
+CUDACPP_MAKEENV:=$(shell echo '$(.VARIABLES)' | tr " " "\n" | egrep "(USEBUILDDIR|AVX|FPTYPE|HELINL|HRDCOD)")
8287
+###$(info CUDACPP_MAKEENV=$(CUDACPP_MAKEENV))
8388
+###$(info $(foreach v,$(CUDACPP_MAKEENV),$(v)="$($(v))"))
84-
+CUDACPP_BUILDDIR:=$(shell $(MAKE) $(foreach v,$(CUDACPP_MAKEENV),$(v)="$($(v))") -f $(CUDACPP_MAKEFILE) -pn 2>/dev/null | awk '/Building/{print $$3}' | sed s/BUILDDIR=//)
85-
+#ifeq ($(CUDACPP_BUILDDIR),)
86-
+#$(error CUDACPP_BUILDDIR='$(CUDACPP_BUILDDIR)' should not be empty!)
87-
+#else
89+
+CUDACPP_BUILDDIR:=$(shell $(MAKE) $(foreach v,$(CUDACPP_MAKEENV),$(v)="$($(v))") -f $(CUDACPP_MAKEFILE) -pn 2>&1 | awk '/Building/{print $$3}' | sed s/BUILDDIR=//)
90+
+ifeq ($(CUDACPP_BUILDDIR),)
91+
+$(error CUDACPP_BUILDDIR='$(CUDACPP_BUILDDIR)' should not be empty!)
92+
+else
8893
+$(info CUDACPP_BUILDDIR='$(CUDACPP_BUILDDIR)')
89-
+#endif
94+
+endif
9095
+CUDACPP_COMMONLIB=mg5amc_common
9196
+CUDACPP_CXXLIB=mg5amc_$(processid_short)_cpp
9297
+CUDACPP_CULIB=mg5amc_$(processid_short)_cuda
9398

9499
LIBS = $(LIBDIR)libbias.$(libext) $(LIBDIR)libdhelas.$(libext) $(LIBDIR)libdsample.$(libext) $(LIBDIR)libgeneric.$(libext) $(LIBDIR)libpdf.$(libext) $(LIBDIR)libgammaUPC.$(libext) $(LIBDIR)libmodel.$(libext) $(LIBDIR)libcernlib.$(libext) $(MADLOOP_LIB) $(LOOP_LIBS)
95100

96-
@@ -43,41 +78,112 @@ ifeq ($(strip $(MATRIX_HEL)),)
101+
@@ -43,41 +84,117 @@ ifeq ($(strip $(MATRIX_HEL)),)
97102
endif
98103

99104

@@ -113,7 +118,12 @@ index 348c283be..74db44d84 100644
113118

114119
-$(PROG): $(PROCESS) auto_dsig.o $(LIBS) $(MATRIX)
115120
- $(FC) -o $(PROG) $(PROCESS) $(MATRIX) $(LINKLIBS) $(LDFLAGS) $(BIASDEPENDENCIES) -fopenmp
116-
+#LDFLAGS+=-Wl,--no-relax # avoid 'failed to convert GOTPCREL relocation' error #458 (flag not universal -> skip?)
121+
+ifeq ($(UNAME),Darwin)
122+
+LDFLAGS += -lc++ # avoid 'Undefined symbols' for chrono::steady_clock on macOS (checked with otool -L libmg5amc_gg_ttx_cpp.so)
123+
+LDFLAGS += -mmacosx-version-min=11.3 # avoid "ld: warning: object file was built for newer macOS version than being linked"
124+
+else
125+
+LDFLAGS += -Wl,--no-relax # avoid 'failed to convert GOTPCREL relocation' error #458 (not supported on macOS)
126+
+endif
117127

118128
-$(PROG)_forhel: $(PROCESS) auto_dsig.o $(LIBS) $(MATRIX_HEL)
119129
- $(FC) -o $(PROG)_forhel $(PROCESS) $(MATRIX_HEL) $(LINKLIBS) $(LDFLAGS) $(BIASDEPENDENCIES) -fopenmp
@@ -128,8 +138,8 @@ index 348c283be..74db44d84 100644
128138
+else ifneq ($(shell $(CXX) --version | egrep '^clang'),)
129139
+override OMPFLAGS = -fopenmp
130140
+$(CUDACPP_BUILDDIR)/$(PROG)_cpp: LINKLIBS += -L $(shell dirname $(shell $(CXX) -print-file-name=libc++.so)) -lomp # see #604
131-
+###else ifneq ($(shell $(CXX) --version | egrep '^Apple clang'),)
132-
+###override OMPFLAGS = -fopenmp # OMP is not supported yet by cudacpp for Apple clang
141+
+else ifneq ($(shell $(CXX) --version | egrep '^Apple clang'),)
142+
+override OMPFLAGS = # OMP is not supported yet by cudacpp for Apple clang
133143
+else
134144
+override OMPFLAGS = -fopenmp
135145
+endif
@@ -166,24 +176,24 @@ index 348c283be..74db44d84 100644
166176
+madevent_fortran_link: $(PROG)_fortran
167177
+ rm -f $(PROG)
168178
+ ln -s $(PROG)_fortran $(PROG)
169-
+
179+
180+
-$(LIBDIR)libpdf.$(libext):
181+
- cd ../../Source/PDF; make
170182
+madevent_cpp_link: $(CUDACPP_BUILDDIR)/$(PROG)_cpp
171183
+ rm -f $(PROG)
172184
+ ln -s $(CUDACPP_BUILDDIR)/$(PROG)_cpp $(PROG)
173-
+
185+
186+
-$(LIBDIR)libgammaUPC.$(libext):
187+
- cd ../../Source/PDF/gammaUPC; make
174188
+madevent_cuda_link: $(CUDACPP_BUILDDIR)/$(PROG)_cuda
175189
+ rm -f $(PROG)
176190
+ ln -s $(CUDACPP_BUILDDIR)/$(PROG)_cuda $(PROG)
177-
178-
-$(LIBDIR)libpdf.$(libext):
179-
- cd ../../Source/PDF; make
191+
+
180192
+# Building $(PROG)_cpp also builds $(PROG)_cuda if $(CUDACPP_CULIB) exists (improved patch for cpp-only builds #503)
181193
+$(CUDACPP_BUILDDIR)/$(PROG)_cpp: $(PROCESS) $(DSIG_cudacpp) auto_dsig.o $(LIBS) $(MATRIX) counters.o ompnumthreads.o $(CUDACPP_BUILDDIR)/.cudacpplibs
182194
+ $(FC) -o $(CUDACPP_BUILDDIR)/$(PROG)_cpp $(PROCESS) $(DSIG_cudacpp) auto_dsig.o $(MATRIX) $(LINKLIBS) $(BIASDEPENDENCIES) $(OMPFLAGS) counters.o ompnumthreads.o -L$(LIBDIR)/$(CUDACPP_BUILDDIR) -l$(CUDACPP_COMMONLIB) -l$(CUDACPP_CXXLIB) $(LIBFLAGSRPATH) $(LDFLAGS)
183195
+ if [ -f $(LIBDIR)/$(CUDACPP_BUILDDIR)/lib$(CUDACPP_CULIB).* ]; then $(FC) -o $(CUDACPP_BUILDDIR)/$(PROG)_cuda $(PROCESS) $(DSIG_cudacpp) auto_dsig.o $(MATRIX) $(LINKLIBS) $(BIASDEPENDENCIES) $(OMPFLAGS) counters.o ompnumthreads.o -L$(LIBDIR)/$(CUDACPP_BUILDDIR) -l$(CUDACPP_COMMONLIB) -l$(CUDACPP_CULIB) $(LIBFLAGSRPATH) $(LDFLAGS); fi
184-
185-
-$(LIBDIR)libgammaUPC.$(libext):
186-
- cd ../../Source/PDF/gammaUPC; make
196+
+
187197
+$(CUDACPP_BUILDDIR)/$(PROG)_cuda: $(CUDACPP_BUILDDIR)/$(PROG)_cpp
188198
+
189199
+counters.o: counters.cc timer.h
@@ -222,7 +232,7 @@ index 348c283be..74db44d84 100644
222232

223233
# Dependencies
224234

225-
@@ -97,5 +203,61 @@ unwgt.o: genps.inc nexternal.inc symswap.inc cluster.inc run.inc message.inc \
235+
@@ -97,5 +214,61 @@ unwgt.o: genps.inc nexternal.inc symswap.inc cluster.inc run.inc message.inc \
226236
run_config.inc
227237
initcluster.o: message.inc
228238

@@ -287,10 +297,10 @@ index 348c283be..74db44d84 100644
287297
+distclean: cleanall # Clean all fortran and cudacpp builds as well as the googletest installation
288298
+ $(MAKE) -f $(CUDACPP_MAKEFILE) distclean
289299
diff --git b/epochX/cudacpp/gg_tt.mad/bin/internal/gen_ximprove.py a/epochX/cudacpp/gg_tt.mad/bin/internal/gen_ximprove.py
290-
index 4dd71db86..3b8ec3121 100755
300+
index ebbc1ac1d..a88d60b28 100755
291301
--- b/epochX/cudacpp/gg_tt.mad/bin/internal/gen_ximprove.py
292302
+++ a/epochX/cudacpp/gg_tt.mad/bin/internal/gen_ximprove.py
293-
@@ -380,8 +380,20 @@ class gensym(object):
303+
@@ -385,8 +385,20 @@ class gensym(object):
294304
done = True
295305
if not done:
296306
raise Exception('Parsing error in gensym: %s' % stdout)
@@ -314,7 +324,7 @@ index 4dd71db86..3b8ec3121 100755
314324
self.submit_to_cluster(job_list)
315325
job_list = {}
316326
diff --git b/epochX/cudacpp/gg_tt.mad/bin/internal/madevent_interface.py a/epochX/cudacpp/gg_tt.mad/bin/internal/madevent_interface.py
317-
index a056d3861..b70b548e5 100755
327+
index 389b93ab8..d72270289 100755
318328
--- b/epochX/cudacpp/gg_tt.mad/bin/internal/madevent_interface.py
319329
+++ a/epochX/cudacpp/gg_tt.mad/bin/internal/madevent_interface.py
320330
@@ -3614,8 +3614,20 @@ Beware that this can be dangerous for local multicore runs.""")

epochX/cudacpp/CODEGEN/PLUGIN/CUDACPP_SA_OUTPUT/launch_plugin.py

Lines changed: 13 additions & 19 deletions
Original file line numberDiff line numberDiff line change
@@ -1,3 +1,7 @@
1+
# Copyright (C) 2020-2023 CERN and UCLouvain.
2+
# Licensed under the GNU Lesser General Public License (version 3 or later).
3+
# Created by: O. Mattelaer (Aug 2023) for the MG5aMC CUDACPP plugin.
4+
# Further modified by: O. Mattelaer, A. Valassi (2023) for the MG5aMC CUDACPP plugin.
15

26
import logging
37
import os
@@ -19,22 +23,15 @@
1923
import madgraph.various.banner as banner_mod
2024

2125
class CPPMEInterface(madevent_interface.MadEventCmdShell):
22-
2326
def compile(self, *args, **opts):
2427
""" """
25-
2628
import multiprocessing
2729
if not self.options['nb_core'] or self.options['nb_core'] == 'None':
2830
self.options['nb_core'] = multiprocessing.cpu_count()
29-
3031
if args and args[0][0] == 'madevent' and hasattr(self, 'run_card'):
3132
import pathlib
3233
import os
3334
pjoin = os.path.join
34-
35-
36-
37-
3835
cudacpp_backend = self.run_card['cudacpp_backend'].upper() # the default value is defined in banner.py
3936
logger.info("Building madevent in madevent_interface.py with '%s' matrix elements"%cudacpp_backend)
4037
if cudacpp_backend == 'FORTRAN':
@@ -50,15 +47,14 @@ def compile(self, *args, **opts):
5047
return misc.compile(nb_core=self.options['nb_core'], *args, **opts)
5148

5249
class CPPRunCard(banner_mod.RunCardLO):
53-
5450
def reset_simd(self, old_value, new_value, name):
5551
if not hasattr(self, 'path'):
56-
raise Exception
57-
52+
logger.warning('WARNING! CPPRunCard instance has no attribute path')
53+
return
54+
###raise Exception('INTERNAL ERROR! CPPRunCard instance has no attribute path')
5855
if name == "vector_size" and new_value <= int(old_value):
5956
# code can handle the new size -> do not recompile
6057
return
61-
6258
Sourcedir = pjoin(os.path.dirname(os.path.dirname(self.path)), 'Source')
6359
subprocess.call(['make', 'cleanavx'], cwd=Sourcedir, stdout=subprocess.DEVNULL, stderr=subprocess.DEVNULL)
6460

@@ -68,33 +64,31 @@ def plugin_input(self, finput):
6864
def default_setup(self):
6965
super().default_setup()
7066
self.add_param('cudacpp_backend', 'CPP', include=False, hidden=False)
71-
7267

7368
def write_one_include_file(self, output_dir, incname, output_file=None):
7469
"""write one include file at the time"""
75-
7670
if incname == "vector.inc" and 'vector_size' not in self.user_set:
7771
return
7872
super().write_one_include_file(output_dir, incname, output_file)
7973

80-
8174
def check_validity(self):
8275
"""ensure that PLUGIN information are consistent"""
83-
8476
super().check_validity()
85-
8677
if self['SDE_strategy'] != 1:
8778
logger.warning('SDE_strategy different of 1 is not supported with SMD/GPU mode')
8879
self['sde_strategy'] = 1
89-
9080
if self['hel_recycling']:
9181
self['hel_recycling'] = False
9282

9383
class GPURunCard(CPPRunCard):
94-
9584
def default_setup(self):
9685
super(CPPRunCard, self).default_setup()
9786
self.add_param('cudacpp_backend', 'CUDA', include=False, hidden=False)
98-
87+
88+
#class CUDACPPRunCard(CPPRunCard):
89+
# def default_setup(self):
90+
# super(CPPRunCard, self).default_setup()
91+
# self.add_param('cudacpp_backend', 'CPP', include=False, hidden=False)
92+
9993
MEINTERFACE = CPPMEInterface
10094
RunCard = CPPRunCard

epochX/cudacpp/CODEGEN/PLUGIN/CUDACPP_SA_OUTPUT/madgraph/iolibs/template_files/gpu/MatrixElementKernels.cc

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -116,7 +116,7 @@ namespace mg5amcCpu
116116
bool known = true;
117117
bool ok = __builtin_cpu_supports( "sse4.2" );
118118
const std::string tag = "nehalem (SSE4.2)";
119-
#else
119+
#else // AV FIXME! Added by OM for Mac, should identify the correct __xxx__ flag that should be targeted
120120
bool known = false; // __builtin_cpu_supports is not supported
121121
// See https://gcc.gnu.org/onlinedocs/gcc/Basic-PowerPC-Built-in-Functions-Available-on-all-Configurations.html
122122
// See https://stackoverflow.com/q/62783908

0 commit comments

Comments
 (0)