From 23f22d74f88b9cece7d5aaecc3813aad5fc88376 Mon Sep 17 00:00:00 2001 From: JUan ESCOBAR <juan.escobar@aero.obs-mip.fr> Date: Tue, 17 Nov 2020 16:21:12 +0100 Subject: [PATCH] Juan 17/11/2020: Rules.LXpgi2004.mk, for MANAGEDO2 compile spll_modd_halo_d.o without managed memory for real GPUDIRECT usage + minor modif --- src/Rules.LXpgi2004.mk | 12 +++++++----- 1 file changed, 7 insertions(+), 5 deletions(-) diff --git a/src/Rules.LXpgi2004.mk b/src/Rules.LXpgi2004.mk index c8f6b3297..d3c5f1039 100644 --- a/src/Rules.LXpgi2004.mk +++ b/src/Rules.LXpgi2004.mk @@ -20,7 +20,7 @@ CUDALEVEL=cuda10.1 # #Compute capability of GPU # -OPT_CPTCAP=cc35,cc50,cc70 +OPT_CPTCAP=cc35,cc50,cc60,cc70 #Aeropc45: cc50 #Nuwa: cc35 #Ouessant Firestone K80: cc35 @@ -42,9 +42,9 @@ OPT_PERF1 = -O1 OPT_PERF2 = -O2 # OPT_MANAGED = -Mframe -Mnostack_arrays -Mallocatable=95 -ta=host,tesla:nofma,$(OPT_CPTCAP),$(CUDALEVEL),managed $(OPT_INFO) $(OPT_PROF) -OPT_MULTICORE = -ta=multicore $(OPT_INFO) $(OPT_PROF) -OPT_NOOPENACC = -ta=host $(OPT_INFO) $(OPT_PROF) -OPT_OPENACC = -Mnostack_arrays -Mnostack_arrays -Mallocatable=95 -ta=host,tesla:nofma,$(OPT_CPTCAP),$(CUDALEVEL) $(OPT_INFO) $(OPT_PROF) +OPT_MULTICORE = -ta=multicore $(OPT_INFO) $(OPT_PROF) +OPT_NOOPENACC = -ta=host $(OPT_INFO) $(OPT_PROF) +OPT_OPENACC = -Mframe -Mnostack_arrays -Mallocatable=95 -ta=host,tesla:nofma,$(OPT_CPTCAP),$(CUDALEVEL) $(OPT_INFO) $(OPT_PROF) # OPT_CHECK = -C #-Mchkfpstk -Mchkptr OPT_I8 = -i8 @@ -102,7 +102,9 @@ OPT0 = $(OPT_BASE) $(OPT_MANAGED) $(OPT_PERF0) OPT_NOCB = $(OPT_BASE) $(OPT_MANAGED) $(OPT_PERF2) CXXFLAGS = -acc -Kieee -Mnofma $(OPT_MANAGED) OBJS_REPROD= spll_mode_sum_ll.o -$(OBJS_REPROD) : OPT = $(OPT_BASE) $(OPT_MANAGED) $(OPT_PERF2) -Mvect=nosimd -Minfo=all +$(OBJS_REPROD) : OPT = $(OPT_BASE) $(OPT_MANAGED) $(OPT_PERF2) -Mvect=nosimd -Minfo=all +OBJS_OPENACC = spll_modd_halo_d.o +$(OBJS_OPENACC) : OPT = $(OPT_BASE) $(OPT_OPENACC) $(OPT_PERF2) endif # ifeq "$(OPTLEVEL)" "MULTICORE" -- GitLab