diff --git a/src/Rules.LXpgi2004.mk b/src/Rules.LXpgi2004.mk index c8f6b3297e9635e26f67fd99eb466dc00e456714..d3c5f1039a3b326e369807bf0a590ce2adddb7b5 100644 --- a/src/Rules.LXpgi2004.mk +++ b/src/Rules.LXpgi2004.mk @@ -20,7 +20,7 @@ CUDALEVEL=cuda10.1 # #Compute capability of GPU # -OPT_CPTCAP=cc35,cc50,cc70 +OPT_CPTCAP=cc35,cc50,cc60,cc70 #Aeropc45: cc50 #Nuwa: cc35 #Ouessant Firestone K80: cc35 @@ -42,9 +42,9 @@ OPT_PERF1 = -O1 OPT_PERF2 = -O2 # OPT_MANAGED = -Mframe -Mnostack_arrays -Mallocatable=95 -ta=host,tesla:nofma,$(OPT_CPTCAP),$(CUDALEVEL),managed $(OPT_INFO) $(OPT_PROF) -OPT_MULTICORE = -ta=multicore $(OPT_INFO) $(OPT_PROF) -OPT_NOOPENACC = -ta=host $(OPT_INFO) $(OPT_PROF) -OPT_OPENACC = -Mnostack_arrays -Mnostack_arrays -Mallocatable=95 -ta=host,tesla:nofma,$(OPT_CPTCAP),$(CUDALEVEL) $(OPT_INFO) $(OPT_PROF) +OPT_MULTICORE = -ta=multicore $(OPT_INFO) $(OPT_PROF) +OPT_NOOPENACC = -ta=host $(OPT_INFO) $(OPT_PROF) +OPT_OPENACC = -Mframe -Mnostack_arrays -Mallocatable=95 -ta=host,tesla:nofma,$(OPT_CPTCAP),$(CUDALEVEL) $(OPT_INFO) $(OPT_PROF) # OPT_CHECK = -C #-Mchkfpstk -Mchkptr OPT_I8 = -i8 @@ -102,7 +102,9 @@ OPT0 = $(OPT_BASE) $(OPT_MANAGED) $(OPT_PERF0) OPT_NOCB = $(OPT_BASE) $(OPT_MANAGED) $(OPT_PERF2) CXXFLAGS = -acc -Kieee -Mnofma $(OPT_MANAGED) OBJS_REPROD= spll_mode_sum_ll.o -$(OBJS_REPROD) : OPT = $(OPT_BASE) $(OPT_MANAGED) $(OPT_PERF2) -Mvect=nosimd -Minfo=all +$(OBJS_REPROD) : OPT = $(OPT_BASE) $(OPT_MANAGED) $(OPT_PERF2) -Mvect=nosimd -Minfo=all +OBJS_OPENACC = spll_modd_halo_d.o +$(OBJS_OPENACC) : OPT = $(OPT_BASE) $(OPT_OPENACC) $(OPT_PERF2) endif # ifeq "$(OPTLEVEL)" "MULTICORE"