From 7f3db5af7739be0d763ac9f9e4b0d3fb22a1408d Mon Sep 17 00:00:00 2001 From: Juan ESCOBAR <juan.escobar@aero.obs-mip.fr> Date: Fri, 4 Nov 2022 15:33:59 +0100 Subject: [PATCH] Juan 04/11/2022:ZSOLVER/dotprod.f90 Bitrep PB with CCE >= 1402, move JK scalar/seq loop upper , or cce/14.X will parallelize it !!! --- src/ZSOLVER/dotprod.f90 | 14 ++++++++------ 1 file changed, 8 insertions(+), 6 deletions(-) diff --git a/src/ZSOLVER/dotprod.f90 b/src/ZSOLVER/dotprod.f90 index e473801b8..2c4791cc6 100644 --- a/src/ZSOLVER/dotprod.f90 +++ b/src/ZSOLVER/dotprod.f90 @@ -185,15 +185,17 @@ CALL MNH_MEM_GET(ZDOTPROD, ILBXB,ILBXE ,ILBYB,ILBYE ) #endif !$acc kernels present(ZDOTPROD) ZDOTPROD(:,:) = 0. -#ifdef MNH_COMPILER_NVHPC - !$acc loop independent collapse(2) -#endif - DO CONCURRENT (JI=ILBXB:ILBXE,JJ=ILBYB:ILBYE) - !$acc loop seq - DO JK = IKB-1,IKE+1 +!$acc loop seq +!dir nextscalar +DO JK = IKB-1,IKE+1 + !DO CONCURRENT (JI=ILBXB:ILBXE,JJ=ILBYB:ILBYE) + !$acc loop collapse(2) independent + DO JJ = ILBYB,ILBYE + DO JI = ILBXB,ILBXE ZDOTPROD(JI,JJ) = ZDOTPROD(JI,JJ) + PA(JI,JJ,JK) * PB(JI,JJ,JK) END DO END DO +END DO !$acc end kernels !$acc update host(ZDOTPROD) PDOTPROD = SUM_DD_R2_ll(ZDOTPROD) -- GitLab