Added large_arrays and removed -r8 to F90 flags for PGI. Modified makefile of GPU Eigensolver accordingly

This commit is contained in:
Pietro Bonfa 2018-04-06 10:36:59 +02:00
parent b60d563cfa
commit 466c74bd94
2 changed files with 6 additions and 6 deletions

View File

@ -1,8 +1,8 @@
include ../../make.inc
FLAGS = -O3 -mp -pgf90libs -Mcuda=cc$(GPU_ARCH),cuda$(CUDA_RUNTIME),ptxinfo -Mlarge_arrays
FLAGS2 = -O3 -mp -pgf90libs -Mcuda=cc$(GPU_ARCH),cuda$(CUDA_RUNTIME),ptxinfo,nollvm -Mlarge_arrays
FLAGS3 = -O3 -mp -pgf90libs -Mcuda=cc$(GPU_ARCH),cuda$(CUDA_RUNTIME),ptxinfo,maxregcount:64,nollvm -Mlarge_arrays
FLAGS = -pgf90libs -Mcuda=cc$(GPU_ARCH),cuda$(CUDA_RUNTIME),ptxinfo $(F90FLAGS)
FLAGS2 = -pgf90libs -Mcuda=cc$(GPU_ARCH),cuda$(CUDA_RUNTIME),ptxinfo,nollvm $(F90FLAGS)
FLAGS3 = -pgf90libs -Mcuda=cc$(GPU_ARCH),cuda$(CUDA_RUNTIME),ptxinfo,maxregcount:64,nollvm $(F90FLAGS)
# Use this FLAGS2 if compiling on Power system
#FLAGS2 = -O1 -mp -pgf90libs -Mcuda=cc$(GPU_ARCH),cuda$(CUDA_RUNTIME),ptxinfo,maxregcount:64,nollvm -Mlarge_arrays

View File

@ -69,9 +69,9 @@ x86_64:nagfor* )
;;
ia32:pgf* | ia64:pgf* | x86_64:pgf* )
try_fflags_nomain="-Mnomain"
try_fflags="-fast -r8"
try_fflags="-fast"
try_fflags_openmp="-mp"
try_f90flags="-fast -r8 -Mcache_align -Mpreprocess"
try_f90flags="-fast -Mcache_align -Mpreprocess -Mlarge_arrays"
try_fflags_noopt="-O0"
try_ldflags=""
try_ldflags_openmp="-mp"