-
Notifications
You must be signed in to change notification settings - Fork 108
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
- ignore temp files generated by Cray Fortran - workaround Cray not having reduce
- Loading branch information
1 parent
3a0fec6
commit 8bda56d
Showing
7 changed files
with
39 additions
and
25 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
|
@@ -20,6 +20,8 @@ src/fortran/BabelStream.* | |
*.gz | ||
*.a | ||
*.mod | ||
*.cub | ||
*.ptx | ||
|
||
KokkosCore_config.* | ||
|
||
|
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
|
@@ -101,6 +101,7 @@ subroutine copy() | |
do i=1,N | ||
C(i) = A(i) | ||
end do | ||
!$omp barrier | ||
end subroutine copy | ||
|
||
subroutine add() | ||
|
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -1,13 +1,6 @@ | ||
#!/bin/bash | ||
|
||
for compiler in oneapi ; do | ||
for implementation in DoConcurrent Array OpenMP OpenMPWorkshare OpenMPTarget OpenMPTargetLoop OpenMPTaskloop ; do | ||
make COMPILER=${compiler} IMPLEMENTATION=${implementation} | ||
done | ||
done | ||
#exit | ||
for compiler in nvhpc ; do | ||
for implementation in DoConcurrent Array OpenMP OpenMPWorkshare OpenMPTarget OpenMPTargetLoop OpenMPTaskloop OpenACC OpenACCArray CUDA CUDAKernel ; do | ||
make COMPILER=${compiler} IMPLEMENTATION=${implementation} | ||
done | ||
compiler=cray | ||
for implementation in DoConcurrent Array OpenMP OpenMPWorkshare OpenMPTarget OpenMPTargetLoop OpenMPTaskloop OpenACC OpenACCArray ; do | ||
make COMPILER=${compiler} IMPLEMENTATION=${implementation} | ||
done |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,16 @@ | ||
FC := ftn | ||
FCFLAGS = -e F -O3 | ||
|
||
DOCONCURRENT_FLAG = -h thread_do_concurrent -DCRAY_THREAD_DOCONCURRENT | ||
ARRAY_FLAG = -h autothread | ||
OPENMP_FLAG = -h omp | ||
OPENACC_FLAG = -h acc | ||
CUDA_FLAG = | ||
SEQUENTIAL_FLAG = | ||
|
||
ifeq ($(IMPLEMENTATION),CUDA) | ||
$(error IMPLEMENTATION=$(IMPLEMENTATION) is not supported by this compiler.) | ||
endif | ||
ifeq ($(IMPLEMENTATION),CUDAKernels) | ||
$(error IMPLEMENTATION=$(IMPLEMENTATION) is not supported by this compiler.) | ||
endif |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -1,22 +1,18 @@ | ||
#!/bin/bash | ||
|
||
export KMP_HW_PLACES=1s,4c,1t | ||
export KMP_HW_SUBSET=1s,4c,1t | ||
export KMP_AFFINITY=compact,granularity=fine #,verbose | ||
M=64 | ||
|
||
compiler=cray | ||
# CPU | ||
for compiler in oneapi ; do | ||
for implementation in DoConcurrent Array OpenMP OpenMPWorkshare OpenMPTaskloop ; do | ||
if [ -f BabelStream.${compiler}.${implementation} ] ; then | ||
./BabelStream.${compiler}.${implementation} -s $((1024*1024*64)) | ||
fi | ||
done | ||
for implementation in DoConcurrent Array OpenMP OpenMPWorkshare OpenMPTaskloop ; do | ||
if [ -f BabelStream.${compiler}.${implementation} ] ; then | ||
./BabelStream.${compiler}.${implementation} -s $((1024*1024*${M})) | ||
fi | ||
done | ||
exit | ||
# GPU | ||
for compiler in nvhpc ; do | ||
for implementation in DoConcurrent OpenMPTarget OpenMPTargetLoop OpenACC OpenACCArray CUDA CUDAKernel ; do | ||
if [ -f BabelStream.${compiler}.${implementation} ] ; then | ||
./BabelStream.${compiler}.${implementation} -s $((1024*1024*64)) | ||
fi | ||
done | ||
for implementation in OpenMPTarget OpenMPTargetLoop OpenACC OpenACCArray ; do | ||
if [ -f BabelStream.${compiler}.${implementation} ] ; then | ||
./BabelStream.${compiler}.${implementation} -s $((1024*1024*${M})) | ||
fi | ||
done |