mirror of
https://github.com/paboyle/Grid.git
synced 2024-11-09 23:45:36 +00:00
Add GPU specific simd targets
This commit is contained in:
parent
eb7d34a4cc
commit
7a4c142955
21
configure.ac
21
configure.ac
@ -251,6 +251,8 @@ esac
|
||||
##################### Compiler dependent choices
|
||||
case ${CXX} in
|
||||
nvcc)
|
||||
# CXX="nvcc -keep -v -x cu "
|
||||
# CXXLD="nvcc -v -link"
|
||||
CXX="nvcc -x cu "
|
||||
CXXLD="nvcc -link"
|
||||
CXXFLAGS="$CXXFLAGS -Xcompiler -fno-strict-aliasing"
|
||||
@ -264,6 +266,12 @@ esac
|
||||
case ${ax_cv_cxx_compiler_vendor} in
|
||||
clang|gnu)
|
||||
case ${ac_SIMD} in
|
||||
GPU)
|
||||
AC_DEFINE([GPU],[1],[GPU float4 vectors])
|
||||
SIMD_FLAGS='';;
|
||||
VGPU)
|
||||
AC_DEFINE([GPU_VEC],[1],[GPU vectorised 512bit])
|
||||
SIMD_FLAGS='';;
|
||||
SSE4)
|
||||
AC_DEFINE([SSE4],[1],[SSE4 intrinsics])
|
||||
case ${ac_SFW_FP16} in
|
||||
@ -313,6 +321,12 @@ case ${ax_cv_cxx_compiler_vendor} in
|
||||
esac;;
|
||||
intel)
|
||||
case ${ac_SIMD} in
|
||||
GPU)
|
||||
AC_DEFINE([GPU],[1],[GPU float4 vectors])
|
||||
SIMD_FLAGS='';;
|
||||
VGPU)
|
||||
AC_DEFINE([GPU_VEC],[1],[GPU vectorised ])
|
||||
SIMD_FLAGS='';;
|
||||
SSE4)
|
||||
AC_DEFINE([SSE4],[1],[SSE4 intrinsics])
|
||||
SIMD_FLAGS='-msse4.2 -xsse4.2';;
|
||||
@ -351,13 +365,6 @@ esac
|
||||
AM_CXXFLAGS="$SIMD_FLAGS $AM_CXXFLAGS"
|
||||
AM_CFLAGS="$SIMD_FLAGS $AM_CFLAGS"
|
||||
|
||||
case ${ac_SIMD} in
|
||||
AVX512|KNL)
|
||||
AC_DEFINE([TEST_ZMM],[1],[compile ZMM test]);;
|
||||
*)
|
||||
;;
|
||||
esac
|
||||
|
||||
############### Precision selection
|
||||
AC_ARG_ENABLE([precision],
|
||||
[AC_HELP_STRING([--enable-precision=single|double],
|
||||
|
Loading…
Reference in New Issue
Block a user