diff options
author | Willem Jan Palenstijn <WillemJan.Palenstijn@uantwerpen.be> | 2014-04-04 10:21:05 +0000 |
---|---|---|
committer | wpalenst <WillemJan.Palenstijn@uantwerpen.be> | 2014-04-04 10:21:05 +0000 |
commit | 1eba5d772d768ce06ada5fbf2422a2bd4eae4fe0 (patch) | |
tree | e1d289ede093cb91adbca7b5b03b0f5581307865 /build/linux/acinclude.m4 | |
parent | 2895e27613dab0815e9f0f2f0ed7853d31f856b4 (diff) | |
download | astra-1eba5d772d768ce06ada5fbf2422a2bd4eae4fe0.tar.gz astra-1eba5d772d768ce06ada5fbf2422a2bd4eae4fe0.tar.bz2 astra-1eba5d772d768ce06ada5fbf2422a2bd4eae4fe0.tar.xz astra-1eba5d772d768ce06ada5fbf2422a2bd4eae4fe0.zip |
Detect arch/gencode options for nvcc
Diffstat (limited to 'build/linux/acinclude.m4')
-rw-r--r-- | build/linux/acinclude.m4 | 34 |
1 files changed, 34 insertions, 0 deletions
diff --git a/build/linux/acinclude.m4 b/build/linux/acinclude.m4 index 5027e85..b6c1b2d 100644 --- a/build/linux/acinclude.m4 +++ b/build/linux/acinclude.m4 @@ -72,3 +72,37 @@ $NVCC -c -o conftest.o conftest.cu $$2 >conftest.nvcc.out 2>&1 || { } rm -f conftest.cu conftest.o conftest.nvcc.out ]) + +dnl ASTRA_FIND_NVCC_ARCHS(archs-to-try,cppflags-to-extend,output-list) +dnl Architectures should be of the form 10, 20, 30, 35, +dnl and should be in order. The last accepted one will be used for PTX output. +dnl All accepted ones will be used for cubin output. +AC_DEFUN([ASTRA_FIND_NVCC_ARCHS],[ +cat >conftest.cu <<_ACEOF +#include <iostream> +int main() { + std::cout << "Test" << std::endl; + return 0; +} +_ACEOF +NVCC_lastarch="none" +NVCC_extra="" +NVCC_list="" +for arch in $1; do + NVCC_opt="-gencode=arch=compute_$arch,code=sm_$arch" + $NVCC -c -o conftest.o conftest.cu $$2 $NVCC_opt >conftest.nvcc.out 2>&1 && { + NVCC_lastarch=$arch + NVCC_extra="$NVCC_extra $NVCC_opt" + NVCC_list="$NVCC_list $arch" + } +done +if test $NVCC_lastarch != none; then + NVCC_extra="$NVCC_extra -gencode=arch=compute_${NVCC_lastarch},code=compute_${NVCC_lastarch}" + $3="$NVCC_list" + $2="$$2 $NVCC_extra" +else + $3="none" +fi +rm -f conftest.cu conftest.o conftest.nvcc.out +]) + |