add latest CUDA arch to fix invalid device function errors
authorEvan Shelhamer <shelhamer@imaginarynumber.net>
Fri, 27 Jun 2014 15:47:42 +0000 (08:47 -0700)
committerEvan Shelhamer <shelhamer@imaginarynumber.net>
Fri, 27 Jun 2014 15:53:15 +0000 (08:53 -0700)
...on devices of that architecture.

Makefile.config.example

index 9754129..c41bada 100644 (file)
@@ -7,11 +7,15 @@ CUDA_DIR := /usr/local/cuda
 # "sudo apt-get install nvidia-cuda-toolkit" then use this instead:
 # CUDA_DIR := /usr
 
-# CUDA architecture setting: going with all of them.
+# CUDA architecture setting: going with all of them (up to CUDA 5.5 compatible).
+# For the latest architecture, you need to install CUDA >= 6.0 and uncomment
+# the *_50 lines below.
 CUDA_ARCH := -gencode arch=compute_20,code=sm_20 \
                -gencode arch=compute_20,code=sm_21 \
                -gencode arch=compute_30,code=sm_30 \
                -gencode arch=compute_35,code=sm_35
+               #-gencode=arch=compute_50,code=sm_50 \
+               #-gencode=arch=compute_50,code=compute_50
 
 # BLAS choice:
 # atlas for ATLAS (default)