Cycles: Fixed compilation of CUDA kernels. Follow-up fix for my last commit.

This commit is contained in:
Stefan Werner
2017-11-21 10:43:40 +01:00
parent d8f80fbe72
commit 58a15b2bfe

View File

@@ -73,13 +73,14 @@
/* tunable parameters */
# define CUDA_THREADS_BLOCK_WIDTH 16
# define CUDA_KERNEL_MAX_REGISTERS 48
# define CUDA_KERNEL_BRANCHED_MAX_REGISTERS 63
/* CUDA 9.0 seems to cause slowdowns on high-end Pascal cards unless we increase the number of registers */
# if __CUDACC_VER_MAJOR__ == 9 && __CUDA_ARCH__ >= 600
# #define CUDA_KERNEL_MAX_REGISTERS 64
# define CUDA_KERNEL_MAX_REGISTERS 64
# else
# define CUDA_KERNEL_MAX_REGISTERS 48
# endif
# define CUDA_KERNEL_BRANCHED_MAX_REGISTERS 63
/* unknown architecture */
#else