Cycles: Make kernel compilable for 3.7 compute capability

It is used by GK210 GPUs which could be found in, i.e. Tesla K80.
This commit is contained in:
Sergey Sharybin 2016-01-28 11:56:09 +01:00
parent 0834015b74
commit ff0dcc5d70
1 changed files with 12 additions and 0 deletions

View File

@ -65,6 +65,18 @@
#define CUDA_KERNEL_MAX_REGISTERS 63
#define CUDA_KERNEL_BRANCHED_MAX_REGISTERS 63
/* 3.7 */
#elif __CUDA_ARCH__ == 370
#define CUDA_MULTIPRESSOR_MAX_REGISTERS 65536
#define CUDA_MULTIPROCESSOR_MAX_BLOCKS 16
#define CUDA_BLOCK_MAX_THREADS 1024
#define CUDA_THREAD_MAX_REGISTERS 255
/* tunable parameters */
#define CUDA_THREADS_BLOCK_WIDTH 16
#define CUDA_KERNEL_MAX_REGISTERS 63
#define CUDA_KERNEL_BRANCHED_MAX_REGISTERS 63
/* 5.0, 5.2 and 5.3 */
#elif __CUDA_ARCH__ == 500 || __CUDA_ARCH__ == 520 || __CUDA_ARCH__ == 530
#define CUDA_MULTIPRESSOR_MAX_REGISTERS 65536