Welcome to mirror list, hosted at ThFree Co, Russian Federation.

github.com/marian-nmt/nccl.git - Unnamed repository; edit this file 'description' to name the repository.
summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorBoris Fomitchev <bfomitchev@nvidia.com>2017-03-24 21:58:14 +0300
committerBoris Fomitchev <bfomitchev@nvidia.com>2017-03-24 21:58:14 +0300
commit649f04d07711440ec2699ce7ec1af4ab71d6dbf9 (patch)
treeec12e2bd231690350c6e6d31de909d7b552eb380
parent7fef264bfa3fce60907b1cd6808257c64e222604 (diff)
Added Pascal nvcc flags, bumped versionv1.3.4-1
-rw-r--r--Makefile6
1 files changed, 4 insertions, 2 deletions
diff --git a/Makefile b/Makefile
index d0fe9b9..8f34fcb 100644
--- a/Makefile
+++ b/Makefile
@@ -20,7 +20,9 @@ NVCC ?= $(CUDA_HOME)/bin/nvcc
NVCC_GENCODE ?= -gencode=arch=compute_35,code=sm_35 \
-gencode=arch=compute_50,code=sm_50 \
-gencode=arch=compute_52,code=sm_52 \
- -gencode=arch=compute_52,code=compute_52
+ -gencode=arch=compute_60,code=sm_60\
+ -gencode=arch=compute_61,code=sm_61 \
+ -gencode=arch=compute_60,code=compute_60
CXXFLAGS := -I$(CUDA_INC) -fPIC -fvisibility=hidden
NVCUFLAGS := -ccbin $(CXX) $(NVCC_GENCODE) -lineinfo -std=c++11 -maxrregcount 96
@@ -52,7 +54,7 @@ endif
NCCL_MAJOR := 1
NCCL_MINOR := 3
-NCCL_PATCH := 3
+NCCL_PATCH := 4
CXXFLAGS += -DNCCL_MAJOR=$(NCCL_MAJOR) -DNCCL_MINOR=$(NCCL_MINOR) -DNCCL_PATCH=$(NCCL_PATCH)
CUDA_VERSION ?= $(shell ls $(CUDA_LIB)/libcudart.so.* | head -1 | rev | cut -d "." -f -2 | rev)