Gentoo Archives: gentoo-commits

From:	Benda XU <heroxbd@g.o>
To:	gentoo-commits@l.g.o
Subject:	[gentoo-commits] proj/sci:master commit in: sci-libs/pytorch/, sci-libs/pytorch/files/
Date:	Fri, 07 Aug 2020 12:56:07
Message-Id:	`1596804958.a788dbf0de374240b116598b7a93881509258e24.heroxbd@gentoo`

1	commit: a788dbf0de374240b116598b7a93881509258e24
2	Author: Benda Xu <heroxbd <AT> gentoo <DOT> org>
3	AuthorDate: Fri Aug 7 12:55:50 2020 +0000
4	Commit: Benda XU <heroxbd <AT> gentoo <DOT> org>
5	CommitDate: Fri Aug 7 12:55:58 2020 +0000
6	URL: https://gitweb.gentoo.org/proj/sci.git/commit/?id=a788dbf0
7
8	sci-libs/pytorch: refresh cuda nccl patch for 1.6.0.
9
10	Package-Manager: Portage-2.3.88, Repoman-2.3.18
11	Signed-off-by: Benda Xu <heroxbd <AT> gentoo.org>
12
13	.../files/pytorch-1.6.0-nccl-nvccflags.patch \| 27 ++++++++++++++++++++++
14	sci-libs/pytorch/pytorch-1.6.0.ebuild \| 2 +-
15	2 files changed, 28 insertions(+), 1 deletion(-)
16
17	diff --git a/sci-libs/pytorch/files/pytorch-1.6.0-nccl-nvccflags.patch b/sci-libs/pytorch/files/pytorch-1.6.0-nccl-nvccflags.patch
18	new file mode 100644
19	index 000000000..052474ee4
20	--- /dev/null
21	+++ b/sci-libs/pytorch/files/pytorch-1.6.0-nccl-nvccflags.patch
22	@@ -0,0 +1,27 @@
23	+diff -uprN nccl-5949d96f36d050e59d05872f8bbffd2549318e95/makefiles/common.mk nccl-patched/makefiles/common.mk
24	+--- nccl-5949d96f36d050e59d05872f8bbffd2549318e95/makefiles/common.mk 2020-06-09 00:31:44.000000000 +0800
25	++++ nccl-patched/makefiles/common.mk 2020-08-06 21:25:57.784279738 +0800
26	+@@ -54,7 +54,7 @@ CXXFLAGS := -DCUDA_MAJOR=$(CUDA_MAJOR)
27	+ # Maxrregcount needs to be set accordingly to NCCL_MAX_NTHREADS (otherwise it will cause kernel launch errors)
28	+ # 512 : 120, 640 : 96, 768 : 80, 1024 : 60
29	+ # We would not have to set this if we used __launch_bounds__, but this only works on kernels, not on functions.
30	+-NVCUFLAGS := -ccbin $(CXX) $(NVCC_GENCODE) -std=c++11 -Xptxas -maxrregcount=96 -Xfatbin -compress-all
31	++NVCUFLAGS := $(NVCCFLAGS) $(NVCC_GENCODE) -std=c++11 -Xptxas -maxrregcount=96 -Xfatbin -compress-all
32	+ # Use addprefix so that we can specify more than one path
33	+ NVLDFLAGS := -L${CUDA_LIB} -lcudart -lrt
34	+
35	+@@ -68,14 +68,6 @@ NVLDFLAGS += ${GCOV_FLAGS:%=-Xcompiler
36	+ # $(warning GCOV_FLAGS=${GCOV_FLAGS})
37	+ ########## GCOV ##########
38	+
39	+-ifeq ($(DEBUG), 0)
40	+-NVCUFLAGS += -O3
41	+-CXXFLAGS += -O3 -g
42	+-else
43	+-NVCUFLAGS += -O0 -G -g
44	+-CXXFLAGS += -O0 -g -ggdb3
45	+-endif
46	+-
47	+ ifneq ($(VERBOSE), 0)
48	+ NVCUFLAGS += -Xptxas -v -Xcompiler -Wall,-Wextra,-Wno-unused-parameter
49	+ CXXFLAGS += -Wall -Wextra
50
51	diff --git a/sci-libs/pytorch/pytorch-1.6.0.ebuild b/sci-libs/pytorch/pytorch-1.6.0.ebuild
52	index c59b248e2..1394bdbe3 100644
53	--- a/sci-libs/pytorch/pytorch-1.6.0.ebuild
54	+++ b/sci-libs/pytorch/pytorch-1.6.0.ebuild
55	@@ -147,7 +147,7 @@ src_prepare() {
56
57	if use cuda; then
58	cd ../nccl \|\| die
59	- eapply "${FILESDIR}"/${PN}-1.4.0-nccl-nvccflags.patch
60	+ eapply "${FILESDIR}"/${PN}-1.6.0-nccl-nvccflags.patch
61	ln -s . nccl \|\| die
62
63	cuda_src_prepare

Report Message

Find on MARC Find on Google Groups