Gentoo Archives: gentoo-commits

From: Andrew Ammerlaan <andrewammerlaan@g.o>
To: gentoo-commits@l.g.o
Subject: [gentoo-commits] proj/sci:master commit in: sci-libs/pytorch/, sci-libs/pytorch/files/
Date: Mon, 27 Dec 2021 11:50:48
Message-Id: 1640602864.fad64b065493a4406304cf7cb4d4aa36a7876555.andrewammerlaan@gentoo
1 commit: fad64b065493a4406304cf7cb4d4aa36a7876555
2 Author: Miezhiko <Miezhiko <AT> gmail <DOT> com>
3 AuthorDate: Mon Dec 27 10:56:29 2021 +0000
4 Commit: Andrew Ammerlaan <andrewammerlaan <AT> gentoo <DOT> org>
5 CommitDate: Mon Dec 27 11:01:04 2021 +0000
6 URL: https://gitweb.gentoo.org/proj/sci.git/commit/?id=fad64b06
7
8 sci-libs/pytorch: fixes for cuda USE flag, nccl update
9
10 Signed-off-by: Miezhiko <Miezhiko <AT> gmail.com>
11 Closes: https://github.com/gentoo/sci/pull/1132
12 Signed-off-by: Andrew Ammerlaan <andrewammerlaan <AT> gentoo.org>
13
14 .../files/pytorch-1.10.1-nccl-nvccflags.patch | 37 ++++++++++++++++++++++
15 sci-libs/pytorch/pytorch-1.10.1.ebuild | 7 ++--
16 2 files changed, 41 insertions(+), 3 deletions(-)
17
18 diff --git a/sci-libs/pytorch/files/pytorch-1.10.1-nccl-nvccflags.patch b/sci-libs/pytorch/files/pytorch-1.10.1-nccl-nvccflags.patch
19 new file mode 100644
20 index 000000000..0ac12a1e7
21 --- /dev/null
22 +++ b/sci-libs/pytorch/files/pytorch-1.10.1-nccl-nvccflags.patch
23 @@ -0,0 +1,37 @@
24 +From 7b04cd503fa1a6265893e0320ee246bcc0bd98cf Mon Sep 17 00:00:00 2001
25 +From: Miezhiko <Miezhiko@×××××.com>
26 +Date: Mon, 27 Dec 2021 14:48:12 +0400
27 +Subject: [PATCH] neutral flags
28 +
29 +---
30 + makefiles/common.mk | 10 +---------
31 + 1 file changed, 1 insertion(+), 9 deletions(-)
32 +
33 +diff --git a/makefiles/common.mk b/makefiles/common.mk
34 +index 64f8d2dc6..7a979c90f 100644
35 +--- a/makefiles/common.mk
36 ++++ b/makefiles/common.mk
37 +@@ -55,7 +55,7 @@ CXXFLAGS := -DCUDA_MAJOR=$(CUDA_MAJOR) -DCUDA_MINOR=$(CUDA_MINOR) -fPIC -fvisi
38 + # Maxrregcount needs to be set accordingly to NCCL_MAX_NTHREADS (otherwise it will cause kernel launch errors)
39 + # 512 : 120, 640 : 96, 768 : 80, 1024 : 60
40 + # We would not have to set this if we used __launch_bounds__, but this only works on kernels, not on functions.
41 +-NVCUFLAGS := -ccbin $(CXX) $(NVCC_GENCODE) -std=c++11 --expt-extended-lambda -Xptxas -maxrregcount=96 -Xfatbin -compress-all
42 ++NVCUFLAGS := $(NVCCFLAGS) $(NVCC_GENCODE) -std=c++11 --expt-extended-lambda -Xptxas -maxrregcount=96 -Xfatbin -compress-all
43 + # Use addprefix so that we can specify more than one path
44 + NVLDFLAGS := -L${CUDA_LIB} -lcudart -lrt
45 +
46 +@@ -69,14 +69,6 @@ NVLDFLAGS += ${GCOV_FLAGS:%=-Xcompiler %}
47 + # $(warning GCOV_FLAGS=${GCOV_FLAGS})
48 + ########## GCOV ##########
49 +
50 +-ifeq ($(DEBUG), 0)
51 +-NVCUFLAGS += -O3
52 +-CXXFLAGS += -O3 -g
53 +-else
54 +-NVCUFLAGS += -O0 -G -g
55 +-CXXFLAGS += -O0 -g -ggdb3
56 +-endif
57 +-
58 + ifneq ($(VERBOSE), 0)
59 + NVCUFLAGS += -Xptxas -v -Xcompiler -Wall,-Wextra,-Wno-unused-parameter
60 + CXXFLAGS += -Wall -Wextra
61
62 diff --git a/sci-libs/pytorch/pytorch-1.10.1.ebuild b/sci-libs/pytorch/pytorch-1.10.1.ebuild
63 index a7bbb62ac..948d595a7 100644
64 --- a/sci-libs/pytorch/pytorch-1.10.1.ebuild
65 +++ b/sci-libs/pytorch/pytorch-1.10.1.ebuild
66 @@ -28,7 +28,7 @@ https://github.com/facebookincubator/gloo/archive/c22a5cfba94edf8ea4f53a174d38aa
67 https://github.com/google/googletest/archive/e2239ee6043f73722e7aa812a459f54a28552929.tar.gz -> googletest-e2239ee6043f73722e7aa812a459f54a28552929.tar.gz
68 https://github.com/intel/ideep/archive/9ca27bbfd88fa1469cbf0467bd6f14cd1738fa40.tar.gz -> ideep-9ca27bbfd88fa1469cbf0467bd6f14cd1738fa40.tar.gz
69 https://github.com/intel/mkl-dnn/archive/5ef631a0.tar.gz -> mkl-dnn-5ef631a0.tar.gz
70 -cuda? ( https://github.com/NVIDIA/nccl/archive/033d7995.tar.gz -> nccl-033d7995.tar.gz )
71 +cuda? ( https://github.com/NVIDIA/nccl/archive/c5790b36722d5b41ee2a9b2bad69e364180ffd22.tar.gz -> nccl-c5790b36722d5b41ee2a9b2bad69e364180ffd22.tar.gz )
72 https://github.com/Maratyszcza/NNPACK/archive/c07e3a0400713d546e0dea2d5466dd22ea389c73.tar.gz -> NNPACK-c07e3a0400713d546e0dea2d5466dd22ea389c73.tar.gz
73 https://github.com/onnx/onnx/archive/a82c6a70.tar.gz -> onnx-a82c6a70.tar.gz
74 https://github.com/onnx/onnx-tensorrt/archive/c153211418a7c57ce071d9ce2a41f8d1c85a878f.tar.gz -> onnx-tensorrt-c153211418a7c57ce071d9ce2a41f8d1c85a878f.tar.gz
75 @@ -168,7 +168,7 @@ src_prepare() {
76 rmdir third_party/ideep/mkl-dnn || die
77 ln -sv "${WORKDIR}"/mkl-dnn-5ef631a030a6f73131c77892041042805a06064f third_party/ideep/mkl-dnn || die
78 rmdir third_party/nccl/nccl || die
79 - ln -sv "${WORKDIR}"/nccl-033d799524fb97629af5ac2f609de367472b2696 third_party/nccl/nccl || die
80 + ln -sv "${WORKDIR}"/nccl-c5790b36722d5b41ee2a9b2bad69e364180ffd22 third_party/nccl/nccl || die
81 rmdir third_party/NNPACK || die
82 ln -sv "${WORKDIR}"/NNPACK-c07e3a0400713d546e0dea2d5466dd22ea389c73 third_party/NNPACK || die
83 rmdir third_party/onnx || die
84 @@ -208,9 +208,10 @@ src_prepare() {
85
86 if use cuda; then
87 cd third_party/nccl/nccl || die
88 - eapply "${FILESDIR}"/${PN}-1.6.0-nccl-nvccflags.patch
89 + eapply "${FILESDIR}"/${PN}-1.10.1-nccl-nvccflags.patch
90 cuda_src_prepare
91 export CUDAHOSTCXX=$(cuda_gccdir)/g++
92 + cd "${S}"
93 fi
94
95 if use rocm; then