[arch-commits] Commit in nccl/trunk (PKGBUILD)

Konstantin Gizdov kgizdov at archlinux.org
Wed Jun 23 15:30:03 UTC 2021


    Date: Wednesday, June 23, 2021 @ 15:30:02
  Author: kgizdov
Revision: 967074

upgpkg: nccl 2.9.9-2: remove unneeded PTX JIT compile units

Modified:
  nccl/trunk/PKGBUILD

----------+
 PKGBUILD |   20 ++++++++------------
 1 file changed, 8 insertions(+), 12 deletions(-)

Modified: PKGBUILD
===================================================================
--- PKGBUILD	2021-06-23 14:53:19 UTC (rev 967073)
+++ PKGBUILD	2021-06-23 15:30:02 UTC (rev 967074)
@@ -4,7 +4,7 @@
 pkgname=nccl
 pkgver=2.9.9
 _upstr_pkgrel=1
-pkgrel=1
+pkgrel=2
 pkgdesc='Library for NVIDIA multi-GPU and multi-node collective communication primitives'
 arch=('x86_64')
 url='https://developer.nvidia.com/nccl/'
@@ -30,26 +30,22 @@
 build() {
   cd "$pkgname"
 
+  # https://docs.nvidia.com/cuda/turing-compatibility-guide/index.html
+  # specify as follows:
+  ## PTX virtual arch: -gencode=arch=compute_XX,code=compute_XX
+  ## binary cubin arch: -gencode=arch=compute_XX,code=sm_XX
+  # we provide binary support on all arches, no PTX is needed
+  # drop PTX to improve performance and reduce linking issues
   export NVCC_GENCODE="-gencode=arch=compute_52,code=sm_52 \
-                       -gencode=arch=compute_52,code=compute_52 \
                        -gencode=arch=compute_53,code=sm_53 \
-                       -gencode=arch=compute_53,code=compute_53 \
                        -gencode=arch=compute_60,code=sm_60 \
-                       -gencode=arch=compute_60,code=compute_60 \
                        -gencode=arch=compute_61,code=sm_61 \
-                       -gencode=arch=compute_61,code=compute_61 \
                        -gencode=arch=compute_62,code=sm_62 \
-                       -gencode=arch=compute_62,code=compute_62 \
                        -gencode=arch=compute_70,code=sm_70 \
-                       -gencode=arch=compute_70,code=compute_70 \
                        -gencode=arch=compute_72,code=sm_72 \
-                       -gencode=arch=compute_72,code=compute_72 \
                        -gencode=arch=compute_75,code=sm_75 \
-                       -gencode=arch=compute_75,code=compute_75 \
                        -gencode=arch=compute_80,code=sm_80 \
-                       -gencode=arch=compute_80,code=compute_80 \
-                       -gencode=arch=compute_86,code=sm_86 \
-                       -gencode=arch=compute_86,code=compute_86"
+                       -gencode=arch=compute_86,code=sm_86"
 
   make CUDA_HOME=/opt/cuda PREFIX=/usr src.build
 }



More information about the arch-commits mailing list