From e37d28a082e5702a16c3e53e28f6daeb9bc59103 Mon Sep 17 00:00:00 2001 From: Andrea Bocci Date: Wed, 6 Mar 2024 18:40:56 +0100 Subject: [PATCH 01/10] Update CMake to version 3.28.3 Force the use of libssl and libcrypto instead of libmd. --- cmake.spec | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/cmake.spec b/cmake.spec index b814180bf82..fef389afdc4 100644 --- a/cmake.spec +++ b/cmake.spec @@ -1,4 +1,4 @@ -### RPM external cmake 3.25.2 +### RPM external cmake 3.28.3 %define downloaddir %(echo %realversion | cut -d. -f1,2) Source: http://www.cmake.org/files/v%{downloaddir}/%n-%realversion.tar.gz Requires: bz2lib curl expat zlib @@ -20,6 +20,7 @@ cat > build-flags.cmake <<- EOF SET(BUILD_CursesDialog FALSE CACHE BOOL "" FORCE) # Use system libraries, not cmake bundled ones. + SET(CMAKE_USE_OPENSSL TRUE CACHE BOOL "" FORCE) SET(CMAKE_USE_SYSTEM_LIBRARY_CURL TRUE CACHE BOOL "" FORCE) SET(CMAKE_USE_SYSTEM_LIBRARY_ZLIB TRUE CACHE BOOL "" FORCE) SET(CMAKE_USE_SYSTEM_LIBRARY_BZIP2 TRUE CACHE BOOL "" FORCE) From bc61a992005cdf5a7dbd76b999b767d91b6588ea Mon Sep 17 00:00:00 2001 From: Andrea Bocci Date: Thu, 7 Mar 2024 12:06:12 +0100 Subject: [PATCH 02/10] Backport a fix for CMake 3.27 from Geant4 v11.2.0 --- geant4.spec | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/geant4.spec b/geant4.spec index 01f3f149777..6d53449ed97 100644 --- a/geant4.spec +++ b/geant4.spec @@ -2,7 +2,7 @@ ## INCLUDE compilation_flags ## INCLUDE compilation_flags_lto ## INCLUDE cpp-standard -%define tag 2d5992376773d172321f01710a82943ead5bb435 +%define tag 0f1b33cb3d004830d88b4f9fab2c12b31ed69164 %define branch cms/v%{realversion} %define github_user cms-externals Source: git+https://github.com/%github_user/%{n}.git?obj=%{branch}/%{tag}&export=%{n}.%{realversion}&output=/%{n}.%{realversion}-%{tag}.tgz From 55f003a5fbbbc06257bc89e15be9f5f359fc9b37 Mon Sep 17 00:00:00 2001 From: Andrea Bocci Date: Wed, 6 Mar 2024 09:00:13 +0100 Subject: [PATCH 03/10] Update to CUDA 12.4.0 Update to CUDA 12.4.0: * CUDA runtime version 12.4.99 * NVIDIA drivers version 550.54.14 See https://docs.nvidia.com/cuda/archive/12.4.0/cuda-toolkit-release-notes/index.html for the full CUDA 12.4.0 release notes and change log. --- cuda.spec | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/cuda.spec b/cuda.spec index e1e033c6bd4..f890c878cf5 100644 --- a/cuda.spec +++ b/cuda.spec @@ -1,8 +1,8 @@ -### RPM external cuda 12.2.1 +### RPM external cuda 12.4.0 ## INITENV +PATH LD_LIBRARY_PATH %i/lib64 %define runpath_opts -m compute-sanitizer -m drivers -m nvvm -%define driversversion 535.86.10 +%define driversversion 550.54.14 %ifarch x86_64 Source0: https://developer.download.nvidia.com/compute/cuda/%{realversion}/local_installers/%{n}_%{realversion}_%{driversversion}_linux.run From ce0b96aa9f41ec4585c3651af196b35b664ba5f6 Mon Sep 17 00:00:00 2001 From: Andrea Bocci Date: Sat, 9 Mar 2024 17:32:44 +0100 Subject: [PATCH 04/10] Force CUDA to consider only the major/minor version of GCC Works around a problem in the GCC version checks inside cudafe++, where GCC 12.3.1 is not recognised as equivalent to GCC 12.3.0. Rename the CUDA-related flags to avoid potential problems when adding, removing or reordering them. --- cuda-compatible-runtime.spec | 4 ++-- cuda-flags.file | 27 +++++++++++++++++---------- llvm.spec | 4 ++-- scram-tools.file/tool-env.file | 2 +- 4 files changed, 22 insertions(+), 15 deletions(-) diff --git a/cuda-compatible-runtime.spec b/cuda-compatible-runtime.spec index 54c4b2f11ab..8c6b40ad960 100644 --- a/cuda-compatible-runtime.spec +++ b/cuda-compatible-runtime.spec @@ -11,11 +11,11 @@ Requires: cuda %build ## INCLUDE cuda-flags -# defines nvcc_stdcxx and cuda_flags_4 +# defines nvcc_flags_stdcxx and nvcc_flags_cuda_archs rm -rf %{_builddir}/build && mkdir %{_builddir}/build if - $CUDA_ROOT/bin/nvcc %{nvcc_stdcxx} -O2 -g %{cuda_flags_4} test.cu -I $CUDA_ROOT/include -L $CUDA_ROOT/lib64 -L $CUDA_ROOT/lib64/stubs --cudart static -ldl -lrt --compiler-options '-Wall -pthread' -o %{_builddir}/build/cuda-compatible-runtime + $CUDA_ROOT/bin/nvcc %{nvcc_flags_stdcxx} -O2 -g %{nvcc_flags_cuda_archs} test.cu -I $CUDA_ROOT/include -L $CUDA_ROOT/lib64 -L $CUDA_ROOT/lib64/stubs --cudart static -ldl -lrt --compiler-options '-Wall -pthread' -o %{_builddir}/build/cuda-compatible-runtime then true else diff --git a/cuda-flags.file b/cuda-flags.file index 8a2e4f9910f..149fc4c917f 100644 --- a/cuda-flags.file +++ b/cuda-flags.file @@ -5,32 +5,39 @@ # build support for Pascal (6.x), Volta (7.0), Turing (7.5), Ampere (8.x) and Lovelace (8.9) %define cuda_arch 60 70 75 80 89 +# LIBOMPTARGET_NVPTX_COMPUTE_CAPABILITIES style for listing the supported CUDA compute architectures +%define omptarget_cuda_archs %(echo $(for ARCH in %cuda_arch; do echo "$ARCH"; done) | sed -e"s/ /,/g") + # LLVM style for listing the supported CUDA compute architectures -%define llvm_cuda_arch %(echo $(for ARCH in %cuda_arch; do echo "$ARCH"; done) | sed -e"s/ /,/g") +%define llvm_flags_cuda_archs %(echo $(for ARCH in %cuda_arch; do echo "--offload-arch=sm_$ARCH"; done)) -Wunknown-cuda-version # C++ standard to use for building host and device code with nvcc -%define nvcc_stdcxx -std=c++%{cms_cxx_standard} +%define nvcc_flags_stdcxx -std=c++%{cms_cxx_standard} # generate optimised code -%define cuda_flags_0 -O3 +%define nvcc_flags_opt -O3 # generate debugging information for device code -%define cuda_flags_1 --generate-line-info --source-in-ptx --display-error-number +%define nvcc_flags_debug --generate-line-info --source-in-ptx --display-error-number # imply __host__, __device__ attributes in constexpr functions -%define cuda_flags_2 --expt-relaxed-constexpr +%define nvcc_flags_constexpr --expt-relaxed-constexpr # allow __host__, __device__ attributes in lambda declaration -%define cuda_flags_3 --extended-lambda +%define nvcc_flags_lambda --extended-lambda # build support for the various compute architectures -%define cuda_flags_4 %(echo $(for ARCH in %cuda_arch; do echo "-gencode arch=compute_$ARCH,code=[sm_$ARCH,compute_$ARCH]"; done)) -Wno-deprecated-gpu-targets +%define nvcc_flags_cuda_archs %(echo $(for ARCH in %cuda_arch; do echo "-gencode arch=compute_$ARCH,code=[sm_$ARCH,compute_$ARCH]"; done)) -Wno-deprecated-gpu-targets # disable warnings about attributes on defaulted methods -%define cuda_flags_5 -Xcudafe --diag_suppress=esa_on_defaulted_function_ignored +%define nvcc_flags_cudafe_diag -Xcudafe --diag_suppress=esa_on_defaulted_function_ignored + +# override the version of GCC passed to cudafe++ +%define override_gnu_version $(gcc -dumpfullversion | { IFS=.; read MAJOR MINOR PATCH; echo $(((MAJOR * 100 + MINOR) * 100)); }) +%define nvcc_flags_gnu_version -Xcudafe --gnu_version=%{override_gnu_version} # link the CUDA runtime shared library -%define cuda_flags_6 --cudart shared +%define nvcc_flags_cudart --cudart shared # collect all CUDA flags -%define nvcc_cuda_flags %{nvcc_stdcxx} %{cuda_flags_0} %{cuda_flags_1} %{cuda_flags_2} %{cuda_flags_3} %{cuda_flags_4} %{cuda_flags_5} %{cuda_flags_6} +%define nvcc_cuda_flags %{nvcc_flags_stdcxx} %{nvcc_flags_opt} %{nvcc_flags_debug} %{nvcc_flags_constexpr} %{nvcc_flags_lambda} %{nvcc_flags_cuda_archs} %{nvcc_flags_cudafe_diag} %{nvcc_flags_gnu_version} %{nvcc_flags_cudart} diff --git a/llvm.spec b/llvm.spec index ac0b0f434b2..0aa8e47c3ea 100644 --- a/llvm.spec +++ b/llvm.spec @@ -29,7 +29,7 @@ sed -ibak '/add_clang_subdirectory(libclang)/a add_subdirectory(include-what-you %build ## INCLUDE cuda-flags -# defines llvm_cuda_arch +# defines omptarget_cuda_archs rm -rf %{_builddir}/build mkdir -p %{_builddir}/build @@ -51,7 +51,7 @@ cmake %{_builddir}/llvm-%{realversion}-%{llvmCommit}/llvm \ -DLLVM_HOST_TRIPLE=$(gcc -dumpmachine) \ -DLLVM_TARGETS_TO_BUILD:STRING="X86;PowerPC;AArch64;NVPTX" \ -DLIBOMPTARGET_NVPTX_ALTERNATE_HOST_COMPILER=/usr/bin/gcc \ - -DLIBOMPTARGET_NVPTX_COMPUTE_CAPABILITIES="%llvm_cuda_arch" \ + -DLIBOMPTARGET_NVPTX_COMPUTE_CAPABILITIES="%omptarget_cuda_archs" \ -DCMAKE_REQUIRED_INCLUDES="${ZLIB_ROOT}/include" \ -DCMAKE_PREFIX_PATH="${ZLIB_ROOT}" diff --git a/scram-tools.file/tool-env.file b/scram-tools.file/tool-env.file index f0c3dbebd85..8e5deeacf44 100644 --- a/scram-tools.file/tool-env.file +++ b/scram-tools.file/tool-env.file @@ -13,7 +13,7 @@ export COMPILER_CXXFLAGS="%{arch_build_flags}" export COMPILER_WARNINGS="%{?warning_flags}" export ORACLE_ENV_ROOT="" export CUDA_FLAGS="%{nvcc_cuda_flags}" -export CUDA_HOST_CXXFLAGS="%{nvcc_stdcxx}" +export CUDA_HOST_CXXFLAGS="%{nvcc_flags_stdcxx}" export LTO_FLAGS="%{?lto_build_flags}" export PGO_FLAGS="%{?pgo_build_flags}" if [ $(echo ' %requiredtools ' | grep ' python3 ' |wc -l) -gt 0 ] ; then export PYTHON3_LIB_SITE_PACKAGES ; fi From 9ea2ee5e7a838e0ea6fb501089a8bac435900cce Mon Sep 17 00:00:00 2001 From: Andrea Bocci Date: Wed, 20 Dec 2023 10:47:53 +0100 Subject: [PATCH 05/10] Update NVIDIA gdrcopy to v2.4.1 Changes in v2.4.1: - add support for persistent mapping - fix bug in src/gdrdrv/Makefile - fix compile-time bug when check.h is not found Changes in v2.4: - various bug fixes in the test and benchmark applications - prefix all applications with "gdrcopy_" - introduce more unit tests in gdrcopy_sanity - introduce gdrcopy_pplat benchmark application - remove dependency on libcheck and libsubunit - introduce gdr_get_info_v2 - introduce new copy algorithm for device mappings - add support for NVIDIA BLUEFIELD-3 - add support for Linux kernel >= 6.3 - add support for SLES and OpenSUSE - add support for systemd service on RHEL9 - relicense gdrdrv to Dual MIT/GPL - fix bugs in gdrdrv when pinning two small buffers back-to-back - add support for coherent platforms such as Grace-Hopper - add support for Confidential Computing (CC) --- gdrcopy.spec | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/gdrcopy.spec b/gdrcopy.spec index 1828f5c4267..5776d73d80c 100644 --- a/gdrcopy.spec +++ b/gdrcopy.spec @@ -1,4 +1,4 @@ -### RPM external gdrcopy 2.3 +### RPM external gdrcopy 2.4.1 ## INITENV +PATH LD_LIBRARY_PATH %i/lib64 Source: https://github.com/NVIDIA/%{n}/archive/v%{realversion}.tar.gz Requires: cuda From 548439fd3d4afe662a30b2151ddddcd527c57342 Mon Sep 17 00:00:00 2001 From: Andrea Bocci Date: Wed, 6 Mar 2024 18:40:24 +0100 Subject: [PATCH 06/10] Update cuDNN to version 8.9 for CUDA 12 See https://docs.nvidia.com/deeplearning/cudnn/archives/cudnn-897/release-notes/index.html for the release notes and change log. --- cudnn.spec | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/cudnn.spec b/cudnn.spec index df73c079f95..801f83eeca1 100644 --- a/cudnn.spec +++ b/cudnn.spec @@ -1,4 +1,4 @@ -### RPM external cudnn 8.8.0.121 +### RPM external cudnn 8.9.7.29 ## INITENV +PATH LD_LIBRARY_PATH %i/lib64 %define cudaver 12 From 17d8a46d34218931951b3d8330e2f3575281663b Mon Sep 17 00:00:00 2001 From: Andrea Bocci Date: Wed, 6 Mar 2024 18:42:54 +0100 Subject: [PATCH 07/10] Update ONNX runtime to version 1.17.1 This version requires two more workarounds: - -Wno-error=maybe-uninitialized is needed to a void a (hopefully false positive) warning about a potentially uninitialised variable with cuDNN 8.9 and 9.0 - -Donnxruntime_NVCC_THREADS=0 is needed because the default is ON, causing nvcc to be called as "nvcc ... --threads ON ...", which causes an error. --- onnxruntime.spec | 13 ++++++++----- 1 file changed, 8 insertions(+), 5 deletions(-) diff --git a/onnxruntime.spec b/onnxruntime.spec index 686e131c0e0..d0ee91f8124 100644 --- a/onnxruntime.spec +++ b/onnxruntime.spec @@ -1,9 +1,9 @@ -### RPM external onnxruntime 1.14.1 +### RPM external onnxruntime 1.17.1 ## INITENV +PATH PYTHON3PATH %{i}/${PYTHON3_LIB_SITE_PACKAGES} ## INCLUDE cuda-flags %define github_user cms-externals %define branch cms/v%{realversion} -%define tag e4c6aa2984c7c71409f4c6d0db865117afa66932 +%define tag 5353412812a6f0409a15faff9a18640456ab1ff8 Source: git+https://github.com/%{github_user}/%{n}.git?obj=%{branch}/%{tag}&export=%{n}-%{realversion}&submodules=1&output=/%{n}-%{realversion}.tgz BuildRequires: cmake ninja @@ -35,6 +35,7 @@ cmake ../%{n}-%{realversion}/cmake -GNinja \ -Donnxruntime_USE_CUDA=${USE_CUDA} \ -Donnxruntime_CUDA_HOME="${CUDA_ROOT}" \ -Donnxruntime_CUDNN_HOME="${CUDNN_ROOT}" \ + -Donnxruntime_NVCC_THREADS=0 \ -Donnxruntime_BUILD_CSHARP=OFF \ -Donnxruntime_USE_OPENMP=OFF \ -Donnxruntime_USE_TVM=OFF \ @@ -53,10 +54,12 @@ cmake ../%{n}-%{realversion}/cmake -GNinja \ -DCMAKE_TRY_COMPILE_PLATFORM_VARIABLES="CMAKE_CUDA_RUNTIME_LIBRARY" \ -DCMAKE_PREFIX_PATH="${ZLIB_ROOT};${LIBPNG_ROOT};${PROTOBUF_ROOT};${PY3_PYBIND11_ROOT};${RE2_ROOT}" \ -DRE2_INCLUDE_DIR="${RE2_ROOT}/include" \ - -DCMAKE_CXX_FLAGS="-Wno-error=stringop-overflow" + -DCMAKE_CXX_FLAGS="-Wno-error=stringop-overflow -Wno-error=maybe-uninitialized" -# False positive string overflow -# https://github.com/google/flatbuffers/issues/7366 +# -Wno-error=stringop-overflow is needed to work around a false positive string overflow, +# see https://github.com/google/flatbuffers/issues/7366 + +# -Wno-error=maybe-uninitialized is needed for ONNX runtime 1.17.1 with cuDNN 8.9 or 9.0 ninja -v %{makeprocesses} python3 ../%{n}-%{realversion}/setup.py build From 0600b1f066f7830d0921ff0ff738a788a530f649 Mon Sep 17 00:00:00 2001 From: Andrea Bocci Date: Thu, 7 Mar 2024 12:39:12 +0100 Subject: [PATCH 08/10] Add the explicit dependency on python to Celeritas --- celeritas.spec | 1 + 1 file changed, 1 insertion(+) diff --git a/celeritas.spec b/celeritas.spec index f255e2caeba..3a97e2c2d28 100644 --- a/celeritas.spec +++ b/celeritas.spec @@ -9,6 +9,7 @@ Source: git+https://github.com/celeritas-project/celeritas?obj=develop/%{tag}&ex BuildRequires: cmake %define build_flags -Wall -Wextra -pedantic %{?arch_build_flags} %{?lto_build_flags} %{?pgo_build_flags} +Requires: python3 Requires: json Requires: geant4 Requires: vecgeom From c5a8a5fb9a17be6dad04c2f8130be7f65404a093 Mon Sep 17 00:00:00 2001 From: Andrea Bocci Date: Thu, 7 Mar 2024 17:28:50 +0100 Subject: [PATCH 09/10] Add missing thrust include in PyTorch --- pytorch.spec | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) diff --git a/pytorch.spec b/pytorch.spec index 5d58c9c5d42..ae2408cf8cf 100644 --- a/pytorch.spec +++ b/pytorch.spec @@ -2,10 +2,10 @@ ## INCLUDE cuda-flags %define cuda_arch_float $(echo %{cuda_arch} | tr ' ' '\\n' | sed -E 's|([0-9])$|.\\1|' | tr '\\n' ' ') -%define tag v%{realversion} -%define branch release/2.1 +%define tag bb938bbe9f53414dda1e1159795b7536dbffd041 +%define branch cms/v%{realversion} -Source: git+https://github.com/pytorch/pytorch.git?obj=%{branch}/%{tag}&export=%{n}-%{realversion}&submodules=1&output=/%{n}-%{realversion}.tgz +Source: git+https://github.com/cms-externals/pytorch.git?obj=%{branch}/%{tag}&export=%{n}-%{realversion}&submodules=1&output=/%{n}-%{realversion}.tgz Source1: FindEigen3.cmake Source2: FindFMT.cmake Patch0: pytorch-ignore-different-cuda-include-dir From fc1f061266026d4072e78857ee64930d8a296403 Mon Sep 17 00:00:00 2001 From: Andrea Bocci Date: Wed, 6 Mar 2024 09:00:13 +0100 Subject: [PATCH 10/10] Update to CUDA 12.4.1 Update to CUDA 12.4.1: * CUDA runtime version 12.4.127 * NVIDIA drivers version 550.54.15 See https://docs.nvidia.com/cuda/archive/12.4.1/cuda-toolkit-release-notes/index.html for the full CUDA 12.4.1 release notes and change log. --- cuda.spec | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/cuda.spec b/cuda.spec index f890c878cf5..33dbd2686d8 100644 --- a/cuda.spec +++ b/cuda.spec @@ -1,8 +1,8 @@ -### RPM external cuda 12.4.0 +### RPM external cuda 12.4.1 ## INITENV +PATH LD_LIBRARY_PATH %i/lib64 %define runpath_opts -m compute-sanitizer -m drivers -m nvvm -%define driversversion 550.54.14 +%define driversversion 550.54.15 %ifarch x86_64 Source0: https://developer.download.nvidia.com/compute/cuda/%{realversion}/local_installers/%{n}_%{realversion}_%{driversversion}_linux.run