File tree Expand file tree Collapse file tree 1 file changed +6
-3
lines changed Expand file tree Collapse file tree 1 file changed +6
-3
lines changed Original file line number Diff line number Diff line change 41
41
fi
42
42
43
43
# Update SPARK RAPIDS config
44
- readonly DEFAULT_SPARK_RAPIDS_VERSION=" 24.04 .0"
44
+ readonly DEFAULT_SPARK_RAPIDS_VERSION=" 24.06 .0"
45
45
readonly SPARK_RAPIDS_VERSION=$( get_metadata_attribute ' spark-rapids-version' ${DEFAULT_SPARK_RAPIDS_VERSION} )
46
46
readonly XGBOOST_VERSION=$( get_metadata_attribute ' xgboost-version' ${DEFAULT_XGBOOST_VERSION} )
47
47
@@ -237,14 +237,17 @@ function install_nvidia_gpu_driver() {
237
237
238
238
elif [[ ${OS_NAME} == " rocky" ]]; then
239
239
240
+ # Ensure the Correct Kernel Development Packages are Installed
241
+ execute_with_retries " yum install -y kernel-devel-$( uname -r) kernel-headers-$( uname -r) "
242
+
240
243
ROCKY_VERSION=$( lsb_release -r | awk ' {print $2}' ) # 8.8 or 9.1
241
244
ROCKY_VERSION=${ROCKY_VERSION% .* } # 8 or 9
242
245
243
246
readonly NVIDIA_ROCKY_REPO_URL=" https://developer.download.nvidia.com/compute/cuda/repos/rhel${ROCKY_VERSION} /x86_64/cuda-rhel${ROCKY_VERSION} .repo"
244
247
execute_with_retries " dnf config-manager --add-repo ${NVIDIA_ROCKY_REPO_URL} "
245
248
execute_with_retries " dnf clean all"
246
- execute_with_retries " dnf -y -q module install nvidia-driver:${NVIDIA_DRIVER_VERSION_PREFIX} "
247
- execute_with_retries " dnf -y -q install cuda-toolkit- ${CUDA_VERSION_MAJOR // . / -} "
249
+ execute_with_retries " dnf -y -q module install nvidia-driver:latest-dkms "
250
+ execute_with_retries " dnf -y -q install cuda-toolkit"
248
251
modprobe nvidia
249
252
250
253
else
You can’t perform that action at this time.
0 commit comments