зеркало из https://github.com/Azure/AgentBaker.git
Pull aks-gpu image with k8s.io namespace (#5046)
This commit is contained in:
Родитель
da67f7c655
Коммит
6a79b6a6d9
|
@ -744,14 +744,14 @@ configGPUDrivers() {
|
|||
if [[ $OS == $UBUNTU_OS_NAME ]]; then
|
||||
mkdir -p /opt/{actions,gpu}
|
||||
if [[ "${CONTAINER_RUNTIME}" == "containerd" ]]; then
|
||||
ctr image pull $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
ctr -n k8s.io image pull $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
retrycmd_if_failure 5 10 600 bash -c "$CTR_GPU_INSTALL_CMD $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG gpuinstall /entrypoint.sh install"
|
||||
ret=$?
|
||||
if [[ "$ret" != "0" ]]; then
|
||||
echo "Failed to install GPU driver, exiting..."
|
||||
exit $ERR_GPU_DRIVERS_START_FAIL
|
||||
fi
|
||||
ctr images rm --sync $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
ctr -n k8s.io images rm --sync $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
else
|
||||
bash -c "$DOCKER_GPU_INSTALL_CMD $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG install"
|
||||
ret=$?
|
||||
|
|
|
@ -151,7 +151,7 @@ NVIDIA_CONTAINER_RUNTIME_VERSION="3.6.0"
|
|||
export NVIDIA_DRIVER_IMAGE_SHA="${GPU_IMAGE_SHA:=}"
|
||||
export NVIDIA_DRIVER_IMAGE_TAG="${GPU_DV}-${NVIDIA_DRIVER_IMAGE_SHA}"
|
||||
export NVIDIA_DRIVER_IMAGE="mcr.microsoft.com/aks/aks-gpu"
|
||||
export CTR_GPU_INSTALL_CMD="ctr run --privileged --rm --net-host --with-ns pid:/proc/1/ns/pid --mount type=bind,src=/opt/gpu,dst=/mnt/gpu,options=rbind --mount type=bind,src=/opt/actions,dst=/mnt/actions,options=rbind"
|
||||
export CTR_GPU_INSTALL_CMD="ctr -n k8s.io run --privileged --rm --net-host --with-ns pid:/proc/1/ns/pid --mount type=bind,src=/opt/gpu,dst=/mnt/gpu,options=rbind --mount type=bind,src=/opt/actions,dst=/mnt/actions,options=rbind"
|
||||
export DOCKER_GPU_INSTALL_CMD="docker run --privileged --net=host --pid=host -v /opt/gpu:/mnt/gpu -v /opt/actions:/mnt/actions --rm"
|
||||
APT_CACHE_DIR=/var/cache/apt/archives/
|
||||
PERMANENT_CACHE_DIR=/root/aptcache/
|
||||
|
|
Различия файлов скрыты, потому что одна или несколько строк слишком длинны
|
@ -702,14 +702,14 @@ configGPUDrivers() {
|
|||
if [[ $OS == $UBUNTU_OS_NAME ]]; then
|
||||
mkdir -p /opt/{actions,gpu}
|
||||
if [[ "${CONTAINER_RUNTIME}" == "containerd" ]]; then
|
||||
ctr image pull $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
ctr -n k8s.io image pull $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
retrycmd_if_failure 5 10 600 bash -c "$CTR_GPU_INSTALL_CMD $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG gpuinstall /entrypoint.sh install"
|
||||
ret=$?
|
||||
if [[ "$ret" != "0" ]]; then
|
||||
echo "Failed to install GPU driver, exiting..."
|
||||
exit $ERR_GPU_DRIVERS_START_FAIL
|
||||
fi
|
||||
ctr images rm --sync $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
ctr -n k8s.io images rm --sync $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
else
|
||||
bash -c "$DOCKER_GPU_INSTALL_CMD $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG install"
|
||||
ret=$?
|
||||
|
|
|
@ -136,7 +136,7 @@ NVIDIA_CONTAINER_RUNTIME_VERSION="3.6.0"
|
|||
export NVIDIA_DRIVER_IMAGE_SHA="${GPU_IMAGE_SHA:=}"
|
||||
export NVIDIA_DRIVER_IMAGE_TAG="${GPU_DV}-${NVIDIA_DRIVER_IMAGE_SHA}"
|
||||
export NVIDIA_DRIVER_IMAGE="mcr.microsoft.com/aks/aks-gpu"
|
||||
export CTR_GPU_INSTALL_CMD="ctr run --privileged --rm --net-host --with-ns pid:/proc/1/ns/pid --mount type=bind,src=/opt/gpu,dst=/mnt/gpu,options=rbind --mount type=bind,src=/opt/actions,dst=/mnt/actions,options=rbind"
|
||||
export CTR_GPU_INSTALL_CMD="ctr -n k8s.io run --privileged --rm --net-host --with-ns pid:/proc/1/ns/pid --mount type=bind,src=/opt/gpu,dst=/mnt/gpu,options=rbind --mount type=bind,src=/opt/actions,dst=/mnt/actions,options=rbind"
|
||||
export DOCKER_GPU_INSTALL_CMD="docker run --privileged --net=host --pid=host -v /opt/gpu:/mnt/gpu -v /opt/actions:/mnt/actions --rm"
|
||||
APT_CACHE_DIR=/var/cache/apt/archives/
|
||||
PERMANENT_CACHE_DIR=/root/aptcache/
|
||||
|
|
Различия файлов скрыты, потому что одна или несколько строк слишком длинны
|
@ -702,14 +702,14 @@ configGPUDrivers() {
|
|||
if [[ $OS == $UBUNTU_OS_NAME ]]; then
|
||||
mkdir -p /opt/{actions,gpu}
|
||||
if [[ "${CONTAINER_RUNTIME}" == "containerd" ]]; then
|
||||
ctr image pull $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
ctr -n k8s.io image pull $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
retrycmd_if_failure 5 10 600 bash -c "$CTR_GPU_INSTALL_CMD $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG gpuinstall /entrypoint.sh install"
|
||||
ret=$?
|
||||
if [[ "$ret" != "0" ]]; then
|
||||
echo "Failed to install GPU driver, exiting..."
|
||||
exit $ERR_GPU_DRIVERS_START_FAIL
|
||||
fi
|
||||
ctr images rm --sync $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
ctr -n k8s.io images rm --sync $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
else
|
||||
bash -c "$DOCKER_GPU_INSTALL_CMD $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG install"
|
||||
ret=$?
|
||||
|
|
|
@ -136,7 +136,7 @@ NVIDIA_CONTAINER_RUNTIME_VERSION="3.6.0"
|
|||
export NVIDIA_DRIVER_IMAGE_SHA="${GPU_IMAGE_SHA:=}"
|
||||
export NVIDIA_DRIVER_IMAGE_TAG="${GPU_DV}-${NVIDIA_DRIVER_IMAGE_SHA}"
|
||||
export NVIDIA_DRIVER_IMAGE="mcr.microsoft.com/aks/aks-gpu"
|
||||
export CTR_GPU_INSTALL_CMD="ctr run --privileged --rm --net-host --with-ns pid:/proc/1/ns/pid --mount type=bind,src=/opt/gpu,dst=/mnt/gpu,options=rbind --mount type=bind,src=/opt/actions,dst=/mnt/actions,options=rbind"
|
||||
export CTR_GPU_INSTALL_CMD="ctr -n k8s.io run --privileged --rm --net-host --with-ns pid:/proc/1/ns/pid --mount type=bind,src=/opt/gpu,dst=/mnt/gpu,options=rbind --mount type=bind,src=/opt/actions,dst=/mnt/actions,options=rbind"
|
||||
export DOCKER_GPU_INSTALL_CMD="docker run --privileged --net=host --pid=host -v /opt/gpu:/mnt/gpu -v /opt/actions:/mnt/actions --rm"
|
||||
APT_CACHE_DIR=/var/cache/apt/archives/
|
||||
PERMANENT_CACHE_DIR=/root/aptcache/
|
||||
|
|
Различия файлов скрыты, потому что одна или несколько строк слишком длинны
|
@ -702,14 +702,14 @@ configGPUDrivers() {
|
|||
if [[ $OS == $UBUNTU_OS_NAME ]]; then
|
||||
mkdir -p /opt/{actions,gpu}
|
||||
if [[ "${CONTAINER_RUNTIME}" == "containerd" ]]; then
|
||||
ctr image pull $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
ctr -n k8s.io image pull $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
retrycmd_if_failure 5 10 600 bash -c "$CTR_GPU_INSTALL_CMD $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG gpuinstall /entrypoint.sh install"
|
||||
ret=$?
|
||||
if [[ "$ret" != "0" ]]; then
|
||||
echo "Failed to install GPU driver, exiting..."
|
||||
exit $ERR_GPU_DRIVERS_START_FAIL
|
||||
fi
|
||||
ctr images rm --sync $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
ctr -n k8s.io images rm --sync $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
else
|
||||
bash -c "$DOCKER_GPU_INSTALL_CMD $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG install"
|
||||
ret=$?
|
||||
|
|
|
@ -136,7 +136,7 @@ NVIDIA_CONTAINER_RUNTIME_VERSION="3.6.0"
|
|||
export NVIDIA_DRIVER_IMAGE_SHA="${GPU_IMAGE_SHA:=}"
|
||||
export NVIDIA_DRIVER_IMAGE_TAG="${GPU_DV}-${NVIDIA_DRIVER_IMAGE_SHA}"
|
||||
export NVIDIA_DRIVER_IMAGE="mcr.microsoft.com/aks/aks-gpu"
|
||||
export CTR_GPU_INSTALL_CMD="ctr run --privileged --rm --net-host --with-ns pid:/proc/1/ns/pid --mount type=bind,src=/opt/gpu,dst=/mnt/gpu,options=rbind --mount type=bind,src=/opt/actions,dst=/mnt/actions,options=rbind"
|
||||
export CTR_GPU_INSTALL_CMD="ctr -n k8s.io run --privileged --rm --net-host --with-ns pid:/proc/1/ns/pid --mount type=bind,src=/opt/gpu,dst=/mnt/gpu,options=rbind --mount type=bind,src=/opt/actions,dst=/mnt/actions,options=rbind"
|
||||
export DOCKER_GPU_INSTALL_CMD="docker run --privileged --net=host --pid=host -v /opt/gpu:/mnt/gpu -v /opt/actions:/mnt/actions --rm"
|
||||
APT_CACHE_DIR=/var/cache/apt/archives/
|
||||
PERMANENT_CACHE_DIR=/root/aptcache/
|
||||
|
|
Различия файлов скрыты, потому что одна или несколько строк слишком длинны
|
@ -702,14 +702,14 @@ configGPUDrivers() {
|
|||
if [[ $OS == $UBUNTU_OS_NAME ]]; then
|
||||
mkdir -p /opt/{actions,gpu}
|
||||
if [[ "${CONTAINER_RUNTIME}" == "containerd" ]]; then
|
||||
ctr image pull $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
ctr -n k8s.io image pull $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
retrycmd_if_failure 5 10 600 bash -c "$CTR_GPU_INSTALL_CMD $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG gpuinstall /entrypoint.sh install"
|
||||
ret=$?
|
||||
if [[ "$ret" != "0" ]]; then
|
||||
echo "Failed to install GPU driver, exiting..."
|
||||
exit $ERR_GPU_DRIVERS_START_FAIL
|
||||
fi
|
||||
ctr images rm --sync $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
ctr -n k8s.io images rm --sync $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
else
|
||||
bash -c "$DOCKER_GPU_INSTALL_CMD $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG install"
|
||||
ret=$?
|
||||
|
|
|
@ -136,7 +136,7 @@ NVIDIA_CONTAINER_RUNTIME_VERSION="3.6.0"
|
|||
export NVIDIA_DRIVER_IMAGE_SHA="${GPU_IMAGE_SHA:=}"
|
||||
export NVIDIA_DRIVER_IMAGE_TAG="${GPU_DV}-${NVIDIA_DRIVER_IMAGE_SHA}"
|
||||
export NVIDIA_DRIVER_IMAGE="mcr.microsoft.com/aks/aks-gpu"
|
||||
export CTR_GPU_INSTALL_CMD="ctr run --privileged --rm --net-host --with-ns pid:/proc/1/ns/pid --mount type=bind,src=/opt/gpu,dst=/mnt/gpu,options=rbind --mount type=bind,src=/opt/actions,dst=/mnt/actions,options=rbind"
|
||||
export CTR_GPU_INSTALL_CMD="ctr -n k8s.io run --privileged --rm --net-host --with-ns pid:/proc/1/ns/pid --mount type=bind,src=/opt/gpu,dst=/mnt/gpu,options=rbind --mount type=bind,src=/opt/actions,dst=/mnt/actions,options=rbind"
|
||||
export DOCKER_GPU_INSTALL_CMD="docker run --privileged --net=host --pid=host -v /opt/gpu:/mnt/gpu -v /opt/actions:/mnt/actions --rm"
|
||||
APT_CACHE_DIR=/var/cache/apt/archives/
|
||||
PERMANENT_CACHE_DIR=/root/aptcache/
|
||||
|
|
Различия файлов скрыты, потому что одна или несколько строк слишком длинны
|
@ -702,14 +702,14 @@ configGPUDrivers() {
|
|||
if [[ $OS == $UBUNTU_OS_NAME ]]; then
|
||||
mkdir -p /opt/{actions,gpu}
|
||||
if [[ "${CONTAINER_RUNTIME}" == "containerd" ]]; then
|
||||
ctr image pull $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
ctr -n k8s.io image pull $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
retrycmd_if_failure 5 10 600 bash -c "$CTR_GPU_INSTALL_CMD $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG gpuinstall /entrypoint.sh install"
|
||||
ret=$?
|
||||
if [[ "$ret" != "0" ]]; then
|
||||
echo "Failed to install GPU driver, exiting..."
|
||||
exit $ERR_GPU_DRIVERS_START_FAIL
|
||||
fi
|
||||
ctr images rm --sync $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
ctr -n k8s.io images rm --sync $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
else
|
||||
bash -c "$DOCKER_GPU_INSTALL_CMD $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG install"
|
||||
ret=$?
|
||||
|
|
|
@ -136,7 +136,7 @@ NVIDIA_CONTAINER_RUNTIME_VERSION="3.6.0"
|
|||
export NVIDIA_DRIVER_IMAGE_SHA="${GPU_IMAGE_SHA:=}"
|
||||
export NVIDIA_DRIVER_IMAGE_TAG="${GPU_DV}-${NVIDIA_DRIVER_IMAGE_SHA}"
|
||||
export NVIDIA_DRIVER_IMAGE="mcr.microsoft.com/aks/aks-gpu"
|
||||
export CTR_GPU_INSTALL_CMD="ctr run --privileged --rm --net-host --with-ns pid:/proc/1/ns/pid --mount type=bind,src=/opt/gpu,dst=/mnt/gpu,options=rbind --mount type=bind,src=/opt/actions,dst=/mnt/actions,options=rbind"
|
||||
export CTR_GPU_INSTALL_CMD="ctr -n k8s.io run --privileged --rm --net-host --with-ns pid:/proc/1/ns/pid --mount type=bind,src=/opt/gpu,dst=/mnt/gpu,options=rbind --mount type=bind,src=/opt/actions,dst=/mnt/actions,options=rbind"
|
||||
export DOCKER_GPU_INSTALL_CMD="docker run --privileged --net=host --pid=host -v /opt/gpu:/mnt/gpu -v /opt/actions:/mnt/actions --rm"
|
||||
APT_CACHE_DIR=/var/cache/apt/archives/
|
||||
PERMANENT_CACHE_DIR=/root/aptcache/
|
||||
|
|
Различия файлов скрыты, потому что одна или несколько строк слишком длинны
|
@ -702,14 +702,14 @@ configGPUDrivers() {
|
|||
if [[ $OS == $UBUNTU_OS_NAME ]]; then
|
||||
mkdir -p /opt/{actions,gpu}
|
||||
if [[ "${CONTAINER_RUNTIME}" == "containerd" ]]; then
|
||||
ctr image pull $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
ctr -n k8s.io image pull $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
retrycmd_if_failure 5 10 600 bash -c "$CTR_GPU_INSTALL_CMD $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG gpuinstall /entrypoint.sh install"
|
||||
ret=$?
|
||||
if [[ "$ret" != "0" ]]; then
|
||||
echo "Failed to install GPU driver, exiting..."
|
||||
exit $ERR_GPU_DRIVERS_START_FAIL
|
||||
fi
|
||||
ctr images rm --sync $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
ctr -n k8s.io images rm --sync $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
else
|
||||
bash -c "$DOCKER_GPU_INSTALL_CMD $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG install"
|
||||
ret=$?
|
||||
|
|
|
@ -136,7 +136,7 @@ NVIDIA_CONTAINER_RUNTIME_VERSION="3.6.0"
|
|||
export NVIDIA_DRIVER_IMAGE_SHA="${GPU_IMAGE_SHA:=}"
|
||||
export NVIDIA_DRIVER_IMAGE_TAG="${GPU_DV}-${NVIDIA_DRIVER_IMAGE_SHA}"
|
||||
export NVIDIA_DRIVER_IMAGE="mcr.microsoft.com/aks/aks-gpu"
|
||||
export CTR_GPU_INSTALL_CMD="ctr run --privileged --rm --net-host --with-ns pid:/proc/1/ns/pid --mount type=bind,src=/opt/gpu,dst=/mnt/gpu,options=rbind --mount type=bind,src=/opt/actions,dst=/mnt/actions,options=rbind"
|
||||
export CTR_GPU_INSTALL_CMD="ctr -n k8s.io run --privileged --rm --net-host --with-ns pid:/proc/1/ns/pid --mount type=bind,src=/opt/gpu,dst=/mnt/gpu,options=rbind --mount type=bind,src=/opt/actions,dst=/mnt/actions,options=rbind"
|
||||
export DOCKER_GPU_INSTALL_CMD="docker run --privileged --net=host --pid=host -v /opt/gpu:/mnt/gpu -v /opt/actions:/mnt/actions --rm"
|
||||
APT_CACHE_DIR=/var/cache/apt/archives/
|
||||
PERMANENT_CACHE_DIR=/root/aptcache/
|
||||
|
|
Различия файлов скрыты, потому что одна или несколько строк слишком длинны
|
@ -702,14 +702,14 @@ configGPUDrivers() {
|
|||
if [[ $OS == $UBUNTU_OS_NAME ]]; then
|
||||
mkdir -p /opt/{actions,gpu}
|
||||
if [[ "${CONTAINER_RUNTIME}" == "containerd" ]]; then
|
||||
ctr image pull $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
ctr -n k8s.io image pull $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
retrycmd_if_failure 5 10 600 bash -c "$CTR_GPU_INSTALL_CMD $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG gpuinstall /entrypoint.sh install"
|
||||
ret=$?
|
||||
if [[ "$ret" != "0" ]]; then
|
||||
echo "Failed to install GPU driver, exiting..."
|
||||
exit $ERR_GPU_DRIVERS_START_FAIL
|
||||
fi
|
||||
ctr images rm --sync $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
ctr -n k8s.io images rm --sync $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
else
|
||||
bash -c "$DOCKER_GPU_INSTALL_CMD $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG install"
|
||||
ret=$?
|
||||
|
|
|
@ -136,7 +136,7 @@ NVIDIA_CONTAINER_RUNTIME_VERSION="3.6.0"
|
|||
export NVIDIA_DRIVER_IMAGE_SHA="${GPU_IMAGE_SHA:=}"
|
||||
export NVIDIA_DRIVER_IMAGE_TAG="${GPU_DV}-${NVIDIA_DRIVER_IMAGE_SHA}"
|
||||
export NVIDIA_DRIVER_IMAGE="mcr.microsoft.com/aks/aks-gpu"
|
||||
export CTR_GPU_INSTALL_CMD="ctr run --privileged --rm --net-host --with-ns pid:/proc/1/ns/pid --mount type=bind,src=/opt/gpu,dst=/mnt/gpu,options=rbind --mount type=bind,src=/opt/actions,dst=/mnt/actions,options=rbind"
|
||||
export CTR_GPU_INSTALL_CMD="ctr -n k8s.io run --privileged --rm --net-host --with-ns pid:/proc/1/ns/pid --mount type=bind,src=/opt/gpu,dst=/mnt/gpu,options=rbind --mount type=bind,src=/opt/actions,dst=/mnt/actions,options=rbind"
|
||||
export DOCKER_GPU_INSTALL_CMD="docker run --privileged --net=host --pid=host -v /opt/gpu:/mnt/gpu -v /opt/actions:/mnt/actions --rm"
|
||||
APT_CACHE_DIR=/var/cache/apt/archives/
|
||||
PERMANENT_CACHE_DIR=/root/aptcache/
|
||||
|
|
Различия файлов скрыты, потому что одна или несколько строк слишком длинны
|
@ -702,14 +702,14 @@ configGPUDrivers() {
|
|||
if [[ $OS == $UBUNTU_OS_NAME ]]; then
|
||||
mkdir -p /opt/{actions,gpu}
|
||||
if [[ "${CONTAINER_RUNTIME}" == "containerd" ]]; then
|
||||
ctr image pull $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
ctr -n k8s.io image pull $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
retrycmd_if_failure 5 10 600 bash -c "$CTR_GPU_INSTALL_CMD $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG gpuinstall /entrypoint.sh install"
|
||||
ret=$?
|
||||
if [[ "$ret" != "0" ]]; then
|
||||
echo "Failed to install GPU driver, exiting..."
|
||||
exit $ERR_GPU_DRIVERS_START_FAIL
|
||||
fi
|
||||
ctr images rm --sync $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
ctr -n k8s.io images rm --sync $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
else
|
||||
bash -c "$DOCKER_GPU_INSTALL_CMD $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG install"
|
||||
ret=$?
|
||||
|
|
|
@ -136,7 +136,7 @@ NVIDIA_CONTAINER_RUNTIME_VERSION="3.6.0"
|
|||
export NVIDIA_DRIVER_IMAGE_SHA="${GPU_IMAGE_SHA:=}"
|
||||
export NVIDIA_DRIVER_IMAGE_TAG="${GPU_DV}-${NVIDIA_DRIVER_IMAGE_SHA}"
|
||||
export NVIDIA_DRIVER_IMAGE="mcr.microsoft.com/aks/aks-gpu"
|
||||
export CTR_GPU_INSTALL_CMD="ctr run --privileged --rm --net-host --with-ns pid:/proc/1/ns/pid --mount type=bind,src=/opt/gpu,dst=/mnt/gpu,options=rbind --mount type=bind,src=/opt/actions,dst=/mnt/actions,options=rbind"
|
||||
export CTR_GPU_INSTALL_CMD="ctr -n k8s.io run --privileged --rm --net-host --with-ns pid:/proc/1/ns/pid --mount type=bind,src=/opt/gpu,dst=/mnt/gpu,options=rbind --mount type=bind,src=/opt/actions,dst=/mnt/actions,options=rbind"
|
||||
export DOCKER_GPU_INSTALL_CMD="docker run --privileged --net=host --pid=host -v /opt/gpu:/mnt/gpu -v /opt/actions:/mnt/actions --rm"
|
||||
APT_CACHE_DIR=/var/cache/apt/archives/
|
||||
PERMANENT_CACHE_DIR=/root/aptcache/
|
||||
|
|
Различия файлов скрыты, потому что одна или несколько строк слишком длинны
|
@ -702,14 +702,14 @@ configGPUDrivers() {
|
|||
if [[ $OS == $UBUNTU_OS_NAME ]]; then
|
||||
mkdir -p /opt/{actions,gpu}
|
||||
if [[ "${CONTAINER_RUNTIME}" == "containerd" ]]; then
|
||||
ctr image pull $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
ctr -n k8s.io image pull $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
retrycmd_if_failure 5 10 600 bash -c "$CTR_GPU_INSTALL_CMD $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG gpuinstall /entrypoint.sh install"
|
||||
ret=$?
|
||||
if [[ "$ret" != "0" ]]; then
|
||||
echo "Failed to install GPU driver, exiting..."
|
||||
exit $ERR_GPU_DRIVERS_START_FAIL
|
||||
fi
|
||||
ctr images rm --sync $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
ctr -n k8s.io images rm --sync $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
else
|
||||
bash -c "$DOCKER_GPU_INSTALL_CMD $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG install"
|
||||
ret=$?
|
||||
|
|
|
@ -136,7 +136,7 @@ NVIDIA_CONTAINER_RUNTIME_VERSION="3.6.0"
|
|||
export NVIDIA_DRIVER_IMAGE_SHA="${GPU_IMAGE_SHA:=}"
|
||||
export NVIDIA_DRIVER_IMAGE_TAG="${GPU_DV}-${NVIDIA_DRIVER_IMAGE_SHA}"
|
||||
export NVIDIA_DRIVER_IMAGE="mcr.microsoft.com/aks/aks-gpu"
|
||||
export CTR_GPU_INSTALL_CMD="ctr run --privileged --rm --net-host --with-ns pid:/proc/1/ns/pid --mount type=bind,src=/opt/gpu,dst=/mnt/gpu,options=rbind --mount type=bind,src=/opt/actions,dst=/mnt/actions,options=rbind"
|
||||
export CTR_GPU_INSTALL_CMD="ctr -n k8s.io run --privileged --rm --net-host --with-ns pid:/proc/1/ns/pid --mount type=bind,src=/opt/gpu,dst=/mnt/gpu,options=rbind --mount type=bind,src=/opt/actions,dst=/mnt/actions,options=rbind"
|
||||
export DOCKER_GPU_INSTALL_CMD="docker run --privileged --net=host --pid=host -v /opt/gpu:/mnt/gpu -v /opt/actions:/mnt/actions --rm"
|
||||
APT_CACHE_DIR=/var/cache/apt/archives/
|
||||
PERMANENT_CACHE_DIR=/root/aptcache/
|
||||
|
|
Различия файлов скрыты, потому что одна или несколько строк слишком длинны
|
@ -702,14 +702,14 @@ configGPUDrivers() {
|
|||
if [[ $OS == $UBUNTU_OS_NAME ]]; then
|
||||
mkdir -p /opt/{actions,gpu}
|
||||
if [[ "${CONTAINER_RUNTIME}" == "containerd" ]]; then
|
||||
ctr image pull $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
ctr -n k8s.io image pull $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
retrycmd_if_failure 5 10 600 bash -c "$CTR_GPU_INSTALL_CMD $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG gpuinstall /entrypoint.sh install"
|
||||
ret=$?
|
||||
if [[ "$ret" != "0" ]]; then
|
||||
echo "Failed to install GPU driver, exiting..."
|
||||
exit $ERR_GPU_DRIVERS_START_FAIL
|
||||
fi
|
||||
ctr images rm --sync $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
ctr -n k8s.io images rm --sync $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
else
|
||||
bash -c "$DOCKER_GPU_INSTALL_CMD $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG install"
|
||||
ret=$?
|
||||
|
|
|
@ -136,7 +136,7 @@ NVIDIA_CONTAINER_RUNTIME_VERSION="3.6.0"
|
|||
export NVIDIA_DRIVER_IMAGE_SHA="${GPU_IMAGE_SHA:=}"
|
||||
export NVIDIA_DRIVER_IMAGE_TAG="${GPU_DV}-${NVIDIA_DRIVER_IMAGE_SHA}"
|
||||
export NVIDIA_DRIVER_IMAGE="mcr.microsoft.com/aks/aks-gpu"
|
||||
export CTR_GPU_INSTALL_CMD="ctr run --privileged --rm --net-host --with-ns pid:/proc/1/ns/pid --mount type=bind,src=/opt/gpu,dst=/mnt/gpu,options=rbind --mount type=bind,src=/opt/actions,dst=/mnt/actions,options=rbind"
|
||||
export CTR_GPU_INSTALL_CMD="ctr -n k8s.io run --privileged --rm --net-host --with-ns pid:/proc/1/ns/pid --mount type=bind,src=/opt/gpu,dst=/mnt/gpu,options=rbind --mount type=bind,src=/opt/actions,dst=/mnt/actions,options=rbind"
|
||||
export DOCKER_GPU_INSTALL_CMD="docker run --privileged --net=host --pid=host -v /opt/gpu:/mnt/gpu -v /opt/actions:/mnt/actions --rm"
|
||||
APT_CACHE_DIR=/var/cache/apt/archives/
|
||||
PERMANENT_CACHE_DIR=/root/aptcache/
|
||||
|
|
Различия файлов скрыты, потому что одна или несколько строк слишком длинны
|
@ -702,14 +702,14 @@ configGPUDrivers() {
|
|||
if [[ $OS == $UBUNTU_OS_NAME ]]; then
|
||||
mkdir -p /opt/{actions,gpu}
|
||||
if [[ "${CONTAINER_RUNTIME}" == "containerd" ]]; then
|
||||
ctr image pull $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
ctr -n k8s.io image pull $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
retrycmd_if_failure 5 10 600 bash -c "$CTR_GPU_INSTALL_CMD $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG gpuinstall /entrypoint.sh install"
|
||||
ret=$?
|
||||
if [[ "$ret" != "0" ]]; then
|
||||
echo "Failed to install GPU driver, exiting..."
|
||||
exit $ERR_GPU_DRIVERS_START_FAIL
|
||||
fi
|
||||
ctr images rm --sync $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
ctr -n k8s.io images rm --sync $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
else
|
||||
bash -c "$DOCKER_GPU_INSTALL_CMD $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG install"
|
||||
ret=$?
|
||||
|
|
|
@ -136,7 +136,7 @@ NVIDIA_CONTAINER_RUNTIME_VERSION="3.6.0"
|
|||
export NVIDIA_DRIVER_IMAGE_SHA="${GPU_IMAGE_SHA:=}"
|
||||
export NVIDIA_DRIVER_IMAGE_TAG="${GPU_DV}-${NVIDIA_DRIVER_IMAGE_SHA}"
|
||||
export NVIDIA_DRIVER_IMAGE="mcr.microsoft.com/aks/aks-gpu"
|
||||
export CTR_GPU_INSTALL_CMD="ctr run --privileged --rm --net-host --with-ns pid:/proc/1/ns/pid --mount type=bind,src=/opt/gpu,dst=/mnt/gpu,options=rbind --mount type=bind,src=/opt/actions,dst=/mnt/actions,options=rbind"
|
||||
export CTR_GPU_INSTALL_CMD="ctr -n k8s.io run --privileged --rm --net-host --with-ns pid:/proc/1/ns/pid --mount type=bind,src=/opt/gpu,dst=/mnt/gpu,options=rbind --mount type=bind,src=/opt/actions,dst=/mnt/actions,options=rbind"
|
||||
export DOCKER_GPU_INSTALL_CMD="docker run --privileged --net=host --pid=host -v /opt/gpu:/mnt/gpu -v /opt/actions:/mnt/actions --rm"
|
||||
APT_CACHE_DIR=/var/cache/apt/archives/
|
||||
PERMANENT_CACHE_DIR=/root/aptcache/
|
||||
|
|
Различия файлов скрыты, потому что одна или несколько строк слишком длинны
|
@ -702,14 +702,14 @@ configGPUDrivers() {
|
|||
if [[ $OS == $UBUNTU_OS_NAME ]]; then
|
||||
mkdir -p /opt/{actions,gpu}
|
||||
if [[ "${CONTAINER_RUNTIME}" == "containerd" ]]; then
|
||||
ctr image pull $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
ctr -n k8s.io image pull $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
retrycmd_if_failure 5 10 600 bash -c "$CTR_GPU_INSTALL_CMD $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG gpuinstall /entrypoint.sh install"
|
||||
ret=$?
|
||||
if [[ "$ret" != "0" ]]; then
|
||||
echo "Failed to install GPU driver, exiting..."
|
||||
exit $ERR_GPU_DRIVERS_START_FAIL
|
||||
fi
|
||||
ctr images rm --sync $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
ctr -n k8s.io images rm --sync $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
else
|
||||
bash -c "$DOCKER_GPU_INSTALL_CMD $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG install"
|
||||
ret=$?
|
||||
|
|
|
@ -136,7 +136,7 @@ NVIDIA_CONTAINER_RUNTIME_VERSION="3.6.0"
|
|||
export NVIDIA_DRIVER_IMAGE_SHA="${GPU_IMAGE_SHA:=}"
|
||||
export NVIDIA_DRIVER_IMAGE_TAG="${GPU_DV}-${NVIDIA_DRIVER_IMAGE_SHA}"
|
||||
export NVIDIA_DRIVER_IMAGE="mcr.microsoft.com/aks/aks-gpu"
|
||||
export CTR_GPU_INSTALL_CMD="ctr run --privileged --rm --net-host --with-ns pid:/proc/1/ns/pid --mount type=bind,src=/opt/gpu,dst=/mnt/gpu,options=rbind --mount type=bind,src=/opt/actions,dst=/mnt/actions,options=rbind"
|
||||
export CTR_GPU_INSTALL_CMD="ctr -n k8s.io run --privileged --rm --net-host --with-ns pid:/proc/1/ns/pid --mount type=bind,src=/opt/gpu,dst=/mnt/gpu,options=rbind --mount type=bind,src=/opt/actions,dst=/mnt/actions,options=rbind"
|
||||
export DOCKER_GPU_INSTALL_CMD="docker run --privileged --net=host --pid=host -v /opt/gpu:/mnt/gpu -v /opt/actions:/mnt/actions --rm"
|
||||
APT_CACHE_DIR=/var/cache/apt/archives/
|
||||
PERMANENT_CACHE_DIR=/root/aptcache/
|
||||
|
|
Различия файлов скрыты, потому что одна или несколько строк слишком длинны
|
@ -702,14 +702,14 @@ configGPUDrivers() {
|
|||
if [[ $OS == $UBUNTU_OS_NAME ]]; then
|
||||
mkdir -p /opt/{actions,gpu}
|
||||
if [[ "${CONTAINER_RUNTIME}" == "containerd" ]]; then
|
||||
ctr image pull $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
ctr -n k8s.io image pull $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
retrycmd_if_failure 5 10 600 bash -c "$CTR_GPU_INSTALL_CMD $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG gpuinstall /entrypoint.sh install"
|
||||
ret=$?
|
||||
if [[ "$ret" != "0" ]]; then
|
||||
echo "Failed to install GPU driver, exiting..."
|
||||
exit $ERR_GPU_DRIVERS_START_FAIL
|
||||
fi
|
||||
ctr images rm --sync $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
ctr -n k8s.io images rm --sync $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
else
|
||||
bash -c "$DOCKER_GPU_INSTALL_CMD $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG install"
|
||||
ret=$?
|
||||
|
|
|
@ -136,7 +136,7 @@ NVIDIA_CONTAINER_RUNTIME_VERSION="3.6.0"
|
|||
export NVIDIA_DRIVER_IMAGE_SHA="${GPU_IMAGE_SHA:=}"
|
||||
export NVIDIA_DRIVER_IMAGE_TAG="${GPU_DV}-${NVIDIA_DRIVER_IMAGE_SHA}"
|
||||
export NVIDIA_DRIVER_IMAGE="mcr.microsoft.com/aks/aks-gpu"
|
||||
export CTR_GPU_INSTALL_CMD="ctr run --privileged --rm --net-host --with-ns pid:/proc/1/ns/pid --mount type=bind,src=/opt/gpu,dst=/mnt/gpu,options=rbind --mount type=bind,src=/opt/actions,dst=/mnt/actions,options=rbind"
|
||||
export CTR_GPU_INSTALL_CMD="ctr -n k8s.io run --privileged --rm --net-host --with-ns pid:/proc/1/ns/pid --mount type=bind,src=/opt/gpu,dst=/mnt/gpu,options=rbind --mount type=bind,src=/opt/actions,dst=/mnt/actions,options=rbind"
|
||||
export DOCKER_GPU_INSTALL_CMD="docker run --privileged --net=host --pid=host -v /opt/gpu:/mnt/gpu -v /opt/actions:/mnt/actions --rm"
|
||||
APT_CACHE_DIR=/var/cache/apt/archives/
|
||||
PERMANENT_CACHE_DIR=/root/aptcache/
|
||||
|
|
Различия файлов скрыты, потому что одна или несколько строк слишком длинны
|
@ -702,14 +702,14 @@ configGPUDrivers() {
|
|||
if [[ $OS == $UBUNTU_OS_NAME ]]; then
|
||||
mkdir -p /opt/{actions,gpu}
|
||||
if [[ "${CONTAINER_RUNTIME}" == "containerd" ]]; then
|
||||
ctr image pull $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
ctr -n k8s.io image pull $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
retrycmd_if_failure 5 10 600 bash -c "$CTR_GPU_INSTALL_CMD $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG gpuinstall /entrypoint.sh install"
|
||||
ret=$?
|
||||
if [[ "$ret" != "0" ]]; then
|
||||
echo "Failed to install GPU driver, exiting..."
|
||||
exit $ERR_GPU_DRIVERS_START_FAIL
|
||||
fi
|
||||
ctr images rm --sync $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
ctr -n k8s.io images rm --sync $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
else
|
||||
bash -c "$DOCKER_GPU_INSTALL_CMD $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG install"
|
||||
ret=$?
|
||||
|
|
|
@ -136,7 +136,7 @@ NVIDIA_CONTAINER_RUNTIME_VERSION="3.6.0"
|
|||
export NVIDIA_DRIVER_IMAGE_SHA="${GPU_IMAGE_SHA:=}"
|
||||
export NVIDIA_DRIVER_IMAGE_TAG="${GPU_DV}-${NVIDIA_DRIVER_IMAGE_SHA}"
|
||||
export NVIDIA_DRIVER_IMAGE="mcr.microsoft.com/aks/aks-gpu"
|
||||
export CTR_GPU_INSTALL_CMD="ctr run --privileged --rm --net-host --with-ns pid:/proc/1/ns/pid --mount type=bind,src=/opt/gpu,dst=/mnt/gpu,options=rbind --mount type=bind,src=/opt/actions,dst=/mnt/actions,options=rbind"
|
||||
export CTR_GPU_INSTALL_CMD="ctr -n k8s.io run --privileged --rm --net-host --with-ns pid:/proc/1/ns/pid --mount type=bind,src=/opt/gpu,dst=/mnt/gpu,options=rbind --mount type=bind,src=/opt/actions,dst=/mnt/actions,options=rbind"
|
||||
export DOCKER_GPU_INSTALL_CMD="docker run --privileged --net=host --pid=host -v /opt/gpu:/mnt/gpu -v /opt/actions:/mnt/actions --rm"
|
||||
APT_CACHE_DIR=/var/cache/apt/archives/
|
||||
PERMANENT_CACHE_DIR=/root/aptcache/
|
||||
|
|
Различия файлов скрыты, потому что одна или несколько строк слишком длинны
|
@ -702,14 +702,14 @@ configGPUDrivers() {
|
|||
if [[ $OS == $UBUNTU_OS_NAME ]]; then
|
||||
mkdir -p /opt/{actions,gpu}
|
||||
if [[ "${CONTAINER_RUNTIME}" == "containerd" ]]; then
|
||||
ctr image pull $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
ctr -n k8s.io image pull $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
retrycmd_if_failure 5 10 600 bash -c "$CTR_GPU_INSTALL_CMD $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG gpuinstall /entrypoint.sh install"
|
||||
ret=$?
|
||||
if [[ "$ret" != "0" ]]; then
|
||||
echo "Failed to install GPU driver, exiting..."
|
||||
exit $ERR_GPU_DRIVERS_START_FAIL
|
||||
fi
|
||||
ctr images rm --sync $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
ctr -n k8s.io images rm --sync $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
else
|
||||
bash -c "$DOCKER_GPU_INSTALL_CMD $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG install"
|
||||
ret=$?
|
||||
|
|
|
@ -136,7 +136,7 @@ NVIDIA_CONTAINER_RUNTIME_VERSION="3.6.0"
|
|||
export NVIDIA_DRIVER_IMAGE_SHA="${GPU_IMAGE_SHA:=}"
|
||||
export NVIDIA_DRIVER_IMAGE_TAG="${GPU_DV}-${NVIDIA_DRIVER_IMAGE_SHA}"
|
||||
export NVIDIA_DRIVER_IMAGE="mcr.microsoft.com/aks/aks-gpu"
|
||||
export CTR_GPU_INSTALL_CMD="ctr run --privileged --rm --net-host --with-ns pid:/proc/1/ns/pid --mount type=bind,src=/opt/gpu,dst=/mnt/gpu,options=rbind --mount type=bind,src=/opt/actions,dst=/mnt/actions,options=rbind"
|
||||
export CTR_GPU_INSTALL_CMD="ctr -n k8s.io run --privileged --rm --net-host --with-ns pid:/proc/1/ns/pid --mount type=bind,src=/opt/gpu,dst=/mnt/gpu,options=rbind --mount type=bind,src=/opt/actions,dst=/mnt/actions,options=rbind"
|
||||
export DOCKER_GPU_INSTALL_CMD="docker run --privileged --net=host --pid=host -v /opt/gpu:/mnt/gpu -v /opt/actions:/mnt/actions --rm"
|
||||
APT_CACHE_DIR=/var/cache/apt/archives/
|
||||
PERMANENT_CACHE_DIR=/root/aptcache/
|
||||
|
|
Различия файлов скрыты, потому что одна или несколько строк слишком длинны
|
@ -702,14 +702,14 @@ configGPUDrivers() {
|
|||
if [[ $OS == $UBUNTU_OS_NAME ]]; then
|
||||
mkdir -p /opt/{actions,gpu}
|
||||
if [[ "${CONTAINER_RUNTIME}" == "containerd" ]]; then
|
||||
ctr image pull $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
ctr -n k8s.io image pull $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
retrycmd_if_failure 5 10 600 bash -c "$CTR_GPU_INSTALL_CMD $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG gpuinstall /entrypoint.sh install"
|
||||
ret=$?
|
||||
if [[ "$ret" != "0" ]]; then
|
||||
echo "Failed to install GPU driver, exiting..."
|
||||
exit $ERR_GPU_DRIVERS_START_FAIL
|
||||
fi
|
||||
ctr images rm --sync $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
ctr -n k8s.io images rm --sync $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
else
|
||||
bash -c "$DOCKER_GPU_INSTALL_CMD $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG install"
|
||||
ret=$?
|
||||
|
|
|
@ -136,7 +136,7 @@ NVIDIA_CONTAINER_RUNTIME_VERSION="3.6.0"
|
|||
export NVIDIA_DRIVER_IMAGE_SHA="${GPU_IMAGE_SHA:=}"
|
||||
export NVIDIA_DRIVER_IMAGE_TAG="${GPU_DV}-${NVIDIA_DRIVER_IMAGE_SHA}"
|
||||
export NVIDIA_DRIVER_IMAGE="mcr.microsoft.com/aks/aks-gpu"
|
||||
export CTR_GPU_INSTALL_CMD="ctr run --privileged --rm --net-host --with-ns pid:/proc/1/ns/pid --mount type=bind,src=/opt/gpu,dst=/mnt/gpu,options=rbind --mount type=bind,src=/opt/actions,dst=/mnt/actions,options=rbind"
|
||||
export CTR_GPU_INSTALL_CMD="ctr -n k8s.io run --privileged --rm --net-host --with-ns pid:/proc/1/ns/pid --mount type=bind,src=/opt/gpu,dst=/mnt/gpu,options=rbind --mount type=bind,src=/opt/actions,dst=/mnt/actions,options=rbind"
|
||||
export DOCKER_GPU_INSTALL_CMD="docker run --privileged --net=host --pid=host -v /opt/gpu:/mnt/gpu -v /opt/actions:/mnt/actions --rm"
|
||||
APT_CACHE_DIR=/var/cache/apt/archives/
|
||||
PERMANENT_CACHE_DIR=/root/aptcache/
|
||||
|
|
Различия файлов скрыты, потому что одна или несколько строк слишком длинны
|
@ -702,14 +702,14 @@ configGPUDrivers() {
|
|||
if [[ $OS == $UBUNTU_OS_NAME ]]; then
|
||||
mkdir -p /opt/{actions,gpu}
|
||||
if [[ "${CONTAINER_RUNTIME}" == "containerd" ]]; then
|
||||
ctr image pull $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
ctr -n k8s.io image pull $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
retrycmd_if_failure 5 10 600 bash -c "$CTR_GPU_INSTALL_CMD $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG gpuinstall /entrypoint.sh install"
|
||||
ret=$?
|
||||
if [[ "$ret" != "0" ]]; then
|
||||
echo "Failed to install GPU driver, exiting..."
|
||||
exit $ERR_GPU_DRIVERS_START_FAIL
|
||||
fi
|
||||
ctr images rm --sync $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
ctr -n k8s.io images rm --sync $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
else
|
||||
bash -c "$DOCKER_GPU_INSTALL_CMD $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG install"
|
||||
ret=$?
|
||||
|
|
|
@ -136,7 +136,7 @@ NVIDIA_CONTAINER_RUNTIME_VERSION="3.6.0"
|
|||
export NVIDIA_DRIVER_IMAGE_SHA="${GPU_IMAGE_SHA:=}"
|
||||
export NVIDIA_DRIVER_IMAGE_TAG="${GPU_DV}-${NVIDIA_DRIVER_IMAGE_SHA}"
|
||||
export NVIDIA_DRIVER_IMAGE="mcr.microsoft.com/aks/aks-gpu"
|
||||
export CTR_GPU_INSTALL_CMD="ctr run --privileged --rm --net-host --with-ns pid:/proc/1/ns/pid --mount type=bind,src=/opt/gpu,dst=/mnt/gpu,options=rbind --mount type=bind,src=/opt/actions,dst=/mnt/actions,options=rbind"
|
||||
export CTR_GPU_INSTALL_CMD="ctr -n k8s.io run --privileged --rm --net-host --with-ns pid:/proc/1/ns/pid --mount type=bind,src=/opt/gpu,dst=/mnt/gpu,options=rbind --mount type=bind,src=/opt/actions,dst=/mnt/actions,options=rbind"
|
||||
export DOCKER_GPU_INSTALL_CMD="docker run --privileged --net=host --pid=host -v /opt/gpu:/mnt/gpu -v /opt/actions:/mnt/actions --rm"
|
||||
APT_CACHE_DIR=/var/cache/apt/archives/
|
||||
PERMANENT_CACHE_DIR=/root/aptcache/
|
||||
|
|
Различия файлов скрыты, потому что одна или несколько строк слишком длинны
|
@ -702,14 +702,14 @@ configGPUDrivers() {
|
|||
if [[ $OS == $UBUNTU_OS_NAME ]]; then
|
||||
mkdir -p /opt/{actions,gpu}
|
||||
if [[ "${CONTAINER_RUNTIME}" == "containerd" ]]; then
|
||||
ctr image pull $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
ctr -n k8s.io image pull $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
retrycmd_if_failure 5 10 600 bash -c "$CTR_GPU_INSTALL_CMD $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG gpuinstall /entrypoint.sh install"
|
||||
ret=$?
|
||||
if [[ "$ret" != "0" ]]; then
|
||||
echo "Failed to install GPU driver, exiting..."
|
||||
exit $ERR_GPU_DRIVERS_START_FAIL
|
||||
fi
|
||||
ctr images rm --sync $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
ctr -n k8s.io images rm --sync $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
else
|
||||
bash -c "$DOCKER_GPU_INSTALL_CMD $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG install"
|
||||
ret=$?
|
||||
|
|
|
@ -136,7 +136,7 @@ NVIDIA_CONTAINER_RUNTIME_VERSION="3.6.0"
|
|||
export NVIDIA_DRIVER_IMAGE_SHA="${GPU_IMAGE_SHA:=}"
|
||||
export NVIDIA_DRIVER_IMAGE_TAG="${GPU_DV}-${NVIDIA_DRIVER_IMAGE_SHA}"
|
||||
export NVIDIA_DRIVER_IMAGE="mcr.microsoft.com/aks/aks-gpu"
|
||||
export CTR_GPU_INSTALL_CMD="ctr run --privileged --rm --net-host --with-ns pid:/proc/1/ns/pid --mount type=bind,src=/opt/gpu,dst=/mnt/gpu,options=rbind --mount type=bind,src=/opt/actions,dst=/mnt/actions,options=rbind"
|
||||
export CTR_GPU_INSTALL_CMD="ctr -n k8s.io run --privileged --rm --net-host --with-ns pid:/proc/1/ns/pid --mount type=bind,src=/opt/gpu,dst=/mnt/gpu,options=rbind --mount type=bind,src=/opt/actions,dst=/mnt/actions,options=rbind"
|
||||
export DOCKER_GPU_INSTALL_CMD="docker run --privileged --net=host --pid=host -v /opt/gpu:/mnt/gpu -v /opt/actions:/mnt/actions --rm"
|
||||
APT_CACHE_DIR=/var/cache/apt/archives/
|
||||
PERMANENT_CACHE_DIR=/root/aptcache/
|
||||
|
|
Различия файлов скрыты, потому что одна или несколько строк слишком длинны
|
@ -702,14 +702,14 @@ configGPUDrivers() {
|
|||
if [[ $OS == $UBUNTU_OS_NAME ]]; then
|
||||
mkdir -p /opt/{actions,gpu}
|
||||
if [[ "${CONTAINER_RUNTIME}" == "containerd" ]]; then
|
||||
ctr image pull $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
ctr -n k8s.io image pull $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
retrycmd_if_failure 5 10 600 bash -c "$CTR_GPU_INSTALL_CMD $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG gpuinstall /entrypoint.sh install"
|
||||
ret=$?
|
||||
if [[ "$ret" != "0" ]]; then
|
||||
echo "Failed to install GPU driver, exiting..."
|
||||
exit $ERR_GPU_DRIVERS_START_FAIL
|
||||
fi
|
||||
ctr images rm --sync $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
ctr -n k8s.io images rm --sync $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
else
|
||||
bash -c "$DOCKER_GPU_INSTALL_CMD $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG install"
|
||||
ret=$?
|
||||
|
|
|
@ -136,7 +136,7 @@ NVIDIA_CONTAINER_RUNTIME_VERSION="3.6.0"
|
|||
export NVIDIA_DRIVER_IMAGE_SHA="${GPU_IMAGE_SHA:=}"
|
||||
export NVIDIA_DRIVER_IMAGE_TAG="${GPU_DV}-${NVIDIA_DRIVER_IMAGE_SHA}"
|
||||
export NVIDIA_DRIVER_IMAGE="mcr.microsoft.com/aks/aks-gpu"
|
||||
export CTR_GPU_INSTALL_CMD="ctr run --privileged --rm --net-host --with-ns pid:/proc/1/ns/pid --mount type=bind,src=/opt/gpu,dst=/mnt/gpu,options=rbind --mount type=bind,src=/opt/actions,dst=/mnt/actions,options=rbind"
|
||||
export CTR_GPU_INSTALL_CMD="ctr -n k8s.io run --privileged --rm --net-host --with-ns pid:/proc/1/ns/pid --mount type=bind,src=/opt/gpu,dst=/mnt/gpu,options=rbind --mount type=bind,src=/opt/actions,dst=/mnt/actions,options=rbind"
|
||||
export DOCKER_GPU_INSTALL_CMD="docker run --privileged --net=host --pid=host -v /opt/gpu:/mnt/gpu -v /opt/actions:/mnt/actions --rm"
|
||||
APT_CACHE_DIR=/var/cache/apt/archives/
|
||||
PERMANENT_CACHE_DIR=/root/aptcache/
|
||||
|
|
Различия файлов скрыты, потому что одна или несколько строк слишком длинны
|
@ -702,14 +702,14 @@ configGPUDrivers() {
|
|||
if [[ $OS == $UBUNTU_OS_NAME ]]; then
|
||||
mkdir -p /opt/{actions,gpu}
|
||||
if [[ "${CONTAINER_RUNTIME}" == "containerd" ]]; then
|
||||
ctr image pull $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
ctr -n k8s.io image pull $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
retrycmd_if_failure 5 10 600 bash -c "$CTR_GPU_INSTALL_CMD $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG gpuinstall /entrypoint.sh install"
|
||||
ret=$?
|
||||
if [[ "$ret" != "0" ]]; then
|
||||
echo "Failed to install GPU driver, exiting..."
|
||||
exit $ERR_GPU_DRIVERS_START_FAIL
|
||||
fi
|
||||
ctr images rm --sync $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
ctr -n k8s.io images rm --sync $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
else
|
||||
bash -c "$DOCKER_GPU_INSTALL_CMD $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG install"
|
||||
ret=$?
|
||||
|
|
|
@ -136,7 +136,7 @@ NVIDIA_CONTAINER_RUNTIME_VERSION="3.6.0"
|
|||
export NVIDIA_DRIVER_IMAGE_SHA="${GPU_IMAGE_SHA:=}"
|
||||
export NVIDIA_DRIVER_IMAGE_TAG="${GPU_DV}-${NVIDIA_DRIVER_IMAGE_SHA}"
|
||||
export NVIDIA_DRIVER_IMAGE="mcr.microsoft.com/aks/aks-gpu"
|
||||
export CTR_GPU_INSTALL_CMD="ctr run --privileged --rm --net-host --with-ns pid:/proc/1/ns/pid --mount type=bind,src=/opt/gpu,dst=/mnt/gpu,options=rbind --mount type=bind,src=/opt/actions,dst=/mnt/actions,options=rbind"
|
||||
export CTR_GPU_INSTALL_CMD="ctr -n k8s.io run --privileged --rm --net-host --with-ns pid:/proc/1/ns/pid --mount type=bind,src=/opt/gpu,dst=/mnt/gpu,options=rbind --mount type=bind,src=/opt/actions,dst=/mnt/actions,options=rbind"
|
||||
export DOCKER_GPU_INSTALL_CMD="docker run --privileged --net=host --pid=host -v /opt/gpu:/mnt/gpu -v /opt/actions:/mnt/actions --rm"
|
||||
APT_CACHE_DIR=/var/cache/apt/archives/
|
||||
PERMANENT_CACHE_DIR=/root/aptcache/
|
||||
|
|
Различия файлов скрыты, потому что одна или несколько строк слишком длинны
|
@ -702,14 +702,14 @@ configGPUDrivers() {
|
|||
if [[ $OS == $UBUNTU_OS_NAME ]]; then
|
||||
mkdir -p /opt/{actions,gpu}
|
||||
if [[ "${CONTAINER_RUNTIME}" == "containerd" ]]; then
|
||||
ctr image pull $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
ctr -n k8s.io image pull $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
retrycmd_if_failure 5 10 600 bash -c "$CTR_GPU_INSTALL_CMD $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG gpuinstall /entrypoint.sh install"
|
||||
ret=$?
|
||||
if [[ "$ret" != "0" ]]; then
|
||||
echo "Failed to install GPU driver, exiting..."
|
||||
exit $ERR_GPU_DRIVERS_START_FAIL
|
||||
fi
|
||||
ctr images rm --sync $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
ctr -n k8s.io images rm --sync $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
else
|
||||
bash -c "$DOCKER_GPU_INSTALL_CMD $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG install"
|
||||
ret=$?
|
||||
|
|
|
@ -136,7 +136,7 @@ NVIDIA_CONTAINER_RUNTIME_VERSION="3.6.0"
|
|||
export NVIDIA_DRIVER_IMAGE_SHA="${GPU_IMAGE_SHA:=}"
|
||||
export NVIDIA_DRIVER_IMAGE_TAG="${GPU_DV}-${NVIDIA_DRIVER_IMAGE_SHA}"
|
||||
export NVIDIA_DRIVER_IMAGE="mcr.microsoft.com/aks/aks-gpu"
|
||||
export CTR_GPU_INSTALL_CMD="ctr run --privileged --rm --net-host --with-ns pid:/proc/1/ns/pid --mount type=bind,src=/opt/gpu,dst=/mnt/gpu,options=rbind --mount type=bind,src=/opt/actions,dst=/mnt/actions,options=rbind"
|
||||
export CTR_GPU_INSTALL_CMD="ctr -n k8s.io run --privileged --rm --net-host --with-ns pid:/proc/1/ns/pid --mount type=bind,src=/opt/gpu,dst=/mnt/gpu,options=rbind --mount type=bind,src=/opt/actions,dst=/mnt/actions,options=rbind"
|
||||
export DOCKER_GPU_INSTALL_CMD="docker run --privileged --net=host --pid=host -v /opt/gpu:/mnt/gpu -v /opt/actions:/mnt/actions --rm"
|
||||
APT_CACHE_DIR=/var/cache/apt/archives/
|
||||
PERMANENT_CACHE_DIR=/root/aptcache/
|
||||
|
|
Различия файлов скрыты, потому что одна или несколько строк слишком длинны
|
@ -702,14 +702,14 @@ configGPUDrivers() {
|
|||
if [[ $OS == $UBUNTU_OS_NAME ]]; then
|
||||
mkdir -p /opt/{actions,gpu}
|
||||
if [[ "${CONTAINER_RUNTIME}" == "containerd" ]]; then
|
||||
ctr image pull $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
ctr -n k8s.io image pull $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
retrycmd_if_failure 5 10 600 bash -c "$CTR_GPU_INSTALL_CMD $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG gpuinstall /entrypoint.sh install"
|
||||
ret=$?
|
||||
if [[ "$ret" != "0" ]]; then
|
||||
echo "Failed to install GPU driver, exiting..."
|
||||
exit $ERR_GPU_DRIVERS_START_FAIL
|
||||
fi
|
||||
ctr images rm --sync $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
ctr -n k8s.io images rm --sync $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
else
|
||||
bash -c "$DOCKER_GPU_INSTALL_CMD $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG install"
|
||||
ret=$?
|
||||
|
|
|
@ -136,7 +136,7 @@ NVIDIA_CONTAINER_RUNTIME_VERSION="3.6.0"
|
|||
export NVIDIA_DRIVER_IMAGE_SHA="${GPU_IMAGE_SHA:=}"
|
||||
export NVIDIA_DRIVER_IMAGE_TAG="${GPU_DV}-${NVIDIA_DRIVER_IMAGE_SHA}"
|
||||
export NVIDIA_DRIVER_IMAGE="mcr.microsoft.com/aks/aks-gpu"
|
||||
export CTR_GPU_INSTALL_CMD="ctr run --privileged --rm --net-host --with-ns pid:/proc/1/ns/pid --mount type=bind,src=/opt/gpu,dst=/mnt/gpu,options=rbind --mount type=bind,src=/opt/actions,dst=/mnt/actions,options=rbind"
|
||||
export CTR_GPU_INSTALL_CMD="ctr -n k8s.io run --privileged --rm --net-host --with-ns pid:/proc/1/ns/pid --mount type=bind,src=/opt/gpu,dst=/mnt/gpu,options=rbind --mount type=bind,src=/opt/actions,dst=/mnt/actions,options=rbind"
|
||||
export DOCKER_GPU_INSTALL_CMD="docker run --privileged --net=host --pid=host -v /opt/gpu:/mnt/gpu -v /opt/actions:/mnt/actions --rm"
|
||||
APT_CACHE_DIR=/var/cache/apt/archives/
|
||||
PERMANENT_CACHE_DIR=/root/aptcache/
|
||||
|
|
Различия файлов скрыты, потому что одна или несколько строк слишком длинны
|
@ -702,14 +702,14 @@ configGPUDrivers() {
|
|||
if [[ $OS == $UBUNTU_OS_NAME ]]; then
|
||||
mkdir -p /opt/{actions,gpu}
|
||||
if [[ "${CONTAINER_RUNTIME}" == "containerd" ]]; then
|
||||
ctr image pull $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
ctr -n k8s.io image pull $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
retrycmd_if_failure 5 10 600 bash -c "$CTR_GPU_INSTALL_CMD $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG gpuinstall /entrypoint.sh install"
|
||||
ret=$?
|
||||
if [[ "$ret" != "0" ]]; then
|
||||
echo "Failed to install GPU driver, exiting..."
|
||||
exit $ERR_GPU_DRIVERS_START_FAIL
|
||||
fi
|
||||
ctr images rm --sync $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
ctr -n k8s.io images rm --sync $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
else
|
||||
bash -c "$DOCKER_GPU_INSTALL_CMD $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG install"
|
||||
ret=$?
|
||||
|
|
|
@ -136,7 +136,7 @@ NVIDIA_CONTAINER_RUNTIME_VERSION="3.6.0"
|
|||
export NVIDIA_DRIVER_IMAGE_SHA="${GPU_IMAGE_SHA:=}"
|
||||
export NVIDIA_DRIVER_IMAGE_TAG="${GPU_DV}-${NVIDIA_DRIVER_IMAGE_SHA}"
|
||||
export NVIDIA_DRIVER_IMAGE="mcr.microsoft.com/aks/aks-gpu"
|
||||
export CTR_GPU_INSTALL_CMD="ctr run --privileged --rm --net-host --with-ns pid:/proc/1/ns/pid --mount type=bind,src=/opt/gpu,dst=/mnt/gpu,options=rbind --mount type=bind,src=/opt/actions,dst=/mnt/actions,options=rbind"
|
||||
export CTR_GPU_INSTALL_CMD="ctr -n k8s.io run --privileged --rm --net-host --with-ns pid:/proc/1/ns/pid --mount type=bind,src=/opt/gpu,dst=/mnt/gpu,options=rbind --mount type=bind,src=/opt/actions,dst=/mnt/actions,options=rbind"
|
||||
export DOCKER_GPU_INSTALL_CMD="docker run --privileged --net=host --pid=host -v /opt/gpu:/mnt/gpu -v /opt/actions:/mnt/actions --rm"
|
||||
APT_CACHE_DIR=/var/cache/apt/archives/
|
||||
PERMANENT_CACHE_DIR=/root/aptcache/
|
||||
|
|
Различия файлов скрыты, потому что одна или несколько строк слишком длинны
|
@ -702,14 +702,14 @@ configGPUDrivers() {
|
|||
if [[ $OS == $UBUNTU_OS_NAME ]]; then
|
||||
mkdir -p /opt/{actions,gpu}
|
||||
if [[ "${CONTAINER_RUNTIME}" == "containerd" ]]; then
|
||||
ctr image pull $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
ctr -n k8s.io image pull $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
retrycmd_if_failure 5 10 600 bash -c "$CTR_GPU_INSTALL_CMD $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG gpuinstall /entrypoint.sh install"
|
||||
ret=$?
|
||||
if [[ "$ret" != "0" ]]; then
|
||||
echo "Failed to install GPU driver, exiting..."
|
||||
exit $ERR_GPU_DRIVERS_START_FAIL
|
||||
fi
|
||||
ctr images rm --sync $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
ctr -n k8s.io images rm --sync $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
else
|
||||
bash -c "$DOCKER_GPU_INSTALL_CMD $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG install"
|
||||
ret=$?
|
||||
|
|
|
@ -136,7 +136,7 @@ NVIDIA_CONTAINER_RUNTIME_VERSION="3.6.0"
|
|||
export NVIDIA_DRIVER_IMAGE_SHA="${GPU_IMAGE_SHA:=}"
|
||||
export NVIDIA_DRIVER_IMAGE_TAG="${GPU_DV}-${NVIDIA_DRIVER_IMAGE_SHA}"
|
||||
export NVIDIA_DRIVER_IMAGE="mcr.microsoft.com/aks/aks-gpu"
|
||||
export CTR_GPU_INSTALL_CMD="ctr run --privileged --rm --net-host --with-ns pid:/proc/1/ns/pid --mount type=bind,src=/opt/gpu,dst=/mnt/gpu,options=rbind --mount type=bind,src=/opt/actions,dst=/mnt/actions,options=rbind"
|
||||
export CTR_GPU_INSTALL_CMD="ctr -n k8s.io run --privileged --rm --net-host --with-ns pid:/proc/1/ns/pid --mount type=bind,src=/opt/gpu,dst=/mnt/gpu,options=rbind --mount type=bind,src=/opt/actions,dst=/mnt/actions,options=rbind"
|
||||
export DOCKER_GPU_INSTALL_CMD="docker run --privileged --net=host --pid=host -v /opt/gpu:/mnt/gpu -v /opt/actions:/mnt/actions --rm"
|
||||
APT_CACHE_DIR=/var/cache/apt/archives/
|
||||
PERMANENT_CACHE_DIR=/root/aptcache/
|
||||
|
|
Различия файлов скрыты, потому что одна или несколько строк слишком длинны
|
@ -702,14 +702,14 @@ configGPUDrivers() {
|
|||
if [[ $OS == $UBUNTU_OS_NAME ]]; then
|
||||
mkdir -p /opt/{actions,gpu}
|
||||
if [[ "${CONTAINER_RUNTIME}" == "containerd" ]]; then
|
||||
ctr image pull $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
ctr -n k8s.io image pull $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
retrycmd_if_failure 5 10 600 bash -c "$CTR_GPU_INSTALL_CMD $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG gpuinstall /entrypoint.sh install"
|
||||
ret=$?
|
||||
if [[ "$ret" != "0" ]]; then
|
||||
echo "Failed to install GPU driver, exiting..."
|
||||
exit $ERR_GPU_DRIVERS_START_FAIL
|
||||
fi
|
||||
ctr images rm --sync $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
ctr -n k8s.io images rm --sync $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
else
|
||||
bash -c "$DOCKER_GPU_INSTALL_CMD $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG install"
|
||||
ret=$?
|
||||
|
|
|
@ -136,7 +136,7 @@ NVIDIA_CONTAINER_RUNTIME_VERSION="3.6.0"
|
|||
export NVIDIA_DRIVER_IMAGE_SHA="${GPU_IMAGE_SHA:=}"
|
||||
export NVIDIA_DRIVER_IMAGE_TAG="${GPU_DV}-${NVIDIA_DRIVER_IMAGE_SHA}"
|
||||
export NVIDIA_DRIVER_IMAGE="mcr.microsoft.com/aks/aks-gpu"
|
||||
export CTR_GPU_INSTALL_CMD="ctr run --privileged --rm --net-host --with-ns pid:/proc/1/ns/pid --mount type=bind,src=/opt/gpu,dst=/mnt/gpu,options=rbind --mount type=bind,src=/opt/actions,dst=/mnt/actions,options=rbind"
|
||||
export CTR_GPU_INSTALL_CMD="ctr -n k8s.io run --privileged --rm --net-host --with-ns pid:/proc/1/ns/pid --mount type=bind,src=/opt/gpu,dst=/mnt/gpu,options=rbind --mount type=bind,src=/opt/actions,dst=/mnt/actions,options=rbind"
|
||||
export DOCKER_GPU_INSTALL_CMD="docker run --privileged --net=host --pid=host -v /opt/gpu:/mnt/gpu -v /opt/actions:/mnt/actions --rm"
|
||||
APT_CACHE_DIR=/var/cache/apt/archives/
|
||||
PERMANENT_CACHE_DIR=/root/aptcache/
|
||||
|
|
Различия файлов скрыты, потому что одна или несколько строк слишком длинны
|
@ -702,14 +702,14 @@ configGPUDrivers() {
|
|||
if [[ $OS == $UBUNTU_OS_NAME ]]; then
|
||||
mkdir -p /opt/{actions,gpu}
|
||||
if [[ "${CONTAINER_RUNTIME}" == "containerd" ]]; then
|
||||
ctr image pull $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
ctr -n k8s.io image pull $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
retrycmd_if_failure 5 10 600 bash -c "$CTR_GPU_INSTALL_CMD $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG gpuinstall /entrypoint.sh install"
|
||||
ret=$?
|
||||
if [[ "$ret" != "0" ]]; then
|
||||
echo "Failed to install GPU driver, exiting..."
|
||||
exit $ERR_GPU_DRIVERS_START_FAIL
|
||||
fi
|
||||
ctr images rm --sync $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
ctr -n k8s.io images rm --sync $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
else
|
||||
bash -c "$DOCKER_GPU_INSTALL_CMD $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG install"
|
||||
ret=$?
|
||||
|
|
|
@ -136,7 +136,7 @@ NVIDIA_CONTAINER_RUNTIME_VERSION="3.6.0"
|
|||
export NVIDIA_DRIVER_IMAGE_SHA="${GPU_IMAGE_SHA:=}"
|
||||
export NVIDIA_DRIVER_IMAGE_TAG="${GPU_DV}-${NVIDIA_DRIVER_IMAGE_SHA}"
|
||||
export NVIDIA_DRIVER_IMAGE="mcr.microsoft.com/aks/aks-gpu"
|
||||
export CTR_GPU_INSTALL_CMD="ctr run --privileged --rm --net-host --with-ns pid:/proc/1/ns/pid --mount type=bind,src=/opt/gpu,dst=/mnt/gpu,options=rbind --mount type=bind,src=/opt/actions,dst=/mnt/actions,options=rbind"
|
||||
export CTR_GPU_INSTALL_CMD="ctr -n k8s.io run --privileged --rm --net-host --with-ns pid:/proc/1/ns/pid --mount type=bind,src=/opt/gpu,dst=/mnt/gpu,options=rbind --mount type=bind,src=/opt/actions,dst=/mnt/actions,options=rbind"
|
||||
export DOCKER_GPU_INSTALL_CMD="docker run --privileged --net=host --pid=host -v /opt/gpu:/mnt/gpu -v /opt/actions:/mnt/actions --rm"
|
||||
APT_CACHE_DIR=/var/cache/apt/archives/
|
||||
PERMANENT_CACHE_DIR=/root/aptcache/
|
||||
|
|
Различия файлов скрыты, потому что одна или несколько строк слишком длинны
|
@ -702,14 +702,14 @@ configGPUDrivers() {
|
|||
if [[ $OS == $UBUNTU_OS_NAME ]]; then
|
||||
mkdir -p /opt/{actions,gpu}
|
||||
if [[ "${CONTAINER_RUNTIME}" == "containerd" ]]; then
|
||||
ctr image pull $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
ctr -n k8s.io image pull $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
retrycmd_if_failure 5 10 600 bash -c "$CTR_GPU_INSTALL_CMD $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG gpuinstall /entrypoint.sh install"
|
||||
ret=$?
|
||||
if [[ "$ret" != "0" ]]; then
|
||||
echo "Failed to install GPU driver, exiting..."
|
||||
exit $ERR_GPU_DRIVERS_START_FAIL
|
||||
fi
|
||||
ctr images rm --sync $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
ctr -n k8s.io images rm --sync $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
else
|
||||
bash -c "$DOCKER_GPU_INSTALL_CMD $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG install"
|
||||
ret=$?
|
||||
|
|
|
@ -136,7 +136,7 @@ NVIDIA_CONTAINER_RUNTIME_VERSION="3.6.0"
|
|||
export NVIDIA_DRIVER_IMAGE_SHA="${GPU_IMAGE_SHA:=}"
|
||||
export NVIDIA_DRIVER_IMAGE_TAG="${GPU_DV}-${NVIDIA_DRIVER_IMAGE_SHA}"
|
||||
export NVIDIA_DRIVER_IMAGE="mcr.microsoft.com/aks/aks-gpu"
|
||||
export CTR_GPU_INSTALL_CMD="ctr run --privileged --rm --net-host --with-ns pid:/proc/1/ns/pid --mount type=bind,src=/opt/gpu,dst=/mnt/gpu,options=rbind --mount type=bind,src=/opt/actions,dst=/mnt/actions,options=rbind"
|
||||
export CTR_GPU_INSTALL_CMD="ctr -n k8s.io run --privileged --rm --net-host --with-ns pid:/proc/1/ns/pid --mount type=bind,src=/opt/gpu,dst=/mnt/gpu,options=rbind --mount type=bind,src=/opt/actions,dst=/mnt/actions,options=rbind"
|
||||
export DOCKER_GPU_INSTALL_CMD="docker run --privileged --net=host --pid=host -v /opt/gpu:/mnt/gpu -v /opt/actions:/mnt/actions --rm"
|
||||
APT_CACHE_DIR=/var/cache/apt/archives/
|
||||
PERMANENT_CACHE_DIR=/root/aptcache/
|
||||
|
|
Различия файлов скрыты, потому что одна или несколько строк слишком длинны
|
@ -702,14 +702,14 @@ configGPUDrivers() {
|
|||
if [[ $OS == $UBUNTU_OS_NAME ]]; then
|
||||
mkdir -p /opt/{actions,gpu}
|
||||
if [[ "${CONTAINER_RUNTIME}" == "containerd" ]]; then
|
||||
ctr image pull $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
ctr -n k8s.io image pull $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
retrycmd_if_failure 5 10 600 bash -c "$CTR_GPU_INSTALL_CMD $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG gpuinstall /entrypoint.sh install"
|
||||
ret=$?
|
||||
if [[ "$ret" != "0" ]]; then
|
||||
echo "Failed to install GPU driver, exiting..."
|
||||
exit $ERR_GPU_DRIVERS_START_FAIL
|
||||
fi
|
||||
ctr images rm --sync $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
ctr -n k8s.io images rm --sync $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
else
|
||||
bash -c "$DOCKER_GPU_INSTALL_CMD $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG install"
|
||||
ret=$?
|
||||
|
|
|
@ -136,7 +136,7 @@ NVIDIA_CONTAINER_RUNTIME_VERSION="3.6.0"
|
|||
export NVIDIA_DRIVER_IMAGE_SHA="${GPU_IMAGE_SHA:=}"
|
||||
export NVIDIA_DRIVER_IMAGE_TAG="${GPU_DV}-${NVIDIA_DRIVER_IMAGE_SHA}"
|
||||
export NVIDIA_DRIVER_IMAGE="mcr.microsoft.com/aks/aks-gpu"
|
||||
export CTR_GPU_INSTALL_CMD="ctr run --privileged --rm --net-host --with-ns pid:/proc/1/ns/pid --mount type=bind,src=/opt/gpu,dst=/mnt/gpu,options=rbind --mount type=bind,src=/opt/actions,dst=/mnt/actions,options=rbind"
|
||||
export CTR_GPU_INSTALL_CMD="ctr -n k8s.io run --privileged --rm --net-host --with-ns pid:/proc/1/ns/pid --mount type=bind,src=/opt/gpu,dst=/mnt/gpu,options=rbind --mount type=bind,src=/opt/actions,dst=/mnt/actions,options=rbind"
|
||||
export DOCKER_GPU_INSTALL_CMD="docker run --privileged --net=host --pid=host -v /opt/gpu:/mnt/gpu -v /opt/actions:/mnt/actions --rm"
|
||||
APT_CACHE_DIR=/var/cache/apt/archives/
|
||||
PERMANENT_CACHE_DIR=/root/aptcache/
|
||||
|
|
Различия файлов скрыты, потому что одна или несколько строк слишком длинны
|
@ -702,14 +702,14 @@ configGPUDrivers() {
|
|||
if [[ $OS == $UBUNTU_OS_NAME ]]; then
|
||||
mkdir -p /opt/{actions,gpu}
|
||||
if [[ "${CONTAINER_RUNTIME}" == "containerd" ]]; then
|
||||
ctr image pull $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
ctr -n k8s.io image pull $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
retrycmd_if_failure 5 10 600 bash -c "$CTR_GPU_INSTALL_CMD $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG gpuinstall /entrypoint.sh install"
|
||||
ret=$?
|
||||
if [[ "$ret" != "0" ]]; then
|
||||
echo "Failed to install GPU driver, exiting..."
|
||||
exit $ERR_GPU_DRIVERS_START_FAIL
|
||||
fi
|
||||
ctr images rm --sync $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
ctr -n k8s.io images rm --sync $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
else
|
||||
bash -c "$DOCKER_GPU_INSTALL_CMD $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG install"
|
||||
ret=$?
|
||||
|
|
|
@ -136,7 +136,7 @@ NVIDIA_CONTAINER_RUNTIME_VERSION="3.6.0"
|
|||
export NVIDIA_DRIVER_IMAGE_SHA="${GPU_IMAGE_SHA:=}"
|
||||
export NVIDIA_DRIVER_IMAGE_TAG="${GPU_DV}-${NVIDIA_DRIVER_IMAGE_SHA}"
|
||||
export NVIDIA_DRIVER_IMAGE="mcr.microsoft.com/aks/aks-gpu"
|
||||
export CTR_GPU_INSTALL_CMD="ctr run --privileged --rm --net-host --with-ns pid:/proc/1/ns/pid --mount type=bind,src=/opt/gpu,dst=/mnt/gpu,options=rbind --mount type=bind,src=/opt/actions,dst=/mnt/actions,options=rbind"
|
||||
export CTR_GPU_INSTALL_CMD="ctr -n k8s.io run --privileged --rm --net-host --with-ns pid:/proc/1/ns/pid --mount type=bind,src=/opt/gpu,dst=/mnt/gpu,options=rbind --mount type=bind,src=/opt/actions,dst=/mnt/actions,options=rbind"
|
||||
export DOCKER_GPU_INSTALL_CMD="docker run --privileged --net=host --pid=host -v /opt/gpu:/mnt/gpu -v /opt/actions:/mnt/actions --rm"
|
||||
APT_CACHE_DIR=/var/cache/apt/archives/
|
||||
PERMANENT_CACHE_DIR=/root/aptcache/
|
||||
|
|
Различия файлов скрыты, потому что одна или несколько строк слишком длинны
|
@ -702,14 +702,14 @@ configGPUDrivers() {
|
|||
if [[ $OS == $UBUNTU_OS_NAME ]]; then
|
||||
mkdir -p /opt/{actions,gpu}
|
||||
if [[ "${CONTAINER_RUNTIME}" == "containerd" ]]; then
|
||||
ctr image pull $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
ctr -n k8s.io image pull $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
retrycmd_if_failure 5 10 600 bash -c "$CTR_GPU_INSTALL_CMD $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG gpuinstall /entrypoint.sh install"
|
||||
ret=$?
|
||||
if [[ "$ret" != "0" ]]; then
|
||||
echo "Failed to install GPU driver, exiting..."
|
||||
exit $ERR_GPU_DRIVERS_START_FAIL
|
||||
fi
|
||||
ctr images rm --sync $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
ctr -n k8s.io images rm --sync $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
else
|
||||
bash -c "$DOCKER_GPU_INSTALL_CMD $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG install"
|
||||
ret=$?
|
||||
|
|
|
@ -136,7 +136,7 @@ NVIDIA_CONTAINER_RUNTIME_VERSION="3.6.0"
|
|||
export NVIDIA_DRIVER_IMAGE_SHA="${GPU_IMAGE_SHA:=}"
|
||||
export NVIDIA_DRIVER_IMAGE_TAG="${GPU_DV}-${NVIDIA_DRIVER_IMAGE_SHA}"
|
||||
export NVIDIA_DRIVER_IMAGE="mcr.microsoft.com/aks/aks-gpu"
|
||||
export CTR_GPU_INSTALL_CMD="ctr run --privileged --rm --net-host --with-ns pid:/proc/1/ns/pid --mount type=bind,src=/opt/gpu,dst=/mnt/gpu,options=rbind --mount type=bind,src=/opt/actions,dst=/mnt/actions,options=rbind"
|
||||
export CTR_GPU_INSTALL_CMD="ctr -n k8s.io run --privileged --rm --net-host --with-ns pid:/proc/1/ns/pid --mount type=bind,src=/opt/gpu,dst=/mnt/gpu,options=rbind --mount type=bind,src=/opt/actions,dst=/mnt/actions,options=rbind"
|
||||
export DOCKER_GPU_INSTALL_CMD="docker run --privileged --net=host --pid=host -v /opt/gpu:/mnt/gpu -v /opt/actions:/mnt/actions --rm"
|
||||
APT_CACHE_DIR=/var/cache/apt/archives/
|
||||
PERMANENT_CACHE_DIR=/root/aptcache/
|
||||
|
|
Различия файлов скрыты, потому что одна или несколько строк слишком длинны
|
@ -702,14 +702,14 @@ configGPUDrivers() {
|
|||
if [[ $OS == $UBUNTU_OS_NAME ]]; then
|
||||
mkdir -p /opt/{actions,gpu}
|
||||
if [[ "${CONTAINER_RUNTIME}" == "containerd" ]]; then
|
||||
ctr image pull $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
ctr -n k8s.io image pull $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
retrycmd_if_failure 5 10 600 bash -c "$CTR_GPU_INSTALL_CMD $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG gpuinstall /entrypoint.sh install"
|
||||
ret=$?
|
||||
if [[ "$ret" != "0" ]]; then
|
||||
echo "Failed to install GPU driver, exiting..."
|
||||
exit $ERR_GPU_DRIVERS_START_FAIL
|
||||
fi
|
||||
ctr images rm --sync $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
ctr -n k8s.io images rm --sync $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
else
|
||||
bash -c "$DOCKER_GPU_INSTALL_CMD $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG install"
|
||||
ret=$?
|
||||
|
|
|
@ -136,7 +136,7 @@ NVIDIA_CONTAINER_RUNTIME_VERSION="3.6.0"
|
|||
export NVIDIA_DRIVER_IMAGE_SHA="${GPU_IMAGE_SHA:=}"
|
||||
export NVIDIA_DRIVER_IMAGE_TAG="${GPU_DV}-${NVIDIA_DRIVER_IMAGE_SHA}"
|
||||
export NVIDIA_DRIVER_IMAGE="mcr.microsoft.com/aks/aks-gpu"
|
||||
export CTR_GPU_INSTALL_CMD="ctr run --privileged --rm --net-host --with-ns pid:/proc/1/ns/pid --mount type=bind,src=/opt/gpu,dst=/mnt/gpu,options=rbind --mount type=bind,src=/opt/actions,dst=/mnt/actions,options=rbind"
|
||||
export CTR_GPU_INSTALL_CMD="ctr -n k8s.io run --privileged --rm --net-host --with-ns pid:/proc/1/ns/pid --mount type=bind,src=/opt/gpu,dst=/mnt/gpu,options=rbind --mount type=bind,src=/opt/actions,dst=/mnt/actions,options=rbind"
|
||||
export DOCKER_GPU_INSTALL_CMD="docker run --privileged --net=host --pid=host -v /opt/gpu:/mnt/gpu -v /opt/actions:/mnt/actions --rm"
|
||||
APT_CACHE_DIR=/var/cache/apt/archives/
|
||||
PERMANENT_CACHE_DIR=/root/aptcache/
|
||||
|
|
Различия файлов скрыты, потому что одна или несколько строк слишком длинны
|
@ -702,14 +702,14 @@ configGPUDrivers() {
|
|||
if [[ $OS == $UBUNTU_OS_NAME ]]; then
|
||||
mkdir -p /opt/{actions,gpu}
|
||||
if [[ "${CONTAINER_RUNTIME}" == "containerd" ]]; then
|
||||
ctr image pull $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
ctr -n k8s.io image pull $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
retrycmd_if_failure 5 10 600 bash -c "$CTR_GPU_INSTALL_CMD $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG gpuinstall /entrypoint.sh install"
|
||||
ret=$?
|
||||
if [[ "$ret" != "0" ]]; then
|
||||
echo "Failed to install GPU driver, exiting..."
|
||||
exit $ERR_GPU_DRIVERS_START_FAIL
|
||||
fi
|
||||
ctr images rm --sync $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
ctr -n k8s.io images rm --sync $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
else
|
||||
bash -c "$DOCKER_GPU_INSTALL_CMD $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG install"
|
||||
ret=$?
|
||||
|
|
|
@ -136,7 +136,7 @@ NVIDIA_CONTAINER_RUNTIME_VERSION="3.6.0"
|
|||
export NVIDIA_DRIVER_IMAGE_SHA="${GPU_IMAGE_SHA:=}"
|
||||
export NVIDIA_DRIVER_IMAGE_TAG="${GPU_DV}-${NVIDIA_DRIVER_IMAGE_SHA}"
|
||||
export NVIDIA_DRIVER_IMAGE="mcr.microsoft.com/aks/aks-gpu"
|
||||
export CTR_GPU_INSTALL_CMD="ctr run --privileged --rm --net-host --with-ns pid:/proc/1/ns/pid --mount type=bind,src=/opt/gpu,dst=/mnt/gpu,options=rbind --mount type=bind,src=/opt/actions,dst=/mnt/actions,options=rbind"
|
||||
export CTR_GPU_INSTALL_CMD="ctr -n k8s.io run --privileged --rm --net-host --with-ns pid:/proc/1/ns/pid --mount type=bind,src=/opt/gpu,dst=/mnt/gpu,options=rbind --mount type=bind,src=/opt/actions,dst=/mnt/actions,options=rbind"
|
||||
export DOCKER_GPU_INSTALL_CMD="docker run --privileged --net=host --pid=host -v /opt/gpu:/mnt/gpu -v /opt/actions:/mnt/actions --rm"
|
||||
APT_CACHE_DIR=/var/cache/apt/archives/
|
||||
PERMANENT_CACHE_DIR=/root/aptcache/
|
||||
|
|
Различия файлов скрыты, потому что одна или несколько строк слишком длинны
|
@ -702,14 +702,14 @@ configGPUDrivers() {
|
|||
if [[ $OS == $UBUNTU_OS_NAME ]]; then
|
||||
mkdir -p /opt/{actions,gpu}
|
||||
if [[ "${CONTAINER_RUNTIME}" == "containerd" ]]; then
|
||||
ctr image pull $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
ctr -n k8s.io image pull $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
retrycmd_if_failure 5 10 600 bash -c "$CTR_GPU_INSTALL_CMD $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG gpuinstall /entrypoint.sh install"
|
||||
ret=$?
|
||||
if [[ "$ret" != "0" ]]; then
|
||||
echo "Failed to install GPU driver, exiting..."
|
||||
exit $ERR_GPU_DRIVERS_START_FAIL
|
||||
fi
|
||||
ctr images rm --sync $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
ctr -n k8s.io images rm --sync $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG
|
||||
else
|
||||
bash -c "$DOCKER_GPU_INSTALL_CMD $NVIDIA_DRIVER_IMAGE:$NVIDIA_DRIVER_IMAGE_TAG install"
|
||||
ret=$?
|
||||
|
|
Некоторые файлы не были показаны из-за слишком большого количества измененных файлов Показать больше
Загрузка…
Ссылка в новой задаче