Handle package db conflicts
- TensorFlow recipe typos
This commit is contained in:
Родитель
093cfdbc83
Коммит
01c2f89ba5
|
@ -12,6 +12,7 @@
|
|||
- CentOS 7.3 to 7.4 Nvidia driver breakage
|
||||
- Regression in `pool ssh` on Windows
|
||||
- Exception in unusable nodes with pool stats on allocation
|
||||
- Handle package manager db locks during conflicts for local package installs
|
||||
|
||||
## [2.9.4] - 2017-09-12
|
||||
### Changed
|
||||
|
|
|
@ -30,7 +30,7 @@ e.g., `gcr.io/tensorflow/tensorflow`
|
|||
* `resource_files` array should be populated if you want Azure Batch to handle
|
||||
the download of the training file from the web endpoint:
|
||||
* `file_path` is the local file path which should be set to
|
||||
`train_mnist.py`
|
||||
`convolutional.py`
|
||||
* `blob_source` is the remote URL of the file to retrieve:
|
||||
`https://raw.githubusercontent.com/tensorflow/models/master/tutorials/image/mnist/convolutional.py`
|
||||
* `command` should contain the command to pass to the Docker run invocation.
|
||||
|
|
|
@ -37,7 +37,7 @@ e.g., `gcr.io/tensorflow/tensorflow:latest-gpu`
|
|||
* `resource_files` array should be populated if you want Azure Batch to handle
|
||||
the download of the training file from the web endpoint:
|
||||
* `file_path` is the local file path which should be set to
|
||||
`train_mnist.py`
|
||||
`convolutional.py`
|
||||
* `blob_source` is the remote URL of the file to retrieve:
|
||||
`https://raw.githubusercontent.com/tensorflow/models/master/tutorials/image/mnist/convolutional.py`
|
||||
* `command` should contain the command to pass to the Docker run invocation.
|
||||
|
|
|
@ -218,11 +218,7 @@ EOF
|
|||
echo "IgnoreSP=TRUE" >> /etc/nvidia/gridd.conf
|
||||
fi
|
||||
# install nvidia-docker
|
||||
if [ $offer == "ubuntuserver" ]; then
|
||||
dpkg -i $nvdocker
|
||||
elif [[ $offer == centos* ]]; then
|
||||
rpm -Uvh $nvdocker
|
||||
fi
|
||||
install_local_packages $offer $nvdocker
|
||||
# enable and start nvidia docker service
|
||||
systemctl enable nvidia-docker.service
|
||||
systemctl start nvidia-docker.service
|
||||
|
@ -287,7 +283,7 @@ install_azurefile_docker_volume_driver() {
|
|||
refresh_package_index() {
|
||||
offer=$1
|
||||
set +e
|
||||
retries=30
|
||||
retries=120
|
||||
while [ $retries -gt 0 ]; do
|
||||
if [[ $offer == "ubuntuserver" ]] || [[ $offer == "debian" ]]; then
|
||||
apt-get update
|
||||
|
@ -313,7 +309,7 @@ install_packages() {
|
|||
offer=$1
|
||||
shift
|
||||
set +e
|
||||
retries=30
|
||||
retries=120
|
||||
while [ $retries -gt 0 ]; do
|
||||
if [[ $offer == "ubuntuserver" ]] || [[ $offer == "debian" ]]; then
|
||||
apt-get install -y -q -o Dpkg::Options::="--force-confnew" --no-install-recommends $*
|
||||
|
@ -335,6 +331,30 @@ install_packages() {
|
|||
set -e
|
||||
}
|
||||
|
||||
install_local_packages() {
|
||||
offer=$1
|
||||
shift
|
||||
set +e
|
||||
retries=120
|
||||
while [ $retries -gt 0 ]; do
|
||||
if [[ $offer == "ubuntuserver" ]] || [[ $offer == "debian" ]]; then
|
||||
dpkg -i $*
|
||||
else
|
||||
rpm -Uvh --nodeps $*
|
||||
fi
|
||||
if [ $? -eq 0 ]; then
|
||||
break
|
||||
fi
|
||||
let retries=retries-1
|
||||
if [ $retries -eq 0 ]; then
|
||||
echo "ERROR: Could not install local packages: $*"
|
||||
exit 1
|
||||
fi
|
||||
sleep 1
|
||||
done
|
||||
set -e
|
||||
}
|
||||
|
||||
docker_pull_image() {
|
||||
image=$1
|
||||
set +e
|
||||
|
@ -793,7 +813,7 @@ elif [[ $offer == opensuse* ]] || [[ $offer == sles* ]]; then
|
|||
exit 1
|
||||
fi
|
||||
install_packages $offer lsb
|
||||
rpm -Uvh --nodeps /opt/intelMPI/intel_mpi_packages/*.rpm
|
||||
install_local_packages $offer /opt/intelMPI/intel_mpi_packages/*.rpm
|
||||
mkdir -p /opt/intel/compilers_and_libraries/linux
|
||||
ln -s /opt/intel/impi/5.0.3.048 /opt/intel/compilers_and_libraries/linux/mpi
|
||||
fi
|
||||
|
|
Загрузка…
Ссылка в новой задаче