DeepSpeech/.compute

#!/bin/bash

set -xe

apt-get install -y python3-venv libopus0

python3 -m venv /tmp/venv
source /tmp/venv/bin/activate

pip install -U setuptools wheel pip
pip install .
pip uninstall -y tensorflow
pip install tensorflow-gpu==1.14

mkdir -p ../keep/summaries

data="${SHARED_DIR}/data"
fis="${data}/LDC/fisher"
swb="${data}/LDC/LDC97S62/swb"
lbs="${data}/OpenSLR/LibriSpeech/librivox"
cv="${data}/mozilla/CommonVoice/en_1087h_2019-06-12/clips"
npr="${data}/NPR/WAMU/sets/v0.3"

python -u DeepSpeech.py \
  --train_files "${npr}/best-train.sdb","${npr}/good-train.sdb","${cv}/train.sdb","${fis}-train.sdb","${swb}-train.sdb","${lbs}-train-clean-100.sdb","${lbs}-train-clean-360.sdb","${lbs}-train-other-500.sdb" \
  --dev_files "${lbs}-dev-clean.sdb" \
  --test_files "${lbs}-test-clean.sdb" \
  --train_batch_size 24 \
  --dev_batch_size 48 \
  --test_batch_size 48 \
  --train_cudnn \
  --n_hidden 2048 \
  --learning_rate 0.0001 \
  --dropout_rate 0.40 \
  --epochs 150 \
  --noearly_stop \
  --feature_cache "../tmp/feature.cache" \
  --checkpoint_dir "../keep" \
  --summary_dir "../keep/summaries"
Fix #493; DeepSpeech part of SLURM cluster support 2017-05-16 18:20:52 +03:00			`#!/bin/bash`

Update .compute script for new cluster setup 2019-02-19 19:26:51 +03:00			`set -xe`
Default training setup for new cluster 2018-09-04 19:49:44 +03:00
Updated .compute 2020-03-27 18:18:18 +03:00			`apt-get install -y python3-venv libopus0`

Use venv module in .compute script 2019-02-22 19:38:28 +03:00			`python3 -m venv /tmp/venv`
			`source /tmp/venv/bin/activate`

Updated .compute 2020-03-27 18:18:18 +03:00			`pip install -U setuptools wheel pip`
Fix .compute for packaged training code 2020-04-01 17:24:36 +03:00			`pip install .`
			`pip uninstall -y tensorflow`
Updated .compute 2020-03-27 18:18:18 +03:00			`pip install tensorflow-gpu==1.14`
Update .compute script for new cluster setup 2019-02-19 19:26:51 +03:00
			`mkdir -p ../keep/summaries`

			`data="${SHARED_DIR}/data"`
Default training setup for new cluster 2018-09-04 19:49:44 +03:00			`fis="${data}/LDC/fisher"`
			`swb="${data}/LDC/LDC97S62/swb"`
			`lbs="${data}/OpenSLR/LibriSpeech/librivox"`
Updated .compute 2020-03-27 18:18:18 +03:00			`cv="${data}/mozilla/CommonVoice/en_1087h_2019-06-12/clips"`
			`npr="${data}/NPR/WAMU/sets/v0.3"`
Default training setup for new cluster 2018-09-04 19:49:44 +03:00
Use venv module in .compute script 2019-02-22 19:38:28 +03:00			`python -u DeepSpeech.py \`
Updated .compute 2020-03-27 18:18:18 +03:00			`--train_files "${npr}/best-train.sdb","${npr}/good-train.sdb","${cv}/train.sdb","${fis}-train.sdb","${swb}-train.sdb","${lbs}-train-clean-100.sdb","${lbs}-train-clean-360.sdb","${lbs}-train-other-500.sdb" \`
			`--dev_files "${lbs}-dev-clean.sdb" \`
			`--test_files "${lbs}-test-clean.sdb" \`
Default training setup for new cluster 2018-09-04 19:49:44 +03:00			`--train_batch_size 24 \`
			`--dev_batch_size 48 \`
			`--test_batch_size 48 \`
Updated .compute 2020-03-27 18:18:18 +03:00			`--train_cudnn \`
Default training setup for new cluster 2018-09-04 19:49:44 +03:00			`--n_hidden 2048 \`
			`--learning_rate 0.0001 \`
Updated .compute 2020-03-27 18:18:18 +03:00			`--dropout_rate 0.40 \`
			`--epochs 150 \`
			`--noearly_stop \`
			`--feature_cache "../tmp/feature.cache" \`
Default training setup for new cluster 2018-09-04 19:49:44 +03:00			`--checkpoint_dir "../keep" \`
Centralize WER report code into evaluate.py, call it from DeepSpeech.py 2018-11-08 23:24:36 +03:00			`--summary_dir "../keep/summaries"`