2017-05-16 18:20:52 +03:00
|
|
|
#!/bin/bash
|
|
|
|
|
2019-02-19 19:26:51 +03:00
|
|
|
set -xe
|
2018-09-04 19:49:44 +03:00
|
|
|
|
2020-03-27 18:18:18 +03:00
|
|
|
apt-get install -y python3-venv libopus0
|
|
|
|
|
2019-02-22 19:38:28 +03:00
|
|
|
python3 -m venv /tmp/venv
|
|
|
|
source /tmp/venv/bin/activate
|
|
|
|
|
2020-03-27 18:18:18 +03:00
|
|
|
pip install -U setuptools wheel pip
|
2020-04-01 17:24:36 +03:00
|
|
|
pip install .
|
|
|
|
pip uninstall -y tensorflow
|
2020-03-27 18:18:18 +03:00
|
|
|
pip install tensorflow-gpu==1.14
|
2019-02-19 19:26:51 +03:00
|
|
|
|
|
|
|
mkdir -p ../keep/summaries
|
|
|
|
|
|
|
|
data="${SHARED_DIR}/data"
|
2018-09-04 19:49:44 +03:00
|
|
|
fis="${data}/LDC/fisher"
|
|
|
|
swb="${data}/LDC/LDC97S62/swb"
|
|
|
|
lbs="${data}/OpenSLR/LibriSpeech/librivox"
|
2020-03-27 18:18:18 +03:00
|
|
|
cv="${data}/mozilla/CommonVoice/en_1087h_2019-06-12/clips"
|
|
|
|
npr="${data}/NPR/WAMU/sets/v0.3"
|
2018-09-04 19:49:44 +03:00
|
|
|
|
2019-02-22 19:38:28 +03:00
|
|
|
python -u DeepSpeech.py \
|
2020-03-27 18:18:18 +03:00
|
|
|
--train_files "${npr}/best-train.sdb","${npr}/good-train.sdb","${cv}/train.sdb","${fis}-train.sdb","${swb}-train.sdb","${lbs}-train-clean-100.sdb","${lbs}-train-clean-360.sdb","${lbs}-train-other-500.sdb" \
|
|
|
|
--dev_files "${lbs}-dev-clean.sdb" \
|
|
|
|
--test_files "${lbs}-test-clean.sdb" \
|
2018-09-04 19:49:44 +03:00
|
|
|
--train_batch_size 24 \
|
|
|
|
--dev_batch_size 48 \
|
|
|
|
--test_batch_size 48 \
|
2020-03-27 18:18:18 +03:00
|
|
|
--train_cudnn \
|
2018-09-04 19:49:44 +03:00
|
|
|
--n_hidden 2048 \
|
|
|
|
--learning_rate 0.0001 \
|
2020-03-27 18:18:18 +03:00
|
|
|
--dropout_rate 0.40 \
|
|
|
|
--epochs 150 \
|
|
|
|
--noearly_stop \
|
|
|
|
--feature_cache "../tmp/feature.cache" \
|
2018-09-04 19:49:44 +03:00
|
|
|
--checkpoint_dir "../keep" \
|
2018-11-08 23:24:36 +03:00
|
|
|
--summary_dir "../keep/summaries"
|