update script for unispeech sat finetune and inference

This commit is contained in:
cywang 2021-10-25 06:49:05 +00:00
Родитель 94823d0b62
Коммит ec4fc4e8a4
2 изменённых файлов: 23 добавлений и 0 удалений

Просмотреть файл

@ -0,0 +1,11 @@
#:: Copyright (c) Microsoft Corporation.
#:: Licensed under the MIT License.
model_path=MODEL_PATH
train_subset=train_clean_100
valid_subset=dev_other
mkdir -p ${model_path}
python train.py --distributed-world-size 8 --distributed-port 0 --nprocs-per-node 8 MANIFEST_PATH --save-dir ${model_path} --post-process letter --train-subset ${train_subset} --valid-subset ${valid_subset} --no-epoch-checkpoints --best-checkpoint-metric wer --num-workers 4 --max-update 80000 --sentence-avg --task hubert_pretraining --fine-tuning --single-target --arch hubert_ctc --w2v-path PRETRAINED_PATH/UniSpeech-SAT-Base.pt --labels '["ltr"]' --apply-mask --mask-selection static --mask-other 0 --mask-length 10 --mask-prob 0.65 --layerdrop 0.1 --mask-channel-selection static --mask-channel-other 0 --mask-channel-length 64 --mask-channel-prob 0.5 --zero-infinity --feature-grad-mult 0 --freeze-finetune-updates 0 --optimizer adam --adam-betas '(0.9, 0.98)' --adam-eps 1e-08 --lr 0.00003 --lr-scheduler tri_stage --warmup-steps 8000 --hold-steps 32000 --decay-steps 40000 --final-lr-scale 0.05 --final-dropout 0.1 --dropout 0.1 --activation-dropout 0.1 --criterion ctc --attention-dropout 0.1 --dropout-input 0.1 --max-tokens 3200000 --seed 2337 --log-format json --log-interval 200 --ddp-backend c10d --fp16 --update-freq 1 --keep-interval-updates 1 --find-unused-parameters

Просмотреть файл

@ -0,0 +1,12 @@
#:: Copyright (c) Microsoft Corporation.
#:: Licensed under the MIT License.
model_path=MODEL_PATH
gen_subset=test_other
result_path=${model_path}/decode_ctc/${gen_subset}
mkdir -p ${result_path}
export PYTHONENCODING=UTF-8
python examples/speech_recognition/infer.py DATA_PATHmanifest/resource/ --task audio_pretraining --nbest 1 --path ${model_path}/checkpoint_best.pt --gen-subset ${gen_subset} --results-path ${result_path} --w2l-decoder viterbi --word-score -1 --sil-weight 0 --criterion ctc --max-tokens 1100000 --dict-path DICT_PATH --post-process letter --quiet