Add files via upload
This commit is contained in:
Родитель
bb9eda12c0
Коммит
295769cbf7
Разница между файлами не показана из-за своего большого размера
Загрузить разницу
|
@ -0,0 +1,137 @@
|
||||||
|
# Configuration for generating Noisy Speech Dataset
|
||||||
|
|
||||||
|
# - sampling_rate: Specify the sampling rate. Default is 16 kHz
|
||||||
|
# - audioformat: default is .wav
|
||||||
|
# - audio_length: Minimum Length of each audio clip (noisy and clean speech) in seconds that will be generated by augmenting utterances.
|
||||||
|
# - silence_length: Duration of silence introduced between clean speech utterances.
|
||||||
|
# - total_hours: Total number of hours of data required. Units are in hours.
|
||||||
|
# - snr_lower: Lower bound for SNR required (default: 0 dB)
|
||||||
|
# - snr_upper: Upper bound for SNR required (default: 40 dB)
|
||||||
|
# - target_level_lower: Lower bound for the target audio level before audiowrite (default: -35 dB)
|
||||||
|
# - target_level_upper: Upper bound for the target audio level before audiowrite (default: -15 dB)
|
||||||
|
# - total_snrlevels: Number of SNR levels required (default: 5, which means there are 5 levels between snr_lower and snr_upper)
|
||||||
|
# - clean_activity_threshold: Activity threshold for clean speech
|
||||||
|
# - noise_activity_threshold: Activity threshold for noise
|
||||||
|
# - fileindex_start: Starting file ID that will be used in filenames
|
||||||
|
# - fileindex_end: Last file ID that will be used in filenames
|
||||||
|
# - is_test_set: Set it to True if it is the test set, else False for the training set
|
||||||
|
# - noise_dir: Specify the directory path to all noise files
|
||||||
|
# - Speech_dir: Specify the directory path to all clean speech files
|
||||||
|
# - noisy_destination: Specify path to the destination directory to store noisy speech
|
||||||
|
# - clean_destination: Specify path to the destination directory to store clean speech
|
||||||
|
# - noise_destination: Specify path to the destination directory to store noise speech
|
||||||
|
# - log_dir: Specify path to the directory to store all the log files
|
||||||
|
|
||||||
|
# Configuration for unit tests
|
||||||
|
# - snr_test: Set to True if SNR test is required, else False
|
||||||
|
# - norm_test: Set to True if Normalization test is required, else False
|
||||||
|
# - sampling_rate_test: Set to True if Sampling Rate test is required, else False
|
||||||
|
# - clipping_test: Set to True if Clipping test is required, else False
|
||||||
|
# - unit_tests_log_dir: Specify path to the directory where you want to store logs
|
||||||
|
|
||||||
|
[noisy_speech]
|
||||||
|
|
||||||
|
sampling_rate: 48000
|
||||||
|
audioformat: *.wav
|
||||||
|
audio_length: 30
|
||||||
|
# 15, 12, 30
|
||||||
|
silence_length: 0.2
|
||||||
|
total_hours: 1000
|
||||||
|
# 1000
|
||||||
|
#200
|
||||||
|
# 2.5, 500, 100
|
||||||
|
snr_lower: -5
|
||||||
|
#-5, 0
|
||||||
|
snr_upper: 20
|
||||||
|
# 25, 40
|
||||||
|
randomize_snr: True
|
||||||
|
target_level_lower: -35
|
||||||
|
target_level_upper: -15
|
||||||
|
total_snrlevels: 31
|
||||||
|
# 5
|
||||||
|
clean_activity_threshold: 0.0
|
||||||
|
noise_activity_threshold: 0.2
|
||||||
|
fileindex_start: None
|
||||||
|
fileindex_end: None
|
||||||
|
is_test_set: False
|
||||||
|
# True, False
|
||||||
|
|
||||||
|
noise_dir: /mnt/f/4th_DNSChallenge/ICASSP_2022/DNS-Challenge/datasets/noise
|
||||||
|
#/mnt/f/4th_DNSChallenge/INTERSPEECH_2021/DNS-Challenge/datasets_fullband/noise
|
||||||
|
#F:\4th_DNSChallenge\INTERSPEECH_2021\DNS-Challenge\datasets_fullband\noise
|
||||||
|
#datasets\pdns_training_set\noise
|
||||||
|
#\test_set2\Test_Noise
|
||||||
|
# datasets\noise
|
||||||
|
# \datasets\noise
|
||||||
|
|
||||||
|
speech_dir: /mnt/f/4th_DNSChallenge/ICASSP_2022/DNS-Challenge/datasets/clean
|
||||||
|
# D:\kanhawin_git\primary_speakers_VCTK_16k_for_synthesizer
|
||||||
|
# datasets\test_set2\Singing_Voice\wav_16k
|
||||||
|
# dir with secondary speaker clean speech
|
||||||
|
speech_dir2: /mnt/f/4th_DNSChallenge/ICASSP_2022/DNS-Challenge/datasets/clean
|
||||||
|
#D:\kanhawin_git\secondary_speakers_voxCeleb2_16k
|
||||||
|
# datasets\test_set2\Singing_Voice\wav_16k
|
||||||
|
|
||||||
|
spkid_csv: /mnt/f/4th_DNSChallenge/ICASSP_2022/DNS-Challenge/datasets/filelists/complete_ps_split.csv
|
||||||
|
#/mnt/f/4th_DNSChallenge/ICASSP_2022/DNS-Challenge/datasets/filelists/vctk_spkid.csv
|
||||||
|
# datasets\clean
|
||||||
|
noise_types_excluded: None
|
||||||
|
|
||||||
|
rir_dir: /mnt/f/4th_DNSChallenge/ICASSP_2022/DNS-Challenge/datasets/pdns_training_set/impulse_responses
|
||||||
|
#/mnt/f/4th_DNSChallenge/ICASSP_2022/DNS-Challenge/datasets/impulse_responses
|
||||||
|
# F:\4th_DNSChallenge\ICASSP_2022\DNS-Challenge\datasets\impulse_responses
|
||||||
|
|
||||||
|
# \datasets\clean
|
||||||
|
noisy_destination: /mnt/f/4th_DNSChallenge/ICASSP_2022/DNS-Challenge/datasets/pdns_training_set/mixed/noisy
|
||||||
|
# datasets/training_data/noisy
|
||||||
|
# datasets\test_set2\synthetic_personalizeddns\noisy
|
||||||
|
#training_set2_onlyrealrir\noisy
|
||||||
|
#\noisy
|
||||||
|
clean_destination: /mnt/f/4th_DNSChallenge/ICASSP_2022/DNS-Challenge/datasets/pdns_training_set/mixed/clean
|
||||||
|
#datasets\test_set2\synthetic_personalizeddns\clean
|
||||||
|
# training_set2_onlyrealrir\clean
|
||||||
|
# \clean
|
||||||
|
noise_destination: /mnt/f/4th_DNSChallenge/ICASSP_2022/DNS-Challenge/datasets/pdns_training_set/mixed/noise
|
||||||
|
# datasets/training_data/noise
|
||||||
|
#datasets\test_set2\synthetic_personalizeddns\noise
|
||||||
|
#training_set2_onlyrealrir\noise
|
||||||
|
# \noise
|
||||||
|
log_dir: logs
|
||||||
|
# \logs
|
||||||
|
|
||||||
|
# Config: add singing voice to clean speech
|
||||||
|
clean_singing: datasets\clean_singing\VocalSet11\FULL
|
||||||
|
singing_choice: 3
|
||||||
|
# 1 for only male, 2 for only female, 3 (default) for both male and female
|
||||||
|
|
||||||
|
# Config: add reverb to clean speech
|
||||||
|
rir_choice: 1
|
||||||
|
# 1 for only real rir, 2 for only synthetic rir, 3 (default) use both real and synthetic
|
||||||
|
lower_t60: 0.3
|
||||||
|
# lower bound of t60 range in seconds
|
||||||
|
upper_t60: 1.3
|
||||||
|
# upper bound of t60 range in seconds
|
||||||
|
rir_table_csv: datasets\acoustic_params\RIR_table_simple.csv
|
||||||
|
clean_speech_t60_csv: datasets\acoustic_params\cleanspeech_table_t60_c50.csv
|
||||||
|
# percent_for_adding_reverb=0.5 # percentage of clean speech convolved with RIR
|
||||||
|
|
||||||
|
# pdns testsets
|
||||||
|
# primary_data: D:\kanhawin_git\primary_speakers_VCTK_16k
|
||||||
|
#'D:\PersonalizedDNS_dataset\synthetic_primary'
|
||||||
|
# secondary_data='D:\kanhawin_git\secondary_speakers_voxCeleb2_16k'
|
||||||
|
#'D:\PersonalizedDNS_dataset\synthetic_secondary'
|
||||||
|
# noise_data= datasets\test_set2\synthetic\noise
|
||||||
|
# pdns_testset_clean= datasets\test_set2\pdns\clean
|
||||||
|
# pdns_testset_noisy= datasets\test_set2\pdns\noisy
|
||||||
|
|
||||||
|
# adaptation_data_seconds=120
|
||||||
|
# num_primary_spk=100
|
||||||
|
# num_clips=600
|
||||||
|
|
||||||
|
# Unit tests config
|
||||||
|
snr_test: True
|
||||||
|
norm_test: True
|
||||||
|
sampling_rate_test = True
|
||||||
|
clipping_test = True
|
||||||
|
|
||||||
|
unit_tests_log_dir: unittests_logs
|
Загрузка…
Ссылка в новой задаче