Add files via upload
This commit is contained in:
Родитель
bb9eda12c0
Коммит
295769cbf7
Разница между файлами не показана из-за своего большого размера
Загрузить разницу
|
@ -0,0 +1,137 @@
|
|||
# Configuration for generating Noisy Speech Dataset
|
||||
|
||||
# - sampling_rate: Specify the sampling rate. Default is 16 kHz
|
||||
# - audioformat: default is .wav
|
||||
# - audio_length: Minimum Length of each audio clip (noisy and clean speech) in seconds that will be generated by augmenting utterances.
|
||||
# - silence_length: Duration of silence introduced between clean speech utterances.
|
||||
# - total_hours: Total number of hours of data required. Units are in hours.
|
||||
# - snr_lower: Lower bound for SNR required (default: 0 dB)
|
||||
# - snr_upper: Upper bound for SNR required (default: 40 dB)
|
||||
# - target_level_lower: Lower bound for the target audio level before audiowrite (default: -35 dB)
|
||||
# - target_level_upper: Upper bound for the target audio level before audiowrite (default: -15 dB)
|
||||
# - total_snrlevels: Number of SNR levels required (default: 5, which means there are 5 levels between snr_lower and snr_upper)
|
||||
# - clean_activity_threshold: Activity threshold for clean speech
|
||||
# - noise_activity_threshold: Activity threshold for noise
|
||||
# - fileindex_start: Starting file ID that will be used in filenames
|
||||
# - fileindex_end: Last file ID that will be used in filenames
|
||||
# - is_test_set: Set it to True if it is the test set, else False for the training set
|
||||
# - noise_dir: Specify the directory path to all noise files
|
||||
# - Speech_dir: Specify the directory path to all clean speech files
|
||||
# - noisy_destination: Specify path to the destination directory to store noisy speech
|
||||
# - clean_destination: Specify path to the destination directory to store clean speech
|
||||
# - noise_destination: Specify path to the destination directory to store noise speech
|
||||
# - log_dir: Specify path to the directory to store all the log files
|
||||
|
||||
# Configuration for unit tests
|
||||
# - snr_test: Set to True if SNR test is required, else False
|
||||
# - norm_test: Set to True if Normalization test is required, else False
|
||||
# - sampling_rate_test: Set to True if Sampling Rate test is required, else False
|
||||
# - clipping_test: Set to True if Clipping test is required, else False
|
||||
# - unit_tests_log_dir: Specify path to the directory where you want to store logs
|
||||
|
||||
[noisy_speech]
|
||||
|
||||
sampling_rate: 48000
|
||||
audioformat: *.wav
|
||||
audio_length: 30
|
||||
# 15, 12, 30
|
||||
silence_length: 0.2
|
||||
total_hours: 1000
|
||||
# 1000
|
||||
#200
|
||||
# 2.5, 500, 100
|
||||
snr_lower: -5
|
||||
#-5, 0
|
||||
snr_upper: 20
|
||||
# 25, 40
|
||||
randomize_snr: True
|
||||
target_level_lower: -35
|
||||
target_level_upper: -15
|
||||
total_snrlevels: 31
|
||||
# 5
|
||||
clean_activity_threshold: 0.0
|
||||
noise_activity_threshold: 0.2
|
||||
fileindex_start: None
|
||||
fileindex_end: None
|
||||
is_test_set: False
|
||||
# True, False
|
||||
|
||||
noise_dir: /mnt/f/4th_DNSChallenge/ICASSP_2022/DNS-Challenge/datasets/noise
|
||||
#/mnt/f/4th_DNSChallenge/INTERSPEECH_2021/DNS-Challenge/datasets_fullband/noise
|
||||
#F:\4th_DNSChallenge\INTERSPEECH_2021\DNS-Challenge\datasets_fullband\noise
|
||||
#datasets\pdns_training_set\noise
|
||||
#\test_set2\Test_Noise
|
||||
# datasets\noise
|
||||
# \datasets\noise
|
||||
|
||||
speech_dir: /mnt/f/4th_DNSChallenge/ICASSP_2022/DNS-Challenge/datasets/clean
|
||||
# D:\kanhawin_git\primary_speakers_VCTK_16k_for_synthesizer
|
||||
# datasets\test_set2\Singing_Voice\wav_16k
|
||||
# dir with secondary speaker clean speech
|
||||
speech_dir2: /mnt/f/4th_DNSChallenge/ICASSP_2022/DNS-Challenge/datasets/clean
|
||||
#D:\kanhawin_git\secondary_speakers_voxCeleb2_16k
|
||||
# datasets\test_set2\Singing_Voice\wav_16k
|
||||
|
||||
spkid_csv: /mnt/f/4th_DNSChallenge/ICASSP_2022/DNS-Challenge/datasets/filelists/complete_ps_split.csv
|
||||
#/mnt/f/4th_DNSChallenge/ICASSP_2022/DNS-Challenge/datasets/filelists/vctk_spkid.csv
|
||||
# datasets\clean
|
||||
noise_types_excluded: None
|
||||
|
||||
rir_dir: /mnt/f/4th_DNSChallenge/ICASSP_2022/DNS-Challenge/datasets/pdns_training_set/impulse_responses
|
||||
#/mnt/f/4th_DNSChallenge/ICASSP_2022/DNS-Challenge/datasets/impulse_responses
|
||||
# F:\4th_DNSChallenge\ICASSP_2022\DNS-Challenge\datasets\impulse_responses
|
||||
|
||||
# \datasets\clean
|
||||
noisy_destination: /mnt/f/4th_DNSChallenge/ICASSP_2022/DNS-Challenge/datasets/pdns_training_set/mixed/noisy
|
||||
# datasets/training_data/noisy
|
||||
# datasets\test_set2\synthetic_personalizeddns\noisy
|
||||
#training_set2_onlyrealrir\noisy
|
||||
#\noisy
|
||||
clean_destination: /mnt/f/4th_DNSChallenge/ICASSP_2022/DNS-Challenge/datasets/pdns_training_set/mixed/clean
|
||||
#datasets\test_set2\synthetic_personalizeddns\clean
|
||||
# training_set2_onlyrealrir\clean
|
||||
# \clean
|
||||
noise_destination: /mnt/f/4th_DNSChallenge/ICASSP_2022/DNS-Challenge/datasets/pdns_training_set/mixed/noise
|
||||
# datasets/training_data/noise
|
||||
#datasets\test_set2\synthetic_personalizeddns\noise
|
||||
#training_set2_onlyrealrir\noise
|
||||
# \noise
|
||||
log_dir: logs
|
||||
# \logs
|
||||
|
||||
# Config: add singing voice to clean speech
|
||||
clean_singing: datasets\clean_singing\VocalSet11\FULL
|
||||
singing_choice: 3
|
||||
# 1 for only male, 2 for only female, 3 (default) for both male and female
|
||||
|
||||
# Config: add reverb to clean speech
|
||||
rir_choice: 1
|
||||
# 1 for only real rir, 2 for only synthetic rir, 3 (default) use both real and synthetic
|
||||
lower_t60: 0.3
|
||||
# lower bound of t60 range in seconds
|
||||
upper_t60: 1.3
|
||||
# upper bound of t60 range in seconds
|
||||
rir_table_csv: datasets\acoustic_params\RIR_table_simple.csv
|
||||
clean_speech_t60_csv: datasets\acoustic_params\cleanspeech_table_t60_c50.csv
|
||||
# percent_for_adding_reverb=0.5 # percentage of clean speech convolved with RIR
|
||||
|
||||
# pdns testsets
|
||||
# primary_data: D:\kanhawin_git\primary_speakers_VCTK_16k
|
||||
#'D:\PersonalizedDNS_dataset\synthetic_primary'
|
||||
# secondary_data='D:\kanhawin_git\secondary_speakers_voxCeleb2_16k'
|
||||
#'D:\PersonalizedDNS_dataset\synthetic_secondary'
|
||||
# noise_data= datasets\test_set2\synthetic\noise
|
||||
# pdns_testset_clean= datasets\test_set2\pdns\clean
|
||||
# pdns_testset_noisy= datasets\test_set2\pdns\noisy
|
||||
|
||||
# adaptation_data_seconds=120
|
||||
# num_primary_spk=100
|
||||
# num_clips=600
|
||||
|
||||
# Unit tests config
|
||||
snr_test: True
|
||||
norm_test: True
|
||||
sampling_rate_test = True
|
||||
clipping_test = True
|
||||
|
||||
unit_tests_log_dir: unittests_logs
|
Загрузка…
Ссылка в новой задаче