Add files via upload

2021-12-01 21:08:08 -08:00 · 2021-12-01 21:08:08 -08:00 · 295769cbf7
--- a/pdns_noisyspeech_synthesizer_singleprocess.py
+++ b/pdns_noisyspeech_synthesizer_singleprocess.py
--- a/pdns_synthesizer_icassp2022.cfg
+++ b/pdns_synthesizer_icassp2022.cfg
@ -0,0 +1,137 @@
 # Configuration for generating Noisy Speech Dataset
 # - sampling_rate: Specify the sampling rate. Default is 16 kHz
 # - audioformat: default is .wav
 # - audio_length: Minimum Length of each audio clip (noisy and clean speech) in seconds that will be generated by augmenting utterances. 
 # - silence_length: Duration of silence introduced between clean speech utterances.
 # - total_hours: Total number of hours of data required. Units are in hours. 
 # - snr_lower: Lower bound for SNR required (default: 0 dB)
 # - snr_upper: Upper bound for SNR required (default: 40 dB)
 # - target_level_lower: Lower bound for the target audio level before audiowrite (default: -35 dB)
 # - target_level_upper: Upper bound for the target audio level before audiowrite (default: -15 dB)
 # - total_snrlevels: Number of SNR levels required (default: 5, which means there are 5 levels between snr_lower and snr_upper)
 # - clean_activity_threshold: Activity threshold for clean speech
 # - noise_activity_threshold: Activity threshold for noise
 # - fileindex_start: Starting file ID that will be used in filenames
 # - fileindex_end: Last file ID that will be used in filenames
 # - is_test_set: Set it to True if it is the test set, else False for the training set
 # - noise_dir: Specify the directory path to all noise files
 # - Speech_dir: Specify the directory path to all clean speech files
 # - noisy_destination: Specify path to the destination directory to store noisy speech
 # - clean_destination: Specify path to the destination directory to store clean speech
 # - noise_destination: Specify path to the destination directory to store noise speech
 # - log_dir: Specify path to the directory to store all the log files
 # Configuration for unit tests
 # - snr_test: Set to True if SNR test is required, else False
 # - norm_test: Set to True if Normalization test is required, else False
 # - sampling_rate_test: Set to True if Sampling Rate test is required, else False
 # - clipping_test: Set to True if Clipping test is required, else False
 # - unit_tests_log_dir: Specify path to the directory where you want to store logs
 [noisy_speech]
 sampling_rate: 48000
 audioformat: *.wav
 audio_length: 30
 # 15, 12, 30 
 silence_length: 0.2
 total_hours: 1000
 # 1000
 #200
 # 2.5, 500, 100
 snr_lower: -5
 #-5, 0
 snr_upper: 20
 # 25, 40
 randomize_snr: True
 target_level_lower: -35
 target_level_upper: -15
 total_snrlevels: 31 
 # 5 
 clean_activity_threshold: 0.0
 noise_activity_threshold: 0.2
 fileindex_start: None
 fileindex_end: None
 is_test_set: False
 # True, False
 noise_dir: /mnt/f/4th_DNSChallenge/ICASSP_2022/DNS-Challenge/datasets/noise
 #/mnt/f/4th_DNSChallenge/INTERSPEECH_2021/DNS-Challenge/datasets_fullband/noise
 #F:\4th_DNSChallenge\INTERSPEECH_2021\DNS-Challenge\datasets_fullband\noise
 #datasets\pdns_training_set\noise
 #\test_set2\Test_Noise
 # datasets\noise 
 # \datasets\noise
 speech_dir: /mnt/f/4th_DNSChallenge/ICASSP_2022/DNS-Challenge/datasets/clean
 # D:\kanhawin_git\primary_speakers_VCTK_16k_for_synthesizer
 # datasets\test_set2\Singing_Voice\wav_16k
 # dir with secondary speaker clean speech
 speech_dir2: /mnt/f/4th_DNSChallenge/ICASSP_2022/DNS-Challenge/datasets/clean
 #D:\kanhawin_git\secondary_speakers_voxCeleb2_16k
 # datasets\test_set2\Singing_Voice\wav_16k
 spkid_csv: /mnt/f/4th_DNSChallenge/ICASSP_2022/DNS-Challenge/datasets/filelists/complete_ps_split.csv
 #/mnt/f/4th_DNSChallenge/ICASSP_2022/DNS-Challenge/datasets/filelists/vctk_spkid.csv
 # datasets\clean 
 noise_types_excluded: None
 rir_dir: /mnt/f/4th_DNSChallenge/ICASSP_2022/DNS-Challenge/datasets/pdns_training_set/impulse_responses
 #/mnt/f/4th_DNSChallenge/ICASSP_2022/DNS-Challenge/datasets/impulse_responses
 # F:\4th_DNSChallenge\ICASSP_2022\DNS-Challenge\datasets\impulse_responses
 # \datasets\clean
 noisy_destination: /mnt/f/4th_DNSChallenge/ICASSP_2022/DNS-Challenge/datasets/pdns_training_set/mixed/noisy
 # datasets/training_data/noisy
 # datasets\test_set2\synthetic_personalizeddns\noisy
 #training_set2_onlyrealrir\noisy 
 #\noisy
 clean_destination: /mnt/f/4th_DNSChallenge/ICASSP_2022/DNS-Challenge/datasets/pdns_training_set/mixed/clean
 #datasets\test_set2\synthetic_personalizeddns\clean
 # training_set2_onlyrealrir\clean 
 # \clean
 noise_destination: /mnt/f/4th_DNSChallenge/ICASSP_2022/DNS-Challenge/datasets/pdns_training_set/mixed/noise
 # datasets/training_data/noise
 #datasets\test_set2\synthetic_personalizeddns\noise
 #training_set2_onlyrealrir\noise 
 # \noise
 log_dir: logs 
 # \logs
 # Config: add singing voice to clean speech
 clean_singing: datasets\clean_singing\VocalSet11\FULL
 singing_choice: 3
 # 1 for only male, 2 for only female, 3 (default) for both male and female 
 # Config: add reverb to clean speech
 rir_choice: 1
 # 1 for only real rir, 2 for only synthetic rir, 3 (default) use both real and synthetic
 lower_t60: 0.3 
 # lower bound of t60 range in seconds
 upper_t60: 1.3 
 # upper bound of t60 range in seconds
 rir_table_csv: datasets\acoustic_params\RIR_table_simple.csv
 clean_speech_t60_csv: datasets\acoustic_params\cleanspeech_table_t60_c50.csv
 # percent_for_adding_reverb=0.5 # percentage of clean speech convolved with RIR
 # pdns testsets
 # primary_data: D:\kanhawin_git\primary_speakers_VCTK_16k
 #'D:\PersonalizedDNS_dataset\synthetic_primary'
 # secondary_data='D:\kanhawin_git\secondary_speakers_voxCeleb2_16k'
 #'D:\PersonalizedDNS_dataset\synthetic_secondary'
 # noise_data= datasets\test_set2\synthetic\noise
 # pdns_testset_clean= datasets\test_set2\pdns\clean
 # pdns_testset_noisy= datasets\test_set2\pdns\noisy
 # adaptation_data_seconds=120
 # num_primary_spk=100
 # num_clips=600
 # Unit tests config
 snr_test: True
 norm_test: True
 sampling_rate_test = True
 clipping_test = True
 unit_tests_log_dir: unittests_logs