From b5e1e136858183e83d20d679f29ce2499a7354ef Mon Sep 17 00:00:00 2001 From: Hari Dubey Date: Tue, 6 Dec 2022 19:50:39 +0000 Subject: [PATCH] intial changes for V5 challenge --- .../Track1_Headset/embeddings/README.txt | 0 .../Track1_Headset/transcripts/README.txt | 0 .../Track2_Speakerphone/embeddings/README.txt | 0 .../transcripts/README.txt | 0 ...s1 => download-dns-challenge-5-headset.ps1 | 0 ....sh => download-dns-challenge-5-headset.sh | 0 download-dns-challenge-5-speakerphone.ps1 | 136 +++++++++ download-dns-challenge-5-speakerphone.sh | 134 +++++++++ ...022.cfg => pdns_synthesizer_icassp2023.cfg | 274 +++++++++--------- 9 files changed, 407 insertions(+), 137 deletions(-) create mode 100644 V5_dev_testset/Track1_Headset/embeddings/README.txt create mode 100644 V5_dev_testset/Track1_Headset/transcripts/README.txt create mode 100644 V5_dev_testset/Track2_Speakerphone/embeddings/README.txt create mode 100644 V5_dev_testset/Track2_Speakerphone/transcripts/README.txt rename download-dns-challenge-4-pdns.ps1 => download-dns-challenge-5-headset.ps1 (100%) rename download-dns-challenge-4-pdns.sh => download-dns-challenge-5-headset.sh (100%) create mode 100644 download-dns-challenge-5-speakerphone.ps1 create mode 100644 download-dns-challenge-5-speakerphone.sh rename pdns_synthesizer_icassp2022.cfg => pdns_synthesizer_icassp2023.cfg (97%) diff --git a/V5_dev_testset/Track1_Headset/embeddings/README.txt b/V5_dev_testset/Track1_Headset/embeddings/README.txt new file mode 100644 index 00000000000..e69de29bb2d diff --git a/V5_dev_testset/Track1_Headset/transcripts/README.txt b/V5_dev_testset/Track1_Headset/transcripts/README.txt new file mode 100644 index 00000000000..e69de29bb2d diff --git a/V5_dev_testset/Track2_Speakerphone/embeddings/README.txt b/V5_dev_testset/Track2_Speakerphone/embeddings/README.txt new file mode 100644 index 00000000000..e69de29bb2d diff --git a/V5_dev_testset/Track2_Speakerphone/transcripts/README.txt b/V5_dev_testset/Track2_Speakerphone/transcripts/README.txt new file mode 100644 index 00000000000..e69de29bb2d diff --git a/download-dns-challenge-4-pdns.ps1 b/download-dns-challenge-5-headset.ps1 similarity index 100% rename from download-dns-challenge-4-pdns.ps1 rename to download-dns-challenge-5-headset.ps1 diff --git a/download-dns-challenge-4-pdns.sh b/download-dns-challenge-5-headset.sh similarity index 100% rename from download-dns-challenge-4-pdns.sh rename to download-dns-challenge-5-headset.sh diff --git a/download-dns-challenge-5-speakerphone.ps1 b/download-dns-challenge-5-speakerphone.ps1 new file mode 100644 index 00000000000..6a6033ac182 --- /dev/null +++ b/download-dns-challenge-5-speakerphone.ps1 @@ -0,0 +1,136 @@ +#!/usr/bin/bash + +# ***** Datasets for ICASSP 2022 DNS Challenge 4 - Personalized DNS Track ***** + +# NOTE: Before downloading, make sure you have enough space +# on your local storage! + +# In all, you will need about 380TB to store the UNPACKED data. +# Archived, the same data takes about 200GB total. + +# Please comment out the files you don't need before launching +# the script. + +# NOTE: By default, the script *DOES NOT* DOWNLOAD ANY FILES! +# Please scroll down and edit this script to pick the +# downloading method that works best for you. + +# ------------------------------------------------------------- +# The directory structure of the unpacked data is: + +# . 362G +# +-- datasets_fullband 64G +# | +-- impulse_responses 5.9G +# | \-- noise_fullband 58G +# +-- pdns_training_set 294G +# | +-- enrollment_embeddings 115M +# | +-- enrollment_wav 42G +# | +-- raw/clean 252G +# | +-- english 168G +# | +-- french 2.1G +# | +-- german 53G +# | +-- italian 17G +# | +-- russian 6.8G +# | \-- spanish 5.4G +# \-- personalized_dev_testset 3.3G + +$BLOB_NAMES=@( + + "pdns_training_set/raw/pdns_training_set.raw.clean.english_000.tar.bz2", + "pdns_training_set/raw/pdns_training_set.raw.clean.english_001.tar.bz2", + "pdns_training_set/raw/pdns_training_set.raw.clean.english_002.tar.bz2", + "pdns_training_set/raw/pdns_training_set.raw.clean.english_003.tar.bz2", + "pdns_training_set/raw/pdns_training_set.raw.clean.english_004.tar.bz2", + "pdns_training_set/raw/pdns_training_set.raw.clean.english_005.tar.bz2", + "pdns_training_set/raw/pdns_training_set.raw.clean.english_006.tar.bz2", + "pdns_training_set/raw/pdns_training_set.raw.clean.english_007.tar.bz2", + "pdns_training_set/raw/pdns_training_set.raw.clean.english_008.tar.bz2", + "pdns_training_set/raw/pdns_training_set.raw.clean.english_009.tar.bz2", + "pdns_training_set/raw/pdns_training_set.raw.clean.english_010.tar.bz2", + "pdns_training_set/raw/pdns_training_set.raw.clean.english_011.tar.bz2", + "pdns_training_set/raw/pdns_training_set.raw.clean.english_012.tar.bz2", + "pdns_training_set/raw/pdns_training_set.raw.clean.english_013.tar.bz2", + "pdns_training_set/raw/pdns_training_set.raw.clean.english_014.tar.bz2", + "pdns_training_set/raw/pdns_training_set.raw.clean.english_015.tar.bz2", + "pdns_training_set/raw/pdns_training_set.raw.clean.english_016.tar.bz2", + "pdns_training_set/raw/pdns_training_set.raw.clean.english_017.tar.bz2", + "pdns_training_set/raw/pdns_training_set.raw.clean.english_018.tar.bz2", + "pdns_training_set/raw/pdns_training_set.raw.clean.english_019.tar.bz2", + "pdns_training_set/raw/pdns_training_set.raw.clean.english_020.tar.bz2", + "pdns_training_set/raw/pdns_training_set.raw.clean.french_000.tar.bz2", + "pdns_training_set/raw/pdns_training_set.raw.clean.german_000.tar.bz2", + "pdns_training_set/raw/pdns_training_set.raw.clean.german_001.tar.bz2", + "pdns_training_set/raw/pdns_training_set.raw.clean.german_002.tar.bz2", + "pdns_training_set/raw/pdns_training_set.raw.clean.german_003.tar.bz2", + "pdns_training_set/raw/pdns_training_set.raw.clean.german_004.tar.bz2", + "pdns_training_set/raw/pdns_training_set.raw.clean.german_005.tar.bz2", + "pdns_training_set/raw/pdns_training_set.raw.clean.german_006.tar.bz2", + "pdns_training_set/raw/pdns_training_set.raw.clean.german_007.tar.bz2", + "pdns_training_set/raw/pdns_training_set.raw.clean.german_008.tar.bz2", + "pdns_training_set/raw/pdns_training_set.raw.clean.italian_000.tar.bz2", + "pdns_training_set/raw/pdns_training_set.raw.clean.italian_001.tar.bz2", + "pdns_training_set/raw/pdns_training_set.raw.clean.italian_002.tar.bz2", + "pdns_training_set/raw/pdns_training_set.raw.clean.russian_000.tar.bz2", + "pdns_training_set/raw/pdns_training_set.raw.clean.spanish_000.tar.bz2", + "pdns_training_set/raw/pdns_training_set.raw.clean.spanish_001.tar.bz2", + "pdns_training_set/raw/pdns_training_set.raw.clean.spanish_002.tar.bz2", + + "pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.english_000.tar.bz2", + "pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.english_001.tar.bz2", + "pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.english_002.tar.bz2", + "pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.english_003.tar.bz2", + "pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.english_004.tar.bz2", + "pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.french_000.tar.bz2", + "pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.german_000.tar.bz2", + "pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.german_001.tar.bz2", + "pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.italian_000.tar.bz2", + "pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.russian_000.tar.bz2", + "pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.spanish_000.tar.bz2", + + "pdns_training_set/pdns_training_set.enrollment_embeddings_000.tar.bz2", + + "datasets_fullband/noise_fullband/datasets_fullband.noise_fullband.audioset_000.tar.bz2", + "datasets_fullband/noise_fullband/datasets_fullband.noise_fullband.audioset_001.tar.bz2", + "datasets_fullband/noise_fullband/datasets_fullband.noise_fullband.audioset_002.tar.bz2", + "datasets_fullband/noise_fullband/datasets_fullband.noise_fullband.audioset_003.tar.bz2", + "datasets_fullband/noise_fullband/datasets_fullband.noise_fullband.audioset_004.tar.bz2", + "datasets_fullband/noise_fullband/datasets_fullband.noise_fullband.audioset_005.tar.bz2", + "datasets_fullband/noise_fullband/datasets_fullband.noise_fullband.audioset_006.tar.bz2", + + "datasets_fullband/noise_fullband/datasets_fullband.noise_fullband.freesound_000.tar.bz2", + "datasets_fullband/noise_fullband/datasets_fullband.noise_fullband.freesound_001.tar.bz2", + + "datasets_fullband/datasets_fullband.impulse_responses_000.tar.bz2", + + "personalized_dev_testset/personalized_dev_testset.enrollment.tar.bz2", + "personalized_dev_testset/personalized_dev_testset.noisy_testclips.tar.bz2" +) + +############################################################### + +$AZURE_URL="https://dns4public.blob.core.windows.net/dns4archive" + +$OUTPUT_PATH="." + +mkdir -Force $OUTPUT_PATH/pdns_training_set/raw 2> $null +mkdir -Force $OUTPUT_PATH/pdns_training_set/enrollment_wav 2> $null +mkdir -Force $OUTPUT_PATH/datasets_fullband/noise_fullband 2> $null + +foreach ($BLOB in $BLOB_NAMES) { + + $URL="$AZURE_URL/$BLOB" + Write-Output "Download: $BLOB" + + # DRY RUN: print HTTP response and Content-Length + # WITHOUT downloading the files + curl -s -I "$URL" | head -n 2 + + # Actually download the files: UNCOMMENT when ready to download + # curl "$URL" -o "$OUTPUT_PATH/$BLOB" + + # Same as above, but using wget + # wget "$URL" -O "$OUTPUT_PATH/$BLOB" + + # Same, + unpack files on the fly + # curl "$URL" | tar -C "$OUTPUT_PATH" -f - -x -j +} diff --git a/download-dns-challenge-5-speakerphone.sh b/download-dns-challenge-5-speakerphone.sh new file mode 100644 index 00000000000..a346a471066 --- /dev/null +++ b/download-dns-challenge-5-speakerphone.sh @@ -0,0 +1,134 @@ +#!/usr/bin/bash + +# ***** Datasets for ICASSP 2022 DNS Challenge 4 - Personalized DNS Track ***** + +# NOTE: Before downloading, make sure you have enough space +# on your local storage! + +# In all, you will need about 380TB to store the UNPACKED data. +# Archived, the same data takes about 200GB total. + +# Please comment out the files you don't need before launching +# the script. + +# NOTE: By default, the script *DOES NOT* DOWNLOAD ANY FILES! +# Please scroll down and edit this script to pick the +# downloading method that works best for you. + +# ------------------------------------------------------------- +# The directory structure of the unpacked data is: + +# . 362G +# +-- datasets_fullband 64G +# | +-- impulse_responses 5.9G +# | \-- noise_fullband 58G +# +-- pdns_training_set 294G +# | +-- enrollment_embeddings 115M +# | +-- enrollment_wav 42G +# | +-- raw/clean 252G +# | +-- english 168G +# | +-- french 2.1G +# | +-- german 53G +# | +-- italian 17G +# | +-- russian 6.8G +# | \-- spanish 5.4G +# \-- personalized_dev_testset 3.3G + +BLOB_NAMES=( + + pdns_training_set/raw/pdns_training_set.raw.clean.english_000.tar.bz2 + pdns_training_set/raw/pdns_training_set.raw.clean.english_001.tar.bz2 + pdns_training_set/raw/pdns_training_set.raw.clean.english_002.tar.bz2 + pdns_training_set/raw/pdns_training_set.raw.clean.english_003.tar.bz2 + pdns_training_set/raw/pdns_training_set.raw.clean.english_004.tar.bz2 + pdns_training_set/raw/pdns_training_set.raw.clean.english_005.tar.bz2 + pdns_training_set/raw/pdns_training_set.raw.clean.english_006.tar.bz2 + pdns_training_set/raw/pdns_training_set.raw.clean.english_007.tar.bz2 + pdns_training_set/raw/pdns_training_set.raw.clean.english_008.tar.bz2 + pdns_training_set/raw/pdns_training_set.raw.clean.english_009.tar.bz2 + pdns_training_set/raw/pdns_training_set.raw.clean.english_010.tar.bz2 + pdns_training_set/raw/pdns_training_set.raw.clean.english_011.tar.bz2 + pdns_training_set/raw/pdns_training_set.raw.clean.english_012.tar.bz2 + pdns_training_set/raw/pdns_training_set.raw.clean.english_013.tar.bz2 + pdns_training_set/raw/pdns_training_set.raw.clean.english_014.tar.bz2 + pdns_training_set/raw/pdns_training_set.raw.clean.english_015.tar.bz2 + pdns_training_set/raw/pdns_training_set.raw.clean.english_016.tar.bz2 + pdns_training_set/raw/pdns_training_set.raw.clean.english_017.tar.bz2 + pdns_training_set/raw/pdns_training_set.raw.clean.english_018.tar.bz2 + pdns_training_set/raw/pdns_training_set.raw.clean.english_019.tar.bz2 + pdns_training_set/raw/pdns_training_set.raw.clean.english_020.tar.bz2 + pdns_training_set/raw/pdns_training_set.raw.clean.french_000.tar.bz2 + pdns_training_set/raw/pdns_training_set.raw.clean.german_000.tar.bz2 + pdns_training_set/raw/pdns_training_set.raw.clean.german_001.tar.bz2 + pdns_training_set/raw/pdns_training_set.raw.clean.german_002.tar.bz2 + pdns_training_set/raw/pdns_training_set.raw.clean.german_003.tar.bz2 + pdns_training_set/raw/pdns_training_set.raw.clean.german_004.tar.bz2 + pdns_training_set/raw/pdns_training_set.raw.clean.german_005.tar.bz2 + pdns_training_set/raw/pdns_training_set.raw.clean.german_006.tar.bz2 + pdns_training_set/raw/pdns_training_set.raw.clean.german_007.tar.bz2 + pdns_training_set/raw/pdns_training_set.raw.clean.german_008.tar.bz2 + pdns_training_set/raw/pdns_training_set.raw.clean.italian_000.tar.bz2 + pdns_training_set/raw/pdns_training_set.raw.clean.italian_001.tar.bz2 + pdns_training_set/raw/pdns_training_set.raw.clean.italian_002.tar.bz2 + pdns_training_set/raw/pdns_training_set.raw.clean.russian_000.tar.bz2 + pdns_training_set/raw/pdns_training_set.raw.clean.spanish_000.tar.bz2 + pdns_training_set/raw/pdns_training_set.raw.clean.spanish_001.tar.bz2 + pdns_training_set/raw/pdns_training_set.raw.clean.spanish_002.tar.bz2 + + pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.english_000.tar.bz2 + pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.english_001.tar.bz2 + pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.english_002.tar.bz2 + pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.english_003.tar.bz2 + pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.english_004.tar.bz2 + pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.french_000.tar.bz2 + pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.german_000.tar.bz2 + pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.german_001.tar.bz2 + pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.italian_000.tar.bz2 + pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.russian_000.tar.bz2 + pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.spanish_000.tar.bz2 + + pdns_training_set/pdns_training_set.enrollment_embeddings_000.tar.bz2 + + datasets_fullband/noise_fullband/datasets_fullband.noise_fullband.audioset_000.tar.bz2 + datasets_fullband/noise_fullband/datasets_fullband.noise_fullband.audioset_001.tar.bz2 + datasets_fullband/noise_fullband/datasets_fullband.noise_fullband.audioset_002.tar.bz2 + datasets_fullband/noise_fullband/datasets_fullband.noise_fullband.audioset_003.tar.bz2 + datasets_fullband/noise_fullband/datasets_fullband.noise_fullband.audioset_004.tar.bz2 + datasets_fullband/noise_fullband/datasets_fullband.noise_fullband.audioset_005.tar.bz2 + datasets_fullband/noise_fullband/datasets_fullband.noise_fullband.audioset_006.tar.bz2 + + datasets_fullband/noise_fullband/datasets_fullband.noise_fullband.freesound_000.tar.bz2 + datasets_fullband/noise_fullband/datasets_fullband.noise_fullband.freesound_001.tar.bz2 + + datasets_fullband/datasets_fullband.impulse_responses_000.tar.bz2 + + personalized_dev_testset/personalized_dev_testset.enrollment.tar.bz2 + personalized_dev_testset/personalized_dev_testset.noisy_testclips.tar.bz2 +) + +############################################################### + +AZURE_URL="https://dns4public.blob.core.windows.net/dns4archive" + +OUTPUT_PATH="." + +mkdir -p $OUTPUT_PATH/{pdns_training_set/{raw,enrollment_wav},datasets_fullband/noise_fullband} + +for BLOB in ${BLOB_NAMES[@]} +do + URL="$AZURE_URL/$BLOB" + echo "Download: $BLOB" + + # DRY RUN: print HTTP response and Content-Length + # WITHOUT downloading the files + curl -s -I "$URL" | head -n 2 + + # Actually download the files: UNCOMMENT when ready to download + # curl "$URL" -o "$OUTPUT_PATH/$BLOB" + + # Same as above, but using wget + # wget "$URL" -O "$OUTPUT_PATH/$BLOB" + + # Same, + unpack files on the fly + # curl "$URL" | tar -C "$OUTPUT_PATH" -f - -x -j +done diff --git a/pdns_synthesizer_icassp2022.cfg b/pdns_synthesizer_icassp2023.cfg similarity index 97% rename from pdns_synthesizer_icassp2022.cfg rename to pdns_synthesizer_icassp2023.cfg index e00474b5303..cebe1da69a7 100644 --- a/pdns_synthesizer_icassp2022.cfg +++ b/pdns_synthesizer_icassp2023.cfg @@ -1,137 +1,137 @@ -# Configuration for generating Noisy Speech Dataset - -# - sampling_rate: Specify the sampling rate. Default is 16 kHz -# - audioformat: default is .wav -# - audio_length: Minimum Length of each audio clip (noisy and clean speech) in seconds that will be generated by augmenting utterances. -# - silence_length: Duration of silence introduced between clean speech utterances. -# - total_hours: Total number of hours of data required. Units are in hours. -# - snr_lower: Lower bound for SNR required (default: 0 dB) -# - snr_upper: Upper bound for SNR required (default: 40 dB) -# - target_level_lower: Lower bound for the target audio level before audiowrite (default: -35 dB) -# - target_level_upper: Upper bound for the target audio level before audiowrite (default: -15 dB) -# - total_snrlevels: Number of SNR levels required (default: 5, which means there are 5 levels between snr_lower and snr_upper) -# - clean_activity_threshold: Activity threshold for clean speech -# - noise_activity_threshold: Activity threshold for noise -# - fileindex_start: Starting file ID that will be used in filenames -# - fileindex_end: Last file ID that will be used in filenames -# - is_test_set: Set it to True if it is the test set, else False for the training set -# - noise_dir: Specify the directory path to all noise files -# - Speech_dir: Specify the directory path to all clean speech files -# - noisy_destination: Specify path to the destination directory to store noisy speech -# - clean_destination: Specify path to the destination directory to store clean speech -# - noise_destination: Specify path to the destination directory to store noise speech -# - log_dir: Specify path to the directory to store all the log files - -# Configuration for unit tests -# - snr_test: Set to True if SNR test is required, else False -# - norm_test: Set to True if Normalization test is required, else False -# - sampling_rate_test: Set to True if Sampling Rate test is required, else False -# - clipping_test: Set to True if Clipping test is required, else False -# - unit_tests_log_dir: Specify path to the directory where you want to store logs - -[noisy_speech] - -sampling_rate: 48000 -audioformat: *.wav -audio_length: 30 -# 15, 12, 30 -silence_length: 0.2 -total_hours: 1000 -# 1000 -#200 -# 2.5, 500, 100 -snr_lower: -5 -#-5, 0 -snr_upper: 20 -# 25, 40 -randomize_snr: True -target_level_lower: -35 -target_level_upper: -15 -total_snrlevels: 31 -# 5 -clean_activity_threshold: 0.0 -noise_activity_threshold: 0.2 -fileindex_start: None -fileindex_end: None -is_test_set: False -# True, False - -noise_dir: /mnt/f/4th_DNSChallenge/ICASSP_2022/DNS-Challenge/datasets/noise -#/mnt/f/4th_DNSChallenge/INTERSPEECH_2021/DNS-Challenge/datasets_fullband/noise -#F:\4th_DNSChallenge\INTERSPEECH_2021\DNS-Challenge\datasets_fullband\noise -#datasets\pdns_training_set\noise -#\test_set2\Test_Noise -# datasets\noise -# \datasets\noise - -speech_dir: /mnt/f/4th_DNSChallenge/ICASSP_2022/DNS-Challenge/datasets/clean -# D:\kanhawin_git\primary_speakers_VCTK_16k_for_synthesizer -# datasets\test_set2\Singing_Voice\wav_16k -# dir with secondary speaker clean speech -speech_dir2: /mnt/f/4th_DNSChallenge/ICASSP_2022/DNS-Challenge/datasets/clean -#D:\kanhawin_git\secondary_speakers_voxCeleb2_16k -# datasets\test_set2\Singing_Voice\wav_16k - -spkid_csv: /mnt/f/4th_DNSChallenge/ICASSP_2022/DNS-Challenge/datasets/filelists/complete_ps_split.csv -#/mnt/f/4th_DNSChallenge/ICASSP_2022/DNS-Challenge/datasets/filelists/vctk_spkid.csv -# datasets\clean -noise_types_excluded: None - -rir_dir: /mnt/f/4th_DNSChallenge/ICASSP_2022/DNS-Challenge/datasets/pdns_training_set/impulse_responses -#/mnt/f/4th_DNSChallenge/ICASSP_2022/DNS-Challenge/datasets/impulse_responses -# F:\4th_DNSChallenge\ICASSP_2022\DNS-Challenge\datasets\impulse_responses - -# \datasets\clean -noisy_destination: /mnt/f/4th_DNSChallenge/ICASSP_2022/DNS-Challenge/datasets/pdns_training_set/mixed/noisy -# datasets/training_data/noisy -# datasets\test_set2\synthetic_personalizeddns\noisy -#training_set2_onlyrealrir\noisy -#\noisy -clean_destination: /mnt/f/4th_DNSChallenge/ICASSP_2022/DNS-Challenge/datasets/pdns_training_set/mixed/clean -#datasets\test_set2\synthetic_personalizeddns\clean -# training_set2_onlyrealrir\clean -# \clean -noise_destination: /mnt/f/4th_DNSChallenge/ICASSP_2022/DNS-Challenge/datasets/pdns_training_set/mixed/noise -# datasets/training_data/noise -#datasets\test_set2\synthetic_personalizeddns\noise -#training_set2_onlyrealrir\noise -# \noise -log_dir: logs -# \logs - -# Config: add singing voice to clean speech -clean_singing: datasets\clean_singing\VocalSet11\FULL -singing_choice: 3 -# 1 for only male, 2 for only female, 3 (default) for both male and female - -# Config: add reverb to clean speech -rir_choice: 1 -# 1 for only real rir, 2 for only synthetic rir, 3 (default) use both real and synthetic -lower_t60: 0.3 -# lower bound of t60 range in seconds -upper_t60: 1.3 -# upper bound of t60 range in seconds -rir_table_csv: datasets\acoustic_params\RIR_table_simple.csv -clean_speech_t60_csv: datasets\acoustic_params\cleanspeech_table_t60_c50.csv -# percent_for_adding_reverb=0.5 # percentage of clean speech convolved with RIR - -# pdns testsets -# primary_data: D:\kanhawin_git\primary_speakers_VCTK_16k -#'D:\PersonalizedDNS_dataset\synthetic_primary' -# secondary_data='D:\kanhawin_git\secondary_speakers_voxCeleb2_16k' -#'D:\PersonalizedDNS_dataset\synthetic_secondary' -# noise_data= datasets\test_set2\synthetic\noise -# pdns_testset_clean= datasets\test_set2\pdns\clean -# pdns_testset_noisy= datasets\test_set2\pdns\noisy - -# adaptation_data_seconds=120 -# num_primary_spk=100 -# num_clips=600 - -# Unit tests config -snr_test: True -norm_test: True -sampling_rate_test = True -clipping_test = True - -unit_tests_log_dir: unittests_logs +# Configuration for generating Noisy Speech Dataset + +# - sampling_rate: Specify the sampling rate. Default is 16 kHz +# - audioformat: default is .wav +# - audio_length: Minimum Length of each audio clip (noisy and clean speech) in seconds that will be generated by augmenting utterances. +# - silence_length: Duration of silence introduced between clean speech utterances. +# - total_hours: Total number of hours of data required. Units are in hours. +# - snr_lower: Lower bound for SNR required (default: 0 dB) +# - snr_upper: Upper bound for SNR required (default: 40 dB) +# - target_level_lower: Lower bound for the target audio level before audiowrite (default: -35 dB) +# - target_level_upper: Upper bound for the target audio level before audiowrite (default: -15 dB) +# - total_snrlevels: Number of SNR levels required (default: 5, which means there are 5 levels between snr_lower and snr_upper) +# - clean_activity_threshold: Activity threshold for clean speech +# - noise_activity_threshold: Activity threshold for noise +# - fileindex_start: Starting file ID that will be used in filenames +# - fileindex_end: Last file ID that will be used in filenames +# - is_test_set: Set it to True if it is the test set, else False for the training set +# - noise_dir: Specify the directory path to all noise files +# - Speech_dir: Specify the directory path to all clean speech files +# - noisy_destination: Specify path to the destination directory to store noisy speech +# - clean_destination: Specify path to the destination directory to store clean speech +# - noise_destination: Specify path to the destination directory to store noise speech +# - log_dir: Specify path to the directory to store all the log files + +# Configuration for unit tests +# - snr_test: Set to True if SNR test is required, else False +# - norm_test: Set to True if Normalization test is required, else False +# - sampling_rate_test: Set to True if Sampling Rate test is required, else False +# - clipping_test: Set to True if Clipping test is required, else False +# - unit_tests_log_dir: Specify path to the directory where you want to store logs + +[noisy_speech] + +sampling_rate: 48000 +audioformat: *.wav +audio_length: 30 +# 15, 12, 30 +silence_length: 0.2 +total_hours: 1000 +# 1000 +#200 +# 2.5, 500, 100 +snr_lower: -5 +#-5, 0 +snr_upper: 20 +# 25, 40 +randomize_snr: True +target_level_lower: -35 +target_level_upper: -15 +total_snrlevels: 31 +# 5 +clean_activity_threshold: 0.0 +noise_activity_threshold: 0.2 +fileindex_start: None +fileindex_end: None +is_test_set: False +# True, False + +noise_dir: /mnt/f/4th_DNSChallenge/ICASSP_2022/DNS-Challenge/datasets/noise +#/mnt/f/4th_DNSChallenge/INTERSPEECH_2021/DNS-Challenge/datasets_fullband/noise +#F:\4th_DNSChallenge\INTERSPEECH_2021\DNS-Challenge\datasets_fullband\noise +#datasets\pdns_training_set\noise +#\test_set2\Test_Noise +# datasets\noise +# \datasets\noise + +speech_dir: /mnt/f/4th_DNSChallenge/ICASSP_2022/DNS-Challenge/datasets/clean +# D:\kanhawin_git\primary_speakers_VCTK_16k_for_synthesizer +# datasets\test_set2\Singing_Voice\wav_16k +# dir with secondary speaker clean speech +speech_dir2: /mnt/f/4th_DNSChallenge/ICASSP_2022/DNS-Challenge/datasets/clean +#D:\kanhawin_git\secondary_speakers_voxCeleb2_16k +# datasets\test_set2\Singing_Voice\wav_16k + +spkid_csv: /mnt/f/4th_DNSChallenge/ICASSP_2022/DNS-Challenge/datasets/filelists/complete_ps_split.csv +#/mnt/f/4th_DNSChallenge/ICASSP_2022/DNS-Challenge/datasets/filelists/vctk_spkid.csv +# datasets\clean +noise_types_excluded: None + +rir_dir: /mnt/f/4th_DNSChallenge/ICASSP_2022/DNS-Challenge/datasets/pdns_training_set/impulse_responses +#/mnt/f/4th_DNSChallenge/ICASSP_2022/DNS-Challenge/datasets/impulse_responses +# F:\4th_DNSChallenge\ICASSP_2022\DNS-Challenge\datasets\impulse_responses + +# \datasets\clean +noisy_destination: /mnt/f/4th_DNSChallenge/ICASSP_2022/DNS-Challenge/datasets/pdns_training_set/mixed/noisy +# datasets/training_data/noisy +# datasets\test_set2\synthetic_personalizeddns\noisy +#training_set2_onlyrealrir\noisy +#\noisy +clean_destination: /mnt/f/4th_DNSChallenge/ICASSP_2022/DNS-Challenge/datasets/pdns_training_set/mixed/clean +#datasets\test_set2\synthetic_personalizeddns\clean +# training_set2_onlyrealrir\clean +# \clean +noise_destination: /mnt/f/4th_DNSChallenge/ICASSP_2022/DNS-Challenge/datasets/pdns_training_set/mixed/noise +# datasets/training_data/noise +#datasets\test_set2\synthetic_personalizeddns\noise +#training_set2_onlyrealrir\noise +# \noise +log_dir: logs +# \logs + +# Config: add singing voice to clean speech +clean_singing: datasets\clean_singing\VocalSet11\FULL +singing_choice: 3 +# 1 for only male, 2 for only female, 3 (default) for both male and female + +# Config: add reverb to clean speech +rir_choice: 1 +# 1 for only real rir, 2 for only synthetic rir, 3 (default) use both real and synthetic +lower_t60: 0.3 +# lower bound of t60 range in seconds +upper_t60: 1.3 +# upper bound of t60 range in seconds +rir_table_csv: datasets\acoustic_params\RIR_table_simple.csv +clean_speech_t60_csv: datasets\acoustic_params\cleanspeech_table_t60_c50.csv +# percent_for_adding_reverb=0.5 # percentage of clean speech convolved with RIR + +# pdns testsets +# primary_data: D:\kanhawin_git\primary_speakers_VCTK_16k +#'D:\PersonalizedDNS_dataset\synthetic_primary' +# secondary_data='D:\kanhawin_git\secondary_speakers_voxCeleb2_16k' +#'D:\PersonalizedDNS_dataset\synthetic_secondary' +# noise_data= datasets\test_set2\synthetic\noise +# pdns_testset_clean= datasets\test_set2\pdns\clean +# pdns_testset_noisy= datasets\test_set2\pdns\noisy + +# adaptation_data_seconds=120 +# num_primary_spk=100 +# num_clips=600 + +# Unit tests config +snr_test: True +norm_test: True +sampling_rate_test = True +clipping_test = True + +unit_tests_log_dir: unittests_logs