Merge pull request #142 from microsoft/ashkana/updating_download_script

updating V5 download scripts
This commit is contained in:
hdubey 2022-12-07 15:49:56 -08:00 коммит произвёл GitHub
Родитель 26827b6d9d f1528275fe
Коммит 53f90648a9
Не найден ключ, соответствующий данной подписи
Идентификатор ключа GPG: 4AEE18F83AFDEB23
6 изменённых файлов: 130 добавлений и 190 удалений

Просмотреть файл

@ -1,6 +1,6 @@
#!/usr/bin/bash
# ***** Datasets for ICASSP 2022 DNS Challenge 4 - Personalized DNS Track *****
# ***** Datasets for ICASSP 2023 DNS Challenge 5 - Headset DNS Track *****
# NOTE: Before downloading, make sure you have enough space
# on your local storage!
@ -16,105 +16,89 @@
# downloading method that works best for you.
# -------------------------------------------------------------
# The directory structure of the unpacked data is:
# . 362G
# +-- datasets_fullband 64G
# | +-- impulse_responses 5.9G
# | \-- noise_fullband 58G
# +-- pdns_training_set 294G
# | +-- enrollment_embeddings 115M
# | +-- enrollment_wav 42G
# | +-- raw/clean 252G
# | +-- english 168G
# | +-- french 2.1G
# | +-- german 53G
# | +-- italian 17G
# | +-- russian 6.8G
# | \-- spanish 5.4G
# \-- personalized_dev_testset 3.3G
$BLOB_NAMES=@(
"V5_training_dataset/Track1_Headset/VocalSet_48kHz_mono.tgz",
"pdns_training_set/raw/pdns_training_set.raw.clean.english_000.tar.bz2",
"pdns_training_set/raw/pdns_training_set.raw.clean.english_001.tar.bz2",
"pdns_training_set/raw/pdns_training_set.raw.clean.english_002.tar.bz2",
"pdns_training_set/raw/pdns_training_set.raw.clean.english_003.tar.bz2",
"pdns_training_set/raw/pdns_training_set.raw.clean.english_004.tar.bz2",
"pdns_training_set/raw/pdns_training_set.raw.clean.english_005.tar.bz2",
"pdns_training_set/raw/pdns_training_set.raw.clean.english_006.tar.bz2",
"pdns_training_set/raw/pdns_training_set.raw.clean.english_007.tar.bz2",
"pdns_training_set/raw/pdns_training_set.raw.clean.english_008.tar.bz2",
"pdns_training_set/raw/pdns_training_set.raw.clean.english_009.tar.bz2",
"pdns_training_set/raw/pdns_training_set.raw.clean.english_010.tar.bz2",
"pdns_training_set/raw/pdns_training_set.raw.clean.english_011.tar.bz2",
"pdns_training_set/raw/pdns_training_set.raw.clean.english_012.tar.bz2",
"pdns_training_set/raw/pdns_training_set.raw.clean.english_013.tar.bz2",
"pdns_training_set/raw/pdns_training_set.raw.clean.english_014.tar.bz2",
"pdns_training_set/raw/pdns_training_set.raw.clean.english_015.tar.bz2",
"pdns_training_set/raw/pdns_training_set.raw.clean.english_016.tar.bz2",
"pdns_training_set/raw/pdns_training_set.raw.clean.english_017.tar.bz2",
"pdns_training_set/raw/pdns_training_set.raw.clean.english_018.tar.bz2",
"pdns_training_set/raw/pdns_training_set.raw.clean.english_019.tar.bz2",
"pdns_training_set/raw/pdns_training_set.raw.clean.english_020.tar.bz2",
"pdns_training_set/raw/pdns_training_set.raw.clean.french_000.tar.bz2",
"pdns_training_set/raw/pdns_training_set.raw.clean.german_000.tar.bz2",
"pdns_training_set/raw/pdns_training_set.raw.clean.german_001.tar.bz2",
"pdns_training_set/raw/pdns_training_set.raw.clean.german_002.tar.bz2",
"pdns_training_set/raw/pdns_training_set.raw.clean.german_003.tar.bz2",
"pdns_training_set/raw/pdns_training_set.raw.clean.german_004.tar.bz2",
"pdns_training_set/raw/pdns_training_set.raw.clean.german_005.tar.bz2",
"pdns_training_set/raw/pdns_training_set.raw.clean.german_006.tar.bz2",
"pdns_training_set/raw/pdns_training_set.raw.clean.german_007.tar.bz2",
"pdns_training_set/raw/pdns_training_set.raw.clean.german_008.tar.bz2",
"pdns_training_set/raw/pdns_training_set.raw.clean.italian_000.tar.bz2",
"pdns_training_set/raw/pdns_training_set.raw.clean.italian_001.tar.bz2",
"pdns_training_set/raw/pdns_training_set.raw.clean.italian_002.tar.bz2",
"pdns_training_set/raw/pdns_training_set.raw.clean.russian_000.tar.bz2",
"pdns_training_set/raw/pdns_training_set.raw.clean.spanish_000.tar.bz2",
"pdns_training_set/raw/pdns_training_set.raw.clean.spanish_001.tar.bz2",
"pdns_training_set/raw/pdns_training_set.raw.clean.spanish_002.tar.bz2",
"V5_training_dataset/Track1_Headset/vctk_wav48_silence_trimmed.tgz.partac",
"V5_training_dataset/Track1_Headset/vctk_wav48_silence_trimmed.tgz.partab",
"V5_training_dataset/Track1_Headset/vctk_wav48_silence_trimmed.tgz.partaa",
"pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.english_000.tar.bz2",
"pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.english_001.tar.bz2",
"pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.english_002.tar.bz2",
"pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.english_003.tar.bz2",
"pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.english_004.tar.bz2",
"pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.french_000.tar.bz2",
"pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.german_000.tar.bz2",
"pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.german_001.tar.bz2",
"pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.italian_000.tar.bz2",
"pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.russian_000.tar.bz2",
"pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.spanish_000.tar.bz2",
"V5_training_dataset/Track1_Headset/russian_speech.tgz",
"pdns_training_set/pdns_training_set.enrollment_embeddings_000.tar.bz2",
"V5_training_dataset/Track1_Headset/read_speech.tgz.partau",
"V5_training_dataset/Track1_Headset/read_speech.tgz.partat",
"V5_training_dataset/Track1_Headset/read_speech.tgz.partas",
"V5_training_dataset/Track1_Headset/read_speech.tgz.partar",
"V5_training_dataset/Track1_Headset/read_speech.tgz.partaq",
"V5_training_dataset/Track1_Headset/read_speech.tgz.partap",
"V5_training_dataset/Track1_Headset/read_speech.tgz.partao",
"V5_training_dataset/Track1_Headset/read_speech.tgz.partan",
"V5_training_dataset/Track1_Headset/read_speech.tgz.partam",
"V5_training_dataset/Track1_Headset/read_speech.tgz.partal",
"V5_training_dataset/Track1_Headset/read_speech.tgz.partak",
"V5_training_dataset/Track1_Headset/read_speech.tgz.partaj",
"V5_training_dataset/Track1_Headset/read_speech.tgz.partai",
"V5_training_dataset/Track1_Headset/read_speech.tgz.partah",
"V5_training_dataset/Track1_Headset/read_speech.tgz.partag",
"V5_training_dataset/Track1_Headset/read_speech.tgz.partaf",
"V5_training_dataset/Track1_Headset/read_speech.tgz.partae",
"V5_training_dataset/Track1_Headset/read_speech.tgz.partad",
"V5_training_dataset/Track1_Headset/read_speech.tgz.partac",
"V5_training_dataset/Track1_Headset/read_speech.tgz.partab",
"V5_training_dataset/Track1_Headset/read_speech.tgz.partaa",
"datasets_fullband/noise_fullband/datasets_fullband.noise_fullband.audioset_000.tar.bz2",
"datasets_fullband/noise_fullband/datasets_fullband.noise_fullband.audioset_001.tar.bz2",
"datasets_fullband/noise_fullband/datasets_fullband.noise_fullband.audioset_002.tar.bz2",
"datasets_fullband/noise_fullband/datasets_fullband.noise_fullband.audioset_003.tar.bz2",
"datasets_fullband/noise_fullband/datasets_fullband.noise_fullband.audioset_004.tar.bz2",
"datasets_fullband/noise_fullband/datasets_fullband.noise_fullband.audioset_005.tar.bz2",
"datasets_fullband/noise_fullband/datasets_fullband.noise_fullband.audioset_006.tar.bz2",
"V5_training_dataset/Track1_Headset/italian_speech.tgz.partad",
"V5_training_dataset/Track1_Headset/italian_speech.tgz.partac",
"V5_training_dataset/Track1_Headset/italian_speech.tgz.partab",
"V5_training_dataset/Track1_Headset/italian_speech.tgz.partaa",
"datasets_fullband/noise_fullband/datasets_fullband.noise_fullband.freesound_000.tar.bz2",
"datasets_fullband/noise_fullband/datasets_fullband.noise_fullband.freesound_001.tar.bz2",
"V5_training_dataset/Track1_Headset/french_speech.tar.gz.partah",
"V5_training_dataset/Track1_Headset/french_speech.tar.gz.partae",
"V5_training_dataset/Track1_Headset/french_speech.tar.gz.partad",
"V5_training_dataset/Track1_Headset/french_speech.tar.gz.partac",
"V5_training_dataset/Track1_Headset/french_speech.tar.gz.partab",
"V5_training_dataset/Track1_Headset/french_speech.tar.gz.partaa",
"datasets_fullband/datasets_fullband.impulse_responses_000.tar.bz2",
"V5_training_dataset/Track1_Headset/emotional_speech.tgz"
"personalized_dev_testset/personalized_dev_testset.enrollment.tar.bz2",
"personalized_dev_testset/personalized_dev_testset.noisy_testclips.tar.bz2"
"V5_training_dataset/noise_fullband/datasets_fullband.noise_fullband.freesound_001.tar.bz2",
"V5_training_dataset/noise_fullband/datasets_fullband.noise_fullband.freesound_000.tar.bz2",
"V5_training_dataset/noise_fullband/datasets_fullband.noise_fullband.audioset_006.tar.bz2",
"V5_training_dataset/noise_fullband/datasets_fullband.noise_fullband.audioset_005.tar.bz2",
"V5_training_dataset/noise_fullband/datasets_fullband.noise_fullband.audioset_004.tar.bz2",
"V5_training_dataset/noise_fullband/datasets_fullband.noise_fullband.audioset_003.tar.bz2",
"V5_training_dataset/noise_fullband/datasets_fullband.noise_fullband.audioset_002.tar.bz2",
"V5_training_dataset/noise_fullband/datasets_fullband.noise_fullband.audioset_001.tar.bz2",
"V5_training_dataset/noise_fullband/datasets_fullband.noise_fullband.audioset_000.tar.bz2",
"V5_training_dataset/datasets_fullband.impulse_responses_000.tar.bz2"
# "pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.english_000.tar.bz2",
# "pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.english_001.tar.bz2",
# "pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.english_002.tar.bz2",
# "pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.english_003.tar.bz2",
# "pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.english_004.tar.bz2",
# "pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.french_000.tar.bz2",
# "pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.german_000.tar.bz2",
# "pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.german_001.tar.bz2",
# "pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.italian_000.tar.bz2",
# "pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.russian_000.tar.bz2",
# "pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.spanish_000.tar.bz2",
# "pdns_training_set/pdns_training_set.enrollment_embeddings_000.tar.bz2"
)
###############################################################
$AZURE_URL="https://dns4public.blob.core.windows.net/dns4archive"
$AZURE_URL="https://dnschallengepublic.blob.core.windows.net/dns5archive"
$OUTPUT_PATH="."
mkdir -Force $OUTPUT_PATH/pdns_training_set/raw 2> $null
mkdir -Force $OUTPUT_PATH/pdns_training_set/enrollment_wav 2> $null
mkdir -Force $OUTPUT_PATH/datasets_fullband/noise_fullband 2> $null
mkdir -Force $OUTPUT_PATH/V5_training_dataset/noise_fullband 2> $null
mkdir -Force $OUTPUT_PATH/V5_training_dataset/Track1_Headset 2> $null
foreach ($BLOB in $BLOB_NAMES) {
@ -123,14 +107,8 @@ foreach ($BLOB in $BLOB_NAMES) {
# DRY RUN: print HTTP response and Content-Length
# WITHOUT downloading the files
curl -s -I "$URL" | head -n 2
# Invoke-WebRequest $URL -Method Head
# Actually download the files: UNCOMMENT when ready to download
# curl "$URL" -o "$OUTPUT_PATH/$BLOB"
# Same as above, but using wget
# wget "$URL" -O "$OUTPUT_PATH/$BLOB"
# Same, + unpack files on the fly
# curl "$URL" | tar -C "$OUTPUT_PATH" -f - -x -j
Invoke-WebRequest $URL -OutFile "$OUTPUT_PATH/$BLOB"
}

Просмотреть файл

@ -1,6 +1,6 @@
#!/usr/bin/bash
# ***** Datasets for ICASSP 2022 DNS Challenge 4 - Personalized DNS Track *****
# ***** Datasets for ICASSP 2023 DNS Challenge 5 - Personalized DNS Track *****
# NOTE: Before downloading, make sure you have enough space
# on your local storage!
@ -16,103 +16,75 @@
# downloading method that works best for you.
# -------------------------------------------------------------
# The directory structure of the unpacked data is:
# . 362G
# +-- datasets_fullband 64G
# | +-- impulse_responses 5.9G
# | \-- noise_fullband 58G
# +-- pdns_training_set 294G
# | +-- enrollment_embeddings 115M
# | +-- enrollment_wav 42G
# | +-- raw/clean 252G
# | +-- english 168G
# | +-- french 2.1G
# | +-- german 53G
# | +-- italian 17G
# | +-- russian 6.8G
# | \-- spanish 5.4G
# \-- personalized_dev_testset 3.3G
BLOB_NAMES=(
V5_training_dataset/Track1_Headset/VocalSet_48kHz_mono.tgz
pdns_training_set/raw/pdns_training_set.raw.clean.english_000.tar.bz2
pdns_training_set/raw/pdns_training_set.raw.clean.english_001.tar.bz2
pdns_training_set/raw/pdns_training_set.raw.clean.english_002.tar.bz2
pdns_training_set/raw/pdns_training_set.raw.clean.english_003.tar.bz2
pdns_training_set/raw/pdns_training_set.raw.clean.english_004.tar.bz2
pdns_training_set/raw/pdns_training_set.raw.clean.english_005.tar.bz2
pdns_training_set/raw/pdns_training_set.raw.clean.english_006.tar.bz2
pdns_training_set/raw/pdns_training_set.raw.clean.english_007.tar.bz2
pdns_training_set/raw/pdns_training_set.raw.clean.english_008.tar.bz2
pdns_training_set/raw/pdns_training_set.raw.clean.english_009.tar.bz2
pdns_training_set/raw/pdns_training_set.raw.clean.english_010.tar.bz2
pdns_training_set/raw/pdns_training_set.raw.clean.english_011.tar.bz2
pdns_training_set/raw/pdns_training_set.raw.clean.english_012.tar.bz2
pdns_training_set/raw/pdns_training_set.raw.clean.english_013.tar.bz2
pdns_training_set/raw/pdns_training_set.raw.clean.english_014.tar.bz2
pdns_training_set/raw/pdns_training_set.raw.clean.english_015.tar.bz2
pdns_training_set/raw/pdns_training_set.raw.clean.english_016.tar.bz2
pdns_training_set/raw/pdns_training_set.raw.clean.english_017.tar.bz2
pdns_training_set/raw/pdns_training_set.raw.clean.english_018.tar.bz2
pdns_training_set/raw/pdns_training_set.raw.clean.english_019.tar.bz2
pdns_training_set/raw/pdns_training_set.raw.clean.english_020.tar.bz2
pdns_training_set/raw/pdns_training_set.raw.clean.french_000.tar.bz2
pdns_training_set/raw/pdns_training_set.raw.clean.german_000.tar.bz2
pdns_training_set/raw/pdns_training_set.raw.clean.german_001.tar.bz2
pdns_training_set/raw/pdns_training_set.raw.clean.german_002.tar.bz2
pdns_training_set/raw/pdns_training_set.raw.clean.german_003.tar.bz2
pdns_training_set/raw/pdns_training_set.raw.clean.german_004.tar.bz2
pdns_training_set/raw/pdns_training_set.raw.clean.german_005.tar.bz2
pdns_training_set/raw/pdns_training_set.raw.clean.german_006.tar.bz2
pdns_training_set/raw/pdns_training_set.raw.clean.german_007.tar.bz2
pdns_training_set/raw/pdns_training_set.raw.clean.german_008.tar.bz2
pdns_training_set/raw/pdns_training_set.raw.clean.italian_000.tar.bz2
pdns_training_set/raw/pdns_training_set.raw.clean.italian_001.tar.bz2
pdns_training_set/raw/pdns_training_set.raw.clean.italian_002.tar.bz2
pdns_training_set/raw/pdns_training_set.raw.clean.russian_000.tar.bz2
pdns_training_set/raw/pdns_training_set.raw.clean.spanish_000.tar.bz2
pdns_training_set/raw/pdns_training_set.raw.clean.spanish_001.tar.bz2
pdns_training_set/raw/pdns_training_set.raw.clean.spanish_002.tar.bz2
V5_training_dataset/Track1_Headset/vctk_wav48_silence_trimmed.tgz.partac
V5_training_dataset/Track1_Headset/vctk_wav48_silence_trimmed.tgz.partab
V5_training_dataset/Track1_Headset/vctk_wav48_silence_trimmed.tgz.partaa
pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.english_000.tar.bz2
pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.english_001.tar.bz2
pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.english_002.tar.bz2
pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.english_003.tar.bz2
pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.english_004.tar.bz2
pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.french_000.tar.bz2
pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.german_000.tar.bz2
pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.german_001.tar.bz2
pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.italian_000.tar.bz2
pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.russian_000.tar.bz2
pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.spanish_000.tar.bz2
V5_training_dataset/Track1_Headset/russian_speech.tgz
pdns_training_set/pdns_training_set.enrollment_embeddings_000.tar.bz2
V5_training_dataset/Track1_Headset/read_speech.tgz.partau
V5_training_dataset/Track1_Headset/read_speech.tgz.partat
V5_training_dataset/Track1_Headset/read_speech.tgz.partas
V5_training_dataset/Track1_Headset/read_speech.tgz.partar
V5_training_dataset/Track1_Headset/read_speech.tgz.partaq
V5_training_dataset/Track1_Headset/read_speech.tgz.partap
V5_training_dataset/Track1_Headset/read_speech.tgz.partao
V5_training_dataset/Track1_Headset/read_speech.tgz.partan
V5_training_dataset/Track1_Headset/read_speech.tgz.partam
V5_training_dataset/Track1_Headset/read_speech.tgz.partal
V5_training_dataset/Track1_Headset/read_speech.tgz.partak
V5_training_dataset/Track1_Headset/read_speech.tgz.partaj
V5_training_dataset/Track1_Headset/read_speech.tgz.partai
V5_training_dataset/Track1_Headset/read_speech.tgz.partah
V5_training_dataset/Track1_Headset/read_speech.tgz.partag
V5_training_dataset/Track1_Headset/read_speech.tgz.partaf
V5_training_dataset/Track1_Headset/read_speech.tgz.partae
V5_training_dataset/Track1_Headset/read_speech.tgz.partad
V5_training_dataset/Track1_Headset/read_speech.tgz.partac
V5_training_dataset/Track1_Headset/read_speech.tgz.partab
V5_training_dataset/Track1_Headset/read_speech.tgz.partaa
datasets_fullband/noise_fullband/datasets_fullband.noise_fullband.audioset_000.tar.bz2
datasets_fullband/noise_fullband/datasets_fullband.noise_fullband.audioset_001.tar.bz2
datasets_fullband/noise_fullband/datasets_fullband.noise_fullband.audioset_002.tar.bz2
datasets_fullband/noise_fullband/datasets_fullband.noise_fullband.audioset_003.tar.bz2
datasets_fullband/noise_fullband/datasets_fullband.noise_fullband.audioset_004.tar.bz2
datasets_fullband/noise_fullband/datasets_fullband.noise_fullband.audioset_005.tar.bz2
datasets_fullband/noise_fullband/datasets_fullband.noise_fullband.audioset_006.tar.bz2
V5_training_dataset/Track1_Headset/italian_speech.tgz.partad
V5_training_dataset/Track1_Headset/italian_speech.tgz.partac
V5_training_dataset/Track1_Headset/italian_speech.tgz.partab
V5_training_dataset/Track1_Headset/italian_speech.tgz.partaa
datasets_fullband/noise_fullband/datasets_fullband.noise_fullband.freesound_000.tar.bz2
datasets_fullband/noise_fullband/datasets_fullband.noise_fullband.freesound_001.tar.bz2
V5_training_dataset/Track1_Headset/french_speech.tar.gz.partah
V5_training_dataset/Track1_Headset/french_speech.tar.gz.partae
V5_training_dataset/Track1_Headset/french_speech.tar.gz.partad
V5_training_dataset/Track1_Headset/french_speech.tar.gz.partac
V5_training_dataset/Track1_Headset/french_speech.tar.gz.partab
V5_training_dataset/Track1_Headset/french_speech.tar.gz.partaa
datasets_fullband/datasets_fullband.impulse_responses_000.tar.bz2
V5_training_dataset/Track1_Headset/emotional_speech.tgz
personalized_dev_testset/personalized_dev_testset.enrollment.tar.bz2
personalized_dev_testset/personalized_dev_testset.noisy_testclips.tar.bz2
V5_training_dataset/noise_fullband/datasets_fullband.noise_fullband.freesound_001.tar.bz2
V5_training_dataset/noise_fullband/datasets_fullband.noise_fullband.freesound_000.tar.bz2
V5_training_dataset/noise_fullband/datasets_fullband.noise_fullband.audioset_006.tar.bz2
V5_training_dataset/noise_fullband/datasets_fullband.noise_fullband.audioset_005.tar.bz2
V5_training_dataset/noise_fullband/datasets_fullband.noise_fullband.audioset_004.tar.bz2
V5_training_dataset/noise_fullband/datasets_fullband.noise_fullband.audioset_003.tar.bz2
V5_training_dataset/noise_fullband/datasets_fullband.noise_fullband.audioset_002.tar.bz2
V5_training_dataset/noise_fullband/datasets_fullband.noise_fullband.audioset_001.tar.bz2
V5_training_dataset/noise_fullband/datasets_fullband.noise_fullband.audioset_000.tar.bz2
V5_training_dataset/datasets_fullband.impulse_responses_000.tar.bz2
)
###############################################################
AZURE_URL="https://dns4public.blob.core.windows.net/dns4archive"
AZURE_URL="https://dnschallengepublic.blob.core.windows.net/dns5archive"
OUTPUT_PATH="."
mkdir -p $OUTPUT_PATH/{pdns_training_set/{raw,enrollment_wav},datasets_fullband/noise_fullband}
mkdir -p $OUTPUT_PATH/V5_training_dataset/noise_fullband
mkdir -p $OUTPUT_PATH/V5_training_dataset/Track1_Headset
for BLOB in ${BLOB_NAMES[@]}
do
@ -125,10 +97,6 @@ do
# Actually download the files: UNCOMMENT when ready to download
# curl "$URL" -o "$OUTPUT_PATH/$BLOB"
# Same as above, but using wget
# wget "$URL" -O "$OUTPUT_PATH/$BLOB"
# Same, + unpack files on the fly
# curl "$URL" | tar -C "$OUTPUT_PATH" -f - -x -j
done
#

Просмотреть файл

@ -1,6 +1,6 @@
#!/usr/bin/bash
# ***** Datasets for ICASSP 2022 DNS Challenge 4 - Personalized DNS Track *****
# ***** Datasets for ICASSP 2023 DNS Challenge 5 - Speakerphone DNS Track *****
# NOTE: Before downloading, make sure you have enough space
# on your local storage!

Просмотреть файл

@ -1,6 +1,6 @@
#!/usr/bin/bash
# ***** Datasets for ICASSP 2022 DNS Challenge 4 - Personalized DNS Track *****
# ***** Datasets for ICASSP 2023 DNS Challenge 5 - Speakerphone DNS Track *****
# NOTE: Before downloading, make sure you have enough space
# on your local storage!

Просмотреть файл

@ -15,11 +15,7 @@
# | +-- Track1_Headset ---> (enrol, noisy)
# | +-- Track2_Speakerphone ---> (enrol, noisy)
$AZURE_URL="https://dns4public.blob.core.windows.net/dns4archive"
$OUTPUT_PATH="."
URL="https://dnschallengepublic.blob.core.windows.net/dns5archive/V5_dev_testset.zip"
$URL="https://dnschallengepublic.blob.core.windows.net/dns5archive/V5_dev_testset.zip"
Write-Output "Download: $URL"

Просмотреть файл

@ -15,8 +15,6 @@
# | +-- Track1_Headset ---> (enrol, noisy)
# | +-- Track2_Speakerphone ---> (enrol, noisy)
AZURE_URL="https://dnschallengepublic.blob.core.windows.net/dns5archive"
URL="https://dnschallengepublic.blob.core.windows.net/dns5archive/V5_dev_testset.zip"
echo "Download: $URL"
#