Merge pull request #142 from microsoft/ashkana/updating_download_script
updating V5 download scripts
This commit is contained in:
Коммит
53f90648a9
|
@ -1,6 +1,6 @@
|
|||
#!/usr/bin/bash
|
||||
|
||||
# ***** Datasets for ICASSP 2022 DNS Challenge 4 - Personalized DNS Track *****
|
||||
# ***** Datasets for ICASSP 2023 DNS Challenge 5 - Headset DNS Track *****
|
||||
|
||||
# NOTE: Before downloading, make sure you have enough space
|
||||
# on your local storage!
|
||||
|
@ -16,105 +16,89 @@
|
|||
# downloading method that works best for you.
|
||||
|
||||
# -------------------------------------------------------------
|
||||
# The directory structure of the unpacked data is:
|
||||
|
||||
# . 362G
|
||||
# +-- datasets_fullband 64G
|
||||
# | +-- impulse_responses 5.9G
|
||||
# | \-- noise_fullband 58G
|
||||
# +-- pdns_training_set 294G
|
||||
# | +-- enrollment_embeddings 115M
|
||||
# | +-- enrollment_wav 42G
|
||||
# | +-- raw/clean 252G
|
||||
# | +-- english 168G
|
||||
# | +-- french 2.1G
|
||||
# | +-- german 53G
|
||||
# | +-- italian 17G
|
||||
# | +-- russian 6.8G
|
||||
# | \-- spanish 5.4G
|
||||
# \-- personalized_dev_testset 3.3G
|
||||
|
||||
$BLOB_NAMES=@(
|
||||
"V5_training_dataset/Track1_Headset/VocalSet_48kHz_mono.tgz",
|
||||
|
||||
"pdns_training_set/raw/pdns_training_set.raw.clean.english_000.tar.bz2",
|
||||
"pdns_training_set/raw/pdns_training_set.raw.clean.english_001.tar.bz2",
|
||||
"pdns_training_set/raw/pdns_training_set.raw.clean.english_002.tar.bz2",
|
||||
"pdns_training_set/raw/pdns_training_set.raw.clean.english_003.tar.bz2",
|
||||
"pdns_training_set/raw/pdns_training_set.raw.clean.english_004.tar.bz2",
|
||||
"pdns_training_set/raw/pdns_training_set.raw.clean.english_005.tar.bz2",
|
||||
"pdns_training_set/raw/pdns_training_set.raw.clean.english_006.tar.bz2",
|
||||
"pdns_training_set/raw/pdns_training_set.raw.clean.english_007.tar.bz2",
|
||||
"pdns_training_set/raw/pdns_training_set.raw.clean.english_008.tar.bz2",
|
||||
"pdns_training_set/raw/pdns_training_set.raw.clean.english_009.tar.bz2",
|
||||
"pdns_training_set/raw/pdns_training_set.raw.clean.english_010.tar.bz2",
|
||||
"pdns_training_set/raw/pdns_training_set.raw.clean.english_011.tar.bz2",
|
||||
"pdns_training_set/raw/pdns_training_set.raw.clean.english_012.tar.bz2",
|
||||
"pdns_training_set/raw/pdns_training_set.raw.clean.english_013.tar.bz2",
|
||||
"pdns_training_set/raw/pdns_training_set.raw.clean.english_014.tar.bz2",
|
||||
"pdns_training_set/raw/pdns_training_set.raw.clean.english_015.tar.bz2",
|
||||
"pdns_training_set/raw/pdns_training_set.raw.clean.english_016.tar.bz2",
|
||||
"pdns_training_set/raw/pdns_training_set.raw.clean.english_017.tar.bz2",
|
||||
"pdns_training_set/raw/pdns_training_set.raw.clean.english_018.tar.bz2",
|
||||
"pdns_training_set/raw/pdns_training_set.raw.clean.english_019.tar.bz2",
|
||||
"pdns_training_set/raw/pdns_training_set.raw.clean.english_020.tar.bz2",
|
||||
"pdns_training_set/raw/pdns_training_set.raw.clean.french_000.tar.bz2",
|
||||
"pdns_training_set/raw/pdns_training_set.raw.clean.german_000.tar.bz2",
|
||||
"pdns_training_set/raw/pdns_training_set.raw.clean.german_001.tar.bz2",
|
||||
"pdns_training_set/raw/pdns_training_set.raw.clean.german_002.tar.bz2",
|
||||
"pdns_training_set/raw/pdns_training_set.raw.clean.german_003.tar.bz2",
|
||||
"pdns_training_set/raw/pdns_training_set.raw.clean.german_004.tar.bz2",
|
||||
"pdns_training_set/raw/pdns_training_set.raw.clean.german_005.tar.bz2",
|
||||
"pdns_training_set/raw/pdns_training_set.raw.clean.german_006.tar.bz2",
|
||||
"pdns_training_set/raw/pdns_training_set.raw.clean.german_007.tar.bz2",
|
||||
"pdns_training_set/raw/pdns_training_set.raw.clean.german_008.tar.bz2",
|
||||
"pdns_training_set/raw/pdns_training_set.raw.clean.italian_000.tar.bz2",
|
||||
"pdns_training_set/raw/pdns_training_set.raw.clean.italian_001.tar.bz2",
|
||||
"pdns_training_set/raw/pdns_training_set.raw.clean.italian_002.tar.bz2",
|
||||
"pdns_training_set/raw/pdns_training_set.raw.clean.russian_000.tar.bz2",
|
||||
"pdns_training_set/raw/pdns_training_set.raw.clean.spanish_000.tar.bz2",
|
||||
"pdns_training_set/raw/pdns_training_set.raw.clean.spanish_001.tar.bz2",
|
||||
"pdns_training_set/raw/pdns_training_set.raw.clean.spanish_002.tar.bz2",
|
||||
"V5_training_dataset/Track1_Headset/vctk_wav48_silence_trimmed.tgz.partac",
|
||||
"V5_training_dataset/Track1_Headset/vctk_wav48_silence_trimmed.tgz.partab",
|
||||
"V5_training_dataset/Track1_Headset/vctk_wav48_silence_trimmed.tgz.partaa",
|
||||
|
||||
"pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.english_000.tar.bz2",
|
||||
"pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.english_001.tar.bz2",
|
||||
"pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.english_002.tar.bz2",
|
||||
"pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.english_003.tar.bz2",
|
||||
"pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.english_004.tar.bz2",
|
||||
"pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.french_000.tar.bz2",
|
||||
"pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.german_000.tar.bz2",
|
||||
"pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.german_001.tar.bz2",
|
||||
"pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.italian_000.tar.bz2",
|
||||
"pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.russian_000.tar.bz2",
|
||||
"pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.spanish_000.tar.bz2",
|
||||
"V5_training_dataset/Track1_Headset/russian_speech.tgz",
|
||||
|
||||
"pdns_training_set/pdns_training_set.enrollment_embeddings_000.tar.bz2",
|
||||
"V5_training_dataset/Track1_Headset/read_speech.tgz.partau",
|
||||
"V5_training_dataset/Track1_Headset/read_speech.tgz.partat",
|
||||
"V5_training_dataset/Track1_Headset/read_speech.tgz.partas",
|
||||
"V5_training_dataset/Track1_Headset/read_speech.tgz.partar",
|
||||
"V5_training_dataset/Track1_Headset/read_speech.tgz.partaq",
|
||||
"V5_training_dataset/Track1_Headset/read_speech.tgz.partap",
|
||||
"V5_training_dataset/Track1_Headset/read_speech.tgz.partao",
|
||||
"V5_training_dataset/Track1_Headset/read_speech.tgz.partan",
|
||||
"V5_training_dataset/Track1_Headset/read_speech.tgz.partam",
|
||||
"V5_training_dataset/Track1_Headset/read_speech.tgz.partal",
|
||||
"V5_training_dataset/Track1_Headset/read_speech.tgz.partak",
|
||||
"V5_training_dataset/Track1_Headset/read_speech.tgz.partaj",
|
||||
"V5_training_dataset/Track1_Headset/read_speech.tgz.partai",
|
||||
"V5_training_dataset/Track1_Headset/read_speech.tgz.partah",
|
||||
"V5_training_dataset/Track1_Headset/read_speech.tgz.partag",
|
||||
"V5_training_dataset/Track1_Headset/read_speech.tgz.partaf",
|
||||
"V5_training_dataset/Track1_Headset/read_speech.tgz.partae",
|
||||
"V5_training_dataset/Track1_Headset/read_speech.tgz.partad",
|
||||
"V5_training_dataset/Track1_Headset/read_speech.tgz.partac",
|
||||
"V5_training_dataset/Track1_Headset/read_speech.tgz.partab",
|
||||
"V5_training_dataset/Track1_Headset/read_speech.tgz.partaa",
|
||||
|
||||
"datasets_fullband/noise_fullband/datasets_fullband.noise_fullband.audioset_000.tar.bz2",
|
||||
"datasets_fullband/noise_fullband/datasets_fullband.noise_fullband.audioset_001.tar.bz2",
|
||||
"datasets_fullband/noise_fullband/datasets_fullband.noise_fullband.audioset_002.tar.bz2",
|
||||
"datasets_fullband/noise_fullband/datasets_fullband.noise_fullband.audioset_003.tar.bz2",
|
||||
"datasets_fullband/noise_fullband/datasets_fullband.noise_fullband.audioset_004.tar.bz2",
|
||||
"datasets_fullband/noise_fullband/datasets_fullband.noise_fullband.audioset_005.tar.bz2",
|
||||
"datasets_fullband/noise_fullband/datasets_fullband.noise_fullband.audioset_006.tar.bz2",
|
||||
"V5_training_dataset/Track1_Headset/italian_speech.tgz.partad",
|
||||
"V5_training_dataset/Track1_Headset/italian_speech.tgz.partac",
|
||||
"V5_training_dataset/Track1_Headset/italian_speech.tgz.partab",
|
||||
"V5_training_dataset/Track1_Headset/italian_speech.tgz.partaa",
|
||||
|
||||
"datasets_fullband/noise_fullband/datasets_fullband.noise_fullband.freesound_000.tar.bz2",
|
||||
"datasets_fullband/noise_fullband/datasets_fullband.noise_fullband.freesound_001.tar.bz2",
|
||||
"V5_training_dataset/Track1_Headset/french_speech.tar.gz.partah",
|
||||
"V5_training_dataset/Track1_Headset/french_speech.tar.gz.partae",
|
||||
"V5_training_dataset/Track1_Headset/french_speech.tar.gz.partad",
|
||||
"V5_training_dataset/Track1_Headset/french_speech.tar.gz.partac",
|
||||
"V5_training_dataset/Track1_Headset/french_speech.tar.gz.partab",
|
||||
"V5_training_dataset/Track1_Headset/french_speech.tar.gz.partaa",
|
||||
|
||||
"datasets_fullband/datasets_fullband.impulse_responses_000.tar.bz2",
|
||||
"V5_training_dataset/Track1_Headset/emotional_speech.tgz"
|
||||
|
||||
"personalized_dev_testset/personalized_dev_testset.enrollment.tar.bz2",
|
||||
"personalized_dev_testset/personalized_dev_testset.noisy_testclips.tar.bz2"
|
||||
|
||||
|
||||
"V5_training_dataset/noise_fullband/datasets_fullband.noise_fullband.freesound_001.tar.bz2",
|
||||
"V5_training_dataset/noise_fullband/datasets_fullband.noise_fullband.freesound_000.tar.bz2",
|
||||
|
||||
"V5_training_dataset/noise_fullband/datasets_fullband.noise_fullband.audioset_006.tar.bz2",
|
||||
"V5_training_dataset/noise_fullband/datasets_fullband.noise_fullband.audioset_005.tar.bz2",
|
||||
"V5_training_dataset/noise_fullband/datasets_fullband.noise_fullband.audioset_004.tar.bz2",
|
||||
"V5_training_dataset/noise_fullband/datasets_fullband.noise_fullband.audioset_003.tar.bz2",
|
||||
"V5_training_dataset/noise_fullband/datasets_fullband.noise_fullband.audioset_002.tar.bz2",
|
||||
"V5_training_dataset/noise_fullband/datasets_fullband.noise_fullband.audioset_001.tar.bz2",
|
||||
"V5_training_dataset/noise_fullband/datasets_fullband.noise_fullband.audioset_000.tar.bz2",
|
||||
|
||||
"V5_training_dataset/datasets_fullband.impulse_responses_000.tar.bz2"
|
||||
|
||||
# "pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.english_000.tar.bz2",
|
||||
# "pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.english_001.tar.bz2",
|
||||
# "pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.english_002.tar.bz2",
|
||||
# "pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.english_003.tar.bz2",
|
||||
# "pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.english_004.tar.bz2",
|
||||
# "pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.french_000.tar.bz2",
|
||||
# "pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.german_000.tar.bz2",
|
||||
# "pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.german_001.tar.bz2",
|
||||
# "pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.italian_000.tar.bz2",
|
||||
# "pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.russian_000.tar.bz2",
|
||||
# "pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.spanish_000.tar.bz2",
|
||||
|
||||
# "pdns_training_set/pdns_training_set.enrollment_embeddings_000.tar.bz2"
|
||||
)
|
||||
|
||||
###############################################################
|
||||
|
||||
$AZURE_URL="https://dns4public.blob.core.windows.net/dns4archive"
|
||||
$AZURE_URL="https://dnschallengepublic.blob.core.windows.net/dns5archive"
|
||||
|
||||
$OUTPUT_PATH="."
|
||||
|
||||
mkdir -Force $OUTPUT_PATH/pdns_training_set/raw 2> $null
|
||||
mkdir -Force $OUTPUT_PATH/pdns_training_set/enrollment_wav 2> $null
|
||||
mkdir -Force $OUTPUT_PATH/datasets_fullband/noise_fullband 2> $null
|
||||
mkdir -Force $OUTPUT_PATH/V5_training_dataset/noise_fullband 2> $null
|
||||
mkdir -Force $OUTPUT_PATH/V5_training_dataset/Track1_Headset 2> $null
|
||||
|
||||
foreach ($BLOB in $BLOB_NAMES) {
|
||||
|
||||
|
@ -123,14 +107,8 @@ foreach ($BLOB in $BLOB_NAMES) {
|
|||
|
||||
# DRY RUN: print HTTP response and Content-Length
|
||||
# WITHOUT downloading the files
|
||||
curl -s -I "$URL" | head -n 2
|
||||
# Invoke-WebRequest $URL -Method Head
|
||||
|
||||
# Actually download the files: UNCOMMENT when ready to download
|
||||
# curl "$URL" -o "$OUTPUT_PATH/$BLOB"
|
||||
|
||||
# Same as above, but using wget
|
||||
# wget "$URL" -O "$OUTPUT_PATH/$BLOB"
|
||||
|
||||
# Same, + unpack files on the fly
|
||||
# curl "$URL" | tar -C "$OUTPUT_PATH" -f - -x -j
|
||||
Invoke-WebRequest $URL -OutFile "$OUTPUT_PATH/$BLOB"
|
||||
}
|
||||
|
|
|
@ -1,6 +1,6 @@
|
|||
#!/usr/bin/bash
|
||||
|
||||
# ***** Datasets for ICASSP 2022 DNS Challenge 4 - Personalized DNS Track *****
|
||||
# ***** Datasets for ICASSP 2023 DNS Challenge 5 - Personalized DNS Track *****
|
||||
|
||||
# NOTE: Before downloading, make sure you have enough space
|
||||
# on your local storage!
|
||||
|
@ -16,103 +16,75 @@
|
|||
# downloading method that works best for you.
|
||||
|
||||
# -------------------------------------------------------------
|
||||
# The directory structure of the unpacked data is:
|
||||
|
||||
# . 362G
|
||||
# +-- datasets_fullband 64G
|
||||
# | +-- impulse_responses 5.9G
|
||||
# | \-- noise_fullband 58G
|
||||
# +-- pdns_training_set 294G
|
||||
# | +-- enrollment_embeddings 115M
|
||||
# | +-- enrollment_wav 42G
|
||||
# | +-- raw/clean 252G
|
||||
# | +-- english 168G
|
||||
# | +-- french 2.1G
|
||||
# | +-- german 53G
|
||||
# | +-- italian 17G
|
||||
# | +-- russian 6.8G
|
||||
# | \-- spanish 5.4G
|
||||
# \-- personalized_dev_testset 3.3G
|
||||
|
||||
BLOB_NAMES=(
|
||||
V5_training_dataset/Track1_Headset/VocalSet_48kHz_mono.tgz
|
||||
|
||||
pdns_training_set/raw/pdns_training_set.raw.clean.english_000.tar.bz2
|
||||
pdns_training_set/raw/pdns_training_set.raw.clean.english_001.tar.bz2
|
||||
pdns_training_set/raw/pdns_training_set.raw.clean.english_002.tar.bz2
|
||||
pdns_training_set/raw/pdns_training_set.raw.clean.english_003.tar.bz2
|
||||
pdns_training_set/raw/pdns_training_set.raw.clean.english_004.tar.bz2
|
||||
pdns_training_set/raw/pdns_training_set.raw.clean.english_005.tar.bz2
|
||||
pdns_training_set/raw/pdns_training_set.raw.clean.english_006.tar.bz2
|
||||
pdns_training_set/raw/pdns_training_set.raw.clean.english_007.tar.bz2
|
||||
pdns_training_set/raw/pdns_training_set.raw.clean.english_008.tar.bz2
|
||||
pdns_training_set/raw/pdns_training_set.raw.clean.english_009.tar.bz2
|
||||
pdns_training_set/raw/pdns_training_set.raw.clean.english_010.tar.bz2
|
||||
pdns_training_set/raw/pdns_training_set.raw.clean.english_011.tar.bz2
|
||||
pdns_training_set/raw/pdns_training_set.raw.clean.english_012.tar.bz2
|
||||
pdns_training_set/raw/pdns_training_set.raw.clean.english_013.tar.bz2
|
||||
pdns_training_set/raw/pdns_training_set.raw.clean.english_014.tar.bz2
|
||||
pdns_training_set/raw/pdns_training_set.raw.clean.english_015.tar.bz2
|
||||
pdns_training_set/raw/pdns_training_set.raw.clean.english_016.tar.bz2
|
||||
pdns_training_set/raw/pdns_training_set.raw.clean.english_017.tar.bz2
|
||||
pdns_training_set/raw/pdns_training_set.raw.clean.english_018.tar.bz2
|
||||
pdns_training_set/raw/pdns_training_set.raw.clean.english_019.tar.bz2
|
||||
pdns_training_set/raw/pdns_training_set.raw.clean.english_020.tar.bz2
|
||||
pdns_training_set/raw/pdns_training_set.raw.clean.french_000.tar.bz2
|
||||
pdns_training_set/raw/pdns_training_set.raw.clean.german_000.tar.bz2
|
||||
pdns_training_set/raw/pdns_training_set.raw.clean.german_001.tar.bz2
|
||||
pdns_training_set/raw/pdns_training_set.raw.clean.german_002.tar.bz2
|
||||
pdns_training_set/raw/pdns_training_set.raw.clean.german_003.tar.bz2
|
||||
pdns_training_set/raw/pdns_training_set.raw.clean.german_004.tar.bz2
|
||||
pdns_training_set/raw/pdns_training_set.raw.clean.german_005.tar.bz2
|
||||
pdns_training_set/raw/pdns_training_set.raw.clean.german_006.tar.bz2
|
||||
pdns_training_set/raw/pdns_training_set.raw.clean.german_007.tar.bz2
|
||||
pdns_training_set/raw/pdns_training_set.raw.clean.german_008.tar.bz2
|
||||
pdns_training_set/raw/pdns_training_set.raw.clean.italian_000.tar.bz2
|
||||
pdns_training_set/raw/pdns_training_set.raw.clean.italian_001.tar.bz2
|
||||
pdns_training_set/raw/pdns_training_set.raw.clean.italian_002.tar.bz2
|
||||
pdns_training_set/raw/pdns_training_set.raw.clean.russian_000.tar.bz2
|
||||
pdns_training_set/raw/pdns_training_set.raw.clean.spanish_000.tar.bz2
|
||||
pdns_training_set/raw/pdns_training_set.raw.clean.spanish_001.tar.bz2
|
||||
pdns_training_set/raw/pdns_training_set.raw.clean.spanish_002.tar.bz2
|
||||
V5_training_dataset/Track1_Headset/vctk_wav48_silence_trimmed.tgz.partac
|
||||
V5_training_dataset/Track1_Headset/vctk_wav48_silence_trimmed.tgz.partab
|
||||
V5_training_dataset/Track1_Headset/vctk_wav48_silence_trimmed.tgz.partaa
|
||||
|
||||
pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.english_000.tar.bz2
|
||||
pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.english_001.tar.bz2
|
||||
pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.english_002.tar.bz2
|
||||
pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.english_003.tar.bz2
|
||||
pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.english_004.tar.bz2
|
||||
pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.french_000.tar.bz2
|
||||
pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.german_000.tar.bz2
|
||||
pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.german_001.tar.bz2
|
||||
pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.italian_000.tar.bz2
|
||||
pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.russian_000.tar.bz2
|
||||
pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.spanish_000.tar.bz2
|
||||
V5_training_dataset/Track1_Headset/russian_speech.tgz
|
||||
|
||||
pdns_training_set/pdns_training_set.enrollment_embeddings_000.tar.bz2
|
||||
V5_training_dataset/Track1_Headset/read_speech.tgz.partau
|
||||
V5_training_dataset/Track1_Headset/read_speech.tgz.partat
|
||||
V5_training_dataset/Track1_Headset/read_speech.tgz.partas
|
||||
V5_training_dataset/Track1_Headset/read_speech.tgz.partar
|
||||
V5_training_dataset/Track1_Headset/read_speech.tgz.partaq
|
||||
V5_training_dataset/Track1_Headset/read_speech.tgz.partap
|
||||
V5_training_dataset/Track1_Headset/read_speech.tgz.partao
|
||||
V5_training_dataset/Track1_Headset/read_speech.tgz.partan
|
||||
V5_training_dataset/Track1_Headset/read_speech.tgz.partam
|
||||
V5_training_dataset/Track1_Headset/read_speech.tgz.partal
|
||||
V5_training_dataset/Track1_Headset/read_speech.tgz.partak
|
||||
V5_training_dataset/Track1_Headset/read_speech.tgz.partaj
|
||||
V5_training_dataset/Track1_Headset/read_speech.tgz.partai
|
||||
V5_training_dataset/Track1_Headset/read_speech.tgz.partah
|
||||
V5_training_dataset/Track1_Headset/read_speech.tgz.partag
|
||||
V5_training_dataset/Track1_Headset/read_speech.tgz.partaf
|
||||
V5_training_dataset/Track1_Headset/read_speech.tgz.partae
|
||||
V5_training_dataset/Track1_Headset/read_speech.tgz.partad
|
||||
V5_training_dataset/Track1_Headset/read_speech.tgz.partac
|
||||
V5_training_dataset/Track1_Headset/read_speech.tgz.partab
|
||||
V5_training_dataset/Track1_Headset/read_speech.tgz.partaa
|
||||
|
||||
datasets_fullband/noise_fullband/datasets_fullband.noise_fullband.audioset_000.tar.bz2
|
||||
datasets_fullband/noise_fullband/datasets_fullband.noise_fullband.audioset_001.tar.bz2
|
||||
datasets_fullband/noise_fullband/datasets_fullband.noise_fullband.audioset_002.tar.bz2
|
||||
datasets_fullband/noise_fullband/datasets_fullband.noise_fullband.audioset_003.tar.bz2
|
||||
datasets_fullband/noise_fullband/datasets_fullband.noise_fullband.audioset_004.tar.bz2
|
||||
datasets_fullband/noise_fullband/datasets_fullband.noise_fullband.audioset_005.tar.bz2
|
||||
datasets_fullband/noise_fullband/datasets_fullband.noise_fullband.audioset_006.tar.bz2
|
||||
V5_training_dataset/Track1_Headset/italian_speech.tgz.partad
|
||||
V5_training_dataset/Track1_Headset/italian_speech.tgz.partac
|
||||
V5_training_dataset/Track1_Headset/italian_speech.tgz.partab
|
||||
V5_training_dataset/Track1_Headset/italian_speech.tgz.partaa
|
||||
|
||||
datasets_fullband/noise_fullband/datasets_fullband.noise_fullband.freesound_000.tar.bz2
|
||||
datasets_fullband/noise_fullband/datasets_fullband.noise_fullband.freesound_001.tar.bz2
|
||||
V5_training_dataset/Track1_Headset/french_speech.tar.gz.partah
|
||||
V5_training_dataset/Track1_Headset/french_speech.tar.gz.partae
|
||||
V5_training_dataset/Track1_Headset/french_speech.tar.gz.partad
|
||||
V5_training_dataset/Track1_Headset/french_speech.tar.gz.partac
|
||||
V5_training_dataset/Track1_Headset/french_speech.tar.gz.partab
|
||||
V5_training_dataset/Track1_Headset/french_speech.tar.gz.partaa
|
||||
|
||||
datasets_fullband/datasets_fullband.impulse_responses_000.tar.bz2
|
||||
V5_training_dataset/Track1_Headset/emotional_speech.tgz
|
||||
|
||||
personalized_dev_testset/personalized_dev_testset.enrollment.tar.bz2
|
||||
personalized_dev_testset/personalized_dev_testset.noisy_testclips.tar.bz2
|
||||
|
||||
V5_training_dataset/noise_fullband/datasets_fullband.noise_fullband.freesound_001.tar.bz2
|
||||
V5_training_dataset/noise_fullband/datasets_fullband.noise_fullband.freesound_000.tar.bz2
|
||||
|
||||
V5_training_dataset/noise_fullband/datasets_fullband.noise_fullband.audioset_006.tar.bz2
|
||||
V5_training_dataset/noise_fullband/datasets_fullband.noise_fullband.audioset_005.tar.bz2
|
||||
V5_training_dataset/noise_fullband/datasets_fullband.noise_fullband.audioset_004.tar.bz2
|
||||
V5_training_dataset/noise_fullband/datasets_fullband.noise_fullband.audioset_003.tar.bz2
|
||||
V5_training_dataset/noise_fullband/datasets_fullband.noise_fullband.audioset_002.tar.bz2
|
||||
V5_training_dataset/noise_fullband/datasets_fullband.noise_fullband.audioset_001.tar.bz2
|
||||
V5_training_dataset/noise_fullband/datasets_fullband.noise_fullband.audioset_000.tar.bz2
|
||||
|
||||
V5_training_dataset/datasets_fullband.impulse_responses_000.tar.bz2
|
||||
)
|
||||
|
||||
###############################################################
|
||||
|
||||
AZURE_URL="https://dns4public.blob.core.windows.net/dns4archive"
|
||||
AZURE_URL="https://dnschallengepublic.blob.core.windows.net/dns5archive"
|
||||
|
||||
OUTPUT_PATH="."
|
||||
|
||||
mkdir -p $OUTPUT_PATH/{pdns_training_set/{raw,enrollment_wav},datasets_fullband/noise_fullband}
|
||||
mkdir -p $OUTPUT_PATH/V5_training_dataset/noise_fullband
|
||||
mkdir -p $OUTPUT_PATH/V5_training_dataset/Track1_Headset
|
||||
|
||||
for BLOB in ${BLOB_NAMES[@]}
|
||||
do
|
||||
|
@ -125,10 +97,6 @@ do
|
|||
|
||||
# Actually download the files: UNCOMMENT when ready to download
|
||||
# curl "$URL" -o "$OUTPUT_PATH/$BLOB"
|
||||
|
||||
# Same as above, but using wget
|
||||
# wget "$URL" -O "$OUTPUT_PATH/$BLOB"
|
||||
|
||||
# Same, + unpack files on the fly
|
||||
# curl "$URL" | tar -C "$OUTPUT_PATH" -f - -x -j
|
||||
done
|
||||
|
||||
#
|
|
@ -1,6 +1,6 @@
|
|||
#!/usr/bin/bash
|
||||
|
||||
# ***** Datasets for ICASSP 2022 DNS Challenge 4 - Personalized DNS Track *****
|
||||
# ***** Datasets for ICASSP 2023 DNS Challenge 5 - Speakerphone DNS Track *****
|
||||
|
||||
# NOTE: Before downloading, make sure you have enough space
|
||||
# on your local storage!
|
||||
|
|
|
@ -1,6 +1,6 @@
|
|||
#!/usr/bin/bash
|
||||
|
||||
# ***** Datasets for ICASSP 2022 DNS Challenge 4 - Personalized DNS Track *****
|
||||
# ***** Datasets for ICASSP 2023 DNS Challenge 5 - Speakerphone DNS Track *****
|
||||
|
||||
# NOTE: Before downloading, make sure you have enough space
|
||||
# on your local storage!
|
||||
|
|
|
@ -15,11 +15,7 @@
|
|||
# | +-- Track1_Headset ---> (enrol, noisy)
|
||||
# | +-- Track2_Speakerphone ---> (enrol, noisy)
|
||||
|
||||
$AZURE_URL="https://dns4public.blob.core.windows.net/dns4archive"
|
||||
|
||||
$OUTPUT_PATH="."
|
||||
|
||||
URL="https://dnschallengepublic.blob.core.windows.net/dns5archive/V5_dev_testset.zip"
|
||||
$URL="https://dnschallengepublic.blob.core.windows.net/dns5archive/V5_dev_testset.zip"
|
||||
|
||||
Write-Output "Download: $URL"
|
||||
|
||||
|
|
|
@ -15,8 +15,6 @@
|
|||
# | +-- Track1_Headset ---> (enrol, noisy)
|
||||
# | +-- Track2_Speakerphone ---> (enrol, noisy)
|
||||
|
||||
AZURE_URL="https://dnschallengepublic.blob.core.windows.net/dns5archive"
|
||||
|
||||
URL="https://dnschallengepublic.blob.core.windows.net/dns5archive/V5_dev_testset.zip"
|
||||
echo "Download: $URL"
|
||||
#
|
||||
|
|
Загрузка…
Ссылка в новой задаче