removing outdated v4 transcripts files, added transcript into v5 devset, removed .ps1
This commit is contained in:
Родитель
a4f1a459cf
Коммит
18fa5e466b
Разница между файлами не показана из-за своего большого размера
Загрузить разницу
|
@ -1,136 +0,0 @@
|
|||
#!/usr/bin/bash
|
||||
|
||||
# ***** Datasets for ICASSP 2022 DNS Challenge 4 - Personalized DNS Track *****
|
||||
|
||||
# NOTE: Before downloading, make sure you have enough space
|
||||
# on your local storage!
|
||||
|
||||
# In all, you will need about 380TB to store the UNPACKED data.
|
||||
# Archived, the same data takes about 200GB total.
|
||||
|
||||
# Please comment out the files you don't need before launching
|
||||
# the script.
|
||||
|
||||
# NOTE: By default, the script *DOES NOT* DOWNLOAD ANY FILES!
|
||||
# Please scroll down and edit this script to pick the
|
||||
# downloading method that works best for you.
|
||||
|
||||
# -------------------------------------------------------------
|
||||
# The directory structure of the unpacked data is:
|
||||
|
||||
# . 362G
|
||||
# +-- datasets_fullband 64G
|
||||
# | +-- impulse_responses 5.9G
|
||||
# | \-- noise_fullband 58G
|
||||
# +-- pdns_training_set 294G
|
||||
# | +-- enrollment_embeddings 115M
|
||||
# | +-- enrollment_wav 42G
|
||||
# | +-- raw/clean 252G
|
||||
# | +-- english 168G
|
||||
# | +-- french 2.1G
|
||||
# | +-- german 53G
|
||||
# | +-- italian 17G
|
||||
# | +-- russian 6.8G
|
||||
# | \-- spanish 5.4G
|
||||
# \-- personalized_dev_testset 3.3G
|
||||
|
||||
$BLOB_NAMES=@(
|
||||
|
||||
"pdns_training_set/raw/pdns_training_set.raw.clean.english_000.tar.bz2",
|
||||
"pdns_training_set/raw/pdns_training_set.raw.clean.english_001.tar.bz2",
|
||||
"pdns_training_set/raw/pdns_training_set.raw.clean.english_002.tar.bz2",
|
||||
"pdns_training_set/raw/pdns_training_set.raw.clean.english_003.tar.bz2",
|
||||
"pdns_training_set/raw/pdns_training_set.raw.clean.english_004.tar.bz2",
|
||||
"pdns_training_set/raw/pdns_training_set.raw.clean.english_005.tar.bz2",
|
||||
"pdns_training_set/raw/pdns_training_set.raw.clean.english_006.tar.bz2",
|
||||
"pdns_training_set/raw/pdns_training_set.raw.clean.english_007.tar.bz2",
|
||||
"pdns_training_set/raw/pdns_training_set.raw.clean.english_008.tar.bz2",
|
||||
"pdns_training_set/raw/pdns_training_set.raw.clean.english_009.tar.bz2",
|
||||
"pdns_training_set/raw/pdns_training_set.raw.clean.english_010.tar.bz2",
|
||||
"pdns_training_set/raw/pdns_training_set.raw.clean.english_011.tar.bz2",
|
||||
"pdns_training_set/raw/pdns_training_set.raw.clean.english_012.tar.bz2",
|
||||
"pdns_training_set/raw/pdns_training_set.raw.clean.english_013.tar.bz2",
|
||||
"pdns_training_set/raw/pdns_training_set.raw.clean.english_014.tar.bz2",
|
||||
"pdns_training_set/raw/pdns_training_set.raw.clean.english_015.tar.bz2",
|
||||
"pdns_training_set/raw/pdns_training_set.raw.clean.english_016.tar.bz2",
|
||||
"pdns_training_set/raw/pdns_training_set.raw.clean.english_017.tar.bz2",
|
||||
"pdns_training_set/raw/pdns_training_set.raw.clean.english_018.tar.bz2",
|
||||
"pdns_training_set/raw/pdns_training_set.raw.clean.english_019.tar.bz2",
|
||||
"pdns_training_set/raw/pdns_training_set.raw.clean.english_020.tar.bz2",
|
||||
"pdns_training_set/raw/pdns_training_set.raw.clean.french_000.tar.bz2",
|
||||
"pdns_training_set/raw/pdns_training_set.raw.clean.german_000.tar.bz2",
|
||||
"pdns_training_set/raw/pdns_training_set.raw.clean.german_001.tar.bz2",
|
||||
"pdns_training_set/raw/pdns_training_set.raw.clean.german_002.tar.bz2",
|
||||
"pdns_training_set/raw/pdns_training_set.raw.clean.german_003.tar.bz2",
|
||||
"pdns_training_set/raw/pdns_training_set.raw.clean.german_004.tar.bz2",
|
||||
"pdns_training_set/raw/pdns_training_set.raw.clean.german_005.tar.bz2",
|
||||
"pdns_training_set/raw/pdns_training_set.raw.clean.german_006.tar.bz2",
|
||||
"pdns_training_set/raw/pdns_training_set.raw.clean.german_007.tar.bz2",
|
||||
"pdns_training_set/raw/pdns_training_set.raw.clean.german_008.tar.bz2",
|
||||
"pdns_training_set/raw/pdns_training_set.raw.clean.italian_000.tar.bz2",
|
||||
"pdns_training_set/raw/pdns_training_set.raw.clean.italian_001.tar.bz2",
|
||||
"pdns_training_set/raw/pdns_training_set.raw.clean.italian_002.tar.bz2",
|
||||
"pdns_training_set/raw/pdns_training_set.raw.clean.russian_000.tar.bz2",
|
||||
"pdns_training_set/raw/pdns_training_set.raw.clean.spanish_000.tar.bz2",
|
||||
"pdns_training_set/raw/pdns_training_set.raw.clean.spanish_001.tar.bz2",
|
||||
"pdns_training_set/raw/pdns_training_set.raw.clean.spanish_002.tar.bz2",
|
||||
|
||||
"pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.english_000.tar.bz2",
|
||||
"pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.english_001.tar.bz2",
|
||||
"pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.english_002.tar.bz2",
|
||||
"pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.english_003.tar.bz2",
|
||||
"pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.english_004.tar.bz2",
|
||||
"pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.french_000.tar.bz2",
|
||||
"pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.german_000.tar.bz2",
|
||||
"pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.german_001.tar.bz2",
|
||||
"pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.italian_000.tar.bz2",
|
||||
"pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.russian_000.tar.bz2",
|
||||
"pdns_training_set/enrollment_wav/pdns_training_set.enrollment_wav.spanish_000.tar.bz2",
|
||||
|
||||
"pdns_training_set/pdns_training_set.enrollment_embeddings_000.tar.bz2",
|
||||
|
||||
"datasets_fullband/noise_fullband/datasets_fullband.noise_fullband.audioset_000.tar.bz2",
|
||||
"datasets_fullband/noise_fullband/datasets_fullband.noise_fullband.audioset_001.tar.bz2",
|
||||
"datasets_fullband/noise_fullband/datasets_fullband.noise_fullband.audioset_002.tar.bz2",
|
||||
"datasets_fullband/noise_fullband/datasets_fullband.noise_fullband.audioset_003.tar.bz2",
|
||||
"datasets_fullband/noise_fullband/datasets_fullband.noise_fullband.audioset_004.tar.bz2",
|
||||
"datasets_fullband/noise_fullband/datasets_fullband.noise_fullband.audioset_005.tar.bz2",
|
||||
"datasets_fullband/noise_fullband/datasets_fullband.noise_fullband.audioset_006.tar.bz2",
|
||||
|
||||
"datasets_fullband/noise_fullband/datasets_fullband.noise_fullband.freesound_000.tar.bz2",
|
||||
"datasets_fullband/noise_fullband/datasets_fullband.noise_fullband.freesound_001.tar.bz2",
|
||||
|
||||
"datasets_fullband/datasets_fullband.impulse_responses_000.tar.bz2",
|
||||
|
||||
"personalized_dev_testset/personalized_dev_testset.enrollment.tar.bz2",
|
||||
"personalized_dev_testset/personalized_dev_testset.noisy_testclips.tar.bz2"
|
||||
)
|
||||
|
||||
###############################################################
|
||||
|
||||
$AZURE_URL="https://dns4public.blob.core.windows.net/dns4archive"
|
||||
|
||||
$OUTPUT_PATH="."
|
||||
|
||||
mkdir -Force $OUTPUT_PATH/pdns_training_set/raw 2> $null
|
||||
mkdir -Force $OUTPUT_PATH/pdns_training_set/enrollment_wav 2> $null
|
||||
mkdir -Force $OUTPUT_PATH/datasets_fullband/noise_fullband 2> $null
|
||||
|
||||
foreach ($BLOB in $BLOB_NAMES) {
|
||||
|
||||
$URL="$AZURE_URL/$BLOB"
|
||||
Write-Output "Download: $BLOB"
|
||||
|
||||
# DRY RUN: print HTTP response and Content-Length
|
||||
# WITHOUT downloading the files
|
||||
curl -s -I "$URL" | head -n 2
|
||||
|
||||
# Actually download the files: UNCOMMENT when ready to download
|
||||
# curl "$URL" -o "$OUTPUT_PATH/$BLOB"
|
||||
|
||||
# Same as above, but using wget
|
||||
# wget "$URL" -O "$OUTPUT_PATH/$BLOB"
|
||||
|
||||
# Same, + unpack files on the fly
|
||||
# curl "$URL" | tar -C "$OUTPUT_PATH" -f - -x -j
|
||||
}
|
|
@ -1,204 +0,0 @@
|
|||
|
||||
# ***** Datasets for ICASSP 2022 DNS Challenge 4 *****
|
||||
|
||||
# NOTE: Before downloading, make sure you have enough space
|
||||
# on your local storage!
|
||||
|
||||
# In all, you will need about 1TB to store the UNPACKED data.
|
||||
# Archived, the same data takes about 550GB total.
|
||||
|
||||
# Please comment out the files you don't need before launching
|
||||
# the script.
|
||||
|
||||
# NOTE: By default, the script *DOES NOT* DOWNLOAD ANY FILES!
|
||||
# Please scroll down and edit this script to pick the
|
||||
# downloading method that works best for you.
|
||||
|
||||
# -------------------------------------------------------------
|
||||
# The directory structure of the unpacked data is:
|
||||
|
||||
# datasets_fullband 892G
|
||||
# +-- dev_testset 1.7G
|
||||
# +-- impulse_responses 5.9G
|
||||
# +-- noise_fullband 58G
|
||||
# \-- clean_fullband 827G
|
||||
# +-- emotional_speech 2.4G
|
||||
# +-- french_speech 62G
|
||||
# +-- german_speech 319G
|
||||
# +-- italian_speech 42G
|
||||
# +-- read_speech 299G
|
||||
# +-- russian_speech 12G
|
||||
# +-- spanish_speech 65G
|
||||
# +-- vctk_wav48_silence_trimmed 27G
|
||||
# \-- VocalSet_48kHz_mono 974M
|
||||
|
||||
$BLOB_NAMES=@(
|
||||
|
||||
"clean_fullband/datasets_fullband.clean_fullband.VocalSet_48kHz_mono_000_NA_NA.tar.bz2",
|
||||
|
||||
"clean_fullband/datasets_fullband.clean_fullband.emotional_speech_000_NA_NA.tar.bz2",
|
||||
|
||||
"clean_fullband/datasets_fullband.clean_fullband.french_speech_000_NA_NA.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.french_speech_001_NA_NA.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.french_speech_002_NA_NA.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.french_speech_003_NA_NA.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.french_speech_004_NA_NA.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.french_speech_005_NA_NA.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.french_speech_006_NA_NA.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.french_speech_007_NA_NA.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.french_speech_008_NA_NA.tar.bz2",
|
||||
|
||||
"clean_fullband/datasets_fullband.clean_fullband.german_speech_000_0.00_3.47.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.german_speech_001_3.47_3.64.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.german_speech_002_3.64_3.74.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.german_speech_003_3.74_3.81.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.german_speech_004_3.81_3.86.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.german_speech_005_3.86_3.91.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.german_speech_006_3.91_3.96.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.german_speech_007_3.96_4.00.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.german_speech_008_4.00_4.04.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.german_speech_009_4.04_4.08.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.german_speech_010_4.08_4.12.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.german_speech_011_4.12_4.16.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.german_speech_012_4.16_4.21.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.german_speech_013_4.21_4.26.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.german_speech_014_4.26_4.33.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.german_speech_015_4.33_4.43.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.german_speech_016_4.43_NA.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.german_speech_017_NA_NA.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.german_speech_018_NA_NA.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.german_speech_019_NA_NA.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.german_speech_020_NA_NA.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.german_speech_021_NA_NA.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.german_speech_022_NA_NA.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.german_speech_023_NA_NA.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.german_speech_024_NA_NA.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.german_speech_025_NA_NA.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.german_speech_026_NA_NA.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.german_speech_027_NA_NA.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.german_speech_028_NA_NA.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.german_speech_029_NA_NA.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.german_speech_030_NA_NA.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.german_speech_031_NA_NA.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.german_speech_032_NA_NA.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.german_speech_033_NA_NA.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.german_speech_034_NA_NA.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.german_speech_035_NA_NA.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.german_speech_036_NA_NA.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.german_speech_037_NA_NA.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.german_speech_038_NA_NA.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.german_speech_039_NA_NA.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.german_speech_040_NA_NA.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.german_speech_041_NA_NA.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.german_speech_042_NA_NA.tar.bz2",
|
||||
|
||||
"clean_fullband/datasets_fullband.clean_fullband.italian_speech_000_0.00_3.98.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.italian_speech_001_3.98_4.21.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.italian_speech_002_4.21_4.40.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.italian_speech_003_4.40_NA.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.italian_speech_004_NA_NA.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.italian_speech_005_NA_NA.tar.bz2",
|
||||
|
||||
"clean_fullband/datasets_fullband.clean_fullband.read_speech_000_0.00_3.75.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.read_speech_001_3.75_3.88.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.read_speech_002_3.88_3.96.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.read_speech_003_3.96_4.02.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.read_speech_004_4.02_4.06.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.read_speech_005_4.06_4.10.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.read_speech_006_4.10_4.13.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.read_speech_007_4.13_4.16.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.read_speech_008_4.16_4.19.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.read_speech_009_4.19_4.21.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.read_speech_010_4.21_4.24.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.read_speech_011_4.24_4.26.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.read_speech_012_4.26_4.29.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.read_speech_013_4.29_4.31.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.read_speech_014_4.31_4.33.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.read_speech_015_4.33_4.35.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.read_speech_016_4.35_4.38.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.read_speech_017_4.38_4.40.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.read_speech_018_4.40_4.42.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.read_speech_019_4.42_4.45.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.read_speech_020_4.45_4.48.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.read_speech_021_4.48_4.52.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.read_speech_022_4.52_4.57.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.read_speech_023_4.57_4.67.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.read_speech_024_4.67_NA.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.read_speech_025_NA_NA.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.read_speech_026_NA_NA.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.read_speech_027_NA_NA.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.read_speech_028_NA_NA.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.read_speech_029_NA_NA.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.read_speech_030_NA_NA.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.read_speech_031_NA_NA.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.read_speech_032_NA_NA.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.read_speech_033_NA_NA.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.read_speech_034_NA_NA.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.read_speech_035_NA_NA.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.read_speech_036_NA_NA.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.read_speech_037_NA_NA.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.read_speech_038_NA_NA.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.read_speech_039_NA_NA.tar.bz2",
|
||||
|
||||
"clean_fullband/datasets_fullband.clean_fullband.russian_speech_000_0.00_4.31.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.russian_speech_001_4.31_NA.tar.bz2",
|
||||
|
||||
"clean_fullband/datasets_fullband.clean_fullband.spanish_speech_000_0.00_4.09.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.spanish_speech_001_4.09_NA.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.spanish_speech_002_NA_NA.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.spanish_speech_003_NA_NA.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.spanish_speech_004_NA_NA.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.spanish_speech_005_NA_NA.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.spanish_speech_006_NA_NA.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.spanish_speech_007_NA_NA.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.spanish_speech_008_NA_NA.tar.bz2",
|
||||
|
||||
"clean_fullband/datasets_fullband.clean_fullband.vctk_wav48_silence_trimmed_000.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.vctk_wav48_silence_trimmed_001.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.vctk_wav48_silence_trimmed_002.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.vctk_wav48_silence_trimmed_003.tar.bz2",
|
||||
"clean_fullband/datasets_fullband.clean_fullband.vctk_wav48_silence_trimmed_004.tar.bz2",
|
||||
|
||||
"noise_fullband/datasets_fullband.noise_fullband.audioset_000.tar.bz2",
|
||||
"noise_fullband/datasets_fullband.noise_fullband.audioset_001.tar.bz2",
|
||||
"noise_fullband/datasets_fullband.noise_fullband.audioset_002.tar.bz2",
|
||||
"noise_fullband/datasets_fullband.noise_fullband.audioset_003.tar.bz2",
|
||||
"noise_fullband/datasets_fullband.noise_fullband.audioset_004.tar.bz2",
|
||||
"noise_fullband/datasets_fullband.noise_fullband.audioset_005.tar.bz2",
|
||||
"noise_fullband/datasets_fullband.noise_fullband.audioset_006.tar.bz2",
|
||||
|
||||
"noise_fullband/datasets_fullband.noise_fullband.freesound_000.tar.bz2",
|
||||
"noise_fullband/datasets_fullband.noise_fullband.freesound_001.tar.bz2",
|
||||
|
||||
"datasets_fullband.dev_testset_000.tar.bz2",
|
||||
|
||||
"datasets_fullband.impulse_responses_000.tar.bz2"
|
||||
)
|
||||
|
||||
###############################################################
|
||||
|
||||
$AZURE_URL="https://dns4public.blob.core.windows.net/dns4archive/datasets_fullband"
|
||||
|
||||
$OUTPUT_PATH="./datasets_fullband"
|
||||
|
||||
mkdir -Force $OUTPUT_PATH/clean_fullband 2> $null
|
||||
mkdir -Force $OUTPUT_PATH/noise_fullband 2> $null
|
||||
|
||||
foreach ($BLOB in $BLOB_NAMES) {
|
||||
|
||||
$URL="$AZURE_URL/$BLOB"
|
||||
Write-Output "Download: $BLOB"
|
||||
|
||||
# DRY RUN: print HTTP response and Content-Length
|
||||
# WITHOUT downloading the files
|
||||
curl -s -I "$URL" | head -n 2
|
||||
|
||||
# Actually download the files: UNCOMMENT when ready to download
|
||||
# curl "$URL" -o "$OUTPUT_PATH/$BLOB"
|
||||
|
||||
# Same as above, but using wget
|
||||
# wget "$URL" -O "$OUTPUT_PATH/$BLOB"
|
||||
|
||||
# Same, + unpack files on the fly
|
||||
# curl "$URL" | tar -C "$OUTPUT_PATH" -f - -x -j
|
||||
}
|
|
@ -1,33 +0,0 @@
|
|||
#!/usr/bin/bash
|
||||
|
||||
# ***** Dev Testset for 5th DNS Challenge at ICASSP 2023*****
|
||||
|
||||
# NOTE: Before downloading, make sure you have enough space
|
||||
# on your local storage!
|
||||
|
||||
# Zip file is 2.9 GB. Unzipped data is 4GB.
|
||||
|
||||
# -------------------------------------------------------------
|
||||
# The directory structure of the unpacked data is:
|
||||
|
||||
#
|
||||
# +-- V5_dev_testset 64G
|
||||
# | +-- Track1_Headset ---> (enrol, noisy)
|
||||
# | +-- Track2_Speakerphone ---> (enrol, noisy)
|
||||
|
||||
$URL="https://dnschallengepublic.blob.core.windows.net/dns5archive/V5_dev_testset.zip"
|
||||
|
||||
Write-Output "Download: $URL"
|
||||
|
||||
# DRY RUN: print HTTP response and Content-Length
|
||||
# WITHOUT downloading the files
|
||||
curl -s -I "$URL" | head -n 2
|
||||
|
||||
# Actually download the files: UNCOMMENT when ready to download
|
||||
# curl "$URL" -o "$OUTPUT_PATH/$BLOB"
|
||||
|
||||
# Same as above, but using wget
|
||||
# wget "$URL" -O "$OUTPUT_PATH/$BLOB"
|
||||
|
||||
# Same, + unpack files on the fly
|
||||
# curl "$URL" | tar -C "$OUTPUT_PATH" -f - -x -j
|
Загрузка…
Ссылка в новой задаче