66 lines
1.7 KiB
Bash
Executable File
66 lines
1.7 KiB
Bash
Executable File
#!/bin/bash
|
|
|
|
# Copyright 2018-2020 Yiming Wang
|
|
# 2018-2020 Daniel Povey
|
|
# 2021 Binbin Zhang
|
|
|
|
[ -f ./path.sh ] && . ./path.sh
|
|
|
|
dl_dir=data/download
|
|
|
|
. tools/parse_options.sh || exit 1;
|
|
|
|
mkdir -p $dl_dir
|
|
|
|
dataset=mobvoi_hotword_dataset.tgz
|
|
resources=mobvoi_hotword_dataset_resources.tgz
|
|
|
|
# base url for downloads.
|
|
data_url=http://www.openslr.org/resources/87
|
|
|
|
if [[ $(hostname -f) == *.clsp.jhu.edu ]]; then
|
|
src_path=/export/fs04/a07/ywang/mobvoihotwords
|
|
else
|
|
src_path=$dl_dir
|
|
fi
|
|
|
|
if [ ! -f $src_path/$dataset ] || [ ! -f $src_path/$resources ]; then
|
|
if ! which wget >/dev/null; then
|
|
echo "$0: wget is not installed."
|
|
exit 1;
|
|
fi
|
|
|
|
if [ ! -f $src_path/$dataset ]; then
|
|
echo "$0: downloading data from $data_url/$dataset. This may take some time, please be patient."
|
|
if ! wget --no-check-certificate -O $dl_dir/$dataset $data_url/$dataset; then
|
|
echo "$0: error executing wget $data_url/$dataset"
|
|
exit 1;
|
|
fi
|
|
fi
|
|
|
|
if [ ! -f $src_path/$resources ]; then
|
|
if ! wget --no-check-certificate -O $dl_dir/$resources $data_url/$resources; then
|
|
echo "$0: error executing wget $data_url/$resources"
|
|
exit 1;
|
|
fi
|
|
fi
|
|
fi
|
|
|
|
if [ -d $dl_dir/$(basename "$dataset" .tgz) ]; then
|
|
echo "Not extracting $(basename "$dataset" .tgz) as it is already there."
|
|
else
|
|
echo "Extracting $dataset..."
|
|
tar -xvzf $src_path/$dataset -C $dl_dir || exit 1;
|
|
echo "Done extracting $dataset."
|
|
fi
|
|
|
|
if [ -d $dl_dir/$(basename "$resources" .tgz) ]; then
|
|
echo "Not extracting $(basename "$dataset" .tar.gz) as it is already there."
|
|
else
|
|
echo "Extracting $resources..."
|
|
tar -xvzf $src_path/$resources -C $dl_dir || exit 1;
|
|
echo "Done extracting $resources."
|
|
fi
|
|
|
|
exit 0
|