data_dir=~/.cache/paddle/dataset/speech/deep_asr_data/aishell data_url='http://deep-asr-data.gz.bcebos.com/aishell_data.tar.gz' lst_url='http://deep-asr-data.gz.bcebos.com/aishell_lst.tar.gz' aux_url='http://deep-asr-data.gz.bcebos.com/aux.tar.gz' md5=17669b8d63331c9326f4a9393d289bfb aux_md5=50e3125eba1e3a2768a6f2e499cc1749 if [ ! -e $data_dir ]; then mkdir -p $data_dir fi if [ ! -e $data_dir/aishell_data.tar.gz ]; then echo "Download $data_dir/aishell_data.tar.gz ..." wget -c -P $data_dir $data_url else echo "Skip downloading for $data_dir/aishell_data.tar.gz has already existed!" fi echo "Checking md5 sum ..." md5sum_tmp=`md5sum $data_dir/aishell_data.tar.gz | cut -d ' ' -f1` if [ $md5sum_tmp != $md5 ]; then echo "Md5sum check failed, please remove and redownload " "$data_dir/aishell_data.tar.gz" exit 1 fi echo "Untar aishell_data.tar.gz ..." tar xzf $data_dir/aishell_data.tar.gz -C $data_dir if [ ! -e data ]; then mkdir data fi echo "Download and untar lst files ..." wget -c -P data $lst_url tar xvf data/aishell_lst.tar.gz -C data ln -s $data_dir data/aishell echo "Download and untar aux files ..." wget -c $aux_url tar xvf aux.tar.gz