From 749c3d4168d96dbd30ffdfc7b7a682c0ab6d850c Mon Sep 17 00:00:00 2001 From: WuHaobo Date: Sat, 11 Apr 2020 02:48:00 +0800 Subject: [PATCH] add dataset --- dataset/README.md | 1 + dataset/download_imagenet2012.sh | 40 ++++++++++++++++++++++++++++++++ 2 files changed, 41 insertions(+) create mode 100644 dataset/README.md create mode 100644 dataset/download_imagenet2012.sh diff --git a/dataset/README.md b/dataset/README.md new file mode 100644 index 00000000..c1a50767 --- /dev/null +++ b/dataset/README.md @@ -0,0 +1 @@ +#mannual diff --git a/dataset/download_imagenet2012.sh b/dataset/download_imagenet2012.sh new file mode 100644 index 00000000..3e6e0ce6 --- /dev/null +++ b/dataset/download_imagenet2012.sh @@ -0,0 +1,40 @@ +set -e +if [ "x${IMAGENET_USERNAME}" == x -o "x${IMAGENET_ACCESS_KEY}" == x ];then + echo "Please create an account on image-net.org." + echo "It will provide you a pair of username and accesskey to download imagenet data." + read -p "Username: " IMAGENET_USERNAME + read -p "Accesskey: " IMAGENET_ACCESS_KEY +fi + +root_url=http://www.image-net.org/challenges/LSVRC/2012/nnoupb +valid_tar=ILSVRC2012_img_val.tar +train_tar=ILSVRC2012_img_train.tar +train_folder=train/ +valid_folder=val/ + +echo "Download imagenet training data..." +mkdir -p ${train_folder} +wget -nd -c ${root_url}/${train_tar} +tar xf ${train_tar} -C ${train_folder} + +cd ${train_folder} +for x in `ls *.tar` +do + filename=`basename $x .tar` + mkdir -p $filename + tar -xf $x -C $filename + rm -rf $x +done +cd - + +echo "Download imagenet validation data..." +mkdir -p ${valid_folder} +wget -nd -c ${root_url}/${valid_tar} +tar xf ${valid_tar} -C ${valid_folder} + +echo "Download imagenet label file: val_list.txt & train_list.txt" +label_file=ImageNet_label.tgz +label_url=http://paddle-imagenet-models.bj.bcebos.com/${label_file} +wget -nd -c ${label_url} +tar zxf ${label_file} + -- GitLab