-
Notifications
You must be signed in to change notification settings - Fork 11
/
get_data.sh
executable file
·82 lines (72 loc) · 1.67 KB
/
get_data.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
#!/usr/bin/env bash
echo "=== Acquiring datasets ==="
echo "---"
if [ -d "$PWD/data/" ]
then
echo "Directory /data/ exists."
else
echo "Create Directory /data."
mkdir data
fi
# (1) SST-2
echo "Downloading SST-2 Dataset..."
if [ -d "$PWD/data/SST-2" ]
then
echo "Directory /data/SST-2 exists."
else
echo "Directory /data/SST-2 does not exist."
python utilities/download_glue.py --tasks SST
fi
echo "---"
# (2) QQP
echo "Downloading QQP Dataset..."
if [ -d "$PWD/data/QQP" ]
then
echo "Directory /data/QQP exists."
else
echo "Directory /data/QQP does not exist."
python utilities/download_glue.py --tasks QQP
fi
echo "---"
# (3) QNLI
echo "Downloading QNLI Dataset..."
if [ -d "$PWD/data/QNLI" ]
then
echo "Directory /data/QNLI exists."
else
echo "Directory /data/QNLI does not exist."
python utilities/download_glue.py --tasks QNLI
fi
echo "---"
# (4) PubMed
# (5) IMDB
# (6) AG_NEWS
# (7) DBPEDIA
#echo "Downloading AG_NEWS..."
## I have to fix that
#if [ -d "$PWD/data/AG_NEWS" ]
#then
# echo "Directory /data/AG_NEWS exists."
#else
# echo "Directory /data/AG_NEWS does not exist."
# cd data
# mkdir AG_NEWS
# cd AG_NEWS
# https://drive.google.com/file/d/1X8hXEEpVscCVPsQnBKZZjozoUP7QL-mI/view?usp=sharing
# wget https://drive.google.com/uc?export=download&id=0Bz8a_Dbh9QhbUDNpeUdjb0wxRms #-O "ag_news_csv.tar.gz"
# tar -xzvf "ag_news_csv.tar.gz" -C "${DATADIR}"
# cd ../../
#fi
#echo "---"
#echo "Downloading DBPedia..."
#if [ -d "$PWD/datasets/DBPEDIA" ]
#then
# echo "Directory /datasets/DBPEDIA exists."
#else
# cd datasets
# mkdir DBPEDIA
# cd DBPEDIA
# wget https://drive.google.com/file/d/0Bz8a_Dbh9QhbQ2Vic1kxMmZZQ1k
#fi
echo "---"
echo "The End :)"