-
Notifications
You must be signed in to change notification settings - Fork 6
/
pull_all_data.sh
50 lines (45 loc) · 1.86 KB
/
pull_all_data.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
mkdir -p SARC/2.0/pol
wget http://nlp.cs.princeton.edu/SARC/2.0/pol/comments.json.bz2
wget http://nlp.cs.princeton.edu/SARC/2.0/pol/train-balanced.csv.bz2
wget http://nlp.cs.princeton.edu/SARC/2.0/pol/train-unbalanced.csv.bz2
wget http://nlp.cs.princeton.edu/SARC/2.0/pol/test-balanced.csv.bz2
wget http://nlp.cs.princeton.edu/SARC/2.0/pol/test-unbalanced.csv.bz2
bzip2 -d comments.json.bz2
bzip2 -d train-balanced.csv.bz2
bzip2 -d train-unbalanced.csv.bz2
bzip2 -d test-balanced.csv.bz2
bzip2 -d test-unbalanced.csv.bz2
mv comments.json SARC/2.0/pol/
mv train-balanced.csv SARC/2.0/pol/
mv train-unbalanced.csv SARC/2.0/pol/
mv test-balanced.csv SARC/2.0/pol/
mv test-unbalanced.csv SARC/2.0/pol/
mkdir ../static
wget https://s3-us-west-1.amazonaws.com/fasttext-vectors/wiki-news-300d-1M-subword.vec.zip
unzip wiki-news-300d-1M-subword.vec.zip
rm wiki-news-300d-1M-subword.vec.zip
mv wiki-news-300d-1M-subword.vec ../static/
wget http://nlp.stanford.edu/data/glove.6B.zip
unzip glove.6B.zip
rm glove.6B.zip
mkdir ../static/glove
mv glove*.txt ../static/glove/
mkdir -p SARC/2.0/main
wget http://nlp.cs.princeton.edu/SARC/2.0/main/comments.json.bz2
wget http://nlp.cs.princeton.edu/SARC/2.0/main/train-balanced.csv.bz2
wget http://nlp.cs.princeton.edu/SARC/2.0/main/test-balanced.csv.bz2
wget http://nlp.cs.princeton.edu/SARC/2.0/main/test-unbalanced.csv.bz2
wget http://nlp.cs.princeton.edu/SARC/2.0/main/train-unbalanced.csv.bz2
bzip2 -d comments.json.bz2
bzip2 -d train-balanced.csv.bz2
bzip2 -d train-unbalanced.csv.bz2
bzip2 -d test-unbalanced.csv.bz2
bzip2 -d test-balanced.csv.bz2
mv comments.json SARC/2.0/main/
mv train-balanced.csv SARC/2.0/main/
mv test-balanced.csv SARC/2.0/main/
mv test-unbalanced.csv SARC/2.0/main/
mv train-unbalanced.csv SARC/2.0/main/
wget http://nlp.cs.princeton.edu/DisC/amazon_glove1600.txt.bz2
bzip2 -d amazon_glove1600.txt.bz2
mv amazon_glove1600.txt ../static