This repository has been archived by the owner on Nov 11, 2023. It is now read-only.
forked from openeventdata/eldiablo
-
Notifications
You must be signed in to change notification settings - Fork 0
/
bootstrap.sh
69 lines (59 loc) · 1.91 KB
/
bootstrap.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
#!/usr/bin/env bash
sudo apt-key adv --keyserver hkp://keyserver.ubuntu.com:80 --recv 7F0CEB10
echo 'deb http://downloads-distro.mongodb.org/repo/ubuntu-upstart dist 10gen' |
tee /etc/apt/sources.list.d/mongodb-org-3.0.list
sudo apt-get update
echo "Installing base packages..."
sudo apt-get install zlib1g-dev
sudo apt-get install git <<-EOF
yes
EOF
sudo apt-get install g++ <<-EOF
yes
EOF
sudo apt-get install default-jre <<-EOF
yes
EOF
sudo apt-get install zip
sudo apt-get install unzip
sudo apt-get install libxml2-dev <<-EOF
yes
EOF
sudo apt-get install libxslt1-dev <<-EOF
yes
EOF
sudo apt-get install python-dev <<-EOF
yes
EOF
sudo apt-get install python-pip <<-EOF
yes
EOF
echo "Cloning Phoenix pipeline files..."
sudo git clone https://github.com/openeventdata/phoenix_pipeline.git
sudo git clone https://github.com/openeventdata/scraper.git
sudo git clone https://github.com/openeventdata/stanford_pipeline.git
echo "Installing Python dependencies..."
sudo pip install -r scraper/requirements.txt
sudo pip install -r phoenix_pipeline/requirements.txt
sudo pip install -r stanford_pipeline/requirements.txt
echo "Installing PETRARCH..."
sudo pip install git+https://github.com/openeventdata/petrarch.git
cd
echo "Downloading CoreNLP..."
sudo wget http://nlp.stanford.edu/software/stanford-corenlp-full-2014-06-16.zip
sudo unzip stanford-corenlp-full-2014-06-16.zip
mv stanford-corenlp-full-2014-06-16 /home/vagrant/stanford-corenlp
cd /home/vagrant/stanford-corenlp
echo "Downloading shift-reduce parser..."
sudo wget http://nlp.stanford.edu/software/stanford-srparser-2014-07-01-models.jar
echo "Downloading NLTK data..."
sudo mkdir -p nltk_data/tokenizers
cd nltk_data/tokenizers
sudo wget http://www.nltk.org/nltk_data/packages/tokenizers/punkt.zip
sudo unzip punkt.zip
cd
sudo mv nltk_data /usr/lib/nltk_data
echo "Installing MongoDB..."
sudo apt-get install -y mongodb-org
echo "Setting up crontab..."
sudo crontab crontab.txt