forked from censusreporter/census-api
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathfabfile.py
231 lines (184 loc) · 10.6 KB
/
fabfile.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
from fabric.api import *
from fabric.contrib.files import *
from fabric.context_managers import shell_env, prefix
from fabric.colors import green
root_dir = '/home/www-data'
host = 'api.censusreporter.org'
code_dir = '%s/%s_app' % (root_dir, host)
virtualenv_name = '%s_venv' % host
virtualenv_dir = '%s/%s' % (root_dir, virtualenv_name)
newrelic_app_name = 'Census Reporter API'
def _download_sql_backups(data_to_load):
""" Creates a new AWS EBS snapshot.
`data_to_load`: A list of releases to import into the database. """
possible_data_sources = {
'tiger2012': 'https://s3.amazonaws.com/census-backup/tiger/2012/tiger2012_backup.sql.gz',
'acs2012_1yr': 'http://census-backup.s3.amazonaws.com/acs/2012/acs2012_1yr/acs2012_1yr_backup.sql.gz',
'acs2012_3yr': 'http://census-backup.s3.amazonaws.com/acs/2012/acs2012_3yr/acs2012_3yr_backup.sql.gz',
'acs2012_5yr': 'http://census-backup.s3.amazonaws.com/acs/2012/acs2012_5yr/acs2012_5yr_backup.sql.gz',
'acs2011_1yr': 'http://census-backup.s3.amazonaws.com/acs/2011/acs2011_1yr/acs2011_1yr_backup.sql.gz',
'acs2011_3yr': 'http://census-backup.s3.amazonaws.com/acs/2011/acs2011_3yr/acs2011_3yr_backup.sql.gz',
'acs2011_5yr': 'http://census-backup.s3.amazonaws.com/acs/2011/acs2011_5yr/acs2011_5yr_backup.sql.gz',
'acs2010_1yr': 'http://census-backup.s3.amazonaws.com/acs/2010/acs2010_1yr/acs2010_1yr_backup.sql.gz',
'acs2010_3yr': 'http://census-backup.s3.amazonaws.com/acs/2010/acs2010_3yr/acs2010_3yr_backup.sql.gz',
'acs2010_5yr': 'http://census-backup.s3.amazonaws.com/acs/2010/acs2010_5yr/acs2010_5yr_backup.sql.gz',
'acs2009_1yr': 'http://census-backup.s3.amazonaws.com/acs/2009/acs2009_1yr/acs2009_1yr_backup.sql.gz',
'acs2009_3yr': 'http://census-backup.s3.amazonaws.com/acs/2009/acs2009_3yr/acs2009_3yr_backup.sql.gz',
'acs2008_1yr': 'http://census-backup.s3.amazonaws.com/acs/2008/acs2008_1yr/acs2008_1yr_backup.sql.gz',
'acs2008_3yr': 'http://census-backup.s3.amazonaws.com/acs/2008/acs2008_3yr/acs2008_3yr_backup.sql.gz',
'acs2007_1yr': 'http://census-backup.s3.amazonaws.com/acs/2007/acs2007_1yr/acs2007_1yr_backup.sql.gz',
'acs2007_3yr': 'http://census-backup.s3.amazonaws.com/acs/2007/acs2007_3yr/acs2007_3yr_backup.sql.gz',
}
files_to_download = []
for release in data_to_load:
url = possible_data_sources.get(release)
if not url:
raise Exception('The specified data \'%s\' is unrecognized.' % release)
files_to_download.append(url)
sudo('mkdir -p /mnt/tmp')
sudo('chown -R ubuntu /mnt/tmp')
for url in data_to_load:
print(green('Downloading to host: ' + url))
run('wget --quiet --continue --directory-prefix="/mnt/tmp" ' + url)
print(green('Done downloading source data!'))
def _install_base():
""" Update apt-get and install base packages (like git). """
sudo('apt-get update -q && sudo apt-get upgrade -q -y')
# Install the python dev packages
sudo('apt-get install -q -y git libpq-dev python-dev libmemcached-dev build-essential libgdal1-dev')
def _mount_ebs():
""" Install the XFS support tools and mount the EBS volume. """
sudo('apt-get install -q -y xfsprogs')
sudo('mkfs.xfs /dev/xvdc', warn_only=True)
append('/etc/fstab', "/dev/xvdc /vol xfs noatime 0 0", use_sudo=True)
sudo('mkdir -p -m 000 /vol')
sudo('mount /vol', warn_only=True)
def _install_postgres():
""" Install PostgreSQL and PostGIS. """
sudo('apt-get install -q -y postgresql-9.3 postgresql-9.3-postgis-2.1')
sudo('/etc/init.d/postgresql stop') # Stop it so we can move the data dir
sudo('mkdir -p /vol/postgresql')
if not exists('/vol/postgresql/9.3'):
sudo('mv /var/lib/postgresql/9.3 /vol/postgresql/')
sudo('chown -R postgres:postgres /vol/postgresql')
sudo("sed -i \"s/data_directory = '\/var\/lib\/postgresql\/9.3\/main'/data_directory = '\/vol\/postgresql\/9.3\/main'/\" /etc/postgresql/9.3/main/postgresql.conf")
sudo('/etc/init.d/postgresql start')
# Create PostgreSQL `census` user and database
sudo('psql -c "CREATE ROLE census WITH NOSUPERUSER LOGIN UNENCRYPTED PASSWORD \'censuspassword\';"', user='postgres', warn_only=True)
sudo('psql -c "CREATE DATABASE census WITH OWNER census;"', user='postgres', warn_only=True)
# Make PostgreSQL login password-less
if not exists('/home/ubuntu/.pgpass'):
append('/home/ubuntu/.pgpass', 'localhost:5432:census:census:censuspassword')
run('chmod 0600 /home/ubuntu/.pgpass')
def _install_libgdal():
""" Install the latest libgdal-dev package. """
# The one included in base Ubuntu doesn't appear to be new enough any more.
sudo('apt-add-repository -y ppa:ubuntugis/ubuntugis-unstable')
sudo('apt-get -q update')
sudo('apt-get -q -y install libgdal1-dev')
def _install_elasticsearch():
""" Install and start ElasticSearch. """
sudo('apt-get install -q -y openjdk-7-jre-headless')
run('wget --quiet --continue https://download.elasticsearch.org/elasticsearch/release/org/elasticsearch/distribution/deb/elasticsearch/2.1.0/elasticsearch-2.1.0.deb')
sudo('dpkg -i elasticsearch-2.1.0.deb')
sudo('mkdir -p /vol/elasticsearch')
sudo('chown elasticsearch:elasticsearch /vol/elasticsearch')
append('/etc/elasticsearch/elasticsearch.yml', 'path.data: /vol/elasticsearch', use_sudo=True)
sudo('service elasticsearch restart')
def _install_memcached():
""" Install and start memcached. """
sudo('apt-get install -q -y memcached')
sudo("sed -i \"s/^-m 64$/-m 1024 -I 10485760/g\" /etc/memcached.conf")
sudo("service memcached restart")
def _install_apache():
""" Install and set up apache and mod_wsgi. """
sudo('apt-get install -q -y apache2 libapache2-mod-wsgi')
sudo('a2enmod wsgi', warn_only=True)
def _install_nginx():
""" Install and set up nginx. """
sudo('apt-get install -q -y nginx')
def install_newrelic(api_key):
""" Install the New Relic Python and Server agents using the specified API key. """
with cd(code_dir):
with prefix('source %s/bin/activate' % virtualenv_dir):
sudo('newrelic-admin generate-config %s %s/newrelic.ini' % (api_key, code_dir), user='www-data')
sudo("sed -i \"s/Python Application/%s/g\" %s/newrelic.ini" % (newrelic_app_name, code_dir), user='www-data')
def install_packages():
""" Installs OS packages required to run the API. """
_install_base()
# _mount_ebs()
# _install_postgres()
_install_libgdal()
_install_elasticsearch()
_install_memcached()
_install_nginx()
def flushcache():
"Flush the memcache by restarting it."
sudo('service memcached restart')
def initial_config():
""" Configure the remote host to run Census Reporter API. """
sudo('mkdir -p %s' % root_dir)
sudo('chown www-data:www-data %s' % root_dir)
# Install up to virtualenv
sudo('apt-get install -q -y python-setuptools')
sudo('easy_install pip')
sudo('pip install virtualenv')
# Create virtualenv and add our Flask app to it
sudo('virtualenv --no-site-packages %s' % virtualenv_dir, user='www-data')
sudo('rm -f %s/lib/python2.7/site-packages/censusreporter.pth' % virtualenv_dir, user='www-data')
append('%s/lib/python2.7/site-packages/censusreporter.pth' % virtualenv_dir, code_dir, use_sudo=True)
sudo('chown www-data:www-data %s/lib/python2.7/site-packages/censusreporter.pth' % virtualenv_dir)
# Install and set up gunicorn in the virtualenv
with prefix('source %s/bin/activate' % virtualenv_dir):
sudo('pip install gunicorn futures', user='www-data')
sudo('rm -f /etc/init/%s.conf' % host)
upload_template('./server/upstart.conf.template', '/etc/init/%s.conf' % host, use_sudo=True, context={
'domainname': host,
'project_path': code_dir,
'virtualenv_dir': virtualenv_dir,
})
# Configure nginx to proxy requests to gunicorn
sudo('rm -f /etc/nginx/sites-enabled/default')
sudo('rm -f /etc/nginx/sites-enabled/%s' % host)
sudo('rm -f /etc/nginx/sites-available/%s' % host)
upload_template('./server/nginx.site.template', '/etc/nginx/sites-available/%s' % host, use_sudo=True, context={
'domainname': host,
'project_path': code_dir,
})
sudo('ln -s /etc/nginx/sites-available/%s /etc/nginx/sites-enabled' % host)
with settings(warn_only=True):
if sudo('test -d %s' % code_dir, user='www-data').failed:
sudo('git clone git://github.com/censusreporter/census-api.git %s' % code_dir, user='www-data')
# Start gunicorn
sudo('start %s' % host)
# Restart nginx
sudo('service nginx restart')
def deploy(branch='master'):
""" Deploy the specified Census Reporter API branch to the remote host. """
with cd(code_dir):
sudo('find . -name \'*.pyc\' -delete', user='www-data')
sudo('git pull origin %s' % branch, user='www-data')
# Install pip requirements
with prefix('source %s/bin/activate' % virtualenv_dir):
with shell_env(CPLUS_INCLUDE_PATH='/usr/include/gdal', C_INCLUDE_PATH='/usr/include/gdal'):
sudo('pip --quiet --no-cache-dir install -r requirements.txt', user='www-data')
# Restart gunicorn
sudo('restart %s' % host)
def load_elasticsearch_data(releases=['acs2012_1yr', 'acs2012_3yr', 'acs2012_5yr'], delete_first=False):
""" Loads search data into our ElasticSearch index. """
# The table index data lives in our census-table-metadata repo
if not exists('/home/ubuntu/census-table-metadata'):
with cd('/home/ubuntu'):
run('git clone https://github.com/censusreporter/census-table-metadata.git')
if delete_first:
# Delete any existing data
run("curl -XDELETE 'http://localhost:9200/census/'")
# Bulk-insert the data
with cd('/home/ubuntu/census-table-metadata'):
for release in releases:
run("curl -S --output /dev/null -XPOST 'http://localhost:9200/_bulk' --data-binary @precomputed/%s/census_column_metadata.txt" % release)
run("curl -S --output /dev/null -XPOST 'http://localhost:9200/_bulk' --data-binary @precomputed/%s/census_table_metadata.txt" % release)
def load_postgresql_data(releases=['acs2012_1yr', 'acs2012_3yr', 'acs2012_5yr', 'tiger2012'], delete_first=False):
""" Loads Census data (including metadata) from the specified releases into PostgreSQL. """
sudo("psql -d census -c \"COPY public.census_tabulation_metadata FROM '/home/ubuntu/census-table-metadata/precomputed/unified_metadata.csv' WITH csv ENCODING 'utf8' HEADER;\"", user='postgres')
print("THIS IS INCOMPLETE. I'm only loading a tabulation metadata for now.")