forked from unitedstates/congress
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Dockerfile
51 lines (44 loc) · 1.47 KB
/
Dockerfile
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
# Dockerization of Congress:
#
# This Docker image will create a minimal environment to run the Congress
# scrapers in. This provides isolation from the host, and allows testing
# in an environment that's as close to production as you can.
#
#
# You can build this image by running:
#
# docker build --rm -t unitedstates/congress .
#
#
# Running the scraper should be as easy as:
#
# export CONGRESS_OUTPUT_DIR=/tmp/congres
#
# docker run \
# -t --rm \
# -v ${CONGRESS_OUTPUT_DIR}:/congress \
# unitedstates/congress \
# ...
#
#
# Where [...] is something like `bills`, or any other arguments to the
# `run` script.
#
# The data produced by the scrape will end up at ${CONGRESS_OUTPUT_DIR}
# on the host. This path may be any path on the host.
#
# One good pattern is to write this out to the /srv/ tree, for example,
# /srv/pault.ag/congress/ or /srv/io.unitedstates/congress/
FROM debian:jessie
MAINTAINER Paul R. Tagliamonte <paultag@sunlightfoundation.com>
RUN apt-get update && apt-get install -y \
git python3-dev libxml2-dev libxslt1-dev libz-dev python3-pip wget
RUN mkdir -p /opt/theunitedstates.io/
ADD . /opt/theunitedstates.io/congress/
WORKDIR /opt/theunitedstates.io/congress/
RUN pip install -r requirements.txt
RUN echo "/opt/theunitedstates.io/congress/" > /usr/lib/python3.6/dist-packages/congress.pth
RUN mkdir -p /congress
WORKDIR /congress
CMD []
ENTRYPOINT ["/opt/theunitedstates.io/congress/run"]