-
Notifications
You must be signed in to change notification settings - Fork 2
/
Copy pathDockerfile-loader
38 lines (31 loc) · 1.11 KB
/
Dockerfile-loader
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
FROM python:3.8-buster
MAINTAINER TweetSets <sfm@gwu.edu>
ADD requirements.txt /opt/tweetsets/
WORKDIR /opt/tweetsets
RUN pip install -r requirements.txt
RUN grep elasticsearch requirements.txt | xargs pip install -t dependencies
RUN apt-get update && \
apt-get install -y openjdk-11-jre-headless \
ca-certificates-java \
zip -y
WORKDIR /opt/tweetsets/dependencies
RUN zip -r ../dependencies.zip .
WORKDIR /opt/tweetsets
ADD tweetset_loader.py /opt/tweetsets/
ADD models.py /opt/tweetsets/
ADD utils.py /opt/tweetsets/
ADD spark_utils.py /opt/tweetsets/
ADD tweetsets_schema.json /opt/tweetsets/
ADD tweetsets_sql_exp.sql /opt/tweetsets/
ADD tests/spark/ /opt/tweetsets/tests
ADD tests/spark/_test_spark_loader.py /opt/tweetsets/tests/test_spark_loader.py
ADD setup.py /opt/tweetsets/
ADD elasticsearch-spark-30_2.12-7.13.4.jar /opt/tweetsets/elasticsearch-hadoop.jar
ADD tweetset_cli.py /opt/tweetsets/
RUN python setup.py bdist_egg
ENV SPARK_LOCAL_IP 0.0.0.0
ENV SPARK_DRIVER_PORT 5001
ENV SPARK_UI_PORT 5002
ENV SPARK_BLOCKMGR_PORT 5003
EXPOSE $SPARK_DRIVER_PORT $SPARK_UI_PORT $SPARK_BLOCKMGR_PORT
CMD /bin/bash