Skip to content
Prev Previous commit
Next Next commit
fix(twint): thinner base and use fixed twint fork
  • Loading branch information
lmeyerov committed Sep 5, 2022
commit b15ae2b4fbd129af2f13bbec59bf8053a3bbd5a7
9 changes: 5 additions & 4 deletions infra/pipelines/docker/Dockerfile
Original file line number Diff line number Diff line change
@@ -1,18 +1,19 @@
FROM graphistry/graphistry-blazing:v2.29.3
#FROM graphistry/graphistry-blazing:v2.29.3

FROM python:3.8

RUN export DEBIAN_FRONTEND=noninteractive \
&& apt-get update \
&& apt-get install -y --no-install-recommends supervisor \
&& apt-get clean \
&& rm -rf /var/lib/apt/lists/*

RUN source activate rapids \
&& pip install prefect==0.10.1 simplejson twarc neo4j boto3==1.12.39 \
RUN pip install prefect==0.10.1 simplejson twarc neo4j boto3==1.12.39 \
&& ( prefect agent install local > supervisord.conf )

COPY . .

#TODO find cleaner way to avoid talking to cloud server
RUN source activate rapids && prefect backend server
RUN prefect backend server

CMD ["./infra/pipelines/docker/entrypoint.sh"]
4 changes: 2 additions & 2 deletions infra/pipelines/docker/datastream-Dockerfile
Original file line number Diff line number Diff line change
@@ -1,4 +1,4 @@
FROM python:3.7
FROM python:3.8
RUN apt-get update \
&& apt-get install -y --no-install-recommends git vim tor \
&& apt-get clean \
Expand All @@ -8,7 +8,7 @@ RUN pip install prefect==0.10.1 simplejson twarc neo4j boto3==1.12.39 \
pandas pyarrow urlextract git+https://github.com/homm/yurl.git@1943161973aeb3b3cf2e1e9de6671673b8356161

#RUN echo "ok6" && pip install git+https://github.com/TheDataRideAlongs/twint.git
RUN pip install git+https://github.com/twintproject/twint.git
RUN pip install git+https://github.com/graphistry/twint.git
#git+https://github.com/lmeyerov/twint.git@patch-1#egg=twint
#RUN pip install git+https://github.com/himanshudabas/twint.git@twint-fixes#egg=twint

Expand Down
2 changes: 1 addition & 1 deletion infra/pipelines/docker/entrypoint.sh
Original file line number Diff line number Diff line change
@@ -1,4 +1,4 @@
#!/bin/bash

echo "Starting prefect executor daemon in foreground"
source activate rapids && supervisord --nodaemon
supervisord --nodaemon
4 changes: 2 additions & 2 deletions infra/pipelines/docker/nonrapids-Dockerfile
Original file line number Diff line number Diff line change
@@ -1,12 +1,12 @@
FROM python:3.7
FROM python:3.8
RUN apt-get update \
&& apt-get install -y --no-install-recommends supervisor \
&& apt-get clean \
&& rm -rf /var/lib/apt/lists/*

COPY . .
RUN pip install prefect==0.10.1 simplejson twarc neo4j boto3==1.12.39 \
pandas git+https://github.com/twintproject/twint.git@origin/master#egg=twint \
pandas git+https://github.com/graphistry/twint.git@origin/master#egg=twint \
&& ( prefect agent install local > supervisord.conf )
RUN prefect backend server
RUN ["chmod","+x","./infra/pipelines/docker/nonrapids-entrypoint.sh"]
Expand Down