-
Notifications
You must be signed in to change notification settings - Fork 220
/
Dockerfile
50 lines (43 loc) · 1.25 KB
/
Dockerfile
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
# Based on the Dockerfiles from the Jupyter Development Team which
# are Copyright (c) Jupyter Development Team and distributed under
# the terms of the Modified BSD License.
ARG OWNER=jupyter
ARG BASE_CONTAINER=$OWNER/pyspark-notebook
FROM $BASE_CONTAINER
LABEL maintainer="Paul Deitel <[email protected]>"
# Fix: https://github.com/hadolint/hadolint/wiki/DL4006
# Fix: https://github.com/koalaman/shellcheck/wiki/SC3014
SHELL ["/bin/bash", "-o", "pipefail", "-c"]
RUN mamba install --yes \
'dnspython' \
'folium' \
'geopy' \
'imageio' \
'nltk' \
'pymongo' \
'scikit-learn' \
'spacy' \
'tweepy'
RUN pip install --upgrade \
'tensorflow' \
'openai' \
'beautifulsoup4' \
'deepl' \
'mastodon.py' \
'better_profanity' \
'tweet-preprocessor' \
'ibm-watson' \
'pubnub' \
'textblob' \
'wordcloud' \
'dweepy' \
'sounddevice'
# download data required by textblob and spacy
RUN python -m textblob.download_corpora && \
python -m spacy download en_core_web_sm && \
python -m spacy download en_core_web_md && \
python -m spacy download en_core_web_lg
# clean up
RUN mamba clean --all -f -y && \
fix-permissions "${CONDA_DIR}" && \
fix-permissions "/home/${NB_USER}"