forked from nielsborie/machine-learning-environments
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Dockerfile
119 lines (103 loc) · 3.03 KB
/
Dockerfile
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
# Copyright (c) Niels Borie.
FROM jupyter/tensorflow-notebook:5811dcb711ba
LABEL maintainer="Niels BORIE"
USER root
# --- Install python-tk htop python-boost
RUN apt-get update && \
apt-get install -y --no-install-recommends python-tk software-properties-common htop libboost-all-dev && \
apt-get clean && \
rm -rf /var/lib/apt/lists/*
# --- Install dependency gcc/g++
RUN add-apt-repository -y ppa:ubuntu-toolchain-r/test
# --- Install gcc/g++
RUN apt-get update && \
apt-get install -y --no-install-recommends gcc-7 g++-7 && \
apt-get clean && \
rm -rf /var/lib/apt/lists/*
# --- Update alternatives
RUN update-alternatives --install /usr/bin/gcc gcc /usr/bin/gcc-7 60 --slave /usr/bin/g++ g++ /usr/bin/g++-7
# Install OpenJDK-8
RUN apt-get update && \
apt-get install -y openjdk-8-jdk && \
apt-get install -y ant && \
apt-get clean;
# Fix certificate issues
RUN apt-get update && \
apt-get install ca-certificates-java && \
apt-get clean && \
update-ca-certificates -f;
# Setup JAVA_HOME -- useful for docker commandline
ENV JAVA_HOME /usr/lib/jvm/java-8-openjdk-amd64/
RUN export JAVA_HOME
# --- Install h2o
RUN $CONDA_DIR/bin/python -m pip install -f http://h2o-release.s3.amazonaws.com/h2o/latest_stable_Py.html h2o
# --- Conda xgboost, lightgbm, catboost, h2o, gensim, mlxtend
RUN conda install --quiet --yes \
'boost' \
'lightgbm' \
'xgboost' \
'catboost' \
'gensim' \
'mlxtend' \
'tabulate' && \
conda clean -tipsy && \
fix-permissions $CONDA_DIR && \
fix-permissions /home/$NB_USER
# --- Install vowpalwabbit, hyperopt, tpot, sklearn-deap, yellowbrick, spacy
RUN $CONDA_DIR/bin/python -m pip install vowpalwabbit \
hyperopt \
deap \
update_checker \
tqdm \
stopit \
scikit-mdr \
skrebate \
tpot \
sklearn-deap \
yellowbrick \
spacy \
gplearn \
kmapper \
skope-rules \
shap \
lime
###########
#
# Add some usefull libs, inspired by kaggle's Dockerfile
# CREDITS : https://hub.docker.com/r/kaggle/python/dockerfile
#
###########
#RUN $CONDA_DIR/bin/python -m pip install --upgrade mpld3
RUN $CONDA_DIR/bin/python -m pip install mplleaflet \
gpxpy \
arrow \
sexmachine \
Geohash \
haversine \
toolz cytoolz \
sacred \
plotly \
git+https://github.com/nicta/dora.git \
git+https://github.com/hyperopt/hyperopt.git \
# tflean. Deep learning library featuring a higher-level API for TensorFlow. http://tflearn.org
git+https://github.com/tflearn/tflearn.git \
fitter \
langid \
# Delorean. Useful for dealing with datetime
delorean \
trueskill \
heamy \
vida \
# Useful data exploration libraries (for missing data and generating reports)
missingno \
pandas-profiling \
s2sphere
###########
#
# Issue #1
# pandas.read_hdf
#
###########
RUN $CONDA_DIR/bin/python -m pip install --upgrade tables
# clean up pip cache
RUN rm -rf /root/.cache/pip/*