forked from rapidsai/cudf
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Dockerfile
64 lines (58 loc) · 2.18 KB
/
Dockerfile
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
# An integration test & dev container which builds and installs libgdf & pygdf from master
ARG CUDA_VERSION=9.2
ARG LINUX_VERSION=ubuntu16.04
FROM nvidia/cuda:${CUDA_VERSION}-devel-${LINUX_VERSION}
ENV LD_LIBRARY_PATH=$LD_LIBRARY_PATH:/usr/local/cuda/lib64:/usr/local/lib
# Needed for pygdf.concat(), avoids "OSError: library nvvm not found"
ENV NUMBAPRO_NVVM=/usr/local/cuda/nvvm/lib64/libnvvm.so
ENV NUMBAPRO_LIBDEVICE=/usr/local/cuda/nvvm/libdevice/
ARG CC=5
ARG CXX=5
RUN apt update -y --fix-missing && \
apt upgrade -y && \
apt install -y \
git \
gcc-${CC} \
g++-${CXX} \
libboost-all-dev
# Install conda
ADD https://repo.continuum.io/miniconda/Miniconda3-latest-Linux-x86_64.sh /miniconda.sh
RUN sh /miniconda.sh -b -p /conda && /conda/bin/conda update -n base conda
ENV PATH=${PATH}:/conda/bin
# Enables "source activate conda"
SHELL ["/bin/bash", "-c"]
# Build combined libgdf/pygdf conda env
ARG PYTHON_VERSION=3.6
RUN conda create -n gdf python=${PYTHON_VERSION}
ARG NUMBA_VERSION=0.40.0
ARG NUMPY_VERSION=1.14.3
# Locked to Pandas 0.20.3 by https://github.com/gpuopenanalytics/pygdf/issues/118
ARG PANDAS_VERSION=0.20.3
ARG PYARROW_VERSION=0.10.0
RUN conda install -n gdf -y -c numba -c conda-forge -c defaults \
numba=${NUMBA_VERSION} \
numpy=${NUMPY_VERSION} \
pandas=${PANDAS_VERSION} \
pyarrow=${PYARROW_VERSION} \
cmake
# LibGDF build/install
ARG LIBGDF_REPO=https://github.com/gpuopenanalytics/libgdf
RUN git clone --recurse-submodules ${LIBGDF_REPO} /libgdf
ENV CC=/usr/bin/gcc-${CC}
ENV CXX=/usr/bin/g++-${CXX}
ARG HASH_JOIN=ON
RUN source activate gdf && \
mkdir -p /libgdf/build && \
cd /libgdf/build && \
cmake .. -DHASH_JOIN=${HASH_JOIN} && \
make -j install && \
make copy_python && \
python setup.py install
# PyGDF build/install
ARG PYGDF_REPO=https://github.com/gpuopenanalytics/pygdf
# To build container against https://github.com/gpuopenanalytics/pygdf/pull/138:
# docker build --build-arg PYGDF_REPO="https://github.com/dantegd/pygdf -b enh-ext-unique-value-counts" -t gdf .
RUN git clone --recurse-submodules ${PYGDF_REPO} /pygdf
RUN source activate gdf && \
cd /pygdf && \
python setup.py install