FROM jupyter/notebook

MAINTAINER Sawood Alam <ibnesayeed@gmail.com>

RUN apt-get update && apt-get install -y default-jre

RUN curl -L -O http://mirrors.ocf.berkeley.edu/apache/spark/spark-1.6.1/spark-1.6.1-bin-hadoop2.6.tgz \
    && mkdir /spark \
    && tar -xf spark-1.6.1-bin-hadoop2.6.tgz --strip-components=1 -C /spark \
    && rm spark-1.6.1-bin-hadoop2.6.tgz

RUN curl -L -O http://l3s.de/~holzmann/archivespark-kernel.tar.gz \
    && mkdir -p /root/.ipython/kernels \
    && tar -xf archivespark-kernel.tar.gz -C /root/.ipython/kernels \
    && rm archivespark-kernel.tar.gz

ADD kernel.json /root/.ipython/kernels/archivespark/kernel.json
ADD example.ipynb /notebooks/
ADD cdx /cdx
ADD warc /warc

CMD ["jupyter", "notebook", "--no-browser"]