2019-01-26 17:30:00 -05:00
|
|
|
FROM node:11-slim
|
2018-12-31 20:53:01 -05:00
|
|
|
LABEL maintainer="Nick Sweeting <archivebox-git@sweeting.me>"
|
2018-10-13 22:47:30 -04:00
|
|
|
|
|
|
|
RUN apt-get update \
|
2019-01-23 01:06:47 -05:00
|
|
|
&& apt-get install -yq --no-install-recommends \
|
|
|
|
git wget curl youtube-dl gnupg2 libgconf-2-4 python3 python3-pip \
|
2018-10-13 22:47:30 -04:00
|
|
|
&& rm -rf /var/lib/apt/lists/*
|
|
|
|
|
|
|
|
# Install latest chrome package and fonts to support major charsets (Chinese, Japanese, Arabic, Hebrew, Thai and a few others)
|
2019-01-23 01:06:47 -05:00
|
|
|
RUN apt-get update && apt-get install -y wget --no-install-recommends \
|
2018-10-13 22:47:30 -04:00
|
|
|
&& wget -q -O - https://dl-ssl.google.com/linux/linux_signing_key.pub | apt-key add - \
|
|
|
|
&& sh -c 'echo "deb [arch=amd64] http://dl.google.com/linux/chrome/deb/ stable main" >> /etc/apt/sources.list.d/google.list' \
|
|
|
|
&& apt-get update \
|
2019-01-23 01:06:47 -05:00
|
|
|
&& apt-get install -y google-chrome-unstable fonts-ipafont-gothic fonts-wqy-zenhei fonts-thai-tlwg fonts-kacst ttf-freefont \
|
2018-10-13 22:47:30 -04:00
|
|
|
--no-install-recommends \
|
|
|
|
&& rm -rf /var/lib/apt/lists/* \
|
2019-01-23 01:06:47 -05:00
|
|
|
&& rm -rf /src/*.deb
|
2018-10-13 22:47:30 -04:00
|
|
|
|
2019-01-23 01:06:47 -05:00
|
|
|
# It's a good idea to use dumb-init to help prevent zombie chrome processes.
|
|
|
|
ADD https://github.com/Yelp/dumb-init/releases/download/v1.2.0/dumb-init_1.2.0_amd64 /usr/local/bin/dumb-init
|
|
|
|
RUN chmod +x /usr/local/bin/dumb-init
|
2018-10-13 22:47:30 -04:00
|
|
|
|
2019-01-23 01:06:47 -05:00
|
|
|
# Install puppeteer so it's available in the container.
|
|
|
|
RUN npm i puppeteer
|
2018-10-13 22:47:30 -04:00
|
|
|
|
2019-01-23 01:06:47 -05:00
|
|
|
# Add user so we don't need --no-sandbox.
|
|
|
|
RUN groupadd -r pptruser && useradd -r -g pptruser -G audio,video pptruser \
|
|
|
|
&& mkdir -p /home/pptruser/Downloads \
|
|
|
|
&& chown -R pptruser:pptruser /home/pptruser \
|
|
|
|
&& chown -R pptruser:pptruser /node_modules
|
|
|
|
|
|
|
|
# Install the ArchiveBox repository and pip requirements
|
|
|
|
RUN git clone https://github.com/pirate/ArchiveBox /home/pptruser/app \
|
2019-01-16 08:05:01 -05:00
|
|
|
&& mkdir -p /data \
|
2019-01-23 01:06:47 -05:00
|
|
|
&& chown -R pptruser:pptruser /data \
|
|
|
|
&& ln -s /data /home/pptruser/app/archivebox/output \
|
|
|
|
&& ln -s /home/pptruser/app/bin/archivebox /bin/archive \
|
|
|
|
&& chown -R pptruser:pptruser /home/pptruser/app/archivebox
|
|
|
|
# && pip3 install -r /home/pptruser/app/archivebox/requirements.txt
|
2018-10-13 22:47:30 -04:00
|
|
|
|
2019-01-16 08:05:01 -05:00
|
|
|
VOLUME /data
|
2018-10-13 22:47:30 -04:00
|
|
|
|
2019-01-23 01:06:47 -05:00
|
|
|
ENV LANG=C.UTF-8 \
|
2018-10-13 22:47:30 -04:00
|
|
|
LANGUAGE=en_US:en \
|
2019-01-23 01:06:47 -05:00
|
|
|
LC_ALL=C.UTF-8 \
|
2018-10-13 22:47:30 -04:00
|
|
|
PYTHONIOENCODING=UTF-8 \
|
|
|
|
CHROME_SANDBOX=False \
|
2019-01-23 01:06:47 -05:00
|
|
|
CHROME_BINARY=google-chrome-unstable \
|
2019-01-16 08:05:01 -05:00
|
|
|
OUTPUT_DIR=/data
|
2018-10-13 22:47:30 -04:00
|
|
|
|
|
|
|
# Run everything from here on out as non-privileged user
|
2019-01-23 01:06:47 -05:00
|
|
|
USER pptruser
|
|
|
|
WORKDIR /home/pptruser/app
|
2018-10-13 22:47:30 -04:00
|
|
|
|
2019-01-23 01:06:47 -05:00
|
|
|
ENTRYPOINT ["dumb-init", "--"]
|
|
|
|
CMD ["/bin/archive"]
|