1
0
Fork 0
mirror of synced 2024-06-27 18:40:52 +12:00

working docker-compose with google chrome

This commit is contained in:
Nick Sweeting 2019-01-23 01:06:47 -05:00
parent 2c375eab49
commit e1be96e597
3 changed files with 33 additions and 27 deletions

View file

@ -1,47 +1,56 @@
FROM debian:stretch FROM node:8-slim
LABEL maintainer="Nick Sweeting <archivebox-git@sweeting.me>" LABEL maintainer="Nick Sweeting <archivebox-git@sweeting.me>"
RUN apt-get update \ RUN apt-get update \
&& apt-get install -qy git wget curl youtube-dl gnupg2 libgconf-2-4 python3 python3-pip \ && apt-get install -yq --no-install-recommends \
git wget curl youtube-dl gnupg2 libgconf-2-4 python3 python3-pip \
&& rm -rf /var/lib/apt/lists/* && rm -rf /var/lib/apt/lists/*
# Install latest chrome package and fonts to support major charsets (Chinese, Japanese, Arabic, Hebrew, Thai and a few others) # Install latest chrome package and fonts to support major charsets (Chinese, Japanese, Arabic, Hebrew, Thai and a few others)
RUN apt-get update && apt-get install -y curl --no-install-recommends \ RUN apt-get update && apt-get install -y wget --no-install-recommends \
&& wget -q -O - https://dl-ssl.google.com/linux/linux_signing_key.pub | apt-key add - \ && wget -q -O - https://dl-ssl.google.com/linux/linux_signing_key.pub | apt-key add - \
&& sh -c 'echo "deb [arch=amd64] http://dl.google.com/linux/chrome/deb/ stable main" >> /etc/apt/sources.list.d/google.list' \ && sh -c 'echo "deb [arch=amd64] http://dl.google.com/linux/chrome/deb/ stable main" >> /etc/apt/sources.list.d/google.list' \
&& apt-get update \ && apt-get update \
&& apt-get install -y chromium fonts-ipafont-gothic fonts-wqy-zenhei fonts-thai-tlwg fonts-kacst ttf-freefont \ && apt-get install -y google-chrome-unstable fonts-ipafont-gothic fonts-wqy-zenhei fonts-thai-tlwg fonts-kacst ttf-freefont \
--no-install-recommends \ --no-install-recommends \
&& rm -rf /var/lib/apt/lists/* \ && rm -rf /var/lib/apt/lists/* \
&& rm -rf /src/*.deb \ && rm -rf /src/*.deb
&& ln -s /usr/bin/chromium /usr/bin/chromium-browser
# It might be a good idea to use dumb-init to help prevent zombie chrome processes. # It's a good idea to use dumb-init to help prevent zombie chrome processes.
# ADD https://github.com/Yelp/dumb-init/releases/download/v1.2.0/dumb-init_1.2.0_amd64 /usr/local/bin/dumb-init ADD https://github.com/Yelp/dumb-init/releases/download/v1.2.0/dumb-init_1.2.0_amd64 /usr/local/bin/dumb-init
# RUN chmod +x /usr/local/bin/dumb-init RUN chmod +x /usr/local/bin/dumb-init
RUN git clone https://github.com/pirate/ArchiveBox /home/chromeuser/app \ # Install puppeteer so it's available in the container.
&& pip3 install -r /home/chromeuser/app/archivebox/requirements.txt \ RUN npm i puppeteer
&& ln -s /home/chromeuser/app/bin/archivebox /usr/bin/archive
# Add user so we area strong, independent chrome that don't need --no-sandbox. # Add user so we don't need --no-sandbox.
RUN groupadd -r chromeuser && useradd -r -g chromeuser -G audio,video chromeuser \ RUN groupadd -r pptruser && useradd -r -g pptruser -G audio,video pptruser \
&& mkdir -p /home/pptruser/Downloads \
&& chown -R pptruser:pptruser /home/pptruser \
&& chown -R pptruser:pptruser /node_modules
# Install the ArchiveBox repository and pip requirements
RUN git clone https://github.com/pirate/ArchiveBox /home/pptruser/app \
&& mkdir -p /data \ && mkdir -p /data \
&& ln -s /data /home/chromeuser/app/archivebox/output \ && chown -R pptruser:pptruser /data \
&& chown -R chromeuser:chromeuser /home/chromeuser/app/archivebox/output \ && ln -s /data /home/pptruser/app/archivebox/output \
&& chown -R chromeuser:chromeuser /home/chromeuser && ln -s /home/pptruser/app/bin/archivebox /bin/archive \
&& chown -R pptruser:pptruser /home/pptruser/app/archivebox
# && pip3 install -r /home/pptruser/app/archivebox/requirements.txt
VOLUME /data VOLUME /data
ENV LANG=en_US.UTF-8 \ ENV LANG=C.UTF-8 \
LANGUAGE=en_US:en \ LANGUAGE=en_US:en \
LC_ALL=en_US.UTF-8 \ LC_ALL=C.UTF-8 \
PYTHONIOENCODING=UTF-8 \ PYTHONIOENCODING=UTF-8 \
CHROME_SANDBOX=False \ CHROME_SANDBOX=False \
CHROME_BINARY=google-chrome-unstable \
OUTPUT_DIR=/data OUTPUT_DIR=/data
# Run everything from here on out as non-privileged user # Run everything from here on out as non-privileged user
USER chromeuser USER pptruser
WORKDIR /home/chromeuser/app WORKDIR /home/pptruser/app
CMD ["/usr/bin/archive"] ENTRYPOINT ["dumb-init", "--"]
CMD ["/bin/archive"]

View file

@ -63,6 +63,7 @@ if not CHROME_BINARY:
'google-chrome-beta', 'google-chrome-beta',
'google-chrome-canary', 'google-chrome-canary',
'google-chrome-dev', 'google-chrome-dev',
'google-chrome-unstable',
) )
for name in common_chrome_executable_names: for name in common_chrome_executable_names:
full_path_exists = shutil.which(name) full_path_exists = shutil.which(name)

View file

@ -6,15 +6,11 @@ services:
stdin_open: true stdin_open: true
tty: true tty: true
environment: environment:
- FETCH_SCREENSHOT=False
- FETCH_PDF=False
- FETCH_DOM=False
- FETCH_MEDIA=False
- USE_COLOR=False - USE_COLOR=False
- SHOW_PROGRESS=False - SHOW_PROGRESS=False
volumes: volumes:
- ./data:/data - ./data:/data
command: bash -c 'echo "https://example.com" | /usr/bin/archive; tail -f /dev/null' command: bash -c 'echo "https://example.com" | /bin/archive; tail -f /dev/null'
nginx: nginx:
image: 'nginx' image: 'nginx'