mirror of
https://github.com/webrecorder/browsertrix-crawler.git
synced 2025-10-19 06:23:16 +00:00

* pending request wait: - instead of waiting for 5s, check redis key 'pywb:{coll}:pending' to see if any pending requests are still pending - keep checking key until pending requests are at 0 - requires latest pywb 2.6.0+ - should fix #44 * fix test to no longer look for waiting for 5s message * lint settings and fixes: allow constant in loops, add lint command to script * chrome: bump default image to chrome:90 image
51 lines
1.2 KiB
Docker
51 lines
1.2 KiB
Docker
ARG BROWSER_VERSION=90
|
|
|
|
FROM oldwebtoday/chrome:${BROWSER_VERSION} as chrome
|
|
|
|
FROM nikolaik/python-nodejs:python3.8-nodejs14
|
|
|
|
RUN curl -sS https://dl.yarnpkg.com/debian/pubkey.gpg | apt-key add -
|
|
|
|
RUN apt-get update -y \
|
|
&& apt-get install --no-install-recommends -qqy fonts-stix locales-all redis-server xvfb \
|
|
&& apt-get clean \
|
|
&& rm -rf /var/lib/apt/lists/*
|
|
|
|
ARG BROWSER_VERSION
|
|
|
|
ENV PROXY_HOST=localhost \
|
|
PROXY_PORT=8080 \
|
|
PROXY_CA_URL=http://wsgiprox/download/pem \
|
|
PROXY_CA_FILE=/tmp/proxy-ca.pem \
|
|
DISPLAY=:99 \
|
|
GEOMETRY=1360x1020x16 \
|
|
BROWSER_VERSION=${BROWSER_VERSION}
|
|
|
|
COPY --from=chrome /tmp/*.deb /deb/
|
|
COPY --from=chrome /app/libpepflashplayer.so /app/libpepflashplayer.so
|
|
RUN dpkg -i /deb/*.deb; apt-get update; apt-get install -fqqy && \
|
|
rm -rf /var/lib/opts/lists/*
|
|
|
|
WORKDIR /app
|
|
|
|
ADD requirements.txt /app/
|
|
RUN pip install -r requirements.txt
|
|
|
|
ADD package.json /app/
|
|
|
|
# to allow forcing rebuilds from this stage
|
|
ARG REBUILD
|
|
|
|
RUN yarn install
|
|
|
|
ADD config.yaml /app/
|
|
ADD uwsgi.ini /app/
|
|
ADD *.js /app/
|
|
|
|
RUN ln -s /app/main.js /usr/bin/crawl
|
|
RUN ln -s /app/create-login-profile.js /usr/bin/create-login-profile
|
|
|
|
WORKDIR /crawls
|
|
|
|
CMD ["crawl"]
|
|
|