Run browsertrix in docker on the host

Install docker in the container

Add a named volume called `browsertrix`

Mount the named volume in the worker at /crawls

Expose the host docker socket

Override the environment variable from auto-archiver's Dockerfile so
that it will call docker.

This will require setting new configs in orchestration.yaml:

 wacz_archiver_enricher:
  browsertrix_home: auto-archiver-api_browsertrix
  wacz_collections: /crawls
This commit is contained in:
Lilia Kai
2023-09-12 16:03:11 +02:00
parent b26bac6ba4
commit 8e4801f3d3
2 changed files with 10 additions and 0 deletions

View File

@@ -1,5 +1,8 @@
version: '3.8'
volumes:
browsertrix:
services:
web:
@@ -23,10 +26,15 @@ services:
command: celery worker --app=worker.celery --loglevel=info --logfile=logs/celery.log
volumes:
- ./src:/app
- /var/run/docker.sock:/var/run/docker.sock
- browsertrix:/crawls
env_file: src/.env
environment:
- CELERY_BROKER_URL=redis://:${REDIS_PASSWORD}@redis:6379/0
- CELERY_RESULT_BACKEND=redis://:${REDIS_PASSWORD}@redis:6379/0
- RUNNING_IN_DOCKER= # Override env from auto-archiver Dockerfile
depends_on:
- web
- redis