forked from openeduhub/oeh-search-etl
-
Notifications
You must be signed in to change notification settings - Fork 2
/
docker-compose.yml
52 lines (50 loc) · 1.43 KB
/
docker-compose.yml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
version: "3.4"
networks:
scrapy:
services:
splash:
image: scrapinghub/splash:master
command: --maxrss 4000
restart: always
ports:
- "127.0.0.1:8050:8050"
networks:
- scrapy
healthcheck:
test: ["CMD", "curl", "-f", "http://localhost:8050/_ping"]
interval: 30s
timeout: 5s
retries: 3
start_period: 40s
headless_chrome:
image: ghcr.io/browserless/chromium:v2.14.0
restart: always
environment:
- TIMEOUT=120000
ports:
- "127.0.0.1:3000:3000"
networks:
- scrapy
scrapy:
# extra_hosts is only required if your need to access an edu-sharing instance on the host that runs docker
# host.docker.internal points to the ip address of the host docker network interface
extra_hosts:
host.docker.internal: host-gateway
image: openeduhub/oeh-search-etl:develop
build:
context: .
network: host
networks:
- scrapy
environment:
- "PYPPETEER_WS_ENDPOINT=ws://headless_chrome:3000"
- "PLAYWRIGHT_WS_ENDPOINT=ws://headless_chrome:3000"
- "SPLASH_URL=http://splash:8050"
- "CRAWLER=${CRAWLER}"
# optional keyword args, e.g. cleanrun=true
- "ARGS=${ARGS}"
- "DRY_RUN=False"
- "LOG_LEVEL=${LOG_LEVEL:-INFO}"
- "EDU_SHARING_BASE_URL=${EDU_SHARING_BASE_URL}"
- "EDU_SHARING_USERNAME=${EDU_SHARING_USERNAME}"
- "EDU_SHARING_PASSWORD=${EDU_SHARING_PASSWORD}"