-
Notifications
You must be signed in to change notification settings - Fork 0
/
docker-compose.yml
102 lines (95 loc) · 2.13 KB
/
docker-compose.yml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
version: '3.8'
services:
mongo:
image: mongo:latest
container_name: mongodb
ports:
- "27017:27017"
volumes:
- ./data/mongo:/data/db
spark:
image: custom-spark:3.5.0
build:
context: .
dockerfile: ./dockerfiles/spark
container_name: spark
environment:
- SPARK_MODE=master
- SPARK_MASTER_HOST=spark
- SPARK_MASTER_PORT=7077
- SPARK_RPC_AUTHENTICATION_ENABLED=no
- SPARK_RPC_ENCRYPTION_ENABLED=no
- SPARK_LOCAL_STORAGE_ENCRYPTION_ENABLED=no
- SPARK_SSL_ENABLED=no
- XDG_CACHE_HOME=/opt/bitnami/spark/.cache
ports:
- "8080:8080"
- "7077:7077"
spark-worker:
image: custom-spark:3.5.0
build:
context: .
dockerfile: ./dockerfiles/spark
container_name: spark-worker
environment:
- SPARK_MODE=worker
- SPARK_MASTER_URL=spark://spark:7077
- SPARK_RPC_AUTHENTICATION_ENABLED=no
- SPARK_RPC_ENCRYPTION_ENABLED=no
- SPARK_LOCAL_STORAGE_ENCRYPTION_ENABLED=no
- SPARK_SSL_ENABLED=no
- XDG_CACHE_HOME=/opt/bitnami/spark/.cache
depends_on:
- spark
minio:
image: minio/minio
ports:
- 9000:9000
- 9001:9001
environment:
- MINIO_ROOT_USER=minio
- MINIO_ROOT_PASSWORD=miniominio
container_name: minio
command: server /data/minio --console-address ":9001"
healthcheck:
test:
[
"CMD",
"curl",
"-f",
"http://localhost:9000/minio/health/live"
]
interval: 30s
timeout: 20s
retries: 3
volumes:
- ./data/minio:/data/minio
jupyter:
image: jupyter:1.0.0
container_name: jupyter
build:
context: .
dockerfile: ./dockerfiles/jupyter
ports:
- "8888:8888"
- "8501:8501" #streamlit app port
command:
[
"jupyter",
"lab",
"--ip=0.0.0.0",
"--port=8888",
"--no-browser",
"--allow-root",
"--NotebookApp.token=''"
]
volumes:
- ./:/rag/
depends_on:
- mongo
- spark
- spark-worker
- minio
volumes:
mongo-data:
minio-data: