-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathdocker-compose.yml
More file actions
119 lines (114 loc) · 3.71 KB
/
docker-compose.yml
File metadata and controls
119 lines (114 loc) · 3.71 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
services:
# PostgreSQL Database - Stores all our data
postgres:
image: postgres:15
container_name: business_postgres
environment:
POSTGRES_USER: ${POSTGRES_USER}
POSTGRES_PASSWORD: ${POSTGRES_PASSWORD}
POSTGRES_DB: ${POSTGRES_DB}
ports:
- "${POSTGRES_PORT}:5432"
volumes:
# Persist data even if container stops
- postgres_data:/var/lib/postgresql/data
# Initialization scripts run on first startup
- ./sql/init.sql:/docker-entrypoint-initdb.d/init.sql
healthcheck:
test: ["CMD-SHELL", "pg_isready -U ${POSTGRES_USER} -d ${POSTGRES_DB}"]
interval: 10s
timeout: 5s
retries: 5
networks:
- data_engineering_network
restart: unless-stopped
# Airflow Webserver - UI for managing DAGs
airflow-webserver:
build:
context: .
dockerfile: Dockerfile.airflow
container_name: airflow_webserver
environment:
- AIRFLOW__CORE__EXECUTOR=${AIRFLOW__CORE__EXECUTOR}
- AIRFLOW__DATABASE__SQL_ALCHEMY_CONN=${AIRFLOW__DATABASE__SQL_ALCHEMY_CONN}
- AIRFLOW__CORE__FERNET_KEY=${AIRFLOW__CORE__FERNET_KEY}
- AIRFLOW__CORE__LOAD_EXAMPLES=${AIRFLOW__CORE__LOAD_EXAMPLES}
- AIRFLOW__WEBSERVER__SECRET_KEY=${AIRFLOW__WEBSERVER__SECRET_KEY}
ports:
- "8080:8080"
volumes:
- ./airflow/dags:/opt/airflow/dags
- ./airflow/logs:/opt/airflow/logs
- ./airflow/plugins:/opt/airflow/plugins
- ./data:/opt/airflow/data
- ./scripts:/opt/airflow/scripts
depends_on:
postgres:
condition: service_healthy
command: >
bash -c "airflow db init &&
airflow users create --username admin --password admin --firstname Admin --lastname User --role Admin --email admin@example.com || true &&
airflow webserver"
healthcheck:
test: ["CMD-SHELL", "curl -f http://localhost:8080/health || exit 1"]
interval: 30s
timeout: 10s
retries: 3
start_period: 60s
networks:
- data_engineering_network
restart: unless-stopped
# Airflow Scheduler - Schedules and triggers DAGs
airflow-scheduler:
build:
context: .
dockerfile: Dockerfile.airflow
container_name: airflow_scheduler
environment:
- AIRFLOW__CORE__EXECUTOR=${AIRFLOW__CORE__EXECUTOR}
- AIRFLOW__DATABASE__SQL_ALCHEMY_CONN=${AIRFLOW__DATABASE__SQL_ALCHEMY_CONN}
- AIRFLOW__CORE__FERNET_KEY=${AIRFLOW__CORE__FERNET_KEY}
- AIRFLOW__CORE__LOAD_EXAMPLES=${AIRFLOW__CORE__LOAD_EXAMPLES}
volumes:
- ./airflow/dags:/opt/airflow/dags
- ./airflow/logs:/opt/airflow/logs
- ./airflow/plugins:/opt/airflow/plugins
- ./data:/opt/airflow/data
- ./scripts:/opt/airflow/scripts
depends_on:
postgres:
condition: service_healthy
airflow-webserver:
condition: service_healthy
command: airflow scheduler
networks:
- data_engineering_network
restart: unless-stopped
# pgAdmin - Web-based PostgreSQL client
pgadmin:
image: dpage/pgadmin4:latest
container_name: business_pgadmin
environment:
PGADMIN_DEFAULT_EMAIL: ${PGADMIN_DEFAULT_EMAIL:-admin@admin.com}
PGADMIN_DEFAULT_PASSWORD: ${PGADMIN_DEFAULT_PASSWORD:-admin}
PGADMIN_CONFIG_SERVER_MODE: 'False'
PGADMIN_CONFIG_MASTER_PASSWORD_REQUIRED: 'False'
ports:
- "${PGADMIN_PORT:-5050}:80"
volumes:
- pgadmin_data:/var/lib/pgadmin
depends_on:
- postgres
networks:
- data_engineering_network
restart: unless-stopped
# Named volumes for data persistence
volumes:
postgres_data:
driver: local
pgadmin_data:
driver: local
# Network for inter-container communication
networks:
data_engineering_network:
driver: bridge