-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathDockerfile
More file actions
39 lines (31 loc) · 1014 Bytes
/
Dockerfile
File metadata and controls
39 lines (31 loc) · 1014 Bytes
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
FROM python:3.12-slim
# Install system dependencies including PostgreSQL client
ENV DEBIAN_FRONTEND=noninteractive
RUN apt-get update && \
apt-get install -y --no-install-recommends \
libpq-dev \
gcc \
postgresql-client \
&& rm -rf /var/lib/apt/lists/*
# Set working directory
WORKDIR /app
# Install Python packages with all dependencies
RUN pip install --no-cache-dir \
great_expectations \
'great_expectations[postgresql]' \
jupyter \
pandas \
pyarrow \
psycopg2-binary \
sqlalchemy \
ipykernel
# Copy parquet files
COPY taxi-data/*.parquet /app/taxi-data/
# Copy data loading script
COPY load_data.py /app/load_data.py
# Expose Jupyter port and data docs port
EXPOSE 8888 8080
# Set working directory for Jupyter
WORKDIR /root/code/gxtutorial
# Default command - start Jupyter from the notebook directory
CMD ["jupyter", "notebook", "--ip=0.0.0.0", "--port=8888", "--no-browser", "--allow-root", "--NotebookApp.token=''", "--NotebookApp.password=''"]