Skip to content
Open
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
11 changes: 11 additions & 0 deletions .dockerignore
Original file line number Diff line number Diff line change
@@ -0,0 +1,11 @@
.git
.venv
src/.venv
src/venv
__pycache__
*.pyc
.vscode
.DS_Store
*.md
local-demo/prometheus/data
local-demo/grafana/data
9 changes: 8 additions & 1 deletion .gitignore
Original file line number Diff line number Diff line change
Expand Up @@ -4,4 +4,11 @@ assets/cloudwatch-dashboard.rendered.json
samconfig.toml
.aws-sam
.env.local.json
events/my.event.json
events/my.event.json

# Local Demo
local-demo/venv/
__pycache__/
*.pyc

./
12 changes: 12 additions & 0 deletions Dockerfile
Original file line number Diff line number Diff line change
@@ -0,0 +1,12 @@
FROM python:3.10-slim

WORKDIR /app

COPY src/requirements.txt .
RUN pip install --no-cache-dir -r requirements.txt

COPY src/ /app/src/

ENV PYTHONPATH=/app

CMD ["python", "src/main.py"]
36 changes: 36 additions & 0 deletions chatgpt/config.yaml
Original file line number Diff line number Diff line change
@@ -0,0 +1,36 @@
host: 0.0.0.0
port: 9109
scrape_interval_seconds: 30
deep_scan_interval_seconds: 600
request_timeout_seconds: 30
max_partitions_per_table: 5000

catalogs:
- name: prod
uri: https://your-iceberg-rest-catalog.example.com
warehouse: s3://warehouse
token: ${ICEBERG_TOKEN}

# Choose one mode
# 1) explicit tables (recommended to start)
discovery:
mode: explicit
tables:
- namespace: demo
table: events
- namespace: sales
table: orders

# 2) namespace scan
# discovery:
# mode: namespace_scan
# namespaces:
# - demo
# - sales

thresholds:
small_file_bytes: 33554432 # 32MB
target_file_bytes: 134217728 # 128MB
delete_file_ratio: 0.2
avg_files_per_partition: 20
small_file_count: 100
Loading