Skip to content

Commit 3d330cc

Browse files
gHashTagona-agent
andcommitted
Fix Fly.io deployment: increase memory and grace period
- 1GB RAM (was 512MB) for model + inference buffers - 120s grace period for model loading - Verified model URL works (139MB download) Co-authored-by: Ona <no-reply@ona.com>
1 parent d5186d7 commit 3d330cc

1 file changed

Lines changed: 4 additions & 3 deletions

File tree

fly.toml

Lines changed: 4 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -13,9 +13,10 @@ primary_region = "iad"
1313
TOP_P = "0.9"
1414

1515
# Use shared-cpu-1x for SmolLM-135M (small model)
16+
# 1GB RAM needed for model loading + inference buffers
1617
[[vm]]
1718
size = "shared-cpu-1x"
18-
memory = "512mb"
19+
memory = "1gb"
1920
cpus = 1
2021

2122
# Persistent volume for models (optional - model is baked into image)
@@ -32,8 +33,8 @@ primary_region = "iad"
3233
min_machines_running = 0
3334

3435
[[http_service.checks]]
35-
grace_period = "60s"
36+
grace_period = "120s"
3637
interval = "30s"
3738
method = "GET"
3839
path = "/health"
39-
timeout = "10s"
40+
timeout = "15s"

0 commit comments

Comments
 (0)