Skip to content

Commit a0eae7a

Browse files
gHashTagona-agent
andcommitted
Fix: Run as SSH-accessible container (no HTTP)
TRINITY chat is CLI-based, not HTTP server. Access via: fly ssh console -a trinity-llm Co-authored-by: Ona <no-reply@ona.com>
1 parent a05b614 commit a0eae7a

2 files changed

Lines changed: 7 additions & 17 deletions

File tree

Dockerfile

Lines changed: 2 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -50,8 +50,5 @@ ENV MODEL_PATH=/app/models/tinyllama-1.1b-chat-v1.0.Q8_0.gguf
5050
ENV TEMPERATURE=0.7
5151
ENV TOP_P=0.9
5252

53-
# Expose port (for future HTTP API)
54-
EXPOSE 8080
55-
56-
# Run chat
57-
CMD ["/app/vibee", "chat", "--model", "/app/models/tinyllama-1.1b-chat-v1.0.Q8_0.gguf", "--temperature", "0.7", "--top-p", "0.9"]
53+
# Keep container running for SSH access
54+
CMD ["/bin/sleep", "infinity"]

fly.toml

Lines changed: 5 additions & 12 deletions
Original file line numberDiff line numberDiff line change
@@ -23,16 +23,9 @@ primary_region = "iad"
2323
# source = "trinity_models"
2424
# destination = "/app/models"
2525

26-
[http_service]
27-
internal_port = 8080
28-
force_https = true
29-
auto_stop_machines = true
30-
auto_start_machines = true
31-
min_machines_running = 0
26+
# No HTTP service - this is a CLI application
27+
# Access via: fly ssh console -a trinity-llm
28+
# Then run: /app/vibee chat --model /app/models/tinyllama-1.1b-chat-v1.0.Q8_0.gguf
3229

33-
[[http_service.checks]]
34-
grace_period = "120s"
35-
interval = "30s"
36-
method = "GET"
37-
path = "/health"
38-
timeout = "10s"
30+
[processes]
31+
app = "/bin/sleep infinity"

0 commit comments

Comments
 (0)