From 47b305091fe4f3ac9ca089db46b94c962bf82eb1 Mon Sep 17 00:00:00 2001 From: Lucas Alvares Gomes Date: Wed, 24 Jun 2026 15:08:29 +0100 Subject: [PATCH] Use HTTP health check for llama-stack/ogx container Replace the TCP socket readiness probe with a proper HTTP GET on /v1/health. Also, add a startup probe and liveness probe that will start only after the startup one succeeds. Signed-off-by: Lucas Alvares Gomes --- internal/controller/lcore_deployment.go | 30 ++++++++++++++++++++++--- 1 file changed, 27 insertions(+), 3 deletions(-) diff --git a/internal/controller/lcore_deployment.go b/internal/controller/lcore_deployment.go index 69a9957..4807da7 100644 --- a/internal/controller/lcore_deployment.go +++ b/internal/controller/lcore_deployment.go @@ -72,14 +72,38 @@ func buildLCorePodTemplateSpec(h *common_helper.Helper, ctx context.Context, ins Ports: []corev1.ContainerPort{{Name: "llama-stack", ContainerPort: LlamaStackContainerPort}}, VolumeMounts: llamaStackMounts, Env: llamaEnvVars, + StartupProbe: &corev1.Probe{ + ProbeHandler: corev1.ProbeHandler{ + HTTPGet: &corev1.HTTPGetAction{ + Path: "/v1/health", + Port: intstr.FromInt32(LlamaStackContainerPort), + }, + }, + PeriodSeconds: 10, + TimeoutSeconds: 5, + FailureThreshold: 30, + }, + LivenessProbe: &corev1.Probe{ + ProbeHandler: corev1.ProbeHandler{ + HTTPGet: &corev1.HTTPGetAction{ + Path: "/v1/health", + Port: intstr.FromInt32(LlamaStackContainerPort), + }, + }, + PeriodSeconds: 10, + TimeoutSeconds: 5, + FailureThreshold: 3, + }, ReadinessProbe: &corev1.Probe{ ProbeHandler: corev1.ProbeHandler{ - TCPSocket: &corev1.TCPSocketAction{ + HTTPGet: &corev1.HTTPGetAction{ + Path: "/v1/health", Port: intstr.FromInt32(LlamaStackContainerPort), }, }, - InitialDelaySeconds: 5, - PeriodSeconds: 10, + PeriodSeconds: 10, + TimeoutSeconds: 5, + FailureThreshold: 3, }, Resources: corev1.ResourceRequirements{ Requests: corev1.ResourceList{