Skip to content

Commit 5cbeb5e

Browse files
authored
chore: Tweak prometheus/grafana config defaults (NVIDIA#319)
1 parent 3f12b57 commit 5cbeb5e

File tree

2 files changed

+8
-12
lines changed

2 files changed

+8
-12
lines changed

applications/llm/count/visualization/docker-compose.yml

Lines changed: 2 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -19,7 +19,6 @@ services:
1919
container_name: prometheus
2020
volumes:
2121
- ./prometheus.yml:/etc/prometheus/prometheus.yml
22-
- prometheus_data:/prometheus
2322
command:
2423
- '--config.file=/etc/prometheus/prometheus.yml'
2524
- '--storage.tsdb.path=/prometheus'
@@ -42,12 +41,13 @@ services:
4241
- ./grafana.json:/etc/grafana/provisioning/dashboards/llm-worker-dashboard.json
4342
- ./grafana-datasources.yml:/etc/grafana/provisioning/datasources/datasources.yml
4443
- ./grafana-dashboard-providers.yml:/etc/grafana/provisioning/dashboards/dashboard-providers.yml
45-
- grafana_data:/var/lib/grafana
4644
environment:
4745
- GF_SECURITY_ADMIN_USER=admin
4846
- GF_SECURITY_ADMIN_PASSWORD=admin
4947
- GF_USERS_ALLOW_SIGN_UP=false
5048
- GF_INSTALL_PLUGINS=grafana-piechart-panel
49+
# Default min interval is 5s, but can be configured lower
50+
- GF_DASHBOARDS_MIN_REFRESH_INTERVAL=2s
5151
restart: unless-stopped
5252
# TODO: Use more explicit networking setup when count is containerized
5353
#ports:
@@ -61,7 +61,3 @@ services:
6161
networks:
6262
monitoring:
6363
driver: bridge
64-
65-
volumes:
66-
prometheus_data:
67-
grafana_data:

applications/llm/count/visualization/grafana.json

Lines changed: 6 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -572,7 +572,7 @@
572572
]
573573
}
574574
],
575-
"refresh": "5s",
575+
"refresh": "2s",
576576
"schemaVersion": 38,
577577
"style": "dark",
578578
"tags": [
@@ -584,8 +584,8 @@
584584
{
585585
"current": {
586586
"selected": false,
587-
"text": "backend",
588-
"value": "backend"
587+
"text": "component",
588+
"value": "vllm"
589589
},
590590
"datasource": {
591591
"type": "prometheus",
@@ -611,8 +611,8 @@
611611
{
612612
"current": {
613613
"selected": false,
614-
"text": "generate",
615-
"value": "generate"
614+
"text": "endpoint",
615+
"value": "load_metrics"
616616
},
617617
"datasource": {
618618
"type": "prometheus",
@@ -638,7 +638,7 @@
638638
]
639639
},
640640
"time": {
641-
"from": "now-15m",
641+
"from": "now-5m",
642642
"to": "now"
643643
},
644644
"timepicker": {},

0 commit comments

Comments
 (0)