We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
2 parents d15d37d + 047091b commit 4feeaedCopy full SHA for 4feeaed
1 file changed
src/metrics/__init__.py
@@ -32,7 +32,10 @@
32
# Histogram to measure response durations
33
# This will be used to track how long it takes to handle requests
34
response_duration_seconds = Histogram(
35
- "ls_response_duration_seconds", "Response durations", ["path"]
+ "ls_response_duration_seconds",
36
+ "Response durations",
37
+ ["path"],
38
+ buckets=LLM_INFERENCE_DURATION_BUCKETS,
39
)
40
41
# Metric that indicates what provider + model customers are using so we can
0 commit comments