Skip to content

Commit 4ed17fa

Browse files
latency related rules
1 parent 7e3ebf0 commit 4ed17fa

1 file changed

Lines changed: 88 additions & 0 deletions

File tree

charts/ceph-operations/alerts/customrules.yaml

Lines changed: 88 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -58,4 +58,92 @@ groups:
5858
"owner", "([a-f0-9]{32}).*"
5959
)
6060
)
61+
# Client I/O Latency (GET+PUT) – avg over 5 m, in seconds
62+
- record: objectstore_client_io_latency_seconds_avg
63+
expr: |
64+
sum by (bucket,project_id) (
65+
label_replace(
66+
rate(radosgw_requests_duration_sum{method=~"GET|PUT"}[5m]),
67+
"project_id", "$1", "tenant", "([a-f0-9]{32})"
68+
)
69+
)
70+
/
71+
sum by (bucket,project_id) (
72+
label_replace(
73+
rate(radosgw_requests_duration_count{method=~"GET|PUT"}[5m]),
74+
"project_id", "$1", "tenant", "([a-f0-9]{32})"
75+
)
76+
)
77+
# Upload Object Latency (PUT+POST) – avg over 5 m, in ms
78+
- record: objectstore_upload_latency_milliseconds_avg
79+
expr: |
80+
(
81+
sum by (bucket,project_id) (
82+
label_replace(
83+
rate(radosgw_requests_duration_sum{method=~"PUT|POST"}[5m]),
84+
"project_id", "$1", "tenant", "([a-f0-9]{32})"
85+
)
86+
)
87+
/
88+
sum by (bucket,project_id) (
89+
label_replace(
90+
rate(radosgw_requests_duration_count{method=~"PUT|POST"}[5m]),
91+
"project_id", "$1", "tenant", "([a-f0-9]{32})"
92+
)
93+
)
94+
) * 1000
95+
# Download Object Latency (GET) – avg over 5 m, in ms
96+
- record: objectstore_download_latency_milliseconds_avg
97+
expr: |
98+
(
99+
sum by (bucket,project_id) (
100+
label_replace(
101+
rate(radosgw_requests_duration_sum{method="GET"}[5m]),
102+
"project_id", "$1", "tenant", "([a-f0-9]{32})"
103+
)
104+
)
105+
/
106+
sum by (bucket,project_id) (
107+
label_replace(
108+
rate(radosgw_requests_duration_count{method="GET"}[5m]),
109+
"project_id", "$1", "tenant", "([a-f0-9]{32})"
110+
)
111+
)
112+
) * 1000
113+
# Delete Object Latency (DELETE) – avg over 5 m, in ms
114+
- record: objectstore_delete_latency_milliseconds_avg
115+
expr: |
116+
(
117+
sum by (bucket,project_id) (
118+
label_replace(
119+
rate(radosgw_requests_duration_sum{method="DELETE"}[5m]),
120+
"project_id", "$1", "tenant", "([a-f0-9]{32})"
121+
)
122+
)
123+
/
124+
sum by (bucket,project_id) (
125+
label_replace(
126+
rate(radosgw_requests_duration_count{method="DELETE"}[5m]),
127+
"project_id", "$1", "tenant", "([a-f0-9]{32})"
128+
)
129+
)
130+
) * 1000
131+
# Client Error Rate (4xx) – per second, per bucket & error
132+
- record: objectstore_client_error_rate
133+
expr: |
134+
sum by (bucket,project_id,http_status) (
135+
label_replace(
136+
rate(radosgw_errors_total{http_status=~"4.."}[5m]),
137+
"project_id", "$1", "tenant", "([a-f0-9]{32})"
138+
)
139+
)
140+
# Server / Service Error Rate (5xx) – per second, per bucket & error
141+
- record: objectstore_server_error_rate
142+
expr: |
143+
sum by (bucket,project_id,http_status) (
144+
label_replace(
145+
rate(radosgw_errors_total{http_status=~"5.."}[5m]),
146+
"project_id", "$1", "tenant", "([a-f0-9]{32})"
147+
)
148+
)
61149
{{- end }}

0 commit comments

Comments
 (0)