-
Notifications
You must be signed in to change notification settings - Fork 1
Expand file tree
/
Copy pathfskhttp_rules.yml
More file actions
57 lines (52 loc) · 1.64 KB
/
fskhttp_rules.yml
File metadata and controls
57 lines (52 loc) · 1.64 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
# Alert Rules (fskhttp_rules.yml)
groups:
- name: fskhttp
rules:
- alert: FSKHTTPHighErrorRate
expr: (rate(fskhttp_requests_failed_total[5m]) / rate(fskhttp_requests_total[5m])) > 0.1
for: 2m
labels:
severity: warning
annotations:
summary: "High error rate detected"
description: "Error rate is {{ $value | humanizePercentage }} for the last 5 minutes"
- alert: FSKHTTPHighLatency
expr: histogram_quantile(0.95, rate(fskhttp_request_duration_seconds_bucket[5m])) > 10
for: 2m
labels:
severity: warning
annotations:
summary: "High latency detected"
description: "95th percentile latency is {{ $value }}s"
- alert: FSKHTTPServiceDown
expr: up{job="fskhttp"} == 0
for: 1m
labels:
severity: critical
annotations:
summary: "FSK HTTP service is down"
description: "Service {{ $labels.instance }} has been down for more than 1 minute"
- alert: FSKHTTPHighCPU
expr: (rate(cpu_percent[5m])) > 80
for: 5m
labels:
severity: warning
annotations:
summary: "High CPU usage"
description: "CPU usage is {{ $value }}% on {{ $labels.instance }}"
- alert: FSKHTTPHighMemory
expr: memory_percent > 85
for: 5m
labels:
severity: warning
annotations:
summary: "High memory usage"
description: "Memory usage is {{ $value }}% on {{ $labels.instance }}"
- alert: FSKHTTPTooManyActiveRequests
expr: fskhttp_requests_active > 40
for: 2m
labels:
severity: warning
annotations:
summary: "Too many active requests"
description: "{{ $value }} active requests on {{ $labels.instance }}"