-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathconfig.yaml
90 lines (74 loc) · 2.59 KB
/
config.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
settings:
## (REQUIRED) The iLert alert source api key
# apiKey: <YOU-API-KEY>
## Path to a kubeconfig. Only required if out-of-cluster.
# kubeconfig: "~/.kube/config"
## The address of the Kubernetes API server. Overrides any value in kubeconfig. Only required if out-of-cluster.
# master: ""
## Namespace in which agent run.
namespace: kube-systems
## The lease lock resource name
electionID: ilert-kube-agent
## The metrics server port
port: 9092
## The evaluation check interval e.g. resources check
checkInterval: 30s
log:
## Log level (debug, info, warn, error, fatal).
level: info
## Enable json logs
json: false
alarms:
pods:
## Enables all pod alarms
enabled: false
terminate:
## Enables terminate pod alarms
enabled: true
## The pod terminate alarm incident priority
priority: HIGH
waiting:
## Enables waiting pod alarms
enabled: true
## The pod waiting alarm incident priority
priority: LOW
restarts:
## Enables restarts pod alarms
enabled: true
## The pod restarts alarm incident priority
priority: LOW
## Pod restart threshold to alarm (min 1)
threshold: 10
resources:
## Enables resources pod alarms
enabled: true
## The pod resources alarm incident priority
priority: LOW
## The pod resources percentage threshold from 1 to 100
threshold: 90
nodes:
## Enables all pod alarms
enabled: true
terminate:
## Enables terminate node alarms
enabled: true
## The node terminate alarm incident priority
priority: HIGH
resources:
## Enables resources node alarms
enabled: true
## The node resources alarm incident priority
priority: LOW
## The node resources percentage threshold from 1 to 100
threshold: 90
links:
pods:
## Pods URL for the alarm-related incident. Your can use following mustache variables here: pod_namespace, pod_name, cluster_name
# - name: Metrics
# href: "https://grafana.example.com/d/kubernetes/kubernetes-overview?var-Node=All&var-Pod={{pod_name}}"
# - name: Logs
# href: "https://grafana.example.com/explore?left=%5B%22now-1h%22,%22now%22,%22Loki%22,%7B%22expr%22:%22%7Binstance%3D%5C%22{{pod_name}}%5C%22,namespace%3D%5C%22{{pod_namespace}}%5C%22%7D%22%7D%5D"
nodes:
## Nodes URL for the alarm-related incident. Your can use following mustache variables here: node_name, cluster_name
# - name: Metrics
# href: "https://grafana.example.com/d/kubernetes/kubernetes-overview?var-Node={{node_name}}"