Slide 18
Slide 18 text
global:
resolve_timeout: 5m
route:
group_by: ['alertname', 'instance'] # receiver ʹ௨͢Δ݅ʹઃఆ
group_wait: 30s # ࠷ॳͷॏෳഉআͷͨΊʹͭඵ
group_interval: 5m # άϧʔϓʹରͯ͠௨Λߦ͏ִؒ
# ࠷ॳ 30 ඵͬͯ௨->Ҏޙ৽͍͠Ξϥʔτ͕͋Ε 5 ຖʹ௨
repeat_interval: 1h # ࠶ૹ͞ΕΔ·Ͱͷ࣌ؒ(resolve ͍ͯ͠ͳ͚ΕԿͳ͘ͱ 1h ຖʹ௨)
routes: # ΞϥʔτͷϧʔςΟϯάͷઃఆ
- match_re: # Rule Ͱઃఆͨ͠λάʹରͯ͠ϧʔςΟϯάΛॻ͚Δ
service: ^sre$
receiver: 'sre-pagerduty'
receivers: # ΞϥʔτΛड͚औΔରͷઃఆ
- name: 'sre-page' # webhook, email, pagerduty ͕͑Δ
pagerduty_configs:
- service_key: xxxxxxxxxxxxxxxxxxxxxxxx
inhibit_rules: # Ξϥʔτͷॏෳഉআͷઃఆ
- source_match: # طʹΞϥʔτ໊ɾΠϯελϯε໊͕ಉ͡,
severity: 'critical' # critical ͷ alert ͕͋Δ߹ɺ
target_match: # warning ͷϚʔδ͞ΕͯऔΓѻΘΕΔ
severity: 'warning'
equal: ['alertname', 'instance']
hbstudy#79 (2017/11/20) | Yoshikawa Ryota ( @rrreeeyyy ) 18