This repository has been archived by the owner on Nov 22, 2021. It is now read-only.
-
Notifications
You must be signed in to change notification settings - Fork 3
/
Copy pathloki-values.yaml
59 lines (59 loc) · 1.81 KB
/
loki-values.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
fluent-bit:
enabled: false
grafana:
enabled: true
image:
tag: 7.5.2
prometheus:
alertmanager:
persistentVolume:
enabled: false
enabled: true
server:
persistentVolume:
enabled: false
promtail:
enabled: true
loki:
# Needed for Alerting: https://grafana.com/docs/loki/latest/alerting/
# This is just a simple example, for more details: https://grafana.com/docs/loki/latest/configuration/#ruler_config
ruler:
storage:
type: local
local:
directory: /rules
rule_path: /tmp/scratch
alertmanager_url: http://alertmanager.svc.logging:9093
ring:
kvstore:
store: inmemory
enable_api: true
# Specify Loki Alerting rules based on this documentation: https://grafana.com/docs/loki/latest/alerting/
# When specified, you also need to add a ruler config section above. An example is shown in the alerting docs.
alerting_groups:
- name: slow
rules:
- alert: slow-ops
annotations:
message: "{{ $labels.job }} is reporting slow ops."
expr: 'sum by (cluster, job, pod) (count_over_time({app="couchbase"}|="couchbase.log.memcached"|="Slow operation") > 0)'
for: 10m
labels:
severity: critical
- alert: slow-runtime
annotations:
message: "{{ $labels.job }} is reporting slow runtime."
expr: 'sum by (cluster, job, pod) (count_over_time({app="couchbase"}|="couchbase.log.memcached"|="Slow runtime") > 0)'
for: 10m
labels:
severity: critical
- name: logs
rules:
- alert: ErrorInLogs
expr: sum(count_over_time({app="couchbase"}|~ "[Ee]rror"[1m]) >= 1
for: 10s
labels:
severity: critical
category: logs
annotations:
title: "{{$value}} Errors occurred in application logs"