2020-04-06 13:44:03 +02:00
|
|
|
package notifier
|
2020-02-16 19:59:02 +01:00
|
|
|
|
2020-03-13 11:19:31 +01:00
|
|
|
import (
|
2020-03-27 17:31:16 +01:00
|
|
|
"bytes"
|
2020-03-29 00:48:30 +01:00
|
|
|
"fmt"
|
|
|
|
"io"
|
2020-03-27 17:31:16 +01:00
|
|
|
"strings"
|
2022-05-14 11:38:44 +02:00
|
|
|
textTpl "text/template"
|
2020-03-13 11:19:31 +01:00
|
|
|
"time"
|
2020-06-29 21:21:03 +02:00
|
|
|
|
2022-05-14 11:38:44 +02:00
|
|
|
"github.com/VictoriaMetrics/VictoriaMetrics/app/vmalert/templates"
|
2020-06-29 21:21:03 +02:00
|
|
|
"github.com/VictoriaMetrics/VictoriaMetrics/app/vmalert/utils"
|
2022-04-09 08:21:16 +02:00
|
|
|
"github.com/VictoriaMetrics/VictoriaMetrics/lib/prompbmarshal"
|
|
|
|
"github.com/VictoriaMetrics/VictoriaMetrics/lib/promrelabel"
|
2020-03-13 11:19:31 +01:00
|
|
|
)
|
2020-02-16 19:59:02 +01:00
|
|
|
|
2020-03-13 11:19:31 +01:00
|
|
|
// Alert the triggered alert
|
2020-04-06 13:44:03 +02:00
|
|
|
// TODO: Looks like alert name isn't unique
|
2020-03-13 11:19:31 +01:00
|
|
|
type Alert struct {
|
2021-09-13 14:48:18 +02:00
|
|
|
// GroupID contains the ID of the parent rules group
|
|
|
|
GroupID uint64
|
|
|
|
// Name represents Alert name
|
|
|
|
Name string
|
|
|
|
// Labels is the list of label-value pairs attached to the Alert
|
|
|
|
Labels map[string]string
|
|
|
|
// Annotations is the list of annotations generated on Alert evaluation
|
2020-03-13 11:19:31 +01:00
|
|
|
Annotations map[string]string
|
2021-09-13 14:48:18 +02:00
|
|
|
// State represents the current state of the Alert
|
|
|
|
State AlertState
|
|
|
|
// Expr contains expression that was executed to generate the Alert
|
|
|
|
Expr string
|
2022-03-29 15:09:07 +02:00
|
|
|
// ActiveAt defines the moment of time when Alert has become active
|
|
|
|
ActiveAt time.Time
|
|
|
|
// Start defines the moment of time when Alert has become firing
|
2020-03-13 11:19:31 +01:00
|
|
|
Start time.Time
|
2021-09-13 14:48:18 +02:00
|
|
|
// End defines the moment of time when Alert supposed to expire
|
|
|
|
End time.Time
|
2022-03-29 15:09:07 +02:00
|
|
|
// ResolvedAt defines the moment when Alert was switched from Firing to Inactive
|
|
|
|
ResolvedAt time.Time
|
2022-03-16 16:26:33 +01:00
|
|
|
// LastSent defines the moment when Alert was sent last time
|
|
|
|
LastSent time.Time
|
2021-09-13 14:48:18 +02:00
|
|
|
// Value stores the value returned from evaluating expression from Expr field
|
2020-03-13 11:19:31 +01:00
|
|
|
Value float64
|
2021-09-13 14:48:18 +02:00
|
|
|
// ID is the unique identifer for the Alert
|
|
|
|
ID uint64
|
2021-10-22 11:30:38 +02:00
|
|
|
// Restored is true if Alert was restored after restart
|
|
|
|
Restored bool
|
2020-03-13 11:19:31 +01:00
|
|
|
}
|
|
|
|
|
2020-04-06 13:44:03 +02:00
|
|
|
// AlertState type indicates the Alert state
|
|
|
|
type AlertState int
|
|
|
|
|
|
|
|
const (
|
|
|
|
// StateInactive is the state of an alert that is neither firing nor pending.
|
|
|
|
StateInactive AlertState = iota
|
|
|
|
// StatePending is the state of an alert that has been active for less than
|
|
|
|
// the configured threshold duration.
|
|
|
|
StatePending
|
|
|
|
// StateFiring is the state of an alert that has been active for longer than
|
|
|
|
// the configured threshold duration.
|
|
|
|
StateFiring
|
|
|
|
)
|
|
|
|
|
2020-04-11 11:40:24 +02:00
|
|
|
// String stringer for AlertState
|
|
|
|
func (as AlertState) String() string {
|
|
|
|
switch as {
|
|
|
|
case StateFiring:
|
|
|
|
return "firing"
|
|
|
|
case StatePending:
|
|
|
|
return "pending"
|
|
|
|
}
|
|
|
|
return "inactive"
|
|
|
|
}
|
|
|
|
|
2020-12-19 13:10:59 +01:00
|
|
|
// AlertTplData is used to execute templating
|
|
|
|
type AlertTplData struct {
|
2020-04-06 13:44:03 +02:00
|
|
|
Labels map[string]string
|
|
|
|
Value float64
|
2020-05-18 10:55:16 +02:00
|
|
|
Expr string
|
2020-03-27 17:31:16 +01:00
|
|
|
}
|
|
|
|
|
2022-02-15 14:59:45 +01:00
|
|
|
var tplHeaders = []string{
|
|
|
|
"{{ $value := .Value }}",
|
|
|
|
"{{ $labels := .Labels }}",
|
|
|
|
"{{ $expr := .Expr }}",
|
|
|
|
"{{ $externalLabels := .ExternalLabels }}",
|
|
|
|
"{{ $externalURL := .ExternalURL }}",
|
|
|
|
}
|
2020-03-27 17:31:16 +01:00
|
|
|
|
2020-12-19 13:10:59 +01:00
|
|
|
// ExecTemplate executes the Alert template for given
|
2020-04-06 13:44:03 +02:00
|
|
|
// map of annotations.
|
2020-12-14 19:11:45 +01:00
|
|
|
// Every alert could have a different datasource, so function
|
|
|
|
// requires a queryFunction as an argument.
|
2022-05-14 11:38:44 +02:00
|
|
|
func (a *Alert) ExecTemplate(q templates.QueryFn, labels, annotations map[string]string) (map[string]string, error) {
|
vmalert: fix labels and annotations processing for alerts (#2403)
To improve compatibility with Prometheus alerting the order of
templates processing has changed.
Before, vmalert did all labels processing beforehand. It meant
all extra labels (such as `alertname`, `alertgroup` or rule labels)
were available in templating. All collisions were resolved in favour
of extra labels.
In Prometheus, only labels from the received metric are available in
templating, so no collisions are possible.
This change makes vmalert's behaviour similar to Prometheus.
For example, consider alerting rule which is triggered by time series
with `alertname` label. In vmalert, this label would be overriden
by alerting rule's name everywhere: for alert labels, for annotations, etc.
In Prometheus, it would be overriden for alert's labels only, but in annotations
the original label value would be available.
See more details here https://github.com/prometheus/compliance/issues/80
Signed-off-by: hagen1778 <roman@victoriametrics.com>
2022-04-06 20:24:45 +02:00
|
|
|
tplData := AlertTplData{Value: a.Value, Labels: labels, Expr: a.Expr}
|
2022-05-14 11:38:44 +02:00
|
|
|
tmpl, err := templates.GetWithFuncs(templates.FuncsWithQuery(q))
|
|
|
|
if err != nil {
|
|
|
|
return nil, fmt.Errorf("error getting a template: %w", err)
|
|
|
|
}
|
|
|
|
return templateAnnotations(annotations, tplData, tmpl, true)
|
2020-03-13 11:19:31 +01:00
|
|
|
}
|
|
|
|
|
2020-12-19 13:10:59 +01:00
|
|
|
// ExecTemplate executes the given template for given annotations map.
|
2022-05-14 11:38:44 +02:00
|
|
|
func ExecTemplate(q templates.QueryFn, annotations map[string]string, tplData AlertTplData) (map[string]string, error) {
|
|
|
|
tmpl, err := templates.GetWithFuncs(templates.FuncsWithQuery(q))
|
|
|
|
if err != nil {
|
|
|
|
return nil, fmt.Errorf("error cloning template: %w", err)
|
|
|
|
}
|
|
|
|
return templateAnnotations(annotations, tplData, tmpl, true)
|
2020-12-19 13:10:59 +01:00
|
|
|
}
|
|
|
|
|
2020-04-26 13:15:04 +02:00
|
|
|
// ValidateTemplates validate annotations for possible template error, uses empty data for template population
|
|
|
|
func ValidateTemplates(annotations map[string]string) error {
|
2022-05-14 11:38:44 +02:00
|
|
|
tmpl, err := templates.Get()
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
_, err = templateAnnotations(annotations, AlertTplData{
|
2020-04-06 13:44:03 +02:00
|
|
|
Labels: map[string]string{},
|
|
|
|
Value: 0,
|
2022-05-14 11:38:44 +02:00
|
|
|
}, tmpl, false)
|
2020-04-06 13:44:03 +02:00
|
|
|
return err
|
2020-03-27 17:31:16 +01:00
|
|
|
}
|
|
|
|
|
2022-05-14 11:38:44 +02:00
|
|
|
func templateAnnotations(annotations map[string]string, data AlertTplData, tmpl *textTpl.Template, execute bool) (map[string]string, error) {
|
2020-03-27 17:31:16 +01:00
|
|
|
var builder strings.Builder
|
|
|
|
var buf bytes.Buffer
|
2020-06-29 21:21:03 +02:00
|
|
|
eg := new(utils.ErrGroup)
|
2020-03-27 17:31:16 +01:00
|
|
|
r := make(map[string]string, len(annotations))
|
2022-02-15 14:59:45 +01:00
|
|
|
tData := tplData{data, externalLabels, externalURL}
|
|
|
|
header := strings.Join(tplHeaders, "")
|
2020-03-27 17:31:16 +01:00
|
|
|
for key, text := range annotations {
|
|
|
|
buf.Reset()
|
|
|
|
builder.Reset()
|
2022-02-15 14:59:45 +01:00
|
|
|
builder.Grow(len(header) + len(text))
|
|
|
|
builder.WriteString(header)
|
2020-03-27 17:31:16 +01:00
|
|
|
builder.WriteString(text)
|
2022-05-14 11:38:44 +02:00
|
|
|
if err := templateAnnotation(&buf, builder.String(), tData, tmpl, execute); err != nil {
|
2021-07-28 18:26:20 +02:00
|
|
|
r[key] = text
|
2020-06-30 21:58:18 +02:00
|
|
|
eg.Add(fmt.Errorf("key %q, template %q: %w", key, text, err))
|
2020-03-13 11:19:31 +01:00
|
|
|
continue
|
|
|
|
}
|
2020-03-27 17:31:16 +01:00
|
|
|
r[key] = buf.String()
|
2020-03-13 11:19:31 +01:00
|
|
|
}
|
2020-06-29 21:21:03 +02:00
|
|
|
return r, eg.Err()
|
2020-03-29 00:48:30 +01:00
|
|
|
}
|
|
|
|
|
2022-02-15 14:59:45 +01:00
|
|
|
type tplData struct {
|
|
|
|
AlertTplData
|
|
|
|
ExternalLabels map[string]string
|
|
|
|
ExternalURL string
|
|
|
|
}
|
|
|
|
|
2022-05-14 11:38:44 +02:00
|
|
|
func templateAnnotation(dst io.Writer, text string, data tplData, tmpl *textTpl.Template, execute bool) error {
|
|
|
|
tpl, err := tmpl.Clone()
|
2020-03-29 00:48:30 +01:00
|
|
|
if err != nil {
|
2022-05-14 11:38:44 +02:00
|
|
|
return fmt.Errorf("error cloning template before parse annotation: %w", err)
|
|
|
|
}
|
|
|
|
tpl, err = tpl.Parse(text)
|
|
|
|
if err != nil {
|
|
|
|
return fmt.Errorf("error parsing annotation template: %w", err)
|
|
|
|
}
|
|
|
|
if !execute {
|
|
|
|
return nil
|
2020-03-29 00:48:30 +01:00
|
|
|
}
|
2022-05-02 10:16:16 +02:00
|
|
|
if !execute {
|
|
|
|
return nil
|
|
|
|
}
|
2020-03-29 00:48:30 +01:00
|
|
|
if err = tpl.Execute(dst, data); err != nil {
|
2020-06-01 12:46:37 +02:00
|
|
|
return fmt.Errorf("error evaluating annotation template: %w", err)
|
2020-03-29 00:48:30 +01:00
|
|
|
}
|
|
|
|
return nil
|
|
|
|
}
|
2022-04-09 08:21:16 +02:00
|
|
|
|
|
|
|
func (a Alert) toPromLabels(relabelCfg *promrelabel.ParsedConfigs) []prompbmarshal.Label {
|
|
|
|
var labels []prompbmarshal.Label
|
|
|
|
for k, v := range a.Labels {
|
|
|
|
labels = append(labels, prompbmarshal.Label{
|
|
|
|
Name: k,
|
|
|
|
Value: v,
|
|
|
|
})
|
|
|
|
}
|
|
|
|
promrelabel.SortLabels(labels)
|
|
|
|
if relabelCfg != nil {
|
|
|
|
return relabelCfg.Apply(labels, 0, false)
|
|
|
|
}
|
|
|
|
return labels
|
|
|
|
}
|