2020-04-06 13:44:03 +02:00
|
|
|
package notifier
|
2020-02-16 19:59:02 +01:00
|
|
|
|
2020-03-13 11:19:31 +01:00
|
|
|
import (
|
2020-03-27 17:31:16 +01:00
|
|
|
"bytes"
|
2020-03-29 00:48:30 +01:00
|
|
|
"fmt"
|
|
|
|
"io"
|
2020-03-27 17:31:16 +01:00
|
|
|
"strings"
|
2022-05-14 11:38:44 +02:00
|
|
|
textTpl "text/template"
|
2020-03-13 11:19:31 +01:00
|
|
|
"time"
|
2020-06-29 21:21:03 +02:00
|
|
|
|
2022-05-14 11:38:44 +02:00
|
|
|
"github.com/VictoriaMetrics/VictoriaMetrics/app/vmalert/templates"
|
2020-06-29 21:21:03 +02:00
|
|
|
"github.com/VictoriaMetrics/VictoriaMetrics/app/vmalert/utils"
|
2022-04-09 08:21:16 +02:00
|
|
|
"github.com/VictoriaMetrics/VictoriaMetrics/lib/prompbmarshal"
|
|
|
|
"github.com/VictoriaMetrics/VictoriaMetrics/lib/promrelabel"
|
2020-03-13 11:19:31 +01:00
|
|
|
)
|
2020-02-16 19:59:02 +01:00
|
|
|
|
2020-03-13 11:19:31 +01:00
|
|
|
// Alert the triggered alert
|
2020-04-06 13:44:03 +02:00
|
|
|
// TODO: Looks like alert name isn't unique
|
2020-03-13 11:19:31 +01:00
|
|
|
type Alert struct {
|
2021-09-13 14:48:18 +02:00
|
|
|
// GroupID contains the ID of the parent rules group
|
|
|
|
GroupID uint64
|
|
|
|
// Name represents Alert name
|
|
|
|
Name string
|
|
|
|
// Labels is the list of label-value pairs attached to the Alert
|
|
|
|
Labels map[string]string
|
|
|
|
// Annotations is the list of annotations generated on Alert evaluation
|
2020-03-13 11:19:31 +01:00
|
|
|
Annotations map[string]string
|
2021-09-13 14:48:18 +02:00
|
|
|
// State represents the current state of the Alert
|
|
|
|
State AlertState
|
|
|
|
// Expr contains expression that was executed to generate the Alert
|
|
|
|
Expr string
|
2022-03-29 15:09:07 +02:00
|
|
|
// ActiveAt defines the moment of time when Alert has become active
|
|
|
|
ActiveAt time.Time
|
|
|
|
// Start defines the moment of time when Alert has become firing
|
2020-03-13 11:19:31 +01:00
|
|
|
Start time.Time
|
2021-09-13 14:48:18 +02:00
|
|
|
// End defines the moment of time when Alert supposed to expire
|
|
|
|
End time.Time
|
2022-03-29 15:09:07 +02:00
|
|
|
// ResolvedAt defines the moment when Alert was switched from Firing to Inactive
|
|
|
|
ResolvedAt time.Time
|
2022-03-16 16:26:33 +01:00
|
|
|
// LastSent defines the moment when Alert was sent last time
|
|
|
|
LastSent time.Time
|
2023-07-27 15:13:13 +02:00
|
|
|
// KeepFiringSince defines the moment when StateFiring was kept because of `keep_firing_for` instead of real alert
|
|
|
|
KeepFiringSince time.Time
|
2021-09-13 14:48:18 +02:00
|
|
|
// Value stores the value returned from evaluating expression from Expr field
|
2020-03-13 11:19:31 +01:00
|
|
|
Value float64
|
2023-02-13 13:27:13 +01:00
|
|
|
// ID is the unique identifier for the Alert
|
2021-09-13 14:48:18 +02:00
|
|
|
ID uint64
|
2021-10-22 11:30:38 +02:00
|
|
|
// Restored is true if Alert was restored after restart
|
|
|
|
Restored bool
|
2022-12-12 20:16:10 +01:00
|
|
|
// For defines for how long Alert needs to be active to become StateFiring
|
|
|
|
For time.Duration
|
2020-03-13 11:19:31 +01:00
|
|
|
}
|
|
|
|
|
2020-04-06 13:44:03 +02:00
|
|
|
// AlertState type indicates the Alert state
|
|
|
|
type AlertState int
|
|
|
|
|
|
|
|
const (
|
|
|
|
// StateInactive is the state of an alert that is neither firing nor pending.
|
|
|
|
StateInactive AlertState = iota
|
|
|
|
// StatePending is the state of an alert that has been active for less than
|
|
|
|
// the configured threshold duration.
|
|
|
|
StatePending
|
|
|
|
// StateFiring is the state of an alert that has been active for longer than
|
|
|
|
// the configured threshold duration.
|
|
|
|
StateFiring
|
|
|
|
)
|
|
|
|
|
2020-04-11 11:40:24 +02:00
|
|
|
// String stringer for AlertState
|
|
|
|
func (as AlertState) String() string {
|
|
|
|
switch as {
|
|
|
|
case StateFiring:
|
|
|
|
return "firing"
|
|
|
|
case StatePending:
|
|
|
|
return "pending"
|
|
|
|
}
|
|
|
|
return "inactive"
|
|
|
|
}
|
|
|
|
|
2020-12-19 13:10:59 +01:00
|
|
|
// AlertTplData is used to execute templating
|
|
|
|
type AlertTplData struct {
|
2022-08-22 13:32:36 +02:00
|
|
|
Labels map[string]string
|
|
|
|
Value float64
|
|
|
|
Expr string
|
|
|
|
AlertID uint64
|
|
|
|
GroupID uint64
|
|
|
|
ActiveAt time.Time
|
2022-12-12 20:16:10 +01:00
|
|
|
For time.Duration
|
2020-03-27 17:31:16 +01:00
|
|
|
}
|
|
|
|
|
2022-02-15 14:59:45 +01:00
|
|
|
var tplHeaders = []string{
|
|
|
|
"{{ $value := .Value }}",
|
|
|
|
"{{ $labels := .Labels }}",
|
|
|
|
"{{ $expr := .Expr }}",
|
|
|
|
"{{ $externalLabels := .ExternalLabels }}",
|
|
|
|
"{{ $externalURL := .ExternalURL }}",
|
2022-08-16 08:08:27 +02:00
|
|
|
"{{ $alertID := .AlertID }}",
|
|
|
|
"{{ $groupID := .GroupID }}",
|
2022-08-22 13:32:36 +02:00
|
|
|
"{{ $activeAt := .ActiveAt }}",
|
2022-12-12 20:16:10 +01:00
|
|
|
"{{ $for := .For }}",
|
2022-02-15 14:59:45 +01:00
|
|
|
}
|
2020-03-27 17:31:16 +01:00
|
|
|
|
2020-12-19 13:10:59 +01:00
|
|
|
// ExecTemplate executes the Alert template for given
|
2020-04-06 13:44:03 +02:00
|
|
|
// map of annotations.
|
2020-12-14 19:11:45 +01:00
|
|
|
// Every alert could have a different datasource, so function
|
|
|
|
// requires a queryFunction as an argument.
|
2022-05-14 11:38:44 +02:00
|
|
|
func (a *Alert) ExecTemplate(q templates.QueryFn, labels, annotations map[string]string) (map[string]string, error) {
|
2022-12-12 20:16:10 +01:00
|
|
|
tplData := AlertTplData{
|
|
|
|
Value: a.Value,
|
|
|
|
Labels: labels,
|
|
|
|
Expr: a.Expr,
|
|
|
|
AlertID: a.ID,
|
|
|
|
GroupID: a.GroupID,
|
|
|
|
ActiveAt: a.ActiveAt,
|
|
|
|
For: a.For,
|
|
|
|
}
|
2023-03-17 15:57:24 +01:00
|
|
|
return ExecTemplate(q, annotations, tplData)
|
2020-03-13 11:19:31 +01:00
|
|
|
}
|
|
|
|
|
2020-12-19 13:10:59 +01:00
|
|
|
// ExecTemplate executes the given template for given annotations map.
|
2022-05-14 11:38:44 +02:00
|
|
|
func ExecTemplate(q templates.QueryFn, annotations map[string]string, tplData AlertTplData) (map[string]string, error) {
|
|
|
|
tmpl, err := templates.GetWithFuncs(templates.FuncsWithQuery(q))
|
|
|
|
if err != nil {
|
|
|
|
return nil, fmt.Errorf("error cloning template: %w", err)
|
|
|
|
}
|
|
|
|
return templateAnnotations(annotations, tplData, tmpl, true)
|
2020-12-19 13:10:59 +01:00
|
|
|
}
|
|
|
|
|
2020-04-26 13:15:04 +02:00
|
|
|
// ValidateTemplates validate annotations for possible template error, uses empty data for template population
|
|
|
|
func ValidateTemplates(annotations map[string]string) error {
|
2022-05-14 11:38:44 +02:00
|
|
|
tmpl, err := templates.Get()
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
_, err = templateAnnotations(annotations, AlertTplData{
|
2020-04-06 13:44:03 +02:00
|
|
|
Labels: map[string]string{},
|
|
|
|
Value: 0,
|
2022-05-14 11:38:44 +02:00
|
|
|
}, tmpl, false)
|
2020-04-06 13:44:03 +02:00
|
|
|
return err
|
2020-03-27 17:31:16 +01:00
|
|
|
}
|
|
|
|
|
2022-05-14 11:38:44 +02:00
|
|
|
func templateAnnotations(annotations map[string]string, data AlertTplData, tmpl *textTpl.Template, execute bool) (map[string]string, error) {
|
2020-03-27 17:31:16 +01:00
|
|
|
var builder strings.Builder
|
|
|
|
var buf bytes.Buffer
|
2020-06-29 21:21:03 +02:00
|
|
|
eg := new(utils.ErrGroup)
|
2020-03-27 17:31:16 +01:00
|
|
|
r := make(map[string]string, len(annotations))
|
2022-02-15 14:59:45 +01:00
|
|
|
tData := tplData{data, externalLabels, externalURL}
|
|
|
|
header := strings.Join(tplHeaders, "")
|
2020-03-27 17:31:16 +01:00
|
|
|
for key, text := range annotations {
|
|
|
|
buf.Reset()
|
|
|
|
builder.Reset()
|
2022-02-15 14:59:45 +01:00
|
|
|
builder.Grow(len(header) + len(text))
|
|
|
|
builder.WriteString(header)
|
2020-03-27 17:31:16 +01:00
|
|
|
builder.WriteString(text)
|
2022-05-14 11:38:44 +02:00
|
|
|
if err := templateAnnotation(&buf, builder.String(), tData, tmpl, execute); err != nil {
|
2021-07-28 18:26:20 +02:00
|
|
|
r[key] = text
|
2020-06-30 21:58:18 +02:00
|
|
|
eg.Add(fmt.Errorf("key %q, template %q: %w", key, text, err))
|
2020-03-13 11:19:31 +01:00
|
|
|
continue
|
|
|
|
}
|
2020-03-27 17:31:16 +01:00
|
|
|
r[key] = buf.String()
|
2020-03-13 11:19:31 +01:00
|
|
|
}
|
2020-06-29 21:21:03 +02:00
|
|
|
return r, eg.Err()
|
2020-03-29 00:48:30 +01:00
|
|
|
}
|
|
|
|
|
2022-02-15 14:59:45 +01:00
|
|
|
type tplData struct {
|
|
|
|
AlertTplData
|
|
|
|
ExternalLabels map[string]string
|
|
|
|
ExternalURL string
|
|
|
|
}
|
|
|
|
|
2022-05-14 11:38:44 +02:00
|
|
|
func templateAnnotation(dst io.Writer, text string, data tplData, tmpl *textTpl.Template, execute bool) error {
|
|
|
|
tpl, err := tmpl.Clone()
|
2020-03-29 00:48:30 +01:00
|
|
|
if err != nil {
|
2022-05-14 11:38:44 +02:00
|
|
|
return fmt.Errorf("error cloning template before parse annotation: %w", err)
|
|
|
|
}
|
2023-03-30 14:57:00 +02:00
|
|
|
// Clone() doesn't copy tpl Options, so we set them manually
|
|
|
|
tpl = tpl.Option("missingkey=zero")
|
2022-05-14 11:38:44 +02:00
|
|
|
tpl, err = tpl.Parse(text)
|
|
|
|
if err != nil {
|
|
|
|
return fmt.Errorf("error parsing annotation template: %w", err)
|
|
|
|
}
|
|
|
|
if !execute {
|
|
|
|
return nil
|
2020-03-29 00:48:30 +01:00
|
|
|
}
|
|
|
|
if err = tpl.Execute(dst, data); err != nil {
|
2020-06-01 12:46:37 +02:00
|
|
|
return fmt.Errorf("error evaluating annotation template: %w", err)
|
2020-03-29 00:48:30 +01:00
|
|
|
}
|
|
|
|
return nil
|
|
|
|
}
|
2022-04-09 08:21:16 +02:00
|
|
|
|
2024-09-09 13:34:48 +02:00
|
|
|
func (a Alert) applyRelabelingIfNeeded(relabelCfg *promrelabel.ParsedConfigs) []prompbmarshal.Label {
|
2022-04-09 08:21:16 +02:00
|
|
|
var labels []prompbmarshal.Label
|
|
|
|
for k, v := range a.Labels {
|
|
|
|
labels = append(labels, prompbmarshal.Label{
|
2023-12-08 14:53:35 +01:00
|
|
|
Name: promrelabel.SanitizeMetricName(k),
|
2022-04-09 08:21:16 +02:00
|
|
|
Value: v,
|
|
|
|
})
|
|
|
|
}
|
|
|
|
if relabelCfg != nil {
|
2022-10-09 13:51:14 +02:00
|
|
|
labels = relabelCfg.Apply(labels, 0)
|
2022-04-09 08:21:16 +02:00
|
|
|
}
|
2022-10-09 13:51:14 +02:00
|
|
|
promrelabel.SortLabels(labels)
|
2022-04-09 08:21:16 +02:00
|
|
|
return labels
|
|
|
|
}
|