2020-06-01 12:46:37 +02:00
|
|
|
package config
|
|
|
|
|
|
|
|
import (
|
2020-09-11 21:14:30 +02:00
|
|
|
"crypto/md5"
|
2020-06-01 12:46:37 +02:00
|
|
|
"fmt"
|
2020-06-15 21:15:47 +02:00
|
|
|
"hash/fnv"
|
2020-06-01 12:46:37 +02:00
|
|
|
"io/ioutil"
|
|
|
|
"path/filepath"
|
2020-06-15 21:15:47 +02:00
|
|
|
"sort"
|
2020-06-01 12:46:37 +02:00
|
|
|
"strings"
|
|
|
|
"time"
|
|
|
|
|
|
|
|
"github.com/VictoriaMetrics/VictoriaMetrics/app/vmalert/notifier"
|
2020-08-13 15:43:55 +02:00
|
|
|
"github.com/VictoriaMetrics/VictoriaMetrics/lib/envtemplate"
|
2020-09-03 10:04:42 +02:00
|
|
|
"github.com/VictoriaMetrics/VictoriaMetrics/lib/logger"
|
2020-06-01 12:46:37 +02:00
|
|
|
"github.com/VictoriaMetrics/metricsql"
|
2020-06-15 21:15:47 +02:00
|
|
|
"gopkg.in/yaml.v2"
|
2020-06-01 12:46:37 +02:00
|
|
|
)
|
|
|
|
|
|
|
|
// Group contains list of Rules grouped into
|
|
|
|
// entity with one name and evaluation interval
|
|
|
|
type Group struct {
|
2020-06-09 14:21:20 +02:00
|
|
|
File string
|
|
|
|
Name string `yaml:"name"`
|
|
|
|
Interval time.Duration `yaml:"interval,omitempty"`
|
|
|
|
Rules []Rule `yaml:"rules"`
|
|
|
|
Concurrency int `yaml:"concurrency"`
|
2020-09-11 21:14:30 +02:00
|
|
|
// Checksum stores the hash of yaml definition for this group.
|
|
|
|
// May be used to detect any changes like rules re-ordering etc.
|
|
|
|
Checksum string
|
2020-06-01 12:46:37 +02:00
|
|
|
|
|
|
|
// Catches all undefined fields and must be empty after parsing.
|
|
|
|
XXX map[string]interface{} `yaml:",inline"`
|
|
|
|
}
|
|
|
|
|
2020-09-11 21:14:30 +02:00
|
|
|
// UnmarshalYAML implements the yaml.Unmarshaler interface.
|
|
|
|
func (g *Group) UnmarshalYAML(unmarshal func(interface{}) error) error {
|
|
|
|
type group Group
|
|
|
|
if err := unmarshal((*group)(g)); err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
b, err := yaml.Marshal(g)
|
|
|
|
if err != nil {
|
2020-09-23 21:46:24 +02:00
|
|
|
return fmt.Errorf("failed to marshal group configuration for checksum: %w", err)
|
2020-09-11 21:14:30 +02:00
|
|
|
}
|
|
|
|
h := md5.New()
|
|
|
|
h.Write(b)
|
|
|
|
g.Checksum = fmt.Sprintf("%x", h.Sum(nil))
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2020-06-01 12:46:37 +02:00
|
|
|
// Validate check for internal Group or Rule configuration errors
|
2020-06-06 22:27:09 +02:00
|
|
|
func (g *Group) Validate(validateAnnotations, validateExpressions bool) error {
|
2020-06-01 12:46:37 +02:00
|
|
|
if g.Name == "" {
|
|
|
|
return fmt.Errorf("group name must be set")
|
|
|
|
}
|
|
|
|
if len(g.Rules) == 0 {
|
|
|
|
return fmt.Errorf("group %q can't contain no rules", g.Name)
|
|
|
|
}
|
2020-06-15 21:15:47 +02:00
|
|
|
uniqueRules := map[uint64]struct{}{}
|
2020-06-01 12:46:37 +02:00
|
|
|
for _, r := range g.Rules {
|
|
|
|
ruleName := r.Record
|
|
|
|
if r.Alert != "" {
|
|
|
|
ruleName = r.Alert
|
|
|
|
}
|
2020-06-15 21:15:47 +02:00
|
|
|
if _, ok := uniqueRules[r.ID]; ok {
|
|
|
|
return fmt.Errorf("rule %q duplicate", ruleName)
|
2020-06-01 12:46:37 +02:00
|
|
|
}
|
2020-06-15 21:15:47 +02:00
|
|
|
uniqueRules[r.ID] = struct{}{}
|
2020-06-01 12:46:37 +02:00
|
|
|
if err := r.Validate(); err != nil {
|
2020-06-30 21:58:18 +02:00
|
|
|
return fmt.Errorf("invalid rule %q.%q: %w", g.Name, ruleName, err)
|
2020-06-01 12:46:37 +02:00
|
|
|
}
|
2020-06-06 22:27:09 +02:00
|
|
|
if validateExpressions {
|
|
|
|
if _, err := metricsql.Parse(r.Expr); err != nil {
|
2020-06-30 21:58:18 +02:00
|
|
|
return fmt.Errorf("invalid expression for rule %q.%q: %w", g.Name, ruleName, err)
|
2020-06-06 22:27:09 +02:00
|
|
|
}
|
2020-06-01 12:46:37 +02:00
|
|
|
}
|
2020-06-06 22:27:09 +02:00
|
|
|
if validateAnnotations {
|
|
|
|
if err := notifier.ValidateTemplates(r.Annotations); err != nil {
|
2020-06-30 21:58:18 +02:00
|
|
|
return fmt.Errorf("invalid annotations for rule %q.%q: %w", g.Name, ruleName, err)
|
2020-06-06 22:27:09 +02:00
|
|
|
}
|
|
|
|
if err := notifier.ValidateTemplates(r.Labels); err != nil {
|
2020-06-30 21:58:18 +02:00
|
|
|
return fmt.Errorf("invalid labels for rule %q.%q: %w", g.Name, ruleName, err)
|
2020-06-06 22:27:09 +02:00
|
|
|
}
|
2020-06-01 12:46:37 +02:00
|
|
|
}
|
|
|
|
}
|
|
|
|
return checkOverflow(g.XXX, fmt.Sprintf("group %q", g.Name))
|
|
|
|
}
|
|
|
|
|
|
|
|
// Rule describes entity that represent either
|
|
|
|
// recording rule or alerting rule.
|
|
|
|
type Rule struct {
|
2020-06-15 21:15:47 +02:00
|
|
|
ID uint64
|
2020-06-01 12:46:37 +02:00
|
|
|
Record string `yaml:"record,omitempty"`
|
|
|
|
Alert string `yaml:"alert,omitempty"`
|
|
|
|
Expr string `yaml:"expr"`
|
2020-10-08 19:12:57 +02:00
|
|
|
For PromDuration `yaml:"for,omitempty"`
|
2020-06-01 12:46:37 +02:00
|
|
|
Labels map[string]string `yaml:"labels,omitempty"`
|
|
|
|
Annotations map[string]string `yaml:"annotations,omitempty"`
|
2020-06-15 21:15:47 +02:00
|
|
|
|
|
|
|
// Catches all undefined fields and must be empty after parsing.
|
|
|
|
XXX map[string]interface{} `yaml:",inline"`
|
|
|
|
}
|
|
|
|
|
2020-10-08 19:12:57 +02:00
|
|
|
// PromDuration is Prometheus duration.
|
|
|
|
type PromDuration struct {
|
|
|
|
milliseconds int64
|
|
|
|
}
|
|
|
|
|
|
|
|
// NewPromDuration returns PromDuration for given d.
|
|
|
|
func NewPromDuration(d time.Duration) PromDuration {
|
|
|
|
return PromDuration{
|
|
|
|
milliseconds: d.Milliseconds(),
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// UnmarshalYAML implements yaml.Unmarshaler interface.
|
|
|
|
func (pd *PromDuration) UnmarshalYAML(unmarshal func(interface{}) error) error {
|
|
|
|
var s string
|
|
|
|
if err := unmarshal(&s); err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
ms, err := metricsql.DurationValue(s, 0)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
pd.milliseconds = ms
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
|
|
|
// Duration returns duration for pd.
|
|
|
|
func (pd *PromDuration) Duration() time.Duration {
|
|
|
|
return time.Duration(pd.milliseconds) * time.Millisecond
|
|
|
|
}
|
|
|
|
|
2020-06-15 21:15:47 +02:00
|
|
|
// UnmarshalYAML implements the yaml.Unmarshaler interface.
|
|
|
|
func (r *Rule) UnmarshalYAML(unmarshal func(interface{}) error) error {
|
|
|
|
type rule Rule
|
|
|
|
if err := unmarshal((*rule)(r)); err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
r.ID = HashRule(*r)
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2020-07-28 13:20:31 +02:00
|
|
|
// Name returns Rule name according to its type
|
|
|
|
func (r *Rule) Name() string {
|
|
|
|
if r.Record != "" {
|
|
|
|
return r.Record
|
|
|
|
}
|
|
|
|
return r.Alert
|
|
|
|
}
|
|
|
|
|
2020-06-15 21:15:47 +02:00
|
|
|
// HashRule hashes significant Rule fields into
|
2020-09-11 21:14:30 +02:00
|
|
|
// unique hash that supposed to define Rule uniqueness
|
2020-06-15 21:15:47 +02:00
|
|
|
func HashRule(r Rule) uint64 {
|
|
|
|
h := fnv.New64a()
|
|
|
|
h.Write([]byte(r.Expr))
|
|
|
|
if r.Record != "" {
|
|
|
|
h.Write([]byte("recording"))
|
|
|
|
h.Write([]byte(r.Record))
|
|
|
|
} else {
|
|
|
|
h.Write([]byte("alerting"))
|
|
|
|
h.Write([]byte(r.Alert))
|
|
|
|
}
|
2020-09-11 21:14:30 +02:00
|
|
|
kv := sortMap(r.Labels)
|
2020-06-15 21:15:47 +02:00
|
|
|
for _, i := range kv {
|
|
|
|
h.Write([]byte(i.key))
|
|
|
|
h.Write([]byte(i.value))
|
|
|
|
h.Write([]byte("\xff"))
|
|
|
|
}
|
|
|
|
return h.Sum64()
|
2020-06-01 12:46:37 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
// Validate check for Rule configuration errors
|
|
|
|
func (r *Rule) Validate() error {
|
|
|
|
if (r.Record == "" && r.Alert == "") || (r.Record != "" && r.Alert != "") {
|
|
|
|
return fmt.Errorf("either `record` or `alert` must be set")
|
|
|
|
}
|
|
|
|
if r.Expr == "" {
|
|
|
|
return fmt.Errorf("expression can't be empty")
|
|
|
|
}
|
2020-06-15 21:15:47 +02:00
|
|
|
return checkOverflow(r.XXX, "rule")
|
2020-06-01 12:46:37 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
// Parse parses rule configs from given file patterns
|
2020-06-06 22:27:09 +02:00
|
|
|
func Parse(pathPatterns []string, validateAnnotations, validateExpressions bool) ([]Group, error) {
|
2020-06-01 12:46:37 +02:00
|
|
|
var fp []string
|
|
|
|
for _, pattern := range pathPatterns {
|
|
|
|
matches, err := filepath.Glob(pattern)
|
|
|
|
if err != nil {
|
2020-06-30 21:58:18 +02:00
|
|
|
return nil, fmt.Errorf("error reading file pattern %s: %w", pattern, err)
|
2020-06-01 12:46:37 +02:00
|
|
|
}
|
|
|
|
fp = append(fp, matches...)
|
|
|
|
}
|
|
|
|
var groups []Group
|
|
|
|
for _, file := range fp {
|
|
|
|
uniqueGroups := map[string]struct{}{}
|
|
|
|
gr, err := parseFile(file)
|
|
|
|
if err != nil {
|
|
|
|
return nil, fmt.Errorf("failed to parse file %q: %w", file, err)
|
|
|
|
}
|
|
|
|
for _, g := range gr {
|
2020-06-06 22:27:09 +02:00
|
|
|
if err := g.Validate(validateAnnotations, validateExpressions); err != nil {
|
2020-06-30 21:58:18 +02:00
|
|
|
return nil, fmt.Errorf("invalid group %q in file %q: %w", g.Name, file, err)
|
2020-06-01 12:46:37 +02:00
|
|
|
}
|
|
|
|
if _, ok := uniqueGroups[g.Name]; ok {
|
|
|
|
return nil, fmt.Errorf("group name %q duplicate in file %q", g.Name, file)
|
|
|
|
}
|
|
|
|
uniqueGroups[g.Name] = struct{}{}
|
|
|
|
g.File = file
|
|
|
|
groups = append(groups, g)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if len(groups) < 1 {
|
2020-09-03 10:04:42 +02:00
|
|
|
logger.Warnf("no groups found in %s", strings.Join(pathPatterns, ";"))
|
2020-06-01 12:46:37 +02:00
|
|
|
}
|
|
|
|
return groups, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
func parseFile(path string) ([]Group, error) {
|
|
|
|
data, err := ioutil.ReadFile(path)
|
|
|
|
if err != nil {
|
|
|
|
return nil, fmt.Errorf("error reading alert rule file: %w", err)
|
|
|
|
}
|
2020-08-13 15:43:55 +02:00
|
|
|
data = envtemplate.Replace(data)
|
2020-06-01 12:46:37 +02:00
|
|
|
g := struct {
|
|
|
|
Groups []Group `yaml:"groups"`
|
|
|
|
// Catches all undefined fields and must be empty after parsing.
|
|
|
|
XXX map[string]interface{} `yaml:",inline"`
|
|
|
|
}{}
|
|
|
|
err = yaml.Unmarshal(data, &g)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
return g.Groups, checkOverflow(g.XXX, "config")
|
|
|
|
}
|
|
|
|
|
|
|
|
func checkOverflow(m map[string]interface{}, ctx string) error {
|
|
|
|
if len(m) > 0 {
|
|
|
|
var keys []string
|
|
|
|
for k := range m {
|
|
|
|
keys = append(keys, k)
|
|
|
|
}
|
|
|
|
return fmt.Errorf("unknown fields in %s: %s", ctx, strings.Join(keys, ", "))
|
|
|
|
}
|
|
|
|
return nil
|
|
|
|
}
|
2020-09-11 21:14:30 +02:00
|
|
|
|
|
|
|
type item struct {
|
|
|
|
key, value string
|
|
|
|
}
|
|
|
|
|
|
|
|
func sortMap(m map[string]string) []item {
|
|
|
|
var kv []item
|
|
|
|
for k, v := range m {
|
|
|
|
kv = append(kv, item{key: k, value: v})
|
|
|
|
}
|
|
|
|
sort.Slice(kv, func(i, j int) bool {
|
|
|
|
return kv[i].key < kv[j].key
|
|
|
|
})
|
|
|
|
return kv
|
|
|
|
}
|