VictoriaMetrics/app/vmselect/promql/exec.go

package promql

import (
	"flag"
	"fmt"
	"math"
	"sort"
	"strings"
	"sync"
	"sync/atomic"
	"time"

	"github.com/VictoriaMetrics/VictoriaMetrics/app/vmselect/netstorage"
	"github.com/VictoriaMetrics/VictoriaMetrics/lib/logger"
	"github.com/VictoriaMetrics/metrics"
	"github.com/VictoriaMetrics/metricsql"
)

var (
	logSlowQueryDuration   = flag.Duration("search.logSlowQueryDuration", 5*time.Second, "Log queries with execution time exceeding this value. Zero disables slow query logging")
	treatDotsAsIsInRegexps = flag.Bool("search.treatDotsAsIsInRegexps", false, "Whether to treat dots as is in regexp label filters used in queries. "+
		`For example, foo{bar=~"a.b.c"} will be automatically converted to foo{bar=~"a\\.b\\.c"}, i.e. all the dots in regexp filters will be automatically escaped `+
		`in order to match only dot char instead of matching any char. Dots in ".+", ".*" and ".{n}" regexps aren't escaped. `+
		`Such escaping can be useful when querying Graphite data`)
)

var slowQueries = metrics.NewCounter(`vm_slow_queries_total`)

// Exec executes q for the given ec.
func Exec(ec *EvalConfig, q string, isFirstPointOnly bool) ([]netstorage.Result, error) {
	if *logSlowQueryDuration > 0 {
		startTime := time.Now()
		defer func() {
			d := time.Since(startTime)
			if d >= *logSlowQueryDuration {
				logger.Warnf("slow query according to -search.logSlowQueryDuration=%s: remoteAddr=%s, duration=%.3f seconds, start=%d, end=%d, step=%d, accountID=%d, projectID=%d, query=%q",
					*logSlowQueryDuration, ec.QuotedRemoteAddr, d.Seconds(), ec.Start/1000, ec.End/1000, ec.Step/1000, ec.AuthToken.AccountID, ec.AuthToken.ProjectID, q)
				slowQueries.Inc()
			}
		}()
	}

	ec.validate()

	e, err := parsePromQLWithCache(q)
	if err != nil {
		return nil, err
	}

	qid := activeQueriesV.Add(ec, q)
	rv, err := evalExpr(ec, e)
	activeQueriesV.Remove(qid)
	if err != nil {
		return nil, err
	}

	if isFirstPointOnly {
		// Remove all the points except the first one from every time series.
		for _, ts := range rv {
			ts.Values = ts.Values[:1]
			ts.Timestamps = ts.Timestamps[:1]
		}
	}

	maySort := maySortResults(e, rv)
	result, err := timeseriesToResult(rv, maySort)
	if err != nil {
		return nil, err
	}
	return result, err
}

func maySortResults(e metricsql.Expr, tss []*timeseries) bool {
	if len(tss) > 100 {
		// There is no sense in sorting a lot of results
		return false
	}
	fe, ok := e.(*metricsql.FuncExpr)
	if !ok {
		return true
	}
	switch fe.Name {
	case "sort", "sort_desc",
		"sort_by_label", "sort_by_label_desc":
		return false
	default:
		return true
	}
}

func timeseriesToResult(tss []*timeseries, maySort bool) ([]netstorage.Result, error) {
	tss = removeNaNs(tss)
	result := make([]netstorage.Result, len(tss))
	m := make(map[string]struct{}, len(tss))
	bb := bbPool.Get()
	for i, ts := range tss {
		bb.B = marshalMetricNameSorted(bb.B[:0], &ts.MetricName)
		if _, ok := m[string(bb.B)]; ok {
			return nil, fmt.Errorf(`duplicate output timeseries: %s`, stringMetricName(&ts.MetricName))
		}
		m[string(bb.B)] = struct{}{}

		rs := &result[i]
		rs.MetricNameMarshaled = append(rs.MetricNameMarshaled[:0], bb.B...)
		rs.MetricName.CopyFrom(&ts.MetricName)
		rs.Values = append(rs.Values[:0], ts.Values...)
		rs.Timestamps = append(rs.Timestamps[:0], ts.Timestamps...)
	}
	bbPool.Put(bb)

	if maySort {
		sort.Slice(result, func(i, j int) bool {
			return string(result[i].MetricNameMarshaled) < string(result[j].MetricNameMarshaled)
		})
	}

	return result, nil
}

func removeNaNs(tss []*timeseries) []*timeseries {
	rvs := tss[:0]
	for _, ts := range tss {
		allNans := true
		for _, v := range ts.Values {
			if !math.IsNaN(v) {
				allNans = false
				break
			}
		}
		if allNans {
			// Skip timeseries with all NaNs.
			continue
		}
		rvs = append(rvs, ts)
	}
	for i := len(rvs); i < len(tss); i++ {
		// Zero unused time series, so GC could reclaim them.
		tss[i] = nil
	}
	return rvs
}

func adjustCmpOps(e metricsql.Expr) metricsql.Expr {
	metricsql.VisitAll(e, func(expr metricsql.Expr) {
		be, ok := expr.(*metricsql.BinaryOpExpr)
		if !ok {
			return
		}
		if !metricsql.IsBinaryOpCmp(be.Op) {
			return
		}
		if isNumberExpr(be.Right) || !isScalarExpr(be.Left) {
			return
		}
		// Convert 'num cmpOp query' expression to `query reverseCmpOp num` expression
		// like Prometheus does. For instance, `0.5 < foo` must be converted to `foo > 0.5`
		// in order to return valid values for `foo` that are bigger than 0.5.
		be.Right, be.Left = be.Left, be.Right
		be.Op = getReverseCmpOp(be.Op)
	})
	return e
}

func isNumberExpr(e metricsql.Expr) bool {
	_, ok := e.(*metricsql.NumberExpr)
	return ok
}

func isScalarExpr(e metricsql.Expr) bool {
	if isNumberExpr(e) {
		return true
	}
	if fe, ok := e.(*metricsql.FuncExpr); ok {
		// time() returns scalar in PromQL - see https://prometheus.io/docs/prometheus/latest/querying/functions/#time
		return strings.ToLower(fe.Name) == "time"
	}
	return false
}

func getReverseCmpOp(op string) string {
	switch op {
	case ">":
		return "<"
	case "<":
		return ">"
	case ">=":
		return "<="
	case "<=":
		return ">="
	default:
		// there is no need in changing `==` and `!=`.
		return op
	}
}

func parsePromQLWithCache(q string) (metricsql.Expr, error) {
	pcv := parseCacheV.Get(q)
	if pcv == nil {
		e, err := metricsql.Parse(q)
		if err == nil {
			e = metricsql.Optimize(e)
			e = adjustCmpOps(e)
			if *treatDotsAsIsInRegexps {
				e = escapeDotsInRegexpLabelFilters(e)
			}
		}
		pcv = &parseCacheValue{
			e:   e,
			err: err,
		}
		parseCacheV.Put(q, pcv)
	}
	if pcv.err != nil {
		return nil, pcv.err
	}
	return pcv.e, nil
}

func escapeDotsInRegexpLabelFilters(e metricsql.Expr) metricsql.Expr {
	metricsql.VisitAll(e, func(expr metricsql.Expr) {
		me, ok := expr.(*metricsql.MetricExpr)
		if !ok {
			return
		}
		for i := range me.LabelFilters {
			f := &me.LabelFilters[i]
			if f.IsRegexp {
				f.Value = escapeDots(f.Value)
			}
		}
	})
	return e
}

func escapeDots(s string) string {
	dotsCount := strings.Count(s, ".")
	if dotsCount <= 0 {
		return s
	}
	result := make([]byte, 0, len(s)+2*dotsCount)
	for i := 0; i < len(s); i++ {
		if s[i] == '.' && (i == 0 || s[i-1] != '\\') && (i+1 == len(s) || i+1 < len(s) && s[i+1] != '*' && s[i+1] != '+' && s[i+1] != '{') {
			// Escape a dot if the following conditions are met:
			// - if it isn't escaped already, i.e. if there is no `\` char before the dot.
			// - if there is no regexp modifiers such as '+', '*' or '{' after the dot.
			result = append(result, '\\', '.')
		} else {
			result = append(result, s[i])
		}
	}
	return string(result)
}

var parseCacheV = func() *parseCache {
	pc := &parseCache{
		m: make(map[string]*parseCacheValue),
	}
	metrics.NewGauge(`vm_cache_requests_total{type="promql/parse"}`, func() float64 {
		return float64(pc.Requests())
	})
	metrics.NewGauge(`vm_cache_misses_total{type="promql/parse"}`, func() float64 {
		return float64(pc.Misses())
	})
	metrics.NewGauge(`vm_cache_entries{type="promql/parse"}`, func() float64 {
		return float64(pc.Len())
	})
	return pc
}()

const parseCacheMaxLen = 10e3

type parseCacheValue struct {
	e   metricsql.Expr
	err error
}

type parseCache struct {
	// Move atomic counters to the top of struct for 8-byte alignment on 32-bit arch.
	// See https://github.com/VictoriaMetrics/VictoriaMetrics/issues/212

	requests uint64
	misses   uint64

	m  map[string]*parseCacheValue
	mu sync.RWMutex
}

func (pc *parseCache) Requests() uint64 {
	return atomic.LoadUint64(&pc.requests)
}

func (pc *parseCache) Misses() uint64 {
	return atomic.LoadUint64(&pc.misses)
}

func (pc *parseCache) Len() uint64 {
	pc.mu.RLock()
	n := len(pc.m)
	pc.mu.RUnlock()
	return uint64(n)
}

func (pc *parseCache) Get(q string) *parseCacheValue {
	atomic.AddUint64(&pc.requests, 1)

	pc.mu.RLock()
	pcv := pc.m[q]
	pc.mu.RUnlock()

	if pcv == nil {
		atomic.AddUint64(&pc.misses, 1)
	}
	return pcv
}

func (pc *parseCache) Put(q string, pcv *parseCacheValue) {
	pc.mu.Lock()
	overflow := len(pc.m) - parseCacheMaxLen
	if overflow > 0 {
		// Remove 10% of items from the cache.
		overflow = int(float64(len(pc.m)) * 0.1)
		for k := range pc.m {
			delete(pc.m, k)
			overflow--
			if overflow <= 0 {
				break
			}
		}
	}
	pc.m[q] = pcv
	pc.mu.Unlock()
}
all: open-sourcing single-node version 2019-05-22 23:16:55 +02:00			`package promql`

			`import (`
app/vmselect: log slow queries if their execution time exceeds `-search.logSlowQueryDuration` 2019-05-24 15:12:31 +02:00			`"flag"`
all: open-sourcing single-node version 2019-05-22 23:16:55 +02:00			`"fmt"`
			`"math"`
			`"sort"`
app/vmselect: add `-search.treatDotsAsIsInRegexps` command-line flag for automatic escaping of dots in regexp label filters 2020-11-11 11:38:44 +01:00			`"strings"`
all: open-sourcing single-node version 2019-05-22 23:16:55 +02:00			`"sync"`
			`"sync/atomic"`
app/vmselect: log slow queries if their execution time exceeds `-search.logSlowQueryDuration` 2019-05-24 15:12:31 +02:00			`"time"`
all: open-sourcing single-node version 2019-05-22 23:16:55 +02:00
			`"github.com/VictoriaMetrics/VictoriaMetrics/app/vmselect/netstorage"`
app/vmselect: log slow queries if their execution time exceeds `-search.logSlowQueryDuration` 2019-05-24 15:12:31 +02:00			`"github.com/VictoriaMetrics/VictoriaMetrics/lib/logger"`
all: open-sourcing single-node version 2019-05-22 23:16:55 +02:00			`"github.com/VictoriaMetrics/metrics"`
lib/metricsql: move it to a separate repository - github.com/VictoriaMetrics/metrics 2020-04-28 14:28:22 +02:00			`"github.com/VictoriaMetrics/metricsql"`
all: open-sourcing single-node version 2019-05-22 23:16:55 +02:00			`)`

app/vmselect: add `-search.treatDotsAsIsInRegexps` command-line flag for automatic escaping of dots in regexp label filters 2020-11-11 11:38:44 +01:00			`var (`
			`logSlowQueryDuration = flag.Duration("search.logSlowQueryDuration", 5*time.Second, "Log queries with execution time exceeding this value. Zero disables slow query logging")`
			`treatDotsAsIsInRegexps = flag.Bool("search.treatDotsAsIsInRegexps", false, "Whether to treat dots as is in regexp label filters used in queries. "+`
			`For example, foo{bar=~"a.b.c"} will be automatically converted to foo{bar=~"a\\.b\\.c"}, i.e. all the dots in regexp filters will be automatically escaped `+
			`in order to match only dot char instead of matching any char. Dots in ".+", ".*" and ".{n}" regexps aren't escaped. `+
			`Such escaping can be useful when querying Graphite data`)
			`)`
app/vmselect: log slow queries if their execution time exceeds `-search.logSlowQueryDuration` 2019-05-24 15:12:31 +02:00
app/vmselect/promql: add `vm_slow_queries_total` metric for counting slow queries The query is slow if its execution time exceeds `-search.logSlowQueryDuration` 2019-07-31 02:35:13 +02:00			var slowQueries = metrics.NewCounter(`vm_slow_queries_total`)

app/vmselect: do not return empty time series in `/api/v1/query` result 2019-07-01 16:14:49 +02:00			`// Exec executes q for the given ec.`
			`func Exec(ec *EvalConfig, q string, isFirstPointOnly bool) ([]netstorage.Result, error) {`
app/vmselect: log slow queries if their execution time exceeds `-search.logSlowQueryDuration` 2019-05-24 15:12:31 +02:00			`if *logSlowQueryDuration > 0 {`
			`startTime := time.Now()`
			`defer func() {`
			`d := time.Since(startTime)`
			`if d >= *logSlowQueryDuration {`
app/vmselect: add remoteAddr to slow query log in order to improve debuggability This will simplify identifying the client that sends slow queries to VictoriaMetrics. 2020-11-18 19:37:54 +01:00			`logger.Warnf("slow query according to -search.logSlowQueryDuration=%s: remoteAddr=%s, duration=%.3f seconds, start=%d, end=%d, step=%d, accountID=%d, projectID=%d, query=%q",`
			`*logSlowQueryDuration, ec.QuotedRemoteAddr, d.Seconds(), ec.Start/1000, ec.End/1000, ec.Step/1000, ec.AuthToken.AccountID, ec.AuthToken.ProjectID, q)`
app/vmselect/promql: add `vm_slow_queries_total` metric for counting slow queries The query is slow if its execution time exceeds `-search.logSlowQueryDuration` 2019-07-31 02:35:13 +02:00			`slowQueries.Inc()`
app/vmselect: log slow queries if their execution time exceeds `-search.logSlowQueryDuration` 2019-05-24 15:12:31 +02:00			`}`
			`}()`
			`}`

all: open-sourcing single-node version 2019-05-22 23:16:55 +02:00			`ec.validate()`

			`e, err := parsePromQLWithCache(q)`
			`if err != nil {`
app/vmselect: add `/api/v1/status/active_queries` page with the list of currently running queries This is a follow-up for https://github.com/VictoriaMetrics/VictoriaMetrics/pull/575 Updates https://github.com/VictoriaMetrics/VictoriaMetrics/issues/528 2020-07-08 18:09:16 +02:00			`return nil, err`
all: open-sourcing single-node version 2019-05-22 23:16:55 +02:00			`}`

app/vmselect: add `/api/v1/status/active_queries` page with the list of currently running queries This is a follow-up for https://github.com/VictoriaMetrics/VictoriaMetrics/pull/575 Updates https://github.com/VictoriaMetrics/VictoriaMetrics/issues/528 2020-07-08 18:09:16 +02:00			`qid := activeQueriesV.Add(ec, q)`
all: open-sourcing single-node version 2019-05-22 23:16:55 +02:00			`rv, err := evalExpr(ec, e)`
app/vmselect: add `/api/v1/status/active_queries` page with the list of currently running queries This is a follow-up for https://github.com/VictoriaMetrics/VictoriaMetrics/pull/575 Updates https://github.com/VictoriaMetrics/VictoriaMetrics/issues/528 2020-07-08 18:09:16 +02:00			`activeQueriesV.Remove(qid)`
all: open-sourcing single-node version 2019-05-22 23:16:55 +02:00			`if err != nil {`
app/vmselect: add `/api/v1/status/active_queries` page with the list of currently running queries This is a follow-up for https://github.com/VictoriaMetrics/VictoriaMetrics/pull/575 Updates https://github.com/VictoriaMetrics/VictoriaMetrics/issues/528 2020-07-08 18:09:16 +02:00			`return nil, err`
all: open-sourcing single-node version 2019-05-22 23:16:55 +02:00			`}`

app/vmselect: do not return empty time series in `/api/v1/query` result 2019-07-01 16:14:49 +02:00			`if isFirstPointOnly {`
			`// Remove all the points except the first one from every time series.`
			`for _, ts := range rv {`
			`ts.Values = ts.Values[:1]`
			`ts.Timestamps = ts.Timestamps[:1]`
			`}`
			`}`

all: open-sourcing single-node version 2019-05-22 23:16:55 +02:00			`maySort := maySortResults(e, rv)`
			`result, err := timeseriesToResult(rv, maySort)`
			`if err != nil {`
app/vmselect: add `/api/v1/status/active_queries` page with the list of currently running queries This is a follow-up for https://github.com/VictoriaMetrics/VictoriaMetrics/pull/575 Updates https://github.com/VictoriaMetrics/VictoriaMetrics/issues/528 2020-07-08 18:09:16 +02:00			`return nil, err`
all: open-sourcing single-node version 2019-05-22 23:16:55 +02:00			`}`
app/vmselect: add `/api/v1/status/active_queries` page with the list of currently running queries This is a follow-up for https://github.com/VictoriaMetrics/VictoriaMetrics/pull/575 Updates https://github.com/VictoriaMetrics/VictoriaMetrics/issues/528 2020-07-08 18:09:16 +02:00			`return result, err`
all: open-sourcing single-node version 2019-05-22 23:16:55 +02:00			`}`

Rename lib/promql to lib/metricsql and apply small fixes 2019-12-25 20:35:47 +01:00			`func maySortResults(e metricsql.Expr, tss []*timeseries) bool {`
all: open-sourcing single-node version 2019-05-22 23:16:55 +02:00			`if len(tss) > 100 {`
			`// There is no sense in sorting a lot of results`
			`return false`
			`}`
Rename lib/promql to lib/metricsql and apply small fixes 2019-12-25 20:35:47 +01:00			`fe, ok := e.(*metricsql.FuncExpr)`
all: open-sourcing single-node version 2019-05-22 23:16:55 +02:00			`if !ok {`
			`return true`
			`}`
			`switch fe.Name {`
app/vmselect: add `sort_by_label(q, label)` and `sort_by_label_desc(q, label)` functions This is implementation of https://github.com/prometheus/prometheus/pull/1533 for VictoriaMetrics. 2020-02-13 16:00:47 +01:00			`case "sort", "sort_desc",`
			`"sort_by_label", "sort_by_label_desc":`
all: open-sourcing single-node version 2019-05-22 23:16:55 +02:00			`return false`
			`default:`
			`return true`
			`}`
			`}`

			`func timeseriesToResult(tss []*timeseries, maySort bool) ([]netstorage.Result, error) {`
			`tss = removeNaNs(tss)`
			`result := make([]netstorage.Result, len(tss))`
app/vmselect/promql: pre-allocate memory for map for checking for duplicate timeseries This should reduce memory allocations for big number of timeseries 2019-08-20 21:51:45 +02:00			`m := make(map[string]struct{}, len(tss))`
all: open-sourcing single-node version 2019-05-22 23:16:55 +02:00			`bb := bbPool.Get()`
			`for i, ts := range tss {`
			`bb.B = marshalMetricNameSorted(bb.B[:0], &ts.MetricName)`
app/vmselect/promql: pre-allocate memory for map for checking for duplicate timeseries This should reduce memory allocations for big number of timeseries 2019-08-20 21:51:45 +02:00			`if _, ok := m[string(bb.B)]; ok {`
app/vmselect/promql: add `histogram` aggregate function, which is useful for building heatmaps from multiple time series 2019-11-23 23:02:18 +01:00			return nil, fmt.Errorf(`duplicate output timeseries: %s`, stringMetricName(&ts.MetricName))
all: open-sourcing single-node version 2019-05-22 23:16:55 +02:00			`}`
app/vmselect/promql: pre-allocate memory for map for checking for duplicate timeseries This should reduce memory allocations for big number of timeseries 2019-08-20 21:51:45 +02:00			`m[string(bb.B)] = struct{}{}`
all: open-sourcing single-node version 2019-05-22 23:16:55 +02:00
			`rs := &result[i]`
			`rs.MetricNameMarshaled = append(rs.MetricNameMarshaled[:0], bb.B...)`
			`rs.MetricName.CopyFrom(&ts.MetricName)`
			`rs.Values = append(rs.Values[:0], ts.Values...)`
			`rs.Timestamps = append(rs.Timestamps[:0], ts.Timestamps...)`
			`}`
			`bbPool.Put(bb)`

			`if maySort {`
			`sort.Slice(result, func(i, j int) bool {`
			`return string(result[i].MetricNameMarshaled) < string(result[j].MetricNameMarshaled)`
			`})`
			`}`

			`return result, nil`
			`}`

			`func removeNaNs(tss []timeseries) []timeseries {`
			`rvs := tss[:0]`
			`for _, ts := range tss {`
app/vmselect/promql: remove empty time series after applying filters like `q > 0` This should reduce CPU and RAM usage for queries over high number of time series. 2019-07-12 18:56:23 +02:00			`allNans := true`
all: open-sourcing single-node version 2019-05-22 23:16:55 +02:00			`for _, v := range ts.Values {`
app/vmselect/promql: remove empty time series after applying filters like `q > 0` This should reduce CPU and RAM usage for queries over high number of time series. 2019-07-12 18:56:23 +02:00			`if !math.IsNaN(v) {`
			`allNans = false`
			`break`
all: open-sourcing single-node version 2019-05-22 23:16:55 +02:00			`}`
			`}`
app/vmselect/promql: remove empty time series after applying filters like `q > 0` This should reduce CPU and RAM usage for queries over high number of time series. 2019-07-12 18:56:23 +02:00			`if allNans {`
all: open-sourcing single-node version 2019-05-22 23:16:55 +02:00			`// Skip timeseries with all NaNs.`
			`continue`
			`}`
			`rvs = append(rvs, ts)`
			`}`
app/vmselect/promql: remove empty time series after applying filters like `q > 0` This should reduce CPU and RAM usage for queries over high number of time series. 2019-07-12 18:56:23 +02:00			`for i := len(rvs); i < len(tss); i++ {`
			`// Zero unused time series, so GC could reclaim them.`
			`tss[i] = nil`
			`}`
all: open-sourcing single-node version 2019-05-22 23:16:55 +02:00			`return rvs`
			`}`

app/vmselect: properly handle PromQL queries like `scalar1 < metric < scalar2` like Prometheus does This fixes some cases from https://promlabs.com/promql-compliance-test-results-victoriametrics/ 2020-08-06 22:18:03 +02:00			`func adjustCmpOps(e metricsql.Expr) metricsql.Expr {`
			`metricsql.VisitAll(e, func(expr metricsql.Expr) {`
			`be, ok := expr.(*metricsql.BinaryOpExpr)`
			`if !ok {`
			`return`
			`}`
			`if !metricsql.IsBinaryOpCmp(be.Op) {`
			`return`
			`}`
app/vmselect: return `metric` values from `time() cmp_op metric` query when `cmp_op` comparison is true This aligns MetricsQL behavior to Prometheus' one. The issue has been identified at https://promlabs.com/promql-compliance-test-results/2020-12-01/victoriametrics/ 2020-12-02 11:08:47 +01:00			`if isNumberExpr(be.Right) \|\| !isScalarExpr(be.Left) {`
app/vmselect: properly handle PromQL queries like `scalar1 < metric < scalar2` like Prometheus does This fixes some cases from https://promlabs.com/promql-compliance-test-results-victoriametrics/ 2020-08-06 22:18:03 +02:00			`return`
			`}`
			// Convert 'num cmpOp query' expression to `query reverseCmpOp num` expression
app/vmselect: return `metric` values from `time() cmp_op metric` query when `cmp_op` comparison is true This aligns MetricsQL behavior to Prometheus' one. The issue has been identified at https://promlabs.com/promql-compliance-test-results/2020-12-01/victoriametrics/ 2020-12-02 11:08:47 +01:00			// like Prometheus does. For instance, `0.5 < foo` must be converted to `foo > 0.5`
app/vmselect: properly handle PromQL queries like `scalar1 < metric < scalar2` like Prometheus does This fixes some cases from https://promlabs.com/promql-compliance-test-results-victoriametrics/ 2020-08-06 22:18:03 +02:00			// in order to return valid values for `foo` that are bigger than 0.5.
			`be.Right, be.Left = be.Left, be.Right`
			`be.Op = getReverseCmpOp(be.Op)`
			`})`
			`return e`
			`}`

app/vmselect: return `metric` values from `time() cmp_op metric` query when `cmp_op` comparison is true This aligns MetricsQL behavior to Prometheus' one. The issue has been identified at https://promlabs.com/promql-compliance-test-results/2020-12-01/victoriametrics/ 2020-12-02 11:08:47 +01:00			`func isNumberExpr(e metricsql.Expr) bool {`
			`_, ok := e.(*metricsql.NumberExpr)`
			`return ok`
			`}`

			`func isScalarExpr(e metricsql.Expr) bool {`
			`if isNumberExpr(e) {`
			`return true`
			`}`
			`if fe, ok := e.(*metricsql.FuncExpr); ok {`
			`// time() returns scalar in PromQL - see https://prometheus.io/docs/prometheus/latest/querying/functions/#time`
			`return strings.ToLower(fe.Name) == "time"`
			`}`
			`return false`
			`}`

app/vmselect: properly handle PromQL queries like `scalar1 < metric < scalar2` like Prometheus does This fixes some cases from https://promlabs.com/promql-compliance-test-results-victoriametrics/ 2020-08-06 22:18:03 +02:00			`func getReverseCmpOp(op string) string {`
			`switch op {`
			`case ">":`
			`return "<"`
			`case "<":`
			`return ">"`
			`case ">=":`
			`return "<="`
			`case "<=":`
			`return ">="`
			`default:`
			// there is no need in changing `==` and `!=`.
			`return op`
			`}`
			`}`

Rename lib/promql to lib/metricsql and apply small fixes 2019-12-25 20:35:47 +01:00			`func parsePromQLWithCache(q string) (metricsql.Expr, error) {`
all: open-sourcing single-node version 2019-05-22 23:16:55 +02:00			`pcv := parseCacheV.Get(q)`
			`if pcv == nil {`
Rename lib/promql to lib/metricsql and apply small fixes 2019-12-25 20:35:47 +01:00			`e, err := metricsql.Parse(q)`
app/vmselect: properly handle PromQL queries like `scalar1 < metric < scalar2` like Prometheus does This fixes some cases from https://promlabs.com/promql-compliance-test-results-victoriametrics/ 2020-08-06 22:18:03 +02:00			`if err == nil {`
app/vmselect/promql: add missing label filters to binary operands before query execution This implements the optimization described at https://utcc.utoronto.ca/~cks/space/blog/sysadmin/PrometheusLabelNonOptimization See also https://github.com/cortexproject/cortex/issues/3253 2020-10-07 20:15:06 +02:00			`e = metricsql.Optimize(e)`
app/vmselect: properly handle PromQL queries like `scalar1 < metric < scalar2` like Prometheus does This fixes some cases from https://promlabs.com/promql-compliance-test-results-victoriametrics/ 2020-08-06 22:18:03 +02:00			`e = adjustCmpOps(e)`
app/vmselect: add `-search.treatDotsAsIsInRegexps` command-line flag for automatic escaping of dots in regexp label filters 2020-11-11 11:38:44 +01:00			`if *treatDotsAsIsInRegexps {`
			`e = escapeDotsInRegexpLabelFilters(e)`
			`}`
app/vmselect: properly handle PromQL queries like `scalar1 < metric < scalar2` like Prometheus does This fixes some cases from https://promlabs.com/promql-compliance-test-results-victoriametrics/ 2020-08-06 22:18:03 +02:00			`}`
all: open-sourcing single-node version 2019-05-22 23:16:55 +02:00			`pcv = &parseCacheValue{`
			`e: e,`
			`err: err,`
			`}`
			`parseCacheV.Put(q, pcv)`
			`}`
			`if pcv.err != nil {`
			`return nil, pcv.err`
			`}`
			`return pcv.e, nil`
			`}`

app/vmselect: add `-search.treatDotsAsIsInRegexps` command-line flag for automatic escaping of dots in regexp label filters 2020-11-11 11:38:44 +01:00			`func escapeDotsInRegexpLabelFilters(e metricsql.Expr) metricsql.Expr {`
			`metricsql.VisitAll(e, func(expr metricsql.Expr) {`
			`me, ok := expr.(*metricsql.MetricExpr)`
			`if !ok {`
			`return`
			`}`
			`for i := range me.LabelFilters {`
			`f := &me.LabelFilters[i]`
			`if f.IsRegexp {`
			`f.Value = escapeDots(f.Value)`
			`}`
			`}`
			`})`
			`return e`
			`}`

			`func escapeDots(s string) string {`
			`dotsCount := strings.Count(s, ".")`
			`if dotsCount <= 0 {`
			`return s`
			`}`
			`result := make([]byte, 0, len(s)+2*dotsCount)`
			`for i := 0; i < len(s); i++ {`
			`if s[i] == '.' && (i == 0 \|\| s[i-1] != '\\') && (i+1 == len(s) \|\| i+1 < len(s) && s[i+1] != '*' && s[i+1] != '+' && s[i+1] != '{') {`
			`// Escape a dot if the following conditions are met:`
			// - if it isn't escaped already, i.e. if there is no `\` char before the dot.
			`// - if there is no regexp modifiers such as '+', '*' or '{' after the dot.`
			`result = append(result, '\\', '.')`
			`} else {`
			`result = append(result, s[i])`
			`}`
			`}`
			`return string(result)`
			`}`

all: open-sourcing single-node version 2019-05-22 23:16:55 +02:00			`var parseCacheV = func() *parseCache {`
			`pc := &parseCache{`
			`m: make(map[string]*parseCacheValue),`
			`}`
			metrics.NewGauge(`vm_cache_requests_total{type="promql/parse"}`, func() float64 {
			`return float64(pc.Requests())`
			`})`
			metrics.NewGauge(`vm_cache_misses_total{type="promql/parse"}`, func() float64 {
			`return float64(pc.Misses())`
			`})`
			metrics.NewGauge(`vm_cache_entries{type="promql/parse"}`, func() float64 {
			`return float64(pc.Len())`
			`})`
			`return pc`
			`}()`

			`const parseCacheMaxLen = 10e3`

			`type parseCacheValue struct {`
Rename lib/promql to lib/metricsql and apply small fixes 2019-12-25 20:35:47 +01:00			`e metricsql.Expr`
all: open-sourcing single-node version 2019-05-22 23:16:55 +02:00			`err error`
			`}`

			`type parseCache struct {`
all: add support for GOARCH=386 and fix all the issues related to 32-bit architectures such as GOARCH=arm Updates https://github.com/VictoriaMetrics/VictoriaMetrics/issues/212 2019-10-17 17:22:56 +02:00			`// Move atomic counters to the top of struct for 8-byte alignment on 32-bit arch.`
			`// See https://github.com/VictoriaMetrics/VictoriaMetrics/issues/212`
all: open-sourcing single-node version 2019-05-22 23:16:55 +02:00
			`requests uint64`
			`misses uint64`
all: add support for GOARCH=386 and fix all the issues related to 32-bit architectures such as GOARCH=arm Updates https://github.com/VictoriaMetrics/VictoriaMetrics/issues/212 2019-10-17 17:22:56 +02:00
			`m map[string]*parseCacheValue`
			`mu sync.RWMutex`
all: open-sourcing single-node version 2019-05-22 23:16:55 +02:00			`}`

			`func (pc *parseCache) Requests() uint64 {`
			`return atomic.LoadUint64(&pc.requests)`
			`}`

			`func (pc *parseCache) Misses() uint64 {`
			`return atomic.LoadUint64(&pc.misses)`
			`}`

			`func (pc *parseCache) Len() uint64 {`
			`pc.mu.RLock()`
			`n := len(pc.m)`
			`pc.mu.RUnlock()`
			`return uint64(n)`
			`}`

			`func (pc parseCache) Get(q string) parseCacheValue {`
			`atomic.AddUint64(&pc.requests, 1)`

			`pc.mu.RLock()`
			`pcv := pc.m[q]`
			`pc.mu.RUnlock()`

			`if pcv == nil {`
			`atomic.AddUint64(&pc.misses, 1)`
			`}`
			`return pcv`
			`}`

			`func (pc parseCache) Put(q string, pcv parseCacheValue) {`
			`pc.mu.Lock()`
			`overflow := len(pc.m) - parseCacheMaxLen`
			`if overflow > 0 {`
			`// Remove 10% of items from the cache.`
			`overflow = int(float64(len(pc.m)) * 0.1)`
			`for k := range pc.m {`
			`delete(pc.m, k)`
			`overflow--`
			`if overflow <= 0 {`
			`break`
			`}`
			`}`
			`}`
			`pc.m[q] = pcv`
			`pc.mu.Unlock()`
			`}`