VictoriaMetrics/lib/logstorage/stats_row_max.go

251 lines
5.8 KiB
Go
Raw Normal View History

2024-05-22 21:01:20 +02:00
package logstorage
import (
"fmt"
"math"
"slices"
"strings"
"unsafe"
"github.com/VictoriaMetrics/VictoriaMetrics/lib/bytesutil"
"github.com/VictoriaMetrics/VictoriaMetrics/lib/logger"
)
2024-05-30 16:19:23 +02:00
type statsRowMax struct {
2024-05-22 21:01:20 +02:00
srcField string
fetchFields []string
}
2024-05-30 16:19:23 +02:00
func (sm *statsRowMax) String() string {
s := "row_max(" + quoteTokenIfNeeded(sm.srcField)
2024-05-22 21:01:20 +02:00
if len(sm.fetchFields) > 0 {
s += ", " + fieldNamesString(sm.fetchFields)
}
s += ")"
return s
}
2024-05-30 16:19:23 +02:00
func (sm *statsRowMax) updateNeededFields(neededFields fieldsSet) {
2024-05-22 21:01:20 +02:00
if len(sm.fetchFields) == 0 {
neededFields.add("*")
} else {
neededFields.addFields(sm.fetchFields)
}
neededFields.add(sm.srcField)
}
2024-05-30 16:19:23 +02:00
func (sm *statsRowMax) newStatsProcessor() (statsProcessor, int) {
smp := &statsRowMaxProcessor{
2024-05-22 21:01:20 +02:00
sm: sm,
}
return smp, int(unsafe.Sizeof(*smp))
}
2024-05-30 16:19:23 +02:00
type statsRowMaxProcessor struct {
sm *statsRowMax
2024-05-22 21:01:20 +02:00
max string
fields []Field
}
2024-05-30 16:19:23 +02:00
func (smp *statsRowMaxProcessor) updateStatsForAllRows(br *blockResult) int {
2024-05-22 21:01:20 +02:00
stateSizeIncrease := 0
c := br.getColumnByName(smp.sm.srcField)
if c.isConst {
v := c.valuesEncoded[0]
stateSizeIncrease += smp.updateState(v, br, 0)
return stateSizeIncrease
}
if c.isTime {
timestamp, ok := TryParseTimestampRFC3339Nano(smp.max)
if !ok {
timestamp = -1 << 63
}
maxTimestamp := br.getMaxTimestamp(timestamp)
if maxTimestamp <= timestamp {
return stateSizeIncrease
}
2024-05-22 21:01:20 +02:00
bb := bbPool.Get()
bb.B = marshalTimestampRFC3339NanoString(bb.B[:0], maxTimestamp)
2024-05-22 21:01:20 +02:00
v := bytesutil.ToUnsafeString(bb.B)
stateSizeIncrease += smp.updateState(v, br, 0)
bbPool.Put(bb)
return stateSizeIncrease
}
needUpdateState := false
switch c.valueType {
case valueTypeString:
needUpdateState = true
case valueTypeDict:
c.forEachDictValue(br, func(v string) {
if !needUpdateState && smp.needUpdateStateString(v) {
2024-05-22 21:01:20 +02:00
needUpdateState = true
}
})
2024-05-22 21:01:20 +02:00
case valueTypeUint8, valueTypeUint16, valueTypeUint32, valueTypeUint64:
bb := bbPool.Get()
bb.B = marshalUint64String(bb.B[:0], c.maxValue)
needUpdateState = smp.needUpdateStateBytes(bb.B)
bbPool.Put(bb)
case valueTypeFloat64:
f := math.Float64frombits(c.maxValue)
bb := bbPool.Get()
bb.B = marshalFloat64String(bb.B[:0], f)
needUpdateState = smp.needUpdateStateBytes(bb.B)
bbPool.Put(bb)
case valueTypeIPv4:
bb := bbPool.Get()
bb.B = marshalIPv4String(bb.B[:0], uint32(c.maxValue))
needUpdateState = smp.needUpdateStateBytes(bb.B)
bbPool.Put(bb)
case valueTypeTimestampISO8601:
bb := bbPool.Get()
bb.B = marshalTimestampISO8601String(bb.B[:0], int64(c.maxValue))
needUpdateState = smp.needUpdateStateBytes(bb.B)
bbPool.Put(bb)
default:
logger.Panicf("BUG: unknown valueType=%d", c.valueType)
}
if needUpdateState {
values := c.getValues(br)
for i, v := range values {
stateSizeIncrease += smp.updateState(v, br, i)
}
}
return stateSizeIncrease
}
2024-05-30 16:19:23 +02:00
func (smp *statsRowMaxProcessor) updateStatsForRow(br *blockResult, rowIdx int) int {
2024-05-22 21:01:20 +02:00
stateSizeIncrease := 0
c := br.getColumnByName(smp.sm.srcField)
if c.isConst {
v := c.valuesEncoded[0]
stateSizeIncrease += smp.updateState(v, br, rowIdx)
return stateSizeIncrease
}
if c.isTime {
timestamps := br.getTimestamps()
2024-05-22 21:01:20 +02:00
bb := bbPool.Get()
bb.B = marshalTimestampRFC3339NanoString(bb.B[:0], timestamps[rowIdx])
2024-05-22 21:01:20 +02:00
v := bytesutil.ToUnsafeString(bb.B)
stateSizeIncrease += smp.updateState(v, br, rowIdx)
bbPool.Put(bb)
return stateSizeIncrease
}
v := c.getValueAtRow(br, rowIdx)
stateSizeIncrease += smp.updateState(v, br, rowIdx)
return stateSizeIncrease
}
2024-05-30 16:19:23 +02:00
func (smp *statsRowMaxProcessor) mergeState(sfp statsProcessor) {
src := sfp.(*statsRowMaxProcessor)
2024-05-22 21:01:20 +02:00
if smp.needUpdateStateString(src.max) {
smp.max = src.max
smp.fields = src.fields
}
}
2024-05-30 16:19:23 +02:00
func (smp *statsRowMaxProcessor) needUpdateStateBytes(b []byte) bool {
2024-05-22 21:01:20 +02:00
v := bytesutil.ToUnsafeString(b)
return smp.needUpdateStateString(v)
}
2024-05-30 16:19:23 +02:00
func (smp *statsRowMaxProcessor) needUpdateStateString(v string) bool {
2024-05-22 21:01:20 +02:00
if v == "" {
return false
}
return smp.max == "" || lessString(smp.max, v)
}
2024-05-30 16:19:23 +02:00
func (smp *statsRowMaxProcessor) updateState(v string, br *blockResult, rowIdx int) int {
2024-05-22 21:01:20 +02:00
stateSizeIncrease := 0
if !smp.needUpdateStateString(v) {
// There is no need in updating state
return stateSizeIncrease
}
stateSizeIncrease -= len(smp.max)
stateSizeIncrease += len(v)
smp.max = strings.Clone(v)
fields := smp.fields
for _, f := range fields {
stateSizeIncrease -= len(f.Name) + len(f.Value)
}
clear(fields)
fields = fields[:0]
fetchFields := smp.sm.fetchFields
if len(fetchFields) == 0 {
cs := br.getColumns()
for _, c := range cs {
v := c.getValueAtRow(br, rowIdx)
fields = append(fields, Field{
Name: strings.Clone(c.name),
Value: strings.Clone(v),
})
stateSizeIncrease += len(c.name) + len(v)
}
} else {
for _, field := range fetchFields {
c := br.getColumnByName(field)
v := c.getValueAtRow(br, rowIdx)
fields = append(fields, Field{
Name: strings.Clone(c.name),
Value: strings.Clone(v),
})
stateSizeIncrease += len(c.name) + len(v)
}
}
smp.fields = fields
return stateSizeIncrease
}
2024-05-30 16:19:23 +02:00
func (smp *statsRowMaxProcessor) finalizeStats() string {
2024-05-22 21:01:20 +02:00
bb := bbPool.Get()
2024-06-04 00:59:25 +02:00
bb.B = MarshalFieldsToJSON(bb.B, smp.fields)
2024-05-22 21:01:20 +02:00
result := string(bb.B)
bbPool.Put(bb)
return result
}
2024-05-30 16:19:23 +02:00
func parseStatsRowMax(lex *lexer) (*statsRowMax, error) {
if !lex.isKeyword("row_max") {
return nil, fmt.Errorf("unexpected func; got %q; want 'row_max'", lex.token)
2024-05-22 21:01:20 +02:00
}
lex.nextToken()
fields, err := parseFieldNamesInParens(lex)
if err != nil {
2024-05-30 16:19:23 +02:00
return nil, fmt.Errorf("cannot parse 'row_max' args: %w", err)
2024-05-22 21:01:20 +02:00
}
if len(fields) == 0 {
2024-05-30 16:19:23 +02:00
return nil, fmt.Errorf("missing first arg for 'row_max' func - source field")
2024-05-22 21:01:20 +02:00
}
srcField := fields[0]
fetchFields := fields[1:]
if slices.Contains(fetchFields, "*") {
fetchFields = nil
}
2024-05-30 16:19:23 +02:00
sm := &statsRowMax{
2024-05-22 21:01:20 +02:00
srcField: srcField,
fetchFields: fetchFields,
}
return sm, nil
}