VictoriaMetrics/lib/storage/raw_row.go

package storage

import (
	"sort"
	"sync"

	"github.com/VictoriaMetrics/VictoriaMetrics/lib/decimal"
	"github.com/VictoriaMetrics/VictoriaMetrics/lib/logger"
)

// rawRow reperesents raw timeseries row.
type rawRow struct {
	// TSID is time series id.
	TSID TSID

	// Timestamp is unix timestamp in milliseconds.
	Timestamp int64

	// Value is time series value for the given timestamp.
	Value float64

	// PrecisionBits is the number of the siginificant bits in the Value
	// to store. Possible values are [1..64].
	// 1 means max. 50% error, 2 - 25%, 3 - 12.5%, 64 means no error, i.e.
	// Value stored without information loss.
	PrecisionBits uint8
}

type rawRowsMarshaler struct {
	bsw blockStreamWriter

	auxTimestamps  []int64
	auxValues      []int64
	auxFloatValues []float64
}

func (rrm *rawRowsMarshaler) reset() {
	rrm.bsw.reset()

	rrm.auxTimestamps = rrm.auxTimestamps[:0]
	rrm.auxValues = rrm.auxValues[:0]
	rrm.auxFloatValues = rrm.auxFloatValues[:0]
}

// Use sort.Interface instead of sort.Slice in order to optimize rows swap.
type rawRowsSort []rawRow

func (rrs *rawRowsSort) Len() int { return len(*rrs) }
func (rrs *rawRowsSort) Less(i, j int) bool {
	x := *rrs
	a := &x[i]
	b := &x[j]
	ta := &a.TSID
	tb := &b.TSID
	if ta.MetricID == tb.MetricID {
		// Fast path - identical TSID values.
		return a.Timestamp < b.Timestamp
	}

	// Slow path - compare TSIDs.
	// Manually inline TSID.Less here, since the compiler doesn't inline it yet :(
	if ta.AccountID < tb.AccountID {
		return true
	}
	if ta.AccountID > tb.AccountID {
		return false
	}
	if ta.ProjectID < tb.ProjectID {
		return true
	}
	if ta.ProjectID > tb.ProjectID {
		return false
	}
	if ta.MetricGroupID < tb.MetricGroupID {
		return true
	}
	if ta.MetricGroupID > tb.MetricGroupID {
		return false
	}
	if ta.JobID < tb.JobID {
		return true
	}
	if ta.JobID > tb.JobID {
		return false
	}
	if ta.InstanceID < tb.InstanceID {
		return true
	}
	if ta.InstanceID > tb.InstanceID {
		return false
	}
	if ta.MetricID < tb.MetricID {
		return true
	}
	if ta.MetricID > tb.MetricID {
		return false
	}
	return false
}
func (rrs *rawRowsSort) Swap(i, j int) {
	x := *rrs
	x[i], x[j] = x[j], x[i]
}

func (rrm *rawRowsMarshaler) marshalToInmemoryPart(mp *inmemoryPart, rows []rawRow) {
	if len(rows) == 0 {
		return
	}
	if uint64(len(rows)) >= 1<<32 {
		logger.Panicf("BUG: rows count must be smaller than 2^32; got %d", len(rows))
	}

	rrm.bsw.InitFromInmemoryPart(mp)

	ph := &mp.ph
	ph.Reset()

	// Sort rows by (TSID, Timestamp) if they aren't sorted yet.
	rrs := rawRowsSort(rows)
	if !sort.IsSorted(&rrs) {
		sort.Sort(&rrs)
	}

	// Group rows into blocks.
	var scale int16
	var rowsMerged uint64
	r := &rows[0]
	tsid := &r.TSID
	precisionBits := r.PrecisionBits
	tmpBlock := getBlock()
	defer putBlock(tmpBlock)
	for i := range rows {
		r = &rows[i]
		if r.TSID.MetricID == tsid.MetricID && len(rrm.auxTimestamps) < maxRowsPerBlock {
			rrm.auxTimestamps = append(rrm.auxTimestamps, r.Timestamp)
			rrm.auxFloatValues = append(rrm.auxFloatValues, r.Value)
			continue
		}

		rrm.auxValues, scale = decimal.AppendFloatToDecimal(rrm.auxValues[:0], rrm.auxFloatValues)
		tmpBlock.Init(tsid, rrm.auxTimestamps, rrm.auxValues, scale, precisionBits)
		rrm.bsw.WriteExternalBlock(tmpBlock, ph, &rowsMerged)

		tsid = &r.TSID
		precisionBits = r.PrecisionBits
		rrm.auxTimestamps = append(rrm.auxTimestamps[:0], r.Timestamp)
		rrm.auxFloatValues = append(rrm.auxFloatValues[:0], r.Value)
	}

	rrm.auxValues, scale = decimal.AppendFloatToDecimal(rrm.auxValues[:0], rrm.auxFloatValues)
	tmpBlock.Init(tsid, rrm.auxTimestamps, rrm.auxValues, scale, precisionBits)
	rrm.bsw.WriteExternalBlock(tmpBlock, ph, &rowsMerged)
	if rowsMerged != uint64(len(rows)) {
		logger.Panicf("BUG: unexpected rowsMerged; got %d; want %d", rowsMerged, len(rows))
	}
	rrm.bsw.MustClose()
}

func getRawRowsMarshaler() *rawRowsMarshaler {
	v := rrmPool.Get()
	if v == nil {
		return &rawRowsMarshaler{}
	}
	return v.(*rawRowsMarshaler)
}

func putRawRowsMarshaler(rrm *rawRowsMarshaler) {
	rrm.reset()
	rrmPool.Put(rrm)
}

var rrmPool sync.Pool
all: open-sourcing single-node version 2019-05-22 23:16:55 +02:00			`package storage`

			`import (`
			`"sort"`
			`"sync"`

			`"github.com/VictoriaMetrics/VictoriaMetrics/lib/decimal"`
			`"github.com/VictoriaMetrics/VictoriaMetrics/lib/logger"`
			`)`

			`// rawRow reperesents raw timeseries row.`
			`type rawRow struct {`
			`// TSID is time series id.`
			`TSID TSID`

			`// Timestamp is unix timestamp in milliseconds.`
			`Timestamp int64`

			`// Value is time series value for the given timestamp.`
			`Value float64`

			`// PrecisionBits is the number of the siginificant bits in the Value`
			`// to store. Possible values are [1..64].`
			`// 1 means max. 50% error, 2 - 25%, 3 - 12.5%, 64 means no error, i.e.`
			`// Value stored without information loss.`
			`PrecisionBits uint8`
			`}`

			`type rawRowsMarshaler struct {`
			`bsw blockStreamWriter`

			`auxTimestamps []int64`
			`auxValues []int64`
			`auxFloatValues []float64`
			`}`

			`func (rrm *rawRowsMarshaler) reset() {`
			`rrm.bsw.reset()`

			`rrm.auxTimestamps = rrm.auxTimestamps[:0]`
			`rrm.auxValues = rrm.auxValues[:0]`
			`rrm.auxFloatValues = rrm.auxFloatValues[:0]`
			`}`

			`// Use sort.Interface instead of sort.Slice in order to optimize rows swap.`
			`type rawRowsSort []rawRow`

			`func (rrs rawRowsSort) Len() int { return len(rrs) }`
			`func (rrs *rawRowsSort) Less(i, j int) bool {`
			`x := *rrs`
			`a := &x[i]`
			`b := &x[j]`
			`ta := &a.TSID`
			`tb := &b.TSID`
			`if ta.MetricID == tb.MetricID {`
			`// Fast path - identical TSID values.`
			`return a.Timestamp < b.Timestamp`
			`}`

			`// Slow path - compare TSIDs.`
			`// Manually inline TSID.Less here, since the compiler doesn't inline it yet :(`
all: open-sourcing cluster version 2019-05-22 23:23:23 +02:00			`if ta.AccountID < tb.AccountID {`
			`return true`
			`}`
			`if ta.AccountID > tb.AccountID {`
			`return false`
			`}`
			`if ta.ProjectID < tb.ProjectID {`
			`return true`
			`}`
			`if ta.ProjectID > tb.ProjectID {`
			`return false`
			`}`
all: open-sourcing single-node version 2019-05-22 23:16:55 +02:00			`if ta.MetricGroupID < tb.MetricGroupID {`
			`return true`
			`}`
			`if ta.MetricGroupID > tb.MetricGroupID {`
			`return false`
			`}`
			`if ta.JobID < tb.JobID {`
			`return true`
			`}`
			`if ta.JobID > tb.JobID {`
			`return false`
			`}`
			`if ta.InstanceID < tb.InstanceID {`
			`return true`
			`}`
			`if ta.InstanceID > tb.InstanceID {`
			`return false`
			`}`
			`if ta.MetricID < tb.MetricID {`
			`return true`
			`}`
			`if ta.MetricID > tb.MetricID {`
			`return false`
			`}`
			`return false`
			`}`
			`func (rrs *rawRowsSort) Swap(i, j int) {`
			`x := *rrs`
			`x[i], x[j] = x[j], x[i]`
			`}`

			`func (rrm rawRowsMarshaler) marshalToInmemoryPart(mp inmemoryPart, rows []rawRow) {`
			`if len(rows) == 0 {`
			`return`
			`}`
			`if uint64(len(rows)) >= 1<<32 {`
			`logger.Panicf("BUG: rows count must be smaller than 2^32; got %d", len(rows))`
			`}`

			`rrm.bsw.InitFromInmemoryPart(mp)`

			`ph := &mp.ph`
			`ph.Reset()`

			`// Sort rows by (TSID, Timestamp) if they aren't sorted yet.`
			`rrs := rawRowsSort(rows)`
			`if !sort.IsSorted(&rrs) {`
			`sort.Sort(&rrs)`
			`}`

			`// Group rows into blocks.`
			`var scale int16`
			`var rowsMerged uint64`
			`r := &rows[0]`
			`tsid := &r.TSID`
			`precisionBits := r.PrecisionBits`
			`tmpBlock := getBlock()`
			`defer putBlock(tmpBlock)`
			`for i := range rows {`
			`r = &rows[i]`
			`if r.TSID.MetricID == tsid.MetricID && len(rrm.auxTimestamps) < maxRowsPerBlock {`
			`rrm.auxTimestamps = append(rrm.auxTimestamps, r.Timestamp)`
			`rrm.auxFloatValues = append(rrm.auxFloatValues, r.Value)`
			`continue`
			`}`

			`rrm.auxValues, scale = decimal.AppendFloatToDecimal(rrm.auxValues[:0], rrm.auxFloatValues)`
			`tmpBlock.Init(tsid, rrm.auxTimestamps, rrm.auxValues, scale, precisionBits)`
			`rrm.bsw.WriteExternalBlock(tmpBlock, ph, &rowsMerged)`

			`tsid = &r.TSID`
			`precisionBits = r.PrecisionBits`
			`rrm.auxTimestamps = append(rrm.auxTimestamps[:0], r.Timestamp)`
			`rrm.auxFloatValues = append(rrm.auxFloatValues[:0], r.Value)`
			`}`

			`rrm.auxValues, scale = decimal.AppendFloatToDecimal(rrm.auxValues[:0], rrm.auxFloatValues)`
			`tmpBlock.Init(tsid, rrm.auxTimestamps, rrm.auxValues, scale, precisionBits)`
			`rrm.bsw.WriteExternalBlock(tmpBlock, ph, &rowsMerged)`
			`if rowsMerged != uint64(len(rows)) {`
			`logger.Panicf("BUG: unexpected rowsMerged; got %d; want %d", rowsMerged, len(rows))`
			`}`
			`rrm.bsw.MustClose()`
			`}`

			`func getRawRowsMarshaler() *rawRowsMarshaler {`
			`v := rrmPool.Get()`
			`if v == nil {`
			`return &rawRowsMarshaler{}`
			`}`
			`return v.(*rawRowsMarshaler)`
			`}`

			`func putRawRowsMarshaler(rrm *rawRowsMarshaler) {`
			`rrm.reset()`
			`rrmPool.Put(rrm)`
			`}`

			`var rrmPool sync.Pool`