2019-05-22 23:16:55 +02:00
package influx
import (
"compress/gzip"
2019-06-14 08:57:13 +02:00
"flag"
2019-05-22 23:16:55 +02:00
"fmt"
"io"
"net/http"
"runtime"
"sync"
"time"
"github.com/VictoriaMetrics/VictoriaMetrics/app/vminsert/common"
"github.com/VictoriaMetrics/VictoriaMetrics/app/vminsert/concurrencylimiter"
"github.com/VictoriaMetrics/VictoriaMetrics/lib/bytesutil"
"github.com/VictoriaMetrics/VictoriaMetrics/lib/storage"
"github.com/VictoriaMetrics/metrics"
)
2019-06-14 08:57:13 +02:00
var (
2019-06-25 12:32:57 +02:00
measurementFieldSeparator = flag . String ( "influxMeasurementFieldSeparator" , "_" , "Separator for `{measurement}{separator}{field_name}` metric name when inserted via Influx line protocol" )
2019-06-14 09:51:57 +02:00
skipSingleField = flag . Bool ( "influxSkipSingleField" , false , "Uses `{measurement}` instead of `{measurement}{separator}{field_name}` for metic name if Influx line contains only a single field" )
2019-06-14 08:57:13 +02:00
)
2019-07-27 12:20:47 +02:00
var (
rowsInserted = metrics . NewCounter ( ` vm_rows_inserted_total { type="influx"} ` )
rowsPerInsert = metrics . NewSummary ( ` vm_rows_per_insert { type="influx"} ` )
)
2019-05-22 23:16:55 +02:00
// InsertHandler processes remote write for influx line protocol.
//
// See https://github.com/influxdata/influxdb/blob/4cbdc197b8117fee648d62e2e5be75c6575352f0/tsdb/README.md
func InsertHandler ( req * http . Request ) error {
return concurrencylimiter . Do ( func ( ) error {
return insertHandlerInternal ( req )
} )
}
func insertHandlerInternal ( req * http . Request ) error {
influxReadCalls . Inc ( )
r := req . Body
if req . Header . Get ( "Content-Encoding" ) == "gzip" {
zr , err := getGzipReader ( r )
if err != nil {
return fmt . Errorf ( "cannot read gzipped influx line protocol data: %s" , err )
}
defer putGzipReader ( zr )
r = zr
}
q := req . URL . Query ( )
tsMultiplier := int64 ( 1e6 )
switch q . Get ( "precision" ) {
case "ns" :
tsMultiplier = 1e6
case "u" :
tsMultiplier = 1e3
case "ms" :
tsMultiplier = 1
case "s" :
tsMultiplier = - 1e3
case "m" :
tsMultiplier = - 1e3 * 60
case "h" :
tsMultiplier = - 1e3 * 3600
}
// Read db tag from https://docs.influxdata.com/influxdb/v1.7/tools/api/#write-http-endpoint
db := q . Get ( "db" )
ctx := getPushCtx ( )
defer putPushCtx ( ctx )
for ctx . Read ( r , tsMultiplier ) {
if err := ctx . InsertRows ( db ) ; err != nil {
return err
}
}
return ctx . Error ( )
}
func ( ctx * pushCtx ) InsertRows ( db string ) error {
rows := ctx . Rows . Rows
rowsLen := 0
for i := range rows {
rowsLen += len ( rows [ i ] . Tags )
}
ic := & ctx . Common
ic . Reset ( rowsLen )
2019-07-27 12:20:47 +02:00
rowsTotal := 0
2019-05-22 23:16:55 +02:00
for i := range rows {
r := & rows [ i ]
ic . Labels = ic . Labels [ : 0 ]
ic . AddLabel ( "db" , db )
for j := range r . Tags {
tag := & r . Tags [ j ]
ic . AddLabel ( tag . Key , tag . Value )
}
ctx . metricNameBuf = storage . MarshalMetricNameRaw ( ctx . metricNameBuf [ : 0 ] , ic . Labels )
ctx . metricGroupBuf = append ( ctx . metricGroupBuf [ : 0 ] , r . Measurement ... )
2019-06-14 09:51:57 +02:00
skipFieldKey := len ( r . Fields ) == 1 && * skipSingleField
if ! skipFieldKey {
ctx . metricGroupBuf = append ( ctx . metricGroupBuf , * measurementFieldSeparator ... )
}
2019-05-22 23:16:55 +02:00
metricGroupPrefixLen := len ( ctx . metricGroupBuf )
for j := range r . Fields {
f := & r . Fields [ j ]
2019-06-14 09:51:57 +02:00
if ! skipFieldKey {
ctx . metricGroupBuf = append ( ctx . metricGroupBuf [ : metricGroupPrefixLen ] , f . Key ... )
}
2019-05-22 23:16:55 +02:00
metricGroup := bytesutil . ToUnsafeString ( ctx . metricGroupBuf )
ic . Labels = ic . Labels [ : 0 ]
ic . AddLabel ( "" , metricGroup )
ic . WriteDataPoint ( ctx . metricNameBuf , ic . Labels [ : 1 ] , r . Timestamp , f . Value )
}
2019-07-27 12:20:47 +02:00
rowsTotal += len ( r . Fields )
2019-05-22 23:16:55 +02:00
}
2019-07-27 12:20:47 +02:00
rowsInserted . Add ( rowsTotal )
rowsPerInsert . Update ( float64 ( rowsTotal ) )
2019-05-22 23:16:55 +02:00
return ic . FlushBufs ( )
}
func getGzipReader ( r io . Reader ) ( * gzip . Reader , error ) {
v := gzipReaderPool . Get ( )
if v == nil {
return gzip . NewReader ( r )
}
zr := v . ( * gzip . Reader )
if err := zr . Reset ( r ) ; err != nil {
return nil , err
}
return zr , nil
}
func putGzipReader ( zr * gzip . Reader ) {
_ = zr . Close ( )
gzipReaderPool . Put ( zr )
}
var gzipReaderPool sync . Pool
func ( ctx * pushCtx ) Read ( r io . Reader , tsMultiplier int64 ) bool {
if ctx . err != nil {
return false
}
2019-05-28 16:31:35 +02:00
ctx . reqBuf , ctx . tailBuf , ctx . err = common . ReadLinesBlock ( r , ctx . reqBuf , ctx . tailBuf )
if ctx . err != nil {
if ctx . err != io . EOF {
influxReadErrors . Inc ( )
ctx . err = fmt . Errorf ( "cannot read influx line protocol data: %s" , ctx . err )
}
2019-05-22 23:16:55 +02:00
return false
}
2019-05-28 16:31:35 +02:00
if err := ctx . Rows . Unmarshal ( bytesutil . ToUnsafeString ( ctx . reqBuf ) ) ; err != nil {
2019-05-22 23:16:55 +02:00
influxUnmarshalErrors . Inc ( )
2019-05-28 16:31:35 +02:00
ctx . err = fmt . Errorf ( "cannot unmarshal influx line protocol data with size %d: %s" , len ( ctx . reqBuf ) , err )
2019-05-22 23:16:55 +02:00
return false
}
// Adjust timestamps according to tsMultiplier
currentTs := time . Now ( ) . UnixNano ( ) / 1e6
if tsMultiplier >= 1 {
for i := range ctx . Rows . Rows {
row := & ctx . Rows . Rows [ i ]
if row . Timestamp == 0 {
row . Timestamp = currentTs
} else {
row . Timestamp /= tsMultiplier
}
}
} else if tsMultiplier < 0 {
tsMultiplier = - tsMultiplier
2019-08-01 23:24:06 +02:00
currentTs -= currentTs % tsMultiplier
2019-05-22 23:16:55 +02:00
for i := range ctx . Rows . Rows {
row := & ctx . Rows . Rows [ i ]
if row . Timestamp == 0 {
row . Timestamp = currentTs
} else {
row . Timestamp *= tsMultiplier
}
}
}
return true
}
var (
influxReadCalls = metrics . NewCounter ( ` vm_read_calls_total { name="influx"} ` )
influxReadErrors = metrics . NewCounter ( ` vm_read_errors_total { name="influx"} ` )
influxUnmarshalErrors = metrics . NewCounter ( ` vm_unmarshal_errors_total { name="influx"} ` )
)
type pushCtx struct {
Rows Rows
Common common . InsertCtx
2019-05-28 16:31:35 +02:00
reqBuf [ ] byte
2019-05-22 23:16:55 +02:00
tailBuf [ ] byte
metricNameBuf [ ] byte
metricGroupBuf [ ] byte
err error
}
func ( ctx * pushCtx ) Error ( ) error {
if ctx . err == io . EOF {
return nil
}
return ctx . err
}
func ( ctx * pushCtx ) reset ( ) {
ctx . Rows . Reset ( )
ctx . Common . Reset ( 0 )
2019-05-28 16:31:35 +02:00
ctx . reqBuf = ctx . reqBuf [ : 0 ]
2019-05-22 23:16:55 +02:00
ctx . tailBuf = ctx . tailBuf [ : 0 ]
ctx . metricNameBuf = ctx . metricNameBuf [ : 0 ]
ctx . metricGroupBuf = ctx . metricGroupBuf [ : 0 ]
ctx . err = nil
}
func getPushCtx ( ) * pushCtx {
select {
case ctx := <- pushCtxPoolCh :
return ctx
default :
if v := pushCtxPool . Get ( ) ; v != nil {
return v . ( * pushCtx )
}
return & pushCtx { }
}
}
func putPushCtx ( ctx * pushCtx ) {
ctx . reset ( )
select {
case pushCtxPoolCh <- ctx :
default :
pushCtxPool . Put ( ctx )
}
}
var pushCtxPool sync . Pool
var pushCtxPoolCh = make ( chan * pushCtx , runtime . GOMAXPROCS ( - 1 ) )