mirror of
https://github.com/VictoriaMetrics/VictoriaMetrics.git
synced 2024-12-16 17:21:04 +01:00
227 lines
6.1 KiB
Go
227 lines
6.1 KiB
Go
|
package jsonline
|
||
|
|
||
|
import (
|
||
|
"bufio"
|
||
|
"errors"
|
||
|
"fmt"
|
||
|
"github.com/VictoriaMetrics/VictoriaMetrics/lib/httputils"
|
||
|
"github.com/VictoriaMetrics/VictoriaMetrics/lib/logjson"
|
||
|
"math"
|
||
|
"net/http"
|
||
|
"strconv"
|
||
|
"time"
|
||
|
|
||
|
"github.com/VictoriaMetrics/VictoriaMetrics/app/vlinsert/common"
|
||
|
"github.com/VictoriaMetrics/VictoriaMetrics/app/vlstorage"
|
||
|
"github.com/VictoriaMetrics/VictoriaMetrics/lib/bytesutil"
|
||
|
"github.com/VictoriaMetrics/VictoriaMetrics/lib/httpserver"
|
||
|
"github.com/VictoriaMetrics/VictoriaMetrics/lib/logger"
|
||
|
"github.com/VictoriaMetrics/VictoriaMetrics/lib/logstorage"
|
||
|
pc "github.com/VictoriaMetrics/VictoriaMetrics/lib/protoparser/common"
|
||
|
"github.com/VictoriaMetrics/VictoriaMetrics/lib/writeconcurrencylimiter"
|
||
|
"github.com/VictoriaMetrics/metrics"
|
||
|
)
|
||
|
|
||
|
// RequestHandler processes jsonline insert requests
|
||
|
func RequestHandler(path string, w http.ResponseWriter, r *http.Request) bool {
|
||
|
w.Header().Add("Content-Type", "application/json")
|
||
|
|
||
|
if path != "/" {
|
||
|
return false
|
||
|
}
|
||
|
if method := r.Method; method != "POST" {
|
||
|
w.WriteHeader(http.StatusMethodNotAllowed)
|
||
|
return true
|
||
|
}
|
||
|
|
||
|
requestsTotal.Inc()
|
||
|
|
||
|
// Extract tenantID
|
||
|
tenantID, err := logstorage.GetTenantIDFromRequest(r)
|
||
|
if err != nil {
|
||
|
httpserver.Errorf(w, r, "%s", err)
|
||
|
return true
|
||
|
}
|
||
|
|
||
|
// Extract time field name from _time_field query arg
|
||
|
var timeField = "_time"
|
||
|
if tf := r.FormValue("_time_field"); tf != "" {
|
||
|
timeField = tf
|
||
|
}
|
||
|
|
||
|
// Extract message field name from _msg_field query arg
|
||
|
var msgField = ""
|
||
|
if msgf := r.FormValue("_msg_field"); msgf != "" {
|
||
|
msgField = msgf
|
||
|
}
|
||
|
|
||
|
streamFields := httputils.GetArray(r, "_stream_fields")
|
||
|
ignoreFields := httputils.GetArray(r, "ignore_fields")
|
||
|
|
||
|
isDebug := httputils.GetBool(r, "debug")
|
||
|
debugRequestURI := ""
|
||
|
debugRemoteAddr := ""
|
||
|
if isDebug {
|
||
|
debugRequestURI = httpserver.GetRequestURI(r)
|
||
|
debugRemoteAddr = httpserver.GetQuotedRemoteAddr(r)
|
||
|
}
|
||
|
|
||
|
lr := logstorage.GetLogRows(streamFields, ignoreFields)
|
||
|
processLogMessage := func(timestamp int64, fields []logstorage.Field) {
|
||
|
lr.MustAdd(tenantID, timestamp, fields)
|
||
|
if isDebug {
|
||
|
s := lr.GetRowString(0)
|
||
|
lr.ResetKeepSettings()
|
||
|
logger.Infof("remoteAddr=%s; requestURI=%s; ignoring log entry because of `debug` query arg: %s", debugRemoteAddr, debugRequestURI, s)
|
||
|
rowsDroppedTotal.Inc()
|
||
|
return
|
||
|
}
|
||
|
if lr.NeedFlush() {
|
||
|
vlstorage.MustAddRows(lr)
|
||
|
lr.ResetKeepSettings()
|
||
|
}
|
||
|
}
|
||
|
|
||
|
reader := r.Body
|
||
|
if r.Header.Get("Content-Encoding") == "gzip" {
|
||
|
zr, err := pc.GetGzipReader(reader)
|
||
|
if err != nil {
|
||
|
//return 0, fmt.Errorf("cannot read gzipped _bulk request: %w", err)
|
||
|
return true
|
||
|
}
|
||
|
defer pc.PutGzipReader(zr)
|
||
|
reader = zr
|
||
|
}
|
||
|
|
||
|
wcr := writeconcurrencylimiter.GetReader(reader)
|
||
|
defer writeconcurrencylimiter.PutReader(wcr)
|
||
|
|
||
|
lb := lineBufferPool.Get()
|
||
|
defer lineBufferPool.Put(lb)
|
||
|
|
||
|
lb.B = bytesutil.ResizeNoCopyNoOverallocate(lb.B, common.MaxLineSizeBytes.IntN())
|
||
|
sc := bufio.NewScanner(wcr)
|
||
|
sc.Buffer(lb.B, len(lb.B))
|
||
|
|
||
|
n := 0
|
||
|
for {
|
||
|
ok, err := readLine(sc, timeField, msgField, processLogMessage)
|
||
|
wcr.DecConcurrency()
|
||
|
if err != nil {
|
||
|
logger.Errorf("cannot read line #%d in /jsonline request: %s", n, err)
|
||
|
}
|
||
|
if !ok {
|
||
|
break
|
||
|
}
|
||
|
n++
|
||
|
rowsIngestedTotal.Inc()
|
||
|
}
|
||
|
|
||
|
vlstorage.MustAddRows(lr)
|
||
|
logstorage.PutLogRows(lr)
|
||
|
|
||
|
return true
|
||
|
}
|
||
|
|
||
|
func readLine(sc *bufio.Scanner, timeField, msgField string, processLogMessage func(timestamp int64, fields []logstorage.Field)) (bool, error) {
|
||
|
if !sc.Scan() {
|
||
|
if err := sc.Err(); err != nil {
|
||
|
if errors.Is(err, bufio.ErrTooLong) {
|
||
|
return false, fmt.Errorf(`cannot read json line, since its size exceeds -insert.maxLineSizeBytes=%d`, common.MaxLineSizeBytes.IntN())
|
||
|
}
|
||
|
return false, err
|
||
|
}
|
||
|
return false, nil
|
||
|
}
|
||
|
|
||
|
line := sc.Bytes()
|
||
|
p := logjson.GetParser()
|
||
|
|
||
|
if err := p.ParseLogMessage(line); err != nil {
|
||
|
invalidJSONLineLogger.Warnf("cannot parse json-encoded log entry: %s", err)
|
||
|
return true, nil
|
||
|
}
|
||
|
|
||
|
timestamp, err := extractTimestampFromFields(timeField, p.Fields)
|
||
|
if err != nil {
|
||
|
invalidTimestampLogger.Warnf("skipping the log entry because cannot parse timestamp: %s", err)
|
||
|
return true, nil
|
||
|
}
|
||
|
updateMessageFieldName(msgField, p.Fields)
|
||
|
processLogMessage(timestamp, p.Fields)
|
||
|
logjson.PutParser(p)
|
||
|
return true, nil
|
||
|
}
|
||
|
|
||
|
func extractTimestampFromFields(timeField string, fields []logstorage.Field) (int64, error) {
|
||
|
for i := range fields {
|
||
|
f := &fields[i]
|
||
|
if f.Name != timeField {
|
||
|
continue
|
||
|
}
|
||
|
timestamp, err := parseTimestamp(f.Value)
|
||
|
if err != nil {
|
||
|
return 0, err
|
||
|
}
|
||
|
f.Value = ""
|
||
|
return timestamp, nil
|
||
|
}
|
||
|
return time.Now().UnixNano(), nil
|
||
|
}
|
||
|
|
||
|
func updateMessageFieldName(msgField string, fields []logstorage.Field) {
|
||
|
if msgField == "" {
|
||
|
return
|
||
|
}
|
||
|
for i := range fields {
|
||
|
f := &fields[i]
|
||
|
if f.Name == msgField {
|
||
|
f.Name = "_msg"
|
||
|
return
|
||
|
}
|
||
|
}
|
||
|
}
|
||
|
|
||
|
func parseTimestamp(s string) (int64, error) {
|
||
|
if len(s) < len("YYYY-MM-DD") || s[len("YYYY")] != '-' {
|
||
|
// Try parsing timestamp in milliseconds
|
||
|
n, err := strconv.ParseInt(s, 10, 64)
|
||
|
if err != nil {
|
||
|
return 0, fmt.Errorf("cannot parse timestamp in milliseconds from %q: %w", s, err)
|
||
|
}
|
||
|
if n > int64(math.MaxInt64)/1e6 {
|
||
|
return 0, fmt.Errorf("too big timestamp in milliseconds: %d; mustn't exceed %d", n, int64(math.MaxInt64)/1e6)
|
||
|
}
|
||
|
if n < int64(math.MinInt64)/1e6 {
|
||
|
return 0, fmt.Errorf("too small timestamp in milliseconds: %d; must be bigger than %d", n, int64(math.MinInt64)/1e6)
|
||
|
}
|
||
|
n *= 1e6
|
||
|
return n, nil
|
||
|
}
|
||
|
if len(s) == len("YYYY-MM-DD") {
|
||
|
t, err := time.Parse("2006-01-02", s)
|
||
|
if err != nil {
|
||
|
return 0, fmt.Errorf("cannot parse date %q: %w", s, err)
|
||
|
}
|
||
|
return t.UnixNano(), nil
|
||
|
}
|
||
|
t, err := time.Parse(time.RFC3339, s)
|
||
|
if err != nil {
|
||
|
return 0, fmt.Errorf("cannot parse timestamp %q: %w", s, err)
|
||
|
}
|
||
|
return t.UnixNano(), nil
|
||
|
}
|
||
|
|
||
|
var lineBufferPool bytesutil.ByteBufferPool
|
||
|
|
||
|
var (
|
||
|
requestsTotal = metrics.NewCounter(`vl_http_requests_total{path="/insert/jsonline"}`)
|
||
|
rowsIngestedTotal = metrics.NewCounter(`vl_rows_ingested_total{type="jsonline"}`)
|
||
|
rowsDroppedTotal = metrics.NewCounter(`vl_rows_dropped_total{path="/insert/jsonline",reason="debug"}`)
|
||
|
)
|
||
|
|
||
|
var (
|
||
|
invalidTimestampLogger = logger.WithThrottler("invalidTimestampLogger", 5*time.Second)
|
||
|
invalidJSONLineLogger = logger.WithThrottler("invalidJSONLineLogger", 5*time.Second)
|
||
|
)
|