package logstorage import ( "fmt" "slices" "github.com/VictoriaMetrics/VictoriaMetrics/lib/bytesutil" ) // pipeUnpackJSON processes '| unpack_json ...' pipe. // // See https://docs.victoriametrics.com/victorialogs/logsql/#unpack_json-pipe type pipeUnpackJSON struct { // fromField is the field to unpack json fields from fromField string // fields is an optional list of fields to extract from json. // // if it is empty, then all the fields are extracted. fields []string // resultPrefix is prefix to add to unpacked field names resultPrefix string // iff is an optional filter for skipping unpacking json iff *ifFilter } func (pu *pipeUnpackJSON) String() string { s := "unpack_json" if pu.iff != nil { s += " " + pu.iff.String() } if !isMsgFieldName(pu.fromField) { s += " from " + quoteTokenIfNeeded(pu.fromField) } if len(pu.fields) > 0 { s += " fields (" + fieldsToString(pu.fields) + ")" } if pu.resultPrefix != "" { s += " result_prefix " + quoteTokenIfNeeded(pu.resultPrefix) } return s } func (pu *pipeUnpackJSON) updateNeededFields(neededFields, unneededFields fieldsSet) { updateNeededFieldsForUnpackPipe(pu.fromField, pu.fields, pu.iff, neededFields, unneededFields) } func updateNeededFieldsForUnpackPipe(fromField string, outFields []string, iff *ifFilter, neededFields, unneededFields fieldsSet) { if neededFields.contains("*") { unneededFieldsOrig := unneededFields.clone() unneededFieldsCount := 0 if len(outFields) > 0 { for _, f := range outFields { if unneededFieldsOrig.contains(f) { unneededFieldsCount++ } unneededFields.add(f) } } if len(outFields) == 0 || unneededFieldsCount < len(outFields) { unneededFields.remove(fromField) if iff != nil { unneededFields.removeFields(iff.neededFields) } } } else { neededFieldsOrig := neededFields.clone() needFromField := len(outFields) == 0 if len(outFields) > 0 { needFromField = false for _, f := range outFields { if neededFieldsOrig.contains(f) { needFromField = true } neededFields.remove(f) } } if needFromField { neededFields.add(fromField) if iff != nil { neededFields.addFields(iff.neededFields) } } } } func (pu *pipeUnpackJSON) newPipeProcessor(workersCount int, _ <-chan struct{}, _ func(), ppBase pipeProcessor) pipeProcessor { unpackJSON := func(uctx *fieldsUnpackerContext, s string) { if len(s) == 0 || s[0] != '{' { // This isn't a JSON object return } p := GetJSONParser() err := p.ParseLogMessage(bytesutil.ToUnsafeBytes(s)) if err != nil { for _, fieldName := range pu.fields { uctx.addField(fieldName, "") } } else { if len(pu.fields) == 0 { for _, f := range p.Fields { uctx.addField(f.Name, f.Value) } } else { for _, fieldName := range pu.fields { addedField := false for _, f := range p.Fields { if f.Name == fieldName { uctx.addField(f.Name, f.Value) addedField = true break } } if !addedField { uctx.addField(fieldName, "") } } } } PutJSONParser(p) } return newPipeUnpackProcessor(workersCount, unpackJSON, ppBase, pu.fromField, pu.resultPrefix, pu.iff) } func parsePipeUnpackJSON(lex *lexer) (*pipeUnpackJSON, error) { if !lex.isKeyword("unpack_json") { return nil, fmt.Errorf("unexpected token: %q; want %q", lex.token, "unpack_json") } lex.nextToken() var iff *ifFilter if lex.isKeyword("if") { f, err := parseIfFilter(lex) if err != nil { return nil, err } iff = f } fromField := "_msg" if lex.isKeyword("from") { lex.nextToken() f, err := parseFieldName(lex) if err != nil { return nil, fmt.Errorf("cannot parse 'from' field name: %w", err) } fromField = f } var fields []string if lex.isKeyword("fields") { lex.nextToken() fs, err := parseFieldNamesInParens(lex) if err != nil { return nil, fmt.Errorf("cannot parse 'fields': %w", err) } fields = fs if slices.Contains(fields, "*") { fields = nil } } resultPrefix := "" if lex.isKeyword("result_prefix") { lex.nextToken() p, err := getCompoundToken(lex) if err != nil { return nil, fmt.Errorf("cannot parse 'result_prefix': %w", err) } resultPrefix = p } pu := &pipeUnpackJSON{ fromField: fromField, fields: fields, resultPrefix: resultPrefix, iff: iff, } return pu, nil }