VictoriaMetrics/lib/logstorage/pipe_extract_test.go

356 lines
9.3 KiB
Go
Raw Normal View History

2024-05-20 04:08:30 +02:00
package logstorage
import (
"testing"
)
2024-05-22 21:01:20 +02:00
func TestParsePipeExtractSuccess(t *testing.T) {
f := func(pipeStr string) {
2024-05-20 04:08:30 +02:00
t.Helper()
2024-05-22 21:01:20 +02:00
expectParsePipeSuccess(t, pipeStr)
2024-05-20 04:08:30 +02:00
}
2024-05-22 21:01:20 +02:00
f(`extract "foo<bar>"`)
2024-05-25 00:30:58 +02:00
f(`extract "foo<bar>" skip_empty_results`)
f(`extract "foo<bar>" keep_original_fields`)
2024-05-22 21:01:20 +02:00
f(`extract "foo<bar>" from x`)
2024-05-25 00:30:58 +02:00
f(`extract "foo<bar>" from x skip_empty_results`)
f(`extract "foo<bar>" from x keep_original_fields`)
2024-05-22 21:01:20 +02:00
f(`extract if (x:y) "foo<bar>" from baz`)
2024-05-25 00:30:58 +02:00
f(`extract if (x:y) "foo<bar>" from baz skip_empty_results`)
f(`extract if (x:y) "foo<bar>" from baz keep_original_fields`)
2024-05-20 04:08:30 +02:00
}
2024-05-22 21:01:20 +02:00
func TestParsePipeExtractFailure(t *testing.T) {
f := func(pipeStr string) {
2024-05-20 04:08:30 +02:00
t.Helper()
2024-05-22 21:01:20 +02:00
expectParsePipeFailure(t, pipeStr)
}
f(`extract`)
2024-05-25 00:30:58 +02:00
f(`extract keep_original_fields`)
f(`extract skip_empty_results`)
2024-05-22 21:01:20 +02:00
f(`extract from`)
f(`extract from x`)
f(`extract from x "y<foo>"`)
f(`extract if (x:y)`)
f(`extract "a<b>" if (x:y)`)
f(`extract "a"`)
f(`extract "<a><b>"`)
f(`extract "<*>foo<_>bar"`)
}
2024-05-20 04:08:30 +02:00
2024-05-22 21:01:20 +02:00
func TestPipeExtract(t *testing.T) {
f := func(pipeStr string, rows, rowsExpected [][]Field) {
t.Helper()
expectPipeResults(t, pipeStr, rows, rowsExpected)
2024-05-20 04:08:30 +02:00
}
2024-05-25 00:30:58 +02:00
// skip empty results
f(`extract "baz=<abc> a=<aa>" skip_empty_results`, [][]Field{
{
{"_msg", `foo=bar baz="x y=z" `},
{"aa", "foobar"},
{"abc", "ippl"},
},
}, [][]Field{
{
{"_msg", `foo=bar baz="x y=z" `},
{"aa", "foobar"},
{"abc", "x y=z"},
},
})
// no skip empty results
f(`extract "baz=<abc> a=<aa>"`, [][]Field{
{
{"_msg", `foo=bar baz="x y=z" `},
{"aa", "foobar"},
{"abc", "ippl"},
},
}, [][]Field{
{
{"_msg", `foo=bar baz="x y=z" `},
{"aa", ""},
{"abc", "x y=z"},
},
})
// keep original fields
f(`extract "baz=<abc> a=<aa>" keep_original_fields`, [][]Field{
{
{"_msg", `foo=bar baz="x y=z" a=b`},
{"aa", "foobar"},
{"abc", ""},
},
}, [][]Field{
{
{"_msg", `foo=bar baz="x y=z" a=b`},
{"abc", "x y=z"},
{"aa", "foobar"},
},
})
// no keep original fields
f(`extract "baz=<abc> a=<aa>"`, [][]Field{
{
{"_msg", `foo=bar baz="x y=z" a=b`},
{"aa", "foobar"},
{"abc", ""},
},
}, [][]Field{
{
{"_msg", `foo=bar baz="x y=z" a=b`},
{"abc", "x y=z"},
{"aa", "b"},
},
})
2024-05-22 21:01:20 +02:00
// single row, extract from _msg
f(`extract "baz=<abc> a=<aa>"`, [][]Field{
{
{"_msg", `foo=bar baz="x y=z" a=b`},
},
}, [][]Field{
2024-05-20 04:08:30 +02:00
{
2024-05-22 21:01:20 +02:00
{"_msg", `foo=bar baz="x y=z" a=b`},
{"abc", "x y=z"},
{"aa", "b"},
2024-05-20 04:08:30 +02:00
},
})
2024-05-22 21:01:20 +02:00
// single row, extract from _msg into _msg
f(`extract "msg=<_msg>"`, [][]Field{
2024-05-20 04:08:30 +02:00
{
2024-05-22 21:01:20 +02:00
{"_msg", `msg=bar`},
2024-05-20 04:08:30 +02:00
},
2024-05-22 21:01:20 +02:00
}, [][]Field{
2024-05-20 04:08:30 +02:00
{
2024-05-22 21:01:20 +02:00
{"_msg", "bar"},
2024-05-20 04:08:30 +02:00
},
})
2024-05-22 21:01:20 +02:00
// single row, extract from non-existing field
f(`extract "foo=<bar>" from x`, [][]Field{
2024-05-20 04:08:30 +02:00
{
2024-05-22 21:01:20 +02:00
{"_msg", `foo=bar`},
2024-05-20 04:08:30 +02:00
},
2024-05-22 21:01:20 +02:00
}, [][]Field{
2024-05-20 04:08:30 +02:00
{
2024-05-22 21:01:20 +02:00
{"_msg", `foo=bar`},
{"bar", ""},
2024-05-20 04:08:30 +02:00
},
})
2024-05-22 21:01:20 +02:00
// single row, pattern mismatch
f(`extract "foo=<bar>" from x`, [][]Field{
2024-05-20 04:08:30 +02:00
{
2024-05-22 21:01:20 +02:00
{"x", `foobar`},
2024-05-20 04:08:30 +02:00
},
2024-05-22 21:01:20 +02:00
}, [][]Field{
2024-05-20 04:08:30 +02:00
{
2024-05-22 21:01:20 +02:00
{"x", `foobar`},
{"bar", ""},
2024-05-20 04:08:30 +02:00
},
})
2024-05-22 21:01:20 +02:00
// single row, partial partern match
f(`extract "foo=<bar> baz=<xx>" from x`, [][]Field{
2024-05-20 04:08:30 +02:00
{
2024-05-22 21:01:20 +02:00
{"x", `a foo="a\"b\\c" cde baz=aa`},
2024-05-20 04:08:30 +02:00
},
2024-05-22 21:01:20 +02:00
}, [][]Field{
2024-05-20 04:08:30 +02:00
{
2024-05-22 21:01:20 +02:00
{"x", `a foo="a\"b\\c" cde baz=aa`},
{"bar", `a"b\c`},
{"xx", ""},
2024-05-20 04:08:30 +02:00
},
})
2024-05-22 21:01:20 +02:00
2024-05-24 03:06:55 +02:00
// single row, disable unquoting
f(`extract 'foo=[< plain : bar >]' from x`, [][]Field{
{
{"x", `a foo=["bc","de"]`},
},
}, [][]Field{
{
{"x", `a foo=["bc","de"]`},
{"bar", `"bc","de"`},
},
})
// single row, default unquoting
f(`extract 'foo=[< bar >]' from x`, [][]Field{
{
{"x", `a foo=["bc","de"]`},
},
}, [][]Field{
{
{"x", `a foo=["bc","de"]`},
{"bar", `bc`},
},
})
2024-05-22 21:01:20 +02:00
// single row, overwirte existing column
f(`extract "foo=<bar> baz=<xx>" from x`, [][]Field{
2024-05-20 04:08:30 +02:00
{
2024-05-22 21:01:20 +02:00
{"x", `a foo=cc baz=aa b`},
{"bar", "abc"},
2024-05-20 04:08:30 +02:00
},
2024-05-22 21:01:20 +02:00
}, [][]Field{
2024-05-20 04:08:30 +02:00
{
2024-05-22 21:01:20 +02:00
{"x", `a foo=cc baz=aa b`},
{"bar", `cc`},
{"xx", `aa b`},
2024-05-20 04:08:30 +02:00
},
})
2024-05-22 21:01:20 +02:00
// single row, if match
f(`extract if (x:baz) "foo=<bar> baz=<xx>" from "x"`, [][]Field{
2024-05-20 04:08:30 +02:00
{
2024-05-22 21:01:20 +02:00
{"x", `a foo=cc baz=aa b`},
{"bar", "abc"},
2024-05-20 04:08:30 +02:00
},
2024-05-22 21:01:20 +02:00
}, [][]Field{
2024-05-20 04:08:30 +02:00
{
2024-05-22 21:01:20 +02:00
{"x", `a foo=cc baz=aa b`},
{"bar", `cc`},
{"xx", `aa b`},
2024-05-20 04:08:30 +02:00
},
})
2024-05-22 21:01:20 +02:00
// single row, if mismatch
f(`extract if (bar:"") "foo=<bar> baz=<xx>" from 'x'`, [][]Field{
2024-05-20 04:08:30 +02:00
{
2024-05-22 21:01:20 +02:00
{"x", `a foo=cc baz=aa b`},
{"bar", "abc"},
2024-05-20 04:08:30 +02:00
},
2024-05-22 21:01:20 +02:00
}, [][]Field{
2024-05-20 04:08:30 +02:00
{
2024-05-22 21:01:20 +02:00
{"x", `a foo=cc baz=aa b`},
{"bar", `abc`},
2024-05-20 04:08:30 +02:00
},
})
2024-05-22 21:01:20 +02:00
// multiple rows with distinct set of labels
f(`extract if (!ip:keep) "ip=<ip> "`, [][]Field{
{
{"foo", "bar"},
{"_msg", "request from ip=1.2.3.4 xxx"},
{"f3", "y"},
},
{
{"foo", "aaa"},
{"_msg", "ip=5.4.3.1 abcd"},
{"ip", "keep"},
{"a", "b"},
},
{
{"foo", "aaa"},
{"_msg", "ip=34.32.11.94 abcd"},
{"ip", "ppp"},
{"a", "b"},
},
{
{"foo", "klkfs"},
{"_msg", "sdfdsfds dsf fd fdsa ip=123 abcd"},
{"ip", "bbbsd"},
{"a", "klo2i"},
},
}, [][]Field{
{
{"foo", "bar"},
{"_msg", "request from ip=1.2.3.4 xxx"},
{"f3", "y"},
{"ip", "1.2.3.4"},
},
{
{"foo", "aaa"},
{"_msg", "ip=5.4.3.1 abcd"},
{"ip", "keep"},
{"a", "b"},
},
{
{"foo", "aaa"},
{"_msg", "ip=34.32.11.94 abcd"},
{"ip", "34.32.11.94"},
{"a", "b"},
},
{
{"foo", "klkfs"},
{"_msg", "sdfdsfds dsf fd fdsa ip=123 abcd"},
{"ip", "123"},
{"a", "klo2i"},
},
})
2024-05-20 04:08:30 +02:00
}
func TestPipeExtractUpdateNeededFields(t *testing.T) {
f := func(s string, neededFields, unneededFields, neededFieldsExpected, unneededFieldsExpected string) {
t.Helper()
expectPipeNeededFields(t, s, neededFields, unneededFields, neededFieldsExpected, unneededFieldsExpected)
}
// all the needed fields
2024-05-22 21:01:20 +02:00
f("extract '<foo>' from x", "*", "", "*", "foo")
f("extract if (foo:bar) '<foo>' from x", "*", "", "*", "")
2024-05-25 00:30:58 +02:00
f("extract if (foo:bar) '<foo>' from x keep_original_fields", "*", "", "*", "")
f("extract if (foo:bar) '<foo>' from x skip_empty_results", "*", "", "*", "")
2024-05-20 04:08:30 +02:00
2024-05-22 21:01:20 +02:00
// unneeded fields do not intersect with pattern and output fields
f("extract '<foo>' from x", "*", "f1,f2", "*", "f1,f2,foo")
2024-05-25 00:30:58 +02:00
f("extract '<foo>' from x keep_original_fields", "*", "f1,f2", "*", "f1,f2")
f("extract '<foo>' from x skip_empty_results", "*", "f1,f2", "*", "f1,f2")
2024-05-22 21:01:20 +02:00
f("extract if (f1:x) '<foo>' from x", "*", "f1,f2", "*", "f2,foo")
2024-05-25 00:30:58 +02:00
f("extract if (f1:x) '<foo>' from x keep_original_fields", "*", "f1,f2", "*", "f2")
f("extract if (f1:x) '<foo>' from x skip_empty_results", "*", "f1,f2", "*", "f2")
2024-05-22 21:01:20 +02:00
f("extract if (foo:bar f1:x) '<foo>' from x", "*", "f1,f2", "*", "f2")
2024-05-20 04:08:30 +02:00
2024-05-22 21:01:20 +02:00
// unneeded fields intersect with pattern
f("extract '<foo>' from x", "*", "f2,x", "*", "f2,foo")
2024-05-25 00:30:58 +02:00
f("extract '<foo>' from x keep_original_fields", "*", "f2,x", "*", "f2")
f("extract '<foo>' from x skip_empty_results", "*", "f2,x", "*", "f2")
2024-05-22 21:01:20 +02:00
f("extract if (f1:abc) '<foo>' from x", "*", "f2,x", "*", "f2,foo")
f("extract if (f2:abc) '<foo>' from x", "*", "f2,x", "*", "foo")
2024-05-20 04:08:30 +02:00
2024-05-22 21:01:20 +02:00
// unneeded fields intersect with output fields
f("extract '<foo>x<bar>' from x", "*", "f2,foo", "*", "bar,f2,foo")
2024-05-25 00:30:58 +02:00
f("extract '<foo>x<bar>' from x keep_original_fields", "*", "f2,foo", "*", "f2,foo")
f("extract '<foo>x<bar>' from x skip_empty_results", "*", "f2,foo", "*", "f2,foo")
2024-05-22 21:01:20 +02:00
f("extract if (f1:abc) '<foo>x<bar>' from x", "*", "f2,foo", "*", "bar,f2,foo")
f("extract if (f2:abc foo:w) '<foo>x<bar>' from x", "*", "f2,foo", "*", "bar")
2024-05-25 00:30:58 +02:00
f("extract if (f2:abc foo:w) '<foo>x<bar>' from x keep_original_fields", "*", "f2,foo", "*", "")
f("extract if (f2:abc foo:w) '<foo>x<bar>' from x skip_empty_results", "*", "f2,foo", "*", "")
2024-05-20 04:08:30 +02:00
2024-05-22 21:01:20 +02:00
// unneeded fields intersect with all the output fields
f("extract '<foo>x<bar>' from x", "*", "f2,foo,bar", "*", "bar,f2,foo,x")
f("extract if (a:b f2:q x:y foo:w) '<foo>x<bar>' from x", "*", "f2,foo,bar", "*", "bar,f2,foo,x")
2024-05-25 00:30:58 +02:00
f("extract if (a:b f2:q x:y foo:w) '<foo>x<bar>' from x keep_original_fields", "*", "f2,foo,bar", "*", "bar,f2,foo,x")
f("extract if (a:b f2:q x:y foo:w) '<foo>x<bar>' from x skip_empty_results", "*", "f2,foo,bar", "*", "bar,f2,foo,x")
2024-05-20 04:08:30 +02:00
2024-05-22 21:01:20 +02:00
// needed fields do not intersect with pattern and output fields
f("extract '<foo>x<bar>' from x", "f1,f2", "", "f1,f2", "")
2024-05-25 00:30:58 +02:00
f("extract '<foo>x<bar>' from x keep_original_fields", "f1,f2", "", "f1,f2", "")
f("extract '<foo>x<bar>' from x skip_empty_results", "f1,f2", "", "f1,f2", "")
2024-05-22 21:01:20 +02:00
f("extract if (a:b) '<foo>x<bar>' from x", "f1,f2", "", "f1,f2", "")
f("extract if (f1:b) '<foo>x<bar>' from x", "f1,f2", "", "f1,f2", "")
2024-05-20 04:08:30 +02:00
2024-05-22 21:01:20 +02:00
// needed fields intersect with pattern field
f("extract '<foo>x<bar>' from x", "f2,x", "", "f2,x", "")
2024-05-25 00:30:58 +02:00
f("extract '<foo>x<bar>' from x keep_original_fields", "f2,x", "", "f2,x", "")
f("extract '<foo>x<bar>' from x skip_empty_results", "f2,x", "", "f2,x", "")
2024-05-22 21:01:20 +02:00
f("extract if (a:b) '<foo>x<bar>' from x", "f2,x", "", "f2,x", "")
2024-05-20 04:08:30 +02:00
// needed fields intersect with output fields
2024-05-22 21:01:20 +02:00
f("extract '<foo>x<bar>' from x", "f2,foo", "", "f2,x", "")
2024-05-25 00:30:58 +02:00
f("extract '<foo>x<bar>' from x keep_original_fields", "f2,foo", "", "foo,f2,x", "")
f("extract '<foo>x<bar>' from x skip_empty_results", "f2,foo", "", "foo,f2,x", "")
2024-05-22 21:01:20 +02:00
f("extract if (a:b) '<foo>x<bar>' from x", "f2,foo", "", "a,f2,x", "")
// needed fields intersect with pattern and output fields
f("extract '<foo>x<bar>' from x", "f2,foo,x,y", "", "f2,x,y", "")
2024-05-25 00:30:58 +02:00
f("extract '<foo>x<bar>' from x keep_original_fields", "f2,foo,x,y", "", "foo,f2,x,y", "")
f("extract '<foo>x<bar>' from x skip_empty_results", "f2,foo,x,y", "", "foo,f2,x,y", "")
2024-05-22 21:01:20 +02:00
f("extract if (a:b foo:q) '<foo>x<bar>' from x", "f2,foo,x,y", "", "a,f2,foo,x,y", "")
}