mirror of
https://github.com/VictoriaMetrics/VictoriaMetrics.git
synced 2024-11-21 14:44:00 +00:00
lib/storage: small code adjustements after d2960a20e0
Updates https://github.com/VictoriaMetrics/VictoriaMetrics/issues/781
This commit is contained in:
parent
d2960a20e0
commit
01987f8c77
3 changed files with 29 additions and 26 deletions
|
@ -5,6 +5,8 @@
|
|||
* `rollup_func(foo{filters}[d]) op bar` -> `rollup_func(foo{filters}[d]) op bar{filters}`
|
||||
* `transform_func(foo{filters}) op bar` -> `transform_func(foo{filters}) op bar{filters}`
|
||||
* `num_or_scalar op foo{filters} op bar` -> `num_or_scalar op foo{filters} op bar{filters}`
|
||||
* FEATURE: improve time series search for queries with multiple label filters. I.e. `foo{label1="value", label2=~"regexp"}`.
|
||||
See https://github.com/VictoriaMetrics/VictoriaMetrics/issues/781
|
||||
|
||||
* BUGFIX: vmagent: properly handle OpenStack endpoint ending with `v3.0` such as `https://ostack.example.com:5000/v3.0`
|
||||
in the same way as Prometheus does. See https://github.com/VictoriaMetrics/VictoriaMetrics/issues/728#issuecomment-709914803
|
||||
|
|
|
@ -268,7 +268,7 @@ func (tf *tagFilter) Init(commonPrefix, key, value []byte, isNegative, isRegexp
|
|||
// during the search for matching metricIDs.
|
||||
tf.orSuffixes = append(tf.orSuffixes[:0], "")
|
||||
tf.isEmptyMatch = len(prefix) == 0
|
||||
tf.matchCost = defaultCost
|
||||
tf.matchCost = fullMatchCost
|
||||
return nil
|
||||
}
|
||||
rcv, err := getRegexpFromCache(expr)
|
||||
|
@ -350,7 +350,6 @@ func getRegexpFromCache(expr []byte) (regexpCacheValue, error) {
|
|||
reMatch = func(b []byte) bool {
|
||||
return string(b) == v
|
||||
}
|
||||
reCost = defaultLiteralCost
|
||||
} else {
|
||||
reMatch = func(b []byte) bool {
|
||||
for _, v := range orValues {
|
||||
|
@ -360,8 +359,8 @@ func getRegexpFromCache(expr []byte) (regexpCacheValue, error) {
|
|||
}
|
||||
return false
|
||||
}
|
||||
reCost = uint64(len(orValues)) * defaultLiteralCost
|
||||
}
|
||||
reCost = uint64(len(orValues)) * literalMatchCost
|
||||
} else {
|
||||
reMatch, literalSuffix, reCost = getOptimizedReMatchFunc(re.Match, sExpr)
|
||||
}
|
||||
|
@ -415,15 +414,17 @@ func getOptimizedReMatchFunc(reMatch func(b []byte) bool, expr string) (func(b [
|
|||
return matchFunc, suffixUnescaped, reCost
|
||||
}
|
||||
// Fall back to un-optimized reMatch.
|
||||
return reMatch, "", defaultReCost
|
||||
return reMatch, "", reMatchCost
|
||||
}
|
||||
|
||||
// The following & default cost values are returned from BenchmarkOptimizedReMatchCost
|
||||
|
||||
var (
|
||||
defaultCost uint64 = 1
|
||||
defaultLiteralCost uint64 = 3
|
||||
defaultReCost uint64 = 140
|
||||
const (
|
||||
fullMatchCost = 1
|
||||
prefixMatchCost = 2
|
||||
literalMatchCost = 3
|
||||
suffixMatchCost = 4
|
||||
middleMatchCost = 6
|
||||
reMatchCost = 100
|
||||
)
|
||||
|
||||
func getOptimizedReMatchFuncExt(reMatch func(b []byte) bool, sre *syntax.Regexp) (func(b []byte) bool, string, uint64) {
|
||||
|
@ -431,13 +432,13 @@ func getOptimizedReMatchFuncExt(reMatch func(b []byte) bool, sre *syntax.Regexp)
|
|||
// '.*'
|
||||
return func(b []byte) bool {
|
||||
return true
|
||||
}, "", 1
|
||||
}, "", fullMatchCost
|
||||
}
|
||||
if isDotPlus(sre) {
|
||||
// '.+'
|
||||
return func(b []byte) bool {
|
||||
return len(b) > 0
|
||||
}, "", 1
|
||||
}, "", fullMatchCost
|
||||
}
|
||||
switch sre.Op {
|
||||
case syntax.OpCapture:
|
||||
|
@ -451,7 +452,7 @@ func getOptimizedReMatchFuncExt(reMatch func(b []byte) bool, sre *syntax.Regexp)
|
|||
// Literal match
|
||||
return func(b []byte) bool {
|
||||
return string(b) == s
|
||||
}, s, defaultLiteralCost
|
||||
}, s, literalMatchCost
|
||||
case syntax.OpConcat:
|
||||
if len(sre.Sub) == 2 {
|
||||
if isLiteral(sre.Sub[0]) {
|
||||
|
@ -460,13 +461,13 @@ func getOptimizedReMatchFuncExt(reMatch func(b []byte) bool, sre *syntax.Regexp)
|
|||
// 'prefix.*'
|
||||
return func(b []byte) bool {
|
||||
return bytes.HasPrefix(b, prefix)
|
||||
}, "", 2
|
||||
}, "", prefixMatchCost
|
||||
}
|
||||
if isDotPlus(sre.Sub[1]) {
|
||||
// 'prefix.+'
|
||||
return func(b []byte) bool {
|
||||
return len(b) > len(prefix) && bytes.HasPrefix(b, prefix)
|
||||
}, "", 2
|
||||
}, "", prefixMatchCost
|
||||
}
|
||||
}
|
||||
if isLiteral(sre.Sub[1]) {
|
||||
|
@ -475,13 +476,13 @@ func getOptimizedReMatchFuncExt(reMatch func(b []byte) bool, sre *syntax.Regexp)
|
|||
// '.*suffix'
|
||||
return func(b []byte) bool {
|
||||
return bytes.HasSuffix(b, suffix)
|
||||
}, string(suffix), 3
|
||||
}, string(suffix), suffixMatchCost
|
||||
}
|
||||
if isDotPlus(sre.Sub[0]) {
|
||||
// '.+suffix'
|
||||
return func(b []byte) bool {
|
||||
return len(b) > len(suffix) && bytes.HasSuffix(b[1:], suffix)
|
||||
}, string(suffix), 3
|
||||
}, string(suffix), suffixMatchCost
|
||||
}
|
||||
}
|
||||
}
|
||||
|
@ -492,13 +493,13 @@ func getOptimizedReMatchFuncExt(reMatch func(b []byte) bool, sre *syntax.Regexp)
|
|||
// '.*middle.*'
|
||||
return func(b []byte) bool {
|
||||
return bytes.Contains(b, middle)
|
||||
}, "", 5
|
||||
}, "", middleMatchCost
|
||||
}
|
||||
if isDotPlus(sre.Sub[2]) {
|
||||
// '.*middle.+'
|
||||
return func(b []byte) bool {
|
||||
return len(b) > len(middle) && bytes.Contains(b[:len(b)-1], middle)
|
||||
}, "", 5
|
||||
}, "", middleMatchCost
|
||||
}
|
||||
}
|
||||
if isDotPlus(sre.Sub[0]) {
|
||||
|
@ -506,13 +507,13 @@ func getOptimizedReMatchFuncExt(reMatch func(b []byte) bool, sre *syntax.Regexp)
|
|||
// '.+middle.*'
|
||||
return func(b []byte) bool {
|
||||
return len(b) > len(middle) && bytes.Contains(b[1:], middle)
|
||||
}, "", 5
|
||||
}, "", middleMatchCost
|
||||
}
|
||||
if isDotPlus(sre.Sub[2]) {
|
||||
// '.+middle.+'
|
||||
return func(b []byte) bool {
|
||||
return len(b) > len(middle)+1 && bytes.Contains(b[1:len(b)-1], middle)
|
||||
}, "", 5
|
||||
}, "", middleMatchCost
|
||||
}
|
||||
}
|
||||
}
|
||||
|
@ -546,7 +547,7 @@ func getOptimizedReMatchFuncExt(reMatch func(b []byte) bool, sre *syntax.Regexp)
|
|||
}
|
||||
// Fall back to slow path.
|
||||
return reMatch(bOrig)
|
||||
}, string(suffix), defaultReCost
|
||||
}, string(suffix), reMatchCost
|
||||
default:
|
||||
return nil, "", 0
|
||||
}
|
||||
|
|
|
@ -312,13 +312,13 @@ func BenchmarkTagFilterMatchSuffix(b *testing.B) {
|
|||
|
||||
// Run the following command to get the execution cost of all matches
|
||||
//
|
||||
// go test -run=none -bench=BenchmarkOptimizedReMatchCost -count 20 | tee cost.txt
|
||||
// go test -run=none -bench=BenchmarkOptimizedReMatchCost -count 20 github.com/VictoriaMetrics/VictoriaMetrics/lib/storage | tee cost.txt
|
||||
// benchstat ./cost.txt
|
||||
//
|
||||
// Calculate the multiplier of default for each match overhead.
|
||||
|
||||
func BenchmarkOptimizedReMatchCost(b *testing.B) {
|
||||
b.Run("default", func(b *testing.B) {
|
||||
b.Run("fullMatchCost", func(b *testing.B) {
|
||||
reMatch := func(b []byte) bool {
|
||||
return len(b) == 0
|
||||
}
|
||||
|
@ -331,7 +331,7 @@ func BenchmarkOptimizedReMatchCost(b *testing.B) {
|
|||
}
|
||||
})
|
||||
})
|
||||
b.Run("literal match", func(b *testing.B) {
|
||||
b.Run("literalMatchCost", func(b *testing.B) {
|
||||
s := "foo1.bar.baz.sss.ddd"
|
||||
reMatch := func(b []byte) bool {
|
||||
return string(b) == s
|
||||
|
@ -345,7 +345,7 @@ func BenchmarkOptimizedReMatchCost(b *testing.B) {
|
|||
}
|
||||
})
|
||||
})
|
||||
b.Run("foo|bar|baz", func(b *testing.B) {
|
||||
b.Run("threeLiteralsMatchCost", func(b *testing.B) {
|
||||
s := []string{"foo", "bar", "baz"}
|
||||
reMatch := func(b []byte) bool {
|
||||
for _, v := range s {
|
||||
|
@ -502,7 +502,7 @@ func BenchmarkOptimizedReMatchCost(b *testing.B) {
|
|||
}
|
||||
})
|
||||
})
|
||||
b.Run("default", func(b *testing.B) {
|
||||
b.Run("reMatchCost", func(b *testing.B) {
|
||||
re := regexp.MustCompile(`foo[^.]*?\.bar\.baz\.[^.]*?\.ddd`)
|
||||
reMatch := func(b []byte) bool {
|
||||
return re.Match(b)
|
||||
|
|
Loading…
Reference in a new issue