lib/storage: add BenchmarkHeadPostingForMatchers similar to the benchmark from Prometheus

See the corresponding benchmark in Prometheus - 23c0299d85/tsdb/head_bench_test.go (L52) The benchmark allows performing apples-to-apples comparison of time series search in Prometheus and VictoriaMetrics. The following article - https://www.robustperception.io/evaluating-performance-and-correctness - contains incorrect numbers for VictoriaMetrics, since there wasn't this benchmark yet. Fix it. Benchmarks can be repeated with the following commands from Prometheus and VictoriaMetrics source code roots: - Prometheus: GOMAXPROCS=1 go test ./tsdb/ -run=111 -bench=BenchmarkHeadPostingForMatchers - VictoriaMetrics: GOMAXPROCS=1 go test ./lib/storage/ -run=111 -bench=BenchmarkHeadPostingForMatchers Benchmark results: benchmark old ns/op new ns/op delta BenchmarkHeadPostingForMatchers/n="1" 272756688 364977 -99.87% BenchmarkHeadPostingForMatchers/n="1",j="foo" 138132923 1181636 -99.14% BenchmarkHeadPostingForMatchers/j="foo",n="1" 134723762 1141578 -99.15% BenchmarkHeadPostingForMatchers/n="1",j!="foo" 195823953 1148056 -99.41% BenchmarkHeadPostingForMatchers/i=~".*" 7962582919 8716755 -99.89% BenchmarkHeadPostingForMatchers/i=~".+" 7589543864 12096587 -99.84% BenchmarkHeadPostingForMatchers/i=~"" 1142371741 16164560 -98.59% BenchmarkHeadPostingForMatchers/i!="" 9964150263 12230021 -99.88% BenchmarkHeadPostingForMatchers/n="1",i=~".*",j="foo" 216995884 1173476 -99.46% BenchmarkHeadPostingForMatchers/n="1",i=~".*",i!="2",j="foo" 202541348 1299743 -99.36% BenchmarkHeadPostingForMatchers/n="1",i!="" 486285711 11555193 -97.62% BenchmarkHeadPostingForMatchers/n="1",i!="",j="foo" 350776931 5607506 -98.40% BenchmarkHeadPostingForMatchers/n="1",i=~".+",j="foo" 380888565 6380335 -98.32% BenchmarkHeadPostingForMatchers/n="1",i=~"1.+",j="foo" 89500296 2078970 -97.68% BenchmarkHeadPostingForMatchers/n="1",i=~".+",i!="2",j="foo" 379529654 6561368 -98.27% BenchmarkHeadPostingForMatchers/n="1",i=~".+",i!~"2.*",j="foo" 424563825 6757132 -98.41% The first column (old) is for Prometheus, the second column (new) is for VictoriaMetrics. Prometheus was using 3.5GB of RAM during the benchmark, while VictoriaMetrics was using 400MB of RAM.
2025-03-11 15:34:56 +00:00 · 2019-11-18 18:21:27 +02:00 · 2019-11-18 18:21:27 +02:00 · 6f61fd367a
commit 6f61fd367a
parent 77bb66a5be
1 changed files with 183 additions and 0 deletions
--- a/lib/storage/index_db_timing_test.go
+++ b/lib/storage/index_db_timing_test.go
@ -111,6 +111,189 @@ func benchmarkIndexDBAddTSIDs(db *indexDB, tsid *TSID, mn *MetricName, startOffs
 	}
 }

+func BenchmarkHeadPostingForMatchers(b *testing.B) {
+	// This benchmark is equivalent to https://github.com/prometheus/prometheus/blob/23c0299d85bfeb5d9b59e994861553a25ca578e5/tsdb/head_bench_test.go#L52
+	// See https://www.robustperception.io/evaluating-performance-and-correctness for more details.
+	metricIDCache := workingsetcache.New(1234, time.Hour)
+	metricNameCache := workingsetcache.New(1234, time.Hour)
+	defer metricIDCache.Stop()
+	defer metricNameCache.Stop()
+
+	var hmCurr atomic.Value
+	hmCurr.Store(&hourMetricIDs{})
+	var hmPrev atomic.Value
+	hmPrev.Store(&hourMetricIDs{})
+
+	const dbName = "bench-head-posting-for-matchers"
+	db, err := openIndexDB(dbName, metricIDCache, metricNameCache, &hmCurr, &hmPrev)
+	if err != nil {
+		b.Fatalf("cannot open indexDB: %s", err)
+	}
+	defer func() {
+		db.MustClose()
+		if err := os.RemoveAll(dbName); err != nil {
+			b.Fatalf("cannot remove indexDB: %s", err)
+		}
+	}()
+
+	// Fill the db with data as in https://github.com/prometheus/prometheus/blob/23c0299d85bfeb5d9b59e994861553a25ca578e5/tsdb/head_bench_test.go#L66
+	const accountID = 34327843
+	const projectID = 893433
+	var mn MetricName
+	var metricName []byte
+	var tsid TSID
+	addSeries := func(kvs ...string) {
+		mn.Reset()
+		for i := 0; i < len(kvs); i += 2 {
+			mn.AddTag(kvs[i], kvs[i+1])
+		}
+		mn.sortTags()
+		mn.AccountID = accountID
+		mn.ProjectID = projectID
+		metricName = mn.Marshal(metricName[:0])
+		if err := db.createTSIDByName(&tsid, metricName); err != nil {
+			b.Fatalf("cannot insert record: %s", err)
+		}
+	}
+	for n := 0; n < 10; n++ {
+		for i := 0; i < 10000; i++ {
+			addSeries("i", strconv.Itoa(i), "n", strconv.Itoa(n), "j", "foo")
+			// Have some series that won't be matched, to properly test inverted matches.
+			addSeries("i", strconv.Itoa(i), "n", strconv.Itoa(n), "j", "bar")
+			addSeries("i", strconv.Itoa(i), "n", "0_"+strconv.Itoa(n), "j", "bar")
+			addSeries("i", strconv.Itoa(i), "n", "1_"+strconv.Itoa(n), "j", "bar")
+			addSeries("i", strconv.Itoa(i), "n", "2_"+strconv.Itoa(n), "j", "foo")
+		}
+	}
+
+	// Make sure all the items can be searched.
+	db.tb.DebugFlush()
+	b.ResetTimer()
+
+	benchSearch := func(b *testing.B, tfs *TagFilters) {
+		is := db.getIndexSearch()
+		defer db.putIndexSearch(is)
+		tfss := []*TagFilters{tfs}
+		tr := TimeRange{
+			MinTimestamp: 0,
+			MaxTimestamp: timestampFromTime(time.Now()),
+		}
+		for i := 0; i < b.N; i++ {
+			_, err := is.searchMetricIDs(tfss, tr, 2e9)
+			if err != nil {
+				b.Fatalf("unexpected error in searchMetricIDs: %s", err)
+			}
+		}
+	}
+	addTagFilter := func(tfs *TagFilters, key, value string, isNegative, isRegexp bool) {
+		if err := tfs.Add([]byte(key), []byte(value), isNegative, isRegexp); err != nil {
+			b.Fatalf("cannot add tag filter %q=%q, isNegative=%v, isRegexp=%v", key, value, isNegative, isRegexp)
+		}
+	}
+
+	b.Run(`n="1"`, func(b *testing.B) {
+		tfs := NewTagFilters(accountID, projectID)
+		addTagFilter(tfs, "n", "1", false, false)
+		benchSearch(b, tfs)
+	})
+	b.Run(`n="1",j="foo"`, func(b *testing.B) {
+		tfs := NewTagFilters(accountID, projectID)
+		addTagFilter(tfs, "n", "1", false, false)
+		addTagFilter(tfs, "j", "foo", false, false)
+		benchSearch(b, tfs)
+	})
+	b.Run(`j="foo",n="1"`, func(b *testing.B) {
+		tfs := NewTagFilters(accountID, projectID)
+		addTagFilter(tfs, "j", "foo", false, false)
+		addTagFilter(tfs, "n", "1", false, false)
+		benchSearch(b, tfs)
+	})
+	b.Run(`n="1",j!="foo"`, func(b *testing.B) {
+		tfs := NewTagFilters(accountID, projectID)
+		addTagFilter(tfs, "n", "1", false, false)
+		addTagFilter(tfs, "j", "foo", true, false)
+		benchSearch(b, tfs)
+	})
+	b.Run(`i=~".*"`, func(b *testing.B) {
+		tfs := NewTagFilters(accountID, projectID)
+		addTagFilter(tfs, "i", ".*", false, true)
+		benchSearch(b, tfs)
+	})
+	b.Run(`i=~".+"`, func(b *testing.B) {
+		tfs := NewTagFilters(accountID, projectID)
+		addTagFilter(tfs, "i", ".+", false, true)
+		benchSearch(b, tfs)
+	})
+	b.Run(`i=~""`, func(b *testing.B) {
+		tfs := NewTagFilters(accountID, projectID)
+		addTagFilter(tfs, "i", "", false, true)
+		benchSearch(b, tfs)
+	})
+	b.Run(`i!=""`, func(b *testing.B) {
+		tfs := NewTagFilters(accountID, projectID)
+		addTagFilter(tfs, "i", "", true, false)
+		benchSearch(b, tfs)
+	})
+	b.Run(`n="1",i=~".*",j="foo"`, func(b *testing.B) {
+		tfs := NewTagFilters(accountID, projectID)
+		addTagFilter(tfs, "n", "1", false, false)
+		addTagFilter(tfs, "i", ".*", false, true)
+		addTagFilter(tfs, "j", "foo", false, false)
+		benchSearch(b, tfs)
+	})
+	b.Run(`n="1",i=~".*",i!="2",j="foo"`, func(b *testing.B) {
+		tfs := NewTagFilters(accountID, projectID)
+		addTagFilter(tfs, "n", "1", false, false)
+		addTagFilter(tfs, "i", ".*", false, true)
+		addTagFilter(tfs, "i", "2", true, false)
+		addTagFilter(tfs, "j", "foo", false, false)
+		benchSearch(b, tfs)
+	})
+	b.Run(`n="1",i!=""`, func(b *testing.B) {
+		tfs := NewTagFilters(accountID, projectID)
+		addTagFilter(tfs, "n", "1", false, false)
+		addTagFilter(tfs, "i", "", true, false)
+		benchSearch(b, tfs)
+	})
+	b.Run(`n="1",i!="",j="foo"`, func(b *testing.B) {
+		tfs := NewTagFilters(accountID, projectID)
+		addTagFilter(tfs, "n", "1", false, false)
+		addTagFilter(tfs, "i", "", true, false)
+		addTagFilter(tfs, "j", "foo", false, false)
+		benchSearch(b, tfs)
+	})
+	b.Run(`n="1",i=~".+",j="foo"`, func(b *testing.B) {
+		tfs := NewTagFilters(accountID, projectID)
+		addTagFilter(tfs, "n", "1", false, false)
+		addTagFilter(tfs, "i", ".+", false, true)
+		addTagFilter(tfs, "j", "foo", false, false)
+		benchSearch(b, tfs)
+	})
+	b.Run(`n="1",i=~"1.+",j="foo"`, func(b *testing.B) {
+		tfs := NewTagFilters(accountID, projectID)
+		addTagFilter(tfs, "n", "1", false, false)
+		addTagFilter(tfs, "i", "1.+", false, true)
+		addTagFilter(tfs, "j", "foo", false, false)
+		benchSearch(b, tfs)
+	})
+	b.Run(`n="1",i=~".+",i!="2",j="foo"`, func(b *testing.B) {
+		tfs := NewTagFilters(accountID, projectID)
+		addTagFilter(tfs, "n", "1", false, false)
+		addTagFilter(tfs, "i", ".+", false, true)
+		addTagFilter(tfs, "i", "2", true, false)
+		addTagFilter(tfs, "j", "foo", false, false)
+		benchSearch(b, tfs)
+	})
+	b.Run(`n="1",i=~".+",i!~"2.*",j="foo"`, func(b *testing.B) {
+		tfs := NewTagFilters(accountID, projectID)
+		addTagFilter(tfs, "n", "1", false, false)
+		addTagFilter(tfs, "i", ".+", false, true)
+		addTagFilter(tfs, "i", "2.*", true, true)
+		addTagFilter(tfs, "j", "foo", false, false)
+		benchSearch(b, tfs)
+	})
+}
+
 func BenchmarkIndexDBGetTSIDs(b *testing.B) {
 	metricIDCache := workingsetcache.New(1234, time.Hour)
 	metricNameCache := workingsetcache.New(1234, time.Hour)