mirror of
https://github.com/VictoriaMetrics/VictoriaMetrics.git
synced 2025-01-10 15:14:09 +00:00
44b071296d
### Describe Your Changes Added an ability to query data across multiple tenants. See: https://github.com/VictoriaMetrics/VictoriaMetrics/issues/1434 Currently, the following endpoints work with multi-tenancy: - /prometheus/api/v1/query - /prometheus/api/v1/query_range - /prometheus/api/v1/series - /prometheus/api/v1/labels - /prometheus/api/v1/label/<label_name>/values - /prometheus/api/v1/status/active_queries - /prometheus/api/v1/status/top_queries - /prometheus/api/v1/status/tsdb - /prometheus/api/v1/export - /prometheus/api/v1/export/csv - /vmui A note regarding VMUI: endpoints such as `active_queries` and `top_queries` have been updated to indicate whether query was a single-tenant or multi-tenant, but UI needs to be updated to display this info. cc: @Loori-R --------- Signed-off-by: Zakhar Bessarab <z.bessarab@victoriametrics.com> Signed-off-by: f41gh7 <nik@victoriametrics.com> Co-authored-by: f41gh7 <nik@victoriametrics.com>
337 lines
9.4 KiB
Go
337 lines
9.4 KiB
Go
package querystats
|
|
|
|
import (
|
|
"flag"
|
|
"fmt"
|
|
"io"
|
|
"sort"
|
|
"sync"
|
|
"time"
|
|
|
|
"github.com/VictoriaMetrics/VictoriaMetrics/lib/logger"
|
|
"github.com/VictoriaMetrics/VictoriaMetrics/lib/stringsutil"
|
|
)
|
|
|
|
var (
|
|
lastQueriesCount = flag.Int("search.queryStats.lastQueriesCount", 20000, "Query stats for /api/v1/status/top_queries is tracked on this number of last queries. "+
|
|
"Zero value disables query stats tracking")
|
|
minQueryDuration = flag.Duration("search.queryStats.minQueryDuration", time.Millisecond, "The minimum duration for queries to track in query stats at /api/v1/status/top_queries. Queries with lower duration are ignored in query stats")
|
|
)
|
|
|
|
var (
|
|
qsTracker *queryStatsTracker
|
|
initOnce sync.Once
|
|
)
|
|
|
|
// Enabled returns true of query stats tracking is enabled.
|
|
func Enabled() bool {
|
|
return *lastQueriesCount > 0
|
|
}
|
|
|
|
// RegisterQuery registers the query on the given timeRangeMsecs, which has been started at startTime.
|
|
//
|
|
// RegisterQuery must be called when the query is finished.
|
|
func RegisterQuery(accountID, projectID uint32, query string, timeRangeMsecs int64, startTime time.Time) {
|
|
initOnce.Do(initQueryStats)
|
|
qsTracker.registerQuery(accountID, projectID, query, timeRangeMsecs, startTime)
|
|
}
|
|
|
|
// RegisterQueryMultiTenant registers the query on the given timeRangeMsecs, which has been started at startTime.
|
|
//
|
|
// RegisterQueryMultiTenant must be called when the query is finished.
|
|
func RegisterQueryMultiTenant(query string, timeRangeMsecs int64, startTime time.Time) {
|
|
initOnce.Do(initQueryStats)
|
|
qsTracker.registerQueryMultiTenant(query, timeRangeMsecs, startTime)
|
|
}
|
|
|
|
// WriteJSONQueryStats writes query stats to given writer in json format.
|
|
func WriteJSONQueryStats(w io.Writer, topN int, maxLifetime time.Duration) {
|
|
initOnce.Do(initQueryStats)
|
|
qsTracker.writeJSONQueryStats(w, topN, nil, maxLifetime)
|
|
}
|
|
|
|
// WriteJSONQueryStatsForAccountProject writes query stats for the given (accountID, projectID) to given writer in json format.
|
|
func WriteJSONQueryStatsForAccountProject(w io.Writer, topN int, accountID, projectID uint32, maxLifetime time.Duration) {
|
|
initOnce.Do(initQueryStats)
|
|
apFilter := &accountProjectFilter{
|
|
accountID: accountID,
|
|
projectID: projectID,
|
|
}
|
|
qsTracker.writeJSONQueryStats(w, topN, apFilter, maxLifetime)
|
|
}
|
|
|
|
// queryStatsTracker holds statistics for queries
|
|
type queryStatsTracker struct {
|
|
mu sync.Mutex
|
|
a []queryStatRecord
|
|
nextIdx uint
|
|
}
|
|
|
|
type queryStatRecord struct {
|
|
accountID uint32
|
|
projectID uint32
|
|
query string
|
|
timeRangeSecs int64
|
|
registerTime time.Time
|
|
duration time.Duration
|
|
multiTenant bool
|
|
}
|
|
|
|
type queryStatKey struct {
|
|
accountID uint32
|
|
projectID uint32
|
|
query string
|
|
timeRangeSecs int64
|
|
multiTenant bool
|
|
}
|
|
|
|
type accountProjectFilter struct {
|
|
accountID uint32
|
|
projectID uint32
|
|
}
|
|
|
|
func initQueryStats() {
|
|
recordsCount := *lastQueriesCount
|
|
if recordsCount <= 0 {
|
|
recordsCount = 1
|
|
} else {
|
|
logger.Infof("enabled query stats tracking at `/api/v1/status/top_queries` with -search.queryStats.lastQueriesCount=%d, -search.queryStats.minQueryDuration=%s",
|
|
*lastQueriesCount, *minQueryDuration)
|
|
}
|
|
qsTracker = &queryStatsTracker{
|
|
a: make([]queryStatRecord, recordsCount),
|
|
}
|
|
}
|
|
|
|
func (qst *queryStatsTracker) writeJSONQueryStats(w io.Writer, topN int, apFilter *accountProjectFilter, maxLifetime time.Duration) {
|
|
fmt.Fprintf(w, `{"topN":"%d","maxLifetime":"%s",`, topN, maxLifetime)
|
|
fmt.Fprintf(w, `"search.queryStats.lastQueriesCount":%d,`, *lastQueriesCount)
|
|
fmt.Fprintf(w, `"search.queryStats.minQueryDuration":"%s",`, *minQueryDuration)
|
|
fmt.Fprintf(w, `"topByCount":[`)
|
|
topByCount := qst.getTopByCount(topN, apFilter, maxLifetime)
|
|
for i, r := range topByCount {
|
|
fmt.Fprintf(w, `{"accountID":%d,"projectID":%d,"query":%s,"timeRangeSeconds":%d,"count":%d,"multiTenant":%v}`, r.accountID, r.projectID, stringsutil.JSONString(r.query), r.timeRangeSecs, r.count, r.multiTenant)
|
|
if i+1 < len(topByCount) {
|
|
fmt.Fprintf(w, `,`)
|
|
}
|
|
}
|
|
fmt.Fprintf(w, `],"topByAvgDuration":[`)
|
|
topByAvgDuration := qst.getTopByAvgDuration(topN, apFilter, maxLifetime)
|
|
for i, r := range topByAvgDuration {
|
|
fmt.Fprintf(w, `{"accountID":%d,"projectID":%d,"query":%s,"timeRangeSeconds":%d,"avgDurationSeconds":%.3f,"count":%d,"multiTenant": %v}`,
|
|
r.accountID, r.projectID, stringsutil.JSONString(r.query), r.timeRangeSecs, r.duration.Seconds(), r.count, r.multiTenant)
|
|
if i+1 < len(topByAvgDuration) {
|
|
fmt.Fprintf(w, `,`)
|
|
}
|
|
}
|
|
fmt.Fprintf(w, `],"topBySumDuration":[`)
|
|
topBySumDuration := qst.getTopBySumDuration(topN, apFilter, maxLifetime)
|
|
for i, r := range topBySumDuration {
|
|
fmt.Fprintf(w, `{"accountID":%d,"projectID":%d,"query":%s,"timeRangeSeconds":%d,"sumDurationSeconds":%.3f,"count":%d,"multiTenant":%v}`,
|
|
r.accountID, r.projectID, stringsutil.JSONString(r.query), r.timeRangeSecs, r.duration.Seconds(), r.count, r.multiTenant)
|
|
if i+1 < len(topBySumDuration) {
|
|
fmt.Fprintf(w, `,`)
|
|
}
|
|
}
|
|
fmt.Fprintf(w, `]}`)
|
|
}
|
|
|
|
func (qst *queryStatsTracker) registerQuery(accountID, projectID uint32, query string, timeRangeMsecs int64, startTime time.Time) {
|
|
registerTime := time.Now()
|
|
duration := registerTime.Sub(startTime)
|
|
if duration < *minQueryDuration {
|
|
return
|
|
}
|
|
|
|
qst.mu.Lock()
|
|
defer qst.mu.Unlock()
|
|
|
|
a := qst.a
|
|
idx := qst.nextIdx
|
|
if idx >= uint(len(a)) {
|
|
idx = 0
|
|
}
|
|
qst.nextIdx = idx + 1
|
|
r := &a[idx]
|
|
r.accountID = accountID
|
|
r.projectID = projectID
|
|
r.query = query
|
|
r.timeRangeSecs = timeRangeMsecs / 1000
|
|
r.registerTime = registerTime
|
|
r.duration = duration
|
|
}
|
|
|
|
func (qst *queryStatsTracker) registerQueryMultiTenant(query string, timeRangeMsecs int64, startTime time.Time) {
|
|
registerTime := time.Now()
|
|
duration := registerTime.Sub(startTime)
|
|
if duration < *minQueryDuration {
|
|
return
|
|
}
|
|
|
|
qst.mu.Lock()
|
|
defer qst.mu.Unlock()
|
|
|
|
a := qst.a
|
|
idx := qst.nextIdx
|
|
if idx >= uint(len(a)) {
|
|
idx = 0
|
|
}
|
|
qst.nextIdx = idx + 1
|
|
r := &a[idx]
|
|
r.multiTenant = true
|
|
r.query = query
|
|
r.timeRangeSecs = timeRangeMsecs / 1000
|
|
r.registerTime = registerTime
|
|
r.duration = duration
|
|
}
|
|
|
|
func (r *queryStatRecord) matches(apFilter *accountProjectFilter, currentTime time.Time, maxLifetime time.Duration) bool {
|
|
if r.query == "" || currentTime.Sub(r.registerTime) > maxLifetime {
|
|
return false
|
|
}
|
|
if apFilter != nil && (apFilter.accountID != r.accountID || apFilter.projectID != r.projectID) {
|
|
return false
|
|
}
|
|
return true
|
|
}
|
|
|
|
func (r *queryStatRecord) key() queryStatKey {
|
|
return queryStatKey{
|
|
accountID: r.accountID,
|
|
projectID: r.projectID,
|
|
query: r.query,
|
|
timeRangeSecs: r.timeRangeSecs,
|
|
multiTenant: r.multiTenant,
|
|
}
|
|
}
|
|
|
|
func (qst *queryStatsTracker) getTopByCount(topN int, apFilter *accountProjectFilter, maxLifetime time.Duration) []queryStatByCount {
|
|
currentTime := time.Now()
|
|
qst.mu.Lock()
|
|
m := make(map[queryStatKey]int)
|
|
for _, r := range qst.a {
|
|
if r.matches(apFilter, currentTime, maxLifetime) {
|
|
k := r.key()
|
|
m[k] = m[k] + 1
|
|
}
|
|
}
|
|
qst.mu.Unlock()
|
|
|
|
var a []queryStatByCount
|
|
for k, count := range m {
|
|
a = append(a, queryStatByCount{
|
|
accountID: k.accountID,
|
|
projectID: k.projectID,
|
|
query: k.query,
|
|
timeRangeSecs: k.timeRangeSecs,
|
|
count: count,
|
|
multiTenant: k.multiTenant,
|
|
})
|
|
}
|
|
sort.Slice(a, func(i, j int) bool {
|
|
return a[i].count > a[j].count
|
|
})
|
|
if len(a) > topN {
|
|
a = a[:topN]
|
|
}
|
|
return a
|
|
}
|
|
|
|
type queryStatByCount struct {
|
|
accountID uint32
|
|
projectID uint32
|
|
query string
|
|
timeRangeSecs int64
|
|
count int
|
|
multiTenant bool
|
|
}
|
|
|
|
func (qst *queryStatsTracker) getTopByAvgDuration(topN int, apFilter *accountProjectFilter, maxLifetime time.Duration) []queryStatByDuration {
|
|
currentTime := time.Now()
|
|
qst.mu.Lock()
|
|
type countSum struct {
|
|
count int
|
|
sum time.Duration
|
|
}
|
|
m := make(map[queryStatKey]countSum)
|
|
for _, r := range qst.a {
|
|
if r.matches(apFilter, currentTime, maxLifetime) {
|
|
k := r.key()
|
|
ks := m[k]
|
|
ks.count++
|
|
ks.sum += r.duration
|
|
m[k] = ks
|
|
}
|
|
}
|
|
qst.mu.Unlock()
|
|
|
|
var a []queryStatByDuration
|
|
for k, ks := range m {
|
|
a = append(a, queryStatByDuration{
|
|
accountID: k.accountID,
|
|
projectID: k.projectID,
|
|
query: k.query,
|
|
timeRangeSecs: k.timeRangeSecs,
|
|
duration: ks.sum / time.Duration(ks.count),
|
|
count: ks.count,
|
|
multiTenant: k.multiTenant,
|
|
})
|
|
}
|
|
sort.Slice(a, func(i, j int) bool {
|
|
return a[i].duration > a[j].duration
|
|
})
|
|
if len(a) > topN {
|
|
a = a[:topN]
|
|
}
|
|
return a
|
|
}
|
|
|
|
type queryStatByDuration struct {
|
|
accountID uint32
|
|
projectID uint32
|
|
query string
|
|
timeRangeSecs int64
|
|
duration time.Duration
|
|
count int
|
|
multiTenant bool
|
|
}
|
|
|
|
func (qst *queryStatsTracker) getTopBySumDuration(topN int, apFilter *accountProjectFilter, maxLifetime time.Duration) []queryStatByDuration {
|
|
currentTime := time.Now()
|
|
qst.mu.Lock()
|
|
type countDuration struct {
|
|
count int
|
|
sum time.Duration
|
|
}
|
|
m := make(map[queryStatKey]countDuration)
|
|
for _, r := range qst.a {
|
|
if r.matches(apFilter, currentTime, maxLifetime) {
|
|
k := r.key()
|
|
kd := m[k]
|
|
kd.count++
|
|
kd.sum += r.duration
|
|
m[k] = kd
|
|
}
|
|
}
|
|
qst.mu.Unlock()
|
|
|
|
var a []queryStatByDuration
|
|
for k, kd := range m {
|
|
a = append(a, queryStatByDuration{
|
|
accountID: k.accountID,
|
|
projectID: k.projectID,
|
|
query: k.query,
|
|
timeRangeSecs: k.timeRangeSecs,
|
|
duration: kd.sum,
|
|
count: kd.count,
|
|
multiTenant: k.multiTenant,
|
|
})
|
|
}
|
|
sort.Slice(a, func(i, j int) bool {
|
|
return a[i].duration > a[j].duration
|
|
})
|
|
if len(a) > topN {
|
|
a = a[:topN]
|
|
}
|
|
return a
|
|
}
|