2019-05-22 21:16:55 +00:00
package promql
import (
2019-05-24 13:12:31 +00:00
"flag"
2019-05-22 21:16:55 +00:00
"fmt"
"math"
"sort"
2020-11-11 10:38:44 +00:00
"strings"
2019-05-22 21:16:55 +00:00
"sync"
"sync/atomic"
2019-05-24 13:12:31 +00:00
"time"
2019-05-22 21:16:55 +00:00
"github.com/VictoriaMetrics/VictoriaMetrics/app/vmselect/netstorage"
2020-12-25 14:44:26 +00:00
"github.com/VictoriaMetrics/VictoriaMetrics/app/vmselect/querystats"
2021-03-15 10:35:44 +00:00
"github.com/VictoriaMetrics/VictoriaMetrics/lib/decimal"
2024-04-25 10:54:42 +00:00
"github.com/VictoriaMetrics/VictoriaMetrics/lib/logger"
2022-05-31 23:29:19 +00:00
"github.com/VictoriaMetrics/VictoriaMetrics/lib/querytracer"
2021-09-23 22:19:59 +00:00
"github.com/VictoriaMetrics/VictoriaMetrics/lib/storage"
2019-05-22 21:16:55 +00:00
"github.com/VictoriaMetrics/metrics"
2020-04-28 12:28:22 +00:00
"github.com/VictoriaMetrics/metricsql"
2019-05-22 21:16:55 +00:00
)
2020-11-11 10:38:44 +00:00
var (
2023-12-09 22:50:35 +00:00
maxResponseSeries = flag . Int ( "search.maxResponseSeries" , 0 , "The maximum number of time series which can be returned from /api/v1/query and /api/v1/query_range . " +
"The limit is disabled if it equals to 0. See also -search.maxPointsPerTimeseries and -search.maxUniqueTimeseries" )
2020-11-11 10:38:44 +00:00
treatDotsAsIsInRegexps = flag . Bool ( "search.treatDotsAsIsInRegexps" , false , "Whether to treat dots as is in regexp label filters used in queries. " +
` For example, foo { bar=~"a.b.c"} will be automatically converted to foo { bar=~"a\\.b\\.c"}, i.e. all the dots in regexp filters will be automatically escaped ` +
` in order to match only dot char instead of matching any char. Dots in ".+", ".*" and ". { n}" regexps aren't escaped. ` +
2021-02-03 18:35:45 +00:00
` This option is DEPRECATED in favor of { __graphite__="a.*.c"} syntax for selecting metrics matching the given Graphite metrics filter ` )
2024-04-25 10:54:42 +00:00
disableImplicitConversion = flag . Bool ( "search.disableImplicitConversion" , false , "Whether to return an error for queries that rely on implicit subquery conversions, " +
"see https://docs.victoriametrics.com/metricsql/#subqueries for details. " +
"See also -search.logImplicitConversion." )
logImplicitConversion = flag . Bool ( "search.logImplicitConversion" , false , "Whether to log queries with implicit subquery conversions, " +
"see https://docs.victoriametrics.com/metricsql/#subqueries for details. " +
"Such conversion can be disabled using -search.disableImplicitConversion." )
2020-11-11 10:38:44 +00:00
)
2019-05-24 13:12:31 +00:00
2022-08-15 10:50:14 +00:00
// UserReadableError is a type of error which supposed to be returned to the user without additional context.
2022-08-15 10:38:47 +00:00
type UserReadableError struct {
2022-08-15 10:50:14 +00:00
// Err is the error which needs to be returned to the user.
2022-08-15 10:38:47 +00:00
Err error
}
2022-08-15 10:50:14 +00:00
// Unwrap returns ure.Err.
//
// This is used by standard errors package. See https://golang.org/pkg/errors
func ( ure * UserReadableError ) Unwrap ( ) error {
return ure . Err
}
2022-08-15 10:38:47 +00:00
// Error satisfies Error interface
2022-08-15 10:50:14 +00:00
func ( ure * UserReadableError ) Error ( ) string {
2022-08-15 10:38:47 +00:00
return ure . Err . Error ( )
}
2019-07-01 14:14:49 +00:00
// Exec executes q for the given ec.
2022-05-31 23:29:19 +00:00
func Exec ( qt * querytracer . Tracer , ec * EvalConfig , q string , isFirstPointOnly bool ) ( [ ] netstorage . Result , error ) {
2020-12-25 14:44:26 +00:00
if querystats . Enabled ( ) {
startTime := time . Now ( )
2023-11-01 15:42:51 +00:00
defer func ( ) {
querystats . RegisterQuery ( q , ec . End - ec . Start , startTime )
ec . QueryStats . addExecutionTimeMsec ( startTime )
} ( )
2020-12-25 14:42:05 +00:00
}
2019-05-24 13:12:31 +00:00
2019-05-22 21:16:55 +00:00
ec . validate ( )
e , err := parsePromQLWithCache ( q )
if err != nil {
2020-07-08 15:55:25 +00:00
return nil , err
2019-05-22 21:16:55 +00:00
}
2024-04-25 10:54:42 +00:00
if * disableImplicitConversion || * logImplicitConversion {
2024-07-02 22:37:37 +00:00
isInvalid := metricsql . IsLikelyInvalid ( e )
if isInvalid && * disableImplicitConversion {
2024-06-17 12:21:16 +00:00
// we don't add query=%q to err message as it will be added by the caller
2024-07-02 22:37:37 +00:00
return nil , fmt . Errorf ( "query requires implicit conversion and is rejected according to -search.disableImplicitConversion command-line flag. " +
"See https://docs.victoriametrics.com/metricsql/#implicit-query-conversions for details" )
2024-04-25 10:54:42 +00:00
}
2024-07-02 22:37:37 +00:00
if isInvalid && * logImplicitConversion {
2024-06-17 12:21:16 +00:00
logger . Warnf ( "query=%q requires implicit conversion, see https://docs.victoriametrics.com/metricsql/#implicit-query-conversions for details" , e . AppendString ( nil ) )
2024-04-25 10:54:42 +00:00
}
}
2020-07-08 15:55:25 +00:00
qid := activeQueriesV . Add ( ec , q )
2022-05-31 23:29:19 +00:00
rv , err := evalExpr ( qt , ec , e )
2020-07-08 15:55:25 +00:00
activeQueriesV . Remove ( qid )
2019-05-22 21:16:55 +00:00
if err != nil {
2020-07-08 15:55:25 +00:00
return nil , err
2019-05-22 21:16:55 +00:00
}
2019-07-01 14:14:49 +00:00
if isFirstPointOnly {
// Remove all the points except the first one from every time series.
for _ , ts := range rv {
ts . Values = ts . Values [ : 1 ]
ts . Timestamps = ts . Timestamps [ : 1 ]
}
2022-05-31 23:29:19 +00:00
qt . Printf ( "leave only the first point in every series" )
2019-07-01 14:14:49 +00:00
}
2023-09-01 07:34:16 +00:00
maySort := maySortResults ( e )
2019-05-22 21:16:55 +00:00
result , err := timeseriesToResult ( rv , maySort )
2023-12-09 22:50:35 +00:00
if * maxResponseSeries > 0 && len ( result ) > * maxResponseSeries {
return nil , fmt . Errorf ( "the response contains more than -search.maxResponseSeries=%d time series: %d series; either increase -search.maxResponseSeries " +
"or change the query in order to return smaller number of series" , * maxResponseSeries , len ( result ) )
}
2019-05-22 21:16:55 +00:00
if err != nil {
2020-07-08 15:55:25 +00:00
return nil , err
2019-05-22 21:16:55 +00:00
}
2022-05-31 23:29:19 +00:00
if maySort {
qt . Printf ( "sort series by metric name and labels" )
} else {
qt . Printf ( "do not sort series by metric name and labels" )
}
2021-03-15 10:35:44 +00:00
if n := ec . RoundDigits ; n < 100 {
for i := range result {
values := result [ i ] . Values
for j , v := range values {
values [ j ] = decimal . RoundToDecimalDigits ( v , n )
}
}
2022-05-31 23:29:19 +00:00
qt . Printf ( "round series values to %d decimal digits after the point" , n )
2021-03-15 10:35:44 +00:00
}
2022-08-15 10:38:47 +00:00
return result , nil
2019-05-22 21:16:55 +00:00
}
2023-09-01 07:34:16 +00:00
func maySortResults ( e metricsql . Expr ) bool {
2021-04-07 21:09:34 +00:00
switch v := e . ( type ) {
case * metricsql . FuncExpr :
switch strings . ToLower ( v . Name ) {
case "sort" , "sort_desc" ,
2022-09-14 14:41:09 +00:00
"sort_by_label" , "sort_by_label_desc" ,
"sort_by_label_numeric" , "sort_by_label_numeric_desc" :
2024-01-15 23:30:07 +00:00
// Results already sorted
2021-04-07 21:09:34 +00:00
return false
}
case * metricsql . AggrFuncExpr :
switch strings . ToLower ( v . Name ) {
case "topk" , "bottomk" , "outliersk" ,
2021-09-30 10:22:52 +00:00
"topk_max" , "topk_min" , "topk_avg" , "topk_median" , "topk_last" ,
"bottomk_max" , "bottomk_min" , "bottomk_avg" , "bottomk_median" , "bottomk_last" :
2024-01-15 23:30:07 +00:00
// Results already sorted
2021-04-07 21:09:34 +00:00
return false
}
2023-09-25 14:14:14 +00:00
case * metricsql . BinaryOpExpr :
2024-05-12 08:20:39 +00:00
if strings . EqualFold ( v . Op , "or" ) {
2023-09-25 14:14:14 +00:00
// Do not sort results for `a or b` in the same way as Prometheus does.
// See https://github.com/VictoriaMetrics/VictoriaMetrics/issues/4763
return false
}
2019-05-22 21:16:55 +00:00
}
2021-04-07 21:09:34 +00:00
return true
2019-05-22 21:16:55 +00:00
}
func timeseriesToResult ( tss [ ] * timeseries , maySort bool ) ( [ ] netstorage . Result , error ) {
2022-04-20 16:53:24 +00:00
tss = removeEmptySeries ( tss )
2024-01-15 23:30:07 +00:00
if maySort {
sortSeriesByMetricName ( tss )
}
2019-05-22 21:16:55 +00:00
result := make ( [ ] netstorage . Result , len ( tss ) )
2019-08-20 19:51:45 +00:00
m := make ( map [ string ] struct { } , len ( tss ) )
2019-05-22 21:16:55 +00:00
bb := bbPool . Get ( )
for i , ts := range tss {
2021-09-23 22:19:59 +00:00
bb . B = marshalMetricNameSorted ( bb . B [ : 0 ] , & ts . MetricName )
2023-10-10 11:44:02 +00:00
k := string ( bb . B )
2023-01-10 06:19:53 +00:00
if _ , ok := m [ k ] ; ok {
2019-11-23 22:02:18 +00:00
return nil , fmt . Errorf ( ` duplicate output timeseries: %s ` , stringMetricName ( & ts . MetricName ) )
2019-05-22 21:16:55 +00:00
}
2023-01-10 06:19:53 +00:00
m [ k ] = struct { } { }
2019-05-22 21:16:55 +00:00
rs := & result [ i ]
2023-01-10 06:38:31 +00:00
rs . MetricName . MoveFrom ( & ts . MetricName )
rs . Values = ts . Values
ts . Values = nil
rs . Timestamps = ts . Timestamps
ts . Timestamps = nil
2019-05-22 21:16:55 +00:00
}
bbPool . Put ( bb )
return result , nil
}
2024-01-15 23:30:07 +00:00
func sortSeriesByMetricName ( tss [ ] * timeseries ) {
sort . Slice ( tss , func ( i , j int ) bool {
return metricNameLess ( & tss [ i ] . MetricName , & tss [ j ] . MetricName )
} )
}
2021-09-23 22:19:59 +00:00
func metricNameLess ( a , b * storage . MetricName ) bool {
if string ( a . MetricGroup ) != string ( b . MetricGroup ) {
return string ( a . MetricGroup ) < string ( b . MetricGroup )
}
// Metric names for a and b match. Compare tags.
// Tags must be already sorted by the caller, so just compare them.
ats := a . Tags
bts := b . Tags
for i := range ats {
if i >= len ( bts ) {
// a contains more tags than b and all the previous tags were identical,
// so a is considered bigger than b.
return false
}
at := & ats [ i ]
bt := & bts [ i ]
if string ( at . Key ) != string ( bt . Key ) {
return string ( at . Key ) < string ( bt . Key )
}
if string ( at . Value ) != string ( bt . Value ) {
return string ( at . Value ) < string ( bt . Value )
}
}
return len ( ats ) < len ( bts )
}
2022-04-20 16:53:24 +00:00
func removeEmptySeries ( tss [ ] * timeseries ) [ ] * timeseries {
2019-05-22 21:16:55 +00:00
rvs := tss [ : 0 ]
for _ , ts := range tss {
2019-07-12 16:56:23 +00:00
allNans := true
2019-05-22 21:16:55 +00:00
for _ , v := range ts . Values {
2019-07-12 16:56:23 +00:00
if ! math . IsNaN ( v ) {
allNans = false
break
2019-05-22 21:16:55 +00:00
}
}
2019-07-12 16:56:23 +00:00
if allNans {
2019-05-22 21:16:55 +00:00
// Skip timeseries with all NaNs.
continue
}
rvs = append ( rvs , ts )
}
2019-07-12 16:56:23 +00:00
for i := len ( rvs ) ; i < len ( tss ) ; i ++ {
// Zero unused time series, so GC could reclaim them.
tss [ i ] = nil
}
2019-05-22 21:16:55 +00:00
return rvs
}
2020-08-06 20:18:03 +00:00
func adjustCmpOps ( e metricsql . Expr ) metricsql . Expr {
metricsql . VisitAll ( e , func ( expr metricsql . Expr ) {
be , ok := expr . ( * metricsql . BinaryOpExpr )
if ! ok {
return
}
if ! metricsql . IsBinaryOpCmp ( be . Op ) {
return
}
2020-12-02 10:08:47 +00:00
if isNumberExpr ( be . Right ) || ! isScalarExpr ( be . Left ) {
2020-08-06 20:18:03 +00:00
return
}
// Convert 'num cmpOp query' expression to `query reverseCmpOp num` expression
2020-12-02 10:08:47 +00:00
// like Prometheus does. For instance, `0.5 < foo` must be converted to `foo > 0.5`
2020-08-06 20:18:03 +00:00
// in order to return valid values for `foo` that are bigger than 0.5.
be . Right , be . Left = be . Left , be . Right
be . Op = getReverseCmpOp ( be . Op )
} )
return e
}
2020-12-02 10:08:47 +00:00
func isNumberExpr ( e metricsql . Expr ) bool {
_ , ok := e . ( * metricsql . NumberExpr )
return ok
}
func isScalarExpr ( e metricsql . Expr ) bool {
if isNumberExpr ( e ) {
return true
}
if fe , ok := e . ( * metricsql . FuncExpr ) ; ok {
// time() returns scalar in PromQL - see https://prometheus.io/docs/prometheus/latest/querying/functions/#time
return strings . ToLower ( fe . Name ) == "time"
}
return false
}
2020-08-06 20:18:03 +00:00
func getReverseCmpOp ( op string ) string {
switch op {
case ">" :
return "<"
case "<" :
return ">"
case ">=" :
return "<="
case "<=" :
return ">="
default :
// there is no need in changing `==` and `!=`.
return op
}
}
2019-12-25 19:35:47 +00:00
func parsePromQLWithCache ( q string ) ( metricsql . Expr , error ) {
2019-05-22 21:16:55 +00:00
pcv := parseCacheV . Get ( q )
if pcv == nil {
2019-12-25 19:35:47 +00:00
e , err := metricsql . Parse ( q )
2020-08-06 20:18:03 +00:00
if err == nil {
2020-10-07 18:15:06 +00:00
e = metricsql . Optimize ( e )
2020-08-06 20:18:03 +00:00
e = adjustCmpOps ( e )
2020-11-11 10:38:44 +00:00
if * treatDotsAsIsInRegexps {
e = escapeDotsInRegexpLabelFilters ( e )
}
2020-08-06 20:18:03 +00:00
}
2019-05-22 21:16:55 +00:00
pcv = & parseCacheValue {
e : e ,
err : err ,
}
parseCacheV . Put ( q , pcv )
}
if pcv . err != nil {
return nil , pcv . err
}
return pcv . e , nil
}
2020-11-11 10:38:44 +00:00
func escapeDotsInRegexpLabelFilters ( e metricsql . Expr ) metricsql . Expr {
metricsql . VisitAll ( e , func ( expr metricsql . Expr ) {
me , ok := expr . ( * metricsql . MetricExpr )
if ! ok {
return
}
2023-07-16 06:48:21 +00:00
for _ , lfs := range me . LabelFilterss {
for i := range lfs {
f := & lfs [ i ]
if f . IsRegexp {
f . Value = escapeDots ( f . Value )
}
2020-11-11 10:38:44 +00:00
}
}
} )
return e
}
func escapeDots ( s string ) string {
dotsCount := strings . Count ( s , "." )
if dotsCount <= 0 {
return s
}
result := make ( [ ] byte , 0 , len ( s ) + 2 * dotsCount )
for i := 0 ; i < len ( s ) ; i ++ {
if s [ i ] == '.' && ( i == 0 || s [ i - 1 ] != '\\' ) && ( i + 1 == len ( s ) || i + 1 < len ( s ) && s [ i + 1 ] != '*' && s [ i + 1 ] != '+' && s [ i + 1 ] != '{' ) {
// Escape a dot if the following conditions are met:
// - if it isn't escaped already, i.e. if there is no `\` char before the dot.
// - if there is no regexp modifiers such as '+', '*' or '{' after the dot.
result = append ( result , '\\' , '.' )
} else {
result = append ( result , s [ i ] )
}
}
return string ( result )
}
2019-05-22 21:16:55 +00:00
var parseCacheV = func ( ) * parseCache {
pc := & parseCache {
m : make ( map [ string ] * parseCacheValue ) ,
}
metrics . NewGauge ( ` vm_cache_requests_total { type="promql/parse"} ` , func ( ) float64 {
return float64 ( pc . Requests ( ) )
} )
metrics . NewGauge ( ` vm_cache_misses_total { type="promql/parse"} ` , func ( ) float64 {
return float64 ( pc . Misses ( ) )
} )
metrics . NewGauge ( ` vm_cache_entries { type="promql/parse"} ` , func ( ) float64 {
return float64 ( pc . Len ( ) )
} )
return pc
} ( )
const parseCacheMaxLen = 10e3
type parseCacheValue struct {
2019-12-25 19:35:47 +00:00
e metricsql . Expr
2019-05-22 21:16:55 +00:00
err error
}
type parseCache struct {
2024-02-24 00:44:19 +00:00
requests atomic . Uint64
misses atomic . Uint64
2019-10-17 15:22:56 +00:00
m map [ string ] * parseCacheValue
mu sync . RWMutex
2019-05-22 21:16:55 +00:00
}
func ( pc * parseCache ) Requests ( ) uint64 {
2024-02-24 00:44:19 +00:00
return pc . requests . Load ( )
2019-05-22 21:16:55 +00:00
}
func ( pc * parseCache ) Misses ( ) uint64 {
2024-02-24 00:44:19 +00:00
return pc . misses . Load ( )
2019-05-22 21:16:55 +00:00
}
func ( pc * parseCache ) Len ( ) uint64 {
pc . mu . RLock ( )
n := len ( pc . m )
pc . mu . RUnlock ( )
return uint64 ( n )
}
func ( pc * parseCache ) Get ( q string ) * parseCacheValue {
2024-02-24 00:44:19 +00:00
pc . requests . Add ( 1 )
2019-05-22 21:16:55 +00:00
pc . mu . RLock ( )
pcv := pc . m [ q ]
pc . mu . RUnlock ( )
if pcv == nil {
2024-02-24 00:44:19 +00:00
pc . misses . Add ( 1 )
2019-05-22 21:16:55 +00:00
}
return pcv
}
func ( pc * parseCache ) Put ( q string , pcv * parseCacheValue ) {
pc . mu . Lock ( )
overflow := len ( pc . m ) - parseCacheMaxLen
if overflow > 0 {
// Remove 10% of items from the cache.
overflow = int ( float64 ( len ( pc . m ) ) * 0.1 )
for k := range pc . m {
delete ( pc . m , k )
overflow --
if overflow <= 0 {
break
}
}
}
pc . m [ q ] = pcv
pc . mu . Unlock ( )
}