VictoriaMetrics/lib/logstorage/stats_max.go

176 lines
3.9 KiB
Go
Raw Permalink Normal View History

package logstorage
import (
"math"
2024-05-20 02:08:30 +00:00
"strings"
"unsafe"
2024-05-20 02:08:30 +00:00
"github.com/VictoriaMetrics/VictoriaMetrics/lib/bytesutil"
"github.com/VictoriaMetrics/VictoriaMetrics/lib/logger"
)
type statsMax struct {
2024-05-22 19:01:20 +00:00
fields []string
}
func (sm *statsMax) String() string {
2024-05-22 19:01:20 +00:00
return "max(" + statsFuncFieldsToString(sm.fields) + ")"
}
2024-05-20 02:08:30 +00:00
func (sm *statsMax) updateNeededFields(neededFields fieldsSet) {
2024-05-22 19:01:20 +00:00
updateNeededFieldsForStatsFunc(neededFields, sm.fields)
}
func (sm *statsMax) newStatsProcessor() (statsProcessor, int) {
smp := &statsMaxProcessor{
2024-05-20 02:08:30 +00:00
sm: sm,
}
return smp, int(unsafe.Sizeof(*smp))
}
type statsMaxProcessor struct {
sm *statsMax
2024-05-22 19:01:20 +00:00
max string
}
func (smp *statsMaxProcessor) updateStatsForAllRows(br *blockResult) int {
2024-05-20 02:08:30 +00:00
maxLen := len(smp.max)
2024-05-22 19:01:20 +00:00
if len(smp.sm.fields) == 0 {
2024-05-20 02:08:30 +00:00
// Find the minimum value across all the columns
for _, c := range br.getColumns() {
2024-05-20 02:08:30 +00:00
smp.updateStateForColumn(br, c)
}
} else {
2024-05-20 02:08:30 +00:00
// Find the minimum value across the requested columns
for _, field := range smp.sm.fields {
c := br.getColumnByName(field)
2024-05-20 02:08:30 +00:00
smp.updateStateForColumn(br, c)
}
}
2024-05-20 02:08:30 +00:00
return len(smp.max) - maxLen
}
func (smp *statsMaxProcessor) updateStatsForRow(br *blockResult, rowIdx int) int {
2024-05-20 02:08:30 +00:00
maxLen := len(smp.max)
2024-05-22 19:01:20 +00:00
if len(smp.sm.fields) == 0 {
2024-05-20 02:08:30 +00:00
// Find the minimum value across all the fields for the given row
for _, c := range br.getColumns() {
2024-05-20 02:08:30 +00:00
v := c.getValueAtRow(br, rowIdx)
smp.updateStateString(v)
}
} else {
2024-05-20 02:08:30 +00:00
// Find the minimum value across the requested fields for the given row
for _, field := range smp.sm.fields {
c := br.getColumnByName(field)
2024-05-20 02:08:30 +00:00
v := c.getValueAtRow(br, rowIdx)
smp.updateStateString(v)
}
}
2024-05-20 02:08:30 +00:00
return maxLen - len(smp.max)
}
func (smp *statsMaxProcessor) mergeState(sfp statsProcessor) {
src := sfp.(*statsMaxProcessor)
2024-05-22 19:01:20 +00:00
smp.updateStateString(src.max)
}
2024-05-20 02:08:30 +00:00
func (smp *statsMaxProcessor) updateStateForColumn(br *blockResult, c *blockResultColumn) {
if br.rowsLen == 0 {
2024-05-20 02:08:30 +00:00
return
}
if c.isTime {
timestamp, ok := TryParseTimestampRFC3339Nano(smp.max)
if !ok {
timestamp = -1 << 63
}
maxTimestamp := br.getMaxTimestamp(timestamp)
if maxTimestamp <= timestamp {
return
}
2024-05-20 02:08:30 +00:00
bb := bbPool.Get()
bb.B = marshalTimestampRFC3339NanoString(bb.B[:0], maxTimestamp)
smp.updateStateBytes(bb.B)
bbPool.Put(bb)
return
}
if c.isConst {
// Special case for const column
v := c.valuesEncoded[0]
smp.updateStateString(v)
return
}
switch c.valueType {
case valueTypeString:
for _, v := range c.getValuesEncoded(br) {
smp.updateStateString(v)
}
case valueTypeDict:
for _, v := range c.dictValues {
smp.updateStateString(v)
}
case valueTypeUint8, valueTypeUint16, valueTypeUint32, valueTypeUint64:
bb := bbPool.Get()
bb.B = marshalUint64String(bb.B[:0], c.maxValue)
smp.updateStateBytes(bb.B)
bbPool.Put(bb)
case valueTypeFloat64:
f := math.Float64frombits(c.maxValue)
bb := bbPool.Get()
bb.B = marshalFloat64String(bb.B[:0], f)
smp.updateStateBytes(bb.B)
bbPool.Put(bb)
case valueTypeIPv4:
bb := bbPool.Get()
bb.B = marshalIPv4String(bb.B[:0], uint32(c.maxValue))
smp.updateStateBytes(bb.B)
bbPool.Put(bb)
case valueTypeTimestampISO8601:
bb := bbPool.Get()
bb.B = marshalTimestampISO8601String(bb.B[:0], int64(c.maxValue))
smp.updateStateBytes(bb.B)
bbPool.Put(bb)
default:
logger.Panicf("BUG: unknown valueType=%d", c.valueType)
}
}
func (smp *statsMaxProcessor) updateStateBytes(b []byte) {
v := bytesutil.ToUnsafeString(b)
smp.updateStateString(v)
}
func (smp *statsMaxProcessor) updateStateString(v string) {
2024-05-22 19:01:20 +00:00
if v == "" {
// Skip empty strings
return
}
if smp.max != "" && !lessString(smp.max, v) {
2024-05-20 02:08:30 +00:00
return
}
smp.max = strings.Clone(v)
}
func (smp *statsMaxProcessor) finalizeStats() string {
2024-05-20 02:08:30 +00:00
return smp.max
}
func parseStatsMax(lex *lexer) (*statsMax, error) {
2024-05-22 19:01:20 +00:00
fields, err := parseStatsFuncFields(lex, "max")
if err != nil {
return nil, err
}
sm := &statsMax{
2024-05-22 19:01:20 +00:00
fields: fields,
}
return sm, nil
}