VictoriaMetrics/lib/logstorage/stats_min.go

178 lines
3.9 KiB
Go
Raw Normal View History

2024-05-01 00:08:37 +00:00
package logstorage
import (
2024-05-15 13:46:42 +00:00
"math"
2024-05-15 11:07:15 +00:00
"strings"
2024-05-01 00:08:37 +00:00
"unsafe"
2024-05-15 11:23:51 +00:00
"github.com/VictoriaMetrics/VictoriaMetrics/lib/bytesutil"
2024-05-15 13:46:42 +00:00
"github.com/VictoriaMetrics/VictoriaMetrics/lib/logger"
2024-05-01 00:08:37 +00:00
)
type statsMin struct {
2024-05-21 21:56:03 +00:00
fields []string
2024-05-01 00:08:37 +00:00
}
func (sm *statsMin) String() string {
2024-05-22 09:25:49 +00:00
return "min(" + statsFuncFieldsToString(sm.fields) + ")"
2024-05-01 00:08:37 +00:00
}
2024-05-17 02:11:10 +00:00
func (sm *statsMin) updateNeededFields(neededFields fieldsSet) {
2024-05-22 09:25:49 +00:00
updateNeededFieldsForStatsFunc(neededFields, sm.fields)
2024-05-01 00:08:37 +00:00
}
func (sm *statsMin) newStatsProcessor() (statsProcessor, int) {
smp := &statsMinProcessor{
2024-05-15 11:07:15 +00:00
sm: sm,
2024-05-01 00:08:37 +00:00
}
return smp, int(unsafe.Sizeof(*smp))
}
type statsMinProcessor struct {
sm *statsMin
2024-05-21 19:18:05 +00:00
min string
2024-05-01 00:08:37 +00:00
}
func (smp *statsMinProcessor) updateStatsForAllRows(br *blockResult) int {
2024-05-15 11:07:15 +00:00
minLen := len(smp.min)
2024-05-22 09:25:49 +00:00
fields := smp.sm.fields
if len(fields) == 0 {
2024-05-01 00:08:37 +00:00
// Find the minimum value across all the columns
for _, c := range br.getColumns() {
2024-05-15 11:23:51 +00:00
smp.updateStateForColumn(br, c)
2024-05-01 00:08:37 +00:00
}
2024-05-03 12:03:17 +00:00
} else {
// Find the minimum value across the requested columns
2024-05-22 09:25:49 +00:00
for _, field := range fields {
2024-05-03 12:03:17 +00:00
c := br.getColumnByName(field)
2024-05-15 11:23:51 +00:00
smp.updateStateForColumn(br, c)
2024-05-01 00:08:37 +00:00
}
}
2024-05-15 11:07:15 +00:00
return len(smp.min) - minLen
2024-05-01 00:08:37 +00:00
}
func (smp *statsMinProcessor) updateStatsForRow(br *blockResult, rowIdx int) int {
2024-05-15 11:07:15 +00:00
minLen := len(smp.min)
2024-05-22 09:25:49 +00:00
fields := smp.sm.fields
if len(fields) == 0 {
2024-05-01 00:08:37 +00:00
// Find the minimum value across all the fields for the given row
for _, c := range br.getColumns() {
2024-05-15 11:07:15 +00:00
v := c.getValueAtRow(br, rowIdx)
2024-05-15 13:46:42 +00:00
smp.updateStateString(v)
2024-05-01 00:08:37 +00:00
}
2024-05-03 12:03:17 +00:00
} else {
// Find the minimum value across the requested fields for the given row
2024-05-22 09:25:49 +00:00
for _, field := range fields {
2024-05-03 12:03:17 +00:00
c := br.getColumnByName(field)
2024-05-15 11:07:15 +00:00
v := c.getValueAtRow(br, rowIdx)
2024-05-15 13:46:42 +00:00
smp.updateStateString(v)
2024-05-01 00:08:37 +00:00
}
}
2024-05-15 11:07:15 +00:00
return minLen - len(smp.min)
2024-05-01 00:08:37 +00:00
}
func (smp *statsMinProcessor) mergeState(sfp statsProcessor) {
src := sfp.(*statsMinProcessor)
2024-05-21 16:56:35 +00:00
smp.updateStateString(src.min)
2024-05-01 00:08:37 +00:00
}
2024-05-15 11:23:51 +00:00
func (smp *statsMinProcessor) updateStateForColumn(br *blockResult, c *blockResultColumn) {
2024-05-15 13:46:42 +00:00
if len(br.timestamps) == 0 {
return
}
2024-05-15 11:23:51 +00:00
if c.isTime {
// Special case for time column
timestamps := br.timestamps
minTimestamp := timestamps[0]
for _, timestamp := range timestamps[1:] {
if timestamp < minTimestamp {
minTimestamp = timestamp
}
}
bb := bbPool.Get()
2024-05-15 13:46:42 +00:00
bb.B = marshalTimestampRFC3339NanoString(bb.B[:0], minTimestamp)
smp.updateStateBytes(bb.B)
2024-05-15 11:23:51 +00:00
bbPool.Put(bb)
return
}
if c.isConst {
// Special case for const column
2024-05-15 20:19:21 +00:00
v := c.valuesEncoded[0]
2024-05-15 13:46:42 +00:00
smp.updateStateString(v)
2024-05-15 11:23:51 +00:00
return
}
2024-05-15 13:46:42 +00:00
switch c.valueType {
case valueTypeString:
2024-05-15 20:19:21 +00:00
for _, v := range c.getValuesEncoded(br) {
2024-05-15 13:46:42 +00:00
smp.updateStateString(v)
}
case valueTypeDict:
for _, v := range c.dictValues {
smp.updateStateString(v)
}
2024-05-15 14:04:10 +00:00
case valueTypeUint8, valueTypeUint16, valueTypeUint32, valueTypeUint64:
2024-05-15 13:46:42 +00:00
bb := bbPool.Get()
2024-05-17 02:11:10 +00:00
bb.B = marshalUint64String(bb.B[:0], c.minValue)
2024-05-15 13:46:42 +00:00
smp.updateStateBytes(bb.B)
bbPool.Put(bb)
case valueTypeFloat64:
2024-05-17 02:11:10 +00:00
f := math.Float64frombits(c.minValue)
2024-05-15 13:46:42 +00:00
bb := bbPool.Get()
2024-05-15 14:04:10 +00:00
bb.B = marshalFloat64String(bb.B[:0], f)
2024-05-15 13:46:42 +00:00
smp.updateStateBytes(bb.B)
bbPool.Put(bb)
case valueTypeIPv4:
bb := bbPool.Get()
2024-05-17 02:11:10 +00:00
bb.B = marshalIPv4String(bb.B[:0], uint32(c.minValue))
2024-05-15 13:46:42 +00:00
smp.updateStateBytes(bb.B)
bbPool.Put(bb)
case valueTypeTimestampISO8601:
bb := bbPool.Get()
2024-05-17 02:11:10 +00:00
bb.B = marshalTimestampISO8601String(bb.B[:0], int64(c.minValue))
2024-05-15 13:46:42 +00:00
smp.updateStateBytes(bb.B)
bbPool.Put(bb)
default:
logger.Panicf("BUG: unknown valueType=%d", c.valueType)
2024-05-15 11:23:51 +00:00
}
}
2024-05-15 13:46:42 +00:00
func (smp *statsMinProcessor) updateStateBytes(b []byte) {
v := bytesutil.ToUnsafeString(b)
smp.updateStateString(v)
}
func (smp *statsMinProcessor) updateStateString(v string) {
2024-05-21 12:19:09 +00:00
if v == "" {
// Skip empty strings
return
}
2024-05-21 16:56:35 +00:00
if smp.min != "" && !lessString(v, smp.min) {
2024-05-15 11:07:15 +00:00
return
}
smp.min = strings.Clone(v)
}
2024-05-01 00:08:37 +00:00
func (smp *statsMinProcessor) finalizeStats() string {
2024-05-15 11:07:15 +00:00
return smp.min
2024-05-01 00:08:37 +00:00
}
func parseStatsMin(lex *lexer) (*statsMin, error) {
2024-05-22 09:25:49 +00:00
fields, err := parseStatsFuncFields(lex, "min")
2024-05-01 00:08:37 +00:00
if err != nil {
2024-05-03 09:15:09 +00:00
return nil, err
2024-05-01 00:08:37 +00:00
}
sm := &statsMin{
2024-05-21 21:56:03 +00:00
fields: fields,
2024-05-01 00:08:37 +00:00
}
return sm, nil
}