2024-05-22 19:01:20 +00:00
|
|
|
package logstorage
|
|
|
|
|
|
|
|
import (
|
|
|
|
"unsafe"
|
|
|
|
|
|
|
|
"github.com/VictoriaMetrics/VictoriaMetrics/lib/bytesutil"
|
|
|
|
)
|
|
|
|
|
2024-05-25 19:36:16 +00:00
|
|
|
func updateNeededFieldsForUnpackPipe(fromField string, outFields []string, keepOriginalFields, skipEmptyResults bool, iff *ifFilter, neededFields, unneededFields fieldsSet) {
|
2024-05-30 14:19:23 +00:00
|
|
|
if neededFields.isEmpty() {
|
|
|
|
if iff != nil {
|
|
|
|
neededFields.addFields(iff.neededFields)
|
|
|
|
}
|
|
|
|
return
|
|
|
|
}
|
|
|
|
|
2024-05-25 19:36:16 +00:00
|
|
|
if neededFields.contains("*") {
|
|
|
|
unneededFieldsOrig := unneededFields.clone()
|
|
|
|
unneededFieldsCount := 0
|
|
|
|
if len(outFields) > 0 {
|
|
|
|
for _, f := range outFields {
|
|
|
|
if unneededFieldsOrig.contains(f) {
|
|
|
|
unneededFieldsCount++
|
|
|
|
}
|
|
|
|
if !keepOriginalFields && !skipEmptyResults {
|
|
|
|
unneededFields.add(f)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if len(outFields) == 0 || unneededFieldsCount < len(outFields) {
|
|
|
|
unneededFields.remove(fromField)
|
|
|
|
if iff != nil {
|
|
|
|
unneededFields.removeFields(iff.neededFields)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
neededFieldsOrig := neededFields.clone()
|
|
|
|
needFromField := len(outFields) == 0
|
|
|
|
if len(outFields) > 0 {
|
|
|
|
needFromField = false
|
|
|
|
for _, f := range outFields {
|
|
|
|
if neededFieldsOrig.contains(f) {
|
|
|
|
needFromField = true
|
|
|
|
}
|
|
|
|
if !keepOriginalFields && !skipEmptyResults {
|
|
|
|
neededFields.remove(f)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if needFromField {
|
|
|
|
neededFields.add(fromField)
|
|
|
|
if iff != nil {
|
|
|
|
neededFields.addFields(iff.neededFields)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2024-05-22 19:01:20 +00:00
|
|
|
type fieldsUnpackerContext struct {
|
|
|
|
fieldPrefix string
|
|
|
|
|
|
|
|
fields []Field
|
|
|
|
a arena
|
|
|
|
}
|
|
|
|
|
|
|
|
func (uctx *fieldsUnpackerContext) reset() {
|
|
|
|
uctx.fieldPrefix = ""
|
|
|
|
uctx.resetFields()
|
|
|
|
uctx.a.reset()
|
|
|
|
}
|
|
|
|
|
|
|
|
func (uctx *fieldsUnpackerContext) resetFields() {
|
|
|
|
clear(uctx.fields)
|
|
|
|
uctx.fields = uctx.fields[:0]
|
|
|
|
}
|
|
|
|
|
2024-06-03 22:59:25 +00:00
|
|
|
func (uctx *fieldsUnpackerContext) init(fieldPrefix string) {
|
2024-05-22 19:01:20 +00:00
|
|
|
uctx.reset()
|
|
|
|
|
|
|
|
uctx.fieldPrefix = fieldPrefix
|
|
|
|
}
|
|
|
|
|
|
|
|
func (uctx *fieldsUnpackerContext) addField(name, value string) {
|
|
|
|
nameCopy := ""
|
|
|
|
fieldPrefix := uctx.fieldPrefix
|
|
|
|
if fieldPrefix != "" {
|
2024-05-28 17:29:41 +00:00
|
|
|
b := uctx.a.b
|
|
|
|
bLen := len(b)
|
|
|
|
b = append(b, fieldPrefix...)
|
|
|
|
b = append(b, name...)
|
|
|
|
uctx.a.b = b
|
|
|
|
nameCopy = bytesutil.ToUnsafeString(b[bLen:])
|
2024-05-22 19:01:20 +00:00
|
|
|
} else {
|
|
|
|
nameCopy = uctx.a.copyString(name)
|
|
|
|
}
|
|
|
|
|
|
|
|
valueCopy := uctx.a.copyString(value)
|
|
|
|
|
|
|
|
uctx.fields = append(uctx.fields, Field{
|
|
|
|
Name: nameCopy,
|
|
|
|
Value: valueCopy,
|
|
|
|
})
|
|
|
|
}
|
|
|
|
|
2024-05-25 19:36:16 +00:00
|
|
|
func newPipeUnpackProcessor(workersCount int, unpackFunc func(uctx *fieldsUnpackerContext, s string), ppNext pipeProcessor,
|
2024-05-24 22:30:58 +00:00
|
|
|
fromField string, fieldPrefix string, keepOriginalFields, skipEmptyResults bool, iff *ifFilter) *pipeUnpackProcessor {
|
2024-05-22 19:01:20 +00:00
|
|
|
|
|
|
|
return &pipeUnpackProcessor{
|
|
|
|
unpackFunc: unpackFunc,
|
2024-05-25 19:36:16 +00:00
|
|
|
ppNext: ppNext,
|
2024-05-22 19:01:20 +00:00
|
|
|
|
|
|
|
shards: make([]pipeUnpackProcessorShard, workersCount),
|
|
|
|
|
2024-05-24 22:30:58 +00:00
|
|
|
fromField: fromField,
|
|
|
|
fieldPrefix: fieldPrefix,
|
|
|
|
keepOriginalFields: keepOriginalFields,
|
|
|
|
skipEmptyResults: skipEmptyResults,
|
|
|
|
iff: iff,
|
2024-05-22 19:01:20 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
type pipeUnpackProcessor struct {
|
|
|
|
unpackFunc func(uctx *fieldsUnpackerContext, s string)
|
2024-05-25 19:36:16 +00:00
|
|
|
ppNext pipeProcessor
|
2024-05-22 19:01:20 +00:00
|
|
|
|
|
|
|
shards []pipeUnpackProcessorShard
|
|
|
|
|
2024-05-24 22:30:58 +00:00
|
|
|
fromField string
|
|
|
|
fieldPrefix string
|
|
|
|
keepOriginalFields bool
|
|
|
|
skipEmptyResults bool
|
2024-05-22 19:01:20 +00:00
|
|
|
|
|
|
|
iff *ifFilter
|
|
|
|
}
|
|
|
|
|
|
|
|
type pipeUnpackProcessorShard struct {
|
|
|
|
pipeUnpackProcessorShardNopad
|
|
|
|
|
|
|
|
// The padding prevents false sharing on widespread platforms with 128 mod (cache line size) = 0 .
|
|
|
|
_ [128 - unsafe.Sizeof(pipeUnpackProcessorShardNopad{})%128]byte
|
|
|
|
}
|
|
|
|
|
|
|
|
type pipeUnpackProcessorShardNopad struct {
|
|
|
|
bm bitmap
|
|
|
|
|
|
|
|
uctx fieldsUnpackerContext
|
|
|
|
wctx pipeUnpackWriteContext
|
|
|
|
}
|
|
|
|
|
|
|
|
func (pup *pipeUnpackProcessor) writeBlock(workerID uint, br *blockResult) {
|
2024-09-25 14:16:53 +00:00
|
|
|
if br.rowsLen == 0 {
|
2024-05-22 19:01:20 +00:00
|
|
|
return
|
|
|
|
}
|
|
|
|
|
|
|
|
shard := &pup.shards[workerID]
|
2024-05-25 19:36:16 +00:00
|
|
|
shard.wctx.init(workerID, pup.ppNext, pup.keepOriginalFields, pup.skipEmptyResults, br)
|
2024-06-03 22:59:25 +00:00
|
|
|
shard.uctx.init(pup.fieldPrefix)
|
2024-05-22 19:01:20 +00:00
|
|
|
|
|
|
|
bm := &shard.bm
|
2024-09-25 14:16:53 +00:00
|
|
|
bm.init(br.rowsLen)
|
2024-05-22 19:01:20 +00:00
|
|
|
bm.setBits()
|
|
|
|
if pup.iff != nil {
|
|
|
|
pup.iff.f.applyToBlockResult(br, bm)
|
|
|
|
if bm.isZero() {
|
2024-05-25 19:36:16 +00:00
|
|
|
pup.ppNext.writeBlock(workerID, br)
|
2024-05-22 19:01:20 +00:00
|
|
|
return
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
c := br.getColumnByName(pup.fromField)
|
|
|
|
if c.isConst {
|
|
|
|
v := c.valuesEncoded[0]
|
|
|
|
shard.uctx.resetFields()
|
|
|
|
pup.unpackFunc(&shard.uctx, v)
|
2024-09-25 14:16:53 +00:00
|
|
|
for rowIdx := 0; rowIdx < br.rowsLen; rowIdx++ {
|
2024-05-22 19:01:20 +00:00
|
|
|
if bm.isSetBit(rowIdx) {
|
|
|
|
shard.wctx.writeRow(rowIdx, shard.uctx.fields)
|
|
|
|
} else {
|
|
|
|
shard.wctx.writeRow(rowIdx, nil)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
values := c.getValues(br)
|
2024-05-25 19:36:16 +00:00
|
|
|
vPrev := ""
|
|
|
|
hadUnpacks := false
|
2024-05-22 19:01:20 +00:00
|
|
|
for i, v := range values {
|
|
|
|
if bm.isSetBit(i) {
|
2024-05-25 19:36:16 +00:00
|
|
|
if !hadUnpacks || vPrev != v {
|
|
|
|
vPrev = v
|
|
|
|
hadUnpacks = true
|
|
|
|
|
2024-05-22 19:01:20 +00:00
|
|
|
shard.uctx.resetFields()
|
|
|
|
pup.unpackFunc(&shard.uctx, v)
|
|
|
|
}
|
|
|
|
shard.wctx.writeRow(i, shard.uctx.fields)
|
|
|
|
} else {
|
|
|
|
shard.wctx.writeRow(i, nil)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
shard.wctx.flush()
|
|
|
|
shard.wctx.reset()
|
|
|
|
shard.uctx.reset()
|
|
|
|
}
|
|
|
|
|
|
|
|
func (pup *pipeUnpackProcessor) flush() error {
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
|
|
|
type pipeUnpackWriteContext struct {
|
2024-05-24 22:30:58 +00:00
|
|
|
workerID uint
|
2024-05-25 19:36:16 +00:00
|
|
|
ppNext pipeProcessor
|
2024-05-24 22:30:58 +00:00
|
|
|
keepOriginalFields bool
|
|
|
|
skipEmptyResults bool
|
2024-05-22 19:01:20 +00:00
|
|
|
|
|
|
|
brSrc *blockResult
|
|
|
|
csSrc []*blockResultColumn
|
|
|
|
|
|
|
|
rcs []resultColumn
|
|
|
|
br blockResult
|
|
|
|
|
|
|
|
// rowsCount is the number of rows in the current block
|
|
|
|
rowsCount int
|
|
|
|
|
|
|
|
// valuesLen is the total length of values in the current block
|
|
|
|
valuesLen int
|
|
|
|
}
|
|
|
|
|
|
|
|
func (wctx *pipeUnpackWriteContext) reset() {
|
|
|
|
wctx.workerID = 0
|
2024-05-25 19:36:16 +00:00
|
|
|
wctx.ppNext = nil
|
2024-05-24 22:30:58 +00:00
|
|
|
wctx.keepOriginalFields = false
|
2024-06-03 22:59:25 +00:00
|
|
|
wctx.skipEmptyResults = false
|
2024-05-22 19:01:20 +00:00
|
|
|
|
|
|
|
wctx.brSrc = nil
|
|
|
|
wctx.csSrc = nil
|
|
|
|
|
|
|
|
rcs := wctx.rcs
|
|
|
|
for i := range rcs {
|
|
|
|
rcs[i].reset()
|
|
|
|
}
|
|
|
|
wctx.rcs = rcs[:0]
|
|
|
|
|
|
|
|
wctx.rowsCount = 0
|
|
|
|
wctx.valuesLen = 0
|
|
|
|
}
|
|
|
|
|
2024-05-25 19:36:16 +00:00
|
|
|
func (wctx *pipeUnpackWriteContext) init(workerID uint, ppNext pipeProcessor, keepOriginalFields, skipEmptyResults bool, brSrc *blockResult) {
|
2024-05-22 19:01:20 +00:00
|
|
|
wctx.reset()
|
|
|
|
|
|
|
|
wctx.workerID = workerID
|
2024-05-25 19:36:16 +00:00
|
|
|
wctx.ppNext = ppNext
|
2024-05-24 22:30:58 +00:00
|
|
|
wctx.keepOriginalFields = keepOriginalFields
|
|
|
|
wctx.skipEmptyResults = skipEmptyResults
|
2024-05-22 19:01:20 +00:00
|
|
|
|
|
|
|
wctx.brSrc = brSrc
|
|
|
|
wctx.csSrc = brSrc.getColumns()
|
|
|
|
}
|
|
|
|
|
|
|
|
func (wctx *pipeUnpackWriteContext) writeRow(rowIdx int, extraFields []Field) {
|
|
|
|
csSrc := wctx.csSrc
|
|
|
|
rcs := wctx.rcs
|
|
|
|
|
|
|
|
areEqualColumns := len(rcs) == len(csSrc)+len(extraFields)
|
|
|
|
if areEqualColumns {
|
|
|
|
for i, f := range extraFields {
|
|
|
|
if rcs[len(csSrc)+i].name != f.Name {
|
|
|
|
areEqualColumns = false
|
|
|
|
break
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if !areEqualColumns {
|
2024-05-25 19:36:16 +00:00
|
|
|
// send the current block to ppNext and construct a block with new set of columns
|
2024-05-22 19:01:20 +00:00
|
|
|
wctx.flush()
|
|
|
|
|
|
|
|
rcs = wctx.rcs[:0]
|
|
|
|
for _, c := range csSrc {
|
|
|
|
rcs = appendResultColumnWithName(rcs, c.name)
|
|
|
|
}
|
|
|
|
for _, f := range extraFields {
|
|
|
|
rcs = appendResultColumnWithName(rcs, f.Name)
|
|
|
|
}
|
|
|
|
wctx.rcs = rcs
|
|
|
|
}
|
|
|
|
|
|
|
|
brSrc := wctx.brSrc
|
|
|
|
for i, c := range csSrc {
|
|
|
|
v := c.getValueAtRow(brSrc, rowIdx)
|
|
|
|
rcs[i].addValue(v)
|
|
|
|
wctx.valuesLen += len(v)
|
|
|
|
}
|
|
|
|
for i, f := range extraFields {
|
|
|
|
v := f.Value
|
2024-05-24 22:30:58 +00:00
|
|
|
if v == "" && wctx.skipEmptyResults || wctx.keepOriginalFields {
|
|
|
|
idx := getBlockResultColumnIdxByName(csSrc, f.Name)
|
|
|
|
if idx >= 0 {
|
|
|
|
vOrig := csSrc[idx].getValueAtRow(brSrc, rowIdx)
|
|
|
|
if vOrig != "" {
|
|
|
|
v = vOrig
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
2024-05-22 19:01:20 +00:00
|
|
|
rcs[len(csSrc)+i].addValue(v)
|
|
|
|
wctx.valuesLen += len(v)
|
|
|
|
}
|
|
|
|
|
|
|
|
wctx.rowsCount++
|
|
|
|
if wctx.valuesLen >= 1_000_000 {
|
|
|
|
wctx.flush()
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
func (wctx *pipeUnpackWriteContext) flush() {
|
|
|
|
rcs := wctx.rcs
|
|
|
|
|
|
|
|
wctx.valuesLen = 0
|
|
|
|
|
2024-05-25 19:36:16 +00:00
|
|
|
// Flush rcs to ppNext
|
2024-05-22 19:01:20 +00:00
|
|
|
br := &wctx.br
|
|
|
|
br.setResultColumns(rcs, wctx.rowsCount)
|
|
|
|
wctx.rowsCount = 0
|
2024-05-25 19:36:16 +00:00
|
|
|
wctx.ppNext.writeBlock(wctx.workerID, br)
|
2024-05-22 19:01:20 +00:00
|
|
|
br.reset()
|
|
|
|
for i := range rcs {
|
|
|
|
rcs[i].resetValues()
|
|
|
|
}
|
|
|
|
}
|