VictoriaMetrics/lib/logstorage/pipe_join.go

package logstorage

import (
	"fmt"
	"slices"
	"unsafe"

	"github.com/VictoriaMetrics/VictoriaMetrics/lib/slicesutil"
)

// pipeJoin processes '| join ...' pipe.
//
// See https://docs.victoriametrics.com/victorialogs/logsql/#join-pipe
type pipeJoin struct {
	// byFields contains fields to use for join on q results
	byFields []string

	// q is a query for obtaining results for joining
	q *Query

	// m contains results for joining. They are automatically initialized during query execution
	m map[string][][]Field
}

func (pj *pipeJoin) String() string {
	return fmt.Sprintf("join by (%s) (%s)", fieldNamesString(pj.byFields), pj.q.String())
}

func (pj *pipeJoin) canLiveTail() bool {
	return true
}

func (pj *pipeJoin) optimize() {
	pj.q.Optimize()
}

func (pj *pipeJoin) hasFilterInWithQuery() bool {
	return false
}

func (pj *pipeJoin) initFilterInValues(_ map[string][]string, _ getFieldValuesFunc) (pipe, error) {
	return pj, nil
}

func (pj *pipeJoin) initJoinMap(getJoinMapFunc getJoinMapFunc) (pipe, error) {
	m, err := getJoinMapFunc(pj.q, pj.byFields)
	if err != nil {
		return nil, fmt.Errorf("cannot execute query at pipe [%s]: %w", pj, err)
	}
	pjNew := *pj
	pjNew.m = m
	return &pjNew, nil
}

func (pj *pipeJoin) updateNeededFields(neededFields, unneededFields fieldsSet) {
	if neededFields.contains("*") {
		unneededFields.removeFields(pj.byFields)
	} else {
		neededFields.addFields(pj.byFields)
	}
}

func (pj *pipeJoin) newPipeProcessor(workersCount int, stopCh <-chan struct{}, _ func(), ppNext pipeProcessor) pipeProcessor {
	return &pipeJoinProcessor{
		pj:     pj,
		stopCh: stopCh,
		ppNext: ppNext,

		shards: make([]pipeJoinProcessorShard, workersCount),
	}
}

type pipeJoinProcessor struct {
	pj     *pipeJoin
	stopCh <-chan struct{}
	ppNext pipeProcessor

	shards []pipeJoinProcessorShard
}

type pipeJoinProcessorShard struct {
	pipeJoinProcessorShardNopad

	// The padding prevents false sharing on widespread platforms with 128 mod (cache line size) = 0 .
	_ [128 - unsafe.Sizeof(pipeJoinProcessorShardNopad{})%128]byte
}

type pipeJoinProcessorShardNopad struct {
	wctx pipeUnpackWriteContext

	byValues []string
	tmpBuf   []byte
}

func (pjp *pipeJoinProcessor) writeBlock(workerID uint, br *blockResult) {
	if br.rowsLen == 0 {
		return
	}

	pj := pjp.pj
	shard := &pjp.shards[workerID]
	shard.wctx.init(workerID, pjp.ppNext, true, true, br)

	shard.byValues = slicesutil.SetLength(shard.byValues, len(pj.byFields))
	byValues := shard.byValues

	cs := br.getColumns()
	for rowIdx := 0; rowIdx < br.rowsLen; rowIdx++ {
		clear(byValues)
		for i := range cs {
			name := cs[i].name
			if cIdx := slices.Index(pj.byFields, name); cIdx >= 0 {
				byValues[cIdx] = cs[i].getValueAtRow(br, rowIdx)
			}
		}

		shard.tmpBuf = marshalStrings(shard.tmpBuf[:0], byValues)
		matchingRows := pj.m[string(shard.tmpBuf)]

		if len(matchingRows) == 0 {
			shard.wctx.writeRow(rowIdx, nil)
			continue
		}
		for _, extraFields := range matchingRows {
			if needStop(pjp.stopCh) {
				return
			}
			shard.wctx.writeRow(rowIdx, extraFields)
		}
	}

	shard.wctx.flush()
	shard.wctx.reset()
}

func (pjp *pipeJoinProcessor) flush() error {
	return nil
}

func parsePipeJoin(lex *lexer) (*pipeJoin, error) {
	if !lex.isKeyword("join") {
		return nil, fmt.Errorf("unexpected token: %q; want %q", lex.token, "join")
	}
	lex.nextToken()

	// parse by (...)
	if lex.isKeyword("by", "on") {
		lex.nextToken()
	}

	byFields, err := parseFieldNamesInParens(lex)
	if err != nil {
		return nil, fmt.Errorf("cannot parse 'by(...)' at 'join': %w", err)
	}
	if len(byFields) == 0 {
		return nil, fmt.Errorf("'by(...)' at 'join' must contain at least a single field")
	}
	if slices.Contains(byFields, "*") {
		return nil, fmt.Errorf("join by '*' isn't supported")
	}

	// Parse join query
	if !lex.isKeyword("(") {
		return nil, fmt.Errorf("missing '(' in front of join query")
	}
	lex.nextToken()

	q, err := parseQuery(lex)
	if err != nil {
		return nil, fmt.Errorf("cannot parse join query: %w", err)
	}

	if !lex.isKeyword(")") {
		return nil, fmt.Errorf("missing ')' after the join query [%s]", q)
	}
	lex.nextToken()

	pj := &pipeJoin{
		byFields: byFields,
		q:        q,
	}

	return pj, nil
}
lib/logstorage: add `join` pipe for joining multiple query results (cherry picked from commit f9e23bf8e3c4a3db57a095aabbd80c57de39d652) 2024-11-06 13:22:13 +00:00			`package logstorage`

			`import (`
			`"fmt"`
			`"slices"`
			`"unsafe"`

			`"github.com/VictoriaMetrics/VictoriaMetrics/lib/slicesutil"`
			`)`

			`// pipeJoin processes '\| join ...' pipe.`
			`//`
			`// See https://docs.victoriametrics.com/victorialogs/logsql/#join-pipe`
			`type pipeJoin struct {`
			`// byFields contains fields to use for join on q results`
			`byFields []string`

			`// q is a query for obtaining results for joining`
			`q *Query`

			`// m contains results for joining. They are automatically initialized during query execution`
			`m map[string][][]Field`
			`}`

			`func (pj *pipeJoin) String() string {`
			`return fmt.Sprintf("join by (%s) (%s)", fieldNamesString(pj.byFields), pj.q.String())`
			`}`

			`func (pj *pipeJoin) canLiveTail() bool {`
			`return true`
			`}`

			`func (pj *pipeJoin) optimize() {`
			`pj.q.Optimize()`
			`}`

			`func (pj *pipeJoin) hasFilterInWithQuery() bool {`
			`return false`
			`}`

lib/logstorage: add `block_stats` pipe for analyzing per-block storage stats (cherry picked from commit 5ed54ebadfeaef23775083507999f056e7b23ef2) 2024-11-06 17:07:52 +00:00			`func (pj *pipeJoin) initFilterInValues(_ map[string][]string, _ getFieldValuesFunc) (pipe, error) {`
lib/logstorage: add `join` pipe for joining multiple query results (cherry picked from commit f9e23bf8e3c4a3db57a095aabbd80c57de39d652) 2024-11-06 13:22:13 +00:00			`return pj, nil`
			`}`

			`func (pj *pipeJoin) initJoinMap(getJoinMapFunc getJoinMapFunc) (pipe, error) {`
			`m, err := getJoinMapFunc(pj.q, pj.byFields)`
			`if err != nil {`
			`return nil, fmt.Errorf("cannot execute query at pipe [%s]: %w", pj, err)`
			`}`
			`pjNew := *pj`
			`pjNew.m = m`
			`return &pjNew, nil`
			`}`

			`func (pj *pipeJoin) updateNeededFields(neededFields, unneededFields fieldsSet) {`
			`if neededFields.contains("*") {`
			`unneededFields.removeFields(pj.byFields)`
			`} else {`
			`neededFields.addFields(pj.byFields)`
			`}`
			`}`

			`func (pj *pipeJoin) newPipeProcessor(workersCount int, stopCh <-chan struct{}, _ func(), ppNext pipeProcessor) pipeProcessor {`
			`return &pipeJoinProcessor{`
			`pj: pj,`
			`stopCh: stopCh,`
			`ppNext: ppNext,`

			`shards: make([]pipeJoinProcessorShard, workersCount),`
			`}`
			`}`

			`type pipeJoinProcessor struct {`
			`pj *pipeJoin`
			`stopCh <-chan struct{}`
			`ppNext pipeProcessor`

			`shards []pipeJoinProcessorShard`
			`}`

			`type pipeJoinProcessorShard struct {`
			`pipeJoinProcessorShardNopad`

			`// The padding prevents false sharing on widespread platforms with 128 mod (cache line size) = 0 .`
			`_ [128 - unsafe.Sizeof(pipeJoinProcessorShardNopad{})%128]byte`
			`}`

			`type pipeJoinProcessorShardNopad struct {`
			`wctx pipeUnpackWriteContext`

			`byValues []string`
			`tmpBuf []byte`
			`}`

			`func (pjp pipeJoinProcessor) writeBlock(workerID uint, br blockResult) {`
			`if br.rowsLen == 0 {`
			`return`
			`}`

			`pj := pjp.pj`
			`shard := &pjp.shards[workerID]`
			`shard.wctx.init(workerID, pjp.ppNext, true, true, br)`

			`shard.byValues = slicesutil.SetLength(shard.byValues, len(pj.byFields))`
			`byValues := shard.byValues`

			`cs := br.getColumns()`
			`for rowIdx := 0; rowIdx < br.rowsLen; rowIdx++ {`
			`clear(byValues)`
			`for i := range cs {`
			`name := cs[i].name`
			`if cIdx := slices.Index(pj.byFields, name); cIdx >= 0 {`
			`byValues[cIdx] = cs[i].getValueAtRow(br, rowIdx)`
			`}`
			`}`

			`shard.tmpBuf = marshalStrings(shard.tmpBuf[:0], byValues)`
			`matchingRows := pj.m[string(shard.tmpBuf)]`

			`if len(matchingRows) == 0 {`
			`shard.wctx.writeRow(rowIdx, nil)`
			`continue`
			`}`
			`for _, extraFields := range matchingRows {`
lib/logstorage: add `block_stats` pipe for analyzing per-block storage stats (cherry picked from commit 5ed54ebadfeaef23775083507999f056e7b23ef2) 2024-11-06 17:07:52 +00:00			`if needStop(pjp.stopCh) {`
			`return`
			`}`
lib/logstorage: add `join` pipe for joining multiple query results (cherry picked from commit f9e23bf8e3c4a3db57a095aabbd80c57de39d652) 2024-11-06 13:22:13 +00:00			`shard.wctx.writeRow(rowIdx, extraFields)`
			`}`
			`}`

			`shard.wctx.flush()`
			`shard.wctx.reset()`
			`}`

			`func (pjp *pipeJoinProcessor) flush() error {`
			`return nil`
			`}`

			`func parsePipeJoin(lex lexer) (pipeJoin, error) {`
			`if !lex.isKeyword("join") {`
			`return nil, fmt.Errorf("unexpected token: %q; want %q", lex.token, "join")`
			`}`
			`lex.nextToken()`

			`// parse by (...)`
			`if lex.isKeyword("by", "on") {`
			`lex.nextToken()`
			`}`

			`byFields, err := parseFieldNamesInParens(lex)`
			`if err != nil {`
			`return nil, fmt.Errorf("cannot parse 'by(...)' at 'join': %w", err)`
			`}`
			`if len(byFields) == 0 {`
			`return nil, fmt.Errorf("'by(...)' at 'join' must contain at least a single field")`
			`}`
			`if slices.Contains(byFields, "*") {`
			`return nil, fmt.Errorf("join by '*' isn't supported")`
			`}`

			`// Parse join query`
			`if !lex.isKeyword("(") {`
			`return nil, fmt.Errorf("missing '(' in front of join query")`
			`}`
			`lex.nextToken()`

			`q, err := parseQuery(lex)`
			`if err != nil {`
			`return nil, fmt.Errorf("cannot parse join query: %w", err)`
			`}`

			`if !lex.isKeyword(")") {`
			`return nil, fmt.Errorf("missing ')' after the join query [%s]", q)`
			`}`
			`lex.nextToken()`

			`pj := &pipeJoin{`
			`byFields: byFields,`
			`q: q,`
			`}`

			`return pj, nil`
			`}`