2024-04-25 22:19:58 +00:00
|
|
|
package logstorage
|
|
|
|
|
|
|
|
import (
|
|
|
|
"fmt"
|
|
|
|
)
|
|
|
|
|
|
|
|
type pipe interface {
|
2024-04-26 21:47:50 +00:00
|
|
|
// String returns string representation of the pipe.
|
2024-04-25 22:19:58 +00:00
|
|
|
String() string
|
2024-04-26 21:47:50 +00:00
|
|
|
|
2024-05-09 00:52:28 +00:00
|
|
|
// updateNeededFields must update neededFields and unneededFields with fields it needs and not needs at the input.
|
|
|
|
updateNeededFields(neededFields, unneededFields fieldsSet)
|
2024-05-04 22:28:01 +00:00
|
|
|
|
2024-04-26 21:47:50 +00:00
|
|
|
// newPipeProcessor must return new pipeProcessor for the given ppBase.
|
|
|
|
//
|
|
|
|
// workersCount is the number of goroutine workers, which will call writeBlock() method.
|
|
|
|
//
|
|
|
|
// If stopCh is closed, the returned pipeProcessor must stop performing CPU-intensive tasks which take more than a few milliseconds.
|
|
|
|
// It is OK to continue processing pipeProcessor calls if they take less than a few milliseconds.
|
|
|
|
//
|
2024-04-27 20:08:03 +00:00
|
|
|
// The returned pipeProcessor may call cancel() at any time in order to notify worker goroutines to stop sending new data to pipeProcessor.
|
2024-04-26 21:47:50 +00:00
|
|
|
newPipeProcessor(workersCount int, stopCh <-chan struct{}, cancel func(), ppBase pipeProcessor) pipeProcessor
|
|
|
|
}
|
|
|
|
|
|
|
|
// pipeProcessor must process a single pipe.
|
|
|
|
type pipeProcessor interface {
|
|
|
|
// writeBlock must write the given block of data to the given pipeProcessor.
|
|
|
|
//
|
2024-04-27 20:08:03 +00:00
|
|
|
// writeBlock is called concurrently from worker goroutines.
|
|
|
|
// The workerID is the id of the worker goroutine, which calls the writeBlock.
|
2024-04-26 21:47:50 +00:00
|
|
|
// It is in the range 0 ... workersCount-1 .
|
|
|
|
//
|
2024-04-30 23:19:22 +00:00
|
|
|
// It is OK to modify br contents inside writeBlock. The caller mustn't rely on br contents after writeBlock call.
|
|
|
|
// It is forbidden to hold references to br after returning from writeBlock, since the caller may re-use it.
|
2024-04-27 20:08:03 +00:00
|
|
|
//
|
|
|
|
// If any error occurs at writeBlock, then cancel() must be called by pipeProcessor in order to notify worker goroutines
|
|
|
|
// to stop sending new data. The occurred error must be returned from flush().
|
|
|
|
//
|
|
|
|
// cancel() may be called also when the pipeProcessor decides to stop accepting new data, even if there is no any error.
|
2024-04-30 21:03:34 +00:00
|
|
|
writeBlock(workerID uint, br *blockResult)
|
2024-04-26 21:47:50 +00:00
|
|
|
|
|
|
|
// flush must flush all the data accumulated in the pipeProcessor to the base pipeProcessor.
|
|
|
|
//
|
2024-04-27 20:08:03 +00:00
|
|
|
// flush is called after all the worker goroutines are stopped.
|
|
|
|
//
|
|
|
|
// It is guaranteed that flush() is called for every pipeProcessor returned from pipe.newPipeProcessor().
|
|
|
|
flush() error
|
2024-04-26 21:47:50 +00:00
|
|
|
}
|
|
|
|
|
2024-04-30 21:03:34 +00:00
|
|
|
type defaultPipeProcessor func(workerID uint, br *blockResult)
|
2024-04-26 21:47:50 +00:00
|
|
|
|
2024-04-30 21:03:34 +00:00
|
|
|
func newDefaultPipeProcessor(writeBlock func(workerID uint, br *blockResult)) pipeProcessor {
|
2024-04-26 21:47:50 +00:00
|
|
|
return defaultPipeProcessor(writeBlock)
|
|
|
|
}
|
|
|
|
|
2024-04-30 21:03:34 +00:00
|
|
|
func (dpp defaultPipeProcessor) writeBlock(workerID uint, br *blockResult) {
|
|
|
|
dpp(workerID, br)
|
2024-04-26 21:47:50 +00:00
|
|
|
}
|
|
|
|
|
2024-04-27 20:08:03 +00:00
|
|
|
func (dpp defaultPipeProcessor) flush() error {
|
|
|
|
return nil
|
2024-04-25 22:19:58 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
func parsePipes(lex *lexer) ([]pipe, error) {
|
|
|
|
var pipes []pipe
|
2024-04-26 23:53:32 +00:00
|
|
|
for !lex.isKeyword(")", "") {
|
2024-04-25 22:19:58 +00:00
|
|
|
if !lex.isKeyword("|") {
|
2024-05-15 00:45:43 +00:00
|
|
|
return nil, fmt.Errorf("expecting '|'; got %q", lex.token)
|
2024-04-25 22:19:58 +00:00
|
|
|
}
|
|
|
|
if !lex.mustNextToken() {
|
|
|
|
return nil, fmt.Errorf("missing token after '|'")
|
|
|
|
}
|
|
|
|
switch {
|
2024-05-18 10:33:34 +00:00
|
|
|
case lex.isKeyword("copy", "cp"):
|
|
|
|
pc, err := parsePipeCopy(lex)
|
2024-04-25 22:19:58 +00:00
|
|
|
if err != nil {
|
2024-05-18 10:33:34 +00:00
|
|
|
return nil, fmt.Errorf("cannot parse 'copy' pipe: %w", err)
|
2024-04-25 22:19:58 +00:00
|
|
|
}
|
2024-05-18 10:33:34 +00:00
|
|
|
pipes = append(pipes, pc)
|
|
|
|
case lex.isKeyword("delete", "del", "rm"):
|
|
|
|
pd, err := parsePipeDelete(lex)
|
2024-05-06 16:33:35 +00:00
|
|
|
if err != nil {
|
2024-05-18 10:33:34 +00:00
|
|
|
return nil, fmt.Errorf("cannot parse 'delete' pipe: %w", err)
|
2024-05-06 16:33:35 +00:00
|
|
|
}
|
2024-05-18 10:33:34 +00:00
|
|
|
pipes = append(pipes, pd)
|
2024-05-18 19:40:02 +00:00
|
|
|
case lex.isKeyword("field_names"):
|
|
|
|
pf, err := parsePipeFieldNames(lex)
|
|
|
|
if err != nil {
|
|
|
|
return nil, fmt.Errorf("cannot parse 'field_names' pipe: %w", err)
|
|
|
|
}
|
|
|
|
pipes = append(pipes, pf)
|
2024-05-18 10:33:34 +00:00
|
|
|
case lex.isKeyword("fields"):
|
|
|
|
pf, err := parsePipeFields(lex)
|
2024-05-11 06:01:31 +00:00
|
|
|
if err != nil {
|
2024-05-18 10:33:34 +00:00
|
|
|
return nil, fmt.Errorf("cannot parse 'fields' pipe: %w", err)
|
2024-05-11 06:01:31 +00:00
|
|
|
}
|
2024-05-18 10:33:34 +00:00
|
|
|
pipes = append(pipes, pf)
|
|
|
|
case lex.isKeyword("filter"):
|
|
|
|
pf, err := parsePipeFilter(lex)
|
|
|
|
if err != nil {
|
|
|
|
return nil, fmt.Errorf("cannot parse 'filter' pipe: %w", err)
|
|
|
|
}
|
|
|
|
pipes = append(pipes, pf)
|
2024-05-05 10:43:38 +00:00
|
|
|
case lex.isKeyword("limit", "head"):
|
|
|
|
pl, err := parsePipeLimit(lex)
|
2024-04-27 00:50:19 +00:00
|
|
|
if err != nil {
|
2024-05-05 10:43:38 +00:00
|
|
|
return nil, fmt.Errorf("cannot parse 'limit' pipe: %w", err)
|
2024-04-27 00:50:19 +00:00
|
|
|
}
|
2024-05-05 10:43:38 +00:00
|
|
|
pipes = append(pipes, pl)
|
|
|
|
case lex.isKeyword("offset", "skip"):
|
|
|
|
ps, err := parsePipeOffset(lex)
|
2024-04-27 01:14:00 +00:00
|
|
|
if err != nil {
|
2024-05-05 10:43:38 +00:00
|
|
|
return nil, fmt.Errorf("cannot parse 'offset' pipe: %w", err)
|
2024-04-27 01:14:00 +00:00
|
|
|
}
|
2024-04-29 01:30:25 +00:00
|
|
|
pipes = append(pipes, ps)
|
2024-05-05 10:43:38 +00:00
|
|
|
case lex.isKeyword("rename", "mv"):
|
2024-05-04 22:28:01 +00:00
|
|
|
pr, err := parsePipeRename(lex)
|
|
|
|
if err != nil {
|
|
|
|
return nil, fmt.Errorf("cannot parse 'rename' pipe: %w", err)
|
|
|
|
}
|
|
|
|
pipes = append(pipes, pr)
|
2024-05-18 10:33:34 +00:00
|
|
|
case lex.isKeyword("sort"):
|
|
|
|
ps, err := parsePipeSort(lex)
|
2024-05-04 22:28:01 +00:00
|
|
|
if err != nil {
|
2024-05-18 10:33:34 +00:00
|
|
|
return nil, fmt.Errorf("cannot parse 'sort' pipe: %w", err)
|
2024-05-04 22:28:01 +00:00
|
|
|
}
|
2024-05-18 10:33:34 +00:00
|
|
|
pipes = append(pipes, ps)
|
|
|
|
case lex.isKeyword("stats"):
|
|
|
|
ps, err := parsePipeStats(lex)
|
|
|
|
if err != nil {
|
|
|
|
return nil, fmt.Errorf("cannot parse 'stats' pipe: %w", err)
|
|
|
|
}
|
|
|
|
pipes = append(pipes, ps)
|
|
|
|
case lex.isKeyword("uniq"):
|
|
|
|
pu, err := parsePipeUniq(lex)
|
|
|
|
if err != nil {
|
|
|
|
return nil, fmt.Errorf("cannot parse 'uniq' pipe: %w", err)
|
|
|
|
}
|
|
|
|
pipes = append(pipes, pu)
|
2024-04-25 22:19:58 +00:00
|
|
|
default:
|
|
|
|
return nil, fmt.Errorf("unexpected pipe %q", lex.token)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return pipes, nil
|
|
|
|
}
|