mirror of
https://github.com/VictoriaMetrics/VictoriaMetrics.git
synced 2025-01-20 15:16:42 +00:00
wip
This commit is contained in:
parent
ff2b6fbe35
commit
12fe2b265c
4 changed files with 77 additions and 17 deletions
|
@ -1128,6 +1128,7 @@ By default rows are selected in arbitrary order because of performance reasons,
|
||||||
|
|
||||||
See also:
|
See also:
|
||||||
|
|
||||||
|
- [`sort` pipe](#sort-pipe)
|
||||||
- [`offset` pipe](#offset-pipe)
|
- [`offset` pipe](#offset-pipe)
|
||||||
|
|
||||||
### offset pipe
|
### offset pipe
|
||||||
|
@ -1147,6 +1148,7 @@ Rows can be sorted with [`sort` pipe](#sort-pipe).
|
||||||
See also:
|
See also:
|
||||||
|
|
||||||
- [`limit` pipe](#limit-pipe)
|
- [`limit` pipe](#limit-pipe)
|
||||||
|
- [`sort` pipe](#sort-pipe)
|
||||||
|
|
||||||
### rename pipe
|
### rename pipe
|
||||||
|
|
||||||
|
@ -1208,6 +1210,14 @@ for the `request_duration` [field](https://docs.victoriametrics.com/VictoriaLogs
|
||||||
_time:1h | sort by (request_duration desc) limit 10
|
_time:1h | sort by (request_duration desc) limit 10
|
||||||
```
|
```
|
||||||
|
|
||||||
|
If the first `N` sorted results must be skipped, then `offset N` can be added to `sort` pipe. For example,
|
||||||
|
the following query skips the first 10 logs with the biggest `request_duration` [field](https://docs.victoriametrics.com/VictoriaLogs/keyConcepts.html#data-model),
|
||||||
|
and then returns the next 20 sorted logs for the last 5 minutes:
|
||||||
|
|
||||||
|
```logsql
|
||||||
|
_time:1h | sort by (request_duration desc) offset 10 limit 20
|
||||||
|
```
|
||||||
|
|
||||||
Note that sorting of big number of logs can be slow and can consume a lot of additional memory.
|
Note that sorting of big number of logs can be slow and can consume a lot of additional memory.
|
||||||
It is recommended limiting the number of logs before sorting with the following approaches:
|
It is recommended limiting the number of logs before sorting with the following approaches:
|
||||||
|
|
||||||
|
|
|
@ -975,9 +975,14 @@ func TestParseQuerySuccess(t *testing.T) {
|
||||||
f(`* | sORt bY (_time, _stream DEsc, host)`, `* | sort by (_time, _stream desc, host)`)
|
f(`* | sORt bY (_time, _stream DEsc, host)`, `* | sort by (_time, _stream desc, host)`)
|
||||||
f(`* | sort bY (foo desc, bar,) desc`, `* | sort by (foo desc, bar) desc`)
|
f(`* | sort bY (foo desc, bar,) desc`, `* | sort by (foo desc, bar) desc`)
|
||||||
f(`* | sort limit 10`, `* | sort limit 10`)
|
f(`* | sort limit 10`, `* | sort limit 10`)
|
||||||
|
f(`* | sort offset 20 limit 10`, `* | sort offset 20 limit 10`)
|
||||||
f(`* | sort desc limit 10`, `* | sort desc limit 10`)
|
f(`* | sort desc limit 10`, `* | sort desc limit 10`)
|
||||||
|
f(`* | sort desc offset 20 limit 10`, `* | sort desc offset 20 limit 10`)
|
||||||
f(`* | sort by (foo desc, bar) limit 10`, `* | sort by (foo desc, bar) limit 10`)
|
f(`* | sort by (foo desc, bar) limit 10`, `* | sort by (foo desc, bar) limit 10`)
|
||||||
|
f(`* | sort by (foo desc, bar) oFFset 20 limit 10`, `* | sort by (foo desc, bar) offset 20 limit 10`)
|
||||||
f(`* | sort by (foo desc, bar) desc limit 10`, `* | sort by (foo desc, bar) desc limit 10`)
|
f(`* | sort by (foo desc, bar) desc limit 10`, `* | sort by (foo desc, bar) desc limit 10`)
|
||||||
|
f(`* | sort by (foo desc, bar) desc OFFSET 30 limit 10`, `* | sort by (foo desc, bar) desc offset 30 limit 10`)
|
||||||
|
f(`* | sort by (foo desc, bar) desc limit 10 OFFSET 30`, `* | sort by (foo desc, bar) desc offset 30 limit 10`)
|
||||||
|
|
||||||
// uniq pipe
|
// uniq pipe
|
||||||
f(`* | uniq`, `* | uniq`)
|
f(`* | uniq`, `* | uniq`)
|
||||||
|
@ -1338,6 +1343,12 @@ func TestParseQueryFailure(t *testing.T) {
|
||||||
f(`foo | sort by(bar) limit foo`)
|
f(`foo | sort by(bar) limit foo`)
|
||||||
f(`foo | sort by(bar) limit -1234`)
|
f(`foo | sort by(bar) limit -1234`)
|
||||||
f(`foo | sort by(bar) limit 12.34`)
|
f(`foo | sort by(bar) limit 12.34`)
|
||||||
|
f(`foo | sort by(bar) limit 10 limit 20`)
|
||||||
|
f(`foo | sort by(bar) offset`)
|
||||||
|
f(`foo | sort by(bar) offset limit`)
|
||||||
|
f(`foo | sort by(bar) offset -1234`)
|
||||||
|
f(`foo | sort by(bar) offset 12.34`)
|
||||||
|
f(`foo | sort by(bar) offset 10 offset 20`)
|
||||||
|
|
||||||
// invalid uniq pipe
|
// invalid uniq pipe
|
||||||
f(`foo | uniq bar`)
|
f(`foo | uniq bar`)
|
||||||
|
|
|
@ -26,6 +26,9 @@ type pipeSort struct {
|
||||||
// whether to apply descending order
|
// whether to apply descending order
|
||||||
isDesc bool
|
isDesc bool
|
||||||
|
|
||||||
|
// how many results to skip
|
||||||
|
offset uint64
|
||||||
|
|
||||||
// how many results to return
|
// how many results to return
|
||||||
//
|
//
|
||||||
// if zero, then all the results are returned
|
// if zero, then all the results are returned
|
||||||
|
@ -44,6 +47,9 @@ func (ps *pipeSort) String() string {
|
||||||
if ps.isDesc {
|
if ps.isDesc {
|
||||||
s += " desc"
|
s += " desc"
|
||||||
}
|
}
|
||||||
|
if ps.offset > 0 {
|
||||||
|
s += fmt.Sprintf(" offset %d", ps.offset)
|
||||||
|
}
|
||||||
if ps.limit > 0 {
|
if ps.limit > 0 {
|
||||||
s += fmt.Sprintf(" limit %d", ps.limit)
|
s += fmt.Sprintf(" limit %d", ps.limit)
|
||||||
}
|
}
|
||||||
|
@ -470,16 +476,25 @@ type pipeSortWriteContext struct {
|
||||||
rcs []resultColumn
|
rcs []resultColumn
|
||||||
br blockResult
|
br blockResult
|
||||||
|
|
||||||
valuesLen int
|
rowsWritten uint64
|
||||||
|
valuesLen int
|
||||||
}
|
}
|
||||||
|
|
||||||
func (wctx *pipeSortWriteContext) writeNextRow(shard *pipeSortProcessorShard) {
|
func (wctx *pipeSortWriteContext) writeNextRow(shard *pipeSortProcessorShard) {
|
||||||
|
ps := shard.ps
|
||||||
|
|
||||||
rowIdx := shard.rowRefNext
|
rowIdx := shard.rowRefNext
|
||||||
shard.rowRefNext++
|
shard.rowRefNext++
|
||||||
|
|
||||||
|
wctx.rowsWritten++
|
||||||
|
if wctx.rowsWritten <= ps.offset {
|
||||||
|
return
|
||||||
|
}
|
||||||
|
|
||||||
rr := shard.rowRefs[rowIdx]
|
rr := shard.rowRefs[rowIdx]
|
||||||
b := &shard.blocks[rr.blockIdx]
|
b := &shard.blocks[rr.blockIdx]
|
||||||
|
|
||||||
byFields := shard.ps.byFields
|
byFields := ps.byFields
|
||||||
rcs := wctx.rcs
|
rcs := wctx.rcs
|
||||||
|
|
||||||
areEqualColumns := len(rcs) == len(byFields)+len(b.otherColumns)
|
areEqualColumns := len(rcs) == len(byFields)+len(b.otherColumns)
|
||||||
|
@ -688,18 +703,36 @@ func parsePipeSort(lex *lexer) (*pipeSort, error) {
|
||||||
ps.isDesc = true
|
ps.isDesc = true
|
||||||
}
|
}
|
||||||
|
|
||||||
switch {
|
for {
|
||||||
case lex.isKeyword("limit"):
|
switch {
|
||||||
lex.nextToken()
|
case lex.isKeyword("offset"):
|
||||||
n, ok := tryParseUint64(lex.token)
|
lex.nextToken()
|
||||||
lex.nextToken()
|
s := lex.token
|
||||||
if !ok {
|
n, ok := tryParseUint64(s)
|
||||||
return nil, fmt.Errorf("cannot parse 'limit %s'", lex.token)
|
lex.nextToken()
|
||||||
|
if !ok {
|
||||||
|
return nil, fmt.Errorf("cannot parse 'offset %s'", s)
|
||||||
|
}
|
||||||
|
if ps.offset > 0 {
|
||||||
|
return nil, fmt.Errorf("duplicate 'offset'; the previous one is %d; the new one is %s", ps.offset, s)
|
||||||
|
}
|
||||||
|
ps.offset = n
|
||||||
|
case lex.isKeyword("limit"):
|
||||||
|
lex.nextToken()
|
||||||
|
s := lex.token
|
||||||
|
n, ok := tryParseUint64(s)
|
||||||
|
lex.nextToken()
|
||||||
|
if !ok {
|
||||||
|
return nil, fmt.Errorf("cannot parse 'limit %s'", s)
|
||||||
|
}
|
||||||
|
if ps.limit > 0 {
|
||||||
|
return nil, fmt.Errorf("duplicate 'limit'; the previous one is %d; the new one is %s", ps.limit, s)
|
||||||
|
}
|
||||||
|
ps.limit = n
|
||||||
|
default:
|
||||||
|
return &ps, nil
|
||||||
}
|
}
|
||||||
ps.limit = n
|
|
||||||
}
|
}
|
||||||
|
|
||||||
return &ps, nil
|
|
||||||
}
|
}
|
||||||
|
|
||||||
// bySortField represents 'by (...)' part of the pipeSort.
|
// bySortField represents 'by (...)' part of the pipeSort.
|
||||||
|
|
|
@ -410,16 +410,22 @@ type pipeTopkWriteContext struct {
|
||||||
}
|
}
|
||||||
|
|
||||||
func (wctx *pipeTopkWriteContext) writeNextRow(shard *pipeTopkProcessorShard) bool {
|
func (wctx *pipeTopkWriteContext) writeNextRow(shard *pipeTopkProcessorShard) bool {
|
||||||
if wctx.rowsWritten >= wctx.ptp.ps.limit {
|
ps := shard.ps
|
||||||
return false
|
|
||||||
}
|
|
||||||
wctx.rowsWritten++
|
|
||||||
|
|
||||||
rowIdx := shard.rowNext
|
rowIdx := shard.rowNext
|
||||||
shard.rowNext++
|
shard.rowNext++
|
||||||
|
|
||||||
|
wctx.rowsWritten++
|
||||||
|
if wctx.rowsWritten <= ps.offset {
|
||||||
|
return true
|
||||||
|
}
|
||||||
|
if wctx.rowsWritten > ps.offset+ps.limit {
|
||||||
|
return false
|
||||||
|
}
|
||||||
|
|
||||||
r := shard.rows[rowIdx]
|
r := shard.rows[rowIdx]
|
||||||
|
|
||||||
byFields := shard.ps.byFields
|
byFields := ps.byFields
|
||||||
rcs := wctx.rcs
|
rcs := wctx.rcs
|
||||||
|
|
||||||
areEqualColumns := len(rcs) == len(byFields)+len(r.otherColumns)
|
areEqualColumns := len(rcs) == len(byFields)+len(r.otherColumns)
|
||||||
|
|
Loading…
Reference in a new issue