2019-05-22 21:16:55 +00:00
|
|
|
package storage
|
|
|
|
|
|
|
|
import (
|
|
|
|
"container/heap"
|
|
|
|
"fmt"
|
|
|
|
"io"
|
|
|
|
)
|
|
|
|
|
|
|
|
// blockStreamMerger is used for merging block streams.
|
|
|
|
type blockStreamMerger struct {
|
|
|
|
// The current block to work with.
|
|
|
|
Block *Block
|
|
|
|
|
|
|
|
bsrHeap blockStreamReaderHeap
|
|
|
|
|
2022-10-23 11:30:16 +00:00
|
|
|
// Blocks with smaller timestamps are removed because of retention.
|
|
|
|
retentionDeadline int64
|
|
|
|
|
2019-05-22 21:16:55 +00:00
|
|
|
// Whether the call to NextBlock must be no-op.
|
|
|
|
nextBlockNoop bool
|
|
|
|
|
|
|
|
// The last error
|
|
|
|
err error
|
|
|
|
}
|
|
|
|
|
|
|
|
func (bsm *blockStreamMerger) reset() {
|
|
|
|
bsm.Block = nil
|
2022-10-23 22:16:23 +00:00
|
|
|
|
2019-05-22 21:16:55 +00:00
|
|
|
for i := range bsm.bsrHeap {
|
|
|
|
bsm.bsrHeap[i] = nil
|
|
|
|
}
|
|
|
|
bsm.bsrHeap = bsm.bsrHeap[:0]
|
2022-10-23 22:16:23 +00:00
|
|
|
|
2022-10-23 11:30:16 +00:00
|
|
|
bsm.retentionDeadline = 0
|
2019-05-22 21:16:55 +00:00
|
|
|
bsm.nextBlockNoop = false
|
|
|
|
bsm.err = nil
|
|
|
|
}
|
|
|
|
|
|
|
|
// Init initializes bsm with the given bsrs.
|
2022-10-23 11:30:16 +00:00
|
|
|
func (bsm *blockStreamMerger) Init(bsrs []*blockStreamReader, retentionDeadline int64) {
|
2019-05-22 21:16:55 +00:00
|
|
|
bsm.reset()
|
2022-10-23 11:30:16 +00:00
|
|
|
bsm.retentionDeadline = retentionDeadline
|
2019-05-22 21:16:55 +00:00
|
|
|
for _, bsr := range bsrs {
|
|
|
|
if bsr.NextBlock() {
|
|
|
|
bsm.bsrHeap = append(bsm.bsrHeap, bsr)
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
if err := bsr.Error(); err != nil {
|
2020-06-30 19:58:18 +00:00
|
|
|
bsm.err = fmt.Errorf("cannot obtain the next block to merge: %w", err)
|
2019-05-22 21:16:55 +00:00
|
|
|
return
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
if len(bsm.bsrHeap) == 0 {
|
|
|
|
bsm.err = io.EOF
|
|
|
|
return
|
|
|
|
}
|
|
|
|
|
|
|
|
heap.Init(&bsm.bsrHeap)
|
|
|
|
bsm.Block = &bsm.bsrHeap[0].Block
|
|
|
|
bsm.nextBlockNoop = true
|
|
|
|
}
|
|
|
|
|
2022-10-23 23:52:38 +00:00
|
|
|
func (bsm *blockStreamMerger) getRetentionDeadline(bh *blockHeader) int64 {
|
2022-10-23 11:30:16 +00:00
|
|
|
return bsm.retentionDeadline
|
|
|
|
}
|
|
|
|
|
2019-05-22 21:16:55 +00:00
|
|
|
// NextBlock stores the next block in bsm.Block.
|
|
|
|
//
|
|
|
|
// The blocks are sorted by (TDIS, MinTimestamp). Two subsequent blocks
|
|
|
|
// for the same TSID may contain overlapped time ranges.
|
|
|
|
func (bsm *blockStreamMerger) NextBlock() bool {
|
|
|
|
if bsm.err != nil {
|
|
|
|
return false
|
|
|
|
}
|
|
|
|
if bsm.nextBlockNoop {
|
|
|
|
bsm.nextBlockNoop = false
|
|
|
|
return true
|
|
|
|
}
|
|
|
|
|
|
|
|
bsm.err = bsm.nextBlock()
|
|
|
|
switch bsm.err {
|
|
|
|
case nil:
|
|
|
|
return true
|
|
|
|
case io.EOF:
|
|
|
|
return false
|
|
|
|
default:
|
2020-06-30 19:58:18 +00:00
|
|
|
bsm.err = fmt.Errorf("cannot obtain the next block to merge: %w", bsm.err)
|
2019-05-22 21:16:55 +00:00
|
|
|
return false
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
func (bsm *blockStreamMerger) nextBlock() error {
|
|
|
|
bsrMin := bsm.bsrHeap[0]
|
|
|
|
if bsrMin.NextBlock() {
|
|
|
|
heap.Fix(&bsm.bsrHeap, 0)
|
|
|
|
bsm.Block = &bsm.bsrHeap[0].Block
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
|
|
|
if err := bsrMin.Error(); err != nil {
|
2022-01-20 18:11:56 +00:00
|
|
|
bsm.Block = nil
|
2019-05-22 21:16:55 +00:00
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
heap.Pop(&bsm.bsrHeap)
|
|
|
|
|
|
|
|
if len(bsm.bsrHeap) == 0 {
|
2022-01-20 18:11:56 +00:00
|
|
|
bsm.Block = nil
|
2019-05-22 21:16:55 +00:00
|
|
|
return io.EOF
|
|
|
|
}
|
|
|
|
|
|
|
|
bsm.Block = &bsm.bsrHeap[0].Block
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
|
|
|
func (bsm *blockStreamMerger) Error() error {
|
|
|
|
if bsm.err == io.EOF {
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
return bsm.err
|
|
|
|
}
|
|
|
|
|
|
|
|
type blockStreamReaderHeap []*blockStreamReader
|
|
|
|
|
|
|
|
func (bsrh *blockStreamReaderHeap) Len() int {
|
|
|
|
return len(*bsrh)
|
|
|
|
}
|
|
|
|
|
|
|
|
func (bsrh *blockStreamReaderHeap) Less(i, j int) bool {
|
|
|
|
x := *bsrh
|
|
|
|
a, b := &x[i].Block.bh, &x[j].Block.bh
|
|
|
|
if a.TSID.MetricID == b.TSID.MetricID {
|
|
|
|
// Fast path for identical TSID values.
|
|
|
|
return a.MinTimestamp < b.MinTimestamp
|
|
|
|
}
|
|
|
|
// Slow path for distinct TSID values.
|
|
|
|
return a.TSID.Less(&b.TSID)
|
|
|
|
}
|
|
|
|
|
|
|
|
func (bsrh *blockStreamReaderHeap) Swap(i, j int) {
|
|
|
|
x := *bsrh
|
|
|
|
x[i], x[j] = x[j], x[i]
|
|
|
|
}
|
|
|
|
|
|
|
|
func (bsrh *blockStreamReaderHeap) Push(x interface{}) {
|
|
|
|
*bsrh = append(*bsrh, x.(*blockStreamReader))
|
|
|
|
}
|
|
|
|
|
|
|
|
func (bsrh *blockStreamReaderHeap) Pop() interface{} {
|
|
|
|
a := *bsrh
|
|
|
|
v := a[len(a)-1]
|
|
|
|
*bsrh = a[:len(a)-1]
|
|
|
|
return v
|
|
|
|
}
|