2019-05-22 21:16:55 +00:00
|
|
|
package mergeset
|
|
|
|
|
|
|
|
import (
|
|
|
|
"fmt"
|
|
|
|
"sort"
|
2021-02-21 19:18:49 +00:00
|
|
|
"unsafe"
|
2019-05-22 21:16:55 +00:00
|
|
|
|
|
|
|
"github.com/VictoriaMetrics/VictoriaMetrics/lib/encoding"
|
|
|
|
"github.com/VictoriaMetrics/VictoriaMetrics/lib/logger"
|
|
|
|
)
|
|
|
|
|
|
|
|
type blockHeader struct {
|
|
|
|
// common prefix for all the items in the block.
|
|
|
|
commonPrefix []byte
|
|
|
|
|
|
|
|
// The first item.
|
|
|
|
firstItem []byte
|
|
|
|
|
2022-11-15 14:30:51 +00:00
|
|
|
// Whether commonPrefix and firstItem point to external data.
|
|
|
|
noCopy bool
|
|
|
|
|
2019-05-22 21:16:55 +00:00
|
|
|
// Marshal type used for block compression.
|
|
|
|
marshalType marshalType
|
|
|
|
|
|
|
|
// The number of items in the block, excluding the first item.
|
|
|
|
itemsCount uint32
|
|
|
|
|
|
|
|
// The offset of the items block.
|
|
|
|
itemsBlockOffset uint64
|
|
|
|
|
|
|
|
// The offset of the lens block.
|
|
|
|
lensBlockOffset uint64
|
|
|
|
|
|
|
|
// The size of the items block.
|
|
|
|
itemsBlockSize uint32
|
|
|
|
|
|
|
|
// The size of the lens block.
|
|
|
|
lensBlockSize uint32
|
|
|
|
}
|
|
|
|
|
2021-02-21 19:18:49 +00:00
|
|
|
func (bh *blockHeader) SizeBytes() int {
|
|
|
|
return int(unsafe.Sizeof(*bh)) + cap(bh.commonPrefix) + cap(bh.firstItem)
|
|
|
|
}
|
|
|
|
|
2019-05-22 21:16:55 +00:00
|
|
|
func (bh *blockHeader) Reset() {
|
2022-11-15 14:30:51 +00:00
|
|
|
if bh.noCopy {
|
|
|
|
bh.commonPrefix = nil
|
|
|
|
bh.firstItem = nil
|
|
|
|
} else {
|
|
|
|
bh.commonPrefix = bh.commonPrefix[:0]
|
|
|
|
bh.firstItem = bh.firstItem[:0]
|
|
|
|
}
|
2019-05-22 21:16:55 +00:00
|
|
|
bh.marshalType = marshalTypePlain
|
|
|
|
bh.itemsCount = 0
|
|
|
|
bh.itemsBlockOffset = 0
|
|
|
|
bh.lensBlockOffset = 0
|
|
|
|
bh.itemsBlockSize = 0
|
|
|
|
bh.lensBlockSize = 0
|
|
|
|
}
|
|
|
|
|
|
|
|
func (bh *blockHeader) Marshal(dst []byte) []byte {
|
|
|
|
dst = encoding.MarshalBytes(dst, bh.commonPrefix)
|
|
|
|
dst = encoding.MarshalBytes(dst, bh.firstItem)
|
|
|
|
dst = append(dst, byte(bh.marshalType))
|
|
|
|
dst = encoding.MarshalUint32(dst, bh.itemsCount)
|
|
|
|
dst = encoding.MarshalUint64(dst, bh.itemsBlockOffset)
|
|
|
|
dst = encoding.MarshalUint64(dst, bh.lensBlockOffset)
|
|
|
|
dst = encoding.MarshalUint32(dst, bh.itemsBlockSize)
|
|
|
|
dst = encoding.MarshalUint32(dst, bh.lensBlockSize)
|
|
|
|
return dst
|
|
|
|
}
|
|
|
|
|
2022-11-15 14:30:51 +00:00
|
|
|
// UnmarshalNoCopy unmarshals bh from src without copying the data from src.
|
|
|
|
//
|
|
|
|
// The src must remain unchanged while bh is in use.
|
|
|
|
func (bh *blockHeader) UnmarshalNoCopy(src []byte) ([]byte, error) {
|
|
|
|
bh.noCopy = true
|
2019-05-22 21:16:55 +00:00
|
|
|
// Unmarshal commonPrefix
|
|
|
|
tail, cp, err := encoding.UnmarshalBytes(src)
|
|
|
|
if err != nil {
|
2020-06-30 19:58:18 +00:00
|
|
|
return tail, fmt.Errorf("cannot unmarshal commonPrefix: %w", err)
|
2019-05-22 21:16:55 +00:00
|
|
|
}
|
2022-11-15 14:30:51 +00:00
|
|
|
bh.commonPrefix = cp[:len(cp):len(cp)]
|
2019-05-22 21:16:55 +00:00
|
|
|
src = tail
|
|
|
|
|
|
|
|
// Unmarshal firstItem
|
|
|
|
tail, fi, err := encoding.UnmarshalBytes(src)
|
|
|
|
if err != nil {
|
2020-06-30 19:58:18 +00:00
|
|
|
return tail, fmt.Errorf("cannot unmarshal firstItem: %w", err)
|
2019-05-22 21:16:55 +00:00
|
|
|
}
|
2022-11-15 14:30:51 +00:00
|
|
|
bh.firstItem = fi[:len(fi):len(fi)]
|
2019-05-22 21:16:55 +00:00
|
|
|
src = tail
|
|
|
|
|
|
|
|
// Unmarshal marshalType
|
|
|
|
if len(src) == 0 {
|
|
|
|
return src, fmt.Errorf("cannot unmarshal marshalType from zero bytes")
|
|
|
|
}
|
|
|
|
bh.marshalType = marshalType(src[0])
|
|
|
|
src = src[1:]
|
|
|
|
if err := checkMarshalType(bh.marshalType); err != nil {
|
2020-06-30 19:58:18 +00:00
|
|
|
return src, fmt.Errorf("unexpected marshalType: %w", err)
|
2019-05-22 21:16:55 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
// Unmarshal itemsCount
|
|
|
|
if len(src) < 4 {
|
|
|
|
return src, fmt.Errorf("cannot unmarshal itemsCount from %d bytes; need at least %d bytes", len(src), 4)
|
|
|
|
}
|
|
|
|
bh.itemsCount = encoding.UnmarshalUint32(src)
|
|
|
|
src = src[4:]
|
|
|
|
|
|
|
|
// Unmarshal itemsBlockOffset
|
|
|
|
if len(src) < 8 {
|
|
|
|
return src, fmt.Errorf("cannot unmarshal itemsBlockOffset from %d bytes; neet at least %d bytes", len(src), 8)
|
|
|
|
}
|
|
|
|
bh.itemsBlockOffset = encoding.UnmarshalUint64(src)
|
|
|
|
src = src[8:]
|
|
|
|
|
|
|
|
// Unmarshal lensBlockOffset
|
|
|
|
if len(src) < 8 {
|
|
|
|
return src, fmt.Errorf("cannot unmarshal lensBlockOffset from %d bytes; need at least %d bytes", len(src), 8)
|
|
|
|
}
|
|
|
|
bh.lensBlockOffset = encoding.UnmarshalUint64(src)
|
|
|
|
src = src[8:]
|
|
|
|
|
|
|
|
// Unmarshal itemsBlockSize
|
|
|
|
if len(src) < 4 {
|
|
|
|
return src, fmt.Errorf("cannot unmarshal itemsBlockSize from %d bytes; need at least %d bytes", len(src), 4)
|
|
|
|
}
|
|
|
|
bh.itemsBlockSize = encoding.UnmarshalUint32(src)
|
|
|
|
src = src[4:]
|
|
|
|
|
|
|
|
// Unmarshal lensBlockSize
|
|
|
|
if len(src) < 4 {
|
|
|
|
return src, fmt.Errorf("cannot unmarshal lensBlockSize from %d bytes; need at least %d bytes", len(src), 4)
|
|
|
|
}
|
|
|
|
bh.lensBlockSize = encoding.UnmarshalUint32(src)
|
|
|
|
src = src[4:]
|
|
|
|
|
|
|
|
if bh.itemsCount <= 0 {
|
|
|
|
return src, fmt.Errorf("itemsCount must be bigger than 0; got %d", bh.itemsCount)
|
|
|
|
}
|
|
|
|
if bh.itemsBlockSize > 2*maxInmemoryBlockSize {
|
|
|
|
return src, fmt.Errorf("too big itemsBlockSize; got %d; cannot exceed %d", bh.itemsBlockSize, 2*maxInmemoryBlockSize)
|
|
|
|
}
|
|
|
|
if bh.lensBlockSize > 2*8*maxInmemoryBlockSize {
|
|
|
|
return src, fmt.Errorf("too big lensBlockSize; got %d; cannot exceed %d", bh.lensBlockSize, 2*8*maxInmemoryBlockSize)
|
|
|
|
}
|
|
|
|
|
|
|
|
return src, nil
|
|
|
|
}
|
|
|
|
|
2022-11-15 14:30:51 +00:00
|
|
|
// unmarshalBlockHeadersNoCopy unmarshals all the block headers from src,
|
2019-05-22 21:16:55 +00:00
|
|
|
// appends them to dst and returns the appended result.
|
|
|
|
//
|
|
|
|
// Block headers must be sorted by bh.firstItem.
|
2022-11-15 14:30:51 +00:00
|
|
|
//
|
|
|
|
// It is expected that src remains unchanged while rhe returned blocks are in use.
|
|
|
|
func unmarshalBlockHeadersNoCopy(dst []blockHeader, src []byte, blockHeadersCount int) ([]blockHeader, error) {
|
2019-05-22 21:16:55 +00:00
|
|
|
if blockHeadersCount <= 0 {
|
|
|
|
logger.Panicf("BUG: blockHeadersCount must be greater than 0; got %d", blockHeadersCount)
|
|
|
|
}
|
|
|
|
dstLen := len(dst)
|
|
|
|
if n := dstLen + blockHeadersCount - cap(dst); n > 0 {
|
|
|
|
dst = append(dst[:cap(dst)], make([]blockHeader, n)...)
|
|
|
|
}
|
|
|
|
dst = dst[:dstLen+blockHeadersCount]
|
|
|
|
for i := 0; i < blockHeadersCount; i++ {
|
2022-11-15 14:30:51 +00:00
|
|
|
tail, err := dst[dstLen+i].UnmarshalNoCopy(src)
|
2019-05-22 21:16:55 +00:00
|
|
|
if err != nil {
|
2022-11-16 19:21:46 +00:00
|
|
|
return dst, fmt.Errorf("cannot unmarshal block header #%d out of %d: %w", i, blockHeadersCount, err)
|
2019-05-22 21:16:55 +00:00
|
|
|
}
|
|
|
|
src = tail
|
|
|
|
}
|
|
|
|
if len(src) > 0 {
|
2020-05-14 12:32:07 +00:00
|
|
|
return dst, fmt.Errorf("unexpected non-zero tail left after unmarshaling %d block headers; len(tail)=%d", blockHeadersCount, len(src))
|
2019-05-22 21:16:55 +00:00
|
|
|
}
|
|
|
|
newBHS := dst[dstLen:]
|
|
|
|
|
|
|
|
// Verify that block headers are sorted by firstItem.
|
2019-09-13 18:58:26 +00:00
|
|
|
if !sort.SliceIsSorted(newBHS, func(i, j int) bool { return string(newBHS[i].firstItem) < string(newBHS[j].firstItem) }) {
|
2020-05-14 12:32:07 +00:00
|
|
|
return dst, fmt.Errorf("block headers must be sorted by firstItem; unmarshaled unsorted block headers: %#v", newBHS)
|
2019-05-22 21:16:55 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
return dst, nil
|
|
|
|
}
|