VictoriaMetrics/lib/mergeset/part_search.go

package mergeset

import (
	"fmt"
	"io"
	"sort"

	"github.com/VictoriaMetrics/VictoriaMetrics/lib/bytesutil"
	"github.com/VictoriaMetrics/VictoriaMetrics/lib/encoding"
	"github.com/VictoriaMetrics/VictoriaMetrics/lib/logger"
)

type partSearch struct {
	// Item contains the last item found after the call to NextItem.
	//
	// The Item content is valid until the next call to NextItem.
	Item []byte

	// p is a part to search.
	p *part

	// The remaining metaindex rows to scan, obtained from p.mrs.
	mrs []metaindexRow

	// The remaining block headers to scan in the current metaindexRow.
	bhs []blockHeader

	// Pointer to inmemory block, which may be reused.
	inmemoryBlockReuse *inmemoryBlock

	shouldCacheBlock func(item []byte) bool

	idxbCache *indexBlockCache
	ibCache   *inmemoryBlockCache

	// err contains the last error.
	err error

	indexBuf           []byte
	compressedIndexBuf []byte

	sb storageBlock

	ib        *inmemoryBlock
	ibItemIdx int
}

func (ps *partSearch) reset() {
	ps.Item = nil
	ps.p = nil
	ps.mrs = nil
	ps.bhs = nil
	if ps.inmemoryBlockReuse != nil {
		putInmemoryBlock(ps.inmemoryBlockReuse)
		ps.inmemoryBlockReuse = nil
	}
	ps.shouldCacheBlock = nil
	ps.idxbCache = nil
	ps.ibCache = nil
	ps.err = nil

	ps.indexBuf = ps.indexBuf[:0]
	ps.compressedIndexBuf = ps.compressedIndexBuf[:0]

	ps.sb.Reset()

	ps.ib = nil
	ps.ibItemIdx = 0
}

// Init initializes ps for search in the p.
//
// Use Seek for search in p.
func (ps *partSearch) Init(p *part, shouldCacheBlock func(item []byte) bool) {
	ps.reset()

	ps.p = p
	ps.idxbCache = p.idxbCache
	ps.ibCache = p.ibCache
}

// Seek seeks for the first item greater or equal to k in ps.
func (ps *partSearch) Seek(k []byte) {
	if err := ps.Error(); err != nil {
		// Do nothing on unrecoverable error.
		return
	}
	ps.err = nil

	if string(k) > string(ps.p.ph.lastItem) {
		// Not matching items in the part.
		ps.err = io.EOF
		return
	}

	if ps.tryFastSeek(k) {
		return
	}

	ps.Item = nil
	ps.mrs = ps.p.mrs
	ps.bhs = nil

	ps.indexBuf = ps.indexBuf[:0]
	ps.compressedIndexBuf = ps.compressedIndexBuf[:0]

	ps.sb.Reset()

	ps.ib = nil
	ps.ibItemIdx = 0

	if string(k) <= string(ps.p.ph.firstItem) {
		// The first item in the first block matches.
		ps.err = ps.nextBlock()
		return
	}

	// Locate the first metaindexRow to scan.
	if len(ps.mrs) == 0 {
		logger.Panicf("BUG: part without metaindex rows passed to partSearch")
	}
	n := sort.Search(len(ps.mrs), func(i int) bool {
		return string(k) <= string(ps.mrs[i].firstItem)
	})
	if n > 0 {
		// The given k may be located in the previous metaindexRow, so go to it.
		n--
	}
	ps.mrs = ps.mrs[n:]

	// Read block headers for the found metaindexRow.
	if err := ps.nextBHS(); err != nil {
		ps.err = err
		return
	}

	// Locate the first block to scan.
	n = sort.Search(len(ps.bhs), func(i int) bool {
		return string(k) <= string(ps.bhs[i].firstItem)
	})
	if n > 0 {
		// The given k may be located in the previous block, so go to it.
		n--
	}
	ps.bhs = ps.bhs[n:]

	// Read the block.
	if err := ps.nextBlock(); err != nil {
		ps.err = err
		return
	}

	// Locate the first item to scan in the block.
	items := ps.ib.items
	cpLen := commonPrefixLen(ps.ib.commonPrefix, k)
	if cpLen > 0 {
		keySuffix := k[cpLen:]
		ps.ibItemIdx = sort.Search(len(items), func(i int) bool {
			return string(keySuffix) <= string(items[i][cpLen:])
		})
	} else {
		ps.ibItemIdx = binarySearchKey(items, k)
	}
	if ps.ibItemIdx < len(items) {
		// The item has been found.
		return
	}

	// Nothing found in the current block. Proceed to the next block.
	// The item to search must be the first in the next block.
	if err := ps.nextBlock(); err != nil {
		ps.err = err
		return
	}
}

func (ps *partSearch) tryFastSeek(k []byte) bool {
	if ps.ib == nil {
		return false
	}
	items := ps.ib.items
	idx := ps.ibItemIdx
	if idx >= len(items) {
		// The ib is exhausted.
		return false
	}
	if string(k) > string(items[len(items)-1]) {
		// The item is located in next blocks.
		return false
	}

	// The item is located either in the current block or in previous blocks.
	if idx > 0 {
		idx--
	}
	if string(k) < string(items[idx]) {
		if string(k) < string(items[0]) {
			// The item is located in previous blocks.
			return false
		}
		idx = 0
	}

	// The item is located in the current block
	ps.ibItemIdx = idx + binarySearchKey(items[idx:], k)
	return true
}

// NextItem advances to the next Item.
//
// Returns true on success.
func (ps *partSearch) NextItem() bool {
	if ps.err != nil {
		return false
	}

	if ps.ibItemIdx < len(ps.ib.items) {
		// Fast path - the current block contains more items.
		// Proceed to the next item.
		ps.Item = ps.ib.items[ps.ibItemIdx]
		ps.ibItemIdx++
		return true
	}

	// The current block is over. Proceed to the next block.
	if err := ps.nextBlock(); err != nil {
		ps.err = err
		return false
	}

	// Invariant: len(ps.ib.items) > 0 after nextBlock.
	ps.Item = ps.ib.items[0]
	ps.ibItemIdx++
	return true
}

// Error returns the last error occurred in the ps.
func (ps *partSearch) Error() error {
	if ps.err == io.EOF {
		return nil
	}
	return ps.err
}

func (ps *partSearch) nextBlock() error {
	if ps.inmemoryBlockReuse != nil {
		putInmemoryBlock(ps.inmemoryBlockReuse)
		ps.inmemoryBlockReuse = nil
	}
	if len(ps.bhs) == 0 {
		// The current metaindexRow is over. Proceed to the next metaindexRow.
		if err := ps.nextBHS(); err != nil {
			return err
		}
	}
	bh := &ps.bhs[0]
	ps.bhs = ps.bhs[1:]
	ib, mayReuseInmemoryBlock, err := ps.getInmemoryBlock(bh)
	if err != nil {
		return err
	}
	if mayReuseInmemoryBlock {
		ps.inmemoryBlockReuse = ib
	}
	ps.ib = ib
	ps.ibItemIdx = 0
	return nil
}

func (ps *partSearch) nextBHS() error {
	if len(ps.mrs) == 0 {
		return io.EOF
	}
	mr := &ps.mrs[0]
	ps.mrs = ps.mrs[1:]
	idxbKey := mr.indexBlockOffset
	idxb := ps.idxbCache.Get(idxbKey)
	if idxb == nil {
		var err error
		idxb, err = ps.readIndexBlock(mr)
		if err != nil {
			return fmt.Errorf("cannot read index block: %s", err)
		}
		ps.idxbCache.Put(idxbKey, idxb)
	}
	ps.bhs = idxb.bhs
	return nil
}

func (ps *partSearch) readIndexBlock(mr *metaindexRow) (*indexBlock, error) {
	ps.compressedIndexBuf = bytesutil.Resize(ps.compressedIndexBuf, int(mr.indexBlockSize))
	ps.p.indexFile.MustReadAt(ps.compressedIndexBuf, int64(mr.indexBlockOffset))

	var err error
	ps.indexBuf, err = encoding.DecompressZSTD(ps.indexBuf[:0], ps.compressedIndexBuf)
	if err != nil {
		return nil, fmt.Errorf("cannot decompress index block with size %d bytes: %s", len(ps.compressedIndexBuf), err)
	}
	idxb := getIndexBlock()
	idxb.bhs, err = unmarshalBlockHeaders(idxb.bhs[:0], ps.indexBuf, int(mr.blockHeadersCount))
	if err != nil {
		return nil, fmt.Errorf("cannot unmarshal block headers from index block (offset=%d, size=%d): %s", mr.indexBlockOffset, mr.indexBlockSize, err)
	}
	return idxb, nil
}

func (ps *partSearch) getInmemoryBlock(bh *blockHeader) (*inmemoryBlock, bool, error) {
	if ps.shouldCacheBlock != nil {
		if !ps.shouldCacheBlock(bh.firstItem) {
			ib, err := ps.readInmemoryBlock(bh)
			if err != nil {
				return nil, false, err
			}
			return ib, true, nil
		}
	}

	var ibKey inmemoryBlockCacheKey
	ibKey.Init(bh)
	ib := ps.ibCache.Get(ibKey)
	if ib != nil {
		return ib, false, nil
	}
	ib, err := ps.readInmemoryBlock(bh)
	if err != nil {
		return nil, false, err
	}
	ps.ibCache.Put(ibKey, ib)
	return ib, false, nil
}

func (ps *partSearch) readInmemoryBlock(bh *blockHeader) (*inmemoryBlock, error) {
	ps.sb.Reset()

	ps.sb.itemsData = bytesutil.Resize(ps.sb.itemsData, int(bh.itemsBlockSize))
	ps.p.itemsFile.MustReadAt(ps.sb.itemsData, int64(bh.itemsBlockOffset))

	ps.sb.lensData = bytesutil.Resize(ps.sb.lensData, int(bh.lensBlockSize))
	ps.p.lensFile.MustReadAt(ps.sb.lensData, int64(bh.lensBlockOffset))

	ib := getInmemoryBlock()
	if err := ib.UnmarshalData(&ps.sb, bh.firstItem, bh.commonPrefix, bh.itemsCount, bh.marshalType); err != nil {
		return nil, fmt.Errorf("cannot unmarshal storage block with %d items: %s", bh.itemsCount, err)
	}

	return ib, nil
}

func binarySearchKey(items [][]byte, key []byte) int {
	if len(items) == 0 {
		return 0
	}
	if string(key) <= string(items[0]) {
		// Fast path - the item is the first.
		return 0
	}
	items = items[1:]
	offset := uint(1)

	// This has been copy-pasted from https://golang.org/src/sort/search.go
	n := uint(len(items))
	i, j := uint(0), n
	for i < j {
		h := uint(i+j) >> 1
		if h >= 0 && h < uint(len(items)) && string(key) > string(items[h]) {
			i = h + 1
		} else {
			j = h
		}
	}
	return int(i + offset)
}
all: open-sourcing single-node version 2019-05-22 21:16:55 +00:00			`package mergeset`

			`import (`
			`"fmt"`
			`"io"`
			`"sort"`

			`"github.com/VictoriaMetrics/VictoriaMetrics/lib/bytesutil"`
			`"github.com/VictoriaMetrics/VictoriaMetrics/lib/encoding"`
			`"github.com/VictoriaMetrics/VictoriaMetrics/lib/logger"`
			`)`

			`type partSearch struct {`
			`// Item contains the last item found after the call to NextItem.`
			`//`
app/vmselect/promql: allow negative offsets Updates https://github.com/prometheus/prometheus/issues/6282 2019-12-10 21:41:11 +00:00			`// The Item content is valid until the next call to NextItem.`
all: open-sourcing single-node version 2019-05-22 21:16:55 +00:00			`Item []byte`

			`// p is a part to search.`
			`p *part`

			`// The remaining metaindex rows to scan, obtained from p.mrs.`
			`mrs []metaindexRow`

			`// The remaining block headers to scan in the current metaindexRow.`
			`bhs []blockHeader`

			`// Pointer to inmemory block, which may be reused.`
			`inmemoryBlockReuse *inmemoryBlock`

lib/{mergeset,storage}: do not cache inverted index blocks containing `tag->metricIDs` items This should reduce the amounts of used RAM during queries with filters over big number of time series. 2019-09-25 10:47:06 +00:00			`shouldCacheBlock func(item []byte) bool`

all: open-sourcing single-node version 2019-05-22 21:16:55 +00:00			`idxbCache *indexBlockCache`
			`ibCache *inmemoryBlockCache`

			`// err contains the last error.`
			`err error`

			`indexBuf []byte`
			`compressedIndexBuf []byte`

			`sb storageBlock`

			`ib *inmemoryBlock`
			`ibItemIdx int`
			`}`

			`func (ps *partSearch) reset() {`
			`ps.Item = nil`
			`ps.p = nil`
			`ps.mrs = nil`
			`ps.bhs = nil`
			`if ps.inmemoryBlockReuse != nil {`
			`putInmemoryBlock(ps.inmemoryBlockReuse)`
			`ps.inmemoryBlockReuse = nil`
			`}`
lib/{mergeset,storage}: do not cache inverted index blocks containing `tag->metricIDs` items This should reduce the amounts of used RAM during queries with filters over big number of time series. 2019-09-25 10:47:06 +00:00			`ps.shouldCacheBlock = nil`
all: open-sourcing single-node version 2019-05-22 21:16:55 +00:00			`ps.idxbCache = nil`
			`ps.ibCache = nil`
			`ps.err = nil`

			`ps.indexBuf = ps.indexBuf[:0]`
			`ps.compressedIndexBuf = ps.compressedIndexBuf[:0]`

			`ps.sb.Reset()`

			`ps.ib = nil`
			`ps.ibItemIdx = 0`
			`}`

			`// Init initializes ps for search in the p.`
			`//`
			`// Use Seek for search in p.`
lib/{mergeset,storage}: do not cache inverted index blocks containing `tag->metricIDs` items This should reduce the amounts of used RAM during queries with filters over big number of time series. 2019-09-25 10:47:06 +00:00			`func (ps partSearch) Init(p part, shouldCacheBlock func(item []byte) bool) {`
all: open-sourcing single-node version 2019-05-22 21:16:55 +00:00			`ps.reset()`

			`ps.p = p`
lib/{mergeset,storage}: fix uint64 counters alignment for 32-bit architectures (GOARCH=386, GOARCH=arm) 2020-01-14 20:47:04 +00:00			`ps.idxbCache = p.idxbCache`
			`ps.ibCache = p.ibCache`
all: open-sourcing single-node version 2019-05-22 21:16:55 +00:00			`}`

			`// Seek seeks for the first item greater or equal to k in ps.`
			`func (ps *partSearch) Seek(k []byte) {`
			`if err := ps.Error(); err != nil {`
			`// Do nothing on unrecoverable error.`
			`return`
			`}`
			`ps.err = nil`

			`if string(k) > string(ps.p.ph.lastItem) {`
			`// Not matching items in the part.`
			`ps.err = io.EOF`
			`return`
			`}`

			`if ps.tryFastSeek(k) {`
			`return`
			`}`

			`ps.Item = nil`
			`ps.mrs = ps.p.mrs`
			`ps.bhs = nil`

			`ps.indexBuf = ps.indexBuf[:0]`
			`ps.compressedIndexBuf = ps.compressedIndexBuf[:0]`

			`ps.sb.Reset()`

			`ps.ib = nil`
			`ps.ibItemIdx = 0`

			`if string(k) <= string(ps.p.ph.firstItem) {`
			`// The first item in the first block matches.`
			`ps.err = ps.nextBlock()`
			`return`
			`}`

			`// Locate the first metaindexRow to scan.`
			`if len(ps.mrs) == 0 {`
			`logger.Panicf("BUG: part without metaindex rows passed to partSearch")`
			`}`
			`n := sort.Search(len(ps.mrs), func(i int) bool {`
			`return string(k) <= string(ps.mrs[i].firstItem)`
			`})`
			`if n > 0 {`
			`// The given k may be located in the previous metaindexRow, so go to it.`
			`n--`
			`}`
			`ps.mrs = ps.mrs[n:]`

			`// Read block headers for the found metaindexRow.`
			`if err := ps.nextBHS(); err != nil {`
			`ps.err = err`
			`return`
			`}`

			`// Locate the first block to scan.`
			`n = sort.Search(len(ps.bhs), func(i int) bool {`
			`return string(k) <= string(ps.bhs[i].firstItem)`
			`})`
			`if n > 0 {`
			`// The given k may be located in the previous block, so go to it.`
			`n--`
			`}`
			`ps.bhs = ps.bhs[n:]`

			`// Read the block.`
			`if err := ps.nextBlock(); err != nil {`
			`ps.err = err`
			`return`
			`}`

			`// Locate the first item to scan in the block.`
			`items := ps.ib.items`
			`cpLen := commonPrefixLen(ps.ib.commonPrefix, k)`
			`if cpLen > 0 {`
			`keySuffix := k[cpLen:]`
			`ps.ibItemIdx = sort.Search(len(items), func(i int) bool {`
			`return string(keySuffix) <= string(items[i][cpLen:])`
			`})`
			`} else {`
			`ps.ibItemIdx = binarySearchKey(items, k)`
			`}`
			`if ps.ibItemIdx < len(items) {`
			`// The item has been found.`
			`return`
			`}`

			`// Nothing found in the current block. Proceed to the next block.`
			`// The item to search must be the first in the next block.`
			`if err := ps.nextBlock(); err != nil {`
			`ps.err = err`
			`return`
			`}`
			`}`

			`func (ps *partSearch) tryFastSeek(k []byte) bool {`
			`if ps.ib == nil {`
			`return false`
			`}`
			`items := ps.ib.items`
			`idx := ps.ibItemIdx`
			`if idx >= len(items) {`
			`// The ib is exhausted.`
			`return false`
			`}`
			`if string(k) > string(items[len(items)-1]) {`
			`// The item is located in next blocks.`
			`return false`
			`}`

			`// The item is located either in the current block or in previous blocks.`
			`if idx > 0 {`
			`idx--`
			`}`
			`if string(k) < string(items[idx]) {`
			`if string(k) < string(items[0]) {`
			`// The item is located in previous blocks.`
			`return false`
			`}`
			`idx = 0`
			`}`

			`// The item is located in the current block`
			`ps.ibItemIdx = idx + binarySearchKey(items[idx:], k)`
			`return true`
			`}`

			`// NextItem advances to the next Item.`
			`//`
			`// Returns true on success.`
			`func (ps *partSearch) NextItem() bool {`
			`if ps.err != nil {`
			`return false`
			`}`

			`if ps.ibItemIdx < len(ps.ib.items) {`
			`// Fast path - the current block contains more items.`
			`// Proceed to the next item.`
			`ps.Item = ps.ib.items[ps.ibItemIdx]`
			`ps.ibItemIdx++`
			`return true`
			`}`

			`// The current block is over. Proceed to the next block.`
			`if err := ps.nextBlock(); err != nil {`
			`ps.err = err`
			`return false`
			`}`

			`// Invariant: len(ps.ib.items) > 0 after nextBlock.`
			`ps.Item = ps.ib.items[0]`
			`ps.ibItemIdx++`
			`return true`
			`}`

			`// Error returns the last error occurred in the ps.`
			`func (ps *partSearch) Error() error {`
			`if ps.err == io.EOF {`
			`return nil`
			`}`
			`return ps.err`
			`}`

			`func (ps *partSearch) nextBlock() error {`
			`if ps.inmemoryBlockReuse != nil {`
			`putInmemoryBlock(ps.inmemoryBlockReuse)`
			`ps.inmemoryBlockReuse = nil`
			`}`
			`if len(ps.bhs) == 0 {`
			`// The current metaindexRow is over. Proceed to the next metaindexRow.`
			`if err := ps.nextBHS(); err != nil {`
			`return err`
			`}`
			`}`
			`bh := &ps.bhs[0]`
			`ps.bhs = ps.bhs[1:]`
			`ib, mayReuseInmemoryBlock, err := ps.getInmemoryBlock(bh)`
			`if err != nil {`
			`return err`
			`}`
			`if mayReuseInmemoryBlock {`
			`ps.inmemoryBlockReuse = ib`
			`}`
			`ps.ib = ib`
			`ps.ibItemIdx = 0`
			`return nil`
			`}`

			`func (ps *partSearch) nextBHS() error {`
			`if len(ps.mrs) == 0 {`
			`return io.EOF`
			`}`
			`mr := &ps.mrs[0]`
			`ps.mrs = ps.mrs[1:]`
			`idxbKey := mr.indexBlockOffset`
			`idxb := ps.idxbCache.Get(idxbKey)`
lib/{storage,mergeset}: cleanup: remove unused partSearch.indexBlockReuse 2020-05-14 11:02:52 +00:00			`if idxb == nil {`
			`var err error`
			`idxb, err = ps.readIndexBlock(mr)`
			`if err != nil {`
			`return fmt.Errorf("cannot read index block: %s", err)`
			`}`
			`ps.idxbCache.Put(idxbKey, idxb)`
all: open-sourcing single-node version 2019-05-22 21:16:55 +00:00			`}`
lib/{storage,mergeset}: cleanup: remove unused partSearch.indexBlockReuse 2020-05-14 11:02:52 +00:00			`ps.bhs = idxb.bhs`
			`return nil`
all: open-sourcing single-node version 2019-05-22 21:16:55 +00:00			`}`

			`func (ps partSearch) readIndexBlock(mr metaindexRow) (*indexBlock, error) {`
			`ps.compressedIndexBuf = bytesutil.Resize(ps.compressedIndexBuf, int(mr.indexBlockSize))`
all: rename ReadAt* to MustReadAt* in order to dont clash with io.ReaderAt 2020-01-30 11:22:15 +00:00			`ps.p.indexFile.MustReadAt(ps.compressedIndexBuf, int64(mr.indexBlockOffset))`
all: open-sourcing single-node version 2019-05-22 21:16:55 +00:00
			`var err error`
			`ps.indexBuf, err = encoding.DecompressZSTD(ps.indexBuf[:0], ps.compressedIndexBuf)`
			`if err != nil {`
			`return nil, fmt.Errorf("cannot decompress index block with size %d bytes: %s", len(ps.compressedIndexBuf), err)`
			`}`
			`idxb := getIndexBlock()`
			`idxb.bhs, err = unmarshalBlockHeaders(idxb.bhs[:0], ps.indexBuf, int(mr.blockHeadersCount))`
			`if err != nil {`
			`return nil, fmt.Errorf("cannot unmarshal block headers from index block (offset=%d, size=%d): %s", mr.indexBlockOffset, mr.indexBlockSize, err)`
			`}`
			`return idxb, nil`
			`}`

			`func (ps partSearch) getInmemoryBlock(bh blockHeader) (*inmemoryBlock, bool, error) {`
lib/{mergeset,storage}: do not cache inverted index blocks containing `tag->metricIDs` items This should reduce the amounts of used RAM during queries with filters over big number of time series. 2019-09-25 10:47:06 +00:00			`if ps.shouldCacheBlock != nil {`
			`if !ps.shouldCacheBlock(bh.firstItem) {`
			`ib, err := ps.readInmemoryBlock(bh)`
			`if err != nil {`
			`return nil, false, err`
			`}`
			`return ib, true, nil`
			`}`
			`}`

all: open-sourcing single-node version 2019-05-22 21:16:55 +00:00			`var ibKey inmemoryBlockCacheKey`
			`ibKey.Init(bh)`
			`ib := ps.ibCache.Get(ibKey)`
			`if ib != nil {`
			`return ib, false, nil`
			`}`
			`ib, err := ps.readInmemoryBlock(bh)`
			`if err != nil {`
			`return nil, false, err`
			`}`
lib/{storage,mergeset}: cleanup: remove unused partSearch.indexBlockReuse 2020-05-14 11:02:52 +00:00			`ps.ibCache.Put(ibKey, ib)`
			`return ib, false, nil`
all: open-sourcing single-node version 2019-05-22 21:16:55 +00:00			`}`

			`func (ps partSearch) readInmemoryBlock(bh blockHeader) (*inmemoryBlock, error) {`
			`ps.sb.Reset()`

			`ps.sb.itemsData = bytesutil.Resize(ps.sb.itemsData, int(bh.itemsBlockSize))`
all: rename ReadAt* to MustReadAt* in order to dont clash with io.ReaderAt 2020-01-30 11:22:15 +00:00			`ps.p.itemsFile.MustReadAt(ps.sb.itemsData, int64(bh.itemsBlockOffset))`
all: open-sourcing single-node version 2019-05-22 21:16:55 +00:00
			`ps.sb.lensData = bytesutil.Resize(ps.sb.lensData, int(bh.lensBlockSize))`
all: rename ReadAt* to MustReadAt* in order to dont clash with io.ReaderAt 2020-01-30 11:22:15 +00:00			`ps.p.lensFile.MustReadAt(ps.sb.lensData, int64(bh.lensBlockOffset))`
all: open-sourcing single-node version 2019-05-22 21:16:55 +00:00
			`ib := getInmemoryBlock()`
			`if err := ib.UnmarshalData(&ps.sb, bh.firstItem, bh.commonPrefix, bh.itemsCount, bh.marshalType); err != nil {`
			`return nil, fmt.Errorf("cannot unmarshal storage block with %d items: %s", bh.itemsCount, err)`
			`}`

			`return ib, nil`
			`}`

			`func binarySearchKey(items [][]byte, key []byte) int {`
lib/mergeset: speed up binarySearchKey by skipping the first item during binary search 2019-06-29 10:45:49 +00:00			`if len(items) == 0 {`
			`return 0`
			`}`
			`if string(key) <= string(items[0]) {`
			`// Fast path - the item is the first.`
			`return 0`
all: open-sourcing single-node version 2019-05-22 21:16:55 +00:00			`}`
lib/mergeset: speed up binarySearchKey by skipping the first item during binary search 2019-06-29 10:45:49 +00:00			`items = items[1:]`
			`offset := uint(1)`
all: open-sourcing single-node version 2019-05-22 21:16:55 +00:00
			`// This has been copy-pasted from https://golang.org/src/sort/search.go`
			`n := uint(len(items))`
			`i, j := uint(0), n`
			`for i < j {`
			`h := uint(i+j) >> 1`
lib/storage: create and use `lib/uint64set` instead of `map[uint64]struct{}` This should improve inverted index search performance for filters matching big number of time series, since `lib/uint64set.Set` is faster than `map[uint64]struct{}` for both `Add` and `Has` calls. See the corresponding benchmarks in `lib/uint64set`. 2019-09-24 18:10:22 +00:00			`if h >= 0 && h < uint(len(items)) && string(key) > string(items[h]) {`
all: open-sourcing single-node version 2019-05-22 21:16:55 +00:00			`i = h + 1`
			`} else {`
			`j = h`
			`}`
			`}`
lib/mergeset: `make fmt` 2019-06-29 11:25:26 +00:00			`return int(i + offset)`
all: open-sourcing single-node version 2019-05-22 21:16:55 +00:00			`}`