erigon-pulse/state/state_recon.go

374 lines
9.8 KiB
Go
Raw Normal View History

/*
Copyright 2022 Erigon contributors
Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at
http://www.apache.org/licenses/LICENSE-2.0
Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
*/
package state
import (
"bytes"
"container/heap"
"encoding/binary"
"fmt"
"github.com/google/btree"
"github.com/ledgerwatch/erigon-lib/compress"
"github.com/ledgerwatch/erigon-lib/recsplit"
"github.com/ledgerwatch/erigon-lib/recsplit/eliasfano32"
)
// Algorithms for reconstituting the state from state history
// DomainContext allows accesing the same domain from multiple go-routines
type DomainContext struct {
d *Domain
files [NumberOfTypes]*btree.BTree
}
func (d *Domain) MakeContext() *DomainContext {
dc := &DomainContext{d: d}
for fType := FileType(0); fType < NumberOfTypes; fType++ {
bt := btree.New(32)
dc.files[fType] = bt
d.files[fType].Ascend(func(i btree.Item) bool {
item := i.(*filesItem)
bt.ReplaceOrInsert(&filesItem{
startTxNum: item.startTxNum,
endTxNum: item.endTxNum,
decompressor: item.decompressor,
index: item.index,
getter: item.decompressor.MakeGetter(),
indexReader: recsplit.NewIndexReader(item.index),
})
return true
})
}
return dc
}
func (dc *DomainContext) GetNoState(key []byte, txNum uint64) ([]byte, bool, uint64, error) {
var search filesItem
search.startTxNum = txNum
search.endTxNum = txNum
var foundTxNum uint64
var foundEndTxNum uint64
var foundStartTxNum uint64
var found bool
var anyItem bool
var maxTxNum uint64
dc.files[EfHistory].AscendGreaterOrEqual(&search, func(i btree.Item) bool {
item := i.(*filesItem)
if item.index.Empty() {
return true
}
anyItem = true
offset := item.indexReader.Lookup(key)
g := item.getter
g.Reset(offset)
if k, _ := g.NextUncompressed(); bytes.Equal(k, key) {
eliasVal, _ := g.NextUncompressed()
ef, _ := eliasfano32.ReadEliasFano(eliasVal)
if n, ok := ef.Search(txNum); ok {
foundTxNum = n
foundEndTxNum = item.endTxNum
foundStartTxNum = item.startTxNum
found = true
return false
} else {
maxTxNum = ef.Max()
}
}
return true
})
if found {
var txKey [8]byte
binary.BigEndian.PutUint64(txKey[:], foundTxNum)
var historyItem *filesItem
search.startTxNum = foundStartTxNum
search.endTxNum = foundEndTxNum
if i := dc.files[History].Get(&search); i != nil {
historyItem = i.(*filesItem)
} else {
return nil, false, 0, fmt.Errorf("no %s file found for [%x]", dc.d.filenameBase, key)
}
offset := historyItem.indexReader.Lookup2(txKey[:], key)
g := historyItem.getter
g.Reset(offset)
if dc.d.compressVals {
v, _ := g.Next(nil)
return v, true, 0, nil
}
v, _ := g.NextUncompressed()
return v, true, 0, nil
} else if anyItem {
return nil, false, maxTxNum, nil
} else {
return nil, true, 0, nil
}
}
func (dc *DomainContext) MaxTxNum(key []byte) (bool, uint64) {
var found bool
var foundTxNum uint64
dc.files[EfHistory].Descend(func(i btree.Item) bool {
item := i.(*filesItem)
if item.index.Empty() {
return true
}
offset := item.indexReader.Lookup(key)
g := item.getter
g.Reset(offset)
if k, _ := g.NextUncompressed(); bytes.Equal(k, key) {
eliasVal, _ := g.NextUncompressed()
ef, _ := eliasfano32.ReadEliasFano(eliasVal)
found = true
foundTxNum = ef.Max()
return false
}
return true
})
if !found {
return false, 0
}
return true, foundTxNum
}
type ReconItem struct {
key []byte
txNum uint64
startTxNum uint64
endTxNum uint64
g *compress.Getter
startOffset uint64
lastOffset uint64
}
type ReconHeap []*ReconItem
func (rh ReconHeap) Len() int {
return len(rh)
}
// Less (part of heap.Interface) compares two links. For persisted links, those with the lower block heights get evicted first. This means that more recently persisted links are preferred.
// For non-persisted links, those with the highest block heights get evicted first. This is to prevent "holes" in the block heights that may cause inability to
// insert headers in the ascending order of their block heights.
func (rh ReconHeap) Less(i, j int) bool {
c := bytes.Compare(rh[i].key, rh[j].key)
if c == 0 {
return rh[i].txNum < rh[j].txNum
}
return c < 0
}
// Swap (part of heap.Interface) moves two links in the queue into each other's places. Note that each link has idx attribute that is getting adjusted during
// the swap. The idx attribute allows the removal of links from the middle of the queue (in case if links are getting invalidated due to
// failed verification of unavailability of parent headers)
func (rh ReconHeap) Swap(i, j int) {
rh[i], rh[j] = rh[j], rh[i]
}
// Push (part of heap.Interface) places a new link onto the end of queue. Note that idx attribute is set to the correct position of the new link
func (rh *ReconHeap) Push(x interface{}) {
// Push and Pop use pointer receivers because they modify the slice's length,
// not just its contents.
l := x.(*ReconItem)
*rh = append(*rh, l)
}
// Pop (part of heap.Interface) removes the first link from the queue
func (rh *ReconHeap) Pop() interface{} {
old := *rh
n := len(old)
x := old[n-1]
*rh = old[0 : n-1]
return x
}
type ScanIterator struct {
dc *DomainContext
h ReconHeap
uptoTxNum uint64
hasNext bool
nextTxNum uint64
fromKey, toKey []byte
key []byte
progress uint64
total uint64
}
func (si *ScanIterator) advance() {
for si.h.Len() > 0 {
top := heap.Pop(&si.h).(*ReconItem)
key := top.key
val, offset := top.g.NextUncompressed()
si.progress += offset - top.lastOffset
top.lastOffset = offset
if top.g.HasNext() {
top.key, _ = top.g.NextUncompressed()
if si.toKey == nil || bytes.Compare(top.key, si.toKey) <= 0 {
heap.Push(&si.h, top)
}
}
if !bytes.Equal(key, si.key) {
si.key = key
ef, _ := eliasfano32.ReadEliasFano(val)
max := ef.Max()
if max < si.uptoTxNum {
si.nextTxNum = max
si.hasNext = true
return
}
}
}
si.hasNext = false
}
func (si *ScanIterator) HasNext() bool {
return si.hasNext
}
func (si *ScanIterator) Next() (uint64, uint64) {
n, p := si.nextTxNum, si.progress
si.advance()
return n, p
}
func (si *ScanIterator) Total() uint64 {
return si.total
}
func (dc *DomainContext) iterateReconTxs(fromKey, toKey []byte, uptoTxNum uint64) *ScanIterator {
var si ScanIterator
dc.files[EfHistory].Ascend(func(i btree.Item) bool {
item := i.(*filesItem)
g := item.getter
for g.HasNext() {
key, offset := g.NextUncompressed()
if fromKey == nil || bytes.Compare(key, fromKey) > 0 {
heap.Push(&si.h, &ReconItem{startTxNum: item.startTxNum, endTxNum: item.endTxNum, g: g, txNum: ^item.endTxNum, key: key, startOffset: offset, lastOffset: offset})
break
} else {
g.SkipUncompressed()
}
}
si.total += uint64(item.decompressor.Size())
return true
})
si.dc = dc
si.fromKey = fromKey
si.toKey = toKey
si.uptoTxNum = uptoTxNum
si.advance()
return &si
}
type HistoryIterator struct {
dc *DomainContext
h ReconHeap
txNum uint64
key, val []byte
hasNext bool
compressVals bool
fromKey, toKey []byte
progress uint64
total uint64
}
func (hi *HistoryIterator) advance() {
for hi.h.Len() > 0 {
top := heap.Pop(&hi.h).(*ReconItem)
key := top.key
val, offset := top.g.NextUncompressed()
hi.progress += offset - top.lastOffset
top.lastOffset = offset
if top.g.HasNext() {
top.key, _ = top.g.NextUncompressed()
if hi.toKey == nil || bytes.Compare(top.key, hi.toKey) <= 0 {
heap.Push(&hi.h, top)
}
}
if !bytes.Equal(hi.key, key) {
ef, _ := eliasfano32.ReadEliasFano(val)
if n, ok := ef.Search(hi.txNum); ok {
hi.key = key
var txKey [8]byte
binary.BigEndian.PutUint64(txKey[:], n)
var historyItem *filesItem
var search filesItem
search.startTxNum = top.startTxNum
search.endTxNum = top.endTxNum
if i := hi.dc.files[History].Get(&search); i != nil {
historyItem = i.(*filesItem)
} else {
panic(fmt.Errorf("no %s file found for [%x]", hi.dc.d.filenameBase, hi.key))
}
offset := historyItem.indexReader.Lookup2(txKey[:], hi.key)
g := historyItem.getter
g.Reset(offset)
if hi.compressVals {
hi.val, _ = g.Next(nil)
} else {
hi.val, _ = g.NextUncompressed()
}
hi.hasNext = true
return
}
}
}
hi.hasNext = false
}
func (hi *HistoryIterator) HasNext() bool {
return hi.hasNext
}
func (hi *HistoryIterator) Next() ([]byte, []byte, uint64) {
k, v, p := hi.key, hi.val, hi.progress
hi.advance()
return k, v, p
}
func (hi *HistoryIterator) Total() uint64 {
return hi.total
}
// Creates iterator that provides history values for the state just before transaction txNum
func (dc *DomainContext) iterateHistoryBeforeTxNum(fromKey, toKey []byte, txNum uint64) *HistoryIterator {
var hi HistoryIterator
heap.Init(&hi.h)
dc.files[EfHistory].Ascend(func(i btree.Item) bool {
item := i.(*filesItem)
g := item.getter
g.Reset(0)
for g.HasNext() {
key, offset := g.NextUncompressed()
if fromKey == nil || bytes.Compare(key, fromKey) > 0 {
heap.Push(&hi.h, &ReconItem{g: g, key: key, startTxNum: item.startTxNum, endTxNum: item.endTxNum, txNum: item.endTxNum, startOffset: offset, lastOffset: offset})
break
} else {
g.SkipUncompressed()
}
}
hi.total += uint64(item.decompressor.Size())
return true
})
hi.dc = dc
hi.compressVals = dc.d.compressVals
hi.txNum = txNum
hi.fromKey = fromKey
hi.toKey = toKey
hi.advance()
return &hi
}