mirror of
https://gitlab.com/pulsechaincom/erigon-pulse.git
synced 2025-01-11 05:20:05 +00:00
d1c8416270
Fix the sync crash due to the mis-accounting of prunable entries
239 lines
6.6 KiB
Go
239 lines
6.6 KiB
Go
// Copyright 2019 The go-ethereum Authors
|
|
// This file is part of the go-ethereum library.
|
|
//
|
|
// The go-ethereum library is free software: you can redistribute it and/or modify
|
|
// it under the terms of the GNU Lesser General Public License as published by
|
|
// the Free Software Foundation, either version 3 of the License, or
|
|
// (at your option) any later version.
|
|
//
|
|
// The go-ethereum library is distributed in the hope that it will be useful,
|
|
// but WITHOUT ANY WARRANTY; without even the implied warranty off
|
|
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
// GNU Lesser General Public License for more details.
|
|
//
|
|
// You should have received a copy of the GNU Lesser General Public License
|
|
// along with the go-ethereum library. If not, see <http://www.gnu.org/licenses/>.
|
|
|
|
// Pruning of the Merkle Patricia trees
|
|
|
|
package trie
|
|
|
|
import (
|
|
"fmt"
|
|
"sort"
|
|
"strings"
|
|
"sync"
|
|
|
|
"github.com/ledgerwatch/turbo-geth/common"
|
|
)
|
|
|
|
type TriePruning struct {
|
|
accountTimestamps map[string]uint64
|
|
accountTimestampsMutex sync.RWMutex
|
|
|
|
// Maps timestamp (uint64) to set of prefixes of nodes (string)
|
|
accounts map[uint64]map[string]struct{}
|
|
accountsMutex sync.RWMutex
|
|
|
|
// For each timestamp, keeps number of branch nodes belonging to it
|
|
generationCounts map[uint64]int
|
|
|
|
// Keeps total number of branch nodes
|
|
nodeCount int
|
|
|
|
// The oldest timestamp of all branch nodes
|
|
oldestGeneration uint64
|
|
|
|
// Current timestamp
|
|
blockNr uint64
|
|
}
|
|
|
|
func NewTriePruning(oldestGeneration uint64) *TriePruning {
|
|
return &TriePruning{
|
|
oldestGeneration: oldestGeneration,
|
|
blockNr: oldestGeneration,
|
|
accountTimestamps: make(map[string]uint64),
|
|
accounts: make(map[uint64]map[string]struct{}),
|
|
generationCounts: make(map[uint64]int),
|
|
}
|
|
}
|
|
|
|
func (tp *TriePruning) SetBlockNr(blockNr uint64) {
|
|
tp.blockNr = blockNr
|
|
}
|
|
|
|
func (tp *TriePruning) BlockNr() uint64 {
|
|
return tp.blockNr
|
|
}
|
|
|
|
// Updates a node to the current timestamp
|
|
// contract is effectively address of the smart contract
|
|
// hex is the prefix of the key
|
|
// parent is the node that needs to be modified to unload the touched node
|
|
// exists is true when the node existed before, and false if it is a new one
|
|
// prevTimestamp is the timestamp the node current has
|
|
func (tp *TriePruning) touch(hexS string, exists bool, prevTimestamp uint64, del bool, newTimestamp uint64) {
|
|
//fmt.Printf("TouchFrom %x, exists: %t, prevTimestamp %d, del %t, newTimestamp %d\n", hex, exists, prevTimestamp, del, newTimestamp)
|
|
if exists && !del && prevTimestamp == newTimestamp {
|
|
return
|
|
}
|
|
if !del {
|
|
tp.accountsMutex.Lock()
|
|
var newMap map[string]struct{}
|
|
if m, ok := tp.accounts[newTimestamp]; ok {
|
|
newMap = m
|
|
} else {
|
|
newMap = make(map[string]struct{})
|
|
tp.accounts[newTimestamp] = newMap
|
|
}
|
|
|
|
newMap[hexS] = struct{}{}
|
|
tp.accountsMutex.Unlock()
|
|
}
|
|
if exists {
|
|
tp.accountsMutex.Lock()
|
|
if m, ok := tp.accounts[prevTimestamp]; ok {
|
|
delete(m, hexS)
|
|
if len(m) == 0 {
|
|
delete(tp.accounts, prevTimestamp)
|
|
}
|
|
}
|
|
tp.accountsMutex.Unlock()
|
|
}
|
|
// Update generation count
|
|
if !del {
|
|
tp.generationCounts[newTimestamp]++
|
|
tp.nodeCount++
|
|
}
|
|
if exists {
|
|
tp.generationCounts[prevTimestamp]--
|
|
if tp.generationCounts[prevTimestamp] == 0 {
|
|
delete(tp.generationCounts, prevTimestamp)
|
|
}
|
|
tp.nodeCount--
|
|
}
|
|
}
|
|
|
|
func (tp *TriePruning) Timestamp(hex []byte) uint64 {
|
|
tp.accountTimestampsMutex.RLock()
|
|
ts := tp.accountTimestamps[string(hex)]
|
|
tp.accountTimestampsMutex.RUnlock()
|
|
return ts
|
|
}
|
|
|
|
// Updates a node to the current timestamp
|
|
// contract is effectively address of the smart contract
|
|
// hex is the prefix of the key
|
|
// parent is the node that needs to be modified to unload the touched node
|
|
func (tp *TriePruning) Touch(hex []byte, del bool) error {
|
|
var exists = false
|
|
var prevTimestamp uint64
|
|
hexS := string(common.CopyBytes(hex))
|
|
|
|
tp.accountTimestampsMutex.Lock()
|
|
if m, ok := tp.accountTimestamps[hexS]; ok {
|
|
prevTimestamp = m
|
|
exists = true
|
|
if del {
|
|
delete(tp.accountTimestamps, hexS)
|
|
}
|
|
}
|
|
if !del {
|
|
tp.accountTimestamps[hexS] = tp.blockNr
|
|
}
|
|
tp.accountTimestampsMutex.Unlock()
|
|
|
|
tp.touch(hexS, exists, prevTimestamp, del, tp.blockNr)
|
|
return nil
|
|
}
|
|
|
|
func pruneMap(t *Trie, m map[string]struct{}, h *hasher) bool {
|
|
hexes := make([]string, len(m))
|
|
i := 0
|
|
for hexS := range m {
|
|
hexes[i] = hexS
|
|
i++
|
|
}
|
|
var empty = false
|
|
sort.Strings(hexes)
|
|
for i, hex := range hexes {
|
|
if i == 0 || len(hex) == 0 || !strings.HasPrefix(hex, hexes[i-1]) { // If the parent nodes are pruned, there is no need to prune descendants
|
|
t.unload([]byte(hex), h)
|
|
if len(hex) == 0 {
|
|
empty = true
|
|
}
|
|
}
|
|
}
|
|
return empty
|
|
}
|
|
|
|
// Prunes all nodes that are older than given timestamp
|
|
func (tp *TriePruning) PruneToTimestamp(
|
|
accountsTrie *Trie,
|
|
targetTimestamp uint64,
|
|
) {
|
|
// Remove (unload) nodes from storage tries and account trie
|
|
aggregateAccounts := make(map[string]struct{})
|
|
for gen := tp.oldestGeneration; gen < targetTimestamp; gen++ {
|
|
tp.nodeCount -= tp.generationCounts[gen]
|
|
tp.accountsMutex.Lock()
|
|
if m, ok := tp.accounts[gen]; ok {
|
|
for hexS := range m {
|
|
aggregateAccounts[hexS] = struct{}{}
|
|
}
|
|
}
|
|
delete(tp.accounts, gen)
|
|
tp.accountsMutex.Unlock()
|
|
}
|
|
h := newHasher(false)
|
|
defer returnHasherToPool(h)
|
|
pruneMap(accountsTrie, aggregateAccounts, h)
|
|
// Remove fom the timestamp structure
|
|
tp.accountTimestampsMutex.Lock()
|
|
for hexS := range aggregateAccounts {
|
|
delete(tp.accountTimestamps, hexS)
|
|
}
|
|
tp.accountTimestampsMutex.Unlock()
|
|
tp.oldestGeneration = targetTimestamp
|
|
}
|
|
|
|
// Prunes mininum number of generations necessary so that the total
|
|
// number of prunable nodes is at most `targetNodeCount`
|
|
func (tp *TriePruning) PruneTo(
|
|
accountsTrie *Trie,
|
|
targetNodeCount int,
|
|
) bool {
|
|
if tp.nodeCount <= targetNodeCount {
|
|
return false
|
|
}
|
|
excess := tp.nodeCount - targetNodeCount
|
|
prunable := 0
|
|
pruneGeneration := tp.oldestGeneration
|
|
for prunable < excess && pruneGeneration < tp.blockNr {
|
|
prunable += tp.generationCounts[pruneGeneration]
|
|
pruneGeneration++
|
|
}
|
|
//fmt.Printf("Will prune to generation %d, nodes to prune: %d, excess %d\n", pruneGeneration, prunable, excess)
|
|
tp.PruneToTimestamp(accountsTrie, pruneGeneration)
|
|
return true
|
|
}
|
|
|
|
func (tp *TriePruning) NodeCount() int {
|
|
return tp.nodeCount
|
|
}
|
|
|
|
func (tp *TriePruning) GenCounts() map[uint64]int {
|
|
return tp.generationCounts
|
|
}
|
|
|
|
// DebugDump is used in the tests to ensure that there are no prunable entries (in such case, this function returns empty string)
|
|
func (tp *TriePruning) DebugDump() string {
|
|
var sb strings.Builder
|
|
for timestamp, m := range tp.accounts {
|
|
for account := range m {
|
|
sb.WriteString(fmt.Sprintf("%d %x\n", timestamp, account))
|
|
}
|
|
}
|
|
return sb.String()
|
|
}
|