mirror of
https://gitlab.com/pulsechaincom/go-pulse.git
synced 2025-01-18 08:08:47 +00:00
59ac229f87
* core/state/snapshot: check dangling storages when generating snapshot * core/state/snapshot: polish * core/state/snapshot: wipe the last part of the dangling storages * core/state/snapshot: fix and add tests * core/state/snapshot: fix comment * README: remove mentions of fast sync (#24656) Co-authored-by: Marius van der Wijden <m.vanderwijden@live.de> * core, cmd: expose dangling storage detector for wider usage * core/state/snapshot: rename variable * core, ethdb: use global iterators for snapshot generation * core/state/snapshot: polish * cmd, core/state/snapshot: polish * core/state/snapshot: polish * Update core/state/snapshot/generate.go Co-authored-by: Martin Holst Swende <martin@swende.se> * ethdb: extend db test suite and fix memorydb iterator * ethdb/dbtest: rollback changes * ethdb/memorydb: simplify iteration * core/state/snapshot: update dangling counter * core/state/snapshot: release iterators * core/state/snapshot: update metrics * core/state/snapshot: update time metrics * metrics/influxdb: temp solution to present counter meaningfully, remove it * add debug log, revert later * core/state/snapshot: fix iterator panic * all: customized snapshot iterator for backward iteration * core, ethdb: polish * core/state/snapshot: remove debug log * core/state/snapshot: address comments from peter * core/state/snapshot: reopen the iterator at the next position * ethdb, core/state/snapshot: address comment from peter * core/state/snapshot: reopen exhausted iterators Co-authored-by: Tbnoapi <63448616+nuoomnoy02@users.noreply.github.com> Co-authored-by: Marius van der Wijden <m.vanderwijden@live.de> Co-authored-by: Martin Holst Swende <martin@swende.se>
242 lines
8.1 KiB
Go
242 lines
8.1 KiB
Go
// Copyright 2022 The go-ethereum Authors
|
|
// This file is part of the go-ethereum library.
|
|
//
|
|
// The go-ethereum library is free software: you can redistribute it and/or modify
|
|
// it under the terms of the GNU Lesser General Public License as published by
|
|
// the Free Software Foundation, either version 3 of the License, or
|
|
// (at your option) any later version.
|
|
//
|
|
// The go-ethereum library is distributed in the hope that it will be useful,
|
|
// but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
// GNU Lesser General Public License for more details.
|
|
//
|
|
// You should have received a copy of the GNU Lesser General Public License
|
|
// along with the go-ethereum library. If not, see <http://www.gnu.org/licenses/>.
|
|
|
|
package snapshot
|
|
|
|
import (
|
|
"bytes"
|
|
"encoding/binary"
|
|
"errors"
|
|
"time"
|
|
|
|
"github.com/ethereum/go-ethereum/common"
|
|
"github.com/ethereum/go-ethereum/common/math"
|
|
"github.com/ethereum/go-ethereum/core/rawdb"
|
|
"github.com/ethereum/go-ethereum/ethdb"
|
|
"github.com/ethereum/go-ethereum/ethdb/memorydb"
|
|
"github.com/ethereum/go-ethereum/log"
|
|
)
|
|
|
|
const (
|
|
snapAccount = "account" // Identifier of account snapshot generation
|
|
snapStorage = "storage" // Identifier of storage snapshot generation
|
|
)
|
|
|
|
// generatorStats is a collection of statistics gathered by the snapshot generator
|
|
// for logging purposes.
|
|
type generatorStats struct {
|
|
origin uint64 // Origin prefix where generation started
|
|
start time.Time // Timestamp when generation started
|
|
accounts uint64 // Number of accounts indexed(generated or recovered)
|
|
slots uint64 // Number of storage slots indexed(generated or recovered)
|
|
dangling uint64 // Number of dangling storage slots
|
|
storage common.StorageSize // Total account and storage slot size(generation or recovery)
|
|
}
|
|
|
|
// Log creates an contextual log with the given message and the context pulled
|
|
// from the internally maintained statistics.
|
|
func (gs *generatorStats) Log(msg string, root common.Hash, marker []byte) {
|
|
var ctx []interface{}
|
|
if root != (common.Hash{}) {
|
|
ctx = append(ctx, []interface{}{"root", root}...)
|
|
}
|
|
// Figure out whether we're after or within an account
|
|
switch len(marker) {
|
|
case common.HashLength:
|
|
ctx = append(ctx, []interface{}{"at", common.BytesToHash(marker)}...)
|
|
case 2 * common.HashLength:
|
|
ctx = append(ctx, []interface{}{
|
|
"in", common.BytesToHash(marker[:common.HashLength]),
|
|
"at", common.BytesToHash(marker[common.HashLength:]),
|
|
}...)
|
|
}
|
|
// Add the usual measurements
|
|
ctx = append(ctx, []interface{}{
|
|
"accounts", gs.accounts,
|
|
"slots", gs.slots,
|
|
"storage", gs.storage,
|
|
"dangling", gs.dangling,
|
|
"elapsed", common.PrettyDuration(time.Since(gs.start)),
|
|
}...)
|
|
// Calculate the estimated indexing time based on current stats
|
|
if len(marker) > 0 {
|
|
if done := binary.BigEndian.Uint64(marker[:8]) - gs.origin; done > 0 {
|
|
left := math.MaxUint64 - binary.BigEndian.Uint64(marker[:8])
|
|
|
|
speed := done/uint64(time.Since(gs.start)/time.Millisecond+1) + 1 // +1s to avoid division by zero
|
|
ctx = append(ctx, []interface{}{
|
|
"eta", common.PrettyDuration(time.Duration(left/speed) * time.Millisecond),
|
|
}...)
|
|
}
|
|
}
|
|
log.Info(msg, ctx...)
|
|
}
|
|
|
|
// generatorContext carries a few global values to be shared by all generation functions.
|
|
type generatorContext struct {
|
|
stats *generatorStats // Generation statistic collection
|
|
db ethdb.KeyValueStore // Key-value store containing the snapshot data
|
|
account *holdableIterator // Iterator of account snapshot data
|
|
storage *holdableIterator // Iterator of storage snapshot data
|
|
batch ethdb.Batch // Database batch for writing batch data atomically
|
|
logged time.Time // The timestamp when last generation progress was displayed
|
|
}
|
|
|
|
// newGeneratorContext initializes the context for generation.
|
|
func newGeneratorContext(stats *generatorStats, db ethdb.KeyValueStore, accMarker []byte, storageMarker []byte) *generatorContext {
|
|
ctx := &generatorContext{
|
|
stats: stats,
|
|
db: db,
|
|
batch: db.NewBatch(),
|
|
logged: time.Now(),
|
|
}
|
|
ctx.openIterator(snapAccount, accMarker)
|
|
ctx.openIterator(snapStorage, storageMarker)
|
|
return ctx
|
|
}
|
|
|
|
// openIterator constructs global account and storage snapshot iterators
|
|
// at the interrupted position. These iterators should be reopened from time
|
|
// to time to avoid blocking leveldb compaction for a long time.
|
|
func (ctx *generatorContext) openIterator(kind string, start []byte) {
|
|
if kind == snapAccount {
|
|
iter := ctx.db.NewIterator(rawdb.SnapshotAccountPrefix, start)
|
|
ctx.account = newHoldableIterator(rawdb.NewKeyLengthIterator(iter, 1+common.HashLength))
|
|
return
|
|
}
|
|
iter := ctx.db.NewIterator(rawdb.SnapshotStoragePrefix, start)
|
|
ctx.storage = newHoldableIterator(rawdb.NewKeyLengthIterator(iter, 1+2*common.HashLength))
|
|
}
|
|
|
|
// reopenIterator releases the specified snapshot iterator and re-open it
|
|
// in the next position. It's aimed for not blocking leveldb compaction.
|
|
func (ctx *generatorContext) reopenIterator(kind string) {
|
|
// Shift iterator one more step, so that we can reopen
|
|
// the iterator at the right position.
|
|
var iter = ctx.account
|
|
if kind == snapStorage {
|
|
iter = ctx.storage
|
|
}
|
|
hasNext := iter.Next()
|
|
if !hasNext {
|
|
// Iterator exhausted, release forever and create an already exhausted virtual iterator
|
|
iter.Release()
|
|
if kind == snapAccount {
|
|
ctx.account = newHoldableIterator(memorydb.New().NewIterator(nil, nil))
|
|
return
|
|
}
|
|
ctx.storage = newHoldableIterator(memorydb.New().NewIterator(nil, nil))
|
|
return
|
|
}
|
|
next := iter.Key()
|
|
iter.Release()
|
|
ctx.openIterator(kind, next[1:])
|
|
}
|
|
|
|
// close releases all the held resources.
|
|
func (ctx *generatorContext) close() {
|
|
ctx.account.Release()
|
|
ctx.storage.Release()
|
|
}
|
|
|
|
// iterator returns the corresponding iterator specified by the kind.
|
|
func (ctx *generatorContext) iterator(kind string) *holdableIterator {
|
|
if kind == snapAccount {
|
|
return ctx.account
|
|
}
|
|
return ctx.storage
|
|
}
|
|
|
|
// removeStorageBefore deletes all storage entries which are located before
|
|
// the specified account. When the iterator touches the storage entry which
|
|
// is located in or outside the given account, it stops and holds the current
|
|
// iterated element locally.
|
|
func (ctx *generatorContext) removeStorageBefore(account common.Hash) {
|
|
var (
|
|
count uint64
|
|
start = time.Now()
|
|
iter = ctx.storage
|
|
)
|
|
for iter.Next() {
|
|
key := iter.Key()
|
|
if bytes.Compare(key[1:1+common.HashLength], account.Bytes()) >= 0 {
|
|
iter.Hold()
|
|
break
|
|
}
|
|
count++
|
|
ctx.batch.Delete(key)
|
|
if ctx.batch.ValueSize() > ethdb.IdealBatchSize {
|
|
ctx.batch.Write()
|
|
ctx.batch.Reset()
|
|
}
|
|
}
|
|
ctx.stats.dangling += count
|
|
snapStorageCleanCounter.Inc(time.Since(start).Nanoseconds())
|
|
}
|
|
|
|
// removeStorageAt deletes all storage entries which are located in the specified
|
|
// account. When the iterator touches the storage entry which is outside the given
|
|
// account, it stops and holds the current iterated element locally. An error will
|
|
// be returned if the initial position of iterator is not in the given account.
|
|
func (ctx *generatorContext) removeStorageAt(account common.Hash) error {
|
|
var (
|
|
count int64
|
|
start = time.Now()
|
|
iter = ctx.storage
|
|
)
|
|
for iter.Next() {
|
|
key := iter.Key()
|
|
cmp := bytes.Compare(key[1:1+common.HashLength], account.Bytes())
|
|
if cmp < 0 {
|
|
return errors.New("invalid iterator position")
|
|
}
|
|
if cmp > 0 {
|
|
iter.Hold()
|
|
break
|
|
}
|
|
count++
|
|
ctx.batch.Delete(key)
|
|
if ctx.batch.ValueSize() > ethdb.IdealBatchSize {
|
|
ctx.batch.Write()
|
|
ctx.batch.Reset()
|
|
}
|
|
}
|
|
snapWipedStorageMeter.Mark(count)
|
|
snapStorageCleanCounter.Inc(time.Since(start).Nanoseconds())
|
|
return nil
|
|
}
|
|
|
|
// removeStorageLeft deletes all storage entries which are located after
|
|
// the current iterator position.
|
|
func (ctx *generatorContext) removeStorageLeft() {
|
|
var (
|
|
count uint64
|
|
start = time.Now()
|
|
iter = ctx.storage
|
|
)
|
|
for iter.Next() {
|
|
count++
|
|
ctx.batch.Delete(iter.Key())
|
|
if ctx.batch.ValueSize() > ethdb.IdealBatchSize {
|
|
ctx.batch.Write()
|
|
ctx.batch.Reset()
|
|
}
|
|
}
|
|
ctx.stats.dangling += count
|
|
snapDanglingStorageMeter.Mark(int64(count))
|
|
snapStorageCleanCounter.Inc(time.Since(start).Nanoseconds())
|
|
}
|