erigon-pulse/cmd/state/stateless/state_snapshot.go

346 lines
8.8 KiB
Go
Raw Normal View History

package stateless
import (
"bytes"
"context"
"encoding/binary"
"fmt"
"time"
"github.com/ledgerwatch/turbo-geth/common"
"github.com/ledgerwatch/turbo-geth/common/dbutils"
"github.com/ledgerwatch/turbo-geth/core/rawdb"
"github.com/ledgerwatch/turbo-geth/core/types/accounts"
"github.com/ledgerwatch/turbo-geth/ethdb"
"github.com/ledgerwatch/turbo-geth/migrations"
"github.com/ledgerwatch/turbo-geth/turbo/trie"
)
// NOTE: This file is not the part of the Turbo-Geth binary. It i s part of the experimental utility, state
// to perform data analysis related to the state growth, state rent, and statelesss clients
type bucketWriter struct {
db ethdb.Database
2020-08-10 23:55:32 +00:00
bucket string
pending ethdb.DbWithPendingMutations
written uint64
}
func (bw *bucketWriter) printStats() {
if bw.written == 0 {
fmt.Printf(" -- nothing to copy for bucket: '%s'...", string(bw.bucket))
} else {
fmt.Printf("\r -- commited %d records for bucket: '%s'...", bw.written, string(bw.bucket))
}
}
func (bw *bucketWriter) walker(k, v []byte) (bool, error) {
if bw.pending == nil {
bw.pending = bw.db.NewBatch()
}
if err := bw.pending.Put(bw.bucket, common.CopyBytes(k), common.CopyBytes(v)); err != nil {
return false, err
}
bw.written++
if bw.pending.BatchSize() >= 100000 {
if _, err := bw.pending.Commit(); err != nil {
return false, err
}
bw.printStats()
bw.pending = bw.db.NewBatch()
}
return true, nil
}
func (bw *bucketWriter) commit() error {
defer bw.printStats()
if bw.pending != nil {
_, err := bw.pending.Commit()
return err
}
return nil
}
2020-08-10 23:55:32 +00:00
func newBucketWriter(db ethdb.Database, bucket string) *bucketWriter {
return &bucketWriter{
db: db,
bucket: bucket,
pending: nil,
written: 0,
}
}
func copyDatabase(fromDB ethdb.Database, toDB ethdb.Database) error {
2020-08-10 23:55:32 +00:00
for _, bucket := range []string{dbutils.CurrentStateBucket, dbutils.CodeBucket, dbutils.DatabaseInfoBucket} {
fmt.Printf(" - copying bucket '%s'...\n", string(bucket))
writer := newBucketWriter(toDB, bucket)
if err := fromDB.Walk(bucket, nil, 0, writer.walker); err != nil {
fmt.Println("FAIL")
return err
}
if err := writer.commit(); err != nil {
fmt.Println("FAIL")
return err
}
fmt.Println("OK")
}
return nil
}
func saveSnapshot(db ethdb.Database, filename string, createDb CreateDbFunc) {
fmt.Printf("Saving snapshot to %s\n", filename)
diskDb, err := createDb(filename)
check(err)
defer diskDb.Close()
err = copyDatabase(db, diskDb)
check(err)
}
func loadSnapshot(db ethdb.Database, filename string, createDb CreateDbFunc) {
fmt.Printf("Loading snapshot from %s\n", filename)
diskDb, err := createDb(filename)
check(err)
defer diskDb.Close()
err = copyDatabase(diskDb, db)
check(err)
err = migrations.NewMigrator().Apply(diskDb, "")
check(err)
}
//nolint
func loadCodes(db ethdb.KV, codeDb ethdb.Database) error {
var account accounts.Account
err := db.Update(context.Background(), func(tx ethdb.Tx) error {
c := tx.Cursor(dbutils.CurrentStateBucket)
cb := tx.Cursor(dbutils.CodeBucket)
for k, v, err := c.First(); k != nil; k, v, err = c.Next() {
if err != nil {
return err
}
if len(k) != 32 {
continue
}
if err := account.DecodeForStorage(v); err != nil {
return err
}
if !account.IsEmptyCodeHash() {
code, _ := codeDb.Get(dbutils.CodeBucket, account.CodeHash[:])
if code != nil {
if err := cb.Put(account.CodeHash[:], code); err != nil {
return err
}
}
}
}
return nil
})
return err
}
//nolint
func compare_snapshot(stateDb ethdb.Database, db ethdb.KV, filename string) {
fmt.Printf("Loading snapshot from %s\n", filename)
diskDb := ethdb.MustOpen(filename)
defer diskDb.Close()
if err := db.View(context.Background(), func(tx ethdb.Tx) error {
c := tx.Cursor(dbutils.CurrentStateBucket)
preimage := tx.Cursor(dbutils.PreimagePrefix)
count := 0
if err := diskDb.KV().View(context.Background(), func(txDisk ethdb.Tx) error {
cDisk := txDisk.Cursor(dbutils.CurrentStateBucket)
for k, v, err := cDisk.First(); k != nil; k, v, err = cDisk.Next() {
if err != nil {
return err
}
if len(k) != 32 {
continue
}
vv, err := c.SeekExact(k)
if err != nil {
return err
}
p, err := preimage.SeekExact(k)
if err != nil {
return err
}
if !bytes.Equal(v, vv) {
fmt.Printf("Diff for %x (%x): disk: %x, mem: %x\n", k, p, v, vv)
}
count++
if count%100000 == 0 {
fmt.Printf("Compared %d records\n", count)
}
}
count = 0
cDisk = txDisk.Cursor(dbutils.CurrentStateBucket)
for k, v, err := cDisk.First(); k != nil; k, v, err = cDisk.Next() {
if err != nil {
return err
}
if len(k) == 32 {
continue
}
vv, err := c.SeekExact(k)
if err != nil {
return err
}
if !bytes.Equal(v, vv) {
fmt.Printf("Diff for %x: disk: %x, mem: %x\n", k, v, vv)
}
count++
if count%100000 == 0 {
fmt.Printf("Committed %d records\n", count)
}
}
count = 0
c := tx.Cursor(dbutils.CurrentStateBucket)
for k, v, err := c.First(); k != nil; k, v, err = c.Next() {
if err != nil {
return err
}
if len(k) != 32 {
continue
}
vv, err := cDisk.SeekExact(k)
if err != nil {
return err
}
p, err := preimage.SeekExact(k)
if err != nil {
return err
}
if len(vv) == 0 {
fmt.Printf("Diff for %x (%x): disk: %x, mem: %x\n", k, p, vv, v)
}
count++
if count%100000 == 0 {
fmt.Printf("Compared %d records\n", count)
}
}
c = tx.Cursor(dbutils.CurrentStateBucket)
for k, v, err := c.First(); k != nil; k, v, err = c.Next() {
if err != nil {
return err
}
if len(k) == 32 {
continue
}
vv, err := cDisk.SeekExact(k)
if err != nil {
return err
}
p, err := preimage.SeekExact(k)
if err != nil {
return err
}
if len(vv) == 0 {
fmt.Printf("Diff for %x (%x): disk: %x, mem: %x\n", k, p, vv, v)
}
count++
if count%100000 == 0 {
fmt.Printf("Compared %d records\n", count)
}
}
return nil
}); err != nil {
return err
}
return nil
}); err != nil {
panic(err)
}
}
func checkRoots(stateDb ethdb.Database, rootHash common.Hash, blockNum uint64) {
startTime := time.Now()
if blockNum > 0 {
l := trie.NewSubTrieLoader(blockNum)
fmt.Printf("new resolve request for root block with hash %x\n", rootHash)
rl := trie.NewRetainList(0)
subTries, err := l.LoadSubTries(stateDb, blockNum, rl, nil /* HashCollector */, [][]byte{nil}, []int{0}, false)
if err != nil {
fmt.Printf("%v\n", err)
}
if subTries.Hashes[0] != rootHash {
fmt.Printf("State root hash mismatch, got %x, expected %x\n", subTries.Hashes[0], rootHash)
}
fmt.Printf("Trie computation took %v\n", time.Since(startTime))
} else {
fmt.Printf("block number is unknown, account trie verification skipped\n")
}
startTime = time.Now()
roots := make(map[common.Hash]*accounts.Account)
incarnationMap := make(map[uint64]int)
if err := stateDb.Walk(dbutils.CurrentStateBucket, nil, 0, func(k, v []byte) (bool, error) {
var addrHash common.Hash
copy(addrHash[:], k[:32])
if _, ok := roots[addrHash]; !ok {
account := &accounts.Account{}
if ok, err := rawdb.ReadAccount(stateDb, addrHash, account); err != nil {
return false, err
} else if !ok {
roots[addrHash] = nil
} else {
roots[addrHash] = account
incarnationMap[account.Incarnation]++
}
}
return true, nil
}); err != nil {
panic(err)
}
fmt.Printf("Incarnation map: %v\n", incarnationMap)
Merge account and storage resolvers (#504) * add_incarnation_to_acc_root_in_ih * merge cached resolver into stateful resolver * - move account root set to "post iteration" of resolver - rename "cache" to IntermediateHash * remove blockNR and bucket params from walker * fix out of range panic * calc acc.Root on the fly * remove fieldSet field from resolver, make logic of root - lazy * remove 2 parameters * working version of forward-only walk over Acc and Storage * improve test * rebase master * save progress - more tests for PrepareResolveParams, add dedicated ResolveSet for storage. Problem: See duplicates in ResolveSet hexes. Next test failing: oracle_test.go * skip old incarnations * don't rebuild when 0 requests * fix tests * start from account key when need resolve storage * Error: stateless prototype faced hashNode when extracting witness * Statless works: copy touches * Remove getAccRoot function * Remove "isAccount" parameter from resolver signature * Fix: use correct storageResolveSet in finaliseStorageRoot * Fix: when startKey changed - reset storage buffers also * Fix: if account incarnation=0 - set EmptyRoot * Fix: remove account roots by default from IntermediateHash bucket * Fix: skip abandoned storage - which appeared just after startKey * Fix: did reset acc key incorrectly * Fix: clean previous key if receive IH * Fix: IH observer - subscribe only to branch nodes (was subscribed to value nodes also) * Add DISABLE_IH and STORE_ACCOUNT_ROOT env variables for tests * Remove accNode from IH cycle * Fix flags * Fix: reset succStorage also * Fix: skip IH if it has wrong incarnation * Fix: skip IH if it has wrong incarnation * Fix: skip IH if it has wrong incarnation * Fix: use rssStorage to HashOnly check * Fix: remove termination symbol from resolveRequest * cleanup * Fix: skip abandoned storage after IH * Debug This reverts commit 9c5eb69465f25607d546b03359b2cbcb1bd46689. * Fix linters * add_incarnation_to_acc_root_in_ih * merge cached resolver into stateful resolver * - move account root set to "post iteration" of resolver - rename "cache" to IntermediateHash * remove blockNR and bucket params from walker * fix out of range panic * calc acc.Root on the fly * remove fieldSet field from resolver, make logic of root - lazy * remove 2 parameters * working version of forward-only walk over Acc and Storage * improve test * rebase master * save progress - more tests for PrepareResolveParams, add dedicated ResolveSet for storage. Problem: See duplicates in ResolveSet hexes. Next test failing: oracle_test.go * skip old incarnations * don't rebuild when 0 requests * fix tests * start from account key when need resolve storage * Error: stateless prototype faced hashNode when extracting witness * Statless works: copy touches * Remove getAccRoot function * Remove "isAccount" parameter from resolver signature * Fix: use correct storageResolveSet in finaliseStorageRoot * Fix: when startKey changed - reset storage buffers also * Fix: if account incarnation=0 - set EmptyRoot * Fix: remove account roots by default from IntermediateHash bucket * Fix: skip abandoned storage - which appeared just after startKey * Fix: did reset acc key incorrectly * Fix: clean previous key if receive IH * Fix: IH observer - subscribe only to branch nodes (was subscribed to value nodes also) * Add DISABLE_IH and STORE_ACCOUNT_ROOT env variables for tests * Remove accNode from IH cycle * Fix flags * Fix: reset succStorage also * Fix: skip IH if it has wrong incarnation * Fix: skip IH if it has wrong incarnation * Fix: skip IH if it has wrong incarnation * Fix: use rssStorage to HashOnly check * Fix: remove termination symbol from resolveRequest * cleanup * Fix: skip abandoned storage after IH * remove inc * remove inc from rss * tr.succStorage.Reset() * remove inc from rss * Remove hard-coding * succ.Reset * Enable CalcTrieRoots * Proper dumping of the trie * Debug * Fix for CalcTrieRoot * Fix another inteference bug * Temp * Fix test * Cleanup * remove STORE_ACCOUNT_ROOT=true flag * Fix linter * Fix linter * Disable getnodedata by default * Fix test * Fix test Co-authored-by: Alexey Akhunov <akhounov@gmail.com>
2020-05-02 18:00:57 +00:00
for addrHash, account := range roots {
if account != nil {
sl := trie.NewSubTrieLoader(blockNum)
contractPrefix := make([]byte, common.HashLength+common.IncarnationLength)
copy(contractPrefix, addrHash[:])
binary.BigEndian.PutUint64(contractPrefix[common.HashLength:], account.Incarnation)
rl := trie.NewRetainList(0)
subTries, err := sl.LoadSubTries(stateDb, blockNum, rl, nil /* HashCollector */, [][]byte{contractPrefix}, []int{8 * len(contractPrefix)}, false)
if err != nil {
fmt.Printf("%x: %v\n", addrHash, err)
fmt.Printf("incarnation: %d, account.Root: %x\n", account.Incarnation, account.Root)
}
if subTries.Hashes[0] != account.Root {
fmt.Printf("Storage root hash mismatch for %x, got %x, expected %x\n", addrHash, subTries.Hashes[0], account.Root)
}
}
}
fmt.Printf("Storage trie computation took %v\n", time.Since(startTime))
}
func VerifySnapshot(path string) {
ethDb := ethdb.MustOpen(path)
defer ethDb.Close()
hash := rawdb.ReadHeadBlockHash(ethDb)
number := rawdb.ReadHeaderNumber(ethDb, hash)
var currentBlockNr uint64
var preRoot common.Hash
if number != nil {
header := rawdb.ReadHeader(ethDb, hash, *number)
currentBlockNr = *number
preRoot = header.Root
}
fmt.Printf("Block number: %d\n", currentBlockNr)
fmt.Printf("Block root hash: %x\n", preRoot)
checkRoots(ethDb, preRoot, currentBlockNr)
}