erigon-pulse/cmd/evm/staterunner.go
Martin Holst Swende c042afb4af
cmd/evm: support batched statetest-mode (#7598)
This implements batched state-test exectution, similar to
https://github.com/ethereum/go-ethereum/pull/27318 .
Some speedtests, executing a state-test twice on current master takes
~4-5 seconds, and scales linerarly.
```
Doing 2 execs old style

real    0m8.185s
user    0m8.081s
sys     0m0.110s
```
Doing `100` executions on this PR -- a few seconds of ramp-up time, but
very quick execution after that :
```
Doing 100 execs v2

real    0m5.009s
user    0m4.560s
sys     0m0.508s
```
I also tested a version where I moved the db instantiation into the top
callsite, with the `MustOpen` and `.Close` only performed once, instead
of `100` times -- however, I noticed no additional speed gains from
doing so (my branch `batched_evm_v2`).

Therefore, I suspect that the slowdowns comes not from the db, but the
kzg library initialization.
2023-05-29 18:28:24 +07:00

174 lines
5.2 KiB
Go

// Copyright 2017 The go-ethereum Authors
// This file is part of go-ethereum.
//
// go-ethereum is free software: you can redistribute it and/or modify
// it under the terms of the GNU General Public License as published by
// the Free Software Foundation, either version 3 of the License, or
// (at your option) any later version.
//
// go-ethereum is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
// GNU General Public License for more details.
//
// You should have received a copy of the GNU General Public License
// along with go-ethereum. If not, see <http://www.gnu.org/licenses/>.
package main
import (
"bufio"
"context"
"encoding/json"
"fmt"
"os"
"path/filepath"
"github.com/c2h5oh/datasize"
libcommon "github.com/ledgerwatch/erigon-lib/common"
"github.com/ledgerwatch/erigon-lib/kv/mdbx"
"github.com/ledgerwatch/log/v3"
mdbx2 "github.com/torquem-ch/mdbx-go/mdbx"
"github.com/urfave/cli/v2"
"github.com/ledgerwatch/erigon/core/state"
"github.com/ledgerwatch/erigon/core/vm"
"github.com/ledgerwatch/erigon/eth/tracers/logger"
"github.com/ledgerwatch/erigon/tests"
"github.com/ledgerwatch/erigon/turbo/trie"
)
var stateTestCommand = cli.Command{
Action: stateTestCmd,
Name: "statetest",
Usage: "executes the given state tests",
ArgsUsage: "<file>",
}
// StatetestResult contains the execution status after running a state test, any
// error that might have occurred and a dump of the final state if requested.
type StatetestResult struct {
Name string `json:"name"`
Pass bool `json:"pass"`
Root *libcommon.Hash `json:"stateRoot,omitempty"`
Fork string `json:"fork"`
Error string `json:"error,omitempty"`
State *state.Dump `json:"state,omitempty"`
}
func stateTestCmd(ctx *cli.Context) error {
// Configure the go-ethereum logger
log.Root().SetHandler(log.LvlFilterHandler(log.LvlDebug, log.StderrHandler))
// Configure the EVM logger
config := &logger.LogConfig{
DisableMemory: ctx.Bool(DisableMemoryFlag.Name),
DisableStack: ctx.Bool(DisableStackFlag.Name),
DisableStorage: ctx.Bool(DisableStorageFlag.Name),
DisableReturnData: ctx.Bool(DisableReturnDataFlag.Name),
}
cfg := vm.Config{
Debug: ctx.Bool(DebugFlag.Name) || ctx.Bool(MachineFlag.Name),
}
if ctx.Bool(MachineFlag.Name) {
cfg.Tracer = logger.NewJSONLogger(config, os.Stderr)
} else if ctx.Bool(DebugFlag.Name) {
cfg.Tracer = logger.NewStructLogger(config)
}
if len(ctx.Args().First()) != 0 {
return runStateTest(ctx.Args().First(), cfg, ctx.Bool(MachineFlag.Name))
}
scanner := bufio.NewScanner(os.Stdin)
for scanner.Scan() {
fname := scanner.Text()
if len(fname) == 0 {
return nil
}
if err := runStateTest(fname, cfg, ctx.Bool(MachineFlag.Name)); err != nil {
return err
}
}
return nil
}
// runStateTest loads the state-test given by fname, and executes the test.
func runStateTest(fname string, cfg vm.Config, jsonOut bool) error {
// Load the test content from the input file
src, err := os.ReadFile(fname)
if err != nil {
return err
}
var stateTests map[string]tests.StateTest
if err = json.Unmarshal(src, &stateTests); err != nil {
return err
}
// Iterate over all the stateTests, run them and aggregate the results
results, err := aggregateResultsFromStateTests(stateTests, cfg, jsonOut)
if err != nil {
return err
}
out, _ := json.MarshalIndent(results, "", " ")
fmt.Println(string(out))
return nil
}
func aggregateResultsFromStateTests(
stateTests map[string]tests.StateTest, cfg vm.Config,
jsonOut bool) ([]StatetestResult, error) {
//this DB is shared. means:
// - faster sequential tests: don't need create/delete db
// - less parallelism: multiple processes can open same DB but only 1 can create rw-transaction (other will wait when 1-st finish)
db := mdbx.NewMDBX(log.New()).
Path(filepath.Join(os.TempDir(), "erigon-statetest")).
Flags(func(u uint) uint {
return u | mdbx2.UtterlyNoSync | mdbx2.NoMetaSync | mdbx2.LifoReclaim | mdbx2.NoMemInit
}).
GrowthStep(1 * datasize.MB).
MustOpen()
defer db.Close()
tx, txErr := db.BeginRw(context.Background())
if txErr != nil {
return nil, txErr
}
defer tx.Rollback()
results := make([]StatetestResult, 0, len(stateTests))
for key, test := range stateTests {
for _, st := range test.Subtests() {
// Run the test and aggregate the result
result := &StatetestResult{Name: key, Fork: st.Fork, Pass: true}
var root libcommon.Hash
var calcRootErr error
statedb, err := test.Run(tx, st, cfg)
// print state root for evmlab tracing
root, calcRootErr = trie.CalcRoot("", tx)
if err == nil && calcRootErr != nil {
err = calcRootErr
}
if err != nil {
// Test failed, mark as so and dump any state to aid debugging
result.Pass, result.Error = false, err.Error()
}
// print state root for evmlab tracing
if statedb != nil {
result.Root = &root
if jsonOut {
_, printErr := fmt.Fprintf(os.Stderr, "{\"stateRoot\": \"%#x\"}\n", root.Bytes())
if printErr != nil {
log.Warn("Failed to write to stderr", "err", printErr)
}
}
}
results = append(results, *result)
}
}
return results, nil
}