erigon-pulse/cmd/integration/commands/refetence_db.go

461 lines
9.8 KiB
Go
Raw Normal View History

2020-07-14 01:56:29 +00:00
package commands
import (
2020-10-28 03:18:10 +00:00
"bufio"
"bytes"
"context"
"fmt"
2020-10-28 03:18:10 +00:00
"os"
"strings"
"time"
"github.com/ledgerwatch/lmdb-go/lmdb"
2020-10-28 03:18:10 +00:00
"github.com/ledgerwatch/turbo-geth/cmd/utils"
"github.com/ledgerwatch/turbo-geth/common"
"github.com/ledgerwatch/turbo-geth/common/dbutils"
"github.com/ledgerwatch/turbo-geth/ethdb"
"github.com/ledgerwatch/turbo-geth/ethdb/mdbx"
"github.com/ledgerwatch/turbo-geth/log"
"github.com/spf13/cobra"
)
2020-08-10 23:55:32 +00:00
var stateBuckets = []string{
dbutils.CurrentStateBucket,
dbutils.AccountChangeSetBucket,
dbutils.StorageChangeSetBucket,
dbutils.ContractCodeBucket,
dbutils.PlainStateBucket,
dbutils.PlainAccountChangeSetBucket,
dbutils.PlainStorageChangeSetBucket,
dbutils.PlainContractCodeBucket,
dbutils.IncarnationMapBucket,
dbutils.CodeBucket,
dbutils.IntermediateTrieHashBucket,
dbutils.AccountsHistoryBucket,
dbutils.StorageHistoryBucket,
dbutils.TxLookupPrefix,
}
var cmdCompareBucket = &cobra.Command{
Use: "compare_bucket",
Short: "compare bucket to the same bucket in '--reference_chaindata'",
RunE: func(cmd *cobra.Command, args []string) error {
ctx := utils.RootContext()
if referenceChaindata == "" {
referenceChaindata = chaindata + "-copy"
}
err := compareBucketBetweenDatabases(ctx, chaindata, referenceChaindata, bucket)
if err != nil {
log.Error(err.Error())
return err
}
return nil
},
}
var cmdCompareStates = &cobra.Command{
Use: "compare_states",
Short: "compare state buckets to buckets in '--reference_chaindata'",
RunE: func(cmd *cobra.Command, args []string) error {
ctx := utils.RootContext()
if referenceChaindata == "" {
referenceChaindata = chaindata + "-copy"
}
err := compareStates(ctx, chaindata, referenceChaindata)
if err != nil {
log.Error(err.Error())
return err
}
return nil
},
}
2020-10-28 03:18:10 +00:00
var cmdToMdbx = &cobra.Command{
Use: "to_mdbx",
Short: "copy data from '--chaindata' to '--reference_chaindata'",
RunE: func(cmd *cobra.Command, args []string) error {
ctx := utils.RootContext()
err := toMdbx(ctx, chaindata, toChaindata)
if err != nil {
log.Error(err.Error())
return err
}
return nil
},
}
var cmdFToMdbx = &cobra.Command{
Use: "f_to_mdbx",
Short: "copy data from '--chaindata' to '--reference_chaindata'",
RunE: func(cmd *cobra.Command, args []string) error {
ctx := utils.RootContext()
err := fToMdbx(ctx, toChaindata)
if err != nil {
log.Error(err.Error())
return err
}
return nil
},
}
func init() {
withChaindata(cmdCompareBucket)
withReferenceChaindata(cmdCompareBucket)
withBucket(cmdCompareBucket)
rootCmd.AddCommand(cmdCompareBucket)
withChaindata(cmdCompareStates)
withReferenceChaindata(cmdCompareStates)
withBucket(cmdCompareStates)
rootCmd.AddCommand(cmdCompareStates)
2020-10-28 03:18:10 +00:00
withChaindata(cmdToMdbx)
withToChaindata(cmdToMdbx)
withBucket(cmdToMdbx)
rootCmd.AddCommand(cmdToMdbx)
withToChaindata(cmdFToMdbx)
withFile(cmdFToMdbx)
2020-10-28 03:18:10 +00:00
withBucket(cmdFToMdbx)
rootCmd.AddCommand(cmdFToMdbx)
}
func compareStates(ctx context.Context, chaindata string, referenceChaindata string) error {
db := ethdb.MustOpen(chaindata)
defer db.Close()
refDB := ethdb.MustOpen(referenceChaindata)
defer refDB.Close()
if err := db.KV().View(context.Background(), func(tx ethdb.Tx) error {
if err := refDB.KV().View(context.Background(), func(refTX ethdb.Tx) error {
for _, bucket := range stateBuckets {
fmt.Printf("\nBucket: %s\n", bucket)
if err := compareBuckets(ctx, tx, bucket, refTX, bucket); err != nil {
return err
}
}
return nil
}); err != nil {
return err
}
return nil
}); err != nil {
return err
}
return nil
}
func compareBucketBetweenDatabases(ctx context.Context, chaindata string, referenceChaindata string, bucket string) error {
db := ethdb.MustOpen(chaindata)
defer db.Close()
refDB := ethdb.MustOpen(referenceChaindata)
defer refDB.Close()
if err := db.KV().View(context.Background(), func(tx ethdb.Tx) error {
return refDB.KV().View(context.Background(), func(refTX ethdb.Tx) error {
return compareBuckets(ctx, tx, bucket, refTX, bucket)
})
}); err != nil {
return err
}
return nil
}
func compareBuckets(ctx context.Context, tx ethdb.Tx, b string, refTx ethdb.Tx, refB string) error {
count := 0
c := tx.Cursor(b)
k, v, e := c.First()
if e != nil {
return e
}
refC := refTx.Cursor(refB)
refK, refV, revErr := refC.First()
if revErr != nil {
return revErr
}
for k != nil || refK != nil {
count++
if count%10_000_000 == 0 {
select {
case <-ctx.Done():
return ctx.Err()
default:
}
fmt.Printf("Compared %d records\n", count)
}
if k == nil {
fmt.Printf("Missing in db: %x [%x]\n", refK, refV)
refK, refV, revErr = refC.Next()
if revErr != nil {
return revErr
}
} else if refK == nil {
fmt.Printf("Missing refDB: %x [%x]\n", k, v)
k, v, e = c.Next()
if e != nil {
return e
}
} else {
switch bytes.Compare(k, refK) {
case -1:
fmt.Printf("Missing refDB: %x [%x]\n", k, v)
k, v, e = c.Next()
if e != nil {
return e
}
case 1:
fmt.Printf("Missing in db: %x [%x]\n", refK, refV)
refK, refV, revErr = refC.Next()
if revErr != nil {
return revErr
}
case 0:
if !bytes.Equal(v, refV) {
fmt.Printf("Different values for %x. db: [%x], refDB: [%x]\n", k, v, refV)
}
k, v, e = c.Next()
if e != nil {
return e
}
refK, refV, revErr = refC.Next()
if revErr != nil {
return revErr
}
default:
fmt.Printf("Unexpected result of bytes.Compare: %d\n", bytes.Compare(k, refK))
}
}
}
return nil
}
2020-10-28 03:18:10 +00:00
func fToMdbx(ctx context.Context, to string) error {
file, err := os.Open(file)
2020-10-28 03:18:10 +00:00
if err != nil {
panic(err)
2020-10-28 03:18:10 +00:00
}
defer file.Close()
dst := ethdb.NewMDBX().Path(to).MustOpen()
dstTx, err1 := dst.Begin(ctx, nil, ethdb.RW)
if err1 != nil {
return err1
}
defer func() {
dstTx.Rollback()
}()
commitEvery := time.NewTicker(30 * time.Second)
2020-10-28 03:18:10 +00:00
defer commitEvery.Stop()
fileScanner := bufio.NewScanner(file)
endData := []byte("DATA=END")
endHeader := []byte("HEADER=END")
MainLoop:
for {
bucket := ""
for { // header
if !fileScanner.Scan() {
break
}
kk := fileScanner.Bytes()
if bytes.Equal(kk, endHeader) {
break
}
parts := strings.Split(string(kk), "=")
k, v := parts[0], parts[1]
if k == "database" {
bucket = v
}
}
err = fileScanner.Err()
if err != nil {
panic(err)
}
err = fileScanner.Err()
if err != nil {
panic(err)
}
if bucket == "" {
panic("bucket not parse")
2020-10-28 03:18:10 +00:00
}
c := dstTx.Cursor(bucket)
var prevK []byte
for {
if !fileScanner.Scan() {
break MainLoop
}
k := common.CopyBytes(fileScanner.Bytes())
if bytes.Equal(k, endData) {
break
}
k = common.FromHex(string(k[1:]))
if !fileScanner.Scan() {
break MainLoop
}
v := common.CopyBytes(fileScanner.Bytes())
v = common.FromHex(string(v[1:]))
if casted, ok := c.(ethdb.CursorDupSort); ok {
if bytes.Equal(k, prevK) {
if err = casted.AppendDup(k, v); err != nil {
panic(err)
}
} else {
if err = casted.Append(k, v); err != nil {
panic(err)
}
}
prevK = k
} else {
if err = c.Append(k, v); err != nil {
panic(err)
}
}
select {
default:
case <-ctx.Done():
return ctx.Err()
case <-commitEvery.C:
log.Info("Progress", "bucket", bucket, "key", fmt.Sprintf("%x", k))
//if err2 := dstTx.Commit(ctx); err2 != nil {
// return err2
//}
//dstTx, err = dst.Begin(ctx, nil, ethdb.RW)
//if err != nil {
// return err
//}
//c = dstTx.Cursor(bucket)
}
2020-10-28 03:18:10 +00:00
}
prevK = nil
err = fileScanner.Err()
if err != nil {
panic(err)
}
}
err = dstTx.Commit(context.Background())
if err != nil {
return err
2020-10-28 03:18:10 +00:00
}
dstTx, err = dst.Begin(ctx, nil, ethdb.RW)
2020-10-28 03:18:10 +00:00
if err != nil {
return err
2020-10-28 03:18:10 +00:00
}
err = dstTx.Commit(ctx)
2020-10-28 03:18:10 +00:00
if err != nil {
return err
}
return nil
}
func toMdbx(ctx context.Context, from, to string) error {
_ = os.RemoveAll(to)
src := ethdb.NewLMDB().Path(from).Flags(func(flags uint) uint {
return (flags | lmdb.Readonly) ^ lmdb.NoReadahead
}).MustOpen()
dst := ethdb.NewMDBX().Path(to).Flags(func(flags uint) uint {
return flags | mdbx.WriteMap | mdbx.NoMemInit
}).MustOpen()
2020-10-28 03:18:10 +00:00
srcTx, err1 := src.Begin(ctx, nil, ethdb.RO)
if err1 != nil {
return err1
}
defer srcTx.Rollback()
dstTx, err1 := dst.Begin(ctx, nil, ethdb.RW)
2020-10-28 03:18:10 +00:00
if err1 != nil {
return err1
}
defer func() {
dstTx.Rollback()
}()
commitEvery := time.NewTicker(60 * time.Second)
2020-10-28 03:18:10 +00:00
defer commitEvery.Stop()
for name, b := range src.AllBuckets() {
2020-10-28 03:18:10 +00:00
if b.IsDeprecated {
continue
}
c := dstTx.Cursor(name)
srcC := srcTx.Cursor(name)
var prevK []byte
2020-10-28 03:18:10 +00:00
for k, v, err := srcC.First(); k != nil; k, v, err = srcC.Next() {
if err != nil {
return err
}
if casted, ok := c.(ethdb.CursorDupSort); ok {
if bytes.Equal(k, prevK) {
if err = casted.AppendDup(k, v); err != nil {
return err
}
} else {
if err = casted.Append(k, v); err != nil {
return err
}
}
prevK = k
} else {
if err = c.Append(k, v); err != nil {
return err
}
2020-10-28 03:18:10 +00:00
}
select {
default:
case <-ctx.Done():
return ctx.Err()
2020-10-28 03:18:10 +00:00
case <-commitEvery.C:
log.Info("Progress", "bucket", name, "key", fmt.Sprintf("%x", k))
2020-10-28 03:18:10 +00:00
if err2 := dstTx.Commit(ctx); err2 != nil {
return err2
}
dstTx, err = dst.Begin(ctx, nil, ethdb.RW)
2020-10-28 03:18:10 +00:00
if err != nil {
return err
}
c = dstTx.Cursor(name)
}
}
prevK = nil
2020-11-23 04:15:43 +00:00
// migrate bucket sequences to native mdbx implementation
currentID, err := srcTx.Sequence(name, 0)
if err != nil {
return err
}
2020-11-23 04:18:21 +00:00
_, err = dstTx.Sequence(name, currentID)
2020-11-23 04:15:43 +00:00
if err != nil {
return err
}
2020-10-28 03:18:10 +00:00
}
err := dstTx.Commit(context.Background())
if err != nil {
return err
}
dstTx, err = dst.Begin(ctx, nil, ethdb.RW)
if err != nil {
return err
}
err = dstTx.Commit(ctx)
if err != nil {
return err
}
2020-10-28 03:18:10 +00:00
srcTx.Rollback()
return nil
}