2020-04-20 10:35:33 +00:00
|
|
|
package core
|
|
|
|
|
|
|
|
import (
|
2020-05-23 09:19:56 +00:00
|
|
|
"encoding/binary"
|
|
|
|
"errors"
|
2020-05-31 06:57:47 +00:00
|
|
|
"fmt"
|
2020-06-16 13:36:16 +00:00
|
|
|
"os"
|
|
|
|
"time"
|
|
|
|
|
2020-04-20 10:35:33 +00:00
|
|
|
"github.com/ledgerwatch/turbo-geth/common"
|
2020-06-10 20:07:14 +00:00
|
|
|
"github.com/ledgerwatch/turbo-geth/common/changeset"
|
2020-04-20 10:35:33 +00:00
|
|
|
"github.com/ledgerwatch/turbo-geth/common/dbutils"
|
2020-06-10 20:07:14 +00:00
|
|
|
"github.com/ledgerwatch/turbo-geth/common/etl"
|
2020-04-20 10:35:33 +00:00
|
|
|
"github.com/ledgerwatch/turbo-geth/ethdb"
|
|
|
|
"github.com/ledgerwatch/turbo-geth/log"
|
|
|
|
)
|
|
|
|
|
2020-07-07 04:00:25 +00:00
|
|
|
func NewIndexGenerator(db ethdb.Database, quitCh <-chan struct{}) *IndexGenerator {
|
2020-04-20 10:35:33 +00:00
|
|
|
return &IndexGenerator{
|
2020-05-31 06:57:47 +00:00
|
|
|
db: db,
|
|
|
|
ChangeSetBufSize: 256 * 1024 * 1024,
|
|
|
|
TempDir: os.TempDir(),
|
2020-06-10 20:07:14 +00:00
|
|
|
quitCh: quitCh,
|
2020-04-20 10:35:33 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
type IndexGenerator struct {
|
2020-05-31 06:57:47 +00:00
|
|
|
db ethdb.Database
|
2020-06-10 20:07:14 +00:00
|
|
|
ChangeSetBufSize int
|
2020-05-31 06:57:47 +00:00
|
|
|
TempDir string
|
2020-07-07 04:00:25 +00:00
|
|
|
quitCh <-chan struct{}
|
2020-04-20 10:35:33 +00:00
|
|
|
}
|
|
|
|
|
2020-08-10 23:55:32 +00:00
|
|
|
func (ig *IndexGenerator) GenerateIndex(startBlock, endBlock uint64, changeSetBucket string, datadir string) error {
|
2020-08-15 13:49:36 +00:00
|
|
|
v, ok := changeset.Mapper[changeSetBucket]
|
2020-05-31 06:57:47 +00:00
|
|
|
if !ok {
|
|
|
|
return errors.New("unknown bucket type")
|
|
|
|
}
|
2020-08-15 13:49:36 +00:00
|
|
|
log.Debug("Index generation", "from", startBlock, "to", endBlock, "csbucket", changeSetBucket)
|
2020-06-10 20:07:14 +00:00
|
|
|
if endBlock < startBlock && endBlock != 0 {
|
2020-06-13 12:39:04 +00:00
|
|
|
return fmt.Errorf("generateIndex %s: endBlock %d smaller than startBlock %d", changeSetBucket, endBlock, startBlock)
|
2020-05-31 06:57:47 +00:00
|
|
|
}
|
2020-06-10 20:07:14 +00:00
|
|
|
t := time.Now()
|
|
|
|
err := etl.Transform(ig.db, changeSetBucket,
|
|
|
|
v.IndexBucket,
|
2020-08-02 10:32:41 +00:00
|
|
|
datadir,
|
2020-06-10 20:07:14 +00:00
|
|
|
getExtractFunc(v.WalkerAdapter),
|
|
|
|
loadFunc,
|
|
|
|
etl.TransformArgs{
|
|
|
|
ExtractStartKey: dbutils.EncodeTimestamp(startBlock),
|
2020-06-28 06:10:27 +00:00
|
|
|
ExtractEndKey: dbutils.EncodeTimestamp(endBlock),
|
2020-06-10 20:07:14 +00:00
|
|
|
FixedBits: 0,
|
|
|
|
BufferType: etl.SortableAppendBuffer,
|
|
|
|
BufferSize: ig.ChangeSetBufSize,
|
|
|
|
Quit: ig.quitCh,
|
2020-08-22 10:12:33 +00:00
|
|
|
LogDetailsExtract: func(k, v []byte) (additionalLogArguments []interface{}) {
|
2020-08-22 23:55:17 +00:00
|
|
|
blockNum, _ := dbutils.DecodeTimestamp(k)
|
|
|
|
return []interface{}{"block", blockNum}
|
2020-08-22 10:12:33 +00:00
|
|
|
},
|
2020-06-10 20:07:14 +00:00
|
|
|
},
|
|
|
|
)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
2020-04-20 10:35:33 +00:00
|
|
|
}
|
|
|
|
|
2020-08-15 13:49:36 +00:00
|
|
|
log.Debug("Index generation successfully finished", "csbucket", changeSetBucket, "it took", time.Since(t))
|
2020-04-20 10:35:33 +00:00
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2020-08-10 23:55:32 +00:00
|
|
|
func (ig *IndexGenerator) Truncate(timestampTo uint64, changeSetBucket string) error {
|
2020-08-15 13:49:36 +00:00
|
|
|
vv, ok := changeset.Mapper[changeSetBucket]
|
2020-05-31 06:57:47 +00:00
|
|
|
if !ok {
|
|
|
|
return errors.New("unknown bucket type")
|
|
|
|
}
|
|
|
|
|
2020-05-23 09:19:56 +00:00
|
|
|
currentKey := dbutils.EncodeTimestamp(timestampTo)
|
|
|
|
keys := make(map[string]struct{})
|
2020-07-10 06:03:18 +00:00
|
|
|
if err := ig.db.Walk(changeSetBucket, currentKey, 0, func(k, v []byte) (b bool, e error) {
|
2020-05-31 06:57:47 +00:00
|
|
|
if err := common.Stopped(ig.quitCh); err != nil {
|
|
|
|
return false, err
|
|
|
|
}
|
|
|
|
|
2020-05-23 09:19:56 +00:00
|
|
|
currentKey = common.CopyBytes(k)
|
2020-05-31 06:57:47 +00:00
|
|
|
err := vv.WalkerAdapter(v).Walk(func(kk []byte, _ []byte) error {
|
2020-07-06 06:34:24 +00:00
|
|
|
keys[string(common.CopyBytes(kk))] = struct{}{}
|
2020-05-23 09:19:56 +00:00
|
|
|
return nil
|
|
|
|
})
|
|
|
|
if err != nil {
|
|
|
|
return false, err
|
|
|
|
}
|
|
|
|
return true, nil
|
2020-07-10 06:03:18 +00:00
|
|
|
}); err != nil {
|
2020-05-23 09:19:56 +00:00
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
2020-05-31 06:57:47 +00:00
|
|
|
historyEffects := make(map[string][]byte)
|
|
|
|
keySize := vv.KeySize
|
2020-08-10 23:55:32 +00:00
|
|
|
if dbutils.StorageChangeSetBucket == changeSetBucket || dbutils.PlainStorageChangeSetBucket == changeSetBucket {
|
2020-05-31 06:57:47 +00:00
|
|
|
keySize -= 8
|
|
|
|
}
|
|
|
|
|
|
|
|
var startKey = make([]byte, keySize+8)
|
2020-05-23 09:19:56 +00:00
|
|
|
|
|
|
|
for key := range keys {
|
2020-07-06 06:34:24 +00:00
|
|
|
copy(startKey[:keySize], dbutils.CompositeKeyWithoutIncarnation([]byte(key)))
|
2020-06-10 20:07:14 +00:00
|
|
|
|
2020-05-31 06:57:47 +00:00
|
|
|
binary.BigEndian.PutUint64(startKey[keySize:], timestampTo)
|
|
|
|
if err := ig.db.Walk(vv.IndexBucket, startKey, 8*keySize, func(k, v []byte) (bool, error) {
|
|
|
|
timestamp := binary.BigEndian.Uint64(k[keySize:]) // the last timestamp in the chunk
|
2020-05-23 09:19:56 +00:00
|
|
|
kStr := string(common.CopyBytes(k))
|
|
|
|
if timestamp > timestampTo {
|
2020-05-31 06:57:47 +00:00
|
|
|
historyEffects[kStr] = nil
|
2020-05-23 09:19:56 +00:00
|
|
|
// truncate the chunk
|
|
|
|
index := dbutils.WrapHistoryIndex(v)
|
|
|
|
index = index.TruncateGreater(timestampTo)
|
|
|
|
if len(index) > 8 { // If the chunk is empty after truncation, it gets simply deleted
|
|
|
|
// Truncated chunk becomes "the last chunk" with the timestamp 0xffff....ffff
|
2020-05-31 06:57:47 +00:00
|
|
|
lastK := make([]byte, len(k))
|
|
|
|
copy(lastK, k[:keySize])
|
|
|
|
binary.BigEndian.PutUint64(lastK[keySize:], ^uint64(0))
|
|
|
|
historyEffects[string(lastK)] = common.CopyBytes(index)
|
2020-05-23 09:19:56 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
return true, nil
|
|
|
|
}); err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
}
|
2020-08-16 16:54:33 +00:00
|
|
|
mutation := ig.db.NewBatch()
|
2020-08-26 06:03:50 +00:00
|
|
|
defer mutation.Rollback()
|
2020-05-23 09:19:56 +00:00
|
|
|
|
2020-05-31 06:57:47 +00:00
|
|
|
for key, value := range historyEffects {
|
2020-05-23 09:19:56 +00:00
|
|
|
if value == nil {
|
2020-08-16 16:54:33 +00:00
|
|
|
if err := mutation.Delete(vv.IndexBucket, []byte(key)); err != nil {
|
2020-05-23 09:19:56 +00:00
|
|
|
return err
|
|
|
|
}
|
|
|
|
} else {
|
2020-08-16 16:54:33 +00:00
|
|
|
if err := mutation.Put(vv.IndexBucket, []byte(key), value); err != nil {
|
2020-05-23 09:19:56 +00:00
|
|
|
return err
|
|
|
|
}
|
|
|
|
}
|
2020-08-16 16:54:33 +00:00
|
|
|
if mutation.BatchSize() >= mutation.IdealBatchSize() {
|
2020-08-26 06:03:50 +00:00
|
|
|
if err := mutation.CommitAndBegin(); err != nil {
|
2020-08-16 16:54:33 +00:00
|
|
|
return err
|
|
|
|
}
|
|
|
|
}
|
2020-05-23 09:19:56 +00:00
|
|
|
}
|
2020-08-16 16:54:33 +00:00
|
|
|
_, err := mutation.Commit()
|
|
|
|
return err
|
2020-05-23 09:19:56 +00:00
|
|
|
}
|
|
|
|
|
2020-08-10 23:55:32 +00:00
|
|
|
func (ig *IndexGenerator) DropIndex(bucket string) error {
|
2020-07-27 21:59:54 +00:00
|
|
|
casted, ok := ig.db.(ethdb.NonTransactional)
|
|
|
|
if !ok {
|
|
|
|
return errors.New("imposible to drop")
|
2020-05-23 09:19:56 +00:00
|
|
|
}
|
2020-08-15 13:49:36 +00:00
|
|
|
log.Warn("Remove bucket", "bucket", bucket)
|
2020-07-27 21:59:54 +00:00
|
|
|
return casted.ClearBuckets(bucket)
|
2020-05-23 09:19:56 +00:00
|
|
|
}
|
2020-05-31 06:57:47 +00:00
|
|
|
|
2020-06-10 20:07:14 +00:00
|
|
|
func loadFunc(k []byte, value []byte, state etl.State, next etl.LoadNextFunc) error {
|
|
|
|
if len(value)%9 != 0 {
|
|
|
|
log.Error("Value must be a multiple of 9", "ln", len(value), "k", common.Bytes2Hex(k))
|
|
|
|
return errors.New("incorrect value")
|
2020-05-31 06:57:47 +00:00
|
|
|
}
|
2020-07-06 06:34:24 +00:00
|
|
|
k = common.CopyBytes(k)
|
2020-06-10 20:07:14 +00:00
|
|
|
currentChunkKey := dbutils.IndexChunkKey(k, ^uint64(0))
|
|
|
|
indexBytes, err1 := state.Get(currentChunkKey)
|
|
|
|
if err1 != nil && !errors.Is(err1, ethdb.ErrKeyNotFound) {
|
|
|
|
return fmt.Errorf("find chunk failed: %w", err1)
|
2020-05-31 06:57:47 +00:00
|
|
|
}
|
2020-06-10 20:07:14 +00:00
|
|
|
currentIndex := dbutils.WrapHistoryIndex(indexBytes)
|
2020-05-31 06:57:47 +00:00
|
|
|
|
2020-06-10 20:07:14 +00:00
|
|
|
for i := 0; i < len(value); i += 9 {
|
|
|
|
b := binary.BigEndian.Uint64(value[i:])
|
|
|
|
vzero := value[i+8] == 1
|
|
|
|
blockNr := b
|
2020-05-31 06:57:47 +00:00
|
|
|
if err1 != nil && err1 != ethdb.ErrKeyNotFound {
|
|
|
|
return fmt.Errorf("find chunk failed: %w", err1)
|
|
|
|
}
|
2020-06-10 20:07:14 +00:00
|
|
|
|
|
|
|
if dbutils.CheckNewIndexChunk(currentIndex, blockNr) {
|
2020-05-31 06:57:47 +00:00
|
|
|
// Chunk overflow, need to write the "old" current chunk under its key derived from the last element
|
2020-06-10 20:07:14 +00:00
|
|
|
indexKey, err3 := currentIndex.Key(k)
|
2020-05-31 06:57:47 +00:00
|
|
|
if err3 != nil {
|
|
|
|
return err3
|
|
|
|
}
|
|
|
|
// Flush the old chunk
|
2020-07-01 14:56:56 +00:00
|
|
|
if err4 := next(k, indexKey, currentIndex); err4 != nil {
|
2020-05-31 06:57:47 +00:00
|
|
|
return err4
|
|
|
|
}
|
|
|
|
// Start a new chunk
|
2020-06-10 20:07:14 +00:00
|
|
|
currentIndex = dbutils.NewHistoryIndex()
|
2020-05-31 06:57:47 +00:00
|
|
|
}
|
2020-06-10 20:07:14 +00:00
|
|
|
currentIndex = currentIndex.Append(blockNr, vzero)
|
|
|
|
}
|
2020-07-10 06:03:18 +00:00
|
|
|
|
|
|
|
if err := next(k, currentChunkKey, currentIndex); err != nil {
|
2020-06-10 20:07:14 +00:00
|
|
|
return err
|
2020-05-31 06:57:47 +00:00
|
|
|
}
|
2020-06-10 20:07:14 +00:00
|
|
|
|
2020-05-31 06:57:47 +00:00
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
|
|
|
func getExtractFunc(bytes2walker func([]byte) changeset.Walker) etl.ExtractFunc { //nolint
|
|
|
|
return func(dbKey, dbValue []byte, next etl.ExtractNextFunc) error {
|
|
|
|
blockNum, _ := dbutils.DecodeTimestamp(dbKey)
|
2020-07-01 14:56:56 +00:00
|
|
|
return bytes2walker(dbValue).Walk(func(changesetKey, changesetValue []byte) error {
|
2020-07-06 06:34:24 +00:00
|
|
|
key := common.CopyBytes(changesetKey)
|
2020-06-10 20:07:14 +00:00
|
|
|
v := make([]byte, 9)
|
2020-07-01 14:56:56 +00:00
|
|
|
binary.BigEndian.PutUint64(v, blockNum)
|
2020-05-31 06:57:47 +00:00
|
|
|
if len(changesetValue) == 0 {
|
2020-06-10 20:07:14 +00:00
|
|
|
v[8] = 1
|
2020-05-31 06:57:47 +00:00
|
|
|
}
|
2020-07-06 06:34:24 +00:00
|
|
|
return next(dbKey, key, v)
|
2020-05-31 06:57:47 +00:00
|
|
|
})
|
|
|
|
}
|
|
|
|
}
|