2020-04-20 10:35:33 +00:00
|
|
|
package stats
|
|
|
|
|
|
|
|
import (
|
|
|
|
"bytes"
|
2021-07-07 16:15:49 +00:00
|
|
|
"context"
|
2020-04-20 10:35:33 +00:00
|
|
|
"encoding/csv"
|
|
|
|
"fmt"
|
|
|
|
"log"
|
|
|
|
"os"
|
|
|
|
"sort"
|
|
|
|
"strconv"
|
2020-08-10 23:55:32 +00:00
|
|
|
"strings"
|
2020-04-20 10:35:33 +00:00
|
|
|
"time"
|
2020-06-16 13:36:16 +00:00
|
|
|
|
2021-10-08 03:20:45 +00:00
|
|
|
libcommon "github.com/ledgerwatch/erigon-lib/common"
|
|
|
|
"github.com/ledgerwatch/erigon-lib/common/length"
|
2021-07-29 11:53:13 +00:00
|
|
|
"github.com/ledgerwatch/erigon-lib/kv"
|
|
|
|
"github.com/ledgerwatch/erigon-lib/kv/mdbx"
|
2021-05-20 18:25:53 +00:00
|
|
|
"github.com/ledgerwatch/erigon/common"
|
2020-04-20 10:35:33 +00:00
|
|
|
)
|
|
|
|
|
2020-08-10 23:55:32 +00:00
|
|
|
func IndexStats(chaindata string, indexBucket string, statsFile string) error {
|
2021-07-28 02:47:38 +00:00
|
|
|
db := mdbx.MustOpen(chaindata)
|
2020-04-20 10:35:33 +00:00
|
|
|
startTime := time.Now()
|
2021-10-08 03:20:45 +00:00
|
|
|
lenOfKey := length.Addr
|
2021-07-28 02:47:38 +00:00
|
|
|
if strings.HasPrefix(indexBucket, kv.StorageHistory) {
|
2021-10-08 03:20:45 +00:00
|
|
|
lenOfKey = length.Addr + length.Hash + length.Incarnation
|
2020-04-20 10:35:33 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
more1index := 0
|
|
|
|
more10index := make(map[string]uint64)
|
|
|
|
more50index := make(map[string]uint64)
|
|
|
|
more100index := make(map[string]uint64)
|
|
|
|
more200index := make(map[string]uint64)
|
|
|
|
more500index := make(map[string]uint64)
|
|
|
|
more1000index := make(map[string]uint64)
|
|
|
|
|
|
|
|
prevKey := []byte{}
|
|
|
|
count := uint64(1)
|
|
|
|
added := false
|
|
|
|
i := uint64(0)
|
2021-07-07 16:15:49 +00:00
|
|
|
tx, err := db.BeginRo(context.Background())
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
defer tx.Rollback()
|
|
|
|
if err = tx.ForEach(indexBucket, []byte{}, func(k, v []byte) error {
|
2020-04-20 10:35:33 +00:00
|
|
|
if i%100_000 == 0 {
|
|
|
|
fmt.Printf("Processed %dK, %s\n", i/1000, time.Since(startTime))
|
|
|
|
}
|
|
|
|
if bytes.Equal(k[:lenOfKey], prevKey) {
|
|
|
|
count++
|
|
|
|
if count > 1 && !added {
|
|
|
|
more1index++
|
|
|
|
added = true
|
|
|
|
}
|
|
|
|
if count > 10 {
|
2021-10-08 03:20:45 +00:00
|
|
|
more10index[string(libcommon.Copy(k[:lenOfKey]))] = count
|
2020-04-20 10:35:33 +00:00
|
|
|
}
|
|
|
|
if count > 50 {
|
2021-10-08 03:20:45 +00:00
|
|
|
more50index[string(libcommon.Copy(k[:lenOfKey]))] = count
|
2020-04-20 10:35:33 +00:00
|
|
|
}
|
|
|
|
if count > 100 {
|
2021-10-08 03:20:45 +00:00
|
|
|
more100index[string(libcommon.Copy(k[:lenOfKey]))] = count
|
2020-04-20 10:35:33 +00:00
|
|
|
}
|
|
|
|
if count > 200 {
|
2021-10-08 03:20:45 +00:00
|
|
|
more200index[string(libcommon.Copy(k[:lenOfKey]))] = count
|
2020-04-20 10:35:33 +00:00
|
|
|
}
|
|
|
|
if count > 500 {
|
2021-10-08 03:20:45 +00:00
|
|
|
more500index[string(libcommon.Copy(k[:lenOfKey]))] = count
|
2020-04-20 10:35:33 +00:00
|
|
|
}
|
|
|
|
if count > 1000 {
|
2021-10-08 03:20:45 +00:00
|
|
|
more1000index[string(libcommon.Copy(k[:lenOfKey]))] = count
|
2020-04-20 10:35:33 +00:00
|
|
|
}
|
|
|
|
} else {
|
|
|
|
added = false
|
|
|
|
count = 1
|
2021-10-08 03:20:45 +00:00
|
|
|
prevKey = libcommon.Copy(k[:length.Addr])
|
2020-04-20 10:35:33 +00:00
|
|
|
}
|
|
|
|
|
2021-07-07 16:15:49 +00:00
|
|
|
return nil
|
2020-06-16 13:36:16 +00:00
|
|
|
}); err != nil {
|
2020-04-20 10:35:33 +00:00
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
fmt.Println("more1", more1index)
|
|
|
|
fmt.Println("more10", len(more10index))
|
|
|
|
fmt.Println("more50", len(more50index))
|
|
|
|
fmt.Println("more100", len(more100index))
|
|
|
|
fmt.Println("more200", len(more200index))
|
|
|
|
fmt.Println("more500", len(more500index))
|
|
|
|
fmt.Println("more1000", len(more1000index))
|
|
|
|
|
|
|
|
if statsFile != "" {
|
|
|
|
f, err := os.Create(statsFile)
|
|
|
|
if err != nil {
|
|
|
|
log.Fatal(err)
|
|
|
|
}
|
|
|
|
defer f.Close() //nolint
|
|
|
|
save10 := make([]struct {
|
|
|
|
Address string
|
|
|
|
Hash string
|
|
|
|
NumOfIndexes uint64
|
|
|
|
}, 0, len(more10index))
|
|
|
|
for hash, v := range more10index {
|
2021-10-08 03:20:45 +00:00
|
|
|
p := []byte(hash)[:length.Addr]
|
2020-04-20 10:35:33 +00:00
|
|
|
if len(p) == 0 {
|
|
|
|
p = make([]byte, 20)
|
|
|
|
}
|
|
|
|
save10 = append(save10, struct {
|
|
|
|
Address string
|
|
|
|
Hash string
|
|
|
|
NumOfIndexes uint64
|
|
|
|
}{
|
|
|
|
Address: common.BytesToAddress(p).String(),
|
|
|
|
NumOfIndexes: v,
|
|
|
|
Hash: common.Bytes2Hex([]byte(hash)),
|
|
|
|
})
|
|
|
|
|
|
|
|
}
|
|
|
|
sort.Slice(save10, func(i, j int) bool {
|
|
|
|
return save10[i].NumOfIndexes > save10[j].NumOfIndexes
|
|
|
|
})
|
|
|
|
|
|
|
|
csvWriter := csv.NewWriter(f)
|
|
|
|
err = csvWriter.Write([]string{"hash", "address", "num"})
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
for _, v := range save10 {
|
|
|
|
err = csvWriter.Write([]string{v.Hash, v.Address, strconv.FormatUint(v.NumOfIndexes, 10)})
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return nil
|
|
|
|
}
|