erigon-pulse/ethdb/kv_bolt.go
2020-08-04 11:05:27 +01:00

554 lines
12 KiB
Go

package ethdb
import (
"bytes"
"context"
"fmt"
"os"
"path"
"strings"
"sync"
"time"
"github.com/ledgerwatch/bolt"
"github.com/ledgerwatch/turbo-geth/common"
"github.com/ledgerwatch/turbo-geth/common/dbutils"
"github.com/ledgerwatch/turbo-geth/log"
"github.com/ledgerwatch/turbo-geth/metrics"
)
var (
boltPagesAllocGauge = metrics.NewRegisteredGauge("bolt/pages/alloc_bytes", nil)
boltPagesFreeGauge = metrics.NewRegisteredGauge("bolt/pages/free", nil)
boltPagesPendingGauge = metrics.NewRegisteredGauge("bolt/pages/pending", nil)
boltFreelistInuseGauge = metrics.NewRegisteredGauge("bolt/freelist/inuse", nil)
boltTxGauge = metrics.NewRegisteredGauge("bolt/tx/total", nil)
boltTxOpenGauge = metrics.NewRegisteredGauge("bolt/tx/open", nil)
boltTxCursorGauge = metrics.NewRegisteredGauge("bolt/tx/cursors_total", nil)
boltRebalanceGauge = metrics.NewRegisteredGauge("bolt/rebalance/total", nil)
boltRebalanceTimer = metrics.NewRegisteredTimer("bolt/rebalance/time", nil)
boltSplitGauge = metrics.NewRegisteredGauge("bolt/split/total", nil)
boltSpillGauge = metrics.NewRegisteredGauge("bolt/spill/total", nil)
boltSpillTimer = metrics.NewRegisteredTimer("bolt/spill/time", nil)
boltWriteGauge = metrics.NewRegisteredGauge("bolt/write/total", nil)
boltWriteTimer = metrics.NewRegisteredTimer("bolt/write/time", nil)
)
var valueBytesMetrics []metrics.Gauge
var keyBytesMetrics []metrics.Gauge
var totalBytesPutMetrics []metrics.Gauge
var totalBytesDeleteMetrics []metrics.Gauge
var keyNMetrics []metrics.Gauge
func init() {
if metrics.Enabled {
for i := range dbutils.Buckets {
b := strings.ToLower(string(dbutils.Buckets[i]))
b = strings.Replace(b, "-", "_", -1)
valueBytesMetrics = append(valueBytesMetrics, metrics.NewRegisteredGauge("db/bucket/value_bytes/"+b, nil))
keyBytesMetrics = append(keyBytesMetrics, metrics.NewRegisteredGauge("db/bucket/key_bytes/"+b, nil))
totalBytesPutMetrics = append(totalBytesPutMetrics, metrics.NewRegisteredGauge("db/bucket/bytes_put_total/"+b, nil))
totalBytesDeleteMetrics = append(totalBytesDeleteMetrics, metrics.NewRegisteredGauge("db/bucket/bytes_delete_total/"+b, nil))
keyNMetrics = append(keyNMetrics, metrics.NewRegisteredGauge("db/bucket/keys/"+b, nil))
}
}
}
func collectBoltMetrics(ctx context.Context, db *bolt.DB, ticker *time.Ticker) {
for {
select {
case <-ctx.Done():
return
case <-ticker.C:
}
stats := db.Stats()
boltPagesFreeGauge.Update(int64(stats.FreePageN))
boltPagesPendingGauge.Update(int64(stats.PendingPageN))
boltPagesAllocGauge.Update(int64(stats.FreeAlloc))
boltFreelistInuseGauge.Update(int64(stats.FreelistInuse))
boltTxGauge.Update(int64(stats.TxN))
boltTxOpenGauge.Update(int64(stats.OpenTxN))
boltTxCursorGauge.Update(int64(stats.TxStats.CursorCount))
boltRebalanceGauge.Update(int64(stats.TxStats.Rebalance))
boltRebalanceTimer.Update(stats.TxStats.RebalanceTime)
boltSplitGauge.Update(int64(stats.TxStats.Split))
boltSpillGauge.Update(int64(stats.TxStats.Spill))
boltSpillTimer.Update(stats.TxStats.SpillTime)
boltWriteGauge.Update(int64(stats.TxStats.Write))
boltWriteTimer.Update(stats.TxStats.WriteTime)
if len(valueBytesMetrics) == 0 {
continue
}
writeStats := db.WriteStats()
for i := range dbutils.Buckets {
st, ok := writeStats[string(dbutils.Buckets[i])]
if !ok {
continue
}
valueBytesMetrics[i].Update(int64(st.ValueBytesN))
keyBytesMetrics[i].Update(int64(st.KeyBytesN))
totalBytesPutMetrics[i].Update(int64(st.TotalBytesPut))
totalBytesDeleteMetrics[i].Update(int64(st.TotalBytesDelete))
keyNMetrics[i].Update(int64(st.KeyN))
}
}
}
type boltOpts struct {
Bolt *bolt.Options
path string
}
type BoltKV struct {
opts boltOpts
bolt *bolt.DB
log log.Logger
stopMetrics context.CancelFunc
wg *sync.WaitGroup
}
type boltTx struct {
ctx context.Context
db *BoltKV
bolt *bolt.Tx
}
type boltBucket struct {
tx *boltTx
bolt *bolt.Bucket
id int
nameLen uint
}
type boltCursor struct {
ctx context.Context
bucket boltBucket
prefix []byte
bolt *bolt.Cursor
}
type noValuesBoltCursor struct {
*boltCursor
}
func (opts boltOpts) InMem() boltOpts {
opts.Bolt.MemOnly = true
return opts
}
func (opts boltOpts) ReadOnly() boltOpts {
opts.Bolt.ReadOnly = true
return opts
}
func (opts boltOpts) Path(path string) boltOpts {
opts.path = path
return opts
}
func (opts boltOpts) Open() (KV, error) {
if !opts.Bolt.MemOnly {
if err := os.MkdirAll(path.Dir(opts.path), 0744); err != nil {
return nil, fmt.Errorf("could not create dir: %s, %w", opts.path, err)
}
}
boltDB, err := bolt.Open(opts.path, 0600, opts.Bolt)
if err != nil {
return nil, err
}
if !opts.Bolt.ReadOnly {
if err := boltDB.Update(func(tx *bolt.Tx) error {
for _, name := range dbutils.Buckets {
_, createErr := tx.CreateBucketIfNotExists(name, false)
if createErr != nil {
return createErr
}
}
return nil
}); err != nil {
return nil, err
}
}
db := &BoltKV{
opts: opts,
bolt: boltDB,
log: log.New("bolt_db", opts.path),
wg: &sync.WaitGroup{},
}
if metrics.Enabled {
ctx, cancel := context.WithCancel(context.Background())
db.stopMetrics = cancel
db.wg.Add(1)
go func() {
defer db.wg.Done()
ticker := time.NewTicker(3 * time.Second)
defer ticker.Stop()
collectBoltMetrics(ctx, boltDB, ticker)
}()
}
return db, nil
}
func (opts boltOpts) MustOpen() KV {
db, err := opts.Open()
if err != nil {
panic(err)
}
return db
}
func NewBolt() boltOpts {
o := boltOpts{Bolt: bolt.DefaultOptions}
o.Bolt.KeysPrefixCompressionDisable = true
return o
}
// Close closes BoltKV
// All transactions must be closed before closing the database.
func (db *BoltKV) Close() {
if db.stopMetrics != nil {
db.stopMetrics()
}
db.wg.Wait()
if db.bolt != nil {
if err := db.bolt.Close(); err != nil {
db.log.Warn("failed to close bolt DB", "err", err)
} else {
db.log.Info("bolt database closed")
}
}
}
func (db *BoltKV) DiskSize(_ context.Context) (uint64, error) {
return uint64(db.bolt.Size()), nil
}
func (db *BoltKV) BucketsStat(_ context.Context) (map[string]common.StorageBucketWriteStats, error) {
res := map[string]common.StorageBucketWriteStats{}
for name, stats := range db.bolt.WriteStats() {
res[name] = common.StorageBucketWriteStats{
KeyN: common.StorageCounter(stats.KeyN),
KeyBytesN: common.StorageSize(stats.KeyBytesN),
ValueBytesN: common.StorageSize(stats.ValueBytesN),
TotalPut: common.StorageCounter(stats.TotalPut),
TotalDelete: common.StorageCounter(stats.TotalDelete),
TotalBytesPut: common.StorageSize(stats.TotalBytesPut),
TotalBytesDelete: common.StorageSize(stats.TotalBytesDelete),
}
}
return res, nil
}
func (db *BoltKV) IdealBatchSize() int {
return 50 * 1024 * 1024 // 50 Mb
}
func (db *BoltKV) Begin(ctx context.Context, writable bool) (Tx, error) {
if db.bolt == nil {
return nil, fmt.Errorf("db closed")
}
t := &boltTx{db: db, ctx: ctx}
var err error
t.bolt, err = db.bolt.Begin(writable)
return t, err
}
func (db *BoltKV) View(ctx context.Context, f func(tx Tx) error) (err error) {
if db.bolt == nil {
return fmt.Errorf("db closed")
}
t := &boltTx{db: db, ctx: ctx}
return db.bolt.View(func(tx *bolt.Tx) error {
t.bolt = tx
return f(t)
})
}
func (db *BoltKV) Update(ctx context.Context, f func(tx Tx) error) (err error) {
if db.bolt == nil {
return fmt.Errorf("db closed")
}
t := &boltTx{db: db, ctx: ctx}
return db.bolt.Update(func(tx *bolt.Tx) error {
t.bolt = tx
return f(t)
})
}
func (tx *boltTx) Commit(ctx context.Context) error {
if tx.bolt == nil {
return fmt.Errorf("db closed")
}
return tx.bolt.Commit()
}
func (tx *boltTx) Rollback() {
if tx.bolt == nil {
return
}
if err := tx.bolt.Rollback(); err != nil {
log.Warn("bolt rollback failed", "err", err)
}
}
func (tx *boltTx) Yield() {
tx.bolt.Yield()
}
func (tx *boltTx) Bucket(name []byte) Bucket {
b := boltBucket{tx: tx, nameLen: uint(len(name)), id: dbutils.BucketsCfg[string(name)].ID}
b.bolt = tx.bolt.Bucket(name)
return b
}
func (c *boltCursor) Prefix(v []byte) Cursor {
c.prefix = v
return c
}
func (c *boltCursor) MatchBits(n uint) Cursor {
panic("not implemented yet")
}
func (c *boltCursor) Prefetch(v uint) Cursor {
// nothing to do
return c
}
func (c *boltCursor) NoValues() NoValuesCursor {
return &noValuesBoltCursor{boltCursor: c}
}
func (b boltBucket) Size() (uint64, error) {
st := b.bolt.Stats()
return uint64((st.BranchPageN + st.BranchOverflowN + st.LeafPageN) * os.Getpagesize()), nil
}
func (b boltBucket) Clear() error {
err := b.tx.bolt.DeleteBucket(dbutils.Buckets[b.id])
if err != nil {
return err
}
_, err = b.tx.bolt.CreateBucket(dbutils.Buckets[b.id], false)
if err != nil {
return err
}
return nil
}
func (b boltBucket) Get(key []byte) (val []byte, err error) {
select {
case <-b.tx.ctx.Done():
return nil, b.tx.ctx.Err()
default:
}
val, _ = b.bolt.Get(key)
return val, err
}
func (b boltBucket) Put(key []byte, value []byte) error {
select {
case <-b.tx.ctx.Done():
return b.tx.ctx.Err()
default:
}
return b.bolt.Put(key, value)
}
func (b boltBucket) Delete(key []byte) error {
select {
case <-b.tx.ctx.Done():
return b.tx.ctx.Err()
default:
}
return b.bolt.Delete(key)
}
func (b boltBucket) Cursor() Cursor {
return &boltCursor{bucket: b, ctx: b.tx.ctx, bolt: b.bolt.Cursor()}
}
func (c *boltCursor) First() (k, v []byte, err error) {
if len(c.prefix) == 0 {
k, v = c.bolt.First()
return k, v, nil
}
k, v = c.bolt.Seek(c.prefix)
if !bytes.HasPrefix(k, c.prefix) {
return nil, nil, nil
}
return k, v, nil
}
func (c *boltCursor) Seek(seek []byte) (k, v []byte, err error) {
select {
case <-c.ctx.Done():
return []byte{}, nil, c.ctx.Err()
default:
}
k, v = c.bolt.Seek(seek)
if c.prefix != nil {
if !bytes.HasPrefix(k, c.prefix) {
return nil, nil, nil
}
}
return k, v, nil
}
func (c *boltCursor) SeekTo(seek []byte) (k, v []byte, err error) {
select {
case <-c.ctx.Done():
return []byte{}, nil, c.ctx.Err()
default:
}
k, v = c.bolt.SeekTo(seek)
if c.prefix != nil {
if !bytes.HasPrefix(k, c.prefix) {
return nil, nil, nil
}
}
return k, v, nil
}
func (c *boltCursor) Next() (k, v []byte, err error) {
select {
case <-c.ctx.Done():
return []byte{}, nil, c.ctx.Err()
default:
}
k, v = c.bolt.Next()
if c.prefix != nil {
if !bytes.HasPrefix(k, c.prefix) {
k, v = nil, nil
}
}
return k, v, nil
}
func (c *boltCursor) Delete(key []byte) error {
select {
case <-c.ctx.Done():
return c.ctx.Err()
default:
}
return c.bolt.Delete2(key)
}
func (c *boltCursor) Put(key []byte, value []byte) error {
select {
case <-c.ctx.Done():
return c.ctx.Err()
default:
}
return c.bolt.Put(key, value)
}
func (c *boltCursor) Append(key []byte, value []byte) error {
return c.Put(key, value)
}
func (c *boltCursor) Walk(walker func(k, v []byte) (bool, error)) error {
for k, v, err := c.First(); k != nil; k, v, err = c.Next() {
if err != nil {
return err
}
ok, err := walker(k, v)
if err != nil {
return err
}
if !ok {
return nil
}
}
return nil
}
func (c *noValuesBoltCursor) Walk(walker func(k []byte, vSize uint32) (bool, error)) error {
for k, vSize, err := c.First(); k != nil; k, vSize, err = c.Next() {
if err != nil {
return err
}
ok, err := walker(k, vSize)
if err != nil {
return err
}
if !ok {
return nil
}
}
return nil
}
func (c *noValuesBoltCursor) First() (k []byte, vSize uint32, err error) {
var v []byte
if len(c.prefix) == 0 {
k, v = c.bolt.First()
return k, uint32(len(v)), nil
}
k, v = c.bolt.Seek(c.prefix)
if !bytes.HasPrefix(k, c.prefix) {
return nil, 0, nil
}
return k, uint32(len(v)), nil
}
func (c *noValuesBoltCursor) Seek(seek []byte) (k []byte, vSize uint32, err error) {
select {
case <-c.ctx.Done():
return []byte{}, 0, c.ctx.Err() // on error key should be != nil
default:
}
var v []byte
k, v = c.bolt.Seek(seek)
if c.prefix != nil {
if !bytes.HasPrefix(k, c.prefix) {
return nil, 0, nil
}
}
return k, uint32(len(v)), nil
}
func (c *noValuesBoltCursor) Next() (k []byte, vSize uint32, err error) {
select {
case <-c.ctx.Done():
return []byte{}, 0, c.ctx.Err()
default:
}
var v []byte
k, v = c.bolt.Next()
if c.prefix != nil {
if !bytes.HasPrefix(k, c.prefix) {
return nil, 0, nil
}
}
return k, uint32(len(v)), nil
}