erigon-pulse/erigon-lib/common/dbg/experiments.go
Mark Holt 79ed8cad35
E2 snapshot uploading (#9056)
This change introduces additional processes to manage snapshot uploading
for E2 snapshots:

## erigon snapshots upload

The `snapshots uploader` command starts a version of erigon customized
for uploading snapshot files to
a remote location.  

It breaks the stage execution process after the senders stage and then
uses the snapshot stage to send
uploaded headers, bodies and (in the case of polygon) bor spans and
events to snapshot files. Because
this process avoids execution in run signifigantly faster than a
standard erigon configuration.

The uploader uses rclone to send seedable (100K or 500K blocks) to a
remote storage location specified
in the rclone config file.

The **uploader** is configured to minimize disk usage by doing the
following:

* It removes snapshots once they are loaded
* It aggressively prunes the database once entities are transferred to
snapshots

in addition to this it has the following performance related features:

* maximizes the workers allocated to snapshot processing to improve
throughput
* Can be started from scratch by downloading the latest snapshots from
the remote location to seed processing

## snapshots command

Is a stand alone command for managing remote snapshots it has the
following sub commands

* **cmp** - compare snapshots
* **copy** - copy snapshots
* **verify** - verify snapshots
* **manifest** - manage the manifest file in the root of remote snapshot
locations
* **torrent** - manage snapshot torrent files
2023-12-27 22:05:09 +00:00

302 lines
5.9 KiB
Go

/*
Copyright 2021 Erigon contributors
Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at
http://www.apache.org/licenses/LICENSE-2.0
Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
*/
package dbg
import (
"os"
"runtime"
"strconv"
"sync"
"time"
"github.com/ledgerwatch/log/v3"
)
var StagesOnlyBlocks = EnvBool("STAGES_ONLY_BLOCKS", false)
var doMemstat = true
func init() {
_, ok := os.LookupEnv("NO_MEMSTAT")
if ok {
doMemstat = false
}
}
func DoMemStat() bool { return doMemstat }
func ReadMemStats(m *runtime.MemStats) {
if doMemstat {
runtime.ReadMemStats(m)
}
}
var (
writeMap bool
writeMapOnce sync.Once
)
func WriteMap() bool {
writeMapOnce.Do(func() {
v, _ := os.LookupEnv("WRITE_MAP")
if v == "true" {
writeMap = true
log.Info("[Experiment]", "WRITE_MAP", writeMap)
}
})
return writeMap
}
var (
dirtySace uint64
dirtySaceOnce sync.Once
)
func DirtySpace() uint64 {
dirtySaceOnce.Do(func() {
v, _ := os.LookupEnv("MDBX_DIRTY_SPACE_MB")
if v != "" {
i, err := strconv.Atoi(v)
if err != nil {
panic(err)
}
dirtySace = uint64(i * 1024 * 1024)
log.Info("[Experiment]", "MDBX_DIRTY_SPACE_MB", dirtySace)
}
})
return dirtySace
}
var (
noSync bool
noSyncOnce sync.Once
)
func NoSync() bool {
noSyncOnce.Do(func() {
v, _ := os.LookupEnv("NO_SYNC")
if v == "true" {
noSync = true
log.Info("[Experiment]", "NO_SYNC", noSync)
}
})
return noSync
}
var (
mergeTr int
mergeTrOnce sync.Once
)
func MergeTr() int {
mergeTrOnce.Do(func() {
v, _ := os.LookupEnv("MERGE_THRESHOLD")
if v != "" {
i, err := strconv.Atoi(v)
if err != nil {
panic(err)
}
if i < 0 || i > 4 {
panic(i)
}
mergeTr = i
log.Info("[Experiment]", "MERGE_THRESHOLD", mergeTr)
}
})
return mergeTr
}
var (
mdbxReadahead bool
mdbxReadaheadOnce sync.Once
)
func MdbxReadAhead() bool {
mdbxReadaheadOnce.Do(func() {
v, _ := os.LookupEnv("MDBX_READAHEAD")
if v == "true" {
mdbxReadahead = true
log.Info("[Experiment]", "MDBX_READAHEAD", mdbxReadahead)
}
})
return mdbxReadahead
}
var (
discardHistory bool
discardHistoryOnce sync.Once
)
func DiscardHistory() bool {
discardHistoryOnce.Do(func() {
v, _ := os.LookupEnv("DISCARD_HISTORY")
if v == "true" {
discardHistory = true
log.Info("[Experiment]", "DISCARD_HISTORY", discardHistory)
}
})
return discardHistory
}
var (
bigRoTx uint
getBigRoTx sync.Once
)
// DEBUG_BIG_RO_TX_KB - print logs with info about large read-only transactions
// DEBUG_BIG_RW_TX_KB - print logs with info about large read-write transactions
// DEBUG_SLOW_COMMIT_MS - print logs with commit timing details if commit is slower than this threshold
func BigRoTxKb() uint {
getBigRoTx.Do(func() {
v, _ := os.LookupEnv("DEBUG_BIG_RO_TX_KB")
if v != "" {
i, err := strconv.Atoi(v)
if err != nil {
panic(err)
}
bigRoTx = uint(i)
log.Info("[Experiment]", "DEBUG_BIG_RO_TX_KB", bigRoTx)
}
})
return bigRoTx
}
var (
bigRwTx uint
getBigRwTx sync.Once
)
func BigRwTxKb() uint {
getBigRwTx.Do(func() {
v, _ := os.LookupEnv("DEBUG_BIG_RW_TX_KB")
if v != "" {
i, err := strconv.Atoi(v)
if err != nil {
panic(err)
}
bigRwTx = uint(i)
log.Info("[Experiment]", "DEBUG_BIG_RW_TX_KB", bigRwTx)
}
})
return bigRwTx
}
var (
slowCommit time.Duration
slowCommitOnce sync.Once
)
func SlowCommit() time.Duration {
slowCommitOnce.Do(func() {
v, _ := os.LookupEnv("SLOW_COMMIT")
if v != "" {
var err error
slowCommit, err = time.ParseDuration(v)
if err != nil {
panic(err)
}
log.Info("[Experiment]", "SLOW_COMMIT", slowCommit.String())
}
})
return slowCommit
}
var (
slowTx time.Duration
slowTxOnce sync.Once
)
func SlowTx() time.Duration {
slowTxOnce.Do(func() {
v, _ := os.LookupEnv("SLOW_TX")
if v != "" {
var err error
slowTx, err = time.ParseDuration(v)
if err != nil {
panic(err)
}
log.Info("[Experiment]", "SLOW_TX", slowTx.String())
}
})
return slowTx
}
var (
stopBeforeStage string
stopBeforeStageFlag sync.Once
stopAfterStage string
stopAfterStageFlag sync.Once
)
func StopBeforeStage() string {
f := func() {
v, _ := os.LookupEnv("STOP_BEFORE_STAGE") // see names in eth/stagedsync/stages/stages.go
if v != "" {
stopBeforeStage = v
log.Info("[Experiment]", "STOP_BEFORE_STAGE", stopBeforeStage)
}
}
stopBeforeStageFlag.Do(f)
return stopBeforeStage
}
// TODO(allada) We should possibly consider removing `STOP_BEFORE_STAGE`, as `STOP_AFTER_STAGE` can
// perform all same the functionality, but due to reverse compatibility reasons we are going to
// leave it.
func StopAfterStage() string {
f := func() {
v, _ := os.LookupEnv("STOP_AFTER_STAGE") // see names in eth/stagedsync/stages/stages.go
if v != "" {
stopAfterStage = v
log.Info("[Experiment]", "STOP_AFTER_STAGE", stopAfterStage)
}
}
stopAfterStageFlag.Do(f)
return stopAfterStage
}
var (
stopAfterReconst bool
stopAfterReconstOnce sync.Once
)
func StopAfterReconst() bool {
stopAfterReconstOnce.Do(func() {
v, _ := os.LookupEnv("STOP_AFTER_RECONSTITUTE")
if v == "true" {
stopAfterReconst = true
log.Info("[Experiment]", "STOP_AFTER_RECONSTITUTE", stopAfterReconst)
}
})
return stopAfterReconst
}
var (
snapshotVersion uint8
snapshotVersionOnce sync.Once
)
func SnapshotVersion() uint8 {
snapshotVersionOnce.Do(func() {
v, _ := os.LookupEnv("SNAPSHOT_VERSION")
if i, _ := strconv.ParseUint(v, 10, 8); i > 0 {
snapshotVersion = uint8(i)
log.Info("[Experiment]", "SNAPSHOT_VERSION", snapshotVersion)
}
})
return snapshotVersion
}