mirror of
https://gitlab.com/pulsechaincom/erigon-pulse.git
synced 2025-01-08 12:01:20 +00:00
79ed8cad35
This change introduces additional processes to manage snapshot uploading for E2 snapshots: ## erigon snapshots upload The `snapshots uploader` command starts a version of erigon customized for uploading snapshot files to a remote location. It breaks the stage execution process after the senders stage and then uses the snapshot stage to send uploaded headers, bodies and (in the case of polygon) bor spans and events to snapshot files. Because this process avoids execution in run signifigantly faster than a standard erigon configuration. The uploader uses rclone to send seedable (100K or 500K blocks) to a remote storage location specified in the rclone config file. The **uploader** is configured to minimize disk usage by doing the following: * It removes snapshots once they are loaded * It aggressively prunes the database once entities are transferred to snapshots in addition to this it has the following performance related features: * maximizes the workers allocated to snapshot processing to improve throughput * Can be started from scratch by downloading the latest snapshots from the remote location to seed processing ## snapshots command Is a stand alone command for managing remote snapshots it has the following sub commands * **cmp** - compare snapshots * **copy** - copy snapshots * **verify** - verify snapshots * **manifest** - manage the manifest file in the root of remote snapshot locations * **torrent** - manage snapshot torrent files
214 lines
7.5 KiB
Go
214 lines
7.5 KiB
Go
/*
|
|
Copyright 2021 Erigon contributors
|
|
|
|
Licensed under the Apache License, Version 2.0 (the "License");
|
|
you may not use this file except in compliance with the License.
|
|
You may obtain a copy of the License at
|
|
|
|
http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
Unless required by applicable law or agreed to in writing, software
|
|
distributed under the License is distributed on an "AS IS" BASIS,
|
|
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
See the License for the specific language governing permissions and
|
|
limitations under the License.
|
|
*/
|
|
|
|
package downloadercfg
|
|
|
|
import (
|
|
"net"
|
|
"net/url"
|
|
"os"
|
|
"path/filepath"
|
|
"runtime"
|
|
"strings"
|
|
"time"
|
|
|
|
"github.com/anacrolix/dht/v2"
|
|
lg "github.com/anacrolix/log"
|
|
"github.com/anacrolix/torrent"
|
|
"github.com/c2h5oh/datasize"
|
|
"github.com/ledgerwatch/erigon-lib/chain/snapcfg"
|
|
"github.com/ledgerwatch/erigon-lib/common/datadir"
|
|
"github.com/ledgerwatch/erigon-lib/common/dir"
|
|
"github.com/ledgerwatch/log/v3"
|
|
"golang.org/x/time/rate"
|
|
)
|
|
|
|
// DefaultPieceSize - Erigon serves many big files, bigger pieces will reduce
|
|
// amount of network announcements, but can't go over 2Mb
|
|
// see https://wiki.theory.org/BitTorrentSpecification#Metainfo_File_Structure
|
|
const DefaultPieceSize = 2 * 1024 * 1024
|
|
|
|
// DefaultNetworkChunkSize - how much data request per 1 network call to peer.
|
|
// default: 16Kb
|
|
const DefaultNetworkChunkSize = 256 * 1024
|
|
|
|
type Cfg struct {
|
|
ClientConfig *torrent.ClientConfig
|
|
DownloadSlots int
|
|
|
|
WebSeedUrls []*url.URL
|
|
WebSeedFiles []string
|
|
WebSeedS3Tokens []string
|
|
ExpectedTorrentFilesHashes snapcfg.Preverified
|
|
DownloadTorrentFilesFromWebseed bool
|
|
AddTorrentsFromDisk bool
|
|
ChainName string
|
|
|
|
Dirs datadir.Dirs
|
|
}
|
|
|
|
func Default() *torrent.ClientConfig {
|
|
torrentConfig := torrent.NewDefaultClientConfig()
|
|
// better don't increase because erigon periodically producing "new seedable files" - and adding them to downloader.
|
|
// it must not impact chain tip sync - so, limit resources to minimum by default.
|
|
// but when downloader is started as a separated process - rise it to max
|
|
//torrentConfig.PieceHashersPerTorrent = cmp.Max(1, runtime.NumCPU()-1)
|
|
|
|
torrentConfig.MinDialTimeout = 6 * time.Second //default: 3s
|
|
torrentConfig.HandshakesTimeout = 8 * time.Second //default: 4s
|
|
|
|
// enable dht
|
|
torrentConfig.NoDHT = true
|
|
//torrentConfig.DisableTrackers = true
|
|
//torrentConfig.DisableWebtorrent = true
|
|
|
|
// Reduce defaults - to avoid peers with very bad geography
|
|
//torrentConfig.MinDialTimeout = 1 * time.Second // default: 3sec
|
|
//torrentConfig.NominalDialTimeout = 10 * time.Second // default: 20sec
|
|
//torrentConfig.HandshakesTimeout = 1 * time.Second // default: 4sec
|
|
|
|
// see: https://en.wikipedia.org/wiki/TCP_half-open
|
|
//torrentConfig.TotalHalfOpenConns = 100 // default: 100
|
|
//torrentConfig.HalfOpenConnsPerTorrent = 25 // default: 25
|
|
//torrentConfig.TorrentPeersHighWater = 500 // default: 500
|
|
//torrentConfig.TorrentPeersLowWater = 50 // default: 50
|
|
|
|
torrentConfig.Seed = true
|
|
torrentConfig.UpnpID = torrentConfig.UpnpID + "leecher"
|
|
|
|
return torrentConfig
|
|
}
|
|
|
|
func New(dirs datadir.Dirs, version string, verbosity lg.Level, downloadRate, uploadRate datasize.ByteSize, port, connsPerFile, downloadSlots int, staticPeers, webseeds []string, chainName string) (*Cfg, error) {
|
|
torrentConfig := Default()
|
|
torrentConfig.DataDir = dirs.Snap // `DataDir` of torrent-client-lib is different from Erigon's `DataDir`. Just same naming.
|
|
|
|
torrentConfig.ExtendedHandshakeClientVersion = version
|
|
|
|
// We would-like to reduce amount of goroutines in Erigon, so reducing next params
|
|
torrentConfig.EstablishedConnsPerTorrent = connsPerFile // default: 50
|
|
|
|
torrentConfig.ListenPort = port
|
|
// check if ipv6 is enabled
|
|
torrentConfig.DisableIPv6 = !getIpv6Enabled()
|
|
|
|
torrentConfig.UploadRateLimiter = rate.NewLimiter(rate.Limit(uploadRate.Bytes()), DefaultNetworkChunkSize) // default: unlimited
|
|
if downloadRate.Bytes() < 500_000_000 {
|
|
torrentConfig.DownloadRateLimiter = rate.NewLimiter(rate.Limit(downloadRate.Bytes()), DefaultNetworkChunkSize) // default: unlimited
|
|
}
|
|
|
|
// debug
|
|
//torrentConfig.Debug = true
|
|
torrentConfig.Logger = torrentConfig.Logger.WithFilterLevel(verbosity)
|
|
torrentConfig.Logger.SetHandlers(adapterHandler{})
|
|
|
|
if len(staticPeers) > 0 {
|
|
torrentConfig.NoDHT = false
|
|
//defaultNodes := torrentConfig.DhtStartingNodes
|
|
torrentConfig.DhtStartingNodes = func(network string) dht.StartingNodesGetter {
|
|
return func() ([]dht.Addr, error) {
|
|
addrs, err := dht.GlobalBootstrapAddrs(network)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
for _, seed := range staticPeers {
|
|
if network == "udp" {
|
|
var addr *net.UDPAddr
|
|
addr, err := net.ResolveUDPAddr(network, seed+":80")
|
|
if err != nil {
|
|
log.Warn("[downloader] Cannot UDP resolve address", "network", network, "addr", seed)
|
|
continue
|
|
}
|
|
addrs = append(addrs, dht.NewAddr(addr))
|
|
}
|
|
if network == "tcp" {
|
|
var addr *net.TCPAddr
|
|
addr, err := net.ResolveTCPAddr(network, seed+":80")
|
|
if err != nil {
|
|
log.Warn("[downloader] Cannot TCP resolve address", "network", network, "addr", seed)
|
|
continue
|
|
}
|
|
addrs = append(addrs, dht.NewAddr(addr))
|
|
}
|
|
}
|
|
return addrs, nil
|
|
}
|
|
}
|
|
//staticPeers
|
|
}
|
|
|
|
webseedUrlsOrFiles := webseeds
|
|
webseedHttpProviders := make([]*url.URL, 0, len(webseedUrlsOrFiles))
|
|
webseedFileProviders := make([]string, 0, len(webseedUrlsOrFiles))
|
|
webseedS3Providers := make([]string, 0, len(webseedUrlsOrFiles))
|
|
for _, webseed := range webseedUrlsOrFiles {
|
|
if !strings.HasPrefix(webseed, "v") { // has marker v1/v2/...
|
|
uri, err := url.ParseRequestURI(webseed)
|
|
if err != nil {
|
|
if strings.HasSuffix(webseed, ".toml") && dir.FileExist(webseed) {
|
|
webseedFileProviders = append(webseedFileProviders, webseed)
|
|
}
|
|
continue
|
|
}
|
|
webseedHttpProviders = append(webseedHttpProviders, uri)
|
|
continue
|
|
}
|
|
|
|
if strings.HasPrefix(webseed, "v1:") {
|
|
withoutVerisonPrefix := webseed[3:]
|
|
if !strings.HasPrefix(withoutVerisonPrefix, "https:") {
|
|
webseedS3Providers = append(webseedS3Providers, webseed)
|
|
continue
|
|
}
|
|
uri, err := url.ParseRequestURI(withoutVerisonPrefix)
|
|
if err != nil {
|
|
log.Warn("[webseed] can't parse url", "err", err, "url", withoutVerisonPrefix)
|
|
continue
|
|
}
|
|
webseedHttpProviders = append(webseedHttpProviders, uri)
|
|
} else {
|
|
continue
|
|
}
|
|
}
|
|
localCfgFile := filepath.Join(dirs.DataDir, "webseed.toml") // datadir/webseed.toml allowed
|
|
if dir.FileExist(localCfgFile) {
|
|
webseedFileProviders = append(webseedFileProviders, localCfgFile)
|
|
}
|
|
//TODO: if don't pass "downloaded files list here" (which we store in db) - synced erigon will download new .torrent files. And erigon can't work with "unfinished" files.
|
|
snapCfg := snapcfg.KnownCfg(chainName, 0)
|
|
return &Cfg{Dirs: dirs, ChainName: chainName,
|
|
ClientConfig: torrentConfig, DownloadSlots: downloadSlots,
|
|
WebSeedUrls: webseedHttpProviders, WebSeedFiles: webseedFileProviders, WebSeedS3Tokens: webseedS3Providers,
|
|
DownloadTorrentFilesFromWebseed: true, AddTorrentsFromDisk: true, ExpectedTorrentFilesHashes: snapCfg.Preverified,
|
|
}, nil
|
|
}
|
|
|
|
func getIpv6Enabled() bool {
|
|
if runtime.GOOS == "linux" {
|
|
file, err := os.ReadFile("/sys/module/ipv6/parameters/disable")
|
|
if err != nil {
|
|
log.Warn("could not read /sys/module/ipv6/parameters/disable for ipv6 detection")
|
|
return false
|
|
}
|
|
fileContent := strings.TrimSpace(string(file))
|
|
return fileContent != "0"
|
|
}
|
|
|
|
// TODO hotfix: for platforms other than linux disable ipv6
|
|
return false
|
|
}
|