mirror of
https://gitlab.com/pulsechaincom/erigon-pulse.git
synced 2025-01-06 19:12:19 +00:00
509a7af26a
This fixes an issue where the mumbai testnet node struggle to find peers. Before this fix in general test peer numbers are typically around 20 in total between eth66, eth67 and eth68. For new peers some can struggle to find even a single peer after days of operation. These are the numbers after 12 hours or running on a node which previously could not find any peers: eth66=13, eth67=76, eth68=91. The root cause of this issue is the following: - A significant number of mumbai peers around the boot node return network ids which are different from those currently available in the DHT - The available nodes are all consequently busy and return 'too many peers' for long periods These issues case a significant number of discovery timeouts, some of the queries will never receive a response. This causes the discovery read loop to enter a channel deadlock - which means that no responses are processed, nor timeouts fired. This causes the discovery process in the node to stop. From then on it just re-requests handshakes from a relatively small number of peers. This check in fixes this situation with the following changes: - Remove the deadlock by running the timer in a separate go-routine so it can run independently of the main request processing. - Allow the discovery process matcher to match on port if no id match can be established on initial ping. This allows subsequent node validation to proceed and if the node proves to be valid via the remainder of the look-up and handshake process it us used as a valid peer. - Completely unsolicited responses, i.e. those which come from a completely unknown ip:port combination continue to be ignored. -
270 lines
6.9 KiB
Go
270 lines
6.9 KiB
Go
// Copyright 2018 The go-ethereum Authors
|
|
// This file is part of the go-ethereum library.
|
|
//
|
|
// The go-ethereum library is free software: you can redistribute it and/or modify
|
|
// it under the terms of the GNU Lesser General Public License as published by
|
|
// the Free Software Foundation, either version 3 of the License, or
|
|
// (at your option) any later version.
|
|
//
|
|
// The go-ethereum library is distributed in the hope that it will be useful,
|
|
// but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
// GNU Lesser General Public License for more details.
|
|
//
|
|
// You should have received a copy of the GNU Lesser General Public License
|
|
// along with the go-ethereum library. If not, see <http://www.gnu.org/licenses/>.
|
|
|
|
package discover
|
|
|
|
import (
|
|
"bytes"
|
|
"context"
|
|
"crypto/ecdsa"
|
|
"encoding/hex"
|
|
"errors"
|
|
"fmt"
|
|
"math/rand"
|
|
"net"
|
|
"sort"
|
|
"sync"
|
|
"time"
|
|
|
|
"github.com/ledgerwatch/erigon/crypto"
|
|
"github.com/ledgerwatch/erigon/p2p/enode"
|
|
"github.com/ledgerwatch/erigon/p2p/enr"
|
|
"github.com/ledgerwatch/log/v3"
|
|
)
|
|
|
|
var nullNode *enode.Node
|
|
|
|
func init() {
|
|
var r enr.Record
|
|
r.Set(enr.IP{0, 0, 0, 0})
|
|
nullNode = enode.SignNull(&r, enode.ID{})
|
|
}
|
|
|
|
func newTestTable(t transport, tmpDir string) (*Table, *enode.DB) {
|
|
db, err := enode.OpenDB(context.Background(), "", tmpDir)
|
|
if err != nil {
|
|
panic(err)
|
|
}
|
|
tab, _ := newTable(t, "test", db, nil, time.Hour, log.Root())
|
|
go tab.loop()
|
|
return tab, db
|
|
}
|
|
|
|
// nodeAtDistance creates a node for which enode.LogDist(base, n.id) == ld.
|
|
func nodeAtDistance(base enode.ID, ld int, ip net.IP) *node {
|
|
var r enr.Record
|
|
r.Set(enr.IP(ip))
|
|
return wrapNode(enode.SignNull(&r, idAtDistance(base, ld)))
|
|
}
|
|
|
|
// nodesAtDistance creates n nodes for which enode.LogDist(base, node.ID()) == ld.
|
|
func nodesAtDistance(base enode.ID, ld int, n int) []*enode.Node {
|
|
results := make([]*enode.Node, 0, n)
|
|
nodeSet := make(map[enode.ID]bool, n)
|
|
for len(results) < n {
|
|
node := unwrapNode(nodeAtDistance(base, ld, intIP(len(results)+1)))
|
|
// idAtDistance might return an ID that's already generated
|
|
// make sure that the node has a unique ID, otherwise regenerate
|
|
if !nodeSet[node.ID()] {
|
|
nodeSet[node.ID()] = true
|
|
results = append(results, node)
|
|
}
|
|
}
|
|
return results
|
|
}
|
|
|
|
func nodesToRecords(nodes []*enode.Node) []*enr.Record {
|
|
records := make([]*enr.Record, len(nodes))
|
|
for i := range nodes {
|
|
records[i] = nodes[i].Record()
|
|
}
|
|
return records
|
|
}
|
|
|
|
// idAtDistance returns a random hash such that enode.LogDist(a, b) == n
|
|
func idAtDistance(a enode.ID, n int) (b enode.ID) {
|
|
if n == 0 {
|
|
return a
|
|
}
|
|
// flip bit at position n, fill the rest with random bits
|
|
b = a
|
|
pos := len(a) - n/8 - 1
|
|
bit := byte(0x01) << (byte(n%8) - 1)
|
|
if bit == 0 {
|
|
pos++
|
|
bit = 0x80
|
|
}
|
|
b[pos] = a[pos]&^bit | ^a[pos]&bit // TODO: randomize end bits
|
|
for i := pos + 1; i < len(a); i++ {
|
|
b[i] = byte(rand.Intn(255))
|
|
}
|
|
return b
|
|
}
|
|
|
|
func intIP(i int) net.IP {
|
|
return net.IP{byte(i), 0, 2, byte(i)}
|
|
}
|
|
|
|
// fillBucket inserts nodes into the given bucket until it is full.
|
|
func fillBucket(tab *Table, n *node) (last *node) {
|
|
ld := enode.LogDist(tab.self().ID(), n.ID())
|
|
b := tab.bucket(n.ID())
|
|
for len(b.entries) < bucketSize {
|
|
b.entries = append(b.entries, nodeAtDistance(tab.self().ID(), ld, intIP(ld)))
|
|
}
|
|
return b.entries[bucketSize-1]
|
|
}
|
|
|
|
// fillTable adds nodes the table to the end of their corresponding bucket
|
|
// if the bucket is not full. The caller must not hold tab.mutex.
|
|
func fillTable(tab *Table, nodes []*node) {
|
|
for _, n := range nodes {
|
|
tab.addSeenNode(n)
|
|
}
|
|
}
|
|
|
|
type pingRecorder struct {
|
|
mu sync.Mutex
|
|
dead, pinged map[enode.ID]bool
|
|
records map[enode.ID]*enode.Node
|
|
n *enode.Node
|
|
}
|
|
|
|
func newPingRecorder() *pingRecorder {
|
|
var r enr.Record
|
|
r.Set(enr.IP{0, 0, 0, 0})
|
|
n := enode.SignNull(&r, enode.ID{})
|
|
|
|
return &pingRecorder{
|
|
dead: make(map[enode.ID]bool),
|
|
pinged: make(map[enode.ID]bool),
|
|
records: make(map[enode.ID]*enode.Node),
|
|
n: n,
|
|
}
|
|
}
|
|
|
|
// setRecord updates a node record. Future calls to ping and
|
|
// requestENR will return this record.
|
|
func (t *pingRecorder) updateRecord(n *enode.Node) {
|
|
t.mu.Lock()
|
|
defer t.mu.Unlock()
|
|
t.records[n.ID()] = n
|
|
}
|
|
|
|
// Stubs to satisfy the transport interface.
|
|
func (t *pingRecorder) Self() *enode.Node { return nullNode }
|
|
func (t *pingRecorder) Version() string { return "none" }
|
|
func (t *pingRecorder) Errors() map[string]uint { return nil }
|
|
func (t *pingRecorder) LenUnsolicited() int { return 0 }
|
|
func (t *pingRecorder) lookupSelf() []*enode.Node { return nil }
|
|
func (t *pingRecorder) lookupRandom() []*enode.Node { return nil }
|
|
|
|
// ping simulates a ping request.
|
|
func (t *pingRecorder) ping(n *enode.Node) (seq uint64, err error) {
|
|
t.mu.Lock()
|
|
defer t.mu.Unlock()
|
|
|
|
t.pinged[n.ID()] = true
|
|
if t.dead[n.ID()] {
|
|
return 0, errTimeout
|
|
}
|
|
if t.records[n.ID()] != nil {
|
|
seq = t.records[n.ID()].Seq()
|
|
}
|
|
return seq, nil
|
|
}
|
|
|
|
// requestENR simulates an ENR request.
|
|
func (t *pingRecorder) RequestENR(n *enode.Node) (*enode.Node, error) {
|
|
t.mu.Lock()
|
|
defer t.mu.Unlock()
|
|
|
|
if t.dead[n.ID()] || t.records[n.ID()] == nil {
|
|
return nil, errTimeout
|
|
}
|
|
return t.records[n.ID()], nil
|
|
}
|
|
|
|
func hasDuplicates(slice []*node) bool {
|
|
seen := make(map[enode.ID]bool)
|
|
for i, e := range slice {
|
|
if e == nil {
|
|
panic(fmt.Sprintf("nil *Node at %d", i))
|
|
}
|
|
if seen[e.ID()] {
|
|
return true
|
|
}
|
|
seen[e.ID()] = true
|
|
}
|
|
return false
|
|
}
|
|
|
|
// checkNodesEqual checks whether the two given node lists contain the same nodes.
|
|
func checkNodesEqual(got, want []*enode.Node) error {
|
|
if len(got) == len(want) {
|
|
for i := range got {
|
|
if !nodeEqual(got[i], want[i]) {
|
|
goto NotEqual
|
|
}
|
|
}
|
|
}
|
|
return nil
|
|
|
|
NotEqual:
|
|
output := new(bytes.Buffer)
|
|
fmt.Fprintf(output, "got %d nodes:\n", len(got))
|
|
for _, n := range got {
|
|
fmt.Fprintf(output, " %v %v\n", n.ID(), n)
|
|
}
|
|
fmt.Fprintf(output, "want %d:\n", len(want))
|
|
for _, n := range want {
|
|
fmt.Fprintf(output, " %v %v\n", n.ID(), n)
|
|
}
|
|
return errors.New(output.String())
|
|
}
|
|
|
|
func nodeEqual(n1 *enode.Node, n2 *enode.Node) bool {
|
|
return n1.ID() == n2.ID() && n1.IP().Equal(n2.IP())
|
|
}
|
|
|
|
func sortByID(nodes []*enode.Node) {
|
|
sort.Slice(nodes, func(i, j int) bool {
|
|
return string(nodes[i].ID().Bytes()) < string(nodes[j].ID().Bytes())
|
|
})
|
|
}
|
|
|
|
func sortedByDistanceTo(distbase enode.ID, slice []*node) bool {
|
|
return sort.SliceIsSorted(slice, func(i, j int) bool {
|
|
return enode.DistCmp(distbase, slice[i].ID(), slice[j].ID()) < 0
|
|
})
|
|
}
|
|
|
|
// hexEncPrivkey decodes h as a private key.
|
|
func hexEncPrivkey(h string) *ecdsa.PrivateKey {
|
|
b, err := hex.DecodeString(h)
|
|
if err != nil {
|
|
panic(err)
|
|
}
|
|
key, err := crypto.ToECDSA(b)
|
|
if err != nil {
|
|
panic(err)
|
|
}
|
|
return key
|
|
}
|
|
|
|
// hexEncPubkey decodes h as a public key.
|
|
func hexEncPubkey(h string) (ret enode.PubkeyEncoded) {
|
|
b, err := hex.DecodeString(h)
|
|
if err != nil {
|
|
panic(err)
|
|
}
|
|
if len(b) != len(ret) {
|
|
panic("invalid length")
|
|
}
|
|
copy(ret[:], b)
|
|
return ret
|
|
}
|