prysm-pulse/shared/deprecated-p2p/monitoring.go
2019-08-24 10:07:03 -06:00

76 lines
1.9 KiB
Go

package p2p
import (
"context"
"time"
host "github.com/libp2p/go-libp2p-host"
"github.com/prometheus/client_golang/prometheus"
"github.com/prometheus/client_golang/prometheus/promauto"
)
var (
propagationTimeMetric = promauto.NewHistogram(prometheus.HistogramOpts{
Name: "p2p_propagation_time_sec",
Help: "The time between message sent/received from peer",
Buckets: append(prometheus.DefBuckets, []float64{20, 30, 60, 90}...),
})
)
// starPeerWatcher updates the peer count metric and calls to reconnect any VIP
// peers such as the bootnode peer, the relay node peer or the static peers.
func startPeerWatcher(ctx context.Context, h host.Host, reconnectPeers ...string) {
peerCountMetric := promauto.NewGauge(prometheus.GaugeOpts{
Name: "p2p_peer_count",
Help: "The number of currently connected peers",
})
go (func() {
for {
select {
case <-ctx.Done():
return
default:
peerCountMetric.Set(float64(peerCount(h)))
ensurePeerConnections(ctx, h, reconnectPeers...)
// Wait 5 second to update again
time.Sleep(5 * time.Second)
}
}
})()
}
func peerCount(h host.Host) int {
return len(h.Network().Peers())
}
// ensurePeerConnections will attempt to reestablish connection to the peers
// if there are currently no connections to that peer.
func ensurePeerConnections(ctx context.Context, h host.Host, peers ...string) {
if len(peers) == 0 {
return
}
for _, p := range peers {
if p == "" {
continue
}
peer, err := MakePeer(p)
if err != nil {
log.Errorf("Could not make peer: %v", err)
continue
}
c := h.Network().ConnsToPeer(peer.ID)
if len(c) == 0 {
log.WithField("peer", peer.ID).Debug("No connections to peer, reconnecting")
ctx, cancel := context.WithTimeout(ctx, 30*time.Second)
defer cancel()
if err := h.Connect(ctx, *peer); err != nil {
log.WithField("peer", peer.ID).WithField("addrs", peer.Addrs).Errorf("Failed to reconnect to peer %v", err)
continue
}
}
}
}