2021-05-03 14:57:26 +00:00
|
|
|
package clientstats
|
|
|
|
|
|
|
|
import (
|
|
|
|
"bytes"
|
|
|
|
"encoding/json"
|
|
|
|
"fmt"
|
|
|
|
"io"
|
|
|
|
"net/http"
|
|
|
|
"strconv"
|
|
|
|
"time"
|
|
|
|
|
|
|
|
dto "github.com/prometheus/client_model/go"
|
|
|
|
"github.com/prometheus/prom2json"
|
2024-02-15 05:46:47 +00:00
|
|
|
eth "github.com/prysmaticlabs/prysm/v5/proto/prysm/v1alpha1"
|
2021-05-03 14:57:26 +00:00
|
|
|
log "github.com/sirupsen/logrus"
|
|
|
|
)
|
|
|
|
|
|
|
|
type beaconNodeScraper struct {
|
|
|
|
url string
|
|
|
|
tripper http.RoundTripper
|
|
|
|
}
|
|
|
|
|
|
|
|
func (bc *beaconNodeScraper) Scrape() (io.Reader, error) {
|
|
|
|
log.Infof("Scraping beacon-node at %s", bc.url)
|
|
|
|
pf, err := scrapeProm(bc.url, bc.tripper)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
2021-06-07 20:37:14 +00:00
|
|
|
bs := populateBeaconNodeStats(pf)
|
|
|
|
|
2021-05-03 14:57:26 +00:00
|
|
|
b, err := json.Marshal(bs)
|
|
|
|
return bytes.NewBuffer(b), err
|
|
|
|
}
|
|
|
|
|
|
|
|
// NewBeaconNodeScraper constructs a Scaper capable of scraping
|
|
|
|
// the prometheus endpoint of a beacon-node process and producing
|
|
|
|
// the json body for the beaconnode client-stats process type.
|
|
|
|
func NewBeaconNodeScraper(promExpoURL string) Scraper {
|
|
|
|
return &beaconNodeScraper{
|
|
|
|
url: promExpoURL,
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
type validatorScraper struct {
|
|
|
|
url string
|
|
|
|
tripper http.RoundTripper
|
|
|
|
}
|
|
|
|
|
|
|
|
func (vc *validatorScraper) Scrape() (io.Reader, error) {
|
|
|
|
log.Infof("Scraping validator at %s", vc.url)
|
|
|
|
pf, err := scrapeProm(vc.url, vc.tripper)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
2021-06-07 20:37:14 +00:00
|
|
|
vs := populateValidatorStats(pf)
|
|
|
|
|
2021-05-03 14:57:26 +00:00
|
|
|
b, err := json.Marshal(vs)
|
|
|
|
return bytes.NewBuffer(b), err
|
|
|
|
}
|
|
|
|
|
|
|
|
// NewValidatorScraper constructs a Scaper capable of scraping
|
|
|
|
// the prometheus endpoint of a validator process and producing
|
|
|
|
// the json body for the validator client-stats process type.
|
|
|
|
func NewValidatorScraper(promExpoURL string) Scraper {
|
|
|
|
return &validatorScraper{
|
|
|
|
url: promExpoURL,
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// note on tripper -- under the hood FetchMetricFamilies constructs an http.Client,
|
|
|
|
// which, if transport is nil, will just use the DefaultTransport, so we
|
|
|
|
// really only bother specifying the transport in tests, otherwise we let
|
|
|
|
// the zero-value (which is nil) flow through so that the default transport
|
|
|
|
// will be used.
|
|
|
|
func scrapeProm(url string, tripper http.RoundTripper) (map[string]*dto.MetricFamily, error) {
|
|
|
|
mfChan := make(chan *dto.MetricFamily)
|
2021-11-15 15:13:52 +00:00
|
|
|
errChan := make(chan error, 1)
|
2021-05-03 14:57:26 +00:00
|
|
|
go func() {
|
|
|
|
// FetchMetricFamilies handles grpc flavored prometheus ez
|
|
|
|
// but at the cost of the awkward channel select loop below
|
|
|
|
err := prom2json.FetchMetricFamilies(url, mfChan, tripper)
|
|
|
|
if err != nil {
|
|
|
|
errChan <- err
|
|
|
|
}
|
|
|
|
}()
|
|
|
|
result := make(map[string]*dto.MetricFamily)
|
|
|
|
// channel select accumulates results from FetchMetricFamilies
|
|
|
|
// unless there is an error.
|
|
|
|
for {
|
|
|
|
select {
|
|
|
|
case fam, chanOpen := <-mfChan:
|
2024-02-06 10:18:21 +00:00
|
|
|
// FetchMetricFamilies will close the channel when done
|
2021-05-03 14:57:26 +00:00
|
|
|
// at which point we want to stop the goroutine
|
|
|
|
if fam == nil && !chanOpen {
|
|
|
|
return result, nil
|
|
|
|
}
|
|
|
|
ptr := fam
|
|
|
|
result[fam.GetName()] = ptr
|
|
|
|
case err := <-errChan:
|
|
|
|
return result, err
|
|
|
|
}
|
|
|
|
if errChan == nil && mfChan == nil {
|
|
|
|
return result, nil
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
type metricMap map[string]*dto.MetricFamily
|
|
|
|
|
|
|
|
func (mm metricMap) getFamily(name string) (*dto.MetricFamily, error) {
|
|
|
|
f, ok := mm[name]
|
|
|
|
if !ok {
|
2021-05-13 06:29:14 +00:00
|
|
|
return nil, fmt.Errorf("scraper did not find metric family %s", name)
|
2021-05-03 14:57:26 +00:00
|
|
|
}
|
|
|
|
return f, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
var now = time.Now // var hook for tests to overwrite
|
2021-05-13 06:29:14 +00:00
|
|
|
var nanosPerMilli = int64(time.Millisecond) / int64(time.Nanosecond)
|
2021-05-03 14:57:26 +00:00
|
|
|
|
|
|
|
func populateAPIMessage(processName string) APIMessage {
|
|
|
|
return APIMessage{
|
|
|
|
Timestamp: now().UnixNano() / nanosPerMilli,
|
|
|
|
APIVersion: APIVersion,
|
|
|
|
ProcessName: processName,
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2021-06-07 20:37:14 +00:00
|
|
|
func populateCommonStats(pf metricMap) CommonStats {
|
2021-05-03 14:57:26 +00:00
|
|
|
cs := CommonStats{}
|
|
|
|
cs.ClientName = ClientName
|
|
|
|
var f *dto.MetricFamily
|
|
|
|
var m *dto.Metric
|
|
|
|
var err error
|
|
|
|
|
|
|
|
f, err = pf.getFamily("process_cpu_seconds_total")
|
|
|
|
if err != nil {
|
2021-06-07 20:37:14 +00:00
|
|
|
log.WithError(err).Debug("Failed to get process_cpu_seconds_total")
|
|
|
|
} else {
|
|
|
|
m = f.Metric[0]
|
|
|
|
// float64->int64: truncates fractional seconds
|
|
|
|
cs.CPUProcessSecondsTotal = int64(m.Counter.GetValue())
|
2021-05-03 14:57:26 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
f, err = pf.getFamily("process_resident_memory_bytes")
|
|
|
|
if err != nil {
|
2021-06-07 20:37:14 +00:00
|
|
|
log.WithError(err).Debug("Failed to get process_resident_memory_bytes")
|
|
|
|
} else {
|
|
|
|
m = f.Metric[0]
|
|
|
|
cs.MemoryProcessBytes = int64(m.Gauge.GetValue())
|
2021-05-03 14:57:26 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
f, err = pf.getFamily("prysm_version")
|
|
|
|
if err != nil {
|
2021-06-07 20:37:14 +00:00
|
|
|
log.WithError(err).Debug("Failed to get prysm_version")
|
|
|
|
} else {
|
|
|
|
m = f.Metric[0]
|
|
|
|
for _, l := range m.GetLabel() {
|
|
|
|
switch l.GetName() {
|
|
|
|
case "version":
|
|
|
|
cs.ClientVersion = l.GetValue()
|
|
|
|
case "buildDate":
|
|
|
|
buildDate, err := strconv.Atoi(l.GetValue())
|
|
|
|
if err != nil {
|
|
|
|
log.WithError(err).Debug("Failed to retrieve buildDate label from the prysm_version metric")
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
cs.ClientBuild = int64(buildDate)
|
2021-05-03 14:57:26 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2021-06-07 20:37:14 +00:00
|
|
|
return cs
|
2021-05-03 14:57:26 +00:00
|
|
|
}
|
|
|
|
|
2021-06-07 20:37:14 +00:00
|
|
|
func populateBeaconNodeStats(pf metricMap) BeaconNodeStats {
|
2021-05-03 14:57:26 +00:00
|
|
|
var err error
|
|
|
|
bs := BeaconNodeStats{}
|
2021-06-07 20:37:14 +00:00
|
|
|
bs.CommonStats = populateCommonStats(pf)
|
2021-05-03 14:57:26 +00:00
|
|
|
bs.APIMessage = populateAPIMessage(BeaconNodeProcessName)
|
|
|
|
|
|
|
|
var f *dto.MetricFamily
|
|
|
|
var m *dto.Metric
|
|
|
|
|
|
|
|
f, err = pf.getFamily("beacon_head_slot")
|
|
|
|
if err != nil {
|
2021-06-07 20:37:14 +00:00
|
|
|
log.WithError(err).Debug("Failed to get beacon_head_slot")
|
|
|
|
} else {
|
|
|
|
m = f.Metric[0]
|
|
|
|
bs.SyncBeaconHeadSlot = int64(m.Gauge.GetValue())
|
2021-05-03 14:57:26 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
f, err = pf.getFamily("beacon_clock_time_slot")
|
|
|
|
if err != nil {
|
2021-06-07 20:37:14 +00:00
|
|
|
log.WithError(err).Debug("Failed to get beacon_clock_time_slot")
|
|
|
|
} else {
|
|
|
|
m = f.Metric[0]
|
|
|
|
if int64(m.Gauge.GetValue()) == bs.SyncBeaconHeadSlot {
|
|
|
|
bs.SyncEth2Synced = true
|
|
|
|
}
|
2021-05-03 14:57:26 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
f, err = pf.getFamily("bcnode_disk_beaconchain_bytes_total")
|
|
|
|
if err != nil {
|
2021-06-07 20:37:14 +00:00
|
|
|
log.WithError(err).Debug("Failed to get bcnode_disk_beaconchain_bytes_total")
|
|
|
|
} else {
|
|
|
|
m = f.Metric[0]
|
|
|
|
bs.DiskBeaconchainBytesTotal = int64(m.Gauge.GetValue())
|
2021-05-03 14:57:26 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
f, err = pf.getFamily("p2p_peer_count")
|
|
|
|
if err != nil {
|
2021-06-07 20:37:14 +00:00
|
|
|
log.WithError(err).Debug("Failed to get p2p_peer_count")
|
|
|
|
} else {
|
|
|
|
for _, m := range f.Metric {
|
|
|
|
for _, l := range m.GetLabel() {
|
|
|
|
if l.GetName() == "state" {
|
|
|
|
if l.GetValue() == "Connected" {
|
|
|
|
bs.NetworkPeersConnected = int64(m.Gauge.GetValue())
|
|
|
|
}
|
2021-05-03 14:57:26 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2021-06-14 23:59:15 +00:00
|
|
|
f, err = pf.getFamily("powchain_sync_eth1_connected")
|
|
|
|
if err != nil {
|
|
|
|
log.WithError(err).Debug("Failed to get powchain_sync_eth1_connected")
|
|
|
|
} else {
|
|
|
|
m = f.Metric[0]
|
|
|
|
bs.SyncEth1Connected = false
|
|
|
|
if int64(m.Gauge.GetValue()) == 1 {
|
|
|
|
bs.SyncEth1Connected = true
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2021-06-07 20:37:14 +00:00
|
|
|
return bs
|
2021-05-03 14:57:26 +00:00
|
|
|
}
|
|
|
|
|
2021-05-03 22:24:27 +00:00
|
|
|
func statusIsActive(statusCode int64) bool {
|
|
|
|
s := eth.ValidatorStatus(statusCode)
|
|
|
|
return s.String() == "ACTIVE"
|
|
|
|
}
|
|
|
|
|
2021-06-07 20:37:14 +00:00
|
|
|
func populateValidatorStats(pf metricMap) ValidatorStats {
|
2021-05-03 14:57:26 +00:00
|
|
|
var err error
|
|
|
|
vs := ValidatorStats{}
|
2021-06-07 20:37:14 +00:00
|
|
|
vs.CommonStats = populateCommonStats(pf)
|
2021-05-03 14:57:26 +00:00
|
|
|
vs.APIMessage = populateAPIMessage(ValidatorProcessName)
|
2021-05-03 22:24:27 +00:00
|
|
|
|
|
|
|
f, err := pf.getFamily("validator_statuses")
|
|
|
|
if err != nil {
|
2021-06-07 20:37:14 +00:00
|
|
|
log.WithError(err).Debug("Failed to get validator_statuses")
|
|
|
|
} else {
|
|
|
|
for _, m := range f.Metric {
|
|
|
|
if statusIsActive(int64(m.Gauge.GetValue())) {
|
|
|
|
vs.ValidatorActive += 1
|
|
|
|
}
|
|
|
|
vs.ValidatorTotal += 1
|
2021-05-03 22:24:27 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2021-06-07 20:37:14 +00:00
|
|
|
return vs
|
2021-05-03 14:57:26 +00:00
|
|
|
}
|