erigon-pulse/erigon-lib/diagnostics/provider_test.go

package diagnostics_test

import (
	"context"
	"testing"
	"time"

	"github.com/ledgerwatch/erigon-lib/diagnostics"
	"github.com/ledgerwatch/log/v3"
)

type testInfo struct {
	count int
}

func (ti testInfo) Type() diagnostics.Type {
	return diagnostics.TypeOf(ti)
}

type testProvider struct {
}

func (t *testProvider) StartDiagnostics(ctx context.Context) error {
	timer := time.NewTicker(1 * time.Second)
	defer timer.Stop()

	var count int

	for {
		select {
		case <-ctx.Done():
			return nil
		case <-timer.C:
			diagnostics.Send(testInfo{count})
			count++
		}
	}
}

func TestProviderRegistration(t *testing.T) {

	// diagnostics provider
	provider := &testProvider{}
	diagnostics.RegisterProvider(provider, diagnostics.TypeOf(testInfo{}), log.Root())

	// diagnostics receiver
	ctx, ch, cancel := diagnostics.Context[testInfo](context.Background(), 1)
	diagnostics.StartProviders(ctx, diagnostics.TypeOf(testInfo{}), log.Root())

	for info := range ch {
		if info.count == 3 {
			cancel()
		}
	}
}

func TestDelayedProviderRegistration(t *testing.T) {

	time.AfterFunc(1*time.Second, func() {
		// diagnostics provider
		provider := &testProvider{}
		diagnostics.RegisterProvider(provider, diagnostics.TypeOf(testInfo{}), log.Root())
	})

	// diagnostics receiver
	ctx, ch, cancel := diagnostics.Context[testInfo](context.Background(), 1)
	diagnostics.StartProviders(ctx, diagnostics.TypeOf(testInfo{}), log.Root())

	for info := range ch {
		if info.count == 3 {
			cancel()
		}
	}
}

func TestProviderFuncRegistration(t *testing.T) {

	// diagnostics provider
	diagnostics.RegisterProvider(diagnostics.ProviderFunc(func(ctx context.Context) error {
		timer := time.NewTicker(1 * time.Second)
		defer timer.Stop()

		var count int

		for {
			select {
			case <-ctx.Done():
				return nil
			case <-timer.C:
				diagnostics.Send(testInfo{count})
				count++
			}
		}
	}), diagnostics.TypeOf(testInfo{}), log.Root())

	// diagnostics receiver
	ctx, ch, cancel := diagnostics.Context[testInfo](context.Background(), 1)

	diagnostics.StartProviders(ctx, diagnostics.TypeOf(testInfo{}), log.Root())

	for info := range ch {
		if info.count == 3 {
			cancel()
		}
	}
}
bytes transfet separated by capability and category (#8568) Co-authored-by: Mark Holt <mark@distributed.vision> 2023-10-27 19:30:28 +00:00			`package diagnostics_test`

			`import (`
			`"context"`
			`"testing"`
			`"time"`

			`"github.com/ledgerwatch/erigon-lib/diagnostics"`
			`"github.com/ledgerwatch/log/v3"`
			`)`

			`type testInfo struct {`
			`count int`
			`}`

			`func (ti testInfo) Type() diagnostics.Type {`
			`return diagnostics.TypeOf(ti)`
			`}`

			`type testProvider struct {`
			`}`

			`func (t *testProvider) StartDiagnostics(ctx context.Context) error {`
			`timer := time.NewTicker(1 * time.Second)`
			`defer timer.Stop()`

			`var count int`

			`for {`
			`select {`
			`case <-ctx.Done():`
			`return nil`
			`case <-timer.C:`
Discovery zero refresh timer (#8661) This fixes an issue where the mumbai testnet node struggle to find peers. Before this fix in general test peer numbers are typically around 20 in total between eth66, eth67 and eth68. For new peers some can struggle to find even a single peer after days of operation. These are the numbers after 12 hours or running on a node which previously could not find any peers: eth66=13, eth67=76, eth68=91. The root cause of this issue is the following: - A significant number of mumbai peers around the boot node return network ids which are different from those currently available in the DHT - The available nodes are all consequently busy and return 'too many peers' for long periods These issues case a significant number of discovery timeouts, some of the queries will never receive a response. This causes the discovery read loop to enter a channel deadlock - which means that no responses are processed, nor timeouts fired. This causes the discovery process in the node to stop. From then on it just re-requests handshakes from a relatively small number of peers. This check in fixes this situation with the following changes: - Remove the deadlock by running the timer in a separate go-routine so it can run independently of the main request processing. - Allow the discovery process matcher to match on port if no id match can be established on initial ping. This allows subsequent node validation to proceed and if the node proves to be valid via the remainder of the look-up and handshake process it us used as a valid peer. - Completely unsolicited responses, i.e. those which come from a completely unknown ip:port combination continue to be ignored. - 2023-11-07 08:48:58 +00:00			`diagnostics.Send(testInfo{count})`
bytes transfet separated by capability and category (#8568) Co-authored-by: Mark Holt <mark@distributed.vision> 2023-10-27 19:30:28 +00:00			`count++`
			`}`
			`}`
			`}`

			`func TestProviderRegistration(t *testing.T) {`

			`// diagnostics provider`
			`provider := &testProvider{}`
			`diagnostics.RegisterProvider(provider, diagnostics.TypeOf(testInfo{}), log.Root())`

			`// diagnostics receiver`
			`ctx, ch, cancel := diagnostics.Context[testInfo](context.Background(), 1)`
			`diagnostics.StartProviders(ctx, diagnostics.TypeOf(testInfo{}), log.Root())`

			`for info := range ch {`
			`if info.count == 3 {`
			`cancel()`
			`}`
			`}`
			`}`

Discovery zero refresh timer (#8661) This fixes an issue where the mumbai testnet node struggle to find peers. Before this fix in general test peer numbers are typically around 20 in total between eth66, eth67 and eth68. For new peers some can struggle to find even a single peer after days of operation. These are the numbers after 12 hours or running on a node which previously could not find any peers: eth66=13, eth67=76, eth68=91. The root cause of this issue is the following: - A significant number of mumbai peers around the boot node return network ids which are different from those currently available in the DHT - The available nodes are all consequently busy and return 'too many peers' for long periods These issues case a significant number of discovery timeouts, some of the queries will never receive a response. This causes the discovery read loop to enter a channel deadlock - which means that no responses are processed, nor timeouts fired. This causes the discovery process in the node to stop. From then on it just re-requests handshakes from a relatively small number of peers. This check in fixes this situation with the following changes: - Remove the deadlock by running the timer in a separate go-routine so it can run independently of the main request processing. - Allow the discovery process matcher to match on port if no id match can be established on initial ping. This allows subsequent node validation to proceed and if the node proves to be valid via the remainder of the look-up and handshake process it us used as a valid peer. - Completely unsolicited responses, i.e. those which come from a completely unknown ip:port combination continue to be ignored. - 2023-11-07 08:48:58 +00:00			`func TestDelayedProviderRegistration(t *testing.T) {`

			`time.AfterFunc(1*time.Second, func() {`
			`// diagnostics provider`
			`provider := &testProvider{}`
			`diagnostics.RegisterProvider(provider, diagnostics.TypeOf(testInfo{}), log.Root())`
			`})`

			`// diagnostics receiver`
			`ctx, ch, cancel := diagnostics.Context[testInfo](context.Background(), 1)`
			`diagnostics.StartProviders(ctx, diagnostics.TypeOf(testInfo{}), log.Root())`

			`for info := range ch {`
			`if info.count == 3 {`
			`cancel()`
			`}`
			`}`
			`}`

bytes transfet separated by capability and category (#8568) Co-authored-by: Mark Holt <mark@distributed.vision> 2023-10-27 19:30:28 +00:00			`func TestProviderFuncRegistration(t *testing.T) {`

			`// diagnostics provider`
			`diagnostics.RegisterProvider(diagnostics.ProviderFunc(func(ctx context.Context) error {`
			`timer := time.NewTicker(1 * time.Second)`
			`defer timer.Stop()`

			`var count int`

			`for {`
			`select {`
			`case <-ctx.Done():`
			`return nil`
			`case <-timer.C:`
Discovery zero refresh timer (#8661) This fixes an issue where the mumbai testnet node struggle to find peers. Before this fix in general test peer numbers are typically around 20 in total between eth66, eth67 and eth68. For new peers some can struggle to find even a single peer after days of operation. These are the numbers after 12 hours or running on a node which previously could not find any peers: eth66=13, eth67=76, eth68=91. The root cause of this issue is the following: - A significant number of mumbai peers around the boot node return network ids which are different from those currently available in the DHT - The available nodes are all consequently busy and return 'too many peers' for long periods These issues case a significant number of discovery timeouts, some of the queries will never receive a response. This causes the discovery read loop to enter a channel deadlock - which means that no responses are processed, nor timeouts fired. This causes the discovery process in the node to stop. From then on it just re-requests handshakes from a relatively small number of peers. This check in fixes this situation with the following changes: - Remove the deadlock by running the timer in a separate go-routine so it can run independently of the main request processing. - Allow the discovery process matcher to match on port if no id match can be established on initial ping. This allows subsequent node validation to proceed and if the node proves to be valid via the remainder of the look-up and handshake process it us used as a valid peer. - Completely unsolicited responses, i.e. those which come from a completely unknown ip:port combination continue to be ignored. - 2023-11-07 08:48:58 +00:00			`diagnostics.Send(testInfo{count})`
bytes transfet separated by capability and category (#8568) Co-authored-by: Mark Holt <mark@distributed.vision> 2023-10-27 19:30:28 +00:00			`count++`
			`}`
			`}`
			`}), diagnostics.TypeOf(testInfo{}), log.Root())`

			`// diagnostics receiver`
			`ctx, ch, cancel := diagnostics.Context[testInfo](context.Background(), 1)`

			`diagnostics.StartProviders(ctx, diagnostics.TypeOf(testInfo{}), log.Root())`

			`for info := range ch {`
			`if info.count == 3 {`
			`cancel()`
			`}`
			`}`
			`}`