mirror of
https://gitlab.com/pulsechaincom/prysm-pulse.git
synced 2025-01-08 02:31:19 +00:00
9fcb9b86af
* fix 1-worker underflow; lower default batch size * adding test for single item in batcher --------- Co-authored-by: Kasey Kirkham <kasey@users.noreply.github.com>
202 lines
6.8 KiB
Go
202 lines
6.8 KiB
Go
package backfill
|
|
|
|
import (
|
|
"github.com/pkg/errors"
|
|
"github.com/prysmaticlabs/prysm/v5/consensus-types/primitives"
|
|
)
|
|
|
|
var errMaxBatches = errors.New("backfill batch requested in excess of max outstanding batches")
|
|
var errEndSequence = errors.New("sequence has terminated, no more backfill batches will be produced")
|
|
var errCannotDecreaseMinimum = errors.New("the minimum backfill slot can only be increased, not decreased")
|
|
|
|
type batchSequencer struct {
|
|
batcher batcher
|
|
seq []batch
|
|
}
|
|
|
|
// sequence() is meant as a verb "arrange in a particular order".
|
|
// sequence determines the next set of batches that should be worked on based on the state of the batches
|
|
// in its internal view. sequence relies on update() for updates to its view of the
|
|
// batches it has previously sequenced.
|
|
func (c *batchSequencer) sequence() ([]batch, error) {
|
|
s := make([]batch, 0)
|
|
// batch start slots are in descending order, c.seq[n].begin == c.seq[n+1].end
|
|
for i := range c.seq {
|
|
switch c.seq[i].state {
|
|
case batchInit, batchErrRetryable:
|
|
c.seq[i] = c.seq[i].withState(batchSequenced)
|
|
s = append(s, c.seq[i])
|
|
case batchNil:
|
|
// batchNil is the zero value of the batch type.
|
|
// This case means that we are initializing a batch that was created by the
|
|
// initial allocation of the seq slice, so batcher need to compute its bounds.
|
|
var b batch
|
|
if i == 0 {
|
|
// The first item in the list is a special case, subsequent items are initialized
|
|
// relative to the preceding batches.
|
|
b = c.batcher.before(c.batcher.max)
|
|
} else {
|
|
b = c.batcher.beforeBatch(c.seq[i-1])
|
|
}
|
|
c.seq[i] = b.withState(batchSequenced)
|
|
s = append(s, c.seq[i])
|
|
case batchEndSequence:
|
|
if len(s) == 0 {
|
|
s = append(s, c.seq[i])
|
|
}
|
|
default:
|
|
continue
|
|
}
|
|
}
|
|
if len(s) == 0 {
|
|
return nil, errMaxBatches
|
|
}
|
|
|
|
return s, nil
|
|
}
|
|
|
|
// update serves 2 roles.
|
|
// - updating batchSequencer's copy of the given batch.
|
|
// - removing batches that are completely imported from the sequence,
|
|
// so that they are not returned the next time import() is called, and populating
|
|
// seq with new batches that are ready to be worked on.
|
|
func (c *batchSequencer) update(b batch) {
|
|
done := 0
|
|
for i := 0; i < len(c.seq); i++ {
|
|
if b.replaces(c.seq[i]) {
|
|
c.seq[i] = b
|
|
}
|
|
// Assumes invariant that batches complete and update is called in order.
|
|
// This should be true because the code using the sequencer doesn't know the expected parent
|
|
// for a batch until it imports the previous batch.
|
|
if c.seq[i].state == batchImportComplete {
|
|
done += 1
|
|
continue
|
|
}
|
|
// Move the unfinished batches to overwrite the finished ones.
|
|
// eg consider [a,b,c,d,e] where a,b are done
|
|
// when i==2, done==2 (since done was incremented for a and b)
|
|
// so we want to copy c to a, then on i=3, d to b, then on i=4 e to c.
|
|
c.seq[i-done] = c.seq[i]
|
|
}
|
|
if done == 1 && len(c.seq) == 1 {
|
|
c.seq[0] = c.batcher.beforeBatch(c.seq[0])
|
|
return
|
|
}
|
|
// Overwrite the moved batches with the next ones in the sequence.
|
|
// Continuing the example in the comment above, len(c.seq)==5, done=2, so i=3.
|
|
// We want to replace index 3 with the batch that should be processed after index 2,
|
|
// which was previously the earliest known batch, and index 4 with the batch that should
|
|
// be processed after index 3, the new earliest batch.
|
|
for i := len(c.seq) - done; i < len(c.seq); i++ {
|
|
c.seq[i] = c.batcher.beforeBatch(c.seq[i-1])
|
|
}
|
|
}
|
|
|
|
// importable returns all batches that are ready to be imported. This means they satisfy 2 conditions:
|
|
// - They are in state batchImportable, which means their data has been downloaded and proposer signatures have been verified.
|
|
// - There are no batches that are not in state batchImportable between them and the start of the slice. This ensures that they
|
|
// can be connected to the canonical chain, either because the root of the last block in the batch matches the parent_root of
|
|
// the oldest block in the canonical chain, or because the root of the last block in the batch matches the parent_root of the
|
|
// new block preceding them in the slice (which must connect to the batch before it, or to the canonical chain if it is first).
|
|
func (c *batchSequencer) importable() []batch {
|
|
imp := make([]batch, 0)
|
|
for i := range c.seq {
|
|
if c.seq[i].state == batchImportable {
|
|
imp = append(imp, c.seq[i])
|
|
continue
|
|
}
|
|
// as soon as we hit a batch with a different state, we return everything leading to it.
|
|
// If the first element isn't importable, we'll return an empty slice.
|
|
break
|
|
}
|
|
return imp
|
|
}
|
|
|
|
// moveMinimum enables the backfill service to change the slot where the batcher will start replying with
|
|
// batch state batchEndSequence (signaling that no new batches will be produced). This is done in response to
|
|
// epochs advancing, which shrinks the gap between <checkpoint slot> and <current slot>-MIN_EPOCHS_FOR_BLOCK_REQUESTS,
|
|
// allowing the node to download a smaller number of blocks.
|
|
func (c *batchSequencer) moveMinimum(min primitives.Slot) error {
|
|
if min < c.batcher.min {
|
|
return errCannotDecreaseMinimum
|
|
}
|
|
c.batcher.min = min
|
|
return nil
|
|
}
|
|
|
|
// countWithState provides a view into how many batches are in a particular state
|
|
// to be used for logging or metrics purposes.
|
|
func (c *batchSequencer) countWithState(s batchState) int {
|
|
n := 0
|
|
for i := 0; i < len(c.seq); i++ {
|
|
if c.seq[i].state == s {
|
|
n += 1
|
|
}
|
|
}
|
|
return n
|
|
}
|
|
|
|
// numTodo computes the number of remaining batches for metrics and logging purposes.
|
|
func (c *batchSequencer) numTodo() int {
|
|
if len(c.seq) == 0 {
|
|
return 0
|
|
}
|
|
lowest := c.seq[len(c.seq)-1]
|
|
todo := 0
|
|
if lowest.state != batchEndSequence {
|
|
todo = c.batcher.remaining(lowest.begin)
|
|
}
|
|
for _, b := range c.seq {
|
|
switch b.state {
|
|
case batchEndSequence, batchImportComplete, batchNil:
|
|
continue
|
|
default:
|
|
todo += 1
|
|
}
|
|
}
|
|
return todo
|
|
}
|
|
|
|
func newBatchSequencer(seqLen int, min, max, size primitives.Slot) *batchSequencer {
|
|
b := batcher{min: min, max: max, size: size}
|
|
seq := make([]batch, seqLen)
|
|
return &batchSequencer{batcher: b, seq: seq}
|
|
}
|
|
|
|
type batcher struct {
|
|
min primitives.Slot
|
|
max primitives.Slot
|
|
size primitives.Slot
|
|
}
|
|
|
|
func (r batcher) remaining(upTo primitives.Slot) int {
|
|
if r.min >= upTo {
|
|
return 0
|
|
}
|
|
delta := upTo - r.min
|
|
if delta%r.size != 0 {
|
|
return int(delta/r.size) + 1
|
|
}
|
|
return int(delta / r.size)
|
|
}
|
|
|
|
func (r batcher) beforeBatch(upTo batch) batch {
|
|
return r.before(upTo.begin)
|
|
}
|
|
|
|
func (r batcher) before(upTo primitives.Slot) batch {
|
|
// upTo is an exclusive upper bound. Requesting a batch before the lower bound of backfill signals the end of the
|
|
// backfill process.
|
|
if upTo <= r.min {
|
|
return batch{begin: upTo, end: upTo, state: batchEndSequence}
|
|
}
|
|
begin := r.min
|
|
if upTo > r.size+r.min {
|
|
begin = upTo - r.size
|
|
}
|
|
|
|
// batch.end is exclusive, .begin is inclusive, so the prev.end = next.begin
|
|
return batch{begin: begin, end: upTo, state: batchInit}
|
|
}
|