erigon-pulse/kv/stream/stream_test.go

160 lines
5.8 KiB
Go

package stream_test
import (
"context"
"testing"
"github.com/ledgerwatch/erigon-lib/kv"
"github.com/ledgerwatch/erigon-lib/kv/memdb"
"github.com/ledgerwatch/erigon-lib/kv/stream"
"github.com/stretchr/testify/require"
)
func TestIntersect(t *testing.T) {
s1 := stream.Array[uint64]([]uint64{1, 3, 4, 5, 6, 7})
s2 := stream.Array[uint64]([]uint64{2, 3, 7})
s3 := stream.Intersect[uint64](s1, s2)
res, err := stream.ToArr[uint64](s3)
require.NoError(t, err)
require.Equal(t, []uint64{3, 7}, res)
}
// Contraversial use-cases:
// - peek merge unlimited iterators until result>=PageSize. It require "Stop" primitive and better to be less eager.
// - get precise range/limit, maybe big
// Then we have 2 API's: Dual (rename Dual to Dual in kv_interface.go) and Cursor.
// But we want have Cursor+requestBatch operation - to avoid too many network ping-pong.
// invIdx.Dual() and invIdx.Paginate() (c.NextPage())
//
// Cockroach:
// 1. Iterate performs a paginated scan and applying the function f to every page.
// The semantics of retrieval and ordering are the same as for Scan. Note that
// Txn auto-retries the transaction if necessary. Hence, the paginated data
// must not be used for side-effects before the txn has committed.
// 2. []Pair; where Pair{k,v []byte}
// Vitess:
// 1. Exec/Dual methods
// But has separated class for each RealtionalAlgebra operator: InMemSort.run()/Intersect.run()
// then operator implementation use hardcoded Exec/Dual method.
// 2. Pairs has struct:
// // A length of -1 means that the field is NULL. While
// // reading values, you have to accummulate the length
// // to know the offset where the next value begins in values.
// repeated sint64 lengths = 1;
// // values contains a concatenation of all values in the row.
// bytes values = 2;
// Request(from, limit) -> (N, nextFrom), Request(nextFrom, limit) -> (N, nil)
// Request(from, limit) -> (N, hasNext=true), Request(nextFrom, limit) -> (N, hasNext=false): server just need internally read Limit+1
//
// Request(from, limit) -> InteractiveStream(N, nextFrom), Request(nextFrom, limit) -> (N, nil))
// TODO: remotedbserver - txs leak... when to close them? insider rollback check non-locked tx.ttl? When do we renew?
// stream will not help
// no Limit in request
// request (from, N) - merge on client
// stream (all) - push from server - merge on client
func TestUnion(t *testing.T) {
t.Run("arrays", func(t *testing.T) {
s1 := stream.Array[uint64]([]uint64{1, 3, 4, 5, 6, 7})
s2 := stream.Array[uint64]([]uint64{2, 3, 7, 8})
s3 := stream.Union[uint64](s1, s2)
res, err := stream.ToArr[uint64](s3)
require.NoError(t, err)
require.Equal(t, []uint64{1, 2, 3, 4, 5, 6, 7, 8}, res)
})
t.Run("empty left", func(t *testing.T) {
s1 := stream.Array[uint64]([]uint64{})
s2 := stream.Array[uint64]([]uint64{2, 3, 7, 8})
s3 := stream.Union[uint64](s1, s2)
res, err := stream.ToArr[uint64](s3)
require.NoError(t, err)
require.Equal(t, []uint64{2, 3, 7, 8}, res)
})
t.Run("empty right", func(t *testing.T) {
s1 := stream.Array[uint64]([]uint64{1, 3, 4, 5, 6, 7})
s2 := stream.Array[uint64]([]uint64{})
s3 := stream.Union[uint64](s1, s2)
res, err := stream.ToArr[uint64](s3)
require.NoError(t, err)
require.Equal(t, []uint64{1, 3, 4, 5, 6, 7}, res)
})
t.Run("empty", func(t *testing.T) {
s1 := stream.Array[uint64]([]uint64{})
s2 := stream.Array[uint64]([]uint64{})
s3 := stream.Union[uint64](s1, s2)
res, err := stream.ToArr[uint64](s3)
require.NoError(t, err)
require.Equal(t, []uint64{}, res)
})
}
func TestUnionPairs(t *testing.T) {
db := memdb.NewTestDB(t)
ctx := context.Background()
t.Run("simple", func(t *testing.T) {
require := require.New(t)
tx, _ := db.BeginRw(ctx)
defer tx.Rollback()
_ = tx.Put(kv.AccountsHistory, []byte{1}, []byte{1})
_ = tx.Put(kv.AccountsHistory, []byte{3}, []byte{1})
_ = tx.Put(kv.AccountsHistory, []byte{4}, []byte{1})
_ = tx.Put(kv.PlainState, []byte{2}, []byte{9})
_ = tx.Put(kv.PlainState, []byte{3}, []byte{9})
it, _ := tx.Stream(kv.AccountsHistory, nil, nil)
it2, _ := tx.Stream(kv.PlainState, nil, nil)
keys, values, err := stream.UnionPairs(it, it2).ToArray()
require.NoError(err)
require.Equal([][]byte{{1}, {2}, {3}, {4}}, keys)
require.Equal([][]byte{{1}, {9}, {1}, {1}}, values)
})
t.Run("empty 1st", func(t *testing.T) {
require := require.New(t)
tx, _ := db.BeginRw(ctx)
defer tx.Rollback()
_ = tx.Put(kv.PlainState, []byte{2}, []byte{9})
_ = tx.Put(kv.PlainState, []byte{3}, []byte{9})
it, _ := tx.Stream(kv.AccountsHistory, nil, nil)
it2, _ := tx.Stream(kv.PlainState, nil, nil)
keys, _, err := stream.UnionPairs(it, it2).ToArray()
require.NoError(err)
require.Equal([][]byte{{2}, {3}}, keys)
})
t.Run("empty 2nd", func(t *testing.T) {
require := require.New(t)
tx, _ := db.BeginRw(ctx)
defer tx.Rollback()
_ = tx.Put(kv.AccountsHistory, []byte{1}, []byte{1})
_ = tx.Put(kv.AccountsHistory, []byte{3}, []byte{1})
_ = tx.Put(kv.AccountsHistory, []byte{4}, []byte{1})
it, _ := tx.Stream(kv.AccountsHistory, nil, nil)
it2, _ := tx.Stream(kv.PlainState, nil, nil)
keys, _, err := stream.UnionPairs(it, it2).ToArray()
require.NoError(err)
require.Equal([][]byte{{1}, {3}, {4}}, keys)
})
t.Run("empty both", func(t *testing.T) {
require := require.New(t)
tx, _ := db.BeginRw(ctx)
defer tx.Rollback()
it, _ := tx.Stream(kv.AccountsHistory, nil, nil)
it2, _ := tx.Stream(kv.PlainState, nil, nil)
m := stream.UnionPairs(it, it2)
require.False(m.HasNext())
})
t.Run("error handling", func(t *testing.T) {
require := require.New(t)
tx, _ := db.BeginRw(ctx)
defer tx.Rollback()
it := stream.PairsWithError(10)
it2 := stream.PairsWithError(12)
keys, _, err := stream.UnionPairs(it, it2).ToArray()
require.Equal("expected error at iteration: 10", err.Error())
require.Equal(10, len(keys))
})
}