mirror of
https://gitlab.com/pulsechaincom/erigon-pulse.git
synced 2025-01-07 03:22:18 +00:00
967937151d
* Fixes for compress, and first test * Add decompressor and memory mapping * Add decompressor and memory mapping * Fix for windows * Fix lint * Fix compile for windows * More on decompressor * Fix lint * Decompress * Fix lint * Use decompressor in tests, fixes * Introduce Index for RecSplit * Fix compilation on Windows * close index file on failure * Fixes to the tests * Add single Elias Fano, fix recsplit fuzz test * Fix elias fano * Add two layer index * Add two level index to the tests Co-authored-by: Alexey Sharp <alexeysharp@Alexeys-iMac.local> Co-authored-by: Alex Sharp <alexsharp@Alexs-MacBook-Pro.local>
186 lines
6.0 KiB
Go
186 lines
6.0 KiB
Go
/*
|
|
Copyright 2021 Erigon contributors
|
|
|
|
Licensed under the Apache License, Version 2.0 (the "License");
|
|
you may not use this file except in compliance with the License.
|
|
You may obtain a copy of the License at
|
|
|
|
http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
Unless required by applicable law or agreed to in writing, software
|
|
distributed under the License is distributed on an "AS IS" BASIS,
|
|
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
See the License for the specific language governing permissions and
|
|
limitations under the License.
|
|
*/
|
|
|
|
package recsplit
|
|
|
|
import (
|
|
"fmt"
|
|
"path"
|
|
"testing"
|
|
)
|
|
|
|
func TestRecSplit2(t *testing.T) {
|
|
tmpDir := t.TempDir()
|
|
rs, err := NewRecSplit(RecSplitArgs{
|
|
KeyCount: 2,
|
|
BucketSize: 10,
|
|
Salt: 0,
|
|
TmpDir: tmpDir,
|
|
IndexFile: path.Join(tmpDir, "index"),
|
|
LeafSize: 8,
|
|
StartSeed: []uint64{0x106393c187cae21a, 0x6453cec3f7376937, 0x643e521ddbd2be98, 0x3740c6412f6572cb, 0x717d47562f1ce470, 0x4cd6eb4c63befb7c, 0x9bfd8c5e18c8da73,
|
|
0x082f20e10092a9a3, 0x2ada2ce68d21defc, 0xe33cb4f3e7c6466b, 0x3980be458c509c59, 0xc466fd9584828e8c, 0x45f0aabe1a61ede6, 0xf6e7b8b33ad9b98d,
|
|
0x4ef95e25f4b4983d, 0x81175195173b92d3, 0x4e50927d8dd15978, 0x1ea2099d1fafae7f, 0x425c8a06fbaaa815, 0xcd4216006c74052a},
|
|
})
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
if err = rs.AddKey([]byte("first_key"), 0); err != nil {
|
|
t.Error(err)
|
|
}
|
|
if err = rs.Build(); err == nil {
|
|
t.Errorf("test is expected to fail, too few keys added")
|
|
}
|
|
if err = rs.AddKey([]byte("second_key"), 0); err != nil {
|
|
t.Error(err)
|
|
}
|
|
if err = rs.Build(); err != nil {
|
|
t.Error(err)
|
|
}
|
|
if err = rs.Build(); err == nil {
|
|
t.Errorf("test is expected to fail, hash gunction was built already")
|
|
}
|
|
if err = rs.AddKey([]byte("key_to_fail"), 0); err == nil {
|
|
t.Errorf("test is expected to fail, hash function was built")
|
|
}
|
|
}
|
|
|
|
func TestRecSplitDuplicate(t *testing.T) {
|
|
tmpDir := t.TempDir()
|
|
rs, err := NewRecSplit(RecSplitArgs{
|
|
KeyCount: 2,
|
|
BucketSize: 10,
|
|
Salt: 0,
|
|
TmpDir: tmpDir,
|
|
IndexFile: path.Join(tmpDir, "index"),
|
|
LeafSize: 8,
|
|
StartSeed: []uint64{0x106393c187cae21a, 0x6453cec3f7376937, 0x643e521ddbd2be98, 0x3740c6412f6572cb, 0x717d47562f1ce470, 0x4cd6eb4c63befb7c, 0x9bfd8c5e18c8da73,
|
|
0x082f20e10092a9a3, 0x2ada2ce68d21defc, 0xe33cb4f3e7c6466b, 0x3980be458c509c59, 0xc466fd9584828e8c, 0x45f0aabe1a61ede6, 0xf6e7b8b33ad9b98d,
|
|
0x4ef95e25f4b4983d, 0x81175195173b92d3, 0x4e50927d8dd15978, 0x1ea2099d1fafae7f, 0x425c8a06fbaaa815, 0xcd4216006c74052a},
|
|
})
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
if err := rs.AddKey([]byte("first_key"), 0); err != nil {
|
|
t.Error(err)
|
|
}
|
|
if err := rs.AddKey([]byte("first_key"), 0); err != nil {
|
|
t.Error(err)
|
|
}
|
|
if err := rs.Build(); err == nil {
|
|
t.Errorf("test is expected to fail, duplicate key")
|
|
}
|
|
}
|
|
|
|
func TestRecSplitLeafSizeTooLarge(t *testing.T) {
|
|
tmpDir := t.TempDir()
|
|
_, err := NewRecSplit(RecSplitArgs{
|
|
KeyCount: 2,
|
|
BucketSize: 10,
|
|
Salt: 0,
|
|
TmpDir: tmpDir,
|
|
IndexFile: path.Join(tmpDir, "index"),
|
|
LeafSize: 64,
|
|
StartSeed: []uint64{0x106393c187cae21a, 0x6453cec3f7376937, 0x643e521ddbd2be98, 0x3740c6412f6572cb, 0x717d47562f1ce470, 0x4cd6eb4c63befb7c, 0x9bfd8c5e18c8da73,
|
|
0x082f20e10092a9a3, 0x2ada2ce68d21defc, 0xe33cb4f3e7c6466b, 0x3980be458c509c59, 0xc466fd9584828e8c, 0x45f0aabe1a61ede6, 0xf6e7b8b33ad9b98d,
|
|
0x4ef95e25f4b4983d, 0x81175195173b92d3, 0x4e50927d8dd15978, 0x1ea2099d1fafae7f, 0x425c8a06fbaaa815, 0xcd4216006c74052a},
|
|
})
|
|
if err == nil {
|
|
t.Errorf("test is expected to fail, leaf size too large")
|
|
}
|
|
}
|
|
|
|
func TestIndexLookup(t *testing.T) {
|
|
tmpDir := t.TempDir()
|
|
indexFile := path.Join(tmpDir, "index")
|
|
rs, err := NewRecSplit(RecSplitArgs{
|
|
KeyCount: 100,
|
|
BucketSize: 10,
|
|
Salt: 0,
|
|
TmpDir: tmpDir,
|
|
IndexFile: indexFile,
|
|
LeafSize: 8,
|
|
StartSeed: []uint64{0x106393c187cae21a, 0x6453cec3f7376937, 0x643e521ddbd2be98, 0x3740c6412f6572cb, 0x717d47562f1ce470, 0x4cd6eb4c63befb7c, 0x9bfd8c5e18c8da73,
|
|
0x082f20e10092a9a3, 0x2ada2ce68d21defc, 0xe33cb4f3e7c6466b, 0x3980be458c509c59, 0xc466fd9584828e8c, 0x45f0aabe1a61ede6, 0xf6e7b8b33ad9b98d,
|
|
0x4ef95e25f4b4983d, 0x81175195173b92d3, 0x4e50927d8dd15978, 0x1ea2099d1fafae7f, 0x425c8a06fbaaa815, 0xcd4216006c74052a},
|
|
})
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
for i := 0; i < 100; i++ {
|
|
if err = rs.AddKey([]byte(fmt.Sprintf("key %d", i)), uint64(i*17)); err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
}
|
|
if err := rs.Build(); err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
var idx *Index
|
|
if idx, err = NewIndex(indexFile); err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
defer idx.Close()
|
|
for i := 0; i < 100; i++ {
|
|
offset := idx.Lookup([]byte(fmt.Sprintf("key %d", i)))
|
|
if offset != uint64(i*17) {
|
|
t.Errorf("expected offset: %d, looked up: %d", i*17, offset)
|
|
}
|
|
}
|
|
}
|
|
|
|
func TestTwoLayerIndex(t *testing.T) {
|
|
tmpDir := t.TempDir()
|
|
indexFile := path.Join(tmpDir, "index")
|
|
rs, err := NewRecSplit(RecSplitArgs{
|
|
KeyCount: 100,
|
|
BucketSize: 10,
|
|
Salt: 0,
|
|
TmpDir: tmpDir,
|
|
IndexFile: indexFile,
|
|
LeafSize: 8,
|
|
StartSeed: []uint64{0x106393c187cae21a, 0x6453cec3f7376937, 0x643e521ddbd2be98, 0x3740c6412f6572cb, 0x717d47562f1ce470, 0x4cd6eb4c63befb7c, 0x9bfd8c5e18c8da73,
|
|
0x082f20e10092a9a3, 0x2ada2ce68d21defc, 0xe33cb4f3e7c6466b, 0x3980be458c509c59, 0xc466fd9584828e8c, 0x45f0aabe1a61ede6, 0xf6e7b8b33ad9b98d,
|
|
0x4ef95e25f4b4983d, 0x81175195173b92d3, 0x4e50927d8dd15978, 0x1ea2099d1fafae7f, 0x425c8a06fbaaa815, 0xcd4216006c74052a},
|
|
Enums: true,
|
|
})
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
for i := 0; i < 100; i++ {
|
|
if err = rs.AddKey([]byte(fmt.Sprintf("key %d", i)), uint64(i*17)); err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
}
|
|
if err := rs.Build(); err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
var idx *Index
|
|
if idx, err = NewIndex(indexFile); err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
defer idx.Close()
|
|
for i := 0; i < 100; i++ {
|
|
e := idx.Lookup([]byte(fmt.Sprintf("key %d", i)))
|
|
if e != uint64(i) {
|
|
t.Errorf("expected enumeration: %d, lookup up: %d", i, e)
|
|
}
|
|
offset := idx.Lookup2(e)
|
|
if offset != uint64(i*17) {
|
|
t.Errorf("expected offset: %d, looked up: %d", i*17, offset)
|
|
}
|
|
}
|
|
}
|