2021-09-13 17:31:09 +00:00
|
|
|
/*
|
|
|
|
Copyright 2021 Erigon contributors
|
|
|
|
|
|
|
|
Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
you may not use this file except in compliance with the License.
|
|
|
|
You may obtain a copy of the License at
|
|
|
|
|
|
|
|
http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
|
|
|
|
Unless required by applicable law or agreed to in writing, software
|
|
|
|
distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
See the License for the specific language governing permissions and
|
|
|
|
limitations under the License.
|
|
|
|
*/
|
|
|
|
|
|
|
|
package recsplit
|
|
|
|
|
|
|
|
import (
|
2021-10-16 09:43:41 +00:00
|
|
|
"fmt"
|
2022-02-12 13:11:30 +00:00
|
|
|
"path/filepath"
|
2021-09-13 17:31:09 +00:00
|
|
|
"testing"
|
|
|
|
)
|
|
|
|
|
2021-09-18 21:59:27 +00:00
|
|
|
func TestRecSplit2(t *testing.T) {
|
2021-10-16 09:43:41 +00:00
|
|
|
tmpDir := t.TempDir()
|
2021-09-13 17:31:09 +00:00
|
|
|
rs, err := NewRecSplit(RecSplitArgs{
|
|
|
|
KeyCount: 2,
|
|
|
|
BucketSize: 10,
|
|
|
|
Salt: 0,
|
2021-10-16 09:43:41 +00:00
|
|
|
TmpDir: tmpDir,
|
2022-02-12 13:11:30 +00:00
|
|
|
IndexFile: filepath.Join(tmpDir, "index"),
|
2021-09-13 17:31:09 +00:00
|
|
|
LeafSize: 8,
|
2021-09-20 11:14:49 +00:00
|
|
|
StartSeed: []uint64{0x106393c187cae21a, 0x6453cec3f7376937, 0x643e521ddbd2be98, 0x3740c6412f6572cb, 0x717d47562f1ce470, 0x4cd6eb4c63befb7c, 0x9bfd8c5e18c8da73,
|
|
|
|
0x082f20e10092a9a3, 0x2ada2ce68d21defc, 0xe33cb4f3e7c6466b, 0x3980be458c509c59, 0xc466fd9584828e8c, 0x45f0aabe1a61ede6, 0xf6e7b8b33ad9b98d,
|
|
|
|
0x4ef95e25f4b4983d, 0x81175195173b92d3, 0x4e50927d8dd15978, 0x1ea2099d1fafae7f, 0x425c8a06fbaaa815, 0xcd4216006c74052a},
|
2021-09-13 17:31:09 +00:00
|
|
|
})
|
|
|
|
if err != nil {
|
|
|
|
t.Fatal(err)
|
|
|
|
}
|
2021-10-16 09:43:41 +00:00
|
|
|
if err = rs.AddKey([]byte("first_key"), 0); err != nil {
|
2021-09-13 17:31:09 +00:00
|
|
|
t.Error(err)
|
|
|
|
}
|
|
|
|
if err = rs.Build(); err == nil {
|
|
|
|
t.Errorf("test is expected to fail, too few keys added")
|
|
|
|
}
|
2021-10-16 09:43:41 +00:00
|
|
|
if err = rs.AddKey([]byte("second_key"), 0); err != nil {
|
2021-09-13 17:31:09 +00:00
|
|
|
t.Error(err)
|
|
|
|
}
|
|
|
|
if err = rs.Build(); err != nil {
|
|
|
|
t.Error(err)
|
|
|
|
}
|
|
|
|
if err = rs.Build(); err == nil {
|
|
|
|
t.Errorf("test is expected to fail, hash gunction was built already")
|
|
|
|
}
|
2021-10-16 09:43:41 +00:00
|
|
|
if err = rs.AddKey([]byte("key_to_fail"), 0); err == nil {
|
2021-09-13 17:31:09 +00:00
|
|
|
t.Errorf("test is expected to fail, hash function was built")
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
func TestRecSplitDuplicate(t *testing.T) {
|
2021-10-16 09:43:41 +00:00
|
|
|
tmpDir := t.TempDir()
|
2021-09-13 17:31:09 +00:00
|
|
|
rs, err := NewRecSplit(RecSplitArgs{
|
|
|
|
KeyCount: 2,
|
|
|
|
BucketSize: 10,
|
|
|
|
Salt: 0,
|
2021-10-16 09:43:41 +00:00
|
|
|
TmpDir: tmpDir,
|
2022-02-12 13:11:30 +00:00
|
|
|
IndexFile: filepath.Join(tmpDir, "index"),
|
2021-09-13 17:31:09 +00:00
|
|
|
LeafSize: 8,
|
2021-09-20 11:14:49 +00:00
|
|
|
StartSeed: []uint64{0x106393c187cae21a, 0x6453cec3f7376937, 0x643e521ddbd2be98, 0x3740c6412f6572cb, 0x717d47562f1ce470, 0x4cd6eb4c63befb7c, 0x9bfd8c5e18c8da73,
|
|
|
|
0x082f20e10092a9a3, 0x2ada2ce68d21defc, 0xe33cb4f3e7c6466b, 0x3980be458c509c59, 0xc466fd9584828e8c, 0x45f0aabe1a61ede6, 0xf6e7b8b33ad9b98d,
|
|
|
|
0x4ef95e25f4b4983d, 0x81175195173b92d3, 0x4e50927d8dd15978, 0x1ea2099d1fafae7f, 0x425c8a06fbaaa815, 0xcd4216006c74052a},
|
2021-09-13 17:31:09 +00:00
|
|
|
})
|
|
|
|
if err != nil {
|
|
|
|
t.Fatal(err)
|
|
|
|
}
|
2021-10-16 09:43:41 +00:00
|
|
|
if err := rs.AddKey([]byte("first_key"), 0); err != nil {
|
2021-09-13 17:31:09 +00:00
|
|
|
t.Error(err)
|
|
|
|
}
|
2021-10-16 09:43:41 +00:00
|
|
|
if err := rs.AddKey([]byte("first_key"), 0); err != nil {
|
2021-09-13 17:31:09 +00:00
|
|
|
t.Error(err)
|
|
|
|
}
|
|
|
|
if err := rs.Build(); err == nil {
|
|
|
|
t.Errorf("test is expected to fail, duplicate key")
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
func TestRecSplitLeafSizeTooLarge(t *testing.T) {
|
2021-10-16 09:43:41 +00:00
|
|
|
tmpDir := t.TempDir()
|
2021-09-13 17:31:09 +00:00
|
|
|
_, err := NewRecSplit(RecSplitArgs{
|
|
|
|
KeyCount: 2,
|
|
|
|
BucketSize: 10,
|
|
|
|
Salt: 0,
|
2021-10-16 09:43:41 +00:00
|
|
|
TmpDir: tmpDir,
|
2022-02-12 13:11:30 +00:00
|
|
|
IndexFile: filepath.Join(tmpDir, "index"),
|
2021-09-13 17:31:09 +00:00
|
|
|
LeafSize: 64,
|
2021-09-20 11:14:49 +00:00
|
|
|
StartSeed: []uint64{0x106393c187cae21a, 0x6453cec3f7376937, 0x643e521ddbd2be98, 0x3740c6412f6572cb, 0x717d47562f1ce470, 0x4cd6eb4c63befb7c, 0x9bfd8c5e18c8da73,
|
|
|
|
0x082f20e10092a9a3, 0x2ada2ce68d21defc, 0xe33cb4f3e7c6466b, 0x3980be458c509c59, 0xc466fd9584828e8c, 0x45f0aabe1a61ede6, 0xf6e7b8b33ad9b98d,
|
|
|
|
0x4ef95e25f4b4983d, 0x81175195173b92d3, 0x4e50927d8dd15978, 0x1ea2099d1fafae7f, 0x425c8a06fbaaa815, 0xcd4216006c74052a},
|
2021-09-13 17:31:09 +00:00
|
|
|
})
|
|
|
|
if err == nil {
|
|
|
|
t.Errorf("test is expected to fail, leaf size too large")
|
|
|
|
}
|
|
|
|
}
|
2021-10-16 09:43:41 +00:00
|
|
|
|
|
|
|
func TestIndexLookup(t *testing.T) {
|
|
|
|
tmpDir := t.TempDir()
|
2022-02-12 13:11:30 +00:00
|
|
|
indexFile := filepath.Join(tmpDir, "index")
|
2021-10-16 09:43:41 +00:00
|
|
|
rs, err := NewRecSplit(RecSplitArgs{
|
|
|
|
KeyCount: 100,
|
|
|
|
BucketSize: 10,
|
|
|
|
Salt: 0,
|
|
|
|
TmpDir: tmpDir,
|
|
|
|
IndexFile: indexFile,
|
|
|
|
LeafSize: 8,
|
|
|
|
StartSeed: []uint64{0x106393c187cae21a, 0x6453cec3f7376937, 0x643e521ddbd2be98, 0x3740c6412f6572cb, 0x717d47562f1ce470, 0x4cd6eb4c63befb7c, 0x9bfd8c5e18c8da73,
|
|
|
|
0x082f20e10092a9a3, 0x2ada2ce68d21defc, 0xe33cb4f3e7c6466b, 0x3980be458c509c59, 0xc466fd9584828e8c, 0x45f0aabe1a61ede6, 0xf6e7b8b33ad9b98d,
|
|
|
|
0x4ef95e25f4b4983d, 0x81175195173b92d3, 0x4e50927d8dd15978, 0x1ea2099d1fafae7f, 0x425c8a06fbaaa815, 0xcd4216006c74052a},
|
|
|
|
})
|
|
|
|
if err != nil {
|
|
|
|
t.Fatal(err)
|
|
|
|
}
|
|
|
|
for i := 0; i < 100; i++ {
|
|
|
|
if err = rs.AddKey([]byte(fmt.Sprintf("key %d", i)), uint64(i*17)); err != nil {
|
|
|
|
t.Fatal(err)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if err := rs.Build(); err != nil {
|
|
|
|
t.Fatal(err)
|
|
|
|
}
|
2021-10-31 02:38:10 +00:00
|
|
|
idx := MustOpen(indexFile)
|
2021-10-16 09:43:41 +00:00
|
|
|
defer idx.Close()
|
|
|
|
for i := 0; i < 100; i++ {
|
2022-01-24 20:39:04 +00:00
|
|
|
reader := NewIndexReader(idx)
|
|
|
|
offset := reader.Lookup([]byte(fmt.Sprintf("key %d", i)))
|
2021-10-16 09:43:41 +00:00
|
|
|
if offset != uint64(i*17) {
|
|
|
|
t.Errorf("expected offset: %d, looked up: %d", i*17, offset)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
func TestTwoLayerIndex(t *testing.T) {
|
|
|
|
tmpDir := t.TempDir()
|
2022-02-12 13:11:30 +00:00
|
|
|
indexFile := filepath.Join(tmpDir, "index")
|
2021-10-16 09:43:41 +00:00
|
|
|
rs, err := NewRecSplit(RecSplitArgs{
|
|
|
|
KeyCount: 100,
|
|
|
|
BucketSize: 10,
|
|
|
|
Salt: 0,
|
|
|
|
TmpDir: tmpDir,
|
|
|
|
IndexFile: indexFile,
|
|
|
|
LeafSize: 8,
|
|
|
|
StartSeed: []uint64{0x106393c187cae21a, 0x6453cec3f7376937, 0x643e521ddbd2be98, 0x3740c6412f6572cb, 0x717d47562f1ce470, 0x4cd6eb4c63befb7c, 0x9bfd8c5e18c8da73,
|
|
|
|
0x082f20e10092a9a3, 0x2ada2ce68d21defc, 0xe33cb4f3e7c6466b, 0x3980be458c509c59, 0xc466fd9584828e8c, 0x45f0aabe1a61ede6, 0xf6e7b8b33ad9b98d,
|
|
|
|
0x4ef95e25f4b4983d, 0x81175195173b92d3, 0x4e50927d8dd15978, 0x1ea2099d1fafae7f, 0x425c8a06fbaaa815, 0xcd4216006c74052a},
|
|
|
|
Enums: true,
|
|
|
|
})
|
|
|
|
if err != nil {
|
|
|
|
t.Fatal(err)
|
|
|
|
}
|
|
|
|
for i := 0; i < 100; i++ {
|
|
|
|
if err = rs.AddKey([]byte(fmt.Sprintf("key %d", i)), uint64(i*17)); err != nil {
|
|
|
|
t.Fatal(err)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if err := rs.Build(); err != nil {
|
|
|
|
t.Fatal(err)
|
|
|
|
}
|
2021-10-31 02:38:10 +00:00
|
|
|
|
|
|
|
idx := MustOpen(indexFile)
|
2021-10-16 09:43:41 +00:00
|
|
|
defer idx.Close()
|
|
|
|
for i := 0; i < 100; i++ {
|
2022-01-24 20:39:04 +00:00
|
|
|
reader := NewIndexReader(idx)
|
|
|
|
e := reader.Lookup([]byte(fmt.Sprintf("key %d", i)))
|
2021-10-16 09:43:41 +00:00
|
|
|
if e != uint64(i) {
|
|
|
|
t.Errorf("expected enumeration: %d, lookup up: %d", i, e)
|
|
|
|
}
|
2022-06-17 11:39:49 +00:00
|
|
|
offset := idx.OrdinalLookup(e)
|
2021-10-16 09:43:41 +00:00
|
|
|
if offset != uint64(i*17) {
|
|
|
|
t.Errorf("expected offset: %d, looked up: %d", i*17, offset)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|