Files
syncthing/internal/db/sqlite/db_local_test.go
Jakob Borg 86ac4e5017 feat: make block indexing configurable (#10608)
This adds a new folder-level configuration `FullBlockIndex`. It controls
whether we maintain the block index for a given folder -- currently
that's always true, now it becomes possible to turn off. The block index
is used for lookup of blocks across files and folders. Effectively, when
syncing a change, for each block, we check:

1. Is the block already present in the old version of the file? If so,
we can reuse (copy) it without network transfer. **This check is always
possible.**
2. Is the block already present in any other file in this folder or
other folders? If so we can copy it. **This check is only possible with
the full block index.**
3. We must transfer the block over the network.

Maintaining the full block index is costly in time, I/O and database
size. With this PR, maintaining the full block index becomes the default
for send-receive and receive-only folders only, with it disabled for
send-only and receive-encrypted folders. The block index is never useful
for encrypted folders, as blocks are encrypted separate for each file.
It is also not useful for send-only folders by themselves, though the
data in the send-only folder could be reused by other receive-type
folders if it were enabled.

For very large folders it may make sense to disable the full block index
regardless of folder type and just accept the resulting decrease in data
reuse.

Disabling or enabling the option in the GUI causes the index to be
destroyed or rebuilt accordingly.

https://github.com/syncthing/docs/pull/1005

---------

Signed-off-by: Jakob Borg <jakob@kastelo.net>
2026-04-26 11:58:09 +02:00

398 lines
9.4 KiB
Go

// Copyright (C) 2025 The Syncthing Authors.
//
// This Source Code Form is subject to the terms of the Mozilla Public
// License, v. 2.0. If a copy of the MPL was not distributed with this file,
// You can obtain one at https://mozilla.org/MPL/2.0/.
package sqlite
import (
"testing"
"github.com/syncthing/syncthing/internal/db"
"github.com/syncthing/syncthing/internal/itererr"
"github.com/syncthing/syncthing/lib/protocol"
)
func TestBlocks(t *testing.T) {
t.Parallel()
db, err := Open(t.TempDir())
if err != nil {
t.Fatal()
}
t.Cleanup(func() {
if err := db.Close(); err != nil {
t.Fatal(err)
}
})
files := []protocol.FileInfo{
{
Name: "file1",
Blocks: []protocol.BlockInfo{
{Hash: []byte{1, 2, 3}, Offset: 0, Size: 42},
{Hash: []byte{2, 3, 4}, Offset: 42, Size: 42},
{Hash: []byte{3, 4, 5}, Offset: 84, Size: 42},
},
},
{
Name: "file2",
Blocks: []protocol.BlockInfo{
{Hash: []byte{2, 3, 4}, Offset: 0, Size: 42},
{Hash: []byte{3, 4, 5}, Offset: 42, Size: 42},
{Hash: []byte{4, 5, 6}, Offset: 84, Size: 42},
},
},
}
if err := db.Update("test", protocol.LocalDeviceID, files); err != nil {
t.Fatal(err)
}
// Search for blocks
vals, err := itererr.Collect(db.AllLocalBlocksWithHash(folderID, []byte{1, 2, 3}))
if err != nil {
t.Fatal(err)
}
if len(vals) != 1 {
t.Log(vals)
t.Fatal("expected one hit")
} else if vals[0].BlockIndex != 0 || vals[0].Offset != 0 || vals[0].Size != 42 {
t.Log(vals[0])
t.Fatal("bad entry")
}
if vals[0].FileName != "file1" {
t.Fatal("should be file1")
}
// Get the other blocks
vals, err = itererr.Collect(db.AllLocalBlocksWithHash(folderID, []byte{3, 4, 5}))
if err != nil {
t.Fatal(err)
}
if len(vals) != 2 {
t.Log(vals)
t.Fatal("expected two hits")
}
// if vals[0].Index != 2 || vals[0].Offset != 84 || vals[0].Size != 42 {
// t.Log(vals[0])
// t.Fatal("bad entry 1")
// }
// if vals[1].Index != 1 || vals[1].Offset != 42 || vals[1].Size != 42 {
// t.Log(vals[1])
// t.Fatal("bad entry 2")
// }
}
func TestBlocksDeleted(t *testing.T) {
t.Parallel()
sdb, err := Open(t.TempDir())
if err != nil {
t.Fatal()
}
t.Cleanup(func() {
if err := sdb.Close(); err != nil {
t.Fatal(err)
}
})
// Insert a file
file := genFile("foo", 1, 0)
if err := sdb.Update(folderID, protocol.LocalDeviceID, []protocol.FileInfo{file}); err != nil {
t.Fatal()
}
// We should find one entry for the block hash
search := file.Blocks[0].Hash
es, err := itererr.Collect(sdb.AllLocalBlocksWithHash(folderID, search))
if err != nil {
t.Fatal(err)
}
if len(es) != 1 {
t.Fatal("expected one hit")
}
// Update the file with a new block hash
file.Blocks = genBlocks("foo", 42, 1)
if err := sdb.Update(folderID, protocol.LocalDeviceID, []protocol.FileInfo{file}); err != nil {
t.Fatal()
}
// Searching for the old hash should yield no hits
if hits, err := itererr.Collect(sdb.AllLocalBlocksWithHash(folderID, search)); err != nil {
t.Fatal(err)
} else if len(hits) != 0 {
t.Log(hits)
t.Error("expected no hits")
}
// Searching for the new hash should yield one hits
if hits, err := itererr.Collect(sdb.AllLocalBlocksWithHash(folderID, file.Blocks[0].Hash)); err != nil {
t.Fatal(err)
} else if len(hits) != 1 {
t.Log(hits)
t.Error("expected one hit")
}
}
func TestDropBlockIndex(t *testing.T) {
t.Parallel()
sdb, err := Open(t.TempDir())
if err != nil {
t.Fatal(err)
}
t.Cleanup(func() { sdb.Close() })
// Insert files with blocks
files := []protocol.FileInfo{
genFile("a", 3, 0),
genFile("b", 2, 0),
}
if err := sdb.Update(folderID, protocol.LocalDeviceID, files); err != nil {
t.Fatal(err)
}
// Verify blocks exist
hits, err := itererr.Collect(sdb.AllLocalBlocksWithHash(folderID, files[0].Blocks[0].Hash))
if err != nil {
t.Fatal(err)
}
if len(hits) == 0 {
t.Fatal("expected block hits before drop")
}
// Drop the block index
if err := sdb.DropBlockIndex(folderID); err != nil {
t.Fatal(err)
}
// Verify blocks are gone
hits, err = itererr.Collect(sdb.AllLocalBlocksWithHash(folderID, files[0].Blocks[0].Hash))
if err != nil {
t.Fatal(err)
}
if len(hits) != 0 {
t.Fatal("expected no block hits after drop")
}
// Dropping again should be a no-op (already empty)
if err := sdb.DropBlockIndex(folderID); err != nil {
t.Fatal(err)
}
// Dropping a nonexistent folder should be fine
if err := sdb.DropBlockIndex("nonexistent"); err != nil {
t.Fatal(err)
}
}
func TestPopulateBlockIndex(t *testing.T) {
t.Parallel()
sdb, err := Open(t.TempDir())
if err != nil {
t.Fatal(err)
}
t.Cleanup(func() { sdb.Close() })
// Insert files with blocks
files := []protocol.FileInfo{
genFile("a", 3, 0),
genFile("b", 2, 0),
}
if err := sdb.Update(folderID, protocol.LocalDeviceID, files); err != nil {
t.Fatal(err)
}
// Collect the original block entries for comparison
origHitsA, err := itererr.Collect(sdb.AllLocalBlocksWithHash(folderID, files[0].Blocks[0].Hash))
if err != nil {
t.Fatal(err)
}
if len(origHitsA) != 1 {
t.Fatal("expected one hit for block a[0]")
}
// Drop the block index
if err := sdb.DropBlockIndex(folderID); err != nil {
t.Fatal(err)
}
// Populate it back from existing blocklists
if err := sdb.PopulateBlockIndex(folderID); err != nil {
t.Fatal(err)
}
// Verify all blocks are back
for i, f := range files {
for j, b := range f.Blocks {
hits, err := itererr.Collect(sdb.AllLocalBlocksWithHash(folderID, b.Hash))
if err != nil {
t.Fatal(err)
}
if len(hits) == 0 {
t.Errorf("file %d block %d: expected hits after populate", i, j)
}
}
}
// Populating again should be a no-op (not empty)
if err := sdb.PopulateBlockIndex(folderID); err != nil {
t.Fatal(err)
}
}
func TestPopulateBlockIndexSkipsRemoteFiles(t *testing.T) {
t.Parallel()
sdb, err := Open(t.TempDir())
if err != nil {
t.Fatal(err)
}
t.Cleanup(func() { sdb.Close() })
// Insert a local file (blocks indexed) and a remote file (blocks not indexed)
localFile := genFile("local", 2, 0)
if err := sdb.Update(folderID, protocol.LocalDeviceID, []protocol.FileInfo{localFile}); err != nil {
t.Fatal(err)
}
remoteFile := genFile("remote", 2, 1)
if err := sdb.Update(folderID, protocol.DeviceID{42}, []protocol.FileInfo{remoteFile}); err != nil {
t.Fatal(err)
}
// Drop and repopulate
if err := sdb.DropBlockIndex(folderID); err != nil {
t.Fatal(err)
}
if err := sdb.PopulateBlockIndex(folderID); err != nil {
t.Fatal(err)
}
// Local file blocks should be present
hits, err := itererr.Collect(sdb.AllLocalBlocksWithHash(folderID, localFile.Blocks[0].Hash))
if err != nil {
t.Fatal(err)
}
if len(hits) == 0 {
t.Error("expected hits for local file blocks")
}
// Remote file blocks should not be present (blocks are only
// indexed for local files)
hits, err = itererr.Collect(sdb.AllLocalBlocksWithHash(folderID, remoteFile.Blocks[0].Hash))
if err != nil {
t.Fatal(err)
}
if len(hits) != 0 {
t.Error("expected no hits for remote file blocks")
}
}
func TestSkipBlockIndexOnUpdate(t *testing.T) {
t.Parallel()
sdb, err := Open(t.TempDir())
if err != nil {
t.Fatal(err)
}
t.Cleanup(func() { sdb.Close() })
// Insert a file with SkipBlockIndex
file := genFile("a", 3, 0)
if err := sdb.Update(folderID, protocol.LocalDeviceID, []protocol.FileInfo{file}, db.WithSkipBlockIndex()); err != nil {
t.Fatal(err)
}
// Blocks should not be indexed
hits, err := itererr.Collect(sdb.AllLocalBlocksWithHash(folderID, file.Blocks[0].Hash))
if err != nil {
t.Fatal(err)
}
if len(hits) != 0 {
t.Fatal("expected no block hits with SkipBlockIndex")
}
// The blocklist should still be stored (file info is retrievable with blocks)
fi, ok, err := sdb.GetDeviceFile(folderID, protocol.LocalDeviceID, "a")
if err != nil {
t.Fatal(err)
}
if !ok {
t.Fatal("file not found")
}
if len(fi.Blocks) != 3 {
t.Fatalf("expected 3 blocks in file info, got %d", len(fi.Blocks))
}
// Populate should fill in the blocks
if err := sdb.PopulateBlockIndex(folderID); err != nil {
t.Fatal(err)
}
hits, err = itererr.Collect(sdb.AllLocalBlocksWithHash(folderID, file.Blocks[0].Hash))
if err != nil {
t.Fatal(err)
}
if len(hits) != 1 {
t.Fatal("expected one hit after populate")
}
}
func TestRemoteSequence(t *testing.T) {
t.Parallel()
sdb, err := Open(t.TempDir())
if err != nil {
t.Fatal()
}
t.Cleanup(func() {
if err := sdb.Close(); err != nil {
t.Fatal(err)
}
})
// Insert a local file
file := genFile("foo", 1, 0)
if err := sdb.Update(folderID, protocol.LocalDeviceID, []protocol.FileInfo{file}); err != nil {
t.Fatal()
}
// Insert several remote files
file = genFile("foo1", 1, 42)
if err := sdb.Update(folderID, protocol.DeviceID{42}, []protocol.FileInfo{file}); err != nil {
t.Fatal()
}
if err := sdb.Update(folderID, protocol.DeviceID{43}, []protocol.FileInfo{file}); err != nil {
t.Fatal()
}
file = genFile("foo2", 1, 43)
if err := sdb.Update(folderID, protocol.DeviceID{43}, []protocol.FileInfo{file}); err != nil {
t.Fatal()
}
if err := sdb.Update(folderID, protocol.DeviceID{44}, []protocol.FileInfo{file}); err != nil {
t.Fatal()
}
file = genFile("foo3", 1, 44)
if err := sdb.Update(folderID, protocol.DeviceID{44}, []protocol.FileInfo{file}); err != nil {
t.Fatal()
}
// Verify remote sequences
seqs, err := sdb.RemoteSequences(folderID)
if err != nil {
t.Fatal(err)
}
if len(seqs) != 3 || seqs[protocol.DeviceID{42}] != 42 ||
seqs[protocol.DeviceID{43}] != 43 ||
seqs[protocol.DeviceID{44}] != 44 {
t.Log(seqs)
t.Error("bad seqs")
}
}