Fix disk cache not reading inode

Also use a faster atomic update mechanism
This commit is contained in:
Kovid Goyal
2025-10-08 08:35:35 +05:30
parent 16cdcf8cf8
commit c2e75ba466
2 changed files with 62 additions and 28 deletions

View File

@@ -1,7 +1,6 @@
package disk_cache package disk_cache
import ( import (
"bytes"
"crypto/sha256" "crypto/sha256"
"encoding/hex" "encoding/hex"
"encoding/json" "encoding/json"
@@ -11,10 +10,9 @@ import (
"os" "os"
"path/filepath" "path/filepath"
"slices" "slices"
"syscall"
"time" "time"
"golang.org/x/sys/unix"
"github.com/kovidgoyal/kitty/tools/utils" "github.com/kovidgoyal/kitty/tools/utils"
) )
@@ -26,6 +24,10 @@ type file_state struct {
Inode uint64 Inode uint64
} }
func (s file_state) String() string {
return fmt.Sprintf("fs{Size: %d, Inode: %d, ModTime: %s}", s.Size, s.Inode, s.ModTime)
}
func (s *file_state) equal(o *file_state) bool { func (s *file_state) equal(o *file_state) bool {
return o != nil && s.Size == o.Size && s.ModTime.Equal(o.ModTime) && s.Inode == o.Inode return o != nil && s.Size == o.Size && s.ModTime.Equal(o.ModTime) && s.Inode == o.Inode
} }
@@ -33,7 +35,7 @@ func (s *file_state) equal(o *file_state) bool {
func get_file_state(fi fs.FileInfo) *file_state { func get_file_state(fi fs.FileInfo) *file_state {
// The Sys() method returns the underlying data source (can be nil). // The Sys() method returns the underlying data source (can be nil).
// For Unix-like systems, it's a *syscall.Stat_t. // For Unix-like systems, it's a *syscall.Stat_t.
stat, ok := fi.Sys().(*unix.Stat_t) stat, ok := fi.Sys().(*syscall.Stat_t)
if !ok { if !ok {
// For non-Unix systems, you might not have an inode. // For non-Unix systems, you might not have an inode.
// In that case, you can fall back to using only size and mod time. // In that case, you can fall back to using only size and mod time.
@@ -145,8 +147,23 @@ func (dc *DiskCache) write_entries_if_dirty() (err error) {
if d, err := json.Marshal(dc.entries); err != nil { if d, err := json.Marshal(dc.entries); err != nil {
return err return err
} else { } else {
// use an atomic write so that the inode number changes // use a rename so that the inode number changes
return utils.AtomicWriteFile(path, bytes.NewReader(d), 0o600) // dont bother with full utils.AtomicWriteFile() as it is slower
temp := path + ".temp"
removed := false
defer func() {
if !removed {
_ = os.Remove(temp)
removed = true
}
}()
if err := os.WriteFile(temp, d, 0o600); err != nil {
return err
}
if err = os.Rename(temp, path); err == nil {
removed = true
}
return err
} }
} }

View File

@@ -24,10 +24,29 @@ func TestDiskCache(t *testing.T) {
if err != nil { if err != nil {
t.Fatal(err) t.Fatal(err)
} }
arc := func(dc *DiskCache, expected int) { ensure_entries := func() {
if expected != dc.read_count { for _, x := range []*DiskCache{dc, dc2} {
t.Fatalf("disk cache has unexpected read count: %d != %d\n%s", expected, dc.read_count, debug.Stack()) if err = x.ensure_entries(); err != nil {
t.Fatal(err)
}
} }
}
arc := func(counts ...int) {
ensure_entries()
if diff := cmp.Diff(counts, []int{dc.read_count, dc2.read_count}); diff != "" {
t.Fatalf("disk cache has unexpected read count\n%s\n%s", diff, debug.Stack())
}
}
add := func(dc *DiskCache, key string, data map[string]string) {
d := make(map[string][]byte, len(data))
for k, v := range data {
d[k] = []byte(v)
}
if _, err := dc.Add(key, d); err != nil {
t.Fatal(err)
}
ensure_entries()
} }
m, err := dc.Get("missing", "one", "two") m, err := dc.Get("missing", "one", "two")
@@ -37,8 +56,6 @@ func TestDiskCache(t *testing.T) {
if len(m) > 0 { if len(m) > 0 {
t.Fatalf("Unexpected return from missing: %s", m) t.Fatalf("Unexpected return from missing: %s", m)
} }
dc.Add("k1", map[string][]byte{"1": []byte("abcd"), "2": []byte("efgh")})
arc(dc, 0)
ad := func(key string, expected map[string]string) { ad := func(key string, expected map[string]string) {
for _, x := range []*DiskCache{dc, dc2} { for _, x := range []*DiskCache{dc, dc2} {
@@ -57,6 +74,7 @@ func TestDiskCache(t *testing.T) {
if diff := cmp.Diff(expected, actual); diff != "" { if diff := cmp.Diff(expected, actual); diff != "" {
t.Fatalf("Data for %s not equal: %s", key, diff) t.Fatalf("Data for %s not equal: %s", key, diff)
} }
ensure_entries()
} }
} }
ak := func(keys ...string) { ak := func(keys ...string) {
@@ -69,32 +87,31 @@ func TestDiskCache(t *testing.T) {
t.Fatalf("wrong keys in %d: %s", i+1, diff) t.Fatalf("wrong keys in %d: %s", i+1, diff)
} }
} }
ensure_entries()
} }
add(dc, "k1", map[string]string{"1": "abcd", "2": "efgh"})
arc(0, 1)
ad("k1", map[string]string{"1": "abcd", "2": "efgh"}) ad("k1", map[string]string{"1": "abcd", "2": "efgh"})
arc(dc, 0) arc(1, 2) // the two gets cause two updates
arc(dc2, 1) add(dc, "k1", map[string]string{"3": "ijk", "4": "lmo"})
dc.Add("k1", map[string][]byte{"3": []byte("ijk"), "4": []byte("lmo")}) arc(1, 3) // dc.Add() causes re-read in dc2
arc(dc, 1) // because dc2.Get() will have updated the file
arc(dc2, 1)
ak("k1") ak("k1")
arc(dc2, 2) // because dc.Add() will have updated the file arc(1, 3)
dc2.Add("k2", map[string][]byte{"1": []byte("123456789")}) add(dc2, "k2", map[string]string{"1": "123456789"})
arc(dc, 1) arc(2, 3) // dc2.Add() causes re-read in dc
arc(dc2, 2)
ak("k1", "k2") ak("k1", "k2")
arc(2, 3)
ad("k1", map[string]string{"1": "abcd", "2": "efgh", "3": "ijk"}) ad("k1", map[string]string{"1": "abcd", "2": "efgh", "3": "ijk"})
if dc.entries.TotalSize != 14+9 { if dc.entries.TotalSize != 14+9 {
t.Fatalf("TotalSize: %d != %d", dc.entries.TotalSize, 14+9) t.Fatalf("TotalSize: %d != %d", dc.entries.TotalSize, 14+9)
} }
arc(dc, 2) // dc2.Add() arc(3, 4) // the two gets cause two updates
arc(dc2, 3) // dc.Get()
ak("k2", "k1") ak("k2", "k1")
dc.Get("k2") dc.Get("k2")
arc(dc, 3) // dc2.Get() arc(3, 5) // dc.Get() causes dc2 to read
arc(dc2, 3)
ak("k1", "k2") ak("k1", "k2")
dc.Add("k3", map[string][]byte{"1": []byte(strings.Repeat("a", int(dc.MaxSize)-10))}) add(dc, "k3", map[string]string{"1": strings.Repeat("a", int(dc.MaxSize)-10)})
arc(dc, 3) arc(3, 6) // dc.Add() causes dc2 to read
ak("k2", "k3") ak("k2", "k3")
// check that creating a new disk cache prunes // check that creating a new disk cache prunes
_, err = NewDiskCache(tdir, dc.MaxSize-8) _, err = NewDiskCache(tdir, dc.MaxSize-8)
@@ -102,7 +119,7 @@ func TestDiskCache(t *testing.T) {
t.Fatal(err) t.Fatal(err)
} }
ak("k3") ak("k3")
arc(dc, 4) // NewDiskCache() arc(4, 7) // NewDiskCache()
// test the path api // test the path api
path := filepath.Join(tdir, "source") path := filepath.Join(tdir, "source")
@@ -130,5 +147,5 @@ func TestDiskCache(t *testing.T) {
if len(entries_before) != len(entries_after) { if len(entries_before) != len(entries_after) {
t.Fatalf("unexpected entries: %s", entries_after) t.Fatalf("unexpected entries: %s", entries_after)
} }
arc(dc, 4) arc(4, 8) // dc.AddPath() causes dc2 to read
} }