From 5b09ebfb0c1bb3f6397655ad87cc8da6b2644569 Mon Sep 17 00:00:00 2001 From: Steven Allen Date: Tue, 31 Mar 2020 15:45:22 -0700 Subject: [PATCH] feat: put all temporary files in the same directory and clean them up on start Otherwise, if we repeatedly stop the same node, we'll collect a bunch of temporary files and NEVER DELETE them. This will: 1. Waste space. 2. Slow down queries/GC. This patch: 1. Moves all temporary files to a single `.temp` directory. The leading `.` means it can't conflict with any keys and queries (even on older flatfs versions) will skip it. 2. Adds an "rm -rf flatfs-dir/.temp" call on start. --- flatfs.go | 27 ++++++++++++++++++++++----- flatfs_test.go | 7 +++---- 2 files changed, 25 insertions(+), 9 deletions(-) diff --git a/flatfs.go b/flatfs.go index 9dbf108..06d3ef0 100644 --- a/flatfs.go +++ b/flatfs.go @@ -112,7 +112,8 @@ type Datastore struct { // (see https://golang.org/pkg/sync/atomic/#pkg-note-BUG) diskUsage int64 - path string + path string + tempPath string shardStr string getDir ShardFunc @@ -196,7 +197,6 @@ func (o *opResult) Finish(ok bool) { } func Create(path string, fun *ShardIdV1) error { - err := os.Mkdir(path, 0755) if err != nil && !os.IsExist(err) { return err @@ -238,6 +238,17 @@ func Open(path string, syncFiles bool) (*Datastore, error) { return nil, err } + tempPath := filepath.Join(path, ".temp") + err = os.RemoveAll(tempPath) + if err != nil && !os.IsNotExist(err) { + return nil, fmt.Errorf("failed to remove temporary directory: %w", err) + } + + err = os.Mkdir(tempPath, 0755) + if err != nil { + return nil, fmt.Errorf("failed to create temporary directory: %w", err) + } + shardId, err := ReadShardFunc(path) if err != nil { return nil, err @@ -245,6 +256,7 @@ func Open(path string, syncFiles bool) (*Datastore, error) { fs := &Datastore{ path: path, + tempPath: tempPath, shardStr: shardId.String(), getDir: shardId.Func(), sync: syncFiles, @@ -452,7 +464,7 @@ func (fs *Datastore) doPut(key datastore.Key, val []byte) error { return err } - tmp, err := ioutil.TempFile(dir, "put-") + tmp, err := fs.tempFile() if err != nil { return err } @@ -528,7 +540,7 @@ func (fs *Datastore) putMany(data map[datastore.Key][]byte) error { } dirsToSync = append(dirsToSync, dir) - tmp, err := ioutil.TempFile(dir, "put-") + tmp, err := fs.tempFile() if err != nil { return err } @@ -954,7 +966,7 @@ func (fs *Datastore) checkpointLoop() { } func (fs *Datastore) writeDiskUsageFile(du int64, doSync bool) { - tmp, err := ioutil.TempFile(fs.path, "du-") + tmp, err := fs.tempFile() if err != nil { log.Warnw("could not write disk usage", "error", err) return @@ -1037,6 +1049,11 @@ func (fs *Datastore) Accuracy() string { return string(fs.storedValue.Accuracy) } +func (fs *Datastore) tempFile() (*os.File, error) { + file, err := ioutil.TempFile(fs.tempPath, "temp-") + return file, err +} + func (fs *Datastore) walk(path string, qrb *query.ResultBuilder) error { dir, err := os.Open(path) if err != nil { diff --git a/flatfs_test.go b/flatfs_test.go index 8cf2743..9d490f6 100644 --- a/flatfs_test.go +++ b/flatfs_test.go @@ -187,7 +187,7 @@ func testStorage(p *params, t *testing.T) { return err } switch path { - case ".", "..", "SHARDING", flatfs.DiskUsageFile: + case ".", "..", "SHARDING", flatfs.DiskUsageFile, ".temp": // ignore case "_README": _, err := ioutil.ReadFile(absPath) @@ -950,9 +950,8 @@ func TestNoCluster(t *testing.T) { tolerance := math.Floor(idealFilesPerDir * 0.25) count := 0 for _, dir := range dirs { - if dir.Name() == flatfs.SHARDING_FN || - dir.Name() == flatfs.README_FN || - dir.Name() == flatfs.DiskUsageFile { + switch dir.Name() { + case flatfs.SHARDING_FN, flatfs.README_FN, flatfs.DiskUsageFile, ".temp": continue } count += 1