Skip to content

Commit

Permalink
Add central LRU cache that adjusts to available memory
Browse files Browse the repository at this point in the history
Hugo has always been a active user of in-memory caches, but before this commit we did nothing to control the memory usage.

One failing example would be loading lots of big JSON data files and unmarshal them via `transform.Unmarshal`.

This commit consolidates all these caches into one single LRU cache with an eviction strategy that also considers used vs. available memory.

Hugo will try to limit its memory usage to 1/4 or total system memory, but this can be controlled with the `HUGO_MEMORYLIMIT` environment variable (a float value representing Gigabytes).

A natural next step after this would be to use this cache for `.Content`.

Fixes #7425
Fixes #7437
Fixes #7436
Fixes #7882
Updates #7544
  • Loading branch information
bep committed Dec 23, 2020
1 parent f802bb2 commit 7360eb8
Show file tree
Hide file tree
Showing 70 changed files with 2,447 additions and 1,091 deletions.
499 changes: 499 additions & 0 deletions cache/memcache/memcache.go

Large diffs are not rendered by default.

178 changes: 178 additions & 0 deletions cache/memcache/memcache_test.go
Original file line number Diff line number Diff line change
@@ -0,0 +1,178 @@
// Copyright 2020 The Hugo Authors. All rights reserved.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

package memcache

import (
"fmt"
"path/filepath"
"sync"
"testing"
"time"

qt "github.com/frankban/quicktest"
)

func TestCache(t *testing.T) {
t.Parallel()
c := qt.New(t)

cache := New(Config{})

counter := 0
create := func() Entry {
counter++
return Entry{Value: counter}
}

a := cache.GetOrCreatePartition("a", ClearNever)

for i := 0; i < 5; i++ {
v1, err := a.GetOrCreate("a1", create)
c.Assert(err, qt.IsNil)
c.Assert(v1, qt.Equals, 1)
v2, err := a.GetOrCreate("a2", create)
c.Assert(err, qt.IsNil)
c.Assert(v2, qt.Equals, 2)
}

cache.Clear()

v3, err := a.GetOrCreate("a2", create)
c.Assert(err, qt.IsNil)
c.Assert(v3, qt.Equals, 3)
}

func TestCacheConcurrent(t *testing.T) {
t.Parallel()

c := qt.New(t)

var wg sync.WaitGroup

cache := New(Config{})

create := func(i int) func() Entry {
return func() Entry {
return Entry{Value: i}
}
}

for i := 0; i < 10; i++ {
wg.Add(1)
go func() {
defer wg.Done()
for j := 0; j < 100; j++ {
id := fmt.Sprintf("id%d", j)
v, err := cache.getOrCreate("a", id, create(j))
c.Assert(err, qt.IsNil)
c.Assert(v, qt.Equals, j)
}
}()
}
wg.Wait()
}

func TestCacheMemStats(t *testing.T) {
t.Parallel()
c := qt.New(t)

cache := New(Config{
ItemsToPrune: 10,
CheckInterval: 500 * time.Millisecond,
})

s := cache.stats

c.Assert(s.memstatsStart.Alloc > 0, qt.Equals, true)
c.Assert(s.memstatsCurrent.Alloc, qt.Equals, uint64(0))
c.Assert(s.availableMemory > 0, qt.Equals, true)
c.Assert(s.numItems, qt.Equals, uint64(0))

counter := 0
create := func() Entry {
counter++
return Entry{Value: counter}
}

for i := 1; i <= 20; i++ {
_, err := cache.getOrCreate("a", fmt.Sprintf("b%d", i), create)
c.Assert(err, qt.IsNil)
}

c.Assert(s.getNumItems(), qt.Equals, uint64(20))
cache.cache.SetMaxSize(10)
time.Sleep(time.Millisecond * 600)
c.Assert(int(s.getNumItems()), qt.Equals, 10)

}

func TestSplitBasePathAndExt(t *testing.T) {
t.Parallel()
c := qt.New(t)

tests := []struct {
path string
a string
b string
}{
{"a/b.json", "a", "json"},
{"a/b/c/d.json", "a", "json"},
}
for i, this := range tests {
msg := qt.Commentf("test %d", i)
a, b := splitBasePathAndExt(this.path)

c.Assert(a, qt.Equals, this.a, msg)
c.Assert(b, qt.Equals, this.b, msg)
}

}

func TestCleanKey(t *testing.T) {
c := qt.New(t)

c.Assert(CleanKey(filepath.FromSlash("a/b/c.js")), qt.Equals, "a/b/c.js")
c.Assert(CleanKey("a//b////c.js"), qt.Equals, "a/b/c.js")
c.Assert(CleanKey("a.js"), qt.Equals, "_root/a.js")
c.Assert(CleanKey("b/a"), qt.Equals, "b/a.unkn")

}

func TestKeyValid(t *testing.T) {
c := qt.New(t)

c.Assert(keyValid("a/b.j"), qt.Equals, true)
c.Assert(keyValid("a/b."), qt.Equals, false)
c.Assert(keyValid("a/b"), qt.Equals, false)
c.Assert(keyValid("/a/b.txt"), qt.Equals, false)
c.Assert(keyValid("a\\b.js"), qt.Equals, false)

}

func TestInsertKeyPathElement(t *testing.T) {
c := qt.New(t)

c.Assert(InsertKeyPathElements("a/b.j", "en"), qt.Equals, "a/en/b.j")
c.Assert(InsertKeyPathElements("a/b.j", "en", "foo"), qt.Equals, "a/en/foo/b.j")
c.Assert(InsertKeyPathElements("a/b.j", "", "foo"), qt.Equals, "a/foo/b.j")

}

func TestShouldEvict(t *testing.T) {
// TODO1 remove?
//c := qt.New(t)

//fmt.Println("=>", CleanKey("kkk"))
//c.Assert(shouldEvict("key", Entry{}, ClearNever, identity.NewPathIdentity(files.ComponentFolderAssets, "a/b/c.js")), qt.Equals, true)
}
78 changes: 0 additions & 78 deletions cache/namedmemcache/named_cache.go

This file was deleted.

80 changes: 0 additions & 80 deletions cache/namedmemcache/named_cache_test.go

This file was deleted.

2 changes: 1 addition & 1 deletion commands/commands.go
Original file line number Diff line number Diff line change
Expand Up @@ -301,7 +301,7 @@ func (cc *hugoBuilderCommon) handleFlags(cmd *cobra.Command) {
cmd.Flags().BoolP("path-warnings", "", false, "print warnings on duplicate target paths etc.")
cmd.Flags().StringVarP(&cc.cpuprofile, "profile-cpu", "", "", "write cpu profile to `file`")
cmd.Flags().StringVarP(&cc.memprofile, "profile-mem", "", "", "write memory profile to `file`")
cmd.Flags().BoolVarP(&cc.printm, "print-mem", "", false, "print memory usage to screen at intervals")
cmd.Flags().BoolVarP(&cc.printm, "printMem", "", false, "print memory usage to screen at intervals")
cmd.Flags().StringVarP(&cc.mutexprofile, "profile-mutex", "", "", "write Mutex profile to `file`")
cmd.Flags().StringVarP(&cc.traceprofile, "trace", "", "", "write trace to `file` (not useful in general)")

Expand Down
22 changes: 7 additions & 15 deletions commands/hugo.go
Original file line number Diff line number Diff line change
Expand Up @@ -417,8 +417,14 @@ func (c *commandeer) initMemTicker() func() {
quit := make(chan struct{})
printMem := func() {
var m runtime.MemStats
var cacheDropped int
h := c.hugo()
if h != nil && h.MemCache != nil {
cacheDropped = h.MemCache.GetDropped()
}

runtime.ReadMemStats(&m)
fmt.Printf("\n\nAlloc = %v\nTotalAlloc = %v\nSys = %v\nNumGC = %v\n\n", formatByteCount(m.Alloc), formatByteCount(m.TotalAlloc), formatByteCount(m.Sys), m.NumGC)
fmt.Printf("\n\nAlloc = %v\nTotalAlloc = %v\nSys = %v\nNumGC = %v\nMemCacheDropped = %d\nConfiguredMemoryLimit = %v\n\n", helpers.FormatByteCount(m.Alloc), helpers.FormatByteCount(m.TotalAlloc), helpers.FormatByteCount(m.Sys), m.NumGC, cacheDropped, helpers.FormatByteCount(config.GetMemoryLimit()))
}

go func() {
Expand Down Expand Up @@ -1188,17 +1194,3 @@ func pickOneWriteOrCreatePath(events []fsnotify.Event) string {

return name
}

func formatByteCount(b uint64) string {
const unit = 1000
if b < unit {
return fmt.Sprintf("%d B", b)
}
div, exp := int64(unit), 0
for n := b / unit; n >= unit; n /= unit {
div *= unit
exp++
}
return fmt.Sprintf("%.1f %cB",
float64(b)/float64(div), "kMGTPE"[exp])
}
4 changes: 2 additions & 2 deletions commands/static_syncer.go
Original file line number Diff line number Diff line change
Expand Up @@ -79,9 +79,9 @@ func (s *staticSyncer) syncsStaticEvents(staticEvents []fsnotify.Event) error {

fromPath := ev.Name

relPath, found := sourceFs.MakePathRelative(fromPath)
relPath := sourceFs.MakePathRelative(fromPath)

if !found {
if relPath == "" {
// Not member of this virtual host.
continue
}
Expand Down
Loading

0 comments on commit 7360eb8

Please sign in to comment.