-
Notifications
You must be signed in to change notification settings - Fork 1.2k
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
- Loading branch information
1 parent
fe5ce80
commit 52bd24a
Showing
1 changed file
with
286 additions
and
0 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,286 @@ | ||
// +build integration | ||
|
||
/* | ||
* Copyright 2018 Dgraph Labs, Inc. and Contributors | ||
* | ||
* Licensed under the Apache License, Version 2.0 (the "License"); | ||
* you may not use this file except in compliance with the License. | ||
* You may obtain a copy of the License at | ||
* | ||
* http://www.apache.org/licenses/LICENSE-2.0 | ||
* | ||
* Unless required by applicable law or agreed to in writing, software | ||
* distributed under the License is distributed on an "AS IS" BASIS, | ||
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. | ||
* See the License for the specific language governing permissions and | ||
* limitations under the License. | ||
*/ | ||
package badger | ||
|
||
import ( | ||
"bytes" | ||
"context" | ||
"flag" | ||
"fmt" | ||
"log" | ||
"math/rand" | ||
"net/http" | ||
"os" | ||
"sync" | ||
"sync/atomic" | ||
"testing" | ||
"time" | ||
|
||
"github.com/dgraph-io/badger/options" | ||
"github.com/dgraph-io/badger/y" | ||
"github.com/paulbellamy/ratecounter" | ||
) | ||
|
||
var ( | ||
numKeys = flag.Float64("keys_mil", 10.0, "How many million keys to write.") | ||
valueSize = flag.Int("valsz", 128, "Value size in bytes.") | ||
dir = flag.String("dir", "", "Base dir for writes.") | ||
skipLoad = flag.Bool("skipLoad", false, "Flag to skip loading and run delete/compaction only") | ||
loadOnly = flag.Bool("loadOnly", false, "Load the data and stop") | ||
bdb *DB | ||
) | ||
|
||
const mil float64 = 1000000 | ||
|
||
func TestOfflineCompaction(t *testing.T) { | ||
go http.ListenAndServe(":8080", nil) | ||
if *skipLoad { | ||
fmt.Printf("Using existing db at: %s\n", *dir) | ||
} else { | ||
openDB(true, 2) | ||
fmt.Printf("TOTAL KEYS TO WRITE: %s\n", humanize(int64(*numKeys*mil))) | ||
loadData() | ||
// TODO print some stats (maybe run badger_info) | ||
} | ||
|
||
if *loadOnly { | ||
fmt.Println("Skipping Deletion, GC and compaction") | ||
return | ||
} | ||
|
||
openDB(false, 2) | ||
fmt.Print("Deleting some keys\n") | ||
deleteData() | ||
|
||
fmt.Println("Purging Older Versions") | ||
y.Check(bdb.PurgeOlderVersions()) | ||
fmt.Println("Running Value Log GC") | ||
y.Check(bdb.RunValueLogGCOffline()) | ||
y.Check(bdb.Close()) | ||
openDB(false, 0) | ||
fmt.Println("Running offline compaction") | ||
y.Check(bdb.CompactLSMTreeOffline()) | ||
fmt.Println("Closing DB") | ||
// TODO print some stats (maybe run badger_info) | ||
y.Check(bdb.Close()) | ||
fmt.Println("Checking DB") | ||
checkData() | ||
} | ||
|
||
func openDB(remove bool, numCompactors int) { | ||
opt := DefaultOptions | ||
opt.TableLoadingMode = options.MemoryMap | ||
opt.Dir = *dir + "/badger" | ||
opt.ValueDir = opt.Dir | ||
opt.SyncWrites = true | ||
opt.NumCompactors = numCompactors | ||
|
||
// Open DB. | ||
if remove { // Remove existing DB if flag set | ||
fmt.Println("Removing existing Badger DB") | ||
y.Check(os.RemoveAll(*dir + "/badger")) | ||
} | ||
fmt.Println("Opening Badger DB") | ||
os.MkdirAll(*dir+"/badger", 0777) | ||
var err error | ||
bdb, err = Open(opt) | ||
if err != nil { | ||
log.Fatalf("while opening badger: %v", err) | ||
} | ||
} | ||
|
||
func loadData() { | ||
rc := ratecounter.NewRateCounter(time.Minute) | ||
var counter int64 | ||
ctx, cancel := context.WithCancel(context.Background()) | ||
go func() { | ||
var count int64 | ||
t := time.NewTicker(time.Second) | ||
defer t.Stop() | ||
for { | ||
select { | ||
case <-t.C: | ||
fmt.Printf("[%04d] Write key rate per minute: %s. Total: %s\n", | ||
count, | ||
humanize(rc.Rate()), | ||
humanize(atomic.LoadInt64(&counter))) | ||
count++ | ||
case <-ctx.Done(): | ||
return | ||
} | ||
} | ||
}() | ||
|
||
N := 12 | ||
var wg sync.WaitGroup | ||
for i := 0; i < N; i++ { | ||
wg.Add(1) | ||
go func(proc int) { | ||
entries := make([]*entry, 1000) | ||
for i := 0; i < len(entries); i++ { | ||
e := new(entry) | ||
e.Key = make([]byte, 22) | ||
e.Value = make([]byte, *valueSize) | ||
entries[i] = e | ||
} | ||
|
||
var written float64 | ||
for written < (*numKeys*mil)/float64(N) { | ||
wrote := float64(writeBatch(entries)) | ||
|
||
wi := int64(wrote) | ||
atomic.AddInt64(&counter, wi) | ||
rc.Incr(wi) | ||
|
||
written += wrote | ||
} | ||
wg.Done() | ||
}(i) | ||
} | ||
// wg.Add(1) // Block | ||
wg.Wait() | ||
cancel() | ||
bdb.Close() | ||
} | ||
|
||
func deleteData() { | ||
rc := ratecounter.NewRateCounter(time.Minute) | ||
var counter int64 | ||
ctx, cancel := context.WithCancel(context.Background()) | ||
go func() { | ||
var count int64 | ||
t := time.NewTicker(time.Second) | ||
defer t.Stop() | ||
for { | ||
select { | ||
case <-t.C: | ||
fmt.Printf("[%04d] Delete key rate per minute: %s. Total: %s\n", | ||
count, | ||
humanize(rc.Rate()), | ||
humanize(atomic.LoadInt64(&counter))) | ||
count++ | ||
case <-ctx.Done(): | ||
return | ||
} | ||
} | ||
}() | ||
|
||
N := 12 | ||
var wg sync.WaitGroup | ||
for i := 0; i < N; i++ { | ||
wg.Add(1) | ||
go func(proc int) { | ||
var deleted float64 | ||
for deleted < (*numKeys*mil/3)/float64(N) { | ||
del := float64(deleteBatch(1000)) | ||
|
||
di := int64(del) | ||
atomic.AddInt64(&counter, di) | ||
rc.Incr(di) | ||
|
||
deleted += del | ||
} | ||
wg.Done() | ||
}(i) | ||
} | ||
// wg.Add(1) // Block | ||
wg.Wait() | ||
cancel() | ||
} | ||
|
||
type entry struct { | ||
Key []byte | ||
Value []byte | ||
Meta byte | ||
} | ||
|
||
func fillEntry(e *entry) { | ||
k := rand.Int() % int(*numKeys*mil) | ||
key := fmt.Sprintf("vsz=%05d-k=%010d", *valueSize, k) // 22 bytes. | ||
if cap(e.Key) < len(key) { | ||
e.Key = make([]byte, 2*len(key)) | ||
} | ||
e.Key = e.Key[:len(key)] | ||
copy(e.Key, key) | ||
|
||
rand.Read(e.Value) | ||
e.Meta = 0 | ||
} | ||
|
||
func writeBatch(entries []*entry) int { | ||
for _, e := range entries { | ||
fillEntry(e) | ||
} | ||
|
||
txn := bdb.NewTransaction(true) | ||
|
||
for _, e := range entries { | ||
y.Check(txn.Set(e.Key, e.Value)) | ||
} | ||
y.Check(txn.Commit(nil)) | ||
|
||
return len(entries) | ||
} | ||
|
||
func deleteBatch(batchSize int) (count int) { | ||
txn := bdb.NewTransaction(true) | ||
for i := 0; i < batchSize; i++ { | ||
k := rand.Int() % int(*numKeys*mil) | ||
key := fmt.Sprintf("vsz=%05d-k=%010d", *valueSize, k) // 22 bytes. | ||
err := txn.Delete([]byte(key)) | ||
if err != ErrKeyNotFound { | ||
y.Check(err) | ||
} | ||
count++ | ||
} | ||
y.Check(txn.Commit(nil)) | ||
return | ||
} | ||
|
||
func checkData() { | ||
openDB(false, 2) | ||
txn := bdb.NewTransaction(false) | ||
opts := DefaultIteratorOptions | ||
opts.PrefetchValues = false | ||
opts.AllVersions = true | ||
it := txn.NewIterator(opts) | ||
var ( | ||
prev []byte | ||
count int64 | ||
) | ||
for it.Rewind(); it.Valid(); it.Next() { | ||
item := it.Item() | ||
if bytes.Compare(prev, item.Key()) == 0 { | ||
log.Fatalf("Multiple key versions found %s\n", item.Key()) | ||
} | ||
y.SafeCopy(prev, item.Key()) | ||
count++ | ||
} | ||
fmt.Printf("%d keys successfully traversed\n", count) | ||
y.Check(bdb.Close()) | ||
} | ||
|
||
func humanize(n int64) string { | ||
if n >= 1000000 { | ||
return fmt.Sprintf("%6.2fM", float64(n)/1000000.0) | ||
} | ||
if n >= 1000 { | ||
return fmt.Sprintf("%6.2fK", float64(n)/1000.0) | ||
} | ||
return fmt.Sprintf("%5.2f", float64(n)) | ||
} |