grafana · woodsaj · Mar 22, 2017 · Mar 21, 2017 · Mar 21, 2017 · Mar 21, 2017
diff --git a/docker/docker-cluster/metrictank.ini b/docker/docker-cluster/metrictank.ini
@@ -248,10 +248,8 @@ max-stale = 0
 prune-interval = 3h
 # synchronize index changes to cassandra. not all your nodes need to do this.
 update-cassandra-index = true
-#frequency at which we should update the metricDef lastUpdate field, use 0s for instant updates
+#frequency at which we should update flush changes to cassandra. only relevant if update-cassandra-index is true.
 update-interval = 4h
-#fuzzyness factor for update-interval. should be in the range 0 > fuzzyness <= 1. With an updateInterval of 4hours and fuzzyness of 0.5, metricDefs will be updated every 4-6hours.
-update-fuzzyness = 0.5
 # enable SSL connection to cassandra
 ssl = false
 # cassandra CA certficate path when using SSL

diff --git a/docker/docker-dev-custom-cfg-kafka/metrictank.ini b/docker/docker-dev-custom-cfg-kafka/metrictank.ini
@@ -248,10 +248,8 @@ max-stale = 0
 prune-interval = 3h
 # synchronize index changes to cassandra. not all your nodes need to do this.
 update-cassandra-index = true
-#frequency at which we should update the metricDef lastUpdate field, use 0s for instant updates
+#frequency at which we should update flush changes to cassandra. only relevant if update-cassandra-index is true.
 update-interval = 4h
-#fuzzyness factor for update-interval. should be in the range 0 > fuzzyness <= 1. With an updateInterval of 4hours and fuzzyness of 0.5, metricDefs will be updated every 4-6hours.
-update-fuzzyness = 0.5
 # enable SSL connection to cassandra
 ssl = false
 # cassandra CA certficate path when using SSL

diff --git a/docs/config.md b/docs/config.md
@@ -297,10 +297,8 @@ max-stale = 0
 prune-interval = 3h
 # synchronize index changes to cassandra. not all your nodes need to do this.
 update-cassandra-index = true
-#frequency at which we should update the metricDef lastUpdate field, use 0s for instant updates
+#frequency at which we should update flush changes to cassandra. only relevant if update-cassandra-index is true.
 update-interval = 4h
-#fuzzyness factor for update-interval. should be in the range 0 > fuzzyness <= 1. With an updateInterval of 4hours and fuzzyness of 0.5, metricDefs will be updated every 4-6hours.
-update-fuzzyness = 0.5
 # enable SSL connection to cassandra
 ssl = false
 # cassandra CA certficate path when using SSL

diff --git a/docs/metadata.md b/docs/metadata.md
@@ -25,7 +25,7 @@ enabled = true
 This is the recommended option because it persists.
 
 * type: Memory-Idx for search queries, backed by Cassandra for persistence
-* persistence:  persists new metricDefinitions as they are seen.  At startup, the internal memory index is rebuilt from all metricDefinitions that have been stored in Cassandra.  Metrictank won’t be considered ready (be able to ingest metrics or handle searches) until the index has been completely rebuilt.
+* persistence:  persists new metricDefinitions as they are seen and every update-interval.  At startup, the internal memory index is rebuilt from all metricDefinitions that have been stored in Cassandra.  Metrictank won’t be considered ready (be able to ingest metrics or handle searches) until the index has been completely rebuilt.
 * efficiency: On low end hardware the index rebuilds at about 70000 metricDefinitions per second. Saving new metrics works pretty fast.
 
 Metrictank will initialize Cassandra with the needed keyspace and tabe.  However if you are running a Cassandra cluster then you should tune the keyspace to suit your deployment.
@@ -51,8 +51,6 @@ num-conns = 10
 write-queue-size = 100000
 ```
 
-Note:
-* All metrictanks write to Cassandra.  this is not very efficient.
 
 ## The anatomy of a metricdef
 
@@ -65,16 +63,15 @@ The schema is as follows:
 ```
 type MetricDefinition struct {
 	Id         string            
-	OrgId      int               
+	OrgId      int       
+	Partition  int        
 	Name       string            // graphite format
 	Metric     string            // kairosdb format (like graphite, but not including some tags)
 	Interval   int               
 	Unit       string            
 	Mtype      string            
 	Tags       []string          
-	LastUpdate int64             
-	Nodes      map[string]string 
-	NodeCount  int               
+	LastUpdate int64                        
 }
 ```
 

diff --git a/docs/metrics.md b/docs/metrics.md
@@ -132,6 +132,8 @@ how many insert queries for a metric failed (triggered by an add or an update)
 time inserts spent in queue before being executed
 * `idx.cassandra.update`:  
 the duration of an update of one metric to the cassandra idx, including the update to the in-memory index, excluding any insert/delete queries
+* `idx.cassandra.save.skipped`:  
+how many saves have been skipped due to the writeQueue being full
 * `idx.memory.add`:  
 the duration of an add of a metric to the memory idx
 * `idx.memory.ops.add`:  

diff --git a/idx/cassandra/cassandra.go b/idx/cassandra/cassandra.go
@@ -3,7 +3,6 @@ package cassandra
 import (
 	"flag"
 	"fmt"
-	"math/rand"
 	"strings"
 	"sync"
 	"time"
@@ -60,7 +59,9 @@ var (
 	statPruneDuration = stats.NewLatencyHistogram15s32("idx.cassandra.prune")
 	// metric idx.cassandra.delete is the duration of a delete of one or more metrics from the cassandra idx, including the delete from the in-memory index and the delete query
 	statDeleteDuration = stats.NewLatencyHistogram15s32("idx.cassandra.delete")
-	errmetrics         = cassandra.NewErrMetrics("idx.cassandra")
+	// metric idx.cassandra.save.skipped is how many saves have been skipped due to the writeQueue being full
+	statSaveSkipped = stats.NewCounter32("idx.cassandra.save.skipped")
+	errmetrics      = cassandra.NewErrMetrics("idx.cassandra")
 
 	Enabled          bool
 	ssl              bool
@@ -80,7 +81,7 @@ var (
 	pruneInterval    time.Duration
 	updateCassIdx    bool
 	updateInterval   time.Duration
-	updateFuzzyness  float64
+	updateInterval32 uint32
 )
 
 func ConfigSetup() *flag.FlagSet {
@@ -95,7 +96,6 @@ func ConfigSetup() *flag.FlagSet {
 	casIdx.IntVar(&writeQueueSize, "write-queue-size", 100000, "Max number of metricDefs allowed to be unwritten to cassandra")
 	casIdx.BoolVar(&updateCassIdx, "update-cassandra-index", true, "synchronize index changes to cassandra. not all your nodes need to do this.")
 	casIdx.DurationVar(&updateInterval, "update-interval", time.Hour*3, "frequency at which we should update the metricDef lastUpdate field, use 0s for instant updates")
-	casIdx.Float64Var(&updateFuzzyness, "update-fuzzyness", 0.5, "fuzzyness factor for update-interval. should be in the range 0 > fuzzyness <= 1. With an updateInterval of 4hours and fuzzyness of 0.5, metricDefs will be updated every 4-6hours.")
 	casIdx.DurationVar(&maxStale, "max-stale", 0, "clear series from the index if they have not been seen for this much time.")
 	casIdx.DurationVar(&pruneInterval, "prune-interval", time.Hour*3, "Interval at which the index should be checked for stale series.")
 	casIdx.IntVar(&protoVer, "protocol-version", 4, "cql protocol version to use")
@@ -154,6 +154,7 @@ func New() *CasIdx {
 	if updateCassIdx {
 		idx.writeQueue = make(chan writeReq, writeQueueSize)
 	}
+	updateInterval32 = uint32(updateInterval.Nanoseconds() / int64(time.Second))
 	return idx
 }
 
@@ -236,46 +237,68 @@ func (c *CasIdx) Stop() {
 func (c *CasIdx) AddOrUpdate(data *schema.MetricData, partition int32) idx.Archive {
 	pre := time.Now()
 	existing, inMemory := c.MemoryIdx.Get(data.Id)
-	updateIdx := false
+	archive := c.MemoryIdx.AddOrUpdate(data, partition)
 	stat := statUpdateDuration
+	if !inMemory {
+		stat = statAddDuration
+	}
+	if !updateCassIdx {
+		stat.Value(time.Since(pre))
+		return archive
+	}
 
-	if inMemory {
-		if existing.Partition == partition {
-			var oldest time.Time
-			if updateInterval > 0 {
-				oldest = time.Now().Add(-1 * updateInterval).Add(-1 * time.Duration(rand.Int63n(updateInterval.Nanoseconds()*int64(updateFuzzyness*100)/100)))
-			} else {
-				oldest = time.Now()
-			}
-			updateIdx = (existing.LastUpdate < oldest.Unix())
-		} else {
-			if updateCassIdx {
-				// the partition of the metric has changed. So we need to delete
-				// the current metricDef from cassandra.  We do this in a separate
-				// goroutine as we dont want to block waiting for the delete to succeed.
-				go func() {
-					if err := c.deleteDef(&existing); err != nil {
-						log.Error(3, err.Error())
-					}
-				}()
+	now := uint32(time.Now().Unix())
+
+	// Cassandra uses partition id asthe partitionin key, so an "update" that changes the partition for
+	// an existing metricDef will just create a new row in the table and wont remove the old row.
+	// So we need to explicitly delete the old entry.
+	if inMemory && existing.Partition != partition {
+		go func() {
+			if err := c.deleteDef(&existing); err != nil {
+				log.Error(3, err.Error())
 			}
-			updateIdx = true
-		}
-	} else {
-		updateIdx = true
-		stat = statAddDuration
+		}()
 	}
 
-	if updateIdx {
-		archive := c.MemoryIdx.AddOrUpdate(data, partition)
-		if updateCassIdx {
-			log.Debug("cassandra-idx updating def in index.")
-			c.writeQueue <- writeReq{recvTime: time.Now(), def: &archive.MetricDefinition}
-		}
+	// check if we need to save to cassandra.
+	if archive.LastSave >= (now - updateInterval32) {
 		stat.Value(time.Since(pre))
 		return archive
 	}
-	return existing
+
+	// This is just a safety precaution to prevent corrupt index entries.
+	// This ensures that the index entry always contains the correct metricDefinition data.
+	if inMemory {
+		archive.MetricDefinition = *schema.MetricDefinitionFromMetricData(data)
+		archive.MetricDefinition.Partition = partition
+	}
+
+	// if the entry has not been saved for 1.5x updateInterval
+	// then perform a blocking save. (bit shifting to the right 1 bit, divides by 2)
+	if archive.LastSave < (now - updateInterval32 - (updateInterval32 >> 1)) {
+		log.Debug("cassandra-idx updating def in index.")
+		c.writeQueue <- writeReq{recvTime: time.Now(), def: &archive.MetricDefinition}
+		archive.LastSave = now
+		c.MemoryIdx.Update(archive)
+	} else {
+		// perform a non-blocking write to the writeQueue. If the queue is full, then
+		// this will fail and we wont update the LastSave timestamp. The next time
+		// the metric is seen, the previous lastSave timestamp will still be in place and so
+		// we will try and save again.  This will continue until we are successful or the
+		// lastSave timestamp become more then 1.5 x UpdateInterval, in which case we will
+		// do a blocking write to the queue.
+		select {
+		case c.writeQueue <- writeReq{recvTime: time.Now(), def: &archive.MetricDefinition}:
+			archive.LastSave = now
+			c.MemoryIdx.Update(archive)
+		default:
+			statSaveSkipped.Inc()
+			log.Debug("writeQueue is full, update not saved.")
+		}
+	}
+
+	stat.Value(time.Since(pre))
+	return archive
 }
 
 func (c *CasIdx) rebuildIndex() {