Skip to content
This repository was archived by the owner on Aug 23, 2023. It is now read-only.

Commit 63b34a5

Browse files
authored
Merge pull request #1303 from bloomberg/fix_overpruning
fix index corruption: make sure defBy{Id,TagSet} use same pointers
2 parents 7b57297 + 2bcfbc4 commit 63b34a5

File tree

1 file changed

+24
-19
lines changed

1 file changed

+24
-19
lines changed

idx/memory/memory.go

+24-19
Original file line numberDiff line numberDiff line change
@@ -346,10 +346,6 @@ func (m *UnpartitionedMemoryIdx) AddOrUpdate(mkey schema.MKey, data *schema.Metr
346346
statMetricsActive.Inc()
347347
statAddDuration.Value(time.Since(pre))
348348

349-
if TagSupport {
350-
m.indexTags(def)
351-
}
352-
353349
return archive, 0, false
354350
}
355351

@@ -441,10 +437,6 @@ func (m *UnpartitionedMemoryIdx) Load(defs []schema.MetricDefinition) int {
441437

442438
m.add(def)
443439

444-
if TagSupport {
445-
m.indexTags(def)
446-
}
447-
448440
// as we are loading the metricDefs from a persistent store, set the lastSave
449441
// to the lastUpdate timestamp. This won't exactly match the true lastSave Timstamp,
450442
// but it will be close enough and it will always be true that the lastSave was at
@@ -471,13 +463,20 @@ func (m *UnpartitionedMemoryIdx) add(def *schema.MetricDefinition) idx.Archive {
471463
IrId: irId,
472464
}
473465

474-
if TagSupport && len(def.Tags) > 0 {
475-
if _, ok := m.defById[def.Id]; !ok {
476-
m.defById[def.Id] = archive
477-
statAdd.Inc()
478-
log.Debugf("memory-idx: adding %s to DefById", path)
466+
if TagSupport {
467+
// Even if there are no tags, index at least "name". It's important to use the definition
468+
// in the archive pointer that we add to defById, because the pointers must reference the
469+
// same underlying object in m.defById and m.defByTagSet
470+
m.indexTags(&archive.MetricDefinition)
471+
472+
if len(def.Tags) > 0 {
473+
if _, ok := m.defById[def.Id]; !ok {
474+
m.defById[def.Id] = archive
475+
statAdd.Inc()
476+
log.Debugf("memory-idx: adding %s to DefById", path)
477+
}
478+
return *archive
479479
}
480-
return *archive
481480
}
482481

483482
if m.findCache != nil {
@@ -1433,17 +1432,23 @@ DEFS:
14331432

14341433
toPruneUntagged[def.OrgId][n.Path] = struct{}{}
14351434
} else {
1436-
defs := m.defByTagSet.defs(def.OrgId, def.NameWithTags())
1435+
defName := def.NameWithTags()
1436+
defs := m.defByTagSet.defs(def.OrgId, defName)
14371437
// if any other MetricDef with the same tag set is not expired yet,
14381438
// then we do not want to prune any of them
1439-
for def := range defs {
1440-
if atomic.LoadInt64(&def.LastUpdate) >= cutoff {
1439+
for sdef := range defs {
1440+
if atomic.LoadInt64(&sdef.LastUpdate) >= cutoff {
14411441
continue DEFS
14421442
}
14431443
}
14441444

1445-
for def := range defs {
1446-
toPruneTagged[def.OrgId][def.Id] = struct{}{}
1445+
for sdef := range defs {
1446+
if defName != sdef.NameWithTags() {
1447+
corruptIndex.Inc()
1448+
log.Errorf("Almost added bad def to prune list: def=%v, sdef=%v", def, sdef)
1449+
} else {
1450+
toPruneTagged[sdef.OrgId][sdef.Id] = struct{}{}
1451+
}
14471452
}
14481453
}
14491454
}

0 commit comments

Comments
 (0)