Skip to content

Commit

Permalink
Add ForceFlush method to TracerProvider (#1608)
Browse files Browse the repository at this point in the history
* Add ForceFlush method to TracerProvider

The specification requires that a TracerProvider have a ForceFlush
method that can be set with a timeout, return any error to the caller,
and have all the registered span processors export their spans. This
updates the SpanProcessor.ForceFlush method to accept a context and
return an error and plumbs this method into a new ForceFlush method of
the SDK TracerProvider.

Additionally, this corrects the TracerProvider Shutdown method. This
method as well needs to return to the caller any failure it encounters
according to the specification. This returns an error if it cannot type
assert the spanProcessorStates or if shutting down a span processor
results in an error.

Resolves #1606

* Add changes to changelog

* Apply suggestions from code review

Co-authored-by: Steven E. Harris <seh@panix.com>

* Cancel export context when BSP stops

* Defer cancel call in BSP span processor funcs

Co-authored-by: Steven E. Harris <seh@panix.com>
  • Loading branch information
MrAlias and seh authored Mar 8, 2021
1 parent bd0bba4 commit 3dc91f2
Show file tree
Hide file tree
Showing 9 changed files with 92 additions and 34 deletions.
3 changes: 3 additions & 0 deletions CHANGELOG.md
Original file line number Diff line number Diff line change
Expand Up @@ -11,9 +11,12 @@ This project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0.htm
## Added

- Added `Marshler` config option to `otlphttp` to enable otlp over json or protobufs. (#1586)
- A `ForceFlush` method to the `"go.opentelemetry.io/otel/sdk/trace".TracerProvider` to flush all registered `SpanProcessor`s. (#1608)

### Changed

- Update the `ForceFlush` method signature to the `"go.opentelemetry.io/otel/sdk/trace".SpanProcessor` to accept a `context.Context` and return an error. (#1608)
- Update the `Shutdown` method to the `"go.opentelemetry.io/otel/sdk/trace".TracerProvider` return an error on shutdown failure. (#1608)
- The SimpleSpanProcessor will now shut down the enclosed `SpanExporter` and gracefully ignore subsequent calls to `OnEnd` after `Shutdown` is called. (#1612)
- `"go.opentelemetry.io/sdk/metric/controller.basic".WithPusher` is replaced with `WithExporter` to provide consistent naming across project. (#1656)
- Added non-empty string check for trace `Attribute` keys. (#1659)
Expand Down
31 changes: 22 additions & 9 deletions sdk/trace/batch_span_processor.go
Original file line number Diff line number Diff line change
Expand Up @@ -147,8 +147,8 @@ func (bsp *batchSpanProcessor) Shutdown(ctx context.Context) error {
}

// ForceFlush exports all ended spans that have not yet been exported.
func (bsp *batchSpanProcessor) ForceFlush() {
bsp.exportSpans()
func (bsp *batchSpanProcessor) ForceFlush(ctx context.Context) error {
return bsp.exportSpans(ctx)
}

func WithMaxQueueSize(size int) BatchSpanProcessorOption {
Expand Down Expand Up @@ -176,18 +176,19 @@ func WithBlocking() BatchSpanProcessorOption {
}

// exportSpans is a subroutine of processing and draining the queue.
func (bsp *batchSpanProcessor) exportSpans() {
func (bsp *batchSpanProcessor) exportSpans(ctx context.Context) error {
bsp.timer.Reset(bsp.o.BatchTimeout)

bsp.batchMutex.Lock()
defer bsp.batchMutex.Unlock()

if len(bsp.batch) > 0 {
if err := bsp.e.ExportSpans(context.Background(), bsp.batch); err != nil {
otel.Handle(err)
if err := bsp.e.ExportSpans(ctx, bsp.batch); err != nil {
return err
}
bsp.batch = bsp.batch[:0]
}
return nil
}

// processQueue removes spans from the `queue` channel until processor
Expand All @@ -196,12 +197,16 @@ func (bsp *batchSpanProcessor) exportSpans() {
func (bsp *batchSpanProcessor) processQueue() {
defer bsp.timer.Stop()

ctx, cancel := context.WithCancel(context.Background())
defer cancel()
for {
select {
case <-bsp.stopCh:
return
case <-bsp.timer.C:
bsp.exportSpans()
if err := bsp.exportSpans(ctx); err != nil {
otel.Handle(err)
}
case sd := <-bsp.queue:
bsp.batchMutex.Lock()
bsp.batch = append(bsp.batch, sd)
Expand All @@ -211,7 +216,9 @@ func (bsp *batchSpanProcessor) processQueue() {
if !bsp.timer.Stop() {
<-bsp.timer.C
}
bsp.exportSpans()
if err := bsp.exportSpans(ctx); err != nil {
otel.Handle(err)
}
}
}
}
Expand All @@ -220,11 +227,15 @@ func (bsp *batchSpanProcessor) processQueue() {
// drainQueue awaits the any caller that had added to bsp.stopWait
// to finish the enqueue, then exports the final batch.
func (bsp *batchSpanProcessor) drainQueue() {
ctx, cancel := context.WithCancel(context.Background())
defer cancel()
for {
select {
case sd := <-bsp.queue:
if sd == nil {
bsp.exportSpans()
if err := bsp.exportSpans(ctx); err != nil {
otel.Handle(err)
}
return
}

Expand All @@ -234,7 +245,9 @@ func (bsp *batchSpanProcessor) drainQueue() {
bsp.batchMutex.Unlock()

if shouldExport {
bsp.exportSpans()
if err := bsp.exportSpans(ctx); err != nil {
otel.Handle(err)
}
}
default:
close(bsp.queue)
Expand Down
9 changes: 5 additions & 4 deletions sdk/trace/batch_span_processor_test.go
Original file line number Diff line number Diff line change
Expand Up @@ -78,10 +78,11 @@ func TestNewBatchSpanProcessorWithNilExporter(t *testing.T) {
// These should not panic.
bsp.OnStart(context.Background(), span.(sdktrace.ReadWriteSpan))
bsp.OnEnd(span.(sdktrace.ReadOnlySpan))
bsp.ForceFlush()
err := bsp.Shutdown(context.Background())
if err != nil {
t.Error("Error shutting the BatchSpanProcessor down\n")
if err := bsp.ForceFlush(context.Background()); err != nil {
t.Errorf("failed to ForceFlush the BatchSpanProcessor: %v", err)
}
if err := bsp.Shutdown(context.Background()); err != nil {
t.Errorf("failed to Shutdown the BatchSpanProcessor: %v", err)
}
}

Expand Down
47 changes: 42 additions & 5 deletions sdk/trace/provider.go
Original file line number Diff line number Diff line change
Expand Up @@ -16,6 +16,7 @@ package trace // import "go.opentelemetry.io/otel/sdk/trace"

import (
"context"
"fmt"
"sync"
"sync/atomic"

Expand Down Expand Up @@ -201,19 +202,55 @@ func (p *TracerProvider) ApplyConfig(cfg Config) {
p.config.Store(&c)
}

// Shutdown shuts down the span processors in the order they were registered
// ForceFlush immediately exports all spans that have not yet been exported for
// all the registered span processors.
func (p *TracerProvider) ForceFlush(ctx context.Context) error {
spss, ok := p.spanProcessors.Load().(spanProcessorStates)
if !ok {
return fmt.Errorf("failed to load span processors")
}
if len(spss) == 0 {
return nil
}

for _, sps := range spss {
select {
case <-ctx.Done():
return ctx.Err()
default:
}

if err := sps.sp.ForceFlush(ctx); err != nil {
return err
}
}
return nil
}

// Shutdown shuts down the span processors in the order they were registered.
func (p *TracerProvider) Shutdown(ctx context.Context) error {
spss, ok := p.spanProcessors.Load().(spanProcessorStates)
if !ok || len(spss) == 0 {
if !ok {
return fmt.Errorf("failed to load span processors")
}
if len(spss) == 0 {
return nil
}

for _, sps := range spss {
select {
case <-ctx.Done():
return ctx.Err()
default:
}

var err error
sps.state.Do(func() {
if err := sps.sp.Shutdown(ctx); err != nil {
otel.Handle(err)
}
err = sps.sp.Shutdown(ctx)
})
if err != nil {
return err
}
}
return nil
}
Expand Down
20 changes: 10 additions & 10 deletions sdk/trace/provider_test.go
Original file line number Diff line number Diff line change
Expand Up @@ -32,9 +32,11 @@ func (t *basicSpanProcesor) Shutdown(context.Context) error {
return t.injectShutdownError
}

func (t *basicSpanProcesor) OnStart(parent context.Context, s ReadWriteSpan) {}
func (t *basicSpanProcesor) OnEnd(s ReadOnlySpan) {}
func (t *basicSpanProcesor) ForceFlush() {}
func (t *basicSpanProcesor) OnStart(context.Context, ReadWriteSpan) {}
func (t *basicSpanProcesor) OnEnd(ReadOnlySpan) {}
func (t *basicSpanProcesor) ForceFlush(context.Context) error {
return nil
}

func TestShutdownTraceProvider(t *testing.T) {
stp := NewTracerProvider()
Expand All @@ -51,7 +53,6 @@ func TestShutdownTraceProvider(t *testing.T) {
}

func TestFailedProcessorShutdown(t *testing.T) {
handler.Reset()
stp := NewTracerProvider()
spErr := errors.New("basic span processor shutdown failure")
sp := &basicSpanProcesor{
Expand All @@ -60,9 +61,9 @@ func TestFailedProcessorShutdown(t *testing.T) {
}
stp.RegisterSpanProcessor(sp)

_ = stp.Shutdown(context.Background())

assert.Contains(t, handler.errs, spErr)
err := stp.Shutdown(context.Background())
assert.Error(t, err)
assert.Equal(t, err, spErr)
}

func TestFailedProcessorShutdownInUnregister(t *testing.T) {
Expand All @@ -78,7 +79,6 @@ func TestFailedProcessorShutdownInUnregister(t *testing.T) {

assert.Contains(t, handler.errs, spErr)

handler.errs = nil
_ = stp.Shutdown(context.Background())
assert.Empty(t, handler.errs)
err := stp.Shutdown(context.Background())
assert.NoError(t, err)
}
3 changes: 2 additions & 1 deletion sdk/trace/simple_span_processor.go
Original file line number Diff line number Diff line change
Expand Up @@ -76,5 +76,6 @@ func (ssp *simpleSpanProcessor) Shutdown(ctx context.Context) error {
}

// ForceFlush does nothing as there is no data to flush.
func (ssp *simpleSpanProcessor) ForceFlush() {
func (ssp *simpleSpanProcessor) ForceFlush(context.Context) error {
return nil
}
2 changes: 1 addition & 1 deletion sdk/trace/span_processor.go
Original file line number Diff line number Diff line change
Expand Up @@ -46,7 +46,7 @@ type SpanProcessor interface {
// been exported. It should only be called when absolutely necessary, such as when
// using a FaaS provider that may suspend the process after an invocation, but before
// the Processor can export the completed spans.
ForceFlush()
ForceFlush(ctx context.Context) error
}

type spanProcessorState struct {
Expand Down
8 changes: 5 additions & 3 deletions sdk/trace/span_processor_example_test.go
Original file line number Diff line number Diff line change
Expand Up @@ -36,8 +36,8 @@ type DurationFilter struct {
func (f DurationFilter) OnStart(parent context.Context, s ReadWriteSpan) {
f.Next.OnStart(parent, s)
}
func (f DurationFilter) Shutdown(ctx context.Context) error { return f.Next.Shutdown(ctx) }
func (f DurationFilter) ForceFlush() { f.Next.ForceFlush() }
func (f DurationFilter) Shutdown(ctx context.Context) error { return f.Next.Shutdown(ctx) }
func (f DurationFilter) ForceFlush(ctx context.Context) error { return f.Next.ForceFlush(ctx) }
func (f DurationFilter) OnEnd(s ReadOnlySpan) {
if f.Min > 0 && s.EndTime().Sub(s.StartTime()) < f.Min {
// Drop short lived spans.
Expand Down Expand Up @@ -65,7 +65,9 @@ func (f InstrumentationBlacklist) OnStart(parent context.Context, s ReadWriteSpa
f.Next.OnStart(parent, s)
}
func (f InstrumentationBlacklist) Shutdown(ctx context.Context) error { return f.Next.Shutdown(ctx) }
func (f InstrumentationBlacklist) ForceFlush() { f.Next.ForceFlush() }
func (f InstrumentationBlacklist) ForceFlush(ctx context.Context) error {
return f.Next.ForceFlush(ctx)
}
func (f InstrumentationBlacklist) OnEnd(s ReadOnlySpan) {
if f.Blacklist != nil && f.Blacklist[s.InstrumentationLibrary().Name] {
// Drop spans from this instrumentation
Expand Down
3 changes: 2 additions & 1 deletion sdk/trace/span_processor_test.go
Original file line number Diff line number Diff line change
Expand Up @@ -63,7 +63,8 @@ func (t *testSpanProcessor) Shutdown(_ context.Context) error {
return nil
}

func (t *testSpanProcessor) ForceFlush() {
func (t *testSpanProcessor) ForceFlush(context.Context) error {
return nil
}

func TestRegisterSpanProcessor(t *testing.T) {
Expand Down

0 comments on commit 3dc91f2

Please sign in to comment.