Skip to content

Fix tracing.NewRandomRatioBased panic #5044

New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Merged
merged 5 commits into from
Dec 15, 2022
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
1 change: 1 addition & 0 deletions CHANGELOG.md
Original file line number Diff line number Diff line change
Expand Up @@ -16,6 +16,7 @@
* [FEATURE] Query Frontend/Scheduler: Add a new counter metric `cortex_request_queue_requests_total` for total requests going to queue. #5030
* [FEATURE] Build ARM docker images. #5041
* [BUGFIX] Updated `golang.org/x/net` dependency to fix CVE-2022-27664. #5008
* [BUGFIX] Fix panic when otel and xray tracing is enabled. #5044

## 1.14.0 2022-12-02

Expand Down
32 changes: 18 additions & 14 deletions pkg/tracing/sampler/sampling.go
Original file line number Diff line number Diff line change
@@ -1,39 +1,43 @@
package sampler

import (
"encoding/binary"
"fmt"
"math"

sdktrace "go.opentelemetry.io/otel/sdk/trace"
"go.opentelemetry.io/otel/trace"
)

type randGenerator interface {
Float64() float64
}

type RandomRatioBased struct {
type xrayTraceIDRatioBased struct {
sdktrace.Sampler
rnd randGenerator
fraction float64
max uint64
}

// NewRandomRatioBased creates a sampler based on random number.
// NewXrayTraceIDRatioBased creates a sampler based on random number.
// fraction parameter should be between 0 and 1 where:
// fraction >= 1 it will always sample
// fraction <= 0 it will never sample
func NewRandomRatioBased(fraction float64, rnd randGenerator) sdktrace.Sampler {
func NewXrayTraceIDRatioBased(fraction float64) sdktrace.Sampler {
if fraction >= 1 {
return sdktrace.AlwaysSample()
} else if fraction <= 0 {
return sdktrace.NeverSample()
}

return &RandomRatioBased{rnd: rnd, fraction: fraction}
return &xrayTraceIDRatioBased{max: uint64(fraction * math.MaxUint64)}
}

func (s *RandomRatioBased) ShouldSample(p sdktrace.SamplingParameters) sdktrace.SamplingResult {
func (s *xrayTraceIDRatioBased) ShouldSample(p sdktrace.SamplingParameters) sdktrace.SamplingResult {
// The default otel sampler pick the first 8 bytes to make the sampling decision and this is a problem to
// xray case as the first 4 bytes on the xray traceId is the time of the original request and the random part are
// the 12 last bytes, and so, this sampler pick the last 8 bytes to make the sampling decision.
// Xray Trace format: https://docs.aws.amazon.com/xray/latest/devguide/xray-api-sendingdata.html
// Xray Id Generator: https://github.com/open-telemetry/opentelemetry-go-contrib/blob/54f0bc5c0fd347cd6db9b7bc14c9f0c00dfcb36b/propagators/aws/xray/idgenerator.go#L58-L63
// Ref: https://github.com/open-telemetry/opentelemetry-go/blob/7a60bc785d669fa6ad26ba70e88151d4df631d90/sdk/trace/sampling.go#L82-L95
val := binary.BigEndian.Uint64(p.TraceID[8:16])
psc := trace.SpanContextFromContext(p.ParentContext)
shouldSample := s.rnd.Float64() < s.fraction
shouldSample := val < s.max
if shouldSample {
return sdktrace.SamplingResult{
Decision: sdktrace.RecordAndSample,
Expand All @@ -46,6 +50,6 @@ func (s *RandomRatioBased) ShouldSample(p sdktrace.SamplingParameters) sdktrace.
}
}

func (s *RandomRatioBased) Description() string {
return fmt.Sprintf("RandomRatioBased{%g}", s.fraction)
func (s *xrayTraceIDRatioBased) Description() string {
return fmt.Sprintf("xrayTraceIDRatioBased{%v}", s.max)
}
64 changes: 29 additions & 35 deletions pkg/tracing/sampler/sampling_test.go
Original file line number Diff line number Diff line change
Expand Up @@ -2,78 +2,72 @@ package sampler

import (
"context"
"math/rand"
"testing"

"github.com/stretchr/testify/require"
"go.opentelemetry.io/contrib/propagators/aws/xray"
sdktrace "go.opentelemetry.io/otel/sdk/trace"
"go.opentelemetry.io/otel/trace"
)

type mockGenerator struct {
mockedValue float64
}

func (g *mockGenerator) Float64() float64 {
return g.mockedValue
}

func Test_ShouldSample(t *testing.T) {
traceID, _ := trace.TraceIDFromHex("4bf92f3577b34da6a3ce929d0e0e4736")
parentCtx := trace.ContextWithSpanContext(
context.Background(),
trace.NewSpanContext(trace.SpanContextConfig{
TraceState: trace.TraceState{},
}),
)

generator := xray.NewIDGenerator()

tests := []struct {
name string
samplingDecision sdktrace.SamplingDecision
fraction float64
generator randGenerator
name string
fraction float64
}{
{
name: "should always sample",
samplingDecision: sdktrace.RecordAndSample,
fraction: 1,
generator: rand.New(rand.NewSource(rand.Int63())),
name: "should always sample",
fraction: 1,
},
{
name: "should nerver sample",
samplingDecision: sdktrace.Drop,
fraction: 0,
generator: rand.New(rand.NewSource(rand.Int63())),
name: "should nerver sample",
fraction: 0,
},
{
name: "should sample when fraction is above generated",
samplingDecision: sdktrace.RecordAndSample,
fraction: 0.5,
generator: &mockGenerator{0.2},
name: "should sample 50%",
fraction: 0.5,
},
{
name: "should not sample when fraction is not above generated",
samplingDecision: sdktrace.Drop,
fraction: 0.5,
generator: &mockGenerator{0.8},
name: "should sample 10%",
fraction: 0.1,
},
{
name: "should sample 1%",
fraction: 0.01,
},
}

totalIterations := 10000
for _, tt := range tests {
t.Run(tt.name, func(t *testing.T) {
s := NewRandomRatioBased(tt.fraction, tt.generator)
for i := 0; i < 100; i++ {

totalSampled := 0
s := NewXrayTraceIDRatioBased(tt.fraction)
for i := 0; i < totalIterations; i++ {
traceID, _ := generator.NewIDs(context.Background())
r := s.ShouldSample(
sdktrace.SamplingParameters{
ParentContext: parentCtx,
TraceID: traceID,
Name: "test",
Kind: trace.SpanKindServer,
})

require.Equal(t, tt.samplingDecision, r.Decision)
if r.Decision == sdktrace.RecordAndSample {
totalSampled++
}
}

tolerance := 0.1
expected := tt.fraction * float64(totalIterations)
require.InDelta(t, expected, totalSampled, expected*tolerance)
})
}
}
17 changes: 8 additions & 9 deletions pkg/tracing/tracing.go
Original file line number Diff line number Diff line change
Expand Up @@ -4,17 +4,15 @@ import (
"context"
"flag"
"fmt"
"math/rand"
"strings"
"time"

"github.com/go-kit/log/level"
"github.com/pkg/errors"
"github.com/weaveworks/common/tracing"
"go.opentelemetry.io/contrib/propagators/aws/xray"
"google.golang.org/grpc/credentials"

"github.com/opentracing/opentracing-go"
"go.opentelemetry.io/contrib/propagators/aws/xray"
"go.opentelemetry.io/otel"
"go.opentelemetry.io/otel/exporters/otlp/otlptrace"
"go.opentelemetry.io/otel/exporters/otlp/otlptrace/otlptracegrpc"
Expand Down Expand Up @@ -110,10 +108,10 @@ func SetupTracing(ctx context.Context, name string, c Config) (func(context.Cont
return nil, fmt.Errorf("creating tracing resource: %w", err)
}

tracerProvider := newTraceProvider(r, c, exporter)
propagator, tracerProvider := newTraceProvider(r, c, exporter)

bridge, wrappedProvider := migration.NewCortexBridgeTracerWrapper(tracerProvider.Tracer("github.com/cortexproject/cortex/cmd/cortex"))
bridge.SetTextMapPropagator(propagation.TraceContext{})
bridge.SetTextMapPropagator(propagator)
opentracing.SetGlobalTracer(bridge)
otel.SetTracerProvider(wrappedProvider)

Expand All @@ -125,21 +123,22 @@ func SetupTracing(ctx context.Context, name string, c Config) (func(context.Cont
}, nil
}

func newTraceProvider(r *resource.Resource, c Config, exporter *otlptrace.Exporter) *sdktrace.TracerProvider {
func newTraceProvider(r *resource.Resource, c Config, exporter *otlptrace.Exporter) (propagation.TextMapPropagator, *sdktrace.TracerProvider) {
options := []sdktrace.TracerProviderOption{
sdktrace.WithBatcher(exporter),
sdktrace.WithResource(r),
}

var propagator propagation.TextMapPropagator = propagation.TraceContext{}
switch strings.ToLower(c.Otel.ExporterType) {
case "awsxray":
options = append(options, sdktrace.WithIDGenerator(xray.NewIDGenerator()))
options = append(options, sdktrace.WithSampler(sdktrace.ParentBased(sampler.NewRandomRatioBased(c.Otel.SampleRatio, rand.New(rand.NewSource(time.Now().Unix()))))))
options = append(options, sdktrace.WithSampler(sdktrace.ParentBased(sampler.NewXrayTraceIDRatioBased(c.Otel.SampleRatio))))
propagator = xray.Propagator{}
default:
options = append(options, sdktrace.WithSampler(sdktrace.ParentBased(sdktrace.TraceIDRatioBased(c.Otel.SampleRatio))))
}

return sdktrace.NewTracerProvider(options...)
return propagator, sdktrace.NewTracerProvider(options...)
}

func newResource(ctx context.Context, target string, detectors []resource.Detector) (*resource.Resource, error) {
Expand Down