From 5aea9be7e5047f7e4fe2ced934c3624509d2553e Mon Sep 17 00:00:00 2001 From: Stanley Liu Date: Thu, 2 May 2024 16:31:38 -0400 Subject: [PATCH 1/7] Add new config option --- .chloggen/stanley.liu_top-level-change.yaml | 28 +++++++++++++++++++ connector/datadogconnector/config.go | 8 ++++++ connector/datadogconnector/connector.go | 3 ++ .../datadogconnector/examples/config.yaml | 9 ++++++ exporter/datadogexporter/config.go | 8 ++++++ .../datadogexporter/examples/collector.yaml | 10 +++++++ exporter/datadogexporter/traces_exporter.go | 3 ++ 7 files changed, 69 insertions(+) create mode 100644 .chloggen/stanley.liu_top-level-change.yaml diff --git a/.chloggen/stanley.liu_top-level-change.yaml b/.chloggen/stanley.liu_top-level-change.yaml new file mode 100644 index 000000000000..48e3dc33f01c --- /dev/null +++ b/.chloggen/stanley.liu_top-level-change.yaml @@ -0,0 +1,28 @@ +# Use this changelog template to create an entry for release notes. + +# One of 'breaking', 'deprecation', 'new_component', 'enhancement', 'bug_fix' +change_type: enhancement + +# The name of the component, or a single word describing the area of concern, (e.g. filelogreceiver) +component: exporter/datadog + +# A brief description of the change. Surround your text with quotes ("") if it needs to start with a backtick (`). +note: The Datadog exporter now has a config option to identify top-level spans by span kind. This new logic can be enabled by setting `traces.compute_top_level_by_span_kind` to true in the Datadog exporter config. + +# Mandatory: One or more tracking issues related to the change. You can use the PR number here if no issue exists. +issues: [32005] + +# (Optional) One or more lines of additional information to render under the primary note. +# These lines will be padded with 2 spaces and then inserted directly into the document. +# Use pipe (|) for multiline entries. +subtext: | + With this new logic, root spans and spans with a server or consumer `span.kind` will be marked as top-level. Additionally, spans with a client or producer `span.kind` will have stats computed. + Enabling this feature flag may increase the number of spans that generate trace metrics, and may change which spans appear as top-level in Datadog. +# If your change doesn't affect end users or the exported elements of any package, +# you should instead start your pull request title with [chore] or use the "Skip Changelog" label. +# Optional: The change log or logs in which this entry should be included. +# e.g. '[user]' or '[user, api]' +# Include 'user' if the change is relevant to end users. +# Include 'api' if there is a change to a library API. +# Default: '[user]' +change_logs: [] \ No newline at end of file diff --git a/connector/datadogconnector/config.go b/connector/datadogconnector/config.go index 1382f09c5740..d66961bbf1d0 100644 --- a/connector/datadogconnector/config.go +++ b/connector/datadogconnector/config.go @@ -42,8 +42,16 @@ type TracesConfig struct { // If set to true, enables an additional stats computation check on spans to see they have an eligible `span.kind` (server, consumer, client, producer). // If enabled, a span with an eligible `span.kind` will have stats computed. If disabled, only top-level and measured spans will have stats computed. // NOTE: For stats computed from OTel traces, only top-level spans are considered when this option is off. + // If you are sending OTel traces and want stats on non-top-level spans, this flag will need to be enabled. + // If you are sending OTel traces and do not want stats computed by span kind, you need to disable this flag and disable `compute_top_level_by_span_kind`. ComputeStatsBySpanKind bool `mapstructure:"compute_stats_by_span_kind"` + // If set to true, root spans and spans with a server or consumer `span.kind` will be marked as top-level. + // Additionally, spans with a client or producer `span.kind` will have stats computed. + // Enabling this config option may increase the number of spans that generate trace metrics, and may change which spans appear as top-level in Datadog. + // The default value is `false`. + ComputeTopLevelBySpanKind bool `mapstructure:"compute_top_level_by_span_kind"` + // If set to true, enables aggregation of peer related tags (e.g., `peer.service`, `db.instance`, etc.) in the datadog connector. // If disabled, aggregated trace stats will not include these tags as dimensions on trace metrics. // For the best experience with peer tags, Datadog also recommends enabling `compute_stats_by_span_kind`. diff --git a/connector/datadogconnector/connector.go b/connector/datadogconnector/connector.go index 22f412e8856a..68fc807cb494 100644 --- a/connector/datadogconnector/connector.go +++ b/connector/datadogconnector/connector.go @@ -114,6 +114,9 @@ func getTraceAgentCfg(cfg TracesConfig, attributesTranslator *attributes.Transla if v := cfg.TraceBuffer; v > 0 { acfg.TraceBuffer = v } + if cfg.ComputeTopLevelBySpanKind { + acfg.Features["enable_otlp_compute_top_level_by_span_kind"] = struct{}{} + } return acfg } diff --git a/connector/datadogconnector/examples/config.yaml b/connector/datadogconnector/examples/config.yaml index 5d6f03374b67..d01c9b65ce25 100644 --- a/connector/datadogconnector/examples/config.yaml +++ b/connector/datadogconnector/examples/config.yaml @@ -41,7 +41,16 @@ connectors: ## If enabled, a span with an eligible `span.kind` will have stats computed. If disabled, only top-level and measured spans will have stats computed. ## NOTE: For stats computed from OTel traces, only top-level spans are considered when this option is off. # + ## If you are sending OTel traces and want stats on non-top-level spans, this flag will need to be enabled. + ## If you are sending OTel traces and do not want stats computed by span kind, you need to disable this flag and disable `compute_top_level_by_span_kind`. + # compute_stats_by_span_kind: true + ## @param compute_top_level_by_span_kind - enables top-level span identification based on `span.kind` - optional + ## If set to true, root spans and spans with a server or consumer `span.kind` will be marked as top-level. + ## Additionally, spans with a client or producer `span.kind` will have stats computed. + ## Enabling this config option may increase the number of spans that generate trace metrics, and may change which spans appear as top-level in Datadog. + # + compute_top_level_by_span_kind: false ## @param peer_tags_aggregation - enables aggregation of peer related tags in Datadog exporter - optional ## If set to true, enables aggregation of peer related tags (e.g., `peer.service`, `db.instance`, etc.) in Datadog exporter. ## If disabled, aggregated trace stats will not include these tags as dimensions on trace metrics. diff --git a/exporter/datadogexporter/config.go b/exporter/datadogexporter/config.go index 9ebd11698016..0e9a28803646 100644 --- a/exporter/datadogexporter/config.go +++ b/exporter/datadogexporter/config.go @@ -273,8 +273,16 @@ type TracesConfig struct { // If set to true, enables an additional stats computation check on spans to see they have an eligible `span.kind` (server, consumer, client, producer). // If enabled, a span with an eligible `span.kind` will have stats computed. If disabled, only top-level and measured spans will have stats computed. // NOTE: For stats computed from OTel traces, only top-level spans are considered when this option is off. + // If you are sending OTel traces and want stats on non-top-level spans, this flag will need to be enabled. + // If you are sending OTel traces and do not want stats computed by span kind, you need to disable this flag and disable `compute_top_level_by_span_kind`. ComputeStatsBySpanKind bool `mapstructure:"compute_stats_by_span_kind"` + // If set to true, root spans and spans with a server or consumer `span.kind` will be marked as top-level. + // Additionally, spans with a client or producer `span.kind` will have stats computed. + // Enabling this config option may increase the number of spans that generate trace metrics, and may change which spans appear as top-level in Datadog. + // The default value is `false`. + ComputeTopLevelBySpanKind bool `mapstructure:"compute_top_level_by_span_kind"` + // If set to true, enables `peer.service` aggregation in the exporter. If disabled, aggregated trace stats will not include `peer.service` as a dimension. // For the best experience with `peer.service`, it is recommended to also enable `compute_stats_by_span_kind`. // If enabling both causes the datadog exporter to consume too many resources, try disabling `compute_stats_by_span_kind` first. diff --git a/exporter/datadogexporter/examples/collector.yaml b/exporter/datadogexporter/examples/collector.yaml index ec0ae11ae1bb..e1410d479b6b 100644 --- a/exporter/datadogexporter/examples/collector.yaml +++ b/exporter/datadogexporter/examples/collector.yaml @@ -357,7 +357,17 @@ exporters: ## If enabled, a span with an eligible `span.kind` will have stats computed. If disabled, only top-level and measured spans will have stats computed. ## NOTE: For stats computed from OTel traces, only top-level spans are considered when this option is off. # + ## If you are sending OTel traces and want stats on non-top-level spans, this flag will need to be enabled. + ## If you are sending OTel traces and do not want stats computed by span kind, you need to disable this flag and disable `compute_top_level_by_span_kind`. + # # compute_stats_by_span_kind: true + + ## @param compute_top_level_by_span_kind - enables top-level span identification based on `span.kind` - optional + ## If set to true, root spans and spans with a server or consumer `span.kind` will be marked as top-level. + ## Additionally, spans with a client or producer `span.kind` will have stats computed. + ## Enabling this config option may increase the number of spans that generate trace metrics, and may change which spans appear as top-level in Datadog. + # + # compute_top_level_by_span_kind: false ## @param peer_service_aggregation - enables `peer.service` aggregation on trace stats in Datadog exporter - optional ## If set to true, enables `peer.service` aggregation in the exporter. If disabled, aggregated trace stats will not include `peer.service` as a dimension. diff --git a/exporter/datadogexporter/traces_exporter.go b/exporter/datadogexporter/traces_exporter.go index 8b0e4dc4cb91..640e22b0b1be 100644 --- a/exporter/datadogexporter/traces_exporter.go +++ b/exporter/datadogexporter/traces_exporter.go @@ -219,6 +219,9 @@ func newTraceAgentConfig(ctx context.Context, params exporter.CreateSettings, cf if addr := cfg.Traces.Endpoint; addr != "" { acfg.Endpoints[0].Host = addr } + if cfg.Traces.ComputeTopLevelBySpanKind { + acfg.Features["enable_otlp_compute_top_level_by_span_kind"] = struct{}{} + } tracelog.SetLogger(&zaplogger{params.Logger}) //TODO: This shouldn't be a singleton return acfg, nil } From da5e594e32cc766d5cfeb84da581231db5978367 Mon Sep 17 00:00:00 2001 From: Stanley Liu Date: Thu, 2 May 2024 17:01:52 -0400 Subject: [PATCH 2/7] Add integration test --- .../integrationtest/integration_test.go | 265 ++++++++++++++++++ 1 file changed, 265 insertions(+) diff --git a/exporter/datadogexporter/integrationtest/integration_test.go b/exporter/datadogexporter/integrationtest/integration_test.go index ab51f52f7e01..a5bcbf2994ac 100644 --- a/exporter/datadogexporter/integrationtest/integration_test.go +++ b/exporter/datadogexporter/integrationtest/integration_test.go @@ -304,3 +304,268 @@ func getGzipReader(t *testing.T, reqBytes []byte) io.Reader { require.NoError(t, err) return reader } + +func getIntegrationComputeTopLevelBySpanKindTestCollector(t *testing.T, url string, factories otelcol.Factories) (*otelcol.Collector, string) { + cfg := fmt.Sprintf(` +receivers: + otlp: + protocols: + http: + endpoint: "localhost:4318" + grpc: + endpoint: "localhost:4317" + +processors: + batch: + send_batch_size: 10 + timeout: 5s + tail_sampling: + decision_wait: 1s + policies: [ + { + name: sample_flag, + type: boolean_attribute, + boolean_attribute: { key: sampled, value: true }, + } + ] + +connectors: + datadog/connector: + traces: + compute_top_level_by_span_kind: true + peer_tags_aggregation: true + peer_tags: ["extra_peer_tag"] + +exporters: + debug: + verbosity: detailed + datadog: + api: + key: "key" + tls: + insecure_skip_verify: true + host_metadata: + enabled: false + traces: + endpoint: %q + trace_buffer: 10 + compute_top_level_by_span_kind: true + metrics: + endpoint: %q + +service: + telemetry: + metrics: + level: none + pipelines: + traces: + receivers: [otlp] + processors: [batch] + exporters: [datadog/connector] + traces/2: # this pipeline uses sampling + receivers: [datadog/connector] + processors: [tail_sampling, batch] + exporters: [datadog, debug] + metrics: + receivers: [datadog/connector] + processors: [batch] + exporters: [datadog, debug]`, url, url) + + confFile, err := os.CreateTemp(os.TempDir(), "conf-") + require.NoError(t, err) + _, err = confFile.Write([]byte(cfg)) + require.NoError(t, err) + _, err = otelcoltest.LoadConfigAndValidate(confFile.Name(), factories) + require.NoError(t, err, "All yaml config must be valid.") + + fmp := fileprovider.NewFactory().Create(confmap.ProviderSettings{}) + configProvider, err := otelcol.NewConfigProvider( + otelcol.ConfigProviderSettings{ + ResolverSettings: confmap.ResolverSettings{ + URIs: []string{confFile.Name()}, + Providers: map[string]confmap.Provider{fmp.Scheme(): fmp}, + }, + }) + require.NoError(t, err) + + appSettings := otelcol.CollectorSettings{ + Factories: func() (otelcol.Factories, error) { return factories, nil }, + ConfigProvider: configProvider, + BuildInfo: component.BuildInfo{ + Command: "otelcol", + Description: "OpenTelemetry Collector", + Version: "tests", + }, + } + + app, err := otelcol.NewCollector(appSettings) + require.NoError(t, err) + return app, confFile.Name() +} + +func TestIntegrationComputeTopLevelBySpanKind(t *testing.T) { + // 1. Set up mock Datadog server + // See also https://github.com/DataDog/datadog-agent/blob/49c16e0d4deab396626238fa1d572b684475a53f/cmd/trace-agent/test/backend.go + apmstatsRec := &testutil.HTTPRequestRecorderWithChan{Pattern: testutil.APMStatsEndpoint, ReqChan: make(chan []byte)} + tracesRec := &testutil.HTTPRequestRecorderWithChan{Pattern: testutil.TraceEndpoint, ReqChan: make(chan []byte)} + server := testutil.DatadogServerMock(apmstatsRec.HandlerFunc, tracesRec.HandlerFunc) + defer server.Close() + + // 2. Start in-process collector + factories := getIntegrationTestComponents(t) + app, confFilePath := getIntegrationComputeTopLevelBySpanKindTestCollector(t, server.URL, factories) + go func() { + assert.NoError(t, app.Run(context.Background())) + }() + defer app.Shutdown() + defer os.Remove(confFilePath) + waitForReadiness(app) + + // 3. Generate and send traces + sendTracesComputeTopLevelBySpanKind(t) + + // 4. Validate traces and APM stats from the mock server + var spans []*pb.Span + var stats []*pb.ClientGroupedStats + var serverSpans, clientSpans, childClientSpans, consumerSpans, producerSpans, internalSpans int + + // 7 sampled spans + APM stats on 11 spans are sent to datadog exporter + for len(spans) < 7 || len(stats) < 11 { + select { + case tracesBytes := <-tracesRec.ReqChan: + gz := getGzipReader(t, tracesBytes) + slurp, err := io.ReadAll(gz) + require.NoError(t, err) + var traces pb.AgentPayload + require.NoError(t, proto.Unmarshal(slurp, &traces)) + for _, tps := range traces.TracerPayloads { + for _, chunks := range tps.Chunks { + spans = append(spans, chunks.Spans...) + } + } + + case apmstatsBytes := <-apmstatsRec.ReqChan: + gz := getGzipReader(t, apmstatsBytes) + var spl pb.StatsPayload + require.NoError(t, msgp.Decode(gz, &spl)) + for _, csps := range spl.Stats { + assert.Equal(t, "datadogexporter-otelcol-tests", spl.AgentVersion) + for _, csbs := range csps.Stats { + stats = append(stats, csbs.Stats...) + for i, stat := range csbs.Stats { + fmt.Printf("i: %v, stat.SpanKind: %v, stat.Hits: %v, stat.TopLevelHits: %v\n", i, stat.SpanKind, stat.Hits, stat.TopLevelHits) + switch stat.SpanKind { + case apitrace.SpanKindInternal.String(): + assert.True(t, strings.HasPrefix(stat.Resource, "TestSpan") || strings.HasPrefix(stat.Resource, "TestChildSpan")) + internalSpans++ + case apitrace.SpanKindServer.String(): + assert.True(t, strings.HasPrefix(stat.Resource, "TestSpan")) + serverSpans++ + case apitrace.SpanKindClient.String(): + assert.True(t, strings.HasPrefix(stat.Resource, "TestSpan") || strings.HasPrefix(stat.Resource, "TestChildSpan")) + if strings.HasPrefix(stat.Resource, "TestSpan") { + clientSpans++ + } + if strings.HasPrefix(stat.Resource, "TestChildSpan") { + childClientSpans++ + assert.Equal(t, uint64(1), stat.Hits) + assert.Equal(t, uint64(0), stat.TopLevelHits) + } + case apitrace.SpanKindProducer.String(): + assert.True(t, strings.HasPrefix(stat.Resource, "TestSpan")) + producerSpans++ + case apitrace.SpanKindConsumer.String(): + assert.True(t, strings.HasPrefix(stat.Resource, "TestSpan")) + consumerSpans++ + } + if !strings.HasPrefix(stat.Resource, "TestChildSpan") { + assert.Equal(t, uint64(1), stat.Hits) + assert.Equal(t, uint64(1), stat.TopLevelHits) + } + } + } + } + } + } + + // Verify we don't receive more than the expected numbers + assert.Equal(t, 2, serverSpans) + assert.Equal(t, 2, clientSpans) + assert.Equal(t, 1, childClientSpans) + assert.Equal(t, 2, consumerSpans) + assert.Equal(t, 2, producerSpans) + assert.Equal(t, 2, internalSpans) + assert.Len(t, spans, 7) + assert.Len(t, stats, 11) + + for _, span := range spans { + fmt.Printf("span.Name: %v, span.Meta: %v\n", span.Name, span.Meta) + } +} + +func sendTracesComputeTopLevelBySpanKind(t *testing.T) { + ctx := context.Background() + + // Set up OTel-Go SDK and exporter + traceExporter, err := otlptracegrpc.New(ctx, otlptracegrpc.WithInsecure()) + require.NoError(t, err) + bsp := sdktrace.NewBatchSpanProcessor(traceExporter) + r1, _ := resource.New(ctx, resource.WithAttributes(attribute.String("k8s.node.name", "aaaa"))) + r2, _ := resource.New(ctx, resource.WithAttributes(attribute.String("k8s.node.name", "bbbb"))) + tracerProvider := sdktrace.NewTracerProvider( + sdktrace.WithSampler(sdktrace.AlwaysSample()), + sdktrace.WithSpanProcessor(bsp), + sdktrace.WithResource(r1), + ) + tracerProvider2 := sdktrace.NewTracerProvider( + sdktrace.WithSampler(sdktrace.AlwaysSample()), + sdktrace.WithSpanProcessor(bsp), + sdktrace.WithResource(r2), + ) + otel.SetTracerProvider(tracerProvider) + defer func() { + require.NoError(t, tracerProvider.Shutdown(ctx)) + require.NoError(t, tracerProvider2.Shutdown(ctx)) + }() + + tracer := otel.Tracer("test-tracer") + for i := 0; i < 10; i++ { + var spanKind apitrace.SpanKind + switch i { + case 0, 1: + spanKind = apitrace.SpanKindConsumer + case 2, 3: + spanKind = apitrace.SpanKindServer + case 4, 5: + spanKind = apitrace.SpanKindClient + case 6, 7: + spanKind = apitrace.SpanKindProducer + case 8, 9: + spanKind = apitrace.SpanKindInternal + } + ctx, span := tracer.Start(ctx, fmt.Sprintf("TestSpan%d", i), apitrace.WithSpanKind(spanKind)) + + if i == 3 { + // Send some traces from a different resource + // This verifies that stats from different hosts don't accidentally create extraneous empty stats buckets + otel.SetTracerProvider(tracerProvider2) + tracer = otel.Tracer("test-tracer2") + } + if i == 4 { + _, childInternalSpan := tracer.Start(ctx, fmt.Sprintf("TestChildSpan%d", i), apitrace.WithSpanKind(apitrace.SpanKindInternal)) + _, childClientSpan := tracer.Start(ctx, fmt.Sprintf("TestChildSpan%d", i), apitrace.WithSpanKind(apitrace.SpanKindClient)) + childInternalSpan.SetAttributes(attribute.String("peer.service", "svc")) + childInternalSpan.SetAttributes(attribute.String("extra_peer_tag", "tag_val")) + childClientSpan.SetAttributes(attribute.String("peer.service", "svc")) + childClientSpan.SetAttributes(attribute.String("extra_peer_tag", "tag_val")) + childInternalSpan.End() + childClientSpan.End() + } + // Only sample 5 out of the 10 spans + if i < 5 { + span.SetAttributes(attribute.Bool("sampled", true)) + } + span.End() + } + time.Sleep(1 * time.Second) +} From d7d84eabb92f49f046f53a2b9c19ddf8df4aabda Mon Sep 17 00:00:00 2001 From: Stanley Liu Date: Thu, 2 May 2024 17:04:51 -0400 Subject: [PATCH 3/7] Update changelog --- ...tanley.liu_top-level-change-connector.yaml | 28 +++++++++++++++++++ .chloggen/stanley.liu_top-level-change.yaml | 2 +- 2 files changed, 29 insertions(+), 1 deletion(-) create mode 100644 .chloggen/stanley.liu_top-level-change-connector.yaml diff --git a/.chloggen/stanley.liu_top-level-change-connector.yaml b/.chloggen/stanley.liu_top-level-change-connector.yaml new file mode 100644 index 000000000000..2f27444f21d0 --- /dev/null +++ b/.chloggen/stanley.liu_top-level-change-connector.yaml @@ -0,0 +1,28 @@ +# Use this changelog template to create an entry for release notes. + +# One of 'breaking', 'deprecation', 'new_component', 'enhancement', 'bug_fix' +change_type: enhancement + +# The name of the component, or a single word describing the area of concern, (e.g. filelogreceiver) +component: connector/datadog + +# A brief description of the change. Surround your text with quotes ("") if it needs to start with a backtick (`). +note: The Datadog connector now has a config option to identify top-level spans by span kind. This new logic can be enabled by setting `traces::compute_top_level_by_span_kind` to true in the Datadog connector config. + +# Mandatory: One or more tracking issues related to the change. You can use the PR number here if no issue exists. +issues: [32005] + +# (Optional) One or more lines of additional information to render under the primary note. +# These lines will be padded with 2 spaces and then inserted directly into the document. +# Use pipe (|) for multiline entries. +subtext: | + With this new logic, root spans and spans with a server or consumer `span.kind` will be marked as top-level. Additionally, spans with a client or producer `span.kind` will have stats computed. + Enabling this feature flag may increase the number of spans that generate trace metrics, and may change which spans appear as top-level in Datadog. +# If your change doesn't affect end users or the exported elements of any package, +# you should instead start your pull request title with [chore] or use the "Skip Changelog" label. +# Optional: The change log or logs in which this entry should be included. +# e.g. '[user]' or '[user, api]' +# Include 'user' if the change is relevant to end users. +# Include 'api' if there is a change to a library API. +# Default: '[user]' +change_logs: [] \ No newline at end of file diff --git a/.chloggen/stanley.liu_top-level-change.yaml b/.chloggen/stanley.liu_top-level-change.yaml index 48e3dc33f01c..4bf2ec146aa3 100644 --- a/.chloggen/stanley.liu_top-level-change.yaml +++ b/.chloggen/stanley.liu_top-level-change.yaml @@ -7,7 +7,7 @@ change_type: enhancement component: exporter/datadog # A brief description of the change. Surround your text with quotes ("") if it needs to start with a backtick (`). -note: The Datadog exporter now has a config option to identify top-level spans by span kind. This new logic can be enabled by setting `traces.compute_top_level_by_span_kind` to true in the Datadog exporter config. +note: The Datadog exporter now has a config option to identify top-level spans by span kind. This new logic can be enabled by setting `traces::compute_top_level_by_span_kind` to true in the Datadog exporter config. # Mandatory: One or more tracking issues related to the change. You can use the PR number here if no issue exists. issues: [32005] From 8963a0f4e2139af63e6421906b0e87c152cd6f2e Mon Sep 17 00:00:00 2001 From: Stanley Liu Date: Thu, 2 May 2024 17:11:28 -0400 Subject: [PATCH 4/7] Fix lint --- exporter/datadogexporter/integrationtest/integration_test.go | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/exporter/datadogexporter/integrationtest/integration_test.go b/exporter/datadogexporter/integrationtest/integration_test.go index a5bcbf2994ac..11857d79c763 100644 --- a/exporter/datadogexporter/integrationtest/integration_test.go +++ b/exporter/datadogexporter/integrationtest/integration_test.go @@ -543,7 +543,8 @@ func sendTracesComputeTopLevelBySpanKind(t *testing.T) { case 8, 9: spanKind = apitrace.SpanKindInternal } - ctx, span := tracer.Start(ctx, fmt.Sprintf("TestSpan%d", i), apitrace.WithSpanKind(spanKind)) + var span apitrace.Span + ctx, span = tracer.Start(ctx, fmt.Sprintf("TestSpan%d", i), apitrace.WithSpanKind(spanKind)) if i == 3 { // Send some traces from a different resource From 3bb323582402c8841d8fcbf97f20804be1b67e5c Mon Sep 17 00:00:00 2001 From: Stanley Liu Date: Fri, 3 May 2024 14:54:56 -0400 Subject: [PATCH 5/7] PR feedback --- ...tanley.liu_top-level-change-connector.yaml | 4 +- .chloggen/stanley.liu_top-level-change.yaml | 4 +- .../integrationtest/integration_test.go | 367 ++++++++---------- 3 files changed, 174 insertions(+), 201 deletions(-) diff --git a/.chloggen/stanley.liu_top-level-change-connector.yaml b/.chloggen/stanley.liu_top-level-change-connector.yaml index 2f27444f21d0..b0b5137ac6a3 100644 --- a/.chloggen/stanley.liu_top-level-change-connector.yaml +++ b/.chloggen/stanley.liu_top-level-change-connector.yaml @@ -7,7 +7,7 @@ change_type: enhancement component: connector/datadog # A brief description of the change. Surround your text with quotes ("") if it needs to start with a backtick (`). -note: The Datadog connector now has a config option to identify top-level spans by span kind. This new logic can be enabled by setting `traces::compute_top_level_by_span_kind` to true in the Datadog connector config. +note: The Datadog connector now has a config option to identify top-level spans by span kind. This new logic can be enabled by setting `traces::compute_top_level_by_span_kind` to true in the Datadog connector config. Default is false. # Mandatory: One or more tracking issues related to the change. You can use the PR number here if no issue exists. issues: [32005] @@ -17,7 +17,7 @@ issues: [32005] # Use pipe (|) for multiline entries. subtext: | With this new logic, root spans and spans with a server or consumer `span.kind` will be marked as top-level. Additionally, spans with a client or producer `span.kind` will have stats computed. - Enabling this feature flag may increase the number of spans that generate trace metrics, and may change which spans appear as top-level in Datadog. + Enabling this config option may increase the number of spans that generate trace metrics, and may change which spans appear as top-level in Datadog. # If your change doesn't affect end users or the exported elements of any package, # you should instead start your pull request title with [chore] or use the "Skip Changelog" label. # Optional: The change log or logs in which this entry should be included. diff --git a/.chloggen/stanley.liu_top-level-change.yaml b/.chloggen/stanley.liu_top-level-change.yaml index 4bf2ec146aa3..3a6a2c570107 100644 --- a/.chloggen/stanley.liu_top-level-change.yaml +++ b/.chloggen/stanley.liu_top-level-change.yaml @@ -7,7 +7,7 @@ change_type: enhancement component: exporter/datadog # A brief description of the change. Surround your text with quotes ("") if it needs to start with a backtick (`). -note: The Datadog exporter now has a config option to identify top-level spans by span kind. This new logic can be enabled by setting `traces::compute_top_level_by_span_kind` to true in the Datadog exporter config. +note: The Datadog exporter now has a config option to identify top-level spans by span kind. This new logic can be enabled by setting `traces::compute_top_level_by_span_kind` to true in the Datadog exporter config. Default is false. # Mandatory: One or more tracking issues related to the change. You can use the PR number here if no issue exists. issues: [32005] @@ -17,7 +17,7 @@ issues: [32005] # Use pipe (|) for multiline entries. subtext: | With this new logic, root spans and spans with a server or consumer `span.kind` will be marked as top-level. Additionally, spans with a client or producer `span.kind` will have stats computed. - Enabling this feature flag may increase the number of spans that generate trace metrics, and may change which spans appear as top-level in Datadog. + Enabling this config option may increase the number of spans that generate trace metrics, and may change which spans appear as top-level in Datadog. # If your change doesn't affect end users or the exported elements of any package, # you should instead start your pull request title with [chore] or use the "Skip Changelog" label. # Optional: The change log or logs in which this entry should be included. diff --git a/exporter/datadogexporter/integrationtest/integration_test.go b/exporter/datadogexporter/integrationtest/integration_test.go index 11857d79c763..3bb5ecaa44c9 100644 --- a/exporter/datadogexporter/integrationtest/integration_test.go +++ b/exporter/datadogexporter/integrationtest/integration_test.go @@ -44,6 +44,135 @@ import ( "github.com/open-telemetry/opentelemetry-collector-contrib/processor/tailsamplingprocessor" ) +const collectorConfig = ` +receivers: + otlp: + protocols: + http: + endpoint: "localhost:4318" + grpc: + endpoint: "localhost:4317" + +processors: + batch: + send_batch_size: 10 + timeout: 5s + tail_sampling: + decision_wait: 1s + policies: [ + { + name: sample_flag, + type: boolean_attribute, + boolean_attribute: { key: sampled, value: true }, + } + ] + +connectors: + datadog/connector: + traces: + compute_stats_by_span_kind: true + peer_tags_aggregation: true + peer_tags: ["extra_peer_tag"] + +exporters: + debug: + verbosity: detailed + datadog: + api: + key: "key" + tls: + insecure_skip_verify: true + host_metadata: + enabled: false + traces: + endpoint: %q + trace_buffer: 10 + metrics: + endpoint: %q + +service: + telemetry: + metrics: + level: none + pipelines: + traces: + receivers: [otlp] + processors: [batch] + exporters: [datadog/connector] + traces/2: # this pipeline uses sampling + receivers: [datadog/connector] + processors: [tail_sampling, batch] + exporters: [datadog, debug] + metrics: + receivers: [datadog/connector] + processors: [batch] + exporters: [datadog, debug]` + +const collectorConfigComputeTopLevelBySpanKind = ` +receivers: + otlp: + protocols: + http: + endpoint: "localhost:4318" + grpc: + endpoint: "localhost:4317" + +processors: + batch: + send_batch_size: 10 + timeout: 5s + tail_sampling: + decision_wait: 1s + policies: [ + { + name: sample_flag, + type: boolean_attribute, + boolean_attribute: { key: sampled, value: true }, + } + ] + +connectors: + datadog/connector: + traces: + compute_top_level_by_span_kind: true + peer_tags_aggregation: true + peer_tags: ["extra_peer_tag"] + +exporters: + debug: + verbosity: detailed + datadog: + api: + key: "key" + tls: + insecure_skip_verify: true + host_metadata: + enabled: false + traces: + endpoint: %q + trace_buffer: 10 + compute_top_level_by_span_kind: true + metrics: + endpoint: %q + +service: + telemetry: + metrics: + level: none + pipelines: + traces: + receivers: [otlp] + processors: [batch] + exporters: [datadog/connector] + traces/2: # this pipeline uses sampling + receivers: [datadog/connector] + processors: [tail_sampling, batch] + exporters: [datadog, debug] + metrics: + receivers: [datadog/connector] + processors: [batch] + exporters: [datadog, debug]` + func TestIntegration(t *testing.T) { // 1. Set up mock Datadog server // See also https://github.com/DataDog/datadog-agent/blob/49c16e0d4deab396626238fa1d572b684475a53f/cmd/trace-agent/test/backend.go @@ -54,7 +183,7 @@ func TestIntegration(t *testing.T) { // 2. Start in-process collector factories := getIntegrationTestComponents(t) - app, confFilePath := getIntegrationTestCollector(t, server.URL, factories) + app, confFilePath := getIntegrationTestCollector(t, collectorConfig, server.URL, factories) go func() { assert.NoError(t, app.Run(context.Background())) }() @@ -143,70 +272,8 @@ func getIntegrationTestComponents(t *testing.T) otelcol.Factories { return factories } -func getIntegrationTestCollector(t *testing.T, url string, factories otelcol.Factories) (*otelcol.Collector, string) { - cfg := fmt.Sprintf(` -receivers: - otlp: - protocols: - http: - endpoint: "localhost:4318" - grpc: - endpoint: "localhost:4317" - -processors: - batch: - send_batch_size: 10 - timeout: 5s - tail_sampling: - decision_wait: 1s - policies: [ - { - name: sample_flag, - type: boolean_attribute, - boolean_attribute: { key: sampled, value: true }, - } - ] - -connectors: - datadog/connector: - traces: - compute_stats_by_span_kind: true - peer_tags_aggregation: true - peer_tags: ["extra_peer_tag"] - -exporters: - debug: - verbosity: detailed - datadog: - api: - key: "key" - tls: - insecure_skip_verify: true - host_metadata: - enabled: false - traces: - endpoint: %q - trace_buffer: 10 - metrics: - endpoint: %q - -service: - telemetry: - metrics: - level: none - pipelines: - traces: - receivers: [otlp] - processors: [batch] - exporters: [datadog/connector] - traces/2: # this pipeline uses sampling - receivers: [datadog/connector] - processors: [tail_sampling, batch] - exporters: [datadog, debug] - metrics: - receivers: [datadog/connector] - processors: [batch] - exporters: [datadog, debug]`, url, url) +func getIntegrationTestCollector(t *testing.T, cfgStr string, url string, factories otelcol.Factories) (*otelcol.Collector, string) { + cfg := fmt.Sprintf(cfgStr, url, url) confFile, err := os.CreateTemp(os.TempDir(), "conf-") require.NoError(t, err) @@ -305,104 +372,6 @@ func getGzipReader(t *testing.T, reqBytes []byte) io.Reader { return reader } -func getIntegrationComputeTopLevelBySpanKindTestCollector(t *testing.T, url string, factories otelcol.Factories) (*otelcol.Collector, string) { - cfg := fmt.Sprintf(` -receivers: - otlp: - protocols: - http: - endpoint: "localhost:4318" - grpc: - endpoint: "localhost:4317" - -processors: - batch: - send_batch_size: 10 - timeout: 5s - tail_sampling: - decision_wait: 1s - policies: [ - { - name: sample_flag, - type: boolean_attribute, - boolean_attribute: { key: sampled, value: true }, - } - ] - -connectors: - datadog/connector: - traces: - compute_top_level_by_span_kind: true - peer_tags_aggregation: true - peer_tags: ["extra_peer_tag"] - -exporters: - debug: - verbosity: detailed - datadog: - api: - key: "key" - tls: - insecure_skip_verify: true - host_metadata: - enabled: false - traces: - endpoint: %q - trace_buffer: 10 - compute_top_level_by_span_kind: true - metrics: - endpoint: %q - -service: - telemetry: - metrics: - level: none - pipelines: - traces: - receivers: [otlp] - processors: [batch] - exporters: [datadog/connector] - traces/2: # this pipeline uses sampling - receivers: [datadog/connector] - processors: [tail_sampling, batch] - exporters: [datadog, debug] - metrics: - receivers: [datadog/connector] - processors: [batch] - exporters: [datadog, debug]`, url, url) - - confFile, err := os.CreateTemp(os.TempDir(), "conf-") - require.NoError(t, err) - _, err = confFile.Write([]byte(cfg)) - require.NoError(t, err) - _, err = otelcoltest.LoadConfigAndValidate(confFile.Name(), factories) - require.NoError(t, err, "All yaml config must be valid.") - - fmp := fileprovider.NewFactory().Create(confmap.ProviderSettings{}) - configProvider, err := otelcol.NewConfigProvider( - otelcol.ConfigProviderSettings{ - ResolverSettings: confmap.ResolverSettings{ - URIs: []string{confFile.Name()}, - Providers: map[string]confmap.Provider{fmp.Scheme(): fmp}, - }, - }) - require.NoError(t, err) - - appSettings := otelcol.CollectorSettings{ - Factories: func() (otelcol.Factories, error) { return factories, nil }, - ConfigProvider: configProvider, - BuildInfo: component.BuildInfo{ - Command: "otelcol", - Description: "OpenTelemetry Collector", - Version: "tests", - }, - } - - app, err := otelcol.NewCollector(appSettings) - require.NoError(t, err) - return app, confFile.Name() -} - func TestIntegrationComputeTopLevelBySpanKind(t *testing.T) { // 1. Set up mock Datadog server // See also https://github.com/DataDog/datadog-agent/blob/49c16e0d4deab396626238fa1d572b684475a53f/cmd/trace-agent/test/backend.go @@ -413,7 +382,7 @@ func TestIntegrationComputeTopLevelBySpanKind(t *testing.T) { // 2. Start in-process collector factories := getIntegrationTestComponents(t) - app, confFilePath := getIntegrationComputeTopLevelBySpanKindTestCollector(t, server.URL, factories) + app, confFilePath := getIntegrationTestCollector(t, collectorConfigComputeTopLevelBySpanKind, server.URL, factories) go func() { assert.NoError(t, app.Run(context.Background())) }() @@ -427,10 +396,10 @@ func TestIntegrationComputeTopLevelBySpanKind(t *testing.T) { // 4. Validate traces and APM stats from the mock server var spans []*pb.Span var stats []*pb.ClientGroupedStats - var serverSpans, clientSpans, childClientSpans, consumerSpans, producerSpans, internalSpans int + var serverSpans, clientSpans, consumerSpans, producerSpans, internalSpans int - // 7 sampled spans + APM stats on 11 spans are sent to datadog exporter - for len(spans) < 7 || len(stats) < 11 { + // 5 sampled spans + APM stats on 8 spans are sent to datadog exporter + for len(spans) < 5 || len(stats) < 8 { select { case tracesBytes := <-tracesRec.ReqChan: gz := getGzipReader(t, tracesBytes) @@ -453,35 +422,29 @@ func TestIntegrationComputeTopLevelBySpanKind(t *testing.T) { for _, csbs := range csps.Stats { stats = append(stats, csbs.Stats...) for i, stat := range csbs.Stats { + // TODO: remove fmt line fmt.Printf("i: %v, stat.SpanKind: %v, stat.Hits: %v, stat.TopLevelHits: %v\n", i, stat.SpanKind, stat.Hits, stat.TopLevelHits) switch stat.SpanKind { case apitrace.SpanKindInternal.String(): - assert.True(t, strings.HasPrefix(stat.Resource, "TestSpan") || strings.HasPrefix(stat.Resource, "TestChildSpan")) internalSpans++ case apitrace.SpanKindServer.String(): - assert.True(t, strings.HasPrefix(stat.Resource, "TestSpan")) + assert.Equal(t, uint64(1), stat.Hits) + assert.Equal(t, uint64(1), stat.TopLevelHits) serverSpans++ case apitrace.SpanKindClient.String(): - assert.True(t, strings.HasPrefix(stat.Resource, "TestSpan") || strings.HasPrefix(stat.Resource, "TestChildSpan")) - if strings.HasPrefix(stat.Resource, "TestSpan") { - clientSpans++ - } - if strings.HasPrefix(stat.Resource, "TestChildSpan") { - childClientSpans++ - assert.Equal(t, uint64(1), stat.Hits) - assert.Equal(t, uint64(0), stat.TopLevelHits) - } + assert.Equal(t, uint64(1), stat.Hits) + assert.Equal(t, uint64(0), stat.TopLevelHits) + clientSpans++ case apitrace.SpanKindProducer.String(): - assert.True(t, strings.HasPrefix(stat.Resource, "TestSpan")) + assert.Equal(t, uint64(1), stat.Hits) + assert.Equal(t, uint64(0), stat.TopLevelHits) producerSpans++ case apitrace.SpanKindConsumer.String(): - assert.True(t, strings.HasPrefix(stat.Resource, "TestSpan")) - consumerSpans++ - } - if !strings.HasPrefix(stat.Resource, "TestChildSpan") { assert.Equal(t, uint64(1), stat.Hits) assert.Equal(t, uint64(1), stat.TopLevelHits) + consumerSpans++ } + assert.True(t, strings.HasPrefix(stat.Resource, "TestSpan")) } } } @@ -491,15 +454,32 @@ func TestIntegrationComputeTopLevelBySpanKind(t *testing.T) { // Verify we don't receive more than the expected numbers assert.Equal(t, 2, serverSpans) assert.Equal(t, 2, clientSpans) - assert.Equal(t, 1, childClientSpans) assert.Equal(t, 2, consumerSpans) assert.Equal(t, 2, producerSpans) - assert.Equal(t, 2, internalSpans) + assert.Equal(t, 0, internalSpans) assert.Len(t, spans, 7) - assert.Len(t, stats, 11) + assert.Len(t, stats, 8) for _, span := range spans { - fmt.Printf("span.Name: %v, span.Meta: %v\n", span.Name, span.Meta) + // TODO: remove fmt line + fmt.Printf("span.Name: %v, span.Meta: %v, span.Resource: %v, span.Metrics: %v, span.ParentID: %v\n", span.Name, span.Meta, span.Resource, span.Metrics, span.ParentID) + switch { + case span.Meta["span.kind"] == apitrace.SpanKindInternal.String(): + assert.EqualValues(t, 0, span.Metrics["_top_level"]) + assert.EqualValues(t, 0, span.Metrics["_dd.measured"]) + case span.Meta["span.kind"] == apitrace.SpanKindServer.String(): + assert.EqualValues(t, 1, span.Metrics["_top_level"]) + assert.EqualValues(t, 0, span.Metrics["_dd.measured"]) + case span.Meta["span.kind"] == apitrace.SpanKindClient.String(): + assert.EqualValues(t, 0, span.Metrics["_top_level"]) + assert.EqualValues(t, 1, span.Metrics["_dd.measured"]) + case span.Meta["span.kind"] == apitrace.SpanKindProducer.String(): + assert.EqualValues(t, 0, span.Metrics["_top_level"]) + assert.EqualValues(t, 1, span.Metrics["_dd.measured"]) + case span.Meta["span.kind"] == apitrace.SpanKindConsumer.String(): + assert.EqualValues(t, 1, span.Metrics["_top_level"]) + assert.EqualValues(t, 0, span.Metrics["_dd.measured"]) + } } } @@ -552,20 +532,13 @@ func sendTracesComputeTopLevelBySpanKind(t *testing.T) { otel.SetTracerProvider(tracerProvider2) tracer = otel.Tracer("test-tracer2") } - if i == 4 { - _, childInternalSpan := tracer.Start(ctx, fmt.Sprintf("TestChildSpan%d", i), apitrace.WithSpanKind(apitrace.SpanKindInternal)) - _, childClientSpan := tracer.Start(ctx, fmt.Sprintf("TestChildSpan%d", i), apitrace.WithSpanKind(apitrace.SpanKindClient)) - childInternalSpan.SetAttributes(attribute.String("peer.service", "svc")) - childInternalSpan.SetAttributes(attribute.String("extra_peer_tag", "tag_val")) - childClientSpan.SetAttributes(attribute.String("peer.service", "svc")) - childClientSpan.SetAttributes(attribute.String("extra_peer_tag", "tag_val")) - childInternalSpan.End() - childClientSpan.End() - } + // Only sample 5 out of the 10 spans if i < 5 { span.SetAttributes(attribute.Bool("sampled", true)) } + span.SetAttributes(attribute.String("peer.service", "svc")) + span.SetAttributes(attribute.String("extra_peer_tag", "tag_val")) span.End() } time.Sleep(1 * time.Second) From 73cc41763464f80374b4e5382db81c2d387e325a Mon Sep 17 00:00:00 2001 From: Stanley Liu Date: Fri, 3 May 2024 16:01:52 -0400 Subject: [PATCH 6/7] Fix integration test --- .../integrationtest/integration_test.go | 33 ++++--------------- 1 file changed, 6 insertions(+), 27 deletions(-) diff --git a/exporter/datadogexporter/integrationtest/integration_test.go b/exporter/datadogexporter/integrationtest/integration_test.go index 3bb5ecaa44c9..fc85bd4ed38d 100644 --- a/exporter/datadogexporter/integrationtest/integration_test.go +++ b/exporter/datadogexporter/integrationtest/integration_test.go @@ -121,22 +121,11 @@ processors: batch: send_batch_size: 10 timeout: 5s - tail_sampling: - decision_wait: 1s - policies: [ - { - name: sample_flag, - type: boolean_attribute, - boolean_attribute: { key: sampled, value: true }, - } - ] connectors: datadog/connector: traces: compute_top_level_by_span_kind: true - peer_tags_aggregation: true - peer_tags: ["extra_peer_tag"] exporters: debug: @@ -164,9 +153,9 @@ service: receivers: [otlp] processors: [batch] exporters: [datadog/connector] - traces/2: # this pipeline uses sampling + traces/2: receivers: [datadog/connector] - processors: [tail_sampling, batch] + processors: [batch] exporters: [datadog, debug] metrics: receivers: [datadog/connector] @@ -398,8 +387,8 @@ func TestIntegrationComputeTopLevelBySpanKind(t *testing.T) { var stats []*pb.ClientGroupedStats var serverSpans, clientSpans, consumerSpans, producerSpans, internalSpans int - // 5 sampled spans + APM stats on 8 spans are sent to datadog exporter - for len(spans) < 5 || len(stats) < 8 { + // 10 total spans + APM stats on 8 spans are sent to datadog exporter + for len(spans) < 10 || len(stats) < 8 { select { case tracesBytes := <-tracesRec.ReqChan: gz := getGzipReader(t, tracesBytes) @@ -421,9 +410,7 @@ func TestIntegrationComputeTopLevelBySpanKind(t *testing.T) { assert.Equal(t, "datadogexporter-otelcol-tests", spl.AgentVersion) for _, csbs := range csps.Stats { stats = append(stats, csbs.Stats...) - for i, stat := range csbs.Stats { - // TODO: remove fmt line - fmt.Printf("i: %v, stat.SpanKind: %v, stat.Hits: %v, stat.TopLevelHits: %v\n", i, stat.SpanKind, stat.Hits, stat.TopLevelHits) + for _, stat := range csbs.Stats { switch stat.SpanKind { case apitrace.SpanKindInternal.String(): internalSpans++ @@ -457,12 +444,10 @@ func TestIntegrationComputeTopLevelBySpanKind(t *testing.T) { assert.Equal(t, 2, consumerSpans) assert.Equal(t, 2, producerSpans) assert.Equal(t, 0, internalSpans) - assert.Len(t, spans, 7) + assert.Len(t, spans, 10) assert.Len(t, stats, 8) for _, span := range spans { - // TODO: remove fmt line - fmt.Printf("span.Name: %v, span.Meta: %v, span.Resource: %v, span.Metrics: %v, span.ParentID: %v\n", span.Name, span.Meta, span.Resource, span.Metrics, span.ParentID) switch { case span.Meta["span.kind"] == apitrace.SpanKindInternal.String(): assert.EqualValues(t, 0, span.Metrics["_top_level"]) @@ -533,12 +518,6 @@ func sendTracesComputeTopLevelBySpanKind(t *testing.T) { tracer = otel.Tracer("test-tracer2") } - // Only sample 5 out of the 10 spans - if i < 5 { - span.SetAttributes(attribute.Bool("sampled", true)) - } - span.SetAttributes(attribute.String("peer.service", "svc")) - span.SetAttributes(attribute.String("extra_peer_tag", "tag_val")) span.End() } time.Sleep(1 * time.Second) From 2c0bf7572c46307d80524c886d17d8324e04bcb4 Mon Sep 17 00:00:00 2001 From: Stanley Liu Date: Mon, 6 May 2024 10:53:57 -0400 Subject: [PATCH 7/7] PR feedback --- .chloggen/stanley.liu_top-level-change-connector.yaml | 1 + .chloggen/stanley.liu_top-level-change.yaml | 1 + connector/datadogconnector/config.go | 1 + connector/datadogconnector/connector.go | 5 +++-- exporter/datadogexporter/config.go | 1 + 5 files changed, 7 insertions(+), 2 deletions(-) diff --git a/.chloggen/stanley.liu_top-level-change-connector.yaml b/.chloggen/stanley.liu_top-level-change-connector.yaml index b0b5137ac6a3..b49d9b7ff328 100644 --- a/.chloggen/stanley.liu_top-level-change-connector.yaml +++ b/.chloggen/stanley.liu_top-level-change-connector.yaml @@ -16,6 +16,7 @@ issues: [32005] # These lines will be padded with 2 spaces and then inserted directly into the document. # Use pipe (|) for multiline entries. subtext: | + `traces::compute_top_level_by_span_kind` needs to be enabled in both the Datadog connector and Datadog exporter configs if both components are being used. With this new logic, root spans and spans with a server or consumer `span.kind` will be marked as top-level. Additionally, spans with a client or producer `span.kind` will have stats computed. Enabling this config option may increase the number of spans that generate trace metrics, and may change which spans appear as top-level in Datadog. # If your change doesn't affect end users or the exported elements of any package, diff --git a/.chloggen/stanley.liu_top-level-change.yaml b/.chloggen/stanley.liu_top-level-change.yaml index 3a6a2c570107..b780ecbb502a 100644 --- a/.chloggen/stanley.liu_top-level-change.yaml +++ b/.chloggen/stanley.liu_top-level-change.yaml @@ -16,6 +16,7 @@ issues: [32005] # These lines will be padded with 2 spaces and then inserted directly into the document. # Use pipe (|) for multiline entries. subtext: | + `traces::compute_top_level_by_span_kind` needs to be enabled in both the Datadog connector and Datadog exporter configs if both components are being used. With this new logic, root spans and spans with a server or consumer `span.kind` will be marked as top-level. Additionally, spans with a client or producer `span.kind` will have stats computed. Enabling this config option may increase the number of spans that generate trace metrics, and may change which spans appear as top-level in Datadog. # If your change doesn't affect end users or the exported elements of any package, diff --git a/connector/datadogconnector/config.go b/connector/datadogconnector/config.go index d66961bbf1d0..bebece6aeb8c 100644 --- a/connector/datadogconnector/config.go +++ b/connector/datadogconnector/config.go @@ -49,6 +49,7 @@ type TracesConfig struct { // If set to true, root spans and spans with a server or consumer `span.kind` will be marked as top-level. // Additionally, spans with a client or producer `span.kind` will have stats computed. // Enabling this config option may increase the number of spans that generate trace metrics, and may change which spans appear as top-level in Datadog. + // ComputeTopLevelBySpanKind needs to be enabled in both the Datadog connector and Datadog exporter configs if both components are being used. // The default value is `false`. ComputeTopLevelBySpanKind bool `mapstructure:"compute_top_level_by_span_kind"` diff --git a/connector/datadogconnector/connector.go b/connector/datadogconnector/connector.go index 68fc807cb494..03e83667d97d 100644 --- a/connector/datadogconnector/connector.go +++ b/connector/datadogconnector/connector.go @@ -88,7 +88,7 @@ func newTraceToMetricConnector(set component.TelemetrySettings, cfg component.Co ctx := context.Background() return &traceToMetricConnector{ logger: set.Logger, - agent: datadog.NewAgentWithConfig(ctx, getTraceAgentCfg(cfg.(*Config).Traces, attributesTranslator), in, metricsClient, timingReporter), + agent: datadog.NewAgentWithConfig(ctx, getTraceAgentCfg(set.Logger, cfg.(*Config).Traces, attributesTranslator), in, metricsClient, timingReporter), translator: trans, in: in, metricsConsumer: metricsConsumer, @@ -98,7 +98,7 @@ func newTraceToMetricConnector(set component.TelemetrySettings, cfg component.Co }, nil } -func getTraceAgentCfg(cfg TracesConfig, attributesTranslator *attributes.Translator) *traceconfig.AgentConfig { +func getTraceAgentCfg(logger *zap.Logger, cfg TracesConfig, attributesTranslator *attributes.Translator) *traceconfig.AgentConfig { acfg := traceconfig.New() acfg.OTLPReceiver.AttributesTranslator = attributesTranslator acfg.OTLPReceiver.SpanNameRemappings = cfg.SpanNameRemappings @@ -115,6 +115,7 @@ func getTraceAgentCfg(cfg TracesConfig, attributesTranslator *attributes.Transla acfg.TraceBuffer = v } if cfg.ComputeTopLevelBySpanKind { + logger.Info("traces::compute_top_level_by_span_kind needs to be enabled in both the Datadog connector and Datadog exporter configs if both components are being used") acfg.Features["enable_otlp_compute_top_level_by_span_kind"] = struct{}{} } return acfg diff --git a/exporter/datadogexporter/config.go b/exporter/datadogexporter/config.go index 0158ec9a8495..631af88b4d67 100644 --- a/exporter/datadogexporter/config.go +++ b/exporter/datadogexporter/config.go @@ -280,6 +280,7 @@ type TracesConfig struct { // If set to true, root spans and spans with a server or consumer `span.kind` will be marked as top-level. // Additionally, spans with a client or producer `span.kind` will have stats computed. // Enabling this config option may increase the number of spans that generate trace metrics, and may change which spans appear as top-level in Datadog. + // ComputeTopLevelBySpanKind needs to be enabled in both the Datadog connector and Datadog exporter configs if both components are being used. // The default value is `false`. ComputeTopLevelBySpanKind bool `mapstructure:"compute_top_level_by_span_kind"`