From bf0a3f4ca94a86475f92d8a82a1831f4dbcabb91 Mon Sep 17 00:00:00 2001
From: Dmitrii Anoshin <anoshindx@gmail.com>
Date: Wed, 18 Oct 2023 10:24:59 -0700
Subject: [PATCH 01/11] [chore] Send readonly data to immutable exporters in
 lifecycle tests (#27825)

This should help to catch exporters that are incorrectly claimed as not
mutating.
---
 cmd/otelcontribcol/exporters_test.go | 18 +++++++++++++++---
 1 file changed, 15 insertions(+), 3 deletions(-)

diff --git a/cmd/otelcontribcol/exporters_test.go b/cmd/otelcontribcol/exporters_test.go
index 8ab6de82c640..949e7e41048d 100644
--- a/cmd/otelcontribcol/exporters_test.go
+++ b/cmd/otelcontribcol/exporters_test.go
@@ -606,11 +606,23 @@ func verifyExporterLifecycle(t *testing.T, factory exporter.Factory, getConfigFn
 			assert.NotPanics(t, func() {
 				switch e := exp.(type) {
 				case exporter.Logs:
-					err = e.ConsumeLogs(ctx, testdata.GenerateLogsManyLogRecordsSameResource(2))
+					logs := testdata.GenerateLogsManyLogRecordsSameResource(2)
+					if !e.Capabilities().MutatesData {
+						logs.MarkReadOnly()
+					}
+					err = e.ConsumeLogs(ctx, logs)
 				case exporter.Metrics:
-					err = e.ConsumeMetrics(ctx, testdata.GenerateMetricsTwoMetrics())
+					metrics := testdata.GenerateMetricsTwoMetrics()
+					if !e.Capabilities().MutatesData {
+						metrics.MarkReadOnly()
+					}
+					err = e.ConsumeMetrics(ctx, metrics)
 				case exporter.Traces:
-					err = e.ConsumeTraces(ctx, testdata.GenerateTracesTwoSpansSameResource())
+					traces := testdata.GenerateTracesTwoSpansSameResource()
+					if !e.Capabilities().MutatesData {
+						traces.MarkReadOnly()
+					}
+					err = e.ConsumeTraces(ctx, traces)
 				}
 			})
 			if !expectErr {

From c2f343b392058e8bdc86cd191451bac994e69dfb Mon Sep 17 00:00:00 2001
From: hovavza <147598197+hovavza@users.noreply.github.com>
Date: Wed, 18 Oct 2023 20:55:22 +0300
Subject: [PATCH 02/11] UDP input operator - async mode - separate between
 readers & processors (#27805)

**Description:** adding a feature - when async mode is enabled in the
UDP receiver (udp input operator), separating reading from processing
operations.
This is important to reduce data-loss in high scale UDP scenarios. See
original issue for more details.
The async config block is changed now. Instead of readers field
(determining the concurrency level of how many threads the udp receiver
is running, all reading from the UDP port, processing, and sending
downstream), it will now have 2 fields:
- readers - determines the concurrency level of threads only reading
from UDP port and pushing the packets to a channel.
- processors - determines the concurrency level of threads reading from
the channel, processing the packets, and sending downstream.
- max_queue_length - determines the max size of the channel between the
readers & the processors. Setting it high enough, allows to prevent
data-loss in cases of downstream temporary latency. Once channel is
full, the readers thread will stop until there's room in the queue (so
to prevent unlimited memory usage).
This improves performance and reduces UDP packet loss in high-scale
scenarios.
Note that async mode only supports this separation of readers from
processors. If async config block isn't included, the default state

**Link to tracking Issue:** 27613

**Testing:** Local stress tests ran all types of async config (no
'async', with 'async', etc.). Updating existing udp test accordingly.
Also, ran scale tests and saw improvement in data-loss.

**Documentation:** Updated md file for both udplogreceiver & stanza
udp_input operator with the new flags.

---------

Co-authored-by: Daniel Jaglowski <jaglows3@gmail.com>
---
 ...er-to-reader-and-processor-with-async.yaml |  27 +++
 pkg/stanza/docs/operators/udp_input.md        |   6 +-
 pkg/stanza/operator/input/udp/config_test.go  |   7 +-
 .../operator/input/udp/testdata/config.yaml   |   4 +-
 pkg/stanza/operator/input/udp/udp.go          | 156 +++++++++++++-----
 pkg/stanza/operator/input/udp/udp_test.go     |   7 +-
 receiver/udplogreceiver/README.md             |   6 +-
 receiver/udplogreceiver/udp_test.go           |   7 +-
 8 files changed, 171 insertions(+), 49 deletions(-)
 create mode 100644 .chloggen/separate-udp-receiver-to-reader-and-processor-with-async.yaml

diff --git a/.chloggen/separate-udp-receiver-to-reader-and-processor-with-async.yaml b/.chloggen/separate-udp-receiver-to-reader-and-processor-with-async.yaml
new file mode 100644
index 000000000000..bd33138b4325
--- /dev/null
+++ b/.chloggen/separate-udp-receiver-to-reader-and-processor-with-async.yaml
@@ -0,0 +1,27 @@
+# Use this changelog template to create an entry for release notes.
+
+# One of 'breaking', 'deprecation', 'new_component', 'enhancement', 'bug_fix'
+change_type: enhancement
+
+# The name of the component, or a single word describing the area of concern, (e.g. filelogreceiver)
+component: pkg/stanza
+
+# A brief description of the change.  Surround your text with quotes ("") if it needs to start with a backtick (`).
+note: When async is enabled for udp receiver, separate logic into readers (only read logs from udp port and push to channel), and processors (read logs from channel and process; decode, split, add attributes, and push downstream), allowing to change concurrency level for both readers and processors separately.
+
+# Mandatory: One or more tracking issues related to the change. You can use the PR number here if no issue exists.
+issues: [27613]
+
+# (Optional) One or more lines of additional information to render under the primary note.
+# These lines will be padded with 2 spaces and then inserted directly into the document.
+# Use pipe (|) for multiline entries.
+subtext:
+
+# If your change doesn't affect end users or the exported elements of any package,
+# you should instead start your pull request title with [chore] or use the "Skip Changelog" label.
+# Optional: The change log or logs in which this entry should be included.
+# e.g. '[user]' or '[user, api]'
+# Include 'user' if the change is relevant to end users.
+# Include 'api' if there is a change to a library API.
+# Default: '[user]'
+change_logs: []
\ No newline at end of file
diff --git a/pkg/stanza/docs/operators/udp_input.md b/pkg/stanza/docs/operators/udp_input.md
index 2a08d16716bb..555ddc97faba 100644
--- a/pkg/stanza/docs/operators/udp_input.md
+++ b/pkg/stanza/docs/operators/udp_input.md
@@ -50,11 +50,13 @@ for other encodings available.
 
 If set, the `async` configuration block instructs the `udp_input` operator to read and process logs asynchronsouly and concurrently.
 
-**note** If `async` is not set at all, a single thread will read lines synchronously.
+**note** If `async` is not set at all, a single thread will read & process lines synchronously.
 
 | Field                                   | Default              | Description |
 | ---                                     | ---                  | ---         |
-| `readers`                               | 1                    | Concurrency level - Determines how many go routines read from UDP port (and process logs before sending downstream). |
+| `readers`                               | 1                    | Concurrency level - Determines how many go routines read from UDP port and push to channel (to be handled by processors). |
+| `processors`                            | 1                    | Concurrency level - Determines how many go routines read from channel (pushed by readers) and process logs before sending downstream. |
+| `max_queue_length`                      | 100                  | Determines max number of messages which may be waiting for a processor. While the queue is full, the readers will wait until there's room (readers will not drop messages, but they will not read additional incoming messages during that period). |
 
 ### Example Configurations
 
diff --git a/pkg/stanza/operator/input/udp/config_test.go b/pkg/stanza/operator/input/udp/config_test.go
index 7b806ed61985..a65f8ea6cc3d 100644
--- a/pkg/stanza/operator/input/udp/config_test.go
+++ b/pkg/stanza/operator/input/udp/config_test.go
@@ -43,8 +43,11 @@ func TestUnmarshal(t *testing.T) {
 					cfg.Encoding = "utf-8"
 					cfg.SplitConfig.LineStartPattern = "ABC"
 					cfg.SplitConfig.LineEndPattern = ""
-					cfg.AsyncConfig = NewAsyncConfig()
-					cfg.AsyncConfig.Readers = 2
+					cfg.AsyncConfig = &AsyncConfig{
+						Readers:        2,
+						Processors:     2,
+						MaxQueueLength: 100,
+					}
 					return cfg
 				}(),
 			},
diff --git a/pkg/stanza/operator/input/udp/testdata/config.yaml b/pkg/stanza/operator/input/udp/testdata/config.yaml
index 4acbf3621df8..4353dd894ee4 100644
--- a/pkg/stanza/operator/input/udp/testdata/config.yaml
+++ b/pkg/stanza/operator/input/udp/testdata/config.yaml
@@ -17,4 +17,6 @@ all_with_async:
     line_start_pattern: ABC
     line_end_pattern: ""
   async:
-    readers: 2
\ No newline at end of file
+    readers: 2
+    processors: 2
+    max_queue_length: 100
diff --git a/pkg/stanza/operator/input/udp/udp.go b/pkg/stanza/operator/input/udp/udp.go
index cc2b69952df3..4593f9ead5e5 100644
--- a/pkg/stanza/operator/input/udp/udp.go
+++ b/pkg/stanza/operator/input/udp/udp.go
@@ -27,6 +27,10 @@ const (
 
 	// Maximum UDP packet size
 	MaxUDPSize = 64 * 1024
+
+	defaultReaders        = 1
+	defaultProcessors     = 1
+	defaultMaxQueueLength = 100
 )
 
 func init() {
@@ -59,14 +63,9 @@ type Config struct {
 }
 
 type AsyncConfig struct {
-	Readers int `mapstructure:"readers,omitempty"`
-}
-
-// NewAsyncConfig creates a new AsyncConfig with default values.
-func NewAsyncConfig() *AsyncConfig {
-	return &AsyncConfig{
-		Readers: 1,
-	}
+	Readers        int `mapstructure:"readers,omitempty"`
+	Processors     int `mapstructure:"processors,omitempty"`
+	MaxQueueLength int `mapstructure:"max_queue_length,omitempty"`
 }
 
 // BaseConfig is the details configuration of a udp input operator.
@@ -113,12 +112,16 @@ func (c Config) Build(logger *zap.SugaredLogger) (operator.Operator, error) {
 		resolver = helper.NewIPResolver()
 	}
 
-	if c.AsyncConfig == nil {
-		c.AsyncConfig = NewAsyncConfig()
-	}
-
-	if c.AsyncConfig.Readers <= 0 {
-		return nil, fmt.Errorf("async readers must be greater than 0")
+	if c.AsyncConfig != nil {
+		if c.AsyncConfig.Readers <= 0 {
+			c.AsyncConfig.Readers = defaultReaders
+		}
+		if c.AsyncConfig.Processors <= 0 {
+			c.AsyncConfig.Processors = defaultProcessors
+		}
+		if c.AsyncConfig.MaxQueueLength <= 0 {
+			c.AsyncConfig.MaxQueueLength = defaultMaxQueueLength
+		}
 	}
 
 	udpInput := &Input{
@@ -132,6 +135,10 @@ func (c Config) Build(logger *zap.SugaredLogger) (operator.Operator, error) {
 		OneLogPerPacket: c.OneLogPerPacket,
 		AsyncConfig:     c.AsyncConfig,
 	}
+
+	if c.AsyncConfig != nil {
+		udpInput.messageQueue = make(chan messageAndAddress, c.AsyncConfig.MaxQueueLength)
+	}
 	return udpInput, nil
 }
 
@@ -151,6 +158,14 @@ type Input struct {
 	encoding  encoding.Encoding
 	splitFunc bufio.SplitFunc
 	resolver  *helper.IPResolver
+
+	messageQueue chan messageAndAddress
+	stopOnce     sync.Once
+}
+
+type messageAndAddress struct {
+	Message    []byte
+	RemoteAddr net.Addr
 }
 
 // Start will start listening for messages on a socket.
@@ -170,9 +185,20 @@ func (u *Input) Start(_ operator.Persister) error {
 
 // goHandleMessages will handle messages from a udp connection.
 func (u *Input) goHandleMessages(ctx context.Context) {
-	for i := 0; i < u.AsyncConfig.Readers; i++ {
+	if u.AsyncConfig == nil {
 		u.wg.Add(1)
 		go u.readAndProcessMessages(ctx)
+		return
+	}
+
+	for i := 0; i < u.AsyncConfig.Readers; i++ {
+		u.wg.Add(1)
+		go u.readMessagesAsync(ctx)
+	}
+
+	for i := 0; i < u.AsyncConfig.Processors; i++ {
+		u.wg.Add(1)
+		go u.processMessagesAsync(ctx)
 	}
 }
 
@@ -193,23 +219,69 @@ func (u *Input) readAndProcessMessages(ctx context.Context) {
 			break
 		}
 
-		if u.OneLogPerPacket {
-			log := truncateMaxLog(message)
-			u.handleMessage(ctx, remoteAddr, dec, log)
-			continue
-		}
+		u.processMessage(ctx, message, remoteAddr, dec, buf)
+	}
+}
 
-		scanner := bufio.NewScanner(bytes.NewReader(message))
-		scanner.Buffer(buf, MaxUDPSize)
+func (u *Input) processMessage(ctx context.Context, message []byte, remoteAddr net.Addr, dec *decode.Decoder, buf []byte) {
+	if u.OneLogPerPacket {
+		log := truncateMaxLog(message)
+		u.handleMessage(ctx, remoteAddr, dec, log)
+		return
+	}
+
+	scanner := bufio.NewScanner(bytes.NewReader(message))
+	scanner.Buffer(buf, MaxUDPSize)
+
+	scanner.Split(u.splitFunc)
 
-		scanner.Split(u.splitFunc)
+	for scanner.Scan() {
+		u.handleMessage(ctx, remoteAddr, dec, scanner.Bytes())
+	}
+	if err := scanner.Err(); err != nil {
+		u.Errorw("Scanner error", zap.Error(err))
+	}
+}
 
-		for scanner.Scan() {
-			u.handleMessage(ctx, remoteAddr, dec, scanner.Bytes())
+func (u *Input) readMessagesAsync(ctx context.Context) {
+	defer u.wg.Done()
+
+	for {
+		message, remoteAddr, err := u.readMessage()
+		if err != nil {
+			select {
+			case <-ctx.Done():
+				return
+			default:
+				u.Errorw("Failed reading messages", zap.Error(err))
+			}
+			break
 		}
-		if err := scanner.Err(); err != nil {
-			u.Errorw("Scanner error", zap.Error(err))
+
+		messageAndAddr := messageAndAddress{
+			Message:    message,
+			RemoteAddr: remoteAddr,
 		}
+
+		// Send the message to the message queue for processing
+		u.messageQueue <- messageAndAddr
+	}
+}
+
+func (u *Input) processMessagesAsync(ctx context.Context) {
+	defer u.wg.Done()
+
+	dec := decode.New(u.encoding)
+	buf := make([]byte, 0, MaxUDPSize)
+
+	for {
+		// Read a message from the message queue.
+		messageAndAddr, ok := <-u.messageQueue
+		if !ok {
+			return // Channel closed, exit the goroutine.
+		}
+
+		u.processMessage(ctx, messageAndAddr.Message, messageAndAddr.RemoteAddr, dec, buf)
 	}
 }
 
@@ -274,18 +346,24 @@ func (u *Input) readMessage() ([]byte, net.Addr, error) {
 
 // Stop will stop listening for udp messages.
 func (u *Input) Stop() error {
-	if u.cancel == nil {
-		return nil
-	}
-	u.cancel()
-	if u.connection != nil {
-		if err := u.connection.Close(); err != nil {
-			u.Errorf("failed to close UDP connection: %s", err)
+	u.stopOnce.Do(func() {
+		if u.AsyncConfig != nil {
+			close(u.messageQueue)
 		}
-	}
-	u.wg.Wait()
-	if u.resolver != nil {
-		u.resolver.Stop()
-	}
+
+		if u.cancel == nil {
+			return
+		}
+		u.cancel()
+		if u.connection != nil {
+			if err := u.connection.Close(); err != nil {
+				u.Errorf("failed to close UDP connection: %s", err)
+			}
+		}
+		u.wg.Wait()
+		if u.resolver != nil {
+			u.resolver.Stop()
+		}
+	})
 	return nil
 }
diff --git a/pkg/stanza/operator/input/udp/udp_test.go b/pkg/stanza/operator/input/udp/udp_test.go
index aba8eeb28e59..7695b734af90 100644
--- a/pkg/stanza/operator/input/udp/udp_test.go
+++ b/pkg/stanza/operator/input/udp/udp_test.go
@@ -143,8 +143,11 @@ func TestInput(t *testing.T) {
 	t.Run("TrailingCRNewlines", udpInputTest([]byte("message1\r\n"), []string{"message1"}, cfg))
 	t.Run("NewlineInMessage", udpInputTest([]byte("message1\nmessage2\n"), []string{"message1\nmessage2"}, cfg))
 
-	cfg.AsyncConfig = NewAsyncConfig()
-	cfg.AsyncConfig.Readers = 2
+	cfg.AsyncConfig = &AsyncConfig{
+		Readers:        2,
+		Processors:     2,
+		MaxQueueLength: 100,
+	}
 	t.Run("SimpleAsync", udpInputTest([]byte("message1"), []string{"message1"}, cfg))
 }
 
diff --git a/receiver/udplogreceiver/README.md b/receiver/udplogreceiver/README.md
index 4d6c9ed85751..8be89e306df1 100644
--- a/receiver/udplogreceiver/README.md
+++ b/receiver/udplogreceiver/README.md
@@ -24,7 +24,7 @@ Receives logs over UDP.
 | `attributes`              | {}                   | A map of `key: value` pairs to add to the entry's attributes                                                       |
 | `one_log_per_packet`      | false                | Skip log tokenization, set to true if logs contains one log per record and multiline is not used.  This will improve performance.                                                 |
 | `resource`                | {}                   | A map of `key: value` pairs to add to the entry's resource                                                         |
-| `add_attributes`          | false                | Adds `net.*` attributes according to [semantic convention][hhttps://github.com/open-telemetry/semantic-conventions/blob/cee22ec91448808ebcfa53df689c800c7171c9e1/docs/general/attributes.md#other-network-attributes] |
+| `add_attributes`          | false                | Adds `net.*` attributes according to [semantic convention][https://github.com/open-telemetry/semantic-conventions/blob/cee22ec91448808ebcfa53df689c800c7171c9e1/docs/general/attributes.md#other-network-attributes] |
 | `multiline`               |                      | A `multiline` configuration block. See below for details                                                           |
 | `encoding`                | `utf-8`              | The encoding of the file being read. See the list of supported encodings below for available options               |
 | `operators`               | []                   | An array of [operators](../../pkg/stanza/docs/operators/README.md#what-operators-are-available). See below for more details |
@@ -78,7 +78,9 @@ If set, the `async` configuration block instructs the `udp_input` operator to re
 
 | Field                                   | Default              | Description |
 | ---                                     | ---                  | ---         |
-| `readers`                               | 1                    | Concurrency level - Determines how many go routines read from UDP port (and process logs before sending downstream). |
+| `readers`                               | 1                    | Concurrency level - Determines how many go routines read from UDP port and push to channel (to be handled by processors). |
+| `processors`                            | 1                    | Concurrency level - Determines how many go routines read from channel (pushed by readers) and process logs before sending downstream. |
+| `max_queue_length`                      | 100                  | Determines max length of channel being used by async reader routines. When channel reaches max number, reader routine will block until channel has room. |
 
 ## Example Configurations
 
diff --git a/receiver/udplogreceiver/udp_test.go b/receiver/udplogreceiver/udp_test.go
index b3cbe39d7b58..e632100a127f 100644
--- a/receiver/udplogreceiver/udp_test.go
+++ b/receiver/udplogreceiver/udp_test.go
@@ -32,7 +32,12 @@ func TestUdp(t *testing.T) {
 func TestUdpAsync(t *testing.T) {
 	listenAddress := "127.0.0.1:29019"
 	cfg := testdataConfigYaml(listenAddress)
-	cfg.InputConfig.AsyncConfig = udp.NewAsyncConfig()
+	cfg.InputConfig.AsyncConfig = &udp.AsyncConfig{
+		Readers:        2,
+		Processors:     2,
+		MaxQueueLength: 100,
+	}
+
 	cfg.InputConfig.AsyncConfig.Readers = 2
 	testUDP(t, testdataConfigYaml(listenAddress), listenAddress)
 }

From c44ad3c81b7670b19edae3abef8a9416f04eecd7 Mon Sep 17 00:00:00 2001
From: Brandon Johnson <brandon.johnson@bluemedora.com>
Date: Wed, 18 Oct 2023 17:11:00 -0400
Subject: [PATCH 03/11] [receiver/filelog] Implement specifying top n files to
 track when ordering (#27844)

**Description:**
* Add a new `ordering_criteria.top_n` option, which allows a user to
specify the number of files to track after ordering.
  * Default is 1, which was the existing behavior.

**Link to tracking Issue:** #23788

**Testing:**
Unit tests added.

**Documentation:**
Added new parameter to existing documentation.
---
 .chloggen/feat_top_n_file_sorting.yaml        |  22 ++++
 pkg/stanza/fileconsumer/config_test.go        |  10 ++
 pkg/stanza/fileconsumer/matcher/matcher.go    |  23 +++-
 .../fileconsumer/matcher/matcher_test.go      | 114 ++++++++++++++++++
 pkg/stanza/fileconsumer/testdata/config.yaml  |   4 +
 receiver/filelogreceiver/README.md            |   1 +
 6 files changed, 171 insertions(+), 3 deletions(-)
 create mode 100755 .chloggen/feat_top_n_file_sorting.yaml

diff --git a/.chloggen/feat_top_n_file_sorting.yaml b/.chloggen/feat_top_n_file_sorting.yaml
new file mode 100755
index 000000000000..1a4e678bae36
--- /dev/null
+++ b/.chloggen/feat_top_n_file_sorting.yaml
@@ -0,0 +1,22 @@
+# Use this changelog template to create an entry for release notes.
+
+# One of 'breaking', 'deprecation', 'new_component', 'enhancement', 'bug_fix'
+change_type: "enhancement"
+
+# The name of the component, or a single word describing the area of concern, (e.g. filelogreceiver)
+component: filelogreceiver
+
+# A brief description of the change.  Surround your text with quotes ("") if it needs to start with a backtick (`).
+note: Add a new "top_n" option to specify the number of files to track when using ordering criteria
+
+# Mandatory: One or more tracking issues related to the change. You can use the PR number here if no issue exists.
+issues: [23788]
+
+# If your change doesn't affect end users or the exported elements of any package,
+# you should instead start your pull request title with [chore] or use the "Skip Changelog" label.
+# Optional: The change log or logs in which this entry should be included.
+# e.g. '[user]' or '[user, api]'
+# Include 'user' if the change is relevant to end users.
+# Include 'api' if there is a change to a library API.
+# Default: '[user]'
+change_logs: ["user"]
diff --git a/pkg/stanza/fileconsumer/config_test.go b/pkg/stanza/fileconsumer/config_test.go
index 9d83118aa4bd..43171be5c96c 100644
--- a/pkg/stanza/fileconsumer/config_test.go
+++ b/pkg/stanza/fileconsumer/config_test.go
@@ -412,6 +412,16 @@ func TestUnmarshal(t *testing.T) {
 					return newMockOperatorConfig(cfg)
 				}(),
 			},
+			{
+				Name: "ordering_criteria_top_n",
+				Expect: func() *mockOperatorConfig {
+					cfg := NewConfig()
+					cfg.OrderingCriteria = matcher.OrderingCriteria{
+						TopN: 10,
+					}
+					return newMockOperatorConfig(cfg)
+				}(),
+			},
 		},
 	}.Run(t)
 }
diff --git a/pkg/stanza/fileconsumer/matcher/matcher.go b/pkg/stanza/fileconsumer/matcher/matcher.go
index 0a7a0628edac..76cdd1bd4feb 100644
--- a/pkg/stanza/fileconsumer/matcher/matcher.go
+++ b/pkg/stanza/fileconsumer/matcher/matcher.go
@@ -18,6 +18,10 @@ const (
 	sortTypeAlphabetical = "alphabetical"
 )
 
+const (
+	defaultOrderingCriteriaTopN = 1
+)
+
 type Criteria struct {
 	Include          []string         `mapstructure:"include,omitempty"`
 	Exclude          []string         `mapstructure:"exclude,omitempty"`
@@ -26,6 +30,7 @@ type Criteria struct {
 
 type OrderingCriteria struct {
 	Regex  string `mapstructure:"regex,omitempty"`
+	TopN   int    `mapstructure:"top_n,omitempty"`
 	SortBy []Sort `mapstructure:"sort_by,omitempty"`
 }
 
@@ -62,6 +67,14 @@ func New(c Criteria) (*Matcher, error) {
 		return nil, fmt.Errorf("'regex' must be specified when 'sort_by' is specified")
 	}
 
+	if c.OrderingCriteria.TopN < 0 {
+		return nil, fmt.Errorf("'top_n' must be a positive integer")
+	}
+
+	if c.OrderingCriteria.TopN == 0 {
+		c.OrderingCriteria.TopN = defaultOrderingCriteriaTopN
+	}
+
 	regex, err := regexp.Compile(c.OrderingCriteria.Regex)
 	if err != nil {
 		return nil, fmt.Errorf("compile regex: %w", err)
@@ -97,6 +110,7 @@ func New(c Criteria) (*Matcher, error) {
 		include:    c.Include,
 		exclude:    c.Exclude,
 		regex:      regex,
+		topN:       c.OrderingCriteria.TopN,
 		filterOpts: filterOpts,
 	}, nil
 }
@@ -105,6 +119,7 @@ type Matcher struct {
 	include    []string
 	exclude    []string
 	regex      *regexp.Regexp
+	topN       int
 	filterOpts []filter.Option
 }
 
@@ -127,7 +142,9 @@ func (m Matcher) MatchFiles() ([]string, error) {
 		return result, errors.Join(err, errs)
 	}
 
-	// Return only the first item.
-	// See https://github.com/open-telemetry/opentelemetry-collector-contrib/issues/23788
-	return result[:1], errors.Join(err, errs)
+	if len(result) <= m.topN {
+		return result, errors.Join(err, errs)
+	}
+
+	return result[:m.topN], errors.Join(err, errs)
 }
diff --git a/pkg/stanza/fileconsumer/matcher/matcher_test.go b/pkg/stanza/fileconsumer/matcher/matcher_test.go
index c838962a4699..1d9de6f17f87 100644
--- a/pkg/stanza/fileconsumer/matcher/matcher_test.go
+++ b/pkg/stanza/fileconsumer/matcher/matcher_test.go
@@ -98,6 +98,23 @@ func TestNew(t *testing.T) {
 			},
 			expectedErr: "compile regex: error parsing regexp: missing closing ]: `[a-z`",
 		},
+		{
+			name: "TopN is negative",
+			criteria: Criteria{
+				Include: []string{"*.log"},
+				OrderingCriteria: OrderingCriteria{
+					Regex: "[a-z]",
+					TopN:  -1,
+					SortBy: []Sort{
+						{
+							SortType: "numeric",
+							RegexKey: "key",
+						},
+					},
+				},
+			},
+			expectedErr: "'top_n' must be a positive integer",
+		},
 		{
 			name: "SortTypeEmpty",
 			criteria: Criteria{
@@ -249,6 +266,46 @@ func TestMatcher(t *testing.T) {
 			},
 			expected: []string{"err.2023020612.log"},
 		},
+		{
+			name:    "TopN > number of files",
+			files:   []string{"err.2023020611.log", "err.2023020612.log"},
+			include: []string{"err.*.log"},
+			exclude: []string{},
+			filterCriteria: OrderingCriteria{
+				Regex: `err\.(?P<value>\d{4}\d{2}\d{2}\d{2}).*log`,
+				TopN:  3,
+				SortBy: []Sort{
+					{
+						SortType:  sortTypeTimestamp,
+						RegexKey:  "value",
+						Ascending: false,
+						Location:  "UTC",
+						Layout:    `%Y%m%d%H`,
+					},
+				},
+			},
+			expected: []string{"err.2023020612.log", "err.2023020611.log"},
+		},
+		{
+			name:    "TopN == number of files",
+			files:   []string{"err.2023020611.log", "err.2023020612.log"},
+			include: []string{"err.*.log"},
+			exclude: []string{},
+			filterCriteria: OrderingCriteria{
+				Regex: `err\.(?P<value>\d{4}\d{2}\d{2}\d{2}).*log`,
+				TopN:  2,
+				SortBy: []Sort{
+					{
+						SortType:  sortTypeTimestamp,
+						RegexKey:  "value",
+						Ascending: false,
+						Location:  "UTC",
+						Layout:    `%Y%m%d%H`,
+					},
+				},
+			},
+			expected: []string{"err.2023020612.log", "err.2023020611.log"},
+		},
 		{
 			name:    "Timestamp Sorting Ascending",
 			files:   []string{"err.2023020612.log", "err.2023020611.log", "err.2023020609.log", "err.2023020610.log"},
@@ -319,6 +376,24 @@ func TestMatcher(t *testing.T) {
 			},
 			expected: []string{"err.d.log"},
 		},
+		{
+			name:    "Alphabetical Sorting - Top 2",
+			files:   []string{"err.a.log", "err.d.log", "err.b.log", "err.c.log"},
+			include: []string{"err.*.log"},
+			exclude: []string{},
+			filterCriteria: OrderingCriteria{
+				Regex: `err\.(?P<value>[a-zA-Z]+).*log`,
+				TopN:  2,
+				SortBy: []Sort{
+					{
+						SortType:  sortTypeAlphabetical,
+						RegexKey:  "value",
+						Ascending: false,
+					},
+				},
+			},
+			expected: []string{"err.d.log", "err.c.log"},
+		},
 		{
 			name:    "Alphabetical Sorting Ascending",
 			files:   []string{"err.b.log", "err.a.log", "err.c.log", "err.d.log"},
@@ -336,6 +411,45 @@ func TestMatcher(t *testing.T) {
 			},
 			expected: []string{"err.a.log"},
 		},
+		{
+			name: "Multiple Sorting - timestamp priority sort - Top 4",
+			files: []string{
+				"err.b.1.2023020601.log",
+				"err.b.2.2023020601.log",
+				"err.a.1.2023020601.log",
+				"err.a.2.2023020601.log",
+				"err.b.1.2023020602.log",
+				"err.a.2.2023020602.log",
+				"err.b.2.2023020602.log",
+				"err.a.1.2023020602.log",
+			},
+			include: []string{"err.*.log"},
+			exclude: []string{},
+			filterCriteria: OrderingCriteria{
+				Regex: `err\.(?P<alpha>[a-zA-Z])\.(?P<number>\d+)\.(?P<time>\d{10})\.log`,
+				TopN:  4,
+				SortBy: []Sort{
+					{
+						SortType:  sortTypeAlphabetical,
+						RegexKey:  "alpha",
+						Ascending: false,
+					},
+					{
+						SortType:  sortTypeNumeric,
+						RegexKey:  "number",
+						Ascending: false,
+					},
+					{
+						SortType:  sortTypeTimestamp,
+						RegexKey:  "time",
+						Ascending: false,
+						Location:  "UTC",
+						Layout:    `%Y%m%d%H`,
+					},
+				},
+			},
+			expected: []string{"err.b.2.2023020602.log", "err.a.2.2023020602.log", "err.b.1.2023020602.log", "err.a.1.2023020602.log"},
+		},
 		{
 			name: "Multiple Sorting - timestamp priority sort",
 			files: []string{
diff --git a/pkg/stanza/fileconsumer/testdata/config.yaml b/pkg/stanza/fileconsumer/testdata/config.yaml
index 69f4c2eee5b2..aa973d609612 100644
--- a/pkg/stanza/fileconsumer/testdata/config.yaml
+++ b/pkg/stanza/fileconsumer/testdata/config.yaml
@@ -180,3 +180,7 @@ header_config:
     pattern: "^#"
     metadata_operators:
       - type: "regex_parser"
+ordering_criteria_top_n:
+  type: mock
+  ordering_criteria:
+    top_n: 10
diff --git a/receiver/filelogreceiver/README.md b/receiver/filelogreceiver/README.md
index f4f730876ef2..2b23516953af 100644
--- a/receiver/filelogreceiver/README.md
+++ b/receiver/filelogreceiver/README.md
@@ -51,6 +51,7 @@ Tails and parses logs from files.
 | `retry_on_failure.max_interval`     | `30s`                                | Upper bound on retry backoff [interval](#time-parameters). Once this value is reached the delay between consecutive retries will remain constant at the specified value.                                                                                        |
 | `retry_on_failure.max_elapsed_time` | `5m`                                 | Maximum amount of [time](#time-parameters) (including retries) spent trying to send a logs batch to a downstream consumer. Once this value is reached, the data is discarded. Retrying never stops if set to `0`.     
 | `ordering_criteria.regex`     |                                      | Regular expression used for sorting, should contain a named capture groups that are to be used in `regex_key`.                                                                                                                               |
+| `ordering_criteria.top_n`     | 1 | The number of files to track when using file ordering. The top N files are tracked after applying the ordering criteria. |
 | `ordering_criteria.sort_by.sort_type` |                                      | Type of sorting to be performed (e.g., `numeric`, `alphabetical`, `timestamp`)                                                                                                                                                                                  |
 | `ordering_criteria.sort_by.location`  |                                      | Relevant if `sort_type` is set to `timestamp`. Defines the location of the timestamp of the file.                                                                                                                                                               |
 | `ordering_criteria.sort_by.format`    |                                      | Relevant if `sort_type` is set to `timestamp`. Defines the strptime format of the timestamp being sorted.                                                                                                                                                       |

From 762f843f556a6da818f7ec0f9f528f5a2f08d277 Mon Sep 17 00:00:00 2001
From: Miel Donkers <miel.donkers@gmail.com>
Date: Thu, 19 Oct 2023 02:53:40 +0200
Subject: [PATCH 04/11] [pkg/pdatautil] Optimize the hashing function for
 `pcommon.Map` (#27840)

**Description:**

Improve the performance of the `MapHash` function, mostly by using the
xxhash architecture optimized version.

`hash.Sum` is a 'Go-code' only implementation
`xxhash.Sum64` has optimized versions for different architectures
Both result in the exact same hash though.


For the given benchmarks, the gain is > 10%

From `main`:
```
goos: linux
goarch: amd64
pkg: github.com/open-telemetry/opentelemetry-collector-contrib/pkg/pdatautil
cpu: 11th Gen Intel(R) Core(TM) i7-11800H @ 2.30GHz
BenchmarkMapHashFourItems-16                  	47676003	       236.0 ns/op	      24 B/op	       1 allocs/op
BenchmarkMapHashEightItems-16                 	22551222	       532.3 ns/op	      32 B/op	       2 allocs/op
BenchmarkMapHashWithEmbeddedSliceAndMap-16    	14098969	       893.1 ns/op	      56 B/op	       3 allocs/op
```

The PR:
```
goos: linux
goarch: amd64
pkg: github.com/open-telemetry/opentelemetry-collector-contrib/pkg/pdatautil
cpu: 11th Gen Intel(R) Core(TM) i7-11800H @ 2.30GHz
BenchmarkMapHashFourItems-16                  	59854737	       203.4 ns/op	      24 B/op	       1 allocs/op
BenchmarkMapHashEightItems-16                 	25609375	       475.0 ns/op	      32 B/op	       2 allocs/op
BenchmarkMapHashWithEmbeddedSliceAndMap-16    	15950144	       753.8 ns/op	      56 B/op	       3 allocs/op
```

**Testing:**
(Re-)using the same tests and benchmarks to prove semantics didn't
change.
---
 pkg/pdatautil/hash.go | 92 +++++++++++++++++++++----------------------
 1 file changed, 44 insertions(+), 48 deletions(-)

diff --git a/pkg/pdatautil/hash.go b/pkg/pdatautil/hash.go
index 043e308e9d0a..7900120cd6c3 100644
--- a/pkg/pdatautil/hash.go
+++ b/pkg/pdatautil/hash.go
@@ -5,7 +5,6 @@ package pdatautil // import "github.com/open-telemetry/opentelemetry-collector-c
 
 import (
 	"encoding/binary"
-	"hash"
 	"math"
 	"sort"
 	"sync"
@@ -28,23 +27,19 @@ var (
 	valMapSuffix    = []byte{'\xfd'}
 	valSlicePrefix  = []byte{'\xfe'}
 	valSliceSuffix  = []byte{'\xff'}
+
+	emptyHash = [16]byte{0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00}
 )
 
 type hashWriter struct {
-	h       hash.Hash
-	strBuf  []byte
+	byteBuf []byte
 	keysBuf []string
-	sumHash []byte
-	numBuf  []byte
 }
 
 func newHashWriter() *hashWriter {
 	return &hashWriter{
-		h:       xxhash.New(),
-		strBuf:  make([]byte, 0, 128),
+		byteBuf: make([]byte, 0, 512),
 		keysBuf: make([]string, 0, 16),
-		sumHash: make([]byte, 0, 16),
-		numBuf:  make([]byte, 8),
 	}
 }
 
@@ -55,10 +50,16 @@ var hashWriterPool = &sync.Pool{
 // MapHash return a hash for the provided map.
 // Maps with the same underlying key/value pairs in different order produce the same deterministic hash value.
 func MapHash(m pcommon.Map) [16]byte {
+	if m.Len() == 0 {
+		return emptyHash
+	}
+
 	hw := hashWriterPool.Get().(*hashWriter)
 	defer hashWriterPool.Put(hw)
-	hw.h.Reset()
+	hw.byteBuf = hw.byteBuf[:0]
+
 	hw.writeMapHash(m)
+
 	return hw.hashSum128()
 }
 
@@ -66,8 +67,10 @@ func MapHash(m pcommon.Map) [16]byte {
 func ValueHash(v pcommon.Value) [16]byte {
 	hw := hashWriterPool.Get().(*hashWriter)
 	defer hashWriterPool.Put(hw)
-	hw.h.Reset()
+	hw.byteBuf = hw.byteBuf[:0]
+
 	hw.writeValueHash(v)
+
 	return hw.hashSum128()
 }
 
@@ -90,10 +93,8 @@ func (hw *hashWriter) writeMapHash(m pcommon.Map) {
 	sort.Strings(workingKeySet)
 	for _, k := range workingKeySet {
 		v, _ := m.Get(k)
-		hw.strBuf = hw.strBuf[:0]
-		hw.strBuf = append(hw.strBuf, keyPrefix...)
-		hw.strBuf = append(hw.strBuf, k...)
-		hw.h.Write(hw.strBuf)
+		hw.byteBuf = append(hw.byteBuf, keyPrefix...)
+		hw.byteBuf = append(hw.byteBuf, k...)
 		hw.writeValueHash(v)
 	}
 
@@ -101,59 +102,54 @@ func (hw *hashWriter) writeMapHash(m pcommon.Map) {
 	hw.keysBuf = hw.keysBuf[:nextIndex]
 }
 
-func (hw *hashWriter) writeSliceHash(sl pcommon.Slice) {
-	for i := 0; i < sl.Len(); i++ {
-		hw.writeValueHash(sl.At(i))
-	}
-}
-
 func (hw *hashWriter) writeValueHash(v pcommon.Value) {
 	switch v.Type() {
 	case pcommon.ValueTypeStr:
-		hw.strBuf = hw.strBuf[:0]
-		hw.strBuf = append(hw.strBuf, valStrPrefix...)
-		hw.strBuf = append(hw.strBuf, v.Str()...)
-		hw.h.Write(hw.strBuf)
+		hw.byteBuf = append(hw.byteBuf, valStrPrefix...)
+		hw.byteBuf = append(hw.byteBuf, v.Str()...)
 	case pcommon.ValueTypeBool:
 		if v.Bool() {
-			hw.h.Write(valBoolTrue)
+			hw.byteBuf = append(hw.byteBuf, valBoolTrue...)
 		} else {
-			hw.h.Write(valBoolFalse)
+			hw.byteBuf = append(hw.byteBuf, valBoolFalse...)
 		}
 	case pcommon.ValueTypeInt:
-		hw.h.Write(valIntPrefix)
-		binary.LittleEndian.PutUint64(hw.numBuf, uint64(v.Int()))
-		hw.h.Write(hw.numBuf)
+		hw.byteBuf = append(hw.byteBuf, valIntPrefix...)
+		hw.byteBuf = binary.LittleEndian.AppendUint64(hw.byteBuf, uint64(v.Int()))
 	case pcommon.ValueTypeDouble:
-		hw.h.Write(valDoublePrefix)
-		binary.LittleEndian.PutUint64(hw.numBuf, math.Float64bits(v.Double()))
-		hw.h.Write(hw.numBuf)
+		hw.byteBuf = append(hw.byteBuf, valDoublePrefix...)
+		hw.byteBuf = binary.LittleEndian.AppendUint64(hw.byteBuf, math.Float64bits(v.Double()))
 	case pcommon.ValueTypeMap:
-		hw.h.Write(valMapPrefix)
+		hw.byteBuf = append(hw.byteBuf, valMapPrefix...)
 		hw.writeMapHash(v.Map())
-		hw.h.Write(valMapSuffix)
+		hw.byteBuf = append(hw.byteBuf, valMapSuffix...)
 	case pcommon.ValueTypeSlice:
-		hw.h.Write(valSlicePrefix)
-		hw.writeSliceHash(v.Slice())
-		hw.h.Write(valSliceSuffix)
+		sl := v.Slice()
+		hw.byteBuf = append(hw.byteBuf, valSlicePrefix...)
+		for i := 0; i < sl.Len(); i++ {
+			hw.writeValueHash(sl.At(i))
+		}
+		hw.byteBuf = append(hw.byteBuf, valSliceSuffix...)
 	case pcommon.ValueTypeBytes:
-		hw.h.Write(valBytesPrefix)
-		hw.h.Write(v.Bytes().AsRaw())
+		hw.byteBuf = append(hw.byteBuf, valBytesPrefix...)
+		hw.byteBuf = append(hw.byteBuf, v.Bytes().AsRaw()...)
 	case pcommon.ValueTypeEmpty:
-		hw.h.Write(valEmpty)
+		hw.byteBuf = append(hw.byteBuf, valEmpty...)
 	}
 }
 
 // hashSum128 returns a [16]byte hash sum.
 func (hw *hashWriter) hashSum128() [16]byte {
-	b := hw.sumHash[:0]
-	b = hw.h.Sum(b)
+	r := [16]byte{}
+	res := r[:]
+
+	h := xxhash.Sum64(hw.byteBuf)
+	res = binary.LittleEndian.AppendUint64(res[:0], h)
 
 	// Append an extra byte to generate another part of the hash sum
-	_, _ = hw.h.Write(extraByte)
-	b = hw.h.Sum(b)
+	hw.byteBuf = append(hw.byteBuf, extraByte...)
+	h = xxhash.Sum64(hw.byteBuf)
+	_ = binary.LittleEndian.AppendUint64(res[8:], h)
 
-	res := [16]byte{}
-	copy(res[:], b)
-	return res
+	return r
 }

From 8ab993cb65bb21de3aea46ecd9dcbf096cd44723 Mon Sep 17 00:00:00 2001
From: bryan-aguilar <46550959+bryan-aguilar@users.noreply.github.com>
Date: Wed, 18 Oct 2023 17:54:23 -0700
Subject: [PATCH 05/11] [aws/cwlogs] Reduce noisy logger in CloudWatch logs
 pusher (#27774)

**Description:** Log at the debug level instead of info level. Existing
behavior would cause excessive log lines on each successful push.
---
 .chloggen/awscwl_noisypusher.yaml | 27 +++++++++++++++++++++++++++
 internal/aws/cwlogs/pusher.go     |  2 +-
 2 files changed, 28 insertions(+), 1 deletion(-)
 create mode 100755 .chloggen/awscwl_noisypusher.yaml

diff --git a/.chloggen/awscwl_noisypusher.yaml b/.chloggen/awscwl_noisypusher.yaml
new file mode 100755
index 000000000000..7d991bae8f63
--- /dev/null
+++ b/.chloggen/awscwl_noisypusher.yaml
@@ -0,0 +1,27 @@
+# Use this changelog template to create an entry for release notes.
+
+# One of 'breaking', 'deprecation', 'new_component', 'enhancement', 'bug_fix'
+change_type: enhancement
+
+# The name of the component, or a single word describing the area of concern, (e.g. filelogreceiver)
+component: awscloudwatchlogsexporter/awsemfexporter
+
+# A brief description of the change.  Surround your text with quotes ("") if it needs to start with a backtick (`).
+note: Reduce noisy logs emitted by CloudWatch Logs Pusher.
+
+# Mandatory: One or more tracking issues related to the change. You can use the PR number here if no issue exists.
+issues: [27774]
+
+# (Optional) One or more lines of additional information to render under the primary note.
+# These lines will be padded with 2 spaces and then inserted directly into the document.
+# Use pipe (|) for multiline entries.
+subtext: The Collector logger will now write successful CloudWatch API writes at the Debug level instead of Info level.
+
+# If your change doesn't affect end users or the exported elements of any package,
+# you should instead start your pull request title with [chore] or use the "Skip Changelog" label.
+# Optional: The change log or logs in which this entry should be included.
+# e.g. '[user]' or '[user, api]'
+# Include 'user' if the change is relevant to end users.
+# Include 'api' if there is a change to a library API.
+# Default: '[user]'
+change_logs: [user]
diff --git a/internal/aws/cwlogs/pusher.go b/internal/aws/cwlogs/pusher.go
index d0f940730278..08ff8f549de2 100644
--- a/internal/aws/cwlogs/pusher.go
+++ b/internal/aws/cwlogs/pusher.go
@@ -267,7 +267,7 @@ func (p *logPusher) pushEventBatch(req interface{}) error {
 		return err
 	}
 
-	p.logger.Info("logpusher: publish log events successfully.",
+	p.logger.Debug("logpusher: publish log events successfully.",
 		zap.Int("NumOfLogEvents", len(putLogEventsInput.LogEvents)),
 		zap.Float64("LogEventsSize", float64(logEventBatch.byteTotal)/float64(1024)),
 		zap.Int64("Time", time.Since(startTime).Nanoseconds()/int64(time.Millisecond)))

From 51b80812b9425bacba3d493a841e61ddee944cc5 Mon Sep 17 00:00:00 2001
From: sakulali <sakulali@126.com>
Date: Thu, 19 Oct 2023 08:54:58 +0800
Subject: [PATCH 06/11] [pkg/pdatatest] Ignore trace ID for ptracetest (#27829)

**Description:**
Support ignore trace ID in span comparisons for ptracetest.

**Link to tracking Issue:**

https://github.com/open-telemetry/opentelemetry-collector-contrib/issues/27687
---
 .chloggen/ptracetest-ignore-traceid.yaml      | 27 +++++++++++++++++++
 pkg/pdatatest/ptracetest/options.go           | 22 +++++++++++++++
 .../testdata/ignore-traceid/actual.yaml       | 21 +++++++++++++++
 .../testdata/ignore-traceid/expected.yaml     | 19 +++++++++++++
 pkg/pdatatest/ptracetest/traces_test.go       | 10 +++++++
 5 files changed, 99 insertions(+)
 create mode 100755 .chloggen/ptracetest-ignore-traceid.yaml
 create mode 100644 pkg/pdatatest/ptracetest/testdata/ignore-traceid/actual.yaml
 create mode 100644 pkg/pdatatest/ptracetest/testdata/ignore-traceid/expected.yaml

diff --git a/.chloggen/ptracetest-ignore-traceid.yaml b/.chloggen/ptracetest-ignore-traceid.yaml
new file mode 100755
index 000000000000..4e9b7449b45e
--- /dev/null
+++ b/.chloggen/ptracetest-ignore-traceid.yaml
@@ -0,0 +1,27 @@
+# Use this changelog template to create an entry for release notes.
+
+# One of 'breaking', 'deprecation', 'new_component', 'enhancement', 'bug_fix'
+change_type: enhancement
+
+# The name of the component, or a single word describing the area of concern, (e.g. filelogreceiver)
+component: pkg/pdatatest
+
+# A brief description of the change.  Surround your text with quotes ("") if it needs to start with a backtick (`).
+note: "support ignore trace ID in span comparisons for ptracetest"
+
+# Mandatory: One or more tracking issues related to the change. You can use the PR number here if no issue exists.
+issues: [27687]
+
+# (Optional) One or more lines of additional information to render under the primary note.
+# These lines will be padded with 2 spaces and then inserted directly into the document.
+# Use pipe (|) for multiline entries.
+subtext:
+
+# If your change doesn't affect end users or the exported elements of any package,
+# you should instead start your pull request title with [chore] or use the "Skip Changelog" label.
+# Optional: The change log or logs in which this entry should be included.
+# e.g. '[user]' or '[user, api]'
+# Include 'user' if the change is relevant to end users.
+# Include 'api' if there is a change to a library API.
+# Default: '[user]'
+change_logs: []
diff --git a/pkg/pdatatest/ptracetest/options.go b/pkg/pdatatest/ptracetest/options.go
index 57a278ec4dda..5a6c318dbcdb 100644
--- a/pkg/pdatatest/ptracetest/options.go
+++ b/pkg/pdatatest/ptracetest/options.go
@@ -172,3 +172,25 @@ func maskEndTimestamp(traces ptrace.Traces, ts pcommon.Timestamp) {
 		}
 	}
 }
+
+// IgnoreTraceID is a CompareTracesOption that clears TraceID fields on all spans.
+func IgnoreTraceID() CompareTracesOption {
+	return compareTracesOptionFunc(func(expected, actual ptrace.Traces) {
+		traceID := pcommon.NewTraceIDEmpty()
+		maskTraceID(expected, traceID)
+		maskTraceID(actual, traceID)
+	})
+}
+
+func maskTraceID(traces ptrace.Traces, traceID pcommon.TraceID) {
+	for i := 0; i < traces.ResourceSpans().Len(); i++ {
+		rs := traces.ResourceSpans().At(i)
+		for j := 0; j < rs.ScopeSpans().Len(); j++ {
+			ss := rs.ScopeSpans().At(j)
+			for k := 0; k < ss.Spans().Len(); k++ {
+				span := ss.Spans().At(k)
+				span.SetTraceID(traceID)
+			}
+		}
+	}
+}
diff --git a/pkg/pdatatest/ptracetest/testdata/ignore-traceid/actual.yaml b/pkg/pdatatest/ptracetest/testdata/ignore-traceid/actual.yaml
new file mode 100644
index 000000000000..817c4fc938d1
--- /dev/null
+++ b/pkg/pdatatest/ptracetest/testdata/ignore-traceid/actual.yaml
@@ -0,0 +1,21 @@
+resourceSpans:
+  - resource:
+      attributes:
+        - key: host.name
+          value:
+            stringValue: node1
+    scopeSpans:
+      - scope:
+          name: collector
+          version: v0.1.0
+        spans:
+          - attributes:
+              - key: key1
+                value:
+                  stringValue: value1
+            name: span1
+            parentSpanId: ""
+            spanId: fd0da883bb27cd6b
+            status: {}
+            traceId: 8c8b1765a7b0acf0b66aa4623fcb7bd5
+
diff --git a/pkg/pdatatest/ptracetest/testdata/ignore-traceid/expected.yaml b/pkg/pdatatest/ptracetest/testdata/ignore-traceid/expected.yaml
new file mode 100644
index 000000000000..f01f0307bac4
--- /dev/null
+++ b/pkg/pdatatest/ptracetest/testdata/ignore-traceid/expected.yaml
@@ -0,0 +1,19 @@
+resourceSpans:
+  - resource:
+      attributes:
+        - key: host.name
+          value:
+            stringValue: node1
+    scopeSpans:
+      - scope:
+          name: collector
+          version: v0.1.0
+        spans:
+          - attributes:
+              - key: key1
+                value:
+                  stringValue: value1
+            name: span1
+            parentSpanId: ""
+            spanId: fd0da883bb27cd6b
+            status: {}
diff --git a/pkg/pdatatest/ptracetest/traces_test.go b/pkg/pdatatest/ptracetest/traces_test.go
index f088d8889bbe..ca8b8d128a3b 100644
--- a/pkg/pdatatest/ptracetest/traces_test.go
+++ b/pkg/pdatatest/ptracetest/traces_test.go
@@ -68,6 +68,16 @@ func TestCompareTraces(t *testing.T) {
 			),
 			withOptions: nil,
 		},
+		{
+			name: "ignore-traceid",
+			compareOptions: []CompareTracesOption{
+				IgnoreTraceID(),
+			},
+			withoutOptions: multierr.Combine(
+				errors.New("resource \"map[host.name:node1]\": scope \"collector\": span \"span1\": trace ID doesn't match expected: 8c8b1765a7b0acf0b66aa4623fcb7bd5, actual: "),
+			),
+			withOptions: nil,
+		},
 		{
 			name: "resourcespans-amount-unequal",
 			withoutOptions: multierr.Combine(

From 4b41ec63d7b331a5dda306c7c4397493ecfe1418 Mon Sep 17 00:00:00 2001
From: sakulali <sakulali@126.com>
Date: Thu, 19 Oct 2023 08:55:52 +0800
Subject: [PATCH 07/11] [pkg/pdatatest] Ignore span ID for ptracetest (#27833)

**Description:**
Support ignore span ID in span comparisons for ptracetest.

**Link to tracking Issue:**

https://github.com/open-telemetry/opentelemetry-collector-contrib/issues/27685

**Testing:**
make chlog-validate
go test for pdatatest

**Documentation:**
---
 .chloggen/ptracetest-ignore-spanid.yaml       | 27 +++++++++++++++++++
 pkg/pdatatest/ptracetest/options.go           | 22 +++++++++++++++
 .../testdata/ignore-spanid/actual.yaml        | 21 +++++++++++++++
 .../testdata/ignore-spanid/expected.yaml      | 19 +++++++++++++
 pkg/pdatatest/ptracetest/traces_test.go       | 10 +++++++
 5 files changed, 99 insertions(+)
 create mode 100755 .chloggen/ptracetest-ignore-spanid.yaml
 create mode 100644 pkg/pdatatest/ptracetest/testdata/ignore-spanid/actual.yaml
 create mode 100644 pkg/pdatatest/ptracetest/testdata/ignore-spanid/expected.yaml

diff --git a/.chloggen/ptracetest-ignore-spanid.yaml b/.chloggen/ptracetest-ignore-spanid.yaml
new file mode 100755
index 000000000000..72f99b9c9322
--- /dev/null
+++ b/.chloggen/ptracetest-ignore-spanid.yaml
@@ -0,0 +1,27 @@
+# Use this changelog template to create an entry for release notes.
+
+# One of 'breaking', 'deprecation', 'new_component', 'enhancement', 'bug_fix'
+change_type: enhancement
+
+# The name of the component, or a single word describing the area of concern, (e.g. filelogreceiver)
+component: pkg/pdatatest
+
+# A brief description of the change.  Surround your text with quotes ("") if it needs to start with a backtick (`).
+note: "support ignore span ID in span comparisons for ptracetest"
+
+# Mandatory: One or more tracking issues related to the change. You can use the PR number here if no issue exists.
+issues: [27685]
+
+# (Optional) One or more lines of additional information to render under the primary note.
+# These lines will be padded with 2 spaces and then inserted directly into the document.
+# Use pipe (|) for multiline entries.
+subtext:
+
+# If your change doesn't affect end users or the exported elements of any package,
+# you should instead start your pull request title with [chore] or use the "Skip Changelog" label.
+# Optional: The change log or logs in which this entry should be included.
+# e.g. '[user]' or '[user, api]'
+# Include 'user' if the change is relevant to end users.
+# Include 'api' if there is a change to a library API.
+# Default: '[user]'
+change_logs: []
diff --git a/pkg/pdatatest/ptracetest/options.go b/pkg/pdatatest/ptracetest/options.go
index 5a6c318dbcdb..3a6886eb0019 100644
--- a/pkg/pdatatest/ptracetest/options.go
+++ b/pkg/pdatatest/ptracetest/options.go
@@ -129,6 +129,28 @@ func sortSpanSlices(ts ptrace.Traces) {
 	}
 }
 
+// IgnoreSpanID is a CompareTracesOption that clears SpanID fields on all spans.
+func IgnoreSpanID() CompareTracesOption {
+	return compareTracesOptionFunc(func(expected, actual ptrace.Traces) {
+		spanID := pcommon.NewSpanIDEmpty()
+		maskSpanID(expected, spanID)
+		maskSpanID(actual, spanID)
+	})
+}
+
+func maskSpanID(traces ptrace.Traces, spanID pcommon.SpanID) {
+	for i := 0; i < traces.ResourceSpans().Len(); i++ {
+		rs := traces.ResourceSpans().At(i)
+		for j := 0; j < rs.ScopeSpans().Len(); j++ {
+			ss := rs.ScopeSpans().At(j)
+			for k := 0; k < ss.Spans().Len(); k++ {
+				span := ss.Spans().At(k)
+				span.SetSpanID(spanID)
+			}
+		}
+	}
+}
+
 // IgnoreStartTimestamp is a CompareTracesOption that clears StartTimestamp fields on all spans.
 func IgnoreStartTimestamp() CompareTracesOption {
 	return compareTracesOptionFunc(func(expected, actual ptrace.Traces) {
diff --git a/pkg/pdatatest/ptracetest/testdata/ignore-spanid/actual.yaml b/pkg/pdatatest/ptracetest/testdata/ignore-spanid/actual.yaml
new file mode 100644
index 000000000000..817c4fc938d1
--- /dev/null
+++ b/pkg/pdatatest/ptracetest/testdata/ignore-spanid/actual.yaml
@@ -0,0 +1,21 @@
+resourceSpans:
+  - resource:
+      attributes:
+        - key: host.name
+          value:
+            stringValue: node1
+    scopeSpans:
+      - scope:
+          name: collector
+          version: v0.1.0
+        spans:
+          - attributes:
+              - key: key1
+                value:
+                  stringValue: value1
+            name: span1
+            parentSpanId: ""
+            spanId: fd0da883bb27cd6b
+            status: {}
+            traceId: 8c8b1765a7b0acf0b66aa4623fcb7bd5
+
diff --git a/pkg/pdatatest/ptracetest/testdata/ignore-spanid/expected.yaml b/pkg/pdatatest/ptracetest/testdata/ignore-spanid/expected.yaml
new file mode 100644
index 000000000000..3b3954599639
--- /dev/null
+++ b/pkg/pdatatest/ptracetest/testdata/ignore-spanid/expected.yaml
@@ -0,0 +1,19 @@
+resourceSpans:
+  - resource:
+      attributes:
+        - key: host.name
+          value:
+            stringValue: node1
+    scopeSpans:
+      - scope:
+          name: collector
+          version: v0.1.0
+        spans:
+          - attributes:
+              - key: key1
+                value:
+                  stringValue: value1
+            name: span1
+            parentSpanId: ""
+            status: {}
+            traceId: 8c8b1765a7b0acf0b66aa4623fcb7bd5
diff --git a/pkg/pdatatest/ptracetest/traces_test.go b/pkg/pdatatest/ptracetest/traces_test.go
index ca8b8d128a3b..ef07930a7311 100644
--- a/pkg/pdatatest/ptracetest/traces_test.go
+++ b/pkg/pdatatest/ptracetest/traces_test.go
@@ -48,6 +48,16 @@ func TestCompareTraces(t *testing.T) {
 			),
 			withOptions: nil,
 		},
+		{
+			name: "ignore-spanid",
+			compareOptions: []CompareTracesOption{
+				IgnoreSpanID(),
+			},
+			withoutOptions: multierr.Combine(
+				errors.New("resource \"map[host.name:node1]\": scope \"collector\": span \"span1\": span ID doesn't match expected: fd0da883bb27cd6b, actual: "),
+			),
+			withOptions: nil,
+		},
 		{
 			name: "ignore-start-timestamp",
 			compareOptions: []CompareTracesOption{

From b0f0dda517e88ccd44ffe7962e68dd15de34a8df Mon Sep 17 00:00:00 2001
From: Christian Kruse <ctkruse99@gmail.com>
Date: Wed, 18 Oct 2023 21:24:24 -0700
Subject: [PATCH 08/11] [processor/k8sattributes] Handle all resource deletion
 event types (#27847)

**Description:**

The k8s go client's cache expects OnDelete handlers to handle objects of
type DeletedFinalStateUnknown when the cache's watch mechanism misses a
delete and notices later. This changes the processor to handle such
deletes as if they were normal, rather than logging an error and
dropping the change.

**Link to tracking Issue:**
https://github.com/open-telemetry/opentelemetry-collector-contrib/issues/27632

**Testing:**

Only what you see in the unit tests. I am open to suggestions, but I
don't see this being a code path we can reasonably cover in the e2e test
suite.

Verified manually locally on a kind cluster.
* Stood up two deployments loosely based off e2e testing resources, one
w/ a collector built from this branch and the other
docker.io/otel/opentelemetry-collector-contrib:latest.
* Both included an additional container in the collector pod I used to
fiddle with iptables rules.
* Added rules to reject traffic to/from the kube api server
* Deleted some namespaces containing deployments generating telemetry.
* Restored connectivity by removing the iptables rules.
* Observed the collector built from this branch was silent (aside from
the junk the k8s client logs due to the broken connection)
* Observed the latest
([0.87.0](https://hub.docker.com/layers/otel/opentelemetry-collector-contrib/0.87.0/images/sha256-77cdd395b828b09cb920c671966f09a87a40611aa6107443146086f2046f4a9a?context=explore))
collector logged a handful of errors for the deleted resources
(api_v1.Pod, and apps_v1.ReplicaSet. I probably just didn't wait long
enough for Namespace.)

```
2023-10-19T02:18:37.781Z        error   kube/client.go:236      object received was not of type api_v1.Pod      {"kind": "processor", "name": "k8sattributes", "pipeline": "metrics", "received": {"Key":"src1/telemetrygen-patched-766d55cbcb-8zktr","Obj":{"metadata":{"name":"telemetrygen-patched-766d55cbcb-8zktr","namespace":"src1","uid":"be5d2268-c8b0-434d-b3b8-8b18083c7a8b","creat
ionTimestamp":"2023-10-19T02:01:08Z","labels":{"app":"telemetrygen-patched","pod-template-hash":"766d55cbcb"},"ownerReferences":[{"apiVersion":"apps/v1","kind":"ReplicaSet","name":"telemetrygen-patched-766d55cbcb","uid":"a887d67a-d5d6-4269-b520-45dbb4f1cd82","controller":true,"blockOwnerDeletion":true}]},"spec":{"containers":[{"name":"telemetrygen","image":"localhost/telemetrygen
:latest","resources":{}}],"nodeName":"manual-e2e-testing-control-plane"},"status":{"podIP":"10.244.0.56","startTime":"2023-10-19T02:01:08Z","containerStatuses":[{"name":"telemetrygen","state":{},"lastState":{},"ready":false,"restartCount":0,"image":"","imageID":"","containerID":"containerd://2821ef32cd8bf93a13414504c0f8f0c016c84be49d6ffdbd475d7e4681e90c51"}]}}}}
github.com/open-telemetry/opentelemetry-collector-contrib/processor/k8sattributesprocessor/internal/kube.(*WatchClient).handlePodDelete
        github.com/open-telemetry/opentelemetry-collector-contrib/processor/k8sattributesprocessor@v0.87.0/internal/kube/client.go:236
k8s.io/client-go/tools/cache.ResourceEventHandlerFuncs.OnDelete
        k8s.io/client-go@v0.28.2/tools/cache/controller.go:253
...

2023-10-19T02:19:03.970Z        error   kube/client.go:868      object received was not of type apps_v1.ReplicaSet      {"kind": "processor", "name": "k8sattributes", "pipeline": "metrics", "received": {"Key":"src1/telemetrygen-stable-5c444bb8b8","Obj":{"metadata":{"name":"telemetrygen-stable-5c444bb8b8","namespace":"src1","uid":"d37707ff-b308-4339-8543-a1caf5705ea8","creationTimestamp":null,"ownerReferences":[{"apiVersion":"apps/v1","kind":"Deployment","name":"telemetrygen-stable","uid":"c421276e-e1bf-40c5-85e1-e92e30363da5","controller":true,"blockOwnerDeletion":true}]},"spec":{"selector":null,"template":{"metadata":{"creationTimestamp":null},"spec":{"containers":null}}},"status":{"replicas":0}}}}
github.com/open-telemetry/opentelemetry-collector-contrib/processor/k8sattributesprocessor/internal/kube.(*WatchClient).handleReplicaSetDelete
        github.com/open-telemetry/opentelemetry-collector-contrib/processor/k8sattributesprocessor@v0.87.0/internal/kube/client.go:868
k8s.io/client-go/tools/cache.ResourceEventHandlerFuncs.OnDelete
        k8s.io/client-go@v0.28.2/tools/cache/controller.go:253
k8s.io/client-go/tools/cache.(*processorListener).run.func1
        k8s.io/client-go@v0.28.2/tools/cache/shared_informer.go:979
k8s.io/apimachinery/pkg/util/wait.BackoffUntil.func1
...
```
**Documentation:** N/A - it is not clear to me whether or not this
should land on the changelog. Its impact on users is marginal.

Signed-off-by: Christian Kruse <ctkruse99@gmail.com>
---
 .../internal/kube/client.go                   | 16 ++++++++--
 .../internal/kube/client_test.go              | 29 ++++++++++++++++++-
 2 files changed, 41 insertions(+), 4 deletions(-)

diff --git a/processor/k8sattributesprocessor/internal/kube/client.go b/processor/k8sattributesprocessor/internal/kube/client.go
index 019105eb2a0e..47ab6255848e 100644
--- a/processor/k8sattributesprocessor/internal/kube/client.go
+++ b/processor/k8sattributesprocessor/internal/kube/client.go
@@ -230,7 +230,7 @@ func (c *WatchClient) handlePodUpdate(_, newPod interface{}) {
 
 func (c *WatchClient) handlePodDelete(obj interface{}) {
 	observability.RecordPodDeleted()
-	if pod, ok := obj.(*api_v1.Pod); ok {
+	if pod, ok := ignoreDeletedFinalStateUnknown(obj).(*api_v1.Pod); ok {
 		c.forgetPod(pod)
 	} else {
 		c.logger.Error("object received was not of type api_v1.Pod", zap.Any("received", obj))
@@ -259,7 +259,7 @@ func (c *WatchClient) handleNamespaceUpdate(_, newNamespace interface{}) {
 
 func (c *WatchClient) handleNamespaceDelete(obj interface{}) {
 	observability.RecordNamespaceDeleted()
-	if namespace, ok := obj.(*api_v1.Namespace); ok {
+	if namespace, ok := ignoreDeletedFinalStateUnknown(obj).(*api_v1.Namespace); ok {
 		c.m.Lock()
 		if ns, ok := c.Namespaces[namespace.Name]; ok {
 			// When a namespace is deleted all the pods(and other k8s objects in that namespace) in that namespace are deleted before it.
@@ -859,7 +859,7 @@ func (c *WatchClient) handleReplicaSetUpdate(_, newRS interface{}) {
 
 func (c *WatchClient) handleReplicaSetDelete(obj interface{}) {
 	observability.RecordReplicaSetDeleted()
-	if replicaset, ok := obj.(*apps_v1.ReplicaSet); ok {
+	if replicaset, ok := ignoreDeletedFinalStateUnknown(obj).(*apps_v1.ReplicaSet); ok {
 		c.m.Lock()
 		key := string(replicaset.UID)
 		delete(c.ReplicaSets, key)
@@ -915,3 +915,13 @@ func (c *WatchClient) getReplicaSet(uid string) (*ReplicaSet, bool) {
 	}
 	return nil, false
 }
+
+// ignoreDeletedFinalStateUnknown returns the object wrapped in
+// DeletedFinalStateUnknown. Useful in OnDelete resource event handlers that do
+// not need the additional context.
+func ignoreDeletedFinalStateUnknown(obj interface{}) interface{} {
+	if obj, ok := obj.(cache.DeletedFinalStateUnknown); ok {
+		return obj.Obj
+	}
+	return obj
+}
diff --git a/processor/k8sattributesprocessor/internal/kube/client_test.go b/processor/k8sattributesprocessor/internal/kube/client_test.go
index fdaf1d5e5c3f..aa31c9f31423 100644
--- a/processor/k8sattributesprocessor/internal/kube/client_test.go
+++ b/processor/k8sattributesprocessor/internal/kube/client_test.go
@@ -21,6 +21,7 @@ import (
 	"k8s.io/apimachinery/pkg/selection"
 	"k8s.io/client-go/kubernetes"
 	"k8s.io/client-go/kubernetes/fake"
+	"k8s.io/client-go/tools/cache"
 
 	"github.com/open-telemetry/opentelemetry-collector-contrib/internal/k8sconfig"
 )
@@ -250,6 +251,14 @@ func TestReplicaSetHandler(t *testing.T) {
 	// test delete replicaset
 	c.handleReplicaSetDelete(updatedReplicaset)
 	assert.Equal(t, len(c.ReplicaSets), 0)
+	// test delete replicaset when DeletedFinalStateUnknown
+	c.handleReplicaSetAdd(replicaset)
+	require.Equal(t, len(c.ReplicaSets), 1)
+	c.handleReplicaSetDelete(cache.DeletedFinalStateUnknown{
+		Obj: replicaset,
+	})
+	assert.Equal(t, len(c.ReplicaSets), 0)
+
 }
 
 func TestPodHostNetwork(t *testing.T) {
@@ -427,13 +436,14 @@ func TestPodDelete(t *testing.T) {
 	assert.False(t, deleteRequest.ts.Before(tsBeforeDelete))
 	assert.False(t, deleteRequest.ts.After(time.Now()))
 
+	// delete when DeletedFinalStateUnknown
 	c.deleteQueue = c.deleteQueue[:0]
 	pod = &api_v1.Pod{}
 	pod.Name = "podC"
 	pod.Status.PodIP = "2.2.2.2"
 	pod.UID = "aaaaaaaa-bbbb-cccc-dddd-eeeeeeeeeeee"
 	tsBeforeDelete = time.Now()
-	c.handlePodDelete(pod)
+	c.handlePodDelete(cache.DeletedFinalStateUnknown{Obj: pod})
 	assert.Equal(t, 5, len(c.Pods))
 	assert.Equal(t, 5, len(c.deleteQueue))
 	deleteRequest = c.deleteQueue[0]
@@ -464,6 +474,23 @@ func TestNamespaceDelete(t *testing.T) {
 	assert.Equal(t, 2, len(c.Namespaces))
 	got := c.Namespaces["namespaceA"]
 	assert.Equal(t, "namespaceA", got.Name)
+	// delete non-existent namespace when DeletedFinalStateUnknown
+	c.handleNamespaceDelete(cache.DeletedFinalStateUnknown{Obj: namespace})
+	assert.Equal(t, 2, len(c.Namespaces))
+	got = c.Namespaces["namespaceA"]
+	assert.Equal(t, "namespaceA", got.Name)
+
+	// delete namespace A
+	namespace.Name = "namespaceA"
+	c.handleNamespaceDelete(namespace)
+	assert.Equal(t, 1, len(c.Namespaces))
+	got = c.Namespaces["namespaceB"]
+	assert.Equal(t, "namespaceB", got.Name)
+
+	// delete namespace B when DeletedFinalStateUnknown
+	namespace.Name = "namespaceB"
+	c.handleNamespaceDelete(cache.DeletedFinalStateUnknown{Obj: namespace})
+	assert.Equal(t, 0, len(c.Namespaces))
 }
 
 func TestDeleteQueue(t *testing.T) {

From c482aa70237ad873e85f093ea443014f2a3401da Mon Sep 17 00:00:00 2001
From: gord02 <53834349+gord02@users.noreply.github.com>
Date: Thu, 19 Oct 2023 00:29:09 -0400
Subject: [PATCH 09/11] [pkg/ottl] Add Double converter (#27457)

**Description:** Adding a Double converter to pkg/ottl

**Link to tracking Issue:** closes #22056
---
 .chloggen/double-converter.yaml        | 27 ++++++++
 pkg/ottl/ottlfuncs/README.md           | 24 +++++++
 pkg/ottl/ottlfuncs/func_double.go      | 42 ++++++++++++
 pkg/ottl/ottlfuncs/func_double_test.go | 93 ++++++++++++++++++++++++++
 pkg/ottl/ottlfuncs/functions.go        |  1 +
 5 files changed, 187 insertions(+)
 create mode 100755 .chloggen/double-converter.yaml
 create mode 100644 pkg/ottl/ottlfuncs/func_double.go
 create mode 100644 pkg/ottl/ottlfuncs/func_double_test.go

diff --git a/.chloggen/double-converter.yaml b/.chloggen/double-converter.yaml
new file mode 100755
index 000000000000..bec559474677
--- /dev/null
+++ b/.chloggen/double-converter.yaml
@@ -0,0 +1,27 @@
+# Use this changelog template to create an entry for release notes.
+
+# One of 'breaking', 'deprecation', 'new_component', 'enhancement', 'bug_fix'
+change_type: 'enhancement'
+
+# The name of the component, or a single word describing the area of concern, (e.g. filelogreceiver)
+component: doubleconverter
+
+# A brief description of the change.  Surround your text with quotes ("") if it needs to start with a backtick (`).
+note: "Adding a double converter into pkg/ottl"
+
+# Mandatory: One or more tracking issues related to the change. You can use the PR number here if no issue exists.
+issues: [22056]
+
+# (Optional) One or more lines of additional information to render under the primary note.
+# These lines will be padded with 2 spaces and then inserted directly into the document.
+# Use pipe (|) for multiline entries.
+subtext:
+
+# If your change doesn't affect end users or the exported elements of any package,
+# you should instead start your pull request title with [chore] or use the "Skip Changelog" label.
+# Optional: The change log or logs in which this entry should be included.
+# e.g. '[user]' or '[user, api]'
+# Include 'user' if the change is relevant to end users.
+# Include 'api' if there is a change to a library API.
+# Default: '[user]'
+change_logs: [user]
diff --git a/pkg/ottl/ottlfuncs/README.md b/pkg/ottl/ottlfuncs/README.md
index 47c7fc7460de..ac5d7dff851f 100644
--- a/pkg/ottl/ottlfuncs/README.md
+++ b/pkg/ottl/ottlfuncs/README.md
@@ -294,6 +294,7 @@ Available Converters:
 - [ExtractPatterns](#extractpatterns)
 - [FNV](#fnv)
 - [Hours](#hours)
+- [Double](#double)
 - [Duration](#duration)
 - [Int](#int)
 - [IsMap](#ismap)
@@ -365,6 +366,29 @@ Examples:
 
 - `ConvertCase(metric.name, "snake")`
 
+### Double
+
+The `Double` Converter converts an inputted `value` into a double.
+
+The returned type is float64.
+
+The input `value` types:
+* float64. returns the `value` without changes.
+* string. Tries to parse a double from string. If it fails then nil will be returned.
+* bool. If `value` is true, then the function will return 1 otherwise 0.
+* int64. The function converts the integer to a double.
+
+If `value` is another type or parsing failed nil is always returned.
+
+The `value` is either a path expression to a telemetry field to retrieve or a literal.
+
+Examples:
+
+- `Double(attributes["http.status_code"])`
+
+
+- `Double("2.0")`
+
 ### Duration
 
 `Duration(duration)`
diff --git a/pkg/ottl/ottlfuncs/func_double.go b/pkg/ottl/ottlfuncs/func_double.go
new file mode 100644
index 000000000000..c454a6363e5d
--- /dev/null
+++ b/pkg/ottl/ottlfuncs/func_double.go
@@ -0,0 +1,42 @@
+// Copyright The OpenTelemetry Authors
+// SPDX-License-Identifier: Apache-2.0
+
+package ottlfuncs // import "github.com/open-telemetry/opentelemetry-collector-contrib/pkg/ottl/ottlfuncs"
+
+import (
+	"context"
+	"fmt"
+
+	"github.com/open-telemetry/opentelemetry-collector-contrib/pkg/ottl"
+)
+
+type DoubleArguments[K any] struct {
+	Target ottl.FloatLikeGetter[K]
+}
+
+func NewDoubleFactory[K any]() ottl.Factory[K] {
+	return ottl.NewFactory("Double", &DoubleArguments[K]{}, createDoubleFunction[K])
+}
+
+func createDoubleFunction[K any](_ ottl.FunctionContext, oArgs ottl.Arguments) (ottl.ExprFunc[K], error) {
+	args, ok := oArgs.(*DoubleArguments[K])
+
+	if !ok {
+		return nil, fmt.Errorf("DoubleFactory args must be of type *DoubleArguments[K]")
+	}
+
+	return doubleFunc(args.Target), nil
+}
+
+func doubleFunc[K any](target ottl.FloatLikeGetter[K]) ottl.ExprFunc[K] {
+	return func(ctx context.Context, tCtx K) (interface{}, error) {
+		value, err := target.Get(ctx, tCtx)
+		if err != nil {
+			return nil, err
+		}
+		if value == nil {
+			return nil, nil
+		}
+		return *value, nil
+	}
+}
diff --git a/pkg/ottl/ottlfuncs/func_double_test.go b/pkg/ottl/ottlfuncs/func_double_test.go
new file mode 100644
index 000000000000..0e81df0e6681
--- /dev/null
+++ b/pkg/ottl/ottlfuncs/func_double_test.go
@@ -0,0 +1,93 @@
+// Copyright The OpenTelemetry Authors
+// SPDX-License-Identifier: Apache-2.0
+
+package ottlfuncs
+
+import (
+	"context"
+	"testing"
+
+	"github.com/stretchr/testify/assert"
+
+	"github.com/open-telemetry/opentelemetry-collector-contrib/pkg/ottl"
+)
+
+func Test_Double(t *testing.T) {
+	tests := []struct {
+		name     string
+		value    interface{}
+		expected interface{}
+		err      bool
+	}{
+		{
+			name:     "string",
+			value:    "50",
+			expected: float64(50),
+		},
+		{
+			name:     "empty string",
+			value:    "",
+			expected: nil,
+			err:      true,
+		},
+		{
+			name:     "not a number string",
+			value:    "test",
+			expected: nil,
+			err:      true,
+		},
+		{
+			name:     "int64",
+			value:    int64(333),
+			expected: float64(333),
+		},
+		{
+			name:     "float64",
+			value:    float64(2.7),
+			expected: float64(2.7),
+		},
+		{
+			name:     "float64 without decimal",
+			value:    float64(55),
+			expected: float64(55),
+		},
+		{
+			name:     "true",
+			value:    true,
+			expected: float64(1),
+		},
+		{
+			name:     "false",
+			value:    false,
+			expected: float64(0),
+		},
+		{
+			name:     "nil",
+			value:    nil,
+			expected: nil,
+		},
+		{
+			name:     "some struct",
+			value:    struct{}{},
+			expected: nil,
+			err:      true,
+		},
+	}
+	for _, test := range tests {
+		t.Run(test.name, func(t *testing.T) {
+			exprFunc := doubleFunc[interface{}](&ottl.StandardFloatLikeGetter[interface{}]{
+
+				Getter: func(context.Context, interface{}) (interface{}, error) {
+					return test.value, nil
+				},
+			})
+			result, err := exprFunc(nil, nil)
+			if test.err {
+				assert.Error(t, err)
+			} else {
+				assert.NoError(t, err)
+			}
+			assert.Equal(t, test.expected, result)
+		})
+	}
+}
diff --git a/pkg/ottl/ottlfuncs/functions.go b/pkg/ottl/ottlfuncs/functions.go
index 736a49313605..e43507192392 100644
--- a/pkg/ottl/ottlfuncs/functions.go
+++ b/pkg/ottl/ottlfuncs/functions.go
@@ -36,6 +36,7 @@ func converters[K any]() []ottl.Factory[K] {
 		// Converters
 		NewConcatFactory[K](),
 		NewConvertCaseFactory[K](),
+		NewDoubleFactory[K](),
 		NewDurationFactory[K](),
 		NewExtractPatternsFactory[K](),
 		NewFnvFactory[K](),

From be81ae7675a3d7fb92ed16ff1574a46ceb233db2 Mon Sep 17 00:00:00 2001
From: bagmeg <joonsoo181005@gmail.com>
Date: Thu, 19 Oct 2023 14:56:22 +0900
Subject: [PATCH 10/11] [chore][exporter/fileexporter] use errors.Join instead
 of go.uber.org/multierr (#27835)

**Description:** fileexporter: use errors.Join instead of go.uber.org/multierr

**Link to tracking Issue:** #25121
---
 exporter/fileexporter/buffered_writer.go      | 5 ++---
 exporter/fileexporter/buffered_writer_test.go | 4 ++--
 exporter/fileexporter/go.mod                  | 2 +-
 3 files changed, 5 insertions(+), 6 deletions(-)

diff --git a/exporter/fileexporter/buffered_writer.go b/exporter/fileexporter/buffered_writer.go
index 64ee151fa217..6e50b6519296 100644
--- a/exporter/fileexporter/buffered_writer.go
+++ b/exporter/fileexporter/buffered_writer.go
@@ -5,9 +5,8 @@ package fileexporter // import "github.com/open-telemetry/opentelemetry-collecto
 
 import (
 	"bufio"
+	"errors"
 	"io"
-
-	"go.uber.org/multierr"
 )
 
 // bufferedWriteCloser is intended to use more memory
@@ -33,7 +32,7 @@ func (bwc *bufferedWriteCloser) Write(p []byte) (n int, err error) {
 }
 
 func (bwc *bufferedWriteCloser) Close() error {
-	return multierr.Combine(
+	return errors.Join(
 		bwc.buffered.Flush(),
 		bwc.wrapped.Close(),
 	)
diff --git a/exporter/fileexporter/buffered_writer_test.go b/exporter/fileexporter/buffered_writer_test.go
index a6512258d2fa..60f79a08a76b 100644
--- a/exporter/fileexporter/buffered_writer_test.go
+++ b/exporter/fileexporter/buffered_writer_test.go
@@ -5,6 +5,7 @@ package fileexporter
 
 import (
 	"bytes"
+	"errors"
 	"fmt"
 	"io"
 	"os"
@@ -13,7 +14,6 @@ import (
 
 	"github.com/stretchr/testify/assert"
 	"github.com/stretchr/testify/require"
-	"go.uber.org/multierr"
 )
 
 const (
@@ -83,7 +83,7 @@ func BenchmarkWriter(b *testing.B) {
 				for i := 0; i < b.N; i++ {
 					_, err = w.Write(payload)
 				}
-				errBenchmark = multierr.Combine(err, w.Close())
+				errBenchmark = errors.Join(err, w.Close())
 			})
 		}
 	}
diff --git a/exporter/fileexporter/go.mod b/exporter/fileexporter/go.mod
index 11be5ffcb8db..6eba04c79ac8 100644
--- a/exporter/fileexporter/go.mod
+++ b/exporter/fileexporter/go.mod
@@ -12,7 +12,6 @@ require (
 	go.opentelemetry.io/collector/consumer v0.87.1-0.20231017160804-ec0725874313
 	go.opentelemetry.io/collector/exporter v0.87.1-0.20231017160804-ec0725874313
 	go.opentelemetry.io/collector/pdata v1.0.0-rcv0016.0.20231017160804-ec0725874313
-	go.uber.org/multierr v1.11.0
 	gopkg.in/natefinch/lumberjack.v2 v2.2.1
 )
 
@@ -39,6 +38,7 @@ require (
 	go.opentelemetry.io/otel v1.19.0 // indirect
 	go.opentelemetry.io/otel/metric v1.19.0 // indirect
 	go.opentelemetry.io/otel/trace v1.19.0 // indirect
+	go.uber.org/multierr v1.11.0 // indirect
 	go.uber.org/zap v1.26.0 // indirect
 	golang.org/x/net v0.17.0 // indirect
 	golang.org/x/sys v0.13.0 // indirect

From 1842e1356889d1d35d007838f4f74edb2315d974 Mon Sep 17 00:00:00 2001
From: Yang Song <songy23@users.noreply.github.com>
Date: Thu, 19 Oct 2023 09:38:55 -0400
Subject: [PATCH 11/11] [connector/datadog] Allow export to traces pipelines
 (#27846)

**Description:** <Describe what has changed.>
Allow datadogconnector export to traces pipelines

**Link to tracking Issue:** <Issue number if applicable>

**Testing:** <Describe what testing was performed and which tests were
added.>

**Documentation:** <Describe the documentation added.>

---------

Co-authored-by: Pablo Baeyens <pbaeyens31+github@gmail.com>
---
 .chloggen/datadog-connector-traces.yaml       | 27 +++++++++++++++++++
 connector/datadogconnector/README.md          |  3 ++-
 connector/datadogconnector/connector.go       | 15 ++++++++---
 connector/datadogconnector/connector_test.go  | 10 +++++--
 connector/datadogconnector/factory.go         | 13 +++++++--
 .../internal/metadata/generated_status.go     |  1 +
 connector/datadogconnector/metadata.yaml      |  2 +-
 7 files changed, 61 insertions(+), 10 deletions(-)
 create mode 100644 .chloggen/datadog-connector-traces.yaml

diff --git a/.chloggen/datadog-connector-traces.yaml b/.chloggen/datadog-connector-traces.yaml
new file mode 100644
index 000000000000..808b388eb57a
--- /dev/null
+++ b/.chloggen/datadog-connector-traces.yaml
@@ -0,0 +1,27 @@
+# Use this changelog template to create an entry for release notes.
+
+# One of 'breaking', 'deprecation', 'new_component', 'enhancement', 'bug_fix'
+change_type: enhancement
+
+# The name of the component, or a single word describing the area of concern, (e.g. filelogreceiver)
+component: datadogconnector
+
+# A brief description of the change.  Surround your text with quotes ("") if it needs to start with a backtick (`).
+note: Allow datadogconnector to be used as a traces-to-traces connector
+
+# Mandatory: One or more tracking issues related to the change. You can use the PR number here if no issue exists.
+issues: [27846]
+
+# (Optional) One or more lines of additional information to render under the primary note.
+# These lines will be padded with 2 spaces and then inserted directly into the document.
+# Use pipe (|) for multiline entries.
+subtext:
+
+# If your change doesn't affect end users or the exported elements of any package,
+# you should instead start your pull request title with [chore] or use the "Skip Changelog" label.
+# Optional: The change log or logs in which this entry should be included.
+# e.g. '[user]' or '[user, api]'
+# Include 'user' if the change is relevant to end users.
+# Include 'api' if there is a change to a library API.
+# Default: '[user]'
+change_logs: []
diff --git a/connector/datadogconnector/README.md b/connector/datadogconnector/README.md
index ba6c82f892a7..457382cd830c 100644
--- a/connector/datadogconnector/README.md
+++ b/connector/datadogconnector/README.md
@@ -15,6 +15,7 @@
 | [Exporter Pipeline Type] | [Receiver Pipeline Type] | [Stability Level] |
 | ------------------------ | ------------------------ | ----------------- |
 | traces | metrics | [beta] |
+| traces | traces | [beta] |
 
 [Exporter Pipeline Type]: https://github.com/open-telemetry/opentelemetry-collector/blob/main/connector/README.md#exporter-pipeline-type
 [Receiver Pipeline Type]: https://github.com/open-telemetry/opentelemetry-collector/blob/main/connector/README.md#receiver-pipeline-type
@@ -91,7 +92,7 @@ service:
      exporters: [datadog/connector]
 
    traces/2: # this pipeline uses sampling
-     receivers: [otlp]
+     receivers: [datadog/connector]
      processors: [batch, probabilistic_sampler]
      exporters: [datadog]
 
diff --git a/connector/datadogconnector/connector.go b/connector/datadogconnector/connector.go
index 1c089f254490..582e45712825 100644
--- a/connector/datadogconnector/connector.go
+++ b/connector/datadogconnector/connector.go
@@ -18,7 +18,8 @@ import (
 
 // connectorImp is the schema for connector
 type connectorImp struct {
-	metricsConsumer consumer.Metrics // the next component in the pipeline to ingest data after connector
+	metricsConsumer consumer.Metrics // the next component in the pipeline to ingest metrics after connector
+	tracesConsumer  consumer.Traces  // the next component in the pipeline to ingest traces after connector
 	logger          *zap.Logger
 
 	// agent specifies the agent used to ingest traces and output APM Stats.
@@ -40,7 +41,7 @@ type connectorImp struct {
 var _ component.Component = (*connectorImp)(nil) // testing that the connectorImp properly implements the type Component interface
 
 // function to create a new connector
-func newConnector(logger *zap.Logger, _ component.Config, nextConsumer consumer.Metrics) (*connectorImp, error) {
+func newConnector(logger *zap.Logger, _ component.Config, metricsConsumer consumer.Metrics, tracesConsumer consumer.Traces) (*connectorImp, error) {
 	logger.Info("Building datadog connector")
 
 	in := make(chan *pb.StatsPayload, 100)
@@ -55,7 +56,8 @@ func newConnector(logger *zap.Logger, _ component.Config, nextConsumer consumer.
 		agent:           datadog.NewAgent(ctx, in),
 		translator:      trans,
 		in:              in,
-		metricsConsumer: nextConsumer,
+		metricsConsumer: metricsConsumer,
+		tracesConsumer:  tracesConsumer,
 		exit:            make(chan struct{}),
 	}, nil
 }
@@ -64,7 +66,9 @@ func newConnector(logger *zap.Logger, _ component.Config, nextConsumer consumer.
 func (c *connectorImp) Start(_ context.Context, _ component.Host) error {
 	c.logger.Info("Starting datadogconnector")
 	c.agent.Start()
-	go c.run()
+	if c.metricsConsumer != nil {
+		go c.run()
+	}
 	return nil
 }
 
@@ -85,6 +89,9 @@ func (c *connectorImp) Capabilities() consumer.Capabilities {
 
 func (c *connectorImp) ConsumeTraces(ctx context.Context, traces ptrace.Traces) error {
 	c.agent.Ingest(ctx, traces)
+	if c.tracesConsumer != nil {
+		return c.tracesConsumer.ConsumeTraces(ctx, traces)
+	}
 	return nil
 }
 
diff --git a/connector/datadogconnector/connector_test.go b/connector/datadogconnector/connector_test.go
index 7f016b6776a4..d5410720be71 100644
--- a/connector/datadogconnector/connector_test.go
+++ b/connector/datadogconnector/connector_test.go
@@ -23,9 +23,15 @@ func TestNewConnector(t *testing.T) {
 	creationParams := connectortest.NewNopCreateSettings()
 	cfg := factory.CreateDefaultConfig().(*Config)
 
-	traceConnector, err := factory.CreateTracesToMetrics(context.Background(), creationParams, cfg, consumertest.NewNop())
+	traceToMetricsConnector, err := factory.CreateTracesToMetrics(context.Background(), creationParams, cfg, consumertest.NewNop())
 	assert.NoError(t, err)
 
-	_, ok := traceConnector.(*connectorImp)
+	_, ok := traceToMetricsConnector.(*connectorImp)
+	assert.True(t, ok) // checks if the created connector implements the connectorImp struct
+
+	traceToTracesConnector, err := factory.CreateTracesToTraces(context.Background(), creationParams, cfg, consumertest.NewNop())
+	assert.NoError(t, err)
+
+	_, ok = traceToTracesConnector.(*connectorImp)
 	assert.True(t, ok) // checks if the created connector implements the connectorImp struct
 }
diff --git a/connector/datadogconnector/factory.go b/connector/datadogconnector/factory.go
index fc61ebfeff1f..5d1d6673426c 100644
--- a/connector/datadogconnector/factory.go
+++ b/connector/datadogconnector/factory.go
@@ -21,7 +21,8 @@ func NewFactory() connector.Factory {
 	return connector.NewFactory(
 		metadata.Type,
 		createDefaultConfig,
-		connector.WithTracesToMetrics(createTracesToMetricsConnector, metadata.TracesToMetricsStability))
+		connector.WithTracesToMetrics(createTracesToMetricsConnector, metadata.TracesToMetricsStability),
+		connector.WithTracesToTraces(createTracesToTracesConnector, metadata.TracesToTracesStability))
 }
 
 var _ component.Config = (*Config)(nil)
@@ -35,7 +36,15 @@ func createDefaultConfig() component.Config {
 // defines the consumer type of the connector
 // we want to consume traces and export metrics therefore define nextConsumer as metrics, consumer is the next component in the pipeline
 func createTracesToMetricsConnector(_ context.Context, params connector.CreateSettings, cfg component.Config, nextConsumer consumer.Metrics) (connector.Traces, error) {
-	c, err := newConnector(params.Logger, cfg, nextConsumer)
+	c, err := newConnector(params.Logger, cfg, nextConsumer, nil)
+	if err != nil {
+		return nil, err
+	}
+	return c, nil
+}
+
+func createTracesToTracesConnector(_ context.Context, params connector.CreateSettings, cfg component.Config, nextConsumer consumer.Traces) (connector.Traces, error) {
+	c, err := newConnector(params.Logger, cfg, nil, nextConsumer)
 	if err != nil {
 		return nil, err
 	}
diff --git a/connector/datadogconnector/internal/metadata/generated_status.go b/connector/datadogconnector/internal/metadata/generated_status.go
index 6ff2f2e5baa3..1e601630c741 100644
--- a/connector/datadogconnector/internal/metadata/generated_status.go
+++ b/connector/datadogconnector/internal/metadata/generated_status.go
@@ -9,4 +9,5 @@ import (
 const (
 	Type                     = "datadog"
 	TracesToMetricsStability = component.StabilityLevelBeta
+	TracesToTracesStability  = component.StabilityLevelBeta
 )
diff --git a/connector/datadogconnector/metadata.yaml b/connector/datadogconnector/metadata.yaml
index 9de47b0382df..f6b1f32221ef 100644
--- a/connector/datadogconnector/metadata.yaml
+++ b/connector/datadogconnector/metadata.yaml
@@ -3,7 +3,7 @@ type: datadog
 status:
   class: connector
   stability:
-    beta: [traces_to_metrics]
+    beta: [traces_to_metrics, traces_to_traces]
   distributions: [contrib]
   codeowners:
     active: [mx-psi, gbbr, dineshg13]