observIQ · camdencheek · Sep 9, 2020 · Sep 3, 2020 · Sep 3, 2020 · Sep 3, 2020
diff --git a/CHANGELOG.md b/CHANGELOG.md
@@ -4,6 +4,13 @@ All notable changes to this project will be documented in this file.
 The format is based on [Keep a Changelog](https://keepachangelog.com/en/1.0.0/),
 and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0.html).
 
+## Unreleased
+### Added
+- Disk buffer for output operators
+### Changed
+- Split buffers into buffers and flushers for better modularity
+- New memory buffer design for a uniform interface between disk and memory buffers
+
 ## [0.9.14] - 2020-08-31
 ### Fixed
 - Rendering issue with the `kubernetes_events` plugin

diff --git a/commands/graph.go b/commands/graph.go
@@ -49,6 +49,7 @@ func runGraph(_ *cobra.Command, _ []string, flags *RootFlags) {
 	}
 
 	buildContext := pg.BuildContext{
+		Database:       operator.NewStubDatabase(),
 		PluginRegistry: pluginRegistry,
 		Logger:         logger,
 	}

diff --git a/commands/offsets.go b/commands/offsets.go
@@ -42,7 +42,7 @@ func NewOffsetsClearCmd(rootFlags *RootFlags) *cobra.Command {
 			db, err := agent.OpenDatabase(rootFlags.DatabaseFile)
 			exitOnErr("Failed to open database", err)
 			defer db.Close()
-			defer db.Sync()
+			defer func() { _ = db.Sync() }()
 
 			if all {
 				if len(args) != 0 {
@@ -94,7 +94,7 @@ func NewOffsetsListCmd(rootFlags *RootFlags) *cobra.Command {
 			exitOnErr("Failed to open database", err)
 			defer db.Close()
 
-			db.View(func(tx *bbolt.Tx) error {
+			err = db.View(func(tx *bbolt.Tx) error {
 				offsetBucket := tx.Bucket(helper.OffsetsBucket)
 				if offsetBucket == nil {
 					return nil
@@ -105,7 +105,9 @@ func NewOffsetsListCmd(rootFlags *RootFlags) *cobra.Command {
 					return nil
 				})
 			})
-
+			if err != nil {
+				exitOnErr("Failed to read database", err)
+			}
 		},
 	}
 

diff --git a/commands/offsets_test.go b/commands/offsets_test.go
@@ -70,5 +70,4 @@ func TestOffsets(t *testing.T) {
 	err = offsetsList.Execute()
 	require.NoError(t, err)
 	require.Equal(t, "$.testoperatorid1\n", buf.String())
-
 }
diff --git a/docs/operators/elastic_output.md b/docs/operators/elastic_output.md
@@ -14,6 +14,8 @@ The `elastic_output` operator will send entries to an Elasticsearch instance
 | `api_key`     |                  | Base64-encoded token for authorization. If set, overrides username and password                       |
 | `index_field` | default          | A [field](/docs/types/field.md) that indicates which index to send the log entry to                   |
 | `id_field`    |                  | A [field](/docs/types/field.md) that contains an id for the entry. If unset, a unique id is generated |
+| `buffer`      |                  | A [buffer](/docs/types/buffer.md) block indicating how to buffer entries before flushing              |
+| `flusher`     |                  | A [flusher](/docs/types/flusher.md) block configuring flushing behavior                               |
 
 
 ### Example Configurations
@@ -27,3 +29,18 @@ Configuration:
     - "http://localhost:9200"
   api_key: <my_api_key>
 ```
+
+#### Configuration with non-default buffer and flusher params
+
+Configuration:
+```yaml
+- type: elastic_output
+  addresses:
+    - "http://localhost:9200"
+  api_key: <my_api_key>
+  buffer:
+    type: disk
+    path: /tmp/stanza_buffer
+  flusher:
+    max_concurrent: 8
+```
diff --git a/docs/operators/google_cloud_output.md b/docs/operators/google_cloud_output.md
@@ -16,6 +16,8 @@ The `google_cloud_output` operator will send entries to Google Cloud Logging.
 | `span_id_field`    |                       | A [field](/docs/types/field.md) for the span_id on the log entry                                           |
 | `use_compression`  | `true`                | Whether to compress the log entry payloads with gzip before sending to Google Cloud                        |
 | `timeout`          | 10s                   | A [duration](/docs/types/duration.md) indicating how long to wait for the API to respond before timing out |
+| `buffer`           |                       | A [buffer](/docs/types/buffer.md) block indicating how to buffer entries before flushing                   |
+| `flusher`          |                       | A [flusher](/docs/types/flusher.md) block configuring flushing behavior                                    |
 
 If both `credentials` and `credentials_file` are left empty, the agent will attempt to find
 [Application Default Credentials](https://cloud.google.com/docs/authentication/production) from the environment.
@@ -30,3 +32,17 @@ Configuration:
   project_id: sample_project
   credentials_file: /tmp/credentials.json
 ```
+
+#### Configuration with non-default buffer and flusher params
+
+Configuration:
+```yaml
+- type: google_cloud_output
+  project_id: sample_project
+  credentials_file: /tmp/credentials.json
+  buffer:
+    type: disk
+    path: /tmp/stanza_buffer
+  flusher:
+    max_concurrent: 8
+```
diff --git a/docs/types/buffer.md b/docs/types/buffer.md
@@ -0,0 +1,61 @@
+# Buffers
+
+Buffers are used to temporarily store log entries until they can be flushed to their final destination.
+
+There are two types of buffers: `memory` buffers and `disk` buffers.
+
+## Memory Buffers
+
+Memory buffers keep log entries in memory until they are flushed, which makes them very fast. However, because
+entries are only stored in memory, they will be lost if the agent is shut down uncleanly. If the agent is shut down
+cleanly, they will be saved to the agent's database.
+
+### Memory Buffer Configuration
+
+Memory buffers are configured by setting the `type` field of the `buffer` block on an output to `memory`. The only other
+configurable field is `max_entries`, which is maximum number of entries that will be held in memory before blocking and
+waiting for some entries to be flushed. The default value of `max_entries` is `1048576` (2^20).
+
+Example:
+```yaml
+- type: google_cloud_output
+  project_id: my_project_id
+  buffer:
+    type: memory
+    max_entries: 10000
+```
+
+
+## Disk Buffers
+
+Disk buffers store all log entries on disk until they have been successfully flushed to their destination. This means
+that, even in the case of an unclean shutdown (kill signal or power loss), no entries will be lost. However, this comes at the cost of
+some performance.
+
+By default, a disk buffer can handle roughly 10,000 logs per second. This number is highly subject to the specs of the
+machine running the agent, so if exact numbers are important, we'd advise running your own tests.
+
+If you'd like better performance and power loss is not a concern, disabling sync writes improves performance to
+(roughly) 100,000 entries per second. This comes at the tradeoff that, if there is a power failure, there may
+be logs that are lost or a corruption of the database.
+
+### Disk Buffer Configuration
+
+Disk buffers are configured by setting the `type` field of the `buffer` block on an output to `disk`. Other fields are described below:
+
+| Field      | Default             | Description                                                                                                                              |
+| ---        | ---                 | ---                                                                                                                                      |
+| `max_size` | `4294967296` (4GiB) | The maximum size of the disk buffer file in bytes                                                                                        |
+| `path`     | required            | The path to the directory which will contain the disk buffer data                                                                        |
+| `sync`     | `true`              | Whether to open the database files with the O_SYNC flag. Disabling this improves performance, but relaxes guarantees about log delivery. |
+
+Example:
+```yaml
+- type: google_cloud_output
+  project_id: my_project_id
+  buffer:
+    type: disk
+    max_size: 10000000 # 10MB
+    path: /tmp/stanza_buffer
+    sync: true
+```
diff --git a/docs/types/flusher.md b/docs/types/flusher.md
@@ -0,0 +1,23 @@
+# Flushers
+
+Flushers handle reading entries from buffers in chunks, flushing them to their final destination, and retrying on failure.
+
+In most cases, the default options will work well, but they may be need tuning for optimal performance or for reducing load
+on the destination API.
+
+For example, if you hit an API limit on the number of requests per second, consider decreasing `max_concurrent` and
+increasing `max_chunk_entries`. This will make fewer, larger requests which should increase efficiency at the cost of
+some latency.
+
+Or, if you have low load and don't care about the higher latency, consider increasing `max_wait` so that entries are sent
+less often in larger requests.
+
+## Flusher configuration
+
+Flushers are configured with the `flusher` block on output plugins.
+
+| Field               | Default | Description                                                                                                                                   |
+| ---                 | ---     | ---                                                                                                                                           |
+| `max_concurrent`    | `16`    | The maximum number of goroutines flushing entries concurrently                                                                                |
+| `max_wait`          | 1s      | The maximum amount of time to wait for a chunk to fill before flushing it. Higher values can reduce load, but also increase delivery latency. |
+| `max_chunk_entries` | 1000    | The maximum number of entries to flush in a single chunk.                                                                                     |
diff --git a/entry/field.go b/entry/field.go
@@ -5,6 +5,12 @@ import (
 	"fmt"
 )
 
+const (
+	labelsPrefix   = "$labels"
+	resourcePrefix = "$resource"
+	recordPrefix   = "$record"
+)
+
 // Field represents a potential field on an entry.
 // It is used to get, set, and delete values at this field.
 // It is deserialized from JSON dot notation.
@@ -49,17 +55,17 @@ func fieldFromString(s string) (Field, error) {
 	}
 
 	switch split[0] {
-	case "$labels":
+	case labelsPrefix:
 		if len(split) != 2 {
 			return Field{}, fmt.Errorf("labels cannot be nested")
 		}
 		return Field{LabelField{split[1]}}, nil
-	case "$resource":
+	case resourcePrefix:
 		if len(split) != 2 {
 			return Field{}, fmt.Errorf("resource fields cannot be nested")
 		}
 		return Field{ResourceField{split[1]}}, nil
-	case "$record", "$":
+	case recordPrefix, "$":
 		return Field{RecordField{split[1:]}}, nil
 	default:
 		return Field{RecordField{split}}, nil
@@ -127,12 +133,13 @@ func splitField(s string) ([]string, error) {
 			}
 			state = OUT_BRACKET
 		case OUT_BRACKET:
-			if c == '.' {
+			switch c {
+			case '.':
 				state = IN_UNBRACKETED_TOKEN
 				tokenStart = i + 1
-			} else if c == '[' {
+			case '[':
 				state = IN_BRACKET
-			} else {
+			default:
 				return nil, fmt.Errorf("bracketed access must be followed by a dot or another bracketed access")
 			}
 		case IN_UNBRACKETED_TOKEN:

diff --git a/entry/label_field_test.go b/entry/label_field_test.go
@@ -50,7 +50,6 @@ func TestLabelFieldGet(t *testing.T) {
 			require.Equal(t, tc.expected, val)
 		})
 	}
-
 }
 
 func TestLabelFieldDelete(t *testing.T) {
@@ -103,7 +102,6 @@ func TestLabelFieldDelete(t *testing.T) {
 			require.Equal(t, tc.expected, val)
 		})
 	}
-
 }
 
 func TestLabelFieldSet(t *testing.T) {
@@ -172,7 +170,6 @@ func TestLabelFieldSet(t *testing.T) {
 			require.Equal(t, tc.expected, entry.Labels)
 		})
 	}
-
 }
 
 func TestLabelFieldString(t *testing.T) {
@@ -198,5 +195,4 @@ func TestLabelFieldString(t *testing.T) {
 			require.Equal(t, tc.expected, tc.field.String())
 		})
 	}
-
 }
diff --git a/entry/record_field.go b/entry/record_field.go
@@ -197,7 +197,7 @@ func (f RecordField) MarshalYAML() (interface{}, error) {
 func fromJSONDot(value string) RecordField {
 	keys := strings.Split(value, ".")
 
-	if keys[0] == "$" || keys[0] == "$record" {
+	if keys[0] == "$" || keys[0] == recordPrefix {
 		keys = keys[1:]
 	}
 
@@ -207,7 +207,7 @@ func fromJSONDot(value string) RecordField {
 // toJSONDot returns the JSON dot notation for a field.
 func toJSONDot(field RecordField) string {
 	if field.isRoot() {
-		return "$record"
+		return recordPrefix
 	}
 
 	containsDots := false
@@ -219,7 +219,7 @@ func toJSONDot(field RecordField) string {
 
 	var b strings.Builder
 	if containsDots {
-		b.WriteString("$record")
+		b.WriteString(recordPrefix)
 		for _, key := range field.Keys {
 			b.WriteString(`['`)
 			b.WriteString(key)
@@ -232,7 +232,6 @@ func toJSONDot(field RecordField) string {
 			}
 			b.WriteString(key)
 		}
-
 	}
 
 	return b.String()

diff --git a/entry/record_field_test.go b/entry/record_field_test.go
@@ -250,7 +250,7 @@ func TestRecordFieldSet(t *testing.T) {
 		t.Run(tc.name, func(t *testing.T) {
 			entry := New()
 			entry.Record = tc.record
-			entry.Set(tc.field, tc.setTo)
+			require.NoError(t, entry.Set(tc.field, tc.setTo))
 			assert.Equal(t, tc.expectedVal, entry.Record)
 		})
 	}

diff --git a/entry/resource_field_test.go b/entry/resource_field_test.go
@@ -50,7 +50,6 @@ func TestResourceFieldGet(t *testing.T) {
 			require.Equal(t, tc.expected, val)
 		})
 	}
-
 }
 
 func TestResourceFieldDelete(t *testing.T) {
@@ -103,7 +102,6 @@ func TestResourceFieldDelete(t *testing.T) {
 			require.Equal(t, tc.expected, val)
 		})
 	}
-
 }
 
 func TestResourceFieldSet(t *testing.T) {
@@ -172,7 +170,6 @@ func TestResourceFieldSet(t *testing.T) {
 			require.Equal(t, tc.expected, entry.Resource)
 		})
 	}
-
 }
 
 func TestResourceFieldString(t *testing.T) {
@@ -198,5 +195,4 @@ func TestResourceFieldString(t *testing.T) {
 			require.Equal(t, tc.expected, tc.field.String())
 		})
 	}
-
 }
diff --git a/go.mod b/go.mod
@@ -3,36 +3,40 @@ module github.com/observiq/stanza
 go 1.14
 
 require (
+	cloud.google.com/go v0.46.3 // indirect
 	cloud.google.com/go/logging v1.0.0
 	github.com/antonmedv/expr v1.8.2
 	github.com/cenkalti/backoff/v4 v4.0.2
 	github.com/elastic/go-elasticsearch/v7 v7.7.0
 	github.com/golang/protobuf v1.4.2
-	github.com/golangci/golangci-lint v1.30.0 // indirect
-	github.com/googleapis/gax-go v1.0.3
+	github.com/google/go-cmp v0.5.0 // indirect
 	github.com/hashicorp/go-uuid v1.0.2
-	github.com/influxdata/go-syslog/v3 v3.0.0 // indirect
 	github.com/json-iterator/go v1.1.9
 	github.com/kardianos/service v1.0.0
-	github.com/kr/pretty v0.2.0 // indirect
+	github.com/kr/text v0.2.0 // indirect
+	github.com/niemeyer/pretty v0.0.0-20200227124842-a10e7caefd8e // indirect
 	github.com/observiq/ctimefmt v1.0.0
 	github.com/observiq/go-syslog/v3 v3.0.2
+	github.com/onsi/ginkgo v1.13.0 // indirect
 	github.com/pkg/errors v0.9.1 // indirect
 	github.com/spf13/cobra v1.0.0
 	github.com/stretchr/testify v1.6.1
-	github.com/vektra/mockery v1.1.2 // indirect
 	go.etcd.io/bbolt v1.3.4
 	go.uber.org/zap v1.15.0
+	golang.org/x/exp v0.0.0-20191030013958-a1ab85dbe136 // indirect
 	golang.org/x/lint v0.0.0-20200302205851-738671d3881b // indirect
-	golang.org/x/net v0.0.0-20200625001655-4c5254603344
 	golang.org/x/oauth2 v0.0.0-20190604053449-0f29369cfe45
+	golang.org/x/sync v0.0.0-20200625203802-6e8e738ad208
 	golang.org/x/sys v0.0.0-20200625212154-ddb9806d33ae
 	golang.org/x/text v0.3.3
+	golang.org/x/tools v0.0.0-20200724022722-7017fd6b1305 // indirect
 	gonum.org/v1/gonum v0.6.2
 	google.golang.org/api v0.20.0
 	google.golang.org/genproto v0.0.0-20200304201815-d429ff31ee6c
 	google.golang.org/grpc v1.27.1
+	gopkg.in/check.v1 v1.0.0-20200227125254-8fa46927fb4f // indirect
 	gopkg.in/yaml.v2 v2.3.0
+	honnef.co/go/tools v0.0.1-2020.1.4 // indirect
 	k8s.io/api v0.18.6
 	k8s.io/apimachinery v0.18.6
 	k8s.io/client-go v0.18.6