Skip to content

Commit

Permalink
dotenv: fix parse error on files with UTF-8 BOM
Browse files Browse the repository at this point in the history
Some Windows editors tend to add UTF-8 BOM markers to files,
which breaks parsing of `.env` files.

Now, when the file is read, if it starts with a UTF-8 BOM,
we'll skip it. (`.env` files are always processed as UTF-8.)

See docker/compose#9799.

Signed-off-by: Milas Bowman <[email protected]>
  • Loading branch information
milas committed Sep 2, 2022
1 parent 7aed131 commit f4d0f7d
Show file tree
Hide file tree
Showing 3 changed files with 43 additions and 3 deletions.
9 changes: 9 additions & 0 deletions dotenv/fixtures/utf8-bom.env
Original file line number Diff line number Diff line change
@@ -0,0 +1,9 @@
OPTION_A=1
OPTION_B=2
OPTION_C= 3
OPTION_D =4
OPTION_E = 5
456 = ABC
OPTION_F =
OPTION_G=
OPTION_H = my string # Inline comment
7 changes: 7 additions & 0 deletions dotenv/godotenv.go
Original file line number Diff line number Diff line change
Expand Up @@ -14,6 +14,7 @@
package dotenv

import (
"bytes"
"errors"
"fmt"
"io"
Expand All @@ -29,6 +30,8 @@ import (

const doubleQuoteSpecialChars = "\\\n\r\"!$`"

var utf8BOM = []byte("\uFEFF")

// LookupFn represents a lookup function to resolve variables from
type LookupFn func(string) (string, bool)

Expand All @@ -48,6 +51,10 @@ func ParseWithLookup(r io.Reader, lookupFn LookupFn) (map[string]string, error)
return nil, err
}

// seek past the UTF-8 BOM if it exists (particularly on Windows, some
// editors tend to add it, and it'll cause parsing to fail)
data = bytes.TrimPrefix(data, utf8BOM)

return UnmarshalBytesWithLookup(data, lookupFn)
}

Expand Down
30 changes: 27 additions & 3 deletions dotenv/godotenv_test.go
Original file line number Diff line number Diff line change
Expand Up @@ -7,6 +7,8 @@ import (
"reflect"
"strings"
"testing"

"github.com/stretchr/testify/require"
)

var noopPresets = make(map[string]string)
Expand Down Expand Up @@ -131,7 +133,7 @@ func TestLoadDoesNotOverride(t *testing.T) {
loadEnvAndCompareValues(t, Load, envFileName, expectedValues, presets)
}

func TestOveroadDoesOverride(t *testing.T) {
func TestOverloadDoesOverride(t *testing.T) {
envFileName := "fixtures/plain.env"

// ensure NO overload
Expand Down Expand Up @@ -525,7 +527,7 @@ func TestRoundtrip(t *testing.T) {
}
}

func TestInheritedEnvVariablSameSize(t *testing.T) {
func TestInheritedEnvVariableSameSize(t *testing.T) {
const envKey = "VAR_TO_BE_LOADED_FROM_OS_ENV"
const envVal = "SOME_RANDOM_VALUE"
os.Setenv(envKey, envVal)
Expand All @@ -551,7 +553,7 @@ func TestInheritedEnvVariablSameSize(t *testing.T) {
}
}

func TestInheritedEnvVariablSingleVar(t *testing.T) {
func TestInheritedEnvVariableSingleVar(t *testing.T) {
const envKey = "VAR_TO_BE_LOADED_FROM_OS_ENV"
const envVal = "SOME_RANDOM_VALUE"
os.Setenv(envKey, envVal)
Expand Down Expand Up @@ -702,3 +704,25 @@ func TestSubstitutionsWithUnsetVarEnvFileDefaultValuePrecedence(t *testing.T) {
}
}
}

func TestUTF8BOM(t *testing.T) {
envFileName := "fixtures/utf8-bom.env"

// sanity check the fixture, since the UTF-8 BOM is invisible, it'd be
// easy for it to get removed by accident, which would invalidate this
// test
envFileData, err := os.ReadFile(envFileName)
require.NoError(t, err)
require.True(t, bytes.HasPrefix(envFileData, []byte("\uFEFF")),
"Test fixture file is missing UTF-8 BOM")

expectedValues := map[string]string{
"OPTION_A": "1",
"OPTION_B": "2",
"OPTION_C": "3",
"OPTION_D": "4",
"OPTION_E": "5",
}

loadEnvAndCompareValues(t, Load, envFileName, expectedValues, noopPresets)
}

0 comments on commit f4d0f7d

Please sign in to comment.