From ee2a744c963d27bac48c5882c9b68563d17fc225 Mon Sep 17 00:00:00 2001 From: Cristian Velazquez Date: Mon, 24 Jul 2023 18:49:47 +0000 Subject: [PATCH] Improve Any stack usage By doing this unsafe approach we are able to save one call to morestack. Stack usage SUBQ $0x118, SP // 280 bytes Benchmark before goos: linux goarch: amd64 pkg: go.uber.org/zap cpu: AMD EPYC 7B13 BenchmarkAny/normal 18570822 61.33 ns/op 24 B/op 1 allocs/op BenchmarkAny/normal-2 20671512 59.85 ns/op 24 B/op 1 allocs/op BenchmarkAny/normal-4 20064495 58.73 ns/op 24 B/op 1 allocs/op BenchmarkAny/normal-8 19763770 60.18 ns/op 24 B/op 1 allocs/op BenchmarkAny/normal_with_logger 7673887 157.4 ns/op 112 B/op 3 allocs/op BenchmarkAny/normal_with_logger-2 8318539 143.0 ns/op 112 B/op 3 allocs/op BenchmarkAny/normal_with_logger-4 8584477 139.0 ns/op 112 B/op 3 allocs/op BenchmarkAny/normal_with_logger-8 8203886 147.7 ns/op 112 B/op 3 allocs/op BenchmarkAny/normal_new_goroutine 273378 3873 ns/op 137 B/op 2 allocs/op BenchmarkAny/normal_new_goroutine-2 496189 2141 ns/op 72 B/op 2 allocs/op BenchmarkAny/normal_new_goroutine-4 1000000 1088 ns/op 72 B/op 2 allocs/op BenchmarkAny/normal_new_goroutine-8 1743856 678.5 ns/op 72 B/op 2 allocs/op PASS ok go.uber.org/zap 15.922s Benchmark after goos: linux goarch: amd64 pkg: go.uber.org/zap cpu: AMD EPYC 7B13 BenchmarkAny/normal 15874744 75.15 ns/op 24 B/op 1 allocs/op BenchmarkAny/normal-2 16086948 71.64 ns/op 24 B/op 1 allocs/op BenchmarkAny/normal-4 16595194 71.02 ns/op 24 B/op 1 allocs/op BenchmarkAny/normal-8 16130025 72.98 ns/op 24 B/op 1 allocs/op BenchmarkAny/normal_with_logger 9092430 130.0 ns/op 88 B/op 2 allocs/op BenchmarkAny/normal_with_logger-2 10157986 122.6 ns/op 88 B/op 2 allocs/op BenchmarkAny/normal_with_logger-4 9523335 123.1 ns/op 88 B/op 2 allocs/op BenchmarkAny/normal_with_logger-8 9183698 128.2 ns/op 88 B/op 2 allocs/op BenchmarkAny/normal_new_goroutine 1250547 883.7 ns/op 73 B/op 2 allocs/op BenchmarkAny/normal_new_goroutine-2 2108619 659.3 ns/op 72 B/op 2 allocs/op BenchmarkAny/normal_new_goroutine-4 2919674 407.9 ns/op 72 B/op 2 allocs/op BenchmarkAny/normal_new_goroutine-8 4778667 320.5 ns/op 72 B/op 2 allocs/op PASS ok go.uber.org/zap 18.898s --- field.go | 476 +++++++++++++++++++++++++++++++++++++++++++------- field_test.go | 38 ++++ 2 files changed, 450 insertions(+), 64 deletions(-) diff --git a/field.go b/field.go index bbb745db5..18baaab9f 100644 --- a/field.go +++ b/field.go @@ -24,6 +24,7 @@ import ( "fmt" "math" "time" + "unsafe" "go.uber.org/zap/zapcore" ) @@ -410,6 +411,13 @@ func Inline(val zapcore.ObjectMarshaler) Field { } } +type anyParams struct { + f *Field + k *string + p unsafe.Pointer + anyP [16]byte +} + // Any takes a key and an arbitrary value and chooses the best way to represent // them as a field, falling back to a reflection-based approach only if // necessary. @@ -417,133 +425,473 @@ func Inline(val zapcore.ObjectMarshaler) Field { // Since byte/uint8 and rune/int32 are aliases, Any can't differentiate between // them. To minimize surprises, []byte values are treated as binary blobs, byte // values are treated as uint8, and runes are always treated as integers. -func Any(key string, value interface{}) Field { +func Any(key string, value interface{}) (f Field) { + params := anyParams{ + f: &f, + k: &key, + // most common case + p: (*(*[2]unsafe.Pointer)(unsafe.Pointer(&value)))[1], + // interface case + anyP: *(*[16]byte)(unsafe.Pointer(&value)), + } switch val := value.(type) { case zapcore.ObjectMarshaler: - return Object(key, val) + _fixInterface(¶ms, unsafe.Pointer(&val)) + _object(¶ms) case zapcore.ArrayMarshaler: - return Array(key, val) + _fixInterface(¶ms, unsafe.Pointer(&val)) + _array(¶ms) case bool: - return Bool(key, val) + _bool(¶ms) case *bool: - return Boolp(key, val) + _boolp(¶ms) case []bool: - return Bools(key, val) + _bools(¶ms) case complex128: - return Complex128(key, val) + _complex128(¶ms) case *complex128: - return Complex128p(key, val) + _complex128p(¶ms) case []complex128: - return Complex128s(key, val) + _complex128s(¶ms) case complex64: - return Complex64(key, val) + _complex64(¶ms) case *complex64: - return Complex64p(key, val) + _complex64p(¶ms) case []complex64: - return Complex64s(key, val) + _complex64s(¶ms) case float64: - return Float64(key, val) + _float64(¶ms) case *float64: - return Float64p(key, val) + _float64p(¶ms) case []float64: - return Float64s(key, val) + _float64s(¶ms) case float32: - return Float32(key, val) + _float32(¶ms) case *float32: - return Float32p(key, val) + _float32p(¶ms) case []float32: - return Float32s(key, val) + _float32s(¶ms) case int: - return Int(key, val) + _int(¶ms) case *int: - return Intp(key, val) + _intp(¶ms) case []int: - return Ints(key, val) + _ints(¶ms) case int64: - return Int64(key, val) + _int64(¶ms) case *int64: - return Int64p(key, val) + _int64p(¶ms) case []int64: - return Int64s(key, val) + _int64s(¶ms) case int32: - return Int32(key, val) + _int32(¶ms) case *int32: - return Int32p(key, val) + _int32p(¶ms) case []int32: - return Int32s(key, val) + _int32s(¶ms) case int16: - return Int16(key, val) + _int16(¶ms) case *int16: - return Int16p(key, val) + _int16p(¶ms) case []int16: - return Int16s(key, val) + _int16s(¶ms) case int8: - return Int8(key, val) + _int8(¶ms) case *int8: - return Int8p(key, val) + _int8p(¶ms) case []int8: - return Int8s(key, val) + _int8s(¶ms) case string: - return String(key, val) + _string(¶ms) case *string: - return Stringp(key, val) + _stringp(¶ms) case []string: - return Strings(key, val) + _strings(¶ms) case uint: - return Uint(key, val) + _uint(¶ms) case *uint: - return Uintp(key, val) + _uintp(¶ms) case []uint: - return Uints(key, val) + _uints(¶ms) case uint64: - return Uint64(key, val) + _uint64(¶ms) case *uint64: - return Uint64p(key, val) + _uint64p(¶ms) case []uint64: - return Uint64s(key, val) + _uint64s(¶ms) case uint32: - return Uint32(key, val) + _uint32(¶ms) case *uint32: - return Uint32p(key, val) + _uint32p(¶ms) case []uint32: - return Uint32s(key, val) + _uint32s(¶ms) case uint16: - return Uint16(key, val) + _uint16(¶ms) case *uint16: - return Uint16p(key, val) + _uint16p(¶ms) case []uint16: - return Uint16s(key, val) + _uint16s(¶ms) case uint8: - return Uint8(key, val) + _uint8(¶ms) case *uint8: - return Uint8p(key, val) + _uint8p(¶ms) case []byte: - return Binary(key, val) + _binary(¶ms) case uintptr: - return Uintptr(key, val) + _uintptr(¶ms) case *uintptr: - return Uintptrp(key, val) + _uintptrp(¶ms) case []uintptr: - return Uintptrs(key, val) + _uintptrs(¶ms) case time.Time: - return Time(key, val) + _time(¶ms) case *time.Time: - return Timep(key, val) + _timep(¶ms) case []time.Time: - return Times(key, val) + _times(¶ms) case time.Duration: - return Duration(key, val) + _duration(¶ms) case *time.Duration: - return Durationp(key, val) + _durationp(¶ms) case []time.Duration: - return Durations(key, val) + _durations(¶ms) case error: - return NamedError(key, val) + _fixInterface(¶ms, unsafe.Pointer(&val)) + _namedError(¶ms) case []error: - return Errors(key, val) + _errors(¶ms) case fmt.Stringer: - return Stringer(key, val) + _fixInterface(¶ms, unsafe.Pointer(&val)) + _stringer(¶ms) default: - return Reflect(key, val) + _reflect(¶ms) } + + return +} + +// _fixInterface makes sure that first 8 bytes are the correct object type. This happens because when we do any(10), the +// interface would look like: +// [ , ] +// but what if the object is an interface, so when we do a := any(errors.New("some error")) and then we do type +// assertion a.(error), this actually changes the first 8 bytes. +func _fixInterface(p *anyParams, valPtr unsafe.Pointer) { + copy(p.anyP[:], (*(*[8]byte)(valPtr))[:]) +} + +//go:noinline +func _object(p *anyParams) { + *p.f = Object(*p.k, *(*zapcore.ObjectMarshaler)(unsafe.Pointer(&p.anyP))) +} + +//go:noinline +func _array(p *anyParams) { + *p.f = Array(*p.k, *(*zapcore.ArrayMarshaler)(unsafe.Pointer(&p.anyP))) +} + +//go:noinline +func _bool(p *anyParams) { + *p.f = Bool(*p.k, *(*bool)(p.p)) +} + +//go:noinline +func _boolp(p *anyParams) { + *p.f = Boolp(*p.k, (*bool)(p.p)) +} + +//go:noinline +func _bools(p *anyParams) { + *p.f = Bools(*p.k, *(*[]bool)(p.p)) +} + +//go:noinline +func _complex128(p *anyParams) { + *p.f = Complex128(*p.k, *(*complex128)(p.p)) +} + +//go:noinline +func _complex128p(p *anyParams) { + *p.f = Complex128p(*p.k, (*complex128)(p.p)) +} + +//go:noinline +func _complex128s(p *anyParams) { + *p.f = Complex128s(*p.k, *(*[]complex128)(p.p)) +} + +//go:noinline +func _complex64(p *anyParams) { + *p.f = Complex64(*p.k, *(*complex64)(p.p)) +} + +//go:noinline +func _complex64p(p *anyParams) { + *p.f = Complex64p(*p.k, (*complex64)(p.p)) +} + +//go:noinline +func _complex64s(p *anyParams) { + *p.f = Complex64s(*p.k, *(*[]complex64)(p.p)) +} + +//go:noinline +func _float64(p *anyParams) { + *p.f = Float64(*p.k, *(*float64)(p.p)) +} + +//go:noinline +func _float64p(p *anyParams) { + *p.f = Float64p(*p.k, (*float64)(p.p)) +} + +//go:noinline +func _float64s(p *anyParams) { + *p.f = Float64s(*p.k, *(*[]float64)(p.p)) +} + +//go:noinline +func _float32(p *anyParams) { + *p.f = Float32(*p.k, *(*float32)(p.p)) +} + +//go:noinline +func _float32p(p *anyParams) { + *p.f = Float32p(*p.k, (*float32)(p.p)) +} + +//go:noinline +func _float32s(p *anyParams) { + *p.f = Float32s(*p.k, *(*[]float32)(p.p)) +} + +//go:noinline +func _int(p *anyParams) { + *p.f = Int(*p.k, *(*int)(p.p)) +} + +//go:noinline +func _intp(p *anyParams) { + *p.f = Intp(*p.k, (*int)(p.p)) +} + +//go:noinline +func _ints(p *anyParams) { + *p.f = Ints(*p.k, *(*[]int)(p.p)) +} + +//go:noinline +func _int64(p *anyParams) { + *p.f = Int64(*p.k, *(*int64)(p.p)) +} + +//go:noinline +func _int64p(p *anyParams) { + *p.f = Int64p(*p.k, (*int64)(p.p)) +} + +//go:noinline +func _int64s(p *anyParams) { + *p.f = Int64s(*p.k, *(*[]int64)(p.p)) +} + +//go:noinline +func _int32(p *anyParams) { + *p.f = Int32(*p.k, *(*int32)(p.p)) +} + +//go:noinline +func _int32p(p *anyParams) { + *p.f = Int32p(*p.k, (*int32)(p.p)) +} + +//go:noinline +func _int32s(p *anyParams) { + *p.f = Int32s(*p.k, *(*[]int32)(p.p)) +} + +//go:noinline +func _int16(p *anyParams) { + *p.f = Int16(*p.k, *(*int16)(p.p)) +} + +//go:noinline +func _int16p(p *anyParams) { + *p.f = Int16p(*p.k, (*int16)(p.p)) +} + +//go:noinline +func _int16s(p *anyParams) { + *p.f = Int16s(*p.k, *(*[]int16)(p.p)) +} + +//go:noinline +func _int8(p *anyParams) { + *p.f = Int8(*p.k, *(*int8)(p.p)) +} + +//go:noinline + +func _int8p(p *anyParams) { + *p.f = Int8p(*p.k, (*int8)(p.p)) +} + +//go:noinline +func _int8s(p *anyParams) { + *p.f = Int8s(*p.k, *(*[]int8)(p.p)) +} + +//go:noinline +func _string(p *anyParams) { + *p.f = String(*p.k, *(*string)(p.p)) +} + +//go:noinline + +func _stringp(p *anyParams) { + *p.f = Stringp(*p.k, (*string)(p.p)) +} + +//go:noinline +func _strings(p *anyParams) { + *p.f = Strings(*p.k, *(*[]string)(p.p)) +} + +//go:noinline +func _uint(p *anyParams) { + *p.f = Uint(*p.k, *(*uint)(p.p)) +} + +//go:noinline +func _uintp(p *anyParams) { + *p.f = Uintp(*p.k, (*uint)(p.p)) +} + +//go:noinline +func _uints(p *anyParams) { + *p.f = Uints(*p.k, *(*[]uint)(p.p)) +} + +//go:noinline +func _uint64(p *anyParams) { + *p.f = Uint64(*p.k, *(*uint64)(p.p)) +} + +//go:noinline +func _uint64p(p *anyParams) { + *p.f = Uint64p(*p.k, (*uint64)(p.p)) +} + +//go:noinline +func _uint64s(p *anyParams) { + *p.f = Uint64s(*p.k, *(*[]uint64)(p.p)) +} + +//go:noinline +func _uint32(p *anyParams) { + *p.f = Uint32(*p.k, *(*uint32)(p.p)) +} + +//go:noinline +func _uint32p(p *anyParams) { + *p.f = Uint32p(*p.k, (*uint32)(p.p)) +} + +//go:noinline +func _uint32s(p *anyParams) { + *p.f = Uint32s(*p.k, *(*[]uint32)(p.p)) +} + +//go:noinline +func _uint16(p *anyParams) { + *p.f = Uint16(*p.k, *(*uint16)(p.p)) +} + +//go:noinline +func _uint16p(p *anyParams) { + *p.f = Uint16p(*p.k, (*uint16)(p.p)) +} + +//go:noinline +func _uint16s(p *anyParams) { + *p.f = Uint16s(*p.k, *(*[]uint16)(p.p)) +} + +//go:noinline +func _uint8(p *anyParams) { + *p.f = Uint8(*p.k, *(*uint8)(p.p)) +} + +//go:noinline +func _uint8p(p *anyParams) { + *p.f = Uint8p(*p.k, (*uint8)(p.p)) +} + +//go:noinline +func _binary(p *anyParams) { + *p.f = Binary(*p.k, *(*[]byte)(p.p)) +} + +//go:noinline +func _uintptr(p *anyParams) { + *p.f = Uintptr(*p.k, *(*uintptr)(p.p)) +} + +//go:noinline +func _uintptrp(p *anyParams) { + *p.f = Uintptrp(*p.k, (*uintptr)(p.p)) +} + +//go:noinline +func _uintptrs(p *anyParams) { + *p.f = Uintptrs(*p.k, *(*[]uintptr)(p.p)) +} + +//go:noinline +func _time(p *anyParams) { + *p.f = Time(*p.k, *(*time.Time)(p.p)) +} + +//go:noinline +func _timep(p *anyParams) { + *p.f = Timep(*p.k, (*time.Time)(p.p)) +} + +//go:noinline +func _times(p *anyParams) { + *p.f = Times(*p.k, *(*[]time.Time)(p.p)) +} + +//go:noinline +func _duration(p *anyParams) { + *p.f = Duration(*p.k, *(*time.Duration)(p.p)) +} + +//go:noinline +func _durationp(p *anyParams) { + *p.f = Durationp(*p.k, (*time.Duration)(p.p)) +} + +//go:noinline +func _durations(p *anyParams) { + *p.f = Durations(*p.k, *(*[]time.Duration)(p.p)) +} + +//go:noinline +func _namedError(p *anyParams) { + *p.f = NamedError(*p.k, *(*error)(unsafe.Pointer(&p.anyP))) +} + +//go:noinline +func _errors(p *anyParams) { + *p.f = Errors(*p.k, *(*[]error)(p.p)) +} + +//go:noinline +func _stringer(p *anyParams) { + *p.f = Stringer(*p.k, *(*fmt.Stringer)(unsafe.Pointer(&p.anyP))) +} + +//go:noinline +func _reflect(p *anyParams) { + *p.f = Reflect(*p.k, *(*any)(unsafe.Pointer(&p.anyP))) } diff --git a/field_test.go b/field_test.go index 5b49eb2f0..75296fd0f 100644 --- a/field_test.go +++ b/field_test.go @@ -21,9 +21,11 @@ package zap import ( + "errors" "math" "net" "regexp" + "runtime" "sync" "testing" "time" @@ -282,3 +284,39 @@ func TestStackSkipFieldWithSkip(t *testing.T) { assert.Equal(t, takeStacktrace(1), f.String, "Unexpected stack trace") assertCanBeReused(t, f) } + +func BenchmarkAny(b *testing.B) { + b.Run("normal", func(b *testing.B) { + errs := []error{errors.New("this error")} + b.ResetTimer() + for i := 0; i < b.N; i++ { + field := Any("error", errs) + runtime.KeepAlive(field) + } + }) + + b.Run("normal with logger", func(b *testing.B) { + errs := []error{errors.New("this error")} + b.ResetTimer() + for i := 0; i < b.N; i++ { + field := Any("error", errs) + L().Error("", field) + } + }) + + b.Run("normal new goroutine", func(b *testing.B) { + errs := []error{errors.New("this error")} + wg := sync.WaitGroup{} + wg.Add(b.N) + b.ResetTimer() + for i := 0; i < b.N; i++ { + go func() { + field := Any("error", errs) + runtime.KeepAlive(field) + wg.Done() + }() + } + + wg.Wait() + }) +}