diff --git a/apis/grpc/v1/payload/payload.pb.go b/apis/grpc/v1/payload/payload.pb.go index bf541cb5cd..6ea1603db4 100644 --- a/apis/grpc/v1/payload/payload.pb.go +++ b/apis/grpc/v1/payload/payload.pb.go @@ -6960,6 +6960,7 @@ var ( (*anypb.Any)(nil), // 105: google.protobuf.Any } ) + var file_v1_payload_payload_proto_depIdxs = []int32{ 22, // 0: payload.v1.Search.Request.config:type_name -> payload.v1.Search.Config 16, // 1: payload.v1.Search.MultiRequest.requests:type_name -> payload.v1.Search.Request diff --git a/apis/grpc/v1/rpc/errdetails/error_details.pb.go b/apis/grpc/v1/rpc/errdetails/error_details.pb.go index 1ca92f9554..ff9e1c42cf 100644 --- a/apis/grpc/v1/rpc/errdetails/error_details.pb.go +++ b/apis/grpc/v1/rpc/errdetails/error_details.pb.go @@ -1108,6 +1108,7 @@ var ( (*durationpb.Duration)(nil), // 15: google.protobuf.Duration } ) + var file_v1_rpc_errdetails_error_details_proto_depIdxs = []int32{ 10, // 0: rpc.v1.ErrorInfo.metadata:type_name -> rpc.v1.ErrorInfo.MetadataEntry 15, // 1: rpc.v1.RetryInfo.retry_delay:type_name -> google.protobuf.Duration diff --git a/internal/net/grpc/client.go b/internal/net/grpc/client.go index b6a4f3eceb..de6b1ab285 100644 --- a/internal/net/grpc/client.go +++ b/internal/net/grpc/client.go @@ -87,30 +87,32 @@ type Client interface { GetDialOption() []DialOption GetCallOption() []CallOption GetBackoff() backoff.Backoff + SetDisableResolveDNSAddr(addr string, disabled bool) ConnectedAddrs() []string Close(ctx context.Context) error } type gRPCClient struct { - addrs map[string]struct{} - poolSize uint64 - clientCount uint64 - conns sync.Map[string, pool.Conn] - hcDur time.Duration - prDur time.Duration - dialer net.Dialer - enablePoolRebalance bool - resolveDNS bool - dopts []DialOption - copts []CallOption - roccd string // reconnection old connection closing duration - eg errgroup.Group - bo backoff.Backoff - cb circuitbreaker.CircuitBreaker - gbo gbackoff.Config // grpc's original backoff configuration - mcd time.Duration // minimum connection timeout duration - group singleflight.Group[pool.Conn] - crl sync.Map[string, bool] // connection request list + addrs map[string]struct{} + poolSize uint64 + clientCount uint64 + conns sync.Map[string, pool.Conn] + hcDur time.Duration + prDur time.Duration + dialer net.Dialer + enablePoolRebalance bool + disableResolveDNSAddrs sync.Map[string, bool] + resolveDNS bool + dopts []DialOption + copts []CallOption + roccd string // reconnection old connection closing duration + eg errgroup.Group + bo backoff.Backoff + cb circuitbreaker.CircuitBreaker + gbo gbackoff.Config // grpc's original backoff configuration + mcd time.Duration // minimum connection timeout duration + group singleflight.Group[pool.Conn] + crl sync.Map[string, bool] // connection request list ech <-chan error monitorRunning atomic.Bool @@ -946,6 +948,12 @@ func (g *gRPCClient) GetBackoff() backoff.Backoff { return g.bo } +func (g *gRPCClient) SetDisableResolveDNSAddr(addr string, disabled bool) { + // NOTE: When connecting to multiple locations, it was necessary to switch dynamically, so implementation was added. + // There is no setting for disable on the helm chart side, so I used this implementation. + g.disableResolveDNSAddrs.Store(addr, disabled) +} + func (g *gRPCClient) Connect( ctx context.Context, addr string, dopts ...DialOption, ) (conn pool.Conn, err error) { @@ -975,7 +983,13 @@ func (g *gRPCClient) Connect( pool.WithAddr(addr), pool.WithSize(g.poolSize), pool.WithDialOptions(append(g.dopts, dopts...)...), - pool.WithResolveDNS(g.resolveDNS), + pool.WithResolveDNS(func() bool { + disabled, ok := g.disableResolveDNSAddrs.Load(addr) + if ok && disabled { + return false + } + return g.resolveDNS + }()), } if g.bo != nil { opts = append(opts, pool.WithBackoff(g.bo)) diff --git a/pkg/gateway/mirror/service/gateway.go b/pkg/gateway/mirror/service/gateway.go index 674f7b93aa..2e4ed97974 100644 --- a/pkg/gateway/mirror/service/gateway.go +++ b/pkg/gateway/mirror/service/gateway.go @@ -16,6 +16,7 @@ package service import ( "context" "reflect" + "strings" "github.com/vdaas/vald/internal/client/v1/client/mirror" "github.com/vdaas/vald/internal/errors" @@ -143,11 +144,21 @@ func (g *gateway) Do( if target == "" { return nil, errors.ErrTargetNotFound } - return g.client.GRPCClient().Do(g.ForwardedContext(ctx, g.podName), target, + fctx := g.ForwardedContext(ctx, g.podName) + res, err = g.client.GRPCClient().Do(fctx, target, func(ictx context.Context, conn *grpc.ClientConn, copts ...grpc.CallOption) (any, error) { return f(ictx, target, NewMirrorClient(conn), copts...) }, ) + if err != nil { + return g.client.GRPCClient().RoundRobin(fctx, func(ictx context.Context, conn *grpc.ClientConn, copts ...grpc.CallOption) (any, error) { + if strings.EqualFold(conn.Target(), target) { + return nil, errors.ErrTargetNotFound + } + return f(ictx, conn.Target(), NewMirrorClient(conn), copts...) + }) + } + return res, nil } // DoMulti performs a gRPC operation on multiple targets using the provided function. diff --git a/pkg/gateway/mirror/service/mirror.go b/pkg/gateway/mirror/service/mirror.go index 5a2e68c920..ce4309b972 100644 --- a/pkg/gateway/mirror/service/mirror.go +++ b/pkg/gateway/mirror/service/mirror.go @@ -319,6 +319,7 @@ func (m *mirr) Connect(ctx context.Context, targets ...*payload.Mirror_Target) e if !m.isSelfMirrorAddr(addr) && !m.isGatewayAddr(addr) { _, ok := m.addrs.Load(addr) if !ok || !m.IsConnected(ctx, addr) { + m.gateway.GRPCClient().SetDisableResolveDNSAddr(addr, true) _, err := m.gateway.GRPCClient().Connect(ctx, addr) if err != nil { m.addrs.Delete(addr)