2017-04-17 18:08:24 -04:00
/ *
*
2018-06-08 05:26:10 -04:00
* Copyright 2014 gRPC authors .
2017-04-17 18:08:24 -04:00
*
2018-06-08 05:26:10 -04:00
* Licensed under the Apache License , Version 2.0 ( the "License" ) ;
* you may not use this file except in compliance with the License .
* You may obtain a copy of the License at
2017-04-17 18:08:24 -04:00
*
2018-06-08 05:26:10 -04:00
* http : //www.apache.org/licenses/LICENSE-2.0
2017-04-17 18:08:24 -04:00
*
2018-06-08 05:26:10 -04:00
* Unless required by applicable law or agreed to in writing , software
* distributed under the License is distributed on an "AS IS" BASIS ,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND , either express or implied .
* See the License for the specific language governing permissions and
* limitations under the License .
2017-04-17 18:08:24 -04:00
*
* /
package grpc
import (
2019-04-12 14:36:17 -04:00
"context"
2017-04-17 18:08:24 -04:00
"errors"
"fmt"
2017-07-02 03:02:24 -04:00
"math"
2022-03-24 08:21:41 -04:00
"net/url"
2018-06-08 05:26:10 -04:00
"strings"
2017-04-17 18:08:24 -04:00
"sync"
2019-04-12 14:36:17 -04:00
"sync/atomic"
2017-04-17 18:08:24 -04:00
"time"
2018-06-08 05:26:10 -04:00
"google.golang.org/grpc/balancer"
2020-04-16 10:34:35 -04:00
"google.golang.org/grpc/balancer/base"
2018-06-08 05:26:10 -04:00
"google.golang.org/grpc/codes"
"google.golang.org/grpc/connectivity"
2023-11-01 11:03:44 -04:00
"google.golang.org/grpc/internal"
2019-04-12 14:36:17 -04:00
"google.golang.org/grpc/internal/channelz"
"google.golang.org/grpc/internal/grpcsync"
2023-11-01 11:03:44 -04:00
"google.golang.org/grpc/internal/idle"
"google.golang.org/grpc/internal/pretty"
2021-08-12 11:11:44 -04:00
iresolver "google.golang.org/grpc/internal/resolver"
2019-04-12 14:36:17 -04:00
"google.golang.org/grpc/internal/transport"
2017-07-02 03:02:24 -04:00
"google.golang.org/grpc/keepalive"
2018-06-08 05:26:10 -04:00
"google.golang.org/grpc/resolver"
2019-10-02 13:42:55 -04:00
"google.golang.org/grpc/serviceconfig"
2018-06-08 05:26:10 -04:00
"google.golang.org/grpc/status"
2020-04-16 10:34:35 -04:00
_ "google.golang.org/grpc/balancer/roundrobin" // To register roundrobin.
_ "google.golang.org/grpc/internal/resolver/passthrough" // To register passthrough resolver.
2021-08-12 11:11:44 -04:00
_ "google.golang.org/grpc/internal/resolver/unix" // To register unix resolver.
2024-02-20 10:42:33 -05:00
_ "google.golang.org/grpc/resolver/dns" // To register dns resolver.
2017-04-17 18:08:24 -04:00
)
2018-06-08 05:26:10 -04:00
const (
// minimum time to give a connection to complete
minConnectTimeout = 20 * time . Second
)
2017-04-17 18:08:24 -04:00
var (
// ErrClientConnClosing indicates that the operation is illegal because
// the ClientConn is closing.
2018-06-08 05:26:10 -04:00
//
// Deprecated: this error should not be relied upon by users; use the status
// code of Canceled instead.
ErrClientConnClosing = status . Error ( codes . Canceled , "grpc: the client connection is closing" )
// errConnDrain indicates that the connection starts to be drained and does not accept any new RPCs.
errConnDrain = errors . New ( "grpc: the connection is drained" )
// errConnClosing indicates that the connection is closing.
errConnClosing = errors . New ( "grpc: the connection is closing" )
2023-09-19 10:37:37 -04:00
// errConnIdling indicates the the connection is being closed as the channel
// is moving to an idle mode due to inactivity.
errConnIdling = errors . New ( "grpc: the connection is closing due to channel idleness" )
2019-04-12 14:36:17 -04:00
// invalidDefaultServiceConfigErrPrefix is used to prefix the json parsing error for the default
// service config.
invalidDefaultServiceConfigErrPrefix = "grpc: the provided default service config is invalid"
2018-06-08 05:26:10 -04:00
)
2017-04-17 18:08:24 -04:00
2018-06-08 05:26:10 -04:00
// The following errors are returned from Dial and DialContext
var (
2017-04-17 18:08:24 -04:00
// errNoTransportSecurity indicates that there is no transport security
// being set for ClientConn. Users should either set one or explicitly
// call WithInsecure DialOption to disable security.
2022-04-29 14:48:09 -04:00
errNoTransportSecurity = errors . New ( "grpc: no transport security set (use grpc.WithTransportCredentials(insecure.NewCredentials()) explicitly or set credentials)" )
2019-04-12 14:36:17 -04:00
// errTransportCredsAndBundle indicates that creds bundle is used together
// with other individual Transport Credentials.
errTransportCredsAndBundle = errors . New ( "grpc: credentials.Bundle may not be used with individual TransportCredentials" )
2022-03-24 08:21:41 -04:00
// errNoTransportCredsInBundle indicated that the configured creds bundle
// returned a transport credentials which was nil.
errNoTransportCredsInBundle = errors . New ( "grpc: credentials.Bundle must return non-nil transport credentials" )
// errTransportCredentialsMissing indicates that users want to transmit
// security information (e.g., OAuth2 token) which requires secure
// connection on an insecure connection.
2017-04-17 18:08:24 -04:00
errTransportCredentialsMissing = errors . New ( "grpc: the credentials require transport level security (use grpc.WithTransportCredentials() to set)" )
)
2018-06-08 05:26:10 -04:00
const (
defaultClientMaxReceiveMessageSize = 1024 * 1024 * 4
defaultClientMaxSendMessageSize = math . MaxInt32
2019-04-12 14:36:17 -04:00
// http2IOBufSize specifies the buffer size for sending frames.
defaultWriteBufSize = 32 * 1024
defaultReadBufSize = 32 * 1024
2018-06-08 05:26:10 -04:00
)
2017-04-17 18:08:24 -04:00
// Dial creates a client connection to the given target.
func Dial ( target string , opts ... DialOption ) ( * ClientConn , error ) {
return DialContext ( context . Background ( ) , target , opts ... )
}
2021-08-12 11:11:44 -04:00
type defaultConfigSelector struct {
sc * ServiceConfig
}
func ( dcs * defaultConfigSelector ) SelectConfig ( rpcInfo iresolver . RPCInfo ) ( * iresolver . RPCConfig , error ) {
return & iresolver . RPCConfig {
Context : rpcInfo . Context ,
MethodConfig : getMethodConfig ( dcs . sc , rpcInfo . Method ) ,
} , nil
}
2024-02-20 10:42:33 -05:00
// newClient returns a new client in idle mode.
func newClient ( target string , opts ... DialOption ) ( conn * ClientConn , err error ) {
2017-04-17 18:08:24 -04:00
cc := & ClientConn {
2023-09-19 10:37:37 -04:00
target : target ,
conns : make ( map [ * addrConn ] struct { } ) ,
dopts : defaultDialOptions ( ) ,
czData : new ( channelzData ) ,
}
2019-04-12 14:36:17 -04:00
cc . retryThrottler . Store ( ( * retryThrottler ) ( nil ) )
2021-08-12 11:11:44 -04:00
cc . safeConfigSelector . UpdateConfigSelector ( & defaultConfigSelector { nil } )
2017-04-17 18:08:24 -04:00
cc . ctx , cc . cancel = context . WithCancel ( context . Background ( ) )
2018-06-08 05:26:10 -04:00
2024-02-20 10:42:33 -05:00
// Apply dial options.
2023-09-19 10:37:37 -04:00
disableGlobalOpts := false
for _ , opt := range opts {
if _ , ok := opt . ( * disableGlobalDialOptions ) ; ok {
disableGlobalOpts = true
break
}
}
if ! disableGlobalOpts {
for _ , opt := range globalDialOptions {
opt . apply ( & cc . dopts )
}
2022-11-21 10:03:02 -05:00
}
2017-07-02 03:02:24 -04:00
for _ , opt := range opts {
2019-04-12 14:36:17 -04:00
opt . apply ( & cc . dopts )
2017-07-02 03:02:24 -04:00
}
2019-10-02 13:42:55 -04:00
chainUnaryClientInterceptors ( cc )
chainStreamClientInterceptors ( cc )
2023-09-19 10:37:37 -04:00
if err := cc . validateTransportCredentials ( ) ; err != nil {
return nil , err
2018-06-08 05:26:10 -04:00
}
2019-04-12 14:36:17 -04:00
if cc . dopts . defaultServiceConfigRawJSON != nil {
2020-04-16 10:34:35 -04:00
scpr := parseServiceConfig ( * cc . dopts . defaultServiceConfigRawJSON )
if scpr . Err != nil {
return nil , fmt . Errorf ( "%s: %v" , invalidDefaultServiceConfigErrPrefix , scpr . Err )
2019-04-12 14:36:17 -04:00
}
2020-04-16 10:34:35 -04:00
cc . dopts . defaultServiceConfig , _ = scpr . Config . ( * ServiceConfig )
2019-04-12 14:36:17 -04:00
}
2017-07-02 03:02:24 -04:00
cc . mkp = cc . dopts . copts . KeepaliveParams
2024-02-20 10:42:33 -05:00
// Register ClientConn with channelz.
cc . channelzRegistration ( target )
// TODO: Ideally it should be impossible to error from this function after
// channelz registration. This will require removing some channelz logs
// from the following functions that can error. Errors can be returned to
// the user, and successful logs can be emitted here, after the checks have
// passed and channelz is subsequently registered.
// Determine the resolver to use.
if err := cc . parseTargetAndFindResolver ( ) ; err != nil {
channelz . RemoveEntry ( cc . channelzID )
return nil , err
}
if err = cc . determineAuthority ( ) ; err != nil {
channelz . RemoveEntry ( cc . channelzID )
return nil , err
}
cc . csMgr = newConnectivityStateManager ( cc . ctx , cc . channelzID )
cc . pickerWrapper = newPickerWrapper ( cc . dopts . copts . StatsHandlers )
cc . initIdleStateLocked ( ) // Safe to call without the lock, since nothing else has a reference to cc.
cc . idlenessMgr = idle . NewManager ( ( * idler ) ( cc ) , cc . dopts . idleTimeout )
return cc , nil
}
// DialContext creates a client connection to the given target. By default, it's
// a non-blocking dial (the function won't wait for connections to be
// established, and connecting happens in the background). To make it a blocking
// dial, use WithBlock() dial option.
//
// In the non-blocking case, the ctx does not act against the connection. It
// only controls the setup steps.
//
// In the blocking case, ctx can be used to cancel or expire the pending
// connection. Once this function returns, the cancellation and expiration of
// ctx will be noop. Users should call ClientConn.Close to terminate all the
// pending operations after this function returns.
//
// The target name syntax is defined in
// https://github.com/grpc/grpc/blob/master/doc/naming.md.
// e.g. to use dns resolver, a "dns:///" prefix should be applied to the target.
func DialContext ( ctx context . Context , target string , opts ... DialOption ) ( conn * ClientConn , err error ) {
cc , err := newClient ( target , opts ... )
if err != nil {
return nil , err
}
// We start the channel off in idle mode, but kick it out of idle now,
// instead of waiting for the first RPC. Other gRPC implementations do wait
// for the first RPC to kick the channel out of idle. But doing so would be
// a major behavior change for our users who are used to seeing the channel
// active after Dial.
//
// Taking this approach of kicking it out of idle at the end of this method
// allows us to share the code between channel creation and exiting idle
// mode. This will also make it easy for us to switch to starting the
// channel off in idle, i.e. by making newClient exported.
defer func ( ) {
if err != nil {
cc . Close ( )
}
} ( )
// This creates the name resolver, load balancer, etc.
if err := cc . idlenessMgr . ExitIdleMode ( ) ; err != nil {
return nil , err
}
// Return now for non-blocking dials.
if ! cc . dopts . block {
return cc , nil
2017-07-02 03:02:24 -04:00
}
if cc . dopts . timeout > 0 {
var cancel context . CancelFunc
ctx , cancel = context . WithTimeout ( ctx , cc . dopts . timeout )
defer cancel ( )
}
2017-04-17 18:08:24 -04:00
defer func ( ) {
select {
case <- ctx . Done ( ) :
2021-08-12 11:11:44 -04:00
switch {
case ctx . Err ( ) == err :
conn = nil
case err == nil || ! cc . dopts . returnLastError :
conn , err = nil , ctx . Err ( )
default :
conn , err = nil , fmt . Errorf ( "%v: %v" , ctx . Err ( ) , err )
}
2017-04-17 18:08:24 -04:00
default :
}
} ( )
2023-09-19 10:37:37 -04:00
// A blocking dial blocks until the clientConn is ready.
for {
s := cc . GetState ( )
if s == connectivity . Idle {
cc . Connect ( )
}
if s == connectivity . Ready {
return cc , nil
} else if cc . dopts . copts . FailOnNonTempDialError && s == connectivity . TransientFailure {
if err = cc . connectionError ( ) ; err != nil {
terr , ok := err . ( interface {
Temporary ( ) bool
} )
if ok && ! terr . Temporary ( ) {
return nil , err
}
}
}
if ! cc . WaitForStateChange ( ctx , s ) {
// ctx got timeout or canceled.
if err = cc . connectionError ( ) ; err != nil && cc . dopts . returnLastError {
return nil , err
}
return nil , ctx . Err ( )
}
}
}
// addTraceEvent is a helper method to add a trace event on the channel. If the
// channel is a nested one, the same event is also added on the parent channel.
func ( cc * ClientConn ) addTraceEvent ( msg string ) {
ted := & channelz . TraceEventDesc {
Desc : fmt . Sprintf ( "Channel %s" , msg ) ,
Severity : channelz . CtInfo ,
}
if cc . dopts . channelzParentID != nil {
ted . Parent = & channelz . TraceEventDesc {
Desc : fmt . Sprintf ( "Nested channel(id:%d) %s" , cc . channelzID . Int ( ) , msg ) ,
Severity : channelz . CtInfo ,
}
}
channelz . AddTraceEvent ( logger , cc . channelzID , 0 , ted )
}
2023-11-01 11:03:44 -04:00
type idler ClientConn
2024-02-20 10:42:33 -05:00
func ( i * idler ) EnterIdleMode ( ) {
( * ClientConn ) ( i ) . enterIdleMode ( )
2023-11-01 11:03:44 -04:00
}
func ( i * idler ) ExitIdleMode ( ) error {
return ( * ClientConn ) ( i ) . exitIdleMode ( )
}
2023-09-19 10:37:37 -04:00
// exitIdleMode moves the channel out of idle mode by recreating the name
2024-02-20 10:42:33 -05:00
// resolver and load balancer. This should never be called directly; use
// cc.idlenessMgr.ExitIdleMode instead.
func ( cc * ClientConn ) exitIdleMode ( ) ( err error ) {
2023-09-19 10:37:37 -04:00
cc . mu . Lock ( )
if cc . conns == nil {
cc . mu . Unlock ( )
return errConnClosing
}
cc . mu . Unlock ( )
2018-06-08 05:26:10 -04:00
2023-09-19 10:37:37 -04:00
// This needs to be called without cc.mu because this builds a new resolver
2024-02-20 10:42:33 -05:00
// which might update state or report error inline, which would then need to
// acquire cc.mu.
if err := cc . resolverWrapper . start ( ) ; err != nil {
2023-09-19 10:37:37 -04:00
return err
2018-06-08 05:26:10 -04:00
}
2023-09-19 10:37:37 -04:00
2024-02-20 10:42:33 -05:00
cc . addTraceEvent ( "exiting idle mode" )
2023-09-19 10:37:37 -04:00
return nil
}
2024-02-20 10:42:33 -05:00
// initIdleStateLocked initializes common state to how it should be while idle.
func ( cc * ClientConn ) initIdleStateLocked ( ) {
cc . resolverWrapper = newCCResolverWrapper ( cc )
cc . balancerWrapper = newCCBalancerWrapper ( cc )
cc . firstResolveEvent = grpcsync . NewEvent ( )
// cc.conns == nil is a proxy for the ClientConn being closed. So, instead
// of setting it to nil here, we recreate the map. This also means that we
// don't have to do this when exiting idle mode.
cc . conns = make ( map [ * addrConn ] struct { } )
}
2023-09-19 10:37:37 -04:00
// enterIdleMode puts the channel in idle mode, and as part of it shuts down the
2024-02-20 10:42:33 -05:00
// name resolver, load balancer, and any subchannels. This should never be
// called directly; use cc.idlenessMgr.EnterIdleMode instead.
func ( cc * ClientConn ) enterIdleMode ( ) {
2019-04-12 14:36:17 -04:00
cc . mu . Lock ( )
2024-02-26 11:53:12 -05:00
2023-09-19 10:37:37 -04:00
if cc . conns == nil {
2024-02-20 10:42:33 -05:00
cc . mu . Unlock ( )
return
2023-09-19 10:37:37 -04:00
}
conns := cc . conns
2024-02-20 10:42:33 -05:00
rWrapper := cc . resolverWrapper
rWrapper . close ( )
cc . pickerWrapper . reset ( )
bWrapper := cc . balancerWrapper
bWrapper . close ( )
2023-09-19 10:37:37 -04:00
cc . csMgr . updateState ( connectivity . Idle )
2024-02-26 11:53:12 -05:00
cc . addTraceEvent ( "entering idle mode" )
2020-04-16 10:34:35 -04:00
2024-02-20 10:42:33 -05:00
cc . initIdleStateLocked ( )
2024-02-26 11:53:12 -05:00
2024-02-20 10:42:33 -05:00
cc . mu . Unlock ( )
// Block until the name resolver and LB policy are closed.
<- rWrapper . serializer . Done ( )
<- bWrapper . serializer . Done ( )
// Close all subchannels after the LB policy is closed.
for ac := range conns {
ac . tearDown ( errConnIdling )
}
2023-09-19 10:37:37 -04:00
}
// validateTransportCredentials performs a series of checks on the configured
// transport credentials. It returns a non-nil error if any of these conditions
// are met:
// - no transport creds and no creds bundle is configured
// - both transport creds and creds bundle are configured
// - creds bundle is configured, but it lacks a transport credentials
// - insecure transport creds configured alongside call creds that require
// transport level security
//
// If none of the above conditions are met, the configured credentials are
// deemed valid and a nil error is returned.
func ( cc * ClientConn ) validateTransportCredentials ( ) error {
if cc . dopts . copts . TransportCredentials == nil && cc . dopts . copts . CredsBundle == nil {
return errNoTransportSecurity
}
if cc . dopts . copts . TransportCredentials != nil && cc . dopts . copts . CredsBundle != nil {
return errTransportCredsAndBundle
}
if cc . dopts . copts . CredsBundle != nil && cc . dopts . copts . CredsBundle . TransportCredentials ( ) == nil {
return errNoTransportCredsInBundle
}
transportCreds := cc . dopts . copts . TransportCredentials
if transportCreds == nil {
transportCreds = cc . dopts . copts . CredsBundle . TransportCredentials ( )
}
if transportCreds . Info ( ) . SecurityProtocol == "insecure" {
for _ , cd := range cc . dopts . copts . PerRPCCredentials {
if cd . RequireTransportSecurity ( ) {
return errTransportCredentialsMissing
2018-06-08 05:26:10 -04:00
}
}
}
2023-09-19 10:37:37 -04:00
return nil
}
2018-06-08 05:26:10 -04:00
2023-09-19 10:37:37 -04:00
// channelzRegistration registers the newly created ClientConn with channelz and
// stores the returned identifier in `cc.channelzID` and `cc.csMgr.channelzID`.
// A channelz trace event is emitted for ClientConn creation. If the newly
// created ClientConn is a nested one, i.e a valid parent ClientConn ID is
// specified via a dial option, the trace event is also added to the parent.
//
// Doesn't grab cc.mu as this method is expected to be called only at Dial time.
func ( cc * ClientConn ) channelzRegistration ( target string ) {
cc . channelzID = channelz . RegisterChannel ( & channelzChannel { cc } , cc . dopts . channelzParentID , target )
cc . addTraceEvent ( "created" )
2017-04-17 18:08:24 -04:00
}
2019-10-02 13:42:55 -04:00
// chainUnaryClientInterceptors chains all unary client interceptors into one.
func chainUnaryClientInterceptors ( cc * ClientConn ) {
interceptors := cc . dopts . chainUnaryInts
// Prepend dopts.unaryInt to the chaining interceptors if it exists, since unaryInt will
// be executed before any other chained interceptors.
if cc . dopts . unaryInt != nil {
interceptors = append ( [ ] UnaryClientInterceptor { cc . dopts . unaryInt } , interceptors ... )
}
var chainedInt UnaryClientInterceptor
if len ( interceptors ) == 0 {
chainedInt = nil
} else if len ( interceptors ) == 1 {
chainedInt = interceptors [ 0 ]
} else {
2023-11-01 11:03:44 -04:00
chainedInt = func ( ctx context . Context , method string , req , reply any , cc * ClientConn , invoker UnaryInvoker , opts ... CallOption ) error {
2019-10-02 13:42:55 -04:00
return interceptors [ 0 ] ( ctx , method , req , reply , cc , getChainUnaryInvoker ( interceptors , 0 , invoker ) , opts ... )
}
}
cc . dopts . unaryInt = chainedInt
}
// getChainUnaryInvoker recursively generate the chained unary invoker.
func getChainUnaryInvoker ( interceptors [ ] UnaryClientInterceptor , curr int , finalInvoker UnaryInvoker ) UnaryInvoker {
if curr == len ( interceptors ) - 1 {
return finalInvoker
}
2023-11-01 11:03:44 -04:00
return func ( ctx context . Context , method string , req , reply any , cc * ClientConn , opts ... CallOption ) error {
2019-10-02 13:42:55 -04:00
return interceptors [ curr + 1 ] ( ctx , method , req , reply , cc , getChainUnaryInvoker ( interceptors , curr + 1 , finalInvoker ) , opts ... )
}
}
// chainStreamClientInterceptors chains all stream client interceptors into one.
func chainStreamClientInterceptors ( cc * ClientConn ) {
interceptors := cc . dopts . chainStreamInts
// Prepend dopts.streamInt to the chaining interceptors if it exists, since streamInt will
// be executed before any other chained interceptors.
if cc . dopts . streamInt != nil {
interceptors = append ( [ ] StreamClientInterceptor { cc . dopts . streamInt } , interceptors ... )
}
var chainedInt StreamClientInterceptor
if len ( interceptors ) == 0 {
chainedInt = nil
} else if len ( interceptors ) == 1 {
chainedInt = interceptors [ 0 ]
} else {
chainedInt = func ( ctx context . Context , desc * StreamDesc , cc * ClientConn , method string , streamer Streamer , opts ... CallOption ) ( ClientStream , error ) {
return interceptors [ 0 ] ( ctx , desc , cc , method , getChainStreamer ( interceptors , 0 , streamer ) , opts ... )
}
}
cc . dopts . streamInt = chainedInt
}
// getChainStreamer recursively generate the chained client stream constructor.
func getChainStreamer ( interceptors [ ] StreamClientInterceptor , curr int , finalStreamer Streamer ) Streamer {
if curr == len ( interceptors ) - 1 {
return finalStreamer
}
return func ( ctx context . Context , desc * StreamDesc , cc * ClientConn , method string , opts ... CallOption ) ( ClientStream , error ) {
return interceptors [ curr + 1 ] ( ctx , desc , cc , method , getChainStreamer ( interceptors , curr + 1 , finalStreamer ) , opts ... )
}
}
2023-11-01 11:03:44 -04:00
// newConnectivityStateManager creates an connectivityStateManager with
// the specified id.
func newConnectivityStateManager ( ctx context . Context , id * channelz . Identifier ) * connectivityStateManager {
return & connectivityStateManager {
channelzID : id ,
pubSub : grpcsync . NewPubSub ( ctx ) ,
}
}
2018-06-08 05:26:10 -04:00
// connectivityStateManager keeps the connectivity.State of ClientConn.
// This struct will eventually be exported so the balancers can access it.
2023-11-01 11:03:44 -04:00
//
// TODO: If possible, get rid of the `connectivityStateManager` type, and
// provide this functionality using the `PubSub`, to avoid keeping track of
// the connectivity state at two places.
2018-06-08 05:26:10 -04:00
type connectivityStateManager struct {
mu sync . Mutex
state connectivity . State
notifyChan chan struct { }
2022-11-16 10:32:17 -05:00
channelzID * channelz . Identifier
2023-11-01 11:03:44 -04:00
pubSub * grpcsync . PubSub
2018-06-08 05:26:10 -04:00
}
2017-04-17 18:08:24 -04:00
2018-06-08 05:26:10 -04:00
// updateState updates the connectivity.State of ClientConn.
// If there's a change it notifies goroutines waiting on state change to
// happen.
func ( csm * connectivityStateManager ) updateState ( state connectivity . State ) {
csm . mu . Lock ( )
defer csm . mu . Unlock ( )
if csm . state == connectivity . Shutdown {
return
}
if csm . state == state {
return
}
csm . state = state
2023-11-01 11:03:44 -04:00
csm . pubSub . Publish ( state )
2021-08-12 11:11:44 -04:00
channelz . Infof ( logger , csm . channelzID , "Channel Connectivity change to %v" , state )
2018-06-08 05:26:10 -04:00
if csm . notifyChan != nil {
// There are other goroutines waiting on this channel.
close ( csm . notifyChan )
csm . notifyChan = nil
}
}
2017-04-17 18:08:24 -04:00
2018-06-08 05:26:10 -04:00
func ( csm * connectivityStateManager ) getState ( ) connectivity . State {
csm . mu . Lock ( )
defer csm . mu . Unlock ( )
return csm . state
}
func ( csm * connectivityStateManager ) getNotifyChan ( ) <- chan struct { } {
csm . mu . Lock ( )
defer csm . mu . Unlock ( )
if csm . notifyChan == nil {
csm . notifyChan = make ( chan struct { } )
2017-04-17 18:08:24 -04:00
}
2018-06-08 05:26:10 -04:00
return csm . notifyChan
2017-04-17 18:08:24 -04:00
}
2020-04-16 10:34:35 -04:00
// ClientConnInterface defines the functions clients need to perform unary and
// streaming RPCs. It is implemented by *ClientConn, and is only intended to
// be referenced by generated code.
type ClientConnInterface interface {
// Invoke performs a unary RPC and returns after the response is received
// into reply.
2023-11-01 11:03:44 -04:00
Invoke ( ctx context . Context , method string , args any , reply any , opts ... CallOption ) error
2020-04-16 10:34:35 -04:00
// NewStream begins a streaming RPC.
NewStream ( ctx context . Context , desc * StreamDesc , method string , opts ... CallOption ) ( ClientStream , error )
}
// Assert *ClientConn implements ClientConnInterface.
var _ ClientConnInterface = ( * ClientConn ) ( nil )
// ClientConn represents a virtual connection to a conceptual endpoint, to
// perform RPCs.
//
// A ClientConn is free to have zero or more actual connections to the endpoint
// based on configuration, load, etc. It is also free to determine which actual
// endpoints to use and may change it every RPC, permitting client-side load
// balancing.
//
// A ClientConn encapsulates a range of functionality including name
// resolution, TCP connection establishment (with retries and backoff) and TLS
// handshakes. It also handles errors on established connections by
// re-resolving the name and reconnecting.
2017-04-17 18:08:24 -04:00
type ClientConn struct {
2022-11-16 10:32:17 -05:00
ctx context . Context // Initialized using the background context at dial time.
cancel context . CancelFunc // Cancelled on close.
// The following are initialized at dial time, and are read-only after that.
target string // User's dial target.
parsedTarget resolver . Target // See parseTargetAndFindResolver().
authority string // See determineAuthority().
dopts dialOptions // Default and user specified dial options.
channelzID * channelz . Identifier // Channelz identifier for the channel.
2023-09-19 10:37:37 -04:00
resolverBuilder resolver . Builder // See parseTargetAndFindResolver().
2024-02-20 10:42:33 -05:00
idlenessMgr * idle . Manager
2022-11-16 10:32:17 -05:00
// The following provide their own synchronization, and therefore don't
// require cc.mu to be held to access them.
csMgr * connectivityStateManager
2024-02-20 10:42:33 -05:00
pickerWrapper * pickerWrapper
2021-08-12 11:11:44 -04:00
safeConfigSelector iresolver . SafeConfigSelector
2022-11-16 10:32:17 -05:00
czData * channelzData
retryThrottler atomic . Value // Updated from service config.
2021-08-12 11:11:44 -04:00
2022-11-16 10:32:17 -05:00
// mu protects the following fields.
// TODO: split mu so the same mutex isn't used for everything.
mu sync . RWMutex
2024-02-20 10:42:33 -05:00
resolverWrapper * ccResolverWrapper // Always recreated whenever entering idle to simplify Close.
balancerWrapper * ccBalancerWrapper // Always recreated whenever entering idle to simplify Close.
2022-11-16 10:32:17 -05:00
sc * ServiceConfig // Latest service config received from the resolver.
conns map [ * addrConn ] struct { } // Set to nil on close.
mkp keepalive . ClientParameters // May be updated upon receipt of a GoAway.
2024-02-20 10:42:33 -05:00
// firstResolveEvent is used to track whether the name resolver sent us at
// least one update. RPCs block on this event. May be accessed without mu
// if we know we cannot be asked to enter idle mode while accessing it (e.g.
// when the idle manager has already been closed, or if we are already
// entering idle mode).
firstResolveEvent * grpcsync . Event
2021-08-12 11:11:44 -04:00
lceMu sync . Mutex // protects lastConnectionError
lastConnectionError error
2018-06-08 05:26:10 -04:00
}
// WaitForStateChange waits until the connectivity.State of ClientConn changes from sourceState or
// ctx expires. A true value is returned in former case and false in latter.
2021-08-12 11:11:44 -04:00
//
2023-07-19 18:26:26 -04:00
// # Experimental
2021-08-12 11:11:44 -04:00
//
// Notice: This API is EXPERIMENTAL and may be changed or removed in a
// later release.
2018-06-08 05:26:10 -04:00
func ( cc * ClientConn ) WaitForStateChange ( ctx context . Context , sourceState connectivity . State ) bool {
ch := cc . csMgr . getNotifyChan ( )
if cc . csMgr . getState ( ) != sourceState {
return true
2017-04-17 18:08:24 -04:00
}
2018-06-08 05:26:10 -04:00
select {
case <- ctx . Done ( ) :
return false
case <- ch :
return true
}
}
// GetState returns the connectivity.State of ClientConn.
2021-08-12 11:11:44 -04:00
//
2023-07-19 18:26:26 -04:00
// # Experimental
2021-08-12 11:11:44 -04:00
//
2022-03-24 08:21:41 -04:00
// Notice: This API is EXPERIMENTAL and may be changed or removed in a later
// release.
2018-06-08 05:26:10 -04:00
func ( cc * ClientConn ) GetState ( ) connectivity . State {
return cc . csMgr . getState ( )
2017-04-17 18:08:24 -04:00
}
2022-03-24 08:21:41 -04:00
// Connect causes all subchannels in the ClientConn to attempt to connect if
// the channel is idle. Does not wait for the connection attempts to begin
// before returning.
//
2023-07-19 18:26:26 -04:00
// # Experimental
2022-03-24 08:21:41 -04:00
//
// Notice: This API is EXPERIMENTAL and may be changed or removed in a later
// release.
func ( cc * ClientConn ) Connect ( ) {
2024-02-20 10:42:33 -05:00
if err := cc . idlenessMgr . ExitIdleMode ( ) ; err != nil {
cc . addTraceEvent ( err . Error ( ) )
return
}
2023-09-19 10:37:37 -04:00
// If the ClientConn was not in idle mode, we need to call ExitIdle on the
// LB policy so that connections can be created.
2024-02-20 10:42:33 -05:00
cc . mu . Lock ( )
cc . balancerWrapper . exitIdle ( )
cc . mu . Unlock ( )
2017-07-02 03:02:24 -04:00
}
2019-04-12 14:36:17 -04:00
// waitForResolvedAddrs blocks until the resolver has provided addresses or the
// context expires. Returns nil unless the context expires first; otherwise
// returns a status error based on the context.
func ( cc * ClientConn ) waitForResolvedAddrs ( ctx context . Context ) error {
// This is on the RPC path, so we use a fast path to avoid the
// more-expensive "select" below after the resolver has returned once.
if cc . firstResolveEvent . HasFired ( ) {
return nil
}
select {
case <- cc . firstResolveEvent . Done ( ) :
return nil
case <- ctx . Done ( ) :
return status . FromContextError ( ctx . Err ( ) ) . Err ( )
case <- cc . ctx . Done ( ) :
return ErrClientConnClosing
}
}
2020-04-16 10:34:35 -04:00
var emptyServiceConfig * ServiceConfig
func init ( ) {
cfg := parseServiceConfig ( "{}" )
if cfg . Err != nil {
panic ( fmt . Sprintf ( "impossible error parsing empty service config: %v" , cfg . Err ) )
}
emptyServiceConfig = cfg . Config . ( * ServiceConfig )
2023-11-01 11:03:44 -04:00
internal . SubscribeToConnectivityStateChanges = func ( cc * ClientConn , s grpcsync . Subscriber ) func ( ) {
return cc . csMgr . pubSub . Subscribe ( s )
}
2024-02-20 10:42:33 -05:00
internal . EnterIdleModeForTesting = func ( cc * ClientConn ) {
cc . idlenessMgr . EnterIdleModeForTesting ( )
2024-02-26 11:53:12 -05:00
}
internal . ExitIdleModeForTesting = func ( cc * ClientConn ) error {
2024-02-20 10:42:33 -05:00
return cc . idlenessMgr . ExitIdleMode ( )
2024-02-26 11:53:12 -05:00
}
2020-04-16 10:34:35 -04:00
}
func ( cc * ClientConn ) maybeApplyDefaultServiceConfig ( addrs [ ] resolver . Address ) {
if cc . sc != nil {
2021-08-12 11:11:44 -04:00
cc . applyServiceConfigAndBalancer ( cc . sc , nil , addrs )
2020-04-16 10:34:35 -04:00
return
}
if cc . dopts . defaultServiceConfig != nil {
2021-08-12 11:11:44 -04:00
cc . applyServiceConfigAndBalancer ( cc . dopts . defaultServiceConfig , & defaultConfigSelector { cc . dopts . defaultServiceConfig } , addrs )
2020-04-16 10:34:35 -04:00
} else {
2021-08-12 11:11:44 -04:00
cc . applyServiceConfigAndBalancer ( emptyServiceConfig , & defaultConfigSelector { emptyServiceConfig } , addrs )
2020-04-16 10:34:35 -04:00
}
}
2024-02-20 10:42:33 -05:00
func ( cc * ClientConn ) updateResolverStateAndUnlock ( s resolver . State , err error ) error {
2020-04-16 10:34:35 -04:00
defer cc . firstResolveEvent . Fire ( )
2019-04-12 14:36:17 -04:00
// Check if the ClientConn is already closed. Some fields (e.g.
// balancerWrapper) are set to nil when closing the ClientConn, and could
// cause nil pointer panic if we don't have this check.
2018-06-08 05:26:10 -04:00
if cc . conns == nil {
2020-04-16 10:34:35 -04:00
cc . mu . Unlock ( )
2019-04-12 14:36:17 -04:00
return nil
2017-04-17 18:08:24 -04:00
}
2018-06-08 05:26:10 -04:00
2020-04-16 10:34:35 -04:00
if err != nil {
// May need to apply the initial service config in case the resolver
// doesn't support service configs, or doesn't provide a service config
// with the new addresses.
cc . maybeApplyDefaultServiceConfig ( nil )
2022-11-16 10:32:17 -05:00
cc . balancerWrapper . resolverError ( err )
2020-04-16 10:34:35 -04:00
// No addresses are valid with err set; return early.
cc . mu . Unlock ( )
return balancer . ErrBadResolverState
2019-04-12 14:36:17 -04:00
}
2018-06-08 05:26:10 -04:00
2020-04-16 10:34:35 -04:00
var ret error
2022-03-24 08:21:41 -04:00
if cc . dopts . disableServiceConfig {
channelz . Infof ( logger , cc . channelzID , "ignoring service config from resolver (%v) and applying the default because service config is disabled" , s . ServiceConfig )
cc . maybeApplyDefaultServiceConfig ( s . Addresses )
} else if s . ServiceConfig == nil {
2020-04-16 10:34:35 -04:00
cc . maybeApplyDefaultServiceConfig ( s . Addresses )
// TODO: do we need to apply a failing LB policy if there is no
// default, per the error handling design?
} else {
if sc , ok := s . ServiceConfig . Config . ( * ServiceConfig ) ; s . ServiceConfig . Err == nil && ok {
2021-08-12 11:11:44 -04:00
configSelector := iresolver . GetConfigSelector ( s )
if configSelector != nil {
if len ( s . ServiceConfig . Config . ( * ServiceConfig ) . Methods ) != 0 {
channelz . Infof ( logger , cc . channelzID , "method configs in service config will be ignored due to presence of config selector" )
}
} else {
configSelector = & defaultConfigSelector { sc }
}
cc . applyServiceConfigAndBalancer ( sc , configSelector , s . Addresses )
2018-06-08 05:26:10 -04:00
} else {
2020-04-16 10:34:35 -04:00
ret = balancer . ErrBadResolverState
2022-11-16 10:32:17 -05:00
if cc . sc == nil {
// Apply the failing LB only if we haven't received valid service config
// from the name resolver in the past.
2024-02-20 10:42:33 -05:00
cc . applyFailingLBLocked ( s . ServiceConfig )
2020-04-16 10:34:35 -04:00
cc . mu . Unlock ( )
return ret
2019-10-02 13:42:55 -04:00
}
2017-04-17 18:08:24 -04:00
}
}
2018-06-08 05:26:10 -04:00
2020-04-16 10:34:35 -04:00
var balCfg serviceconfig . LoadBalancingConfig
2022-11-16 10:32:17 -05:00
if cc . sc != nil && cc . sc . lbConfig != nil {
2020-04-16 10:34:35 -04:00
balCfg = cc . sc . lbConfig . cfg
}
bw := cc . balancerWrapper
cc . mu . Unlock ( )
2022-11-16 10:32:17 -05:00
2020-04-16 10:34:35 -04:00
uccsErr := bw . updateClientConnState ( & balancer . ClientConnState { ResolverState : s , BalancerConfig : balCfg } )
if ret == nil {
ret = uccsErr // prefer ErrBadResolver state since any other error is
// currently meaningless to the caller.
}
return ret
2018-06-08 05:26:10 -04:00
}
2024-02-20 10:42:33 -05:00
// applyFailingLBLocked is akin to configuring an LB policy on the channel which
2022-11-16 10:32:17 -05:00
// always fails RPCs. Here, an actual LB policy is not configured, but an always
// erroring picker is configured, which returns errors with information about
// what was invalid in the received service config. A config selector with no
// service config is configured, and the connectivity state of the channel is
// set to TransientFailure.
2024-02-20 10:42:33 -05:00
func ( cc * ClientConn ) applyFailingLBLocked ( sc * serviceconfig . ParseResult ) {
2022-11-16 10:32:17 -05:00
var err error
if sc . Err != nil {
err = status . Errorf ( codes . Unavailable , "error parsing service config: %v" , sc . Err )
2021-08-12 11:11:44 -04:00
} else {
2022-11-16 10:32:17 -05:00
err = status . Errorf ( codes . Unavailable , "illegal service config type: %T" , sc . Config )
2018-06-08 05:26:10 -04:00
}
2022-11-16 10:32:17 -05:00
cc . safeConfigSelector . UpdateConfigSelector ( & defaultConfigSelector { nil } )
2024-02-20 10:42:33 -05:00
cc . pickerWrapper . updatePicker ( base . NewErrPicker ( err ) )
2022-11-16 10:32:17 -05:00
cc . csMgr . updateState ( connectivity . TransientFailure )
2018-06-08 05:26:10 -04:00
}
2023-11-01 11:03:44 -04:00
// Makes a copy of the input addresses slice and clears out the balancer
// attributes field. Addresses are passed during subconn creation and address
// update operations. In both cases, we will clear the balancer attributes by
// calling this function, and therefore we will be able to use the Equal method
// provided by the resolver.Address type for comparison.
func copyAddressesWithoutBalancerAttributes ( in [ ] resolver . Address ) [ ] resolver . Address {
out := make ( [ ] resolver . Address , len ( in ) )
for i := range in {
out [ i ] = in [ i ]
out [ i ] . BalancerAttributes = nil
}
return out
}
2024-02-20 10:42:33 -05:00
// newAddrConnLocked creates an addrConn for addrs and adds it to cc.conns.
2018-06-08 05:26:10 -04:00
//
// Caller needs to make sure len(addrs) > 0.
2024-02-20 10:42:33 -05:00
func ( cc * ClientConn ) newAddrConnLocked ( addrs [ ] resolver . Address , opts balancer . NewSubConnOptions ) ( * addrConn , error ) {
if cc . conns == nil {
return nil , ErrClientConnClosing
}
2018-06-08 05:26:10 -04:00
ac := & addrConn {
2021-08-12 11:11:44 -04:00
state : connectivity . Idle ,
2019-04-12 14:36:17 -04:00
cc : cc ,
2023-11-01 11:03:44 -04:00
addrs : copyAddressesWithoutBalancerAttributes ( addrs ) ,
2019-04-12 14:36:17 -04:00
scopts : opts ,
dopts : cc . dopts ,
czData : new ( channelzData ) ,
resetBackoff : make ( chan struct { } ) ,
2023-09-19 10:37:37 -04:00
stateChan : make ( chan struct { } ) ,
2018-06-08 05:26:10 -04:00
}
ac . ctx , ac . cancel = context . WithCancel ( cc . ctx )
2022-11-16 10:32:17 -05:00
var err error
ac . channelzID , err = channelz . RegisterSubChannel ( ac , cc . channelzID , "" )
if err != nil {
return nil , err
2017-04-17 18:08:24 -04:00
}
2022-11-16 10:32:17 -05:00
channelz . AddTraceEvent ( logger , ac . channelzID , 0 , & channelz . TraceEventDesc {
Desc : "Subchannel created" ,
Severity : channelz . CtInfo ,
Parent : & channelz . TraceEventDesc {
Desc : fmt . Sprintf ( "Subchannel(id:%d) created" , ac . channelzID . Int ( ) ) ,
Severity : channelz . CtInfo ,
} ,
} )
2024-02-20 10:42:33 -05:00
// Track ac in cc. This needs to be done before any getTransport(...) is called.
2018-06-08 05:26:10 -04:00
cc . conns [ ac ] = struct { } { }
return ac , nil
}
// removeAddrConn removes the addrConn in the subConn from clientConn.
// It also tears down the ac with the given error.
func ( cc * ClientConn ) removeAddrConn ( ac * addrConn , err error ) {
cc . mu . Lock ( )
if cc . conns == nil {
cc . mu . Unlock ( )
return
}
delete ( cc . conns , ac )
cc . mu . Unlock ( )
ac . tearDown ( err )
}
2019-04-12 14:36:17 -04:00
func ( cc * ClientConn ) channelzMetric ( ) * channelz . ChannelInternalMetric {
2018-06-08 05:26:10 -04:00
return & channelz . ChannelInternalMetric {
2019-04-12 14:36:17 -04:00
State : cc . GetState ( ) ,
2018-06-08 05:26:10 -04:00
Target : cc . target ,
2019-04-12 14:36:17 -04:00
CallsStarted : atomic . LoadInt64 ( & cc . czData . callsStarted ) ,
CallsSucceeded : atomic . LoadInt64 ( & cc . czData . callsSucceeded ) ,
CallsFailed : atomic . LoadInt64 ( & cc . czData . callsFailed ) ,
LastCallStartedTimestamp : time . Unix ( 0 , atomic . LoadInt64 ( & cc . czData . lastCallStartedTime ) ) ,
2018-06-08 05:26:10 -04:00
}
}
2019-04-12 14:36:17 -04:00
// Target returns the target string of the ClientConn.
2021-08-12 11:11:44 -04:00
//
2023-07-19 18:26:26 -04:00
// # Experimental
2021-08-12 11:11:44 -04:00
//
// Notice: This API is EXPERIMENTAL and may be changed or removed in a
// later release.
2019-04-12 14:36:17 -04:00
func ( cc * ClientConn ) Target ( ) string {
return cc . target
}
2018-06-08 05:26:10 -04:00
func ( cc * ClientConn ) incrCallsStarted ( ) {
2019-04-12 14:36:17 -04:00
atomic . AddInt64 ( & cc . czData . callsStarted , 1 )
atomic . StoreInt64 ( & cc . czData . lastCallStartedTime , time . Now ( ) . UnixNano ( ) )
2018-06-08 05:26:10 -04:00
}
func ( cc * ClientConn ) incrCallsSucceeded ( ) {
2019-04-12 14:36:17 -04:00
atomic . AddInt64 ( & cc . czData . callsSucceeded , 1 )
2018-06-08 05:26:10 -04:00
}
func ( cc * ClientConn ) incrCallsFailed ( ) {
2019-04-12 14:36:17 -04:00
atomic . AddInt64 ( & cc . czData . callsFailed , 1 )
2018-06-08 05:26:10 -04:00
}
2019-04-12 14:36:17 -04:00
// connect starts creating a transport.
2018-06-08 05:26:10 -04:00
// It does nothing if the ac is not IDLE.
// TODO(bar) Move this to the addrConn section.
func ( ac * addrConn ) connect ( ) error {
ac . mu . Lock ( )
if ac . state == connectivity . Shutdown {
2023-07-19 18:26:26 -04:00
if logger . V ( 2 ) {
logger . Infof ( "connect called on shutdown addrConn; ignoring." )
}
2018-06-08 05:26:10 -04:00
ac . mu . Unlock ( )
return errConnClosing
2017-04-17 18:08:24 -04:00
}
2018-06-08 05:26:10 -04:00
if ac . state != connectivity . Idle {
2023-07-19 18:26:26 -04:00
if logger . V ( 2 ) {
logger . Infof ( "connect called on addrConn in non-idle state (%v); ignoring." , ac . state )
}
2018-06-08 05:26:10 -04:00
ac . mu . Unlock ( )
return nil
}
ac . mu . Unlock ( )
2022-03-24 08:21:41 -04:00
ac . resetTransport ( )
2017-04-17 18:08:24 -04:00
return nil
}
2022-11-16 10:32:17 -05:00
func equalAddresses ( a , b [ ] resolver . Address ) bool {
if len ( a ) != len ( b ) {
return false
}
for i , v := range a {
if ! v . Equal ( b [ i ] ) {
return false
}
}
return true
}
2023-09-19 10:37:37 -04:00
// updateAddrs updates ac.addrs with the new addresses list and handles active
// connections or connection attempts.
func ( ac * addrConn ) updateAddrs ( addrs [ ] resolver . Address ) {
2018-06-08 05:26:10 -04:00
ac . mu . Lock ( )
2023-11-01 11:03:44 -04:00
channelz . Infof ( logger , ac . channelzID , "addrConn: updateAddrs curAddr: %v, addrs: %v" , pretty . ToJSON ( ac . curAddr ) , pretty . ToJSON ( addrs ) )
2023-09-19 10:37:37 -04:00
2023-11-01 11:03:44 -04:00
addrs = copyAddressesWithoutBalancerAttributes ( addrs )
2023-09-19 10:37:37 -04:00
if equalAddresses ( ac . addrs , addrs ) {
ac . mu . Unlock ( )
return
}
ac . addrs = addrs
2019-10-02 13:42:55 -04:00
if ac . state == connectivity . Shutdown ||
ac . state == connectivity . TransientFailure ||
ac . state == connectivity . Idle {
2023-09-19 10:37:37 -04:00
// We were not connecting, so do nothing but update the addresses.
ac . mu . Unlock ( )
return
2018-06-08 05:26:10 -04:00
}
2017-07-02 03:02:24 -04:00
2023-09-19 10:37:37 -04:00
if ac . state == connectivity . Ready {
// Try to find the connected address.
for _ , a := range addrs {
a . ServerName = ac . cc . getServerName ( a )
if a . Equal ( ac . curAddr ) {
// We are connected to a valid address, so do nothing but
// update the addresses.
ac . mu . Unlock ( )
return
}
}
2022-11-16 10:32:17 -05:00
}
2023-09-19 10:37:37 -04:00
// We are either connected to the wrong address or currently connecting.
// Stop the current iteration and restart.
2019-04-12 14:36:17 -04:00
2023-09-19 10:37:37 -04:00
ac . cancel ( )
ac . ctx , ac . cancel = context . WithCancel ( ac . cc . ctx )
2023-11-01 11:03:44 -04:00
// We have to defer here because GracefulClose => onClose, which requires
// locking ac.mu.
2023-09-19 10:37:37 -04:00
if ac . transport != nil {
defer ac . transport . GracefulClose ( )
ac . transport = nil
2017-04-17 18:08:24 -04:00
}
2023-09-19 10:37:37 -04:00
if len ( addrs ) == 0 {
ac . updateConnectivityState ( connectivity . Idle , nil )
2018-06-08 05:26:10 -04:00
}
2023-09-19 10:37:37 -04:00
ac . mu . Unlock ( )
// Since we were connecting/connected, we should start a new connection
// attempt.
go ac . resetTransport ( )
2018-06-08 05:26:10 -04:00
}
2022-03-24 08:21:41 -04:00
// getServerName determines the serverName to be used in the connection
// handshake. The default value for the serverName is the authority on the
// ClientConn, which either comes from the user's dial target or through an
// authority override specified using the WithAuthority dial option. Name
// resolvers can specify a per-address override for the serverName through the
// resolver.Address.ServerName field which is used only if the WithAuthority
// dial option was not used. The rationale is that per-address authority
// overrides specified by the name resolver can represent a security risk, while
// an override specified by the user is more dependable since they probably know
// what they are doing.
func ( cc * ClientConn ) getServerName ( addr resolver . Address ) string {
if cc . dopts . authority != "" {
return cc . dopts . authority
}
if addr . ServerName != "" {
return addr . ServerName
}
return cc . authority
}
2021-08-12 11:11:44 -04:00
func getMethodConfig ( sc * ServiceConfig , method string ) MethodConfig {
if sc == nil {
return MethodConfig { }
}
if m , ok := sc . Methods [ method ] ; ok {
return m
}
i := strings . LastIndex ( method , "/" )
if m , ok := sc . Methods [ method [ : i + 1 ] ] ; ok {
return m
}
return sc . Methods [ "" ]
}
2018-06-08 05:26:10 -04:00
// GetMethodConfig gets the method config of the input method.
// If there's an exact match for input method (i.e. /service/method), we return
// the corresponding MethodConfig.
2021-08-12 11:11:44 -04:00
// If there isn't an exact match for the input method, we look for the service's default
// config under the service (i.e /service/) and then for the default for all services (empty string).
//
// If there is a default MethodConfig for the service, we return it.
2018-06-08 05:26:10 -04:00
// Otherwise, we return an empty MethodConfig.
func ( cc * ClientConn ) GetMethodConfig ( method string ) MethodConfig {
// TODO: Avoid the locking here.
cc . mu . RLock ( )
defer cc . mu . RUnlock ( )
2021-08-12 11:11:44 -04:00
return getMethodConfig ( cc . sc , method )
2018-06-08 05:26:10 -04:00
}
2019-04-12 14:36:17 -04:00
func ( cc * ClientConn ) healthCheckConfig ( ) * healthCheckConfig {
cc . mu . RLock ( )
defer cc . mu . RUnlock ( )
if cc . sc == nil {
return nil
}
return cc . sc . healthCheckConfig
}
2023-07-19 18:26:26 -04:00
func ( cc * ClientConn ) getTransport ( ctx context . Context , failfast bool , method string ) ( transport . ClientTransport , balancer . PickResult , error ) {
2024-02-20 10:42:33 -05:00
return cc . pickerWrapper . pick ( ctx , failfast , balancer . PickInfo {
2020-04-16 10:34:35 -04:00
Ctx : ctx ,
2019-04-12 14:36:17 -04:00
FullMethodName : method ,
} )
2018-06-08 05:26:10 -04:00
}
2021-08-12 11:11:44 -04:00
func ( cc * ClientConn ) applyServiceConfigAndBalancer ( sc * ServiceConfig , configSelector iresolver . ConfigSelector , addrs [ ] resolver . Address ) {
2019-04-12 14:36:17 -04:00
if sc == nil {
// should never reach here.
2020-04-16 10:34:35 -04:00
return
2017-04-17 18:08:24 -04:00
}
2018-06-08 05:26:10 -04:00
cc . sc = sc
2021-08-12 11:11:44 -04:00
if configSelector != nil {
cc . safeConfigSelector . UpdateConfigSelector ( configSelector )
}
2018-06-08 05:26:10 -04:00
2019-04-12 14:36:17 -04:00
if cc . sc . retryThrottling != nil {
newThrottler := & retryThrottler {
tokens : cc . sc . retryThrottling . MaxTokens ,
max : cc . sc . retryThrottling . MaxTokens ,
thresh : cc . sc . retryThrottling . MaxTokens / 2 ,
ratio : cc . sc . retryThrottling . TokenRatio ,
2017-04-17 18:08:24 -04:00
}
2019-04-12 14:36:17 -04:00
cc . retryThrottler . Store ( newThrottler )
} else {
cc . retryThrottler . Store ( ( * retryThrottler ) ( nil ) )
2018-06-08 05:26:10 -04:00
}
2022-11-16 10:32:17 -05:00
var newBalancerName string
2023-11-01 11:03:44 -04:00
if cc . sc == nil || ( cc . sc . lbConfig == nil && cc . sc . LB == nil ) {
// No service config or no LB policy specified in config.
newBalancerName = PickFirstBalancerName
} else if cc . sc . lbConfig != nil {
2022-11-16 10:32:17 -05:00
newBalancerName = cc . sc . lbConfig . name
2023-11-01 11:03:44 -04:00
} else { // cc.sc.LB != nil
newBalancerName = * cc . sc . LB
2020-04-16 10:34:35 -04:00
}
2022-11-16 10:32:17 -05:00
cc . balancerWrapper . switchTo ( newBalancerName )
2018-06-08 05:26:10 -04:00
}
2020-04-16 10:34:35 -04:00
func ( cc * ClientConn ) resolveNow ( o resolver . ResolveNowOptions ) {
2019-04-12 14:36:17 -04:00
cc . mu . RLock ( )
2024-02-20 10:42:33 -05:00
cc . resolverWrapper . resolveNow ( o )
2019-04-12 14:36:17 -04:00
cc . mu . RUnlock ( )
2024-02-20 10:42:33 -05:00
}
func ( cc * ClientConn ) resolveNowLocked ( o resolver . ResolveNowOptions ) {
cc . resolverWrapper . resolveNow ( o )
2017-04-17 18:08:24 -04:00
}
2019-04-12 14:36:17 -04:00
// ResetConnectBackoff wakes up all subchannels in transient failure and causes
// them to attempt another connection immediately. It also resets the backoff
// times used for subsequent attempts regardless of the current state.
//
// In general, this function should not be used. Typical service or network
// outages result in a reasonable client reconnection strategy by default.
// However, if a previously unavailable network becomes available, this may be
// used to trigger an immediate reconnect.
//
2023-07-19 18:26:26 -04:00
// # Experimental
2021-08-12 11:11:44 -04:00
//
// Notice: This API is EXPERIMENTAL and may be changed or removed in a
// later release.
2019-04-12 14:36:17 -04:00
func ( cc * ClientConn ) ResetConnectBackoff ( ) {
cc . mu . Lock ( )
2020-04-16 10:34:35 -04:00
conns := cc . conns
cc . mu . Unlock ( )
for ac := range conns {
2019-04-12 14:36:17 -04:00
ac . resetConnectBackoff ( )
}
}
2017-04-17 18:08:24 -04:00
// Close tears down the ClientConn and all underlying connections.
func ( cc * ClientConn ) Close ( ) error {
2023-11-01 11:03:44 -04:00
defer func ( ) {
cc . cancel ( )
<- cc . csMgr . pubSub . Done ( )
} ( )
2017-04-17 18:08:24 -04:00
2024-02-20 10:42:33 -05:00
// Prevent calls to enter/exit idle immediately, and ensure we are not
// currently entering/exiting idle mode.
cc . idlenessMgr . Close ( )
2017-04-17 18:08:24 -04:00
cc . mu . Lock ( )
if cc . conns == nil {
cc . mu . Unlock ( )
return ErrClientConnClosing
}
2023-09-19 10:37:37 -04:00
2017-04-17 18:08:24 -04:00
conns := cc . conns
cc . conns = nil
2018-06-08 05:26:10 -04:00
cc . csMgr . updateState ( connectivity . Shutdown )
2024-02-20 10:42:33 -05:00
// We can safely unlock and continue to access all fields now as
// cc.conns==nil, preventing any further operations on cc.
2017-04-17 18:08:24 -04:00
cc . mu . Unlock ( )
2018-06-08 05:26:10 -04:00
2024-02-20 10:42:33 -05:00
cc . resolverWrapper . close ( )
2022-11-16 10:32:17 -05:00
// The order of closing matters here since the balancer wrapper assumes the
// picker is closed before it is closed.
2024-02-20 10:42:33 -05:00
cc . pickerWrapper . close ( )
cc . balancerWrapper . close ( )
<- cc . resolverWrapper . serializer . Done ( )
<- cc . balancerWrapper . serializer . Done ( )
2018-06-08 05:26:10 -04:00
for ac := range conns {
2017-04-17 18:08:24 -04:00
ac . tearDown ( ErrClientConnClosing )
}
2023-09-19 10:37:37 -04:00
cc . addTraceEvent ( "deleted" )
2022-11-16 10:32:17 -05:00
// TraceEvent needs to be called before RemoveEntry, as TraceEvent may add
// trace reference to the entity being deleted, and thus prevent it from being
// deleted right away.
channelz . RemoveEntry ( cc . channelzID )
2017-04-17 18:08:24 -04:00
return nil
}
// addrConn is a network connection to a given address.
type addrConn struct {
ctx context . Context
cancel context . CancelFunc
cc * ClientConn
dopts dialOptions
2024-02-20 10:42:33 -05:00
acbw * acBalancerWrapper
2019-04-12 14:36:17 -04:00
scopts balancer . NewSubConnOptions
// transport is set when there's a viable transport (note: ac state may not be READY as LB channel
// health checking may require server to report healthy to set ac to READY), and is reset
// to nil when the current transport should no longer be used to create a stream (e.g. after GoAway
// is received, transport is closed, ac has been torn down).
transport transport . ClientTransport // The current transport.
mu sync . Mutex
curAddr resolver . Address // The current address.
addrs [ ] resolver . Address // All addresses that the resolver resolved to.
// Use updateConnectivityState for updating addrConn's connectivity state.
2023-09-19 10:37:37 -04:00
state connectivity . State
stateChan chan struct { } // closed and recreated on every state change.
2019-04-12 14:36:17 -04:00
backoffIdx int // Needs to be stateful for resetConnectBackoff.
resetBackoff chan struct { }
2017-04-17 18:08:24 -04:00
2022-11-16 10:32:17 -05:00
channelzID * channelz . Identifier
2019-04-12 14:36:17 -04:00
czData * channelzData
}
// Note: this requires a lock on ac.mu.
2020-04-16 10:34:35 -04:00
func ( ac * addrConn ) updateConnectivityState ( s connectivity . State , lastErr error ) {
2019-04-12 14:36:17 -04:00
if ac . state == s {
return
}
2023-09-19 10:37:37 -04:00
// When changing states, reset the state change channel.
close ( ac . stateChan )
ac . stateChan = make ( chan struct { } )
2019-04-12 14:36:17 -04:00
ac . state = s
2023-09-19 10:37:37 -04:00
if lastErr == nil {
channelz . Infof ( logger , ac . channelzID , "Subchannel Connectivity change to %v" , s )
} else {
channelz . Infof ( logger , ac . channelzID , "Subchannel Connectivity change to %v, last error: %s" , s , lastErr )
}
2024-02-20 10:42:33 -05:00
ac . acbw . updateState ( s , lastErr )
2017-04-17 18:08:24 -04:00
}
2017-07-02 03:02:24 -04:00
// adjustParams updates parameters used to create transports upon
// receiving a GoAway.
func ( ac * addrConn ) adjustParams ( r transport . GoAwayReason ) {
switch r {
2018-06-08 05:26:10 -04:00
case transport . GoAwayTooManyPings :
2017-07-02 03:02:24 -04:00
v := 2 * ac . dopts . copts . KeepaliveParams . Time
ac . cc . mu . Lock ( )
if v > ac . cc . mkp . Time {
ac . cc . mkp . Time = v
}
ac . cc . mu . Unlock ( )
}
}
2019-04-12 14:36:17 -04:00
func ( ac * addrConn ) resetTransport ( ) {
2022-03-24 08:21:41 -04:00
ac . mu . Lock ( )
2023-09-19 10:37:37 -04:00
acCtx := ac . ctx
if acCtx . Err ( ) != nil {
2022-03-24 08:21:41 -04:00
ac . mu . Unlock ( )
return
}
addrs := ac . addrs
backoffFor := ac . dopts . bs . Backoff ( ac . backoffIdx )
// This will be the duration that dial gets to finish.
dialDuration := minConnectTimeout
if ac . dopts . minConnectTimeout != nil {
dialDuration = ac . dopts . minConnectTimeout ( )
}
2017-04-17 18:08:24 -04:00
2022-03-24 08:21:41 -04:00
if dialDuration < backoffFor {
// Give dial more time as we keep failing to connect.
dialDuration = backoffFor
}
// We can potentially spend all the time trying the first address, and
// if the server accepts the connection and then hangs, the following
// addresses will never be tried.
//
// The spec doesn't mention what should be done for multiple addresses.
// https://github.com/grpc/grpc/blob/master/doc/connection-backoff.md#proposed-backoff-algorithm
connectDeadline := time . Now ( ) . Add ( dialDuration )
ac . updateConnectivityState ( connectivity . Connecting , nil )
ac . mu . Unlock ( )
2023-09-19 10:37:37 -04:00
if err := ac . tryAllAddrs ( acCtx , addrs , connectDeadline ) ; err != nil {
2022-03-24 08:21:41 -04:00
ac . cc . resolveNow ( resolver . ResolveNowOptions { } )
2023-11-01 11:03:44 -04:00
ac . mu . Lock ( )
2023-09-19 10:37:37 -04:00
if acCtx . Err ( ) != nil {
2023-11-01 11:03:44 -04:00
// addrConn was torn down.
ac . mu . Unlock ( )
2019-04-12 14:36:17 -04:00
return
2017-04-17 18:08:24 -04:00
}
2023-11-01 11:03:44 -04:00
// After exhausting all addresses, the addrConn enters
// TRANSIENT_FAILURE.
2022-03-24 08:21:41 -04:00
ac . updateConnectivityState ( connectivity . TransientFailure , err )
2018-06-08 05:26:10 -04:00
2022-03-24 08:21:41 -04:00
// Backoff.
b := ac . resetBackoff
2019-04-12 14:36:17 -04:00
ac . mu . Unlock ( )
2022-03-24 08:21:41 -04:00
timer := time . NewTimer ( backoffFor )
select {
case <- timer . C :
2017-04-17 18:08:24 -04:00
ac . mu . Lock ( )
2022-03-24 08:21:41 -04:00
ac . backoffIdx ++
2017-04-17 18:08:24 -04:00
ac . mu . Unlock ( )
2022-03-24 08:21:41 -04:00
case <- b :
timer . Stop ( )
2023-09-19 10:37:37 -04:00
case <- acCtx . Done ( ) :
2022-03-24 08:21:41 -04:00
timer . Stop ( )
return
2017-04-17 18:08:24 -04:00
}
2019-04-12 14:36:17 -04:00
2017-04-17 18:08:24 -04:00
ac . mu . Lock ( )
2023-09-19 10:37:37 -04:00
if acCtx . Err ( ) == nil {
2022-03-24 08:21:41 -04:00
ac . updateConnectivityState ( connectivity . Idle , err )
2017-04-17 18:08:24 -04:00
}
ac . mu . Unlock ( )
2022-03-24 08:21:41 -04:00
return
2017-04-17 18:08:24 -04:00
}
2022-03-24 08:21:41 -04:00
// Success; reset backoff.
ac . mu . Lock ( )
ac . backoffIdx = 0
ac . mu . Unlock ( )
2017-04-17 18:08:24 -04:00
}
2022-03-24 08:21:41 -04:00
// tryAllAddrs tries to creates a connection to the addresses, and stop when at
// the first successful one. It returns an error if no address was successfully
// connected, or updates ac appropriately with the new transport.
2023-09-19 10:37:37 -04:00
func ( ac * addrConn ) tryAllAddrs ( ctx context . Context , addrs [ ] resolver . Address , connectDeadline time . Time ) error {
2020-04-16 10:34:35 -04:00
var firstConnErr error
2019-04-12 14:36:17 -04:00
for _ , addr := range addrs {
2023-09-19 10:37:37 -04:00
if ctx . Err ( ) != nil {
2022-03-24 08:21:41 -04:00
return errConnClosing
2018-06-08 05:26:10 -04:00
}
2023-09-19 10:37:37 -04:00
ac . mu . Lock ( )
2019-04-12 14:36:17 -04:00
ac . cc . mu . RLock ( )
ac . dopts . copts . KeepaliveParams = ac . cc . mkp
ac . cc . mu . RUnlock ( )
copts := ac . dopts . copts
if ac . scopts . CredsBundle != nil {
copts . CredsBundle = ac . scopts . CredsBundle
2018-06-08 05:26:10 -04:00
}
2019-04-12 14:36:17 -04:00
ac . mu . Unlock ( )
2021-08-12 11:11:44 -04:00
channelz . Infof ( logger , ac . channelzID , "Subchannel picks a new address %q to connect" , addr . Addr )
2019-04-12 14:36:17 -04:00
2023-09-19 10:37:37 -04:00
err := ac . createTransport ( ctx , addr , copts , connectDeadline )
2019-04-12 14:36:17 -04:00
if err == nil {
2022-03-24 08:21:41 -04:00
return nil
2018-06-08 05:26:10 -04:00
}
2020-04-16 10:34:35 -04:00
if firstConnErr == nil {
firstConnErr = err
}
2021-08-12 11:11:44 -04:00
ac . cc . updateConnectionError ( err )
2019-04-12 14:36:17 -04:00
}
// Couldn't connect to any address.
2022-03-24 08:21:41 -04:00
return firstConnErr
2019-04-12 14:36:17 -04:00
}
2022-03-24 08:21:41 -04:00
// createTransport creates a connection to addr. It returns an error if the
// address was not successfully connected, or updates ac appropriately with the
// new transport.
2023-09-19 10:37:37 -04:00
func ( ac * addrConn ) createTransport ( ctx context . Context , addr resolver . Address , copts transport . ConnectOptions , connectDeadline time . Time ) error {
2022-03-24 08:21:41 -04:00
addr . ServerName = ac . cc . getServerName ( addr )
2023-09-19 10:37:37 -04:00
hctx , hcancel := context . WithCancel ( ctx )
2019-04-12 14:36:17 -04:00
2023-07-19 18:26:26 -04:00
onClose := func ( r transport . GoAwayReason ) {
2019-04-12 14:36:17 -04:00
ac . mu . Lock ( )
2022-03-24 08:21:41 -04:00
defer ac . mu . Unlock ( )
2023-07-19 18:26:26 -04:00
// adjust params based on GoAwayReason
ac . adjustParams ( r )
2023-09-19 10:37:37 -04:00
if ctx . Err ( ) != nil {
// Already shut down or connection attempt canceled. tearDown() or
// updateAddrs() already cleared the transport and canceled hctx
// via ac.ctx, and we expected this connection to be closed, so do
// nothing here.
2023-07-19 18:26:26 -04:00
return
}
hcancel ( )
if ac . transport == nil {
// We're still connecting to this address, which could error. Do
// not update the connectivity state or resolve; these will happen
// at the end of the tryAllAddrs connection loop in the event of an
// error.
2022-03-24 08:21:41 -04:00
return
}
ac . transport = nil
2023-07-19 18:26:26 -04:00
// Refresh the name resolver on any connection loss.
2022-03-24 08:21:41 -04:00
ac . cc . resolveNow ( resolver . ResolveNowOptions { } )
2023-07-19 18:26:26 -04:00
// Always go idle and wait for the LB policy to initiate a new
// connection attempt.
ac . updateConnectivityState ( connectivity . Idle , nil )
2019-04-12 14:36:17 -04:00
}
2023-09-19 10:37:37 -04:00
connectCtx , cancel := context . WithDeadline ( ctx , connectDeadline )
2019-04-12 14:36:17 -04:00
defer cancel ( )
2022-11-16 10:32:17 -05:00
copts . ChannelzParentID = ac . channelzID
2019-04-12 14:36:17 -04:00
2023-07-19 18:26:26 -04:00
newTr , err := transport . NewClientTransport ( connectCtx , ac . cc . ctx , addr , copts , onClose )
2019-04-12 14:36:17 -04:00
if err != nil {
2023-07-19 18:26:26 -04:00
if logger . V ( 2 ) {
logger . Infof ( "Creating new client transport to %q: %v" , addr , err )
}
2019-04-12 14:36:17 -04:00
// newTr is either nil, or closed.
2022-11-16 10:32:17 -05:00
hcancel ( )
channelz . Warningf ( logger , ac . channelzID , "grpc: addrConn.createTransport failed to connect to %s. Err: %v" , addr , err )
2022-03-24 08:21:41 -04:00
return err
2019-04-12 14:36:17 -04:00
}
2023-07-19 18:26:26 -04:00
ac . mu . Lock ( )
defer ac . mu . Unlock ( )
2023-09-19 10:37:37 -04:00
if ctx . Err ( ) != nil {
2023-07-19 18:26:26 -04:00
// This can happen if the subConn was removed while in `Connecting`
// state. tearDown() would have set the state to `Shutdown`, but
// would not have closed the transport since ac.transport would not
// have been set at that point.
//
// We run this in a goroutine because newTr.Close() calls onClose()
// inline, which requires locking ac.mu.
//
2022-03-24 08:21:41 -04:00
// The error we pass to Close() is immaterial since there are no open
// streams at this point, so no trailers with error details will be sent
// out. We just need to pass a non-nil error.
2023-09-19 10:37:37 -04:00
//
// This can also happen when updateAddrs is called during a connection
// attempt.
2023-07-19 18:26:26 -04:00
go newTr . Close ( transport . ErrConnClosing )
2022-03-24 08:21:41 -04:00
return nil
2023-07-19 18:26:26 -04:00
}
if hctx . Err ( ) != nil {
// onClose was already called for this connection, but the connection
// was successfully established first. Consider it a success and set
// the new state to Idle.
ac . updateConnectivityState ( connectivity . Idle , nil )
2022-03-24 08:21:41 -04:00
return nil
2017-04-17 18:08:24 -04:00
}
2023-07-19 18:26:26 -04:00
ac . curAddr = addr
ac . transport = newTr
ac . startHealthCheck ( hctx ) // Will set state to READY if appropriate.
return nil
2017-04-17 18:08:24 -04:00
}
2019-10-02 13:42:55 -04:00
// startHealthCheck starts the health checking stream (RPC) to watch the health
// stats of this connection if health checking is requested and configured.
//
// LB channel health checking is enabled when all requirements below are met:
// 1. it is not disabled by the user with the WithDisableHealthCheck DialOption
2021-08-12 11:11:44 -04:00
// 2. internal.HealthCheckFunc is set by importing the grpc/health package
2019-10-02 13:42:55 -04:00
// 3. a service config with non-empty healthCheckConfig field is provided
// 4. the load balancer requests it
//
// It sets addrConn to READY if the health checking stream is not started.
//
// Caller must hold ac.mu.
func ( ac * addrConn ) startHealthCheck ( ctx context . Context ) {
var healthcheckManagingState bool
defer func ( ) {
if ! healthcheckManagingState {
2020-04-16 10:34:35 -04:00
ac . updateConnectivityState ( connectivity . Ready , nil )
2019-10-02 13:42:55 -04:00
}
} ( )
if ac . cc . dopts . disableHealthCheck {
return
}
healthCheckConfig := ac . cc . healthCheckConfig ( )
if healthCheckConfig == nil {
return
}
if ! ac . scopts . HealthCheckEnabled {
return
}
healthCheckFunc := ac . cc . dopts . healthCheckFunc
if healthCheckFunc == nil {
// The health package is not imported to set health check function.
//
// TODO: add a link to the health check doc in the error message.
2021-08-12 11:11:44 -04:00
channelz . Error ( logger , ac . channelzID , "Health check is requested but health check function is not set." )
2019-10-02 13:42:55 -04:00
return
}
healthcheckManagingState = true
// Set up the health check helper functions.
currentTr := ac . transport
2023-11-01 11:03:44 -04:00
newStream := func ( method string ) ( any , error ) {
2019-10-02 13:42:55 -04:00
ac . mu . Lock ( )
if ac . transport != currentTr {
ac . mu . Unlock ( )
return nil , status . Error ( codes . Canceled , "the provided transport is no longer valid to use" )
}
ac . mu . Unlock ( )
return newNonRetryClientStream ( ctx , & StreamDesc { ServerStreams : true } , method , currentTr , ac )
2019-04-12 14:36:17 -04:00
}
2020-04-16 10:34:35 -04:00
setConnectivityState := func ( s connectivity . State , lastErr error ) {
2017-04-17 18:08:24 -04:00
ac . mu . Lock ( )
2019-04-12 14:36:17 -04:00
defer ac . mu . Unlock ( )
2019-10-02 13:42:55 -04:00
if ac . transport != currentTr {
2019-04-12 14:36:17 -04:00
return
2017-04-17 18:08:24 -04:00
}
2020-04-16 10:34:35 -04:00
ac . updateConnectivityState ( s , lastErr )
2019-04-12 14:36:17 -04:00
}
2019-10-02 13:42:55 -04:00
// Start the health checking stream.
go func ( ) {
err := ac . cc . dopts . healthCheckFunc ( ctx , newStream , setConnectivityState , healthCheckConfig . ServiceName )
if err != nil {
if status . Code ( err ) == codes . Unimplemented {
2021-08-12 11:11:44 -04:00
channelz . Error ( logger , ac . channelzID , "Subchannel health check is unimplemented at server side, thus health check is disabled" )
2019-10-02 13:42:55 -04:00
} else {
2023-07-19 18:26:26 -04:00
channelz . Errorf ( logger , ac . channelzID , "Health checking failed: %v" , err )
2019-04-12 14:36:17 -04:00
}
2017-04-17 18:08:24 -04:00
}
2019-10-02 13:42:55 -04:00
} ( )
2017-04-17 18:08:24 -04:00
}
2019-04-12 14:36:17 -04:00
func ( ac * addrConn ) resetConnectBackoff ( ) {
ac . mu . Lock ( )
close ( ac . resetBackoff )
ac . backoffIdx = 0
ac . resetBackoff = make ( chan struct { } )
ac . mu . Unlock ( )
}
2022-03-24 08:21:41 -04:00
// getReadyTransport returns the transport if ac's state is READY or nil if not.
func ( ac * addrConn ) getReadyTransport ( ) transport . ClientTransport {
2018-06-08 05:26:10 -04:00
ac . mu . Lock ( )
2022-03-24 08:21:41 -04:00
defer ac . mu . Unlock ( )
if ac . state == connectivity . Ready {
return ac . transport
2018-06-08 05:26:10 -04:00
}
2022-03-24 08:21:41 -04:00
return nil
2018-06-08 05:26:10 -04:00
}
2023-09-19 10:37:37 -04:00
// getTransport waits until the addrconn is ready and returns the transport.
// If the context expires first, returns an appropriate status. If the
// addrConn is stopped first, returns an Unavailable status error.
func ( ac * addrConn ) getTransport ( ctx context . Context ) ( transport . ClientTransport , error ) {
for ctx . Err ( ) == nil {
ac . mu . Lock ( )
t , state , sc := ac . transport , ac . state , ac . stateChan
ac . mu . Unlock ( )
if state == connectivity . Ready {
return t , nil
}
if state == connectivity . Shutdown {
return nil , status . Errorf ( codes . Unavailable , "SubConn shutting down" )
}
select {
case <- ctx . Done ( ) :
case <- sc :
}
}
return nil , status . FromContextError ( ctx . Err ( ) ) . Err ( )
}
2017-04-17 18:08:24 -04:00
// tearDown starts to tear down the addrConn.
2021-08-12 11:11:44 -04:00
//
// Note that tearDown doesn't remove ac from ac.cc.conns, so the addrConn struct
// will leak. In most cases, call cc.removeAddrConn() instead.
2017-04-17 18:08:24 -04:00
func ( ac * addrConn ) tearDown ( err error ) {
ac . mu . Lock ( )
2018-06-08 05:26:10 -04:00
if ac . state == connectivity . Shutdown {
2019-04-12 14:36:17 -04:00
ac . mu . Unlock ( )
2018-06-08 05:26:10 -04:00
return
2017-04-17 18:08:24 -04:00
}
2019-04-12 14:36:17 -04:00
curTr := ac . transport
ac . transport = nil
// We have to set the state to Shutdown before anything else to prevent races
2020-04-16 10:34:35 -04:00
// between setting the state and logic that waits on context cancellation / etc.
ac . updateConnectivityState ( connectivity . Shutdown , nil )
2019-04-12 14:36:17 -04:00
ac . cancel ( )
2018-06-08 05:26:10 -04:00
ac . curAddr = resolver . Address { }
2023-11-01 11:03:44 -04:00
2022-11-16 10:32:17 -05:00
channelz . AddTraceEvent ( logger , ac . channelzID , 0 , & channelz . TraceEventDesc {
Desc : "Subchannel deleted" ,
Severity : channelz . CtInfo ,
Parent : & channelz . TraceEventDesc {
Desc : fmt . Sprintf ( "Subchannel(id:%d) deleted" , ac . channelzID . Int ( ) ) ,
2021-08-12 11:11:44 -04:00
Severity : channelz . CtInfo ,
2022-11-16 10:32:17 -05:00
} ,
} )
// TraceEvent needs to be called before RemoveEntry, as TraceEvent may add
// trace reference to the entity being deleted, and thus prevent it from
// being deleted right away.
channelz . RemoveEntry ( ac . channelzID )
2019-04-12 14:36:17 -04:00
ac . mu . Unlock ( )
2023-11-01 11:03:44 -04:00
// We have to release the lock before the call to GracefulClose/Close here
// because both of them call onClose(), which requires locking ac.mu.
if curTr != nil {
if err == errConnDrain {
// Close the transport gracefully when the subConn is being shutdown.
//
// GracefulClose() may be executed multiple times if:
// - multiple GoAway frames are received from the server
// - there are concurrent name resolver or balancer triggered
// address removal and GoAway
curTr . GracefulClose ( )
} else {
// Hard close the transport when the channel is entering idle or is
// being shutdown. In the case where the channel is being shutdown,
// closing of transports is also taken care of by cancelation of cc.ctx.
// But in the case where the channel is entering idle, we need to
// explicitly close the transports here. Instead of distinguishing
// between these two cases, it is simpler to close the transport
// unconditionally here.
curTr . Close ( err )
}
}
2018-06-08 05:26:10 -04:00
}
func ( ac * addrConn ) getState ( ) connectivity . State {
ac . mu . Lock ( )
defer ac . mu . Unlock ( )
return ac . state
}
func ( ac * addrConn ) ChannelzMetric ( ) * channelz . ChannelInternalMetric {
ac . mu . Lock ( )
addr := ac . curAddr . Addr
ac . mu . Unlock ( )
return & channelz . ChannelInternalMetric {
2019-04-12 14:36:17 -04:00
State : ac . getState ( ) ,
2018-06-08 05:26:10 -04:00
Target : addr ,
2019-04-12 14:36:17 -04:00
CallsStarted : atomic . LoadInt64 ( & ac . czData . callsStarted ) ,
CallsSucceeded : atomic . LoadInt64 ( & ac . czData . callsSucceeded ) ,
CallsFailed : atomic . LoadInt64 ( & ac . czData . callsFailed ) ,
LastCallStartedTimestamp : time . Unix ( 0 , atomic . LoadInt64 ( & ac . czData . lastCallStartedTime ) ) ,
2018-06-08 05:26:10 -04:00
}
}
func ( ac * addrConn ) incrCallsStarted ( ) {
2019-04-12 14:36:17 -04:00
atomic . AddInt64 ( & ac . czData . callsStarted , 1 )
atomic . StoreInt64 ( & ac . czData . lastCallStartedTime , time . Now ( ) . UnixNano ( ) )
2018-06-08 05:26:10 -04:00
}
func ( ac * addrConn ) incrCallsSucceeded ( ) {
2019-04-12 14:36:17 -04:00
atomic . AddInt64 ( & ac . czData . callsSucceeded , 1 )
2018-06-08 05:26:10 -04:00
}
func ( ac * addrConn ) incrCallsFailed ( ) {
2019-04-12 14:36:17 -04:00
atomic . AddInt64 ( & ac . czData . callsFailed , 1 )
}
type retryThrottler struct {
max float64
thresh float64
ratio float64
mu sync . Mutex
tokens float64 // TODO(dfawley): replace with atomic and remove lock.
}
// throttle subtracts a retry token from the pool and returns whether a retry
// should be throttled (disallowed) based upon the retry throttling policy in
// the service config.
func ( rt * retryThrottler ) throttle ( ) bool {
if rt == nil {
return false
}
rt . mu . Lock ( )
defer rt . mu . Unlock ( )
rt . tokens --
if rt . tokens < 0 {
rt . tokens = 0
}
return rt . tokens <= rt . thresh
}
func ( rt * retryThrottler ) successfulRPC ( ) {
if rt == nil {
return
}
rt . mu . Lock ( )
defer rt . mu . Unlock ( )
rt . tokens += rt . ratio
if rt . tokens > rt . max {
rt . tokens = rt . max
}
}
type channelzChannel struct {
cc * ClientConn
}
func ( c * channelzChannel ) ChannelzMetric ( ) * channelz . ChannelInternalMetric {
return c . cc . channelzMetric ( )
2018-06-08 05:26:10 -04:00
}
// ErrClientConnTimeout indicates that the ClientConn cannot establish the
// underlying connections within the specified timeout.
//
// Deprecated: This error is never returned by grpc and should not be
// referenced by users.
var ErrClientConnTimeout = errors . New ( "grpc: timed out when dialing" )
2020-04-16 10:34:35 -04:00
2023-09-19 10:37:37 -04:00
// getResolver finds the scheme in the cc's resolvers or the global registry.
// scheme should always be lowercase (typically by virtue of url.Parse()
// performing proper RFC3986 behavior).
2020-04-16 10:34:35 -04:00
func ( cc * ClientConn ) getResolver ( scheme string ) resolver . Builder {
for _ , rb := range cc . dopts . resolvers {
2021-08-12 11:11:44 -04:00
if scheme == rb . Scheme ( ) {
2020-04-16 10:34:35 -04:00
return rb
}
}
2021-08-12 11:11:44 -04:00
return resolver . Get ( scheme )
}
func ( cc * ClientConn ) updateConnectionError ( err error ) {
cc . lceMu . Lock ( )
cc . lastConnectionError = err
cc . lceMu . Unlock ( )
}
func ( cc * ClientConn ) connectionError ( ) error {
cc . lceMu . Lock ( )
defer cc . lceMu . Unlock ( )
return cc . lastConnectionError
2020-04-16 10:34:35 -04:00
}
2022-03-24 08:21:41 -04:00
2023-09-19 10:37:37 -04:00
// parseTargetAndFindResolver parses the user's dial target and stores the
// parsed target in `cc.parsedTarget`.
//
// The resolver to use is determined based on the scheme in the parsed target
// and the same is stored in `cc.resolverBuilder`.
//
// Doesn't grab cc.mu as this method is expected to be called only at Dial time.
func ( cc * ClientConn ) parseTargetAndFindResolver ( ) error {
2022-03-24 08:21:41 -04:00
channelz . Infof ( logger , cc . channelzID , "original dial target is: %q" , cc . target )
var rb resolver . Builder
parsedTarget , err := parseTarget ( cc . target )
if err != nil {
channelz . Infof ( logger , cc . channelzID , "dial target %q parse failed: %v" , cc . target , err )
} else {
2024-02-20 10:42:33 -05:00
channelz . Infof ( logger , cc . channelzID , "parsed dial target is: %#v" , parsedTarget )
2023-07-19 18:26:26 -04:00
rb = cc . getResolver ( parsedTarget . URL . Scheme )
2022-03-24 08:21:41 -04:00
if rb != nil {
cc . parsedTarget = parsedTarget
2023-09-19 10:37:37 -04:00
cc . resolverBuilder = rb
return nil
2022-03-24 08:21:41 -04:00
}
}
// We are here because the user's dial target did not contain a scheme or
// specified an unregistered scheme. We should fallback to the default
// scheme, except when a custom dialer is specified in which case, we should
// always use passthrough scheme.
defScheme := resolver . GetDefaultScheme ( )
channelz . Infof ( logger , cc . channelzID , "fallback to scheme %q" , defScheme )
canonicalTarget := defScheme + ":///" + cc . target
parsedTarget , err = parseTarget ( canonicalTarget )
if err != nil {
channelz . Infof ( logger , cc . channelzID , "dial target %q parse failed: %v" , canonicalTarget , err )
2023-09-19 10:37:37 -04:00
return err
2022-03-24 08:21:41 -04:00
}
channelz . Infof ( logger , cc . channelzID , "parsed dial target is: %+v" , parsedTarget )
2023-07-19 18:26:26 -04:00
rb = cc . getResolver ( parsedTarget . URL . Scheme )
2022-03-24 08:21:41 -04:00
if rb == nil {
2023-09-19 10:37:37 -04:00
return fmt . Errorf ( "could not get resolver for default scheme: %q" , parsedTarget . URL . Scheme )
2022-03-24 08:21:41 -04:00
}
cc . parsedTarget = parsedTarget
2023-09-19 10:37:37 -04:00
cc . resolverBuilder = rb
return nil
2022-03-24 08:21:41 -04:00
}
// parseTarget uses RFC 3986 semantics to parse the given target into a
2023-11-01 11:03:44 -04:00
// resolver.Target struct containing url. Query params are stripped from the
// endpoint.
2022-03-24 08:21:41 -04:00
func parseTarget ( target string ) ( resolver . Target , error ) {
u , err := url . Parse ( target )
if err != nil {
return resolver . Target { } , err
}
2023-07-19 18:26:26 -04:00
2023-11-01 11:03:44 -04:00
return resolver . Target { URL : * u } , nil
}
func encodeAuthority ( authority string ) string {
const upperhex = "0123456789ABCDEF"
// Return for characters that must be escaped as per
// Valid chars are mentioned here:
// https://datatracker.ietf.org/doc/html/rfc3986#section-3.2
shouldEscape := func ( c byte ) bool {
// Alphanum are always allowed.
if 'a' <= c && c <= 'z' || 'A' <= c && c <= 'Z' || '0' <= c && c <= '9' {
return false
}
switch c {
case '-' , '_' , '.' , '~' : // Unreserved characters
return false
case '!' , '$' , '&' , '\'' , '(' , ')' , '*' , '+' , ',' , ';' , '=' : // Subdelim characters
return false
case ':' , '[' , ']' , '@' : // Authority related delimeters
return false
}
// Everything else must be escaped.
return true
}
hexCount := 0
for i := 0 ; i < len ( authority ) ; i ++ {
c := authority [ i ]
if shouldEscape ( c ) {
hexCount ++
}
}
if hexCount == 0 {
return authority
}
required := len ( authority ) + 2 * hexCount
t := make ( [ ] byte , required )
j := 0
// This logic is a barebones version of escape in the go net/url library.
for i := 0 ; i < len ( authority ) ; i ++ {
switch c := authority [ i ] ; {
case shouldEscape ( c ) :
t [ j ] = '%'
t [ j + 1 ] = upperhex [ c >> 4 ]
t [ j + 2 ] = upperhex [ c & 15 ]
j += 3
default :
t [ j ] = authority [ i ]
j ++
}
}
return string ( t )
2022-03-24 08:21:41 -04:00
}
// Determine channel authority. The order of precedence is as follows:
// - user specified authority override using `WithAuthority` dial option
// - creds' notion of server name for the authentication handshake
// - endpoint from dial target of the form "scheme://[authority]/endpoint"
2023-09-19 10:37:37 -04:00
//
// Stores the determined authority in `cc.authority`.
//
// Returns a non-nil error if the authority returned by the transport
// credentials do not match the authority configured through the dial option.
//
// Doesn't grab cc.mu as this method is expected to be called only at Dial time.
func ( cc * ClientConn ) determineAuthority ( ) error {
dopts := cc . dopts
2022-03-24 08:21:41 -04:00
// Historically, we had two options for users to specify the serverName or
// authority for a channel. One was through the transport credentials
// (either in its constructor, or through the OverrideServerName() method).
// The other option (for cases where WithInsecure() dial option was used)
// was to use the WithAuthority() dial option.
//
// A few things have changed since:
// - `insecure` package with an implementation of the `TransportCredentials`
// interface for the insecure case
// - WithAuthority() dial option support for secure credentials
authorityFromCreds := ""
if creds := dopts . copts . TransportCredentials ; creds != nil && creds . Info ( ) . ServerName != "" {
authorityFromCreds = creds . Info ( ) . ServerName
}
authorityFromDialOption := dopts . authority
if ( authorityFromCreds != "" && authorityFromDialOption != "" ) && authorityFromCreds != authorityFromDialOption {
2023-09-19 10:37:37 -04:00
return fmt . Errorf ( "ClientConn's authority from transport creds %q and dial option %q don't match" , authorityFromCreds , authorityFromDialOption )
2022-03-24 08:21:41 -04:00
}
2023-09-19 10:37:37 -04:00
endpoint := cc . parsedTarget . Endpoint ( )
target := cc . target
2022-03-24 08:21:41 -04:00
switch {
case authorityFromDialOption != "" :
2023-09-19 10:37:37 -04:00
cc . authority = authorityFromDialOption
2022-03-24 08:21:41 -04:00
case authorityFromCreds != "" :
2023-09-19 10:37:37 -04:00
cc . authority = authorityFromCreds
2022-03-24 08:21:41 -04:00
case strings . HasPrefix ( target , "unix:" ) || strings . HasPrefix ( target , "unix-abstract:" ) :
// TODO: remove when the unix resolver implements optional interface to
// return channel authority.
2023-09-19 10:37:37 -04:00
cc . authority = "localhost"
2022-03-24 08:21:41 -04:00
case strings . HasPrefix ( endpoint , ":" ) :
2023-09-19 10:37:37 -04:00
cc . authority = "localhost" + endpoint
2022-03-24 08:21:41 -04:00
default :
// TODO: Define an optional interface on the resolver builder to return
// the channel authority given the user's dial target. For resolvers
// which don't implement this interface, we will use the endpoint from
// "scheme://authority/endpoint" as the default authority.
2023-11-01 11:03:44 -04:00
// Escape the endpoint to handle use cases where the endpoint
// might not be a valid authority by default.
// For example an endpoint which has multiple paths like
// 'a/b/c', which is not a valid authority by default.
cc . authority = encodeAuthority ( endpoint )
2022-03-24 08:21:41 -04:00
}
2023-09-19 10:37:37 -04:00
channelz . Infof ( logger , cc . channelzID , "Channel authority set to %q" , cc . authority )
return nil
}