balancer.go 17 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426
  1. /*
  2. *
  3. * Copyright 2017 gRPC authors.
  4. *
  5. * Licensed under the Apache License, Version 2.0 (the "License");
  6. * you may not use this file except in compliance with the License.
  7. * You may obtain a copy of the License at
  8. *
  9. * http://www.apache.org/licenses/LICENSE-2.0
  10. *
  11. * Unless required by applicable law or agreed to in writing, software
  12. * distributed under the License is distributed on an "AS IS" BASIS,
  13. * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  14. * See the License for the specific language governing permissions and
  15. * limitations under the License.
  16. *
  17. */
  18. // Package balancer defines APIs for load balancing in gRPC.
  19. // All APIs in this package are experimental.
  20. package balancer
  21. import (
  22. "context"
  23. "encoding/json"
  24. "errors"
  25. "net"
  26. "strings"
  27. "google.golang.org/grpc/channelz"
  28. "google.golang.org/grpc/connectivity"
  29. "google.golang.org/grpc/credentials"
  30. "google.golang.org/grpc/internal"
  31. "google.golang.org/grpc/metadata"
  32. "google.golang.org/grpc/resolver"
  33. "google.golang.org/grpc/serviceconfig"
  34. )
  35. var (
  36. // m is a map from name to balancer builder.
  37. m = make(map[string]Builder)
  38. )
  39. // Register registers the balancer builder to the balancer map. b.Name
  40. // (lowercased) will be used as the name registered with this builder. If the
  41. // Builder implements ConfigParser, ParseConfig will be called when new service
  42. // configs are received by the resolver, and the result will be provided to the
  43. // Balancer in UpdateClientConnState.
  44. //
  45. // NOTE: this function must only be called during initialization time (i.e. in
  46. // an init() function), and is not thread-safe. If multiple Balancers are
  47. // registered with the same name, the one registered last will take effect.
  48. func Register(b Builder) {
  49. m[strings.ToLower(b.Name())] = b
  50. }
  51. // unregisterForTesting deletes the balancer with the given name from the
  52. // balancer map.
  53. //
  54. // This function is not thread-safe.
  55. func unregisterForTesting(name string) {
  56. delete(m, name)
  57. }
  58. func init() {
  59. internal.BalancerUnregister = unregisterForTesting
  60. }
  61. // Get returns the resolver builder registered with the given name.
  62. // Note that the compare is done in a case-insensitive fashion.
  63. // If no builder is register with the name, nil will be returned.
  64. func Get(name string) Builder {
  65. if b, ok := m[strings.ToLower(name)]; ok {
  66. return b
  67. }
  68. return nil
  69. }
  70. // A SubConn represents a single connection to a gRPC backend service.
  71. //
  72. // Each SubConn contains a list of addresses.
  73. //
  74. // All SubConns start in IDLE, and will not try to connect. To trigger the
  75. // connecting, Balancers must call Connect. If a connection re-enters IDLE,
  76. // Balancers must call Connect again to trigger a new connection attempt.
  77. //
  78. // gRPC will try to connect to the addresses in sequence, and stop trying the
  79. // remainder once the first connection is successful. If an attempt to connect
  80. // to all addresses encounters an error, the SubConn will enter
  81. // TRANSIENT_FAILURE for a backoff period, and then transition to IDLE.
  82. //
  83. // Once established, if a connection is lost, the SubConn will transition
  84. // directly to IDLE.
  85. //
  86. // This interface is to be implemented by gRPC. Users should not need their own
  87. // implementation of this interface. For situations like testing, any
  88. // implementations should embed this interface. This allows gRPC to add new
  89. // methods to this interface.
  90. type SubConn interface {
  91. // UpdateAddresses updates the addresses used in this SubConn.
  92. // gRPC checks if currently-connected address is still in the new list.
  93. // If it's in the list, the connection will be kept.
  94. // If it's not in the list, the connection will gracefully closed, and
  95. // a new connection will be created.
  96. //
  97. // This will trigger a state transition for the SubConn.
  98. //
  99. // Deprecated: This method is now part of the ClientConn interface and will
  100. // eventually be removed from here.
  101. UpdateAddresses([]resolver.Address)
  102. // Connect starts the connecting for this SubConn.
  103. Connect()
  104. }
  105. // NewSubConnOptions contains options to create new SubConn.
  106. type NewSubConnOptions struct {
  107. // CredsBundle is the credentials bundle that will be used in the created
  108. // SubConn. If it's nil, the original creds from grpc DialOptions will be
  109. // used.
  110. //
  111. // Deprecated: Use the Attributes field in resolver.Address to pass
  112. // arbitrary data to the credential handshaker.
  113. CredsBundle credentials.Bundle
  114. // HealthCheckEnabled indicates whether health check service should be
  115. // enabled on this SubConn
  116. HealthCheckEnabled bool
  117. }
  118. // State contains the balancer's state relevant to the gRPC ClientConn.
  119. type State struct {
  120. // State contains the connectivity state of the balancer, which is used to
  121. // determine the state of the ClientConn.
  122. ConnectivityState connectivity.State
  123. // Picker is used to choose connections (SubConns) for RPCs.
  124. Picker Picker
  125. }
  126. // ClientConn represents a gRPC ClientConn.
  127. //
  128. // This interface is to be implemented by gRPC. Users should not need a
  129. // brand new implementation of this interface. For the situations like
  130. // testing, the new implementation should embed this interface. This allows
  131. // gRPC to add new methods to this interface.
  132. type ClientConn interface {
  133. // NewSubConn is called by balancer to create a new SubConn.
  134. // It doesn't block and wait for the connections to be established.
  135. // Behaviors of the SubConn can be controlled by options.
  136. NewSubConn([]resolver.Address, NewSubConnOptions) (SubConn, error)
  137. // RemoveSubConn removes the SubConn from ClientConn.
  138. // The SubConn will be shutdown.
  139. RemoveSubConn(SubConn)
  140. // UpdateAddresses updates the addresses used in the passed in SubConn.
  141. // gRPC checks if the currently connected address is still in the new list.
  142. // If so, the connection will be kept. Else, the connection will be
  143. // gracefully closed, and a new connection will be created.
  144. //
  145. // This will trigger a state transition for the SubConn.
  146. UpdateAddresses(SubConn, []resolver.Address)
  147. // UpdateState notifies gRPC that the balancer's internal state has
  148. // changed.
  149. //
  150. // gRPC will update the connectivity state of the ClientConn, and will call
  151. // Pick on the new Picker to pick new SubConns.
  152. UpdateState(State)
  153. // ResolveNow is called by balancer to notify gRPC to do a name resolving.
  154. ResolveNow(resolver.ResolveNowOptions)
  155. // Target returns the dial target for this ClientConn.
  156. //
  157. // Deprecated: Use the Target field in the BuildOptions instead.
  158. Target() string
  159. }
  160. // BuildOptions contains additional information for Build.
  161. type BuildOptions struct {
  162. // DialCreds is the transport credentials to use when communicating with a
  163. // remote load balancer server. Balancer implementations which do not
  164. // communicate with a remote load balancer server can ignore this field.
  165. DialCreds credentials.TransportCredentials
  166. // CredsBundle is the credentials bundle to use when communicating with a
  167. // remote load balancer server. Balancer implementations which do not
  168. // communicate with a remote load balancer server can ignore this field.
  169. CredsBundle credentials.Bundle
  170. // Dialer is the custom dialer to use when communicating with a remote load
  171. // balancer server. Balancer implementations which do not communicate with a
  172. // remote load balancer server can ignore this field.
  173. Dialer func(context.Context, string) (net.Conn, error)
  174. // Authority is the server name to use as part of the authentication
  175. // handshake when communicating with a remote load balancer server. Balancer
  176. // implementations which do not communicate with a remote load balancer
  177. // server can ignore this field.
  178. Authority string
  179. // ChannelzParentID is the parent ClientConn's channelz ID.
  180. ChannelzParentID *channelz.Identifier
  181. // CustomUserAgent is the custom user agent set on the parent ClientConn.
  182. // The balancer should set the same custom user agent if it creates a
  183. // ClientConn.
  184. CustomUserAgent string
  185. // Target contains the parsed address info of the dial target. It is the
  186. // same resolver.Target as passed to the resolver. See the documentation for
  187. // the resolver.Target type for details about what it contains.
  188. Target resolver.Target
  189. }
  190. // Builder creates a balancer.
  191. type Builder interface {
  192. // Build creates a new balancer with the ClientConn.
  193. Build(cc ClientConn, opts BuildOptions) Balancer
  194. // Name returns the name of balancers built by this builder.
  195. // It will be used to pick balancers (for example in service config).
  196. Name() string
  197. }
  198. // ConfigParser parses load balancer configs.
  199. type ConfigParser interface {
  200. // ParseConfig parses the JSON load balancer config provided into an
  201. // internal form or returns an error if the config is invalid. For future
  202. // compatibility reasons, unknown fields in the config should be ignored.
  203. ParseConfig(LoadBalancingConfigJSON json.RawMessage) (serviceconfig.LoadBalancingConfig, error)
  204. }
  205. // PickInfo contains additional information for the Pick operation.
  206. type PickInfo struct {
  207. // FullMethodName is the method name that NewClientStream() is called
  208. // with. The canonical format is /service/Method.
  209. FullMethodName string
  210. // Ctx is the RPC's context, and may contain relevant RPC-level information
  211. // like the outgoing header metadata.
  212. Ctx context.Context
  213. }
  214. // DoneInfo contains additional information for done.
  215. type DoneInfo struct {
  216. // Err is the rpc error the RPC finished with. It could be nil.
  217. Err error
  218. // Trailer contains the metadata from the RPC's trailer, if present.
  219. Trailer metadata.MD
  220. // BytesSent indicates if any bytes have been sent to the server.
  221. BytesSent bool
  222. // BytesReceived indicates if any byte has been received from the server.
  223. BytesReceived bool
  224. // ServerLoad is the load received from server. It's usually sent as part of
  225. // trailing metadata.
  226. //
  227. // The only supported type now is *orca_v1.LoadReport.
  228. ServerLoad interface{}
  229. }
  230. var (
  231. // ErrNoSubConnAvailable indicates no SubConn is available for pick().
  232. // gRPC will block the RPC until a new picker is available via UpdateState().
  233. ErrNoSubConnAvailable = errors.New("no SubConn is available")
  234. // ErrTransientFailure indicates all SubConns are in TransientFailure.
  235. // WaitForReady RPCs will block, non-WaitForReady RPCs will fail.
  236. //
  237. // Deprecated: return an appropriate error based on the last resolution or
  238. // connection attempt instead. The behavior is the same for any non-gRPC
  239. // status error.
  240. ErrTransientFailure = errors.New("all SubConns are in TransientFailure")
  241. )
  242. // PickResult contains information related to a connection chosen for an RPC.
  243. type PickResult struct {
  244. // SubConn is the connection to use for this pick, if its state is Ready.
  245. // If the state is not Ready, gRPC will block the RPC until a new Picker is
  246. // provided by the balancer (using ClientConn.UpdateState). The SubConn
  247. // must be one returned by ClientConn.NewSubConn.
  248. SubConn SubConn
  249. // Done is called when the RPC is completed. If the SubConn is not ready,
  250. // this will be called with a nil parameter. If the SubConn is not a valid
  251. // type, Done may not be called. May be nil if the balancer does not wish
  252. // to be notified when the RPC completes.
  253. Done func(DoneInfo)
  254. }
  255. // TransientFailureError returns e. It exists for backward compatibility and
  256. // will be deleted soon.
  257. //
  258. // Deprecated: no longer necessary, picker errors are treated this way by
  259. // default.
  260. func TransientFailureError(e error) error { return e }
  261. // Picker is used by gRPC to pick a SubConn to send an RPC.
  262. // Balancer is expected to generate a new picker from its snapshot every time its
  263. // internal state has changed.
  264. //
  265. // The pickers used by gRPC can be updated by ClientConn.UpdateState().
  266. type Picker interface {
  267. // Pick returns the connection to use for this RPC and related information.
  268. //
  269. // Pick should not block. If the balancer needs to do I/O or any blocking
  270. // or time-consuming work to service this call, it should return
  271. // ErrNoSubConnAvailable, and the Pick call will be repeated by gRPC when
  272. // the Picker is updated (using ClientConn.UpdateState).
  273. //
  274. // If an error is returned:
  275. //
  276. // - If the error is ErrNoSubConnAvailable, gRPC will block until a new
  277. // Picker is provided by the balancer (using ClientConn.UpdateState).
  278. //
  279. // - If the error is a status error (implemented by the grpc/status
  280. // package), gRPC will terminate the RPC with the code and message
  281. // provided.
  282. //
  283. // - For all other errors, wait for ready RPCs will wait, but non-wait for
  284. // ready RPCs will be terminated with this error's Error() string and
  285. // status code Unavailable.
  286. Pick(info PickInfo) (PickResult, error)
  287. }
  288. // Balancer takes input from gRPC, manages SubConns, and collects and aggregates
  289. // the connectivity states.
  290. //
  291. // It also generates and updates the Picker used by gRPC to pick SubConns for RPCs.
  292. //
  293. // UpdateClientConnState, ResolverError, UpdateSubConnState, and Close are
  294. // guaranteed to be called synchronously from the same goroutine. There's no
  295. // guarantee on picker.Pick, it may be called anytime.
  296. type Balancer interface {
  297. // UpdateClientConnState is called by gRPC when the state of the ClientConn
  298. // changes. If the error returned is ErrBadResolverState, the ClientConn
  299. // will begin calling ResolveNow on the active name resolver with
  300. // exponential backoff until a subsequent call to UpdateClientConnState
  301. // returns a nil error. Any other errors are currently ignored.
  302. UpdateClientConnState(ClientConnState) error
  303. // ResolverError is called by gRPC when the name resolver reports an error.
  304. ResolverError(error)
  305. // UpdateSubConnState is called by gRPC when the state of a SubConn
  306. // changes.
  307. UpdateSubConnState(SubConn, SubConnState)
  308. // Close closes the balancer. The balancer is not required to call
  309. // ClientConn.RemoveSubConn for its existing SubConns.
  310. Close()
  311. }
  312. // ExitIdler is an optional interface for balancers to implement. If
  313. // implemented, ExitIdle will be called when ClientConn.Connect is called, if
  314. // the ClientConn is idle. If unimplemented, ClientConn.Connect will cause
  315. // all SubConns to connect.
  316. //
  317. // Notice: it will be required for all balancers to implement this in a future
  318. // release.
  319. type ExitIdler interface {
  320. // ExitIdle instructs the LB policy to reconnect to backends / exit the
  321. // IDLE state, if appropriate and possible. Note that SubConns that enter
  322. // the IDLE state will not reconnect until SubConn.Connect is called.
  323. ExitIdle()
  324. }
  325. // SubConnState describes the state of a SubConn.
  326. type SubConnState struct {
  327. // ConnectivityState is the connectivity state of the SubConn.
  328. ConnectivityState connectivity.State
  329. // ConnectionError is set if the ConnectivityState is TransientFailure,
  330. // describing the reason the SubConn failed. Otherwise, it is nil.
  331. ConnectionError error
  332. }
  333. // ClientConnState describes the state of a ClientConn relevant to the
  334. // balancer.
  335. type ClientConnState struct {
  336. ResolverState resolver.State
  337. // The parsed load balancing configuration returned by the builder's
  338. // ParseConfig method, if implemented.
  339. BalancerConfig serviceconfig.LoadBalancingConfig
  340. }
  341. // ErrBadResolverState may be returned by UpdateClientConnState to indicate a
  342. // problem with the provided name resolver data.
  343. var ErrBadResolverState = errors.New("bad resolver state")
  344. // ConnectivityStateEvaluator takes the connectivity states of multiple SubConns
  345. // and returns one aggregated connectivity state.
  346. //
  347. // It's not thread safe.
  348. type ConnectivityStateEvaluator struct {
  349. numReady uint64 // Number of addrConns in ready state.
  350. numConnecting uint64 // Number of addrConns in connecting state.
  351. numTransientFailure uint64 // Number of addrConns in transient failure state.
  352. numIdle uint64 // Number of addrConns in idle state.
  353. }
  354. // RecordTransition records state change happening in subConn and based on that
  355. // it evaluates what aggregated state should be.
  356. //
  357. // - If at least one SubConn in Ready, the aggregated state is Ready;
  358. // - Else if at least one SubConn in Connecting, the aggregated state is Connecting;
  359. // - Else if at least one SubConn is TransientFailure, the aggregated state is Transient Failure;
  360. // - Else if at least one SubConn is Idle, the aggregated state is Idle;
  361. // - Else there are no subconns and the aggregated state is Transient Failure
  362. //
  363. // Shutdown is not considered.
  364. func (cse *ConnectivityStateEvaluator) RecordTransition(oldState, newState connectivity.State) connectivity.State {
  365. // Update counters.
  366. for idx, state := range []connectivity.State{oldState, newState} {
  367. updateVal := 2*uint64(idx) - 1 // -1 for oldState and +1 for new.
  368. switch state {
  369. case connectivity.Ready:
  370. cse.numReady += updateVal
  371. case connectivity.Connecting:
  372. cse.numConnecting += updateVal
  373. case connectivity.TransientFailure:
  374. cse.numTransientFailure += updateVal
  375. case connectivity.Idle:
  376. cse.numIdle += updateVal
  377. }
  378. }
  379. // Evaluate.
  380. if cse.numReady > 0 {
  381. return connectivity.Ready
  382. }
  383. if cse.numConnecting > 0 {
  384. return connectivity.Connecting
  385. }
  386. if cse.numTransientFailure > 0 {
  387. return connectivity.TransientFailure
  388. }
  389. if cse.numIdle > 0 {
  390. return connectivity.Idle
  391. }
  392. return connectivity.TransientFailure
  393. }