balancer.go 16 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404
  1. /*
  2. *
  3. * Copyright 2017 gRPC authors.
  4. *
  5. * Licensed under the Apache License, Version 2.0 (the "License");
  6. * you may not use this file except in compliance with the License.
  7. * You may obtain a copy of the License at
  8. *
  9. * http://www.apache.org/licenses/LICENSE-2.0
  10. *
  11. * Unless required by applicable law or agreed to in writing, software
  12. * distributed under the License is distributed on an "AS IS" BASIS,
  13. * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  14. * See the License for the specific language governing permissions and
  15. * limitations under the License.
  16. *
  17. */
  18. // Package balancer defines APIs for load balancing in gRPC.
  19. // All APIs in this package are experimental.
  20. package balancer
  21. import (
  22. "context"
  23. "encoding/json"
  24. "errors"
  25. "net"
  26. "strings"
  27. "google.golang.org/grpc/channelz"
  28. "google.golang.org/grpc/connectivity"
  29. "google.golang.org/grpc/credentials"
  30. "google.golang.org/grpc/internal"
  31. "google.golang.org/grpc/metadata"
  32. "google.golang.org/grpc/resolver"
  33. "google.golang.org/grpc/serviceconfig"
  34. )
  35. var (
  36. // m is a map from name to balancer builder.
  37. m = make(map[string]Builder)
  38. )
  39. // Register registers the balancer builder to the balancer map. b.Name
  40. // (lowercased) will be used as the name registered with this builder. If the
  41. // Builder implements ConfigParser, ParseConfig will be called when new service
  42. // configs are received by the resolver, and the result will be provided to the
  43. // Balancer in UpdateClientConnState.
  44. //
  45. // NOTE: this function must only be called during initialization time (i.e. in
  46. // an init() function), and is not thread-safe. If multiple Balancers are
  47. // registered with the same name, the one registered last will take effect.
  48. func Register(b Builder) {
  49. m[strings.ToLower(b.Name())] = b
  50. }
  51. // unregisterForTesting deletes the balancer with the given name from the
  52. // balancer map.
  53. //
  54. // This function is not thread-safe.
  55. func unregisterForTesting(name string) {
  56. delete(m, name)
  57. }
  58. func init() {
  59. internal.BalancerUnregister = unregisterForTesting
  60. }
  61. // Get returns the resolver builder registered with the given name.
  62. // Note that the compare is done in a case-insensitive fashion.
  63. // If no builder is register with the name, nil will be returned.
  64. func Get(name string) Builder {
  65. if b, ok := m[strings.ToLower(name)]; ok {
  66. return b
  67. }
  68. return nil
  69. }
  70. // A SubConn represents a single connection to a gRPC backend service.
  71. //
  72. // Each SubConn contains a list of addresses.
  73. //
  74. // All SubConns start in IDLE, and will not try to connect. To trigger the
  75. // connecting, Balancers must call Connect. If a connection re-enters IDLE,
  76. // Balancers must call Connect again to trigger a new connection attempt.
  77. //
  78. // gRPC will try to connect to the addresses in sequence, and stop trying the
  79. // remainder once the first connection is successful. If an attempt to connect
  80. // to all addresses encounters an error, the SubConn will enter
  81. // TRANSIENT_FAILURE for a backoff period, and then transition to IDLE.
  82. //
  83. // Once established, if a connection is lost, the SubConn will transition
  84. // directly to IDLE.
  85. //
  86. // This interface is to be implemented by gRPC. Users should not need their own
  87. // implementation of this interface. For situations like testing, any
  88. // implementations should embed this interface. This allows gRPC to add new
  89. // methods to this interface.
  90. type SubConn interface {
  91. // UpdateAddresses updates the addresses used in this SubConn.
  92. // gRPC checks if currently-connected address is still in the new list.
  93. // If it's in the list, the connection will be kept.
  94. // If it's not in the list, the connection will gracefully closed, and
  95. // a new connection will be created.
  96. //
  97. // This will trigger a state transition for the SubConn.
  98. //
  99. // Deprecated: This method is now part of the ClientConn interface and will
  100. // eventually be removed from here.
  101. UpdateAddresses([]resolver.Address)
  102. // Connect starts the connecting for this SubConn.
  103. Connect()
  104. // GetOrBuildProducer returns a reference to the existing Producer for this
  105. // ProducerBuilder in this SubConn, or, if one does not currently exist,
  106. // creates a new one and returns it. Returns a close function which must
  107. // be called when the Producer is no longer needed.
  108. GetOrBuildProducer(ProducerBuilder) (p Producer, close func())
  109. }
  110. // NewSubConnOptions contains options to create new SubConn.
  111. type NewSubConnOptions struct {
  112. // CredsBundle is the credentials bundle that will be used in the created
  113. // SubConn. If it's nil, the original creds from grpc DialOptions will be
  114. // used.
  115. //
  116. // Deprecated: Use the Attributes field in resolver.Address to pass
  117. // arbitrary data to the credential handshaker.
  118. CredsBundle credentials.Bundle
  119. // HealthCheckEnabled indicates whether health check service should be
  120. // enabled on this SubConn
  121. HealthCheckEnabled bool
  122. }
  123. // State contains the balancer's state relevant to the gRPC ClientConn.
  124. type State struct {
  125. // State contains the connectivity state of the balancer, which is used to
  126. // determine the state of the ClientConn.
  127. ConnectivityState connectivity.State
  128. // Picker is used to choose connections (SubConns) for RPCs.
  129. Picker Picker
  130. }
  131. // ClientConn represents a gRPC ClientConn.
  132. //
  133. // This interface is to be implemented by gRPC. Users should not need a
  134. // brand new implementation of this interface. For the situations like
  135. // testing, the new implementation should embed this interface. This allows
  136. // gRPC to add new methods to this interface.
  137. type ClientConn interface {
  138. // NewSubConn is called by balancer to create a new SubConn.
  139. // It doesn't block and wait for the connections to be established.
  140. // Behaviors of the SubConn can be controlled by options.
  141. NewSubConn([]resolver.Address, NewSubConnOptions) (SubConn, error)
  142. // RemoveSubConn removes the SubConn from ClientConn.
  143. // The SubConn will be shutdown.
  144. RemoveSubConn(SubConn)
  145. // UpdateAddresses updates the addresses used in the passed in SubConn.
  146. // gRPC checks if the currently connected address is still in the new list.
  147. // If so, the connection will be kept. Else, the connection will be
  148. // gracefully closed, and a new connection will be created.
  149. //
  150. // This will trigger a state transition for the SubConn.
  151. UpdateAddresses(SubConn, []resolver.Address)
  152. // UpdateState notifies gRPC that the balancer's internal state has
  153. // changed.
  154. //
  155. // gRPC will update the connectivity state of the ClientConn, and will call
  156. // Pick on the new Picker to pick new SubConns.
  157. UpdateState(State)
  158. // ResolveNow is called by balancer to notify gRPC to do a name resolving.
  159. ResolveNow(resolver.ResolveNowOptions)
  160. // Target returns the dial target for this ClientConn.
  161. //
  162. // Deprecated: Use the Target field in the BuildOptions instead.
  163. Target() string
  164. }
  165. // BuildOptions contains additional information for Build.
  166. type BuildOptions struct {
  167. // DialCreds is the transport credentials to use when communicating with a
  168. // remote load balancer server. Balancer implementations which do not
  169. // communicate with a remote load balancer server can ignore this field.
  170. DialCreds credentials.TransportCredentials
  171. // CredsBundle is the credentials bundle to use when communicating with a
  172. // remote load balancer server. Balancer implementations which do not
  173. // communicate with a remote load balancer server can ignore this field.
  174. CredsBundle credentials.Bundle
  175. // Dialer is the custom dialer to use when communicating with a remote load
  176. // balancer server. Balancer implementations which do not communicate with a
  177. // remote load balancer server can ignore this field.
  178. Dialer func(context.Context, string) (net.Conn, error)
  179. // Authority is the server name to use as part of the authentication
  180. // handshake when communicating with a remote load balancer server. Balancer
  181. // implementations which do not communicate with a remote load balancer
  182. // server can ignore this field.
  183. Authority string
  184. // ChannelzParentID is the parent ClientConn's channelz ID.
  185. ChannelzParentID *channelz.Identifier
  186. // CustomUserAgent is the custom user agent set on the parent ClientConn.
  187. // The balancer should set the same custom user agent if it creates a
  188. // ClientConn.
  189. CustomUserAgent string
  190. // Target contains the parsed address info of the dial target. It is the
  191. // same resolver.Target as passed to the resolver. See the documentation for
  192. // the resolver.Target type for details about what it contains.
  193. Target resolver.Target
  194. }
  195. // Builder creates a balancer.
  196. type Builder interface {
  197. // Build creates a new balancer with the ClientConn.
  198. Build(cc ClientConn, opts BuildOptions) Balancer
  199. // Name returns the name of balancers built by this builder.
  200. // It will be used to pick balancers (for example in service config).
  201. Name() string
  202. }
  203. // ConfigParser parses load balancer configs.
  204. type ConfigParser interface {
  205. // ParseConfig parses the JSON load balancer config provided into an
  206. // internal form or returns an error if the config is invalid. For future
  207. // compatibility reasons, unknown fields in the config should be ignored.
  208. ParseConfig(LoadBalancingConfigJSON json.RawMessage) (serviceconfig.LoadBalancingConfig, error)
  209. }
  210. // PickInfo contains additional information for the Pick operation.
  211. type PickInfo struct {
  212. // FullMethodName is the method name that NewClientStream() is called
  213. // with. The canonical format is /service/Method.
  214. FullMethodName string
  215. // Ctx is the RPC's context, and may contain relevant RPC-level information
  216. // like the outgoing header metadata.
  217. Ctx context.Context
  218. }
  219. // DoneInfo contains additional information for done.
  220. type DoneInfo struct {
  221. // Err is the rpc error the RPC finished with. It could be nil.
  222. Err error
  223. // Trailer contains the metadata from the RPC's trailer, if present.
  224. Trailer metadata.MD
  225. // BytesSent indicates if any bytes have been sent to the server.
  226. BytesSent bool
  227. // BytesReceived indicates if any byte has been received from the server.
  228. BytesReceived bool
  229. // ServerLoad is the load received from server. It's usually sent as part of
  230. // trailing metadata.
  231. //
  232. // The only supported type now is *orca_v3.LoadReport.
  233. ServerLoad interface{}
  234. }
  235. var (
  236. // ErrNoSubConnAvailable indicates no SubConn is available for pick().
  237. // gRPC will block the RPC until a new picker is available via UpdateState().
  238. ErrNoSubConnAvailable = errors.New("no SubConn is available")
  239. // ErrTransientFailure indicates all SubConns are in TransientFailure.
  240. // WaitForReady RPCs will block, non-WaitForReady RPCs will fail.
  241. //
  242. // Deprecated: return an appropriate error based on the last resolution or
  243. // connection attempt instead. The behavior is the same for any non-gRPC
  244. // status error.
  245. ErrTransientFailure = errors.New("all SubConns are in TransientFailure")
  246. )
  247. // PickResult contains information related to a connection chosen for an RPC.
  248. type PickResult struct {
  249. // SubConn is the connection to use for this pick, if its state is Ready.
  250. // If the state is not Ready, gRPC will block the RPC until a new Picker is
  251. // provided by the balancer (using ClientConn.UpdateState). The SubConn
  252. // must be one returned by ClientConn.NewSubConn.
  253. SubConn SubConn
  254. // Done is called when the RPC is completed. If the SubConn is not ready,
  255. // this will be called with a nil parameter. If the SubConn is not a valid
  256. // type, Done may not be called. May be nil if the balancer does not wish
  257. // to be notified when the RPC completes.
  258. Done func(DoneInfo)
  259. // Metadata provides a way for LB policies to inject arbitrary per-call
  260. // metadata. Any metadata returned here will be merged with existing
  261. // metadata added by the client application.
  262. //
  263. // LB policies with child policies are responsible for propagating metadata
  264. // injected by their children to the ClientConn, as part of Pick().
  265. Metadata metadata.MD
  266. }
  267. // TransientFailureError returns e. It exists for backward compatibility and
  268. // will be deleted soon.
  269. //
  270. // Deprecated: no longer necessary, picker errors are treated this way by
  271. // default.
  272. func TransientFailureError(e error) error { return e }
  273. // Picker is used by gRPC to pick a SubConn to send an RPC.
  274. // Balancer is expected to generate a new picker from its snapshot every time its
  275. // internal state has changed.
  276. //
  277. // The pickers used by gRPC can be updated by ClientConn.UpdateState().
  278. type Picker interface {
  279. // Pick returns the connection to use for this RPC and related information.
  280. //
  281. // Pick should not block. If the balancer needs to do I/O or any blocking
  282. // or time-consuming work to service this call, it should return
  283. // ErrNoSubConnAvailable, and the Pick call will be repeated by gRPC when
  284. // the Picker is updated (using ClientConn.UpdateState).
  285. //
  286. // If an error is returned:
  287. //
  288. // - If the error is ErrNoSubConnAvailable, gRPC will block until a new
  289. // Picker is provided by the balancer (using ClientConn.UpdateState).
  290. //
  291. // - If the error is a status error (implemented by the grpc/status
  292. // package), gRPC will terminate the RPC with the code and message
  293. // provided.
  294. //
  295. // - For all other errors, wait for ready RPCs will wait, but non-wait for
  296. // ready RPCs will be terminated with this error's Error() string and
  297. // status code Unavailable.
  298. Pick(info PickInfo) (PickResult, error)
  299. }
  300. // Balancer takes input from gRPC, manages SubConns, and collects and aggregates
  301. // the connectivity states.
  302. //
  303. // It also generates and updates the Picker used by gRPC to pick SubConns for RPCs.
  304. //
  305. // UpdateClientConnState, ResolverError, UpdateSubConnState, and Close are
  306. // guaranteed to be called synchronously from the same goroutine. There's no
  307. // guarantee on picker.Pick, it may be called anytime.
  308. type Balancer interface {
  309. // UpdateClientConnState is called by gRPC when the state of the ClientConn
  310. // changes. If the error returned is ErrBadResolverState, the ClientConn
  311. // will begin calling ResolveNow on the active name resolver with
  312. // exponential backoff until a subsequent call to UpdateClientConnState
  313. // returns a nil error. Any other errors are currently ignored.
  314. UpdateClientConnState(ClientConnState) error
  315. // ResolverError is called by gRPC when the name resolver reports an error.
  316. ResolverError(error)
  317. // UpdateSubConnState is called by gRPC when the state of a SubConn
  318. // changes.
  319. UpdateSubConnState(SubConn, SubConnState)
  320. // Close closes the balancer. The balancer is not required to call
  321. // ClientConn.RemoveSubConn for its existing SubConns.
  322. Close()
  323. }
  324. // ExitIdler is an optional interface for balancers to implement. If
  325. // implemented, ExitIdle will be called when ClientConn.Connect is called, if
  326. // the ClientConn is idle. If unimplemented, ClientConn.Connect will cause
  327. // all SubConns to connect.
  328. //
  329. // Notice: it will be required for all balancers to implement this in a future
  330. // release.
  331. type ExitIdler interface {
  332. // ExitIdle instructs the LB policy to reconnect to backends / exit the
  333. // IDLE state, if appropriate and possible. Note that SubConns that enter
  334. // the IDLE state will not reconnect until SubConn.Connect is called.
  335. ExitIdle()
  336. }
  337. // SubConnState describes the state of a SubConn.
  338. type SubConnState struct {
  339. // ConnectivityState is the connectivity state of the SubConn.
  340. ConnectivityState connectivity.State
  341. // ConnectionError is set if the ConnectivityState is TransientFailure,
  342. // describing the reason the SubConn failed. Otherwise, it is nil.
  343. ConnectionError error
  344. }
  345. // ClientConnState describes the state of a ClientConn relevant to the
  346. // balancer.
  347. type ClientConnState struct {
  348. ResolverState resolver.State
  349. // The parsed load balancing configuration returned by the builder's
  350. // ParseConfig method, if implemented.
  351. BalancerConfig serviceconfig.LoadBalancingConfig
  352. }
  353. // ErrBadResolverState may be returned by UpdateClientConnState to indicate a
  354. // problem with the provided name resolver data.
  355. var ErrBadResolverState = errors.New("bad resolver state")
  356. // A ProducerBuilder is a simple constructor for a Producer. It is used by the
  357. // SubConn to create producers when needed.
  358. type ProducerBuilder interface {
  359. // Build creates a Producer. The first parameter is always a
  360. // grpc.ClientConnInterface (a type to allow creating RPCs/streams on the
  361. // associated SubConn), but is declared as interface{} to avoid a
  362. // dependency cycle. Should also return a close function that will be
  363. // called when all references to the Producer have been given up.
  364. Build(grpcClientConnInterface interface{}) (p Producer, close func())
  365. }
  366. // A Producer is a type shared among potentially many consumers. It is
  367. // associated with a SubConn, and an implementation will typically contain
  368. // other methods to provide additional functionality, e.g. configuration or
  369. // subscription registration.
  370. type Producer interface {
  371. }