retry.go 12 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351
  1. // Copyright 2016 The etcd Authors
  2. //
  3. // Licensed under the Apache License, Version 2.0 (the "License");
  4. // you may not use this file except in compliance with the License.
  5. // You may obtain a copy of the License at
  6. //
  7. // http://www.apache.org/licenses/LICENSE-2.0
  8. //
  9. // Unless required by applicable law or agreed to in writing, software
  10. // distributed under the License is distributed on an "AS IS" BASIS,
  11. // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  12. // See the License for the specific language governing permissions and
  13. // limitations under the License.
  14. package clientv3
  15. import (
  16. "context"
  17. "github.com/coreos/etcd/etcdserver/api/v3rpc/rpctypes"
  18. pb "github.com/coreos/etcd/etcdserver/etcdserverpb"
  19. "google.golang.org/grpc"
  20. "google.golang.org/grpc/codes"
  21. "google.golang.org/grpc/status"
  22. )
  23. type rpcFunc func(ctx context.Context) error
  24. type retryRPCFunc func(context.Context, rpcFunc) error
  25. type retryStopErrFunc func(error) bool
  26. func isReadStopError(err error) bool {
  27. eErr := rpctypes.Error(err)
  28. // always stop retry on etcd errors
  29. if _, ok := eErr.(rpctypes.EtcdError); ok {
  30. return true
  31. }
  32. // only retry if unavailable
  33. ev, _ := status.FromError(err)
  34. return ev.Code() != codes.Unavailable
  35. }
  36. func isWriteStopError(err error) bool {
  37. ev, _ := status.FromError(err)
  38. if ev.Code() != codes.Unavailable {
  39. return true
  40. }
  41. return rpctypes.ErrorDesc(err) != "there is no address available"
  42. }
  43. func (c *Client) newRetryWrapper(isStop retryStopErrFunc) retryRPCFunc {
  44. return func(rpcCtx context.Context, f rpcFunc) error {
  45. for {
  46. if err := readyWait(rpcCtx, c.ctx, c.balancer.ConnectNotify()); err != nil {
  47. return err
  48. }
  49. pinned := c.balancer.pinned()
  50. err := f(rpcCtx)
  51. if err == nil {
  52. return nil
  53. }
  54. if logger.V(4) {
  55. logger.Infof("clientv3/retry: error %q on pinned endpoint %q", err.Error(), pinned)
  56. }
  57. // mark this before endpoint switch is triggered
  58. c.balancer.hostPortError(pinned, err)
  59. if s, ok := status.FromError(err); ok && s.Code() == codes.Unavailable {
  60. c.balancer.next()
  61. }
  62. if isStop(err) {
  63. return err
  64. }
  65. }
  66. }
  67. }
  68. func (c *Client) newAuthRetryWrapper() retryRPCFunc {
  69. return func(rpcCtx context.Context, f rpcFunc) error {
  70. for {
  71. pinned := c.balancer.pinned()
  72. err := f(rpcCtx)
  73. if err == nil {
  74. return nil
  75. }
  76. if logger.V(4) {
  77. logger.Infof("clientv3/auth-retry: error %q on pinned endpoint %q", err.Error(), pinned)
  78. }
  79. // always stop retry on etcd errors other than invalid auth token
  80. if rpctypes.Error(err) == rpctypes.ErrInvalidAuthToken {
  81. gterr := c.getToken(rpcCtx)
  82. if gterr != nil {
  83. if logger.V(4) {
  84. logger.Infof("clientv3/auth-retry: cannot retry due to error %q(%q) on pinned endpoint %q", err.Error(), gterr.Error(), pinned)
  85. }
  86. return err // return the original error for simplicity
  87. }
  88. continue
  89. }
  90. return err
  91. }
  92. }
  93. }
  94. // RetryKVClient implements a KVClient that uses the client's FailFast retry policy.
  95. func RetryKVClient(c *Client) pb.KVClient {
  96. readRetry := c.newRetryWrapper(isReadStopError)
  97. writeRetry := c.newRetryWrapper(isWriteStopError)
  98. conn := pb.NewKVClient(c.conn)
  99. retryBasic := &retryKVClient{&retryWriteKVClient{conn, writeRetry}, readRetry}
  100. retryAuthWrapper := c.newAuthRetryWrapper()
  101. return &retryKVClient{
  102. &retryWriteKVClient{retryBasic, retryAuthWrapper},
  103. retryAuthWrapper}
  104. }
  105. type retryKVClient struct {
  106. *retryWriteKVClient
  107. readRetry retryRPCFunc
  108. }
  109. func (rkv *retryKVClient) Range(ctx context.Context, in *pb.RangeRequest, opts ...grpc.CallOption) (resp *pb.RangeResponse, err error) {
  110. err = rkv.readRetry(ctx, func(rctx context.Context) error {
  111. resp, err = rkv.KVClient.Range(rctx, in, opts...)
  112. return err
  113. })
  114. return resp, err
  115. }
  116. type retryWriteKVClient struct {
  117. pb.KVClient
  118. writeRetry retryRPCFunc
  119. }
  120. func (rkv *retryWriteKVClient) Put(ctx context.Context, in *pb.PutRequest, opts ...grpc.CallOption) (resp *pb.PutResponse, err error) {
  121. err = rkv.writeRetry(ctx, func(rctx context.Context) error {
  122. resp, err = rkv.KVClient.Put(rctx, in, opts...)
  123. return err
  124. })
  125. return resp, err
  126. }
  127. func (rkv *retryWriteKVClient) DeleteRange(ctx context.Context, in *pb.DeleteRangeRequest, opts ...grpc.CallOption) (resp *pb.DeleteRangeResponse, err error) {
  128. err = rkv.writeRetry(ctx, func(rctx context.Context) error {
  129. resp, err = rkv.KVClient.DeleteRange(rctx, in, opts...)
  130. return err
  131. })
  132. return resp, err
  133. }
  134. func (rkv *retryWriteKVClient) Txn(ctx context.Context, in *pb.TxnRequest, opts ...grpc.CallOption) (resp *pb.TxnResponse, err error) {
  135. err = rkv.writeRetry(ctx, func(rctx context.Context) error {
  136. resp, err = rkv.KVClient.Txn(rctx, in, opts...)
  137. return err
  138. })
  139. return resp, err
  140. }
  141. func (rkv *retryWriteKVClient) Compact(ctx context.Context, in *pb.CompactionRequest, opts ...grpc.CallOption) (resp *pb.CompactionResponse, err error) {
  142. err = rkv.writeRetry(ctx, func(rctx context.Context) error {
  143. resp, err = rkv.KVClient.Compact(rctx, in, opts...)
  144. return err
  145. })
  146. return resp, err
  147. }
  148. type retryLeaseClient struct {
  149. lc pb.LeaseClient
  150. repeatableRetry retryRPCFunc
  151. }
  152. // RetryLeaseClient implements a LeaseClient.
  153. func RetryLeaseClient(c *Client) pb.LeaseClient {
  154. retry := &retryLeaseClient{
  155. pb.NewLeaseClient(c.conn),
  156. c.newRetryWrapper(isReadStopError),
  157. }
  158. return &retryLeaseClient{retry, c.newAuthRetryWrapper()}
  159. }
  160. func (rlc *retryLeaseClient) LeaseTimeToLive(ctx context.Context, in *pb.LeaseTimeToLiveRequest, opts ...grpc.CallOption) (resp *pb.LeaseTimeToLiveResponse, err error) {
  161. err = rlc.repeatableRetry(ctx, func(rctx context.Context) error {
  162. resp, err = rlc.lc.LeaseTimeToLive(rctx, in, opts...)
  163. return err
  164. })
  165. return resp, err
  166. }
  167. func (rlc *retryLeaseClient) LeaseLeases(ctx context.Context, in *pb.LeaseLeasesRequest, opts ...grpc.CallOption) (resp *pb.LeaseLeasesResponse, err error) {
  168. err = rlc.repeatableRetry(ctx, func(rctx context.Context) error {
  169. resp, err = rlc.lc.LeaseLeases(rctx, in, opts...)
  170. return err
  171. })
  172. return resp, err
  173. }
  174. func (rlc *retryLeaseClient) LeaseGrant(ctx context.Context, in *pb.LeaseGrantRequest, opts ...grpc.CallOption) (resp *pb.LeaseGrantResponse, err error) {
  175. err = rlc.repeatableRetry(ctx, func(rctx context.Context) error {
  176. resp, err = rlc.lc.LeaseGrant(rctx, in, opts...)
  177. return err
  178. })
  179. return resp, err
  180. }
  181. func (rlc *retryLeaseClient) LeaseRevoke(ctx context.Context, in *pb.LeaseRevokeRequest, opts ...grpc.CallOption) (resp *pb.LeaseRevokeResponse, err error) {
  182. err = rlc.repeatableRetry(ctx, func(rctx context.Context) error {
  183. resp, err = rlc.lc.LeaseRevoke(rctx, in, opts...)
  184. return err
  185. })
  186. return resp, err
  187. }
  188. func (rlc *retryLeaseClient) LeaseKeepAlive(ctx context.Context, opts ...grpc.CallOption) (stream pb.Lease_LeaseKeepAliveClient, err error) {
  189. err = rlc.repeatableRetry(ctx, func(rctx context.Context) error {
  190. stream, err = rlc.lc.LeaseKeepAlive(rctx, opts...)
  191. return err
  192. })
  193. return stream, err
  194. }
  195. type retryClusterClient struct {
  196. pb.ClusterClient
  197. writeRetry retryRPCFunc
  198. }
  199. // RetryClusterClient implements a ClusterClient that uses the client's FailFast retry policy.
  200. func RetryClusterClient(c *Client) pb.ClusterClient {
  201. return &retryClusterClient{pb.NewClusterClient(c.conn), c.newRetryWrapper(isWriteStopError)}
  202. }
  203. func (rcc *retryClusterClient) MemberAdd(ctx context.Context, in *pb.MemberAddRequest, opts ...grpc.CallOption) (resp *pb.MemberAddResponse, err error) {
  204. err = rcc.writeRetry(ctx, func(rctx context.Context) error {
  205. resp, err = rcc.ClusterClient.MemberAdd(rctx, in, opts...)
  206. return err
  207. })
  208. return resp, err
  209. }
  210. func (rcc *retryClusterClient) MemberRemove(ctx context.Context, in *pb.MemberRemoveRequest, opts ...grpc.CallOption) (resp *pb.MemberRemoveResponse, err error) {
  211. err = rcc.writeRetry(ctx, func(rctx context.Context) error {
  212. resp, err = rcc.ClusterClient.MemberRemove(rctx, in, opts...)
  213. return err
  214. })
  215. return resp, err
  216. }
  217. func (rcc *retryClusterClient) MemberUpdate(ctx context.Context, in *pb.MemberUpdateRequest, opts ...grpc.CallOption) (resp *pb.MemberUpdateResponse, err error) {
  218. err = rcc.writeRetry(ctx, func(rctx context.Context) error {
  219. resp, err = rcc.ClusterClient.MemberUpdate(rctx, in, opts...)
  220. return err
  221. })
  222. return resp, err
  223. }
  224. type retryAuthClient struct {
  225. pb.AuthClient
  226. writeRetry retryRPCFunc
  227. }
  228. // RetryAuthClient implements a AuthClient that uses the client's FailFast retry policy.
  229. func RetryAuthClient(c *Client) pb.AuthClient {
  230. return &retryAuthClient{pb.NewAuthClient(c.conn), c.newRetryWrapper(isWriteStopError)}
  231. }
  232. func (rac *retryAuthClient) AuthEnable(ctx context.Context, in *pb.AuthEnableRequest, opts ...grpc.CallOption) (resp *pb.AuthEnableResponse, err error) {
  233. err = rac.writeRetry(ctx, func(rctx context.Context) error {
  234. resp, err = rac.AuthClient.AuthEnable(rctx, in, opts...)
  235. return err
  236. })
  237. return resp, err
  238. }
  239. func (rac *retryAuthClient) AuthDisable(ctx context.Context, in *pb.AuthDisableRequest, opts ...grpc.CallOption) (resp *pb.AuthDisableResponse, err error) {
  240. err = rac.writeRetry(ctx, func(rctx context.Context) error {
  241. resp, err = rac.AuthClient.AuthDisable(rctx, in, opts...)
  242. return err
  243. })
  244. return resp, err
  245. }
  246. func (rac *retryAuthClient) UserAdd(ctx context.Context, in *pb.AuthUserAddRequest, opts ...grpc.CallOption) (resp *pb.AuthUserAddResponse, err error) {
  247. err = rac.writeRetry(ctx, func(rctx context.Context) error {
  248. resp, err = rac.AuthClient.UserAdd(rctx, in, opts...)
  249. return err
  250. })
  251. return resp, err
  252. }
  253. func (rac *retryAuthClient) UserDelete(ctx context.Context, in *pb.AuthUserDeleteRequest, opts ...grpc.CallOption) (resp *pb.AuthUserDeleteResponse, err error) {
  254. err = rac.writeRetry(ctx, func(rctx context.Context) error {
  255. resp, err = rac.AuthClient.UserDelete(rctx, in, opts...)
  256. return err
  257. })
  258. return resp, err
  259. }
  260. func (rac *retryAuthClient) UserChangePassword(ctx context.Context, in *pb.AuthUserChangePasswordRequest, opts ...grpc.CallOption) (resp *pb.AuthUserChangePasswordResponse, err error) {
  261. err = rac.writeRetry(ctx, func(rctx context.Context) error {
  262. resp, err = rac.AuthClient.UserChangePassword(rctx, in, opts...)
  263. return err
  264. })
  265. return resp, err
  266. }
  267. func (rac *retryAuthClient) UserGrantRole(ctx context.Context, in *pb.AuthUserGrantRoleRequest, opts ...grpc.CallOption) (resp *pb.AuthUserGrantRoleResponse, err error) {
  268. err = rac.writeRetry(ctx, func(rctx context.Context) error {
  269. resp, err = rac.AuthClient.UserGrantRole(rctx, in, opts...)
  270. return err
  271. })
  272. return resp, err
  273. }
  274. func (rac *retryAuthClient) UserRevokeRole(ctx context.Context, in *pb.AuthUserRevokeRoleRequest, opts ...grpc.CallOption) (resp *pb.AuthUserRevokeRoleResponse, err error) {
  275. err = rac.writeRetry(ctx, func(rctx context.Context) error {
  276. resp, err = rac.AuthClient.UserRevokeRole(rctx, in, opts...)
  277. return err
  278. })
  279. return resp, err
  280. }
  281. func (rac *retryAuthClient) RoleAdd(ctx context.Context, in *pb.AuthRoleAddRequest, opts ...grpc.CallOption) (resp *pb.AuthRoleAddResponse, err error) {
  282. err = rac.writeRetry(ctx, func(rctx context.Context) error {
  283. resp, err = rac.AuthClient.RoleAdd(rctx, in, opts...)
  284. return err
  285. })
  286. return resp, err
  287. }
  288. func (rac *retryAuthClient) RoleDelete(ctx context.Context, in *pb.AuthRoleDeleteRequest, opts ...grpc.CallOption) (resp *pb.AuthRoleDeleteResponse, err error) {
  289. err = rac.writeRetry(ctx, func(rctx context.Context) error {
  290. resp, err = rac.AuthClient.RoleDelete(rctx, in, opts...)
  291. return err
  292. })
  293. return resp, err
  294. }
  295. func (rac *retryAuthClient) RoleGrantPermission(ctx context.Context, in *pb.AuthRoleGrantPermissionRequest, opts ...grpc.CallOption) (resp *pb.AuthRoleGrantPermissionResponse, err error) {
  296. err = rac.writeRetry(ctx, func(rctx context.Context) error {
  297. resp, err = rac.AuthClient.RoleGrantPermission(rctx, in, opts...)
  298. return err
  299. })
  300. return resp, err
  301. }
  302. func (rac *retryAuthClient) RoleRevokePermission(ctx context.Context, in *pb.AuthRoleRevokePermissionRequest, opts ...grpc.CallOption) (resp *pb.AuthRoleRevokePermissionResponse, err error) {
  303. err = rac.writeRetry(ctx, func(rctx context.Context) error {
  304. resp, err = rac.AuthClient.RoleRevokePermission(rctx, in, opts...)
  305. return err
  306. })
  307. return resp, err
  308. }