retry.go 13 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368
  1. // Copyright 2016 The etcd Authors
  2. //
  3. // Licensed under the Apache License, Version 2.0 (the "License");
  4. // you may not use this file except in compliance with the License.
  5. // You may obtain a copy of the License at
  6. //
  7. // http://www.apache.org/licenses/LICENSE-2.0
  8. //
  9. // Unless required by applicable law or agreed to in writing, software
  10. // distributed under the License is distributed on an "AS IS" BASIS,
  11. // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  12. // See the License for the specific language governing permissions and
  13. // limitations under the License.
  14. package clientv3
  15. import (
  16. "context"
  17. "github.com/coreos/etcd/etcdserver/api/v3rpc/rpctypes"
  18. pb "github.com/coreos/etcd/etcdserver/etcdserverpb"
  19. "google.golang.org/grpc"
  20. "google.golang.org/grpc/codes"
  21. "google.golang.org/grpc/status"
  22. )
  23. type rpcFunc func(ctx context.Context) error
  24. type retryRPCFunc func(context.Context, rpcFunc) error
  25. type retryStopErrFunc func(error) bool
  26. func isRepeatableStopError(err error) bool {
  27. eErr := rpctypes.Error(err)
  28. // always stop retry on etcd errors
  29. if _, ok := eErr.(rpctypes.EtcdError); ok {
  30. return true
  31. }
  32. // only retry if unavailable
  33. ev, _ := status.FromError(err)
  34. return ev.Code() != codes.Unavailable
  35. }
  36. func isNonRepeatableStopError(err error) bool {
  37. ev, _ := status.FromError(err)
  38. if ev.Code() != codes.Unavailable {
  39. return true
  40. }
  41. return rpctypes.ErrorDesc(err) != "there is no address available"
  42. }
  43. func (c *Client) newRetryWrapper(isStop retryStopErrFunc) retryRPCFunc {
  44. return func(rpcCtx context.Context, f rpcFunc) error {
  45. for {
  46. if err := readyWait(rpcCtx, c.ctx, c.balancer.ConnectNotify()); err != nil {
  47. return err
  48. }
  49. pinned := c.balancer.pinned()
  50. err := f(rpcCtx)
  51. if err == nil {
  52. return nil
  53. }
  54. if logger.V(4) {
  55. logger.Infof("clientv3/retry: error %q on pinned endpoint %q", err.Error(), pinned)
  56. }
  57. // mark this before endpoint switch is triggered
  58. c.balancer.hostPortError(pinned, err)
  59. if s, ok := status.FromError(err); ok && s.Code() == codes.Unavailable {
  60. c.balancer.next()
  61. }
  62. if isStop(err) {
  63. return err
  64. }
  65. }
  66. }
  67. }
  68. func (c *Client) newAuthRetryWrapper() retryRPCFunc {
  69. return func(rpcCtx context.Context, f rpcFunc) error {
  70. for {
  71. pinned := c.balancer.pinned()
  72. err := f(rpcCtx)
  73. if err == nil {
  74. return nil
  75. }
  76. if logger.V(4) {
  77. logger.Infof("clientv3/auth-retry: error %q on pinned endpoint %q", err.Error(), pinned)
  78. }
  79. // always stop retry on etcd errors other than invalid auth token
  80. if rpctypes.Error(err) == rpctypes.ErrInvalidAuthToken {
  81. gterr := c.getToken(rpcCtx)
  82. if gterr != nil {
  83. if logger.V(4) {
  84. logger.Infof("clientv3/auth-retry: cannot retry due to error %q(%q) on pinned endpoint %q", err.Error(), gterr.Error(), pinned)
  85. }
  86. return err // return the original error for simplicity
  87. }
  88. continue
  89. }
  90. return err
  91. }
  92. }
  93. }
  94. // RetryKVClient implements a KVClient.
  95. func RetryKVClient(c *Client) pb.KVClient {
  96. repeatableRetry := c.newRetryWrapper(isRepeatableStopError)
  97. nonRepeatableRetry := c.newRetryWrapper(isNonRepeatableStopError)
  98. conn := pb.NewKVClient(c.conn)
  99. retryBasic := &retryKVClient{&nonRepeatableKVClient{conn, nonRepeatableRetry}, repeatableRetry}
  100. retryAuthWrapper := c.newAuthRetryWrapper()
  101. return &retryKVClient{
  102. &nonRepeatableKVClient{retryBasic, retryAuthWrapper},
  103. retryAuthWrapper}
  104. }
  105. type retryKVClient struct {
  106. *nonRepeatableKVClient
  107. repeatableRetry retryRPCFunc
  108. }
  109. func (rkv *retryKVClient) Range(ctx context.Context, in *pb.RangeRequest, opts ...grpc.CallOption) (resp *pb.RangeResponse, err error) {
  110. err = rkv.repeatableRetry(ctx, func(rctx context.Context) error {
  111. resp, err = rkv.kc.Range(rctx, in, opts...)
  112. return err
  113. })
  114. return resp, err
  115. }
  116. type nonRepeatableKVClient struct {
  117. kc pb.KVClient
  118. nonRepeatableRetry retryRPCFunc
  119. }
  120. func (rkv *nonRepeatableKVClient) Put(ctx context.Context, in *pb.PutRequest, opts ...grpc.CallOption) (resp *pb.PutResponse, err error) {
  121. err = rkv.nonRepeatableRetry(ctx, func(rctx context.Context) error {
  122. resp, err = rkv.kc.Put(rctx, in, opts...)
  123. return err
  124. })
  125. return resp, err
  126. }
  127. func (rkv *nonRepeatableKVClient) DeleteRange(ctx context.Context, in *pb.DeleteRangeRequest, opts ...grpc.CallOption) (resp *pb.DeleteRangeResponse, err error) {
  128. err = rkv.nonRepeatableRetry(ctx, func(rctx context.Context) error {
  129. resp, err = rkv.kc.DeleteRange(rctx, in, opts...)
  130. return err
  131. })
  132. return resp, err
  133. }
  134. func (rkv *nonRepeatableKVClient) Txn(ctx context.Context, in *pb.TxnRequest, opts ...grpc.CallOption) (resp *pb.TxnResponse, err error) {
  135. // TODO: repeatableRetry if read-only txn
  136. err = rkv.nonRepeatableRetry(ctx, func(rctx context.Context) error {
  137. resp, err = rkv.kc.Txn(rctx, in, opts...)
  138. return err
  139. })
  140. return resp, err
  141. }
  142. func (rkv *nonRepeatableKVClient) Compact(ctx context.Context, in *pb.CompactionRequest, opts ...grpc.CallOption) (resp *pb.CompactionResponse, err error) {
  143. err = rkv.nonRepeatableRetry(ctx, func(rctx context.Context) error {
  144. resp, err = rkv.kc.Compact(rctx, in, opts...)
  145. return err
  146. })
  147. return resp, err
  148. }
  149. type retryLeaseClient struct {
  150. lc pb.LeaseClient
  151. repeatableRetry retryRPCFunc
  152. }
  153. // RetryLeaseClient implements a LeaseClient.
  154. func RetryLeaseClient(c *Client) pb.LeaseClient {
  155. retry := &retryLeaseClient{
  156. pb.NewLeaseClient(c.conn),
  157. c.newRetryWrapper(isRepeatableStopError),
  158. }
  159. return &retryLeaseClient{retry, c.newAuthRetryWrapper()}
  160. }
  161. func (rlc *retryLeaseClient) LeaseTimeToLive(ctx context.Context, in *pb.LeaseTimeToLiveRequest, opts ...grpc.CallOption) (resp *pb.LeaseTimeToLiveResponse, err error) {
  162. err = rlc.repeatableRetry(ctx, func(rctx context.Context) error {
  163. resp, err = rlc.lc.LeaseTimeToLive(rctx, in, opts...)
  164. return err
  165. })
  166. return resp, err
  167. }
  168. func (rlc *retryLeaseClient) LeaseLeases(ctx context.Context, in *pb.LeaseLeasesRequest, opts ...grpc.CallOption) (resp *pb.LeaseLeasesResponse, err error) {
  169. err = rlc.repeatableRetry(ctx, func(rctx context.Context) error {
  170. resp, err = rlc.lc.LeaseLeases(rctx, in, opts...)
  171. return err
  172. })
  173. return resp, err
  174. }
  175. func (rlc *retryLeaseClient) LeaseGrant(ctx context.Context, in *pb.LeaseGrantRequest, opts ...grpc.CallOption) (resp *pb.LeaseGrantResponse, err error) {
  176. err = rlc.repeatableRetry(ctx, func(rctx context.Context) error {
  177. resp, err = rlc.lc.LeaseGrant(rctx, in, opts...)
  178. return err
  179. })
  180. return resp, err
  181. }
  182. func (rlc *retryLeaseClient) LeaseRevoke(ctx context.Context, in *pb.LeaseRevokeRequest, opts ...grpc.CallOption) (resp *pb.LeaseRevokeResponse, err error) {
  183. err = rlc.repeatableRetry(ctx, func(rctx context.Context) error {
  184. resp, err = rlc.lc.LeaseRevoke(rctx, in, opts...)
  185. return err
  186. })
  187. return resp, err
  188. }
  189. func (rlc *retryLeaseClient) LeaseKeepAlive(ctx context.Context, opts ...grpc.CallOption) (stream pb.Lease_LeaseKeepAliveClient, err error) {
  190. err = rlc.repeatableRetry(ctx, func(rctx context.Context) error {
  191. stream, err = rlc.lc.LeaseKeepAlive(rctx, opts...)
  192. return err
  193. })
  194. return stream, err
  195. }
  196. type retryClusterClient struct {
  197. *nonRepeatableClusterClient
  198. repeatableRetry retryRPCFunc
  199. }
  200. // RetryClusterClient implements a ClusterClient.
  201. func RetryClusterClient(c *Client) pb.ClusterClient {
  202. repeatableRetry := c.newRetryWrapper(isRepeatableStopError)
  203. nonRepeatableRetry := c.newRetryWrapper(isNonRepeatableStopError)
  204. cc := pb.NewClusterClient(c.conn)
  205. return &retryClusterClient{&nonRepeatableClusterClient{cc, nonRepeatableRetry}, repeatableRetry}
  206. }
  207. func (rcc *retryClusterClient) MemberList(ctx context.Context, in *pb.MemberListRequest, opts ...grpc.CallOption) (resp *pb.MemberListResponse, err error) {
  208. err = rcc.repeatableRetry(ctx, func(rctx context.Context) error {
  209. resp, err = rcc.cc.MemberList(rctx, in, opts...)
  210. return err
  211. })
  212. return resp, err
  213. }
  214. type nonRepeatableClusterClient struct {
  215. cc pb.ClusterClient
  216. nonRepeatableRetry retryRPCFunc
  217. }
  218. func (rcc *nonRepeatableClusterClient) MemberAdd(ctx context.Context, in *pb.MemberAddRequest, opts ...grpc.CallOption) (resp *pb.MemberAddResponse, err error) {
  219. err = rcc.nonRepeatableRetry(ctx, func(rctx context.Context) error {
  220. resp, err = rcc.cc.MemberAdd(rctx, in, opts...)
  221. return err
  222. })
  223. return resp, err
  224. }
  225. func (rcc *nonRepeatableClusterClient) MemberRemove(ctx context.Context, in *pb.MemberRemoveRequest, opts ...grpc.CallOption) (resp *pb.MemberRemoveResponse, err error) {
  226. err = rcc.nonRepeatableRetry(ctx, func(rctx context.Context) error {
  227. resp, err = rcc.cc.MemberRemove(rctx, in, opts...)
  228. return err
  229. })
  230. return resp, err
  231. }
  232. func (rcc *nonRepeatableClusterClient) MemberUpdate(ctx context.Context, in *pb.MemberUpdateRequest, opts ...grpc.CallOption) (resp *pb.MemberUpdateResponse, err error) {
  233. err = rcc.nonRepeatableRetry(ctx, func(rctx context.Context) error {
  234. resp, err = rcc.cc.MemberUpdate(rctx, in, opts...)
  235. return err
  236. })
  237. return resp, err
  238. }
  239. type retryAuthClient struct {
  240. pb.AuthClient
  241. writeRetry retryRPCFunc
  242. }
  243. // RetryAuthClient implements a AuthClient that uses the client's FailFast retry policy.
  244. func RetryAuthClient(c *Client) pb.AuthClient {
  245. return &retryAuthClient{pb.NewAuthClient(c.conn), c.newRetryWrapper(isNonRepeatableStopError)}
  246. }
  247. func (rac *retryAuthClient) AuthEnable(ctx context.Context, in *pb.AuthEnableRequest, opts ...grpc.CallOption) (resp *pb.AuthEnableResponse, err error) {
  248. err = rac.writeRetry(ctx, func(rctx context.Context) error {
  249. resp, err = rac.AuthClient.AuthEnable(rctx, in, opts...)
  250. return err
  251. })
  252. return resp, err
  253. }
  254. func (rac *retryAuthClient) AuthDisable(ctx context.Context, in *pb.AuthDisableRequest, opts ...grpc.CallOption) (resp *pb.AuthDisableResponse, err error) {
  255. err = rac.writeRetry(ctx, func(rctx context.Context) error {
  256. resp, err = rac.AuthClient.AuthDisable(rctx, in, opts...)
  257. return err
  258. })
  259. return resp, err
  260. }
  261. func (rac *retryAuthClient) UserAdd(ctx context.Context, in *pb.AuthUserAddRequest, opts ...grpc.CallOption) (resp *pb.AuthUserAddResponse, err error) {
  262. err = rac.writeRetry(ctx, func(rctx context.Context) error {
  263. resp, err = rac.AuthClient.UserAdd(rctx, in, opts...)
  264. return err
  265. })
  266. return resp, err
  267. }
  268. func (rac *retryAuthClient) UserDelete(ctx context.Context, in *pb.AuthUserDeleteRequest, opts ...grpc.CallOption) (resp *pb.AuthUserDeleteResponse, err error) {
  269. err = rac.writeRetry(ctx, func(rctx context.Context) error {
  270. resp, err = rac.AuthClient.UserDelete(rctx, in, opts...)
  271. return err
  272. })
  273. return resp, err
  274. }
  275. func (rac *retryAuthClient) UserChangePassword(ctx context.Context, in *pb.AuthUserChangePasswordRequest, opts ...grpc.CallOption) (resp *pb.AuthUserChangePasswordResponse, err error) {
  276. err = rac.writeRetry(ctx, func(rctx context.Context) error {
  277. resp, err = rac.AuthClient.UserChangePassword(rctx, in, opts...)
  278. return err
  279. })
  280. return resp, err
  281. }
  282. func (rac *retryAuthClient) UserGrantRole(ctx context.Context, in *pb.AuthUserGrantRoleRequest, opts ...grpc.CallOption) (resp *pb.AuthUserGrantRoleResponse, err error) {
  283. err = rac.writeRetry(ctx, func(rctx context.Context) error {
  284. resp, err = rac.AuthClient.UserGrantRole(rctx, in, opts...)
  285. return err
  286. })
  287. return resp, err
  288. }
  289. func (rac *retryAuthClient) UserRevokeRole(ctx context.Context, in *pb.AuthUserRevokeRoleRequest, opts ...grpc.CallOption) (resp *pb.AuthUserRevokeRoleResponse, err error) {
  290. err = rac.writeRetry(ctx, func(rctx context.Context) error {
  291. resp, err = rac.AuthClient.UserRevokeRole(rctx, in, opts...)
  292. return err
  293. })
  294. return resp, err
  295. }
  296. func (rac *retryAuthClient) RoleAdd(ctx context.Context, in *pb.AuthRoleAddRequest, opts ...grpc.CallOption) (resp *pb.AuthRoleAddResponse, err error) {
  297. err = rac.writeRetry(ctx, func(rctx context.Context) error {
  298. resp, err = rac.AuthClient.RoleAdd(rctx, in, opts...)
  299. return err
  300. })
  301. return resp, err
  302. }
  303. func (rac *retryAuthClient) RoleDelete(ctx context.Context, in *pb.AuthRoleDeleteRequest, opts ...grpc.CallOption) (resp *pb.AuthRoleDeleteResponse, err error) {
  304. err = rac.writeRetry(ctx, func(rctx context.Context) error {
  305. resp, err = rac.AuthClient.RoleDelete(rctx, in, opts...)
  306. return err
  307. })
  308. return resp, err
  309. }
  310. func (rac *retryAuthClient) RoleGrantPermission(ctx context.Context, in *pb.AuthRoleGrantPermissionRequest, opts ...grpc.CallOption) (resp *pb.AuthRoleGrantPermissionResponse, err error) {
  311. err = rac.writeRetry(ctx, func(rctx context.Context) error {
  312. resp, err = rac.AuthClient.RoleGrantPermission(rctx, in, opts...)
  313. return err
  314. })
  315. return resp, err
  316. }
  317. func (rac *retryAuthClient) RoleRevokePermission(ctx context.Context, in *pb.AuthRoleRevokePermissionRequest, opts ...grpc.CallOption) (resp *pb.AuthRoleRevokePermissionResponse, err error) {
  318. err = rac.writeRetry(ctx, func(rctx context.Context) error {
  319. resp, err = rac.AuthClient.RoleRevokePermission(rctx, in, opts...)
  320. return err
  321. })
  322. return resp, err
  323. }