maintenance.go 5.0 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196
  1. // Copyright 2016 CoreOS, Inc.
  2. //
  3. // Licensed under the Apache License, Version 2.0 (the "License");
  4. // you may not use this file except in compliance with the License.
  5. // You may obtain a copy of the License at
  6. //
  7. // http://www.apache.org/licenses/LICENSE-2.0
  8. //
  9. // Unless required by applicable law or agreed to in writing, software
  10. // distributed under the License is distributed on an "AS IS" BASIS,
  11. // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  12. // See the License for the specific language governing permissions and
  13. // limitations under the License.
  14. package clientv3
  15. import (
  16. "io"
  17. "sync"
  18. "github.com/coreos/etcd/etcdserver/api/v3rpc/rpctypes"
  19. pb "github.com/coreos/etcd/etcdserver/etcdserverpb"
  20. "golang.org/x/net/context"
  21. "google.golang.org/grpc"
  22. )
  23. type (
  24. DefragmentResponse pb.DefragmentResponse
  25. AlarmResponse pb.AlarmResponse
  26. AlarmMember pb.AlarmMember
  27. StatusResponse pb.StatusResponse
  28. )
  29. type Maintenance interface {
  30. // AlarmList gets all active alarms.
  31. AlarmList(ctx context.Context) (*AlarmResponse, error)
  32. // AlarmDisarm disarms a given alarm.
  33. AlarmDisarm(ctx context.Context, m *AlarmMember) (*AlarmResponse, error)
  34. // Defragment defragments storage backend of the etcd member with given endpoint.
  35. // Defragment is only needed when deleting a large number of keys and want to reclaim
  36. // the resources.
  37. // Defragment is an expensive operation. User should avoid defragmenting multiple members
  38. // at the same time.
  39. // To defragment multiple members in the cluster, user need to call defragment multiple
  40. // times with different endpoints.
  41. Defragment(ctx context.Context, endpoint string) (*DefragmentResponse, error)
  42. // Status gets the status of the endpoint.
  43. Status(ctx context.Context, endpoint string) (*StatusResponse, error)
  44. // Snapshot provides a reader for a snapshot of a backend.
  45. Snapshot(ctx context.Context) (io.ReadCloser, error)
  46. }
  47. type maintenance struct {
  48. c *Client
  49. mu sync.Mutex
  50. conn *grpc.ClientConn // conn in-use
  51. remote pb.MaintenanceClient
  52. }
  53. func NewMaintenance(c *Client) Maintenance {
  54. conn := c.ActiveConnection()
  55. return &maintenance{
  56. c: c,
  57. conn: conn,
  58. remote: pb.NewMaintenanceClient(conn),
  59. }
  60. }
  61. func (m *maintenance) AlarmList(ctx context.Context) (*AlarmResponse, error) {
  62. req := &pb.AlarmRequest{
  63. Action: pb.AlarmRequest_GET,
  64. MemberID: 0, // all
  65. Alarm: pb.AlarmType_NONE, // all
  66. }
  67. for {
  68. resp, err := m.getRemote().Alarm(ctx, req)
  69. if err == nil {
  70. return (*AlarmResponse)(resp), nil
  71. }
  72. if isHaltErr(ctx, err) {
  73. return nil, rpctypes.Error(err)
  74. }
  75. if err = m.switchRemote(err); err != nil {
  76. return nil, err
  77. }
  78. }
  79. }
  80. func (m *maintenance) AlarmDisarm(ctx context.Context, am *AlarmMember) (*AlarmResponse, error) {
  81. req := &pb.AlarmRequest{
  82. Action: pb.AlarmRequest_DEACTIVATE,
  83. MemberID: am.MemberID,
  84. Alarm: am.Alarm,
  85. }
  86. if req.MemberID == 0 && req.Alarm == pb.AlarmType_NONE {
  87. ar, err := m.AlarmList(ctx)
  88. if err != nil {
  89. return nil, rpctypes.Error(err)
  90. }
  91. ret := AlarmResponse{}
  92. for _, am := range ar.Alarms {
  93. dresp, derr := m.AlarmDisarm(ctx, (*AlarmMember)(am))
  94. if derr != nil {
  95. return nil, rpctypes.Error(derr)
  96. }
  97. ret.Alarms = append(ret.Alarms, dresp.Alarms...)
  98. }
  99. return &ret, nil
  100. }
  101. resp, err := m.getRemote().Alarm(ctx, req)
  102. if err == nil {
  103. return (*AlarmResponse)(resp), nil
  104. }
  105. if isHaltErr(ctx, err) {
  106. go m.switchRemote(err)
  107. }
  108. return nil, rpctypes.Error(err)
  109. }
  110. func (m *maintenance) Defragment(ctx context.Context, endpoint string) (*DefragmentResponse, error) {
  111. conn, err := m.c.Dial(endpoint)
  112. if err != nil {
  113. return nil, rpctypes.Error(err)
  114. }
  115. remote := pb.NewMaintenanceClient(conn)
  116. resp, err := remote.Defragment(ctx, &pb.DefragmentRequest{})
  117. if err != nil {
  118. return nil, rpctypes.Error(err)
  119. }
  120. return (*DefragmentResponse)(resp), nil
  121. }
  122. func (m *maintenance) Status(ctx context.Context, endpoint string) (*StatusResponse, error) {
  123. conn, err := m.c.Dial(endpoint)
  124. if err != nil {
  125. return nil, rpctypes.Error(err)
  126. }
  127. remote := pb.NewMaintenanceClient(conn)
  128. resp, err := remote.Status(ctx, &pb.StatusRequest{})
  129. if err != nil {
  130. return nil, rpctypes.Error(err)
  131. }
  132. return (*StatusResponse)(resp), nil
  133. }
  134. func (m *maintenance) Snapshot(ctx context.Context) (io.ReadCloser, error) {
  135. ss, err := m.getRemote().Snapshot(ctx, &pb.SnapshotRequest{})
  136. if err != nil {
  137. return nil, rpctypes.Error(err)
  138. }
  139. pr, pw := io.Pipe()
  140. go func() {
  141. for {
  142. resp, err := ss.Recv()
  143. if err != nil {
  144. pw.CloseWithError(err)
  145. return
  146. }
  147. if resp == nil && err == nil {
  148. break
  149. }
  150. if _, werr := pw.Write(resp.Blob); werr != nil {
  151. pw.CloseWithError(werr)
  152. return
  153. }
  154. }
  155. pw.Close()
  156. }()
  157. return pr, nil
  158. }
  159. func (m *maintenance) getRemote() pb.MaintenanceClient {
  160. m.mu.Lock()
  161. defer m.mu.Unlock()
  162. return m.remote
  163. }
  164. func (m *maintenance) switchRemote(prevErr error) error {
  165. m.mu.Lock()
  166. defer m.mu.Unlock()
  167. newConn, err := m.c.retryConnection(m.conn, prevErr)
  168. if err != nil {
  169. return rpctypes.Error(err)
  170. }
  171. m.conn = newConn
  172. m.remote = pb.NewMaintenanceClient(m.conn)
  173. return nil
  174. }