maintenance.go 4.8 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195
  1. // Copyright 2016 CoreOS, Inc.
  2. //
  3. // Licensed under the Apache License, Version 2.0 (the "License");
  4. // you may not use this file except in compliance with the License.
  5. // You may obtain a copy of the License at
  6. //
  7. // http://www.apache.org/licenses/LICENSE-2.0
  8. //
  9. // Unless required by applicable law or agreed to in writing, software
  10. // distributed under the License is distributed on an "AS IS" BASIS,
  11. // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  12. // See the License for the specific language governing permissions and
  13. // limitations under the License.
  14. package clientv3
  15. import (
  16. "io"
  17. "sync"
  18. pb "github.com/coreos/etcd/etcdserver/etcdserverpb"
  19. "golang.org/x/net/context"
  20. "google.golang.org/grpc"
  21. )
  22. type (
  23. DefragmentResponse pb.DefragmentResponse
  24. AlarmResponse pb.AlarmResponse
  25. AlarmMember pb.AlarmMember
  26. StatusResponse pb.StatusResponse
  27. )
  28. type Maintenance interface {
  29. // AlarmList gets all active alarms.
  30. AlarmList(ctx context.Context) (*AlarmResponse, error)
  31. // AlarmDisarm disarms a given alarm.
  32. AlarmDisarm(ctx context.Context, m *AlarmMember) (*AlarmResponse, error)
  33. // Defragment defragments storage backend of the etcd member with given endpoint.
  34. // Defragment is only needed when deleting a large number of keys and want to reclaim
  35. // the resources.
  36. // Defragment is an expensive operation. User should avoid defragmenting multiple members
  37. // at the same time.
  38. // To defragment multiple members in the cluster, user need to call defragment multiple
  39. // times with different endpoints.
  40. Defragment(ctx context.Context, endpoint string) (*DefragmentResponse, error)
  41. // Status gets the status of the member.
  42. Status(ctx context.Context, endpoint string) (*StatusResponse, error)
  43. // Snapshot provides a reader for a snapshot of a backend.
  44. Snapshot(ctx context.Context) (io.ReadCloser, error)
  45. }
  46. type maintenance struct {
  47. c *Client
  48. mu sync.Mutex
  49. conn *grpc.ClientConn // conn in-use
  50. remote pb.MaintenanceClient
  51. }
  52. func NewMaintenance(c *Client) Maintenance {
  53. conn := c.ActiveConnection()
  54. return &maintenance{
  55. c: c,
  56. conn: conn,
  57. remote: pb.NewMaintenanceClient(conn),
  58. }
  59. }
  60. func (m *maintenance) AlarmList(ctx context.Context) (*AlarmResponse, error) {
  61. req := &pb.AlarmRequest{
  62. Action: pb.AlarmRequest_GET,
  63. MemberID: 0, // all
  64. Alarm: pb.AlarmType_NONE, // all
  65. }
  66. for {
  67. resp, err := m.getRemote().Alarm(ctx, req)
  68. if err == nil {
  69. return (*AlarmResponse)(resp), nil
  70. }
  71. if isHalted(ctx, err) {
  72. return nil, err
  73. }
  74. if err = m.switchRemote(err); err != nil {
  75. return nil, err
  76. }
  77. }
  78. }
  79. func (m *maintenance) AlarmDisarm(ctx context.Context, am *AlarmMember) (*AlarmResponse, error) {
  80. req := &pb.AlarmRequest{
  81. Action: pb.AlarmRequest_DEACTIVATE,
  82. MemberID: am.MemberID,
  83. Alarm: am.Alarm,
  84. }
  85. if req.MemberID == 0 && req.Alarm == pb.AlarmType_NONE {
  86. ar, err := m.AlarmList(ctx)
  87. if err != nil {
  88. return nil, err
  89. }
  90. ret := AlarmResponse{}
  91. for _, am := range ar.Alarms {
  92. dresp, derr := m.AlarmDisarm(ctx, (*AlarmMember)(am))
  93. if derr != nil {
  94. return nil, derr
  95. }
  96. ret.Alarms = append(ret.Alarms, dresp.Alarms...)
  97. }
  98. return &ret, nil
  99. }
  100. resp, err := m.getRemote().Alarm(ctx, req)
  101. if err == nil {
  102. return (*AlarmResponse)(resp), nil
  103. }
  104. if !isHalted(ctx, err) {
  105. go m.switchRemote(err)
  106. }
  107. return nil, err
  108. }
  109. func (m *maintenance) Defragment(ctx context.Context, endpoint string) (*DefragmentResponse, error) {
  110. conn, err := m.c.Dial(endpoint)
  111. if err != nil {
  112. return nil, err
  113. }
  114. remote := pb.NewMaintenanceClient(conn)
  115. resp, err := remote.Defragment(ctx, &pb.DefragmentRequest{})
  116. if err != nil {
  117. return nil, err
  118. }
  119. return (*DefragmentResponse)(resp), nil
  120. }
  121. func (m *maintenance) Status(ctx context.Context, endpoint string) (*StatusResponse, error) {
  122. conn, err := m.c.Dial(endpoint)
  123. if err != nil {
  124. return nil, err
  125. }
  126. remote := pb.NewMaintenanceClient(conn)
  127. resp, err := remote.Status(ctx, &pb.StatusRequest{})
  128. if err != nil {
  129. return nil, err
  130. }
  131. return (*StatusResponse)(resp), nil
  132. }
  133. func (m *maintenance) Snapshot(ctx context.Context) (io.ReadCloser, error) {
  134. ss, err := m.getRemote().Snapshot(ctx, &pb.SnapshotRequest{})
  135. if err != nil {
  136. return nil, err
  137. }
  138. pr, pw := io.Pipe()
  139. go func() {
  140. for {
  141. resp, err := ss.Recv()
  142. if err != nil {
  143. pw.CloseWithError(err)
  144. return
  145. }
  146. if resp == nil && err == nil {
  147. break
  148. }
  149. if _, werr := pw.Write(resp.Blob); werr != nil {
  150. pw.CloseWithError(werr)
  151. return
  152. }
  153. }
  154. pw.Close()
  155. }()
  156. return pr, nil
  157. }
  158. func (m *maintenance) getRemote() pb.MaintenanceClient {
  159. m.mu.Lock()
  160. defer m.mu.Unlock()
  161. return m.remote
  162. }
  163. func (m *maintenance) switchRemote(prevErr error) error {
  164. m.mu.Lock()
  165. defer m.mu.Unlock()
  166. newConn, err := m.c.retryConnection(m.conn, prevErr)
  167. if err != nil {
  168. return err
  169. }
  170. m.conn = newConn
  171. m.remote = pb.NewMaintenanceClient(m.conn)
  172. return nil
  173. }