maintenance.go 4.2 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164
  1. // Copyright 2016 CoreOS, Inc.
  2. //
  3. // Licensed under the Apache License, Version 2.0 (the "License");
  4. // you may not use this file except in compliance with the License.
  5. // You may obtain a copy of the License at
  6. //
  7. // http://www.apache.org/licenses/LICENSE-2.0
  8. //
  9. // Unless required by applicable law or agreed to in writing, software
  10. // distributed under the License is distributed on an "AS IS" BASIS,
  11. // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  12. // See the License for the specific language governing permissions and
  13. // limitations under the License.
  14. package clientv3
  15. import (
  16. "sync"
  17. pb "github.com/coreos/etcd/etcdserver/etcdserverpb"
  18. "golang.org/x/net/context"
  19. "google.golang.org/grpc"
  20. )
  21. type (
  22. DefragmentResponse pb.DefragmentResponse
  23. AlarmResponse pb.AlarmResponse
  24. AlarmMember pb.AlarmMember
  25. StatusResponse pb.StatusResponse
  26. )
  27. type Maintenance interface {
  28. // AlarmList gets all active alarms.
  29. AlarmList(ctx context.Context) (*AlarmResponse, error)
  30. // AlarmDisarm disarms a given alarm.
  31. AlarmDisarm(ctx context.Context, m *AlarmMember) (*AlarmResponse, error)
  32. // Defragment defragments storage backend of the etcd member with given endpoint.
  33. // Defragment is only needed when deleting a large number of keys and want to reclaim
  34. // the resources.
  35. // Defragment is an expensive operation. User should avoid defragmenting multiple members
  36. // at the same time.
  37. // To defragment multiple members in the cluster, user need to call defragment multiple
  38. // times with different endpoints.
  39. Defragment(ctx context.Context, endpoint string) (*DefragmentResponse, error)
  40. // Status gets the status of the member.
  41. Status(ctx context.Context, endpoint string) (*StatusResponse, error)
  42. }
  43. type maintenance struct {
  44. c *Client
  45. mu sync.Mutex
  46. conn *grpc.ClientConn // conn in-use
  47. remote pb.MaintenanceClient
  48. }
  49. func NewMaintenance(c *Client) Maintenance {
  50. conn := c.ActiveConnection()
  51. return &maintenance{
  52. c: c,
  53. conn: conn,
  54. remote: pb.NewMaintenanceClient(conn),
  55. }
  56. }
  57. func (m *maintenance) AlarmList(ctx context.Context) (*AlarmResponse, error) {
  58. req := &pb.AlarmRequest{
  59. Action: pb.AlarmRequest_GET,
  60. MemberID: 0, // all
  61. Alarm: pb.AlarmType_NONE, // all
  62. }
  63. for {
  64. resp, err := m.getRemote().Alarm(ctx, req)
  65. if err == nil {
  66. return (*AlarmResponse)(resp), nil
  67. }
  68. if isHalted(ctx, err) {
  69. return nil, err
  70. }
  71. if err = m.switchRemote(err); err != nil {
  72. return nil, err
  73. }
  74. }
  75. }
  76. func (m *maintenance) AlarmDisarm(ctx context.Context, am *AlarmMember) (*AlarmResponse, error) {
  77. req := &pb.AlarmRequest{
  78. Action: pb.AlarmRequest_DEACTIVATE,
  79. MemberID: am.MemberID,
  80. Alarm: am.Alarm,
  81. }
  82. if req.MemberID == 0 && req.Alarm == pb.AlarmType_NONE {
  83. ar, err := m.AlarmList(ctx)
  84. if err != nil {
  85. return nil, err
  86. }
  87. ret := AlarmResponse{}
  88. for _, am := range ar.Alarms {
  89. dresp, derr := m.AlarmDisarm(ctx, (*AlarmMember)(am))
  90. if derr != nil {
  91. return nil, derr
  92. }
  93. ret.Alarms = append(ret.Alarms, dresp.Alarms...)
  94. }
  95. return &ret, nil
  96. }
  97. resp, err := m.getRemote().Alarm(ctx, req)
  98. if err == nil {
  99. return (*AlarmResponse)(resp), nil
  100. }
  101. if !isHalted(ctx, err) {
  102. go m.switchRemote(err)
  103. }
  104. return nil, err
  105. }
  106. func (m *maintenance) Defragment(ctx context.Context, endpoint string) (*DefragmentResponse, error) {
  107. conn, err := m.c.Dial(endpoint)
  108. if err != nil {
  109. return nil, err
  110. }
  111. remote := pb.NewMaintenanceClient(conn)
  112. resp, err := remote.Defragment(ctx, &pb.DefragmentRequest{})
  113. if err != nil {
  114. return nil, err
  115. }
  116. return (*DefragmentResponse)(resp), nil
  117. }
  118. func (m *maintenance) Status(ctx context.Context, endpoint string) (*StatusResponse, error) {
  119. conn, err := m.c.Dial(endpoint)
  120. if err != nil {
  121. return nil, err
  122. }
  123. remote := pb.NewMaintenanceClient(conn)
  124. resp, err := remote.Status(ctx, &pb.StatusRequest{})
  125. if err != nil {
  126. return nil, err
  127. }
  128. return (*StatusResponse)(resp), nil
  129. }
  130. func (m *maintenance) getRemote() pb.MaintenanceClient {
  131. m.mu.Lock()
  132. defer m.mu.Unlock()
  133. return m.remote
  134. }
  135. func (m *maintenance) switchRemote(prevErr error) error {
  136. m.mu.Lock()
  137. defer m.mu.Unlock()
  138. newConn, err := m.c.retryConnection(m.conn, prevErr)
  139. if err != nil {
  140. return err
  141. }
  142. m.conn = newConn
  143. m.remote = pb.NewMaintenanceClient(m.conn)
  144. return nil
  145. }