util.go 5.3 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172
  1. // Copyright 2015 The etcd Authors
  2. //
  3. // Licensed under the Apache License, Version 2.0 (the "License");
  4. // you may not use this file except in compliance with the License.
  5. // You may obtain a copy of the License at
  6. //
  7. // http://www.apache.org/licenses/LICENSE-2.0
  8. //
  9. // Unless required by applicable law or agreed to in writing, software
  10. // distributed under the License is distributed on an "AS IS" BASIS,
  11. // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  12. // See the License for the specific language governing permissions and
  13. // limitations under the License.
  14. package etcdserver
  15. import (
  16. "fmt"
  17. "reflect"
  18. "strings"
  19. "time"
  20. "github.com/golang/protobuf/proto"
  21. "go.etcd.io/etcd/etcdserver/api/membership"
  22. "go.etcd.io/etcd/etcdserver/api/rafthttp"
  23. pb "go.etcd.io/etcd/etcdserver/etcdserverpb"
  24. "go.etcd.io/etcd/pkg/traceutil"
  25. "go.etcd.io/etcd/pkg/types"
  26. "go.uber.org/zap"
  27. )
  28. // isConnectedToQuorumSince checks whether the local member is connected to the
  29. // quorum of the cluster since the given time.
  30. func isConnectedToQuorumSince(transport rafthttp.Transporter, since time.Time, self types.ID, members []*membership.Member) bool {
  31. return numConnectedSince(transport, since, self, members) >= (len(members)/2)+1
  32. }
  33. // isConnectedSince checks whether the local member is connected to the
  34. // remote member since the given time.
  35. func isConnectedSince(transport rafthttp.Transporter, since time.Time, remote types.ID) bool {
  36. t := transport.ActiveSince(remote)
  37. return !t.IsZero() && t.Before(since)
  38. }
  39. // isConnectedFullySince checks whether the local member is connected to all
  40. // members in the cluster since the given time.
  41. func isConnectedFullySince(transport rafthttp.Transporter, since time.Time, self types.ID, members []*membership.Member) bool {
  42. return numConnectedSince(transport, since, self, members) == len(members)
  43. }
  44. // numConnectedSince counts how many members are connected to the local member
  45. // since the given time.
  46. func numConnectedSince(transport rafthttp.Transporter, since time.Time, self types.ID, members []*membership.Member) int {
  47. connectedNum := 0
  48. for _, m := range members {
  49. if m.ID == self || isConnectedSince(transport, since, m.ID) {
  50. connectedNum++
  51. }
  52. }
  53. return connectedNum
  54. }
  55. // longestConnected chooses the member with longest active-since-time.
  56. // It returns false, if nothing is active.
  57. func longestConnected(tp rafthttp.Transporter, membs []types.ID) (types.ID, bool) {
  58. var longest types.ID
  59. var oldest time.Time
  60. for _, id := range membs {
  61. tm := tp.ActiveSince(id)
  62. if tm.IsZero() { // inactive
  63. continue
  64. }
  65. if oldest.IsZero() { // first longest candidate
  66. oldest = tm
  67. longest = id
  68. }
  69. if tm.Before(oldest) {
  70. oldest = tm
  71. longest = id
  72. }
  73. }
  74. if uint64(longest) == 0 {
  75. return longest, false
  76. }
  77. return longest, true
  78. }
  79. type notifier struct {
  80. c chan struct{}
  81. err error
  82. }
  83. func newNotifier() *notifier {
  84. return &notifier{
  85. c: make(chan struct{}),
  86. }
  87. }
  88. func (nc *notifier) notify(err error) {
  89. nc.err = err
  90. close(nc.c)
  91. }
  92. func warnOfExpensiveRequest(lg *zap.Logger, now time.Time, reqStringer fmt.Stringer, respMsg proto.Message, err error) {
  93. var resp string
  94. if !isNil(respMsg) {
  95. resp = fmt.Sprintf("size:%d", proto.Size(respMsg))
  96. }
  97. warnOfExpensiveGenericRequest(lg, nil, now, reqStringer, "", resp, err)
  98. }
  99. func warnOfExpensiveReadOnlyTxnRequest(lg *zap.Logger, now time.Time, r *pb.TxnRequest, txnResponse *pb.TxnResponse, err error) {
  100. reqStringer := pb.NewLoggableTxnRequest(r)
  101. var resp string
  102. if !isNil(txnResponse) {
  103. var resps []string
  104. for _, r := range txnResponse.Responses {
  105. switch op := r.Response.(type) {
  106. case *pb.ResponseOp_ResponseRange:
  107. resps = append(resps, fmt.Sprintf("range_response_count:%d", len(op.ResponseRange.Kvs)))
  108. default:
  109. // only range responses should be in a read only txn request
  110. }
  111. }
  112. resp = fmt.Sprintf("responses:<%s> size:%d", strings.Join(resps, " "), proto.Size(txnResponse))
  113. }
  114. warnOfExpensiveGenericRequest(lg, nil, now, reqStringer, "read-only range ", resp, err)
  115. }
  116. func warnOfExpensiveReadOnlyRangeRequest(lg *zap.Logger, trace *traceutil.Trace, now time.Time, reqStringer fmt.Stringer, rangeResponse *pb.RangeResponse, err error) {
  117. var resp string
  118. if !isNil(rangeResponse) {
  119. resp = fmt.Sprintf("range_response_count:%d size:%d", len(rangeResponse.Kvs), proto.Size(rangeResponse))
  120. }
  121. warnOfExpensiveGenericRequest(lg, trace, now, reqStringer, "read-only range ", resp, err)
  122. }
  123. func warnOfExpensiveGenericRequest(lg *zap.Logger, trace *traceutil.Trace, now time.Time, reqStringer fmt.Stringer, prefix string, resp string, err error) {
  124. d := time.Since(now)
  125. if d > warnApplyDuration {
  126. if lg != nil {
  127. lg.Warn(
  128. "apply request took too long",
  129. zap.Duration("took", d),
  130. zap.Duration("expected-duration", warnApplyDuration),
  131. zap.String("prefix", prefix),
  132. zap.String("request", reqStringer.String()),
  133. zap.String("response", resp),
  134. zap.Error(err),
  135. )
  136. } else {
  137. var result string
  138. if err != nil {
  139. result = fmt.Sprintf("error:%v", err)
  140. } else {
  141. result = resp
  142. }
  143. plog.Warningf("%srequest %q with result %q took too long (%v) to execute", prefix, reqStringer.String(), result, d)
  144. }
  145. if trace != nil {
  146. trace.Log(lg)
  147. }
  148. slowApplies.Inc()
  149. }
  150. }
  151. func isNil(msg proto.Message) bool {
  152. return msg == nil || reflect.ValueOf(msg).IsNil()
  153. }