|
|
@@ -14,57 +14,41 @@
|
|
|
|
|
|
package rafthttp
|
|
|
|
|
|
-import (
|
|
|
- "time"
|
|
|
-
|
|
|
- "github.com/coreos/etcd/pkg/types"
|
|
|
- "github.com/coreos/etcd/raft/raftpb"
|
|
|
- "github.com/prometheus/client_golang/prometheus"
|
|
|
-)
|
|
|
+import "github.com/prometheus/client_golang/prometheus"
|
|
|
|
|
|
+// TODO: record write/recv failures.
|
|
|
var (
|
|
|
- // TODO: create a separate histogram for recording
|
|
|
- // snapshot sending metric. snapshot can be large and
|
|
|
- // take a long time to send. So it needs a different
|
|
|
- // time range than other type of messages.
|
|
|
- msgSentDuration = prometheus.NewHistogramVec(
|
|
|
- prometheus.HistogramOpts{
|
|
|
- Namespace: "etcd_debugging",
|
|
|
- Subsystem: "rafthttp",
|
|
|
- Name: "message_sent_latency_seconds",
|
|
|
- Help: "message sent latency distributions.",
|
|
|
- Buckets: prometheus.ExponentialBuckets(0.0005, 2, 13),
|
|
|
- },
|
|
|
- []string{"sendingType", "remoteID", "msgType"},
|
|
|
+ sentBytes = prometheus.NewCounterVec(prometheus.CounterOpts{
|
|
|
+ Namespace: "etcd",
|
|
|
+ Subsystem: "network",
|
|
|
+ Name: "sent_bytes_total",
|
|
|
+ Help: "The total number of bytes sent.",
|
|
|
+ },
|
|
|
+ []string{"To"},
|
|
|
+ )
|
|
|
+
|
|
|
+ receivedBytes = prometheus.NewCounterVec(prometheus.CounterOpts{
|
|
|
+ Namespace: "etcd",
|
|
|
+ Subsystem: "network",
|
|
|
+ Name: "received_bytes_total",
|
|
|
+ Help: "The total number of bytes received.",
|
|
|
+ },
|
|
|
+ []string{"From"},
|
|
|
)
|
|
|
|
|
|
- msgSentFailed = prometheus.NewCounterVec(prometheus.CounterOpts{
|
|
|
- Namespace: "etcd_debugging",
|
|
|
- Subsystem: "rafthttp",
|
|
|
- Name: "message_sent_failed_total",
|
|
|
- Help: "The total number of failed messages sent.",
|
|
|
+ rtts = prometheus.NewHistogramVec(prometheus.HistogramOpts{
|
|
|
+ Namespace: "etcd",
|
|
|
+ Subsystem: "network",
|
|
|
+ Name: "round_trip_time_seconds",
|
|
|
+ Help: "Round-Trip-Time histogram between members.",
|
|
|
+ Buckets: prometheus.ExponentialBuckets(0.0001, 2, 14),
|
|
|
},
|
|
|
- []string{"sendingType", "remoteID", "msgType"},
|
|
|
+ []string{"To"},
|
|
|
)
|
|
|
)
|
|
|
|
|
|
func init() {
|
|
|
- prometheus.MustRegister(msgSentDuration)
|
|
|
- prometheus.MustRegister(msgSentFailed)
|
|
|
-}
|
|
|
-
|
|
|
-func reportSentDuration(sendingType string, m raftpb.Message, duration time.Duration) {
|
|
|
- typ := m.Type.String()
|
|
|
- if isLinkHeartbeatMessage(m) {
|
|
|
- typ = "MsgLinkHeartbeat"
|
|
|
- }
|
|
|
- msgSentDuration.WithLabelValues(sendingType, types.ID(m.To).String(), typ).Observe(float64(duration) / float64(time.Second))
|
|
|
-}
|
|
|
-
|
|
|
-func reportSentFailure(sendingType string, m raftpb.Message) {
|
|
|
- typ := m.Type.String()
|
|
|
- if isLinkHeartbeatMessage(m) {
|
|
|
- typ = "MsgLinkHeartbeat"
|
|
|
- }
|
|
|
- msgSentFailed.WithLabelValues(sendingType, types.ID(m.To).String(), typ).Inc()
|
|
|
+ prometheus.MustRegister(sentBytes)
|
|
|
+ prometheus.MustRegister(receivedBytes)
|
|
|
+ prometheus.MustRegister(rtts)
|
|
|
}
|