123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541 |
- package origin
- import (
- "sync"
- "time"
- "github.com/cloudflare/cloudflared/h2mux"
- "github.com/prometheus/client_golang/prometheus"
- )
- const (
- metricsNamespace = "cloudflared"
- tunnelSubsystem = "tunnel"
- muxerSubsystem = "muxer"
- )
- type muxerMetrics struct {
- rtt *prometheus.GaugeVec
- rttMin *prometheus.GaugeVec
- rttMax *prometheus.GaugeVec
- receiveWindowAve *prometheus.GaugeVec
- sendWindowAve *prometheus.GaugeVec
- receiveWindowMin *prometheus.GaugeVec
- receiveWindowMax *prometheus.GaugeVec
- sendWindowMin *prometheus.GaugeVec
- sendWindowMax *prometheus.GaugeVec
- inBoundRateCurr *prometheus.GaugeVec
- inBoundRateMin *prometheus.GaugeVec
- inBoundRateMax *prometheus.GaugeVec
- outBoundRateCurr *prometheus.GaugeVec
- outBoundRateMin *prometheus.GaugeVec
- outBoundRateMax *prometheus.GaugeVec
- compBytesBefore *prometheus.GaugeVec
- compBytesAfter *prometheus.GaugeVec
- compRateAve *prometheus.GaugeVec
- }
- type TunnelMetrics struct {
- haConnections prometheus.Gauge
- activeStreams prometheus.Gauge
- totalRequests prometheus.Counter
- requestsPerTunnel *prometheus.CounterVec
- // concurrentRequestsLock is a mutex for concurrentRequests and maxConcurrentRequests
- concurrentRequestsLock sync.Mutex
- concurrentRequestsPerTunnel *prometheus.GaugeVec
- // concurrentRequests records count of concurrent requests for each tunnel
- concurrentRequests map[string]uint64
- maxConcurrentRequestsPerTunnel *prometheus.GaugeVec
- // concurrentRequests records max count of concurrent requests for each tunnel
- maxConcurrentRequests map[string]uint64
- timerRetries prometheus.Gauge
- responseByCode *prometheus.CounterVec
- responseCodePerTunnel *prometheus.CounterVec
- serverLocations *prometheus.GaugeVec
- // locationLock is a mutex for oldServerLocations
- locationLock sync.Mutex
- // oldServerLocations stores the last server the tunnel was connected to
- oldServerLocations map[string]string
- regSuccess *prometheus.CounterVec
- regFail *prometheus.CounterVec
- rpcFail *prometheus.CounterVec
- muxerMetrics *muxerMetrics
- tunnelsHA tunnelsForHA
- userHostnamesCounts *prometheus.CounterVec
- }
- func newMuxerMetrics() *muxerMetrics {
- rtt := prometheus.NewGaugeVec(
- prometheus.GaugeOpts{
- Namespace: metricsNamespace,
- Subsystem: muxerSubsystem,
- Name: "rtt",
- Help: "Round-trip time in millisecond",
- },
- []string{"connection_id"},
- )
- prometheus.MustRegister(rtt)
- rttMin := prometheus.NewGaugeVec(
- prometheus.GaugeOpts{
- Namespace: metricsNamespace,
- Subsystem: muxerSubsystem,
- Name: "rtt_min",
- Help: "Shortest round-trip time in millisecond",
- },
- []string{"connection_id"},
- )
- prometheus.MustRegister(rttMin)
- rttMax := prometheus.NewGaugeVec(
- prometheus.GaugeOpts{
- Namespace: metricsNamespace,
- Subsystem: muxerSubsystem,
- Name: "rtt_max",
- Help: "Longest round-trip time in millisecond",
- },
- []string{"connection_id"},
- )
- prometheus.MustRegister(rttMax)
- receiveWindowAve := prometheus.NewGaugeVec(
- prometheus.GaugeOpts{
- Namespace: metricsNamespace,
- Subsystem: muxerSubsystem,
- Name: "receive_window_ave",
- Help: "Average receive window size in bytes",
- },
- []string{"connection_id"},
- )
- prometheus.MustRegister(receiveWindowAve)
- sendWindowAve := prometheus.NewGaugeVec(
- prometheus.GaugeOpts{
- Namespace: metricsNamespace,
- Subsystem: muxerSubsystem,
- Name: "send_window_ave",
- Help: "Average send window size in bytes",
- },
- []string{"connection_id"},
- )
- prometheus.MustRegister(sendWindowAve)
- receiveWindowMin := prometheus.NewGaugeVec(
- prometheus.GaugeOpts{
- Namespace: metricsNamespace,
- Subsystem: muxerSubsystem,
- Name: "receive_window_min",
- Help: "Smallest receive window size in bytes",
- },
- []string{"connection_id"},
- )
- prometheus.MustRegister(receiveWindowMin)
- receiveWindowMax := prometheus.NewGaugeVec(
- prometheus.GaugeOpts{
- Namespace: metricsNamespace,
- Subsystem: muxerSubsystem,
- Name: "receive_window_max",
- Help: "Largest receive window size in bytes",
- },
- []string{"connection_id"},
- )
- prometheus.MustRegister(receiveWindowMax)
- sendWindowMin := prometheus.NewGaugeVec(
- prometheus.GaugeOpts{
- Namespace: metricsNamespace,
- Subsystem: muxerSubsystem,
- Name: "send_window_min",
- Help: "Smallest send window size in bytes",
- },
- []string{"connection_id"},
- )
- prometheus.MustRegister(sendWindowMin)
- sendWindowMax := prometheus.NewGaugeVec(
- prometheus.GaugeOpts{
- Namespace: metricsNamespace,
- Subsystem: muxerSubsystem,
- Name: "send_window_max",
- Help: "Largest send window size in bytes",
- },
- []string{"connection_id"},
- )
- prometheus.MustRegister(sendWindowMax)
- inBoundRateCurr := prometheus.NewGaugeVec(
- prometheus.GaugeOpts{
- Namespace: metricsNamespace,
- Subsystem: muxerSubsystem,
- Name: "inbound_bytes_per_sec_curr",
- Help: "Current inbounding bytes per second, 0 if there is no incoming connection",
- },
- []string{"connection_id"},
- )
- prometheus.MustRegister(inBoundRateCurr)
- inBoundRateMin := prometheus.NewGaugeVec(
- prometheus.GaugeOpts{
- Namespace: metricsNamespace,
- Subsystem: muxerSubsystem,
- Name: "inbound_bytes_per_sec_min",
- Help: "Minimum non-zero inbounding bytes per second",
- },
- []string{"connection_id"},
- )
- prometheus.MustRegister(inBoundRateMin)
- inBoundRateMax := prometheus.NewGaugeVec(
- prometheus.GaugeOpts{
- Namespace: metricsNamespace,
- Subsystem: muxerSubsystem,
- Name: "inbound_bytes_per_sec_max",
- Help: "Maximum inbounding bytes per second",
- },
- []string{"connection_id"},
- )
- prometheus.MustRegister(inBoundRateMax)
- outBoundRateCurr := prometheus.NewGaugeVec(
- prometheus.GaugeOpts{
- Namespace: metricsNamespace,
- Subsystem: muxerSubsystem,
- Name: "outbound_bytes_per_sec_curr",
- Help: "Current outbounding bytes per second, 0 if there is no outgoing traffic",
- },
- []string{"connection_id"},
- )
- prometheus.MustRegister(outBoundRateCurr)
- outBoundRateMin := prometheus.NewGaugeVec(
- prometheus.GaugeOpts{
- Namespace: metricsNamespace,
- Subsystem: muxerSubsystem,
- Name: "outbound_bytes_per_sec_min",
- Help: "Minimum non-zero outbounding bytes per second",
- },
- []string{"connection_id"},
- )
- prometheus.MustRegister(outBoundRateMin)
- outBoundRateMax := prometheus.NewGaugeVec(
- prometheus.GaugeOpts{
- Namespace: metricsNamespace,
- Subsystem: muxerSubsystem,
- Name: "outbound_bytes_per_sec_max",
- Help: "Maximum outbounding bytes per second",
- },
- []string{"connection_id"},
- )
- prometheus.MustRegister(outBoundRateMax)
- compBytesBefore := prometheus.NewGaugeVec(
- prometheus.GaugeOpts{
- Namespace: metricsNamespace,
- Subsystem: muxerSubsystem,
- Name: "comp_bytes_before",
- Help: "Bytes sent via cross-stream compression, pre compression",
- },
- []string{"connection_id"},
- )
- prometheus.MustRegister(compBytesBefore)
- compBytesAfter := prometheus.NewGaugeVec(
- prometheus.GaugeOpts{
- Namespace: metricsNamespace,
- Subsystem: muxerSubsystem,
- Name: "comp_bytes_after",
- Help: "Bytes sent via cross-stream compression, post compression",
- },
- []string{"connection_id"},
- )
- prometheus.MustRegister(compBytesAfter)
- compRateAve := prometheus.NewGaugeVec(
- prometheus.GaugeOpts{
- Namespace: metricsNamespace,
- Subsystem: muxerSubsystem,
- Name: "comp_rate_ave",
- Help: "Average outbound cross-stream compression ratio",
- },
- []string{"connection_id"},
- )
- prometheus.MustRegister(compRateAve)
- return &muxerMetrics{
- rtt: rtt,
- rttMin: rttMin,
- rttMax: rttMax,
- receiveWindowAve: receiveWindowAve,
- sendWindowAve: sendWindowAve,
- receiveWindowMin: receiveWindowMin,
- receiveWindowMax: receiveWindowMax,
- sendWindowMin: sendWindowMin,
- sendWindowMax: sendWindowMax,
- inBoundRateCurr: inBoundRateCurr,
- inBoundRateMin: inBoundRateMin,
- inBoundRateMax: inBoundRateMax,
- outBoundRateCurr: outBoundRateCurr,
- outBoundRateMin: outBoundRateMin,
- outBoundRateMax: outBoundRateMax,
- compBytesBefore: compBytesBefore,
- compBytesAfter: compBytesAfter,
- compRateAve: compRateAve,
- }
- }
- func (m *muxerMetrics) update(connectionID string, metrics *h2mux.MuxerMetrics) {
- m.rtt.WithLabelValues(connectionID).Set(convertRTTMilliSec(metrics.RTT))
- m.rttMin.WithLabelValues(connectionID).Set(convertRTTMilliSec(metrics.RTTMin))
- m.rttMax.WithLabelValues(connectionID).Set(convertRTTMilliSec(metrics.RTTMax))
- m.receiveWindowAve.WithLabelValues(connectionID).Set(metrics.ReceiveWindowAve)
- m.sendWindowAve.WithLabelValues(connectionID).Set(metrics.SendWindowAve)
- m.receiveWindowMin.WithLabelValues(connectionID).Set(float64(metrics.ReceiveWindowMin))
- m.receiveWindowMax.WithLabelValues(connectionID).Set(float64(metrics.ReceiveWindowMax))
- m.sendWindowMin.WithLabelValues(connectionID).Set(float64(metrics.SendWindowMin))
- m.sendWindowMax.WithLabelValues(connectionID).Set(float64(metrics.SendWindowMax))
- m.inBoundRateCurr.WithLabelValues(connectionID).Set(float64(metrics.InBoundRateCurr))
- m.inBoundRateMin.WithLabelValues(connectionID).Set(float64(metrics.InBoundRateMin))
- m.inBoundRateMax.WithLabelValues(connectionID).Set(float64(metrics.InBoundRateMax))
- m.outBoundRateCurr.WithLabelValues(connectionID).Set(float64(metrics.OutBoundRateCurr))
- m.outBoundRateMin.WithLabelValues(connectionID).Set(float64(metrics.OutBoundRateMin))
- m.outBoundRateMax.WithLabelValues(connectionID).Set(float64(metrics.OutBoundRateMax))
- m.compBytesBefore.WithLabelValues(connectionID).Set(float64(metrics.CompBytesBefore.Value()))
- m.compBytesAfter.WithLabelValues(connectionID).Set(float64(metrics.CompBytesAfter.Value()))
- m.compRateAve.WithLabelValues(connectionID).Set(float64(metrics.CompRateAve()))
- }
- func convertRTTMilliSec(t time.Duration) float64 {
- return float64(t / time.Millisecond)
- }
- // Metrics that can be collected without asking the edge
- func NewTunnelMetrics() *TunnelMetrics {
- haConnections := prometheus.NewGauge(
- prometheus.GaugeOpts{
- Namespace: metricsNamespace,
- Subsystem: tunnelSubsystem,
- Name: "ha_connections",
- Help: "Number of active ha connections",
- })
- prometheus.MustRegister(haConnections)
- activeStreams := h2mux.NewActiveStreamsMetrics(metricsNamespace, tunnelSubsystem)
- totalRequests := prometheus.NewCounter(
- prometheus.CounterOpts{
- Namespace: metricsNamespace,
- Subsystem: tunnelSubsystem,
- Name: "total_requests",
- Help: "Amount of requests proxied through all the tunnels",
- })
- prometheus.MustRegister(totalRequests)
- requestsPerTunnel := prometheus.NewCounterVec(
- prometheus.CounterOpts{
- Namespace: metricsNamespace,
- Subsystem: tunnelSubsystem,
- Name: "requests_per_tunnel",
- Help: "Amount of requests proxied through each tunnel",
- },
- []string{"connection_id"},
- )
- prometheus.MustRegister(requestsPerTunnel)
- concurrentRequestsPerTunnel := prometheus.NewGaugeVec(
- prometheus.GaugeOpts{
- Namespace: metricsNamespace,
- Subsystem: tunnelSubsystem,
- Name: "concurrent_requests_per_tunnel",
- Help: "Concurrent requests proxied through each tunnel",
- },
- []string{"connection_id"},
- )
- prometheus.MustRegister(concurrentRequestsPerTunnel)
- maxConcurrentRequestsPerTunnel := prometheus.NewGaugeVec(
- prometheus.GaugeOpts{
- Namespace: metricsNamespace,
- Subsystem: tunnelSubsystem,
- Name: "max_concurrent_requests_per_tunnel",
- Help: "Largest number of concurrent requests proxied through each tunnel so far",
- },
- []string{"connection_id"},
- )
- prometheus.MustRegister(maxConcurrentRequestsPerTunnel)
- timerRetries := prometheus.NewGauge(
- prometheus.GaugeOpts{
- Namespace: metricsNamespace,
- Subsystem: tunnelSubsystem,
- Name: "timer_retries",
- Help: "Unacknowledged heart beats count",
- })
- prometheus.MustRegister(timerRetries)
- responseByCode := prometheus.NewCounterVec(
- prometheus.CounterOpts{
- Namespace: metricsNamespace,
- Subsystem: tunnelSubsystem,
- Name: "response_by_code",
- Help: "Count of responses by HTTP status code",
- },
- []string{"status_code"},
- )
- prometheus.MustRegister(responseByCode)
- responseCodePerTunnel := prometheus.NewCounterVec(
- prometheus.CounterOpts{
- Namespace: metricsNamespace,
- Subsystem: tunnelSubsystem,
- Name: "response_code_per_tunnel",
- Help: "Count of responses by HTTP status code fore each tunnel",
- },
- []string{"connection_id", "status_code"},
- )
- prometheus.MustRegister(responseCodePerTunnel)
- serverLocations := prometheus.NewGaugeVec(
- prometheus.GaugeOpts{
- Namespace: metricsNamespace,
- Subsystem: tunnelSubsystem,
- Name: "server_locations",
- Help: "Where each tunnel is connected to. 1 means current location, 0 means previous locations.",
- },
- []string{"connection_id", "location"},
- )
- prometheus.MustRegister(serverLocations)
- rpcFail := prometheus.NewCounterVec(
- prometheus.CounterOpts{
- Namespace: metricsNamespace,
- Subsystem: tunnelSubsystem,
- Name: "tunnel_rpc_fail",
- Help: "Count of RPC connection errors by type",
- },
- []string{"error", "rpcName"},
- )
- prometheus.MustRegister(rpcFail)
- registerFail := prometheus.NewCounterVec(
- prometheus.CounterOpts{
- Namespace: metricsNamespace,
- Subsystem: tunnelSubsystem,
- Name: "tunnel_register_fail",
- Help: "Count of tunnel registration errors by type",
- },
- []string{"error", "rpcName"},
- )
- prometheus.MustRegister(registerFail)
- userHostnamesCounts := prometheus.NewCounterVec(
- prometheus.CounterOpts{
- Namespace: metricsNamespace,
- Subsystem: tunnelSubsystem,
- Name: "user_hostnames_counts",
- Help: "Which user hostnames cloudflared is serving",
- },
- []string{"userHostname"},
- )
- prometheus.MustRegister(userHostnamesCounts)
- registerSuccess := prometheus.NewCounterVec(
- prometheus.CounterOpts{
- Namespace: metricsNamespace,
- Subsystem: tunnelSubsystem,
- Name: "tunnel_register_success",
- Help: "Count of successful tunnel registrations",
- },
- []string{"rpcName"},
- )
- prometheus.MustRegister(registerSuccess)
- return &TunnelMetrics{
- haConnections: haConnections,
- activeStreams: activeStreams,
- totalRequests: totalRequests,
- requestsPerTunnel: requestsPerTunnel,
- concurrentRequestsPerTunnel: concurrentRequestsPerTunnel,
- concurrentRequests: make(map[string]uint64),
- maxConcurrentRequestsPerTunnel: maxConcurrentRequestsPerTunnel,
- maxConcurrentRequests: make(map[string]uint64),
- timerRetries: timerRetries,
- responseByCode: responseByCode,
- responseCodePerTunnel: responseCodePerTunnel,
- serverLocations: serverLocations,
- oldServerLocations: make(map[string]string),
- muxerMetrics: newMuxerMetrics(),
- tunnelsHA: NewTunnelsForHA(),
- regSuccess: registerSuccess,
- regFail: registerFail,
- rpcFail: rpcFail,
- userHostnamesCounts: userHostnamesCounts,
- }
- }
- func (t *TunnelMetrics) incrementHaConnections() {
- t.haConnections.Inc()
- }
- func (t *TunnelMetrics) decrementHaConnections() {
- t.haConnections.Dec()
- }
- func (t *TunnelMetrics) updateMuxerMetrics(connectionID string, metrics *h2mux.MuxerMetrics) {
- t.muxerMetrics.update(connectionID, metrics)
- }
- func (t *TunnelMetrics) incrementRequests(connectionID string) {
- t.concurrentRequestsLock.Lock()
- var concurrentRequests uint64
- var ok bool
- if concurrentRequests, ok = t.concurrentRequests[connectionID]; ok {
- t.concurrentRequests[connectionID]++
- concurrentRequests++
- } else {
- t.concurrentRequests[connectionID] = 1
- concurrentRequests = 1
- }
- if maxConcurrentRequests, ok := t.maxConcurrentRequests[connectionID]; (ok && maxConcurrentRequests < concurrentRequests) || !ok {
- t.maxConcurrentRequests[connectionID] = concurrentRequests
- t.maxConcurrentRequestsPerTunnel.WithLabelValues(connectionID).Set(float64(concurrentRequests))
- }
- t.concurrentRequestsLock.Unlock()
- t.totalRequests.Inc()
- t.requestsPerTunnel.WithLabelValues(connectionID).Inc()
- t.concurrentRequestsPerTunnel.WithLabelValues(connectionID).Inc()
- }
- func (t *TunnelMetrics) decrementConcurrentRequests(connectionID string) {
- t.concurrentRequestsLock.Lock()
- if _, ok := t.concurrentRequests[connectionID]; ok {
- t.concurrentRequests[connectionID]--
- }
- t.concurrentRequestsLock.Unlock()
- t.concurrentRequestsPerTunnel.WithLabelValues(connectionID).Dec()
- }
- func (t *TunnelMetrics) incrementResponses(connectionID, code string) {
- t.responseByCode.WithLabelValues(code).Inc()
- t.responseCodePerTunnel.WithLabelValues(connectionID, code).Inc()
- }
- func (t *TunnelMetrics) registerServerLocation(connectionID, loc string) {
- t.locationLock.Lock()
- defer t.locationLock.Unlock()
- if oldLoc, ok := t.oldServerLocations[connectionID]; ok && oldLoc == loc {
- return
- } else if ok {
- t.serverLocations.WithLabelValues(connectionID, oldLoc).Dec()
- }
- t.serverLocations.WithLabelValues(connectionID, loc).Inc()
- t.oldServerLocations[connectionID] = loc
- }
|