netdata/netdata

View on GitHub
src/go/collectors/go.d.plugin/modules/consul/collect_autopilot.go

Summary

Maintainability
A
0 mins
Test Coverage
// SPDX-License-Identifier: GPL-3.0-or-later

package consul

import (
    "net/http"
    "time"
)

const (
    // https://developer.hashicorp.com/consul/api-docs/operator/autopilot#read-health
    urlPathOperationAutopilotHealth = "/v1/operator/autopilot/health"
)

type autopilotHealth struct {
    Servers []struct {
        ID          string
        SerfStatus  string
        Leader      bool
        LastContact string
        Healthy     bool
        Voter       bool
        StableSince time.Time
    }
}

func (c *Consul) collectAutopilotHealth(mx map[string]int64) error {
    var health autopilotHealth

    // The HTTP status code will indicate the health of the cluster: 200 is healthy, 429 is unhealthy.
    // https://github.com/hashicorp/consul/blob/c7ef04c5979dbc311ff3c67b7bf3028a93e8b0f1/agent/operator_endpoint.go#L325
    if err := c.doOKDecode(urlPathOperationAutopilotHealth, &health, http.StatusTooManyRequests); err != nil {
        return err
    }

    for _, srv := range health.Servers {
        if srv.ID == c.cfg.Config.NodeID {
            // SerfStatus: alive, left, failed or none:
            // https://github.com/hashicorp/consul/blob/c7ef04c5979dbc311ff3c67b7bf3028a93e8b0f1/agent/consul/operator_autopilot_endpoint.go#L124-L133
            mx["autopilot_server_sefStatus_alive"] = boolToInt(srv.SerfStatus == "alive")
            mx["autopilot_server_sefStatus_left"] = boolToInt(srv.SerfStatus == "left")
            mx["autopilot_server_sefStatus_failed"] = boolToInt(srv.SerfStatus == "failed")
            mx["autopilot_server_sefStatus_none"] = boolToInt(srv.SerfStatus == "none")
            // https://github.com/hashicorp/raft-autopilot/blob/d936f51c374c3b7902d5e4fdafe9f7d8d199ea53/types.go#L110
            mx["autopilot_server_healthy_yes"] = boolToInt(srv.Healthy)
            mx["autopilot_server_healthy_no"] = boolToInt(!srv.Healthy)
            mx["autopilot_server_voter_yes"] = boolToInt(srv.Voter)
            mx["autopilot_server_voter_no"] = boolToInt(!srv.Voter)
            mx["autopilot_server_stable_time"] = int64(time.Since(srv.StableSince).Seconds())
            mx["autopilot_server_stable_time"] = int64(time.Since(srv.StableSince).Seconds())
            if !srv.Leader {
                if v, err := time.ParseDuration(srv.LastContact); err == nil {
                    mx["autopilot_server_lastContact_leader"] = v.Milliseconds()
                }
            }

            break
        }
    }

    return nil
}