Prometheus Exporter - 直接检测与自定义收集器

您没有遵循最佳实践，因为您正在使用您链接到的文章所警告的全局指标。使用您当前的实现，在设备断开连接后（或者更准确地说，直到您的导出器重新启动），您的仪表板将永远显示 CPU 指标的一些任意且恒定的值。相反，RPC 方法应该维护一组本地指标，并在方法返回后将其删除。这样，当设备断开连接时，设备的指标就会从抓取输出中消失。这是执行此操作的一种方法。它使用包含当前活动指标的地图。每个映射元素都是一个特定流的一组指标（我理解它对应于一个设备）。一旦流结束，该条目就会被删除。package mainimport (    "sync"    "github.com/prometheus/client_golang/prometheus")// Exporter is a prometheus.Collector implementation.type Exporter struct {    // We need some way to map gRPC streams to their metrics. Using the stream    // itself as a map key is simple enough, but anything works as long as we    // can remove metrics once the stream ends.    sync.Mutex    Metrics map[StreamServer]*DeviceMetrics}type DeviceMetrics struct {    sync.Mutex    CPU prometheus.Metric}// Globally defined descriptions are fine.var cpu5SecDesc = prometheus.NewDesc(    "cisco_iosxe_iosd_cpu_busy_5_sec_percentage",    "The IOSd daemon CPU busy percentage over the last 5 seconds",    []string{"node"},    nil, // constant labels)// Collect implements prometheus.Collector.func (e *Exporter) Collect(ch chan<- prometheus.Metric) {    // Copy current metrics so we don't lock for very long if ch's consumer is    // slow.    var metrics []prometheus.Metric    e.Lock()    for _, deviceMetrics := range e.Metrics {        deviceMetrics.Lock()        metrics = append(metrics,            deviceMetrics.CPU,        )        deviceMetrics.Unlock()    }    e.Unlock()    for _, m := range metrics {        if m != nil {            ch <- m        }    }}// Describe implements prometheus.Collector.func (e *Exporter) Describe(ch chan<- *prometheus.Desc) {    ch <- cpu5SecDesc}// Service is the gRPC service implementation.type Service struct {    exp *Exporter}func (s *Service) RPCMethod(stream StreamServer) (*Response, error) {    deviceMetrics := new(DeviceMetrics)    s.exp.Lock()    s.exp.Metrics[stream] = deviceMetrics    s.exp.Unlock()    defer func() {        // Stop emitting metrics for this stream.        s.exp.Lock()        delete(s.exp.Metrics, stream)        s.exp.Unlock()    }()    for {        req, err := stream.Recv()        // TODO: handle error        var msg *Telemetry = parseRequest(req) // Your existing code that unmarshals the nested message.        var (            metricField *prometheus.Metric            metric      prometheus.Metric        )        switch msg.GetEncodingPath() {        case CpuYANGEncodingPath:            metricField = &deviceMetrics.CPU            metric = prometheus.MustNewConstMetric(                cpu5SecDesc,                prometheus.GaugeValue,                ParsePBMsgCpuBusyPercent(msg), // func(*Telemetry) float64                "node", msg.GetNodeIdStr(),            )        default:            continue        }        deviceMetrics.Lock()        *metricField = metric        deviceMetrics.Unlock()    }    return nil, &Response{}}

Prometheus Exporter - 直接检测与自定义收集器

1回答