mirror of
https://github.com/prometheus/prometheus.git
synced 2025-10-24 14:01:02 +02:00
SD Managers take over responsibility for SD metrics registration --------- Signed-off-by: Paulin Todev <paulin.todev@gmail.com> Signed-off-by: Björn Rabenstein <github@rabenste.in> Co-authored-by: Björn Rabenstein <github@rabenste.in>
292 lines
9.7 KiB
Go
292 lines
9.7 KiB
Go
// Copyright 2018 The Prometheus Authors
|
|
// Licensed under the Apache License, Version 2.0 (the "License");
|
|
// you may not use this file except in compliance with the License.
|
|
// You may obtain a copy of the License at
|
|
//
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
//
|
|
// Unless required by applicable law or agreed to in writing, software
|
|
// distributed under the License is distributed on an "AS IS" BASIS,
|
|
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
// See the License for the specific language governing permissions and
|
|
// limitations under the License.
|
|
|
|
package main
|
|
|
|
import (
|
|
"context"
|
|
"encoding/json"
|
|
"fmt"
|
|
"io"
|
|
"net"
|
|
"net/http"
|
|
"os"
|
|
"strconv"
|
|
"strings"
|
|
"time"
|
|
|
|
"github.com/alecthomas/kingpin/v2"
|
|
"github.com/go-kit/log"
|
|
"github.com/go-kit/log/level"
|
|
"github.com/prometheus/client_golang/prometheus"
|
|
"github.com/prometheus/common/model"
|
|
|
|
prom_discovery "github.com/prometheus/prometheus/discovery"
|
|
"github.com/prometheus/prometheus/discovery/targetgroup"
|
|
"github.com/prometheus/prometheus/documentation/examples/custom-sd/adapter"
|
|
"github.com/prometheus/prometheus/util/strutil"
|
|
)
|
|
|
|
var (
|
|
a = kingpin.New("sd adapter usage", "Tool to generate file_sd target files for unimplemented SD mechanisms.")
|
|
outputFile = a.Flag("output.file", "Output file for file_sd compatible file.").Default("custom_sd.json").String()
|
|
listenAddress = a.Flag("listen.address", "The address the Consul HTTP API is listening on for requests.").Default("localhost:8500").String()
|
|
logger log.Logger
|
|
|
|
// addressLabel is the name for the label containing a target's address.
|
|
addressLabel = model.MetaLabelPrefix + "consul_address"
|
|
// nodeLabel is the name for the label containing a target's node name.
|
|
nodeLabel = model.MetaLabelPrefix + "consul_node"
|
|
// tagsLabel is the name of the label containing the tags assigned to the target.
|
|
tagsLabel = model.MetaLabelPrefix + "consul_tags"
|
|
// serviceAddressLabel is the name of the label containing the (optional) service address.
|
|
serviceAddressLabel = model.MetaLabelPrefix + "consul_service_address"
|
|
// servicePortLabel is the name of the label containing the service port.
|
|
servicePortLabel = model.MetaLabelPrefix + "consul_service_port"
|
|
// serviceIDLabel is the name of the label containing the service ID.
|
|
serviceIDLabel = model.MetaLabelPrefix + "consul_service_id"
|
|
)
|
|
|
|
// CatalogService is copied from https://github.com/hashicorp/consul/blob/master/api/catalog.go
|
|
// this struct represents the response from a /service/<service-name> request.
|
|
// Consul License: https://github.com/hashicorp/consul/blob/master/LICENSE
|
|
type CatalogService struct {
|
|
ID string
|
|
Node string
|
|
Address string
|
|
Datacenter string
|
|
TaggedAddresses map[string]string
|
|
NodeMeta map[string]string
|
|
ServiceID string
|
|
ServiceName string
|
|
ServiceAddress string
|
|
ServiceTags []string
|
|
ServicePort int
|
|
ServiceEnableTagOverride bool
|
|
CreateIndex uint64
|
|
ModifyIndex uint64
|
|
}
|
|
|
|
// Note: create a config struct for your custom SD type here.
|
|
type sdConfig struct {
|
|
Address string
|
|
TagSeparator string
|
|
RefreshInterval int
|
|
}
|
|
|
|
// Note: This is the struct with your implementation of the Discoverer interface (see Run function).
|
|
// Discovery retrieves target information from a Consul server and updates them via watches.
|
|
type discovery struct {
|
|
address string
|
|
refreshInterval int
|
|
tagSeparator string
|
|
logger log.Logger
|
|
oldSourceList map[string]bool
|
|
}
|
|
|
|
func (d *discovery) parseServiceNodes(resp *http.Response, name string) (*targetgroup.Group, error) {
|
|
var nodes []*CatalogService
|
|
tgroup := targetgroup.Group{
|
|
Source: name,
|
|
Labels: make(model.LabelSet),
|
|
}
|
|
|
|
defer func() {
|
|
io.Copy(io.Discard, resp.Body)
|
|
resp.Body.Close()
|
|
}()
|
|
|
|
b, err := io.ReadAll(resp.Body)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
err = json.Unmarshal(b, &nodes)
|
|
if err != nil {
|
|
return &tgroup, err
|
|
}
|
|
|
|
tgroup.Targets = make([]model.LabelSet, 0, len(nodes))
|
|
|
|
for _, node := range nodes {
|
|
// We surround the separated list with the separator as well. This way regular expressions
|
|
// in relabeling rules don't have to consider tag positions.
|
|
tags := "," + strings.Join(node.ServiceTags, ",") + ","
|
|
|
|
// If the service address is not empty it should be used instead of the node address
|
|
// since the service may be registered remotely through a different node.
|
|
var addr string
|
|
if node.ServiceAddress != "" {
|
|
addr = net.JoinHostPort(node.ServiceAddress, fmt.Sprintf("%d", node.ServicePort))
|
|
} else {
|
|
addr = net.JoinHostPort(node.Address, fmt.Sprintf("%d", node.ServicePort))
|
|
}
|
|
|
|
target := model.LabelSet{model.AddressLabel: model.LabelValue(addr)}
|
|
labels := model.LabelSet{
|
|
model.AddressLabel: model.LabelValue(addr),
|
|
model.LabelName(addressLabel): model.LabelValue(node.Address),
|
|
model.LabelName(nodeLabel): model.LabelValue(node.Node),
|
|
model.LabelName(tagsLabel): model.LabelValue(tags),
|
|
model.LabelName(serviceAddressLabel): model.LabelValue(node.ServiceAddress),
|
|
model.LabelName(servicePortLabel): model.LabelValue(strconv.Itoa(node.ServicePort)),
|
|
model.LabelName(serviceIDLabel): model.LabelValue(node.ServiceID),
|
|
}
|
|
tgroup.Labels = labels
|
|
|
|
// Add all key/value pairs from the node's metadata as their own labels.
|
|
for k, v := range node.NodeMeta {
|
|
name := strutil.SanitizeLabelName(k)
|
|
tgroup.Labels[model.LabelName(model.MetaLabelPrefix+name)] = model.LabelValue(v)
|
|
}
|
|
|
|
tgroup.Targets = append(tgroup.Targets, target)
|
|
}
|
|
return &tgroup, nil
|
|
}
|
|
|
|
// Note: you must implement this function for your discovery implementation as part of the
|
|
// Discoverer interface. Here you should query your SD for it's list of known targets, determine
|
|
// which of those targets you care about (for example, which of Consuls known services do you want
|
|
// to scrape for metrics), and then send those targets as a target.TargetGroup to the ch channel.
|
|
func (d *discovery) Run(ctx context.Context, ch chan<- []*targetgroup.Group) {
|
|
for c := time.Tick(time.Duration(d.refreshInterval) * time.Second); ; {
|
|
var srvs map[string][]string
|
|
resp, err := http.Get(fmt.Sprintf("http://%s/v1/catalog/services", d.address))
|
|
if err != nil {
|
|
level.Error(d.logger).Log("msg", "Error getting services list", "err", err)
|
|
time.Sleep(time.Duration(d.refreshInterval) * time.Second)
|
|
continue
|
|
}
|
|
|
|
b, err := io.ReadAll(resp.Body)
|
|
io.Copy(io.Discard, resp.Body)
|
|
resp.Body.Close()
|
|
if err != nil {
|
|
level.Error(d.logger).Log("msg", "Error reading services list", "err", err)
|
|
time.Sleep(time.Duration(d.refreshInterval) * time.Second)
|
|
continue
|
|
}
|
|
|
|
err = json.Unmarshal(b, &srvs)
|
|
resp.Body.Close()
|
|
if err != nil {
|
|
level.Error(d.logger).Log("msg", "Error parsing services list", "err", err)
|
|
time.Sleep(time.Duration(d.refreshInterval) * time.Second)
|
|
continue
|
|
}
|
|
|
|
var tgs []*targetgroup.Group
|
|
// Note that we treat errors when querying specific consul services as fatal for this
|
|
// iteration of the time.Tick loop. It's better to have some stale targets than an incomplete
|
|
// list of targets simply because there may have been a timeout. If the service is actually
|
|
// gone as far as consul is concerned, that will be picked up during the next iteration of
|
|
// the outer loop.
|
|
|
|
newSourceList := make(map[string]bool)
|
|
for name := range srvs {
|
|
if name == "consul" {
|
|
continue
|
|
}
|
|
resp, err := http.Get(fmt.Sprintf("http://%s/v1/catalog/service/%s", d.address, name))
|
|
if err != nil {
|
|
level.Error(d.logger).Log("msg", "Error getting services nodes", "service", name, "err", err)
|
|
break
|
|
}
|
|
|
|
tg, err := d.parseServiceNodes(resp, name)
|
|
if err != nil {
|
|
level.Error(d.logger).Log("msg", "Error parsing services nodes", "service", name, "err", err)
|
|
break
|
|
}
|
|
tgs = append(tgs, tg)
|
|
newSourceList[tg.Source] = true
|
|
}
|
|
// When targetGroup disappear, send an update with empty targetList.
|
|
for key := range d.oldSourceList {
|
|
if !newSourceList[key] {
|
|
tgs = append(tgs, &targetgroup.Group{
|
|
Source: key,
|
|
})
|
|
}
|
|
}
|
|
d.oldSourceList = newSourceList
|
|
if err == nil {
|
|
// We're returning all Consul services as a single targetgroup.
|
|
ch <- tgs
|
|
}
|
|
// Wait for ticker or exit when ctx is closed.
|
|
select {
|
|
case <-c:
|
|
continue
|
|
case <-ctx.Done():
|
|
return
|
|
}
|
|
}
|
|
}
|
|
|
|
func newDiscovery(conf sdConfig) (*discovery, error) {
|
|
cd := &discovery{
|
|
address: conf.Address,
|
|
refreshInterval: conf.RefreshInterval,
|
|
tagSeparator: conf.TagSeparator,
|
|
logger: logger,
|
|
oldSourceList: make(map[string]bool),
|
|
}
|
|
return cd, nil
|
|
}
|
|
|
|
func main() {
|
|
a.HelpFlag.Short('h')
|
|
|
|
_, err := a.Parse(os.Args[1:])
|
|
if err != nil {
|
|
fmt.Println("err: ", err)
|
|
return
|
|
}
|
|
logger = log.NewSyncLogger(log.NewLogfmtLogger(os.Stdout))
|
|
logger = log.With(logger, "ts", log.DefaultTimestampUTC, "caller", log.DefaultCaller)
|
|
|
|
ctx := context.Background()
|
|
|
|
// NOTE: create an instance of your new SD implementation here.
|
|
cfg := sdConfig{
|
|
TagSeparator: ",",
|
|
Address: *listenAddress,
|
|
RefreshInterval: 30,
|
|
}
|
|
|
|
disc, err := newDiscovery(cfg)
|
|
if err != nil {
|
|
fmt.Println("err: ", err)
|
|
}
|
|
|
|
if err != nil {
|
|
level.Error(logger).Log("msg", "failed to create discovery metrics", "err", err)
|
|
os.Exit(1)
|
|
}
|
|
|
|
reg := prometheus.NewRegistry()
|
|
refreshMetrics := prom_discovery.NewRefreshMetrics(reg)
|
|
metrics, err := prom_discovery.RegisterSDMetrics(reg, refreshMetrics)
|
|
if err != nil {
|
|
level.Error(logger).Log("msg", "failed to register service discovery metrics", "err", err)
|
|
os.Exit(1)
|
|
}
|
|
|
|
sdAdapter := adapter.NewAdapter(ctx, *outputFile, "exampleSD", disc, logger, metrics, reg)
|
|
sdAdapter.Run()
|
|
|
|
<-ctx.Done()
|
|
}
|