mirror of
https://github.com/VictoriaMetrics/VictoriaMetrics.git
synced 2025-01-20 23:39:48 +01:00
54410bf51b
- Document the bugfix at docs/CHANGELOG.md - Wait until all the worker goroutines are done in consulWatcher.mustStop() - Do not log `context canceled` errors when discovering consul serviceNames - Removed explicit handling of gzipped responses at lib/promscrape/discoveryutils.Client, since this handling is automatically performed by net/http.Transport. See DisableCompression option at https://pkg.go.dev/net/http#Transport . - Remove explicit handling of the proxyURL, since it is automatically handled by net/http.Transport. See Proxy option at https://pkg.go.dev/net/http#Transport . - Expliticly set MaxIdleConnsPerHost, since its default value equals to 2. Such a small value may result in excess tcp connection churn when more than 2 concurrent requests are processed by lib/promscrape/discoveryutils.Client. - Do not set explicitly the `Host` request header, since it is automatically set by net/http.Client. - Backport the bugfix to the recently added nomad_sd_configs - see https://github.com/VictoriaMetrics/VictoriaMetrics/issues/3367 Updates https://github.com/VictoriaMetrics/VictoriaMetrics/issues/3468
170 lines
4.9 KiB
Go
170 lines
4.9 KiB
Go
package nomad
|
|
|
|
import (
|
|
"flag"
|
|
"fmt"
|
|
"net/http"
|
|
"os"
|
|
"strconv"
|
|
"strings"
|
|
"time"
|
|
|
|
"github.com/VictoriaMetrics/VictoriaMetrics/lib/logger"
|
|
"github.com/VictoriaMetrics/VictoriaMetrics/lib/promauth"
|
|
"github.com/VictoriaMetrics/VictoriaMetrics/lib/promscrape/discoveryutils"
|
|
)
|
|
|
|
var waitTime = flag.Duration("promscrape.nomad.waitTime", 0, "Wait time used by Nomad service discovery. Default value is used if not set")
|
|
|
|
// apiConfig contains config for API server.
|
|
type apiConfig struct {
|
|
tagSeparator string
|
|
nomadWatcher *nomadWatcher
|
|
}
|
|
|
|
func (ac *apiConfig) mustStop() {
|
|
ac.nomadWatcher.mustStop()
|
|
}
|
|
|
|
var configMap = discoveryutils.NewConfigMap()
|
|
|
|
func getAPIConfig(sdc *SDConfig, baseDir string) (*apiConfig, error) {
|
|
v, err := configMap.Get(sdc, func() (interface{}, error) { return newAPIConfig(sdc, baseDir) })
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
return v.(*apiConfig), nil
|
|
}
|
|
|
|
func newAPIConfig(sdc *SDConfig, baseDir string) (*apiConfig, error) {
|
|
hcc := sdc.HTTPClientConfig
|
|
token := getToken(sdc.Token)
|
|
if token != "" {
|
|
if hcc.BearerToken != nil {
|
|
return nil, fmt.Errorf("cannot set both token and bearer_token configs")
|
|
}
|
|
hcc.BearerToken = promauth.NewSecret(token)
|
|
}
|
|
ac, err := hcc.NewConfig(baseDir)
|
|
if err != nil {
|
|
return nil, fmt.Errorf("cannot parse auth config: %w", err)
|
|
}
|
|
apiServer := sdc.Server
|
|
if apiServer == "" {
|
|
apiServer = "localhost:4646"
|
|
}
|
|
if !strings.Contains(apiServer, "://") {
|
|
scheme := sdc.Scheme
|
|
if scheme == "" {
|
|
scheme = "http"
|
|
}
|
|
apiServer = scheme + "://" + apiServer
|
|
}
|
|
proxyAC, err := sdc.ProxyClientConfig.NewConfig(baseDir)
|
|
if err != nil {
|
|
return nil, fmt.Errorf("cannot parse proxy auth config: %w", err)
|
|
}
|
|
client, err := discoveryutils.NewClient(apiServer, ac, sdc.ProxyURL, proxyAC)
|
|
if err != nil {
|
|
return nil, fmt.Errorf("cannot create HTTP client for %q: %w", apiServer, err)
|
|
}
|
|
tagSeparator := ","
|
|
if sdc.TagSeparator != nil {
|
|
tagSeparator = *sdc.TagSeparator
|
|
}
|
|
dc, err := getDatacenter(client, sdc.Datacenter)
|
|
if err != nil {
|
|
return nil, fmt.Errorf("cannot obtain Nomad datacenter: %w", err)
|
|
}
|
|
|
|
namespace := sdc.Namespace
|
|
// default namespace can be detected from env var.
|
|
if namespace == "" {
|
|
namespace = os.Getenv("NOMAD_NAMESPACE")
|
|
}
|
|
|
|
nw := newNomadWatcher(client, sdc, dc, namespace)
|
|
cfg := &apiConfig{
|
|
tagSeparator: tagSeparator,
|
|
nomadWatcher: nw,
|
|
}
|
|
return cfg, nil
|
|
}
|
|
|
|
func getToken(token *promauth.Secret) string {
|
|
if token != nil {
|
|
return token.String()
|
|
}
|
|
t := os.Getenv("NOMAD_TOKEN")
|
|
// Allow empty token - it should work if ACL is disabled in Nomad.
|
|
return t
|
|
}
|
|
|
|
func getDatacenter(client *discoveryutils.Client, dc string) (string, error) {
|
|
if dc != "" {
|
|
return dc, nil
|
|
}
|
|
// See https://developer.hashicorp.com/nomad/api-docs/agent#query-self
|
|
data, err := client.GetAPIResponse("/v1/agent/self")
|
|
if err != nil {
|
|
return "", fmt.Errorf("cannot query nomad agent info: %w", err)
|
|
}
|
|
a, err := parseAgent(data)
|
|
if err != nil {
|
|
return "", err
|
|
}
|
|
return a.Config.Datacenter, nil
|
|
}
|
|
|
|
// maxWaitTime is duration for Nomad blocking request.
|
|
func maxWaitTime() time.Duration {
|
|
d := discoveryutils.BlockingClientReadTimeout
|
|
// Nomad adds random delay up to wait/16, so reduce the timeout in order to keep it below BlockingClientReadTimeout.
|
|
// See https://developer.hashicorp.com/nomad/api-docs#blocking-queries
|
|
d -= d / 16
|
|
// The timeout cannot exceed 10 minuntes. See https://developer.hashicorp.com/nomad/api-docs#blocking-queries
|
|
|
|
if d > 10*time.Minute {
|
|
d = 10 * time.Minute
|
|
}
|
|
if *waitTime > time.Second && *waitTime < d {
|
|
d = *waitTime
|
|
}
|
|
return d
|
|
}
|
|
|
|
// getBlockingAPIResponse perfoms blocking request to Nomad via client and returns response.
|
|
// See https://developer.hashicorp.com/nomad/api-docs#blocking-queries .
|
|
func getBlockingAPIResponse(client *discoveryutils.Client, path string, index int64) ([]byte, int64, error) {
|
|
path += "&index=" + strconv.FormatInt(index, 10)
|
|
path += "&wait=" + fmt.Sprintf("%ds", int(maxWaitTime().Seconds()))
|
|
getMeta := func(resp *http.Response) {
|
|
ind := resp.Header.Get("X-Nomad-Index")
|
|
if len(ind) == 0 {
|
|
logger.Errorf("cannot find X-Nomad-Index header in response from %q", path)
|
|
return
|
|
}
|
|
newIndex, err := strconv.ParseInt(ind, 10, 64)
|
|
if err != nil {
|
|
logger.Errorf("cannot parse X-Nomad-Index header value in response from %q: %s", path, err)
|
|
return
|
|
}
|
|
// Properly handle the returned newIndex according to https://developer.hashicorp.com/nomad/api-docs#blocking-queries.
|
|
// Index implementation details are the same for Consul and Nomad: https://developer.hashicorp.com/consul/api-docs/features/blocking#implementation-details
|
|
if newIndex < 1 {
|
|
index = 1
|
|
return
|
|
}
|
|
if index > newIndex {
|
|
index = 0
|
|
return
|
|
}
|
|
index = newIndex
|
|
}
|
|
data, err := client.GetBlockingAPIResponse(path, getMeta)
|
|
if err != nil {
|
|
return nil, index, fmt.Errorf("cannot perform blocking Nomad API request at %q: %w", path, err)
|
|
}
|
|
return data, index, nil
|
|
}
|