2015-01-21 19:07:45 +00:00
|
|
|
// Copyright 2013 The Prometheus Authors
|
2013-08-09 17:32:55 +00:00
|
|
|
// Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
// you may not use this file except in compliance with the License.
|
|
|
|
// You may obtain a copy of the License at
|
|
|
|
//
|
|
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
//
|
|
|
|
// Unless required by applicable law or agreed to in writing, software
|
|
|
|
// distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
// See the License for the specific language governing permissions and
|
|
|
|
// limitations under the License.
|
|
|
|
|
2016-03-01 11:37:22 +00:00
|
|
|
package notifier
|
2013-08-09 17:32:55 +00:00
|
|
|
|
|
|
|
import (
|
2019-04-18 08:50:37 +00:00
|
|
|
"bytes"
|
2017-10-25 04:21:42 +00:00
|
|
|
"context"
|
2015-12-10 15:31:50 +00:00
|
|
|
"encoding/json"
|
|
|
|
"fmt"
|
2022-04-27 09:24:36 +00:00
|
|
|
"io"
|
2013-08-09 17:32:55 +00:00
|
|
|
"net/http"
|
2015-12-10 15:31:50 +00:00
|
|
|
"net/http/httptest"
|
2017-04-25 05:42:33 +00:00
|
|
|
"net/url"
|
2022-07-01 12:23:23 +00:00
|
|
|
"strconv"
|
2013-08-09 17:32:55 +00:00
|
|
|
"testing"
|
|
|
|
"time"
|
|
|
|
|
2020-07-01 07:51:32 +00:00
|
|
|
"github.com/prometheus/alertmanager/api/v2/models"
|
2018-01-11 15:10:25 +00:00
|
|
|
config_util "github.com/prometheus/common/config"
|
2015-08-20 15:18:46 +00:00
|
|
|
"github.com/prometheus/common/model"
|
2020-10-29 09:43:23 +00:00
|
|
|
"github.com/stretchr/testify/require"
|
2020-07-30 07:45:42 +00:00
|
|
|
"go.uber.org/atomic"
|
2022-08-31 13:50:38 +00:00
|
|
|
"gopkg.in/yaml.v2"
|
2019-09-02 14:05:02 +00:00
|
|
|
|
2016-08-09 08:08:15 +00:00
|
|
|
"github.com/prometheus/prometheus/config"
|
Refactor SD configuration to remove `config` dependency (#3629)
* refactor: move targetGroup struct and CheckOverflow() to their own package
* refactor: move auth and security related structs to a utility package, fix import error in utility package
* refactor: Azure SD, remove SD struct from config
* refactor: DNS SD, remove SD struct from config into dns package
* refactor: ec2 SD, move SD struct from config into the ec2 package
* refactor: file SD, move SD struct from config to file discovery package
* refactor: gce, move SD struct from config to gce discovery package
* refactor: move HTTPClientConfig and URL into util/config, fix import error in httputil
* refactor: consul, move SD struct from config into consul discovery package
* refactor: marathon, move SD struct from config into marathon discovery package
* refactor: triton, move SD struct from config to triton discovery package, fix test
* refactor: zookeeper, move SD structs from config to zookeeper discovery package
* refactor: openstack, remove SD struct from config, move into openstack discovery package
* refactor: kubernetes, move SD struct from config into kubernetes discovery package
* refactor: notifier, use targetgroup package instead of config
* refactor: tests for file, marathon, triton SD - use targetgroup package instead of config.TargetGroup
* refactor: retrieval, use targetgroup package instead of config.TargetGroup
* refactor: storage, use config util package
* refactor: discovery manager, use targetgroup package instead of config.TargetGroup
* refactor: use HTTPClient and TLS config from configUtil instead of config
* refactor: tests, use targetgroup package instead of config.TargetGroup
* refactor: fix tagetgroup.Group pointers that were removed by mistake
* refactor: openstack, kubernetes: drop prefixes
* refactor: remove import aliases forced due to vscode bug
* refactor: move main SD struct out of config into discovery/config
* refactor: rename configUtil to config_util
* refactor: rename yamlUtil to yaml_config
* refactor: kubernetes, remove prefixes
* refactor: move the TargetGroup package to discovery/
* refactor: fix order of imports
2017-12-29 20:01:34 +00:00
|
|
|
"github.com/prometheus/prometheus/discovery/targetgroup"
|
2021-11-08 14:23:17 +00:00
|
|
|
"github.com/prometheus/prometheus/model/labels"
|
|
|
|
"github.com/prometheus/prometheus/model/relabel"
|
2013-08-09 17:32:55 +00:00
|
|
|
)
|
|
|
|
|
2016-11-23 16:03:22 +00:00
|
|
|
func TestPostPath(t *testing.T) {
|
2021-10-22 08:06:44 +00:00
|
|
|
cases := []struct {
|
2016-02-04 10:56:14 +00:00
|
|
|
in, out string
|
|
|
|
}{
|
|
|
|
{
|
2016-11-23 16:03:22 +00:00
|
|
|
in: "",
|
|
|
|
out: "/api/v1/alerts",
|
2016-02-04 10:56:14 +00:00
|
|
|
},
|
|
|
|
{
|
2016-11-23 16:03:22 +00:00
|
|
|
in: "/",
|
|
|
|
out: "/api/v1/alerts",
|
2016-02-04 10:56:14 +00:00
|
|
|
},
|
|
|
|
{
|
2016-11-23 16:03:22 +00:00
|
|
|
in: "/prefix",
|
|
|
|
out: "/prefix/api/v1/alerts",
|
2016-02-04 10:56:14 +00:00
|
|
|
},
|
|
|
|
{
|
2016-11-23 16:03:22 +00:00
|
|
|
in: "/prefix//",
|
|
|
|
out: "/prefix/api/v1/alerts",
|
2016-02-04 10:56:14 +00:00
|
|
|
},
|
|
|
|
{
|
2016-11-23 16:03:22 +00:00
|
|
|
in: "prefix//",
|
|
|
|
out: "/prefix/api/v1/alerts",
|
2016-02-04 10:56:14 +00:00
|
|
|
},
|
|
|
|
}
|
|
|
|
for _, c := range cases {
|
2020-10-29 09:43:23 +00:00
|
|
|
require.Equal(t, c.out, postPath(c.in, config.AlertmanagerAPIVersionV1))
|
2016-02-04 10:56:14 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2015-12-10 15:31:50 +00:00
|
|
|
func TestHandlerNextBatch(t *testing.T) {
|
2018-01-30 17:45:37 +00:00
|
|
|
h := NewManager(&Options{}, nil)
|
2015-12-10 15:31:50 +00:00
|
|
|
|
|
|
|
for i := range make([]struct{}, 2*maxBatchSize+1) {
|
2016-12-29 15:53:11 +00:00
|
|
|
h.queue = append(h.queue, &Alert{
|
|
|
|
Labels: labels.FromStrings("alertname", fmt.Sprintf("%d", i)),
|
2015-12-10 15:31:50 +00:00
|
|
|
})
|
|
|
|
}
|
|
|
|
|
2016-12-29 15:53:11 +00:00
|
|
|
expected := append([]*Alert{}, h.queue...)
|
2015-12-10 15:31:50 +00:00
|
|
|
|
2020-10-29 09:43:23 +00:00
|
|
|
require.NoError(t, alertsEqual(expected[0:maxBatchSize], h.nextBatch()))
|
|
|
|
require.NoError(t, alertsEqual(expected[maxBatchSize:2*maxBatchSize], h.nextBatch()))
|
|
|
|
require.NoError(t, alertsEqual(expected[2*maxBatchSize:], h.nextBatch()))
|
2023-12-07 11:35:01 +00:00
|
|
|
require.Empty(t, h.queue, "Expected queue to be empty but got %d alerts", len(h.queue))
|
2013-08-09 17:32:55 +00:00
|
|
|
}
|
|
|
|
|
2019-09-02 14:05:02 +00:00
|
|
|
func alertsEqual(a, b []*Alert) error {
|
2015-12-10 15:31:50 +00:00
|
|
|
if len(a) != len(b) {
|
2022-06-16 08:38:27 +00:00
|
|
|
return fmt.Errorf("length mismatch: %v != %v", a, b)
|
2015-12-10 15:31:50 +00:00
|
|
|
}
|
|
|
|
for i, alert := range a {
|
2016-12-29 15:53:11 +00:00
|
|
|
if !labels.Equal(alert.Labels, b[i].Labels) {
|
2022-06-16 08:38:27 +00:00
|
|
|
return fmt.Errorf("label mismatch at index %d: %s != %s", i, alert.Labels, b[i].Labels)
|
2015-12-10 15:31:50 +00:00
|
|
|
}
|
|
|
|
}
|
2019-09-02 14:05:02 +00:00
|
|
|
return nil
|
2013-08-09 17:32:55 +00:00
|
|
|
}
|
|
|
|
|
2016-06-02 12:25:19 +00:00
|
|
|
func TestHandlerSendAll(t *testing.T) {
|
2015-12-10 15:31:50 +00:00
|
|
|
var (
|
2019-09-02 14:05:02 +00:00
|
|
|
errc = make(chan error, 1)
|
|
|
|
expected = make([]*Alert, 0, maxBatchSize)
|
2020-07-30 07:45:42 +00:00
|
|
|
status1, status2 atomic.Int32
|
2015-12-10 15:31:50 +00:00
|
|
|
)
|
2020-07-30 07:45:42 +00:00
|
|
|
status1.Store(int32(http.StatusOK))
|
|
|
|
status2.Store(int32(http.StatusOK))
|
2013-08-09 17:32:55 +00:00
|
|
|
|
2020-07-30 07:45:42 +00:00
|
|
|
newHTTPServer := func(u, p string, status *atomic.Int32) *httptest.Server {
|
2019-09-02 14:05:02 +00:00
|
|
|
return httptest.NewServer(http.HandlerFunc(func(w http.ResponseWriter, r *http.Request) {
|
|
|
|
var err error
|
|
|
|
defer func() {
|
|
|
|
if err == nil {
|
|
|
|
return
|
|
|
|
}
|
|
|
|
select {
|
|
|
|
case errc <- err:
|
|
|
|
default:
|
|
|
|
}
|
|
|
|
}()
|
|
|
|
user, pass, _ := r.BasicAuth()
|
|
|
|
if user != u || pass != p {
|
2022-06-16 08:38:27 +00:00
|
|
|
err = fmt.Errorf("unexpected user/password: %s/%s != %s/%s", user, pass, u, p)
|
2019-09-02 14:05:02 +00:00
|
|
|
w.WriteHeader(http.StatusInternalServerError)
|
|
|
|
return
|
|
|
|
}
|
2021-07-02 08:38:14 +00:00
|
|
|
|
2022-04-27 09:24:36 +00:00
|
|
|
b, err := io.ReadAll(r.Body)
|
2021-07-02 08:38:14 +00:00
|
|
|
if err != nil {
|
2022-06-16 08:38:27 +00:00
|
|
|
err = fmt.Errorf("error reading body: %w", err)
|
2021-07-02 08:38:14 +00:00
|
|
|
w.WriteHeader(http.StatusInternalServerError)
|
|
|
|
return
|
|
|
|
}
|
|
|
|
|
2019-09-02 14:05:02 +00:00
|
|
|
var alerts []*Alert
|
2021-07-02 08:38:14 +00:00
|
|
|
err = json.Unmarshal(b, &alerts)
|
2019-09-02 14:05:02 +00:00
|
|
|
if err == nil {
|
|
|
|
err = alertsEqual(expected, alerts)
|
|
|
|
}
|
2020-07-30 07:45:42 +00:00
|
|
|
w.WriteHeader(int(status.Load()))
|
2019-09-02 14:05:02 +00:00
|
|
|
}))
|
2016-06-02 12:25:19 +00:00
|
|
|
}
|
2019-09-02 14:05:02 +00:00
|
|
|
server1 := newHTTPServer("prometheus", "testing_password", &status1)
|
|
|
|
server2 := newHTTPServer("", "", &status2)
|
2016-06-02 12:25:19 +00:00
|
|
|
defer server1.Close()
|
|
|
|
defer server2.Close()
|
2015-12-10 15:31:50 +00:00
|
|
|
|
2018-01-30 17:45:37 +00:00
|
|
|
h := NewManager(&Options{}, nil)
|
2017-12-12 13:40:00 +00:00
|
|
|
|
2019-09-02 14:05:02 +00:00
|
|
|
authClient, _ := config_util.NewClientFromConfig(
|
|
|
|
config_util.HTTPClientConfig{
|
|
|
|
BasicAuth: &config_util.BasicAuth{
|
|
|
|
Username: "prometheus",
|
|
|
|
Password: "testing_password",
|
|
|
|
},
|
2021-09-26 21:16:12 +00:00
|
|
|
}, "auth_alertmanager")
|
2017-12-30 17:47:18 +00:00
|
|
|
|
|
|
|
h.alertmanagers = make(map[string]*alertmanagerSet)
|
|
|
|
|
2019-04-18 12:17:03 +00:00
|
|
|
am1Cfg := config.DefaultAlertmanagerConfig
|
|
|
|
am1Cfg.Timeout = model.Duration(time.Second)
|
|
|
|
|
|
|
|
am2Cfg := config.DefaultAlertmanagerConfig
|
|
|
|
am2Cfg.Timeout = model.Duration(time.Second)
|
|
|
|
|
2017-12-30 17:47:18 +00:00
|
|
|
h.alertmanagers["1"] = &alertmanagerSet{
|
2016-11-23 16:03:22 +00:00
|
|
|
ams: []alertmanager{
|
2016-11-25 10:11:28 +00:00
|
|
|
alertmanagerMock{
|
|
|
|
urlf: func() string { return server1.URL },
|
|
|
|
},
|
2017-12-12 13:40:00 +00:00
|
|
|
},
|
2019-04-18 12:17:03 +00:00
|
|
|
cfg: &am1Cfg,
|
2017-12-12 13:40:00 +00:00
|
|
|
client: authClient,
|
2017-12-30 17:47:18 +00:00
|
|
|
}
|
2017-12-12 13:40:00 +00:00
|
|
|
|
2017-12-30 17:47:18 +00:00
|
|
|
h.alertmanagers["2"] = &alertmanagerSet{
|
2017-12-12 13:40:00 +00:00
|
|
|
ams: []alertmanager{
|
2016-11-25 10:11:28 +00:00
|
|
|
alertmanagerMock{
|
|
|
|
urlf: func() string { return server2.URL },
|
|
|
|
},
|
2016-11-23 16:03:22 +00:00
|
|
|
},
|
2019-04-18 12:17:03 +00:00
|
|
|
cfg: &am2Cfg,
|
2017-12-30 17:47:18 +00:00
|
|
|
}
|
2013-08-09 17:32:55 +00:00
|
|
|
|
2015-12-10 15:31:50 +00:00
|
|
|
for i := range make([]struct{}, maxBatchSize) {
|
2016-12-29 15:53:11 +00:00
|
|
|
h.queue = append(h.queue, &Alert{
|
|
|
|
Labels: labels.FromStrings("alertname", fmt.Sprintf("%d", i)),
|
2015-12-10 15:31:50 +00:00
|
|
|
})
|
2016-12-29 15:53:11 +00:00
|
|
|
expected = append(expected, &Alert{
|
|
|
|
Labels: labels.FromStrings("alertname", fmt.Sprintf("%d", i)),
|
2015-12-10 15:31:50 +00:00
|
|
|
})
|
|
|
|
}
|
|
|
|
|
2019-09-02 14:05:02 +00:00
|
|
|
checkNoErr := func() {
|
|
|
|
t.Helper()
|
|
|
|
select {
|
|
|
|
case err := <-errc:
|
2020-10-29 09:43:23 +00:00
|
|
|
require.NoError(t, err)
|
2019-09-02 14:05:02 +00:00
|
|
|
default:
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2020-10-29 09:43:23 +00:00
|
|
|
require.True(t, h.sendAll(h.queue...), "all sends failed unexpectedly")
|
2019-09-02 14:05:02 +00:00
|
|
|
checkNoErr()
|
2015-12-10 15:31:50 +00:00
|
|
|
|
2020-07-30 07:45:42 +00:00
|
|
|
status1.Store(int32(http.StatusNotFound))
|
2020-10-29 09:43:23 +00:00
|
|
|
require.True(t, h.sendAll(h.queue...), "all sends failed unexpectedly")
|
2019-09-02 14:05:02 +00:00
|
|
|
checkNoErr()
|
2013-08-09 17:32:55 +00:00
|
|
|
|
2020-07-30 07:45:42 +00:00
|
|
|
status2.Store(int32(http.StatusInternalServerError))
|
2020-10-29 09:43:23 +00:00
|
|
|
require.False(t, h.sendAll(h.queue...), "all sends succeeded unexpectedly")
|
2019-09-02 14:05:02 +00:00
|
|
|
checkNoErr()
|
2013-08-09 17:32:55 +00:00
|
|
|
}
|
|
|
|
|
2017-02-27 19:31:16 +00:00
|
|
|
func TestCustomDo(t *testing.T) {
|
|
|
|
const testURL = "http://testurl.com/"
|
|
|
|
const testBody = "testbody"
|
|
|
|
|
|
|
|
var received bool
|
2018-01-30 17:45:37 +00:00
|
|
|
h := NewManager(&Options{
|
2018-11-19 11:31:16 +00:00
|
|
|
Do: func(_ context.Context, client *http.Client, req *http.Request) (*http.Response, error) {
|
2017-02-27 19:31:16 +00:00
|
|
|
received = true
|
2022-04-27 09:24:36 +00:00
|
|
|
body, err := io.ReadAll(req.Body)
|
2018-03-29 15:07:26 +00:00
|
|
|
|
2020-10-29 09:43:23 +00:00
|
|
|
require.NoError(t, err)
|
2018-03-29 15:07:26 +00:00
|
|
|
|
2020-10-29 09:43:23 +00:00
|
|
|
require.Equal(t, testBody, string(body))
|
2018-03-29 15:07:26 +00:00
|
|
|
|
2020-10-29 09:43:23 +00:00
|
|
|
require.Equal(t, testURL, req.URL.String())
|
2018-03-29 15:07:26 +00:00
|
|
|
|
2017-02-27 19:31:16 +00:00
|
|
|
return &http.Response{
|
2022-04-27 09:24:36 +00:00
|
|
|
Body: io.NopCloser(bytes.NewBuffer(nil)),
|
2017-02-27 19:31:16 +00:00
|
|
|
}, nil
|
|
|
|
},
|
2017-08-11 18:45:52 +00:00
|
|
|
}, nil)
|
2017-02-27 19:31:16 +00:00
|
|
|
|
|
|
|
h.sendOne(context.Background(), nil, testURL, []byte(testBody))
|
|
|
|
|
2020-10-29 09:43:23 +00:00
|
|
|
require.True(t, received, "Expected to receive an alert, but didn't")
|
2017-02-27 19:31:16 +00:00
|
|
|
}
|
|
|
|
|
2016-09-27 12:34:56 +00:00
|
|
|
func TestExternalLabels(t *testing.T) {
|
2018-01-30 17:45:37 +00:00
|
|
|
h := NewManager(&Options{
|
2016-09-27 12:34:56 +00:00
|
|
|
QueueCapacity: 3 * maxBatchSize,
|
2022-03-09 22:21:29 +00:00
|
|
|
ExternalLabels: labels.FromStrings("a", "b"),
|
2018-12-18 11:26:36 +00:00
|
|
|
RelabelConfigs: []*relabel.Config{
|
2016-09-27 12:34:56 +00:00
|
|
|
{
|
|
|
|
SourceLabels: model.LabelNames{"alertname"},
|
|
|
|
TargetLabel: "a",
|
|
|
|
Action: "replace",
|
2018-12-18 11:26:36 +00:00
|
|
|
Regex: relabel.MustNewRegexp("externalrelabelthis"),
|
2016-09-27 12:34:56 +00:00
|
|
|
Replacement: "c",
|
|
|
|
},
|
|
|
|
},
|
2017-08-11 18:45:52 +00:00
|
|
|
}, nil)
|
2016-09-27 12:34:56 +00:00
|
|
|
|
|
|
|
// This alert should get the external label attached.
|
2016-12-29 15:53:11 +00:00
|
|
|
h.Send(&Alert{
|
|
|
|
Labels: labels.FromStrings("alertname", "test"),
|
2016-09-27 12:34:56 +00:00
|
|
|
})
|
|
|
|
|
|
|
|
// This alert should get the external label attached, but then set to "c"
|
|
|
|
// through relabelling.
|
2016-12-29 15:53:11 +00:00
|
|
|
h.Send(&Alert{
|
|
|
|
Labels: labels.FromStrings("alertname", "externalrelabelthis"),
|
2016-09-27 12:34:56 +00:00
|
|
|
})
|
|
|
|
|
2016-12-29 15:53:11 +00:00
|
|
|
expected := []*Alert{
|
|
|
|
{Labels: labels.FromStrings("alertname", "test", "a", "b")},
|
|
|
|
{Labels: labels.FromStrings("alertname", "externalrelabelthis", "a", "c")},
|
2016-09-27 12:34:56 +00:00
|
|
|
}
|
|
|
|
|
2020-10-29 09:43:23 +00:00
|
|
|
require.NoError(t, alertsEqual(expected, h.queue))
|
2016-09-27 12:34:56 +00:00
|
|
|
}
|
|
|
|
|
2016-08-09 08:08:15 +00:00
|
|
|
func TestHandlerRelabel(t *testing.T) {
|
2018-01-30 17:45:37 +00:00
|
|
|
h := NewManager(&Options{
|
2016-08-09 08:08:15 +00:00
|
|
|
QueueCapacity: 3 * maxBatchSize,
|
2018-12-18 11:26:36 +00:00
|
|
|
RelabelConfigs: []*relabel.Config{
|
2016-09-15 03:13:27 +00:00
|
|
|
{
|
2016-08-09 08:08:15 +00:00
|
|
|
SourceLabels: model.LabelNames{"alertname"},
|
|
|
|
Action: "drop",
|
2018-12-18 11:26:36 +00:00
|
|
|
Regex: relabel.MustNewRegexp("drop"),
|
2016-08-09 08:08:15 +00:00
|
|
|
},
|
2016-09-15 03:13:27 +00:00
|
|
|
{
|
2016-08-09 08:08:15 +00:00
|
|
|
SourceLabels: model.LabelNames{"alertname"},
|
|
|
|
TargetLabel: "alertname",
|
|
|
|
Action: "replace",
|
2018-12-18 11:26:36 +00:00
|
|
|
Regex: relabel.MustNewRegexp("rename"),
|
2016-08-09 08:08:15 +00:00
|
|
|
Replacement: "renamed",
|
|
|
|
},
|
|
|
|
},
|
2017-08-11 18:45:52 +00:00
|
|
|
}, nil)
|
2016-08-09 08:08:15 +00:00
|
|
|
|
|
|
|
// This alert should be dropped due to the configuration
|
2016-12-29 15:53:11 +00:00
|
|
|
h.Send(&Alert{
|
|
|
|
Labels: labels.FromStrings("alertname", "drop"),
|
2016-08-09 08:08:15 +00:00
|
|
|
})
|
|
|
|
|
|
|
|
// This alert should be replaced due to the configuration
|
2016-12-29 15:53:11 +00:00
|
|
|
h.Send(&Alert{
|
|
|
|
Labels: labels.FromStrings("alertname", "rename"),
|
2016-08-09 08:08:15 +00:00
|
|
|
})
|
|
|
|
|
2016-12-29 15:53:11 +00:00
|
|
|
expected := []*Alert{
|
|
|
|
{Labels: labels.FromStrings("alertname", "renamed")},
|
2016-08-09 08:08:15 +00:00
|
|
|
}
|
|
|
|
|
2020-10-29 09:43:23 +00:00
|
|
|
require.NoError(t, alertsEqual(expected, h.queue))
|
2016-08-09 08:08:15 +00:00
|
|
|
}
|
|
|
|
|
2020-01-02 14:54:09 +00:00
|
|
|
func TestHandlerQueuing(t *testing.T) {
|
2015-12-10 15:31:50 +00:00
|
|
|
var (
|
2019-09-02 14:05:02 +00:00
|
|
|
expectedc = make(chan []*Alert)
|
|
|
|
called = make(chan struct{})
|
|
|
|
done = make(chan struct{})
|
|
|
|
errc = make(chan error, 1)
|
2015-12-10 15:31:50 +00:00
|
|
|
)
|
|
|
|
|
|
|
|
server := httptest.NewServer(http.HandlerFunc(func(w http.ResponseWriter, r *http.Request) {
|
2019-09-02 14:05:02 +00:00
|
|
|
// Notify the test function that we have received something.
|
|
|
|
select {
|
|
|
|
case called <- struct{}{}:
|
|
|
|
case <-done:
|
|
|
|
return
|
|
|
|
}
|
2015-12-10 15:31:50 +00:00
|
|
|
|
2019-09-02 14:05:02 +00:00
|
|
|
// Wait for the test function to unblock us.
|
|
|
|
select {
|
|
|
|
case expected := <-expectedc:
|
|
|
|
var alerts []*Alert
|
2021-07-02 08:38:14 +00:00
|
|
|
|
2022-04-27 09:24:36 +00:00
|
|
|
b, err := io.ReadAll(r.Body)
|
2021-07-02 08:38:14 +00:00
|
|
|
if err != nil {
|
|
|
|
panic(err)
|
|
|
|
}
|
|
|
|
|
|
|
|
err = json.Unmarshal(b, &alerts)
|
2019-09-02 14:05:02 +00:00
|
|
|
if err == nil {
|
|
|
|
err = alertsEqual(expected, alerts)
|
|
|
|
}
|
|
|
|
select {
|
|
|
|
case errc <- err:
|
|
|
|
default:
|
|
|
|
}
|
|
|
|
case <-done:
|
|
|
|
}
|
2015-12-10 15:31:50 +00:00
|
|
|
}))
|
2019-09-02 14:05:02 +00:00
|
|
|
defer func() {
|
|
|
|
close(done)
|
|
|
|
server.Close()
|
|
|
|
}()
|
|
|
|
|
|
|
|
h := NewManager(
|
|
|
|
&Options{
|
|
|
|
QueueCapacity: 3 * maxBatchSize,
|
|
|
|
},
|
2017-08-11 18:45:52 +00:00
|
|
|
nil,
|
2017-04-28 15:12:38 +00:00
|
|
|
)
|
2017-12-30 17:47:18 +00:00
|
|
|
|
|
|
|
h.alertmanagers = make(map[string]*alertmanagerSet)
|
|
|
|
|
2019-04-18 12:17:03 +00:00
|
|
|
am1Cfg := config.DefaultAlertmanagerConfig
|
|
|
|
am1Cfg.Timeout = model.Duration(time.Second)
|
|
|
|
|
2017-12-30 17:47:18 +00:00
|
|
|
h.alertmanagers["1"] = &alertmanagerSet{
|
2016-11-23 16:03:22 +00:00
|
|
|
ams: []alertmanager{
|
2016-11-25 10:11:28 +00:00
|
|
|
alertmanagerMock{
|
|
|
|
urlf: func() string { return server.URL },
|
|
|
|
},
|
2016-11-23 16:03:22 +00:00
|
|
|
},
|
2019-04-18 12:17:03 +00:00
|
|
|
cfg: &am1Cfg,
|
2017-12-30 17:47:18 +00:00
|
|
|
}
|
2019-09-02 14:05:02 +00:00
|
|
|
go h.Run(nil)
|
|
|
|
defer h.Stop()
|
2015-12-10 15:31:50 +00:00
|
|
|
|
2016-12-29 15:53:11 +00:00
|
|
|
var alerts []*Alert
|
2015-12-10 15:31:50 +00:00
|
|
|
for i := range make([]struct{}, 20*maxBatchSize) {
|
2016-12-29 15:53:11 +00:00
|
|
|
alerts = append(alerts, &Alert{
|
|
|
|
Labels: labels.FromStrings("alertname", fmt.Sprintf("%d", i)),
|
2015-12-10 15:31:50 +00:00
|
|
|
})
|
|
|
|
}
|
|
|
|
|
2019-09-02 14:05:02 +00:00
|
|
|
assertAlerts := func(expected []*Alert) {
|
|
|
|
t.Helper()
|
|
|
|
for {
|
|
|
|
select {
|
|
|
|
case <-called:
|
|
|
|
expectedc <- expected
|
|
|
|
case err := <-errc:
|
2020-10-29 09:43:23 +00:00
|
|
|
require.NoError(t, err)
|
2019-09-02 14:05:02 +00:00
|
|
|
return
|
|
|
|
case <-time.After(5 * time.Second):
|
2021-09-13 19:19:20 +00:00
|
|
|
require.FailNow(t, "Alerts were not pushed.")
|
2019-09-02 14:05:02 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
2015-12-10 15:31:50 +00:00
|
|
|
|
2019-09-02 14:05:02 +00:00
|
|
|
// If the batch is larger than the queue capacity, it should be truncated
|
|
|
|
// from the front.
|
2015-12-10 15:31:50 +00:00
|
|
|
h.Send(alerts[:4*maxBatchSize]...)
|
|
|
|
for i := 1; i < 4; i++ {
|
2019-09-02 14:05:02 +00:00
|
|
|
assertAlerts(alerts[i*maxBatchSize : (i+1)*maxBatchSize])
|
2013-08-09 17:32:55 +00:00
|
|
|
}
|
|
|
|
|
2019-09-02 14:05:02 +00:00
|
|
|
// Send one batch, wait for it to arrive and block the server so the queue fills up.
|
2015-12-10 15:31:50 +00:00
|
|
|
h.Send(alerts[:maxBatchSize]...)
|
|
|
|
<-called
|
|
|
|
|
2019-09-02 14:05:02 +00:00
|
|
|
// Send several batches while the server is still blocked so the queue
|
|
|
|
// fills up to its maximum capacity (3*maxBatchSize). Then check that the
|
|
|
|
// queue is truncated in the front.
|
|
|
|
h.Send(alerts[1*maxBatchSize : 2*maxBatchSize]...) // this batch should be dropped.
|
2015-12-10 15:31:50 +00:00
|
|
|
h.Send(alerts[2*maxBatchSize : 3*maxBatchSize]...)
|
|
|
|
h.Send(alerts[3*maxBatchSize : 4*maxBatchSize]...)
|
|
|
|
|
|
|
|
// Send the batch that drops the first one.
|
|
|
|
h.Send(alerts[4*maxBatchSize : 5*maxBatchSize]...)
|
|
|
|
|
2019-09-02 14:05:02 +00:00
|
|
|
// Unblock the server.
|
|
|
|
expectedc <- alerts[:maxBatchSize]
|
|
|
|
select {
|
|
|
|
case err := <-errc:
|
2020-10-29 09:43:23 +00:00
|
|
|
require.NoError(t, err)
|
2019-09-02 14:05:02 +00:00
|
|
|
case <-time.After(5 * time.Second):
|
2021-09-13 19:19:20 +00:00
|
|
|
require.FailNow(t, "Alerts were not pushed.")
|
2019-09-02 14:05:02 +00:00
|
|
|
}
|
2015-12-10 15:31:50 +00:00
|
|
|
|
2019-09-02 14:05:02 +00:00
|
|
|
// Verify that we receive the last 3 batches.
|
2019-05-06 07:02:40 +00:00
|
|
|
for i := 2; i < 5; i++ {
|
2019-09-02 14:05:02 +00:00
|
|
|
assertAlerts(alerts[i*maxBatchSize : (i+1)*maxBatchSize])
|
2013-08-09 17:32:55 +00:00
|
|
|
}
|
|
|
|
}
|
2016-11-25 10:11:28 +00:00
|
|
|
|
|
|
|
type alertmanagerMock struct {
|
|
|
|
urlf func() string
|
|
|
|
}
|
|
|
|
|
2017-04-25 05:42:33 +00:00
|
|
|
func (a alertmanagerMock) url() *url.URL {
|
|
|
|
u, err := url.Parse(a.urlf())
|
|
|
|
if err != nil {
|
|
|
|
panic(err)
|
|
|
|
}
|
|
|
|
return u
|
2016-11-25 10:11:28 +00:00
|
|
|
}
|
2017-05-17 14:24:22 +00:00
|
|
|
|
|
|
|
func TestLabelSetNotReused(t *testing.T) {
|
|
|
|
tg := makeInputTargetGroup()
|
2021-10-28 00:01:28 +00:00
|
|
|
_, _, err := AlertmanagerFromGroup(tg, &config.AlertmanagerConfig{})
|
2017-05-17 14:24:22 +00:00
|
|
|
|
2020-10-29 09:43:23 +00:00
|
|
|
require.NoError(t, err)
|
2018-03-29 15:07:26 +00:00
|
|
|
|
|
|
|
// Target modified during alertmanager extraction
|
2020-10-29 09:43:23 +00:00
|
|
|
require.Equal(t, tg, makeInputTargetGroup())
|
2017-05-17 14:24:22 +00:00
|
|
|
}
|
|
|
|
|
2017-12-30 20:28:34 +00:00
|
|
|
func TestReload(t *testing.T) {
|
2021-10-22 08:06:44 +00:00
|
|
|
tests := []struct {
|
2017-12-30 20:28:34 +00:00
|
|
|
in *targetgroup.Group
|
|
|
|
out string
|
|
|
|
}{
|
|
|
|
{
|
|
|
|
in: &targetgroup.Group{
|
|
|
|
Targets: []model.LabelSet{
|
|
|
|
{
|
|
|
|
"__address__": "alertmanager:9093",
|
|
|
|
},
|
|
|
|
},
|
|
|
|
},
|
2021-03-19 17:19:12 +00:00
|
|
|
out: "http://alertmanager:9093/api/v2/alerts",
|
2017-12-30 20:28:34 +00:00
|
|
|
},
|
|
|
|
}
|
|
|
|
|
2018-01-30 17:45:37 +00:00
|
|
|
n := NewManager(&Options{}, nil)
|
2017-12-30 20:28:34 +00:00
|
|
|
|
|
|
|
cfg := &config.Config{}
|
|
|
|
s := `
|
|
|
|
alerting:
|
|
|
|
alertmanagers:
|
|
|
|
- static_configs:
|
|
|
|
`
|
2021-09-13 19:19:20 +00:00
|
|
|
err := yaml.UnmarshalStrict([]byte(s), cfg)
|
|
|
|
require.NoError(t, err, "Unable to load YAML config.")
|
2023-12-07 11:35:01 +00:00
|
|
|
require.Len(t, cfg.AlertingConfig.AlertmanagerConfigs, 1)
|
2017-12-30 20:28:34 +00:00
|
|
|
|
2021-09-13 19:19:20 +00:00
|
|
|
err = n.ApplyConfig(cfg)
|
|
|
|
require.NoError(t, err, "Error applying the config.")
|
2017-12-30 20:28:34 +00:00
|
|
|
|
|
|
|
tgs := make(map[string][]*targetgroup.Group)
|
|
|
|
for _, tt := range tests {
|
2019-12-12 16:00:19 +00:00
|
|
|
for k := range cfg.AlertingConfig.AlertmanagerConfigs.ToMap() {
|
|
|
|
tgs[k] = []*targetgroup.Group{
|
|
|
|
tt.in,
|
|
|
|
}
|
|
|
|
break
|
2017-12-30 20:28:34 +00:00
|
|
|
}
|
|
|
|
n.reload(tgs)
|
|
|
|
res := n.Alertmanagers()[0].String()
|
|
|
|
|
2020-10-29 09:43:23 +00:00
|
|
|
require.Equal(t, tt.out, res)
|
2017-12-30 20:28:34 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2018-02-21 09:00:07 +00:00
|
|
|
func TestDroppedAlertmanagers(t *testing.T) {
|
2021-10-22 08:06:44 +00:00
|
|
|
tests := []struct {
|
2018-02-21 09:00:07 +00:00
|
|
|
in *targetgroup.Group
|
|
|
|
out string
|
|
|
|
}{
|
|
|
|
{
|
|
|
|
in: &targetgroup.Group{
|
|
|
|
Targets: []model.LabelSet{
|
|
|
|
{
|
|
|
|
"__address__": "alertmanager:9093",
|
|
|
|
},
|
|
|
|
},
|
|
|
|
},
|
2021-03-19 17:19:12 +00:00
|
|
|
out: "http://alertmanager:9093/api/v2/alerts",
|
2018-02-21 09:00:07 +00:00
|
|
|
},
|
|
|
|
}
|
|
|
|
|
|
|
|
n := NewManager(&Options{}, nil)
|
|
|
|
|
|
|
|
cfg := &config.Config{}
|
|
|
|
s := `
|
|
|
|
alerting:
|
|
|
|
alertmanagers:
|
|
|
|
- static_configs:
|
|
|
|
relabel_configs:
|
|
|
|
- source_labels: ['__address__']
|
|
|
|
regex: 'alertmanager:9093'
|
|
|
|
action: drop
|
|
|
|
`
|
2021-09-13 19:19:20 +00:00
|
|
|
err := yaml.UnmarshalStrict([]byte(s), cfg)
|
|
|
|
require.NoError(t, err, "Unable to load YAML config.")
|
2023-12-07 11:35:01 +00:00
|
|
|
require.Len(t, cfg.AlertingConfig.AlertmanagerConfigs, 1)
|
2018-02-21 09:00:07 +00:00
|
|
|
|
2021-09-13 19:19:20 +00:00
|
|
|
err = n.ApplyConfig(cfg)
|
|
|
|
require.NoError(t, err, "Error applying the config.")
|
2018-02-21 09:00:07 +00:00
|
|
|
|
|
|
|
tgs := make(map[string][]*targetgroup.Group)
|
|
|
|
for _, tt := range tests {
|
2019-12-12 16:00:19 +00:00
|
|
|
for k := range cfg.AlertingConfig.AlertmanagerConfigs.ToMap() {
|
|
|
|
tgs[k] = []*targetgroup.Group{
|
|
|
|
tt.in,
|
|
|
|
}
|
|
|
|
break
|
2018-02-21 09:00:07 +00:00
|
|
|
}
|
2019-12-12 16:00:19 +00:00
|
|
|
|
2018-02-21 09:00:07 +00:00
|
|
|
n.reload(tgs)
|
|
|
|
res := n.DroppedAlertmanagers()[0].String()
|
|
|
|
|
2020-10-29 09:43:23 +00:00
|
|
|
require.Equal(t, res, tt.out)
|
2018-02-21 09:00:07 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
Refactor SD configuration to remove `config` dependency (#3629)
* refactor: move targetGroup struct and CheckOverflow() to their own package
* refactor: move auth and security related structs to a utility package, fix import error in utility package
* refactor: Azure SD, remove SD struct from config
* refactor: DNS SD, remove SD struct from config into dns package
* refactor: ec2 SD, move SD struct from config into the ec2 package
* refactor: file SD, move SD struct from config to file discovery package
* refactor: gce, move SD struct from config to gce discovery package
* refactor: move HTTPClientConfig and URL into util/config, fix import error in httputil
* refactor: consul, move SD struct from config into consul discovery package
* refactor: marathon, move SD struct from config into marathon discovery package
* refactor: triton, move SD struct from config to triton discovery package, fix test
* refactor: zookeeper, move SD structs from config to zookeeper discovery package
* refactor: openstack, remove SD struct from config, move into openstack discovery package
* refactor: kubernetes, move SD struct from config into kubernetes discovery package
* refactor: notifier, use targetgroup package instead of config
* refactor: tests for file, marathon, triton SD - use targetgroup package instead of config.TargetGroup
* refactor: retrieval, use targetgroup package instead of config.TargetGroup
* refactor: storage, use config util package
* refactor: discovery manager, use targetgroup package instead of config.TargetGroup
* refactor: use HTTPClient and TLS config from configUtil instead of config
* refactor: tests, use targetgroup package instead of config.TargetGroup
* refactor: fix tagetgroup.Group pointers that were removed by mistake
* refactor: openstack, kubernetes: drop prefixes
* refactor: remove import aliases forced due to vscode bug
* refactor: move main SD struct out of config into discovery/config
* refactor: rename configUtil to config_util
* refactor: rename yamlUtil to yaml_config
* refactor: kubernetes, remove prefixes
* refactor: move the TargetGroup package to discovery/
* refactor: fix order of imports
2017-12-29 20:01:34 +00:00
|
|
|
func makeInputTargetGroup() *targetgroup.Group {
|
|
|
|
return &targetgroup.Group{
|
2017-05-17 14:24:22 +00:00
|
|
|
Targets: []model.LabelSet{
|
2017-08-29 08:00:11 +00:00
|
|
|
{
|
2017-05-17 14:24:22 +00:00
|
|
|
model.AddressLabel: model.LabelValue("1.1.1.1:9090"),
|
|
|
|
model.LabelName("notcommon1"): model.LabelValue("label"),
|
|
|
|
},
|
|
|
|
},
|
|
|
|
Labels: model.LabelSet{
|
|
|
|
model.LabelName("common"): model.LabelValue("label"),
|
|
|
|
},
|
|
|
|
Source: "testsource",
|
|
|
|
}
|
|
|
|
}
|
2020-07-01 07:51:32 +00:00
|
|
|
|
|
|
|
func TestLabelsToOpenAPILabelSet(t *testing.T) {
|
2022-03-09 22:21:29 +00:00
|
|
|
require.Equal(t, models.LabelSet{"aaa": "111", "bbb": "222"}, labelsToOpenAPILabelSet(labels.FromStrings("aaa", "111", "bbb", "222")))
|
2020-07-01 07:51:32 +00:00
|
|
|
}
|
2022-07-01 12:23:23 +00:00
|
|
|
|
|
|
|
// TestHangingNotifier validates that targets updates happen even when there are
|
|
|
|
// queued alerts.
|
|
|
|
func TestHangingNotifier(t *testing.T) {
|
|
|
|
// Note: When targets are not updated in time, this test is flaky because go
|
|
|
|
// selects are not deterministic. Therefore we run 10 subtests to run into the issue.
|
|
|
|
for i := 0; i < 10; i++ {
|
|
|
|
t.Run(strconv.Itoa(i), func(t *testing.T) {
|
|
|
|
var (
|
|
|
|
done = make(chan struct{})
|
|
|
|
changed = make(chan struct{})
|
|
|
|
syncCh = make(chan map[string][]*targetgroup.Group)
|
|
|
|
)
|
|
|
|
|
|
|
|
defer func() {
|
|
|
|
close(done)
|
|
|
|
}()
|
|
|
|
|
2022-07-05 13:27:26 +00:00
|
|
|
var calledOnce bool
|
2022-07-01 12:23:23 +00:00
|
|
|
// Setting up a bad server. This server hangs for 2 seconds.
|
|
|
|
badServer := httptest.NewServer(http.HandlerFunc(func(w http.ResponseWriter, r *http.Request) {
|
2022-07-05 13:27:26 +00:00
|
|
|
if calledOnce {
|
|
|
|
t.Fatal("hanging server called multiple times")
|
|
|
|
}
|
|
|
|
calledOnce = true
|
2022-07-01 12:23:23 +00:00
|
|
|
select {
|
|
|
|
case <-done:
|
|
|
|
case <-time.After(2 * time.Second):
|
|
|
|
}
|
|
|
|
}))
|
|
|
|
badURL, err := url.Parse(badServer.URL)
|
|
|
|
require.NoError(t, err)
|
|
|
|
badAddress := badURL.Host // Used for __name__ label in targets.
|
|
|
|
|
|
|
|
// Setting up a bad server. This server returns fast, signaling requests on
|
|
|
|
// by closing the changed channel.
|
|
|
|
goodServer := httptest.NewServer(http.HandlerFunc(func(w http.ResponseWriter, r *http.Request) {
|
|
|
|
close(changed)
|
|
|
|
}))
|
|
|
|
goodURL, err := url.Parse(goodServer.URL)
|
|
|
|
require.NoError(t, err)
|
|
|
|
goodAddress := goodURL.Host // Used for __name__ label in targets.
|
|
|
|
|
|
|
|
h := NewManager(
|
|
|
|
&Options{
|
|
|
|
QueueCapacity: 20 * maxBatchSize,
|
|
|
|
},
|
|
|
|
nil,
|
|
|
|
)
|
|
|
|
|
|
|
|
h.alertmanagers = make(map[string]*alertmanagerSet)
|
|
|
|
|
|
|
|
am1Cfg := config.DefaultAlertmanagerConfig
|
|
|
|
am1Cfg.Timeout = model.Duration(200 * time.Millisecond)
|
|
|
|
|
|
|
|
h.alertmanagers["config-0"] = &alertmanagerSet{
|
|
|
|
ams: []alertmanager{},
|
|
|
|
cfg: &am1Cfg,
|
|
|
|
metrics: h.metrics,
|
|
|
|
}
|
|
|
|
go h.Run(syncCh)
|
|
|
|
defer h.Stop()
|
|
|
|
|
|
|
|
var alerts []*Alert
|
|
|
|
for i := range make([]struct{}, 20*maxBatchSize) {
|
|
|
|
alerts = append(alerts, &Alert{
|
|
|
|
Labels: labels.FromStrings("alertname", fmt.Sprintf("%d", i)),
|
|
|
|
})
|
|
|
|
}
|
|
|
|
|
|
|
|
// Injecting the hanging server URL.
|
|
|
|
syncCh <- map[string][]*targetgroup.Group{
|
|
|
|
"config-0": {
|
|
|
|
{
|
|
|
|
Targets: []model.LabelSet{
|
|
|
|
{
|
|
|
|
model.AddressLabel: model.LabelValue(badAddress),
|
|
|
|
},
|
|
|
|
},
|
|
|
|
},
|
|
|
|
},
|
|
|
|
}
|
|
|
|
|
|
|
|
// Queing alerts.
|
|
|
|
h.Send(alerts...)
|
|
|
|
|
|
|
|
// Updating with a working alertmanager target.
|
|
|
|
go func() {
|
|
|
|
select {
|
|
|
|
case syncCh <- map[string][]*targetgroup.Group{
|
|
|
|
"config-0": {
|
|
|
|
{
|
|
|
|
Targets: []model.LabelSet{
|
|
|
|
{
|
|
|
|
model.AddressLabel: model.LabelValue(goodAddress),
|
|
|
|
},
|
|
|
|
},
|
|
|
|
},
|
|
|
|
},
|
|
|
|
}:
|
|
|
|
case <-done:
|
|
|
|
}
|
|
|
|
}()
|
|
|
|
|
|
|
|
select {
|
2022-07-05 13:27:26 +00:00
|
|
|
case <-time.After(1 * time.Second):
|
|
|
|
t.Fatalf("Timeout after 1 second, targets not synced in time.")
|
2022-07-01 12:23:23 +00:00
|
|
|
case <-changed:
|
|
|
|
// The good server has been hit in less than 3 seconds, therefore
|
|
|
|
// targets have been updated before a second call could be made to the
|
|
|
|
// bad server.
|
|
|
|
}
|
|
|
|
})
|
|
|
|
}
|
|
|
|
}
|