Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Add filtering option for prometheus collector #16420

Merged
merged 14 commits into from
Feb 24, 2020
3 changes: 2 additions & 1 deletion CHANGELOG.next.asciidoc
Original file line number Diff line number Diff line change
Expand Up @@ -125,7 +125,7 @@ https://github.com/elastic/beats/compare/v7.0.0-alpha2...master[Check the HEAD d
- Add MQTT input. {issue}15602[15602] {pull}16204[16204]
- Add ECS categorization fields to activemq module. {issue}16151[16151] {pull}16201[16201]
- Add a TLS test and more debug output to httpjson input {pull}16315[16315]
- Add an SSL config example in config.yml for filebeat MISP module. {pull}16320[16320]
- Add an SSL config example in config.yml for filebeat MISP module. {pull}16320[16320]
- Improve ECS categorization, container & process field mappings in auditd module. {issue}16153[16153] {pull}16280[16280]

*Heartbeat*
Expand Down Expand Up @@ -164,6 +164,7 @@ https://github.com/elastic/beats/compare/v7.0.0-alpha2...master[Check the HEAD d
- Add Load Balancing metricset to GCP {pull}15559[15559]
- Add support for Dropwizard metrics 4.1. {pull}16332[16332]
- Improve the `haproxy` module to support metrics exposed via HTTPS. {issue}14579[14579] {pull}16333[16333]
- Add filtering option for prometheus collector. {pull}16420[16420]

*Packetbeat*

Expand Down
3 changes: 3 additions & 0 deletions metricbeat/docs/modules/prometheus.asciidoc
Original file line number Diff line number Diff line change
Expand Up @@ -32,6 +32,9 @@ metricbeat.modules:
period: 10s
hosts: ["localhost:9090"]
metrics_path: /metrics
#metrics_filters:
# include: []
# exclude: []
#username: "user"
#password: "secret"
Expand Down
3 changes: 3 additions & 0 deletions metricbeat/metricbeat.reference.yml
Original file line number Diff line number Diff line change
Expand Up @@ -699,6 +699,9 @@ metricbeat.modules:
period: 10s
hosts: ["localhost:9090"]
metrics_path: /metrics
#metrics_filters:
# include: []
# exclude: []
#username: "user"
#password: "secret"

Expand Down
3 changes: 3 additions & 0 deletions metricbeat/module/prometheus/_meta/config.yml
Original file line number Diff line number Diff line change
Expand Up @@ -2,6 +2,9 @@
period: 10s
hosts: ["localhost:9090"]
metrics_path: /metrics
#metrics_filters:
# include: []
# exclude: []
#username: "user"
#password: "secret"

Expand Down
21 changes: 20 additions & 1 deletion metricbeat/module/prometheus/collector/_meta/docs.asciidoc
Original file line number Diff line number Diff line change
Expand Up @@ -40,4 +40,23 @@ metricbeat.modules:
metrics_path: '/federate'
query:
'match[]': '{__name__!=""}'
-------------------------------------------------------------------------------------
-------------------------------------------------------------------------------------

[float]
=== Filtering metrics

In order to filter out/in metrics one can make use of `metrics_filters.include` `metrics_filters.exclude` settings:

[source,yaml]
-------------------------------------------------------------------------------------
- module: prometheus
period: 10s
hosts: ["localhost:9092"]
metrics_path: /metrics
metrics_filters:
include: ["node_filesystem_*"]
exclude: ["node_filesystem_device_*", "node_filesystem_readonly"]
-------------------------------------------------------------------------------------

The configuration above will include only metrics that match `node_filesystem_*` pattern and do not match `node_filesystem_device_*`
and are not `node_filesystem_readonly` metric.
83 changes: 80 additions & 3 deletions metricbeat/module/prometheus/collector/collector.go
Original file line number Diff line number Diff line change
Expand Up @@ -18,7 +18,10 @@
package collector

import (
"regexp"

"github.com/pkg/errors"
dto "github.com/prometheus/client_model/go"

"github.com/elastic/beats/libbeat/common"
p "github.com/elastic/beats/metricbeat/helper/prometheus"
Expand Down Expand Up @@ -49,20 +52,36 @@ func init() {
// MetricSet for fetching prometheus data
type MetricSet struct {
mb.BaseMetricSet
prometheus p.Prometheus
prometheus p.Prometheus
includeMetrics []*regexp.Regexp
excludeMetrics []*regexp.Regexp
}

// New creates a new metricset
func New(base mb.BaseMetricSet) (mb.MetricSet, error) {
config := defaultConfig
if err := base.Module().UnpackConfig(&config); err != nil {
return nil, err
}
prometheus, err := p.NewPrometheusClient(base)
if err != nil {
return nil, err
}

return &MetricSet{
ms := &MetricSet{
BaseMetricSet: base,
prometheus: prometheus,
}, nil
}
ms.excludeMetrics, err = compilePatternList(config.MetricsFilters.ExcludeMetrics)
if err != nil {
return nil, errors.Wrapf(err, "unable to compile exclude patterns")
}
ms.includeMetrics, err = compilePatternList(config.MetricsFilters.IncludeMetrics)
if err != nil {
return nil, errors.Wrapf(err, "unable to compile include patterns")
}

return ms, nil
}

// Fetch fetches data and reports it
Expand All @@ -81,6 +100,9 @@ func (m *MetricSet) Fetch(reporter mb.ReporterV2) error {
}

for _, family := range families {
if m.skipFamily(family) {
continue
}
promEvents := getPromEventsFromMetricFamily(family)

for _, promEvent := range promEvents {
Expand Down Expand Up @@ -140,3 +162,58 @@ func (m *MetricSet) addUpEvent(eventList map[string]common.MapStr, up int) {
}

}

func (m *MetricSet) skipFamily(family *dto.MetricFamily) bool {
// example:
// include_metrics:
// - node_*
// exclude_metrics:
// - node_disk_*
//
// This would mean that we want to keep only the metrics that start with node_ prefix but
// are not related to disk so we exclude node_disk_* metrics from them.

if family == nil {
return true
}

// if include_metrics are defined, check if this metric should be included
if len(m.includeMetrics) > 0 {
if !matchMetricFamily(*family.Name, m.includeMetrics) {
return true
}
}
// now exclude the metric if it matches any of the given patterns
if len(m.excludeMetrics) > 0 {
if matchMetricFamily(*family.Name, m.excludeMetrics) {
return true
}
}
return false
}

func compilePatternList(patterns *[]string) ([]*regexp.Regexp, error) {
var compiledPatterns []*regexp.Regexp
compiledPatterns = []*regexp.Regexp{}
if patterns != nil {
for _, pattern := range *patterns {
r, err := regexp.Compile(pattern)
if err != nil {
return nil, errors.Wrapf(err, "compiling pattern '%s'", pattern)
}
compiledPatterns = append(compiledPatterns, r)
}
return compiledPatterns, nil
}
return []*regexp.Regexp{}, nil
}

func matchMetricFamily(family string, matchMetrics []*regexp.Regexp) bool {
for _, checkMetric := range matchMetrics {
matched := checkMetric.MatchString(family)
if matched {
return true
}
}
return false
}
160 changes: 160 additions & 0 deletions metricbeat/module/prometheus/collector/collector_test.go
Original file line number Diff line number Diff line change
Expand Up @@ -22,6 +22,8 @@ package collector
import (
"testing"

"github.com/elastic/beats/metricbeat/mb"

"github.com/golang/protobuf/proto"
dto "github.com/prometheus/client_model/go"
"github.com/stretchr/testify/assert"
Expand Down Expand Up @@ -200,6 +202,164 @@ func TestGetPromEventsFromMetricFamily(t *testing.T) {
}
}

func TestSkipMetricFamily(t *testing.T) {
testFamilies := []*dto.MetricFamily{
{
Name: proto.String("http_request_duration_microseconds_a_a_in"),
Help: proto.String("foo"),
Type: dto.MetricType_COUNTER.Enum(),
Metric: []*dto.Metric{
{
Label: []*dto.LabelPair{
{
Name: proto.String("handler"),
Value: proto.String("query"),
},
},
Counter: &dto.Counter{
Value: proto.Float64(10),
},
},
},
},
{
Name: proto.String("http_request_duration_microseconds_a_b_in"),
Help: proto.String("foo"),
Type: dto.MetricType_COUNTER.Enum(),
Metric: []*dto.Metric{
{
Label: []*dto.LabelPair{
{
Name: proto.String("handler"),
Value: proto.String("query"),
},
},
Counter: &dto.Counter{
Value: proto.Float64(10),
},
},
},
},
{
Name: proto.String("http_request_duration_microseconds_b_in"),
Help: proto.String("foo"),
Type: dto.MetricType_GAUGE.Enum(),
Metric: []*dto.Metric{
{
Gauge: &dto.Gauge{
Value: proto.Float64(10),
},
},
},
},
{
Name: proto.String("http_request_duration_microseconds_c_in"),
Help: proto.String("foo"),
Type: dto.MetricType_SUMMARY.Enum(),
Metric: []*dto.Metric{
{
Summary: &dto.Summary{
SampleCount: proto.Uint64(10),
SampleSum: proto.Float64(10),
Quantile: []*dto.Quantile{
{
Quantile: proto.Float64(0.99),
Value: proto.Float64(10),
},
},
},
},
},
},
{
Name: proto.String("http_request_duration_microseconds_d_in"),
Help: proto.String("foo"),
Type: dto.MetricType_HISTOGRAM.Enum(),
Metric: []*dto.Metric{
{
Histogram: &dto.Histogram{
SampleCount: proto.Uint64(10),
SampleSum: proto.Float64(10),
Bucket: []*dto.Bucket{
{
UpperBound: proto.Float64(0.99),
CumulativeCount: proto.Uint64(10),
},
},
},
},
},
},
{
Name: proto.String("http_request_duration_microseconds_e_in"),
Help: proto.String("foo"),
Type: dto.MetricType_UNTYPED.Enum(),
Metric: []*dto.Metric{
{
Label: []*dto.LabelPair{
{
Name: proto.String("handler"),
Value: proto.String("query"),
},
},
Untyped: &dto.Untyped{
Value: proto.Float64(10),
},
},
},
},
}

ms := &MetricSet{
BaseMetricSet: mb.BaseMetricSet{},
}

// test with no filters
ms.includeMetrics, _ = compilePatternList(&[]string{})
ms.excludeMetrics, _ = compilePatternList(&[]string{})
metricsToKeep := 0
for _, testFamily := range testFamilies {
if !ms.skipFamily(testFamily) {
metricsToKeep += 1
}
}
assert.Equal(t, metricsToKeep, len(testFamilies))

// test with only one include filter
ms.includeMetrics, _ = compilePatternList(&[]string{"http_request_duration_microseconds_a_*"})
ms.excludeMetrics, _ = compilePatternList(&[]string{})
metricsToKeep = 0
for _, testFamily := range testFamilies {
if !ms.skipFamily(testFamily) {
metricsToKeep += 1
}
}
assert.Equal(t, metricsToKeep, 2)

// test with only one exclude filter
ms.includeMetrics, _ = compilePatternList(&[]string{""})
ms.excludeMetrics, _ = compilePatternList(&[]string{"http_request_duration_microseconds_a_*"})
metricsToKeep = 0
for _, testFamily := range testFamilies {
if !ms.skipFamily(testFamily) {
metricsToKeep += 1
}
}
assert.Equal(t, len(testFamilies)-2, metricsToKeep)

// test with ine include and one exclude
ms.includeMetrics, _ = compilePatternList(&[]string{"http_request_duration_microseconds_a_*"})
ms.excludeMetrics, _ = compilePatternList(&[]string{"http_request_duration_microseconds_a_b_*"})
metricsToKeep = 0
for _, testFamily := range testFamilies {
if !ms.skipFamily(testFamily) {
metricsToKeep += 1
}
}
assert.Equal(t, 1, metricsToKeep)

}

func TestData(t *testing.T) {
mbtest.TestDataFiles(t, "prometheus", "collector")
}
Loading