mirror of https://github.com/prometheus/prometheus
You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
375 lines
11 KiB
375 lines
11 KiB
// Copyright 2024 The Prometheus Authors
|
|
// Licensed under the Apache License, Version 2.0 (the "License");
|
|
// you may not use this file except in compliance with the License.
|
|
// You may obtain a copy of the License at
|
|
//
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
//
|
|
// Unless required by applicable law or agreed to in writing, software
|
|
// distributed under the License is distributed on an "AS IS" BASIS,
|
|
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
// See the License for the specific language governing permissions and
|
|
// limitations under the License.
|
|
|
|
package textparse
|
|
|
|
import (
|
|
"errors"
|
|
"io"
|
|
"math"
|
|
"strconv"
|
|
"strings"
|
|
|
|
"github.com/prometheus/common/model"
|
|
|
|
"github.com/prometheus/prometheus/model/exemplar"
|
|
"github.com/prometheus/prometheus/model/histogram"
|
|
"github.com/prometheus/prometheus/model/labels"
|
|
"github.com/prometheus/prometheus/util/convertnhcb"
|
|
)
|
|
|
|
type collectionState int
|
|
|
|
const (
|
|
stateStart collectionState = iota
|
|
stateCollecting
|
|
stateEmitting
|
|
)
|
|
|
|
// The NHCBParser wraps a Parser and converts classic histograms to native
|
|
// histograms with custom buckets.
|
|
//
|
|
// Since Parser interface is line based, this parser needs to keep track
|
|
// of the last classic histogram series it saw to collate them into a
|
|
// single native histogram.
|
|
//
|
|
// Note:
|
|
// - Only series that have the histogram metadata type are considered for
|
|
// conversion.
|
|
// - The classic series are also returned if keepClassicHistograms is true.
|
|
type NHCBParser struct {
|
|
// The parser we're wrapping.
|
|
parser Parser
|
|
// Option to keep classic histograms along with converted histograms.
|
|
keepClassicHistograms bool
|
|
|
|
// Labels builder.
|
|
builder labels.ScratchBuilder
|
|
|
|
// State of the parser.
|
|
state collectionState
|
|
|
|
// Caches the values from the underlying parser.
|
|
// For Series and Histogram.
|
|
bytes []byte
|
|
ts *int64
|
|
value float64
|
|
h *histogram.Histogram
|
|
fh *histogram.FloatHistogram
|
|
// For Metric.
|
|
lset labels.Labels
|
|
metricString string
|
|
// For Type.
|
|
bName []byte
|
|
typ model.MetricType
|
|
|
|
// Caches the entry itself if we are inserting a converted NHCB
|
|
// halfway through.
|
|
entry Entry
|
|
err error
|
|
|
|
// Caches the values and metric for the inserted converted NHCB.
|
|
bytesNHCB []byte
|
|
hNHCB *histogram.Histogram
|
|
fhNHCB *histogram.FloatHistogram
|
|
lsetNHCB labels.Labels
|
|
exemplars []exemplar.Exemplar
|
|
ctNHCB *int64
|
|
metricStringNHCB string
|
|
|
|
// Collates values from the classic histogram series to build
|
|
// the converted histogram later.
|
|
tempLsetNHCB labels.Labels
|
|
tempNHCB convertnhcb.TempHistogram
|
|
tempExemplars []exemplar.Exemplar
|
|
tempExemplarCount int
|
|
tempCT *int64
|
|
|
|
// Remembers the last base histogram metric name (assuming it's
|
|
// a classic histogram) so we can tell if the next float series
|
|
// is part of the same classic histogram.
|
|
lastHistogramName string
|
|
lastHistogramLabelsHash uint64
|
|
lastHistogramExponential bool
|
|
// Reused buffer for hashing labels.
|
|
hBuffer []byte
|
|
}
|
|
|
|
func NewNHCBParser(p Parser, st *labels.SymbolTable, keepClassicHistograms bool) Parser {
|
|
return &NHCBParser{
|
|
parser: p,
|
|
keepClassicHistograms: keepClassicHistograms,
|
|
builder: labels.NewScratchBuilderWithSymbolTable(st, 16),
|
|
tempNHCB: convertnhcb.NewTempHistogram(),
|
|
}
|
|
}
|
|
|
|
func (p *NHCBParser) Series() ([]byte, *int64, float64) {
|
|
return p.bytes, p.ts, p.value
|
|
}
|
|
|
|
func (p *NHCBParser) Histogram() ([]byte, *int64, *histogram.Histogram, *histogram.FloatHistogram) {
|
|
if p.state == stateEmitting {
|
|
return p.bytesNHCB, p.ts, p.hNHCB, p.fhNHCB
|
|
}
|
|
return p.bytes, p.ts, p.h, p.fh
|
|
}
|
|
|
|
func (p *NHCBParser) Help() ([]byte, []byte) {
|
|
return p.parser.Help()
|
|
}
|
|
|
|
func (p *NHCBParser) Type() ([]byte, model.MetricType) {
|
|
return p.bName, p.typ
|
|
}
|
|
|
|
func (p *NHCBParser) Unit() ([]byte, []byte) {
|
|
return p.parser.Unit()
|
|
}
|
|
|
|
func (p *NHCBParser) Comment() []byte {
|
|
return p.parser.Comment()
|
|
}
|
|
|
|
func (p *NHCBParser) Metric(l *labels.Labels) string {
|
|
if p.state == stateEmitting {
|
|
*l = p.lsetNHCB
|
|
return p.metricStringNHCB
|
|
}
|
|
*l = p.lset
|
|
return p.metricString
|
|
}
|
|
|
|
func (p *NHCBParser) Exemplar(ex *exemplar.Exemplar) bool {
|
|
if p.state == stateEmitting {
|
|
if len(p.exemplars) == 0 {
|
|
return false
|
|
}
|
|
*ex = p.exemplars[0]
|
|
p.exemplars = p.exemplars[1:]
|
|
return true
|
|
}
|
|
return p.parser.Exemplar(ex)
|
|
}
|
|
|
|
func (p *NHCBParser) CreatedTimestamp() *int64 {
|
|
switch p.state {
|
|
case stateStart:
|
|
if p.entry == EntrySeries || p.entry == EntryHistogram {
|
|
return p.parser.CreatedTimestamp()
|
|
}
|
|
case stateCollecting:
|
|
return p.tempCT
|
|
case stateEmitting:
|
|
return p.ctNHCB
|
|
}
|
|
return nil
|
|
}
|
|
|
|
func (p *NHCBParser) Next() (Entry, error) {
|
|
if p.state == stateEmitting {
|
|
p.state = stateStart
|
|
if p.entry == EntrySeries {
|
|
isNHCB := p.handleClassicHistogramSeries(p.lset)
|
|
if isNHCB && !p.keepClassicHistograms {
|
|
// Do not return the classic histogram series if it was converted to NHCB and we are not keeping classic histograms.
|
|
return p.Next()
|
|
}
|
|
}
|
|
return p.entry, p.err
|
|
}
|
|
|
|
p.entry, p.err = p.parser.Next()
|
|
if p.err != nil {
|
|
if errors.Is(p.err, io.EOF) && p.processNHCB() {
|
|
return EntryHistogram, nil
|
|
}
|
|
return EntryInvalid, p.err
|
|
}
|
|
switch p.entry {
|
|
case EntrySeries:
|
|
p.bytes, p.ts, p.value = p.parser.Series()
|
|
p.metricString = p.parser.Metric(&p.lset)
|
|
// Check the label set to see if we can continue or need to emit the NHCB.
|
|
var isNHCB bool
|
|
if p.compareLabels() {
|
|
// Labels differ. Check if we can emit the NHCB.
|
|
if p.processNHCB() {
|
|
return EntryHistogram, nil
|
|
}
|
|
isNHCB = p.handleClassicHistogramSeries(p.lset)
|
|
} else {
|
|
// Labels are the same. Check if after an exponential histogram.
|
|
if p.lastHistogramExponential {
|
|
isNHCB = false
|
|
} else {
|
|
isNHCB = p.handleClassicHistogramSeries(p.lset)
|
|
}
|
|
}
|
|
if isNHCB && !p.keepClassicHistograms {
|
|
// Do not return the classic histogram series if it was converted to NHCB and we are not keeping classic histograms.
|
|
return p.Next()
|
|
}
|
|
return p.entry, p.err
|
|
case EntryHistogram:
|
|
p.bytes, p.ts, p.h, p.fh = p.parser.Histogram()
|
|
p.metricString = p.parser.Metric(&p.lset)
|
|
p.storeExponentialLabels()
|
|
case EntryType:
|
|
p.bName, p.typ = p.parser.Type()
|
|
}
|
|
if p.processNHCB() {
|
|
return EntryHistogram, nil
|
|
}
|
|
return p.entry, p.err
|
|
}
|
|
|
|
// Return true if labels have changed and we should emit the NHCB.
|
|
func (p *NHCBParser) compareLabels() bool {
|
|
if p.state != stateCollecting {
|
|
return false
|
|
}
|
|
if p.typ != model.MetricTypeHistogram {
|
|
// Different metric type.
|
|
return true
|
|
}
|
|
if p.lastHistogramName != convertnhcb.GetHistogramMetricBaseName(p.lset.Get(labels.MetricName)) {
|
|
// Different metric name.
|
|
return true
|
|
}
|
|
nextHash, _ := p.lset.HashWithoutLabels(p.hBuffer, labels.BucketLabel)
|
|
// Different label values.
|
|
return p.lastHistogramLabelsHash != nextHash
|
|
}
|
|
|
|
// Save the label set of the classic histogram without suffix and bucket `le` label.
|
|
func (p *NHCBParser) storeClassicLabels() {
|
|
p.lastHistogramName = convertnhcb.GetHistogramMetricBaseName(p.lset.Get(labels.MetricName))
|
|
p.lastHistogramLabelsHash, _ = p.lset.HashWithoutLabels(p.hBuffer, labels.BucketLabel)
|
|
p.lastHistogramExponential = false
|
|
}
|
|
|
|
func (p *NHCBParser) storeExponentialLabels() {
|
|
p.lastHistogramName = p.lset.Get(labels.MetricName)
|
|
p.lastHistogramLabelsHash, _ = p.lset.HashWithoutLabels(p.hBuffer)
|
|
p.lastHistogramExponential = true
|
|
}
|
|
|
|
// handleClassicHistogramSeries collates the classic histogram series to be converted to NHCB
|
|
// if it is actually a classic histogram series (and not a normal float series) and if there
|
|
// isn't already a native histogram with the same name (assuming it is always processed
|
|
// right before the classic histograms) and returns true if the collation was done.
|
|
func (p *NHCBParser) handleClassicHistogramSeries(lset labels.Labels) bool {
|
|
if p.typ != model.MetricTypeHistogram {
|
|
return false
|
|
}
|
|
mName := lset.Get(labels.MetricName)
|
|
// Sanity check to ensure that the TYPE metadata entry name is the same as the base name.
|
|
if convertnhcb.GetHistogramMetricBaseName(mName) != string(p.bName) {
|
|
return false
|
|
}
|
|
switch {
|
|
case strings.HasSuffix(mName, "_bucket") && lset.Has(labels.BucketLabel):
|
|
le, err := strconv.ParseFloat(lset.Get(labels.BucketLabel), 64)
|
|
if err == nil && !math.IsNaN(le) {
|
|
p.processClassicHistogramSeries(lset, "_bucket", func(hist *convertnhcb.TempHistogram) {
|
|
_ = hist.SetBucketCount(le, p.value)
|
|
})
|
|
return true
|
|
}
|
|
case strings.HasSuffix(mName, "_count"):
|
|
p.processClassicHistogramSeries(lset, "_count", func(hist *convertnhcb.TempHistogram) {
|
|
_ = hist.SetCount(p.value)
|
|
})
|
|
return true
|
|
case strings.HasSuffix(mName, "_sum"):
|
|
p.processClassicHistogramSeries(lset, "_sum", func(hist *convertnhcb.TempHistogram) {
|
|
_ = hist.SetSum(p.value)
|
|
})
|
|
return true
|
|
}
|
|
return false
|
|
}
|
|
|
|
func (p *NHCBParser) processClassicHistogramSeries(lset labels.Labels, suffix string, updateHist func(*convertnhcb.TempHistogram)) {
|
|
if p.state != stateCollecting {
|
|
p.storeClassicLabels()
|
|
p.tempCT = p.parser.CreatedTimestamp()
|
|
p.state = stateCollecting
|
|
p.tempLsetNHCB = convertnhcb.GetHistogramMetricBase(lset, suffix)
|
|
}
|
|
p.storeExemplars()
|
|
updateHist(&p.tempNHCB)
|
|
}
|
|
|
|
func (p *NHCBParser) storeExemplars() {
|
|
for ex := p.nextExemplarPtr(); p.parser.Exemplar(ex); ex = p.nextExemplarPtr() {
|
|
p.tempExemplarCount++
|
|
}
|
|
}
|
|
|
|
func (p *NHCBParser) nextExemplarPtr() *exemplar.Exemplar {
|
|
switch {
|
|
case p.tempExemplarCount == len(p.tempExemplars)-1:
|
|
// Reuse the previously allocated exemplar, it was not filled up.
|
|
case len(p.tempExemplars) == cap(p.tempExemplars):
|
|
// Let the runtime grow the slice.
|
|
p.tempExemplars = append(p.tempExemplars, exemplar.Exemplar{})
|
|
default:
|
|
// Take the next element into use.
|
|
p.tempExemplars = p.tempExemplars[:len(p.tempExemplars)+1]
|
|
}
|
|
return &p.tempExemplars[len(p.tempExemplars)-1]
|
|
}
|
|
|
|
func (p *NHCBParser) swapExemplars() {
|
|
p.exemplars = p.tempExemplars[:p.tempExemplarCount]
|
|
p.tempExemplars = p.tempExemplars[:0]
|
|
}
|
|
|
|
// processNHCB converts the collated classic histogram series to NHCB and caches the info
|
|
// to be returned to callers. Retruns true if the conversion was successful.
|
|
func (p *NHCBParser) processNHCB() bool {
|
|
if p.state != stateCollecting {
|
|
return false
|
|
}
|
|
h, fh, err := p.tempNHCB.Convert()
|
|
if err == nil {
|
|
if h != nil {
|
|
if err := h.Validate(); err != nil {
|
|
return false
|
|
}
|
|
p.hNHCB = h
|
|
p.fhNHCB = nil
|
|
} else if fh != nil {
|
|
if err := fh.Validate(); err != nil {
|
|
return false
|
|
}
|
|
p.hNHCB = nil
|
|
p.fhNHCB = fh
|
|
}
|
|
p.metricStringNHCB = p.tempLsetNHCB.Get(labels.MetricName) + strings.ReplaceAll(p.tempLsetNHCB.DropMetricName().String(), ", ", ",")
|
|
p.bytesNHCB = []byte(p.metricStringNHCB)
|
|
p.lsetNHCB = p.tempLsetNHCB
|
|
p.swapExemplars()
|
|
p.ctNHCB = p.tempCT
|
|
p.state = stateEmitting
|
|
} else {
|
|
p.state = stateStart
|
|
}
|
|
p.tempNHCB.Reset()
|
|
p.tempExemplarCount = 0
|
|
p.tempCT = nil
|
|
return err == nil
|
|
}
|