mirror of https://github.com/prometheus/prometheus
You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
376 lines
11 KiB
376 lines
11 KiB
// Copyright 2024 The Prometheus Authors |
|
// Licensed under the Apache License, Version 2.0 (the "License"); |
|
// you may not use this file except in compliance with the License. |
|
// You may obtain a copy of the License at |
|
// |
|
// http://www.apache.org/licenses/LICENSE-2.0 |
|
// |
|
// Unless required by applicable law or agreed to in writing, software |
|
// distributed under the License is distributed on an "AS IS" BASIS, |
|
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
|
// See the License for the specific language governing permissions and |
|
// limitations under the License. |
|
|
|
package textparse |
|
|
|
import ( |
|
"errors" |
|
"io" |
|
"math" |
|
"strconv" |
|
"strings" |
|
|
|
"github.com/prometheus/common/model" |
|
|
|
"github.com/prometheus/prometheus/model/exemplar" |
|
"github.com/prometheus/prometheus/model/histogram" |
|
"github.com/prometheus/prometheus/model/labels" |
|
"github.com/prometheus/prometheus/util/convertnhcb" |
|
) |
|
|
|
type collectionState int |
|
|
|
const ( |
|
stateStart collectionState = iota |
|
stateCollecting |
|
stateEmitting |
|
) |
|
|
|
// The NHCBParser wraps a Parser and converts classic histograms to native |
|
// histograms with custom buckets. |
|
// |
|
// Since Parser interface is line based, this parser needs to keep track |
|
// of the last classic histogram series it saw to collate them into a |
|
// single native histogram. |
|
// |
|
// Note: |
|
// - Only series that have the histogram metadata type are considered for |
|
// conversion. |
|
// - The classic series are also returned if keepClassicHistograms is true. |
|
type NHCBParser struct { |
|
// The parser we're wrapping. |
|
parser Parser |
|
// Option to keep classic histograms along with converted histograms. |
|
keepClassicHistograms bool |
|
|
|
// Labels builder. |
|
builder labels.ScratchBuilder |
|
|
|
// State of the parser. |
|
state collectionState |
|
|
|
// Caches the values from the underlying parser. |
|
// For Series and Histogram. |
|
bytes []byte |
|
ts *int64 |
|
value float64 |
|
h *histogram.Histogram |
|
fh *histogram.FloatHistogram |
|
// For Metric. |
|
lset labels.Labels |
|
metricString string |
|
// For Type. |
|
bName []byte |
|
typ model.MetricType |
|
|
|
// Caches the entry itself if we are inserting a converted NHCB |
|
// halfway through. |
|
entry Entry |
|
err error |
|
|
|
// Caches the values and metric for the inserted converted NHCB. |
|
bytesNHCB []byte |
|
hNHCB *histogram.Histogram |
|
fhNHCB *histogram.FloatHistogram |
|
lsetNHCB labels.Labels |
|
exemplars []exemplar.Exemplar |
|
ctNHCB *int64 |
|
metricStringNHCB string |
|
|
|
// Collates values from the classic histogram series to build |
|
// the converted histogram later. |
|
tempLsetNHCB labels.Labels |
|
tempNHCB convertnhcb.TempHistogram |
|
tempExemplars []exemplar.Exemplar |
|
tempExemplarCount int |
|
tempCT *int64 |
|
|
|
// Remembers the last base histogram metric name (assuming it's |
|
// a classic histogram) so we can tell if the next float series |
|
// is part of the same classic histogram. |
|
lastHistogramName string |
|
lastHistogramLabelsHash uint64 |
|
lastHistogramExponential bool |
|
// Reused buffer for hashing labels. |
|
hBuffer []byte |
|
} |
|
|
|
func NewNHCBParser(p Parser, st *labels.SymbolTable, keepClassicHistograms bool) Parser { |
|
return &NHCBParser{ |
|
parser: p, |
|
keepClassicHistograms: keepClassicHistograms, |
|
builder: labels.NewScratchBuilderWithSymbolTable(st, 16), |
|
tempNHCB: convertnhcb.NewTempHistogram(), |
|
} |
|
} |
|
|
|
func (p *NHCBParser) Series() ([]byte, *int64, float64) { |
|
return p.bytes, p.ts, p.value |
|
} |
|
|
|
func (p *NHCBParser) Histogram() ([]byte, *int64, *histogram.Histogram, *histogram.FloatHistogram) { |
|
if p.state == stateEmitting { |
|
return p.bytesNHCB, p.ts, p.hNHCB, p.fhNHCB |
|
} |
|
return p.bytes, p.ts, p.h, p.fh |
|
} |
|
|
|
func (p *NHCBParser) Help() ([]byte, []byte) { |
|
return p.parser.Help() |
|
} |
|
|
|
func (p *NHCBParser) Type() ([]byte, model.MetricType) { |
|
return p.bName, p.typ |
|
} |
|
|
|
func (p *NHCBParser) Unit() ([]byte, []byte) { |
|
return p.parser.Unit() |
|
} |
|
|
|
func (p *NHCBParser) Comment() []byte { |
|
return p.parser.Comment() |
|
} |
|
|
|
func (p *NHCBParser) Metric(l *labels.Labels) string { |
|
if p.state == stateEmitting { |
|
*l = p.lsetNHCB |
|
return p.metricStringNHCB |
|
} |
|
*l = p.lset |
|
return p.metricString |
|
} |
|
|
|
func (p *NHCBParser) Exemplar(ex *exemplar.Exemplar) bool { |
|
if p.state == stateEmitting { |
|
if len(p.exemplars) == 0 { |
|
return false |
|
} |
|
*ex = p.exemplars[0] |
|
p.exemplars = p.exemplars[1:] |
|
return true |
|
} |
|
return p.parser.Exemplar(ex) |
|
} |
|
|
|
func (p *NHCBParser) CreatedTimestamp() *int64 { |
|
switch p.state { |
|
case stateStart: |
|
if p.entry == EntrySeries || p.entry == EntryHistogram { |
|
return p.parser.CreatedTimestamp() |
|
} |
|
case stateCollecting: |
|
return p.tempCT |
|
case stateEmitting: |
|
return p.ctNHCB |
|
} |
|
return nil |
|
} |
|
|
|
func (p *NHCBParser) Next() (Entry, error) { |
|
if p.state == stateEmitting { |
|
p.state = stateStart |
|
if p.entry == EntrySeries { |
|
isNHCB := p.handleClassicHistogramSeries(p.lset) |
|
if isNHCB && !p.keepClassicHistograms { |
|
// Do not return the classic histogram series if it was converted to NHCB and we are not keeping classic histograms. |
|
return p.Next() |
|
} |
|
} |
|
return p.entry, p.err |
|
} |
|
|
|
p.entry, p.err = p.parser.Next() |
|
if p.err != nil { |
|
if errors.Is(p.err, io.EOF) && p.processNHCB() { |
|
return EntryHistogram, nil |
|
} |
|
return EntryInvalid, p.err |
|
} |
|
switch p.entry { |
|
case EntrySeries: |
|
p.bytes, p.ts, p.value = p.parser.Series() |
|
p.metricString = p.parser.Metric(&p.lset) |
|
// Check the label set to see if we can continue or need to emit the NHCB. |
|
var isNHCB bool |
|
if p.compareLabels() { |
|
// Labels differ. Check if we can emit the NHCB. |
|
if p.processNHCB() { |
|
return EntryHistogram, nil |
|
} |
|
isNHCB = p.handleClassicHistogramSeries(p.lset) |
|
} else { |
|
// Labels are the same. Check if after an exponential histogram. |
|
if p.lastHistogramExponential { |
|
isNHCB = false |
|
} else { |
|
isNHCB = p.handleClassicHistogramSeries(p.lset) |
|
} |
|
} |
|
if isNHCB && !p.keepClassicHistograms { |
|
// Do not return the classic histogram series if it was converted to NHCB and we are not keeping classic histograms. |
|
return p.Next() |
|
} |
|
return p.entry, p.err |
|
case EntryHistogram: |
|
p.bytes, p.ts, p.h, p.fh = p.parser.Histogram() |
|
p.metricString = p.parser.Metric(&p.lset) |
|
p.storeExponentialLabels() |
|
case EntryType: |
|
p.bName, p.typ = p.parser.Type() |
|
} |
|
if p.processNHCB() { |
|
return EntryHistogram, nil |
|
} |
|
return p.entry, p.err |
|
} |
|
|
|
// Return true if labels have changed and we should emit the NHCB. |
|
func (p *NHCBParser) compareLabels() bool { |
|
if p.state != stateCollecting { |
|
return false |
|
} |
|
if p.typ != model.MetricTypeHistogram { |
|
// Different metric type. |
|
return true |
|
} |
|
if p.lastHistogramName != convertnhcb.GetHistogramMetricBaseName(p.lset.Get(labels.MetricName)) { |
|
// Different metric name. |
|
return true |
|
} |
|
nextHash, _ := p.lset.HashWithoutLabels(p.hBuffer, labels.BucketLabel) |
|
// Different label values. |
|
return p.lastHistogramLabelsHash != nextHash |
|
} |
|
|
|
// Save the label set of the classic histogram without suffix and bucket `le` label. |
|
func (p *NHCBParser) storeClassicLabels() { |
|
p.lastHistogramName = convertnhcb.GetHistogramMetricBaseName(p.lset.Get(labels.MetricName)) |
|
p.lastHistogramLabelsHash, _ = p.lset.HashWithoutLabels(p.hBuffer, labels.BucketLabel) |
|
p.lastHistogramExponential = false |
|
} |
|
|
|
func (p *NHCBParser) storeExponentialLabels() { |
|
p.lastHistogramName = p.lset.Get(labels.MetricName) |
|
p.lastHistogramLabelsHash, _ = p.lset.HashWithoutLabels(p.hBuffer) |
|
p.lastHistogramExponential = true |
|
} |
|
|
|
// handleClassicHistogramSeries collates the classic histogram series to be converted to NHCB |
|
// if it is actually a classic histogram series (and not a normal float series) and if there |
|
// isn't already a native histogram with the same name (assuming it is always processed |
|
// right before the classic histograms) and returns true if the collation was done. |
|
func (p *NHCBParser) handleClassicHistogramSeries(lset labels.Labels) bool { |
|
if p.typ != model.MetricTypeHistogram { |
|
return false |
|
} |
|
mName := lset.Get(labels.MetricName) |
|
// Sanity check to ensure that the TYPE metadata entry name is the same as the base name. |
|
if convertnhcb.GetHistogramMetricBaseName(mName) != string(p.bName) { |
|
return false |
|
} |
|
switch { |
|
case strings.HasSuffix(mName, "_bucket") && lset.Has(labels.BucketLabel): |
|
le, err := strconv.ParseFloat(lset.Get(labels.BucketLabel), 64) |
|
if err == nil && !math.IsNaN(le) { |
|
p.processClassicHistogramSeries(lset, "_bucket", func(hist *convertnhcb.TempHistogram) { |
|
hist.BucketCounts[le] = p.value |
|
}) |
|
return true |
|
} |
|
case strings.HasSuffix(mName, "_count"): |
|
p.processClassicHistogramSeries(lset, "_count", func(hist *convertnhcb.TempHistogram) { |
|
hist.Count = p.value |
|
}) |
|
return true |
|
case strings.HasSuffix(mName, "_sum"): |
|
p.processClassicHistogramSeries(lset, "_sum", func(hist *convertnhcb.TempHistogram) { |
|
hist.Sum = p.value |
|
}) |
|
return true |
|
} |
|
return false |
|
} |
|
|
|
func (p *NHCBParser) processClassicHistogramSeries(lset labels.Labels, suffix string, updateHist func(*convertnhcb.TempHistogram)) { |
|
if p.state != stateCollecting { |
|
p.storeClassicLabels() |
|
p.tempCT = p.parser.CreatedTimestamp() |
|
p.state = stateCollecting |
|
} |
|
p.tempLsetNHCB = convertnhcb.GetHistogramMetricBase(lset, suffix) |
|
p.storeExemplars() |
|
updateHist(&p.tempNHCB) |
|
} |
|
|
|
func (p *NHCBParser) storeExemplars() { |
|
for ex := p.nextExemplarPtr(); p.parser.Exemplar(ex); ex = p.nextExemplarPtr() { |
|
p.tempExemplarCount++ |
|
} |
|
} |
|
|
|
func (p *NHCBParser) nextExemplarPtr() *exemplar.Exemplar { |
|
switch { |
|
case p.tempExemplarCount == len(p.tempExemplars)-1: |
|
// Reuse the previously allocated exemplar, it was not filled up. |
|
case len(p.tempExemplars) == cap(p.tempExemplars): |
|
// Let the runtime grow the slice. |
|
p.tempExemplars = append(p.tempExemplars, exemplar.Exemplar{}) |
|
default: |
|
// Take the next element into use. |
|
p.tempExemplars = p.tempExemplars[:len(p.tempExemplars)+1] |
|
} |
|
return &p.tempExemplars[len(p.tempExemplars)-1] |
|
} |
|
|
|
func (p *NHCBParser) swapExemplars() { |
|
p.exemplars = p.tempExemplars[:p.tempExemplarCount] |
|
p.tempExemplars = p.tempExemplars[:0] |
|
p.tempExemplarCount = 0 |
|
} |
|
|
|
// processNHCB converts the collated classic histogram series to NHCB and caches the info |
|
// to be returned to callers. Retruns true if the conversion was successful. |
|
func (p *NHCBParser) processNHCB() bool { |
|
if p.state != stateCollecting { |
|
return false |
|
} |
|
ub := make([]float64, 0, len(p.tempNHCB.BucketCounts)) |
|
for b := range p.tempNHCB.BucketCounts { |
|
ub = append(ub, b) |
|
} |
|
upperBounds, hBase := convertnhcb.ProcessUpperBoundsAndCreateBaseHistogram(ub, false) |
|
fhBase := hBase.ToFloat(nil) |
|
h, fh := convertnhcb.NewHistogram(p.tempNHCB, upperBounds, hBase, fhBase) |
|
if h != nil { |
|
if err := h.Validate(); err != nil { |
|
return false |
|
} |
|
p.hNHCB = h |
|
p.fhNHCB = nil |
|
} else if fh != nil { |
|
if err := fh.Validate(); err != nil { |
|
return false |
|
} |
|
p.hNHCB = nil |
|
p.fhNHCB = fh |
|
} |
|
p.metricStringNHCB = p.tempLsetNHCB.Get(labels.MetricName) + strings.ReplaceAll(p.tempLsetNHCB.DropMetricName().String(), ", ", ",") |
|
p.bytesNHCB = []byte(p.metricStringNHCB) |
|
p.lsetNHCB = p.tempLsetNHCB |
|
p.swapExemplars() |
|
p.ctNHCB = p.tempCT |
|
p.tempNHCB = convertnhcb.NewTempHistogram() |
|
p.state = stateEmitting |
|
p.tempCT = nil |
|
return true |
|
}
|
|
|