mirror of
				https://github.com/prometheus/prometheus.git
				synced 2025-10-25 22:41:00 +02:00 
			
		
		
		
	The wrong source was used to return the created timestamp, leading to index out of bound panic. One line fix. Refactor the requirement test to be generic and be able to test OpenMetrics and Prom parsers as well. There are some differencies in what the parsers support, the Prom parser doesn't have created timestamp. The protobuf parser uses different formatting to identify the metric for the scrape loop. Each parser represents the sample timestamp differently. Signed-off-by: György Krajcsovits <gyorgy.krajcsovits@grafana.com>
		
			
				
	
	
		
			377 lines
		
	
	
		
			11 KiB
		
	
	
	
		
			Go
		
	
	
	
	
	
			
		
		
	
	
			377 lines
		
	
	
		
			11 KiB
		
	
	
	
		
			Go
		
	
	
	
	
	
| // Copyright 2024 The Prometheus Authors
 | |
| // Licensed under the Apache License, Version 2.0 (the "License");
 | |
| // you may not use this file except in compliance with the License.
 | |
| // You may obtain a copy of the License at
 | |
| //
 | |
| // http://www.apache.org/licenses/LICENSE-2.0
 | |
| //
 | |
| // Unless required by applicable law or agreed to in writing, software
 | |
| // distributed under the License is distributed on an "AS IS" BASIS,
 | |
| // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 | |
| // See the License for the specific language governing permissions and
 | |
| // limitations under the License.
 | |
| 
 | |
| package textparse
 | |
| 
 | |
| import (
 | |
| 	"errors"
 | |
| 	"io"
 | |
| 	"math"
 | |
| 	"strconv"
 | |
| 	"strings"
 | |
| 
 | |
| 	"github.com/prometheus/common/model"
 | |
| 
 | |
| 	"github.com/prometheus/prometheus/model/exemplar"
 | |
| 	"github.com/prometheus/prometheus/model/histogram"
 | |
| 	"github.com/prometheus/prometheus/model/labels"
 | |
| 	"github.com/prometheus/prometheus/util/convertnhcb"
 | |
| )
 | |
| 
 | |
| type collectionState int
 | |
| 
 | |
| const (
 | |
| 	stateStart collectionState = iota
 | |
| 	stateCollecting
 | |
| 	stateEmitting
 | |
| )
 | |
| 
 | |
| // The NHCBParser wraps a Parser and converts classic histograms to native
 | |
| // histograms with custom buckets.
 | |
| //
 | |
| // Since Parser interface is line based, this parser needs to keep track
 | |
| // of the last classic histogram series it saw to collate them into a
 | |
| // single native histogram.
 | |
| //
 | |
| // Note:
 | |
| //   - Only series that have the histogram metadata type are considered for
 | |
| //     conversion.
 | |
| //   - The classic series are also returned if keepClassicHistograms is true.
 | |
| type NHCBParser struct {
 | |
| 	// The parser we're wrapping.
 | |
| 	parser Parser
 | |
| 	// Option to keep classic histograms along with converted histograms.
 | |
| 	keepClassicHistograms bool
 | |
| 
 | |
| 	// Labels builder.
 | |
| 	builder labels.ScratchBuilder
 | |
| 
 | |
| 	// State of the parser.
 | |
| 	state collectionState
 | |
| 
 | |
| 	// Caches the values from the underlying parser.
 | |
| 	// For Series and Histogram.
 | |
| 	bytes []byte
 | |
| 	ts    *int64
 | |
| 	value float64
 | |
| 	h     *histogram.Histogram
 | |
| 	fh    *histogram.FloatHistogram
 | |
| 	// For Metric.
 | |
| 	lset         labels.Labels
 | |
| 	metricString string
 | |
| 	// For Type.
 | |
| 	bName []byte
 | |
| 	typ   model.MetricType
 | |
| 
 | |
| 	// Caches the entry itself if we are inserting a converted NHCB
 | |
| 	// halfway through.
 | |
| 	entry Entry
 | |
| 	err   error
 | |
| 
 | |
| 	// Caches the values and metric for the inserted converted NHCB.
 | |
| 	bytesNHCB        []byte
 | |
| 	hNHCB            *histogram.Histogram
 | |
| 	fhNHCB           *histogram.FloatHistogram
 | |
| 	lsetNHCB         labels.Labels
 | |
| 	exemplars        []exemplar.Exemplar
 | |
| 	ctNHCB           *int64
 | |
| 	metricStringNHCB string
 | |
| 
 | |
| 	// Collates values from the classic histogram series to build
 | |
| 	// the converted histogram later.
 | |
| 	tempLsetNHCB      labels.Labels
 | |
| 	tempNHCB          convertnhcb.TempHistogram
 | |
| 	tempExemplars     []exemplar.Exemplar
 | |
| 	tempExemplarCount int
 | |
| 	tempCT            *int64
 | |
| 
 | |
| 	// Remembers the last base histogram metric name (assuming it's
 | |
| 	// a classic histogram) so we can tell if the next float series
 | |
| 	// is part of the same classic histogram.
 | |
| 	lastHistogramName        string
 | |
| 	lastHistogramLabelsHash  uint64
 | |
| 	lastHistogramExponential bool
 | |
| 	// Reused buffer for hashing labels.
 | |
| 	hBuffer []byte
 | |
| }
 | |
| 
 | |
| func NewNHCBParser(p Parser, st *labels.SymbolTable, keepClassicHistograms bool) Parser {
 | |
| 	return &NHCBParser{
 | |
| 		parser:                p,
 | |
| 		keepClassicHistograms: keepClassicHistograms,
 | |
| 		builder:               labels.NewScratchBuilderWithSymbolTable(st, 16),
 | |
| 		tempNHCB:              convertnhcb.NewTempHistogram(),
 | |
| 	}
 | |
| }
 | |
| 
 | |
| func (p *NHCBParser) Series() ([]byte, *int64, float64) {
 | |
| 	return p.bytes, p.ts, p.value
 | |
| }
 | |
| 
 | |
| func (p *NHCBParser) Histogram() ([]byte, *int64, *histogram.Histogram, *histogram.FloatHistogram) {
 | |
| 	if p.state == stateEmitting {
 | |
| 		return p.bytesNHCB, p.ts, p.hNHCB, p.fhNHCB
 | |
| 	}
 | |
| 	return p.bytes, p.ts, p.h, p.fh
 | |
| }
 | |
| 
 | |
| func (p *NHCBParser) Help() ([]byte, []byte) {
 | |
| 	return p.parser.Help()
 | |
| }
 | |
| 
 | |
| func (p *NHCBParser) Type() ([]byte, model.MetricType) {
 | |
| 	return p.bName, p.typ
 | |
| }
 | |
| 
 | |
| func (p *NHCBParser) Unit() ([]byte, []byte) {
 | |
| 	return p.parser.Unit()
 | |
| }
 | |
| 
 | |
| func (p *NHCBParser) Comment() []byte {
 | |
| 	return p.parser.Comment()
 | |
| }
 | |
| 
 | |
| func (p *NHCBParser) Metric(l *labels.Labels) string {
 | |
| 	if p.state == stateEmitting {
 | |
| 		*l = p.lsetNHCB
 | |
| 		return p.metricStringNHCB
 | |
| 	}
 | |
| 	*l = p.lset
 | |
| 	return p.metricString
 | |
| }
 | |
| 
 | |
| func (p *NHCBParser) Exemplar(ex *exemplar.Exemplar) bool {
 | |
| 	if p.state == stateEmitting {
 | |
| 		if len(p.exemplars) == 0 {
 | |
| 			return false
 | |
| 		}
 | |
| 		*ex = p.exemplars[0]
 | |
| 		p.exemplars = p.exemplars[1:]
 | |
| 		return true
 | |
| 	}
 | |
| 	return p.parser.Exemplar(ex)
 | |
| }
 | |
| 
 | |
| func (p *NHCBParser) CreatedTimestamp() *int64 {
 | |
| 	switch p.state {
 | |
| 	case stateStart:
 | |
| 		if p.entry == EntrySeries || p.entry == EntryHistogram {
 | |
| 			return p.parser.CreatedTimestamp()
 | |
| 		}
 | |
| 	case stateCollecting:
 | |
| 		return p.tempCT
 | |
| 	case stateEmitting:
 | |
| 		return p.ctNHCB
 | |
| 	}
 | |
| 	return nil
 | |
| }
 | |
| 
 | |
| func (p *NHCBParser) Next() (Entry, error) {
 | |
| 	if p.state == stateEmitting {
 | |
| 		p.state = stateStart
 | |
| 		if p.entry == EntrySeries {
 | |
| 			isNHCB := p.handleClassicHistogramSeries(p.lset)
 | |
| 			if isNHCB && !p.keepClassicHistograms {
 | |
| 				// Do not return the classic histogram series if it was converted to NHCB and we are not keeping classic histograms.
 | |
| 				return p.Next()
 | |
| 			}
 | |
| 		}
 | |
| 		return p.entry, p.err
 | |
| 	}
 | |
| 
 | |
| 	p.entry, p.err = p.parser.Next()
 | |
| 	if p.err != nil {
 | |
| 		if errors.Is(p.err, io.EOF) && p.processNHCB() {
 | |
| 			return EntryHistogram, nil
 | |
| 		}
 | |
| 		return EntryInvalid, p.err
 | |
| 	}
 | |
| 	switch p.entry {
 | |
| 	case EntrySeries:
 | |
| 		p.bytes, p.ts, p.value = p.parser.Series()
 | |
| 		p.metricString = p.parser.Metric(&p.lset)
 | |
| 		// Check the label set to see if we can continue or need to emit the NHCB.
 | |
| 		var isNHCB bool
 | |
| 		if p.compareLabels() {
 | |
| 			// Labels differ. Check if we can emit the NHCB.
 | |
| 			if p.processNHCB() {
 | |
| 				return EntryHistogram, nil
 | |
| 			}
 | |
| 			isNHCB = p.handleClassicHistogramSeries(p.lset)
 | |
| 		} else {
 | |
| 			// Labels are the same. Check if after an exponential histogram.
 | |
| 			if p.lastHistogramExponential {
 | |
| 				isNHCB = false
 | |
| 			} else {
 | |
| 				isNHCB = p.handleClassicHistogramSeries(p.lset)
 | |
| 			}
 | |
| 		}
 | |
| 		if isNHCB && !p.keepClassicHistograms {
 | |
| 			// Do not return the classic histogram series if it was converted to NHCB and we are not keeping classic histograms.
 | |
| 			return p.Next()
 | |
| 		}
 | |
| 		return p.entry, p.err
 | |
| 	case EntryHistogram:
 | |
| 		p.bytes, p.ts, p.h, p.fh = p.parser.Histogram()
 | |
| 		p.metricString = p.parser.Metric(&p.lset)
 | |
| 		p.storeExponentialLabels()
 | |
| 	case EntryType:
 | |
| 		p.bName, p.typ = p.parser.Type()
 | |
| 	}
 | |
| 	if p.processNHCB() {
 | |
| 		return EntryHistogram, nil
 | |
| 	}
 | |
| 	return p.entry, p.err
 | |
| }
 | |
| 
 | |
| // Return true if labels have changed and we should emit the NHCB.
 | |
| func (p *NHCBParser) compareLabels() bool {
 | |
| 	if p.state != stateCollecting {
 | |
| 		return false
 | |
| 	}
 | |
| 	if p.typ != model.MetricTypeHistogram {
 | |
| 		// Different metric type.
 | |
| 		return true
 | |
| 	}
 | |
| 	if p.lastHistogramName != convertnhcb.GetHistogramMetricBaseName(p.lset.Get(labels.MetricName)) {
 | |
| 		// Different metric name.
 | |
| 		return true
 | |
| 	}
 | |
| 	nextHash, _ := p.lset.HashWithoutLabels(p.hBuffer, labels.BucketLabel)
 | |
| 	// Different label values.
 | |
| 	return p.lastHistogramLabelsHash != nextHash
 | |
| }
 | |
| 
 | |
| // Save the label set of the classic histogram without suffix and bucket `le` label.
 | |
| func (p *NHCBParser) storeClassicLabels() {
 | |
| 	p.lastHistogramName = convertnhcb.GetHistogramMetricBaseName(p.lset.Get(labels.MetricName))
 | |
| 	p.lastHistogramLabelsHash, _ = p.lset.HashWithoutLabels(p.hBuffer, labels.BucketLabel)
 | |
| 	p.lastHistogramExponential = false
 | |
| }
 | |
| 
 | |
| func (p *NHCBParser) storeExponentialLabels() {
 | |
| 	p.lastHistogramName = p.lset.Get(labels.MetricName)
 | |
| 	p.lastHistogramLabelsHash, _ = p.lset.HashWithoutLabels(p.hBuffer)
 | |
| 	p.lastHistogramExponential = true
 | |
| }
 | |
| 
 | |
| // handleClassicHistogramSeries collates the classic histogram series to be converted to NHCB
 | |
| // if it is actually a classic histogram series (and not a normal float series) and if there
 | |
| // isn't already a native histogram with the same name (assuming it is always processed
 | |
| // right before the classic histograms) and returns true if the collation was done.
 | |
| func (p *NHCBParser) handleClassicHistogramSeries(lset labels.Labels) bool {
 | |
| 	if p.typ != model.MetricTypeHistogram {
 | |
| 		return false
 | |
| 	}
 | |
| 	mName := lset.Get(labels.MetricName)
 | |
| 	// Sanity check to ensure that the TYPE metadata entry name is the same as the base name.
 | |
| 	if convertnhcb.GetHistogramMetricBaseName(mName) != string(p.bName) {
 | |
| 		return false
 | |
| 	}
 | |
| 	switch {
 | |
| 	case strings.HasSuffix(mName, "_bucket") && lset.Has(labels.BucketLabel):
 | |
| 		le, err := strconv.ParseFloat(lset.Get(labels.BucketLabel), 64)
 | |
| 		if err == nil && !math.IsNaN(le) {
 | |
| 			p.processClassicHistogramSeries(lset, "_bucket", func(hist *convertnhcb.TempHistogram) {
 | |
| 				hist.BucketCounts[le] = p.value
 | |
| 			})
 | |
| 			return true
 | |
| 		}
 | |
| 	case strings.HasSuffix(mName, "_count"):
 | |
| 		p.processClassicHistogramSeries(lset, "_count", func(hist *convertnhcb.TempHistogram) {
 | |
| 			hist.Count = p.value
 | |
| 		})
 | |
| 		return true
 | |
| 	case strings.HasSuffix(mName, "_sum"):
 | |
| 		p.processClassicHistogramSeries(lset, "_sum", func(hist *convertnhcb.TempHistogram) {
 | |
| 			hist.Sum = p.value
 | |
| 		})
 | |
| 		return true
 | |
| 	}
 | |
| 	return false
 | |
| }
 | |
| 
 | |
| func (p *NHCBParser) processClassicHistogramSeries(lset labels.Labels, suffix string, updateHist func(*convertnhcb.TempHistogram)) {
 | |
| 	if p.state != stateCollecting {
 | |
| 		p.storeClassicLabels()
 | |
| 		p.tempCT = p.parser.CreatedTimestamp()
 | |
| 		p.state = stateCollecting
 | |
| 	}
 | |
| 	p.tempLsetNHCB = convertnhcb.GetHistogramMetricBase(lset, suffix)
 | |
| 	p.storeExemplars()
 | |
| 	updateHist(&p.tempNHCB)
 | |
| }
 | |
| 
 | |
| func (p *NHCBParser) storeExemplars() {
 | |
| 	for ex := p.nextExemplarPtr(); p.parser.Exemplar(ex); ex = p.nextExemplarPtr() {
 | |
| 		p.tempExemplarCount++
 | |
| 	}
 | |
| }
 | |
| 
 | |
| func (p *NHCBParser) nextExemplarPtr() *exemplar.Exemplar {
 | |
| 	switch {
 | |
| 	case p.tempExemplarCount == len(p.tempExemplars)-1:
 | |
| 		// Reuse the previously allocated exemplar, it was not filled up.
 | |
| 	case len(p.tempExemplars) == cap(p.tempExemplars):
 | |
| 		// Let the runtime grow the slice.
 | |
| 		p.tempExemplars = append(p.tempExemplars, exemplar.Exemplar{})
 | |
| 	default:
 | |
| 		// Take the next element into use.
 | |
| 		p.tempExemplars = p.tempExemplars[:len(p.tempExemplars)+1]
 | |
| 	}
 | |
| 	return &p.tempExemplars[len(p.tempExemplars)-1]
 | |
| }
 | |
| 
 | |
| func (p *NHCBParser) swapExemplars() {
 | |
| 	p.exemplars = p.tempExemplars[:p.tempExemplarCount]
 | |
| 	p.tempExemplars = p.tempExemplars[:0]
 | |
| 	p.tempExemplarCount = 0
 | |
| }
 | |
| 
 | |
| // processNHCB converts the collated classic histogram series to NHCB and caches the info
 | |
| // to be returned to callers. Retruns true if the conversion was successful.
 | |
| func (p *NHCBParser) processNHCB() bool {
 | |
| 	if p.state != stateCollecting {
 | |
| 		return false
 | |
| 	}
 | |
| 	ub := make([]float64, 0, len(p.tempNHCB.BucketCounts))
 | |
| 	for b := range p.tempNHCB.BucketCounts {
 | |
| 		ub = append(ub, b)
 | |
| 	}
 | |
| 	upperBounds, hBase := convertnhcb.ProcessUpperBoundsAndCreateBaseHistogram(ub, false)
 | |
| 	fhBase := hBase.ToFloat(nil)
 | |
| 	h, fh := convertnhcb.NewHistogram(p.tempNHCB, upperBounds, hBase, fhBase)
 | |
| 	if h != nil {
 | |
| 		if err := h.Validate(); err != nil {
 | |
| 			return false
 | |
| 		}
 | |
| 		p.hNHCB = h
 | |
| 		p.fhNHCB = nil
 | |
| 	} else if fh != nil {
 | |
| 		if err := fh.Validate(); err != nil {
 | |
| 			return false
 | |
| 		}
 | |
| 		p.hNHCB = nil
 | |
| 		p.fhNHCB = fh
 | |
| 	}
 | |
| 	p.metricStringNHCB = p.tempLsetNHCB.Get(labels.MetricName) + strings.ReplaceAll(p.tempLsetNHCB.DropMetricName().String(), ", ", ",")
 | |
| 	p.bytesNHCB = []byte(p.metricStringNHCB)
 | |
| 	p.lsetNHCB = p.tempLsetNHCB
 | |
| 	p.swapExemplars()
 | |
| 	p.ctNHCB = p.tempCT
 | |
| 	p.tempNHCB = convertnhcb.NewTempHistogram()
 | |
| 	p.state = stateEmitting
 | |
| 	p.tempCT = nil
 | |
| 	return true
 | |
| }
 |