mirror of https://github.com/prometheus/prometheus
Backfill: Use mmap to reuse parser code
Signed-off-by: Julien Pivotto <roidelapluie@inuits.eu>pull/8232/head
parent
b317b6ab9c
commit
82b5f1d8b1
|
@ -14,51 +14,18 @@
|
|||
package main
|
||||
|
||||
import (
|
||||
"bufio"
|
||||
"context"
|
||||
"io"
|
||||
"math"
|
||||
"os"
|
||||
|
||||
"github.com/go-kit/kit/log"
|
||||
"github.com/pkg/errors"
|
||||
"github.com/prometheus/common/expfmt"
|
||||
"github.com/prometheus/prometheus/pkg/labels"
|
||||
"github.com/prometheus/prometheus/pkg/textparse"
|
||||
"github.com/prometheus/prometheus/tsdb"
|
||||
tsdb_errors "github.com/prometheus/prometheus/tsdb/errors"
|
||||
)
|
||||
|
||||
// OpenMetricsParser implements textparse.Parser.
|
||||
type OpenMetricsParser struct {
|
||||
textparse.Parser
|
||||
s *bufio.Scanner
|
||||
}
|
||||
|
||||
// NewOpenMetricsParser returns an OpenMetricsParser reading from the provided reader.
|
||||
func NewOpenMetricsParser(r io.Reader) *OpenMetricsParser {
|
||||
return &OpenMetricsParser{s: bufio.NewScanner(r)}
|
||||
}
|
||||
|
||||
// Next advances the parser to the next sample. It returns io.EOF if no
|
||||
// more samples were read.
|
||||
func (p *OpenMetricsParser) Next() (textparse.Entry, error) {
|
||||
for p.s.Scan() {
|
||||
line := p.s.Bytes()
|
||||
line = append(line, '\n')
|
||||
|
||||
p.Parser = textparse.New(line, string(expfmt.FmtOpenMetrics))
|
||||
if et, err := p.Parser.Next(); err != io.EOF {
|
||||
return et, err
|
||||
}
|
||||
}
|
||||
|
||||
if err := p.s.Err(); err != nil {
|
||||
return 0, err
|
||||
}
|
||||
return 0, io.EOF
|
||||
}
|
||||
|
||||
func getMinAndMaxTimestamps(p textparse.Parser) (int64, int64, error) {
|
||||
var maxt, mint int64 = math.MinInt64, math.MaxInt64
|
||||
|
||||
|
@ -98,7 +65,7 @@ func getMinAndMaxTimestamps(p textparse.Parser) (int64, int64, error) {
|
|||
return maxt, mint, nil
|
||||
}
|
||||
|
||||
func createBlocks(input *os.File, mint, maxt int64, maxSamplesInAppender int, outputDir string) (returnErr error) {
|
||||
func createBlocks(input []byte, mint, maxt int64, maxSamplesInAppender int, outputDir string) (returnErr error) {
|
||||
blockDuration := tsdb.DefaultBlockDuration
|
||||
mint = blockDuration * (mint / blockDuration)
|
||||
|
||||
|
@ -120,12 +87,9 @@ func createBlocks(input *os.File, mint, maxt int64, maxSamplesInAppender int, ou
|
|||
err = tsdb_errors.NewMulti(err, w.Close()).Err()
|
||||
}()
|
||||
|
||||
if _, err := input.Seek(0, 0); err != nil {
|
||||
return errors.Wrap(err, "seek file")
|
||||
}
|
||||
ctx := context.Background()
|
||||
app := w.Appender(ctx)
|
||||
p := NewOpenMetricsParser(input)
|
||||
p := textparse.NewOpenMetricsParser(input)
|
||||
tsUpper := t + blockDuration
|
||||
samplesCount := 0
|
||||
for {
|
||||
|
@ -194,8 +158,8 @@ func createBlocks(input *os.File, mint, maxt int64, maxSamplesInAppender int, ou
|
|||
return nil
|
||||
}
|
||||
|
||||
func backfill(maxSamplesInAppender int, input *os.File, outputDir string) (err error) {
|
||||
p := NewOpenMetricsParser(input)
|
||||
func backfill(maxSamplesInAppender int, input []byte, outputDir string) (err error) {
|
||||
p := textparse.NewOpenMetricsParser(input)
|
||||
maxt, mint, err := getMinAndMaxTimestamps(p)
|
||||
if err != nil {
|
||||
return errors.Wrap(err, "getting min and max timestamp")
|
||||
|
|
|
@ -33,17 +33,6 @@ type backfillSample struct {
|
|||
Labels labels.Labels
|
||||
}
|
||||
|
||||
func createTemporaryOpenMetricsFile(t *testing.T, text string) string {
|
||||
newf, err := ioutil.TempFile("", "")
|
||||
require.NoError(t, err)
|
||||
|
||||
_, err = newf.WriteString(text)
|
||||
require.NoError(t, err)
|
||||
require.NoError(t, newf.Close())
|
||||
|
||||
return newf.Name()
|
||||
}
|
||||
|
||||
func sortSamples(samples []backfillSample) {
|
||||
sort.Slice(samples, func(x, y int) bool {
|
||||
sx, sy := samples[x], samples[y]
|
||||
|
@ -329,6 +318,30 @@ http_requests_total{code="400"} 1 1565166113.989
|
|||
},
|
||||
},
|
||||
},
|
||||
{
|
||||
ToParse: `no_newline_after_eof 42 6900
|
||||
# EOF`,
|
||||
IsOk: true,
|
||||
Description: "Sample without newline after # EOF.",
|
||||
MaxSamplesInAppender: 5000,
|
||||
Expected: struct {
|
||||
MinTime int64
|
||||
MaxTime int64
|
||||
NumBlocks int
|
||||
Samples []backfillSample
|
||||
}{
|
||||
MinTime: 6900000,
|
||||
MaxTime: 6900000,
|
||||
NumBlocks: 1,
|
||||
Samples: []backfillSample{
|
||||
{
|
||||
Timestamp: 6900000,
|
||||
Value: 42,
|
||||
Labels: labels.FromStrings("__name__", "no_newline_after_eof"),
|
||||
},
|
||||
},
|
||||
},
|
||||
},
|
||||
{
|
||||
ToParse: `bare_metric 42.24 1001
|
||||
# EOF
|
||||
|
@ -382,24 +395,35 @@ no_nl{type="no newline"}
|
|||
IsOk: false,
|
||||
Description: "No newline.",
|
||||
},
|
||||
{
|
||||
ToParse: `# HELP no_eof This test has no EOF so will fail
|
||||
# TYPE no_eof gauge
|
||||
no_eof 1 1
|
||||
`,
|
||||
IsOk: false,
|
||||
Description: "No EOF.",
|
||||
},
|
||||
{
|
||||
ToParse: `# HELP after_eof There is data after EOF.
|
||||
# TYPE after_eof gauge
|
||||
after_eof 1 1
|
||||
# EOF
|
||||
after_eof 1 2
|
||||
`,
|
||||
IsOk: false,
|
||||
Description: "Data after EOF.",
|
||||
},
|
||||
}
|
||||
for _, test := range tests {
|
||||
t.Logf("Test:%s", test.Description)
|
||||
|
||||
openMetricsFile := createTemporaryOpenMetricsFile(t, test.ToParse)
|
||||
input, err := os.Open(openMetricsFile)
|
||||
require.NoError(t, err)
|
||||
defer func() {
|
||||
require.NoError(t, input.Close())
|
||||
}()
|
||||
|
||||
outputDir, err := ioutil.TempDir("", "myDir")
|
||||
require.NoError(t, err)
|
||||
defer func() {
|
||||
require.NoError(t, os.RemoveAll(outputDir))
|
||||
}()
|
||||
|
||||
err = backfill(test.MaxSamplesInAppender, input, outputDir)
|
||||
err = backfill(test.MaxSamplesInAppender, []byte(test.ToParse), outputDir)
|
||||
|
||||
if !test.IsOk {
|
||||
require.Error(t, err, test.Description)
|
||||
|
|
|
@ -39,6 +39,7 @@ import (
|
|||
"github.com/prometheus/prometheus/tsdb"
|
||||
"github.com/prometheus/prometheus/tsdb/chunks"
|
||||
tsdb_errors "github.com/prometheus/prometheus/tsdb/errors"
|
||||
"github.com/prometheus/prometheus/tsdb/fileutil"
|
||||
)
|
||||
|
||||
const timeDelta = 30000
|
||||
|
@ -615,12 +616,12 @@ func checkErr(err error) int {
|
|||
}
|
||||
|
||||
func backfillOpenMetrics(path string, outputDir string) (err error) {
|
||||
input, err := os.Open(path)
|
||||
inputFile, err := fileutil.OpenMmapFile(path)
|
||||
if err != nil {
|
||||
return err
|
||||
}
|
||||
defer func() {
|
||||
input.Close()
|
||||
inputFile.Close()
|
||||
}()
|
||||
return backfill(5000, input, outputDir)
|
||||
return backfill(5000, inputFile.Bytes(), outputDir)
|
||||
}
|
||||
|
|
Loading…
Reference in New Issue