prometheus/head.go

package tsdb

import (
	"errors"
	"math"
	"sort"
	"sync"
	"time"

	"github.com/bradfitz/slice"
	"github.com/fabxc/tsdb/chunks"
	"github.com/fabxc/tsdb/labels"
	"github.com/go-kit/kit/log"
)

// HeadBlock handles reads and writes of time series data within a time window.
type HeadBlock struct {
	mtx sync.RWMutex
	d   string

	// descs holds all chunk descs for the head block. Each chunk implicitly
	// is assigned the index as its ID.
	descs []*chunkDesc
	// mapping maps a series ID to its position in an ordered list
	// of all series. The orderDirty flag indicates that it has gone stale.
	mapper *positionMapper
	// hashes contains a collision map of label set hashes of chunks
	// to their chunk descs.
	hashes map[uint64][]*chunkDesc

	values   map[string]stringset // label names to possible values
	postings *memPostings         // postings lists for terms

	wal *WAL

	bstats *BlockStats
}

// OpenHeadBlock creates a new empty head block.
func OpenHeadBlock(dir string, l log.Logger) (*HeadBlock, error) {
	wal, err := OpenWAL(dir, log.NewContext(l).With("component", "wal"), 15*time.Second)
	if err != nil {
		return nil, err
	}

	b := &HeadBlock{
		d:        dir,
		descs:    []*chunkDesc{},
		hashes:   map[uint64][]*chunkDesc{},
		values:   map[string]stringset{},
		postings: &memPostings{m: make(map[term][]uint32)},
		wal:      wal,
		mapper:   newPositionMapper(nil),
	}
	b.bstats = &BlockStats{
		MinTime: math.MaxInt64,
		MaxTime: math.MinInt64,
	}

	err = wal.ReadAll(&walHandler{
		series: func(lset labels.Labels) {
			b.create(lset.Hash(), lset)
		},
		sample: func(s hashedSample) {
			cd := b.descs[s.ref]

			// Duplicated from appendBatch – TODO(fabxc): deduplicate?
			if cd.lastTimestamp == s.t && cd.lastValue != s.v {
				return
			}
			cd.append(s.t, s.v)

			if s.t > b.bstats.MaxTime {
				b.bstats.MaxTime = s.t
			}
			if s.t < b.bstats.MinTime {
				b.bstats.MinTime = s.t
			}
			b.bstats.SampleCount++
		},
	})
	if err != nil {
		return nil, err
	}

	b.updateMapping()

	return b, nil
}

// Close syncs all data and closes underlying resources of the head block.
func (h *HeadBlock) Close() error {
	return h.wal.Close()
}

func (h *HeadBlock) dir() string          { return h.d }
func (h *HeadBlock) persisted() bool      { return false }
func (h *HeadBlock) index() IndexReader   { return h }
func (h *HeadBlock) series() SeriesReader { return h }

func (h *HeadBlock) stats() BlockStats {
	h.bstats.mtx.RLock()
	defer h.bstats.mtx.RUnlock()

	return *h.bstats
}

// Chunk returns the chunk for the reference number.
func (h *HeadBlock) Chunk(ref uint32) (chunks.Chunk, error) {
	h.mtx.RLock()
	defer h.mtx.RUnlock()

	if int(ref) >= len(h.descs) {
		return nil, errNotFound
	}
	return h.descs[int(ref)].chunk, nil
}

func (h *HeadBlock) interval() (int64, int64) {
	return h.bstats.MinTime, h.bstats.MaxTime
}

// Stats returns statisitics about the indexed data.
func (h *HeadBlock) Stats() (BlockStats, error) {
	return *h.bstats, nil
}

// LabelValues returns the possible label values
func (h *HeadBlock) LabelValues(names ...string) (StringTuples, error) {
	h.mtx.RLock()
	defer h.mtx.RUnlock()

	if len(names) != 1 {
		return nil, errInvalidSize
	}
	var sl []string

	for s := range h.values[names[0]] {
		sl = append(sl, s)
	}
	sort.Strings(sl)

	return &stringTuples{l: len(names), s: sl}, nil
}

// Postings returns the postings list iterator for the label pair.
func (h *HeadBlock) Postings(name, value string) (Postings, error) {
	h.mtx.RLock()
	defer h.mtx.RUnlock()

	return h.postings.get(term{name: name, value: value}), nil
}

// Series returns the series for the given reference.
func (h *HeadBlock) Series(ref uint32) (labels.Labels, []ChunkMeta, error) {
	h.mtx.RLock()
	defer h.mtx.RUnlock()

	if int(ref) >= len(h.descs) {
		return nil, nil, errNotFound
	}
	cd := h.descs[ref]

	meta := ChunkMeta{
		MinTime: cd.firstTimestamp,
		MaxTime: cd.lastTimestamp,
		Ref:     ref,
	}
	return cd.lset, []ChunkMeta{meta}, nil
}

func (h *HeadBlock) LabelIndices() ([][]string, error) {
	h.mtx.RLock()
	defer h.mtx.RUnlock()

	res := [][]string{}

	for s := range h.values {
		res = append(res, []string{s})
	}
	return res, nil
}

// get retrieves the chunk with the hash and label set and creates
// a new one if it doesn't exist yet.
func (h *HeadBlock) get(hash uint64, lset labels.Labels) *chunkDesc {
	cds := h.hashes[hash]

	for _, cd := range cds {
		if cd.lset.Equals(lset) {
			return cd
		}
	}
	return nil
}

func (h *HeadBlock) create(hash uint64, lset labels.Labels) *chunkDesc {
	cd := &chunkDesc{
		lset:          lset,
		chunk:         chunks.NewXORChunk(),
		lastTimestamp: math.MinInt64,
	}

	var err error
	cd.app, err = cd.chunk.Appender()
	if err != nil {
		// Getting an Appender for a new chunk must not panic.
		panic(err)
	}
	// Index the new chunk.
	cd.ref = uint32(len(h.descs))

	h.descs = append(h.descs, cd)
	h.hashes[hash] = append(h.hashes[hash], cd)

	for _, l := range lset {
		valset, ok := h.values[l.Name]
		if !ok {
			valset = stringset{}
			h.values[l.Name] = valset
		}
		valset.set(l.Value)

		h.postings.add(cd.ref, term{name: l.Name, value: l.Value})
	}

	h.postings.add(cd.ref, term{})

	return cd
}

var (
	// ErrOutOfOrderSample is returned if an appended sample has a
	// timestamp larger than the most recent sample.
	ErrOutOfOrderSample = errors.New("out of order sample")

	// ErrAmendSample is returned if an appended sample has the same timestamp
	// as the most recent sample but a different value.
	ErrAmendSample = errors.New("amending sample")
)

func (h *HeadBlock) appendBatch(samples []hashedSample) error {
	// Find head chunks for all samples and allocate new IDs/refs for
	// ones we haven't seen before.
	var (
		newSeries    []labels.Labels
		newSamples   []*hashedSample
		newHashes    []uint64
		uniqueHashes = map[uint64]uint32{}
	)
	h.mtx.RLock()
	defer h.mtx.RUnlock()

	for i := range samples {
		s := &samples[i]

		cd := h.get(s.hash, s.labels)
		if cd != nil {
			// Samples must only occur in order.
			if s.t < cd.lastTimestamp {
				return ErrOutOfOrderSample
			}
			if cd.lastTimestamp == s.t && cd.lastValue != s.v {
				return ErrAmendSample
			}
			// TODO(fabxc): sample refs are only scoped within a block for
			// now and we ignore any previously set value
			s.ref = cd.ref
			continue
		}

		// There may be several samples for a new series in a batch.
		// We don't want to reserve a new space for each.
		if ref, ok := uniqueHashes[s.hash]; ok {
			s.ref = ref
			continue
		}
		s.ref = uint32(len(newSeries))
		uniqueHashes[s.hash] = s.ref

		newSeries = append(newSeries, s.labels)
		newHashes = append(newHashes, s.hash)
		newSamples = append(newSamples, s)
	}

	// Write all new series and samples to the WAL and add it to the
	// in-mem database on success.
	if err := h.wal.Log(newSeries, samples); err != nil {
		return err
	}

	// After the samples were successfully written to the WAL, there may
	// be no further failures.
	if len(newSeries) > 0 {
		h.mtx.RUnlock()
		h.mtx.Lock()

		base := len(h.descs)

		for i, s := range newSeries {
			h.create(newHashes[i], s)
		}
		for _, s := range newSamples {
			s.ref = uint32(base) + s.ref
		}

		h.mtx.Unlock()
		h.mtx.RLock()
	}

	var (
		total = uint64(len(samples))
		mint  = int64(math.MaxInt64)
		maxt  = int64(math.MinInt64)
	)
	for _, s := range samples {
		cd := h.descs[s.ref]
		// Skip duplicate samples.
		if cd.lastTimestamp == s.t && cd.lastValue != s.v {
			total--
			continue
		}
		cd.append(s.t, s.v)

		if mint > s.t {
			mint = s.t
		}
		if maxt < s.t {
			maxt = s.t
		}
	}

	h.bstats.mtx.Lock()
	defer h.bstats.mtx.Unlock()

	h.bstats.SampleCount += total
	h.bstats.SeriesCount += uint64(len(newSeries))
	h.bstats.ChunkCount += uint64(len(newSeries)) // head block has one chunk/series

	if mint < h.bstats.MinTime {
		h.bstats.MinTime = mint
	}
	if maxt > h.bstats.MaxTime {
		h.bstats.MaxTime = maxt
	}

	return nil
}

func (h *HeadBlock) fullness() float64 {
	h.bstats.mtx.RLock()
	defer h.bstats.mtx.RUnlock()

	return float64(h.bstats.SampleCount) / float64(h.bstats.SeriesCount+1) / 250
}

func (h *HeadBlock) updateMapping() {
	h.mapper.mtx.Lock()
	defer h.mapper.mtx.Unlock()

	if h.mapper.sortable != nil && h.mapper.Len() == len(h.descs) {
		return
	}

	cds := make([]*chunkDesc, len(h.descs))
	copy(cds, h.descs)

	s := slice.SortInterface(cds, func(i, j int) bool {
		return labels.Compare(cds[i].lset, cds[j].lset) < 0
	})

	h.mapper.update(s)
}

// remapPostings changes the order of the postings from their ID to the ordering
// of the series they reference.
// Returned postings have no longer monotonic IDs and MUST NOT be used for regular
// postings set operations, i.e. intersect and merge.
func (h *HeadBlock) remapPostings(p Postings) Postings {
	list, err := expandPostings(p)
	if err != nil {
		return errPostings{err: err}
	}

	h.mapper.mtx.RLock()
	defer h.mapper.mtx.RUnlock()

	h.mapper.Sort(list)

	slice.Sort(list, func(i, j int) bool {
		return h.mapper.fw[list[i]] < h.mapper.fw[list[j]]
	})

	return newListPostings(list)
}

// positionMapper stores a position mapping from unsorted to
// sorted indices of a sortable collection.
type positionMapper struct {
	mtx      sync.RWMutex
	sortable sort.Interface
	iv, fw   []int
}

func newPositionMapper(s sort.Interface) *positionMapper {
	m := &positionMapper{}
	if s != nil {
		m.update(s)
	}
	return m
}

func (m *positionMapper) Len() int           { return m.sortable.Len() }
func (m *positionMapper) Less(i, j int) bool { return m.sortable.Less(i, j) }

func (m *positionMapper) Swap(i, j int) {
	m.sortable.Swap(i, j)

	m.iv[i], m.iv[j] = m.iv[j], m.iv[i]
}

func (m *positionMapper) Sort(l []uint32) {
	slice.Sort(l, func(i, j int) bool {
		return m.fw[l[i]] < m.fw[l[j]]
	})
}

func (m *positionMapper) update(s sort.Interface) {
	m.sortable = s

	m.iv = make([]int, s.Len())
	m.fw = make([]int, s.Len())

	for i := range m.iv {
		m.iv[i] = i
	}
	sort.Sort(m)

	for i, k := range m.iv {
		m.fw[k] = i
	}
}
-												Add new interfaces and skeleton

											
										
										
											8 years ago
+								package tsdb
 								import (
-												Modify IndexReader API to accomodate compaction

This changes the IndexReader API to expose plain labels
and chunk meta information instead of a Series interface.
Dropping of irrelevant chunks is moved into the querier.

A LabelIndices method is added to query for existing label
value indices.

											
										
										
											8 years ago
+									"errors"
-												Fix last timestamp initialization

This initializes the chunkDesc's last timestamp to the minimum
value so initial samples with a timestamp of 0 (e.g. in tests)
are not accidentally dropped.

											
										
										
											8 years ago
+									"math"
-												Misc fixes for initial Prometheus integration

											
										
										
											8 years ago
+									"sort"
-												Add new interfaces and skeleton

											
										
										
											8 years ago
+									"sync"
-												Periodically fsync WAL, make head cut async

											
										
										
											8 years ago
+									"time"
-												Add new interfaces and skeleton

											
										
										
											8 years ago
-												Add postings wrapper that emits head postings in label set order

This adds a position mapper that takes series from a head block
in the order they were appended and creates a mapping representing
them in order of their label sets.

Write-repair of the postings list would cause very expensive writing.
Hence, we keep them as they are and only apply the postition mapping
at the very end, after a postings list has been sufficienctly reduced
through intersections etc.

											
										
										
											8 years ago
+									"github.com/bradfitz/slice"
-												Add new interfaces and skeleton

											
										
										
											8 years ago
+									"github.com/fabxc/tsdb/chunks"
-												Extract labels package

											
										
										
											8 years ago
+									"github.com/fabxc/tsdb/labels"
-												Periodically fsync WAL, make head cut async

											
										
										
											8 years ago
+									"github.com/go-kit/kit/log"
-												Add new interfaces and skeleton

											
										
										
											8 years ago
+								)
 								// HeadBlock handles reads and writes of time series data within a time window.
 								type HeadBlock struct {
-												Consolidate mem index into HeadBlock

											
										
										
											8 years ago
+									mtx sync.RWMutex
-												Lock mmapped files

											
										
										
											8 years ago
+									d   string
-												Consolidate mem index into HeadBlock

											
										
										
											8 years ago
 									// descs holds all chunk descs for the head block. Each chunk implicitly
 									// is assigned the index as its ID.
 									descs []*chunkDesc
-												Add postings wrapper that emits head postings in label set order

This adds a position mapper that takes series from a head block
in the order they were appended and creates a mapping representing
them in order of their label sets.

Write-repair of the postings list would cause very expensive writing.
Hence, we keep them as they are and only apply the postition mapping
at the very end, after a postings list has been sufficienctly reduced
through intersections etc.

											
										
										
											8 years ago
+									// mapping maps a series ID to its position in an ordered list
 									// of all series. The orderDirty flag indicates that it has gone stale.
 									mapper *positionMapper
-												Consolidate mem index into HeadBlock

											
										
										
											8 years ago
+									// hashes contains a collision map of label set hashes of chunks
-												Remove double-reference in chunk hashmap

											
										
										
											8 years ago
+									// to their chunk descs.
 									hashes map[uint64][]*chunkDesc
-												Consolidate mem index into HeadBlock

											
										
										
											8 years ago
 									values   map[string]stringset // label names to possible values
 									postings *memPostings         // postings lists for terms
-												Bucket samples before appending.

This pre-sorts samples into buckets before appending them to reduce
locking of shards.

											
										
										
											8 years ago
-												Add initial WAL writing

											
										
										
											8 years ago
+									wal *WAL
-												Fix races

											
										
										
											8 years ago
+									bstats *BlockStats
-												Add new interfaces and skeleton

											
										
										
											8 years ago
+								}
-												Rename to OpenHeadBlock

											
										
										
											8 years ago
+								// OpenHeadBlock creates a new empty head block.
-												Periodically fsync WAL, make head cut async

											
										
										
											8 years ago
+								func OpenHeadBlock(dir string, l log.Logger) (*HeadBlock, error) {
 									wal, err := OpenWAL(dir, log.NewContext(l).With("component", "wal"), 15*time.Second)
-												Add initial WAL writing

											
										
										
											8 years ago
+									if err != nil {
 										return nil, err
 									}
-												Add stats serialization, load querier of all blocks

											
										
										
											8 years ago
+									b := &HeadBlock{
-												Lock mmapped files

											
										
										
											8 years ago
+										d:        dir,
-												Consolidate mem index into HeadBlock

											
										
										
											8 years ago
+										descs:    []*chunkDesc{},
-												Remove double-reference in chunk hashmap

											
										
										
											8 years ago
+										hashes:   map[uint64][]*chunkDesc{},
-												Consolidate mem index into HeadBlock

											
										
										
											8 years ago
+										values:   map[string]stringset{},
 										postings: &memPostings{m: make(map[term][]uint32)},
-												Add initial WAL writing

											
										
										
											8 years ago
+										wal:      wal,
-												Don't update head postings mapper on every append

											
										
										
											8 years ago
+										mapper:   newPositionMapper(nil),
-												Move sub-indexes into single index structure

											
										
										
											8 years ago
+									}
-												Fix races

											
										
										
											8 years ago
+									b.bstats = &BlockStats{
 										MinTime: math.MaxInt64,
 										MaxTime: math.MinInt64,
 									}
-												Handle compaction trigger and reinitializing in DB

											
										
										
											8 years ago
-												Add WAL decoder+loading and benchmarks

											
										
										
											8 years ago
+									err = wal.ReadAll(&walHandler{
 										series: func(lset labels.Labels) {
 											b.create(lset.Hash(), lset)
 										},
 										sample: func(s hashedSample) {
-												Switch to sequential block names

This changes block directory names from the int64 timestamp
to sequential numbering.

											
										
										
											8 years ago
+											cd := b.descs[s.ref]
 											// Duplicated from appendBatch – TODO(fabxc): deduplicate?
 											if cd.lastTimestamp == s.t && cd.lastValue != s.v {
 												return
 											}
 											cd.append(s.t, s.v)
 											if s.t > b.bstats.MaxTime {
 												b.bstats.MaxTime = s.t
 											}
 											if s.t < b.bstats.MinTime {
 												b.bstats.MinTime = s.t
 											}
-												Consolidate persistence and compaction

											
										
										
											8 years ago
+											b.bstats.SampleCount++
-												Add WAL decoder+loading and benchmarks

											
										
										
											8 years ago
+										},
 									})
 									if err != nil {
 										return nil, err
 									}
-												Don't update head postings mapper on every append

											
										
										
											8 years ago
+									b.updateMapping()
-												Add postings wrapper that emits head postings in label set order

This adds a position mapper that takes series from a head block
in the order they were appended and creates a mapping representing
them in order of their label sets.

Write-repair of the postings list would cause very expensive writing.
Hence, we keep them as they are and only apply the postition mapping
at the very end, after a postings list has been sufficienctly reduced
through intersections etc.

											
										
										
											8 years ago
-												Add initial WAL writing

											
										
										
											8 years ago
+									return b, nil
 								}
 								// Close syncs all data and closes underlying resources of the head block.
 								func (h *HeadBlock) Close() error {
 									return h.wal.Close()
-												Move sub-indexes into single index structure

											
										
										
											8 years ago
+								}
-												Lock mmapped files

											
										
										
											8 years ago
+								func (h *HeadBlock) dir() string          { return h.d }
-												Consolidate persistence and compaction

											
										
										
											8 years ago
+								func (h *HeadBlock) persisted() bool      { return false }
-												Lock mmapped files

											
										
										
											8 years ago
+								func (h *HeadBlock) index() IndexReader   { return h }
 								func (h *HeadBlock) series() SeriesReader { return h }
-												Fix head block stats races

											
										
										
											8 years ago
 								func (h *HeadBlock) stats() BlockStats {
 									h.bstats.mtx.RLock()
 									defer h.bstats.mtx.RUnlock()
 									return *h.bstats
 								}
-												Misc fixes for initial Prometheus integration

											
										
										
											8 years ago
-												Add stats serialization, load querier of all blocks

											
										
										
											8 years ago
+								// Chunk returns the chunk for the reference number.
-												Misc fixes for initial Prometheus integration

											
										
										
											8 years ago
+								func (h *HeadBlock) Chunk(ref uint32) (chunks.Chunk, error) {
-												Use separate lock for series creation

This uses the head block's own lock to only lock if new series were
encountered.
In the general append case we just need to hold a

											
										
										
											8 years ago
+									h.mtx.RLock()
 									defer h.mtx.RUnlock()
-												Consolidate mem index into HeadBlock

											
										
										
											8 years ago
+									if int(ref) >= len(h.descs) {
-												Misc fixes for initial Prometheus integration

											
										
										
											8 years ago
+										return nil, errNotFound
 									}
-												Consolidate mem index into HeadBlock

											
										
										
											8 years ago
+									return h.descs[int(ref)].chunk, nil
-												Misc fixes for initial Prometheus integration

											
										
										
											8 years ago
+								}
-												Add stats serialization, load querier of all blocks

											
										
										
											8 years ago
+								func (h *HeadBlock) interval() (int64, int64) {
-												Consolidate persistence and compaction

											
										
										
											8 years ago
+									return h.bstats.MinTime, h.bstats.MaxTime
-												Add stats serialization, load querier of all blocks

											
										
										
											8 years ago
+								}
-												Misc fixes for initial Prometheus integration

											
										
										
											8 years ago
+								// Stats returns statisitics about the indexed data.
-												Add stats serialization, load querier of all blocks

											
										
										
											8 years ago
+								func (h *HeadBlock) Stats() (BlockStats, error) {
-												Fix races

											
										
										
											8 years ago
+									return *h.bstats, nil
-												Misc fixes for initial Prometheus integration

											
										
										
											8 years ago
+								}
 								// LabelValues returns the possible label values
 								func (h *HeadBlock) LabelValues(names ...string) (StringTuples, error) {
-												Use separate lock for series creation

This uses the head block's own lock to only lock if new series were
encountered.
In the general append case we just need to hold a

											
										
										
											8 years ago
+									h.mtx.RLock()
 									defer h.mtx.RUnlock()
-												Misc fixes for initial Prometheus integration

											
										
										
											8 years ago
+									if len(names) != 1 {
 										return nil, errInvalidSize
 									}
 									var sl []string
-												Consolidate mem index into HeadBlock

											
										
										
											8 years ago
+									for s := range h.values[names[0]] {
-												Misc fixes for initial Prometheus integration

											
										
										
											8 years ago
+										sl = append(sl, s)
 									}
 									sort.Strings(sl)
-												Add postings wrapper that emits head postings in label set order

This adds a position mapper that takes series from a head block
in the order they were appended and creates a mapping representing
them in order of their label sets.

Write-repair of the postings list would cause very expensive writing.
Hence, we keep them as they are and only apply the postition mapping
at the very end, after a postings list has been sufficienctly reduced
through intersections etc.

											
										
										
											8 years ago
+									return &stringTuples{l: len(names), s: sl}, nil
-												Misc fixes for initial Prometheus integration

											
										
										
											8 years ago
+								}
 								// Postings returns the postings list iterator for the label pair.
-												Rename Iterator to Postings

											
										
										
											8 years ago
+								func (h *HeadBlock) Postings(name, value string) (Postings, error) {
-												Use separate lock for series creation

This uses the head block's own lock to only lock if new series were
encountered.
In the general append case we just need to hold a

											
										
										
											8 years ago
+									h.mtx.RLock()
 									defer h.mtx.RUnlock()
-												Consolidate mem index into HeadBlock

											
										
										
											8 years ago
+									return h.postings.get(term{name: name, value: value}), nil
-												Misc fixes for initial Prometheus integration

											
										
										
											8 years ago
+								}
 								// Series returns the series for the given reference.
-												Modify IndexReader API to accomodate compaction

This changes the IndexReader API to expose plain labels
and chunk meta information instead of a Series interface.
Dropping of irrelevant chunks is moved into the querier.

A LabelIndices method is added to query for existing label
value indices.

											
										
										
											8 years ago
+								func (h *HeadBlock) Series(ref uint32) (labels.Labels, []ChunkMeta, error) {
-												Use separate lock for series creation

This uses the head block's own lock to only lock if new series were
encountered.
In the general append case we just need to hold a

											
										
										
											8 years ago
+									h.mtx.RLock()
 									defer h.mtx.RUnlock()
-												Consolidate mem index into HeadBlock

											
										
										
											8 years ago
+									if int(ref) >= len(h.descs) {
-												Modify IndexReader API to accomodate compaction

This changes the IndexReader API to expose plain labels
and chunk meta information instead of a Series interface.
Dropping of irrelevant chunks is moved into the querier.

A LabelIndices method is added to query for existing label
value indices.

											
										
										
											8 years ago
+										return nil, nil, errNotFound
-												Misc fixes for initial Prometheus integration

											
										
										
											8 years ago
+									}
-												Consolidate mem index into HeadBlock

											
										
										
											8 years ago
+									cd := h.descs[ref]
-												Consolidate persistence and compaction

											
										
										
											8 years ago
+									meta := ChunkMeta{
-												Fix last timestamp initialization

This initializes the chunkDesc's last timestamp to the minimum
value so initial samples with a timestamp of 0 (e.g. in tests)
are not accidentally dropped.

											
										
										
											8 years ago
+										MinTime: cd.firstTimestamp,
-												Consolidate persistence and compaction

											
										
										
											8 years ago
+										MaxTime: cd.lastTimestamp,
 										Ref:     ref,
 									}
 									return cd.lset, []ChunkMeta{meta}, nil
-												Modify IndexReader API to accomodate compaction

This changes the IndexReader API to expose plain labels
and chunk meta information instead of a Series interface.
Dropping of irrelevant chunks is moved into the querier.

A LabelIndices method is added to query for existing label
value indices.

											
										
										
											8 years ago
+								}
 								func (h *HeadBlock) LabelIndices() ([][]string, error) {
-												Use separate lock for series creation

This uses the head block's own lock to only lock if new series were
encountered.
In the general append case we just need to hold a

											
										
										
											8 years ago
+									h.mtx.RLock()
 									defer h.mtx.RUnlock()
-												Modify IndexReader API to accomodate compaction

This changes the IndexReader API to expose plain labels
and chunk meta information instead of a Series interface.
Dropping of irrelevant chunks is moved into the querier.

A LabelIndices method is added to query for existing label
value indices.

											
										
										
											8 years ago
+									res := [][]string{}
 									for s := range h.values {
 										res = append(res, []string{s})
-												Misc fixes for initial Prometheus integration

											
										
										
											8 years ago
+									}
-												Modify IndexReader API to accomodate compaction

This changes the IndexReader API to expose plain labels
and chunk meta information instead of a Series interface.
Dropping of irrelevant chunks is moved into the querier.

A LabelIndices method is added to query for existing label
value indices.

											
										
										
											8 years ago
+									return res, nil
-												Misc fixes for initial Prometheus integration

											
										
										
											8 years ago
+								}
-												Add new interfaces and skeleton

											
										
										
											8 years ago
+								// get retrieves the chunk with the hash and label set and creates
 								// a new one if it doesn't exist yet.
-												Remove double-reference in chunk hashmap

											
										
										
											8 years ago
+								func (h *HeadBlock) get(hash uint64, lset labels.Labels) *chunkDesc {
 									cds := h.hashes[hash]
-												Consolidate mem index into HeadBlock

											
										
										
											8 years ago
-												Remove double-reference in chunk hashmap

											
										
										
											8 years ago
+									for _, cd := range cds {
 										if cd.lset.Equals(lset) {
 											return cd
-												Add new interfaces and skeleton

											
										
										
											8 years ago
+										}
 									}
-												Remove double-reference in chunk hashmap

											
										
										
											8 years ago
+									return nil
-												Add initial WAL writing

											
										
										
											8 years ago
+								}
 								func (h *HeadBlock) create(hash uint64, lset labels.Labels) *chunkDesc {
-												Add new interfaces and skeleton

											
										
										
											8 years ago
+									cd := &chunkDesc{
-												Fix last timestamp initialization

This initializes the chunkDesc's last timestamp to the minimum
value so initial samples with a timestamp of 0 (e.g. in tests)
are not accidentally dropped.

											
										
										
											8 years ago
+										lset:          lset,
 										chunk:         chunks.NewXORChunk(),
 										lastTimestamp: math.MinInt64,
-												Append to chunks cannot error

											
										
										
											8 years ago
+									}
-												Fix last timestamp initialization

This initializes the chunkDesc's last timestamp to the minimum
value so initial samples with a timestamp of 0 (e.g. in tests)
are not accidentally dropped.

											
										
										
											8 years ago
-												Switch to sequential block names

This changes block directory names from the int64 timestamp
to sequential numbering.

											
										
										
											8 years ago
+									var err error
-												Append to chunks cannot error

											
										
										
											8 years ago
+									cd.app, err = cd.chunk.Appender()
 									if err != nil {
 										// Getting an Appender for a new chunk must not panic.
 										panic(err)
-												Add new interfaces and skeleton

											
										
										
											8 years ago
+									}
-												Consolidate mem index into HeadBlock

											
										
										
											8 years ago
+									// Index the new chunk.
-												Remove double-reference in chunk hashmap

											
										
										
											8 years ago
+									cd.ref = uint32(len(h.descs))
-												Consolidate mem index into HeadBlock

											
										
										
											8 years ago
 									h.descs = append(h.descs, cd)
-												Remove double-reference in chunk hashmap

											
										
										
											8 years ago
+									h.hashes[hash] = append(h.hashes[hash], cd)
-												Consolidate mem index into HeadBlock

											
										
										
											8 years ago
 									for _, l := range lset {
 										valset, ok := h.values[l.Name]
 										if !ok {
 											valset = stringset{}
 											h.values[l.Name] = valset
 										}
 										valset.set(l.Value)
-												Consolidate persistence and compaction

											
										
										
											8 years ago
 										h.postings.add(cd.ref, term{name: l.Name, value: l.Value})
-												Consolidate mem index into HeadBlock

											
										
										
											8 years ago
+									}
-												Consolidate persistence and compaction

											
										
										
											8 years ago
 									h.postings.add(cd.ref, term{})
-												Add new interfaces and skeleton

											
										
										
											8 years ago
-												misc

											
										
										
											8 years ago
+									return cd
-												Add new interfaces and skeleton

											
										
										
											8 years ago
+								}
-												Modify IndexReader API to accomodate compaction

This changes the IndexReader API to expose plain labels
and chunk meta information instead of a Series interface.
Dropping of irrelevant chunks is moved into the querier.

A LabelIndices method is added to query for existing label
value indices.

											
										
										
											8 years ago
+								var (
-												Run persistence in separate goroutine

											
										
										
											8 years ago
+									// ErrOutOfOrderSample is returned if an appended sample has a
 									// timestamp larger than the most recent sample.
-												Modify IndexReader API to accomodate compaction

This changes the IndexReader API to expose plain labels
and chunk meta information instead of a Series interface.
Dropping of irrelevant chunks is moved into the querier.

A LabelIndices method is added to query for existing label
value indices.

											
										
										
											8 years ago
+									ErrOutOfOrderSample = errors.New("out of order sample")
-												Run persistence in separate goroutine

											
										
										
											8 years ago
 									// ErrAmendSample is returned if an appended sample has the same timestamp
 									// as the most recent sample but a different value.
 									ErrAmendSample = errors.New("amending sample")
-												Modify IndexReader API to accomodate compaction

This changes the IndexReader API to expose plain labels
and chunk meta information instead of a Series interface.
Dropping of irrelevant chunks is moved into the querier.

A LabelIndices method is added to query for existing label
value indices.

											
										
										
											8 years ago
+								)
-												Remove double-reference in chunk hashmap

											
										
										
											8 years ago
+								func (h *HeadBlock) appendBatch(samples []hashedSample) error {
-												Add initial WAL writing

											
										
										
											8 years ago
+									// Find head chunks for all samples and allocate new IDs/refs for
 									// ones we haven't seen before.
 									var (
-												Fix uniqueness of new series

											
										
										
											8 years ago
+										newSeries    []labels.Labels
-												Use separate lock for series creation

This uses the head block's own lock to only lock if new series were
encountered.
In the general append case we just need to hold a

											
										
										
											8 years ago
+										newSamples   []*hashedSample
-												Fix uniqueness of new series

											
										
										
											8 years ago
+										newHashes    []uint64
 										uniqueHashes = map[uint64]uint32{}
-												Add initial WAL writing

											
										
										
											8 years ago
+									)
-												Use separate lock for series creation

This uses the head block's own lock to only lock if new series were
encountered.
In the general append case we just need to hold a

											
										
										
											8 years ago
+									h.mtx.RLock()
-												Fix races

											
										
										
											8 years ago
+									defer h.mtx.RUnlock()
-												Consolidate mem index into HeadBlock

											
										
										
											8 years ago
-												Fix erroneous value assignments

											
										
										
											8 years ago
+									for i := range samples {
 										s := &samples[i]
-												Remove double-reference in chunk hashmap

											
										
										
											8 years ago
+										cd := h.get(s.hash, s.labels)
-												Add initial WAL writing

											
										
										
											8 years ago
+										if cd != nil {
-												Modify IndexReader API to accomodate compaction

This changes the IndexReader API to expose plain labels
and chunk meta information instead of a Series interface.
Dropping of irrelevant chunks is moved into the querier.

A LabelIndices method is added to query for existing label
value indices.

											
										
										
											8 years ago
+											// Samples must only occur in order.
 											if s.t < cd.lastTimestamp {
 												return ErrOutOfOrderSample
 											}
 											if cd.lastTimestamp == s.t && cd.lastValue != s.v {
 												return ErrAmendSample
 											}
-												Add initial WAL writing

											
										
										
											8 years ago
+											// TODO(fabxc): sample refs are only scoped within a block for
 											// now and we ignore any previously set value
-												Remove double-reference in chunk hashmap

											
										
										
											8 years ago
+											s.ref = cd.ref
-												Add initial WAL writing

											
										
										
											8 years ago
+											continue
 										}
-												Fix uniqueness of new series

											
										
										
											8 years ago
 										// There may be several samples for a new series in a batch.
 										// We don't want to reserve a new space for each.
 										if ref, ok := uniqueHashes[s.hash]; ok {
 											s.ref = ref
 											continue
 										}
-												Use separate lock for series creation

This uses the head block's own lock to only lock if new series were
encountered.
In the general append case we just need to hold a

											
										
										
											8 years ago
+										s.ref = uint32(len(newSeries))
-												Fix uniqueness of new series

											
										
										
											8 years ago
+										uniqueHashes[s.hash] = s.ref
-												Fix erroneous value assignments

											
										
										
											8 years ago
-												Add initial WAL writing

											
										
										
											8 years ago
+										newSeries = append(newSeries, s.labels)
 										newHashes = append(newHashes, s.hash)
-												Use separate lock for series creation

This uses the head block's own lock to only lock if new series were
encountered.
In the general append case we just need to hold a

											
										
										
											8 years ago
+										newSamples = append(newSamples, s)
-												Add initial WAL writing

											
										
										
											8 years ago
+									}
-												Consolidate mem index into HeadBlock

											
										
										
											8 years ago
-												Add initial WAL writing

											
										
										
											8 years ago
+									// Write all new series and samples to the WAL and add it to the
 									// in-mem database on success.
 									if err := h.wal.Log(newSeries, samples); err != nil {
-												Bucket samples before appending.

This pre-sorts samples into buckets before appending them to reduce
locking of shards.

											
										
										
											8 years ago
+										return err
 									}
-												Add initial seriailization of block data

											
										
										
											8 years ago
-												Remove double-reference in chunk hashmap

											
										
										
											8 years ago
+									// After the samples were successfully written to the WAL, there may
 									// be no further failures.
-												Use separate lock for series creation

This uses the head block's own lock to only lock if new series were
encountered.
In the general append case we just need to hold a

											
										
										
											8 years ago
+									if len(newSeries) > 0 {
-												Fix races

											
										
										
											8 years ago
+										h.mtx.RUnlock()
-												Use separate lock for series creation

This uses the head block's own lock to only lock if new series were
encountered.
In the general append case we just need to hold a

											
										
										
											8 years ago
+										h.mtx.Lock()
 										base := len(h.descs)
 										for i, s := range newSeries {
 											h.create(newHashes[i], s)
 										}
 										for _, s := range newSamples {
 											s.ref = uint32(base) + s.ref
 										}
 										h.mtx.Unlock()
 										h.mtx.RLock()
-												Add initial WAL writing

											
										
										
											8 years ago
+									}
-												cleanup and switching removal of unsafe calls.

											
										
										
											8 years ago
-												Fix head block stats races

											
										
										
											8 years ago
+									var (
 										total = uint64(len(samples))
 										mint  = int64(math.MaxInt64)
 										maxt  = int64(math.MinInt64)
 									)
-												Add initial WAL writing

											
										
										
											8 years ago
+									for _, s := range samples {
-												Modify IndexReader API to accomodate compaction

This changes the IndexReader API to expose plain labels
and chunk meta information instead of a Series interface.
Dropping of irrelevant chunks is moved into the querier.

A LabelIndices method is added to query for existing label
value indices.

											
										
										
											8 years ago
+										cd := h.descs[s.ref]
 										// Skip duplicate samples.
 										if cd.lastTimestamp == s.t && cd.lastValue != s.v {
-												Use separate lock for series creation

This uses the head block's own lock to only lock if new series were
encountered.
In the general append case we just need to hold a

											
										
										
											8 years ago
+											total--
-												Modify IndexReader API to accomodate compaction

This changes the IndexReader API to expose plain labels
and chunk meta information instead of a Series interface.
Dropping of irrelevant chunks is moved into the querier.

A LabelIndices method is added to query for existing label
value indices.

											
										
										
											8 years ago
+											continue
 										}
 										cd.append(s.t, s.v)
-												Add initial WAL writing

											
										
										
											8 years ago
-												Fix head block stats races

											
										
										
											8 years ago
+										if mint > s.t {
 											mint = s.t
-												Add initial WAL writing

											
										
										
											8 years ago
+										}
-												Fix head block stats races

											
										
										
											8 years ago
+										if maxt < s.t {
 											maxt = s.t
-												Switch to sequential block names

This changes block directory names from the int64 timestamp
to sequential numbering.

											
										
										
											8 years ago
+										}
-												misc

											
										
										
											8 years ago
+									}
-												Add stats serialization, load querier of all blocks

											
										
										
											8 years ago
-												Fix head block stats races

											
										
										
											8 years ago
+									h.bstats.mtx.Lock()
 									defer h.bstats.mtx.Unlock()
 									h.bstats.SampleCount += total
 									h.bstats.SeriesCount += uint64(len(newSeries))
 									h.bstats.ChunkCount += uint64(len(newSeries)) // head block has one chunk/series
 									if mint < h.bstats.MinTime {
 										h.bstats.MinTime = mint
 									}
 									if maxt > h.bstats.MaxTime {
 										h.bstats.MaxTime = maxt
 									}
-												Use separate lock for series creation

This uses the head block's own lock to only lock if new series were
encountered.
In the general append case we just need to hold a

											
										
										
											8 years ago
-												Append to chunks cannot error

											
										
										
											8 years ago
+									return nil
-												Add initial seriailization of block data

											
										
										
											8 years ago
+								}
-												Add postings wrapper that emits head postings in label set order

This adds a position mapper that takes series from a head block
in the order they were appended and creates a mapping representing
them in order of their label sets.

Write-repair of the postings list would cause very expensive writing.
Hence, we keep them as they are and only apply the postition mapping
at the very end, after a postings list has been sufficienctly reduced
through intersections etc.

											
										
										
											8 years ago
-												Fix head block stats races

											
										
										
											8 years ago
+								func (h *HeadBlock) fullness() float64 {
 									h.bstats.mtx.RLock()
 									defer h.bstats.mtx.RUnlock()
 									return float64(h.bstats.SampleCount) / float64(h.bstats.SeriesCount+1) / 250
 								}
-												Don't update head postings mapper on every append

											
										
										
											8 years ago
+								func (h *HeadBlock) updateMapping() {
 									h.mapper.mtx.Lock()
 									defer h.mapper.mtx.Unlock()
 									if h.mapper.sortable != nil && h.mapper.Len() == len(h.descs) {
 										return
 									}
-												Add postings wrapper that emits head postings in label set order

This adds a position mapper that takes series from a head block
in the order they were appended and creates a mapping representing
them in order of their label sets.

Write-repair of the postings list would cause very expensive writing.
Hence, we keep them as they are and only apply the postition mapping
at the very end, after a postings list has been sufficienctly reduced
through intersections etc.

											
										
										
											8 years ago
+									cds := make([]*chunkDesc, len(h.descs))
 									copy(cds, h.descs)
 									s := slice.SortInterface(cds, func(i, j int) bool {
 										return labels.Compare(cds[i].lset, cds[j].lset) < 0
 									})
-												Don't update head postings mapper on every append

											
										
										
											8 years ago
+									h.mapper.update(s)
 								}
 								// remapPostings changes the order of the postings from their ID to the ordering
 								// of the series they reference.
 								// Returned postings have no longer monotonic IDs and MUST NOT be used for regular
 								// postings set operations, i.e. intersect and merge.
 								func (h *HeadBlock) remapPostings(p Postings) Postings {
 									list, err := expandPostings(p)
 									if err != nil {
 										return errPostings{err: err}
 									}
 									h.mapper.mtx.RLock()
 									defer h.mapper.mtx.RUnlock()
 									h.mapper.Sort(list)
 									slice.Sort(list, func(i, j int) bool {
 										return h.mapper.fw[list[i]] < h.mapper.fw[list[j]]
 									})
 									return newListPostings(list)
-												Add postings wrapper that emits head postings in label set order

This adds a position mapper that takes series from a head block
in the order they were appended and creates a mapping representing
them in order of their label sets.

Write-repair of the postings list would cause very expensive writing.
Hence, we keep them as they are and only apply the postition mapping
at the very end, after a postings list has been sufficienctly reduced
through intersections etc.

											
										
										
											8 years ago
+								}
 								// positionMapper stores a position mapping from unsorted to
 								// sorted indices of a sortable collection.
 								type positionMapper struct {
-												Don't update head postings mapper on every append

											
										
										
											8 years ago
+									mtx      sync.RWMutex
-												Add postings wrapper that emits head postings in label set order

This adds a position mapper that takes series from a head block
in the order they were appended and creates a mapping representing
them in order of their label sets.

Write-repair of the postings list would cause very expensive writing.
Hence, we keep them as they are and only apply the postition mapping
at the very end, after a postings list has been sufficienctly reduced
through intersections etc.

											
										
										
											8 years ago
+									sortable sort.Interface
 									iv, fw   []int
 								}
 								func newPositionMapper(s sort.Interface) *positionMapper {
-												Don't update head postings mapper on every append

											
										
										
											8 years ago
+									m := &positionMapper{}
 									if s != nil {
 										m.update(s)
-												Add postings wrapper that emits head postings in label set order

This adds a position mapper that takes series from a head block
in the order they were appended and creates a mapping representing
them in order of their label sets.

Write-repair of the postings list would cause very expensive writing.
Hence, we keep them as they are and only apply the postition mapping
at the very end, after a postings list has been sufficienctly reduced
through intersections etc.

											
										
										
											8 years ago
+									}
 									return m
 								}
 								func (m *positionMapper) Len() int           { return m.sortable.Len() }
 								func (m *positionMapper) Less(i, j int) bool { return m.sortable.Less(i, j) }
 								func (m *positionMapper) Swap(i, j int) {
 									m.sortable.Swap(i, j)
 									m.iv[i], m.iv[j] = m.iv[j], m.iv[i]
 								}
-												Don't update head postings mapper on every append

											
										
										
											8 years ago
 								func (m *positionMapper) Sort(l []uint32) {
 									slice.Sort(l, func(i, j int) bool {
 										return m.fw[l[i]] < m.fw[l[j]]
 									})
 								}
 								func (m *positionMapper) update(s sort.Interface) {
 									m.sortable = s
 									m.iv = make([]int, s.Len())
 									m.fw = make([]int, s.Len())
 									for i := range m.iv {
 										m.iv[i] = i
 									}
 									sort.Sort(m)
 									for i, k := range m.iv {
 										m.fw[k] = i
 									}
 								}