influxdb/tsdb/index/tsi1/measurement_block.go

544 lines
14 KiB
Go
Raw Normal View History

2016-09-02 14:52:11 +00:00
package tsi1
2016-09-26 15:56:12 +00:00
import (
"bytes"
"encoding/binary"
"errors"
"io"
"sort"
2016-09-26 15:56:12 +00:00
2016-11-17 16:33:35 +00:00
"github.com/influxdata/influxdb/pkg/estimator"
"github.com/influxdata/influxdb/pkg/estimator/hll"
2016-09-26 15:56:12 +00:00
"github.com/influxdata/influxdb/pkg/rhh"
)
// MeasurementBlockVersion is the version of the measurement block.
const MeasurementBlockVersion = 1
// Measurement flag constants.
const (
MeasurementTombstoneFlag = 0x01
)
// Measurement field size constants.
const (
// 1 byte offset for the block to ensure non-zero offsets.
MeasurementFillSize = 1
2016-09-26 15:56:12 +00:00
// Measurement trailer fields
MeasurementTrailerSize = 0 +
2 + // version
8 + 8 + // data offset/size
2016-11-17 16:33:35 +00:00
8 + 8 + // hash index offset/size
8 + 8 + // measurement sketch offset/size
8 + 8 // tombstone measurement sketch offset/size
2016-09-26 15:56:12 +00:00
// Measurement key block fields.
MeasurementNSize = 4
MeasurementOffsetSize = 8
)
// Measurement errors.
var (
2016-11-17 16:33:35 +00:00
ErrUnsupportedMeasurementBlockVersion = errors.New("unsupported measurement block version")
ErrMeasurementBlockSizeMismatch = errors.New("measurement block size mismatch")
2016-09-26 15:56:12 +00:00
)
// MeasurementBlock represents a collection of all measurements in an index.
type MeasurementBlock struct {
data []byte
hashData []byte
2016-11-17 16:33:35 +00:00
// Measurement block sketch and tombstone sketch for cardinality
// estimation.
sketch, tsketch estimator.Sketch
2016-09-26 15:56:12 +00:00
version int // block version
}
// Version returns the encoding version parsed from the data.
// Only valid after UnmarshalBinary() has been successfully invoked.
func (blk *MeasurementBlock) Version() int { return blk.version }
// Elem returns an element for a measurement.
2016-10-21 15:31:40 +00:00
func (blk *MeasurementBlock) Elem(name []byte) (e MeasurementBlockElem, ok bool) {
2016-09-26 15:56:12 +00:00
n := binary.BigEndian.Uint32(blk.hashData[:MeasurementNSize])
hash := hashKey(name)
2016-10-07 17:29:22 +00:00
pos := int(hash % n)
2016-09-26 15:56:12 +00:00
// Track current distance
var d int
for {
// Find offset of measurement.
offset := binary.BigEndian.Uint64(blk.hashData[MeasurementNSize+(pos*MeasurementOffsetSize):])
// Evaluate name if offset is not empty.
if offset > 0 {
// Parse into element.
2016-10-21 15:31:40 +00:00
var e MeasurementBlockElem
2016-09-26 15:56:12 +00:00
e.UnmarshalBinary(blk.data[offset:])
// Return if name match.
2016-10-31 14:46:07 +00:00
if bytes.Equal(e.name, name) {
2016-09-26 15:56:12 +00:00
return e, true
}
// Check if we've exceeded the probe distance.
2016-10-31 14:46:07 +00:00
if d > dist(hashKey(e.name), pos, int(n)) {
2016-10-21 15:31:40 +00:00
return MeasurementBlockElem{}, false
2016-09-26 15:56:12 +00:00
}
}
// Move position forward.
pos = (pos + 1) % int(n)
d++
2016-10-25 14:36:58 +00:00
if uint32(d) > n {
2016-12-15 15:31:18 +00:00
return MeasurementBlockElem{}, false
2016-10-25 14:36:58 +00:00
}
2016-09-26 15:56:12 +00:00
}
}
// UnmarshalBinary unpacks data into the block. Block is not copied so data
// should be retained and unchanged after being passed into this function.
func (blk *MeasurementBlock) UnmarshalBinary(data []byte) error {
2016-10-03 15:08:43 +00:00
// Read trailer.
t, err := ReadMeasurementBlockTrailer(data)
if err != nil {
return err
2016-09-26 15:56:12 +00:00
}
2016-10-03 15:08:43 +00:00
// Save data section.
blk.data = data[t.Data.Offset:]
blk.data = blk.data[:t.Data.Size]
// Save hash index block.
blk.hashData = data[t.HashIndex.Offset:]
blk.hashData = blk.hashData[:t.HashIndex.Size]
2016-11-17 16:33:35 +00:00
// Initialise sketches. We're currently using HLL+.
var s, ts *hll.Plus
if err := s.UnmarshalBinary(data[t.Sketch.Offset:][:t.Sketch.Size]); err != nil {
return err
}
blk.sketch = s
if err := ts.UnmarshalBinary(data[t.TSketch.Offset:][:t.TSketch.Size]); err != nil {
return err
}
blk.tsketch = ts
2016-10-03 15:08:43 +00:00
return nil
}
// Iterator returns an iterator over all measurements.
func (blk *MeasurementBlock) Iterator() MeasurementIterator {
2016-10-21 15:31:40 +00:00
return &blockMeasurementIterator{data: blk.data[MeasurementFillSize:]}
}
2016-11-02 16:09:49 +00:00
// seriesIDIterator returns an iterator for all series ids in a measurement.
func (blk *MeasurementBlock) seriesIDIterator(name []byte) seriesIDIterator {
// Find measurement element.
e, ok := blk.Elem(name)
if !ok {
return &rawSeriesIDIterator{}
}
return &rawSeriesIDIterator{data: e.series.data}
}
2016-10-21 15:31:40 +00:00
// blockMeasurementIterator iterates over a list measurements in a block.
type blockMeasurementIterator struct {
2016-10-31 14:46:07 +00:00
elem MeasurementBlockElem
data []byte
}
2016-10-21 15:31:40 +00:00
// Next returns the next measurement. Returns nil when iterator is complete.
2016-10-31 14:46:07 +00:00
func (itr *blockMeasurementIterator) Next() MeasurementElem {
// Return nil when we run out of data.
if len(itr.data) == 0 {
return nil
}
// Unmarshal the element at the current position.
2016-10-31 14:46:07 +00:00
itr.elem.UnmarshalBinary(itr.data)
// Move the data forward past the record.
2016-10-31 14:46:07 +00:00
itr.data = itr.data[itr.elem.size:]
return &itr.elem
}
2016-11-02 16:09:49 +00:00
// rawSeriesIterator iterates over a list of raw series data.
type rawSeriesIDIterator struct {
data []byte
}
// next returns the next decoded series.
func (itr *rawSeriesIDIterator) next() uint32 {
if len(itr.data) == 0 {
return 0
}
id := binary.BigEndian.Uint32(itr.data)
itr.data = itr.data[SeriesIDSize:]
return id
}
// MeasurementBlockTrailer represents meta data at the end of a MeasurementBlock.
type MeasurementBlockTrailer struct {
Version int // Encoding version
// Offset & size of data section.
Data struct {
Offset int64
Size int64
}
// Offset & size of hash map section.
HashIndex struct {
Offset int64
Size int64
}
2016-11-17 16:33:35 +00:00
// Offset and size of cardinality sketch for measurements.
Sketch struct {
Offset int64
Size int64
}
// Offset and size of cardinality sketch for tombstoned measurements.
TSketch struct {
Offset int64
Size int64
}
}
// ReadMeasurementBlockTrailer returns the block trailer from data.
2016-10-03 15:08:43 +00:00
func ReadMeasurementBlockTrailer(data []byte) (MeasurementBlockTrailer, error) {
var t MeasurementBlockTrailer
2016-11-17 16:33:35 +00:00
// Read version (which is located in the last two bytes of the trailer).
t.Version = int(binary.BigEndian.Uint16(data[len(data)-2:]))
2016-10-03 15:08:43 +00:00
if t.Version != MeasurementBlockVersion {
return t, ErrUnsupportedIndexFileVersion
2016-09-26 15:56:12 +00:00
}
// Slice trailer data.
2016-11-17 16:33:35 +00:00
buf := data[len(data)-MeasurementTrailerSize:]
2016-09-26 15:56:12 +00:00
// Read data section info.
t.Data.Offset, buf = int64(binary.BigEndian.Uint64(buf[0:8])), buf[8:]
t.Data.Size, buf = int64(binary.BigEndian.Uint64(buf[0:8])), buf[8:]
2016-09-26 15:56:12 +00:00
// Read measurement block info.
t.HashIndex.Offset, buf = int64(binary.BigEndian.Uint64(buf[0:8])), buf[8:]
t.HashIndex.Size, buf = int64(binary.BigEndian.Uint64(buf[0:8])), buf[8:]
2016-09-26 15:56:12 +00:00
2016-11-17 16:33:35 +00:00
// Read measurment sketch info.
t.Sketch.Offset, buf = int64(binary.BigEndian.Uint64(buf[0:8])), buf[8:]
t.Sketch.Size, buf = int64(binary.BigEndian.Uint64(buf[0:8])), buf[8:]
// Read tombstone measurment sketch info.
t.TSketch.Offset, buf = int64(binary.BigEndian.Uint64(buf[0:8])), buf[8:]
t.TSketch.Size, buf = int64(binary.BigEndian.Uint64(buf[0:8])), buf[8:]
2016-10-03 15:08:43 +00:00
return t, nil
}
// WriteTo writes the trailer to w.
func (t *MeasurementBlockTrailer) WriteTo(w io.Writer) (n int64, err error) {
// Write data section info.
if err := writeUint64To(w, uint64(t.Data.Offset), &n); err != nil {
return n, err
} else if err := writeUint64To(w, uint64(t.Data.Size), &n); err != nil {
return n, err
}
2016-10-03 15:08:43 +00:00
// Write hash index section info.
if err := writeUint64To(w, uint64(t.HashIndex.Offset), &n); err != nil {
return n, err
} else if err := writeUint64To(w, uint64(t.HashIndex.Size), &n); err != nil {
return n, err
2016-10-03 15:08:43 +00:00
}
2016-11-17 16:33:35 +00:00
// Write measurement sketch info.
if err := writeUint64To(w, uint64(t.Sketch.Offset), &n); err != nil {
return n, err
} else if err := writeUint64To(w, uint64(t.Sketch.Size), &n); err != nil {
return n, err
}
// Write tombstone measurement sketch info.
if err := writeUint64To(w, uint64(t.TSketch.Offset), &n); err != nil {
return n, err
} else if err := writeUint64To(w, uint64(t.TSketch.Size), &n); err != nil {
return n, err
}
// Write measurement block version.
if err := writeUint16To(w, MeasurementBlockVersion, &n); err != nil {
return n, err
2016-10-03 15:08:43 +00:00
}
return n, nil
2016-09-26 15:56:12 +00:00
}
2016-10-21 15:31:40 +00:00
// MeasurementBlockElem represents an internal measurement element.
type MeasurementBlockElem struct {
2016-10-31 14:46:07 +00:00
flag byte // flag
name []byte // measurement name
2016-10-05 15:04:04 +00:00
2016-11-02 16:09:49 +00:00
tagBlock struct {
2016-10-31 14:46:07 +00:00
offset int64
size int64
2016-10-05 15:04:04 +00:00
}
2016-09-26 15:56:12 +00:00
2016-10-31 14:46:07 +00:00
series struct {
n uint32 // series count
data []byte // serialized series data
2016-09-26 15:56:12 +00:00
}
2016-10-31 14:46:07 +00:00
// size in bytes, set after unmarshaling.
size int
}
2016-10-31 14:46:07 +00:00
// Name returns the measurement name.
func (e *MeasurementBlockElem) Name() []byte { return e.name }
// Deleted returns true if the tombstone flag is set.
2016-10-21 15:31:40 +00:00
func (e *MeasurementBlockElem) Deleted() bool {
2016-10-31 14:46:07 +00:00
return (e.flag & MeasurementTombstoneFlag) != 0
2016-09-26 15:56:12 +00:00
}
2016-11-02 16:09:49 +00:00
// TagBlockOffset returns the offset of the measurement's tag block.
func (e *MeasurementBlockElem) TagBlockOffset() int64 { return e.tagBlock.offset }
2016-10-31 14:46:07 +00:00
2016-11-02 16:09:49 +00:00
// TagBlockSize returns the size of the measurement's tag block.
func (e *MeasurementBlockElem) TagBlockSize() int64 { return e.tagBlock.size }
2016-10-31 14:46:07 +00:00
2016-09-26 15:56:12 +00:00
// SeriesID returns series ID at an index.
2016-10-21 15:31:40 +00:00
func (e *MeasurementBlockElem) SeriesID(i int) uint32 {
2016-10-31 14:46:07 +00:00
return binary.BigEndian.Uint32(e.series.data[i*SeriesIDSize:])
2016-09-26 15:56:12 +00:00
}
// SeriesIDs returns a list of decoded series ids.
2016-10-21 15:31:40 +00:00
func (e *MeasurementBlockElem) SeriesIDs() []uint32 {
2016-10-31 14:46:07 +00:00
a := make([]uint32, e.series.n)
for i := 0; i < int(e.series.n); i++ {
2016-09-26 15:56:12 +00:00
a[i] = e.SeriesID(i)
}
return a
}
// UnmarshalBinary unmarshals data into e.
2016-10-21 15:31:40 +00:00
func (e *MeasurementBlockElem) UnmarshalBinary(data []byte) error {
start := len(data)
2016-09-26 15:56:12 +00:00
// Parse flag data.
2016-10-31 14:46:07 +00:00
e.flag, data = data[0], data[1:]
2016-09-26 15:56:12 +00:00
2016-11-02 16:09:49 +00:00
// Parse tag block offset.
e.tagBlock.offset, data = int64(binary.BigEndian.Uint64(data)), data[8:]
e.tagBlock.size, data = int64(binary.BigEndian.Uint64(data)), data[8:]
2016-09-26 15:56:12 +00:00
// Parse name.
sz, n := binary.Uvarint(data)
2016-10-31 14:46:07 +00:00
e.name, data = data[n:n+int(sz)], data[n+int(sz):]
2016-09-26 15:56:12 +00:00
// Parse series data.
v, n := binary.Uvarint(data)
2016-10-31 14:46:07 +00:00
e.series.n, data = uint32(v), data[n:]
e.series.data, data = data[:e.series.n*SeriesIDSize], data[e.series.n*SeriesIDSize:]
// Save length of elem.
2016-10-31 14:46:07 +00:00
e.size = start - len(data)
2016-09-26 15:56:12 +00:00
return nil
}
// MeasurementBlockWriter writes a measurement block.
type MeasurementBlockWriter struct {
mms map[string]measurement
2016-11-17 16:33:35 +00:00
// Measurement sketch and tombstoned measurement sketch. These must be
// set before calling WriteTo.
sketch, tsketch estimator.Sketch
2016-09-26 15:56:12 +00:00
}
// NewMeasurementBlockWriter returns a new MeasurementBlockWriter.
func NewMeasurementBlockWriter() *MeasurementBlockWriter {
return &MeasurementBlockWriter{
mms: make(map[string]measurement),
}
}
2016-10-05 15:04:04 +00:00
// Add adds a measurement with series and tag set offset/size.
func (mw *MeasurementBlockWriter) Add(name []byte, offset, size int64, seriesIDs []uint32) {
2016-09-26 15:56:12 +00:00
mm := mw.mms[string(name)]
2016-11-02 16:09:49 +00:00
mm.tagBlock.offset = offset
mm.tagBlock.size = size
2016-09-26 15:56:12 +00:00
mm.seriesIDs = seriesIDs
mw.mms[string(name)] = mm
}
// WriteTo encodes the measurements to w.
func (mw *MeasurementBlockWriter) WriteTo(w io.Writer) (n int64, err error) {
var t MeasurementBlockTrailer
2016-09-26 15:56:12 +00:00
2016-11-17 16:33:35 +00:00
// The sketches must be set before calling WriteTo.
if mw.sketch == nil {
return 0, errors.New("measurement sketch not set")
} else if mw.tsketch == nil {
return 0, errors.New("measurement tombstone sketch not set")
}
// Sort names.
names := make([]string, 0, len(mw.mms))
2016-09-26 15:56:12 +00:00
for name := range mw.mms {
names = append(names, name)
2016-09-26 15:56:12 +00:00
}
sort.Strings(names)
2016-09-26 15:56:12 +00:00
// Begin data section.
t.Data.Offset = n
// Write padding byte so no offsets are zero.
if err := writeUint8To(w, 0, &n); err != nil {
return n, err
}
2016-09-26 15:56:12 +00:00
// Encode key list.
for _, name := range names {
// Retrieve measurement and save offset.
mm := mw.mms[name]
mm.offset = n
mw.mms[name] = mm
2016-09-26 15:56:12 +00:00
// Write measurement
if err := mw.writeMeasurementTo(w, []byte(name), &mm, &n); err != nil {
2016-09-26 15:56:12 +00:00
return n, err
}
}
t.Data.Size = n - t.Data.Offset
2016-09-26 15:56:12 +00:00
// Build key hash map
m := rhh.NewHashMap(rhh.Options{
2016-10-25 14:36:58 +00:00
Capacity: len(names),
LoadFactor: 90,
})
for name := range mw.mms {
mm := mw.mms[name]
m.Put([]byte(name), &mm)
}
t.HashIndex.Offset = n
2016-09-26 15:56:12 +00:00
// Encode hash map length.
if err := writeUint32To(w, uint32(m.Cap()), &n); err != nil {
return n, err
}
// Encode hash map offset entries.
for i := 0; i < m.Cap(); i++ {
_, v := m.Elem(i)
var offset int64
if mm, ok := v.(*measurement); ok {
offset = mm.offset
}
if err := writeUint64To(w, uint64(offset), &n); err != nil {
2016-09-26 15:56:12 +00:00
return n, err
}
}
t.HashIndex.Size = n - t.HashIndex.Offset
2016-09-26 15:56:12 +00:00
2016-11-17 16:33:35 +00:00
// Write the sketches out.
t.Sketch.Offset = n
if err := writeSketchTo(w, mw.sketch, &n); err != nil {
return n, err
}
t.Sketch.Size = n - t.Sketch.Offset
t.TSketch.Offset = n
if err := writeSketchTo(w, mw.tsketch, &n); err != nil {
return n, err
}
t.TSketch.Size = n - t.TSketch.Offset
2016-09-26 15:56:12 +00:00
// Write trailer.
nn, err := t.WriteTo(w)
n += nn
if err != nil {
2016-09-26 15:56:12 +00:00
return n, err
}
return n, nil
}
// writeMeasurementTo encodes a single measurement entry into w.
func (mw *MeasurementBlockWriter) writeMeasurementTo(w io.Writer, name []byte, mm *measurement, n *int64) error {
2016-11-02 16:09:49 +00:00
// Write flag & tag block offset.
2016-09-26 15:56:12 +00:00
if err := writeUint8To(w, mm.flag(), n); err != nil {
return err
}
2016-11-02 16:09:49 +00:00
if err := writeUint64To(w, uint64(mm.tagBlock.offset), n); err != nil {
2016-10-05 15:04:04 +00:00
return err
2016-11-02 16:09:49 +00:00
} else if err := writeUint64To(w, uint64(mm.tagBlock.size), n); err != nil {
2016-09-26 15:56:12 +00:00
return err
}
// Write measurement name.
if err := writeUvarintTo(w, uint64(len(name)), n); err != nil {
return err
}
if err := writeTo(w, name, n); err != nil {
return err
}
// Write series count & ids.
if err := writeUvarintTo(w, uint64(len(mm.seriesIDs)), n); err != nil {
return err
}
for _, seriesID := range mm.seriesIDs {
if err := writeUint32To(w, seriesID, n); err != nil {
return err
}
}
return nil
}
2016-11-17 16:33:35 +00:00
// writeSketchTo writes an estimator.Sketch into w, updating the number of bytes
// written via n.
func writeSketchTo(w io.Writer, s estimator.Sketch, n *int64) error {
// TODO(edd): implement io.WriterTo on sketches.
data, err := s.MarshalBinary()
if err != nil {
return err
}
nn, err := w.Write(data)
*n += int64(nn)
return err
}
2016-09-26 15:56:12 +00:00
type measurement struct {
2016-11-02 16:09:49 +00:00
deleted bool
tagBlock struct {
2016-10-05 15:04:04 +00:00
offset int64
size int64
}
2016-09-26 15:56:12 +00:00
seriesIDs []uint32
offset int64
2016-09-26 15:56:12 +00:00
}
func (mm measurement) flag() byte {
var flag byte
if mm.deleted {
flag |= MeasurementTombstoneFlag
}
return flag
}