influxdb/tsdb/store.go

package tsdb // import "github.com/influxdata/influxdb/tsdb"

import (
	"errors"
	"fmt"
	"io"
	"io/ioutil"
	"os"
	"path/filepath"
	"runtime"
	"sort"
	"strconv"
	"strings"
	"sync"
	"time"

	"github.com/influxdata/influxdb/influxql"
	"github.com/influxdata/influxdb/models"
	"github.com/influxdata/influxdb/pkg/estimator"
	"github.com/influxdata/influxdb/pkg/limiter"
	"go.uber.org/zap"
)

var (
	// ErrShardNotFound is returned when trying to get a non existing shard.
	ErrShardNotFound = fmt.Errorf("shard not found")
	// ErrStoreClosed is returned when trying to use a closed Store.
	ErrStoreClosed = fmt.Errorf("store is closed")
)

// Store manages shards and indexes for databases.
type Store struct {
	mu sync.RWMutex
	// databases keeps track of the number of databases being managed by the
	// store.
	databases map[string]struct{}

	path string

	// shards is a map of shard IDs to the associated Shard.
	shards map[uint64]*Shard

	EngineOptions EngineOptions
	baseLogger    zap.Logger
	Logger        zap.Logger

	closing chan struct{}
	wg      sync.WaitGroup
	opened  bool
}

// NewStore returns a new store with the given path and a default configuration.
// The returned store must be initialized by calling Open before using it.
func NewStore(path string) *Store {
	opts := NewEngineOptions()

	logger := zap.New(zap.NullEncoder())
	return &Store{
		databases:     make(map[string]struct{}),
		path:          path,
		EngineOptions: opts,
		Logger:        logger,
		baseLogger:    logger,
	}
}

// WithLogger sets the logger for the store.
func (s *Store) WithLogger(log zap.Logger) {
	s.baseLogger = log
	s.Logger = log.With(zap.String("service", "store"))
	for _, sh := range s.shards {
		sh.WithLogger(s.baseLogger)
	}
}

// Statistics returns statistics for period monitoring.
func (s *Store) Statistics(tags map[string]string) []models.Statistic {
	s.mu.RLock()
	shards := s.shardsSlice()
	s.mu.RUnlock()

	// Gather all statistics for all shards.
	var statistics []models.Statistic
	for _, shard := range shards {
		statistics = append(statistics, shard.Statistics(tags)...)
	}
	return statistics
}

// Path returns the store's root path.
func (s *Store) Path() string { return s.path }

// Open initializes the store, creating all necessary directories, loading all
// shards as well as initializing periodic maintenance of them.
func (s *Store) Open() error {
	s.mu.Lock()
	defer s.mu.Unlock()

	s.closing = make(chan struct{})
	s.shards = map[uint64]*Shard{}

	s.Logger.Info(fmt.Sprintf("Using data dir: %v", s.Path()))

	// Create directory.
	if err := os.MkdirAll(s.path, 0777); err != nil {
		return err
	}

	if err := s.loadShards(); err != nil {
		return err
	}

	s.opened = true

	return nil
}

func (s *Store) loadShards() error {
	// res holds the result from opening each shard in a goroutine
	type res struct {
		s   *Shard
		err error
	}

	t := limiter.NewFixed(runtime.GOMAXPROCS(0))

	resC := make(chan *res)
	var n int

	// Determine how many shards we need to open by checking the store path.
	dbDirs, err := ioutil.ReadDir(s.path)
	if err != nil {
		return err
	}

	for _, db := range dbDirs {
		if !db.IsDir() {
			s.Logger.Printf("Not loading %s. Not a database directory.", db.Name())
			continue
		}

		// Load each retention policy within the database directory.
		rpDirs, err := ioutil.ReadDir(filepath.Join(s.path, db.Name()))
		if err != nil {
			return err
		}

		for _, rp := range rpDirs {
			if !rp.IsDir() {
				s.Logger.Info(fmt.Sprintf("Skipping retention policy dir: %s. Not a directory", rp.Name()))
				continue
			}

			shardDirs, err := ioutil.ReadDir(filepath.Join(s.path, db.Name(), rp.Name()))
			if err != nil {
				return err
			}
			for _, sh := range shardDirs {
				n++
				go func(db, rp, sh string) {
					t.Take()
					defer t.Release()

					start := time.Now()
					path := filepath.Join(s.path, db, rp, sh)
					walPath := filepath.Join(s.EngineOptions.Config.WALDir, db, rp, sh)

					// Shard file names are numeric shardIDs
					shardID, err := strconv.ParseUint(sh, 10, 64)
					if err != nil {
						resC <- &res{err: fmt.Errorf("%s is not a valid ID. Skipping shard.", sh)}
						return
					}

					shard := NewShard(shardID, path, walPath, s.EngineOptions)
					shard.WithLogger(s.baseLogger)

					err = shard.Open()
					if err != nil {
						resC <- &res{err: fmt.Errorf("Failed to open shard: %d: %s", shardID, err)}
						return
					}

					resC <- &res{s: shard}
					s.Logger.Info(fmt.Sprintf("%s opened in %s", path, time.Now().Sub(start)))
				}(db, rp.Name(), sh.Name())
			}
		}
	}

	// Gather results of opening shards concurrently, keeping track of how
	// many databases we are managing.
	for i := 0; i < n; i++ {
		res := <-resC
		if res.err != nil {
			s.Logger.Info(res.err.Error())
			continue
		}
		s.shards[res.s.id] = res.s
		s.databases[res.s.database] = struct{}{}
	}
	close(resC)
	return nil
}

// Close closes the store and all associated shards. After calling Close accessing
// shards through the Store will result in ErrStoreClosed being returned.
func (s *Store) Close() error {
	s.mu.Lock()
	defer s.mu.Unlock()

	if s.opened {
		close(s.closing)
	}
	s.wg.Wait()

	// Close all the shards in parallel.
	if err := s.walkShards(s.shardsSlice(), func(sh *Shard) error {
		return sh.Close()
	}); err != nil {
		return err
	}

	s.opened = false
	s.shards = nil

	return nil
}

// Shard returns a shard by id.
func (s *Store) Shard(id uint64) *Shard {
	s.mu.RLock()
	defer s.mu.RUnlock()
	sh, ok := s.shards[id]
	if !ok {
		return nil
	}
	return sh
}

// Shards returns a list of shards by id.
func (s *Store) Shards(ids []uint64) []*Shard {
	s.mu.RLock()
	defer s.mu.RUnlock()
	a := make([]*Shard, 0, len(ids))
	for _, id := range ids {
		sh, ok := s.shards[id]
		if !ok {
			continue
		}
		a = append(a, sh)
	}
	return a
}

// ShardN returns the number of shards in the store.
func (s *Store) ShardN() int {
	s.mu.RLock()
	defer s.mu.RUnlock()
	return len(s.shards)
}

// CreateShard creates a shard with the given id and retention policy on a database.
func (s *Store) CreateShard(database, retentionPolicy string, shardID uint64, enabled bool) error {
	s.mu.Lock()
	defer s.mu.Unlock()

	select {
	case <-s.closing:
		return ErrStoreClosed
	default:
	}

	// Shard already exists.
	if _, ok := s.shards[shardID]; ok {
		return nil
	}

	// Create the db and retention policy directories if they don't exist.
	if err := os.MkdirAll(filepath.Join(s.path, database, retentionPolicy), 0700); err != nil {
		return err
	}

	// Create the WAL directory.
	walPath := filepath.Join(s.EngineOptions.Config.WALDir, database, retentionPolicy, fmt.Sprintf("%d", shardID))
	if err := os.MkdirAll(walPath, 0700); err != nil {
		return err
	}

	path := filepath.Join(s.path, database, retentionPolicy, strconv.FormatUint(shardID, 10))
	shard := NewShard(shardID, path, walPath, s.EngineOptions)
	shard.WithLogger(s.baseLogger)
	shard.EnableOnOpen = enabled

	if err := shard.Open(); err != nil {
		return err
	}

	s.shards[shardID] = shard
	s.databases[database] = struct{}{} // Ensure we are tracking any new db.

	return nil
}

// CreateShardSnapShot will create a hard link to the underlying shard and return a path.
// The caller is responsible for cleaning up (removing) the file path returned.
func (s *Store) CreateShardSnapshot(id uint64) (string, error) {
	sh := s.Shard(id)
	if sh == nil {
		return "", ErrShardNotFound
	}

	return sh.CreateSnapshot()
}

// SetShardEnabled enables or disables a shard for read and writes.
func (s *Store) SetShardEnabled(shardID uint64, enabled bool) error {
	sh := s.Shard(shardID)
	if sh == nil {
		return ErrShardNotFound
	}
	sh.SetEnabled(enabled)
	return nil
}

// DeleteShard removes a shard from disk.
func (s *Store) DeleteShard(shardID uint64) error {
	sh := s.Shard(shardID)
	if sh == nil {
		return nil
	}

	if err := sh.Close(); err != nil {
		return err
	}

	if err := os.RemoveAll(sh.path); err != nil {
		return err
	}

	if err := os.RemoveAll(sh.walPath); err != nil {
		return err
	}

	s.mu.Lock()
	delete(s.shards, shardID)
	s.mu.Unlock()

	return nil
}

// ShardIteratorCreator returns an iterator creator for a shard.
func (s *Store) ShardIteratorCreator(id uint64, opt *influxql.SelectOptions) influxql.IteratorCreator {
	sh := s.Shard(id)
	if sh == nil {
		return nil
	}
	return &shardIteratorCreator{
		sh:         sh,
		maxSeriesN: opt.MaxSeriesN,
	}
}

// DeleteDatabase will close all shards associated with a database and remove the directory and files from disk.
func (s *Store) DeleteDatabase(name string) error {
	s.mu.RLock()
	shards := s.filterShards(byDatabase(name))
	s.mu.RUnlock()

	if err := s.walkShards(shards, func(sh *Shard) error {
		if sh.database != name {
			return nil
		}

		return sh.Close()
	}); err != nil {
		return err
	}

	if err := os.RemoveAll(filepath.Join(s.path, name)); err != nil {
		return err
	}
	if err := os.RemoveAll(filepath.Join(s.EngineOptions.Config.WALDir, name)); err != nil {
		return err
	}

	s.mu.Lock()
	for _, sh := range shards {
		delete(s.shards, sh.id)
	}

	// Remove database from store list of databases
	delete(s.databases, name)
	s.mu.Unlock()

	return nil
}

// DeleteRetentionPolicy will close all shards associated with the
// provided retention policy, remove the retention policy directories on
// both the DB and WAL, and remove all shard files from disk.
func (s *Store) DeleteRetentionPolicy(database, name string) error {
	s.mu.RLock()
	shards := s.filterShards(func(sh *Shard) bool {
		return sh.database == database && sh.retentionPolicy == name
	})
	s.mu.RUnlock()

	// Close and delete all shards under the retention policy on the
	// database.
	if err := s.walkShards(shards, func(sh *Shard) error {
		if sh.database != database || sh.retentionPolicy != name {
			return nil
		}

		return sh.Close()
	}); err != nil {
		return err
	}

	// Remove the retention policy folder.
	if err := os.RemoveAll(filepath.Join(s.path, database, name)); err != nil {
		return err
	}

	// Remove the retention policy folder from the the WAL.
	if err := os.RemoveAll(filepath.Join(s.EngineOptions.Config.WALDir, database, name)); err != nil {
		return err
	}

	s.mu.Lock()
	for _, sh := range shards {
		delete(s.shards, sh.id)
	}
	s.mu.Unlock()
	return nil
}

// DeleteMeasurement removes a measurement and all associated series from a database.
func (s *Store) DeleteMeasurement(database, name string) error {
	s.mu.RLock()
	shards := s.filterShards(byDatabase(database))
	s.mu.RUnlock()

	return s.walkShards(shards, func(sh *Shard) error {
		if err := sh.DeleteMeasurement(name); err != nil {
			return err
		}
		return nil
	})
}

// filterShards returns a slice of shards where fn returns true
// for the shard. If the provided predicate is nil then all shards are returned.
func (s *Store) filterShards(fn func(sh *Shard) bool) []*Shard {
	var shards []*Shard
	if fn == nil {
		shards = make([]*Shard, 0, len(s.shards))
		fn = func(*Shard) bool { return true }
	} else {
		shards = make([]*Shard, 0)
	}

	for _, sh := range s.shards {
		if fn(sh) {
			shards = append(shards, sh)
		}
	}
	return shards
}

// byDatabase provides a predicate for filterShards that matches on the name of
// the database passed in.
var byDatabase = func(name string) func(sh *Shard) bool {
	return func(sh *Shard) bool {
		return sh.database == name
	}
}

// walkShards apply a function to each shard in parallel.  If any of the
// functions return an error, the first error is returned.
func (s *Store) walkShards(shards []*Shard, fn func(sh *Shard) error) error {
	// struct to hold the result of opening each reader in a goroutine
	type res struct {
		err error
	}

	resC := make(chan res)
	var n int

	for _, sh := range shards {
		n++

		go func(sh *Shard) {
			if err := fn(sh); err != nil {
				resC <- res{err: fmt.Errorf("shard %d: %s", sh.id, err)}
				return
			}

			resC <- res{}
		}(sh)
	}

	var err error
	for i := 0; i < n; i++ {
		res := <-resC
		if res.err != nil {
			err = res.err
		}
	}
	close(resC)
	return err
}

// shardsSlice returns an ordered list of shards.
func (s *Store) shardsSlice() []*Shard {
	a := make([]*Shard, 0, len(s.shards))
	for _, sh := range s.shards {
		a = append(a, sh)
	}
	sort.Sort(Shards(a))
	return a
}

// Databases returns the names of all databases managed by the store.
func (s *Store) Databases() []string {
	s.mu.RLock()
	defer s.mu.RUnlock()

	databases := make([]string, 0, len(s.databases))
	for k, _ := range s.databases {
		databases = append(databases, k)
	}
	return databases
}

// DiskSize returns the size of all the shard files in bytes.
// This size does not include the WAL size.
func (s *Store) DiskSize() (int64, error) {
	var size int64

	s.mu.RLock()
	allShards := s.filterShards(nil)
	s.mu.RUnlock()

	for _, sh := range allShards {
		sz, err := sh.DiskSize()
		if err != nil {
			return 0, err
		}
		size += sz
	}
	return size, nil
}

// SeriesCardinality returns the series cardinality for the provided database.
func (s *Store) SeriesCardinality(database string) (int64, error) {
	s.mu.RLock()
	shards := s.filterShards(byDatabase(database))
	s.mu.RUnlock()

	var sketch estimator.Sketch
	// Iterate over all shards for the database and combine all of the series
	// sketches.
	for _, shard := range shards {
		other, err := shard.engine.SeriesSketch()
		if err != nil {
			return 0, err
		}

		if sketch == nil {
			sketch = other
		} else if err = sketch.Merge(other); err != nil {
			return 0, err
		}
	}

	if sketch != nil {
		cnt, err := sketch.Count()
		return int64(cnt), err
	}
	return 0, nil
}

// MeasurementsCardinality returns the measurement cardinality for the provided
// database.
func (s *Store) MeasurementsCardinality(database string) (int64, error) {
	panic("TODO: edd")
}

// BackupShard will get the shard and have the engine backup since the passed in
// time to the writer.
func (s *Store) BackupShard(id uint64, since time.Time, w io.Writer) error {
	shard := s.Shard(id)
	if shard == nil {
		return fmt.Errorf("shard %d doesn't exist on this server", id)
	}

	path, err := relativePath(s.path, shard.path)
	if err != nil {
		return err
	}

	return shard.engine.Backup(w, path, since)
}

// RestoreShard restores a backup from r to a given shard.
// This will only overwrite files included in the backup.
func (s *Store) RestoreShard(id uint64, r io.Reader) error {
	shard := s.Shard(id)
	if shard == nil {
		return fmt.Errorf("shard %d doesn't exist on this server", id)
	}

	path, err := relativePath(s.path, shard.path)
	if err != nil {
		return err
	}

	return shard.Restore(r, path)
}

// ShardRelativePath will return the relative path to the shard, i.e.,
// <database>/<retention>/<id>.
func (s *Store) ShardRelativePath(id uint64) (string, error) {
	shard := s.Shard(id)
	if shard == nil {
		return "", fmt.Errorf("shard %d doesn't exist on this server", id)
	}
	return relativePath(s.path, shard.path)
}

// DeleteSeries loops through the local shards and deletes the series data for
// the passed in series keys.
func (s *Store) DeleteSeries(database string, sources []influxql.Source, condition influxql.Expr) error {
	// Expand regex expressions in the FROM clause.
	a, err := s.ExpandSources(sources)
	if err != nil {
		return err
	} else if sources != nil && len(sources) != 0 && len(a) == 0 {
		return nil
	}
	sources = a

	// Determine deletion time range.
	min, max, err := influxql.TimeRangeAsEpochNano(condition)
	if err != nil {
		return err
	}

	s.mu.RLock()
	shards := s.filterShards(byDatabase(database))
	s.mu.RUnlock()

	mMap := make(map[string]*Measurement)
	for _, shard := range shards {
		shardMeasures := shard.Measurements()
		for _, m := range shardMeasures {
			mMap[m.Name] = m
		}
	}

	s.mu.RLock()
	defer s.mu.RUnlock()

	measurements, err := measurementsFromSourcesOrDB(mMap, sources...)
	if err != nil {
		return err
	}

	var seriesKeys []string
	for _, m := range measurements {
		var ids SeriesIDs
		var filters FilterExprs
		if condition != nil {
			// Get series IDs that match the WHERE clause.
			ids, filters, err = m.walkWhereForSeriesIds(condition)
			if err != nil {
				return err
			}

			// Delete boolean literal true filter expressions.
			// These are returned for `WHERE tagKey = 'tagVal'` type expressions and are okay.
			filters.DeleteBoolLiteralTrues()

			// Check for unsupported field filters.
			// Any remaining filters means there were fields (e.g., `WHERE value = 1.2`).
			if filters.Len() > 0 {
				return errors.New("fields not supported in WHERE clause during deletion")
			}
		} else {
			// No WHERE clause so get all series IDs for this measurement.
			ids = m.seriesIDs
		}

		for _, id := range ids {
			seriesKeys = append(seriesKeys, m.seriesByID[id].Key)
		}
	}

	// delete the raw series data.
	return s.walkShards(shards, func(sh *Shard) error {
		if err := sh.DeleteSeriesRange(seriesKeys, min, max); err != nil {
			return err
		}
		return nil
	})
}

// ExpandSources expands sources against all local shards.
func (s *Store) ExpandSources(sources influxql.Sources) (influxql.Sources, error) {
	return s.IteratorCreators().ExpandSources(sources)
}

// IteratorCreators returns a set of all local shards as iterator creators.
func (s *Store) IteratorCreators() influxql.IteratorCreators {
	s.mu.RLock()
	defer s.mu.RUnlock()

	a := make(influxql.IteratorCreators, 0, len(s.shards))
	for _, sh := range s.shards {
		a = append(a, sh)
	}
	return a
}

// IteratorCreator returns an iterator creator for all shards in the given shard IDs.
func (s *Store) IteratorCreator(shards []uint64, opt *influxql.SelectOptions) (influxql.IteratorCreator, error) {
	// Generate iterators for each node.
	ics := make([]influxql.IteratorCreator, 0)
	if err := func() error {
		for _, id := range shards {
			ic := s.ShardIteratorCreator(id, opt)
			if ic == nil {
				continue
			}
			ics = append(ics, ic)
		}

		return nil
	}(); err != nil {
		influxql.IteratorCreators(ics).Close()
		return nil, err
	}

	return influxql.IteratorCreators(ics), nil
}

// WriteToShard writes a list of points to a shard identified by its ID.
func (s *Store) WriteToShard(shardID uint64, points []models.Point) error {
	s.mu.RLock()

	select {
	case <-s.closing:
		s.mu.RUnlock()
		return ErrStoreClosed
	default:
	}

	sh := s.shards[shardID]
	if sh == nil {
		s.mu.RUnlock()
		return ErrShardNotFound
	}
	s.mu.RUnlock()

	return sh.WritePoints(points)
}

// Measurements returns a slice of all measurements. Measurements accepts an
// optional condition expression. If cond is nil, then all measurements for the
// database will be returned.
func (s *Store) Measurements(database string, cond influxql.Expr) ([]string, error) {
	s.mu.RLock()
	shards := s.filterShards(byDatabase(database))
	s.mu.RUnlock()

	var m Measurements
	for _, sh := range shards {
		var mms Measurements
		// Retrieve measurements from database index. Filter if condition specified.
		if cond == nil {
			mms = sh.Measurements()
		} else {
			var err error
			mms, _, err = sh.MeasurementsByExpr(cond)
			if err != nil {
				return nil, err
			}
		}

		m = append(m, mms...)
	}

	// Sort measurements by name.
	sort.Sort(m)

	measurements := make([]string, 0, len(m))
	for _, m := range m {
		measurements = append(measurements, m.Name)
	}

	return measurements, nil
}

// MeasurementSeriesCounts returns the number of measurements and series in all
// the shards' indices.
func (s *Store) MeasurementSeriesCounts(database string) (measuments int, series int) {
	// TODO: implement me
	return 0, 0
}

type TagValues struct {
	Measurement string
	Values      []KeyValue
}

// TagValues returns the tag keys and values in the given database, matching the condition.
func (s *Store) TagValues(database string, cond influxql.Expr) ([]TagValues, error) {
	if cond == nil {
		return nil, errors.New("a condition is required")
	}

	measurementExpr := influxql.CloneExpr(cond)
	measurementExpr = influxql.Reduce(influxql.RewriteExpr(measurementExpr, func(e influxql.Expr) influxql.Expr {
		switch e := e.(type) {
		case *influxql.BinaryExpr:
			switch e.Op {
			case influxql.EQ, influxql.NEQ, influxql.EQREGEX, influxql.NEQREGEX:
				tag, ok := e.LHS.(*influxql.VarRef)
				if !ok || tag.Val != "_name" {
					return nil
				}
			}
		}
		return e
	}), nil)

	// Get all measurements for the shards we're interested in.
	s.mu.RLock()
	shards := s.filterShards(byDatabase(database))
	s.mu.RUnlock()

	var measures Measurements
	for _, sh := range shards {
		mms, ok, err := sh.MeasurementsByExpr(measurementExpr)
		if err != nil {
			return nil, err
		} else if !ok {
			// TODO(edd): can we simplify this so we don't have to check the
			// ok value, and we can call sh.measurements with a shard filter
			// instead?
			mms = sh.Measurements()
		}

		measures = append(measures, mms...)
	}

	// If there are no measurements, return immediately.
	if len(measures) == 0 {
		return nil, nil
	}
	sort.Sort(measures)

	filterExpr := influxql.CloneExpr(cond)
	filterExpr = influxql.Reduce(influxql.RewriteExpr(filterExpr, func(e influxql.Expr) influxql.Expr {
		switch e := e.(type) {
		case *influxql.BinaryExpr:
			switch e.Op {
			case influxql.EQ, influxql.NEQ, influxql.EQREGEX, influxql.NEQREGEX:
				tag, ok := e.LHS.(*influxql.VarRef)
				if !ok || strings.HasPrefix(tag.Val, "_") {
					return nil
				}
			}
		}
		return e
	}), nil)

	tagValues := make([]TagValues, len(measures))
	for i, mm := range measures {
		tagValues[i].Measurement = mm.Name

		ids, err := mm.SeriesIDsAllOrByExpr(filterExpr)
		if err != nil {
			return nil, err
		}
		ss := mm.SeriesByIDSlice(ids)

		// Determine a list of keys from condition.
		keySet, ok, err := mm.TagKeysByExpr(cond)
		if err != nil {
			return nil, err
		}

		// Loop over all keys for each series.
		m := make(map[KeyValue]struct{}, len(ss))
		for _, series := range ss {
			for _, t := range series.Tags {
				if !ok {
					// nop
				} else if _, exists := keySet[string(t.Key)]; !exists {
					continue
				}
				m[KeyValue{string(t.Key), string(t.Value)}] = struct{}{}
			}
		}

		// Return an empty slice if there are no key/value matches.
		if len(m) == 0 {
			continue
		}

		// Sort key/value set.
		a := make([]KeyValue, 0, len(m))
		for kv := range m {
			a = append(a, kv)
		}
		sort.Sort(KeyValues(a))
		tagValues[i].Values = a
	}

	return tagValues, nil
}

// KeyValue holds a string key and a string value.
type KeyValue struct {
	Key, Value string
}

// KeyValues is a sortable slice of KeyValue.
type KeyValues []KeyValue

// Len implements sort.Interface.
func (a KeyValues) Len() int { return len(a) }

// Swap implements sort.Interface.
func (a KeyValues) Swap(i, j int) { a[i], a[j] = a[j], a[i] }

// Less implements sort.Interface. Keys are compared before values.
func (a KeyValues) Less(i, j int) bool {
	ki, kj := a[i].Key, a[j].Key
	if ki == kj {
		return a[i].Value < a[j].Value
	}
	return ki < kj
}

// filterShowSeriesResult will limit the number of series returned based on the limit and the offset.
// Unlike limit and offset on SELECT statements, the limit and offset don't apply to the number of Rows, but
// to the number of total Values returned, since each Value represents a unique series.
func (e *Store) filterShowSeriesResult(limit, offset int, rows models.Rows) models.Rows {
	var filteredSeries models.Rows
	seriesCount := 0
	for _, r := range rows {
		var currentSeries [][]interface{}

		// filter the values
		for _, v := range r.Values {
			if seriesCount >= offset && seriesCount-offset < limit {
				currentSeries = append(currentSeries, v)
			}
			seriesCount++
		}

		// only add the row back in if there are some values in it
		if len(currentSeries) > 0 {
			r.Values = currentSeries
			filteredSeries = append(filteredSeries, r)
			if seriesCount > limit+offset {
				return filteredSeries
			}
		}
	}
	return filteredSeries
}

// decodeStorePath extracts the database and retention policy names
// from a given shard or WAL path.
func decodeStorePath(shardOrWALPath string) (database, retentionPolicy string) {
	// shardOrWALPath format: /maybe/absolute/base/then/:database/:retentionPolicy/:nameOfShardOrWAL

	// Discard the last part of the path (the shard name or the wal name).
	path, _ := filepath.Split(filepath.Clean(shardOrWALPath))

	// Extract the database and retention policy.
	path, rp := filepath.Split(filepath.Clean(path))
	_, db := filepath.Split(filepath.Clean(path))
	return db, rp
}

// relativePath will expand out the full paths passed in and return
// the relative shard path from the store
func relativePath(storePath, shardPath string) (string, error) {
	path, err := filepath.Abs(storePath)
	if err != nil {
		return "", fmt.Errorf("store abs path: %s", err)
	}

	fp, err := filepath.Abs(shardPath)
	if err != nil {
		return "", fmt.Errorf("file abs path: %s", err)
	}

	name, err := filepath.Rel(path, fp)
	if err != nil {
		return "", fmt.Errorf("file rel path: %s", err)
	}

	return name, nil
}

// measurementsFromSourcesOrDB returns a list of measurements from the
// sources passed in or, if sources is empty, a list of all
// measurement names from the measurement map passed in.
func measurementsFromSourcesOrDB(measurements map[string]*Measurement, sources ...influxql.Source) (Measurements, error) {
	var all Measurements
	if len(sources) > 0 {
		for _, source := range sources {
			if m, ok := source.(*influxql.Measurement); ok {
				measurement := measurements[m.Name]
				if measurement == nil {
					continue
				}

				all = append(all, measurement)
			} else {
				return nil, errors.New("identifiers in FROM clause must be measurement names")
			}
		}
	} else {
		// No measurements specified in FROM clause so get all measurements that have series.
		for _, m := range measurements {
			if m.HasSeries() {
				all = append(all, m)
			}
		}
	}
	sort.Sort(all)

	return all, nil
}
-												add canonical paths

											
										
										
											2016-02-10 18:30:52 +00:00
+								package tsdb // import "github.com/influxdata/influxdb/tsdb"
-												Move data.Node to tsdb.Store. Move data to cluster.
											
										
										
											2015-05-26 19:56:54 +00:00
 								import (
-												refactor query executor

This commit moves the `QueryExecutor` to the `cluster` package
and provides an interface to it inside the `influxql` package.

											
										
										
											2016-02-12 22:10:02 +00:00
+									"errors"
-												Move data.Node to tsdb.Store. Move data to cluster.
											
										
										
											2015-05-26 19:56:54 +00:00
+									"fmt"
-												Implement backup/restore for TSM.

This changes backup and restore to work for TSM. It breaks it for b1 and bz1, but since those are getting removed it's ok.

The backup runs against any host that is specified and can backup either the metasstore, a database, specific retention policy, or a specific shard. It can also take incremental backups with the `since` flag, which will only backup TSM files that have been created since that timestamp.

The backup is safe to run online. However, for shards that are still hot for writes, they won't be able to create new TSM files while the backup for that single shard runs. If the backup isn't too large and the write throughput isn't too high this shouldn't be a problem since the writes will just go into the WAL cache.

											
										
										
											2015-12-25 13:23:22 +00:00
+									"io"
-												Update tx.go to work with tsdb

											
										
										
											2015-05-28 22:02:12 +00:00
+									"io/ioutil"
-												Move data.Node to tsdb.Store. Move data to cluster.
											
										
										
											2015-05-26 19:56:54 +00:00
+									"os"
 									"path/filepath"
-												Limit concurrent shards loading to number of cores available

											
										
										
											2016-05-13 21:10:18 +00:00
+									"runtime"
-												refactor query engine

											
										
										
											2015-11-04 21:06:06 +00:00
+									"sort"
-												Update tx.go to work with tsdb

											
										
										
											2015-05-28 22:02:12 +00:00
+									"strconv"
-												Switch SHOW MEASUREMENTS and SHOW TAG VALUES to directly access the tsdb.Store

The `SHOW MEASUREMENTS` and `SHOW TAG VALUES` cannot go through the
query engine to get the speed they need. They also only need access to
the database index and do not need access to specific shards. This
removes the query rewriting that was done to turn these two queries into
a select statement and reimplements them inside of the coordinator as an
interface on the TSDBStore.

											
										
										
											2016-07-28 22:38:08 +00:00
+									"strings"
-												Update tx.go to work with tsdb

											
										
										
											2015-05-28 22:02:12 +00:00
+									"sync"
-												Add PerformMaintenance to store for flushes and compactions.

Also fixed shard to work again with b1 and bz1 engines.

											
										
										
											2015-09-29 02:50:00 +00:00
+									"time"
-												Update tx.go to work with tsdb

											
										
										
											2015-05-28 22:02:12 +00:00
-												rename influxdb/influxdb to influxdata/influxdb

This commit changes all the import and URL references from:

    github.com/influxdb/influxdb

to:

    github.com/influxdata/influxdb

											
										
										
											2016-02-10 17:26:18 +00:00
+									"github.com/influxdata/influxdb/influxql"
 									"github.com/influxdata/influxdb/models"
-												Wire in HLL estimator

											
										
										
											2016-09-21 15:04:37 +00:00
+									"github.com/influxdata/influxdb/pkg/estimator"
-												Rename throttle package to limiter

											
										
										
											2016-07-18 18:00:58 +00:00
+									"github.com/influxdata/influxdb/pkg/limiter"
-												Use proper uber-go/zap import path

It looks like the real import path to the project is go.uber.org/zap
instead of github.com/uber-go/zap since the example in the project
references that path.

											
										
										
											2016-12-15 14:54:14 +00:00
+									"go.uber.org/zap"
-												Move data.Node to tsdb.Store. Move data to cluster.
											
										
										
											2015-05-26 19:56:54 +00:00
+								)
 								var (
-												Update godoc for the tsdb package

											
										
										
											2016-12-31 05:12:37 +00:00
+									// ErrShardNotFound is returned when trying to get a non existing shard.
-												Move data.Node to tsdb.Store. Move data to cluster.
											
										
										
											2015-05-26 19:56:54 +00:00
+									ErrShardNotFound = fmt.Errorf("shard not found")
-												Update godoc for the tsdb package

											
										
										
											2016-12-31 05:12:37 +00:00
+									// ErrStoreClosed is returned when trying to use a closed Store.
-												Lint tsdb and tsdb/engine package

											
										
										
											2016-02-10 20:04:18 +00:00
+									ErrStoreClosed = fmt.Errorf("store is closed")
-												Move data.Node to tsdb.Store. Move data to cluster.
											
										
										
											2015-05-26 19:56:54 +00:00
+								)
-												Lint tsdb and tsdb/engine package

											
										
										
											2016-02-10 20:04:18 +00:00
+								// Store manages shards and indexes for databases.
-												Move data.Node to tsdb.Store. Move data to cluster.
											
										
										
											2015-05-26 19:56:54 +00:00
+								type Store struct {
-												Initialise index in shards

											
										
										
											2016-09-01 12:40:16 +00:00
+									mu sync.RWMutex
 									// databases keeps track of the number of databases being managed by the
 									// store.
 									databases map[string]struct{}
-												Move data.Node to tsdb.Store. Move data to cluster.
											
										
										
											2015-05-26 19:56:54 +00:00
-												Initialise index in shards

											
										
										
											2016-09-01 12:40:16 +00:00
+									path string
-												Wire up DROP retention policy to TSDB store.

Fixes #5653 and #5394.

Previously dropping retention policies did not propogate to local TSDB
shards. Instead, the retention policiess would just be removed from the
Meta Store.

This PR adds ensures that data associated with retention policies is
removed, when the retention policy is dropped.

Also, it cleans up a couple of other methods in `tsdb`, including the
requirement to provide (redundant) shardIDs when deleting databases.

											
										
										
											2016-02-15 13:00:58 +00:00
-												Add database, RP as tags on shard stats

This commit updates tsdb.Shard to contain a ShardConfig and updates
tsdb.Store to directly reference a map of tsdb.Shard rather than the
previous tsdb.shardLocation abstraction.

											
										
										
											2016-02-23 20:07:21 +00:00
+									// shards is a map of shard IDs to the associated Shard.
 									shards map[uint64]*Shard
-												Move data.Node to tsdb.Store. Move data to cluster.
											
										
										
											2015-05-26 19:56:54 +00:00
-												refactor storage to engine

											
										
										
											2015-07-22 14:53:20 +00:00
+									EngineOptions EngineOptions
-												Switch logging to use structured logging everywhere

The logging library has been switched to use uber-go/zap. While the
logging has been changed to use structured logging, this commit does not
change any of the logging statements to take advantage of the new
structured log or new log levels. Those changes will come in future
commits.

											
										
										
											2016-12-01 18:26:23 +00:00
+									baseLogger    zap.Logger
 									Logger        zap.Logger
-												Make logging output location more programmatically configurable (#6213)

This has various benefits:

- Users embedding InfluxDB within other Go programs can specify a different logger / prefix easily.
- More consistent with code used elsewhere in InfluxDB (e.g. services, other `run.Server.*` fields, etc).
- This is also more efficient, because it means `executeQuery` no longer allocates a single `*log.Logger` each time it is called.

											
										
										
											2016-04-20 20:07:08 +00:00
-												Add PerformMaintenance to store for flushes and compactions.

Also fixed shard to work again with b1 and bz1 engines.

											
										
										
											2015-09-29 02:50:00 +00:00
+									closing chan struct{}
 									wg      sync.WaitGroup
-												Fix panic: assignment to entry in nil map

Closing the store did not properly return an error for in-flight
writes because the closing channel was set to nil when closed.  A
nil channel is not selectable so writes continue on past the guard
checks and trigger panics.

											
										
										
											2015-10-06 20:00:31 +00:00
+									opened  bool
-												Move data.Node to tsdb.Store. Move data to cluster.
											
										
										
											2015-05-26 19:56:54 +00:00
+								}
-												Lint tsdb and tsdb/engine package

											
										
										
											2016-02-10 20:04:18 +00:00
+								// NewStore returns a new store with the given path and a default configuration.
 								// The returned store must be initialized by calling Open before using it.
-												refactor query engine

											
										
										
											2015-11-04 21:06:06 +00:00
+								func NewStore(path string) *Store {
 									opts := NewEngineOptions()
-												Switch logging to use structured logging everywhere

The logging library has been switched to use uber-go/zap. While the
logging has been changed to use structured logging, this commit does not
change any of the logging statements to take advantage of the new
structured log or new log levels. Those changes will come in future
commits.

											
										
										
											2016-12-01 18:26:23 +00:00
+									logger := zap.New(zap.NullEncoder())
-												refactor query engine

											
										
										
											2015-11-04 21:06:06 +00:00
+									return &Store{
-												Initialise index in shards

											
										
										
											2016-09-01 12:40:16 +00:00
+										databases:     make(map[string]struct{}),
-												refactor query engine

											
										
										
											2015-11-04 21:06:06 +00:00
+										path:          path,
 										EngineOptions: opts,
-												Switch logging to use structured logging everywhere

The logging library has been switched to use uber-go/zap. While the
logging has been changed to use structured logging, this commit does not
change any of the logging statements to take advantage of the new
structured log or new log levels. Those changes will come in future
commits.

											
										
										
											2016-12-01 18:26:23 +00:00
+										Logger:        logger,
 										baseLogger:    logger,
-												Make logging output location more programmatically configurable (#6213)

This has various benefits:

- Users embedding InfluxDB within other Go programs can specify a different logger / prefix easily.
- More consistent with code used elsewhere in InfluxDB (e.g. services, other `run.Server.*` fields, etc).
- This is also more efficient, because it means `executeQuery` no longer allocates a single `*log.Logger` each time it is called.

											
										
										
											2016-04-20 20:07:08 +00:00
+									}
 								}
-												Update godoc for the tsdb package

											
										
										
											2016-12-31 05:12:37 +00:00
+								// WithLogger sets the logger for the store.
-												Switch logging to use structured logging everywhere

The logging library has been switched to use uber-go/zap. While the
logging has been changed to use structured logging, this commit does not
change any of the logging statements to take advantage of the new
structured log or new log levels. Those changes will come in future
commits.

											
										
										
											2016-12-01 18:26:23 +00:00
+								func (s *Store) WithLogger(log zap.Logger) {
 									s.baseLogger = log
 									s.Logger = log.With(zap.String("service", "store"))
 									for _, sh := range s.shards {
 										sh.WithLogger(s.baseLogger)
-												refactor query engine

											
										
										
											2015-11-04 21:06:06 +00:00
+									}
 								}
-												Update godoc for the tsdb package

											
										
										
											2016-12-31 05:12:37 +00:00
+								// Statistics returns statistics for period monitoring.
-												Refactoring the monitor service to avoid expvar

Truncate the time interval output of the monitor service to be on even
time intervals rather than on every minute based on the start time. This
normalizes the output from the monitor service.

											
										
										
											2016-07-07 16:13:56 +00:00
+								func (s *Store) Statistics(tags map[string]string) []models.Statistic {
 									s.mu.RLock()
 									shards := s.shardsSlice()
 									s.mu.RUnlock()
-												Initialise index in shards

											
										
										
											2016-09-01 12:40:16 +00:00
+									// Gather all statistics for all shards.
 									var statistics []models.Statistic
-												Refactoring the monitor service to avoid expvar

Truncate the time interval output of the monitor service to be on even
time intervals rather than on every minute based on the start time. This
normalizes the output from the monitor service.

											
										
										
											2016-07-07 16:13:56 +00:00
+									for _, shard := range shards {
 										statistics = append(statistics, shard.Statistics(tags)...)
 									}
 									return statistics
 								}
-												Refactor backup and restore

This commit updates the snapshot code as well as the "backup" and
"restore" command to work with the new architecture.

											
										
										
											2015-06-08 19:07:05 +00:00
+								// Path returns the store's root path.
 								func (s *Store) Path() string { return s.path }
-												Lint tsdb and tsdb/engine package

											
										
										
											2016-02-10 20:04:18 +00:00
+								// Open initializes the store, creating all necessary directories, loading all
-												Initialise index in shards

											
										
										
											2016-09-01 12:40:16 +00:00
+								// shards as well as initializing periodic maintenance of them.
-												refactor query engine

											
										
										
											2015-11-04 21:06:06 +00:00
+								func (s *Store) Open() error {
 									s.mu.Lock()
 									defer s.mu.Unlock()
 									s.closing = make(chan struct{})
-												Add database, RP as tags on shard stats

This commit updates tsdb.Shard to contain a ShardConfig and updates
tsdb.Store to directly reference a map of tsdb.Shard rather than the
previous tsdb.shardLocation abstraction.

											
										
										
											2016-02-23 20:07:21 +00:00
+									s.shards = map[uint64]*Shard{}
-												refactor query engine

											
										
										
											2015-11-04 21:06:06 +00:00
-												Switch logging to use structured logging everywhere

The logging library has been switched to use uber-go/zap. While the
logging has been changed to use structured logging, this commit does not
change any of the logging statements to take advantage of the new
structured log or new log levels. Those changes will come in future
commits.

											
										
										
											2016-12-01 18:26:23 +00:00
+									s.Logger.Info(fmt.Sprintf("Using data dir: %v", s.Path()))
-												refactor query engine

											
										
										
											2015-11-04 21:06:06 +00:00
 									// Create directory.
 									if err := os.MkdirAll(s.path, 0777); err != nil {
 										return err
 									}
 									if err := s.loadShards(); err != nil {
 										return err
 									}
 									s.opened = true
 									return nil
 								}
 								func (s *Store) loadShards() error {
-												Initialise index in shards

											
										
										
											2016-09-01 12:40:16 +00:00
+									// res holds the result from opening each shard in a goroutine
-												Load shards concurrently

											
										
										
											2016-01-11 18:00:25 +00:00
+									type res struct {
 										s   *Shard
 										err error
 									}
-												Limit how many shards are loaded concurrently

Since loading a shard can allocate a lot of memory, running them all
at once could OOM the process.  This limits the number of shards
loaded to 4.  This will be changed to a config option provided the
approach helps.

											
										
										
											2016-03-16 23:15:22 +00:00
-												Rename throttle package to limiter

											
										
										
											2016-07-18 18:00:58 +00:00
+									t := limiter.NewFixed(runtime.GOMAXPROCS(0))
-												Limit how many shards are loaded concurrently

Since loading a shard can allocate a lot of memory, running them all
at once could OOM the process.  This limits the number of shards
loaded to 4.  This will be changed to a config option provided the
approach helps.

											
										
										
											2016-03-16 23:15:22 +00:00
-												Load shards concurrently

											
										
										
											2016-01-11 18:00:25 +00:00
+									resC := make(chan *res)
 									var n int
-												Initialise index in shards

											
										
										
											2016-09-01 12:40:16 +00:00
+									// Determine how many shards we need to open by checking the store path.
 									dbDirs, err := ioutil.ReadDir(s.path)
 									if err != nil {
 										return err
 									}
 									for _, db := range dbDirs {
 										if !db.IsDir() {
 											s.Logger.Printf("Not loading %s. Not a database directory.", db.Name())
 											continue
 										}
 										// Load each retention policy within the database directory.
 										rpDirs, err := ioutil.ReadDir(filepath.Join(s.path, db.Name()))
-												refactor query engine

											
										
										
											2015-11-04 21:06:06 +00:00
+										if err != nil {
 											return err
 										}
-												Initialise index in shards

											
										
										
											2016-09-01 12:40:16 +00:00
+										for _, rp := range rpDirs {
-												refactor query engine

											
										
										
											2015-11-04 21:06:06 +00:00
+											if !rp.IsDir() {
-												Switch logging to use structured logging everywhere

The logging library has been switched to use uber-go/zap. While the
logging has been changed to use structured logging, this commit does not
change any of the logging statements to take advantage of the new
structured log or new log levels. Those changes will come in future
commits.

											
										
										
											2016-12-01 18:26:23 +00:00
+												s.Logger.Info(fmt.Sprintf("Skipping retention policy dir: %s. Not a directory", rp.Name()))
-												refactor query engine

											
										
										
											2015-11-04 21:06:06 +00:00
+												continue
 											}
-												Initialise index in shards

											
										
										
											2016-09-01 12:40:16 +00:00
+											shardDirs, err := ioutil.ReadDir(filepath.Join(s.path, db.Name(), rp.Name()))
-												refactor query engine

											
										
										
											2015-11-04 21:06:06 +00:00
+											if err != nil {
 												return err
 											}
-												Initialise index in shards

											
										
										
											2016-09-01 12:40:16 +00:00
+											for _, sh := range shardDirs {
-												Load shards concurrently

											
										
										
											2016-01-11 18:00:25 +00:00
+												n++
-												Initialise index in shards

											
										
										
											2016-09-01 12:40:16 +00:00
+												go func(db, rp, sh string) {
-												Limit in-flight wal writes/encodings

A slower disk can can cause excessive allocations to occur when
writing to the WAL because the slower encoding and compression occurs
before taking the write lock.  The encoding/compression grabs a large
byte slice from a pool and ultimately waits until it can acquire the
write lock.

This adds a throttle to limit how many inflight WAL writes can be queued
up to prevent OOMing the processess with slower disks and heavy writes.

											
										
										
											2016-07-16 05:26:25 +00:00
+													t.Take()
 													defer t.Release()
-												Limit how many shards are loaded concurrently

Since loading a shard can allocate a lot of memory, running them all
at once could OOM the process.  This limits the number of shards
loaded to 4.  This will be changed to a config option provided the
approach helps.

											
										
										
											2016-03-16 23:15:22 +00:00
-												Load shards concurrently

											
										
										
											2016-01-11 18:00:25 +00:00
+													start := time.Now()
 													path := filepath.Join(s.path, db, rp, sh)
 													walPath := filepath.Join(s.EngineOptions.Config.WALDir, db, rp, sh)
 													// Shard file names are numeric shardIDs
 													shardID, err := strconv.ParseUint(sh, 10, 64)
 													if err != nil {
 														resC <- &res{err: fmt.Errorf("%s is not a valid ID. Skipping shard.", sh)}
 														return
 													}
-												Initialise index in shards

											
										
										
											2016-09-01 12:40:16 +00:00
+													shard := NewShard(shardID, path, walPath, s.EngineOptions)
-												Switch logging to use structured logging everywhere

The logging library has been switched to use uber-go/zap. While the
logging has been changed to use structured logging, this commit does not
change any of the logging statements to take advantage of the new
structured log or new log levels. Those changes will come in future
commits.

											
										
										
											2016-12-01 18:26:23 +00:00
+													shard.WithLogger(s.baseLogger)
-												Load shards concurrently

											
										
										
											2016-01-11 18:00:25 +00:00
 													err = shard.Open()
 													if err != nil {
 														resC <- &res{err: fmt.Errorf("Failed to open shard: %d: %s", shardID, err)}
 														return
 													}
 													resC <- &res{s: shard}
-												Switch logging to use structured logging everywhere

The logging library has been switched to use uber-go/zap. While the
logging has been changed to use structured logging, this commit does not
change any of the logging statements to take advantage of the new
structured log or new log levels. Those changes will come in future
commits.

											
										
										
											2016-12-01 18:26:23 +00:00
+													s.Logger.Info(fmt.Sprintf("%s opened in %s", path, time.Now().Sub(start)))
-												Initialise index in shards

											
										
										
											2016-09-01 12:40:16 +00:00
+												}(db, rp.Name(), sh.Name())
-												refactor query engine

											
										
										
											2015-11-04 21:06:06 +00:00
+											}
 										}
 									}
-												Initialise index in shards

											
										
										
											2016-09-01 12:40:16 +00:00
+									// Gather results of opening shards concurrently, keeping track of how
 									// many databases we are managing.
-												Load shards concurrently

											
										
										
											2016-01-11 18:00:25 +00:00
+									for i := 0; i < n; i++ {
 										res := <-resC
 										if res.err != nil {
-												Switch logging to use structured logging everywhere

The logging library has been switched to use uber-go/zap. While the
logging has been changed to use structured logging, this commit does not
change any of the logging statements to take advantage of the new
structured log or new log levels. Those changes will come in future
commits.

											
										
										
											2016-12-01 18:26:23 +00:00
+											s.Logger.Info(res.err.Error())
-												Load shards concurrently

											
										
										
											2016-01-11 18:00:25 +00:00
+											continue
 										}
 										s.shards[res.s.id] = res.s
-												Initialise index in shards

											
										
										
											2016-09-01 12:40:16 +00:00
+										s.databases[res.s.database] = struct{}{}
-												Load shards concurrently

											
										
										
											2016-01-11 18:00:25 +00:00
+									}
 									close(resC)
-												refactor query engine

											
										
										
											2015-11-04 21:06:06 +00:00
+									return nil
 								}
-												Lint tsdb and tsdb/engine package

											
										
										
											2016-02-10 20:04:18 +00:00
+								// Close closes the store and all associated shards. After calling Close accessing
 								// shards through the Store will result in ErrStoreClosed being returned.
-												refactor query engine

											
										
										
											2015-11-04 21:06:06 +00:00
+								func (s *Store) Close() error {
 									s.mu.Lock()
 									defer s.mu.Unlock()
 									if s.opened {
 										close(s.closing)
 									}
 									s.wg.Wait()
-												Speed up shutdown

On my machine with about 20 shards, it would take 10+ seconds to shut
down InfluxDB with SIGINT. After this change, it shuts down in nearly
instantly.

(*tsdb.Store).Close was shutting down each of its shards sequentially.
Each shard's engine would signal to its compaction goroutines to quit,
and because each compaction goroutine has a hardcoded 1-second sleep in
between checks, waiting for the goroutines would often block for up to a
second.

This change closes all of the TSDB store's shards in parallel. This
means it's possible that multiple close values could error at once, but
we're still only returning the first error, consistent with previous
behavior. That being said, the return value of (*tsdb.Store).Close is
ignored in (*cmd/influxd/run.Server).Close anyway.

											
										
										
											2016-10-10 15:42:02 +00:00
+									// Close all the shards in parallel.
 									if err := s.walkShards(s.shardsSlice(), func(sh *Shard) error {
 										return sh.Close()
 									}); err != nil {
 										return err
-												refactor query engine

											
										
										
											2015-11-04 21:06:06 +00:00
+									}
-												Speed up shutdown

On my machine with about 20 shards, it would take 10+ seconds to shut
down InfluxDB with SIGINT. After this change, it shuts down in nearly
instantly.

(*tsdb.Store).Close was shutting down each of its shards sequentially.
Each shard's engine would signal to its compaction goroutines to quit,
and because each compaction goroutine has a hardcoded 1-second sleep in
between checks, waiting for the goroutines would often block for up to a
second.

This change closes all of the TSDB store's shards in parallel. This
means it's possible that multiple close values could error at once, but
we're still only returning the first error, consistent with previous
behavior. That being said, the return value of (*tsdb.Store).Close is
ignored in (*cmd/influxd/run.Server).Close anyway.

											
										
										
											2016-10-10 15:42:02 +00:00
-												refactor query engine

											
										
										
											2015-11-04 21:06:06 +00:00
+									s.opened = false
-												Add database, RP as tags on shard stats

This commit updates tsdb.Shard to contain a ShardConfig and updates
tsdb.Store to directly reference a map of tsdb.Shard rather than the
previous tsdb.shardLocation abstraction.

											
										
										
											2016-02-23 20:07:21 +00:00
+									s.shards = nil
-												refactor query engine

											
										
										
											2015-11-04 21:06:06 +00:00
 									return nil
 								}
-												refactor tsdb tests into test package

											
										
										
											2015-07-20 19:59:46 +00:00
+								// Shard returns a shard by id.
 								func (s *Store) Shard(id uint64) *Shard {
 									s.mu.RLock()
 									defer s.mu.RUnlock()
-												Add database, RP as tags on shard stats

This commit updates tsdb.Shard to contain a ShardConfig and updates
tsdb.Store to directly reference a map of tsdb.Shard rather than the
previous tsdb.shardLocation abstraction.

											
										
										
											2016-02-23 20:07:21 +00:00
+									sh, ok := s.shards[id]
-												Wire up DROP retention policy to TSDB store.

Fixes #5653 and #5394.

Previously dropping retention policies did not propogate to local TSDB
shards. Instead, the retention policiess would just be removed from the
Meta Store.

This PR adds ensures that data associated with retention policies is
removed, when the retention policy is dropped.

Also, it cleans up a couple of other methods in `tsdb`, including the
requirement to provide (redundant) shardIDs when deleting databases.

											
										
										
											2016-02-15 13:00:58 +00:00
+									if !ok {
 										return nil
 									}
-												Add database, RP as tags on shard stats

This commit updates tsdb.Shard to contain a ShardConfig and updates
tsdb.Store to directly reference a map of tsdb.Shard rather than the
previous tsdb.shardLocation abstraction.

											
										
										
											2016-02-23 20:07:21 +00:00
+									return sh
-												refactor tsdb tests into test package

											
										
										
											2015-07-20 19:59:46 +00:00
+								}
-												refactor query engine

											
										
										
											2015-11-04 21:06:06 +00:00
+								// Shards returns a list of shards by id.
 								func (s *Store) Shards(ids []uint64) []*Shard {
 									s.mu.RLock()
 									defer s.mu.RUnlock()
 									a := make([]*Shard, 0, len(ids))
 									for _, id := range ids {
-												Add database, RP as tags on shard stats

This commit updates tsdb.Shard to contain a ShardConfig and updates
tsdb.Store to directly reference a map of tsdb.Shard rather than the
previous tsdb.shardLocation abstraction.

											
										
										
											2016-02-23 20:07:21 +00:00
+										sh, ok := s.shards[id]
-												Wire up DROP retention policy to TSDB store.

Fixes #5653 and #5394.

Previously dropping retention policies did not propogate to local TSDB
shards. Instead, the retention policiess would just be removed from the
Meta Store.

This PR adds ensures that data associated with retention policies is
removed, when the retention policy is dropped.

Also, it cleans up a couple of other methods in `tsdb`, including the
requirement to provide (redundant) shardIDs when deleting databases.

											
										
										
											2016-02-15 13:00:58 +00:00
+										if !ok {
-												fix non-existent shard handling

This commit removes `nil` shards returned from `tsdb.Store.Shards()`
which caused panics in some SELECTs. This can occur if the meta
store has created shards before the store or if the shards are
distributed throughout a cluster.

Fixes #5555

											
										
										
											2016-02-08 18:02:33 +00:00
+											continue
 										}
-												Add database, RP as tags on shard stats

This commit updates tsdb.Shard to contain a ShardConfig and updates
tsdb.Store to directly reference a map of tsdb.Shard rather than the
previous tsdb.shardLocation abstraction.

											
										
										
											2016-02-23 20:07:21 +00:00
+										a = append(a, sh)
-												refactor query engine

											
										
										
											2015-11-04 21:06:06 +00:00
+									}
 									return a
 								}
-												Miscellaneous cleanup in tsdb package

* When possible, initialize maps/slices to exact length/capacity
  * See slice benchmarks at
    https://gist.github.com/mark-rushakoff/b5650bd8f06bece0b9fd
* Fixed some typos
* Removed an unnecessary loop in stringset.intersect

											
										
										
											2015-12-19 19:32:44 +00:00
+								// ShardN returns the number of shards in the store.
-												refactor tsdb tests into test package

											
										
										
											2015-07-20 19:59:46 +00:00
+								func (s *Store) ShardN() int {
 									s.mu.RLock()
 									defer s.mu.RUnlock()
-												Add database, RP as tags on shard stats

This commit updates tsdb.Shard to contain a ShardConfig and updates
tsdb.Store to directly reference a map of tsdb.Shard rather than the
previous tsdb.shardLocation abstraction.

											
										
										
											2016-02-23 20:07:21 +00:00
+									return len(s.shards)
-												refactor tsdb tests into test package

											
										
										
											2015-07-20 19:59:46 +00:00
+								}
-												Lint tsdb and tsdb/engine package

											
										
										
											2016-02-10 20:04:18 +00:00
+								// CreateShard creates a shard with the given id and retention policy on a database.
-												Allow creating shards in a disable state

For restoring a shard, we need to be able to have the shard open,
but disabled.  It was racy to open it and then disable it separately
since writes/queries could occur in between that time.

											
										
										
											2016-06-01 22:17:18 +00:00
+								func (s *Store) CreateShard(database, retentionPolicy string, shardID uint64, enabled bool) error {
-												Create and open shards on-demand

Uses a structure like:

  /root/
      /db1/rp1/1
              /2
      /db2/rp2/3

If a write is assigned to a shard on the local node but the shard
has not been created, create it when the write returns an error
and retry the write.

											
										
										
											2015-05-26 22:35:16 +00:00
+									s.mu.Lock()
 									defer s.mu.Unlock()
-												Ensure the tsdb.Store is not closed before creating a shard

Fixes panic: assignment to entry in nil map

Fixes #3848

											
										
										
											2015-09-04 22:32:08 +00:00
+									select {
 									case <-s.closing:
-												Fix panic: assignment to entry in nil map

Closing the store did not properly return an error for in-flight
writes because the closing channel was set to nil when closed.  A
nil channel is not selectable so writes continue on past the guard
checks and trigger panics.

											
										
										
											2015-10-06 20:00:31 +00:00
+										return ErrStoreClosed
-												Ensure the tsdb.Store is not closed before creating a shard

Fixes panic: assignment to entry in nil map

Fixes #3848

											
										
										
											2015-09-04 22:32:08 +00:00
+									default:
 									}
-												Initialise index in shards

											
										
										
											2016-09-01 12:40:16 +00:00
+									// Shard already exists.
-												Add database, RP as tags on shard stats

This commit updates tsdb.Shard to contain a ShardConfig and updates
tsdb.Store to directly reference a map of tsdb.Shard rather than the
previous tsdb.shardLocation abstraction.

											
										
										
											2016-02-23 20:07:21 +00:00
+									if _, ok := s.shards[shardID]; ok {
-												Create and open shards on-demand

Uses a structure like:

  /root/
      /db1/rp1/1
              /2
      /db2/rp2/3

If a write is assigned to a shard on the local node but the shard
has not been created, create it when the write returns an error
and retry the write.

											
										
										
											2015-05-26 22:35:16 +00:00
+										return nil
 									}
-												Initialise index in shards

											
										
										
											2016-09-01 12:40:16 +00:00
+									// Create the db and retention policy directories if they don't exist.
-												Create and open shards on-demand

Uses a structure like:

  /root/
      /db1/rp1/1
              /2
      /db2/rp2/3

If a write is assigned to a shard on the local node but the shard
has not been created, create it when the write returns an error
and retry the write.

											
										
										
											2015-05-26 22:35:16 +00:00
+									if err := os.MkdirAll(filepath.Join(s.path, database, retentionPolicy), 0700); err != nil {
 										return err
 									}
-												Initialise index in shards

											
										
										
											2016-09-01 12:40:16 +00:00
+									// Create the WAL directory.
-												Update store to properly manage WAL create/delete.

* Update the store to remove the WAL directories associated with a shard or database when they are deleted.
* Fix the Store so that it creates separate WAL directories for databases and retention policies.
											
										
										
											2015-08-21 15:22:04 +00:00
+									walPath := filepath.Join(s.EngineOptions.Config.WALDir, database, retentionPolicy, fmt.Sprintf("%d", shardID))
 									if err := os.MkdirAll(walPath, 0700); err != nil {
 										return err
 									}
-												Tag TSM stats with database, retention policy

... by extracting the db/rp from the given path.

Now that the code has "standardized" on extracting db/rp this way, the
ShardLocation struct is no longer necessary and thus has been removed.
We're back on the previous style of passing the path and walPath to
NewShard.

											
										
										
											2016-02-26 19:41:54 +00:00
+									path := filepath.Join(s.path, database, retentionPolicy, strconv.FormatUint(shardID, 10))
-												Initialise index in shards

											
										
										
											2016-09-01 12:40:16 +00:00
+									shard := NewShard(shardID, path, walPath, s.EngineOptions)
-												Switch logging to use structured logging everywhere

The logging library has been switched to use uber-go/zap. While the
logging has been changed to use structured logging, this commit does not
change any of the logging statements to take advantage of the new
structured log or new log levels. Those changes will come in future
commits.

											
										
										
											2016-12-01 18:26:23 +00:00
+									shard.WithLogger(s.baseLogger)
-												Allow creating shards in a disable state

For restoring a shard, we need to be able to have the shard open,
but disabled.  It was racy to open it and then disable it separately
since writes/queries could occur in between that time.

											
										
										
											2016-06-01 22:17:18 +00:00
+									shard.EnableOnOpen = enabled
-												Make store open every shard on load. Fix shard to set measurementFields on load.

Fixes issue where queries wouldn't be able to hit anything because the index does't load until the shard is open.

Fix an issue where field codecs weren't populated in the shard when loading.

											
										
										
											2015-05-29 21:15:05 +00:00
+									if err := shard.Open(); err != nil {
 										return err
 									}
-												Create and open shards on-demand

Uses a structure like:

  /root/
      /db1/rp1/1
              /2
      /db2/rp2/3

If a write is assigned to a shard on the local node but the shard
has not been created, create it when the write returns an error
and retry the write.

											
										
										
											2015-05-26 22:35:16 +00:00
-												Add database, RP as tags on shard stats

This commit updates tsdb.Shard to contain a ShardConfig and updates
tsdb.Store to directly reference a map of tsdb.Shard rather than the
previous tsdb.shardLocation abstraction.

											
										
										
											2016-02-23 20:07:21 +00:00
+									s.shards[shardID] = shard
-												Initialise index in shards

											
										
										
											2016-09-01 12:40:16 +00:00
+									s.databases[database] = struct{}{} // Ensure we are tracking any new db.
-												Create and open shards on-demand

Uses a structure like:

  /root/
      /db1/rp1/1
              /2
      /db2/rp2/3

If a write is assigned to a shard on the local node but the shard
has not been created, create it when the write returns an error
and retry the write.

											
										
										
											2015-05-26 22:35:16 +00:00
-												Move data.Node to tsdb.Store. Move data to cluster.
											
										
										
											2015-05-26 19:56:54 +00:00
+									return nil
 								}
-												Update godoc for the tsdb package

											
										
										
											2016-12-31 05:12:37 +00:00
+								// CreateShardSnapShot will create a hard link to the underlying shard and return a path.
 								// The caller is responsible for cleaning up (removing) the file path returned.
-												wip

											
										
										
											2016-05-09 15:53:34 +00:00
+								func (s *Store) CreateShardSnapshot(id uint64) (string, error) {
 									sh := s.Shard(id)
 									if sh == nil {
 										return "", ErrShardNotFound
 									}
 									return sh.CreateSnapshot()
 								}
-												Update godoc for the tsdb package

											
										
										
											2016-12-31 05:12:37 +00:00
+								// SetShardEnabled enables or disables a shard for read and writes.
-												Add ability to disable shards

Disabling a shard causes all writes and queries to a shard to return
an error.  This also disables compactions for the shard.

											
										
										
											2016-05-27 22:47:33 +00:00
+								func (s *Store) SetShardEnabled(shardID uint64, enabled bool) error {
 									sh := s.Shard(shardID)
 									if sh == nil {
 										return ErrShardNotFound
 									}
 									sh.SetEnabled(enabled)
 									return nil
 								}
-												Add DeleteShard to TSDB store

											
										
										
											2015-06-04 01:02:49 +00:00
+								// DeleteShard removes a shard from disk.
 								func (s *Store) DeleteShard(shardID uint64) error {
-												Inline deleteShard

Only used by one caller now

											
										
										
											2016-07-14 22:41:07 +00:00
+									sh := s.Shard(shardID)
 									if sh == nil {
-												Add DeleteShard to TSDB store

											
										
										
											2015-06-04 01:02:49 +00:00
+										return nil
 									}
-												Add database, RP as tags on shard stats

This commit updates tsdb.Shard to contain a ShardConfig and updates
tsdb.Store to directly reference a map of tsdb.Shard rather than the
previous tsdb.shardLocation abstraction.

											
										
										
											2016-02-23 20:07:21 +00:00
+									if err := sh.Close(); err != nil {
-												Add DeleteShard to TSDB store

											
										
										
											2015-06-04 01:02:49 +00:00
+										return err
 									}
-												Tag TSM stats with database, retention policy

... by extracting the db/rp from the given path.

Now that the code has "standardized" on extracting db/rp this way, the
ShardLocation struct is no longer necessary and thus has been removed.
We're back on the previous style of passing the path and walPath to
NewShard.

											
										
										
											2016-02-26 19:41:54 +00:00
+									if err := os.RemoveAll(sh.path); err != nil {
-												Add DeleteShard to TSDB store

											
										
										
											2015-06-04 01:02:49 +00:00
+										return err
 									}
-												Tag TSM stats with database, retention policy

... by extracting the db/rp from the given path.

Now that the code has "standardized" on extracting db/rp this way, the
ShardLocation struct is no longer necessary and thus has been removed.
We're back on the previous style of passing the path and walPath to
NewShard.

											
										
										
											2016-02-26 19:41:54 +00:00
+									if err := os.RemoveAll(sh.walPath); err != nil {
-												Update store to properly manage WAL create/delete.

* Update the store to remove the WAL directories associated with a shard or database when they are deleted.
* Fix the Store so that it creates separate WAL directories for databases and retention policies.
											
										
										
											2015-08-21 15:22:04 +00:00
+										return err
 									}
-												Inline deleteShard

Only used by one caller now

											
										
										
											2016-07-14 22:41:07 +00:00
+									s.mu.Lock()
-												Add database, RP as tags on shard stats

This commit updates tsdb.Shard to contain a ShardConfig and updates
tsdb.Store to directly reference a map of tsdb.Shard rather than the
previous tsdb.shardLocation abstraction.

											
										
										
											2016-02-23 20:07:21 +00:00
+									delete(s.shards, shardID)
-												Inline deleteShard

Only used by one caller now

											
										
										
											2016-07-14 22:41:07 +00:00
+									s.mu.Unlock()
-												Add DeleteShard to TSDB store

											
										
										
											2015-06-04 01:02:49 +00:00
+									return nil
 								}
-												add remote execution

This commit adds remote execution to the query engine.

											
										
										
											2016-02-19 20:38:02 +00:00
+								// ShardIteratorCreator returns an iterator creator for a shard.
-												concurrent series limit

This commit fixes the `MaxSelectSeriesN` limit which was broken by
the implementation of lazy iterators. The setting previously limited
the total number of series but the new implementation limits the
concurrent number of series being processed.

											
										
										
											2016-08-08 16:39:38 +00:00
+								func (s *Store) ShardIteratorCreator(id uint64, opt *influxql.SelectOptions) influxql.IteratorCreator {
-												add remote execution

This commit adds remote execution to the query engine.

											
										
										
											2016-02-19 20:38:02 +00:00
+									sh := s.Shard(id)
 									if sh == nil {
 										return nil
 									}
-												concurrent series limit

This commit fixes the `MaxSelectSeriesN` limit which was broken by
the implementation of lazy iterators. The setting previously limited
the total number of series but the new implementation limits the
concurrent number of series being processed.

											
										
										
											2016-08-08 16:39:38 +00:00
+									return &shardIteratorCreator{
 										sh:         sh,
 										maxSeriesN: opt.MaxSeriesN,
 									}
-												add remote execution

This commit adds remote execution to the query engine.

											
										
										
											2016-02-19 20:38:02 +00:00
+								}
 								// DeleteDatabase will close all shards associated with a database and remove the directory and files from disk.
-												Wire up DROP retention policy to TSDB store.

Fixes #5653 and #5394.

Previously dropping retention policies did not propogate to local TSDB
shards. Instead, the retention policiess would just be removed from the
Meta Store.

This PR adds ensures that data associated with retention policies is
removed, when the retention policy is dropped.

Also, it cleans up a couple of other methods in `tsdb`, including the
requirement to provide (redundant) shardIDs when deleting databases.

											
										
										
											2016-02-15 13:00:58 +00:00
+								func (s *Store) DeleteDatabase(name string) error {
-												Speed up drop database

Drop database was closing and deleting each shard dir individually and
serially.  It would then delete the empty database dirs.

This changes drop database to close all shards in parallel and run
one os.RemoveAll to remove everything under the db dir which is more
efficient.

This also reworked the locking to avoid locking the tsdb.Store for
long periods of time.  That can cause queries and writes for other
databases to block as well.

											
										
										
											2016-05-13 16:14:49 +00:00
+									s.mu.RLock()
-												Initialise index in shards

											
										
										
											2016-09-01 12:40:16 +00:00
+									shards := s.filterShards(byDatabase(name))
-												Speed up drop database

Drop database was closing and deleting each shard dir individually and
serially.  It would then delete the empty database dirs.

This changes drop database to close all shards in parallel and run
one os.RemoveAll to remove everything under the db dir which is more
efficient.

This also reworked the locking to avoid locking the tsdb.Store for
long periods of time.  That can cause queries and writes for other
databases to block as well.

											
										
										
											2016-05-13 16:14:49 +00:00
+									s.mu.RUnlock()
-												Refactor DeleteDatabase to use filter/walk funcs

											
										
										
											2016-07-14 22:37:46 +00:00
+									if err := s.walkShards(shards, func(sh *Shard) error {
 										if sh.database != name {
 											return nil
-												Wire up DROP DATABASE query.
											
										
										
											2015-06-05 16:31:04 +00:00
+										}
-												Refactor DeleteDatabase to use filter/walk funcs

											
										
										
											2016-07-14 22:37:46 +00:00
 										return sh.Close()
 									}); err != nil {
 										return err
-												Wire up DROP DATABASE query.
											
										
										
											2015-06-05 16:31:04 +00:00
+									}
-												Remove the shard references when database is dropped

The shards map still held a reference to a shard that was dropped
which caused the periodic mainteance task to report errors continuously.

											
										
										
											2015-10-26 19:04:57 +00:00
-												Form database path correctly on DROP DATABASE

Fixes #3330

											
										
										
											2015-07-15 18:11:02 +00:00
+									if err := os.RemoveAll(filepath.Join(s.path, name)); err != nil {
-												On DROP DATABASE remove from TSDB index

											
										
										
											2015-06-22 18:44:46 +00:00
+										return err
 									}
-												Update store to properly manage WAL create/delete.

* Update the store to remove the WAL directories associated with a shard or database when they are deleted.
* Fix the Store so that it creates separate WAL directories for databases and retention policies.
											
										
										
											2015-08-21 15:22:04 +00:00
+									if err := os.RemoveAll(filepath.Join(s.EngineOptions.Config.WALDir, name)); err != nil {
 										return err
 									}
-												refactor query engine

											
										
										
											2015-11-04 21:06:06 +00:00
-												Refactor DeleteDatabase to use filter/walk funcs

											
										
										
											2016-07-14 22:37:46 +00:00
+									s.mu.Lock()
 									for _, sh := range shards {
 										delete(s.shards, sh.id)
 									}
-												Initialise index in shards

											
										
										
											2016-09-01 12:40:16 +00:00
 									// Remove database from store list of databases
 									delete(s.databases, name)
-												Refactor DeleteDatabase to use filter/walk funcs

											
										
										
											2016-07-14 22:37:46 +00:00
+									s.mu.Unlock()
-												refactor query engine

											
										
										
											2015-11-04 21:06:06 +00:00
+									return nil
 								}
-												Wire up DROP retention policy to TSDB store.

Fixes #5653 and #5394.

Previously dropping retention policies did not propogate to local TSDB
shards. Instead, the retention policiess would just be removed from the
Meta Store.

This PR adds ensures that data associated with retention policies is
removed, when the retention policy is dropped.

Also, it cleans up a couple of other methods in `tsdb`, including the
requirement to provide (redundant) shardIDs when deleting databases.

											
										
										
											2016-02-15 13:00:58 +00:00
+								// DeleteRetentionPolicy will close all shards associated with the
 								// provided retention policy, remove the retention policy directories on
 								// both the DB and WAL, and remove all shard files from disk.
 								func (s *Store) DeleteRetentionPolicy(database, name string) error {
-												Speed up drop retention policy

Reduce the lock contention on tsdb.Store by taking a short lived
read-lock instead of a long write lock.  Also close shards in parallel
and drop the whole RP dir in bulk instead of each shard dir.

											
										
										
											2016-07-14 22:24:01 +00:00
+									s.mu.RLock()
 									shards := s.filterShards(func(sh *Shard) bool {
 										return sh.database == database && sh.retentionPolicy == name
 									})
 									s.mu.RUnlock()
-												Wire up DROP retention policy to TSDB store.

Fixes #5653 and #5394.

Previously dropping retention policies did not propogate to local TSDB
shards. Instead, the retention policiess would just be removed from the
Meta Store.

This PR adds ensures that data associated with retention policies is
removed, when the retention policy is dropped.

Also, it cleans up a couple of other methods in `tsdb`, including the
requirement to provide (redundant) shardIDs when deleting databases.

											
										
										
											2016-02-15 13:00:58 +00:00
 									// Close and delete all shards under the retention policy on the
 									// database.
-												Speed up drop retention policy

Reduce the lock contention on tsdb.Store by taking a short lived
read-lock instead of a long write lock.  Also close shards in parallel
and drop the whole RP dir in bulk instead of each shard dir.

											
										
										
											2016-07-14 22:24:01 +00:00
+									if err := s.walkShards(shards, func(sh *Shard) error {
 										if sh.database != database || sh.retentionPolicy != name {
 											return nil
-												Wire up DROP retention policy to TSDB store.

Fixes #5653 and #5394.

Previously dropping retention policies did not propogate to local TSDB
shards. Instead, the retention policiess would just be removed from the
Meta Store.

This PR adds ensures that data associated with retention policies is
removed, when the retention policy is dropped.

Also, it cleans up a couple of other methods in `tsdb`, including the
requirement to provide (redundant) shardIDs when deleting databases.

											
										
										
											2016-02-15 13:00:58 +00:00
+										}
-												Speed up drop retention policy

Reduce the lock contention on tsdb.Store by taking a short lived
read-lock instead of a long write lock.  Also close shards in parallel
and drop the whole RP dir in bulk instead of each shard dir.

											
										
										
											2016-07-14 22:24:01 +00:00
 										return sh.Close()
 									}); err != nil {
 										return err
-												Wire up DROP retention policy to TSDB store.

Fixes #5653 and #5394.

Previously dropping retention policies did not propogate to local TSDB
shards. Instead, the retention policiess would just be removed from the
Meta Store.

This PR adds ensures that data associated with retention policies is
removed, when the retention policy is dropped.

Also, it cleans up a couple of other methods in `tsdb`, including the
requirement to provide (redundant) shardIDs when deleting databases.

											
										
										
											2016-02-15 13:00:58 +00:00
+									}
-												Initialise index in shards

											
										
										
											2016-09-01 12:40:16 +00:00
+									// Remove the retention policy folder.
-												Wire up DROP retention policy to TSDB store.

Fixes #5653 and #5394.

Previously dropping retention policies did not propogate to local TSDB
shards. Instead, the retention policiess would just be removed from the
Meta Store.

This PR adds ensures that data associated with retention policies is
removed, when the retention policy is dropped.

Also, it cleans up a couple of other methods in `tsdb`, including the
requirement to provide (redundant) shardIDs when deleting databases.

											
										
										
											2016-02-15 13:00:58 +00:00
+									if err := os.RemoveAll(filepath.Join(s.path, database, name)); err != nil {
 										return err
 									}
 									// Remove the retention policy folder from the the WAL.
-												Speed up drop retention policy

Reduce the lock contention on tsdb.Store by taking a short lived
read-lock instead of a long write lock.  Also close shards in parallel
and drop the whole RP dir in bulk instead of each shard dir.

											
										
										
											2016-07-14 22:24:01 +00:00
+									if err := os.RemoveAll(filepath.Join(s.EngineOptions.Config.WALDir, database, name)); err != nil {
 										return err
 									}
 									s.mu.Lock()
 									for _, sh := range shards {
 										delete(s.shards, sh.id)
 									}
 									s.mu.Unlock()
 									return nil
-												Wire up DROP retention policy to TSDB store.

Fixes #5653 and #5394.

Previously dropping retention policies did not propogate to local TSDB
shards. Instead, the retention policiess would just be removed from the
Meta Store.

This PR adds ensures that data associated with retention policies is
removed, when the retention policy is dropped.

Also, it cleans up a couple of other methods in `tsdb`, including the
requirement to provide (redundant) shardIDs when deleting databases.

											
										
										
											2016-02-15 13:00:58 +00:00
+								}
-												refactor query engine

											
										
										
											2015-11-04 21:06:06 +00:00
+								// DeleteMeasurement removes a measurement and all associated series from a database.
 								func (s *Store) DeleteMeasurement(database, name string) error {
-												Fix missing read locks before filtering

											
										
										
											2016-07-15 16:08:26 +00:00
+									s.mu.RLock()
-												Initialise index in shards

											
										
										
											2016-09-01 12:40:16 +00:00
+									shards := s.filterShards(byDatabase(database))
-												Fix missing read locks before filtering

											
										
										
											2016-07-15 16:08:26 +00:00
+									s.mu.RUnlock()
-												Speed up drop measurement

Reduces the lock contention on the tsdb.Store by taking a short
read lock instead of a long write lock.  Also processes shards
in parallel instead of serially.

											
										
										
											2016-07-14 22:06:13 +00:00
-												Initialise index in shards

											
										
										
											2016-09-01 12:40:16 +00:00
+									return s.walkShards(shards, func(sh *Shard) error {
 										if err := sh.DeleteMeasurement(name); err != nil {
-												Speed up drop measurement

Reduces the lock contention on the tsdb.Store by taking a short
read lock instead of a long write lock.  Also processes shards
in parallel instead of serially.

											
										
										
											2016-07-14 22:06:13 +00:00
+											return err
 										}
 										return nil
-												Initialise index in shards

											
										
										
											2016-09-01 12:40:16 +00:00
+									})
-												Speed up drop measurement

Reduces the lock contention on the tsdb.Store by taking a short
read lock instead of a long write lock.  Also processes shards
in parallel instead of serially.

											
										
										
											2016-07-14 22:06:13 +00:00
+								}
 								// filterShards returns a slice of shards where fn returns true
-												Refactor

											
										
										
											2016-09-14 13:55:44 +00:00
+								// for the shard. If the provided predicate is nil then all shards are returned.
-												Speed up drop measurement

Reduces the lock contention on the tsdb.Store by taking a short
read lock instead of a long write lock.  Also processes shards
in parallel instead of serially.

											
										
										
											2016-07-14 22:06:13 +00:00
+								func (s *Store) filterShards(fn func(sh *Shard) bool) []*Shard {
-												Refactor

											
										
										
											2016-09-14 13:55:44 +00:00
+									var shards []*Shard
 									if fn == nil {
 										shards = make([]*Shard, 0, len(s.shards))
 										fn = func(*Shard) bool { return true }
 									} else {
 										shards = make([]*Shard, 0)
 									}
-												Add database, RP as tags on shard stats

This commit updates tsdb.Shard to contain a ShardConfig and updates
tsdb.Store to directly reference a map of tsdb.Shard rather than the
previous tsdb.shardLocation abstraction.

											
										
										
											2016-02-23 20:07:21 +00:00
+									for _, sh := range s.shards {
-												Speed up drop measurement

Reduces the lock contention on the tsdb.Store by taking a short
read lock instead of a long write lock.  Also processes shards
in parallel instead of serially.

											
										
										
											2016-07-14 22:06:13 +00:00
+										if fn(sh) {
 											shards = append(shards, sh)
-												add dedupe iterator

											
										
										
											2016-02-05 17:23:35 +00:00
+										}
-												Speed up drop measurement

Reduces the lock contention on the tsdb.Store by taking a short
read lock instead of a long write lock.  Also processes shards
in parallel instead of serially.

											
										
										
											2016-07-14 22:06:13 +00:00
+									}
 									return shards
 								}
-												Wire up DROP retention policy to TSDB store.

Fixes #5653 and #5394.

Previously dropping retention policies did not propogate to local TSDB
shards. Instead, the retention policiess would just be removed from the
Meta Store.

This PR adds ensures that data associated with retention policies is
removed, when the retention policy is dropped.

Also, it cleans up a couple of other methods in `tsdb`, including the
requirement to provide (redundant) shardIDs when deleting databases.

											
										
										
											2016-02-15 13:00:58 +00:00
-												Initialise index in shards

											
										
										
											2016-09-01 12:40:16 +00:00
+								// byDatabase provides a predicate for filterShards that matches on the name of
 								// the database passed in.
 								var byDatabase = func(name string) func(sh *Shard) bool {
 									return func(sh *Shard) bool {
 										return sh.database == name
 									}
 								}
-												Speed up drop measurement

Reduces the lock contention on the tsdb.Store by taking a short
read lock instead of a long write lock.  Also processes shards
in parallel instead of serially.

											
										
										
											2016-07-14 22:06:13 +00:00
+								// walkShards apply a function to each shard in parallel.  If any of the
 								// functions return an error, the first error is returned.
 								func (s *Store) walkShards(shards []*Shard, fn func(sh *Shard) error) error {
 									// struct to hold the result of opening each reader in a goroutine
 									type res struct {
 										err error
-												refactor query engine

											
										
										
											2015-11-04 21:06:06 +00:00
+									}
-												Simplify throttle type

											
										
										
											2016-07-15 18:14:25 +00:00
+									resC := make(chan res)
-												Speed up drop measurement

Reduces the lock contention on the tsdb.Store by taking a short
read lock instead of a long write lock.  Also processes shards
in parallel instead of serially.

											
										
										
											2016-07-14 22:06:13 +00:00
+									var n int
 									for _, sh := range shards {
 										n++
 										go func(sh *Shard) {
 											if err := fn(sh); err != nil {
-												Simplify throttle type

											
										
										
											2016-07-15 18:14:25 +00:00
+												resC <- res{err: fmt.Errorf("shard %d: %s", sh.id, err)}
-												Speed up drop measurement

Reduces the lock contention on the tsdb.Store by taking a short
read lock instead of a long write lock.  Also processes shards
in parallel instead of serially.

											
										
										
											2016-07-14 22:06:13 +00:00
+												return
 											}
-												Simplify throttle type

											
										
										
											2016-07-15 18:14:25 +00:00
+											resC <- res{}
-												Speed up drop measurement

Reduces the lock contention on the tsdb.Store by taking a short
read lock instead of a long write lock.  Also processes shards
in parallel instead of serially.

											
										
										
											2016-07-14 22:06:13 +00:00
+										}(sh)
 									}
 									var err error
 									for i := 0; i < n; i++ {
 										res := <-resC
 										if res.err != nil {
 											err = res.err
 										}
 									}
 									close(resC)
 									return err
-												Wire up DROP DATABASE query.
											
										
										
											2015-06-05 16:31:04 +00:00
+								}
-												refactor query engine

											
										
										
											2015-11-04 21:06:06 +00:00
+								// shardsSlice returns an ordered list of shards.
 								func (s *Store) shardsSlice() []*Shard {
-												Add database, RP as tags on shard stats

This commit updates tsdb.Shard to contain a ShardConfig and updates
tsdb.Store to directly reference a map of tsdb.Shard rather than the
previous tsdb.shardLocation abstraction.

											
										
										
											2016-02-23 20:07:21 +00:00
+									a := make([]*Shard, 0, len(s.shards))
 									for _, sh := range s.shards {
 										a = append(a, sh)
-												Update tx.go to work with tsdb

											
										
										
											2015-05-28 22:02:12 +00:00
+									}
-												refactor query engine

											
										
										
											2015-11-04 21:06:06 +00:00
+									sort.Sort(Shards(a))
 									return a
-												Update tx.go to work with tsdb

											
										
										
											2015-05-28 22:02:12 +00:00
+								}
-												Initialise index in shards

											
										
										
											2016-09-01 12:40:16 +00:00
+								// Databases returns the names of all databases managed by the store.
-												Add inspect tool

Start of a lower-level file inspection tool.  This currently dumps
summary statistics for the shards, index and WAL that can be used to
understand the shape of the data is in the local shards.  This util
operates on the shards itself and not through the server and is intended
more for debugging/troubleshooting.

											
										
										
											2015-08-25 21:44:42 +00:00
+								func (s *Store) Databases() []string {
 									s.mu.RLock()
 									defer s.mu.RUnlock()
-												Initialise index in shards

											
										
										
											2016-09-01 12:40:16 +00:00
+									databases := make([]string, 0, len(s.databases))
 									for k, _ := range s.databases {
 										databases = append(databases, k)
-												Update tx.go to work with tsdb

											
										
										
											2015-05-28 22:02:12 +00:00
+									}
-												Initialise index in shards

											
										
										
											2016-09-01 12:40:16 +00:00
+									return databases
-												Update tx.go to work with tsdb

											
										
										
											2015-05-28 22:02:12 +00:00
+								}
-												Initialise index in shards

											
										
										
											2016-09-01 12:40:16 +00:00
+								// DiskSize returns the size of all the shard files in bytes.
 								// This size does not include the WAL size.
-												Add inspect tool

Start of a lower-level file inspection tool.  This currently dumps
summary statistics for the shards, index and WAL that can be used to
understand the shape of the data is in the local shards.  This util
operates on the shards itself and not through the server and is intended
more for debugging/troubleshooting.

											
										
										
											2015-08-25 21:44:42 +00:00
+								func (s *Store) DiskSize() (int64, error) {
 									var size int64
-												Refactor

											
										
										
											2016-09-14 13:55:44 +00:00
 									s.mu.RLock()
 									allShards := s.filterShards(nil)
 									s.mu.RUnlock()
 									for _, sh := range allShards {
 										sz, err := sh.DiskSize()
-												Add inspect tool

Start of a lower-level file inspection tool.  This currently dumps
summary statistics for the shards, index and WAL that can be used to
understand the shape of the data is in the local shards.  This util
operates on the shards itself and not through the server and is intended
more for debugging/troubleshooting.

											
										
										
											2015-08-25 21:44:42 +00:00
+										if err != nil {
 											return 0, err
 										}
 										size += sz
 									}
 									return size, nil
 								}
-												Refactor

											
										
										
											2016-09-14 13:55:44 +00:00
+								// SeriesCardinality returns the series cardinality for the provided database.
 								func (s *Store) SeriesCardinality(database string) (int64, error) {
-												Wire in HLL estimator

											
										
										
											2016-09-21 15:04:37 +00:00
+									s.mu.RLock()
 									shards := s.filterShards(byDatabase(database))
 									s.mu.RUnlock()
 									var sketch estimator.Sketch
 									// Iterate over all shards for the database and combine all of the series
 									// sketches.
 									for _, shard := range shards {
 										other, err := shard.engine.SeriesSketch()
 										if err != nil {
 											return 0, err
 										}
 										if sketch == nil {
 											sketch = other
 										} else if err = sketch.Merge(other); err != nil {
 											return 0, err
 										}
 									}
 									if sketch != nil {
 										cnt, err := sketch.Count()
 										return int64(cnt), err
 									}
 									return 0, nil
-												Refactor

											
										
										
											2016-09-14 13:55:44 +00:00
+								}
 								// MeasurementsCardinality returns the measurement cardinality for the provided
 								// database.
 								func (s *Store) MeasurementsCardinality(database string) (int64, error) {
 									panic("TODO: edd")
 								}
-												Initialise index in shards

											
										
										
											2016-09-01 12:40:16 +00:00
+								// BackupShard will get the shard and have the engine backup since the passed in
 								// time to the writer.
-												Implement backup/restore for TSM.

This changes backup and restore to work for TSM. It breaks it for b1 and bz1, but since those are getting removed it's ok.

The backup runs against any host that is specified and can backup either the metasstore, a database, specific retention policy, or a specific shard. It can also take incremental backups with the `since` flag, which will only backup TSM files that have been created since that timestamp.

The backup is safe to run online. However, for shards that are still hot for writes, they won't be able to create new TSM files while the backup for that single shard runs. If the backup isn't too large and the write throughput isn't too high this shouldn't be a problem since the writes will just go into the WAL cache.

											
										
										
											2015-12-25 13:23:22 +00:00
+								func (s *Store) BackupShard(id uint64, since time.Time, w io.Writer) error {
 									shard := s.Shard(id)
 									if shard == nil {
 										return fmt.Errorf("shard %d doesn't exist on this server", id)
 									}
-												Tag TSM stats with database, retention policy

... by extracting the db/rp from the given path.

Now that the code has "standardized" on extracting db/rp this way, the
ShardLocation struct is no longer necessary and thus has been removed.
We're back on the previous style of passing the path and walPath to
NewShard.

											
										
										
											2016-02-26 19:41:54 +00:00
+									path, err := relativePath(s.path, shard.path)
-												Implement backup/restore for TSM.

This changes backup and restore to work for TSM. It breaks it for b1 and bz1, but since those are getting removed it's ok.

The backup runs against any host that is specified and can backup either the metasstore, a database, specific retention policy, or a specific shard. It can also take incremental backups with the `since` flag, which will only backup TSM files that have been created since that timestamp.

The backup is safe to run online. However, for shards that are still hot for writes, they won't be able to create new TSM files while the backup for that single shard runs. If the backup isn't too large and the write throughput isn't too high this shouldn't be a problem since the writes will just go into the WAL cache.

											
										
										
											2015-12-25 13:23:22 +00:00
+									if err != nil {
 										return err
 									}
 									return shard.engine.Backup(w, path, since)
 								}
-												added baseline backup/restore plumbing

											
										
										
											2016-04-29 00:29:09 +00:00
+								// RestoreShard restores a backup from r to a given shard.
 								// This will only overwrite files included in the backup.
 								func (s *Store) RestoreShard(id uint64, r io.Reader) error {
 									shard := s.Shard(id)
 									if shard == nil {
 										return fmt.Errorf("shard %d doesn't exist on this server", id)
 									}
 									path, err := relativePath(s.path, shard.path)
 									if err != nil {
 										return err
 									}
 									return shard.Restore(r, path)
 								}
-												Initialise index in shards

											
										
										
											2016-09-01 12:40:16 +00:00
+								// ShardRelativePath will return the relative path to the shard, i.e.,
 								// <database>/<retention>/<id>.
-												Implement backup/restore for TSM.

This changes backup and restore to work for TSM. It breaks it for b1 and bz1, but since those are getting removed it's ok.

The backup runs against any host that is specified and can backup either the metasstore, a database, specific retention policy, or a specific shard. It can also take incremental backups with the `since` flag, which will only backup TSM files that have been created since that timestamp.

The backup is safe to run online. However, for shards that are still hot for writes, they won't be able to create new TSM files while the backup for that single shard runs. If the backup isn't too large and the write throughput isn't too high this shouldn't be a problem since the writes will just go into the WAL cache.

											
										
										
											2015-12-25 13:23:22 +00:00
+								func (s *Store) ShardRelativePath(id uint64) (string, error) {
 									shard := s.Shard(id)
 									if shard == nil {
 										return "", fmt.Errorf("shard %d doesn't exist on this server", id)
 									}
-												Tag TSM stats with database, retention policy

... by extracting the db/rp from the given path.

Now that the code has "standardized" on extracting db/rp this way, the
ShardLocation struct is no longer necessary and thus has been removed.
We're back on the previous style of passing the path and walPath to
NewShard.

											
										
										
											2016-02-26 19:41:54 +00:00
+									return relativePath(s.path, shard.path)
-												Implement backup/restore for TSM.

This changes backup and restore to work for TSM. It breaks it for b1 and bz1, but since those are getting removed it's ok.

The backup runs against any host that is specified and can backup either the metasstore, a database, specific retention policy, or a specific shard. It can also take incremental backups with the `since` flag, which will only backup TSM files that have been created since that timestamp.

The backup is safe to run online. However, for shards that are still hot for writes, they won't be able to create new TSM files while the backup for that single shard runs. If the backup isn't too large and the write throughput isn't too high this shouldn't be a problem since the writes will just go into the WAL cache.

											
										
										
											2015-12-25 13:23:22 +00:00
+								}
-												Initialise index in shards

											
										
										
											2016-09-01 12:40:16 +00:00
+								// DeleteSeries loops through the local shards and deletes the series data for
 								// the passed in series keys.
-												Remove index meta data when series and measurements are gone

This remove the dropMeta param from the tsdb.Store.DeleteSeries and
lets the shard determine when to remove the meta data from the index
based on what series still have data in the shard.

This uncovered a nasty bug in compactions where a fully deleted series would
prematurely end the compactions and not carry forward the rest of the data
in the TSM file.  This is now fixed as well.

											
										
										
											2016-04-29 22:31:57 +00:00
+								func (s *Store) DeleteSeries(database string, sources []influxql.Source, condition influxql.Expr) error {
-												add support for remote expansion of regex

This commit moves the `tsdb.Store.ExpandSources()` function onto
the `influxql.IteratorCreator` and provides support for issuing
source expansion across a cluster.

											
										
										
											2016-03-04 18:01:41 +00:00
+									// Expand regex expressions in the FROM clause.
 									a, err := s.ExpandSources(sources)
 									if err != nil {
 										return err
 									} else if sources != nil && len(sources) != 0 && len(a) == 0 {
 										return nil
 									}
 									sources = a
-												add DELETE query support

This commit adds query language support for deleting series with a
`DELETE` query.

											
										
										
											2016-04-26 21:43:10 +00:00
+									// Determine deletion time range.
 									min, max, err := influxql.TimeRangeAsEpochNano(condition)
 									if err != nil {
 										return err
 									}
-												Wire up DROP MEASUREMENT

* Add deleteMeasurement to store and shard
* Add DropMeasurement to DatabaseIndex
* Update ErrMeasurementNotFound and ErrDatabaseNotFound to not include the first line of the stack trace.
											
										
										
											2015-06-03 15:32:50 +00:00
+									s.mu.RLock()
-												Initialise index in shards

											
										
										
											2016-09-01 12:40:16 +00:00
+									shards := s.filterShards(byDatabase(database))
 									s.mu.RUnlock()
-												fix #4303: don't drop from multiple databases

											
										
										
											2015-12-12 04:36:34 +00:00
-												Initialise index in shards

											
										
										
											2016-09-01 12:40:16 +00:00
+									mMap := make(map[string]*Measurement)
 									for _, shard := range shards {
 										shardMeasures := shard.Measurements()
 										for _, m := range shardMeasures {
 											mMap[m.Name] = m
 										}
-												refactor query executor

This commit moves the `QueryExecutor` to the `cluster` package
and provides an interface to it inside the `influxql` package.

											
										
										
											2016-02-12 22:10:02 +00:00
+									}
-												Initialise index in shards

											
										
										
											2016-09-01 12:40:16 +00:00
+									s.mu.RLock()
 									defer s.mu.RUnlock()
 									measurements, err := measurementsFromSourcesOrDB(mMap, sources...)
-												refactor query executor

This commit moves the `QueryExecutor` to the `cluster` package
and provides an interface to it inside the `influxql` package.

											
										
										
											2016-02-12 22:10:02 +00:00
+									if err != nil {
 										return err
 									}
 									var seriesKeys []string
 									for _, m := range measurements {
 										var ids SeriesIDs
 										var filters FilterExprs
 										if condition != nil {
 											// Get series IDs that match the WHERE clause.
 											ids, filters, err = m.walkWhereForSeriesIds(condition)
 											if err != nil {
 												return err
 											}
 											// Delete boolean literal true filter expressions.
 											// These are returned for `WHERE tagKey = 'tagVal'` type expressions and are okay.
 											filters.DeleteBoolLiteralTrues()
 											// Check for unsupported field filters.
 											// Any remaining filters means there were fields (e.g., `WHERE value = 1.2`).
 											if filters.Len() > 0 {
-												add DELETE query support

This commit adds query language support for deleting series with a
`DELETE` query.

											
										
										
											2016-04-26 21:43:10 +00:00
+												return errors.New("fields not supported in WHERE clause during deletion")
-												refactor query executor

This commit moves the `QueryExecutor` to the `cluster` package
and provides an interface to it inside the `influxql` package.

											
										
										
											2016-02-12 22:10:02 +00:00
+											}
 										} else {
 											// No WHERE clause so get all series IDs for this measurement.
 											ids = m.seriesIDs
 										}
 										for _, id := range ids {
 											seriesKeys = append(seriesKeys, m.seriesByID[id].Key)
 										}
 									}
-												Initialise index in shards

											
										
										
											2016-09-01 12:40:16 +00:00
+									// delete the raw series data.
-												Speed up delete series

Reduce lock contention and process shards in concurrently.

											
										
										
											2016-07-14 23:08:32 +00:00
+									return s.walkShards(shards, func(sh *Shard) error {
-												add DELETE query support

This commit adds query language support for deleting series with a
`DELETE` query.

											
										
										
											2016-04-26 21:43:10 +00:00
+										if err := sh.DeleteSeriesRange(seriesKeys, min, max); err != nil {
-												Wire up DROP MEASUREMENT

* Add deleteMeasurement to store and shard
* Add DropMeasurement to DatabaseIndex
* Update ErrMeasurementNotFound and ErrDatabaseNotFound to not include the first line of the stack trace.
											
										
										
											2015-06-03 15:32:50 +00:00
+											return err
 										}
-												Speed up delete series

Reduce lock contention and process shards in concurrently.

											
										
										
											2016-07-14 23:08:32 +00:00
+										return nil
 									})
-												Wire up DROP MEASUREMENT

* Add deleteMeasurement to store and shard
* Add DropMeasurement to DatabaseIndex
* Update ErrMeasurementNotFound and ErrDatabaseNotFound to not include the first line of the stack trace.
											
										
										
											2015-06-03 15:32:50 +00:00
+								}
-												add support for remote expansion of regex

This commit moves the `tsdb.Store.ExpandSources()` function onto
the `influxql.IteratorCreator` and provides support for issuing
source expansion across a cluster.

											
										
										
											2016-03-04 18:01:41 +00:00
+								// ExpandSources expands sources against all local shards.
-												refactor query engine

											
										
										
											2015-11-04 21:06:06 +00:00
+								func (s *Store) ExpandSources(sources influxql.Sources) (influxql.Sources, error) {
-												add support for remote expansion of regex

This commit moves the `tsdb.Store.ExpandSources()` function onto
the `influxql.IteratorCreator` and provides support for issuing
source expansion across a cluster.

											
										
										
											2016-03-04 18:01:41 +00:00
+									return s.IteratorCreators().ExpandSources(sources)
-												refactor query executor

This commit moves the `QueryExecutor` to the `cluster` package
and provides an interface to it inside the `influxql` package.

											
										
										
											2016-02-12 22:10:02 +00:00
+								}
-												Move data.Node to tsdb.Store. Move data to cluster.
											
										
										
											2015-05-26 19:56:54 +00:00
-												add support for remote expansion of regex

This commit moves the `tsdb.Store.ExpandSources()` function onto
the `influxql.IteratorCreator` and provides support for issuing
source expansion across a cluster.

											
										
										
											2016-03-04 18:01:41 +00:00
+								// IteratorCreators returns a set of all local shards as iterator creators.
 								func (s *Store) IteratorCreators() influxql.IteratorCreators {
-												Fix possible deadlock when queries and delete series run concurrently

This locks showeed up in a deadlock systems running queries and
delete series across a large dataset.  Queries should not need to
lock the tsdb.Store for writes

											
										
										
											2016-05-13 23:04:12 +00:00
+									s.mu.RLock()
 									defer s.mu.RUnlock()
-												Move data.Node to tsdb.Store. Move data to cluster.
											
										
										
											2015-05-26 19:56:54 +00:00
-												add support for remote expansion of regex

This commit moves the `tsdb.Store.ExpandSources()` function onto
the `influxql.IteratorCreator` and provides support for issuing
source expansion across a cluster.

											
										
										
											2016-03-04 18:01:41 +00:00
+									a := make(influxql.IteratorCreators, 0, len(s.shards))
 									for _, sh := range s.shards {
 										a = append(a, sh)
-												refactor query engine

											
										
										
											2015-11-04 21:06:06 +00:00
+									}
-												add support for remote expansion of regex

This commit moves the `tsdb.Store.ExpandSources()` function onto
the `influxql.IteratorCreator` and provides support for issuing
source expansion across a cluster.

											
										
										
											2016-03-04 18:01:41 +00:00
+									return a
-												Move data.Node to tsdb.Store. Move data to cluster.
											
										
										
											2015-05-26 19:56:54 +00:00
+								}
-												Update godoc for the tsdb package

											
										
										
											2016-12-31 05:12:37 +00:00
+								// IteratorCreator returns an iterator creator for all shards in the given shard IDs.
-												add node id to execution options

This commit changes the `ExecutionOptions` and `SelectOptions` to
allow a `NodeID` for specifying an exact node to query against.

											
										
										
											2016-06-10 15:14:21 +00:00
+								func (s *Store) IteratorCreator(shards []uint64, opt *influxql.SelectOptions) (influxql.IteratorCreator, error) {
-												Cleanup QueryExecutor and split statement execution code

The QueryExecutor had a lot of dead code made obsolete by the query
engine refactor that has now been removed. The TSDBStore interface has
also been cleaned up so we can have multiple implementations of this
(such as a local and remote version).

A StatementExecutor interface has been created for adding custom
functionality to the QueryExecutor that may not be available in the open
source version. The QueryExecutor delegate all statement execution to
the StatementExecutor and the QueryExecutor will only keep track of
housekeeping. Implementing additional queries is as simple as wrapping
the cluster.StatementExecutor struct or replacing it with something
completely different.

The PointsWriter in the QueryExecutor has been changed to a simple
interface that implements the one method needed by the query executor.
This is to allow different PointsWriter implementations to be used by
the QueryExecutor. It has also been moved into the StatementExecutor
instead.

The TSDBStore interface has now been modified to contain the code for
creating an IteratorCreator. This is so the underlying TSDBStore can
implement different ways of accessing the underlying shards rather than
always having to access each shard individually (such as batch
requests).

Remove the show servers handling. This isn't a valid command in the open
source version of InfluxDB anymore.

The QueryManager interface is now built into QueryExecutor and is no
longer necessary. The StatementExecutor and QueryExecutor split allows
task management to much more easily be built into QueryExecutor rather
than as a separate struct.

											
										
										
											2016-03-31 22:12:29 +00:00
+									// Generate iterators for each node.
 									ics := make([]influxql.IteratorCreator, 0)
 									if err := func() error {
 										for _, id := range shards {
-												concurrent series limit

This commit fixes the `MaxSelectSeriesN` limit which was broken by
the implementation of lazy iterators. The setting previously limited
the total number of series but the new implementation limits the
concurrent number of series being processed.

											
										
										
											2016-08-08 16:39:38 +00:00
+											ic := s.ShardIteratorCreator(id, opt)
-												Cleanup QueryExecutor and split statement execution code

The QueryExecutor had a lot of dead code made obsolete by the query
engine refactor that has now been removed. The TSDBStore interface has
also been cleaned up so we can have multiple implementations of this
(such as a local and remote version).

A StatementExecutor interface has been created for adding custom
functionality to the QueryExecutor that may not be available in the open
source version. The QueryExecutor delegate all statement execution to
the StatementExecutor and the QueryExecutor will only keep track of
housekeeping. Implementing additional queries is as simple as wrapping
the cluster.StatementExecutor struct or replacing it with something
completely different.

The PointsWriter in the QueryExecutor has been changed to a simple
interface that implements the one method needed by the query executor.
This is to allow different PointsWriter implementations to be used by
the QueryExecutor. It has also been moved into the StatementExecutor
instead.

The TSDBStore interface has now been modified to contain the code for
creating an IteratorCreator. This is so the underlying TSDBStore can
implement different ways of accessing the underlying shards rather than
always having to access each shard individually (such as batch
requests).

Remove the show servers handling. This isn't a valid command in the open
source version of InfluxDB anymore.

The QueryManager interface is now built into QueryExecutor and is no
longer necessary. The StatementExecutor and QueryExecutor split allows
task management to much more easily be built into QueryExecutor rather
than as a separate struct.

											
										
										
											2016-03-31 22:12:29 +00:00
+											if ic == nil {
 												continue
 											}
 											ics = append(ics, ic)
 										}
 										return nil
 									}(); err != nil {
 										influxql.IteratorCreators(ics).Close()
 										return nil, err
 									}
-												Revert "limit shard concurrency"

This reverts commit 6c7d56d4bc634170d2abd11104423bda1b554e0e.

											
										
										
											2016-08-29 17:39:52 +00:00
+									return influxql.IteratorCreators(ics), nil
-												Cleanup QueryExecutor and split statement execution code

The QueryExecutor had a lot of dead code made obsolete by the query
engine refactor that has now been removed. The TSDBStore interface has
also been cleaned up so we can have multiple implementations of this
(such as a local and remote version).

A StatementExecutor interface has been created for adding custom
functionality to the QueryExecutor that may not be available in the open
source version. The QueryExecutor delegate all statement execution to
the StatementExecutor and the QueryExecutor will only keep track of
housekeeping. Implementing additional queries is as simple as wrapping
the cluster.StatementExecutor struct or replacing it with something
completely different.

The PointsWriter in the QueryExecutor has been changed to a simple
interface that implements the one method needed by the query executor.
This is to allow different PointsWriter implementations to be used by
the QueryExecutor. It has also been moved into the StatementExecutor
instead.

The TSDBStore interface has now been modified to contain the code for
creating an IteratorCreator. This is so the underlying TSDBStore can
implement different ways of accessing the underlying shards rather than
always having to access each shard individually (such as batch
requests).

Remove the show servers handling. This isn't a valid command in the open
source version of InfluxDB anymore.

The QueryManager interface is now built into QueryExecutor and is no
longer necessary. The StatementExecutor and QueryExecutor split allows
task management to much more easily be built into QueryExecutor rather
than as a separate struct.

											
										
										
											2016-03-31 22:12:29 +00:00
+								}
-												Lint tsdb and tsdb/engine package

											
										
										
											2016-02-10 20:04:18 +00:00
+								// WriteToShard writes a list of points to a shard identified by its ID.
-												refactor Points and Rows to dedicated packages

											
										
										
											2015-09-16 20:33:08 +00:00
+								func (s *Store) WriteToShard(shardID uint64, points []models.Point) error {
-												fix data race in WriteToShard

											
										
										
											2015-06-03 17:46:18 +00:00
+									s.mu.RLock()
-												Fix panic: assignment to entry in nil map

Closing the store did not properly return an error for in-flight
writes because the closing channel was set to nil when closed.  A
nil channel is not selectable so writes continue on past the guard
checks and trigger panics.

											
										
										
											2015-10-06 20:00:31 +00:00
 									select {
 									case <-s.closing:
-												Fix race on measurementFields

Both Shard and Engine had the same reference to the measurementField map,
but they each protected it with their own locks.  This causes a race when
write and queries are occurring because writes can add new fields to the
map while queries are reading from it.

The fix moves the ownership to the Engine and provides protected accessors
to that Shard now users.  For the most parts, the access on shard were old
dead code.

Fixing the measurementFields map race created a new race on the internal
fields map.  This is now unexported and protected via MeasurementFields
exported funcs.

Fixes #6188

											
										
										
											2016-04-01 19:30:09 +00:00
+										s.mu.RUnlock()
-												Fix panic: assignment to entry in nil map

Closing the store did not properly return an error for in-flight
writes because the closing channel was set to nil when closed.  A
nil channel is not selectable so writes continue on past the guard
checks and trigger panics.

											
										
										
											2015-10-06 20:00:31 +00:00
+										return ErrStoreClosed
 									default:
 									}
-												models: Add FieldIterator type

The FieldIterator is used to scan over the fields of a point, providing
information, and delaying parsing/decoding the value until it is needed.
This change uses this new type to avoid the allocation of a map for the
fields which is then thrown away as soon as the points get converted
into columns within the datastore.

											
										
										
											2016-09-21 17:12:09 +00:00
+									sh := s.shards[shardID]
 									if sh == nil {
-												Fix race on measurementFields

Both Shard and Engine had the same reference to the measurementField map,
but they each protected it with their own locks.  This causes a race when
write and queries are occurring because writes can add new fields to the
map while queries are reading from it.

The fix moves the ownership to the Engine and provides protected accessors
to that Shard now users.  For the most parts, the access on shard were old
dead code.

Fixing the measurementFields map race created a new race on the internal
fields map.  This is now unexported and protected via MeasurementFields
exported funcs.

Fixes #6188

											
										
										
											2016-04-01 19:30:09 +00:00
+										s.mu.RUnlock()
-												Move data.Node to tsdb.Store. Move data to cluster.
											
										
										
											2015-05-26 19:56:54 +00:00
+										return ErrShardNotFound
 									}
-												Fix race on measurementFields

Both Shard and Engine had the same reference to the measurementField map,
but they each protected it with their own locks.  This causes a race when
write and queries are occurring because writes can add new fields to the
map while queries are reading from it.

The fix moves the ownership to the Engine and provides protected accessors
to that Shard now users.  For the most parts, the access on shard were old
dead code.

Fixing the measurementFields map race created a new race on the internal
fields map.  This is now unexported and protected via MeasurementFields
exported funcs.

Fixes #6188

											
										
										
											2016-04-01 19:30:09 +00:00
+									s.mu.RUnlock()
-												Move data.Node to tsdb.Store. Move data to cluster.
											
										
										
											2015-05-26 19:56:54 +00:00
-												Add database, RP as tags on shard stats

This commit updates tsdb.Shard to contain a ShardConfig and updates
tsdb.Store to directly reference a map of tsdb.Shard rather than the
previous tsdb.shardLocation abstraction.

											
										
										
											2016-02-23 20:07:21 +00:00
+									return sh.WritePoints(points)
-												Move data.Node to tsdb.Store. Move data to cluster.
											
										
										
											2015-05-26 19:56:54 +00:00
+								}
-												Initialise index in shards

											
										
										
											2016-09-01 12:40:16 +00:00
+								// Measurements returns a slice of all measurements. Measurements accepts an
 								// optional condition expression. If cond is nil, then all measurements for the
 								// database will be returned.
-												Switch SHOW MEASUREMENTS and SHOW TAG VALUES to directly access the tsdb.Store

The `SHOW MEASUREMENTS` and `SHOW TAG VALUES` cannot go through the
query engine to get the speed they need. They also only need access to
the database index and do not need access to specific shards. This
removes the query rewriting that was done to turn these two queries into
a select statement and reimplements them inside of the coordinator as an
interface on the TSDBStore.

											
										
										
											2016-07-28 22:38:08 +00:00
+								func (s *Store) Measurements(database string, cond influxql.Expr) ([]string, error) {
-												Initialise index in shards

											
										
										
											2016-09-01 12:40:16 +00:00
+									s.mu.RLock()
 									shards := s.filterShards(byDatabase(database))
 									s.mu.RUnlock()
-												Switch SHOW MEASUREMENTS and SHOW TAG VALUES to directly access the tsdb.Store

The `SHOW MEASUREMENTS` and `SHOW TAG VALUES` cannot go through the
query engine to get the speed they need. They also only need access to
the database index and do not need access to specific shards. This
removes the query rewriting that was done to turn these two queries into
a select statement and reimplements them inside of the coordinator as an
interface on the TSDBStore.

											
										
										
											2016-07-28 22:38:08 +00:00
-												Initialise index in shards

											
										
										
											2016-09-01 12:40:16 +00:00
+									var m Measurements
 									for _, sh := range shards {
 										var mms Measurements
 										// Retrieve measurements from database index. Filter if condition specified.
 										if cond == nil {
 											mms = sh.Measurements()
 										} else {
 											var err error
 											mms, _, err = sh.MeasurementsByExpr(cond)
 											if err != nil {
 												return nil, err
 											}
-												Switch SHOW MEASUREMENTS and SHOW TAG VALUES to directly access the tsdb.Store

The `SHOW MEASUREMENTS` and `SHOW TAG VALUES` cannot go through the
query engine to get the speed they need. They also only need access to
the database index and do not need access to specific shards. This
removes the query rewriting that was done to turn these two queries into
a select statement and reimplements them inside of the coordinator as an
interface on the TSDBStore.

											
										
										
											2016-07-28 22:38:08 +00:00
+										}
-												Initialise index in shards

											
										
										
											2016-09-01 12:40:16 +00:00
 										m = append(m, mms...)
-												Switch SHOW MEASUREMENTS and SHOW TAG VALUES to directly access the tsdb.Store

The `SHOW MEASUREMENTS` and `SHOW TAG VALUES` cannot go through the
query engine to get the speed they need. They also only need access to
the database index and do not need access to specific shards. This
removes the query rewriting that was done to turn these two queries into
a select statement and reimplements them inside of the coordinator as an
interface on the TSDBStore.

											
										
										
											2016-07-28 22:38:08 +00:00
+									}
 									// Sort measurements by name.
-												Initialise index in shards

											
										
										
											2016-09-01 12:40:16 +00:00
+									sort.Sort(m)
-												Switch SHOW MEASUREMENTS and SHOW TAG VALUES to directly access the tsdb.Store

The `SHOW MEASUREMENTS` and `SHOW TAG VALUES` cannot go through the
query engine to get the speed they need. They also only need access to
the database index and do not need access to specific shards. This
removes the query rewriting that was done to turn these two queries into
a select statement and reimplements them inside of the coordinator as an
interface on the TSDBStore.

											
										
										
											2016-07-28 22:38:08 +00:00
-												Initialise index in shards

											
										
										
											2016-09-01 12:40:16 +00:00
+									measurements := make([]string, 0, len(m))
 									for _, m := range m {
 										measurements = append(measurements, m.Name)
-												Switch SHOW MEASUREMENTS and SHOW TAG VALUES to directly access the tsdb.Store

The `SHOW MEASUREMENTS` and `SHOW TAG VALUES` cannot go through the
query engine to get the speed they need. They also only need access to
the database index and do not need access to specific shards. This
removes the query rewriting that was done to turn these two queries into
a select statement and reimplements them inside of the coordinator as an
interface on the TSDBStore.

											
										
										
											2016-07-28 22:38:08 +00:00
+									}
 									return measurements, nil
 								}
-												Initialise index in shards

											
										
										
											2016-09-01 12:40:16 +00:00
+								// MeasurementSeriesCounts returns the number of measurements and series in all
 								// the shards' indices.
 								func (s *Store) MeasurementSeriesCounts(database string) (measuments int, series int) {
 									// TODO: implement me
 									return 0, 0
 								}
-												Switch SHOW MEASUREMENTS and SHOW TAG VALUES to directly access the tsdb.Store

The `SHOW MEASUREMENTS` and `SHOW TAG VALUES` cannot go through the
query engine to get the speed they need. They also only need access to
the database index and do not need access to specific shards. This
removes the query rewriting that was done to turn these two queries into
a select statement and reimplements them inside of the coordinator as an
interface on the TSDBStore.

											
										
										
											2016-07-28 22:38:08 +00:00
+								type TagValues struct {
 									Measurement string
 									Values      []KeyValue
 								}
-												Update godoc for the tsdb package

											
										
										
											2016-12-31 05:12:37 +00:00
+								// TagValues returns the tag keys and values in the given database, matching the condition.
-												Switch SHOW MEASUREMENTS and SHOW TAG VALUES to directly access the tsdb.Store

The `SHOW MEASUREMENTS` and `SHOW TAG VALUES` cannot go through the
query engine to get the speed they need. They also only need access to
the database index and do not need access to specific shards. This
removes the query rewriting that was done to turn these two queries into
a select statement and reimplements them inside of the coordinator as an
interface on the TSDBStore.

											
										
										
											2016-07-28 22:38:08 +00:00
+								func (s *Store) TagValues(database string, cond influxql.Expr) ([]TagValues, error) {
 									if cond == nil {
 										return nil, errors.New("a condition is required")
 									}
 									measurementExpr := influxql.CloneExpr(cond)
 									measurementExpr = influxql.Reduce(influxql.RewriteExpr(measurementExpr, func(e influxql.Expr) influxql.Expr {
 										switch e := e.(type) {
 										case *influxql.BinaryExpr:
 											switch e.Op {
 											case influxql.EQ, influxql.NEQ, influxql.EQREGEX, influxql.NEQREGEX:
 												tag, ok := e.LHS.(*influxql.VarRef)
 												if !ok || tag.Val != "_name" {
 													return nil
 												}
 											}
 										}
 										return e
 									}), nil)
-												Initialise index in shards

											
										
										
											2016-09-01 12:40:16 +00:00
+									// Get all measurements for the shards we're interested in.
 									s.mu.RLock()
 									shards := s.filterShards(byDatabase(database))
 									s.mu.RUnlock()
 									var measures Measurements
 									for _, sh := range shards {
 										mms, ok, err := sh.MeasurementsByExpr(measurementExpr)
 										if err != nil {
 											return nil, err
 										} else if !ok {
 											// TODO(edd): can we simplify this so we don't have to check the
 											// ok value, and we can call sh.measurements with a shard filter
 											// instead?
 											mms = sh.Measurements()
 										}
 										measures = append(measures, mms...)
-												Switch SHOW MEASUREMENTS and SHOW TAG VALUES to directly access the tsdb.Store

The `SHOW MEASUREMENTS` and `SHOW TAG VALUES` cannot go through the
query engine to get the speed they need. They also only need access to
the database index and do not need access to specific shards. This
removes the query rewriting that was done to turn these two queries into
a select statement and reimplements them inside of the coordinator as an
interface on the TSDBStore.

											
										
										
											2016-07-28 22:38:08 +00:00
+									}
 									// If there are no measurements, return immediately.
-												Initialise index in shards

											
										
										
											2016-09-01 12:40:16 +00:00
+									if len(measures) == 0 {
-												Switch SHOW MEASUREMENTS and SHOW TAG VALUES to directly access the tsdb.Store

The `SHOW MEASUREMENTS` and `SHOW TAG VALUES` cannot go through the
query engine to get the speed they need. They also only need access to
the database index and do not need access to specific shards. This
removes the query rewriting that was done to turn these two queries into
a select statement and reimplements them inside of the coordinator as an
interface on the TSDBStore.

											
										
										
											2016-07-28 22:38:08 +00:00
+										return nil, nil
 									}
-												Initialise index in shards

											
										
										
											2016-09-01 12:40:16 +00:00
+									sort.Sort(measures)
-												Switch SHOW MEASUREMENTS and SHOW TAG VALUES to directly access the tsdb.Store

The `SHOW MEASUREMENTS` and `SHOW TAG VALUES` cannot go through the
query engine to get the speed they need. They also only need access to
the database index and do not need access to specific shards. This
removes the query rewriting that was done to turn these two queries into
a select statement and reimplements them inside of the coordinator as an
interface on the TSDBStore.

											
										
										
											2016-07-28 22:38:08 +00:00
 									filterExpr := influxql.CloneExpr(cond)
 									filterExpr = influxql.Reduce(influxql.RewriteExpr(filterExpr, func(e influxql.Expr) influxql.Expr {
 										switch e := e.(type) {
 										case *influxql.BinaryExpr:
 											switch e.Op {
 											case influxql.EQ, influxql.NEQ, influxql.EQREGEX, influxql.NEQREGEX:
 												tag, ok := e.LHS.(*influxql.VarRef)
 												if !ok || strings.HasPrefix(tag.Val, "_") {
 													return nil
 												}
 											}
 										}
 										return e
 									}), nil)
-												Initialise index in shards

											
										
										
											2016-09-01 12:40:16 +00:00
+									tagValues := make([]TagValues, len(measures))
 									for i, mm := range measures {
-												Switch SHOW MEASUREMENTS and SHOW TAG VALUES to directly access the tsdb.Store

The `SHOW MEASUREMENTS` and `SHOW TAG VALUES` cannot go through the
query engine to get the speed they need. They also only need access to
the database index and do not need access to specific shards. This
removes the query rewriting that was done to turn these two queries into
a select statement and reimplements them inside of the coordinator as an
interface on the TSDBStore.

											
										
										
											2016-07-28 22:38:08 +00:00
+										tagValues[i].Measurement = mm.Name
 										ids, err := mm.SeriesIDsAllOrByExpr(filterExpr)
 										if err != nil {
 											return nil, err
 										}
 										ss := mm.SeriesByIDSlice(ids)
 										// Determine a list of keys from condition.
 										keySet, ok, err := mm.TagKeysByExpr(cond)
 										if err != nil {
 											return nil, err
 										}
 										// Loop over all keys for each series.
 										m := make(map[KeyValue]struct{}, len(ss))
 										for _, series := range ss {
-												reduce memory allocations in index

This commit changes the index to point to index data in the shards
instead of keeping it in-memory on the heap.

											
										
										
											2016-06-30 16:49:53 +00:00
+											for _, t := range series.Tags {
-												Switch SHOW MEASUREMENTS and SHOW TAG VALUES to directly access the tsdb.Store

The `SHOW MEASUREMENTS` and `SHOW TAG VALUES` cannot go through the
query engine to get the speed they need. They also only need access to
the database index and do not need access to specific shards. This
removes the query rewriting that was done to turn these two queries into
a select statement and reimplements them inside of the coordinator as an
interface on the TSDBStore.

											
										
										
											2016-07-28 22:38:08 +00:00
+												if !ok {
 													// nop
-												reduce memory allocations in index

This commit changes the index to point to index data in the shards
instead of keeping it in-memory on the heap.

											
										
										
											2016-06-30 16:49:53 +00:00
+												} else if _, exists := keySet[string(t.Key)]; !exists {
-												Switch SHOW MEASUREMENTS and SHOW TAG VALUES to directly access the tsdb.Store

The `SHOW MEASUREMENTS` and `SHOW TAG VALUES` cannot go through the
query engine to get the speed they need. They also only need access to
the database index and do not need access to specific shards. This
removes the query rewriting that was done to turn these two queries into
a select statement and reimplements them inside of the coordinator as an
interface on the TSDBStore.

											
										
										
											2016-07-28 22:38:08 +00:00
+													continue
 												}
-												reduce memory allocations in index

This commit changes the index to point to index data in the shards
instead of keeping it in-memory on the heap.

											
										
										
											2016-06-30 16:49:53 +00:00
+												m[KeyValue{string(t.Key), string(t.Value)}] = struct{}{}
-												Switch SHOW MEASUREMENTS and SHOW TAG VALUES to directly access the tsdb.Store

The `SHOW MEASUREMENTS` and `SHOW TAG VALUES` cannot go through the
query engine to get the speed they need. They also only need access to
the database index and do not need access to specific shards. This
removes the query rewriting that was done to turn these two queries into
a select statement and reimplements them inside of the coordinator as an
interface on the TSDBStore.

											
										
										
											2016-07-28 22:38:08 +00:00
+											}
 										}
 										// Return an empty slice if there are no key/value matches.
 										if len(m) == 0 {
 											continue
 										}
 										// Sort key/value set.
 										a := make([]KeyValue, 0, len(m))
 										for kv := range m {
 											a = append(a, kv)
 										}
 										sort.Sort(KeyValues(a))
 										tagValues[i].Values = a
 									}
 									return tagValues, nil
 								}
-												Update godoc for the tsdb package

											
										
										
											2016-12-31 05:12:37 +00:00
+								// KeyValue holds a string key and a string value.
-												Switch SHOW MEASUREMENTS and SHOW TAG VALUES to directly access the tsdb.Store

The `SHOW MEASUREMENTS` and `SHOW TAG VALUES` cannot go through the
query engine to get the speed they need. They also only need access to
the database index and do not need access to specific shards. This
removes the query rewriting that was done to turn these two queries into
a select statement and reimplements them inside of the coordinator as an
interface on the TSDBStore.

											
										
										
											2016-07-28 22:38:08 +00:00
+								type KeyValue struct {
 									Key, Value string
 								}
-												Update godoc for the tsdb package

											
										
										
											2016-12-31 05:12:37 +00:00
+								// KeyValues is a sortable slice of KeyValue.
-												Switch SHOW MEASUREMENTS and SHOW TAG VALUES to directly access the tsdb.Store

The `SHOW MEASUREMENTS` and `SHOW TAG VALUES` cannot go through the
query engine to get the speed they need. They also only need access to
the database index and do not need access to specific shards. This
removes the query rewriting that was done to turn these two queries into
a select statement and reimplements them inside of the coordinator as an
interface on the TSDBStore.

											
										
										
											2016-07-28 22:38:08 +00:00
+								type KeyValues []KeyValue
-												Update godoc for the tsdb package

											
										
										
											2016-12-31 05:12:37 +00:00
+								// Len implements sort.Interface.
 								func (a KeyValues) Len() int { return len(a) }
 								// Swap implements sort.Interface.
-												Switch SHOW MEASUREMENTS and SHOW TAG VALUES to directly access the tsdb.Store

The `SHOW MEASUREMENTS` and `SHOW TAG VALUES` cannot go through the
query engine to get the speed they need. They also only need access to
the database index and do not need access to specific shards. This
removes the query rewriting that was done to turn these two queries into
a select statement and reimplements them inside of the coordinator as an
interface on the TSDBStore.

											
										
										
											2016-07-28 22:38:08 +00:00
+								func (a KeyValues) Swap(i, j int) { a[i], a[j] = a[j], a[i] }
-												Update godoc for the tsdb package

											
										
										
											2016-12-31 05:12:37 +00:00
 								// Less implements sort.Interface. Keys are compared before values.
-												Switch SHOW MEASUREMENTS and SHOW TAG VALUES to directly access the tsdb.Store

The `SHOW MEASUREMENTS` and `SHOW TAG VALUES` cannot go through the
query engine to get the speed they need. They also only need access to
the database index and do not need access to specific shards. This
removes the query rewriting that was done to turn these two queries into
a select statement and reimplements them inside of the coordinator as an
interface on the TSDBStore.

											
										
										
											2016-07-28 22:38:08 +00:00
+								func (a KeyValues) Less(i, j int) bool {
 									ki, kj := a[i].Key, a[j].Key
 									if ki == kj {
 										return a[i].Value < a[j].Value
 									}
 									return ki < kj
 								}
-												refactor query executor

This commit moves the `QueryExecutor` to the `cluster` package
and provides an interface to it inside the `influxql` package.

											
										
										
											2016-02-12 22:10:02 +00:00
+								// filterShowSeriesResult will limit the number of series returned based on the limit and the offset.
 								// Unlike limit and offset on SELECT statements, the limit and offset don't apply to the number of Rows, but
 								// to the number of total Values returned, since each Value represents a unique series.
 								func (e *Store) filterShowSeriesResult(limit, offset int, rows models.Rows) models.Rows {
 									var filteredSeries models.Rows
 									seriesCount := 0
 									for _, r := range rows {
 										var currentSeries [][]interface{}
 										// filter the values
 										for _, v := range r.Values {
 											if seriesCount >= offset && seriesCount-offset < limit {
 												currentSeries = append(currentSeries, v)
 											}
 											seriesCount++
 										}
 										// only add the row back in if there are some values in it
 										if len(currentSeries) > 0 {
 											r.Values = currentSeries
 											filteredSeries = append(filteredSeries, r)
 											if seriesCount > limit+offset {
 												return filteredSeries
 											}
 										}
 									}
 									return filteredSeries
 								}
-												Refactor

											
										
										
											2016-09-14 13:55:44 +00:00
+								// decodeStorePath extracts the database and retention policy names
-												Tag TSM stats with database, retention policy

... by extracting the db/rp from the given path.

Now that the code has "standardized" on extracting db/rp this way, the
ShardLocation struct is no longer necessary and thus has been removed.
We're back on the previous style of passing the path and walPath to
NewShard.

											
										
										
											2016-02-26 19:41:54 +00:00
+								// from a given shard or WAL path.
-												Refactor

											
										
										
											2016-09-14 13:55:44 +00:00
+								func decodeStorePath(shardOrWALPath string) (database, retentionPolicy string) {
-												Tag TSM stats with database, retention policy

... by extracting the db/rp from the given path.

Now that the code has "standardized" on extracting db/rp this way, the
ShardLocation struct is no longer necessary and thus has been removed.
We're back on the previous style of passing the path and walPath to
NewShard.

											
										
										
											2016-02-26 19:41:54 +00:00
+									// shardOrWALPath format: /maybe/absolute/base/then/:database/:retentionPolicy/:nameOfShardOrWAL
 									// Discard the last part of the path (the shard name or the wal name).
 									path, _ := filepath.Split(filepath.Clean(shardOrWALPath))
 									// Extract the database and retention policy.
 									path, rp := filepath.Split(filepath.Clean(path))
 									_, db := filepath.Split(filepath.Clean(path))
 									return db, rp
 								}
-												Implement backup/restore for TSM.

This changes backup and restore to work for TSM. It breaks it for b1 and bz1, but since those are getting removed it's ok.

The backup runs against any host that is specified and can backup either the metasstore, a database, specific retention policy, or a specific shard. It can also take incremental backups with the `since` flag, which will only backup TSM files that have been created since that timestamp.

The backup is safe to run online. However, for shards that are still hot for writes, they won't be able to create new TSM files while the backup for that single shard runs. If the backup isn't too large and the write throughput isn't too high this shouldn't be a problem since the writes will just go into the WAL cache.

											
										
										
											2015-12-25 13:23:22 +00:00
+								// relativePath will expand out the full paths passed in and return
 								// the relative shard path from the store
 								func relativePath(storePath, shardPath string) (string, error) {
 									path, err := filepath.Abs(storePath)
 									if err != nil {
 										return "", fmt.Errorf("store abs path: %s", err)
 									}
 									fp, err := filepath.Abs(shardPath)
 									if err != nil {
 										return "", fmt.Errorf("file abs path: %s", err)
 									}
 									name, err := filepath.Rel(path, fp)
 									if err != nil {
 										return "", fmt.Errorf("file rel path: %s", err)
 									}
 									return name, nil
 								}
-												refactor query executor

This commit moves the `QueryExecutor` to the `cluster` package
and provides an interface to it inside the `influxql` package.

											
										
										
											2016-02-12 22:10:02 +00:00
 								// measurementsFromSourcesOrDB returns a list of measurements from the
 								// sources passed in or, if sources is empty, a list of all
-												Initialise index in shards

											
										
										
											2016-09-01 12:40:16 +00:00
+								// measurement names from the measurement map passed in.
 								func measurementsFromSourcesOrDB(measurements map[string]*Measurement, sources ...influxql.Source) (Measurements, error) {
 									var all Measurements
-												refactor query executor

This commit moves the `QueryExecutor` to the `cluster` package
and provides an interface to it inside the `influxql` package.

											
										
										
											2016-02-12 22:10:02 +00:00
+									if len(sources) > 0 {
 										for _, source := range sources {
 											if m, ok := source.(*influxql.Measurement); ok {
-												Initialise index in shards

											
										
										
											2016-09-01 12:40:16 +00:00
+												measurement := measurements[m.Name]
-												refactor query executor

This commit moves the `QueryExecutor` to the `cluster` package
and provides an interface to it inside the `influxql` package.

											
										
										
											2016-02-12 22:10:02 +00:00
+												if measurement == nil {
 													continue
 												}
-												Initialise index in shards

											
										
										
											2016-09-01 12:40:16 +00:00
+												all = append(all, measurement)
-												refactor query executor

This commit moves the `QueryExecutor` to the `cluster` package
and provides an interface to it inside the `influxql` package.

											
										
										
											2016-02-12 22:10:02 +00:00
+											} else {
 												return nil, errors.New("identifiers in FROM clause must be measurement names")
 											}
 										}
 									} else {
 										// No measurements specified in FROM clause so get all measurements that have series.
-												Initialise index in shards

											
										
										
											2016-09-01 12:40:16 +00:00
+										for _, m := range measurements {
-												refactor query executor

This commit moves the `QueryExecutor` to the `cluster` package
and provides an interface to it inside the `influxql` package.

											
										
										
											2016-02-12 22:10:02 +00:00
+											if m.HasSeries() {
-												Initialise index in shards

											
										
										
											2016-09-01 12:40:16 +00:00
+												all = append(all, m)
-												refactor query executor

This commit moves the `QueryExecutor` to the `cluster` package
and provides an interface to it inside the `influxql` package.

											
										
										
											2016-02-12 22:10:02 +00:00
+											}
 										}
 									}
-												Initialise index in shards

											
										
										
											2016-09-01 12:40:16 +00:00
+									sort.Sort(all)
-												refactor query executor

This commit moves the `QueryExecutor` to the `cluster` package
and provides an interface to it inside the `influxql` package.

											
										
										
											2016-02-12 22:10:02 +00:00
-												Initialise index in shards

											
										
										
											2016-09-01 12:40:16 +00:00
+									return all, nil
-												refactor query executor

This commit moves the `QueryExecutor` to the `cluster` package
and provides an interface to it inside the `influxql` package.

											
										
										
											2016-02-12 22:10:02 +00:00
+								}