2021-04-19 05:50:12 +00:00
|
|
|
// Copyright (C) 2019-2020 Zilliz. All rights reserved.
|
|
|
|
//
|
|
|
|
// Licensed under the Apache License, Version 2.0 (the "License"); you may not use this file except in compliance
|
|
|
|
// with the License. You may obtain a copy of the License at
|
|
|
|
//
|
|
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
//
|
|
|
|
// Unless required by applicable law or agreed to in writing, software distributed under the License
|
|
|
|
// is distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express
|
|
|
|
// or implied. See the License for the specific language governing permissions and limitations under the License.
|
|
|
|
|
2021-01-15 06:38:36 +00:00
|
|
|
package indexnode
|
2020-12-10 09:55:55 +00:00
|
|
|
|
|
|
|
import (
|
|
|
|
"container/list"
|
|
|
|
"context"
|
2021-03-08 02:09:48 +00:00
|
|
|
"errors"
|
2020-12-10 09:55:55 +00:00
|
|
|
"sync"
|
|
|
|
|
2021-03-10 01:56:09 +00:00
|
|
|
"go.uber.org/zap"
|
|
|
|
|
2021-04-22 06:45:57 +00:00
|
|
|
"github.com/milvus-io/milvus/internal/kv"
|
|
|
|
"github.com/milvus-io/milvus/internal/log"
|
|
|
|
"github.com/milvus-io/milvus/internal/util/trace"
|
2021-02-23 01:58:06 +00:00
|
|
|
"github.com/opentracing/opentracing-go"
|
|
|
|
oplog "github.com/opentracing/opentracing-go/log"
|
2020-12-10 09:55:55 +00:00
|
|
|
)
|
|
|
|
|
2021-10-03 02:15:56 +00:00
|
|
|
// TaskQueue is a queue used to store tasks.
|
2020-12-10 09:55:55 +00:00
|
|
|
type TaskQueue interface {
|
|
|
|
utChan() <-chan int
|
|
|
|
utEmpty() bool
|
|
|
|
utFull() bool
|
|
|
|
addUnissuedTask(t task) error
|
2021-07-23 02:44:12 +00:00
|
|
|
//FrontUnissuedTask() task
|
2020-12-10 09:55:55 +00:00
|
|
|
PopUnissuedTask() task
|
|
|
|
AddActiveTask(t task)
|
|
|
|
PopActiveTask(tID UniqueID) task
|
|
|
|
Enqueue(t task) error
|
2021-07-23 02:44:12 +00:00
|
|
|
//tryToRemoveUselessIndexBuildTask(indexID UniqueID) []UniqueID
|
2020-12-10 09:55:55 +00:00
|
|
|
}
|
|
|
|
|
2021-10-03 02:15:56 +00:00
|
|
|
// BaseTaskQueue is a basic instance of TaskQueue.
|
2020-12-10 09:55:55 +00:00
|
|
|
type BaseTaskQueue struct {
|
|
|
|
unissuedTasks *list.List
|
|
|
|
activeTasks map[UniqueID]task
|
|
|
|
utLock sync.Mutex
|
|
|
|
atLock sync.Mutex
|
|
|
|
|
|
|
|
// maxTaskNum should keep still
|
|
|
|
maxTaskNum int64
|
|
|
|
|
|
|
|
utBufChan chan int // to block scheduler
|
|
|
|
|
|
|
|
sched *TaskScheduler
|
|
|
|
}
|
|
|
|
|
|
|
|
func (queue *BaseTaskQueue) utChan() <-chan int {
|
|
|
|
return queue.utBufChan
|
|
|
|
}
|
|
|
|
|
|
|
|
func (queue *BaseTaskQueue) utEmpty() bool {
|
|
|
|
return queue.unissuedTasks.Len() == 0
|
|
|
|
}
|
|
|
|
|
|
|
|
func (queue *BaseTaskQueue) utFull() bool {
|
|
|
|
return int64(queue.unissuedTasks.Len()) >= queue.maxTaskNum
|
|
|
|
}
|
|
|
|
|
|
|
|
func (queue *BaseTaskQueue) addUnissuedTask(t task) error {
|
|
|
|
queue.utLock.Lock()
|
|
|
|
defer queue.utLock.Unlock()
|
|
|
|
|
|
|
|
if queue.utFull() {
|
2021-06-06 01:41:35 +00:00
|
|
|
return errors.New("IndexNode task queue is full")
|
2020-12-10 09:55:55 +00:00
|
|
|
}
|
|
|
|
queue.unissuedTasks.PushBack(t)
|
|
|
|
queue.utBufChan <- 1
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2021-07-23 02:44:12 +00:00
|
|
|
//func (queue *BaseTaskQueue) FrontUnissuedTask() task {
|
|
|
|
// queue.utLock.Lock()
|
|
|
|
// defer queue.utLock.Unlock()
|
|
|
|
//
|
|
|
|
// if queue.unissuedTasks.Len() <= 0 {
|
|
|
|
// log.Debug("IndexNode FrontUnissuedTask sorry, but the unissued task list is empty!")
|
|
|
|
// return nil
|
|
|
|
// }
|
|
|
|
//
|
|
|
|
// return queue.unissuedTasks.Front().Value.(task)
|
|
|
|
//}
|
2020-12-10 09:55:55 +00:00
|
|
|
|
2021-10-03 02:15:56 +00:00
|
|
|
// PopUnissuedTask pops a task from tasks queue.
|
2020-12-10 09:55:55 +00:00
|
|
|
func (queue *BaseTaskQueue) PopUnissuedTask() task {
|
|
|
|
queue.utLock.Lock()
|
|
|
|
defer queue.utLock.Unlock()
|
|
|
|
|
|
|
|
if queue.unissuedTasks.Len() <= 0 {
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
|
|
|
ft := queue.unissuedTasks.Front()
|
|
|
|
queue.unissuedTasks.Remove(ft)
|
|
|
|
|
|
|
|
return ft.Value.(task)
|
|
|
|
}
|
|
|
|
|
2021-10-03 02:15:56 +00:00
|
|
|
// AddActiveTask adds a task to activeTasks.
|
2020-12-10 09:55:55 +00:00
|
|
|
func (queue *BaseTaskQueue) AddActiveTask(t task) {
|
|
|
|
queue.atLock.Lock()
|
|
|
|
defer queue.atLock.Unlock()
|
|
|
|
|
|
|
|
tID := t.ID()
|
|
|
|
_, ok := queue.activeTasks[tID]
|
|
|
|
if ok {
|
2021-10-13 02:54:33 +00:00
|
|
|
log.Debug("IndexNode task already in active task list", zap.Any("TaskID", tID))
|
2020-12-10 09:55:55 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
queue.activeTasks[tID] = t
|
|
|
|
}
|
|
|
|
|
2021-10-03 02:15:56 +00:00
|
|
|
// PopActiveTask tasks out a task from activateTask and the task will be executed.
|
2020-12-10 09:55:55 +00:00
|
|
|
func (queue *BaseTaskQueue) PopActiveTask(tID UniqueID) task {
|
|
|
|
queue.atLock.Lock()
|
|
|
|
defer queue.atLock.Unlock()
|
|
|
|
|
|
|
|
t, ok := queue.activeTasks[tID]
|
|
|
|
if ok {
|
|
|
|
delete(queue.activeTasks, tID)
|
|
|
|
return t
|
|
|
|
}
|
2021-10-13 02:54:33 +00:00
|
|
|
log.Debug("IndexNode task was not found in the active task list", zap.Any("TaskID", tID))
|
2020-12-10 09:55:55 +00:00
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2021-07-23 02:44:12 +00:00
|
|
|
//func (queue *BaseTaskQueue) tryToRemoveUselessIndexBuildTask(indexID UniqueID) []UniqueID {
|
|
|
|
// queue.utLock.Lock()
|
|
|
|
// defer queue.utLock.Unlock()
|
|
|
|
//
|
|
|
|
// var next *list.Element
|
|
|
|
// var indexBuildIDs []UniqueID
|
|
|
|
// for e := queue.unissuedTasks.Front(); e != nil; e = next {
|
|
|
|
// next = e.Next()
|
|
|
|
// indexBuildTask, ok := e.Value.(*IndexBuildTask)
|
|
|
|
// if !ok {
|
|
|
|
// continue
|
|
|
|
// }
|
|
|
|
// if indexBuildTask.req.IndexID == indexID {
|
|
|
|
// indexBuildIDs = append(indexBuildIDs, indexBuildTask.req.IndexBuildID)
|
|
|
|
// queue.unissuedTasks.Remove(e)
|
|
|
|
// indexBuildTask.Notify(nil)
|
|
|
|
// }
|
|
|
|
// }
|
|
|
|
// return indexBuildIDs
|
|
|
|
//}
|
2021-02-23 03:57:18 +00:00
|
|
|
|
2021-10-03 02:15:56 +00:00
|
|
|
// Enqueue adds a task to TaskQueue.
|
2020-12-10 09:55:55 +00:00
|
|
|
func (queue *BaseTaskQueue) Enqueue(t task) error {
|
2020-12-12 22:48:05 +00:00
|
|
|
err := t.OnEnqueue()
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
2020-12-10 09:55:55 +00:00
|
|
|
return queue.addUnissuedTask(t)
|
|
|
|
}
|
|
|
|
|
2021-10-03 02:15:56 +00:00
|
|
|
// IndexBuildTaskQueue is a task queue used to store building index tasks.
|
2020-12-10 09:55:55 +00:00
|
|
|
type IndexBuildTaskQueue struct {
|
|
|
|
BaseTaskQueue
|
|
|
|
}
|
|
|
|
|
2021-10-03 02:15:56 +00:00
|
|
|
// NewIndexBuildTaskQueue creates a new IndexBuildTaskQueue.
|
2020-12-10 09:55:55 +00:00
|
|
|
func NewIndexBuildTaskQueue(sched *TaskScheduler) *IndexBuildTaskQueue {
|
|
|
|
return &IndexBuildTaskQueue{
|
|
|
|
BaseTaskQueue: BaseTaskQueue{
|
|
|
|
unissuedTasks: list.New(),
|
|
|
|
activeTasks: make(map[UniqueID]task),
|
|
|
|
maxTaskNum: 1024,
|
|
|
|
utBufChan: make(chan int, 1024),
|
|
|
|
sched: sched,
|
|
|
|
},
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2021-10-03 02:15:56 +00:00
|
|
|
// TaskScheduler is a scheduler of indexing tasks.
|
2020-12-10 09:55:55 +00:00
|
|
|
type TaskScheduler struct {
|
|
|
|
IndexBuildQueue TaskQueue
|
|
|
|
|
2021-01-26 01:38:40 +00:00
|
|
|
buildParallel int
|
2021-04-12 10:09:28 +00:00
|
|
|
kv kv.BaseKV
|
2021-01-26 01:38:40 +00:00
|
|
|
wg sync.WaitGroup
|
|
|
|
ctx context.Context
|
|
|
|
cancel context.CancelFunc
|
2020-12-10 09:55:55 +00:00
|
|
|
}
|
|
|
|
|
2021-10-03 02:15:56 +00:00
|
|
|
// NewTaskScheduler creates a new task scheduler of indexing tasks.
|
2020-12-10 09:55:55 +00:00
|
|
|
func NewTaskScheduler(ctx context.Context,
|
2021-04-12 10:09:28 +00:00
|
|
|
kv kv.BaseKV) (*TaskScheduler, error) {
|
2020-12-10 09:55:55 +00:00
|
|
|
ctx1, cancel := context.WithCancel(ctx)
|
|
|
|
s := &TaskScheduler{
|
2021-01-26 01:38:40 +00:00
|
|
|
kv: kv,
|
|
|
|
ctx: ctx1,
|
|
|
|
cancel: cancel,
|
|
|
|
buildParallel: 1, // default value
|
2020-12-10 09:55:55 +00:00
|
|
|
}
|
|
|
|
s.IndexBuildQueue = NewIndexBuildTaskQueue(s)
|
|
|
|
|
|
|
|
return s, nil
|
|
|
|
}
|
|
|
|
|
2021-09-09 09:09:08 +00:00
|
|
|
//func (sched *TaskScheduler) setParallelism(parallel int) {
|
|
|
|
// if parallel <= 0 {
|
|
|
|
// log.Debug("IndexNode can not set parallelism to less than zero!")
|
|
|
|
// return
|
|
|
|
// }
|
|
|
|
// sched.buildParallel = parallel
|
|
|
|
//}
|
2020-12-10 09:55:55 +00:00
|
|
|
|
2021-01-26 01:38:40 +00:00
|
|
|
func (sched *TaskScheduler) scheduleIndexBuildTask() []task {
|
|
|
|
ret := make([]task, 0)
|
|
|
|
for i := 0; i < sched.buildParallel; i++ {
|
|
|
|
t := sched.IndexBuildQueue.PopUnissuedTask()
|
|
|
|
if t == nil {
|
|
|
|
return ret
|
|
|
|
}
|
|
|
|
ret = append(ret, t)
|
|
|
|
}
|
|
|
|
return ret
|
2020-12-10 09:55:55 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
func (sched *TaskScheduler) processTask(t task, q TaskQueue) {
|
2021-02-23 01:58:06 +00:00
|
|
|
span, ctx := trace.StartSpanFromContext(t.Ctx(),
|
|
|
|
opentracing.Tags{
|
|
|
|
"Type": t.Name(),
|
|
|
|
"ID": t.ID(),
|
|
|
|
})
|
2021-02-27 02:45:03 +00:00
|
|
|
|
2021-02-23 01:58:06 +00:00
|
|
|
defer span.Finish()
|
|
|
|
span.LogFields(oplog.Int64("scheduler process PreExecute", t.ID()))
|
|
|
|
err := t.PreExecute(ctx)
|
2021-02-27 02:45:03 +00:00
|
|
|
t.SetError(err)
|
2020-12-10 09:55:55 +00:00
|
|
|
|
|
|
|
defer func() {
|
2021-02-27 02:45:03 +00:00
|
|
|
span.LogFields(oplog.Int64("scheduler process PostExecute", t.ID()))
|
|
|
|
err := t.PostExecute(ctx)
|
|
|
|
t.SetError(err)
|
2020-12-10 09:55:55 +00:00
|
|
|
}()
|
2021-02-27 02:45:03 +00:00
|
|
|
|
2020-12-10 09:55:55 +00:00
|
|
|
if err != nil {
|
2021-02-23 01:58:06 +00:00
|
|
|
trace.LogError(span, err)
|
2020-12-10 09:55:55 +00:00
|
|
|
return
|
|
|
|
}
|
|
|
|
|
2021-02-23 01:58:06 +00:00
|
|
|
span.LogFields(oplog.Int64("scheduler process AddActiveTask", t.ID()))
|
2020-12-10 09:55:55 +00:00
|
|
|
q.AddActiveTask(t)
|
2021-02-27 02:45:03 +00:00
|
|
|
|
2021-01-23 12:58:46 +00:00
|
|
|
// log.Printf("task add to active list ...")
|
2020-12-10 09:55:55 +00:00
|
|
|
defer func() {
|
2021-02-23 01:58:06 +00:00
|
|
|
span.LogFields(oplog.Int64("scheduler process PopActiveTask", t.ID()))
|
2020-12-10 09:55:55 +00:00
|
|
|
q.PopActiveTask(t.ID())
|
2021-01-23 12:58:46 +00:00
|
|
|
// log.Printf("pop from active list ...")
|
2020-12-10 09:55:55 +00:00
|
|
|
}()
|
|
|
|
|
2021-02-23 01:58:06 +00:00
|
|
|
span.LogFields(oplog.Int64("scheduler process Execute", t.ID()))
|
|
|
|
err = t.Execute(ctx)
|
2021-02-27 02:45:03 +00:00
|
|
|
t.SetError(err)
|
2020-12-10 09:55:55 +00:00
|
|
|
}
|
|
|
|
|
2020-12-12 22:48:05 +00:00
|
|
|
func (sched *TaskScheduler) indexBuildLoop() {
|
2021-06-06 01:41:35 +00:00
|
|
|
log.Debug("IndexNode TaskScheduler start build loop ...")
|
2020-12-10 09:55:55 +00:00
|
|
|
defer sched.wg.Done()
|
|
|
|
for {
|
|
|
|
select {
|
|
|
|
case <-sched.ctx.Done():
|
|
|
|
return
|
|
|
|
case <-sched.IndexBuildQueue.utChan():
|
|
|
|
if !sched.IndexBuildQueue.utEmpty() {
|
2021-01-26 01:38:40 +00:00
|
|
|
tasks := sched.scheduleIndexBuildTask()
|
|
|
|
var wg sync.WaitGroup
|
|
|
|
for _, t := range tasks {
|
|
|
|
wg.Add(1)
|
|
|
|
go func(group *sync.WaitGroup, t task) {
|
|
|
|
defer group.Done()
|
|
|
|
sched.processTask(t, sched.IndexBuildQueue)
|
|
|
|
}(&wg, t)
|
|
|
|
}
|
|
|
|
wg.Wait()
|
2020-12-10 09:55:55 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2021-10-03 02:15:56 +00:00
|
|
|
// Start stats the task scheduler of indexing tasks.
|
2020-12-10 09:55:55 +00:00
|
|
|
func (sched *TaskScheduler) Start() error {
|
|
|
|
|
2020-12-12 22:48:05 +00:00
|
|
|
sched.wg.Add(1)
|
|
|
|
go sched.indexBuildLoop()
|
2020-12-10 09:55:55 +00:00
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2021-10-03 02:15:56 +00:00
|
|
|
// Close closes the task scheduler of indexing tasks.
|
2020-12-10 09:55:55 +00:00
|
|
|
func (sched *TaskScheduler) Close() {
|
|
|
|
sched.cancel()
|
|
|
|
sched.wg.Wait()
|
|
|
|
}
|