tidb/disttask/framework/scheduler/manager.go

// Copyright 2023 PingCAP, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

package scheduler

import (
	"context"
	"sync"
	"sync/atomic"
	"time"

	"github.com/pingcap/errors"
	"github.com/pingcap/failpoint"
	"github.com/pingcap/tidb/config"
	"github.com/pingcap/tidb/disttask/framework/proto"
	"github.com/pingcap/tidb/domain/infosync"
	"github.com/pingcap/tidb/resourcemanager/pool/spool"
	"github.com/pingcap/tidb/resourcemanager/util"
	"github.com/pingcap/tidb/util/logutil"
	"go.uber.org/zap"
)

var (
	schedulerPoolSize       int32 = 4
	subtaskExecutorPoolSize int32 = 10
	// same as dispatcher
	checkTime        = 300 * time.Millisecond
	retrySQLTimes    = 3
	retrySQLInterval = 500 * time.Millisecond
)

// ManagerBuilder is used to build a Manager.
type ManagerBuilder struct {
	newPool func(name string, size int32, component util.Component, options ...spool.Option) (Pool, error)
}

// NewManagerBuilder creates a new ManagerBuilder.
func NewManagerBuilder() *ManagerBuilder {
	return &ManagerBuilder{
		newPool: func(name string, size int32, component util.Component, options ...spool.Option) (Pool, error) {
			return spool.NewPool(name, size, component, options...)
		},
	}
}

// setPoolFactory sets the poolFactory to mock the Pool in unit test.
func (b *ManagerBuilder) setPoolFactory(poolFactory func(name string, size int32, component util.Component, options ...spool.Option) (Pool, error)) {
	b.newPool = poolFactory
}

// Manager monitors the global task table and manages the schedulers.
type Manager struct {
	taskTable     TaskTable
	schedulerPool Pool
	// taskType -> subtaskExecutorPool
	// shared by subtasks of all task steps
	subtaskExecutorPools map[string]Pool
	mu                   struct {
		sync.RWMutex
		// taskID -> cancelFunc.
		// cancelFunc is used to fast cancel the scheduler.Run.
		handlingTasks map[int64]context.CancelFunc
	}
	// id, it's the same as server id now, i.e. host:port.
	id      string
	wg      sync.WaitGroup
	ctx     context.Context
	cancel  context.CancelFunc
	logCtx  context.Context
	newPool func(name string, size int32, component util.Component, options ...spool.Option) (Pool, error)
}

// BuildManager builds a Manager.
func (b *ManagerBuilder) BuildManager(ctx context.Context, id string, taskTable TaskTable) (*Manager, error) {
	m := &Manager{
		id:                   id,
		taskTable:            taskTable,
		subtaskExecutorPools: make(map[string]Pool),
		logCtx:               logutil.WithKeyValue(context.Background(), "dist_task_manager", id),
		newPool:              b.newPool,
	}
	m.ctx, m.cancel = context.WithCancel(ctx)
	m.mu.handlingTasks = make(map[int64]context.CancelFunc)

	schedulerPool, err := m.newPool("scheduler_pool", schedulerPoolSize, util.DistTask)
	if err != nil {
		return nil, err
	}
	m.schedulerPool = schedulerPool

	for taskType, opt := range taskTypes {
		poolSize := subtaskExecutorPoolSize
		if opt.PoolSize > 0 {
			poolSize = opt.PoolSize
		}
		subtaskExecutorPool, err := m.newPool(taskType+"_pool", poolSize, util.DistTask)
		if err != nil {
			return nil, err
		}
		m.subtaskExecutorPools[taskType] = subtaskExecutorPool
	}
	return m, nil
}

// Start starts the Manager.
func (m *Manager) Start() error {
	logutil.Logger(m.logCtx).Debug("manager start")
	var err error
	for i := 0; i < retrySQLTimes; i++ {
		err = m.taskTable.StartManager(m.id, config.GetGlobalConfig().Instance.TiDBServiceScope)
		if err == nil {
			break
		}
		if i%10 == 0 {
			logutil.Logger(m.logCtx).Warn("start manager failed", zap.String("scope", config.GetGlobalConfig().Instance.TiDBServiceScope),
				zap.Int("retry times", retrySQLTimes), zap.Error(err))
		}
		time.Sleep(retrySQLInterval)
	}
	if err != nil {
		return err
	}

	m.wg.Add(1)
	go func() {
		defer m.wg.Done()
		m.fetchAndHandleRunnableTasks(m.ctx)
	}()

	m.wg.Add(1)
	go func() {
		defer m.wg.Done()
		m.fetchAndFastCancelTasks(m.ctx)
	}()
	return nil
}

// Stop stops the Manager.
func (m *Manager) Stop() {
	m.cancel()
	for _, pool := range m.subtaskExecutorPools {
		pool.ReleaseAndWait()
	}
	m.schedulerPool.ReleaseAndWait()
	m.wg.Wait()
}

// fetchAndHandleRunnableTasks fetches the runnable tasks from the global task table and handles them.
func (m *Manager) fetchAndHandleRunnableTasks(ctx context.Context) {
	ticker := time.NewTicker(checkTime)
	for {
		select {
		case <-ctx.Done():
			logutil.Logger(m.logCtx).Info("fetchAndHandleRunnableTasks done")
			return
		case <-ticker.C:
			tasks, err := m.taskTable.GetGlobalTasksInStates(proto.TaskStateRunning, proto.TaskStateReverting)
			if err != nil {
				m.onError(err)
				continue
			}
			m.onRunnableTasks(ctx, tasks)
		}
	}
}

// fetchAndFastCancelTasks fetches the reverting tasks from the global task table and fast cancels them.
func (m *Manager) fetchAndFastCancelTasks(ctx context.Context) {
	ticker := time.NewTicker(checkTime)
	for {
		select {
		case <-ctx.Done():
			m.cancelAllRunningTasks()
			logutil.Logger(m.logCtx).Info("fetchAndFastCancelTasks done")
			return
		case <-ticker.C:
			tasks, err := m.taskTable.GetGlobalTasksInStates(proto.TaskStateReverting)
			if err != nil {
				m.onError(err)
				continue
			}
			m.onCanceledTasks(ctx, tasks)
		}
	}
}

// onRunnableTasks handles runnable tasks.
func (m *Manager) onRunnableTasks(ctx context.Context, tasks []*proto.Task) {
	tasks = m.filterAlreadyHandlingTasks(tasks)
	for _, task := range tasks {
		if _, ok := m.subtaskExecutorPools[task.Type]; !ok {
			logutil.Logger(m.logCtx).Error("unknown task type", zap.String("type", task.Type))
			continue
		}
		exist, err := m.taskTable.HasSubtasksInStates(m.id, task.ID, task.Step, proto.TaskStatePending, proto.TaskStateRevertPending)
		if err != nil {
			logutil.Logger(m.logCtx).Error("check subtask exist failed", zap.Error(err))
			m.onError(err)
			continue
		}
		if !exist {
			continue
		}
		logutil.Logger(m.logCtx).Info("detect new subtask", zap.Any("task_id", task.ID))
		m.addHandlingTask(task.ID)
		t := task
		err = m.schedulerPool.Run(func() {
			m.onRunnableTask(ctx, t.ID, t.Type)
			m.removeHandlingTask(task.ID)
		})
		// pool closed.
		if err != nil {
			m.removeHandlingTask(task.ID)
			m.onError(err)
			return
		}
	}
}

// onCanceledTasks cancels the running tasks.
func (m *Manager) onCanceledTasks(_ context.Context, tasks []*proto.Task) {
	m.mu.RLock()
	defer m.mu.RUnlock()
	for _, task := range tasks {
		logutil.Logger(m.logCtx).Info("onCanceledTasks", zap.Any("task_id", task.ID))
		if cancel, ok := m.mu.handlingTasks[task.ID]; ok && cancel != nil {
			cancel()
		}
	}
}

// cancelAllRunningTasks cancels all running tasks.
func (m *Manager) cancelAllRunningTasks() {
	m.mu.RLock()
	defer m.mu.RUnlock()
	for id, cancel := range m.mu.handlingTasks {
		logutil.Logger(m.logCtx).Info("cancelAllRunningTasks", zap.Any("task_id", id))
		if cancel != nil {
			cancel()
		}
	}
}

// filterAlreadyHandlingTasks filters the tasks that are already handled.
func (m *Manager) filterAlreadyHandlingTasks(tasks []*proto.Task) []*proto.Task {
	m.mu.RLock()
	defer m.mu.RUnlock()

	var i int
	for _, task := range tasks {
		if _, ok := m.mu.handlingTasks[task.ID]; !ok {
			tasks[i] = task
			i++
		}
	}
	return tasks[:i]
}

// TestContext only used in tests.
type TestContext struct {
	TestSyncSubtaskRun chan struct{}
	mockDown           atomic.Bool
}

var testContexts sync.Map

// onRunnableTask handles a runnable task.
func (m *Manager) onRunnableTask(ctx context.Context, taskID int64, taskType string) {
	logutil.Logger(m.logCtx).Info("onRunnableTask", zap.Any("task_id", taskID), zap.Any("type", taskType))
	if _, ok := m.subtaskExecutorPools[taskType]; !ok {
		m.onError(errors.Errorf("task type %s not found", taskType))
		return
	}
	// runCtx only used in scheduler.Run, cancel in m.fetchAndFastCancelTasks.
	factory := getSchedulerFactory(taskType)
	if factory == nil {
		m.onError(errors.Errorf("task type %s not found", taskType))
		return
	}
	scheduler := factory(ctx, m.id, taskID, m.taskTable, m.subtaskExecutorPools[taskType])
	for {
		select {
		case <-ctx.Done():
			return
		case <-time.After(checkTime):
		}
		failpoint.Inject("mockStopManager", func() {
			testContexts.Store(m.id, &TestContext{make(chan struct{}), atomic.Bool{}})
			go func() {
				v, ok := testContexts.Load(m.id)
				if ok {
					<-v.(*TestContext).TestSyncSubtaskRun
					_ = infosync.MockGlobalServerInfoManagerEntry.DeleteByID(m.id)
					m.Stop()
				}
			}()
		})
		task, err := m.taskTable.GetGlobalTaskByID(taskID)
		if err != nil {
			m.onError(err)
			return
		}
		if task.State != proto.TaskStateRunning && task.State != proto.TaskStateReverting {
			logutil.Logger(m.logCtx).Info("onRunnableTask exit", zap.Any("task_id", taskID), zap.Int64("step", task.Step), zap.Any("state", task.State))
			return
		}
		if exist, err := m.taskTable.HasSubtasksInStates(m.id, task.ID, task.Step, proto.TaskStatePending, proto.TaskStateRevertPending); err != nil {
			m.onError(err)
			return
		} else if !exist {
			continue
		}

		switch task.State {
		case proto.TaskStateRunning:
			runCtx, runCancel := context.WithCancel(ctx)
			m.registerCancelFunc(task.ID, runCancel)
			err = scheduler.Run(runCtx, task)
			runCancel()
		case proto.TaskStateReverting:
			err = scheduler.Rollback(ctx, task)
		}
		if err != nil {
			logutil.Logger(m.logCtx).Error("failed to handle task", zap.Error(err))
		}
	}
}

// addHandlingTask adds a task to the handling task set.
func (m *Manager) addHandlingTask(id int64) {
	m.mu.Lock()
	defer m.mu.Unlock()
	m.mu.handlingTasks[id] = nil
}

// registerCancelFunc registers a cancel function for a task.
func (m *Manager) registerCancelFunc(id int64, cancel context.CancelFunc) {
	m.mu.Lock()
	defer m.mu.Unlock()
	m.mu.handlingTasks[id] = cancel
}

// removeHandlingTask removes a task from the handling task set.
func (m *Manager) removeHandlingTask(id int64) {
	m.mu.Lock()
	defer m.mu.Unlock()
	delete(m.mu.handlingTasks, id)
}

// onError handles the error.
func (m *Manager) onError(err error) {
	if err == nil {
		return
	}

	logutil.Logger(m.logCtx).Error("task manager error", zap.Error(err))
}