279 lines
12 KiB
Go
279 lines
12 KiB
Go
// Copyright 2015 PingCAP, Inc.
|
|
//
|
|
// Licensed under the Apache License, Version 2.0 (the "License");
|
|
// you may not use this file except in compliance with the License.
|
|
// You may obtain a copy of the License at
|
|
//
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
//
|
|
// Unless required by applicable law or agreed to in writing, software
|
|
// distributed under the License is distributed on an "AS IS" BASIS,
|
|
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
// See the License for the specific language governing permissions and
|
|
// limitations under the License.
|
|
|
|
// Copyright 2013 The ql Authors. All rights reserved.
|
|
// Use of this source code is governed by a BSD-style
|
|
// license that can be found in the LICENSES/QL-LICENSE file.
|
|
|
|
package table
|
|
|
|
import (
|
|
"context"
|
|
"time"
|
|
|
|
"github.com/opentracing/opentracing-go"
|
|
mysql "github.com/pingcap/tidb/errno"
|
|
"github.com/pingcap/tidb/kv"
|
|
"github.com/pingcap/tidb/meta/autoid"
|
|
"github.com/pingcap/tidb/parser/model"
|
|
"github.com/pingcap/tidb/sessionctx"
|
|
"github.com/pingcap/tidb/types"
|
|
"github.com/pingcap/tidb/util/dbterror"
|
|
"github.com/pingcap/tidb/util/sqlexec"
|
|
)
|
|
|
|
// Type is used to distinguish between different tables that store data in different ways.
|
|
type Type int16
|
|
|
|
const (
|
|
// NormalTable stores data in tikv, mocktikv and so on.
|
|
NormalTable Type = iota
|
|
// VirtualTable stores no data, just extract data from the memory struct.
|
|
VirtualTable
|
|
// ClusterTable contains the `VirtualTable` in the all cluster tidb nodes.
|
|
ClusterTable
|
|
)
|
|
|
|
// IsNormalTable checks whether the table is a normal table type.
|
|
func (tp Type) IsNormalTable() bool {
|
|
return tp == NormalTable
|
|
}
|
|
|
|
// IsVirtualTable checks whether the table is a virtual table type.
|
|
func (tp Type) IsVirtualTable() bool {
|
|
return tp == VirtualTable
|
|
}
|
|
|
|
// IsClusterTable checks whether the table is a cluster table type.
|
|
func (tp Type) IsClusterTable() bool {
|
|
return tp == ClusterTable
|
|
}
|
|
|
|
var (
|
|
// ErrColumnCantNull is used for inserting null to a not null column.
|
|
ErrColumnCantNull = dbterror.ClassTable.NewStd(mysql.ErrBadNull)
|
|
// ErrUnknownColumn is returned when accessing an unknown column.
|
|
ErrUnknownColumn = dbterror.ClassTable.NewStd(mysql.ErrBadField)
|
|
errDuplicateColumn = dbterror.ClassTable.NewStd(mysql.ErrFieldSpecifiedTwice)
|
|
|
|
errGetDefaultFailed = dbterror.ClassTable.NewStd(mysql.ErrFieldGetDefaultFailed)
|
|
|
|
// ErrNoDefaultValue is used when insert a row, the column value is not given, and the column has not null flag
|
|
// and it doesn't have a default value.
|
|
ErrNoDefaultValue = dbterror.ClassTable.NewStd(mysql.ErrNoDefaultForField)
|
|
// ErrIndexOutBound returns for index column offset out of bound.
|
|
ErrIndexOutBound = dbterror.ClassTable.NewStd(mysql.ErrIndexOutBound)
|
|
// ErrUnsupportedOp returns for unsupported operation.
|
|
ErrUnsupportedOp = dbterror.ClassTable.NewStd(mysql.ErrUnsupportedOp)
|
|
// ErrRowNotFound returns for row not found.
|
|
ErrRowNotFound = dbterror.ClassTable.NewStd(mysql.ErrRowNotFound)
|
|
// ErrTableStateCantNone returns for table none state.
|
|
ErrTableStateCantNone = dbterror.ClassTable.NewStd(mysql.ErrTableStateCantNone)
|
|
// ErrColumnStateCantNone returns for column none state.
|
|
ErrColumnStateCantNone = dbterror.ClassTable.NewStd(mysql.ErrColumnStateCantNone)
|
|
// ErrColumnStateNonPublic returns for column non-public state.
|
|
ErrColumnStateNonPublic = dbterror.ClassTable.NewStd(mysql.ErrColumnStateNonPublic)
|
|
// ErrIndexStateCantNone returns for index none state.
|
|
ErrIndexStateCantNone = dbterror.ClassTable.NewStd(mysql.ErrIndexStateCantNone)
|
|
// ErrInvalidRecordKey returns for invalid record key.
|
|
ErrInvalidRecordKey = dbterror.ClassTable.NewStd(mysql.ErrInvalidRecordKey)
|
|
// ErrTruncatedWrongValueForField returns for truncate wrong value for field.
|
|
ErrTruncatedWrongValueForField = dbterror.ClassTable.NewStd(mysql.ErrTruncatedWrongValueForField)
|
|
// ErrUnknownPartition returns unknown partition error.
|
|
ErrUnknownPartition = dbterror.ClassTable.NewStd(mysql.ErrUnknownPartition)
|
|
// ErrNoPartitionForGivenValue returns table has no partition for value.
|
|
ErrNoPartitionForGivenValue = dbterror.ClassTable.NewStd(mysql.ErrNoPartitionForGivenValue)
|
|
// ErrLockOrActiveTransaction returns when execute unsupported statement in a lock session or an active transaction.
|
|
ErrLockOrActiveTransaction = dbterror.ClassTable.NewStd(mysql.ErrLockOrActiveTransaction)
|
|
// ErrSequenceHasRunOut returns when sequence has run out.
|
|
ErrSequenceHasRunOut = dbterror.ClassTable.NewStd(mysql.ErrSequenceRunOut)
|
|
// ErrRowDoesNotMatchGivenPartitionSet returns when the destination partition conflict with the partition selection.
|
|
ErrRowDoesNotMatchGivenPartitionSet = dbterror.ClassTable.NewStd(mysql.ErrRowDoesNotMatchGivenPartitionSet)
|
|
// ErrTempTableFull returns a table is full error, it's used by temporary table now.
|
|
ErrTempTableFull = dbterror.ClassTable.NewStd(mysql.ErrRecordFileFull)
|
|
// ErrOptOnCacheTable returns when exec unsupported opt at cache mode
|
|
ErrOptOnCacheTable = dbterror.ClassDDL.NewStd(mysql.ErrOptOnCacheTable)
|
|
)
|
|
|
|
// RecordIterFunc is used for low-level record iteration.
|
|
type RecordIterFunc func(h kv.Handle, rec []types.Datum, cols []*Column) (more bool, err error)
|
|
|
|
// AddRecordOpt contains the options will be used when adding a record.
|
|
type AddRecordOpt struct {
|
|
CreateIdxOpt
|
|
IsUpdate bool
|
|
ReserveAutoID int
|
|
}
|
|
|
|
// AddRecordOption is defined for the AddRecord() method of the Table interface.
|
|
type AddRecordOption interface {
|
|
ApplyOn(*AddRecordOpt)
|
|
}
|
|
|
|
// WithReserveAutoIDHint tells the AddRecord operation to reserve a batch of auto ID in the stmtctx.
|
|
type WithReserveAutoIDHint int
|
|
|
|
// ApplyOn implements the AddRecordOption interface.
|
|
func (n WithReserveAutoIDHint) ApplyOn(opt *AddRecordOpt) {
|
|
opt.ReserveAutoID = int(n)
|
|
}
|
|
|
|
// ApplyOn implements the AddRecordOption interface, so any CreateIdxOptFunc
|
|
// can be passed as the optional argument to the table.AddRecord method.
|
|
func (f CreateIdxOptFunc) ApplyOn(opt *AddRecordOpt) {
|
|
f(&opt.CreateIdxOpt)
|
|
}
|
|
|
|
// IsUpdate is a defined value for AddRecordOptFunc.
|
|
var IsUpdate AddRecordOption = isUpdate{}
|
|
|
|
type isUpdate struct{}
|
|
|
|
func (i isUpdate) ApplyOn(opt *AddRecordOpt) {
|
|
opt.IsUpdate = true
|
|
}
|
|
|
|
type columnAPI interface {
|
|
// Cols returns the columns of the table which is used in select, including hidden columns.
|
|
Cols() []*Column
|
|
|
|
// VisibleCols returns the columns of the table which is used in select, excluding hidden columns.
|
|
VisibleCols() []*Column
|
|
|
|
// HiddenCols returns the hidden columns of the table.
|
|
HiddenCols() []*Column
|
|
|
|
// WritableCols returns columns of the table in writable states.
|
|
// Writable states includes Public, WriteOnly, WriteOnlyReorganization.
|
|
WritableCols() []*Column
|
|
|
|
// DeletableCols returns columns of the table in deletable states.
|
|
// Deletable states includes Public, WriteOnly, WriteOnlyReorganization, DeleteOnly, DeleteReorganization.
|
|
DeletableCols() []*Column
|
|
|
|
// FullHiddenColsAndVisibleCols returns hidden columns in all states and unhidden columns in public states.
|
|
FullHiddenColsAndVisibleCols() []*Column
|
|
}
|
|
|
|
// Table is used to retrieve and modify rows in table.
|
|
type Table interface {
|
|
columnAPI
|
|
|
|
// Indices returns the indices of the table.
|
|
// The caller must be aware of that not all the returned indices are public.
|
|
Indices() []Index
|
|
|
|
// RecordPrefix returns the record key prefix.
|
|
RecordPrefix() kv.Key
|
|
// IndexPrefix returns the index key prefix.
|
|
IndexPrefix() kv.Key
|
|
|
|
// AddRecord inserts a row which should contain only public columns
|
|
AddRecord(ctx sessionctx.Context, r []types.Datum, opts ...AddRecordOption) (recordID kv.Handle, err error)
|
|
|
|
// UpdateRecord updates a row which should contain only writable columns.
|
|
UpdateRecord(ctx context.Context, sctx sessionctx.Context, h kv.Handle, currData, newData []types.Datum, touched []bool) error
|
|
|
|
// RemoveRecord removes a row in the table.
|
|
RemoveRecord(ctx sessionctx.Context, h kv.Handle, r []types.Datum) error
|
|
|
|
// Allocators returns all allocators.
|
|
Allocators(ctx sessionctx.Context) autoid.Allocators
|
|
|
|
// Meta returns TableInfo.
|
|
Meta() *model.TableInfo
|
|
|
|
// Type returns the type of table
|
|
Type() Type
|
|
}
|
|
|
|
// AllocAutoIncrementValue allocates an auto_increment value for a new row.
|
|
func AllocAutoIncrementValue(ctx context.Context, t Table, sctx sessionctx.Context) (int64, error) {
|
|
if span := opentracing.SpanFromContext(ctx); span != nil && span.Tracer() != nil {
|
|
span1 := span.Tracer().StartSpan("table.AllocAutoIncrementValue", opentracing.ChildOf(span.Context()))
|
|
defer span1.Finish()
|
|
}
|
|
increment := sctx.GetSessionVars().AutoIncrementIncrement
|
|
offset := sctx.GetSessionVars().AutoIncrementOffset
|
|
alloc := t.Allocators(sctx).Get(autoid.AutoIncrementType)
|
|
_, max, err := alloc.Alloc(ctx, uint64(1), int64(increment), int64(offset))
|
|
if err != nil {
|
|
return 0, err
|
|
}
|
|
return max, err
|
|
}
|
|
|
|
// AllocBatchAutoIncrementValue allocates batch auto_increment value for rows, returning firstID, increment and err.
|
|
// The caller can derive the autoID by adding increment to firstID for N-1 times.
|
|
func AllocBatchAutoIncrementValue(ctx context.Context, t Table, sctx sessionctx.Context, N int) (firstID int64, increment int64, err error) {
|
|
increment = int64(sctx.GetSessionVars().AutoIncrementIncrement)
|
|
offset := int64(sctx.GetSessionVars().AutoIncrementOffset)
|
|
alloc := t.Allocators(sctx).Get(autoid.AutoIncrementType)
|
|
min, max, err := alloc.Alloc(ctx, uint64(N), increment, offset)
|
|
if err != nil {
|
|
return min, max, err
|
|
}
|
|
// SeekToFirstAutoIDUnSigned seeks to first autoID. Because AutoIncrement always allocate from 1,
|
|
// signed and unsigned value can be unified as the unsigned handle.
|
|
nr := int64(autoid.SeekToFirstAutoIDUnSigned(uint64(min), uint64(increment), uint64(offset)))
|
|
return nr, increment, nil
|
|
}
|
|
|
|
// PhysicalTable is an abstraction for two kinds of table representation: partition or non-partitioned table.
|
|
// PhysicalID is a ID that can be used to construct a key ranges, all the data in the key range belongs to the corresponding PhysicalTable.
|
|
// For a non-partitioned table, its PhysicalID equals to its TableID; For a partition of a partitioned table, its PhysicalID is the partition's ID.
|
|
type PhysicalTable interface {
|
|
Table
|
|
GetPhysicalID() int64
|
|
}
|
|
|
|
// PartitionedTable is a Table, and it has a GetPartition() method.
|
|
// GetPartition() gets the partition from a partition table by a physical table ID,
|
|
type PartitionedTable interface {
|
|
Table
|
|
GetPartition(physicalID int64) PhysicalTable
|
|
GetPartitionByRow(sessionctx.Context, []types.Datum) (PhysicalTable, error)
|
|
GetAllPartitionIDs() []int64
|
|
GetPartitionColumnNames() []model.CIStr
|
|
CheckForExchangePartition(ctx sessionctx.Context, pi *model.PartitionInfo, r []types.Datum, pid int64) error
|
|
}
|
|
|
|
// TableFromMeta builds a table.Table from *model.TableInfo.
|
|
// Currently, it is assigned to tables.TableFromMeta in tidb package's init function.
|
|
var TableFromMeta func(allocators autoid.Allocators, tblInfo *model.TableInfo) (Table, error)
|
|
|
|
// MockTableFromMeta only serves for test.
|
|
var MockTableFromMeta func(tableInfo *model.TableInfo) Table
|
|
|
|
// CachedTable is a Table, and it has a UpdateLockForRead() method
|
|
// UpdateLockForRead() according to the reasons for not meeting the read conditions, update the lock information,
|
|
// And at the same time reload data from the original table.
|
|
type CachedTable interface {
|
|
Table
|
|
|
|
Init(exec sqlexec.SQLExecutor) error
|
|
|
|
// TryReadFromCache checks if the cache table is readable.
|
|
TryReadFromCache(ts uint64, leaseDuration time.Duration) (kv.MemBuffer, bool)
|
|
|
|
// UpdateLockForRead If you cannot meet the conditions of the read buffer,
|
|
// you need to update the lock information and read the data from the original table
|
|
UpdateLockForRead(ctx context.Context, store kv.Storage, ts uint64, leaseDuration time.Duration)
|
|
|
|
// WriteLockAndKeepAlive first obtain the write lock, then it renew the lease to keep the lock alive.
|
|
// 'exit' is a channel to tell the keep alive goroutine to exit.
|
|
// The result is sent to the 'wg' channel.
|
|
WriteLockAndKeepAlive(ctx context.Context, exit chan struct{}, leasePtr *uint64, wg chan error)
|
|
}
|