// Copyright 2016 PingCAP, Inc. // // Licensed under the Apache License, Version 2.0 (the "License"); // you may not use this file except in compliance with the License. // You may obtain a copy of the License at // // http://www.apache.org/licenses/LICENSE-2.0 // // Unless required by applicable law or agreed to in writing, software // distributed under the License is distributed on an "AS IS" BASIS, // See the License for the specific language governing permissions and // limitations under the License. package tablecodec import ( "bytes" "encoding/binary" "math" "time" "github.com/pingcap/errors" "github.com/pingcap/parser/mysql" "github.com/pingcap/parser/terror" "github.com/pingcap/tidb/kv" "github.com/pingcap/tidb/sessionctx/stmtctx" "github.com/pingcap/tidb/types" "github.com/pingcap/tidb/util/codec" ) var ( errInvalidKey = terror.ClassXEval.New(codeInvalidKey, "invalid key") errInvalidRecordKey = terror.ClassXEval.New(codeInvalidRecordKey, "invalid record key") errInvalidIndexKey = terror.ClassXEval.New(codeInvalidIndexKey, "invalid index key") errInvalidColumnCount = terror.ClassXEval.New(codeInvalidColumnCount, "invalid column count") ) var ( tablePrefix = []byte{'t'} recordPrefixSep = []byte("_r") indexPrefixSep = []byte("_i") ) const ( idLen = 8 prefixLen = 1 + idLen /*tableID*/ + 2 recordRowKeyLen = prefixLen + idLen /*handle*/ tablePrefixLength = 1 recordPrefixSepLength = 2 ) // TableSplitKeyLen is the length of key 't{table_id}' which is used for table split. const TableSplitKeyLen = 1 + idLen // TablePrefix returns table's prefix 't'. func TablePrefix() []byte { return tablePrefix } // EncodeRowKey encodes the table id and record handle into a kv.Key func EncodeRowKey(tableID int64, encodedHandle []byte) kv.Key { buf := make([]byte, 0, recordRowKeyLen) buf = appendTableRecordPrefix(buf, tableID) buf = append(buf, encodedHandle...) return buf } // EncodeRowKeyWithHandle encodes the table id, row handle into a kv.Key func EncodeRowKeyWithHandle(tableID int64, handle int64) kv.Key { buf := make([]byte, 0, recordRowKeyLen) buf = appendTableRecordPrefix(buf, tableID) buf = codec.EncodeInt(buf, handle) return buf } // CutRowKeyPrefix cuts the row key prefix. func CutRowKeyPrefix(key kv.Key) []byte { return key[prefixLen:] } // EncodeRecordKey encodes the recordPrefix, row handle into a kv.Key. func EncodeRecordKey(recordPrefix kv.Key, h int64) kv.Key { buf := make([]byte, 0, len(recordPrefix)+idLen) buf = append(buf, recordPrefix...) buf = codec.EncodeInt(buf, h) return buf } func hasTablePrefix(key kv.Key) bool { return key[0] == tablePrefix[0] } func hasRecordPrefixSep(key kv.Key) bool { return key[0] == recordPrefixSep[0] && key[1] == recordPrefixSep[1] } // DecodeRecordKey decodes the key and gets the tableID, handle. func DecodeRecordKey(key kv.Key) (tableID int64, handle int64, err error) { if len(key) <= prefixLen { return 0, 0, errInvalidRecordKey.GenWithStack("invalid record key - %q", key) } k := key if !hasTablePrefix(key) { return 0, 0, errInvalidRecordKey.GenWithStack("invalid record key - %q", k) } key = key[tablePrefixLength:] key, tableID, err = codec.DecodeInt(key) if err != nil { return 0, 0, errors.Trace(err) } if !hasRecordPrefixSep(key) { return 0, 0, errInvalidRecordKey.GenWithStack("invalid record key - %q", k) } key = key[recordPrefixSepLength:] key, handle, err = codec.DecodeInt(key) if err != nil { return 0, 0, errors.Trace(err) } return } // DecodeIndexKey decodes the key and gets the tableID, indexID, indexValues. func DecodeIndexKey(key kv.Key) (tableID int64, indexID int64, indexValues []string, err error) { k := key tableID, indexID, isRecord, err := DecodeKeyHead(key) if err != nil { return 0, 0, nil, errors.Trace(err) } if isRecord { return 0, 0, nil, errInvalidIndexKey.GenWithStack("invalid index key - %q", k) } key = key[prefixLen+idLen:] for len(key) > 0 { // FIXME: Without the schema information, we can only decode the raw kind of // the column. For instance, MysqlTime is internally saved as uint64. remain, d, e := codec.DecodeOne(key) if e != nil { return 0, 0, nil, errInvalidIndexKey.GenWithStack("invalid index key - %q %v", k, e) } str, e1 := d.ToString() if e1 != nil { return 0, 0, nil, errInvalidIndexKey.GenWithStack("invalid index key - %q %v", k, e1) } indexValues = append(indexValues, str) key = remain } return } // DecodeKeyHead decodes the key's head and gets the tableID, indexID. isRecordKey is true when is a record key. func DecodeKeyHead(key kv.Key) (tableID int64, indexID int64, isRecordKey bool, err error) { isRecordKey = false k := key if !key.HasPrefix(tablePrefix) { err = errInvalidKey.GenWithStack("invalid key - %q", k) return } key = key[len(tablePrefix):] key, tableID, err = codec.DecodeInt(key) if err != nil { err = errors.Trace(err) return } if key.HasPrefix(recordPrefixSep) { isRecordKey = true return } if !key.HasPrefix(indexPrefixSep) { err = errInvalidKey.GenWithStack("invalid key - %q", k) return } key = key[len(indexPrefixSep):] key, indexID, err = codec.DecodeInt(key) if err != nil { err = errors.Trace(err) return } return } // DecodeTableID decodes the table ID of the key, if the key is not table key, returns 0. func DecodeTableID(key kv.Key) int64 { if !key.HasPrefix(tablePrefix) { return 0 } key = key[len(tablePrefix):] _, tableID, err := codec.DecodeInt(key) // TODO: return error. terror.Log(errors.Trace(err)) return tableID } // DecodeRowKey decodes the key and gets the handle. func DecodeRowKey(key kv.Key) (int64, error) { if len(key) != recordRowKeyLen || !hasTablePrefix(key) || !hasRecordPrefixSep(key[prefixLen-2:]) { return 0, errInvalidKey.GenWithStack("invalid key - %q", key) } u := binary.BigEndian.Uint64(key[prefixLen:]) return codec.DecodeCmpUintToInt(u), nil } // EncodeValue encodes a go value to bytes. func EncodeValue(sc *stmtctx.StatementContext, b []byte, raw types.Datum) ([]byte, error) { var v types.Datum err := flatten(sc, raw, &v) if err != nil { return nil, err } return codec.EncodeValue(sc, b, v) } // EncodeRow encode row data and column ids into a slice of byte. // Row layout: colID1, value1, colID2, value2, ..... // valBuf and values pass by caller, for reducing EncodeRow allocates temporary bufs. If you pass valBuf and values as nil, // EncodeRow will allocate it. func EncodeRow(sc *stmtctx.StatementContext, row []types.Datum, colIDs []int64, valBuf []byte, values []types.Datum) ([]byte, error) { if len(row) != len(colIDs) { return nil, errors.Errorf("EncodeRow error: data and columnID count not match %d vs %d", len(row), len(colIDs)) } valBuf = valBuf[:0] if values == nil { values = make([]types.Datum, len(row)*2) } for i, c := range row { id := colIDs[i] values[2*i].SetInt64(id) err := flatten(sc, c, &values[2*i+1]) if err != nil { return valBuf, errors.Trace(err) } } if len(values) == 0 { // We could not set nil value into kv. return append(valBuf, codec.NilFlag), nil } return codec.EncodeValue(sc, valBuf, values...) } func flatten(sc *stmtctx.StatementContext, data types.Datum, ret *types.Datum) error { switch data.Kind() { case types.KindMysqlTime: // for mysql datetime, timestamp and date type t := data.GetMysqlTime() if t.Type == mysql.TypeTimestamp && sc.TimeZone != time.UTC { err := t.ConvertTimeZone(sc.TimeZone, time.UTC) if err != nil { return errors.Trace(err) } } v, err := t.ToPackedUint() ret.SetUint64(v) return errors.Trace(err) case types.KindMysqlDuration: // for mysql time type ret.SetInt64(int64(data.GetMysqlDuration().Duration)) return nil case types.KindMysqlEnum: ret.SetUint64(data.GetMysqlEnum().Value) return nil case types.KindMysqlSet: ret.SetUint64(data.GetMysqlSet().Value) return nil case types.KindBinaryLiteral, types.KindMysqlBit: // We don't need to handle errors here since the literal is ensured to be able to store in uint64 in convertToMysqlBit. val, err := data.GetBinaryLiteral().ToInt(sc) if err != nil { return errors.Trace(err) } ret.SetUint64(val) return nil default: *ret = data return nil } } // DecodeColumnValue decodes data to a Datum according to the column info. func DecodeColumnValue(data []byte, ft *types.FieldType, loc *time.Location) (types.Datum, error) { _, d, err := codec.DecodeOne(data) if err != nil { return types.Datum{}, errors.Trace(err) } colDatum, err := unflatten(d, ft, loc) if err != nil { return types.Datum{}, errors.Trace(err) } return colDatum, nil } // DecodeRowWithMap decodes a byte slice into datums with a existing row map. // Row layout: colID1, value1, colID2, value2, ..... func DecodeRowWithMap(b []byte, cols map[int64]*types.FieldType, loc *time.Location, row map[int64]types.Datum) (map[int64]types.Datum, error) { if row == nil { row = make(map[int64]types.Datum, len(cols)) } if b == nil { return row, nil } if len(b) == 1 && b[0] == codec.NilFlag { return row, nil } cnt := 0 var ( data []byte err error ) for len(b) > 0 { // Get col id. data, b, err = codec.CutOne(b) if err != nil { return nil, errors.Trace(err) } _, cid, err := codec.DecodeOne(data) if err != nil { return nil, errors.Trace(err) } // Get col value. data, b, err = codec.CutOne(b) if err != nil { return nil, errors.Trace(err) } id := cid.GetInt64() ft, ok := cols[id] if ok { _, v, err := codec.DecodeOne(data) if err != nil { return nil, errors.Trace(err) } v, err = unflatten(v, ft, loc) if err != nil { return nil, errors.Trace(err) } row[id] = v cnt++ if cnt == len(cols) { // Get enough data. break } } } return row, nil } // DecodeRow decodes a byte slice into datums. // Row layout: colID1, value1, colID2, value2, ..... func DecodeRow(b []byte, cols map[int64]*types.FieldType, loc *time.Location) (map[int64]types.Datum, error) { return DecodeRowWithMap(b, cols, loc, nil) } // CutRowNew cuts encoded row into byte slices and return columns' byte slice. // Row layout: colID1, value1, colID2, value2, ..... func CutRowNew(data []byte, colIDs map[int64]int) ([][]byte, error) { if data == nil { return nil, nil } if len(data) == 1 && data[0] == codec.NilFlag { return nil, nil } var ( cnt int b []byte err error cid int64 ) row := make([][]byte, len(colIDs)) for len(data) > 0 && cnt < len(colIDs) { // Get col id. data, cid, err = codec.CutColumnID(data) if err != nil { return nil, errors.Trace(err) } // Get col value. b, data, err = codec.CutOne(data) if err != nil { return nil, errors.Trace(err) } offset, ok := colIDs[cid] if ok { row[offset] = b cnt++ } } return row, nil } // UnflattenDatums converts raw datums to column datums. func UnflattenDatums(datums []types.Datum, fts []*types.FieldType, loc *time.Location) ([]types.Datum, error) { for i, datum := range datums { ft := fts[i] uDatum, err := unflatten(datum, ft, loc) if err != nil { return datums, errors.Trace(err) } datums[i] = uDatum } return datums, nil } // unflatten converts a raw datum to a column datum. func unflatten(datum types.Datum, ft *types.FieldType, loc *time.Location) (types.Datum, error) { if datum.IsNull() { return datum, nil } switch ft.Tp { case mysql.TypeFloat: datum.SetFloat32(float32(datum.GetFloat64())) return datum, nil case mysql.TypeTiny, mysql.TypeShort, mysql.TypeYear, mysql.TypeInt24, mysql.TypeLong, mysql.TypeLonglong, mysql.TypeDouble, mysql.TypeTinyBlob, mysql.TypeMediumBlob, mysql.TypeBlob, mysql.TypeLongBlob, mysql.TypeVarchar, mysql.TypeString: return datum, nil case mysql.TypeDate, mysql.TypeDatetime, mysql.TypeTimestamp: var t types.Time t.Type = ft.Tp t.Fsp = int8(ft.Decimal) var err error err = t.FromPackedUint(datum.GetUint64()) if err != nil { return datum, errors.Trace(err) } if ft.Tp == mysql.TypeTimestamp && !t.IsZero() { err = t.ConvertTimeZone(time.UTC, loc) if err != nil { return datum, errors.Trace(err) } } datum.SetUint64(0) datum.SetMysqlTime(t) return datum, nil case mysql.TypeDuration: //duration should read fsp from column meta data dur := types.Duration{Duration: time.Duration(datum.GetInt64()), Fsp: int8(ft.Decimal)} datum.SetValue(dur) return datum, nil case mysql.TypeEnum: // ignore error deliberately, to read empty enum value. enum, err := types.ParseEnumValue(ft.Elems, datum.GetUint64()) if err != nil { enum = types.Enum{} } datum.SetValue(enum) return datum, nil case mysql.TypeSet: set, err := types.ParseSetValue(ft.Elems, datum.GetUint64()) if err != nil { return datum, errors.Trace(err) } datum.SetValue(set) return datum, nil case mysql.TypeBit: val := datum.GetUint64() byteSize := (ft.Flen + 7) >> 3 datum.SetUint64(0) datum.SetMysqlBit(types.NewBinaryLiteralFromUint(val, byteSize)) } return datum, nil } // EncodeIndexSeekKey encodes an index value to kv.Key. func EncodeIndexSeekKey(tableID int64, idxID int64, encodedValue []byte) kv.Key { key := make([]byte, 0, prefixLen+len(encodedValue)) key = appendTableIndexPrefix(key, tableID) key = codec.EncodeInt(key, idxID) key = append(key, encodedValue...) return key } // CutIndexKey cuts encoded index key into colIDs to bytes slices map. // The returned value b is the remaining bytes of the key which would be empty if it is unique index or handle data // if it is non-unique index. func CutIndexKey(key kv.Key, colIDs []int64) (values map[int64][]byte, b []byte, err error) { b = key[prefixLen+idLen:] values = make(map[int64][]byte) for _, id := range colIDs { var val []byte val, b, err = codec.CutOne(b) if err != nil { return nil, nil, errors.Trace(err) } values[id] = val } return } // CutIndexPrefix cuts the index prefix. func CutIndexPrefix(key kv.Key) []byte { return key[prefixLen+idLen:] } // CutIndexKeyNew cuts encoded index key into colIDs to bytes slices. // The returned value b is the remaining bytes of the key which would be empty if it is unique index or handle data // if it is non-unique index. func CutIndexKeyNew(key kv.Key, length int) (values [][]byte, b []byte, err error) { b = key[prefixLen+idLen:] values = make([][]byte, 0, length) for i := 0; i < length; i++ { var val []byte val, b, err = codec.CutOne(b) if err != nil { return nil, nil, errors.Trace(err) } values = append(values, val) } return } // PrimaryKeyStatus is the primary key column status. type PrimaryKeyStatus int const ( // PrimaryKeyNotExists means no need to decode primary key column value when DecodeIndexKV. PrimaryKeyNotExists PrimaryKeyStatus = iota // PrimaryKeyIsSigned means decode primary key column value as int64 when DecodeIndexKV. PrimaryKeyIsSigned // PrimaryKeyIsUnsigned means decode primary key column value as uint64 when DecodeIndexKV. PrimaryKeyIsUnsigned ) // DecodeIndexKV uses to decode index key values. func DecodeIndexKV(key, value []byte, colsLen int, pkStatus PrimaryKeyStatus) ([][]byte, error) { values, b, err := CutIndexKeyNew(key, colsLen) if err != nil { return nil, errors.Trace(err) } if len(b) > 0 { if pkStatus != PrimaryKeyNotExists { values = append(values, b) } } else if pkStatus != PrimaryKeyNotExists { handle, err := DecodeIndexValueAsHandle(value) if err != nil { return nil, errors.Trace(err) } var handleDatum types.Datum if pkStatus == PrimaryKeyIsUnsigned { handleDatum = types.NewUintDatum(uint64(handle)) } else { handleDatum = types.NewIntDatum(handle) } handleBytes := make([]byte, 0, 8) handleBytes, err = codec.EncodeValue(nil, handleBytes, handleDatum) if err != nil { return nil, errors.Trace(err) } values = append(values, handleBytes) } return values, nil } // DecodeIndexValueAsHandle uses to decode index value as handle id. func DecodeIndexValueAsHandle(data []byte) (int64, error) { var h int64 buf := bytes.NewBuffer(data) err := binary.Read(buf, binary.BigEndian, &h) return h, errors.Trace(err) } // EncodeTableIndexPrefix encodes index prefix with tableID and idxID. func EncodeTableIndexPrefix(tableID, idxID int64) kv.Key { key := make([]byte, 0, prefixLen) key = appendTableIndexPrefix(key, tableID) key = codec.EncodeInt(key, idxID) return key } // EncodeTablePrefix encodes table prefix with table ID. func EncodeTablePrefix(tableID int64) kv.Key { var key kv.Key key = append(key, tablePrefix...) key = codec.EncodeInt(key, tableID) return key } // appendTableRecordPrefix appends table record prefix "t[tableID]_r". func appendTableRecordPrefix(buf []byte, tableID int64) []byte { buf = append(buf, tablePrefix...) buf = codec.EncodeInt(buf, tableID) buf = append(buf, recordPrefixSep...) return buf } // appendTableIndexPrefix appends table index prefix "t[tableID]_i". func appendTableIndexPrefix(buf []byte, tableID int64) []byte { buf = append(buf, tablePrefix...) buf = codec.EncodeInt(buf, tableID) buf = append(buf, indexPrefixSep...) return buf } // ReplaceRecordKeyTableID replace the tableID in the recordKey buf. func ReplaceRecordKeyTableID(buf []byte, tableID int64) []byte { if len(buf) < len(tablePrefix)+8 { return buf } u := codec.EncodeIntToCmpUint(tableID) binary.BigEndian.PutUint64(buf[len(tablePrefix):], u) return buf } // GenTableRecordPrefix composes record prefix with tableID: "t[tableID]_r". func GenTableRecordPrefix(tableID int64) kv.Key { buf := make([]byte, 0, len(tablePrefix)+8+len(recordPrefixSep)) return appendTableRecordPrefix(buf, tableID) } // GenTableIndexPrefix composes index prefix with tableID: "t[tableID]_i". func GenTableIndexPrefix(tableID int64) kv.Key { buf := make([]byte, 0, len(tablePrefix)+8+len(indexPrefixSep)) return appendTableIndexPrefix(buf, tableID) } // GenTablePrefix composes table record and index prefix: "t[tableID]". func GenTablePrefix(tableID int64) kv.Key { buf := make([]byte, 0, len(tablePrefix)+8) buf = append(buf, tablePrefix...) buf = codec.EncodeInt(buf, tableID) return buf } // TruncateToRowKeyLen truncates the key to row key length if the key is longer than row key. func TruncateToRowKeyLen(key kv.Key) kv.Key { if len(key) > recordRowKeyLen { return key[:recordRowKeyLen] } return key } // GetTableHandleKeyRange returns table handle's key range with tableID. func GetTableHandleKeyRange(tableID int64) (startKey, endKey []byte) { startKey = EncodeRowKeyWithHandle(tableID, math.MinInt64) endKey = EncodeRowKeyWithHandle(tableID, math.MaxInt64) return } // GetTableIndexKeyRange returns table index's key range with tableID and indexID. func GetTableIndexKeyRange(tableID, indexID int64) (startKey, endKey []byte) { startKey = EncodeIndexSeekKey(tableID, indexID, nil) endKey = EncodeIndexSeekKey(tableID, indexID, []byte{255}) return } const ( codeInvalidRecordKey = 4 codeInvalidColumnCount = 5 codeInvalidKey = 6 codeInvalidIndexKey = 7 )