Files
tidb/pkg/expression/builtin_ilike_test.go

173 lines
6.6 KiB
Go

// Copyright 2023 PingCAP, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.
package expression
import (
"fmt"
"testing"
"github.com/pingcap/tidb/pkg/parser/ast"
"github.com/pingcap/tidb/pkg/parser/charset"
"github.com/pingcap/tidb/pkg/parser/mysql"
"github.com/pingcap/tidb/pkg/testkit/testutil"
"github.com/pingcap/tidb/pkg/types"
"github.com/pingcap/tidb/pkg/util/chunk"
"github.com/pingcap/tidb/pkg/util/collate"
"github.com/stretchr/testify/require"
)
func TestIlike(t *testing.T) {
ctx := createContext(t)
tests := []struct {
input string
pattern string
escape int
generalMatch int
unicodeMatch int
}{
{"a", "", 0, 0, 0},
{"a", "a", 0, 1, 1},
{"ü", "Ü", 0, 0, 0},
{"a", "á", 0, 0, 0},
{"a", "b", 0, 0, 0},
{"aA", "Aa", 0, 1, 1},
{"áAb", `Aa%`, 0, 0, 0},
{"áAb", `%ab%`, 0, 1, 1},
{"", "", 0, 1, 1},
{"ß", "s%", 0, 0, 0},
{"ß", "%s", 0, 0, 0},
{"ß", "ss", 0, 0, 0},
{"ß", "s", 0, 0, 0},
{"ss", "%ß%", 0, 0, 0},
{"ß", "_", 0, 1, 1},
{"ß", "__", 0, 0, 0},
{"啊aaa啊啊啊aa", "啊aaa啊啊啊aa", 0, 1, 1},
// escape tests
{"abc", "ABC", int('a'), 1, 1},
{"abc", "ABC", int('A'), 0, 0},
{"aaz", "Aaaz", int('a'), 1, 1},
{"AAz", "AAAAz", int('a'), 0, 0},
{"a", "Aa", int('A'), 1, 1},
{"a", "AA", int('A'), 1, 1},
{"Aa", "AAAA", int('A'), 1, 1},
{"gTp", "AGTAp", int('A'), 1, 1},
{"gTAp", "AGTAap", int('A'), 1, 1},
{"A", "aA", int('a'), 1, 1},
{"a", "aA", int('a'), 1, 1},
{"aaa", "AAaA", int('a'), 1, 1},
{"a啊啊a", "a啊啊A", int('A'), 0, 0},
{"啊aaa啊啊啊aa", "啊aaa啊啊啊aa", int('A'), 1, 1},
{"啊aAa啊啊啊aA", "啊AAA啊啊啊AA", int('a'), 1, 1},
{"啊aaa啊啊啊aa", "啊aaa啊啊啊aa", int('a'), 0, 0},
}
var charsetAndCollationGeneral = [][]string{{"utf8mb4", "utf8mb4_general_ci"}, {"utf8", "utf8_general_ci"}}
for _, charsetAndCollation := range charsetAndCollationGeneral {
for _, tt := range tests {
comment := fmt.Sprintf(`for input = "%s", pattern = "%s", escape = "%s", collation = "%s"`, tt.input, tt.pattern, string(rune(tt.escape)), charsetAndCollation[1])
fc := funcs[ast.Ilike]
inputs := datumsToConstants(types.MakeDatums(tt.input, tt.pattern, tt.escape))
f, err := fc.getFunction(ctx, inputs)
require.NoError(t, err, comment)
f.SetCharsetAndCollation(charsetAndCollation[0], charsetAndCollation[1])
f.setCollator(collate.GetCollator(charsetAndCollation[1]))
r, err := evalBuiltinFunc(f, ctx, chunk.Row{})
require.NoError(t, err, comment)
testutil.DatumEqual(t, types.NewDatum(tt.generalMatch), r, comment)
}
}
var charsetAndCollationUnicode = [][]string{
{"utf8mb4", "utf8mb4_bin"},
{"utf8mb4", "utf8mb4_unicode_ci"},
{"utf8", "utf8_bin"},
{"utf8", "utf8_unicode_ci"}}
for _, charsetAndCollation := range charsetAndCollationUnicode {
for _, tt := range tests {
comment := fmt.Sprintf(`for input = "%s", pattern = "%s", escape = "%s", collation = "%s"`, tt.input, tt.pattern, string(rune(tt.escape)), charsetAndCollation[1])
fc := funcs[ast.Ilike]
inputs := datumsToConstants(types.MakeDatums(tt.input, tt.pattern, tt.escape))
f, err := fc.getFunction(ctx, inputs)
require.NoError(t, err, comment)
f.SetCharsetAndCollation(charsetAndCollation[0], charsetAndCollation[1])
f.setCollator(collate.GetCollator(charsetAndCollation[1]))
r, err := evalBuiltinFunc(f, ctx, chunk.Row{})
require.NoError(t, err, comment)
testutil.DatumEqual(t, types.NewDatum(tt.unicodeMatch), r, comment)
}
}
}
var vecBuiltinIlikeCases = map[string][]vecExprBenchCase{
ast.Ilike: {
{
retEvalType: types.ETInt,
childrenTypes: []types.EvalType{types.ETString, types.ETString, types.ETInt},
geners: []dataGenerator{
&selectStringGener{
candidates: []string{"aaa", "abc", "aAa", "AaA", "a啊啊Aa啊", "啊啊啊啊", "üÜ", "Ü", "a", "A"},
randGen: newDefaultRandGen(),
},
&selectStringGener{
candidates: []string{"aaa", "ABC", "啊啊啊啊", "üÜ", "ü", "a", "A"},
randGen: newDefaultRandGen(),
}},
childrenFieldTypes: []*types.FieldType{types.NewFieldTypeBuilder().SetType(mysql.TypeString).SetFlag(mysql.BinaryFlag).SetCharset(charset.CharsetBin).SetCollate(charset.CollationBin).BuildP()},
},
{
retEvalType: types.ETInt,
childrenTypes: []types.EvalType{types.ETString, types.ETString, types.ETInt},
geners: []dataGenerator{
&selectStringGener{
candidates: []string{"aaa", "abc", "aAa", "AaA", "a啊啊Aa啊", "啊啊啊啊", "üÜ", "Ü", "a", "A"},
// candidates: []string{"abc"},
randGen: newDefaultRandGen(),
},
&selectStringGener{
candidates: []string{"aaa", "ABC", "啊啊啊啊", "üÜ", "ü", "a", "A"},
// candidates: []string{"ABC"},
randGen: newDefaultRandGen(),
}},
childrenFieldTypes: []*types.FieldType{types.NewFieldTypeBuilder().SetType(mysql.TypeString).SetFlag(mysql.BinaryFlag).SetCharset(charset.CharsetBin).SetCollate(charset.CollationBin).BuildP()},
},
{
retEvalType: types.ETInt,
childrenTypes: []types.EvalType{types.ETString, types.ETString, types.ETInt},
geners: []dataGenerator{
&selectStringGener{
candidates: []string{"aaa", "abc", "aAa", "AaA", "a啊啊Aa啊", "啊啊啊啊", "üÜ", "Ü", "a", "A"},
randGen: newDefaultRandGen(),
},
&selectStringGener{
candidates: []string{"aaa", "ABC", "啊啊啊啊", "üÜ", "ü", "a", "A"},
randGen: newDefaultRandGen(),
}},
childrenFieldTypes: []*types.FieldType{types.NewFieldTypeBuilder().SetType(mysql.TypeString).SetFlag(mysql.BinaryFlag).SetCharset(charset.CharsetBin).SetCollate(charset.CollationBin).BuildP()},
},
},
}
func TestVectorizedBuiltinIlikeFunc(t *testing.T) {
vecBuiltinIlikeCases[ast.Ilike][0].constants = make([]*Constant, 3)
vecBuiltinIlikeCases[ast.Ilike][1].constants = make([]*Constant, 3)
vecBuiltinIlikeCases[ast.Ilike][2].constants = make([]*Constant, 3)
vecBuiltinIlikeCases[ast.Ilike][0].constants[2] = getIntConstant(int64(byte('A')))
vecBuiltinIlikeCases[ast.Ilike][1].constants[2] = getIntConstant(int64(byte('a')))
vecBuiltinIlikeCases[ast.Ilike][2].constants[2] = getIntConstant(int64(byte('\\')))
testVectorizedBuiltinFunc(t, vecBuiltinIlikeCases)
}