1. upgrade gutil code from imapla to new verison, include `cpuinfo`, `spinlock` and `linux_syscall_support ` 2. impliments arm version utf8 check code 3. remove incompatible code from stopwatch
125 lines
4.0 KiB
C++
125 lines
4.0 KiB
C++
// Licensed to the Apache Software Foundation (ASF) under one
|
|
// or more contributor license agreements. See the NOTICE file
|
|
// distributed with this work for additional information
|
|
// regarding copyright ownership. The ASF licenses this file
|
|
// to you under the Apache License, Version 2.0 (the
|
|
// "License"); you may not use this file except in compliance
|
|
// with the License. You may obtain a copy of the License at
|
|
//
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
//
|
|
// Unless required by applicable law or agreed to in writing,
|
|
// software distributed under the License is distributed on an
|
|
// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
|
|
// KIND, either express or implied. See the License for the
|
|
// specific language governing permissions and limitations
|
|
// under the License.
|
|
|
|
#include "util/utf8_check.h"
|
|
|
|
#include <gtest/gtest.h>
|
|
|
|
namespace doris {
|
|
|
|
struct test {
|
|
const char *data;
|
|
int len;
|
|
};
|
|
|
|
class Utf8CheckTest : public testing::Test {
|
|
public:
|
|
Utf8CheckTest() { }
|
|
virtual ~Utf8CheckTest() { }
|
|
private:
|
|
/* positive tests */
|
|
std::vector<test> pos = {
|
|
{"", 0},
|
|
{"\x00", 1},
|
|
{"\x66", 1},
|
|
{"\x7F", 1},
|
|
{"\x00\x7F", 2},
|
|
{"\x7F\x00", 2},
|
|
{"\xC2\x80", 2},
|
|
{"\xDF\xBF", 2},
|
|
{"\xE0\xA0\x80", 3},
|
|
{"\xE0\xA0\xBF", 3},
|
|
{"\xED\x9F\x80", 3},
|
|
{"\xEF\x80\xBF", 3},
|
|
{"\xF0\x90\xBF\x80", 4},
|
|
{"\xF2\x81\xBE\x99", 4},
|
|
{"\xF4\x8F\x88\xAA", 4}
|
|
};
|
|
|
|
/* negative tests */
|
|
std::vector<test> neg = {
|
|
{"\x80", 1},
|
|
{"\xBF", 1},
|
|
{"\xC0\x80", 2},
|
|
{"\xC1\x00", 2},
|
|
{"\xC2\x7F", 2},
|
|
{"\xDF\xC0", 2},
|
|
{"\xE0\x9F\x80", 3},
|
|
{"\xE0\xC2\x80", 3},
|
|
{"\xED\xA0\x80", 3},
|
|
{"\xED\x7F\x80", 3},
|
|
{"\xEF\x80\x00", 3},
|
|
{"\xF0\x8F\x80\x80", 4},
|
|
{"\xF0\xEE\x80\x80", 4},
|
|
{"\xF2\x90\x91\x7F", 4},
|
|
{"\xF4\x90\x88\xAA", 4},
|
|
{"\xF4\x00\xBF\xBF", 4},
|
|
{"\x00\x00\x00\x00\x00\xC2\x80\x00\x00\x00\xE1\x80\x80\x00\x00\xC2" \
|
|
"\xC2\x80\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00",
|
|
32},
|
|
{"\x00\x00\x00\x00\x00\xC2\xC2\x80\x00\x00\xE1\x80\x80\x00\x00\x00",
|
|
16},
|
|
{"\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00" \
|
|
"\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\xF1\x80",
|
|
32},
|
|
{"\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00" \
|
|
"\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\xF1",
|
|
32},
|
|
{"\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00" \
|
|
"\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\xF1\x80" \
|
|
"\x80", 33},
|
|
{"\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00" \
|
|
"\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\xF1\x80" \
|
|
"\xC2\x80", 34},
|
|
{"\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00" \
|
|
"\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\xF0" \
|
|
"\x80\x80\x80", 35}
|
|
};
|
|
};
|
|
TEST_F(Utf8CheckTest, empty) {
|
|
ASSERT_TRUE(validate_utf8(pos[0].data, pos[0].len));
|
|
}
|
|
|
|
TEST_F(Utf8CheckTest, normal) {
|
|
for (int i = 0; i < sizeof(pos)/sizeof(pos[0]); ++i) {
|
|
ASSERT_TRUE(validate_utf8(pos[i].data, pos[i].len));
|
|
}
|
|
}
|
|
|
|
TEST_F(Utf8CheckTest, abnormal) {
|
|
for (int i = 0; i < sizeof(neg)/sizeof(neg[0]); ++i) {
|
|
ASSERT_FALSE(validate_utf8(neg[i].data, neg[i].len));
|
|
}
|
|
}
|
|
|
|
TEST_F(Utf8CheckTest, naive) {
|
|
for (int i = 0; i < sizeof(pos)/sizeof(pos[0]); ++i) {
|
|
ASSERT_TRUE(validate_utf8_naive(pos[i].data, pos[i].len));
|
|
}
|
|
for (int i = 0; i < sizeof(neg)/sizeof(neg[0]); ++i) {
|
|
std::cout << validate_utf8_naive(neg[i].data, neg[i].len) << std::endl;
|
|
ASSERT_FALSE(validate_utf8_naive(neg[i].data, neg[i].len));
|
|
}
|
|
}
|
|
|
|
}
|
|
|
|
int main(int argc, char* argv[]) {
|
|
::testing::InitGoogleTest(&argc, argv);
|
|
return RUN_ALL_TESTS();
|
|
}
|