204 lines
		
	
	
		
			4.9 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
			
		
		
	
	
			204 lines
		
	
	
		
			4.9 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
| /**
 | |
|  * Copyright (c) 2021 OceanBase
 | |
|  * OceanBase CE is licensed under Mulan PubL v2.
 | |
|  * You can use this software according to the terms and conditions of the Mulan PubL v2.
 | |
|  * You may obtain a copy of Mulan PubL v2 at:
 | |
|  *          http://license.coscl.org.cn/MulanPubL-2.0
 | |
|  * THIS SOFTWARE IS PROVIDED ON AN "AS IS" BASIS, WITHOUT WARRANTIES OF ANY KIND,
 | |
|  * EITHER EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO NON-INFRINGEMENT,
 | |
|  * MERCHANTABILITY OR FIT FOR A PARTICULAR PURPOSE.
 | |
|  * See the Mulan PubL v2 for more details.
 | |
|  */
 | |
| 
 | |
| #define USING_LOG_PREFIX STORAGE
 | |
| 
 | |
| #include "mysql_dump_data_reader.h"
 | |
| #include "share/ob_define.h"
 | |
| 
 | |
| namespace oceanbase
 | |
| {
 | |
| using namespace common;
 | |
| 
 | |
| MysqlDumpDataReader::MysqlDumpDataReader() : value_cnt_(0), data_index_(0)
 | |
| {
 | |
| }
 | |
| 
 | |
| int MysqlDumpDataReader::init(const char *file)
 | |
| {
 | |
|   int ret = OB_SUCCESS;
 | |
|   stream_.open(file);
 | |
|   if (stream_.fail()) {
 | |
|     ret = OB_ERROR;
 | |
|     LOG_WARN("open file error", K(ret), K(file), K(errno));
 | |
|     return ret;
 | |
|   }
 | |
|   bool is_insert = false;
 | |
|   while (OB_SUCC(next_sql())) {
 | |
|     if (cur_sql_.size() > 6 && strncmp(cur_sql_.data(), "INSERT", 6) == 0) {
 | |
|       is_insert = true;
 | |
|       break;
 | |
|     } else {
 | |
|       schema_sqls_.push_back(cur_sql_);
 | |
|     }
 | |
|   }
 | |
|   if (OB_ITER_END == ret) {
 | |
|     ret = OB_SUCCESS;
 | |
|   } else if (OB_FAIL(ret)) {
 | |
|     LOG_WARN("init failed", K(ret));
 | |
|   } else {
 | |
|     if (is_insert) {
 | |
|       if (OB_FAIL(parse_insert_sql())) {
 | |
|         LOG_WARN("parse insert sql failed", K(ret));
 | |
|       }
 | |
|     }
 | |
|   }
 | |
|   return ret;
 | |
| }
 | |
| 
 | |
| int MysqlDumpDataReader::reset()
 | |
| {
 | |
|   int ret = OB_SUCCESS;
 | |
|   stream_.clear();
 | |
|   stream_.seekg(0, std::ios::beg);
 | |
|   bool is_insert = false;
 | |
|   while (OB_SUCC(next_sql())) {
 | |
|     if (cur_sql_.size() > 6 && strncmp(cur_sql_.data(), "INSERT", 6) == 0) {
 | |
|       is_insert = true;
 | |
|       break;
 | |
|     }
 | |
|   }
 | |
|   if (is_insert) {
 | |
|     if (OB_FAIL(parse_insert_sql())) {
 | |
|       LOG_WARN("parse insert sql failed", K(ret));
 | |
|     }
 | |
|   }
 | |
|   return ret;
 | |
| }
 | |
| 
 | |
| int MysqlDumpDataReader::next_sql()
 | |
| {
 | |
|   int ret = OB_SUCCESS;
 | |
|   cur_sql_.clear();
 | |
|   cur_line_.clear();
 | |
|   while (std::getline(stream_, cur_line_)) {
 | |
|     if (cur_line_.empty()) { // skip empty line
 | |
|     } else if (cur_line_.size() >= 2
 | |
|         && (strncmp(cur_line_.data(), "/*", 2) == 0
 | |
|             || strncmp(cur_line_.data(), "--", 2) == 0)) { // skip comment line
 | |
|     } else {
 | |
|       if (!cur_sql_.empty()) {
 | |
|         cur_sql_.push_back('\n');
 | |
|       }
 | |
|       cur_sql_.append(cur_line_);
 | |
|       if (cur_sql_[cur_sql_.size() - 1] == ';') {
 | |
|         break;
 | |
|       }
 | |
|     }
 | |
|     cur_line_.clear();
 | |
|   }
 | |
|   if (cur_sql_.empty()) {
 | |
|     ret = OB_ITER_END;
 | |
|   }
 | |
|   return ret;
 | |
| }
 | |
| 
 | |
| int MysqlDumpDataReader::next_data(std::vector<ObString> &data)
 | |
| {
 | |
|   int ret = OB_SUCCESS;
 | |
|   while (data_index_ >= datas_.size() && OB_SUCC(ret)) {
 | |
|     if (OB_FAIL(next_sql())) {
 | |
|     } else if (OB_FAIL(parse_insert_sql())) {
 | |
|       LOG_WARN("parse insert sql failed", K(ret));
 | |
|     }
 | |
|   }
 | |
|   if (OB_SUCC(ret)) {
 | |
|     data.clear();
 | |
|     data.reserve(value_cnt_);
 | |
|     for (int64_t i = 0; i < value_cnt_; ++i) {
 | |
|       data.push_back(datas_.at(data_index_));
 | |
|       data_index_++;
 | |
|     }
 | |
|   }
 | |
|   return ret;
 | |
| }
 | |
| 
 | |
| int MysqlDumpDataReader::parse_insert_sql()
 | |
| {
 | |
|   int ret = OB_SUCCESS;
 | |
|   if (cur_sql_.size() < 6 || strncmp(cur_sql_.c_str(), "INSERT", 6) != 0) {
 | |
|     LOG_INFO("not insert sql, ignore", K(ret), K(cur_sql_.c_str()));
 | |
|   } else {
 | |
|     char *sql = const_cast<char *>(cur_sql_.c_str());
 | |
|     value_cnt_ = 0;
 | |
|     data_index_ = 0;
 | |
|     datas_.clear();
 | |
|     const char *begin_str = " VALUES (";
 | |
|     char *p = strstr(sql, begin_str);
 | |
|     if (NULL == sql) {
 | |
|       ret = OB_ERROR;
 | |
|       LOG_WARN("value begin mark not found", K(ret), K(begin_str), K(sql));
 | |
|       return ret;
 | |
|     }
 | |
|     p += strlen(begin_str);
 | |
|     bool quote = false;
 | |
|     char *begin = NULL;
 | |
|     p = sql;
 | |
|     while (*p) {
 | |
|       if (quote) {
 | |
|         switch (*p) {
 | |
|           case '\\':
 | |
|             p++;
 | |
|             if (!*p) {
 | |
|               ret = OB_ERROR;
 | |
|               LOG_WARN("unterminated string", K(ret));
 | |
|               return ret;
 | |
|             }
 | |
|             p++;
 | |
|             break;
 | |
|           case '\'':
 | |
|             quote = false;
 | |
|             p++;
 | |
|             datas_.push_back(ObString(p - begin, begin));
 | |
|             begin = NULL;
 | |
|             break;
 | |
|           default:
 | |
|             p++;
 | |
|         }
 | |
|       } else {
 | |
|         switch (*p) {
 | |
|           case '(':
 | |
|           case ';':
 | |
|             begin = NULL;
 | |
|             *p = '\0';
 | |
|             p++;
 | |
|             break;
 | |
|           case ')':
 | |
|           case ',':
 | |
|             if (NULL != begin) {
 | |
|               datas_.push_back(ObString(p - begin, begin));
 | |
|               begin = NULL;
 | |
|             }
 | |
|             if (value_cnt_ == 0 && *p == ')') {
 | |
|               value_cnt_ = datas_.size();
 | |
|             }
 | |
|             *p = '\0';
 | |
|             p++;
 | |
|             break;
 | |
|           case '\'':
 | |
|             quote = true;
 | |
|             // intentionally no break
 | |
|           default:
 | |
|             if (NULL == begin) {
 | |
|               begin = p;
 | |
|             }
 | |
|             p++;
 | |
|         }
 | |
|       }
 | |
|     }
 | |
|     LOG_DEBUG("parsed data", K(value_cnt_), K(datas_.size()));
 | |
|   }
 | |
|   return ret;
 | |
| }
 | |
| 
 | |
| } // end namespace oceanbase
 | 
