## Proposed changes Add transaction for the operation of insert. It will cost less time than non-transaction(it will cost 1/1000 time) when you want to insert a amount of rows. ### Syntax ``` BEGIN [ WITH LABEL label]; INSERT INTO table_name ... [COMMIT | ROLLBACK]; ``` ### Example commit a transaction: ``` begin; insert into Tbl values(11, 22, 33); commit; ``` rollback a transaction: ``` begin; insert into Tbl values(11, 22, 33); rollback; ``` commit a transaction with label: ``` begin with label test_label; insert into Tbl values(11, 22, 33); commit; ``` ### Description ``` begin: begin a transaction, the next insert will execute in the transaction until commit/rollback; commit: commit the transaction, the data in the transaction will be inserted into the table; rollback: abort the transaction, nothing will be inserted into the table; ``` ### The main realization principle: ``` 1. begin a transaction in the session. next sql is executed in the transaction; 2. insert sql will be parser and get the database name and table name, they will be used to select a be and create a pipe to accept data; 3. all inserted values will be sent to the be and write into the pipe; 4. a thread will get the data from the pipe, then write them to disk; 5. commit will complete this transaction and make these data visible; 6. rollback will abort this transaction ``` ### Some restrictions on the use of update syntax. 1. Only ```insert``` can be called in a transaction. 2. If something error happened, ```commit``` will not succeed, it will ```rollback``` directly; 3. By default, if part of insert in the transaction is invalid, ```commit``` will only insert the other correct data into the table. 4. If you need ```commit``` return failed when any insert in the transaction is invalid, you need execute ```set enable_insert_strict = true``` before ```begin```.
126 lines
3.8 KiB
C++
126 lines
3.8 KiB
C++
// Licensed to the Apache Software Foundation (ASF) under one
|
|
// or more contributor license agreements. See the NOTICE file
|
|
// distributed with this work for additional information
|
|
// regarding copyright ownership. The ASF licenses this file
|
|
// to you under the Apache License, Version 2.0 (the
|
|
// "License"); you may not use this file except in compliance
|
|
// with the License. You may obtain a copy of the License at
|
|
//
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
//
|
|
// Unless required by applicable law or agreed to in writing,
|
|
// software distributed under the License is distributed on an
|
|
// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
|
|
// KIND, either express or implied. See the License for the
|
|
// specific language governing permissions and limitations
|
|
// under the License.
|
|
|
|
#pragma once
|
|
|
|
#include <map>
|
|
#include <memory>
|
|
#include <sstream>
|
|
#include <string>
|
|
#include <vector>
|
|
|
|
#include "common/status.h"
|
|
#include "exec/base_scanner.h"
|
|
#include "gen_cpp/PlanNodes_types.h"
|
|
#include "gen_cpp/Types_types.h"
|
|
#include "gen_cpp/internal_service.pb.h"
|
|
#include "runtime/mem_pool.h"
|
|
#include "util/runtime_profile.h"
|
|
#include "util/slice.h"
|
|
|
|
namespace doris {
|
|
|
|
class Tuple;
|
|
class SlotDescriptor;
|
|
class Slice;
|
|
class TextConverter;
|
|
class FileReader;
|
|
class LineReader;
|
|
class Decompressor;
|
|
class RuntimeState;
|
|
class ExprContext;
|
|
class TupleDescriptor;
|
|
class TupleRow;
|
|
class RowDescriptor;
|
|
class MemTracker;
|
|
class RuntimeProfile;
|
|
class StreamLoadPipe;
|
|
|
|
// Broker scanner convert the data read from broker to doris's tuple.
|
|
class BrokerScanner : public BaseScanner {
|
|
public:
|
|
BrokerScanner(RuntimeState* state, RuntimeProfile* profile,
|
|
const TBrokerScanRangeParams& params, const std::vector<TBrokerRangeDesc>& ranges,
|
|
const std::vector<TNetworkAddress>& broker_addresses,
|
|
const std::vector<ExprContext*>& pre_filter_ctxs, ScannerCounter* counter);
|
|
~BrokerScanner();
|
|
|
|
// Open this scanner, will initialize information need to
|
|
Status open() override;
|
|
|
|
// Get next tuple
|
|
Status get_next(Tuple* tuple, MemPool* tuple_pool, bool* eof) override;
|
|
|
|
// Close this scanner
|
|
void close() override;
|
|
|
|
private:
|
|
Status open_file_reader();
|
|
Status create_decompressor(TFileFormatType::type type);
|
|
Status open_line_reader();
|
|
// Read next buffer from reader
|
|
Status open_next_reader();
|
|
|
|
// Split one text line to values
|
|
void split_line(const Slice& line);
|
|
|
|
void fill_fix_length_string(const Slice& value, MemPool* pool, char** new_value_p,
|
|
int new_value_length);
|
|
|
|
bool check_decimal_input(const Slice& value, int precision, int scale,
|
|
std::stringstream* error_msg);
|
|
|
|
// Convert one row to one tuple
|
|
// 'ptr' and 'len' is csv text line
|
|
// output is tuple
|
|
bool convert_one_row(const Slice& line, Tuple* tuple, MemPool* tuple_pool);
|
|
|
|
Status line_to_src_tuple();
|
|
bool line_to_src_tuple(const Slice& line);
|
|
|
|
private:
|
|
const std::vector<TBrokerRangeDesc>& _ranges;
|
|
const std::vector<TNetworkAddress>& _broker_addresses;
|
|
|
|
std::unique_ptr<TextConverter> _text_converter;
|
|
|
|
std::string _value_separator;
|
|
std::string _line_delimiter;
|
|
TFileFormatType::type _file_format_type;
|
|
int _value_separator_length;
|
|
int _line_delimiter_length;
|
|
|
|
// Reader
|
|
FileReader* _cur_file_reader;
|
|
LineReader* _cur_line_reader;
|
|
Decompressor* _cur_decompressor;
|
|
int _next_range;
|
|
bool _cur_line_reader_eof;
|
|
|
|
bool _scanner_eof;
|
|
|
|
// When we fetch range doesn't start from 0,
|
|
// we will read to one ahead, and skip the first line
|
|
bool _skip_next_line;
|
|
|
|
// used to hold current StreamLoadPipe
|
|
std::shared_ptr<StreamLoadPipe> _stream_load_pipe;
|
|
std::vector<Slice> _split_values;
|
|
};
|
|
|
|
} // namespace doris
|