baidu palo

This commit is contained in:
cyongli
2017-08-11 17:51:21 +08:00
commit e2311f656e
1988 changed files with 586941 additions and 0 deletions

207
be/src/runtime/tuple.cpp Normal file
View File

@ -0,0 +1,207 @@
// Modifications copyright (C) 2017, Baidu.com, Inc.
// Copyright 2017 The Apache Software Foundation
// Licensed to the Apache Software Foundation (ASF) under one
// or more contributor license agreements. See the NOTICE file
// distributed with this work for additional information
// regarding copyright ownership. The ASF licenses this file
// to you under the Apache License, Version 2.0 (the
// "License"); you may not use this file except in compliance
// with the License. You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing,
// software distributed under the License is distributed on an
// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
// KIND, either express or implied. See the License for the
// specific language governing permissions and limitations
// under the License.
#include "runtime/tuple.h"
#include <vector>
#include "exprs/expr.h"
#include "util/mem_util.hpp"
#include "runtime/descriptors.h"
#include "runtime/mem_pool.h"
#include "runtime/raw_value.h"
#include "runtime/tuple_row.h"
#include "runtime/string_value.h"
#include "util/debug_util.h"
namespace palo {
const char* Tuple::_s_llvm_class_name = "class.palo::Tuple";
int64_t Tuple::total_byte_size(const TupleDescriptor& desc) const {
int64_t result = desc.byte_size();
if (!desc.has_varlen_slots()) {
return result;
}
result += varlen_byte_size(desc);
return result;
}
int64_t Tuple::varlen_byte_size(const TupleDescriptor& desc) const {
int64_t result = 0;
std::vector<SlotDescriptor*>::const_iterator slot = desc.string_slots().begin();
for (; slot != desc.string_slots().end(); ++slot) {
DCHECK((*slot)->type().is_string_type());
if (is_null((*slot)->null_indicator_offset())) {
continue;
}
const StringValue* string_val = get_string_slot((*slot)->tuple_offset());
result += string_val->len;
}
return result;
}
Tuple* Tuple::deep_copy(const TupleDescriptor& desc, MemPool* pool, bool convert_ptrs) {
Tuple* result = reinterpret_cast<Tuple*>(pool->allocate(desc.byte_size()));
deep_copy(result, desc, pool, convert_ptrs);
return result;
}
void Tuple::deep_copy(Tuple* dst, const TupleDescriptor& desc, MemPool* pool,
bool convert_ptrs) {
memory_copy(dst, this, desc.byte_size());
// allocate in the same pool and then copy all non-null string slots
for (std::vector<SlotDescriptor*>::const_iterator i = desc.string_slots().begin();
i != desc.string_slots().end(); ++i) {
DCHECK((*i)->type().is_string_type());
if (!dst->is_null((*i)->null_indicator_offset())) {
StringValue* string_v = dst->get_string_slot((*i)->tuple_offset());
if (string_v->len != 0) {
int offset = pool->total_allocated_bytes();
char* string_copy = reinterpret_cast<char*>(pool->allocate(string_v->len));
memory_copy(string_copy, string_v->ptr, string_v->len);
string_v->ptr = (convert_ptrs ? reinterpret_cast<char*>(offset) : string_copy);
}
}
}
}
Tuple* Tuple::dcopy_with_new(const TupleDescriptor& desc, MemPool* pool, int64_t* bytes) {
Tuple* result = reinterpret_cast<Tuple*>(pool->allocate(desc.byte_size()));
*bytes = dcopy_with_new(result, desc);
return result;
}
int64_t Tuple::dcopy_with_new(Tuple* dst, const TupleDescriptor& desc) {
memory_copy(dst, this, desc.byte_size());
int64_t bytes = 0;
// allocate in the same pool and then copy all non-null string slots
for (auto slot : desc.string_slots()) {
DCHECK(slot->type().is_string_type());
if (!dst->is_null(slot->null_indicator_offset())) {
StringValue* string_v = dst->get_string_slot(slot->tuple_offset());
bytes += string_v->len;
if (string_v->len != 0) {
char* string_copy = new char[string_v->len];
memory_copy(string_copy, string_v->ptr, string_v->len);
string_v->ptr = string_copy;
} else {
string_v->ptr = nullptr;
}
}
}
return bytes;
}
int64_t Tuple::release_string(const TupleDescriptor& desc) {
int64_t bytes = 0;
for (auto slot : desc.string_slots()) {
if (!is_null(slot->null_indicator_offset())) {
StringValue* string_v = get_string_slot(slot->tuple_offset());
delete[] string_v->ptr;
bytes += string_v->len;
}
}
return bytes;
}
void Tuple::deep_copy(const TupleDescriptor& desc, char** data, int* offset,
bool convert_ptrs) {
Tuple* dst = reinterpret_cast<Tuple*>(*data);
memory_copy(dst, this, desc.byte_size());
*data += desc.byte_size();
*offset += desc.byte_size();
for (std::vector<SlotDescriptor*>::const_iterator i = desc.string_slots().begin();
i != desc.string_slots().end(); ++i) {
DCHECK((*i)->type().is_string_type());
if (!dst->is_null((*i)->null_indicator_offset())) {
StringValue* string_v = dst->get_string_slot((*i)->tuple_offset());
memory_copy(*data, string_v->ptr, string_v->len);
string_v->ptr = (convert_ptrs ? reinterpret_cast<char*>(*offset) : *data);
*data += string_v->len;
*offset += string_v->len;
}
}
}
template <bool collect_string_vals>
void Tuple::materialize_exprs(
TupleRow* row, const TupleDescriptor& desc,
const std::vector<ExprContext*>& materialize_expr_ctxs, MemPool* pool,
std::vector<StringValue*>* non_null_var_len_values, int* total_var_len) {
if (collect_string_vals) {
non_null_var_len_values->clear();
*total_var_len = 0;
}
memset(this, 0, desc.num_null_bytes());
// Evaluate the output_slot_exprs and place the results in the tuples.
int mat_expr_index = 0;
for (int i = 0; i < desc.slots().size(); ++i) {
SlotDescriptor* slot_desc = desc.slots()[i];
if (!slot_desc->is_materialized()) {
continue;
}
// The FE ensures we don't get any TYPE_NULL expressions by picking an arbitrary type
// when necessary, but does not do this for slot descs.
// TODO: revisit this logic in the FE
PrimitiveType slot_type = slot_desc->type().type;
PrimitiveType expr_type = materialize_expr_ctxs[mat_expr_index]->root()->type().type;
if ((slot_type == TYPE_CHAR) || (slot_type == TYPE_VARCHAR) || (slot_type == TYPE_HLL)) {
DCHECK((expr_type == TYPE_CHAR) || (expr_type == TYPE_VARCHAR) || (expr_type == TYPE_HLL));
} else if ((slot_type == TYPE_DATE) || (slot_type == TYPE_DATETIME)) {
DCHECK((expr_type == TYPE_DATE) || (expr_type == TYPE_DATETIME));
} else {
DCHECK(slot_type == TYPE_NULL || slot_type == expr_type);
}
void* src = materialize_expr_ctxs[mat_expr_index]->get_value(row);
if (src != NULL) {
void* dst = get_slot(slot_desc->tuple_offset());
RawValue::write(src, dst, slot_desc->type(), pool);
if (collect_string_vals) {
if (slot_desc->type().is_string_type()) {
StringValue* string_val = reinterpret_cast<StringValue*>(dst);
non_null_var_len_values->push_back(string_val);
*total_var_len += string_val->len;
}
}
} else {
set_null(slot_desc->null_indicator_offset());
}
++mat_expr_index;
}
DCHECK_EQ(mat_expr_index, materialize_expr_ctxs.size());
}
template void Tuple::materialize_exprs<false>(TupleRow* row, const TupleDescriptor& desc,
const std::vector<ExprContext*>& materialize_expr_ctxs, MemPool* pool,
std::vector<StringValue*>* non_null_var_values, int* total_var_len);
template void Tuple::materialize_exprs<true>(TupleRow* row, const TupleDescriptor& desc,
const std::vector<ExprContext*>& materialize_expr_ctxs, MemPool* pool,
std::vector<StringValue*>* non_null_var_values, int* total_var_len);
}