Files
doris/be/src/util/path_util.cpp
Mingyu Chen 2678afd2db [fix][improvement](fs) add HdfsIO profile and modification time (#21638)
Refactor the interface of create_file_reader

the file_size and mtime are merged into FileDescription, not in FileReaderOptions anymore.
Now the file handle cache can get correct file's modification time from FileDescription.
Add HdfsIO for hdfs file reader
pick from [Enhancement](multi-catalog) Add hdfs read statistics profile. #21442
2023-07-08 14:49:44 +08:00

95 lines
2.8 KiB
C++

// Licensed to the Apache Software Foundation (ASF) under one
// or more contributor license agreements. See the NOTICE file
// distributed with this work for additional information
// regarding copyright ownership. The ASF licenses this file
// to you under the Apache License, Version 2.0 (the
// "License"); you may not use this file except in compliance
// with the License. You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing,
// software distributed under the License is distributed on an
// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
// KIND, either express or implied. See the License for the
// specific language governing permissions and limitations
// under the License.
#include "util/path_util.h"
// Use the POSIX version of dirname(3). See `man 3 dirname`
#include <libgen.h>
#include "gutil/strings/split.h"
#include "gutil/strings/stringpiece.h"
#include "gutil/strings/strip.h"
using std::string;
using std::vector;
using strings::SkipEmpty;
using strings::Split;
namespace doris {
namespace path_util {
const string kTmpInfix = ".doristmp";
std::string join_path_segments(const string& a, const string& b) {
if (a.empty()) {
return b;
} else if (b.empty()) {
return a;
} else {
return StripSuffixString(a, "/") + "/" + StripPrefixString(b, "/");
}
}
std::vector<string> join_path_segments_v(const std::vector<string>& v, const string& s) {
std::vector<string> out;
for (const string& path : v) {
out.emplace_back(join_path_segments(path, s));
}
return out;
}
std::vector<string> split_path(const string& path) {
if (path.empty()) {
return {};
}
std::vector<string> segments;
if (path[0] == '/') {
segments.emplace_back("/");
}
std::vector<StringPiece> pieces = Split(path, "/", SkipEmpty());
for (const StringPiece& piece : pieces) {
segments.emplace_back(piece.data(), piece.size());
}
return segments;
}
// strdup use malloc to obtain memory for the new string, it should be freed with free.
// but std::unique_ptr use delete to free memory by default, so it should specify free memory using free
std::string dir_name(const string& path) {
std::vector<char> path_copy(path.c_str(), path.c_str() + path.size() + 1);
return dirname(&path_copy[0]);
}
std::string base_name(const string& path) {
std::vector<char> path_copy(path.c_str(), path.c_str() + path.size() + 1);
return basename(&path_copy[0]);
}
std::string file_extension(const string& path) {
string file_name = base_name(path);
if (file_name == "." || file_name == "..") {
return "";
}
string::size_type pos = file_name.rfind(".");
return pos == string::npos ? "" : file_name.substr(pos);
}
} // namespace path_util
} // namespace doris