238 lines
6.7 KiB
C++
238 lines
6.7 KiB
C++
// Licensed to the Apache Software Foundation (ASF) under one
|
|
// or more contributor license agreements. See the NOTICE file
|
|
// distributed with this work for additional information
|
|
// regarding copyright ownership. The ASF licenses this file
|
|
// to you under the Apache License, Version 2.0 (the
|
|
// "License"); you may not use this file except in compliance
|
|
// with the License. You may obtain a copy of the License at
|
|
//
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
//
|
|
// Unless required by applicable law or agreed to in writing,
|
|
// software distributed under the License is distributed on an
|
|
// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
|
|
// KIND, either express or implied. See the License for the
|
|
// specific language governing permissions and limitations
|
|
// under the License.
|
|
|
|
#include "util/file_utils.h"
|
|
|
|
#include <dirent.h>
|
|
#include <openssl/md5.h>
|
|
#include <sys/mman.h>
|
|
#include <sys/stat.h>
|
|
#include <sys/types.h>
|
|
|
|
#include <algorithm>
|
|
#include <filesystem>
|
|
#include <iomanip>
|
|
#include <memory>
|
|
#include <sstream>
|
|
|
|
#include "env/env.h"
|
|
#include "gutil/strings/split.h"
|
|
#include "gutil/strings/strip.h"
|
|
#include "gutil/strings/substitute.h"
|
|
#include "olap/file_helper.h"
|
|
#include "runtime/thread_context.h"
|
|
#include "util/defer_op.h"
|
|
|
|
namespace doris {
|
|
|
|
using strings::Substitute;
|
|
|
|
Status FileUtils::create_dir(const std::string& path, Env* env) {
|
|
return env->create_dirs(path);
|
|
}
|
|
|
|
Status FileUtils::create_dir(const std::string& dir_path) {
|
|
return create_dir(dir_path, Env::Default());
|
|
}
|
|
|
|
Status FileUtils::remove_all(const std::string& file_path) {
|
|
return Env::Default()->delete_dir(file_path);
|
|
}
|
|
|
|
Status FileUtils::remove(const std::string& path) {
|
|
if (!Env::Default()->path_exists(path).ok()) {
|
|
LOG(WARNING) << "path does exist: " << path;
|
|
return Status::OK();
|
|
}
|
|
bool is_dir;
|
|
RETURN_IF_ERROR(Env::Default()->is_directory(path, &is_dir));
|
|
|
|
if (is_dir) {
|
|
return Env::Default()->delete_dir(path);
|
|
} else {
|
|
return Env::Default()->delete_file(path);
|
|
}
|
|
}
|
|
|
|
Status FileUtils::remove_paths(const std::vector<std::string>& paths) {
|
|
for (const std::string& p : paths) {
|
|
RETURN_IF_ERROR(remove(p));
|
|
}
|
|
return Status::OK();
|
|
}
|
|
|
|
Status FileUtils::list_files(Env* env, const std::string& dir, std::vector<std::string>* files) {
|
|
auto cb = [files](const char* name) -> bool {
|
|
if (!is_dot_or_dotdot(name)) {
|
|
files->push_back(name);
|
|
}
|
|
return true;
|
|
};
|
|
return env->iterate_dir(dir, cb);
|
|
}
|
|
|
|
Status FileUtils::list_dirs_files(const std::string& path, std::set<std::string>* dirs,
|
|
std::set<std::string>* files, Env* env) {
|
|
auto cb = [path, dirs, files, env](const char* name) -> bool {
|
|
if (is_dot_or_dotdot(name)) {
|
|
return true;
|
|
}
|
|
|
|
std::string temp_path = path + "/" + name;
|
|
bool is_dir;
|
|
|
|
auto st = env->is_directory(temp_path, &is_dir);
|
|
if (st.ok()) {
|
|
if (is_dir) {
|
|
if (dirs != nullptr) {
|
|
dirs->insert(name);
|
|
}
|
|
} else if (files != nullptr) {
|
|
files->insert(name);
|
|
}
|
|
} else {
|
|
LOG(WARNING) << "check path " << path << "is directory error: " << st.to_string();
|
|
}
|
|
|
|
return true;
|
|
};
|
|
|
|
return env->iterate_dir(path, cb);
|
|
}
|
|
|
|
Status FileUtils::get_children_count(Env* env, const std::string& dir, int64_t* count) {
|
|
auto cb = [count](const char* name) -> bool {
|
|
if (!is_dot_or_dotdot(name)) {
|
|
*count += 1;
|
|
}
|
|
return true;
|
|
};
|
|
return env->iterate_dir(dir, cb);
|
|
}
|
|
|
|
bool FileUtils::is_dir(const std::string& file_path, Env* env) {
|
|
bool ret;
|
|
if (env->is_directory(file_path, &ret).ok()) {
|
|
return ret;
|
|
}
|
|
|
|
return false;
|
|
}
|
|
|
|
bool FileUtils::is_dir(const std::string& path) {
|
|
return is_dir(path, Env::Default());
|
|
}
|
|
|
|
// Through proc filesystem
|
|
std::string FileUtils::path_of_fd(int fd) {
|
|
const int PATH_SIZE = 256;
|
|
char proc_path[PATH_SIZE];
|
|
snprintf(proc_path, PATH_SIZE, "/proc/self/fd/%d", fd);
|
|
char path[PATH_SIZE];
|
|
if (readlink(proc_path, path, PATH_SIZE) < 0) {
|
|
path[0] = '\0';
|
|
}
|
|
return path;
|
|
}
|
|
|
|
Status FileUtils::split_paths(const char* path, std::vector<std::string>* path_vec) {
|
|
path_vec->clear();
|
|
*path_vec = strings::Split(path, ";", strings::SkipWhitespace());
|
|
|
|
for (std::vector<std::string>::iterator it = path_vec->begin(); it != path_vec->end();) {
|
|
StripWhiteSpace(&(*it));
|
|
|
|
it->erase(it->find_last_not_of("/") + 1);
|
|
if (it->size() == 0) {
|
|
it = path_vec->erase(it);
|
|
} else {
|
|
++it;
|
|
}
|
|
}
|
|
|
|
// Check if
|
|
std::sort(path_vec->begin(), path_vec->end());
|
|
if (std::unique(path_vec->begin(), path_vec->end()) != path_vec->end()) {
|
|
return Status::InternalError("Same path in path.[path={}]", path);
|
|
}
|
|
|
|
if (path_vec->size() == 0) {
|
|
return Status::InternalError("Size of vector after split is zero.[path={}]", path);
|
|
}
|
|
|
|
return Status::OK();
|
|
}
|
|
|
|
Status FileUtils::copy_file(const std::string& src_path, const std::string& dest_path) {
|
|
return Env::Default()->copy_path(src_path, dest_path);
|
|
}
|
|
|
|
Status FileUtils::md5sum(const std::string& file, std::string* md5sum) {
|
|
int fd = open(file.c_str(), O_RDONLY);
|
|
if (fd < 0) {
|
|
return Status::InternalError("failed to open file");
|
|
}
|
|
|
|
struct stat statbuf;
|
|
if (fstat(fd, &statbuf) < 0) {
|
|
close(fd);
|
|
return Status::InternalError("failed to stat file");
|
|
}
|
|
size_t file_len = statbuf.st_size;
|
|
CONSUME_THREAD_MEM_TRACKER(file_len);
|
|
void* buf = mmap(0, file_len, PROT_READ, MAP_SHARED, fd, 0);
|
|
|
|
unsigned char result[MD5_DIGEST_LENGTH];
|
|
MD5((unsigned char*)buf, file_len, result);
|
|
munmap(buf, file_len);
|
|
RELEASE_THREAD_MEM_TRACKER(file_len);
|
|
|
|
std::stringstream ss;
|
|
for (int32_t i = 0; i < MD5_DIGEST_LENGTH; i++) {
|
|
ss << std::setfill('0') << std::setw(2) << std::hex << (int)result[i];
|
|
}
|
|
ss >> *md5sum;
|
|
|
|
close(fd);
|
|
return Status::OK();
|
|
}
|
|
|
|
Status FileUtils::mtime(const std::string& file, time_t* m_time) {
|
|
int fd = open(file.c_str(), O_RDONLY);
|
|
if (fd < 0) {
|
|
return Status::InternalError("failed to open file");
|
|
}
|
|
|
|
Defer defer {[&]() { close(fd); }};
|
|
struct stat statbuf;
|
|
if (fstat(fd, &statbuf) < 0) {
|
|
return Status::InternalError("failed to stat file");
|
|
}
|
|
*m_time = statbuf.st_mtime;
|
|
return Status::OK();
|
|
}
|
|
|
|
bool FileUtils::check_exist(const std::string& path) {
|
|
return Env::Default()->path_exists(path).ok();
|
|
}
|
|
|
|
Status FileUtils::canonicalize(const std::string& path, std::string* real_path) {
|
|
return Env::Default()->canonicalize(path, real_path);
|
|
}
|
|
|
|
} // namespace doris
|