// Licensed to the Apache Software Foundation (ASF) under one // or more contributor license agreements. See the NOTICE file // distributed with this work for additional information // regarding copyright ownership. The ASF licenses this file // to you under the Apache License, Version 2.0 (the // "License"); you may not use this file except in compliance // with the License. You may obtain a copy of the License at // // http://www.apache.org/licenses/LICENSE-2.0 // // Unless required by applicable law or agreed to in writing, // software distributed under the License is distributed on an // "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY // KIND, either express or implied. See the License for the // specific language governing permissions and limitations // under the License. #include "util/file_utils.h" #include #include #include #include #include #include #include #include #include #include #include "env/env.h" #include "gutil/strings/split.h" #include "gutil/strings/strip.h" #include "gutil/strings/substitute.h" #include "olap/file_helper.h" #include "runtime/thread_context.h" #include "util/defer_op.h" namespace doris { using strings::Substitute; Status FileUtils::create_dir(const std::string& path, Env* env) { return env->create_dirs(path); } Status FileUtils::create_dir(const std::string& dir_path) { return create_dir(dir_path, Env::Default()); } Status FileUtils::remove_all(const std::string& file_path) { return Env::Default()->delete_dir(file_path); } Status FileUtils::remove(const std::string& path) { if (!Env::Default()->path_exists(path).ok()) { LOG(WARNING) << "path does exist: " << path; return Status::OK(); } bool is_dir; RETURN_IF_ERROR(Env::Default()->is_directory(path, &is_dir)); if (is_dir) { return Env::Default()->delete_dir(path); } else { return Env::Default()->delete_file(path); } } Status FileUtils::remove_paths(const std::vector& paths) { for (const std::string& p : paths) { RETURN_IF_ERROR(remove(p)); } return Status::OK(); } Status FileUtils::list_files(Env* env, const std::string& dir, std::vector* files) { auto cb = [files](const char* name) -> bool { if (!is_dot_or_dotdot(name)) { files->push_back(name); } return true; }; return env->iterate_dir(dir, cb); } Status FileUtils::list_dirs_files(const std::string& path, std::set* dirs, std::set* files, Env* env) { auto cb = [path, dirs, files, env](const char* name) -> bool { if (is_dot_or_dotdot(name)) { return true; } std::string temp_path = path + "/" + name; bool is_dir; auto st = env->is_directory(temp_path, &is_dir); if (st.ok()) { if (is_dir) { if (dirs != nullptr) { dirs->insert(name); } } else if (files != nullptr) { files->insert(name); } } else { LOG(WARNING) << "check path " << path << "is directory error: " << st.to_string(); } return true; }; return env->iterate_dir(path, cb); } Status FileUtils::get_children_count(Env* env, const std::string& dir, int64_t* count) { auto cb = [count](const char* name) -> bool { if (!is_dot_or_dotdot(name)) { *count += 1; } return true; }; return env->iterate_dir(dir, cb); } bool FileUtils::is_dir(const std::string& file_path, Env* env) { bool ret; if (env->is_directory(file_path, &ret).ok()) { return ret; } return false; } bool FileUtils::is_dir(const std::string& path) { return is_dir(path, Env::Default()); } // Through proc filesystem std::string FileUtils::path_of_fd(int fd) { const int PATH_SIZE = 256; char proc_path[PATH_SIZE]; snprintf(proc_path, PATH_SIZE, "/proc/self/fd/%d", fd); char path[PATH_SIZE]; if (readlink(proc_path, path, PATH_SIZE) < 0) { path[0] = '\0'; } return path; } Status FileUtils::split_paths(const char* path, std::vector* path_vec) { path_vec->clear(); *path_vec = strings::Split(path, ";", strings::SkipWhitespace()); for (std::vector::iterator it = path_vec->begin(); it != path_vec->end();) { StripWhiteSpace(&(*it)); it->erase(it->find_last_not_of("/") + 1); if (it->size() == 0) { it = path_vec->erase(it); } else { ++it; } } // Check if std::sort(path_vec->begin(), path_vec->end()); if (std::unique(path_vec->begin(), path_vec->end()) != path_vec->end()) { return Status::InternalError("Same path in path.[path={}]", path); } if (path_vec->size() == 0) { return Status::InternalError("Size of vector after split is zero.[path={}]", path); } return Status::OK(); } Status FileUtils::copy_file(const std::string& src_path, const std::string& dest_path) { return Env::Default()->copy_path(src_path, dest_path); } Status FileUtils::md5sum(const std::string& file, std::string* md5sum) { int fd = open(file.c_str(), O_RDONLY); if (fd < 0) { return Status::InternalError("failed to open file"); } struct stat statbuf; if (fstat(fd, &statbuf) < 0) { close(fd); return Status::InternalError("failed to stat file"); } size_t file_len = statbuf.st_size; CONSUME_THREAD_MEM_TRACKER(file_len); void* buf = mmap(0, file_len, PROT_READ, MAP_SHARED, fd, 0); unsigned char result[MD5_DIGEST_LENGTH]; MD5((unsigned char*)buf, file_len, result); munmap(buf, file_len); RELEASE_THREAD_MEM_TRACKER(file_len); std::stringstream ss; for (int32_t i = 0; i < MD5_DIGEST_LENGTH; i++) { ss << std::setfill('0') << std::setw(2) << std::hex << (int)result[i]; } ss >> *md5sum; close(fd); return Status::OK(); } Status FileUtils::mtime(const std::string& file, time_t* m_time) { int fd = open(file.c_str(), O_RDONLY); if (fd < 0) { return Status::InternalError("failed to open file"); } Defer defer {[&]() { close(fd); }}; struct stat statbuf; if (fstat(fd, &statbuf) < 0) { return Status::InternalError("failed to stat file"); } *m_time = statbuf.st_mtime; return Status::OK(); } bool FileUtils::check_exist(const std::string& path) { return Env::Default()->path_exists(path).ok(); } Status FileUtils::canonicalize(const std::string& path, std::string* real_path) { return Env::Default()->canonicalize(path, real_path); } } // namespace doris