osquery-1/osquery/filesystem/globbing.cpp
2015-04-10 18:04:26 -07:00

358 lines
12 KiB
C++

/*
* Copyright (c) 2014, Facebook, Inc.
* All rights reserved.
*
* This source code is licensed under the BSD-style license found in the
* LICENSE file in the root directory of this source tree. An additional grant
* of patent rights can be found in the PATENTS file in the same directory.
*
*/
#include <boost/algorithm/string/join.hpp>
#include <boost/filesystem/operations.hpp>
#include <osquery/core.h>
#include <osquery/filesystem.h>
namespace fs = boost::filesystem;
namespace osquery {
/**
* @brief Drill down recursively and list all sub files
*
* This functions purpose is to take a path with no wildcards
* and it will recursively go through all files and and return
* them in the results vector.
*
* @param fs_path The entire resolved path
* @param results The vector where results will be returned
* @param rec_depth How many recursions deep the current execution is at
*
* @return An instance of osquery::Status indicating the success of failure of
* the operation
*/
Status doubleStarTraversal(const fs::path& fs_path,
std::vector<std::string>& results,
ReturnSetting setting,
unsigned int rec_depth) {
if (rec_depth >= kMaxDirectoryTraversalDepth) {
return Status(2, fs_path.string().c_str());
}
// List files first
if (setting & REC_LIST_FILES) {
Status stat = listFilesInDirectory(fs_path, results);
if (!stat.ok()) {
return Status(0, "OK");
}
}
std::vector<std::string> folders;
Status stat = listDirectoriesInDirectory(fs_path, folders);
if (!stat.ok()) {
return Status(0, "OK");
}
if (setting & REC_LIST_FOLDERS) {
results.push_back(fs_path.string());
}
for (const auto& folder : folders) {
if (fs::is_symlink(folder)) {
continue;
}
stat = doubleStarTraversal(folder, results, setting, rec_depth + 1);
if (!stat.ok() && stat.getCode() == 2) {
return stat;
}
}
return Status(0, "OK");
}
/**
* @brief Resolve the last component of a file path
*
* This function exists because unlike the other parts of of a file
* path, which should only resolve to folder, a wildcard at the end
* means to list all files in that directory, as does just listing
* folder. Also, a double means to drill down recursively into that
* that folder and list all sub file.
*
* @param fs_path The entire resolved path (except last component)
* @param results The vector where results will be returned
* @param components A path, split by forward slashes
* @param rec_depth How many recursions deep the current execution is at
*
* @return An instance of osquery::Status indicating the success of failure of
* the operation
*/
Status resolveLastPathComponent(const fs::path& fs_path,
std::vector<std::string>& results,
ReturnSetting setting,
const std::vector<std::string>& components,
unsigned int rec_depth) {
// Is the last component a double star?
if (components[components.size() - 1] == kWildcardCharacterRecursive) {
if (setting & REC_EVENT_OPT) {
results.push_back(fs_path.parent_path().string());
return Status(0, "OK");
} else {
Status stat = doubleStarTraversal(
fs_path.parent_path(), results, setting, rec_depth);
return stat;
}
}
try {
// Is the path a file
if ((setting & (REC_EVENT_OPT | REC_LIST_FILES)) > 0 &&
fs::is_regular_file(fs_path)) {
results.push_back(fs_path.string());
return Status(0, "OK");
}
} catch (const fs::filesystem_error& e) {
return Status(0, "OK");
}
std::vector<std::string> files;
std::vector<std::string> folders;
Status stat_file = listFilesInDirectory(fs_path.parent_path(), files);
Status stat_fold = listDirectoriesInDirectory(fs_path.parent_path(), folders);
// Is the last component a wildcard?
if (components[components.size() - 1] == kWildcardCharacter) {
if (setting & REC_EVENT_OPT) {
results.push_back(fs_path.parent_path().string());
return Status(0, "OK");
}
if (setting & REC_LIST_FOLDERS) {
results.push_back(fs_path.parent_path().string());
for (const auto& fold : folders) {
results.push_back(fold);
}
}
if (setting & REC_LIST_FILES) {
for (const auto& file : files) {
results.push_back(file);
}
}
return Status(0, "OK");
}
std::string processed_path =
"/" +
boost::algorithm::join(
std::vector<std::string>(components.begin(), components.end() - 1),
"/");
// Is this a (.*)% type file match
if (components[components.size() - 1].find(kWildcardCharacter, 1) !=
std::string::npos &&
components[components.size() - 1][0] != kWildcardCharacter[0]) {
std::string prefix =
processed_path + "/" +
components[components.size() - 1].substr(
0, components[components.size() - 1].find(kWildcardCharacter, 1));
if (setting & REC_LIST_FOLDERS) {
for (const auto& fold : folders) {
if (fold.find(prefix, 0) != 0) {
continue;
}
results.push_back(fold);
}
}
if (setting & REC_LIST_FILES || setting & REC_EVENT_OPT) {
for (const auto& file : files) {
if (file.find(prefix, 0) != 0) {
continue;
}
results.push_back(file);
}
}
// Should be a return here?
return Status(0, "OK");
}
// Is this a %(.*) type file match
if (components[components.size() - 1][0] == kWildcardCharacter[0]) {
std::string suffix = components[components.size() - 1].substr(1);
if (setting & REC_LIST_FOLDERS) {
for (const auto& fold : folders) {
std::string file_name =
boost::filesystem::path(fold).filename().string();
size_t pos = file_name.find(suffix);
if (pos != std::string::npos &&
pos + suffix.length() == file_name.length()) {
results.push_back(fold);
}
}
}
if (setting & REC_LIST_FILES || setting & REC_EVENT_OPT) {
for (const auto& file : files) {
boost::filesystem::path p(file);
std::string file_name = p.filename().string();
size_t pos = file_name.find(suffix);
if (pos != std::string::npos &&
pos + suffix.length() == file_name.length()) {
results.push_back(file);
}
}
}
return Status(0, "OK");
}
// Back out if this path doesn't exist due to invalid path
if (!(pathExists(fs_path).ok())) {
return Status(0, "OK");
}
// Is the path a directory
if (fs::is_directory(fs_path)) {
results.push_back(fs_path.string());
return Status(0, "OK");
}
return Status(1, "UNKNOWN FILE TYPE");
}
/**
* @brief List all files in a directory recursively
*
* This is an overloaded version of the exported `resolveFilePattern`. This
* version is used internally to facilitate the tracking of the recursion
* depth.
*
* @param results The vector where results will be returned
* @param components A path, split by forward slashes
* @param processed_index What index of components has been resolved so far
* @param rec_depth How many recursions deep the current execution is at
*
* @return An instance of osquery::Status indicating the success of failure of
* the operation
*/
Status resolveFilePattern(std::vector<std::string> components,
std::vector<std::string>& results,
ReturnSetting setting = REC_LIST_FILES,
unsigned int processed_index = 0,
unsigned int rec_depth = 0) {
// Stop recursing here if we've reached out max depth
if (rec_depth >= kMaxDirectoryTraversalDepth) {
return Status(2, "MAX_DEPTH");
}
// Handle all parts of the path except last because then we want to get files,
// not directories
for (auto i = processed_index; i < components.size() - 1; i++) {
// If we encounter a full recursion, that is invalid because it is not
// the last component. So return.
if (components[i] == kWildcardCharacterRecursive) {
return Status(1, kWildcardCharacterRecursive + " NOT LAST COMPONENT");
}
// Create a vector to hold all the folders in the current folder
// Build the path we're at out of components
std::vector<std::string> folders;
std::string processed_path =
"/" +
boost::algorithm::join(std::vector<std::string>(components.begin(),
components.begin() + i),
"/");
Status stat = listDirectoriesInDirectory(processed_path, folders);
// If we couldn't list the directories it's probably because
// the path is invalid (or we don't have permission). Return
// here because this branch is no good. This is not an error
if (!stat.ok()) {
return Status(0, "OK");
}
// If we just have a wildcard character then we will recurse though
// all folders we find
if (components[i] == kWildcardCharacter) {
for (const auto& dir : folders) {
boost::filesystem::path p(dir);
components[i] = p.filename().string();
Status stat = resolveFilePattern(
components, results, setting, i + 1, rec_depth + 1);
if (!stat.ok() && stat.getCode() == 2) {
return stat;
}
}
// Our subcalls that handle processing are now complete, return
return Status(0, "OK");
// The case of (.*)%
} else if (components[i].find(kWildcardCharacter, 1) != std::string::npos &&
components[i][0] != kWildcardCharacter[0]) {
std::string prefix =
processed_path + "/" +
components[i].substr(0, components[i].find(kWildcardCharacter, 1));
for (const auto& dir : folders) {
if (dir.find(prefix, 0) != 0) {
continue;
}
boost::filesystem::path p(dir);
components[i] = p.filename().string();
Status stat = resolveFilePattern(
components, results, setting, i + 1, rec_depth + 1);
if (!stat.ok() && stat.getCode() == 2) {
return stat;
}
}
return Status(0, "OK");
// The case of %(.*)
} else if (components[i][0] == kWildcardCharacter[0]) {
std::string suffix = components[i].substr(1);
for (const auto& dir : folders) {
boost::filesystem::path p(dir);
std::string folder_name = p.filename().string();
size_t pos = folder_name.find(suffix);
if (pos != std::string::npos &&
pos + suffix.length() == folder_name.length()) {
components[i] = p.filename().string();
Status stat = resolveFilePattern(
components, results, setting, i + 1, rec_depth + 1);
if (!stat.ok() && stat.getCode() == 2) {
return stat;
}
}
}
return Status(0, "OK");
} else {
}
}
// At this point, all of our call paths have been resolved, so know we want to
// list the files at this point or do our ** traversal
return resolveLastPathComponent("/" + boost::algorithm::join(components, "/"),
results,
setting,
components,
rec_depth);
}
Status resolveFilePattern(const fs::path& fs_path,
std::vector<std::string>& results) {
if (fs_path.string()[0] != '/') {
return resolveFilePattern(
split(fs::current_path().string() + "/" + fs_path.string(), "/"),
results);
}
return resolveFilePattern(split(fs_path.string(), "/"), results);
}
Status resolveFilePattern(const fs::path& fs_path,
std::vector<std::string>& results,
ReturnSetting setting) {
if (fs_path.string()[0] != '/') {
return resolveFilePattern(
split(fs::current_path().string() + "/" + fs_path.string(), "/"),
results,
setting);
}
return resolveFilePattern(split(fs_path.string(), "/"), results, setting);
}
}