serenity/Userland/Utilities/du.cpp

239 lines
8.3 KiB
C++
Raw Normal View History

2020-02-26 02:43:55 +00:00
/*
* Copyright (c) 2020, Fei Wu <f.eiwu@yahoo.com>
*
* SPDX-License-Identifier: BSD-2-Clause
2020-02-26 02:43:55 +00:00
*/
#include <AK/DeprecatedString.h>
#include <AK/LexicalPath.h>
#include <AK/NumberFormat.h>
2020-02-26 02:43:55 +00:00
#include <AK/Vector.h>
#include <LibCore/ArgsParser.h>
#include <LibCore/DateTime.h>
#include <LibCore/DirIterator.h>
#include <LibCore/File.h>
#include <LibCore/System.h>
#include <LibMain/Main.h>
2020-02-26 02:43:55 +00:00
#include <limits.h>
#include <string.h>
struct DuOption {
enum class TimeType {
NotUsed,
Modification,
Access,
Status
};
bool human_readable = false;
bool human_readable_si = false;
2020-02-26 02:43:55 +00:00
bool all = false;
bool apparent_size = false;
i64 threshold = 0;
2020-02-26 02:43:55 +00:00
TimeType time_type = TimeType::NotUsed;
Vector<DeprecatedString> excluded_patterns;
u64 block_size = 1024;
size_t max_depth = SIZE_MAX;
2020-02-26 02:43:55 +00:00
};
struct VisitedFile {
dev_t device;
ino_t inode;
};
template<>
struct AK::Traits<VisitedFile> : public GenericTraits<VisitedFile> {
static unsigned hash(VisitedFile const& visited_file)
{
return pair_int_hash(u64_hash(visited_file.device), u64_hash(visited_file.inode));
}
static bool equals(VisitedFile const& a, VisitedFile const& b)
{
return a.device == b.device && a.inode == b.inode;
}
};
static HashTable<VisitedFile> s_visited_files;
static ErrorOr<void> parse_args(Main::Arguments arguments, Vector<DeprecatedString>& files, DuOption& du_option);
static u64 print_space_usage(DeprecatedString const& path, DuOption const& du_option, size_t current_depth, bool inside_dir = false);
2020-02-26 02:43:55 +00:00
ErrorOr<int> serenity_main(Main::Arguments arguments)
2020-02-26 02:43:55 +00:00
{
Vector<DeprecatedString> files;
2020-02-26 02:43:55 +00:00
DuOption du_option;
TRY(parse_args(arguments, files, du_option));
2020-02-26 02:43:55 +00:00
2022-04-01 17:58:27 +00:00
for (auto const& file : files)
print_space_usage(file, du_option, 0);
2020-02-26 02:43:55 +00:00
return 0;
}
ErrorOr<void> parse_args(Main::Arguments arguments, Vector<DeprecatedString>& files, DuOption& du_option)
2020-02-26 02:43:55 +00:00
{
bool summarize = false;
2022-09-14 11:02:33 +00:00
StringView pattern;
StringView exclude_from;
Vector<StringView> files_to_process;
2020-02-26 02:43:55 +00:00
Core::ArgsParser::Option time_option {
Core::ArgsParser::OptionArgumentMode::Required,
2020-02-26 02:43:55 +00:00
"Show time of type time-type of any file in the directory, or any of its subdirectories. "
"Available choices: mtime, modification, ctime, status, use, atime, access",
"time",
0,
"time-type",
[&du_option](StringView option) {
if (option == "mtime"sv || option == "modification"sv)
2020-02-26 02:43:55 +00:00
du_option.time_type = DuOption::TimeType::Modification;
else if (option == "ctime"sv || option == "status"sv || option == "use"sv)
2020-02-26 02:43:55 +00:00
du_option.time_type = DuOption::TimeType::Status;
else if (option == "atime"sv || option == "access"sv)
2020-02-26 02:43:55 +00:00
du_option.time_type = DuOption::TimeType::Access;
else
return false;
return true;
}
};
Core::ArgsParser::Option block_size_1k_option {
Core::ArgsParser::OptionArgumentMode::None,
"Equivalent to `--block-size 1024`",
nullptr,
'k',
nullptr,
[&du_option](StringView) {
du_option.block_size = 1024;
return true;
}
};
2020-02-26 02:43:55 +00:00
Core::ArgsParser args_parser;
args_parser.set_general_help("Display actual or apparent disk usage of files or directories.");
2020-02-26 02:43:55 +00:00
args_parser.add_option(du_option.all, "Write counts for all files, not just directories", "all", 'a');
args_parser.add_option(du_option.apparent_size, "Print apparent sizes, rather than disk usage", "apparent-size", 0);
args_parser.add_option(du_option.human_readable, "Print human-readable sizes", "human-readable", 'h');
args_parser.add_option(du_option.human_readable_si, "Print human-readable sizes in SI units", "si", 0);
args_parser.add_option(du_option.max_depth, "Print the total for a directory or file only if it is N or fewer levels below the command line argument", "max-depth", 'd', "N");
2020-02-26 02:43:55 +00:00
args_parser.add_option(summarize, "Display only a total for each argument", "summarize", 's');
args_parser.add_option(du_option.threshold, "Exclude entries smaller than size if positive, or entries greater than size if negative", "threshold", 't', "size");
args_parser.add_option(move(time_option));
args_parser.add_option(pattern, "Exclude files that match pattern", "exclude", 0, "pattern");
args_parser.add_option(exclude_from, "Exclude files that match any pattern in file", "exclude-from", 'X', "file");
2022-07-20 21:00:34 +00:00
args_parser.add_option(du_option.block_size, "Outputs file sizes as the required blocks with the given size (defaults to 1024)", "block-size", 'B', "size");
args_parser.add_option(move(block_size_1k_option));
2020-02-26 02:43:55 +00:00
args_parser.add_positional_argument(files_to_process, "File to process", "file", Core::ArgsParser::Required::No);
args_parser.parse(arguments);
2020-02-26 02:43:55 +00:00
if (summarize)
du_option.max_depth = 0;
2020-02-26 02:43:55 +00:00
2022-09-14 11:02:33 +00:00
if (!pattern.is_empty())
2020-02-26 02:43:55 +00:00
du_option.excluded_patterns.append(pattern);
2022-09-14 11:02:33 +00:00
if (!exclude_from.is_empty()) {
auto file = TRY(Core::File::open(exclude_from, Core::File::OpenMode::Read));
auto const buff = TRY(file->read_until_eof());
if (!buff.is_empty()) {
DeprecatedString patterns = DeprecatedString::copy(buff, Chomp);
du_option.excluded_patterns.extend(patterns.split('\n'));
2020-02-26 02:43:55 +00:00
}
}
for (auto const& file : files_to_process) {
2020-02-26 02:43:55 +00:00
files.append(file);
}
if (files.is_empty()) {
files.append(".");
}
return {};
2020-02-26 02:43:55 +00:00
}
u64 print_space_usage(DeprecatedString const& path, DuOption const& du_option, size_t current_depth, bool inside_dir)
2020-02-26 02:43:55 +00:00
{
u64 size = 0;
auto path_stat_or_error = Core::System::lstat(path);
if (path_stat_or_error.is_error()) {
warnln("du: cannot stat '{}': {}", path, path_stat_or_error.release_error());
return 0;
}
auto path_stat = path_stat_or_error.release_value();
VisitedFile visited_file { path_stat.st_dev, path_stat.st_ino };
if (s_visited_files.contains(visited_file)) {
return 0;
}
s_visited_files.set(visited_file);
2022-04-01 17:58:27 +00:00
bool const is_directory = S_ISDIR(path_stat.st_mode);
if (is_directory) {
2020-02-26 02:43:55 +00:00
auto di = Core::DirIterator(path, Core::DirIterator::SkipParentAndBaseDir);
if (di.has_error()) {
auto error = di.error();
warnln("du: cannot read directory '{}': {}", path, error);
return 0;
2020-02-26 02:43:55 +00:00
}
2020-02-26 02:43:55 +00:00
while (di.has_next()) {
2022-04-01 17:58:27 +00:00
auto const child_path = di.next_full_path();
size += print_space_usage(child_path, du_option, current_depth + 1, true);
2020-02-26 02:43:55 +00:00
}
}
2022-04-01 17:58:27 +00:00
auto const basename = LexicalPath::basename(path);
for (auto const& pattern : du_option.excluded_patterns) {
2020-02-26 02:43:55 +00:00
if (basename.matches(pattern, CaseSensitivity::CaseSensitive))
return 0;
2020-02-26 02:43:55 +00:00
}
if (!du_option.apparent_size) {
constexpr auto block_size = 512;
size += path_stat.st_blocks * block_size;
} else {
size += path_stat.st_size;
2020-02-26 02:43:55 +00:00
}
bool is_beyond_depth = current_depth > du_option.max_depth;
bool is_inner_file = inside_dir && !is_directory;
bool is_outside_threshold = (du_option.threshold > 0 && size < static_cast<u64>(du_option.threshold)) || (du_option.threshold < 0 && size > static_cast<u64>(-du_option.threshold));
2020-02-26 02:43:55 +00:00
// All of these still count towards the full size, they are just not reported on individually.
if (is_beyond_depth || (is_inner_file && !du_option.all) || is_outside_threshold)
return size;
if (du_option.human_readable) {
out("{}", human_readable_size(size));
} else if (du_option.human_readable_si) {
out("{}", human_readable_size(size, AK::HumanReadableBasedOn::Base10));
} else {
out("{}", ceil_div(size, du_option.block_size));
}
2020-02-26 02:43:55 +00:00
if (du_option.time_type == DuOption::TimeType::NotUsed) {
outln("\t{}", path);
} else {
2020-02-26 02:43:55 +00:00
auto time = path_stat.st_mtime;
switch (du_option.time_type) {
case DuOption::TimeType::Access:
time = path_stat.st_atime;
break;
case DuOption::TimeType::Status:
time = path_stat.st_ctime;
break;
2020-02-26 02:43:55 +00:00
default:
break;
}
auto const formatted_time = Core::DateTime::from_timestamp(time).to_deprecated_string();
outln("\t{}\t{}", formatted_time, path);
2020-02-26 02:43:55 +00:00
}
return size;
2020-02-26 02:43:55 +00:00
}