2020-11-27 20:44:25 +03:30
|
|
|
/*
|
|
|
|
* Copyright (c) 2020, Emanuel Sprung <emanuel.sprung@gmail.com>
|
|
|
|
*
|
2021-04-22 01:24:48 -07:00
|
|
|
* SPDX-License-Identifier: BSD-2-Clause
|
2020-11-27 20:44:25 +03:30
|
|
|
*/
|
|
|
|
|
2021-05-15 12:34:40 +02:00
|
|
|
#include <AK/Assertions.h>
|
2020-11-27 20:44:25 +03:30
|
|
|
#include <AK/ByteBuffer.h>
|
2021-01-23 21:58:14 -07:00
|
|
|
#include <AK/ScopeGuard.h>
|
2020-11-27 20:44:25 +03:30
|
|
|
#include <AK/String.h>
|
|
|
|
#include <AK/Utf8View.h>
|
|
|
|
#include <AK/Vector.h>
|
|
|
|
#include <LibCore/ArgsParser.h>
|
|
|
|
#include <LibCore/DirIterator.h>
|
|
|
|
#include <LibCore/File.h>
|
|
|
|
#include <LibRegex/Regex.h>
|
|
|
|
#include <stdio.h>
|
|
|
|
#include <unistd.h>
|
|
|
|
|
2020-11-28 18:10:56 +03:30
|
|
|
enum class BinaryFileMode {
|
|
|
|
Binary,
|
|
|
|
Text,
|
|
|
|
Skip,
|
|
|
|
};
|
|
|
|
|
|
|
|
template<typename... Ts>
|
|
|
|
void fail(StringView format, Ts... args)
|
|
|
|
{
|
2021-05-31 15:43:25 +01:00
|
|
|
warn("\x1b[31m");
|
2020-11-28 18:10:56 +03:30
|
|
|
warnln(format, forward<Ts>(args)...);
|
2021-05-31 15:43:25 +01:00
|
|
|
warn("\x1b[0m");
|
2020-11-28 18:10:56 +03:30
|
|
|
abort();
|
|
|
|
}
|
|
|
|
|
2020-11-27 20:44:25 +03:30
|
|
|
int main(int argc, char** argv)
|
|
|
|
{
|
|
|
|
if (pledge("stdio rpath", nullptr) < 0) {
|
|
|
|
perror("pledge");
|
|
|
|
return 1;
|
|
|
|
}
|
|
|
|
|
|
|
|
Vector<const char*> files;
|
|
|
|
|
|
|
|
bool recursive { false };
|
|
|
|
bool use_ere { true };
|
|
|
|
const char* pattern = nullptr;
|
2020-11-28 18:10:56 +03:30
|
|
|
BinaryFileMode binary_mode { BinaryFileMode::Binary };
|
|
|
|
bool case_insensitive = false;
|
2021-01-23 22:11:19 -07:00
|
|
|
bool invert_match = false;
|
2020-11-27 20:44:25 +03:30
|
|
|
|
|
|
|
Core::ArgsParser args_parser;
|
|
|
|
args_parser.add_option(recursive, "Recursively scan files starting in working directory", "recursive", 'r');
|
|
|
|
args_parser.add_option(use_ere, "Extended regular expressions (default)", "extended-regexp", 'E');
|
|
|
|
args_parser.add_option(pattern, "Pattern", "regexp", 'e', "Pattern");
|
2020-11-28 18:10:56 +03:30
|
|
|
args_parser.add_option(case_insensitive, "Make matches case-insensitive", nullptr, 'i');
|
2021-01-23 22:11:19 -07:00
|
|
|
args_parser.add_option(invert_match, "Select non-matching lines", "invert-match", 'v');
|
2020-11-28 18:10:56 +03:30
|
|
|
args_parser.add_option(Core::ArgsParser::Option {
|
|
|
|
.requires_argument = true,
|
|
|
|
.help_string = "Action to take for binary files ([binary], text, skip)",
|
|
|
|
.long_name = "binary-mode",
|
|
|
|
.accept_value = [&](auto* str) {
|
2021-07-04 11:08:46 +02:00
|
|
|
if ("text"sv == str)
|
2020-11-28 18:10:56 +03:30
|
|
|
binary_mode = BinaryFileMode::Text;
|
2021-07-04 11:08:46 +02:00
|
|
|
else if ("binary"sv == str)
|
2020-11-28 18:10:56 +03:30
|
|
|
binary_mode = BinaryFileMode::Binary;
|
2021-07-04 11:08:46 +02:00
|
|
|
else if ("skip"sv == str)
|
2020-11-28 18:10:56 +03:30
|
|
|
binary_mode = BinaryFileMode::Skip;
|
|
|
|
else
|
|
|
|
return false;
|
|
|
|
return true;
|
|
|
|
},
|
|
|
|
});
|
|
|
|
args_parser.add_option(Core::ArgsParser::Option {
|
|
|
|
.requires_argument = false,
|
|
|
|
.help_string = "Treat binary files as text (same as --binary-mode text)",
|
|
|
|
.long_name = "text",
|
|
|
|
.short_name = 'a',
|
|
|
|
.accept_value = [&](auto) {
|
|
|
|
binary_mode = BinaryFileMode::Text;
|
|
|
|
return true;
|
|
|
|
},
|
|
|
|
});
|
|
|
|
args_parser.add_option(Core::ArgsParser::Option {
|
|
|
|
.requires_argument = false,
|
|
|
|
.help_string = "Ignore binary files (same as --binary-mode skip)",
|
|
|
|
.long_name = nullptr,
|
|
|
|
.short_name = 'I',
|
|
|
|
.accept_value = [&](auto) {
|
|
|
|
binary_mode = BinaryFileMode::Skip;
|
|
|
|
return true;
|
|
|
|
},
|
|
|
|
});
|
2020-11-27 20:44:25 +03:30
|
|
|
args_parser.add_positional_argument(files, "File(s) to process", "file", Core::ArgsParser::Required::No);
|
|
|
|
args_parser.parse(argc, argv);
|
|
|
|
|
|
|
|
if (!use_ere)
|
|
|
|
return 0;
|
|
|
|
|
|
|
|
// mock grep behaviour: if -e is omitted, use first positional argument as pattern
|
|
|
|
if (pattern == nullptr && files.size())
|
|
|
|
pattern = files.take_first();
|
|
|
|
|
2020-11-28 18:10:56 +03:30
|
|
|
PosixOptions options {};
|
|
|
|
if (case_insensitive)
|
|
|
|
options |= PosixFlags::Insensitive;
|
|
|
|
|
|
|
|
Regex<PosixExtended> re(pattern, options);
|
2020-11-27 20:44:25 +03:30
|
|
|
if (re.parser_result.error != Error::NoError) {
|
|
|
|
return 1;
|
|
|
|
}
|
|
|
|
|
2020-11-28 18:10:56 +03:30
|
|
|
auto matches = [&](StringView str, StringView filename = "", bool print_filename = false, bool is_binary = false) {
|
2020-11-27 20:44:25 +03:30
|
|
|
size_t last_printed_char_pos { 0 };
|
2020-11-28 18:10:56 +03:30
|
|
|
if (is_binary && binary_mode == BinaryFileMode::Skip)
|
|
|
|
return false;
|
|
|
|
|
2020-11-27 20:44:25 +03:30
|
|
|
auto result = re.match(str, PosixFlags::Global);
|
2021-01-23 22:11:19 -07:00
|
|
|
if (result.success ^ invert_match) {
|
2020-11-28 18:10:56 +03:30
|
|
|
if (is_binary && binary_mode == BinaryFileMode::Binary) {
|
|
|
|
outln("binary file \x1B[34m{}\x1B[0m matches", filename);
|
|
|
|
} else {
|
2021-01-23 22:11:19 -07:00
|
|
|
if ((result.matches.size() || invert_match) && print_filename) {
|
2020-11-28 18:10:56 +03:30
|
|
|
out("\x1B[34m{}:\x1B[0m", filename);
|
|
|
|
}
|
|
|
|
|
|
|
|
for (auto& match : result.matches) {
|
|
|
|
|
|
|
|
out("{}\x1B[32m{}\x1B[0m",
|
|
|
|
StringView(&str[last_printed_char_pos], match.global_offset - last_printed_char_pos),
|
|
|
|
match.view.to_string());
|
|
|
|
last_printed_char_pos = match.global_offset + match.view.length();
|
|
|
|
}
|
2020-12-13 11:44:53 +01:00
|
|
|
outln("{}", StringView(&str[last_printed_char_pos], str.length() - last_printed_char_pos));
|
2020-11-27 20:44:25 +03:30
|
|
|
}
|
|
|
|
|
2020-11-28 18:10:56 +03:30
|
|
|
return true;
|
2020-11-27 20:44:25 +03:30
|
|
|
}
|
|
|
|
|
|
|
|
return false;
|
|
|
|
};
|
2020-11-28 18:10:56 +03:30
|
|
|
|
|
|
|
auto handle_file = [&matches, binary_mode](StringView filename, bool print_filename) -> bool {
|
2020-11-27 20:44:25 +03:30
|
|
|
auto file = Core::File::construct(filename);
|
2021-05-12 13:56:43 +04:30
|
|
|
if (!file->open(Core::OpenMode::ReadOnly)) {
|
2020-11-28 18:10:56 +03:30
|
|
|
warnln("Failed to open {}: {}", filename, file->error_string());
|
2020-11-27 20:44:25 +03:30
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
|
|
|
while (file->can_read_line()) {
|
2020-12-13 11:44:53 +01:00
|
|
|
auto line = file->read_line();
|
|
|
|
auto is_binary = memchr(line.characters(), 0, line.length()) != nullptr;
|
2020-11-28 18:10:56 +03:30
|
|
|
|
2020-12-13 11:44:53 +01:00
|
|
|
if (matches(line, filename, print_filename, is_binary) && is_binary && binary_mode == BinaryFileMode::Binary)
|
2020-11-28 18:10:56 +03:30
|
|
|
return true;
|
2020-11-27 20:44:25 +03:30
|
|
|
}
|
|
|
|
return true;
|
|
|
|
};
|
|
|
|
|
|
|
|
auto add_directory = [&handle_file](String base, Optional<String> recursive, auto handle_directory) -> void {
|
|
|
|
Core::DirIterator it(recursive.value_or(base), Core::DirIterator::Flags::SkipDots);
|
|
|
|
while (it.has_next()) {
|
|
|
|
auto path = it.next_full_path();
|
|
|
|
if (!Core::File::is_directory(path)) {
|
2020-11-28 18:10:56 +03:30
|
|
|
auto key = path.substring_view(base.length() + 1, path.length() - base.length() - 1);
|
|
|
|
handle_file(key, true);
|
2020-11-27 20:44:25 +03:30
|
|
|
} else {
|
|
|
|
handle_directory(base, path, handle_directory);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
};
|
|
|
|
|
2021-02-11 21:55:58 +03:30
|
|
|
bool did_match_something = false;
|
2020-11-27 20:44:25 +03:30
|
|
|
if (!files.size() && !recursive) {
|
2021-01-23 21:58:14 -07:00
|
|
|
char* line = nullptr;
|
|
|
|
size_t line_len = 0;
|
|
|
|
ssize_t nread = 0;
|
|
|
|
ScopeGuard free_line = [line] { free(line); };
|
|
|
|
while ((nread = getline(&line, &line_len, stdin)) != -1) {
|
2021-02-23 20:42:32 +01:00
|
|
|
VERIFY(nread > 0);
|
2021-06-14 23:36:53 +10:00
|
|
|
if (line[nread - 1] == '\n')
|
|
|
|
--nread;
|
2021-04-29 16:07:17 +01:00
|
|
|
StringView line_view(line, nread);
|
2021-01-23 21:58:14 -07:00
|
|
|
bool is_binary = line_view.contains(0);
|
2020-11-27 20:44:25 +03:30
|
|
|
|
2020-11-28 18:10:56 +03:30
|
|
|
if (is_binary && binary_mode == BinaryFileMode::Skip)
|
|
|
|
return 1;
|
2020-11-27 20:44:25 +03:30
|
|
|
|
2021-02-11 21:55:58 +03:30
|
|
|
auto matched = matches(line_view, "stdin", false, is_binary);
|
|
|
|
did_match_something = did_match_something || matched;
|
|
|
|
if (matched && is_binary && binary_mode == BinaryFileMode::Binary)
|
2020-11-27 20:44:25 +03:30
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
if (recursive) {
|
|
|
|
add_directory(".", {}, add_directory);
|
|
|
|
|
|
|
|
} else {
|
|
|
|
bool print_filename { files.size() > 1 };
|
|
|
|
for (auto& filename : files) {
|
|
|
|
if (!handle_file(filename, print_filename))
|
|
|
|
return 1;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2021-02-11 21:55:58 +03:30
|
|
|
return did_match_something ? 0 : 1;
|
2020-11-27 20:44:25 +03:30
|
|
|
}
|