2022-12-17 01:06:26 -08:00
|
|
|
/*
|
|
|
|
* Copyright (c) 2022, Eli Youngs <eli.m.youngs@gmail.com>
|
|
|
|
*
|
|
|
|
* SPDX-License-Identifier: BSD-2-Clause
|
|
|
|
*/
|
|
|
|
|
2022-12-18 22:29:10 -08:00
|
|
|
#include <AK/CharacterTypes.h>
|
2022-12-17 01:06:26 -08:00
|
|
|
#include <AK/GenericLexer.h>
|
|
|
|
#include <AK/Vector.h>
|
|
|
|
#include <LibCore/ArgsParser.h>
|
2023-02-09 03:02:46 +01:00
|
|
|
#include <LibCore/File.h>
|
2022-12-17 01:06:26 -08:00
|
|
|
#include <LibCore/System.h>
|
|
|
|
#include <LibMain/Main.h>
|
|
|
|
#include <LibRegex/RegexMatcher.h>
|
|
|
|
#include <LibRegex/RegexOptions.h>
|
|
|
|
|
|
|
|
struct SubstitutionCommand {
|
|
|
|
Regex<PosixExtended> regex;
|
|
|
|
StringView replacement;
|
|
|
|
PosixOptions options;
|
2022-12-18 22:29:10 -08:00
|
|
|
Optional<StringView> output_filepath;
|
2022-12-17 01:06:26 -08:00
|
|
|
};
|
|
|
|
|
2022-12-18 22:29:10 -08:00
|
|
|
static Vector<StringView> split_flags(StringView const& input)
|
|
|
|
{
|
|
|
|
Vector<StringView> flags;
|
|
|
|
|
|
|
|
auto lexer = GenericLexer(input);
|
|
|
|
while (!lexer.is_eof()) {
|
|
|
|
StringView flag;
|
|
|
|
|
|
|
|
if (lexer.next_is(is_ascii_digit)) {
|
|
|
|
flag = lexer.consume_while(is_ascii_digit);
|
|
|
|
} else if (lexer.peek() == 'w') {
|
|
|
|
flag = lexer.consume_all();
|
|
|
|
} else {
|
|
|
|
flag = lexer.consume(1);
|
|
|
|
}
|
|
|
|
|
|
|
|
flags.append(flag);
|
|
|
|
}
|
|
|
|
|
|
|
|
return flags;
|
|
|
|
}
|
|
|
|
|
2022-12-17 01:06:26 -08:00
|
|
|
static ErrorOr<SubstitutionCommand> parse_command(StringView command)
|
|
|
|
{
|
|
|
|
auto generic_error_message = "Incomplete substitution command"sv;
|
|
|
|
|
|
|
|
auto lexer = GenericLexer(command);
|
|
|
|
|
|
|
|
auto address = lexer.consume_until('s');
|
|
|
|
if (!address.is_empty())
|
|
|
|
warnln("sed: Addresses are currently ignored");
|
|
|
|
|
|
|
|
if (!lexer.consume_specific('s'))
|
|
|
|
return Error::from_string_view(generic_error_message);
|
|
|
|
|
|
|
|
if (lexer.is_eof())
|
|
|
|
return Error::from_string_view(generic_error_message);
|
|
|
|
|
|
|
|
auto delimiter = lexer.consume();
|
|
|
|
if (delimiter == '\n' || delimiter == '\\')
|
|
|
|
return Error::from_string_literal("\\n and \\ cannot be used as delimiters.");
|
|
|
|
|
|
|
|
auto pattern = lexer.consume_until(delimiter);
|
|
|
|
if (pattern.is_empty())
|
|
|
|
return Error::from_string_literal("Substitution patterns cannot be empty.");
|
|
|
|
|
|
|
|
if (!lexer.consume_specific(delimiter))
|
|
|
|
return Error::from_string_view(generic_error_message);
|
|
|
|
|
|
|
|
auto replacement = lexer.consume_until(delimiter);
|
|
|
|
|
|
|
|
// According to Posix, "s/x/y" is an invalid substitution command.
|
|
|
|
// It must have a closing delimiter: "s/x/y/"
|
|
|
|
if (!lexer.consume_specific(delimiter))
|
|
|
|
return Error::from_string_literal("The substitution command was not properly terminated.");
|
|
|
|
|
2022-12-18 22:29:10 -08:00
|
|
|
PosixOptions options = PosixOptions(PosixFlags::Global | PosixFlags::SingleMatch);
|
|
|
|
Optional<StringView> output_filepath;
|
|
|
|
|
|
|
|
auto flags = split_flags(lexer.consume_all());
|
|
|
|
for (auto const& flag : flags) {
|
|
|
|
if (flag.starts_with('w')) {
|
|
|
|
auto flag_filepath = flag.substring_view(1).trim_whitespace();
|
|
|
|
if (flag_filepath.is_empty())
|
|
|
|
return Error::from_string_literal("No filepath was provided for the 'w' flag.");
|
|
|
|
output_filepath = flag_filepath;
|
|
|
|
} else if (flag == "g"sv) {
|
|
|
|
// Allow multiple matches per line by un-setting the SingleMatch flag
|
|
|
|
options &= ~PosixFlags::SingleMatch;
|
2022-12-18 22:55:49 -08:00
|
|
|
} else if (flag == "i"sv || flag == "I"sv) {
|
|
|
|
options |= PosixFlags::Insensitive;
|
2022-12-18 22:29:10 -08:00
|
|
|
} else {
|
|
|
|
warnln("sed: Unsupported flag: {}", flag);
|
|
|
|
}
|
|
|
|
}
|
2022-12-17 01:06:26 -08:00
|
|
|
|
2022-12-18 22:29:10 -08:00
|
|
|
return SubstitutionCommand { Regex<PosixExtended> { pattern }, replacement, options, output_filepath };
|
2022-12-17 01:06:26 -08:00
|
|
|
}
|
|
|
|
|
|
|
|
ErrorOr<int> serenity_main(Main::Arguments args)
|
|
|
|
{
|
2022-12-18 22:29:10 -08:00
|
|
|
TRY(Core::System::pledge("stdio cpath rpath wpath"));
|
2022-12-17 01:06:26 -08:00
|
|
|
|
|
|
|
Core::ArgsParser args_parser;
|
|
|
|
|
|
|
|
StringView command_input;
|
|
|
|
Vector<StringView> filepaths;
|
|
|
|
|
|
|
|
args_parser.add_positional_argument(command_input, "Command", "command_input", Core::ArgsParser::Required::Yes);
|
|
|
|
args_parser.add_positional_argument(filepaths, "File", "file", Core::ArgsParser::Required::No);
|
|
|
|
|
|
|
|
args_parser.parse(args);
|
|
|
|
|
|
|
|
auto command = TRY(parse_command(command_input));
|
|
|
|
|
2023-02-09 03:02:46 +01:00
|
|
|
Optional<NonnullOwnPtr<Core::File>> maybe_output_file;
|
2022-12-18 22:29:10 -08:00
|
|
|
if (command.output_filepath.has_value())
|
2023-02-09 03:02:46 +01:00
|
|
|
maybe_output_file = TRY(Core::File::open_file_or_standard_stream(command.output_filepath.release_value(), Core::File::OpenMode::Write));
|
2022-12-18 22:29:10 -08:00
|
|
|
|
2022-12-17 01:06:26 -08:00
|
|
|
if (filepaths.is_empty())
|
|
|
|
filepaths = { "-"sv };
|
|
|
|
|
|
|
|
Array<u8, PAGE_SIZE> buffer {};
|
|
|
|
for (auto const& filepath : filepaths) {
|
2023-02-09 03:02:46 +01:00
|
|
|
auto file_unbuffered = TRY(Core::File::open_file_or_standard_stream(filepath, Core::File::OpenMode::Read));
|
|
|
|
auto file = TRY(Core::BufferedFile::create(move(file_unbuffered)));
|
2022-12-17 01:06:26 -08:00
|
|
|
|
|
|
|
while (!file->is_eof()) {
|
|
|
|
auto line = TRY(file->read_line(buffer));
|
|
|
|
|
|
|
|
// Substitutions can apply to blank lines in the middle of a file,
|
|
|
|
// but not to the trailing newline that marks the end of a file.
|
|
|
|
if (line.is_empty() && file->is_eof())
|
|
|
|
break;
|
|
|
|
|
|
|
|
auto result = command.regex.replace(line, command.replacement, command.options);
|
|
|
|
outln(result);
|
2022-12-18 22:29:10 -08:00
|
|
|
|
|
|
|
if (maybe_output_file.has_value()) {
|
|
|
|
auto const& output_file = maybe_output_file.value();
|
2023-03-01 17:24:50 +01:00
|
|
|
TRY(output_file->write_until_depleted(result.bytes()));
|
|
|
|
TRY(output_file->write_until_depleted("\n"sv.bytes()));
|
2022-12-18 22:29:10 -08:00
|
|
|
}
|
2022-12-17 01:06:26 -08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|