serenity/Userland/Utilities/tr.cpp
Timothy Flynn 02e3633b7f AK: Move FormatParser definition from header to implementation file
This is primarily to be able to remove the GenericLexer include out of
Format.h as well. A subsequent commit will add AK::Result to
GenericLexer, which will cause naming conflicts with other structures
named Result. This can be avoided (for now) by preventing nearly every
file in the system from implicitly including GenericLexer.

Other changes in this commit are to add the GenericLexer include to
files where it is missing.
2021-08-19 23:49:25 +02:00

144 lines
4.8 KiB
C++

/*
* Copyright (c) 2018-2020, Andreas Kling <kling@serenityos.org>
*
* SPDX-License-Identifier: BSD-2-Clause
*/
#include <AK/GenericLexer.h>
#include <AK/Optional.h>
#include <AK/String.h>
#include <LibCore/ArgsParser.h>
#include <ctype.h>
#include <stdio.h>
static bool is_octal(int c)
{
return c == '0' || c == '1' || c == '2' || c == '3' || c == '4' || c == '5' || c == '6' || c == '7';
}
static void generate_character_class(Function<int(int)> oracle, StringBuilder& out)
{
for (int i = 0; i < 128; i++) {
if (oracle(i))
out.append(static_cast<char>(i));
}
}
static String build_set(StringView specification)
{
StringBuilder out;
GenericLexer lexer(specification);
while (!lexer.is_eof()) {
if (lexer.consume_specific("[:alnum:]"sv))
generate_character_class(isalnum, out);
else if (lexer.consume_specific("[:blank:]"sv))
generate_character_class(isblank, out);
else if (lexer.consume_specific("[:digit:]"sv))
generate_character_class(isdigit, out);
else if (lexer.consume_specific("[:lower:]"sv))
generate_character_class(islower, out);
else if (lexer.consume_specific("[:punct:]"sv))
generate_character_class(ispunct, out);
else if (lexer.consume_specific("[:upper:]"sv))
generate_character_class(isupper, out);
else if (lexer.consume_specific("[:alpha:]"sv))
generate_character_class(isalpha, out);
else if (lexer.consume_specific("[:cntrl:]"sv))
generate_character_class(iscntrl, out);
else if (lexer.consume_specific("[:graph:]"sv))
generate_character_class(isgraph, out);
else if (lexer.consume_specific("[:print:]"sv))
generate_character_class(isprint, out);
else if (lexer.consume_specific("[:space:]"sv))
generate_character_class(isspace, out);
else if (lexer.consume_specific("[:xdigit:]"sv))
generate_character_class(isxdigit, out);
else if (lexer.consume_specific("\\\\"sv))
out.append('\\');
else if (lexer.consume_specific("\\a"sv))
out.append('\a');
else if (lexer.consume_specific("\\b"sv))
out.append('\b');
else if (lexer.consume_specific("\\f"sv))
out.append('\f');
else if (lexer.consume_specific("\\n"sv))
out.append('\n');
else if (lexer.consume_specific("\\r"sv))
out.append('\r');
else if (lexer.consume_specific("\\t"sv))
out.append('\t');
else if (lexer.consume_specific("\\v"sv))
out.append('\v');
else if (lexer.next_is('\\') && is_octal(lexer.peek(1))) {
lexer.consume_specific('\\');
int max_left_over = 3;
auto octal_digits = lexer.consume_while([&](char i) -> bool {
return is_octal(i) && max_left_over--;
});
int value = 0;
for (char ch : octal_digits)
value = value * 8 + (ch - '0');
out.append(static_cast<char>(value));
} else
out.append(lexer.consume(1));
}
return out.to_string();
}
int main(int argc, char** argv)
{
bool complement_flag = false;
bool delete_flag = false;
const char* from_chars = nullptr;
const char* to_chars = nullptr;
Core::ArgsParser args_parser;
args_parser.add_option(complement_flag, "Take the complement of the first set", "complement", 'c');
args_parser.add_option(delete_flag, "Delete characters instead of replacing", "delete", 'd');
args_parser.add_positional_argument(from_chars, "Set of characters to translate from", "from");
args_parser.add_positional_argument(to_chars, "Set of characters to translate to", "to", Core::ArgsParser::Required::No);
args_parser.parse(argc, argv);
if (!to_chars && !delete_flag) {
args_parser.print_usage(stderr, argv[0]);
return 1;
}
String from_str = build_set(from_chars);
if (complement_flag) {
StringBuilder complement_set;
for (int ch = 0; ch < 256; ch++) {
if (!from_str.contains(static_cast<char>(ch)))
complement_set.append(static_cast<char>(ch));
}
from_str = complement_set.to_string();
}
if (delete_flag) {
for (;;) {
char ch = fgetc(stdin);
if (feof(stdin))
break;
if (!from_str.contains(ch))
putchar(ch);
}
} else {
auto to_str = build_set(to_chars);
for (;;) {
char ch = fgetc(stdin);
if (feof(stdin))
break;
auto match = from_str.find_last(ch);
if (match.has_value())
putchar(to_str[min(match.value(), to_str.length() - 1)]);
else
putchar(ch);
}
}
return 0;
}