2020-01-18 09:38:21 +01:00
|
|
|
/*
|
|
|
|
* Copyright (c) 2018-2020, Andreas Kling <kling@serenityos.org>
|
|
|
|
* All rights reserved.
|
|
|
|
*
|
|
|
|
* Redistribution and use in source and binary forms, with or without
|
|
|
|
* modification, are permitted provided that the following conditions are met:
|
|
|
|
*
|
|
|
|
* 1. Redistributions of source code must retain the above copyright notice, this
|
|
|
|
* list of conditions and the following disclaimer.
|
|
|
|
*
|
|
|
|
* 2. Redistributions in binary form must reproduce the above copyright notice,
|
|
|
|
* this list of conditions and the following disclaimer in the documentation
|
|
|
|
* and/or other materials provided with the distribution.
|
|
|
|
*
|
|
|
|
* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
|
|
|
|
* AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
|
|
|
|
* IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
|
|
|
|
* DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE
|
|
|
|
* FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
|
|
|
|
* DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
|
|
|
|
* SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
|
|
|
|
* CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
|
|
|
|
* OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
|
|
|
|
* OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
|
|
|
*/
|
|
|
|
|
2020-08-29 15:38:36 +04:30
|
|
|
#include <AK/GenericLexer.h>
|
|
|
|
#include <AK/LexicalPath.h>
|
2020-05-03 09:01:06 +04:30
|
|
|
#include <AK/NumberFormat.h>
|
2020-01-01 18:53:34 +01:00
|
|
|
#include <AK/SharedBuffer.h>
|
2020-05-03 09:01:06 +04:30
|
|
|
#include <AK/URL.h>
|
2020-08-05 20:53:16 +02:00
|
|
|
#include <LibCore/ArgsParser.h>
|
2020-02-06 15:04:03 +01:00
|
|
|
#include <LibCore/EventLoop.h>
|
2020-08-29 15:38:36 +04:30
|
|
|
#include <LibCore/File.h>
|
2019-11-23 21:48:39 +01:00
|
|
|
#include <LibProtocol/Client.h>
|
2019-11-24 13:20:44 +01:00
|
|
|
#include <LibProtocol/Download.h>
|
2020-09-27 12:44:03 +02:00
|
|
|
#include <ctype.h>
|
2019-11-23 21:48:39 +01:00
|
|
|
#include <stdio.h>
|
|
|
|
|
2020-08-29 15:38:36 +04:30
|
|
|
// FIXME: Move this somewhere else when it's needed (e.g. in the Browser)
|
|
|
|
class ContentDispositionParser {
|
|
|
|
public:
|
|
|
|
ContentDispositionParser(const StringView& value)
|
|
|
|
{
|
|
|
|
GenericLexer lexer(value);
|
|
|
|
|
2020-09-27 12:44:03 +02:00
|
|
|
lexer.ignore_while(isspace);
|
2020-08-29 15:38:36 +04:30
|
|
|
|
|
|
|
if (lexer.consume_specific("inline")) {
|
|
|
|
m_kind = Kind::Inline;
|
|
|
|
if (!lexer.is_eof())
|
|
|
|
m_might_be_wrong = true;
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (lexer.consume_specific("attachment")) {
|
|
|
|
m_kind = Kind::Attachment;
|
|
|
|
if (lexer.consume_specific(";")) {
|
2020-09-27 12:44:03 +02:00
|
|
|
lexer.ignore_while(isspace);
|
2020-08-29 15:38:36 +04:30
|
|
|
if (lexer.consume_specific("filename=")) {
|
2020-08-31 19:24:46 +04:30
|
|
|
// RFC 2183: "A short (length <= 78 characters)
|
|
|
|
// parameter value containing only non-`tspecials' characters SHOULD be
|
|
|
|
// represented as a single `token'."
|
|
|
|
// Some people seem to take this as generic advice of "if it doesn't have special characters,
|
|
|
|
// it's safe to specify as a single token"
|
|
|
|
// So let's just be as lenient as possible.
|
|
|
|
if (lexer.next_is('"'))
|
|
|
|
m_filename = lexer.consume_quoted_string();
|
|
|
|
else
|
|
|
|
m_filename = lexer.consume_until(is_any_of("()<>@,;:\\\"/[]?= "));
|
2020-08-29 15:38:36 +04:30
|
|
|
} else {
|
|
|
|
m_might_be_wrong = true;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (lexer.consume_specific("form-data")) {
|
|
|
|
m_kind = Kind::FormData;
|
|
|
|
while (lexer.consume_specific(";")) {
|
2020-09-27 12:44:03 +02:00
|
|
|
lexer.ignore_while(isspace);
|
2020-08-29 15:38:36 +04:30
|
|
|
if (lexer.consume_specific("name=")) {
|
|
|
|
m_name = lexer.consume_quoted_string();
|
|
|
|
} else if (lexer.consume_specific("filename=")) {
|
2020-08-31 19:24:46 +04:30
|
|
|
if (lexer.next_is('"'))
|
|
|
|
m_filename = lexer.consume_quoted_string();
|
|
|
|
else
|
|
|
|
m_filename = lexer.consume_until(is_any_of("()<>@,;:\\\"/[]?= "));
|
2020-08-29 15:38:36 +04:30
|
|
|
} else {
|
|
|
|
m_might_be_wrong = true;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
// FIXME: Support 'filename*'
|
|
|
|
m_might_be_wrong = true;
|
|
|
|
}
|
|
|
|
|
|
|
|
enum class Kind {
|
|
|
|
Inline,
|
|
|
|
Attachment,
|
|
|
|
FormData,
|
|
|
|
};
|
|
|
|
|
|
|
|
const StringView& filename() const { return m_filename; }
|
|
|
|
const StringView& name() const { return m_name; }
|
|
|
|
Kind kind() const { return m_kind; }
|
|
|
|
bool might_be_wrong() const { return m_might_be_wrong; }
|
|
|
|
|
|
|
|
private:
|
|
|
|
StringView m_filename;
|
|
|
|
StringView m_name;
|
|
|
|
Kind m_kind { Kind::Inline };
|
|
|
|
bool m_might_be_wrong { false };
|
|
|
|
};
|
|
|
|
|
2020-12-19 13:09:02 +01:00
|
|
|
static void do_write(ReadonlyBytes payload)
|
2020-08-29 15:38:36 +04:30
|
|
|
{
|
|
|
|
size_t length_remaining = payload.size();
|
|
|
|
size_t length_written = 0;
|
|
|
|
while (length_remaining > 0) {
|
2020-12-19 13:09:02 +01:00
|
|
|
auto nwritten = fwrite(payload.data() + length_written, sizeof(char), length_remaining, stdout);
|
2020-08-29 15:38:36 +04:30
|
|
|
if (nwritten > 0) {
|
|
|
|
length_remaining -= nwritten;
|
|
|
|
length_written += nwritten;
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (feof(stdout)) {
|
|
|
|
fprintf(stderr, "pro: unexpected eof while writing\n");
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (ferror(stdout)) {
|
|
|
|
fprintf(stderr, "pro: error while writing\n");
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2019-11-23 21:48:39 +01:00
|
|
|
int main(int argc, char** argv)
|
|
|
|
{
|
2020-08-05 20:53:16 +02:00
|
|
|
const char* url_str = nullptr;
|
2020-08-29 15:38:36 +04:30
|
|
|
bool save_at_provided_name = false;
|
2020-08-05 20:53:16 +02:00
|
|
|
|
|
|
|
Core::ArgsParser args_parser;
|
2020-12-06 14:18:25 +01:00
|
|
|
args_parser.set_general_help(
|
|
|
|
"Download a file from an arbitrary URL. This command uses ProtocolServer, "
|
|
|
|
"and thus supports at least http, https, and gemini.");
|
2020-08-29 15:38:36 +04:30
|
|
|
args_parser.add_option(save_at_provided_name, "Write to a file named as the remote file", nullptr, 'O');
|
2020-08-05 20:53:16 +02:00
|
|
|
args_parser.add_positional_argument(url_str, "URL to download from", "url");
|
|
|
|
args_parser.parse(argc, argv);
|
2019-11-23 22:16:23 +01:00
|
|
|
|
2020-08-05 20:53:16 +02:00
|
|
|
URL url(url_str);
|
2019-11-23 22:16:23 +01:00
|
|
|
if (!url.is_valid()) {
|
2020-08-05 20:53:16 +02:00
|
|
|
fprintf(stderr, "'%s' is not a valid URL\n", url_str);
|
2019-11-23 22:16:23 +01:00
|
|
|
return 1;
|
|
|
|
}
|
|
|
|
|
2020-02-02 12:34:39 +01:00
|
|
|
Core::EventLoop loop;
|
2020-02-05 18:21:30 +01:00
|
|
|
auto protocol_client = Protocol::Client::construct();
|
2019-11-23 21:48:39 +01:00
|
|
|
|
2020-09-28 11:55:26 +02:00
|
|
|
auto download = protocol_client->start_download("GET", url.to_string());
|
2020-04-04 20:00:07 +02:00
|
|
|
if (!download) {
|
2020-08-05 20:53:16 +02:00
|
|
|
fprintf(stderr, "Failed to start download for '%s'\n", url_str);
|
2020-04-04 20:00:07 +02:00
|
|
|
return 1;
|
|
|
|
}
|
2020-08-29 15:38:36 +04:30
|
|
|
|
2020-05-03 09:01:06 +04:30
|
|
|
u32 previous_downloaded_size { 0 };
|
|
|
|
timeval prev_time, current_time, time_diff;
|
|
|
|
gettimeofday(&prev_time, nullptr);
|
|
|
|
|
|
|
|
download->on_progress = [&](Optional<u32> maybe_total_size, u32 downloaded_size) {
|
|
|
|
fprintf(stderr, "\r\033[2K");
|
2020-05-30 22:17:46 +02:00
|
|
|
if (maybe_total_size.has_value()) {
|
|
|
|
fprintf(stderr, "\033]9;%d;%d;\033\\", downloaded_size, maybe_total_size.value());
|
2020-05-03 09:01:06 +04:30
|
|
|
fprintf(stderr, "Download progress: %s / %s", human_readable_size(downloaded_size).characters(), human_readable_size(maybe_total_size.value()).characters());
|
2020-05-30 22:17:46 +02:00
|
|
|
} else {
|
2020-05-03 09:01:06 +04:30
|
|
|
fprintf(stderr, "Download progress: %s / ???", human_readable_size(downloaded_size).characters());
|
2020-05-30 22:17:46 +02:00
|
|
|
}
|
2020-05-03 09:01:06 +04:30
|
|
|
|
|
|
|
gettimeofday(¤t_time, nullptr);
|
|
|
|
timersub(¤t_time, &prev_time, &time_diff);
|
|
|
|
|
|
|
|
auto time_diff_ms = time_diff.tv_sec * 1000 + time_diff.tv_usec / 1000;
|
|
|
|
auto size_diff = downloaded_size - previous_downloaded_size;
|
|
|
|
|
|
|
|
fprintf(stderr, " at %s/s", human_readable_size(((float)size_diff / (float)time_diff_ms) * 1000).characters());
|
|
|
|
|
|
|
|
previous_downloaded_size = downloaded_size;
|
|
|
|
prev_time = current_time;
|
2019-11-23 21:48:39 +01:00
|
|
|
};
|
2020-12-19 13:09:02 +01:00
|
|
|
download->on_finish = [&](bool success, auto payload, auto, auto& response_headers, auto) {
|
2020-05-30 22:17:46 +02:00
|
|
|
fprintf(stderr, "\033]9;-1;\033\\");
|
2020-05-03 09:01:06 +04:30
|
|
|
fprintf(stderr, "\n");
|
2020-08-29 15:38:36 +04:30
|
|
|
if (success && save_at_provided_name) {
|
|
|
|
String output_name;
|
|
|
|
if (auto content_disposition = response_headers.get("Content-Disposition"); content_disposition.has_value()) {
|
|
|
|
auto& value = content_disposition.value();
|
|
|
|
ContentDispositionParser parser(value);
|
|
|
|
output_name = parser.filename();
|
|
|
|
}
|
|
|
|
|
|
|
|
if (output_name.is_empty())
|
|
|
|
output_name = url.path();
|
|
|
|
|
|
|
|
LexicalPath path { output_name };
|
|
|
|
output_name = path.basename();
|
|
|
|
|
|
|
|
// The URL didn't have a name component, e.g. 'serenityos.org'
|
|
|
|
if (output_name.is_empty() || output_name == "/") {
|
|
|
|
int i = -1;
|
|
|
|
do {
|
|
|
|
output_name = url.host();
|
|
|
|
if (i > -1)
|
|
|
|
output_name = String::format("%s.%d", output_name.characters(), i);
|
|
|
|
++i;
|
|
|
|
} while (Core::File::exists(output_name));
|
|
|
|
}
|
|
|
|
|
|
|
|
if (freopen(output_name.characters(), "w", stdout) == nullptr) {
|
|
|
|
perror("freopen");
|
|
|
|
success = false; // oops!
|
|
|
|
loop.quit(1);
|
|
|
|
}
|
|
|
|
}
|
2019-11-24 13:20:44 +01:00
|
|
|
if (success)
|
2020-08-29 15:38:36 +04:30
|
|
|
do_write(payload);
|
2019-11-24 13:20:44 +01:00
|
|
|
else
|
|
|
|
fprintf(stderr, "Download failed :(\n");
|
|
|
|
loop.quit(0);
|
2019-11-23 21:48:39 +01:00
|
|
|
};
|
2019-11-24 13:20:44 +01:00
|
|
|
dbgprintf("started download with id %d\n", download->id());
|
2019-11-23 21:48:39 +01:00
|
|
|
|
|
|
|
return loop.exec();
|
|
|
|
}
|