123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296 |
- /*
- * Copyright (c) 2018-2020, Andreas Kling <kling@serenityos.org>
- * All rights reserved.
- *
- * Redistribution and use in source and binary forms, with or without
- * modification, are permitted provided that the following conditions are met:
- *
- * 1. Redistributions of source code must retain the above copyright notice, this
- * list of conditions and the following disclaimer.
- *
- * 2. Redistributions in binary form must reproduce the above copyright notice,
- * this list of conditions and the following disclaimer in the documentation
- * and/or other materials provided with the distribution.
- *
- * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
- * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
- * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
- * DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE
- * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
- * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
- * SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
- * CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
- * OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
- * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
- */
- #include <AK/FileStream.h>
- #include <AK/GenericLexer.h>
- #include <AK/LexicalPath.h>
- #include <AK/NumberFormat.h>
- #include <AK/URL.h>
- #include <LibCore/ArgsParser.h>
- #include <LibCore/EventLoop.h>
- #include <LibCore/File.h>
- #include <LibProtocol/Client.h>
- #include <LibProtocol/Download.h>
- #include <ctype.h>
- #include <stdio.h>
- // FIXME: Move this somewhere else when it's needed (e.g. in the Browser)
- class ContentDispositionParser {
- public:
- ContentDispositionParser(const StringView& value)
- {
- GenericLexer lexer(value);
- lexer.ignore_while(isspace);
- if (lexer.consume_specific("inline")) {
- m_kind = Kind::Inline;
- if (!lexer.is_eof())
- m_might_be_wrong = true;
- return;
- }
- if (lexer.consume_specific("attachment")) {
- m_kind = Kind::Attachment;
- if (lexer.consume_specific(";")) {
- lexer.ignore_while(isspace);
- if (lexer.consume_specific("filename=")) {
- // RFC 2183: "A short (length <= 78 characters)
- // parameter value containing only non-`tspecials' characters SHOULD be
- // represented as a single `token'."
- // Some people seem to take this as generic advice of "if it doesn't have special characters,
- // it's safe to specify as a single token"
- // So let's just be as lenient as possible.
- if (lexer.next_is('"'))
- m_filename = lexer.consume_quoted_string();
- else
- m_filename = lexer.consume_until(is_any_of("()<>@,;:\\\"/[]?= "));
- } else {
- m_might_be_wrong = true;
- }
- }
- return;
- }
- if (lexer.consume_specific("form-data")) {
- m_kind = Kind::FormData;
- while (lexer.consume_specific(";")) {
- lexer.ignore_while(isspace);
- if (lexer.consume_specific("name=")) {
- m_name = lexer.consume_quoted_string();
- } else if (lexer.consume_specific("filename=")) {
- if (lexer.next_is('"'))
- m_filename = lexer.consume_quoted_string();
- else
- m_filename = lexer.consume_until(is_any_of("()<>@,;:\\\"/[]?= "));
- } else {
- m_might_be_wrong = true;
- }
- }
- return;
- }
- // FIXME: Support 'filename*'
- m_might_be_wrong = true;
- }
- enum class Kind {
- Inline,
- Attachment,
- FormData,
- };
- const StringView& filename() const { return m_filename; }
- const StringView& name() const { return m_name; }
- Kind kind() const { return m_kind; }
- bool might_be_wrong() const { return m_might_be_wrong; }
- private:
- StringView m_filename;
- StringView m_name;
- Kind m_kind { Kind::Inline };
- bool m_might_be_wrong { false };
- };
- template<typename ConditionT>
- class ConditionalOutputFileStream final : public OutputFileStream {
- public:
- template<typename... Args>
- ConditionalOutputFileStream(ConditionT&& condition, Args... args)
- : OutputFileStream(args...)
- , m_condition(condition)
- {
- }
- ~ConditionalOutputFileStream()
- {
- if (!m_condition())
- return;
- if (!m_buffer.is_empty()) {
- OutputFileStream::write(m_buffer);
- m_buffer.clear();
- }
- }
- private:
- size_t write(ReadonlyBytes bytes) override
- {
- if (!m_condition()) {
- write_to_buffer:;
- m_buffer.append(bytes.data(), bytes.size());
- return bytes.size();
- }
- if (!m_buffer.is_empty()) {
- auto size = OutputFileStream::write(m_buffer);
- m_buffer = m_buffer.slice(size, m_buffer.size() - size);
- }
- if (!m_buffer.is_empty())
- goto write_to_buffer;
- return OutputFileStream::write(bytes);
- }
- ConditionT m_condition;
- ByteBuffer m_buffer;
- };
- int main(int argc, char** argv)
- {
- const char* url_str = nullptr;
- bool save_at_provided_name = false;
- const char* data = nullptr;
- String method = "GET";
- HashMap<String, String, CaseInsensitiveStringTraits> request_headers;
- Core::ArgsParser args_parser;
- args_parser.set_general_help(
- "Download a file from an arbitrary URL. This command uses ProtocolServer, "
- "and thus supports at least http, https, and gemini.");
- args_parser.add_option(save_at_provided_name, "Write to a file named as the remote file", nullptr, 'O');
- args_parser.add_option(data, "(HTTP only) Send the provided data via an HTTP POST request", "data", 'd', "data");
- args_parser.add_option(Core::ArgsParser::Option {
- .requires_argument = true,
- .help_string = "Add a header entry to the request",
- .long_name = "header",
- .short_name = 'H',
- .value_name = "header-value",
- .accept_value = [&](auto* s) {
- StringView header { s };
- auto split = header.find_first_of(':');
- if (!split.has_value())
- return false;
- request_headers.set(header.substring_view(0, split.value()), header.substring_view(split.value() + 1));
- return true;
- } });
- args_parser.add_positional_argument(url_str, "URL to download from", "url");
- args_parser.parse(argc, argv);
- if (data) {
- method = "POST";
- // FIXME: Content-Type?
- }
- URL url(url_str);
- if (!url.is_valid()) {
- fprintf(stderr, "'%s' is not a valid URL\n", url_str);
- return 1;
- }
- Core::EventLoop loop;
- auto protocol_client = Protocol::Client::construct();
- auto download = protocol_client->start_download(method, url.to_string(), request_headers, data ? StringView { data }.bytes() : ReadonlyBytes {});
- if (!download) {
- fprintf(stderr, "Failed to start download for '%s'\n", url_str);
- return 1;
- }
- u32 previous_downloaded_size { 0 };
- timeval prev_time, current_time, time_diff;
- gettimeofday(&prev_time, nullptr);
- bool received_actual_headers = false;
- download->on_progress = [&](Optional<u32> maybe_total_size, u32 downloaded_size) {
- fprintf(stderr, "\r\033[2K");
- if (maybe_total_size.has_value()) {
- fprintf(stderr, "\033]9;%d;%d;\033\\", downloaded_size, maybe_total_size.value());
- fprintf(stderr, "Download progress: %s / %s", human_readable_size(downloaded_size).characters(), human_readable_size(maybe_total_size.value()).characters());
- } else {
- fprintf(stderr, "Download progress: %s / ???", human_readable_size(downloaded_size).characters());
- }
- gettimeofday(¤t_time, nullptr);
- timersub(¤t_time, &prev_time, &time_diff);
- auto time_diff_ms = time_diff.tv_sec * 1000 + time_diff.tv_usec / 1000;
- auto size_diff = downloaded_size - previous_downloaded_size;
- fprintf(stderr, " at %s/s", human_readable_size(((float)size_diff / (float)time_diff_ms) * 1000).characters());
- previous_downloaded_size = downloaded_size;
- prev_time = current_time;
- };
- if (save_at_provided_name) {
- download->on_headers_received = [&](auto& response_headers, auto status_code) {
- if (received_actual_headers)
- return;
- dbgln("Received headers! response code = {}", status_code.value_or(0));
- received_actual_headers = true; // And not trailers!
- String output_name;
- if (auto content_disposition = response_headers.get("Content-Disposition"); content_disposition.has_value()) {
- auto& value = content_disposition.value();
- ContentDispositionParser parser(value);
- output_name = parser.filename();
- }
- if (output_name.is_empty())
- output_name = url.path();
- LexicalPath path { output_name };
- output_name = path.basename();
- // The URL didn't have a name component, e.g. 'serenityos.org'
- if (output_name.is_empty() || output_name == "/") {
- int i = -1;
- do {
- output_name = url.host();
- if (i > -1)
- output_name = String::formatted("{}.{}", output_name, i);
- ++i;
- } while (Core::File::exists(output_name));
- }
- if (freopen(output_name.characters(), "w", stdout) == nullptr) {
- perror("freopen");
- loop.quit(1);
- return;
- }
- };
- }
- download->on_finish = [&](bool success, auto) {
- fprintf(stderr, "\033]9;-1;\033\\");
- fprintf(stderr, "\n");
- if (!success)
- fprintf(stderr, "Download failed :(\n");
- loop.quit(0);
- };
- auto output_stream = ConditionalOutputFileStream { [&] { return save_at_provided_name ? received_actual_headers : true; }, stdout };
- download->stream_into(output_stream);
- dbgln("started download with id {}", download->id());
- auto rc = loop.exec();
- // FIXME: This shouldn't be needed.
- fclose(stdout);
- return rc;
- }
|