mirror of
				https://github.com/RGBCube/serenity
				synced 2025-10-31 21:12:43 +00:00 
			
		
		
		
	
		
			
				
	
	
		
			400 lines
		
	
	
	
		
			15 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
			
		
		
	
	
			400 lines
		
	
	
	
		
			15 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
| /*
 | |
|  * Copyright (c) 2018-2020, Andreas Kling <kling@serenityos.org>
 | |
|  * Copyright (c) 2022, Thomas Keppler <serenity@tkeppler.de>
 | |
|  *
 | |
|  * SPDX-License-Identifier: BSD-2-Clause
 | |
|  */
 | |
| 
 | |
| #include <AK/Base64.h>
 | |
| #include <AK/FileStream.h>
 | |
| #include <AK/GenericLexer.h>
 | |
| #include <AK/LexicalPath.h>
 | |
| #include <AK/NumberFormat.h>
 | |
| #include <AK/String.h>
 | |
| #include <AK/URL.h>
 | |
| #include <LibCore/ArgsParser.h>
 | |
| #include <LibCore/EventLoop.h>
 | |
| #include <LibCore/File.h>
 | |
| #include <LibCore/System.h>
 | |
| #include <LibHTTP/HttpResponse.h>
 | |
| #include <LibMain/Main.h>
 | |
| #include <LibProtocol/Request.h>
 | |
| #include <LibProtocol/RequestClient.h>
 | |
| #include <ctype.h>
 | |
| #include <stdio.h>
 | |
| 
 | |
| // FIXME: Move this somewhere else when it's needed (e.g. in the Browser)
 | |
| class ContentDispositionParser {
 | |
| public:
 | |
|     ContentDispositionParser(StringView value)
 | |
|     {
 | |
|         GenericLexer lexer(value);
 | |
| 
 | |
|         lexer.ignore_while(isspace);
 | |
| 
 | |
|         if (lexer.consume_specific("inline")) {
 | |
|             m_kind = Kind::Inline;
 | |
|             if (!lexer.is_eof())
 | |
|                 m_might_be_wrong = true;
 | |
|             return;
 | |
|         }
 | |
| 
 | |
|         if (lexer.consume_specific("attachment")) {
 | |
|             m_kind = Kind::Attachment;
 | |
|             if (lexer.consume_specific(";")) {
 | |
|                 lexer.ignore_while(isspace);
 | |
|                 if (lexer.consume_specific("filename=")) {
 | |
|                     // RFC 2183: "A short (length <= 78 characters)
 | |
|                     //            parameter value containing only non-`tspecials' characters SHOULD be
 | |
|                     //            represented as a single `token'."
 | |
|                     // Some people seem to take this as generic advice of "if it doesn't have special characters,
 | |
|                     // it's safe to specify as a single token"
 | |
|                     // So let's just be as lenient as possible.
 | |
|                     if (lexer.next_is('"'))
 | |
|                         m_filename = lexer.consume_quoted_string();
 | |
|                     else
 | |
|                         m_filename = lexer.consume_until(is_any_of("()<>@,;:\\\"/[]?= "sv));
 | |
|                 } else {
 | |
|                     m_might_be_wrong = true;
 | |
|                 }
 | |
|             }
 | |
|             return;
 | |
|         }
 | |
| 
 | |
|         if (lexer.consume_specific("form-data")) {
 | |
|             m_kind = Kind::FormData;
 | |
|             while (lexer.consume_specific(";")) {
 | |
|                 lexer.ignore_while(isspace);
 | |
|                 if (lexer.consume_specific("name=")) {
 | |
|                     m_name = lexer.consume_quoted_string();
 | |
|                 } else if (lexer.consume_specific("filename=")) {
 | |
|                     if (lexer.next_is('"'))
 | |
|                         m_filename = lexer.consume_quoted_string();
 | |
|                     else
 | |
|                         m_filename = lexer.consume_until(is_any_of("()<>@,;:\\\"/[]?= "sv));
 | |
|                 } else {
 | |
|                     m_might_be_wrong = true;
 | |
|                 }
 | |
|             }
 | |
| 
 | |
|             return;
 | |
|         }
 | |
| 
 | |
|         // FIXME: Support 'filename*'
 | |
|         m_might_be_wrong = true;
 | |
|     }
 | |
| 
 | |
|     enum class Kind {
 | |
|         Inline,
 | |
|         Attachment,
 | |
|         FormData,
 | |
|     };
 | |
| 
 | |
|     StringView filename() const { return m_filename; }
 | |
|     StringView name() const { return m_name; }
 | |
|     Kind kind() const { return m_kind; }
 | |
|     bool might_be_wrong() const { return m_might_be_wrong; }
 | |
| 
 | |
| private:
 | |
|     StringView m_filename;
 | |
|     StringView m_name;
 | |
|     Kind m_kind { Kind::Inline };
 | |
|     bool m_might_be_wrong { false };
 | |
| };
 | |
| 
 | |
| template<typename ConditionT>
 | |
| class ConditionalOutputFileStream final : public OutputFileStream {
 | |
| public:
 | |
|     template<typename... Args>
 | |
|     ConditionalOutputFileStream(ConditionT&& condition, Args... args)
 | |
|         : OutputFileStream(args...)
 | |
|         , m_condition(condition)
 | |
|     {
 | |
|     }
 | |
| 
 | |
|     ~ConditionalOutputFileStream()
 | |
|     {
 | |
|         if (!m_condition())
 | |
|             return;
 | |
| 
 | |
|         if (!m_buffer.is_empty()) {
 | |
|             OutputFileStream::write(m_buffer);
 | |
|             m_buffer.clear();
 | |
|         }
 | |
|     }
 | |
| 
 | |
| private:
 | |
|     size_t write(ReadonlyBytes bytes) override
 | |
|     {
 | |
|         if (!m_condition()) {
 | |
|         write_to_buffer:;
 | |
|             // FIXME: Propagate errors.
 | |
|             if (m_buffer.try_append(bytes.data(), bytes.size()).is_error())
 | |
|                 return 0;
 | |
|             return bytes.size();
 | |
|         }
 | |
| 
 | |
|         if (!m_buffer.is_empty()) {
 | |
|             auto size = OutputFileStream::write(m_buffer);
 | |
|             // FIXME: Propagate errors.
 | |
|             m_buffer = MUST(m_buffer.slice(size, m_buffer.size() - size));
 | |
|         }
 | |
| 
 | |
|         if (!m_buffer.is_empty())
 | |
|             goto write_to_buffer;
 | |
| 
 | |
|         return OutputFileStream::write(bytes);
 | |
|     }
 | |
| 
 | |
|     ConditionT m_condition;
 | |
|     ByteBuffer m_buffer;
 | |
| };
 | |
| 
 | |
| ErrorOr<int> serenity_main(Main::Arguments arguments)
 | |
| {
 | |
|     StringView url_str;
 | |
|     bool save_at_provided_name = false;
 | |
|     bool should_follow_url = false;
 | |
|     bool verbose_output = false;
 | |
|     char const* data = nullptr;
 | |
|     StringView proxy_spec;
 | |
|     DeprecatedString method = "GET";
 | |
|     StringView method_override;
 | |
|     HashMap<DeprecatedString, DeprecatedString, CaseInsensitiveStringTraits> request_headers;
 | |
|     String credentials;
 | |
| 
 | |
|     Core::ArgsParser args_parser;
 | |
|     args_parser.set_general_help(
 | |
|         "Request a file from an arbitrary URL. This command uses RequestServer, "
 | |
|         "and thus supports at least http, https, and gemini.");
 | |
|     args_parser.add_option(save_at_provided_name, "Write to a file named as the remote file", nullptr, 'O');
 | |
|     args_parser.add_option(data, "(HTTP only) Send the provided data via an HTTP POST request", "data", 'd', "data");
 | |
|     args_parser.add_option(method_override, "(HTTP only) HTTP method to use for the request (eg, GET, POST, etc)", "method", 'm', "method");
 | |
|     args_parser.add_option(should_follow_url, "(HTTP only) Follow the Location header if a 3xx status is encountered", "follow", 'l');
 | |
|     args_parser.add_option(Core::ArgsParser::Option {
 | |
|         .argument_mode = Core::ArgsParser::OptionArgumentMode::Required,
 | |
|         .help_string = "Add a header entry to the request",
 | |
|         .long_name = "header",
 | |
|         .short_name = 'H',
 | |
|         .value_name = "key:value",
 | |
|         .accept_value = [&](auto* s) {
 | |
|             StringView header { s, strlen(s) };
 | |
|             auto split = header.find(':');
 | |
|             if (!split.has_value())
 | |
|                 return false;
 | |
|             request_headers.set(header.substring_view(0, split.value()), header.substring_view(split.value() + 1));
 | |
|             return true;
 | |
|         } });
 | |
|     args_parser.add_option(Core::ArgsParser::Option {
 | |
|         .argument_mode = Core::ArgsParser::OptionArgumentMode::Required,
 | |
|         .help_string = "(HTTP only) Provide basic authentication credentials",
 | |
|         .long_name = "auth",
 | |
|         .short_name = 'u',
 | |
|         .value_name = "username:password",
 | |
|         .accept_value = [&](auto* s) {
 | |
|             StringView input { s, strlen(s) };
 | |
|             if (!input.contains(':'))
 | |
|                 return false;
 | |
| 
 | |
|             // NOTE: Input is explicitly not trimmed, but instead taken in raw;
 | |
|             //       Space prepended usernames and appended passwords might be legal in the user's context.
 | |
|             auto maybe_credentials = String::from_utf8(input);
 | |
|             if (maybe_credentials.is_error())
 | |
|                 return false;
 | |
| 
 | |
|             credentials = maybe_credentials.release_value();
 | |
|             return true;
 | |
|         } });
 | |
|     args_parser.add_option(proxy_spec, "Specify a proxy server to use for this request (proto://ip:port)", "proxy", 'p', "proxy");
 | |
|     args_parser.add_option(verbose_output, "(HTTP only) Log request and response metadata", "verbose", 'v');
 | |
|     args_parser.add_positional_argument(url_str, "URL to download from", "url");
 | |
|     args_parser.parse(arguments);
 | |
| 
 | |
|     if (!method_override.is_empty()) {
 | |
|         method = method_override;
 | |
|     } else if (data) {
 | |
|         method = "POST";
 | |
|         // FIXME: Content-Type?
 | |
|     }
 | |
| 
 | |
|     URL url(url_str);
 | |
|     if (!url.is_valid()) {
 | |
|         warnln("'{}' is not a valid URL", url_str);
 | |
|         return 1;
 | |
|     }
 | |
| 
 | |
|     bool const is_http_url = url.scheme().is_one_of("http"sv, "https"sv);
 | |
| 
 | |
|     Core::ProxyData proxy_data {};
 | |
|     if (!proxy_spec.is_empty())
 | |
|         proxy_data = TRY(Core::ProxyData::parse_url(proxy_spec));
 | |
| 
 | |
|     Core::EventLoop loop;
 | |
|     bool received_actual_headers = false;
 | |
|     bool should_save_stream_data = false;
 | |
|     bool following_url = false;
 | |
| 
 | |
|     u32 previous_downloaded_size = 0;
 | |
|     u32 const report_time_in_ms = 100;
 | |
|     u32 const speed_update_time_in_ms = 4000;
 | |
| 
 | |
|     timeval previous_time, current_time, time_diff;
 | |
|     gettimeofday(&previous_time, nullptr);
 | |
| 
 | |
|     RefPtr<Protocol::Request> request;
 | |
|     auto protocol_client = TRY(Protocol::RequestClient::try_create());
 | |
|     auto output_stream = ConditionalOutputFileStream { [&] { return should_save_stream_data; }, stdout };
 | |
| 
 | |
|     // https://httpwg.org/specs/rfc9110.html#authentication
 | |
|     auto const has_credentials = !credentials.is_empty();
 | |
|     auto const has_manual_authorization_header = request_headers.contains("Authorization");
 | |
|     if (is_http_url && has_credentials && !has_manual_authorization_header) {
 | |
|         // 11.2. Authentication Parameters
 | |
|         // The authentication scheme is followed by additional information necessary for achieving authentication via
 | |
|         // that scheme as (...) or a single sequence of characters capable of holding base64-encoded information.
 | |
|         auto const encoded_credentials = TRY(encode_base64(credentials.bytes()));
 | |
|         auto const authorization = TRY(String::formatted("Basic {}", encoded_credentials));
 | |
|         request_headers.set("Authorization", authorization.to_deprecated_string());
 | |
|     } else {
 | |
|         if (is_http_url && has_credentials && has_manual_authorization_header)
 | |
|             warnln("* Skipping encoding provided authorization, manual header present.");
 | |
|         if (!is_http_url && has_credentials)
 | |
|             warnln("* Skipping adding Authorization header, request was not for the HTTP protocol.");
 | |
|     }
 | |
| 
 | |
|     Function<void()> setup_request = [&] {
 | |
|         if (!request) {
 | |
|             warnln("Failed to start request for '{}'", url_str);
 | |
|             exit(1);
 | |
|         }
 | |
| 
 | |
|         if (verbose_output && is_http_url) {
 | |
|             warnln("* Setting up request");
 | |
|             warnln("> Method={}, URL={}", method, url);
 | |
|             for (auto const& header : request_headers) {
 | |
|                 warnln("> {}: {}", header.key, header.value);
 | |
|             }
 | |
|         }
 | |
| 
 | |
|         request->on_progress = [&](Optional<u32> maybe_total_size, u32 downloaded_size) {
 | |
|             gettimeofday(¤t_time, nullptr);
 | |
|             timersub(¤t_time, &previous_time, &time_diff);
 | |
|             auto time_diff_ms = time_diff.tv_sec * 1000 + time_diff.tv_usec / 1000;
 | |
|             if (time_diff_ms < report_time_in_ms)
 | |
|                 return;
 | |
| 
 | |
|             warn("\r\033[2K");
 | |
|             if (maybe_total_size.has_value()) {
 | |
|                 warn("\033]9;{};{};\033\\", downloaded_size, maybe_total_size.value());
 | |
|                 warn("Download progress: {} / {}", human_readable_size(downloaded_size), human_readable_size(maybe_total_size.value()));
 | |
|             } else {
 | |
|                 warn("Download progress: {} / ???", human_readable_size(downloaded_size));
 | |
|             }
 | |
| 
 | |
|             auto size_diff = downloaded_size - previous_downloaded_size;
 | |
|             if (time_diff_ms > speed_update_time_in_ms) {
 | |
|                 previous_time = current_time;
 | |
|                 previous_downloaded_size = downloaded_size;
 | |
|             }
 | |
| 
 | |
|             warn(" at {}/s", human_readable_size(((float)size_diff / (float)time_diff_ms) * 1000));
 | |
|         };
 | |
|         request->on_headers_received = [&](auto& response_headers, auto status_code) {
 | |
|             if (received_actual_headers)
 | |
|                 return;
 | |
|             dbgln("Received headers! response code = {}", status_code.value_or(0));
 | |
|             received_actual_headers = true; // And not trailers!
 | |
|             should_save_stream_data = true;
 | |
| 
 | |
|             if (verbose_output && is_http_url) {
 | |
|                 warnln("* Received headers");
 | |
|                 auto const value = status_code.value_or(0);
 | |
|                 auto const reason_phrase = (value != 0)
 | |
|                     ? HTTP::HttpResponse::reason_phrase_for_code(value)
 | |
|                     : "UNKNOWN"sv;
 | |
|                 warnln("< Code={}, Reason={}", value, reason_phrase);
 | |
|                 for (auto const& header : response_headers) {
 | |
|                     warnln("< {}: {}", header.key, header.value);
 | |
|                 }
 | |
|             }
 | |
| 
 | |
|             if (!following_url && save_at_provided_name) {
 | |
|                 DeprecatedString output_name;
 | |
|                 if (auto content_disposition = response_headers.get("Content-Disposition"); content_disposition.has_value()) {
 | |
|                     auto& value = content_disposition.value();
 | |
|                     ContentDispositionParser parser(value);
 | |
|                     output_name = parser.filename();
 | |
|                 }
 | |
| 
 | |
|                 if (output_name.is_empty())
 | |
|                     output_name = url.path();
 | |
| 
 | |
|                 LexicalPath path { output_name };
 | |
|                 output_name = path.basename();
 | |
| 
 | |
|                 // The URL didn't have a name component, e.g. 'serenityos.org'
 | |
|                 if (output_name.is_empty() || output_name == "/") {
 | |
|                     int i = -1;
 | |
|                     do {
 | |
|                         output_name = url.host();
 | |
|                         if (i > -1)
 | |
|                             output_name = DeprecatedString::formatted("{}.{}", output_name, i);
 | |
|                         ++i;
 | |
|                     } while (Core::File::exists(output_name));
 | |
|                 }
 | |
| 
 | |
|                 if (freopen(output_name.characters(), "w", stdout) == nullptr) {
 | |
|                     perror("freopen");
 | |
|                     loop.quit(1);
 | |
|                     return;
 | |
|                 }
 | |
|             }
 | |
| 
 | |
|             auto status_code_value = status_code.value_or(0);
 | |
|             if (should_follow_url && status_code_value >= 300 && status_code_value < 400) {
 | |
|                 if (auto location = response_headers.get("Location"); location.has_value()) {
 | |
|                     auto was_following_url = following_url;
 | |
|                     following_url = true;
 | |
|                     received_actual_headers = false;
 | |
|                     should_save_stream_data = false;
 | |
|                     request->on_finish = nullptr;
 | |
|                     request->on_headers_received = nullptr;
 | |
|                     request->on_progress = nullptr;
 | |
|                     request->stop();
 | |
| 
 | |
|                     Core::deferred_invoke([&, was_following_url, url = location.value()] {
 | |
|                         warnln("{}Following to {}", was_following_url ? "" : "\n", url);
 | |
|                         request = protocol_client->start_request(method, url, request_headers, ReadonlyBytes {}, proxy_data);
 | |
|                         setup_request();
 | |
|                     });
 | |
|                 }
 | |
|             } else {
 | |
|                 following_url = false;
 | |
| 
 | |
|                 if (status_code_value >= 400)
 | |
|                     warnln("Request returned error {}", status_code_value);
 | |
|             }
 | |
|         };
 | |
|         request->on_finish = [&](bool success, auto) {
 | |
|             if (following_url)
 | |
|                 return;
 | |
| 
 | |
|             warn("\033]9;-1;\033\\");
 | |
|             warnln();
 | |
|             if (!success)
 | |
|                 warnln("Request failed :(");
 | |
|             loop.quit(0);
 | |
|         };
 | |
| 
 | |
|         request->stream_into(output_stream);
 | |
|     };
 | |
| 
 | |
|     request = protocol_client->start_request(method, url, request_headers, data ? StringView { data, strlen(data) }.bytes() : ReadonlyBytes {}, proxy_data);
 | |
|     setup_request();
 | |
| 
 | |
|     dbgln("started request with id {}", request->id());
 | |
| 
 | |
|     auto rc = loop.exec();
 | |
|     fflush(stdout);
 | |
|     return rc;
 | |
| }
 | 
