2018-12-31 22:04:05 +03:00
|
|
|
//
|
2019-01-01 01:02:34 +03:00
|
|
|
// Copyright Aliaksei Levin (levlam@telegram.org), Arseny Smirnov (arseny30@gmail.com) 2014-2019
|
2018-12-31 22:04:05 +03:00
|
|
|
//
|
|
|
|
// Distributed under the Boost Software License, Version 1.0. (See accompanying
|
|
|
|
// file LICENSE_1_0.txt or copy at http://www.boost.org/LICENSE_1_0.txt)
|
|
|
|
//
|
|
|
|
#include "td/net/Wget.h"
|
|
|
|
|
|
|
|
#include "td/net/HttpHeaderCreator.h"
|
|
|
|
#include "td/net/HttpOutboundConnection.h"
|
2018-08-15 15:41:42 +03:00
|
|
|
#include "td/net/SslStream.h"
|
2018-12-31 22:04:05 +03:00
|
|
|
|
|
|
|
#include "td/utils/buffer.h"
|
|
|
|
#include "td/utils/HttpUrl.h"
|
|
|
|
#include "td/utils/logging.h"
|
2018-04-28 11:56:10 +03:00
|
|
|
#include "td/utils/misc.h"
|
2018-12-31 22:04:05 +03:00
|
|
|
#include "td/utils/port/IPAddress.h"
|
|
|
|
#include "td/utils/port/SocketFd.h"
|
|
|
|
#include "td/utils/Slice.h"
|
|
|
|
|
|
|
|
#include <limits>
|
|
|
|
|
|
|
|
namespace td {
|
2018-05-18 16:15:01 +03:00
|
|
|
|
2019-06-17 19:12:54 +03:00
|
|
|
Wget::Wget(Promise<unique_ptr<HttpQuery>> promise, string url, std::vector<std::pair<string, string>> headers,
|
|
|
|
int32 timeout_in, int32 ttl, bool prefer_ipv6, SslStream::VerifyPeer verify_peer)
|
2018-12-31 22:04:05 +03:00
|
|
|
: promise_(std::move(promise))
|
|
|
|
, input_url_(std::move(url))
|
|
|
|
, headers_(std::move(headers))
|
|
|
|
, timeout_in_(timeout_in)
|
|
|
|
, ttl_(ttl)
|
2018-07-01 04:45:25 +03:00
|
|
|
, prefer_ipv6_(prefer_ipv6)
|
2018-12-31 22:04:05 +03:00
|
|
|
, verify_peer_(verify_peer) {
|
|
|
|
}
|
|
|
|
|
|
|
|
Status Wget::try_init() {
|
|
|
|
string input_url = input_url_;
|
|
|
|
TRY_RESULT(url, parse_url(MutableSlice(input_url)));
|
2018-05-18 16:15:01 +03:00
|
|
|
TRY_RESULT(ascii_host, idn_to_ascii(url.host_));
|
|
|
|
url.host_ = std::move(ascii_host);
|
2018-12-31 22:04:05 +03:00
|
|
|
|
|
|
|
HttpHeaderCreator hc;
|
|
|
|
hc.init_get(url.query_);
|
2018-03-13 22:31:37 +03:00
|
|
|
bool was_host = false;
|
2018-04-19 15:23:54 +03:00
|
|
|
bool was_accept_encoding = false;
|
2018-12-31 22:04:05 +03:00
|
|
|
for (auto &header : headers_) {
|
2018-04-19 15:23:54 +03:00
|
|
|
auto header_lower = to_lower(header.first);
|
|
|
|
if (header_lower == "host") {
|
2018-03-13 22:31:37 +03:00
|
|
|
was_host = true;
|
|
|
|
}
|
2018-04-19 15:23:54 +03:00
|
|
|
if (header_lower == "accept-encoding") {
|
|
|
|
was_accept_encoding = true;
|
|
|
|
}
|
2018-12-31 22:04:05 +03:00
|
|
|
hc.add_header(header.first, header.second);
|
|
|
|
}
|
2018-03-13 22:31:37 +03:00
|
|
|
if (!was_host) {
|
|
|
|
hc.add_header("Host", url.host_);
|
|
|
|
}
|
2018-04-19 15:23:54 +03:00
|
|
|
if (!was_accept_encoding) {
|
|
|
|
hc.add_header("Accept-Encoding", "gzip, deflate");
|
|
|
|
}
|
2018-06-01 23:45:34 +03:00
|
|
|
TRY_RESULT(header, hc.finish());
|
|
|
|
|
|
|
|
IPAddress addr;
|
2018-07-01 04:45:25 +03:00
|
|
|
TRY_STATUS(addr.init_host_port(url.host_, url.port_, prefer_ipv6_));
|
2018-06-01 23:45:34 +03:00
|
|
|
|
|
|
|
TRY_RESULT(fd, SocketFd::open(addr));
|
|
|
|
if (url.protocol_ == HttpUrl::Protocol::HTTP) {
|
2018-08-15 15:41:42 +03:00
|
|
|
connection_ = create_actor<HttpOutboundConnection>("Connect", std::move(fd), SslStream{},
|
|
|
|
std::numeric_limits<std::size_t>::max(), 0, 0,
|
|
|
|
ActorOwn<HttpOutboundConnection::Callback>(actor_id(this)));
|
2018-06-01 23:45:34 +03:00
|
|
|
} else {
|
2018-08-15 15:41:42 +03:00
|
|
|
TRY_RESULT(ssl_stream, SslStream::create(url.host_, CSlice() /* certificate */, verify_peer_));
|
|
|
|
connection_ = create_actor<HttpOutboundConnection>("Connect", std::move(fd), std::move(ssl_stream),
|
|
|
|
std::numeric_limits<std::size_t>::max(), 0, 0,
|
|
|
|
ActorOwn<HttpOutboundConnection::Callback>(actor_id(this)));
|
2018-06-01 23:45:34 +03:00
|
|
|
}
|
2018-12-31 22:04:05 +03:00
|
|
|
|
2018-06-01 23:45:34 +03:00
|
|
|
send_closure(connection_, &HttpOutboundConnection::write_next, BufferSlice(header));
|
2018-12-31 22:04:05 +03:00
|
|
|
send_closure(connection_, &HttpOutboundConnection::write_ok);
|
|
|
|
return Status::OK();
|
|
|
|
}
|
|
|
|
|
|
|
|
void Wget::loop() {
|
|
|
|
if (connection_.empty()) {
|
|
|
|
auto status = try_init();
|
|
|
|
if (status.is_error()) {
|
|
|
|
return on_error(std::move(status));
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2019-06-17 19:12:54 +03:00
|
|
|
void Wget::handle(unique_ptr<HttpQuery> result) {
|
2018-12-31 22:04:05 +03:00
|
|
|
on_ok(std::move(result));
|
|
|
|
}
|
|
|
|
|
|
|
|
void Wget::on_connection_error(Status error) {
|
|
|
|
on_error(std::move(error));
|
|
|
|
}
|
|
|
|
|
2019-06-17 19:12:54 +03:00
|
|
|
void Wget::on_ok(unique_ptr<HttpQuery> http_query_ptr) {
|
2018-12-31 22:04:05 +03:00
|
|
|
CHECK(promise_);
|
2019-06-17 19:12:54 +03:00
|
|
|
CHECK(http_query_ptr);
|
2018-05-18 02:03:21 +03:00
|
|
|
if ((http_query_ptr->code_ == 301 || http_query_ptr->code_ == 302 || http_query_ptr->code_ == 307 ||
|
|
|
|
http_query_ptr->code_ == 308) &&
|
|
|
|
ttl_ > 0) {
|
2018-12-31 22:04:05 +03:00
|
|
|
LOG(DEBUG) << *http_query_ptr;
|
2018-04-19 15:23:54 +03:00
|
|
|
input_url_ = http_query_ptr->get_header("location").str();
|
2018-12-31 22:04:05 +03:00
|
|
|
LOG(DEBUG) << input_url_;
|
|
|
|
ttl_--;
|
|
|
|
connection_.reset();
|
|
|
|
yield();
|
|
|
|
} else if (http_query_ptr->code_ >= 200 && http_query_ptr->code_ < 300) {
|
|
|
|
promise_.set_value(std::move(http_query_ptr));
|
|
|
|
stop();
|
|
|
|
} else {
|
2018-04-19 15:23:54 +03:00
|
|
|
on_error(Status::Error(PSLICE() << "HTTP error: " << http_query_ptr->code_));
|
2018-12-31 22:04:05 +03:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
void Wget::on_error(Status error) {
|
|
|
|
CHECK(error.is_error());
|
|
|
|
CHECK(promise_);
|
|
|
|
promise_.set_error(std::move(error));
|
|
|
|
stop();
|
|
|
|
}
|
|
|
|
|
|
|
|
void Wget::start_up() {
|
|
|
|
set_timeout_in(timeout_in_);
|
|
|
|
loop();
|
|
|
|
}
|
|
|
|
|
|
|
|
void Wget::timeout_expired() {
|
|
|
|
on_error(Status::Error("Timeout expired"));
|
|
|
|
}
|
|
|
|
|
|
|
|
void Wget::tear_down() {
|
|
|
|
if (promise_) {
|
|
|
|
on_error(Status::Error("Cancelled"));
|
|
|
|
}
|
|
|
|
}
|
2018-05-18 16:15:01 +03:00
|
|
|
|
2018-12-31 22:04:05 +03:00
|
|
|
} // namespace td
|