ppsspp/Common/Net/HTTPClient.cpp

634 lines
17 KiB
C++
Raw Normal View History

#include "Common/Net/HTTPClient.h"
#include "Common/TimeUtil.h"
#include "Common/StringUtils.h"
#include "Common/System/OSD.h"
#ifndef _WIN32
#include <netinet/in.h>
#include <arpa/inet.h>
#include <sys/select.h>
#include <sys/socket.h>
#include <sys/types.h>
#include <netdb.h>
#include <unistd.h>
#define closesocket close
#else
#ifndef NOMINMAX
#define NOMINMAX
#endif
#include <winsock2.h>
#include <ws2tcpip.h>
#include <io.h>
#endif
#include <cmath>
2020-09-29 11:02:02 +00:00
#include <cstdio>
#include <cstdlib>
#include "Common/Net/Resolve.h"
#include "Common/Net/URL.h"
#include "Common/File/FileDescriptor.h"
2023-09-23 18:10:45 +00:00
#include "Common/SysError.h"
#include "Common/Thread/ThreadUtil.h"
#include "Common/Data/Encoding/Compression.h"
#include "Common/Net/NetBuffer.h"
#include "Common/Log.h"
namespace net {
Connection::~Connection() {
2012-10-30 12:20:55 +00:00
Disconnect();
if (resolved_ != nullptr)
DNSResolveFree(resolved_);
}
// For whatever crazy reason, htons isn't available on android x86 on the build server. so here we go.
// TODO: Fix for big-endian
inline unsigned short myhtons(unsigned short x) {
return (x >> 8) | (x << 8);
}
2020-12-19 18:34:43 +00:00
const char *DNSTypeAsString(DNSType type) {
switch (type) {
case DNSType::IPV4:
return "IPV4";
case DNSType::IPV6:
return "IPV6";
case DNSType::ANY:
return "ANY";
default:
return "N/A";
}
}
bool Connection::Resolve(const char *host, int port, DNSType type) {
if ((intptr_t)sock_ != -1) {
ERROR_LOG(Log::IO, "Resolve: Already have a socket");
return false;
}
if (!host || port < 1 || port > 65535) {
ERROR_LOG(Log::IO, "Resolve: Invalid host or port (%d)", port);
return false;
}
2012-10-30 12:20:55 +00:00
host_ = host;
port_ = port;
char port_str[16];
snprintf(port_str, sizeof(port_str), "%d", port);
2013-11-18 15:27:39 +00:00
std::string err;
if (!net::DNSResolve(host, port_str, &resolved_, err, type)) {
WARN_LOG(Log::IO, "Failed to resolve host '%s': '%s' (%s)", host, err.c_str(), DNSTypeAsString(type));
2020-12-19 18:34:43 +00:00
// Zero port so that future calls fail.
port_ = 0;
return false;
}
2012-10-30 12:20:55 +00:00
return true;
}
2023-09-17 15:37:45 +00:00
static void FormatAddr(char *addrbuf, size_t bufsize, const addrinfo *info) {
switch (info->ai_family) {
case AF_INET:
case AF_INET6:
2023-09-23 18:10:45 +00:00
inet_ntop(info->ai_family, &((sockaddr_in *)info->ai_addr)->sin_addr, addrbuf, bufsize);
2023-09-17 15:37:45 +00:00
break;
default:
snprintf(addrbuf, bufsize, "(Unknown AF %d)", info->ai_family);
break;
}
}
bool Connection::Connect(int maxTries, double timeout, bool *cancelConnect) {
if (port_ <= 0) {
ERROR_LOG(Log::IO, "Bad port");
return false;
}
sock_ = -1;
2012-10-30 12:20:55 +00:00
for (int tries = maxTries; tries > 0; --tries) {
std::vector<uintptr_t> sockets;
fd_set fds;
int maxfd = 1;
FD_ZERO(&fds);
for (addrinfo *possible = resolved_; possible != nullptr; possible = possible->ai_next) {
if (possible->ai_family != AF_INET && possible->ai_family != AF_INET6)
continue;
int sock = socket(possible->ai_family, SOCK_STREAM, IPPROTO_TCP);
if ((intptr_t)sock == -1) {
ERROR_LOG(Log::IO, "Bad socket");
continue;
}
// Windows sockets aren't limited by socket number, just by count, so checking FD_SETSIZE there is wrong.
#if !PPSSPP_PLATFORM(WINDOWS)
if (sock >= FD_SETSIZE) {
ERROR_LOG(Log::IO, "Socket doesn't fit in FD_SET: %d We probably have a leak.", sock);
closesocket(sock);
continue;
}
#endif
fd_util::SetNonBlocking(sock, true);
// Start trying to connect (async with timeout.)
errno = 0;
if (connect(sock, possible->ai_addr, (int)possible->ai_addrlen) < 0) {
2023-09-23 18:10:45 +00:00
#if PPSSPP_PLATFORM(WINDOWS)
int errorCode = WSAGetLastError();
std::string errorString = GetStringErrorMsg(errorCode);
bool unreachable = errorCode == WSAENETUNREACH;
bool inProgress = errorCode == WSAEINPROGRESS || errorCode == WSAEWOULDBLOCK;
#else
int errorCode = errno;
std::string errorString = strerror(errno);
bool unreachable = errorCode == ENETUNREACH;
bool inProgress = errorCode == EINPROGRESS || errorCode == EWOULDBLOCK;
#endif
if (!inProgress) {
char addrStr[128]{};
2023-09-17 15:37:45 +00:00
FormatAddr(addrStr, sizeof(addrStr), possible);
2023-09-23 18:10:45 +00:00
if (!unreachable) {
ERROR_LOG(Log::HTTP, "connect(%d) call to %s failed (%d: %s)", sock, addrStr, errorCode, errorString.c_str());
2023-09-17 15:37:45 +00:00
} else {
INFO_LOG(Log::HTTP, "connect(%d): Ignoring unreachable resolved address %s", sock, addrStr);
2023-09-17 15:37:45 +00:00
}
closesocket(sock);
continue;
}
}
sockets.push_back(sock);
FD_SET(sock, &fds);
if (maxfd < sock + 1) {
maxfd = sock + 1;
}
}
int selectResult = 0;
long timeoutHalfSeconds = floor(2 * timeout);
while (timeoutHalfSeconds >= 0 && selectResult == 0) {
2024-10-10 09:55:07 +00:00
struct timeval tv{};
tv.tv_sec = 0;
if (timeoutHalfSeconds > 0) {
// Wait up to 0.5 seconds between cancel checks.
tv.tv_usec = 500000;
} else {
// Wait the remaining <= 0.5 seconds. Possibly 0, but that's okay.
tv.tv_usec = (timeout - floor(2 * timeout) / 2) * 1000000.0;
}
--timeoutHalfSeconds;
selectResult = select(maxfd, nullptr, &fds, nullptr, &tv);
if (cancelConnect && *cancelConnect) {
WARN_LOG(Log::HTTP, "connect: cancelled (1)");
break;
}
}
if (selectResult > 0) {
// Something connected. Pick the first one that did (if multiple.)
for (int sock : sockets) {
if ((intptr_t)sock_ == -1 && FD_ISSET(sock, &fds)) {
sock_ = sock;
} else {
closesocket(sock);
}
}
// Great, now we're good to go.
return true;
} else {
// Fail. Close all the sockets.
for (int sock : sockets) {
closesocket(sock);
}
}
if (cancelConnect && *cancelConnect) {
WARN_LOG(Log::HTTP, "connect: cancelled (2)");
break;
}
sleep_ms(1, "connect");
2012-10-30 12:20:55 +00:00
}
// Nothing connected, unfortunately.
return false;
}
void Connection::Disconnect() {
2012-10-30 12:20:55 +00:00
if ((intptr_t)sock_ != -1) {
closesocket(sock_);
sock_ = -1;
}
}
2012-10-30 12:20:55 +00:00
} // net
namespace http {
// TODO: do something sane here
2023-07-14 13:24:34 +00:00
constexpr const char *DEFAULT_USERAGENT = "PPSSPP";
constexpr const char *HTTP_VERSION = "1.1";
2013-06-04 20:05:17 +00:00
Client::Client() {
2021-05-01 06:12:42 +00:00
userAgent_ = DEFAULT_USERAGENT;
}
2013-06-04 20:05:17 +00:00
Client::~Client() {
Disconnect();
}
// Ignores line folding (deprecated), but respects field combining.
// Don't use for Set-Cookie, which is a special header per RFC 7230.
bool GetHeaderValue(const std::vector<std::string> &responseHeaders, const std::string &header, std::string *value) {
std::string search = header + ":";
bool found = false;
value->clear();
for (const std::string &line : responseHeaders) {
auto stripped = StripSpaces(line);
if (startsWithNoCase(stripped, search)) {
size_t value_pos = search.length();
size_t after_white = stripped.find_first_not_of(" \t", value_pos);
if (after_white != stripped.npos)
value_pos = after_white;
if (!found)
*value = stripped.substr(value_pos);
else
*value += "," + stripped.substr(value_pos);
found = true;
}
}
return found;
}
2013-06-04 20:05:17 +00:00
static bool DeChunk(Buffer *inbuffer, Buffer *outbuffer, int contentLength) {
_dbg_assert_(outbuffer->empty());
2013-11-29 15:31:19 +00:00
int dechunkedBytes = 0;
2013-06-04 20:05:17 +00:00
while (true) {
std::string line;
inbuffer->TakeLineCRLF(&line);
if (!line.size())
return false;
unsigned int chunkSize = 0;
if (sscanf(line.c_str(), "%x", &chunkSize) != 1) {
return false;
}
2013-06-04 20:05:17 +00:00
if (chunkSize) {
std::string data;
inbuffer->Take(chunkSize, &data);
outbuffer->Append(data);
} else {
// a zero size chunk should mean the end.
inbuffer->clear();
return true;
2013-06-04 20:05:17 +00:00
}
2013-11-29 15:31:19 +00:00
dechunkedBytes += chunkSize;
2013-06-04 20:05:17 +00:00
inbuffer->Skip(2);
}
// Unreachable
return true;
2013-06-04 20:05:17 +00:00
}
int Client::GET(const RequestParams &req, Buffer *output, std::vector<std::string> &responseHeaders, net::RequestProgress *progress) {
const char *otherHeaders =
"Accept-Encoding: gzip\r\n";
int err = SendRequest("GET", req, otherHeaders, progress);
if (err < 0) {
return err;
}
net::Buffer readbuf;
int code = ReadResponseHeaders(&readbuf, responseHeaders, progress);
if (code < 0) {
return code;
}
err = ReadResponseEntity(&readbuf, responseHeaders, output, progress);
if (err < 0) {
return err;
}
return code;
}
int Client::GET(const RequestParams &req, Buffer *output, net::RequestProgress *progress) {
2017-03-11 05:23:49 +00:00
std::vector<std::string> responseHeaders;
int code = GET(req, output, responseHeaders, progress);
2017-03-11 05:23:49 +00:00
return code;
}
int Client::POST(const RequestParams &req, const std::string &data, const std::string &mime, Buffer *output, net::RequestProgress *progress) {
2014-11-25 16:49:05 +00:00
char otherHeaders[2048];
if (mime.empty()) {
snprintf(otherHeaders, sizeof(otherHeaders), "Content-Length: %lld\r\n", (long long)data.size());
} else {
snprintf(otherHeaders, sizeof(otherHeaders), "Content-Length: %lld\r\nContent-Type: %s\r\n", (long long)data.size(), mime.c_str());
}
int err = SendRequestWithData("POST", req, data, otherHeaders, progress);
2014-11-25 16:49:05 +00:00
if (err < 0) {
return err;
}
net::Buffer readbuf;
2014-11-25 16:49:05 +00:00
std::vector<std::string> responseHeaders;
int code = ReadResponseHeaders(&readbuf, responseHeaders, progress);
if (code < 0) {
return code;
}
2014-11-25 16:49:05 +00:00
err = ReadResponseEntity(&readbuf, responseHeaders, output, progress);
if (err < 0) {
return err;
}
return code;
}
int Client::POST(const RequestParams &req, const std::string &data, Buffer *output, net::RequestProgress *progress) {
return POST(req, data, "", output, progress);
}
int Client::SendRequest(const char *method, const RequestParams &req, const char *otherHeaders, net::RequestProgress *progress) {
return SendRequestWithData(method, req, "", otherHeaders, progress);
2014-11-25 16:49:05 +00:00
}
int Client::SendRequestWithData(const char *method, const RequestParams &req, const std::string &data, const char *otherHeaders, net::RequestProgress *progress) {
2023-07-18 13:52:14 +00:00
progress->Update(0, 0, false);
2013-11-18 15:27:39 +00:00
net::Buffer buffer;
2013-06-04 20:05:17 +00:00
const char *tpl =
"%s %s HTTP/%s\r\n"
2013-06-04 20:05:17 +00:00
"Host: %s\r\n"
"User-Agent: %s\r\n"
"Accept: %s\r\n"
2013-06-04 20:05:17 +00:00
"Connection: close\r\n"
"%s"
2013-06-04 20:05:17 +00:00
"\r\n";
buffer.Printf(tpl,
method, req.resource.c_str(), HTTP_VERSION,
host_.c_str(),
2021-05-01 06:12:42 +00:00
userAgent_.c_str(),
req.acceptMime,
otherHeaders ? otherHeaders : "");
2014-11-25 16:49:05 +00:00
buffer.Append(data);
bool flushed = buffer.FlushSocket(sock(), dataTimeout_, progress->cancelled);
if (!flushed) {
return -1; // TODO error code.
}
return 0;
}
int Client::ReadResponseHeaders(net::Buffer *readbuf, std::vector<std::string> &responseHeaders, net::RequestProgress *progress) {
2013-06-04 20:05:17 +00:00
// Snarf all the data we can into RAM. A little unsafe but hey.
static constexpr float CANCEL_INTERVAL = 0.25f;
bool ready = false;
double endTimeout = time_now_d() + dataTimeout_;
while (!ready) {
if (progress->cancelled && *progress->cancelled)
return -1;
ready = fd_util::WaitUntilReady(sock(), CANCEL_INTERVAL, false);
if (!ready && time_now_d() > endTimeout) {
ERROR_LOG(Log::HTTP, "HTTP headers timed out");
return -1;
}
};
// Let's hope all the headers are available in a single packet...
if (readbuf->Read(sock(), 4096) < 0) {
ERROR_LOG(Log::HTTP, "Failed to read HTTP headers :(");
return -1;
2013-11-29 15:31:19 +00:00
}
2013-06-02 21:44:28 +00:00
// Grab the first header line that contains the http code.
2013-06-04 20:05:17 +00:00
std::string line;
readbuf->TakeLineCRLF(&line);
2013-06-25 02:40:24 +00:00
int code;
size_t code_pos = line.find(' ');
if (code_pos != line.npos) {
code_pos = line.find_first_not_of(' ', code_pos);
}
2013-11-29 16:33:56 +00:00
2013-06-25 02:40:24 +00:00
if (code_pos != line.npos) {
code = atoi(&line[code_pos]);
} else {
ERROR_LOG(Log::HTTP, "Could not parse HTTP status code: %s", line.c_str());
2013-06-25 02:40:24 +00:00
return -1;
}
2013-06-04 20:05:17 +00:00
while (true) {
int sz = readbuf->TakeLineCRLF(&line);
2023-07-23 21:20:30 +00:00
if (!sz || sz < 0)
2013-06-04 20:05:17 +00:00
break;
responseHeaders.push_back(line);
}
2014-11-25 16:49:05 +00:00
if (responseHeaders.size() == 0) {
ERROR_LOG(Log::HTTP, "No HTTP response headers");
2014-11-25 16:49:05 +00:00
return -1;
}
return code;
}
int Client::ReadResponseEntity(net::Buffer *readbuf, const std::vector<std::string> &responseHeaders, Buffer *output, net::RequestProgress *progress) {
_dbg_assert_(progress->cancelled);
bool gzip = false;
bool chunked = false;
int contentLength = 0;
for (std::string line : responseHeaders) {
if (startsWithNoCase(line, "Content-Length:")) {
2013-06-25 02:40:24 +00:00
size_t size_pos = line.find_first_of(' ');
if (size_pos != line.npos) {
size_pos = line.find_first_not_of(' ', size_pos);
}
if (size_pos != line.npos) {
contentLength = atoi(&line[size_pos]);
chunked = false;
}
} else if (startsWithNoCase(line, "Content-Encoding:")) {
// TODO: Case folding...
2013-06-04 20:05:17 +00:00
if (line.find("gzip") != std::string::npos) {
gzip = true;
}
} else if (startsWithNoCase(line, "Transfer-Encoding:")) {
// TODO: Case folding...
2013-06-25 02:40:24 +00:00
if (line.find("chunked") != std::string::npos) {
chunked = true;
}
2013-06-04 20:05:17 +00:00
}
}
2013-06-02 21:44:28 +00:00
if (contentLength < 0) {
WARN_LOG(Log::HTTP, "Negative content length %d", contentLength);
// Just sanity checking...
contentLength = 0;
}
if (!readbuf->ReadAllWithProgress(sock(), contentLength, progress))
return -1;
2013-11-18 15:27:39 +00:00
2013-06-04 20:05:17 +00:00
// output now contains the rest of the reply. Dechunk it.
if (!output->IsVoid()) {
if (chunked) {
if (!DeChunk(readbuf, output, contentLength)) {
ERROR_LOG(Log::HTTP, "Bad chunked data, couldn't read chunk size");
progress->Update(0, 0, true);
return -1;
}
} else {
output->Append(*readbuf);
}
2013-06-04 20:05:17 +00:00
// If it's gzipped, we decompress it and put it back in the buffer.
if (gzip) {
std::string compressed, decompressed;
output->TakeAll(&compressed);
bool result = decompress_string(compressed, &decompressed);
if (!result) {
ERROR_LOG(Log::HTTP, "Error decompressing using zlib");
2023-07-18 13:52:14 +00:00
progress->Update(0, 0, true);
return -1;
}
output->Append(decompressed);
2013-06-04 20:05:17 +00:00
}
}
2023-07-18 13:52:14 +00:00
progress->Update(contentLength, contentLength, true);
return 0;
}
HTTPRequest::HTTPRequest(RequestMethod method, const std::string &url, const std::string &postData, const std::string &postMime, const Path &outfile, ProgressBarMode progressBarMode, std::string_view name)
: Request(method, url, name, &cancelled_, progressBarMode), postData_(postData), postMime_(postMime), outfile_(outfile) {
}
HTTPRequest::~HTTPRequest() {
2024-10-10 08:46:52 +00:00
g_OSD.RemoveProgressBar(url_, !failed_, 0.5f);
2023-07-18 13:52:14 +00:00
_assert_msg_(joined_, "Download destructed without join");
}
void HTTPRequest::Start() {
2024-10-10 08:46:52 +00:00
thread_ = std::thread([this] { Do(); });
}
void HTTPRequest::Join() {
2020-06-28 16:34:00 +00:00
if (joined_) {
ERROR_LOG(Log::HTTP, "Already joined thread!");
2020-06-28 16:34:00 +00:00
}
thread_.join();
joined_ = true;
}
void HTTPRequest::SetFailed(int code) {
failed_ = true;
2023-07-18 13:52:14 +00:00
progress_.Update(0, 0, true);
completed_ = true;
}
int HTTPRequest::Perform(const std::string &url) {
2019-06-23 19:04:59 +00:00
Url fileUrl(url);
if (!fileUrl.Valid()) {
2019-06-23 19:04:59 +00:00
return -1;
}
http::Client client;
2023-07-14 13:24:34 +00:00
if (!userAgent_.empty()) {
client.SetUserAgent(userAgent_);
}
2014-12-31 17:36:51 +00:00
if (!client.Resolve(fileUrl.Host().c_str(), fileUrl.Port())) {
ERROR_LOG(Log::HTTP, "Failed resolving %s", url.c_str());
2019-06-23 19:04:59 +00:00
return -1;
}
if (cancelled_) {
2019-06-23 19:04:59 +00:00
return -1;
}
2019-06-23 19:04:59 +00:00
if (!client.Connect(2, 20.0, &cancelled_)) {
ERROR_LOG(Log::HTTP, "Failed connecting to server or cancelled.");
2019-06-23 19:04:59 +00:00
return -1;
}
if (cancelled_) {
2019-06-23 19:04:59 +00:00
return -1;
}
RequestParams req(fileUrl.Resource(), acceptMime_);
if (method_ == RequestMethod::GET) {
return client.GET(req, &buffer_, responseHeaders_, &progress_);
} else {
return client.POST(req, postData_, postMime_, &buffer_, &progress_);
}
2019-06-23 19:04:59 +00:00
}
std::string HTTPRequest::RedirectLocation(const std::string &baseUrl) const {
std::string redirectUrl;
if (GetHeaderValue(responseHeaders_, "Location", &redirectUrl)) {
Url url(baseUrl);
url = url.Relative(redirectUrl);
redirectUrl = url.ToString();
}
2019-06-23 19:04:59 +00:00
return redirectUrl;
}
void HTTPRequest::Do() {
SetCurrentThreadName("HTTPDownload::Do");
AndroidJNIThreadContext jniContext;
2019-06-23 19:04:59 +00:00
resultCode_ = 0;
std::string downloadURL = url_;
while (resultCode_ == 0) {
// This is where the new request is performed.
int resultCode = Perform(downloadURL);
2019-06-23 19:04:59 +00:00
if (resultCode == -1) {
SetFailed(resultCode);
return;
}
if (resultCode == 301 || resultCode == 302 || resultCode == 303 || resultCode == 307 || resultCode == 308) {
std::string redirectURL = RedirectLocation(downloadURL);
if (redirectURL.empty()) {
ERROR_LOG(Log::HTTP, "Could not find Location header for redirect");
2019-06-23 19:04:59 +00:00
resultCode_ = resultCode;
} else if (redirectURL == downloadURL || redirectURL == url_) {
// Simple loop detected, bail out.
resultCode_ = resultCode;
}
// Perform the next GET.
if (resultCode_ == 0) {
INFO_LOG(Log::HTTP, "Download of %s redirected to %s", downloadURL.c_str(), redirectURL.c_str());
buffer_.clear();
responseHeaders_.clear();
}
2019-06-23 19:04:59 +00:00
downloadURL = redirectURL;
continue;
}
if (resultCode == 200) {
INFO_LOG(Log::HTTP, "Completed requesting %s (storing result to %s)", url_.c_str(), outfile_.empty() ? "memory" : outfile_.c_str());
2021-05-15 05:46:03 +00:00
if (!outfile_.empty() && !buffer_.FlushToFile(outfile_)) {
ERROR_LOG(Log::HTTP, "Failed writing download to '%s'", outfile_.c_str());
2019-06-23 19:04:59 +00:00
}
} else {
ERROR_LOG(Log::HTTP, "Error requesting '%s' (storing result to '%s'): %i", url_.c_str(), outfile_.empty() ? "memory" : outfile_.c_str(), resultCode);
2019-06-23 19:04:59 +00:00
}
resultCode_ = resultCode;
}
2013-11-29 16:33:56 +00:00
// Set this last to ensure no race conditions when checking Done. Users must always check
// Done before looking at the result code.
completed_ = true;
}
2012-10-30 12:20:55 +00:00
} // http