Files
allwpilib/src/main/native/cpp/HttpUtil.cpp

352 lines
10 KiB
C++
Raw Normal View History

2016-12-02 19:15:40 -08:00
/*----------------------------------------------------------------------------*/
2017-08-25 17:48:06 -07:00
/* Copyright (c) 2016-2017 FIRST. All Rights Reserved. */
2016-12-02 19:15:40 -08:00
/* Open Source Software - may be modified and shared by FRC teams. The code */
/* must be accompanied by the FIRST BSD license file in the root directory of */
/* the project. */
/*----------------------------------------------------------------------------*/
#include "HttpUtil.h"
#include <cctype>
2017-08-25 17:48:06 -07:00
#include <llvm/STLExtras.h>
#include <llvm/StringExtras.h>
#include <support/Base64.h>
#include <tcpsockets/TCPConnector.h>
#include "Log.h"
2016-12-02 19:15:40 -08:00
namespace cs {
llvm::StringRef ReadLine(wpi::raw_istream& is, llvm::SmallVectorImpl<char>& buf,
int maxLen, bool* error) {
buf.clear();
for (int i = 0; i < maxLen; ++i) {
char c;
is.read(c);
if (is.has_error()) {
*error = true;
return llvm::StringRef{buf.data(), buf.size()};
}
if (c == '\r') continue;
buf.push_back(c);
if (c == '\n') break;
}
*error = false;
return llvm::StringRef{buf.data(), buf.size()};
}
llvm::StringRef UnescapeURI(llvm::StringRef str,
llvm::SmallVectorImpl<char>& buf, bool* error) {
buf.clear();
for (auto i = str.begin(), end = str.end(); i != end; ++i) {
// pass non-escaped characters to output
if (*i != '%') {
// decode + to space
if (*i == '+')
buf.push_back(' ');
else
buf.push_back(*i);
continue;
}
// are there enough characters left?
if (i + 2 >= end) {
*error = true;
return llvm::StringRef{};
}
// replace %xx with the corresponding character
unsigned val1 = llvm::hexDigitValue(*++i);
if (val1 == -1U) {
*error = true;
return llvm::StringRef{};
}
unsigned val2 = llvm::hexDigitValue(*++i);
if (val2 == -1U) {
*error = true;
return llvm::StringRef{};
}
buf.push_back((val1 << 4) | val2);
}
*error = false;
return llvm::StringRef{buf.data(), buf.size()};
}
llvm::StringRef EscapeURI(llvm::StringRef str, llvm::SmallVectorImpl<char>& buf,
bool spacePlus) {
2017-08-25 17:48:06 -07:00
static const char* const hexLut = "0123456789ABCDEF";
2016-12-02 19:15:40 -08:00
buf.clear();
for (auto i = str.begin(), end = str.end(); i != end; ++i) {
// pass unreserved characters to output
if (std::isalnum(*i) || *i == '-' || *i == '_' || *i == '.' || *i == '~') {
buf.push_back(*i);
continue;
}
// encode space to +
if (spacePlus && *i == ' ') {
buf.push_back('+');
continue;
}
// convert others to %xx
buf.push_back('%');
buf.push_back(hexLut[((*i) >> 4) & 0x0f]);
buf.push_back(hexLut[(*i) & 0x0f]);
}
return llvm::StringRef{buf.data(), buf.size()};
}
bool ParseHttpHeaders(wpi::raw_istream& is,
llvm::SmallVectorImpl<char>* contentType,
llvm::SmallVectorImpl<char>* contentLength) {
if (contentType) contentType->clear();
if (contentLength) contentLength->clear();
bool inContentType = false;
bool inContentLength = false;
llvm::SmallString<64> lineBuf;
for (;;) {
bool error;
llvm::StringRef line = ReadLine(is, lineBuf, 1024, &error).rtrim();
if (error) return false;
if (line.empty()) return true; // empty line signals end of headers
// header fields start at the beginning of the line
if (!std::isspace(line[0])) {
inContentType = false;
inContentLength = false;
llvm::StringRef field;
std::tie(field, line) = line.split(':');
field = field.rtrim();
if (field == "Content-Type")
inContentType = true;
else if (field == "Content-Length")
inContentLength = true;
else
continue; // ignore other fields
}
// collapse whitespace
line = line.ltrim();
// save field data
if (inContentType && contentType)
contentType->append(line.begin(), line.end());
else if (inContentLength && contentLength)
contentLength->append(line.begin(), line.end());
}
}
bool FindMultipartBoundary(wpi::raw_istream& is, llvm::StringRef boundary,
std::string* saveBuf) {
llvm::SmallString<64> searchBuf;
searchBuf.resize(boundary.size() + 2);
size_t searchPos = 0;
// Per the spec, the --boundary should be preceded by \r\n, so do a first
// pass of 1-byte reads to throw those away (common case) and keep the
// last non-\r\n character in searchBuf.
if (!saveBuf) {
do {
is.read(searchBuf.data(), 1);
if (is.has_error()) return false;
} while (searchBuf[0] == '\r' || searchBuf[0] == '\n');
searchPos = 1;
}
// Look for --boundary. Read boundarysize+2 bytes at a time
// during the search to speed up the reads, then fast-scan for -,
// and only then match the entire boundary. This will be slow if
// there's a bunch of continuous -'s in the output, but that's unlikely.
for (;;) {
is.read(searchBuf.data() + searchPos, searchBuf.size() - searchPos);
if (is.has_error()) return false;
// Did we find the boundary?
if (searchBuf[0] == '-' && searchBuf[1] == '-' &&
searchBuf.substr(2) == boundary)
return true;
// Fast-scan for '-'
size_t pos = searchBuf.find('-', searchBuf[0] == '-' ? 1 : 0);
if (pos == llvm::StringRef::npos) {
2017-08-25 17:48:06 -07:00
if (saveBuf) saveBuf->append(searchBuf.data(), searchBuf.size());
} else {
2017-08-25 17:48:06 -07:00
if (saveBuf) saveBuf->append(searchBuf.data(), pos);
// move '-' and following to start of buffer (next read will fill)
std::memmove(searchBuf.data(), searchBuf.data() + pos,
searchBuf.size() - pos);
searchPos = searchBuf.size() - pos;
}
}
}
HttpLocation::HttpLocation(llvm::StringRef url_, bool* error,
llvm::StringRef cameraName)
: url{url_} {
// Split apart into components
llvm::StringRef query{url_};
// scheme:
llvm::StringRef scheme;
std::tie(scheme, query) = query.split(':');
if (!scheme.equals_lower("http")) {
ERROR(cameraName << ": only supports http URLs, got \"" << url << "\"");
*error = true;
return;
}
// "//"
if (!query.startswith("//")) {
ERROR(cameraName << ": expected http://..., got \"" << url << "\"");
*error = true;
return;
}
query = query.drop_front(2);
// user:password@host:port/
llvm::StringRef authority;
std::tie(authority, query) = query.split('/');
llvm::StringRef userpass, hostport;
std::tie(userpass, hostport) = authority.split('@');
// split leaves the RHS empty if the split char isn't present...
if (hostport.empty()) {
hostport = userpass;
userpass = llvm::StringRef{};
}
if (!userpass.empty()) {
llvm::StringRef rawUser, rawPassword;
std::tie(rawUser, rawPassword) = userpass.split(':');
llvm::SmallString<64> userBuf, passBuf;
user = UnescapeURI(rawUser, userBuf, error);
if (*error) {
ERROR(cameraName << ": could not unescape user \"" << rawUser
<< "\" in \"" << url << "\"");
return;
}
password = UnescapeURI(rawPassword, passBuf, error);
if (*error) {
ERROR(cameraName << ": could not unescape password \"" << rawPassword
<< "\" in \"" << url << "\"");
return;
}
}
llvm::StringRef portStr;
std::tie(host, portStr) = hostport.rsplit(':');
if (host.empty()) {
ERROR(cameraName << ": host is empty in \"" << url << "\"");
*error = true;
return;
}
if (portStr.empty()) {
port = 80;
} else if (portStr.getAsInteger(10, port)) {
ERROR(cameraName << ": port \"" << portStr << "\" is not an integer in \""
<< url << "\"");
*error = true;
return;
}
// path?query#fragment
std::tie(query, fragment) = query.split('#');
std::tie(path, query) = query.split('?');
// Split query string into parameters
while (!query.empty()) {
// split out next param and value
llvm::StringRef rawParam, rawValue;
std::tie(rawParam, query) = query.split('&');
if (rawParam.empty()) continue; // ignore "&&"
std::tie(rawParam, rawValue) = rawParam.split('=');
// unescape param
*error = false;
llvm::SmallString<64> paramBuf;
llvm::StringRef param = UnescapeURI(rawParam, paramBuf, error);
if (*error) {
ERROR(cameraName << ": could not unescape parameter \"" << rawParam
<< "\" in \"" << url << "\"");
return;
}
// unescape value
llvm::SmallString<64> valueBuf;
llvm::StringRef value = UnescapeURI(rawValue, valueBuf, error);
if (*error) {
ERROR(cameraName << ": could not unescape value \"" << rawValue
<< "\" in \"" << url << "\"");
return;
}
params.emplace_back(std::make_pair(param, value));
}
*error = false;
}
void HttpRequest::SetAuth(const HttpLocation& loc) {
if (!loc.user.empty()) {
llvm::SmallString<64> userpass;
userpass += loc.user;
userpass += ':';
userpass += loc.password;
wpi::Base64Encode(userpass, &auth);
}
}
bool HttpConnection::Handshake(const HttpRequest& request,
llvm::StringRef cameraName) {
// send GET request
os << "GET /" << request.path << " HTTP/1.1\r\n";
os << "Host: " << request.host << "\r\n";
if (!request.auth.empty())
os << "Authorization: Basic " << request.auth << "\r\n";
os << "\r\n";
os.flush();
// read first line of response
bool error = false;
llvm::SmallString<64> lineBuf;
llvm::StringRef line = ReadLine(is, lineBuf, 1024, &error).rtrim();
if (error) {
WARNING(cameraName << ": \"" << request.host
<< "\": disconnected before response");
return false;
}
// see if we got a HTTP 200 response
llvm::StringRef httpver, code, codeText;
std::tie(httpver, line) = line.split(' ');
std::tie(code, codeText) = line.split(' ');
if (!httpver.startswith("HTTP")) {
WARNING(cameraName << ": \"" << request.host
<< "\": did not receive HTTP response");
return false;
}
if (code != "200") {
WARNING(cameraName << ": \"" << request.host << "\": received " << code
<< " " << codeText << " response");
return false;
}
// Parse headers
if (!ParseHttpHeaders(is, &contentType, &contentLength)) {
WARNING(cameraName << ": \"" << request.host
<< "\": disconnected during headers");
return false;
}
return true;
}
2016-12-02 19:15:40 -08:00
} // namespace cs