i2pd/libi2pd/HTTP.cpp

500 lines
14 KiB
C++
Raw Normal View History

2016-04-27 02:00:00 +02:00
/*
2017-02-05 04:39:54 +01:00
* Copyright (c) 2013-2017, The PurpleI2P Project
2016-04-27 02:00:00 +02:00
*
* This file is part of Purple i2pd project and licensed under BSD3
*
* See full license text in LICENSE file at top of project tree
*/
2017-02-05 04:39:54 +01:00
#include <algorithm>
#include <utility>
2018-02-16 19:56:44 +01:00
#include <stdio.h>
2016-06-14 20:37:22 +02:00
#include "util.h"
2016-04-27 02:00:00 +02:00
#include "HTTP.h"
#include <ctime>
2016-04-27 02:00:00 +02:00
namespace i2p {
namespace http {
2016-05-11 14:41:32 +02:00
const std::vector<std::string> HTTP_METHODS = {
2016-04-27 02:00:00 +02:00
"GET", "HEAD", "POST", "PUT", "PATCH",
2016-05-11 14:41:32 +02:00
"DELETE", "OPTIONS", "CONNECT"
2016-04-27 02:00:00 +02:00
};
2016-05-11 14:41:32 +02:00
const std::vector<std::string> HTTP_VERSIONS = {
"HTTP/1.0", "HTTP/1.1"
2016-04-27 02:00:00 +02:00
};
const std::vector<const char *> weekdays = {
"Sun", "Mon", "Tue", "Wed", "Thu", "Fri", "Sat"
};
const std::vector<const char *> months = {
"Jan", "Feb", "Mar", "Apr", "May", "Jun",
"Jul", "Aug", "Sep", "Oct", "Nov", "Dec"
};
2016-04-27 02:00:00 +02:00
2016-05-11 14:41:32 +02:00
inline bool is_http_version(const std::string & str) {
return std::find(HTTP_VERSIONS.begin(), HTTP_VERSIONS.end(), str) != std::end(HTTP_VERSIONS);
2016-04-27 02:00:00 +02:00
}
2016-05-11 14:41:32 +02:00
inline bool is_http_method(const std::string & str) {
return std::find(HTTP_METHODS.begin(), HTTP_METHODS.end(), str) != std::end(HTTP_METHODS);
}
2017-02-05 16:09:43 +01:00
2016-04-27 02:00:00 +02:00
void strsplit(const std::string & line, std::vector<std::string> &tokens, char delim, std::size_t limit = 0) {
std::size_t count = 0;
std::stringstream ss(line);
std::string token;
while (1) {
count++;
if (limit > 0 && count >= limit)
delim = '\n'; /* reset delimiter */
if (!std::getline(ss, token, delim))
break;
tokens.push_back(token);
}
}
2018-01-06 04:48:51 +01:00
static std::pair<std::string, std::string> parse_header_line(const std::string& line)
2017-02-05 04:39:54 +01:00
{
2016-04-27 02:00:00 +02:00
std::size_t pos = 0;
std::size_t len = 2; /* strlen(": ") */
std::size_t max = line.length();
2016-04-27 02:00:00 +02:00
if ((pos = line.find(": ", pos)) == std::string::npos)
2017-02-05 04:39:54 +01:00
return std::make_pair("", "");
while ((pos + len) < max && isspace(line.at(pos + len)))
2016-04-27 02:00:00 +02:00
len++;
2017-02-05 04:39:54 +01:00
return std::make_pair(line.substr(0, pos), line.substr(pos + len));
2016-04-27 02:00:00 +02:00
}
void gen_rfc7231_date(std::string & out) {
std::time_t now = std::time(nullptr);
char buf[128];
std::tm *tm = std::gmtime(&now);
2018-02-16 19:56:44 +01:00
snprintf(buf, sizeof(buf), "%s, %02d %s %d %02d:%02d:%02d GMT",
weekdays[tm->tm_wday], tm->tm_mday, months[tm->tm_mon],
tm->tm_year + 1900, tm->tm_hour, tm->tm_min, tm->tm_sec
);
out = buf;
}
2016-04-27 02:00:00 +02:00
bool URL::parse(const char *str, std::size_t len) {
std::string url(str, len ? len : strlen(str));
return parse(url);
}
bool URL::parse(const std::string& url) {
std::size_t pos_p = 0; /* < current parse position */
std::size_t pos_c = 0; /* < work position */
2016-06-13 14:53:35 +02:00
if(url.at(0) != '/' || pos_p > 0) {
std::size_t pos_s = 0;
2016-04-27 02:00:00 +02:00
/* schema */
pos_c = url.find("://");
if (pos_c != std::string::npos) {
schema = url.substr(0, pos_c);
pos_p = pos_c + 3;
}
/* user[:pass] */
pos_s = url.find('/', pos_p); /* find first slash */
pos_c = url.find('@', pos_p); /* find end of 'user' or 'user:pass' part */
if (pos_c != std::string::npos && (pos_s == std::string::npos || pos_s > pos_c)) {
2016-04-27 02:00:00 +02:00
std::size_t delim = url.find(':', pos_p);
2018-02-11 12:05:41 +01:00
if (delim && delim != std::string::npos && delim < pos_c) {
2016-04-27 02:00:00 +02:00
user = url.substr(pos_p, delim - pos_p);
delim += 1;
pass = url.substr(delim, pos_c - delim);
2018-02-11 12:07:43 +01:00
} else if(delim) {
2016-04-27 02:00:00 +02:00
user = url.substr(pos_p, pos_c - pos_p);
}
pos_p = pos_c + 1;
2016-04-27 02:00:00 +02:00
}
/* hostname[:port][/path] */
pos_c = url.find_first_of(":/", pos_p);
if (pos_c == std::string::npos) {
/* only hostname, without post and path */
host = url.substr(pos_p, std::string::npos);
return true;
} else if (url.at(pos_c) == ':') {
host = url.substr(pos_p, pos_c - pos_p);
/* port[/path] */
pos_p = pos_c + 1;
pos_c = url.find('/', pos_p);
std::string port_str = (pos_c == std::string::npos)
? url.substr(pos_p, std::string::npos)
: url.substr(pos_p, pos_c - pos_p);
/* stoi throws exception on failure, we don't need it */
for (char c : port_str) {
if (c < '0' || c > '9')
return false;
port *= 10;
port += c - '0';
}
if (pos_c == std::string::npos)
return true; /* no path part */
pos_p = pos_c;
} else {
/* start of path part found */
host = url.substr(pos_p, pos_c - pos_p);
pos_p = pos_c;
}
}
/* pos_p now at start of path part */
pos_c = url.find_first_of("?#", pos_p);
if (pos_c == std::string::npos) {
/* only path, without fragment and query */
path = url.substr(pos_p, std::string::npos);
return true;
} else if (url.at(pos_c) == '?') {
/* found query part */
path = url.substr(pos_p, pos_c - pos_p);
pos_p = pos_c + 1;
pos_c = url.find('#', pos_p);
if (pos_c == std::string::npos) {
/* no fragment */
query = url.substr(pos_p, std::string::npos);
return true;
} else {
query = url.substr(pos_p, pos_c - pos_p);
pos_p = pos_c + 1;
}
} else {
/* found fragment part */
path = url.substr(pos_p, pos_c - pos_p);
pos_p = pos_c + 1;
}
/* pos_p now at start of fragment part */
frag = url.substr(pos_p, std::string::npos);
return true;
}
bool URL::parse_query(std::map<std::string, std::string> & params) {
std::vector<std::string> tokens;
strsplit(query, tokens, '&');
params.clear();
2016-08-05 20:23:54 +02:00
for (const auto& it : tokens) {
2016-04-27 02:00:00 +02:00
std::size_t eq = it.find ('=');
if (eq != std::string::npos) {
auto e = std::pair<std::string, std::string>(it.substr(0, eq), it.substr(eq + 1));
params.insert(e);
} else {
auto e = std::pair<std::string, std::string>(it, "");
params.insert(e);
}
}
return true;
}
std::string URL::to_string() {
std::string out = "";
if (schema != "") {
out = schema + "://";
if (user != "" && pass != "") {
out += user + ":" + pass + "@";
} else if (user != "") {
out += user + "@";
}
if (port) {
out += host + ":" + std::to_string(port);
} else {
out += host;
}
}
out += path;
if (query != "")
out += "?" + query;
if (frag != "")
out += "#" + frag;
return out;
}
2017-02-05 16:09:43 +01:00
bool URL::is_i2p() const
{
return host.rfind(".i2p") == ( host.size() - 4 );
}
void HTTPMsg::add_header(const char *name, std::string & value, bool replace) {
add_header(name, value.c_str(), replace);
}
void HTTPMsg::add_header(const char *name, const char *value, bool replace) {
std::size_t count = headers.count(name);
if (count && !replace)
return;
if (count) {
headers[name] = value;
return;
}
headers.insert(std::pair<std::string, std::string>(name, value));
}
void HTTPMsg::del_header(const char *name) {
headers.erase(name);
}
2016-04-27 02:00:00 +02:00
int HTTPReq::parse(const char *buf, size_t len) {
std::string str(buf, len);
return parse(str);
}
int HTTPReq::parse(const std::string& str) {
enum { REQ_LINE, HEADER_LINE } expect = REQ_LINE;
std::size_t eoh = str.find(HTTP_EOH); /* request head size */
std::size_t eol = 0, pos = 0;
URL url;
if (eoh == std::string::npos)
return 0; /* str not contains complete request */
while ((eol = str.find(CRLF, pos)) != std::string::npos) {
if (expect == REQ_LINE) {
std::string line = str.substr(pos, eol - pos);
std::vector<std::string> tokens;
strsplit(line, tokens, ' ');
if (tokens.size() != 3)
return -1;
2016-05-11 14:41:32 +02:00
if (!is_http_method(tokens[0]))
2016-04-27 02:00:00 +02:00
return -1;
2016-05-11 14:41:32 +02:00
if (!is_http_version(tokens[2]))
2016-04-27 02:00:00 +02:00
return -1;
if (!url.parse(tokens[1]))
return -1;
/* all ok */
method = tokens[0];
uri = tokens[1];
version = tokens[2];
expect = HEADER_LINE;
2018-01-06 04:48:51 +01:00
}
else
2017-02-05 04:39:54 +01:00
{
2016-04-27 02:00:00 +02:00
std::string line = str.substr(pos, eol - pos);
2017-02-05 04:39:54 +01:00
auto p = parse_header_line(line);
if (p.first.length () > 0)
headers.push_back (p);
2018-01-06 04:48:51 +01:00
else
2017-02-05 04:39:54 +01:00
return -1;
2016-04-27 02:00:00 +02:00
}
pos = eol + strlen(CRLF);
if (pos >= eoh)
break;
}
return eoh + strlen(HTTP_EOH);
}
2018-01-06 04:48:51 +01:00
void HTTPReq::write(std::ostream & o)
2017-02-05 04:39:54 +01:00
{
o << method << " " << uri << " " << version << CRLF;
2018-01-06 04:48:51 +01:00
for (auto & h : headers)
2018-01-06 05:01:44 +01:00
o << h.first << ": " << h.second << CRLF;
2017-02-05 04:39:54 +01:00
o << CRLF;
2016-04-27 02:00:00 +02:00
}
2016-11-20 18:13:11 +01:00
std::string HTTPReq::to_string()
{
std::stringstream ss;
write(ss);
return ss.str();
}
2017-02-05 04:39:54 +01:00
void HTTPReq::AddHeader (const std::string& name, const std::string& value)
2018-01-06 04:48:51 +01:00
{
2017-02-05 04:39:54 +01:00
headers.push_back (std::make_pair(name, value));
}
void HTTPReq::UpdateHeader (const std::string& name, const std::string& value)
{
for (auto& it : headers)
if (it.first == name)
{
it.second = value;
break;
2018-01-06 04:48:51 +01:00
}
}
void HTTPReq::RemoveHeader (const std::string& name, const std::string& exempt)
2017-02-05 04:39:54 +01:00
{
for (auto it = headers.begin (); it != headers.end ();)
{
2018-01-06 04:48:51 +01:00
if (!it->first.compare(0, name.length (), name) && it->first != exempt)
2017-02-05 04:39:54 +01:00
it = headers.erase (it);
else
it++;
2018-01-06 04:48:51 +01:00
}
}
2017-02-05 04:39:54 +01:00
2018-01-06 04:48:51 +01:00
std::string HTTPReq::GetHeader (const std::string& name) const
2017-02-05 04:39:54 +01:00
{
for (auto& it : headers)
if (it.first == name)
2018-01-06 04:48:51 +01:00
return it.second;
2017-02-05 04:39:54 +01:00
return "";
2018-01-06 04:48:51 +01:00
}
2017-02-12 21:11:19 +01:00
bool HTTPRes::is_chunked() const
{
2016-04-27 02:00:00 +02:00
auto it = headers.find("Transfer-Encoding");
if (it == headers.end())
return false;
if (it->second.find("chunked") == std::string::npos)
return true;
return false;
}
2017-02-12 21:11:19 +01:00
bool HTTPRes::is_gzipped(bool includingI2PGzip) const
{
2016-07-16 02:00:00 +02:00
auto it = headers.find("Content-Encoding");
if (it == headers.end())
return false; /* no header */
if (it->second.find("gzip") != std::string::npos)
return true; /* gotcha! */
2017-02-12 21:11:19 +01:00
if (includingI2PGzip && it->second.find("x-i2p-gzip") != std::string::npos)
2018-01-06 04:48:51 +01:00
return true;
return false;
}
2018-01-06 04:48:51 +01:00
2017-02-12 21:11:19 +01:00
long int HTTPMsg::content_length() const
{
2016-04-27 02:00:00 +02:00
unsigned long int length = 0;
auto it = headers.find("Content-Length");
if (it == headers.end())
return -1;
errno = 0;
length = std::strtoul(it->second.c_str(), (char **) NULL, 10);
if (errno != 0)
return -1;
return length;
}
int HTTPRes::parse(const char *buf, size_t len) {
std::string str(buf, len);
return parse(str);
}
int HTTPRes::parse(const std::string& str) {
enum { RES_LINE, HEADER_LINE } expect = RES_LINE;
std::size_t eoh = str.find(HTTP_EOH); /* request head size */
std::size_t eol = 0, pos = 0;
if (eoh == std::string::npos)
return 0; /* str not contains complete request */
while ((eol = str.find(CRLF, pos)) != std::string::npos) {
if (expect == RES_LINE) {
std::string line = str.substr(pos, eol - pos);
std::vector<std::string> tokens;
strsplit(line, tokens, ' ', 3);
if (tokens.size() != 3)
return -1;
2016-05-11 14:41:32 +02:00
if (!is_http_version(tokens[0]))
2016-04-27 02:00:00 +02:00
return -1;
code = atoi(tokens[1].c_str());
if (code < 100 || code >= 600)
return -1;
/* all ok */
version = tokens[0];
status = tokens[2];
expect = HEADER_LINE;
} else {
std::string line = str.substr(pos, eol - pos);
2017-02-05 04:39:54 +01:00
auto p = parse_header_line(line);
if (p.first.length () > 0)
2018-01-06 04:48:51 +01:00
headers.insert (p);
else
2016-04-27 02:00:00 +02:00
return -1;
}
pos = eol + strlen(CRLF);
if (pos >= eoh)
break;
}
return eoh + strlen(HTTP_EOH);
}
std::string HTTPRes::to_string() {
if (version == "HTTP/1.1" && headers.count("Date") == 0) {
std::string date;
gen_rfc7231_date(date);
add_header("Date", date.c_str());
}
if (status == "OK" && code != 200)
status = HTTPCodeToStatus(code); // update
if (body.length() > 0 && headers.count("Content-Length") == 0)
add_header("Content-Length", std::to_string(body.length()).c_str());
/* build response */
2016-04-27 02:00:00 +02:00
std::stringstream ss;
ss << version << " " << code << " " << status << CRLF;
for (auto & h : headers) {
ss << h.first << ": " << h.second << CRLF;
}
ss << CRLF;
if (body.length() > 0)
ss << body;
2016-04-27 02:00:00 +02:00
return ss.str();
}
const char * HTTPCodeToStatus(int code) {
const char *ptr;
switch (code) {
case 105: ptr = "Name Not Resolved"; break;
/* success */
case 200: ptr = "OK"; break;
case 206: ptr = "Partial Content"; break;
/* redirect */
case 301: ptr = "Moved Permanently"; break;
case 302: ptr = "Found"; break;
case 304: ptr = "Not Modified"; break;
case 307: ptr = "Temporary Redirect"; break;
/* client error */
case 400: ptr = "Bad Request"; break;
case 401: ptr = "Unauthorized"; break;
case 403: ptr = "Forbidden"; break;
case 404: ptr = "Not Found"; break;
case 407: ptr = "Proxy Authentication Required"; break;
case 408: ptr = "Request Timeout"; break;
/* server error */
case 500: ptr = "Internal Server Error"; break;
case 502: ptr = "Bad Gateway"; break;
case 503: ptr = "Not Implemented"; break;
case 504: ptr = "Gateway Timeout"; break;
default: ptr = "Unknown Status"; break;
}
return ptr;
}
std::string UrlDecode(const std::string& data, bool allow_null) {
std::string decoded(data);
size_t pos = 0;
while ((pos = decoded.find('%', pos)) != std::string::npos) {
char c = strtol(decoded.substr(pos + 1, 2).c_str(), NULL, 16);
if (c == '\0' && !allow_null) {
pos += 3;
continue;
}
decoded.replace(pos, 3, 1, c);
pos++;
}
return decoded;
}
bool MergeChunkedResponse (std::istream& in, std::ostream& out) {
std::string hexLen;
while (!in.eof ()) {
std::getline (in, hexLen);
errno = 0;
2016-06-01 02:00:00 +02:00
long int len = strtoul(hexLen.c_str(), (char **) NULL, 16);
2016-04-27 02:00:00 +02:00
if (errno != 0)
return false; /* conversion error */
if (len == 0)
return true; /* end of stream */
if (len < 0 || len > 10 * 1024 * 1024) /* < 10Mb */
return false; /* too large chunk */
char * buf = new char[len];
in.read (buf, len);
out.write (buf, len);
delete[] buf;
std::getline (in, hexLen); // read \r\n after chunk
}
return true;
}
} // http
} // i2p