0
0
Fork 0
mirror of https://github.com/matrix-construct/construct synced 2024-12-28 16:34:13 +01:00
construct/ircd/http.cc

734 lines
22 KiB
C++
Raw Normal View History

2016-11-29 16:23:38 +01:00
/*
* Copyright (C) 2016 Charybdis Development Team
* Copyright (C) 2016 Jason Volk <jason@zemos.net>
*
* Permission to use, copy, modify, and/or distribute this software for any
* purpose with or without fee is hereby granted, provided that the above
* copyright notice and this permission notice is present in all copies.
*
* THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
* IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
* WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
* DISCLAIMED. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT,
* INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
* (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
* SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
* HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT,
* STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING
* IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
* POSSIBILITY OF SUCH DAMAGE.
*/
#include <ircd/spirit.h>
2016-11-29 16:23:38 +01:00
namespace ircd::http
{
namespace spirit = boost::spirit;
namespace qi = spirit::qi;
namespace ascii = qi::ascii;
using spirit::unused_type;
using qi::lit;
using qi::string;
using qi::char_;
using qi::short_;
using qi::int_;
using qi::long_;
using qi::repeat;
using qi::omit;
using qi::raw;
using qi::attr;
using qi::eps;
template<class it, class top = unused_type> struct grammar;
struct parser extern const parser;
size_t printed_size(const std::initializer_list<line::header> &headers);
size_t print(char *const &buf, const size_t &max, const std::initializer_list<line::header> &headers);
}
std::map<ircd::http::code, ircd::string_view> ircd::http::reason
{
2017-04-03 05:59:18 +02:00
{ code::CONTINUE, "Continue" },
{ code::SWITCHING_PROTOCOLS, "Switching Protocols" },
2017-04-03 05:59:18 +02:00
{ code::OK, "OK" },
{ code::CREATED, "Created" },
{ code::ACCEPTED, "Accepted" },
{ code::NON_AUTHORITATIVE_INFORMATION, "Non-Authoritative Information" },
{ code::NO_CONTENT, "No Content" },
2017-04-07 01:54:20 +02:00
{ code::PARTIAL_CONTENT, "Partial Content" },
{ code::MOVED_PERMANENTLY, "Moved Permanently" },
{ code::FOUND, "Found" },
{ code::SEE_OTHER, "See Other" },
{ code::NOT_MODIFIED, "Not Modified" },
{ code::TEMPORARY_REDIRECT, "Temporary Redirect" },
{ code::PERMANENT_REDIRECT, "Permanent Redirect" },
2017-04-03 05:59:18 +02:00
{ code::BAD_REQUEST, "Bad Request" },
{ code::UNAUTHORIZED, "Unauthorized" },
{ code::FORBIDDEN, "Forbidden" },
{ code::NOT_FOUND, "Not Found" },
{ code::METHOD_NOT_ALLOWED, "Method Not Allowed" },
{ code::REQUEST_TIMEOUT, "Request Time-out" },
{ code::CONFLICT, "Conflict" },
{ code::REQUEST_URI_TOO_LONG, "Request URI Too Long" },
{ code::EXPECTATION_FAILED, "Expectation Failed" },
2017-04-07 01:54:20 +02:00
{ code::IM_A_TEAPOT, "Negative, I Am A Meat Popsicle" },
2017-04-03 05:59:18 +02:00
{ code::UNPROCESSABLE_ENTITY, "Unprocessable Entity" },
{ code::TOO_MANY_REQUESTS, "Too Many Requests" },
{ code::REQUEST_HEADER_FIELDS_TOO_LARGE, "Request Header Fields Too Large" },
2017-04-03 05:59:18 +02:00
{ code::INTERNAL_SERVER_ERROR, "Internal Server Error" },
{ code::NOT_IMPLEMENTED, "Not Implemented" },
{ code::SERVICE_UNAVAILABLE, "Service Unavailable" },
{ code::HTTP_VERSION_NOT_SUPPORTED, "HTTP Version Not Supported" },
{ code::INSUFFICIENT_STORAGE, "Insufficient Storage" },
};
2016-11-29 16:23:38 +01:00
BOOST_FUSION_ADAPT_STRUCT
(
ircd::http::line::request,
( decltype(ircd::http::line::request::method), method )
( decltype(ircd::http::line::request::path), path )
( decltype(ircd::http::line::request::query), query )
( decltype(ircd::http::line::request::fragment), fragment )
2016-11-29 16:23:38 +01:00
( decltype(ircd::http::line::request::version), version )
)
BOOST_FUSION_ADAPT_STRUCT
(
ircd::http::line::response,
( decltype(ircd::http::line::response::version), version )
( decltype(ircd::http::line::response::status), status )
( decltype(ircd::http::line::response::reason), reason )
)
BOOST_FUSION_ADAPT_STRUCT
(
ircd::http::line::header,
( decltype(ircd::http::line::header::first), first )
( decltype(ircd::http::line::header::second), second )
)
BOOST_FUSION_ADAPT_STRUCT
(
ircd::http::query,
( decltype(ircd::http::query::first), first )
( decltype(ircd::http::query::second), second )
)
2016-11-29 16:23:38 +01:00
template<class it,
class top>
struct ircd::http::grammar
2016-11-29 16:23:38 +01:00
:qi::grammar<it, top>
,parse::grammar
{
template<class R = unused_type> using rule = qi::rule<it, R>;
rule<> NUL { lit('\0') ,"nul" };
2016-11-29 16:23:38 +01:00
// insignificant whitespaces
rule<> SP { lit('\x20') ,"space" };
rule<> HT { lit('\x09') ,"horizontal tab" };
rule<> ws { SP | HT ,"whitespace" };
rule<> CR { lit('\x0D') ,"carriage return" };
rule<> LF { lit('\x0A') ,"line feed" };
rule<> CRLF { CR >> LF ,"carriage return, line feed" };
2016-11-29 16:23:38 +01:00
rule<> illegal { NUL | CR | LF ,"illegal" };
rule<> colon { lit(':') ,"colon" };
rule<> slash { lit('/') ,"forward solidus" };
rule<> question { lit('?') ,"question mark" };
rule<> pound { lit('#') ,"pound sign" };
rule<> equal { lit('=') ,"equal sign" };
rule<> ampersand { lit('&') ,"ampersand" };
rule<string_view> token { raw[+(char_ - (illegal | ws))] ,"token" };
rule<string_view> string { raw[+(char_ - illegal)] ,"string" };
rule<string_view> line { *ws >> -string >> CRLF ,"line" };
rule<string_view> status { raw[repeat(3)[char_("0-9")]] ,"status" };
rule<short> status_code { short_ ,"status code" };
rule<string_view> reason { string ,"status" };
rule<string_view> head_key { raw[+(char_ - (illegal | ws | colon))] ,"head key" };
rule<string_view> head_val { string ,"head value" };
rule<line::header> header { head_key >> *ws >> colon >> *ws >> head_val ,"header" };
rule<unused_type> headers { (header % (*ws >> CRLF)) ,"headers" };
rule<> query_terminator { equal | question | ampersand | pound ,"query terminator" };
rule<> query_illegal { illegal | ws | query_terminator ,"query illegal" };
rule<string_view> query_key { raw[+(char_ - query_illegal)] ,"query key" };
rule<string_view> query_val { raw[*(char_ - query_illegal)] ,"query value" };
rule<string_view> method { token ,"method" };
rule<string_view> path { -slash >> raw[*(char_ - query_illegal)] ,"path" };
rule<string_view> fragment { pound >> -token ,"fragment" };
rule<string_view> version { token ,"version" };
rule<http::query> query
{
query_key >> -(equal >> query_val)
,"query"
};
rule<string_view> query_string
{
question >> -raw[(query_key >> -(equal >> query_val)) % ampersand]
,"query string"
};
rule<line::request> request_line
{
method >> +SP >> path >> -query_string >> -fragment >> +SP >> version
,"request line"
};
rule<line::response> response_line
{
version >> +SP >> status >> -(+SP >> reason)
,"response line"
};
rule<unused_type> request
{
request_line >> *ws >> CRLF >> -headers >> CRLF
,"request"
};
rule<unused_type> response
{
response_line >> *ws >> CRLF >> -headers >> CRLF
,"response"
};
grammar(rule<top> &top_rule, const char *const &name)
:grammar<it, top>::base_type
{
top_rule
}
,parse::grammar
{
name
}
{}
};
2016-11-29 16:23:38 +01:00
struct ircd::http::parser
2016-11-29 16:23:38 +01:00
:grammar<const char *, unused_type>
{
static size_t content_length(const string_view &val);
2016-11-29 16:23:38 +01:00
parser(): grammar { grammar::ws, "http.request" } {}
}
const ircd::http::parser;
2016-11-29 16:23:38 +01:00
size_t
ircd::http::print(char *const &buf,
const size_t &max,
const std::initializer_list<line::header> &headers)
{
size_t ret(0);
for(const auto &header : headers)
ret += snprintf(buf + ret, max - ret, "%s: %s\r\n",
header.first.data(),
header.second.data());
return ret;
}
size_t
ircd::http::printed_size(const std::initializer_list<line::header> &headers)
{
return std::accumulate(begin(headers), end(headers), size_t(0), []
(auto &ret, const auto &pair)
2016-11-29 16:23:38 +01:00
{
// key : SP value CRLF
return ret += pair.first.size() + 1 + 1 + pair.second.size() + 2;
});
}
2017-03-13 23:24:42 +01:00
ircd::http::request::request(parse::capstan &pc,
content *const &c,
const write_closure &write_closure,
const proffer &proffer,
const headers::closure &headers_closure)
try
{
const head h{pc, headers_closure};
const char *const content_mark(pc.parsed);
const scope discard_unused_content{[&pc, &h, &content_mark]
{
const size_t consumed(pc.parsed - content_mark);
const size_t remain(h.content_length - consumed);
http::content{pc, remain, content::discard};
}};
if(proffer)
proffer(h);
2016-11-29 16:23:38 +01:00
if(c)
*c = content{pc, h};
2016-11-29 16:23:38 +01:00
}
catch(const http::error &e)
{
if(write_closure)
http::response{e.code, e.content, write_closure};
2016-11-29 16:23:38 +01:00
throw;
}
catch(const std::exception &e)
2016-11-29 16:23:38 +01:00
{
if(write_closure)
http::response{http::INTERNAL_SERVER_ERROR, e.what(), write_closure};
throw;
}
ircd::http::request::request(const string_view &host,
const string_view &method,
const string_view &path,
const string_view &query,
const string_view &content,
const write_closure &closure,
const std::initializer_list<line::header> &headers)
{
assert(!method.empty());
assert(!path.empty());
const auto &version{"HTTP/1.1"s};
char request_line[2048]; const auto request_line_len
{
snprintf(request_line, sizeof(request_line), "%s /%s%s%s %s\r\n",
method.data(),
path.data(),
query.empty()? "" : "?",
query.empty()? "" : query.data(),
version.data())
};
char host_line[128] {"Host: "}; const auto host_line_len
{
6 + snprintf(host_line + 6, std::min(sizeof(host_line) - 6, host.size() + 3), "%s\r\n",
host.data())
};
char content_len[64]; const auto content_len_len
{
snprintf(content_len, sizeof(content_len), "Content-Length: %zu\r\n",
content.size())
};
char user_headers[printed_size(headers) + 2 + 1]; auto user_headers_len
2016-11-29 16:23:38 +01:00
{
print(user_headers, sizeof(user_headers), headers)
};
const auto terminator{"\r\n"};
user_headers_len = strlcat(user_headers, terminator, sizeof(user_headers));
const ilist<const_buffer> vector
{
{ request_line, size_t(request_line_len) },
{ host_line, size_t(host_line_len) },
{ content_len, size_t(content_len_len) },
{ user_headers, size_t(user_headers_len) },
{ content.data(), content.size() },
};
closure(vector);
}
2017-03-13 23:24:42 +01:00
ircd::http::request::head::head(parse::capstan &pc,
const headers::closure &c)
:line::request{pc}
{
headers{pc, [this, &c](const auto &h)
{
if(iequals(h.first, "host"s))
2016-11-29 16:23:38 +01:00
host = h.second;
else if(iequals(h.first, "expect"s))
2016-11-29 16:23:38 +01:00
expect = h.second;
else if(iequals(h.first, "te"s))
2016-11-29 16:23:38 +01:00
te = h.second;
else if(iequals(h.first, "content-length"s))
content_length = parser.content_length(h.second);
2016-11-29 16:23:38 +01:00
if(c)
c(h);
}};
}
2017-03-13 23:24:42 +01:00
ircd::http::response::response(parse::capstan &pc,
content *const &c,
const proffer &proffer,
const headers::closure &headers_closure)
{
const head h{pc, headers_closure};
const char *const content_mark(pc.parsed);
const scope discard_unused_content{[&pc, &h, &content_mark]
{
const size_t consumed(pc.parsed - content_mark);
const size_t remain(h.content_length - consumed);
http::content{pc, remain, content::discard};
}};
if(proffer)
proffer(h);
if(c)
*c = content{pc, h};
}
ircd::http::response::response(const code &code,
const string_view &content,
const write_closure &closure,
const std::initializer_list<line::header> &headers)
{
char status_line[128]; const auto status_line_len
{
snprintf(status_line, sizeof(status_line), "HTTP/1.1 %u %s\r\n",
uint(code),
http::reason[code].data())
};
char server_line[128]; const auto server_line_len
{
code >= 200 && code < 300?
snprintf(server_line, sizeof(server_line), "Server: %s (IRCd) %s\r\n",
BRANDING_NAME,
BRANDING_VERSION):
0
};
const time_t ltime(time());
struct tm *const tm(localtime(&ltime));
char date_line[128]; const auto date_line_len
{
code < 400 || code >= 500?
strftime(date_line, sizeof(date_line), "Date: %a, %d %b %Y %T %z\r\n", tm):
0
};
char cache_line[64]; const auto cache_line_len
{
//TODO: real cache control subsystem
(code >= 200 && code < 300) || (code >= 403 && code <= 405) || (code >= 300 && code < 400)?
snprintf(cache_line, sizeof(cache_line), "Cache-Control: %s\r\n",
"no-cache"):
0
};
char content_len[64]; const auto content_len_len
{
code != NO_CONTENT?
snprintf(content_len, sizeof(content_len), "Content-Length: %zu\r\n",
content.size()):
0
};
const auto user_headers_bufsize
{
std::accumulate(begin(headers), end(headers), size_t(1), []
(auto &ret, const auto &pair)
{
return ret += pair.first.size() + 1 + 1 + pair.second.size() + 2;
})
};
char user_headers[user_headers_bufsize]; const auto user_headers_len
{
print(user_headers, sizeof(user_headers), headers)
};
const ilist<const_buffer> iov
{
{ status_line, size_t(status_line_len) },
{ server_line, size_t(server_line_len) },
{ date_line, size_t(date_line_len) },
{ cache_line, size_t(cache_line_len) },
{ user_headers, size_t(user_headers_len) },
{ content_len, size_t(content_len_len) },
{ "\r\n", 2 },
{ content.data(), content.size() },
};
closure(iov);
}
2017-03-13 23:24:42 +01:00
ircd::http::response::head::head(parse::capstan &pc,
const headers::closure &c)
:line::response{pc}
{
headers{pc, [this, &c](const auto &h)
{
if(iequals(h.first, "content-length"s))
content_length = parser.content_length(h.second);
if(c)
c(h);
}};
}
2017-03-13 23:24:42 +01:00
ircd::http::content::content(parse::capstan &pc,
const size_t &length)
:string_view{[&pc, &length]
{
const char *const base(pc.parsed);
const size_t have(std::min(pc.unparsed(), length));
size_t remain(length - have);
pc.parsed += have;
while(remain && pc.remaining())
{
const auto read_max(std::min(remain, pc.remaining()));
pc.reader(pc.read, pc.read + read_max);
remain -= pc.unparsed();
pc.parsed = pc.read;
}
//assert(pc.parsed == base + length);
if(unlikely(pc.parsed < base + length))
throw parse::buffer_error("parse buffer short by %zu to hold %zu total bytes of content",
remain,
length);
if(pc.remaining())
*pc.read = '\0';
assert(pc.parsed == pc.read);
return string_view { base, pc.parsed };
}()}
{
}
2017-03-13 23:24:42 +01:00
ircd::http::content::content(parse::capstan &pc,
const size_t &length,
discard_t)
:string_view{}
{
static char buf[512] alignas(16);
const size_t have(std::min(pc.unparsed(), length));
size_t remain(length - have);
pc.read -= have;
while(remain)
{
char *start(buf);
__builtin_prefetch(start, 1, 0); // 1 = write, 0 = no cache
pc.reader(start, start + std::min(remain, sizeof(buf)));
remain -= std::distance(buf, start);
2016-11-29 16:23:38 +01:00
}
}
2017-03-13 23:24:42 +01:00
ircd::http::headers::headers(parse::capstan &pc,
const closure &c)
{
for(line::header h{pc}; !h.first.empty(); h = line::header{pc})
if(c)
c(h);
}
2016-11-29 16:23:38 +01:00
ircd::http::line::header::header(const line &line)
try
{
static const auto grammar
{
eps > parser.header
};
if(line.empty())
return;
const char *start(line.data());
const char *const stop(line.data() + line.size());
qi::parse(start, stop, grammar, *this);
}
catch(const qi::expectation_failure<const char *> &e)
{
char buf[256];
const auto rule(ircd::string(e.what_));
fmt::snprintf(buf, sizeof(buf),
"I require a valid HTTP %s. You sent %zu invalid characters starting with `%s'.",
between(rule, "<", ">"),
ssize_t(e.last - e.first),
string_view{e.first, e.last});
throw error(code::BAD_REQUEST, buf);
2016-11-29 16:23:38 +01:00
}
ircd::http::line::response::response(const line &line)
{
static const auto grammar
{
eps > parser.response_line
2016-11-29 16:23:38 +01:00
};
const char *start(line.data());
const char *const stop(line.data() + line.size());
qi::parse(start, stop, grammar, *this);
}
ircd::http::line::request::request(const line &line)
try
{
static const auto grammar
{
eps > parser.request_line
};
const char *start(line.data());
const char *const stop(line.data() + line.size());
qi::parse(start, stop, grammar, *this);
}
catch(const qi::expectation_failure<const char *> &e)
{
char buf[256];
const auto rule(ircd::string(e.what_));
fmt::snprintf(buf, sizeof(buf),
"I require a valid HTTP %s. You sent %zu invalid characters starting with `%s'.",
between(rule, "<", ">"),
ssize_t(e.last - e.first),
string_view{e.first, e.last});
throw error(code::BAD_REQUEST, buf);
2016-11-29 16:23:38 +01:00
}
2017-03-13 23:24:42 +01:00
ircd::http::line::line(parse::capstan &pc)
2016-11-29 16:23:38 +01:00
:string_view{[&pc]
{
static const auto grammar
{
parser.line
};
string_view ret;
pc([&ret](const char *&start, const char *const &stop)
2016-11-29 16:23:38 +01:00
{
if(!qi::parse(start, stop, grammar, ret))
{
ret = {};
return false;
}
else return true;
2016-11-29 16:23:38 +01:00
});
return ret;
}()}
{
}
ircd::string_view
ircd::http::query::string::at(const string_view &key)
const
{
const auto ret(operator[](key));
if(ret.empty())
throw std::out_of_range("Failed to find value for required query string key");
return ret;
}
ircd::string_view
ircd::http::query::string::operator[](const string_view &key)
const
{
string_view ret;
const auto match([&key, &ret](const query &query) -> bool
{
if(query.first == key)
{
ret = query.second;
return false; // false to break out of until()
}
else return true;
});
until(match);
return ret;
}
bool
ircd::http::query::string::until(const std::function<bool (const query &)> &closure)
const
{
const auto action([&closure](const auto &attribute, const auto &context, auto &halt)
{
halt = closure(attribute);
});
const parser::rule<unused_type> grammar
{
-parser.question >> (parser.query[action] % parser.ampersand)
};
const string_view &s(*this);
const char *start(s.data()), *const stop(s.data() + s.size());
return qi::parse(start, stop, grammar);
}
void
ircd::http::query::string::for_each(const std::function<void (const query &)> &closure)
const
{
const auto action([&closure](const auto &attribute, const auto &context, auto &halt)
{
closure(attribute);
});
const parser::rule<unused_type> grammar
{
-parser.question >> (parser.query[action] % parser.ampersand)
};
const string_view &s(*this);
const char *start(s.data()), *const stop(s.data() + s.size());
qi::parse(start, stop, grammar);
}
2017-03-11 02:46:25 +01:00
ircd::http::error::error(const enum code &code,
std::string content)
2016-11-29 16:23:38 +01:00
:ircd::error{generate_skip}
2017-03-11 02:46:25 +01:00
,code{code}
,content{std::move(content)}
2016-11-29 16:23:38 +01:00
{
snprintf(buf, sizeof(buf), "%d %s", int(code), reason[code].data());
}
ircd::http::code
ircd::http::status(const string_view &str)
{
static const auto grammar
{
parser.status_code
};
short ret;
const char *start(str.data());
const bool parsed(qi::parse(start, start + str.size(), grammar, ret));
if(!parsed || ret < 0 || ret >= 1000)
throw ircd::error("Invalid HTTP status code");
return http::code(ret);
}
size_t
ircd::http::parser::content_length(const string_view &str)
{
static const parser::rule<long> grammar
{
long_
};
long ret;
const char *start(str.data());
const bool parsed(qi::parse(start, start + str.size(), grammar, ret));
if(!parsed || ret < 0)
throw error(BAD_REQUEST, "Invalid content-length value");
return ret;
}