Files
scylladb/httpd.cc
Avi Kivity 10695644d7 Get rid of regex in http parser
It's slow.  Replacing it doubles throughput to 110K req/s.
2014-08-20 16:37:11 +03:00

280 lines
10 KiB
C++

/*
* Copyright 2014 Cloudius Systems
*/
#include "reactor.hh"
#include "sstring.hh"
#include <iostream>
#include <algorithm>
#include <unordered_map>
#include <queue>
#include <bitset>
#include <limits>
#include <cctype>
class char_filter {
using uchar = unsigned char;
public:
template <typename Pred>
explicit char_filter(Pred pred) {
for (unsigned i = 0; i <= std::numeric_limits<uchar>::max(); ++i) {
_filter.set(i, pred(i));
}
}
bool operator()(char v) const { return _filter.test(uchar(v)); }
private:
std::bitset<1 << std::numeric_limits<uchar>::digits> _filter;
};
char_filter tchar([](char c) {
return std::isalnum(c) || std::string("-!#$%&'\\*\\+.^_`|~").find_first_of(c) != std::string::npos;
});
char_filter op_char([](char c) { return std::isupper(c); });
char_filter sp_char([](char c) { return std::isspace(c); });
char_filter nsp_char([](char c) { return !std::isspace(c); });
char_filter digit_char([](char c) { return std::isdigit(c); });
class http_server {
std::vector<pollable_fd> _listeners;
public:
void listen(ipv4_addr addr) {
listen_options lo;
lo.reuse_address = true;
_listeners.push_back(the_reactor.listen(make_ipv4_address(addr), lo));
do_accepts(_listeners.size() - 1);
}
void do_accepts(int which) {
_listeners[which].accept().then([this, which] (pollable_fd fd, socket_address addr) mutable {
(new connection(*this, std::move(fd), addr))->read();
do_accepts(which);
});
}
class connection {
http_server& _server;
pollable_fd _fd;
socket_address _addr;
input_stream_buffer<char> _read_buf;
output_stream_buffer<char> _write_buf;
bool _eof = false;
static constexpr size_t limit = 4096;
using tmp_buf = temporary_buffer<char>;
struct request {
sstring _method;
sstring _url;
sstring _version;
std::unordered_map<sstring, sstring> _headers;
};
sstring _last_header_name;
struct response {
sstring _response_line;
sstring _body;
std::unordered_map<sstring, sstring> _headers;
};
std::unique_ptr<request> _req;
std::unique_ptr<response> _resp;
std::queue<std::unique_ptr<response>> _pending_responses;
public:
connection(http_server& server, pollable_fd&& fd, socket_address addr)
: _server(server), _fd(std::move(fd)), _addr(addr), _read_buf(_fd, 8192)
, _write_buf(_fd, 8192) {}
void read() {
_read_buf.read_until(limit, '\n').then([this] (tmp_buf start_line) {
if (!start_line.size()) {
_eof = true;
maybe_done();
return;
}
_req = std::make_unique<request>();
size_t pos = 0;
size_t end = start_line.size();
while (pos < end && op_char(start_line[pos])) {
++pos;
}
if (pos == 0) {
return bad(std::move(_req));
}
_req->_method = sstring(start_line.begin(), pos);
if (pos == end || start_line[pos++] != ' ') {
return bad(std::move(_req));
}
auto url = pos;
while (pos < end && nsp_char(start_line[pos])) {
++pos;
}
_req->_url = sstring(start_line.begin() + url, pos - url);
if (pos == end || start_line[pos++] != ' ') {
return bad(std::move(_req));
}
if (pos == end || start_line[pos++] != 'H') {
return bad(std::move(_req));
}
if (pos == end || start_line[pos++] != 'T') {
return bad(std::move(_req));
}
if (pos == end || start_line[pos++] != 'T') {
return bad(std::move(_req));
}
if (pos == end || start_line[pos++] != 'P') {
return bad(std::move(_req));
}
if (pos == end || start_line[pos++] != '/') {
return bad(std::move(_req));
}
auto ver = pos;
if (pos == end || !digit_char(start_line[pos++])) {
return bad(std::move(_req));
}
if (pos == end || start_line[pos++] != '.') {
return bad(std::move(_req));
}
if (pos == end || !digit_char(start_line[pos++])) {
return bad(std::move(_req));
}
_req->_version = sstring(start_line.begin() + ver, pos - ver);
if (pos == end || start_line[pos++] != '\r') {
return bad(std::move(_req));
}
if (pos == end || start_line[pos++] != '\n') {
return bad(std::move(_req));
}
if (pos != end) {
return bad(std::move(_req));
}
if (_req->_method != "GET") {
return bad(std::move(_req));
}
_read_buf.read_until(limit, '\n').then([this] (tmp_buf header) {
parse_header(std::move(header));
});
});
}
void parse_header(tmp_buf header) {
if (header.size() == 2 && header[0] == '\r' && header[1] == '\n') {
generate_response(std::move(_req));
read();
return;
}
size_t pos = 0;
size_t end = header.size();
if (end < 2 || header[end-2] != '\r' || header[end-1] != '\n') {
return bad(std::move(_req));
}
while (tchar(header[pos])) {
++pos;
}
if (pos) {
sstring name = sstring(header.begin(), pos);
while (pos != end && sp_char(header[pos])) {
++pos;
}
if (pos == end || header[pos++] != ':') {
return bad(std::move(_req));
}
while (pos != end && sp_char(header[pos])) {
++pos;
}
while (pos != end && sp_char(header[end-1])) {
--end;
}
sstring value = sstring(header.begin() + pos, end - pos);
_req->_headers[name] = std::move(value);
_last_header_name = std::move(name);
} else {
while (sp_char(header[pos])) {
++pos;
}
while (pos != end && sp_char(header[end-1])) {
--end;
}
if (!pos || end == pos) {
return bad(std::move(_req));
}
_req->_headers[_last_header_name] += " ";
_req->_headers[_last_header_name] += sstring(header.begin() + pos, end - pos);
}
_read_buf.read_until(limit, '\n').then([this] (tmp_buf header) {
parse_header(std::move(header));
});
}
void bad(std::unique_ptr<request> req) {
auto resp = std::make_unique<response>();
resp->_response_line = "HTTP/1.1 400 BAD REQUEST\r\n\r\n";
respond(std::move(resp));
}
void respond(std::unique_ptr<response> resp) {
if (!_resp) {
_resp = std::move(resp);
start_response();
} else {
_pending_responses.push(std::move(resp));
}
}
void start_response() {
_resp->_headers["Content-Length"] = to_sstring(_resp->_body.size());
_write_buf.write(_resp->_response_line.begin(), _resp->_response_line.size()).then(
[this] (size_t n) mutable {
return write_response_headers(_resp->_headers.begin());
}).then([this] (size_t done) {
return _write_buf.write("\r\n", 2);
}).then([this] (size_t done) mutable {
return write_body();
}).then([this] (size_t done) {
return _write_buf.flush();
}).then([this] (bool done) {
_resp.reset();
if (!_pending_responses.empty()) {
_resp = std::move(_pending_responses.front());
_pending_responses.pop();
start_response();
} else {
maybe_done();
}
});
}
future<size_t> write_response_headers(std::unordered_map<sstring, sstring>::iterator hi) {
if (hi == _resp->_headers.end()) {
return make_ready_future<size_t>(0);
}
promise<size_t> pr;
auto fut = pr.get_future();
_write_buf.write(hi->first.begin(), hi->first.size()).then(
[hi, this, pr = std::move(pr)] (size_t done) mutable {
return _write_buf.write(": ", 2);
}).then([hi, this, pr = std::move(pr)] (size_t done) mutable {
return _write_buf.write(hi->second.begin(), hi->second.size());
}).then([hi, this, pr = std::move(pr)] (size_t done) mutable {
return _write_buf.write("\r\n", 2);
}).then([hi, this, pr = std::move(pr)] (size_t done) mutable {
return write_response_headers(++hi);
}).then([this, pr = std::move(pr)] (size_t done) mutable {
pr.set_value(done);
});
return fut;
}
void generate_response(std::unique_ptr<request> req) {
auto resp = std::make_unique<response>();
resp->_response_line = "HTTP/1.1 200 OK\r\n";
resp->_headers["Content-Type"] = "text/html";
resp->_body = "<html><head><title>this is the future</title></head><body><p>Future!!</p></body></html>";
respond(std::move(resp));
}
future<size_t> write_body() {
return _write_buf.write(_resp->_body.begin(), _resp->_body.size());
}
void maybe_done() {
if (_eof && !_req && !_resp && _pending_responses.empty()) {
delete this;
}
}
};
};
int main(int ac, char** av) {
http_server server;
server.listen({{}, 10000});
the_reactor.run();
return 0;
}