1 Star 1 Fork 0

俞寅达 / nicenet

加入 Gitee
与超过 1200万 开发者一起发现、参与优秀开源项目,私有仓库也完全免费 :)
免费加入
克隆/下载
HttpParser.hpp 30.25 KB
一键复制 编辑 原始数据 按行查看 历史
俞寅达 提交于 2021-10-05 13:03 . nicenet
123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209121012111212121312141215121612171218121912201221122212231224122512261227122812291230123112321233123412351236123712381239124012411242124312441245124612471248124912501251125212531254125512561257125812591260126112621263126412651266126712681269127012711272127312741275127612771278127912801281128212831284128512861287128812891290129112921293129412951296129712981299130013011302130313041305130613071308130913101311131213131314131513161317131813191320132113221323132413251326132713281329133013311332133313341335133613371338133913401341134213431344134513461347134813491350135113521353135413551356135713581359136013611362136313641365136613671368136913701371137213731374137513761377137813791380138113821383138413851386138713881389139013911392139313941395139613971398139914001401140214031404140514061407140814091410141114121413141414151416141714181419142014211422142314241425142614271428142914301431143214331434143514361437143814391440144114421443144414451446144714481449145014511452145314541455145614571458145914601461146214631464146514661467146814691470147114721473147414751476147714781479148014811482148314841485148614871488148914901491149214931494149514961497149814991500150115021503150415051506150715081509151015111512151315141515151615171518151915201521152215231524152515261527152815291530153115321533153415351536153715381539154015411542154315441545154615471548154915501551155215531554155515561557155815591560156115621563156415651566156715681569157015711572157315741575157615771578157915801581158215831584158515861587158815891590159115921593159415951596159715981599160016011602160316041605160616071608160916101611161216131614161516161617161816191620162116221623162416251626162716281629163016311632163316341635163616371638
#ifndef ___NICE_HTTPPARSER____
#define ___NICE_HTTPPARSER____
#include <algorithm>
#include <string.h>
#include <stdlib.h>
#include <string>
#include <vector>
#include <sstream>
#include <map>
#include "Common.hpp"
namespace nicehero
{
struct HttpRequestBase {
HttpRequestBase()
: versionMajor(0), versionMinor(0), keepAlive(false), remainSize(0)
{}
struct HeaderItem
{
std::string name;
std::string value;
};
std::string method;
std::string uri;
int versionMajor;
int versionMinor;
std::vector<HeaderItem> headers;
std::vector<char> content;
bool keepAlive;
int remainSize;
std::string paramsString;
std::map<std::string,std::string> params;
std::string inspect() const
{
std::stringstream stream;
stream << method << " " << uri << " HTTP/"
<< versionMajor << "." << versionMinor << "\n";
for (std::vector<HttpRequestBase::HeaderItem>::const_iterator it = headers.begin();
it != headers.end(); ++it)
{
stream << it->name << ": " << it->value << "\n";
}
std::string data(content.begin(), content.end());
stream << data << "\n";
stream << "+ keep-alive: " << keepAlive << "\n";;
return stream.str();
}
};
class HttpRequestParser
{
public:
HttpRequestParser()
: state(RequestMethodStart), contentSize(0),
chunkSize(0), chunked(false)
{
}
enum ParseResult {
ParsingCompleted,
ParsingIncompleted,
ParsingError
};
ParseResult parse(HttpRequestBase &req, const char *begin, const char *end)
{
return consume(req, begin, end);
}
private:
static bool checkIfConnection(const HttpRequestBase::HeaderItem &item)
{
return StrCaseCmp(item.name.c_str(), "Connection") == 0;
}
ParseResult consume(HttpRequestBase &req, const char *begin, const char *end)
{
while (begin != end)
{
char input = *begin++;
switch (state)
{
case RequestMethodStart:
if (!isChar(input) || isControl(input) || isSpecial(input))
{
return ParsingError;
}
else
{
state = RequestMethod;
req.method.push_back(input);
}
break;
case RequestMethod:
if (input == ' ')
{
state = RequestUriStart;
}
else if (!isChar(input) || isControl(input) || isSpecial(input))
{
return ParsingError;
}
else
{
req.method.push_back(input);
}
break;
case RequestUriStart:
if (isControl(input))
{
return ParsingError;
}
else
{
state = RequestUri;
req.uri.push_back(input);
}
break;
case RequestUri:
if (input == ' ')
{
state = RequestHttpVersion_h;
}
else if (input == '\r')
{
req.versionMajor = 0;
req.versionMinor = 9;
req.remainSize = int(end - begin);
return ParsingCompleted;
}
else if (isControl(input))
{
return ParsingError;
}
else
{
req.uri.push_back(input);
}
break;
case RequestHttpVersion_h:
if (input == 'H')
{
state = RequestHttpVersion_ht;
}
else
{
return ParsingError;
}
break;
case RequestHttpVersion_ht:
if (input == 'T')
{
state = RequestHttpVersion_htt;
}
else
{
return ParsingError;
}
break;
case RequestHttpVersion_htt:
if (input == 'T')
{
state = RequestHttpVersion_http;
}
else
{
return ParsingError;
}
break;
case RequestHttpVersion_http:
if (input == 'P')
{
state = RequestHttpVersion_slash;
}
else
{
return ParsingError;
}
break;
case RequestHttpVersion_slash:
if (input == '/')
{
req.versionMajor = 0;
req.versionMinor = 0;
state = RequestHttpVersion_majorStart;
}
else
{
return ParsingError;
}
break;
case RequestHttpVersion_majorStart:
if (isDigit(input))
{
req.versionMajor = input - '0';
state = RequestHttpVersion_major;
}
else
{
return ParsingError;
}
break;
case RequestHttpVersion_major:
if (input == '.')
{
state = RequestHttpVersion_minorStart;
}
else if (isDigit(input))
{
req.versionMajor = req.versionMajor * 10 + input - '0';
}
else
{
return ParsingError;
}
break;
case RequestHttpVersion_minorStart:
if (isDigit(input))
{
req.versionMinor = input - '0';
state = RequestHttpVersion_minor;
}
else
{
return ParsingError;
}
break;
case RequestHttpVersion_minor:
if (input == '\r')
{
state = ResponseHttpVersion_newLine;
}
else if (isDigit(input))
{
req.versionMinor = req.versionMinor * 10 + input - '0';
}
else
{
return ParsingError;
}
break;
case ResponseHttpVersion_newLine:
if (input == '\n')
{
state = HeaderLineStart;
}
else
{
return ParsingError;
}
break;
case HeaderLineStart:
if (input == '\r')
{
state = ExpectingNewline_3;
}
else if (!req.headers.empty() && (input == ' ' || input == '\t'))
{
state = HeaderLws;
}
else if (!isChar(input) || isControl(input) || isSpecial(input))
{
return ParsingError;
}
else
{
req.headers.push_back(HttpRequestBase::HeaderItem());
req.headers.back().name.reserve(16);
req.headers.back().value.reserve(16);
req.headers.back().name.push_back(input);
state = HeaderName;
}
break;
case HeaderLws:
if (input == '\r')
{
state = ExpectingNewline_2;
}
else if (input == ' ' || input == '\t')
{
}
else if (isControl(input))
{
return ParsingError;
}
else
{
state = HeaderValue;
req.headers.back().value.push_back(input);
}
break;
case HeaderName:
if (input == ':')
{
state = SpaceBeforeHeaderValue;
}
else if (!isChar(input) || isControl(input) || isSpecial(input))
{
return ParsingError;
}
else
{
req.headers.back().name.push_back(input);
}
break;
case SpaceBeforeHeaderValue:
if (input == ' ')
{
state = HeaderValue;
}
else
{
return ParsingError;
}
break;
case HeaderValue:
if (input == '\r')
{
if (req.method == "POST" || req.method == "PUT")
{
HttpRequestBase::HeaderItem &h = req.headers.back();
if (StrCaseCmp(h.name.c_str(), "Content-Length") == 0)
{
contentSize = atoi(h.value.c_str());
req.content.reserve(contentSize);
}
else if (StrCaseCmp(h.name.c_str(), "Transfer-Encoding") == 0)
{
if (StrCaseCmp(h.value.c_str(), "chunked") == 0)
chunked = true;
}
}
state = ExpectingNewline_2;
}
else if (isControl(input))
{
return ParsingError;
}
else
{
req.headers.back().value.push_back(input);
}
break;
case ExpectingNewline_2:
if (input == '\n')
{
state = HeaderLineStart;
}
else
{
return ParsingError;
}
break;
case ExpectingNewline_3: {
std::vector<HttpRequestBase::HeaderItem>::iterator it = std::find_if(req.headers.begin(),
req.headers.end(),
checkIfConnection);
if (it != req.headers.end())
{
if (StrCaseCmp(it->value.c_str(), "Keep-Alive") == 0)
{
req.keepAlive = true;
}
else // == Close
{
req.keepAlive = false;
}
}
else
{
if (req.versionMajor > 1 || (req.versionMajor == 1 && req.versionMinor == 1))
req.keepAlive = true;
}
if (chunked)
{
state = ChunkSize;
}
else if (contentSize == 0)
{
if (input == '\n')
{
req.remainSize = int(end - begin);
return ParsingCompleted;
}
else
return ParsingError;
}
else
{
state = Post;
}
break;
}
case Post:
--contentSize;
req.content.push_back(input);
if (contentSize == 0)
{
req.remainSize = int(end - begin);
return ParsingCompleted;
}
break;
case ChunkSize:
if (isalnum(input))
{
chunkSizeStr.push_back(input);
}
else if (input == ';')
{
state = ChunkExtensionName;
}
else if (input == '\r')
{
state = ChunkSizeNewLine;
}
else
{
return ParsingError;
}
break;
case ChunkExtensionName:
if (isalnum(input) || input == ' ')
{
// skip
}
else if (input == '=')
{
state = ChunkExtensionValue;
}
else if (input == '\r')
{
state = ChunkSizeNewLine;
}
else
{
return ParsingError;
}
break;
case ChunkExtensionValue:
if (isalnum(input) || input == ' ')
{
// skip
}
else if (input == '\r')
{
state = ChunkSizeNewLine;
}
else
{
return ParsingError;
}
break;
case ChunkSizeNewLine:
if (input == '\n')
{
chunkSize = strtol(chunkSizeStr.c_str(), NULL, 16);
chunkSizeStr.clear();
req.content.reserve(req.content.size() + chunkSize);
if (chunkSize == 0)
state = ChunkSizeNewLine_2;
else
state = ChunkData;
}
else
{
return ParsingError;
}
break;
case ChunkSizeNewLine_2:
if (input == '\r')
{
state = ChunkSizeNewLine_3;
}
else if (isalpha(input))
{
state = ChunkTrailerName;
}
else
{
return ParsingError;
}
break;
case ChunkSizeNewLine_3:
if (input == '\n')
{
req.remainSize = int(end - begin);
return ParsingCompleted;
}
else
{
return ParsingError;
}
break;
case ChunkTrailerName:
if (isalnum(input))
{
// skip
}
else if (input == ':')
{
state = ChunkTrailerValue;
}
else
{
return ParsingError;
}
break;
case ChunkTrailerValue:
if (isalnum(input) || input == ' ')
{
// skip
}
else if (input == '\r')
{
state = ChunkSizeNewLine;
}
else
{
return ParsingError;
}
break;
case ChunkData:
req.content.push_back(input);
if (--chunkSize == 0)
{
state = ChunkDataNewLine_1;
}
break;
case ChunkDataNewLine_1:
if (input == '\r')
{
state = ChunkDataNewLine_2;
}
else
{
return ParsingError;
}
break;
case ChunkDataNewLine_2:
if (input == '\n')
{
state = ChunkSize;
}
else
{
return ParsingError;
}
break;
default:
return ParsingError;
}
}
return ParsingIncompleted;
}
// Check if a byte is an HTTP character.
inline bool isChar(int c)
{
return c >= 0 && c <= 127;
}
// Check if a byte is an HTTP control character.
inline bool isControl(int c)
{
return (c >= 0 && c <= 31) || (c == 127);
}
// Check if a byte is defined as an HTTP special character.
inline bool isSpecial(int c)
{
switch (c)
{
case '(': case ')': case '<': case '>': case '@':
case ',': case ';': case ':': case '\\': case '"':
case '/': case '[': case ']': case '?': case '=':
case '{': case '}': case ' ': case '\t':
return true;
default:
return false;
}
}
// Check if a byte is a digit.
inline bool isDigit(int c)
{
return c >= '0' && c <= '9';
}
// The current state of the parser.
enum State
{
RequestMethodStart,
RequestMethod,
RequestUriStart,
RequestUri,
RequestHttpVersion_h,
RequestHttpVersion_ht,
RequestHttpVersion_htt,
RequestHttpVersion_http,
RequestHttpVersion_slash,
RequestHttpVersion_majorStart,
RequestHttpVersion_major,
RequestHttpVersion_minorStart,
RequestHttpVersion_minor,
ResponseStatusStart,
ResponseHttpVersion_ht,
ResponseHttpVersion_htt,
ResponseHttpVersion_http,
ResponseHttpVersion_slash,
ResponseHttpVersion_majorStart,
ResponseHttpVersion_major,
ResponseHttpVersion_minorStart,
ResponseHttpVersion_minor,
ResponseHttpVersion_spaceAfterVersion,
ResponseHttpVersion_statusCodeStart,
ResponseHttpVersion_spaceAfterStatusCode,
ResponseHttpVersion_statusTextStart,
ResponseHttpVersion_newLine,
HeaderLineStart,
HeaderLws,
HeaderName,
SpaceBeforeHeaderValue,
HeaderValue,
ExpectingNewline_2,
ExpectingNewline_3,
Post,
ChunkSize,
ChunkExtensionName,
ChunkExtensionValue,
ChunkSizeNewLine,
ChunkSizeNewLine_2,
ChunkSizeNewLine_3,
ChunkTrailerName,
ChunkTrailerValue,
ChunkDataNewLine_1,
ChunkDataNewLine_2,
ChunkData,
} state;
size_t contentSize;
std::string chunkSizeStr;
size_t chunkSize;
bool chunked;
};
struct HttpResponseBase {
HttpResponseBase()
: versionMajor(1), versionMinor(1), keepAlive(false), statusCode(404)
{}
struct HeaderItem
{
std::string name;
std::string value;
};
int versionMajor;
int versionMinor;
std::vector<HeaderItem> headers;
std::vector<char> content;
bool keepAlive;
unsigned int statusCode;
std::string status;
std::string inspect() const
{
std::stringstream stream;
stream << "HTTP/" << versionMajor << "." << versionMinor
<< " " << statusCode << " " << status << "\n";
for (std::vector<HttpResponseBase::HeaderItem>::const_iterator it = headers.begin();
it != headers.end(); ++it)
{
stream << it->name << ": " << it->value << "\n";
}
if (keepAlive)
{
stream << "Connection: keep-alive\n";
}
stream << "Content-Length: " << content.size() << "\n";
stream << "\n";
std::string data(content.begin(), content.end());
stream << data << "\n";
return stream.str();
}
};
class HttpResponseParser
{
public:
HttpResponseParser()
: state(ResponseStatusStart),
contentSize(0),
chunkSize(0),
chunked(false)
{
}
enum ParseResult {
ParsingCompleted,
ParsingIncompleted,
ParsingError
};
ParseResult parse(HttpResponseBase &resp, const char *begin, const char *end)
{
return consume(resp, begin, end);
}
private:
static bool checkIfConnection(const HttpResponseBase::HeaderItem &item)
{
return StrCaseCmp(item.name.c_str(), "Connection") == 0;
}
ParseResult consume(HttpResponseBase &resp, const char *begin, const char *end)
{
while (begin != end)
{
char input = *begin++;
switch (state)
{
case ResponseStatusStart:
if (input != 'H')
{
return ParsingError;
}
else
{
state = ResponseHttpVersion_ht;
}
break;
case ResponseHttpVersion_ht:
if (input == 'T')
{
state = ResponseHttpVersion_htt;
}
else
{
return ParsingError;
}
break;
case ResponseHttpVersion_htt:
if (input == 'T')
{
state = ResponseHttpVersion_http;
}
else
{
return ParsingError;
}
break;
case ResponseHttpVersion_http:
if (input == 'P')
{
state = ResponseHttpVersion_slash;
}
else
{
return ParsingError;
}
break;
case ResponseHttpVersion_slash:
if (input == '/')
{
resp.versionMajor = 0;
resp.versionMinor = 0;
state = ResponseHttpVersion_majorStart;
}
else
{
return ParsingError;
}
break;
case ResponseHttpVersion_majorStart:
if (isDigit(input))
{
resp.versionMajor = input - '0';
state = ResponseHttpVersion_major;
}
else
{
return ParsingError;
}
break;
case ResponseHttpVersion_major:
if (input == '.')
{
state = ResponseHttpVersion_minorStart;
}
else if (isDigit(input))
{
resp.versionMajor = resp.versionMajor * 10 + input - '0';
}
else
{
return ParsingError;
}
break;
case ResponseHttpVersion_minorStart:
if (isDigit(input))
{
resp.versionMinor = input - '0';
state = ResponseHttpVersion_minor;
}
else
{
return ParsingError;
}
break;
case ResponseHttpVersion_minor:
if (input == ' ')
{
state = ResponseHttpVersion_statusCodeStart;
resp.statusCode = 0;
}
else if (isDigit(input))
{
resp.versionMinor = resp.versionMinor * 10 + input - '0';
}
else
{
return ParsingError;
}
break;
case ResponseHttpVersion_statusCodeStart:
if (isDigit(input))
{
resp.statusCode = input - '0';
state = ResponseHttpVersion_statusCode;
}
else
{
return ParsingError;
}
break;
case ResponseHttpVersion_statusCode:
if (isDigit(input))
{
resp.statusCode = resp.statusCode * 10 + input - '0';
}
else
{
if (resp.statusCode < 100 || resp.statusCode > 999)
{
return ParsingError;
}
else if (input == ' ')
{
state = ResponseHttpVersion_statusTextStart;
}
else
{
return ParsingError;
}
}
break;
case ResponseHttpVersion_statusTextStart:
if (isChar(input))
{
resp.status += input;
state = ResponseHttpVersion_statusText;
}
else
{
return ParsingError;
}
break;
case ResponseHttpVersion_statusText:
if (input == '\r')
{
state = ResponseHttpVersion_newLine;
}
else if (isChar(input))
{
resp.status += input;
}
else
{
return ParsingError;
}
break;
case ResponseHttpVersion_newLine:
if (input == '\n')
{
state = HeaderLineStart;
}
else
{
return ParsingError;
}
break;
case HeaderLineStart:
if (input == '\r')
{
state = ExpectingNewline_3;
}
else if (!resp.headers.empty() && (input == ' ' || input == '\t'))
{
state = HeaderLws;
}
else if (!isChar(input) || isControl(input) || isSpecial(input))
{
return ParsingError;
}
else
{
resp.headers.push_back(HttpResponseBase::HeaderItem());
resp.headers.back().name.reserve(16);
resp.headers.back().value.reserve(16);
resp.headers.back().name.push_back(input);
state = HeaderName;
}
break;
case HeaderLws:
if (input == '\r')
{
state = ExpectingNewline_2;
}
else if (input == ' ' || input == '\t')
{
}
else if (isControl(input))
{
return ParsingError;
}
else
{
state = HeaderValue;
resp.headers.back().value.push_back(input);
}
break;
case HeaderName:
if (input == ':')
{
state = SpaceBeforeHeaderValue;
}
else if (!isChar(input) || isControl(input) || isSpecial(input))
{
return ParsingError;
}
else
{
resp.headers.back().name.push_back(input);
}
break;
case SpaceBeforeHeaderValue:
if (input == ' ')
{
state = HeaderValue;
}
else
{
return ParsingError;
}
break;
case HeaderValue:
if (input == '\r')
{
HttpResponseBase::HeaderItem &h = resp.headers.back();
if (StrCaseCmp(h.name.c_str(), "Content-Length") == 0)
{
contentSize = atoi(h.value.c_str());
resp.content.reserve(contentSize);
}
else if (StrCaseCmp(h.name.c_str(), "Transfer-Encoding") == 0)
{
if (StrCaseCmp(h.value.c_str(), "chunked") == 0)
chunked = true;
}
state = ExpectingNewline_2;
}
else if (isControl(input))
{
return ParsingError;
}
else
{
resp.headers.back().value.push_back(input);
}
break;
case ExpectingNewline_2:
if (input == '\n')
{
state = HeaderLineStart;
}
else
{
return ParsingError;
}
break;
case ExpectingNewline_3: {
std::vector<HttpResponseBase::HeaderItem>::iterator it = std::find_if(resp.headers.begin(),
resp.headers.end(),
checkIfConnection);
if (it != resp.headers.end())
{
if (StrCaseCmp(it->value.c_str(), "Keep-Alive") == 0)
{
resp.keepAlive = true;
}
else // == Close
{
resp.keepAlive = false;
}
}
else
{
if (resp.versionMajor > 1 || (resp.versionMajor == 1 && resp.versionMinor == 1))
resp.keepAlive = true;
}
if (chunked)
{
state = ChunkSize;
}
else if (contentSize == 0)
{
if (input == '\n')
return ParsingCompleted;
else
return ParsingError;
}
else
{
state = Post;
}
break;
}
case Post:
--contentSize;
resp.content.push_back(input);
if (contentSize == 0)
{
return ParsingCompleted;
}
break;
case ChunkSize:
if (isalnum(input))
{
chunkSizeStr.push_back(input);
}
else if (input == ';')
{
state = ChunkExtensionName;
}
else if (input == '\r')
{
state = ChunkSizeNewLine;
}
else
{
return ParsingError;
}
break;
case ChunkExtensionName:
if (isalnum(input) || input == ' ')
{
// skip
}
else if (input == '=')
{
state = ChunkExtensionValue;
}
else if (input == '\r')
{
state = ChunkSizeNewLine;
}
else
{
return ParsingError;
}
break;
case ChunkExtensionValue:
if (isalnum(input) || input == ' ')
{
// skip
}
else if (input == '\r')
{
state = ChunkSizeNewLine;
}
else
{
return ParsingError;
}
break;
case ChunkSizeNewLine:
if (input == '\n')
{
chunkSize = strtol(chunkSizeStr.c_str(), NULL, 16);
chunkSizeStr.clear();
resp.content.reserve(resp.content.size() + chunkSize);
if (chunkSize == 0)
state = ChunkSizeNewLine_2;
else
state = ChunkData;
}
else
{
return ParsingError;
}
break;
case ChunkSizeNewLine_2:
if (input == '\r')
{
state = ChunkSizeNewLine_3;
}
else if (isalpha(input))
{
state = ChunkTrailerName;
}
else
{
return ParsingError;
}
break;
case ChunkSizeNewLine_3:
if (input == '\n')
{
return ParsingCompleted;
}
else
{
return ParsingError;
}
break;
case ChunkTrailerName:
if (isalnum(input))
{
// skip
}
else if (input == ':')
{
state = ChunkTrailerValue;
}
else
{
return ParsingError;
}
break;
case ChunkTrailerValue:
if (isalnum(input) || input == ' ')
{
// skip
}
else if (input == '\r')
{
state = ChunkSizeNewLine;
}
else
{
return ParsingError;
}
break;
case ChunkData:
resp.content.push_back(input);
if (--chunkSize == 0)
{
state = ChunkDataNewLine_1;
}
break;
case ChunkDataNewLine_1:
if (input == '\r')
{
state = ChunkDataNewLine_2;
}
else
{
return ParsingError;
}
break;
case ChunkDataNewLine_2:
if (input == '\n')
{
state = ChunkSize;
}
else
{
return ParsingError;
}
break;
default:
return ParsingError;
}
}
return ParsingIncompleted;
}
// Check if a byte is an HTTP character.
inline bool isChar(int c)
{
return c >= 0 && c <= 127;
}
// Check if a byte is an HTTP control character.
inline bool isControl(int c)
{
return (c >= 0 && c <= 31) || (c == 127);
}
// Check if a byte is defined as an HTTP special character.
inline bool isSpecial(int c)
{
switch (c)
{
case '(': case ')': case '<': case '>': case '@':
case ',': case ';': case ':': case '\\': case '"':
case '/': case '[': case ']': case '?': case '=':
case '{': case '}': case ' ': case '\t':
return true;
default:
return false;
}
}
// Check if a byte is a digit.
inline bool isDigit(int c)
{
return c >= '0' && c <= '9';
}
// The current state of the parser.
enum State
{
ResponseStatusStart,
ResponseHttpVersion_ht,
ResponseHttpVersion_htt,
ResponseHttpVersion_http,
ResponseHttpVersion_slash,
ResponseHttpVersion_majorStart,
ResponseHttpVersion_major,
ResponseHttpVersion_minorStart,
ResponseHttpVersion_minor,
ResponseHttpVersion_statusCodeStart,
ResponseHttpVersion_statusCode,
ResponseHttpVersion_statusTextStart,
ResponseHttpVersion_statusText,
ResponseHttpVersion_newLine,
HeaderLineStart,
HeaderLws,
HeaderName,
SpaceBeforeHeaderValue,
HeaderValue,
ExpectingNewline_2,
ExpectingNewline_3,
Post,
ChunkSize,
ChunkExtensionName,
ChunkExtensionValue,
ChunkSizeNewLine,
ChunkSizeNewLine_2,
ChunkSizeNewLine_3,
ChunkTrailerName,
ChunkTrailerValue,
ChunkDataNewLine_1,
ChunkDataNewLine_2,
ChunkData,
} state;
size_t contentSize;
std::string chunkSizeStr;
size_t chunkSize;
bool chunked;
};
class UrlParser
{
public:
UrlParser()
: valid(false)
{
}
explicit UrlParser(const std::string &url)
: valid(true)
{
parse(url);
}
bool parse(const std::string &str)
{
url = Url();
parse_(str);
return isValid();
}
bool isValid() const
{
return valid;
}
std::string scheme() const
{
return url.scheme;
}
std::string username() const
{
return url.username;
}
std::string password() const
{
return url.password;
}
std::string hostname() const
{
return url.hostname;
}
std::string port() const
{
return url.port;
}
std::string path() const
{
return url.path;
}
std::string query() const
{
return url.query;
}
std::string fragment() const
{
return url.fragment;
}
uint16_t httpPort() const
{
const uint16_t defaultHttpPort = 80;
const uint16_t defaultHttpsPort = 443;
if (url.port.empty())
{
if (scheme() == "https")
return defaultHttpsPort;
else
return defaultHttpPort;
}
else
{
return url.integerPort;
}
}
private:
bool isUnreserved(char ch) const
{
if (isalnum(ch))
return true;
switch (ch)
{
case '-':
case '.':
case '_':
case '~':
return true;
}
return false;
}
void parse_(const std::string &str)
{
enum {
Scheme,
SlashAfterScheme1,
SlashAfterScheme2,
UsernameOrHostname,
Password,
Hostname,
IPV6Hostname,
PortOrPassword,
Port,
Path,
Query,
Fragment
} state = Scheme;
std::string usernameOrHostname;
std::string portOrPassword;
valid = true;
url.path = "/";
url.integerPort = 0;
for (size_t i = 0; i < str.size() && valid; ++i)
{
char ch = str[i];
switch (state)
{
case Scheme:
if (isalnum(ch) || ch == '+' || ch == '-' || ch == '.')
{
url.scheme += ch;
}
else if (ch == ':')
{
state = SlashAfterScheme1;
}
else
{
valid = false;
url = Url();
}
break;
case SlashAfterScheme1:
if (ch == '/')
{
state = SlashAfterScheme2;
}
else if (isalnum(ch))
{
usernameOrHostname = ch;
state = UsernameOrHostname;
}
else
{
valid = false;
url = Url();
}
break;
case SlashAfterScheme2:
if (ch == '/')
{
state = UsernameOrHostname;
}
else
{
valid = false;
url = Url();
}
break;
case UsernameOrHostname:
if (isUnreserved(ch) || ch == '%')
{
usernameOrHostname += ch;
}
else if (ch == ':')
{
state = PortOrPassword;
}
else if (ch == '@')
{
state = Hostname;
std::swap(url.username, usernameOrHostname);
}
else if (ch == '/')
{
state = Path;
std::swap(url.hostname, usernameOrHostname);
}
else
{
valid = false;
url = Url();
}
break;
case Password:
if (isalnum(ch) || ch == '%')
{
url.password += ch;
}
else if (ch == '@')
{
state = Hostname;
}
else
{
valid = false;
url = Url();
}
break;
case Hostname:
if (ch == '[' && url.hostname.empty())
{
state = IPV6Hostname;
}
else if (isUnreserved(ch) || ch == '%')
{
url.hostname += ch;
}
else if (ch == ':')
{
state = Port;
}
else if (ch == '/')
{
state = Path;
}
else
{
valid = false;
url = Url();
}
break;
case IPV6Hostname:
abort(); // TODO
case PortOrPassword:
if (isdigit(ch))
{
portOrPassword += ch;
}
else if (ch == '/')
{
std::swap(url.hostname, usernameOrHostname);
std::swap(url.port, portOrPassword);
url.integerPort = atoi(url.port.c_str());
state = Path;
}
else if (isalnum(ch) || ch == '%')
{
std::swap(url.username, usernameOrHostname);
std::swap(url.password, portOrPassword);
url.password += ch;
state = Password;
}
else
{
valid = false;
url = Url();
}
break;
case Port:
if (isdigit(ch))
{
portOrPassword += ch;
}
else if (ch == '/')
{
std::swap(url.port, portOrPassword);
url.integerPort = atoi(url.port.c_str());
state = Path;
}
else
{
valid = false;
url = Url();
}
break;
case Path:
if (ch == '#')
{
state = Fragment;
}
else if (ch == '?')
{
state = Query;
}
else
{
url.path += ch;
}
break;
case Query:
if (ch == '#')
{
state = Fragment;
}
else if (ch == '?')
{
state = Query;
}
else
{
url.query += ch;
}
break;
case Fragment:
url.fragment += ch;
break;
}
}
if (!usernameOrHostname.empty())
url.hostname = usernameOrHostname;
}
bool valid;
struct Url
{
Url() : integerPort(0)
{}
std::string scheme;
std::string username;
std::string password;
std::string hostname;
std::string port;
std::string path;
std::string query;
std::string fragment;
uint16_t integerPort;
} url;
};
}
#endif // !___NICE_HTTPPARSER____
马建仓 AI 助手
尝试更多
代码解读
代码找茬
代码优化
1
https://gitee.com/nicehero/nicenet.git
git@gitee.com:nicehero/nicenet.git
nicehero
nicenet
nicenet
master

搜索帮助

344bd9b3 5694891 D2dac590 5694891