SNode.C
Loading...
Searching...
No Matches
Parser.cpp
Go to the documentation of this file.
1/*
2 * SNode.C - a slim toolkit for network communication
3 * Copyright (C) Volker Christian <me@vchrist.at>
4 * 2020, 2021, 2022, 2023, 2024, 2025
5 *
6 * This program is free software: you can redistribute it and/or modify
7 * it under the terms of the GNU Lesser General Public License as published
8 * by the Free Software Foundation, either version 3 of the License, or
9 * (at your option) any later version.
10 *
11 * This program is distributed in the hope that it will be useful,
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 * GNU Lesser General Public License for more details.
15 *
16 * You should have received a copy of the GNU Lesser General Public License
17 * along with this program. If not, see <http://www.gnu.org/licenses/>.
18 */
19
20#include "web/http/Parser.h"
21
22#include "core/socket/stream/SocketContext.h"
23#include "web/http/decoder/Chunked.h"
24#include "web/http/decoder/HTTP10Response.h"
25#include "web/http/decoder/Identity.h"
26
27#ifndef DOXYGEN_SHOULD_SKIP_THIS
28
29#include "web/http/http_utils.h"
30
31#include <tuple>
32#include <utility>
33
34#endif /* DOXYGEN_SHOULD_SKIP_THIS */
35
36namespace web::http {
37
38 // HTTP/1.0 and HTTP/1.1
39 const std::regex Parser::httpVersionRegex("^HTTP/([1])[.]([0-1])$");
40
41 Parser::Parser(core::socket::stream::SocketContext* socketContext, const enum Parser::HTTPCompliance& compliance)
42 : hTTPCompliance(compliance)
43 , socketContext(socketContext)
44 , headerDecoder(socketContext)
45 , trailerDecoder(socketContext) {
46 }
47
49 reset();
50 }
51
52 void Parser::reset() {
54 headers.clear();
55 content.clear();
56 httpMinor = 0;
57 httpMajor = 0;
58 line.clear();
59 contentLength = 0;
60 contentLengthRead = 0;
61
62 for (ContentDecoder* contentDecoder : decoderQueue) {
63 delete contentDecoder;
64 }
65 decoderQueue.clear();
66
67 trailerFieldsExpected.clear();
68 }
69
71 std::size_t ret = 0;
72 std::size_t consumed = 0;
73
74 do {
75 switch (parserState) {
76 case ParserState::BEGIN:
77 begin();
78 parserState = ParserState::FIRSTLINE;
79 [[fallthrough]];
80 case ParserState::FIRSTLINE:
81 ret = readStartLine();
82 break;
83 case ParserState::HEADER:
84 ret = readHeader();
85 break;
86 case ParserState::BODY:
87 ret = readContent();
88 break;
89 case ParserState::TRAILER:
90 ret = readTrailer();
91 break;
92 case ParserState::ERROR:
93 break;
94 }
95 consumed += ret;
96 } while (ret > 0 && parserState != ParserState::BEGIN && parserState != ParserState::ERROR);
97
98 return consumed;
99 }
100
102 std::size_t consumed = 0;
103 std::size_t ret = 0;
104
105 do {
106 char ch = 0;
107 ret = socketContext->readFromPeer(&ch, 1);
108
109 if (ret > 0) {
110 consumed += ret;
111 if (ch == '\r' || ch == '\n') {
112 if (ch == '\n') {
113 parseStartLine(line);
114 line.clear();
115 }
116 } else {
117 line += ch;
118 }
119 }
120 } while (ret > 0 && parserState == ParserState::FIRSTLINE);
121
122 return consumed;
123 }
124
126 const std::size_t consumed = headerDecoder.read();
127
128 if (headerDecoder.isError()) {
129 parseError(headerDecoder.getErrorCode(), headerDecoder.getErrorReason());
130 } else if (headerDecoder.isComplete()) {
131 headers = std::move(headerDecoder.getHeader());
133 }
134
135 return consumed;
136 }
137
139 if (headers.contains("Content-Length")) {
140 contentLength = std::stoul(headers["Content-Length"]);
141 transferEncoding = TransferEncoding::Identity;
142 decoderQueue.emplace_back(new web::http::decoder::Identity(socketContext, contentLength));
143 }
144 if (headers.contains("Transfer-Encoding")) {
145 const std::string& encoding = headers["Transfer-Encoding"];
146
147 if (web::http::ciContains(encoding, "chunked")) {
148 transferEncoding = TransferEncoding::Chunked;
149 decoderQueue.emplace_back(new web::http::decoder::Chunked(socketContext));
150
151 if (headers.contains("Trailer")) {
152 std::string trailers = headers["Trailer"];
153
154 while (!trailers.empty()) {
155 std::string trailerField;
156 std::tie(trailerField, trailers) = httputils::str_split(trailers, ',');
157 httputils::str_trimm(trailerField);
158 trailerFieldsExpected.insert(trailerField);
159 trailerField.clear();
160 }
161 trailerDecoder.setFieldsExpected(trailerFieldsExpected);
162 }
163 }
164 if (web::http::ciContains(encoding, "compressed")) {
165 // decoderQueue.emplace_back(new web::http::decoder::Compress(socketContext));
166 }
167 if (web::http::ciContains(encoding, "deflate")) {
168 // decoderQueue.emplace_back(new web::http::decoder::Deflate(socketContext));
169 }
170 if (web::http::ciContains(encoding, "gzip")) {
171 // decoderQueue.emplace_back(new web::http::decoder::GZip(socketContext));
172 }
173 }
174 if (decoderQueue.empty()) {
175 transferEncoding = TransferEncoding::HTTP10;
176 decoderQueue.emplace_back(new web::http::decoder::HTTP10Response(socketContext));
177 }
178
179 if (headers.contains("Content-Encoding")) {
180 const std::string& encoding = headers["Content-Encoding"];
181
182 if (web::http::ciContains(encoding, "compressed")) {
183 // decoderQueue.emplace_back(new web::http::decoder::Compress(socketContext));
184 }
185 if (web::http::ciContains(encoding, "deflate")) {
186 // decoderQueue.emplace_back(new web::http::decoder::Deflate(socketContext));
187 }
188 if (web::http::ciContains(encoding, "gzip")) {
189 // decoderQueue.emplace_back(new web::http::decoder::GZip(socketContext));
190 }
191 if (web::http::ciContains(encoding, "br")) {
192 // decoderQueue.emplace_back(new web::http::decoder::Br(socketContext));
193 }
194 }
195 }
196
198 ContentDecoder* contentDecoder = decoderQueue.front();
199
200 const std::size_t consumed = contentDecoder->read();
201
202 if (contentDecoder->isComplete()) {
203 contentDecoder = decoderQueue.back();
204
205 std::vector<char> chunk = contentDecoder->getContent();
206 content.insert(content.end(), chunk.begin(), chunk.end());
207
208 if (transferEncoding == TransferEncoding::Chunked && headers.contains("Trailer")) {
210 } else {
212 }
213 } else if (contentDecoder->isError()) {
214 parseError(400, "Wrong content encoding");
215 }
216
217 return consumed;
218 }
219
221 const std::size_t consumed = trailerDecoder.read();
222
223 if (trailerDecoder.isError()) {
224 parseError(trailerDecoder.getErrorCode(), trailerDecoder.getErrorReason());
225 } else if (trailerDecoder.isComplete()) {
226 web::http::CiStringMap<std::string>&& trailer = trailerDecoder.getHeader();
227 headers.insert(trailer.begin(), trailer.end());
229 }
230
231 return consumed;
232 }
233
234 enum Parser::HTTPCompliance operator|(const enum Parser::HTTPCompliance& c1, const enum Parser::HTTPCompliance& c2) {
235 return static_cast<enum Parser::HTTPCompliance>(static_cast<unsigned short>(c1) | static_cast<unsigned short>(c2));
236 }
237
238 enum Parser::HTTPCompliance operator&(const enum Parser::HTTPCompliance& c1, const enum Parser::HTTPCompliance& c2) {
239 return static_cast<enum Parser::HTTPCompliance>(static_cast<unsigned short>(c1) & static_cast<unsigned short>(c2));
240 }
241
242} // namespace web::http
ParserState parserState
Definition Parser.h:78
std::size_t parse()
Definition Parser.cpp:70
friend enum HTTPCompliance operator&(const enum HTTPCompliance &c1, const enum HTTPCompliance &c2)
Definition Parser.cpp:238
virtual ~Parser()
Definition Parser.cpp:48
static const std::regex httpVersionRegex
Definition Parser.h:82
friend enum HTTPCompliance operator|(const enum HTTPCompliance &c1, const enum HTTPCompliance &c2)
Definition Parser.cpp:234
std::size_t readContent()
Definition Parser.cpp:197
virtual void parsingFinished()=0
std::size_t readTrailer()
Definition Parser.cpp:220
std::size_t readStartLine()
Definition Parser.cpp:101
virtual void analyzeHeader()
Definition Parser.cpp:138
std::size_t readHeader()
Definition Parser.cpp:125