src/rfc/detail/rules.cpp

95.8% Lines (159/166) 100.0% Functions (10/10)
src/rfc/detail/rules.cpp
Line TLA Hits Source Code
1 //
2 // Copyright (c) 2021 Vinnie Falco ([email protected])
3 //
4 // Distributed under the Boost Software License, Version 1.0. (See accompanying
5 // file LICENSE_1_0.txt or copy at http://www.boost.org/LICENSE_1_0.txt)
6 //
7 // Official repository: https://github.com/cppalliance/http
8 //
9
10 #include "src/rfc/detail/rules.hpp"
11
12 #include <boost/http/error.hpp>
13 #include <boost/http/detail/config.hpp>
14 #include <boost/http/rfc/token_rule.hpp>
15
16 #include <boost/core/detail/string_view.hpp>
17 #include <boost/url/grammar/delim_rule.hpp>
18 #include <boost/url/grammar/digit_chars.hpp>
19 #include <boost/url/grammar/error.hpp>
20 #include <boost/url/grammar/hexdig_chars.hpp>
21 #include <boost/url/grammar/lut_chars.hpp>
22 #include <boost/url/grammar/parse.hpp>
23 #include <boost/url/grammar/tuple_rule.hpp>
24
25 #include "src/rfc/detail/rules.hpp"
26
27 namespace boost {
28 namespace http {
29 namespace detail {
30
31 auto
32 26077 crlf_rule_t::
33 parse(
34 char const*& it,
35 char const* end) const noexcept ->
36 system::result<value_type>
37 {
38 26077 if(it == end)
39 4509 return grammar::error::need_more;
40 21568 if(*it != '\r')
41 29 return grammar::error::mismatch;
42 21539 ++it;
43 21539 if(it == end)
44 645 return grammar::error::need_more;
45 20894 if(*it != '\n')
46 51 return grammar::error::mismatch;
47 20843 ++it;
48 20843 return {};
49 }
50
51 //------------------------------------------------
52
53 auto
54 21683 version_rule_t::
55 parse(
56 char const*& it,
57 char const* end) const noexcept ->
58 system::result<value_type>
59 {
60 21683 value_type v = 0;
61 21683 if(it == end)
62 {
63 // expected "HTTP/"
64 1141 BOOST_HTTP_RETURN_EC(
65 grammar::error::need_more);
66 }
67 20542 if(end - it >= 5)
68 {
69 17528 if(std::memcmp(
70 it, "HTTP/", 5) != 0)
71 {
72 BOOST_HTTP_RETURN_EC(
73 grammar::error::mismatch);
74 }
75 17528 it += 5;
76 }
77 20542 if(it == end)
78 {
79 // expected DIGIT
80 683 BOOST_HTTP_RETURN_EC(
81 grammar::error::need_more);
82 }
83 19859 if(! grammar::digit_chars(*it))
84 {
85 // expected DIGIT
86 3014 BOOST_HTTP_RETURN_EC(
87 grammar::error::need_more);
88 }
89 16845 v = 10 * (*it++ - '0');
90 16845 if(it == end)
91 {
92 // expected "."
93 817 BOOST_HTTP_RETURN_EC(
94 grammar::error::need_more);
95 }
96 16028 if(*it != '.')
97 {
98 // expected "."
99 BOOST_HTTP_RETURN_EC(
100 grammar::error::need_more);
101 }
102 16028 ++it;
103 16028 if(it == end)
104 {
105 // expected DIGIT
106 663 BOOST_HTTP_RETURN_EC(
107 grammar::error::need_more);
108 }
109 15365 if(! grammar::digit_chars(*it))
110 {
111 // expected DIGIT
112 BOOST_HTTP_RETURN_EC(
113 grammar::error::need_more);
114 }
115 15365 v += *it++ - '0';
116 15365 return v;
117 }
118
119 //------------------------------------------------
120
121 auto
122 5105 status_code_rule_t::
123 parse(
124 char const*& it,
125 char const* end) const noexcept ->
126 system::result<value_type>
127 {
128 auto const dig =
129 11983 [](char c) -> int
130 {
131 11983 unsigned char uc(c - '0');
132 11983 if(uc > 9)
133 return -1;
134 11983 return uc;
135 };
136
137 5105 if(it == end)
138 {
139 // end
140 562 BOOST_HTTP_RETURN_EC(
141 grammar::error::need_more);
142 }
143 4543 auto it0 = it;
144 4543 int v = dig(*it);
145 4543 if(v == -1)
146 {
147 // expected DIGIT
148 BOOST_HTTP_RETURN_EC(
149 grammar::error::mismatch);
150 }
151 4543 value_type t;
152 4543 t.v = 100 * v;
153 4543 ++it;
154 4543 if(it == end)
155 {
156 // end
157 552 BOOST_HTTP_RETURN_EC(
158 grammar::error::need_more);
159 }
160 3991 v = dig(*it);
161 3991 if(v == -1)
162 {
163 // expected DIGIT
164 BOOST_HTTP_RETURN_EC(
165 grammar::error::mismatch);
166 }
167 3991 t.v = t.v + (10 * v);
168 3991 ++it;
169 3991 if(it == end)
170 {
171 // end
172 542 BOOST_HTTP_RETURN_EC(
173 grammar::error::need_more);
174 }
175 3449 v = dig(*it);
176 3449 if(v == -1)
177 {
178 // expected DIGIT
179 BOOST_HTTP_RETURN_EC(
180 grammar::error::need_more);
181 }
182 3449 t.v = t.v + v;
183 3449 ++it;
184
185 3449 t.s = core::string_view(it0, it - it0);
186 3449 t.st = int_to_status(t.v);
187 3449 return t;
188 }
189
190 //------------------------------------------------
191
192 auto
193 2917 reason_phrase_rule_t::
194 parse(
195 char const*& it,
196 char const* end) const noexcept ->
197 system::result<value_type>
198 {
199 2917 auto begin = it;
200 2917 it = grammar::find_if_not(it, end, ws_vchars);
201 2917 return core::string_view(begin, it);
202 }
203
204 //------------------------------------------------
205
206 auto
207 21201 field_name_rule_t::
208 parse(
209 char const*& it,
210 char const* end) const noexcept ->
211 system::result<value_type>
212 {
213 21201 if( it == end )
214 1 BOOST_HTTP_RETURN_EC(
215 grammar::error::need_more);
216
217 21200 value_type v;
218
219 21200 auto begin = it;
220 21200 auto rv = grammar::parse(
221 it, end, token_rule);
222 21200 if( rv.has_error() || (it != end) )
223 {
224 14501 if( it != begin )
225 {
226 14435 v = core::string_view(begin, it - begin);
227 14435 return v;
228 }
229 66 return error::bad_field_name;
230 }
231
232 6699 v = core::string_view(begin, end - begin);
233 6699 return v;
234 }
235
236 auto
237 14704 field_value_rule_t::
238 parse(
239 char const*& it,
240 char const* end) const noexcept ->
241 system::result<value_type>
242 {
243 14704 value_type v;
244 14704 if( it == end )
245 {
246 511 v.value = core::string_view(it, 0);
247 511 return v;
248 }
249
250 // field-line = field-name ":" OWS field-value OWS
251 // field-value = *field-content
252 // field-content = field-vchar
253 // [ 1*( SP / HTAB / field-vchar ) field-vchar ]
254 // field-vchar = VCHAR / obs-text
255 // obs-text = %x80-FF
256 // VCHAR = %x21-7E
257 // ; visible (printing) characters
258
259 62618 auto is_field_vchar = [](unsigned char ch)
260 {
261 62618 return (ch >= 0x21 && ch <= 0x7e) || ch >= 0x80;
262 };
263
264 14193 char const* s0 = nullptr;
265 14193 char const* s1 = nullptr;
266
267 14193 bool has_crlf = false;
268 14193 bool has_obs_fold = false;
269
270 93612 while( it < end )
271 {
272 90964 auto ch = *it;
273 90964 if( ws(ch) )
274 {
275 16105 ++it;
276 16105 continue;
277 }
278
279 74859 if( ch == '\r' )
280 {
281 // too short to know if we have a potential obs-fold
282 // occurrence
283 12241 if( end - it < 2 )
284 454 BOOST_HTTP_RETURN_EC(
285 grammar::error::need_more);
286
287 11787 if( it[1] != '\n' )
288 53 goto done;
289
290 11734 if( end - it < 3 )
291 416 BOOST_HTTP_RETURN_EC(
292 grammar::error::need_more);
293
294 11318 if(! ws(it[2]) )
295 {
296 10588 has_crlf = true;
297 10588 goto done;
298 }
299
300 730 has_obs_fold = true;
301 730 it = it + 3;
302 730 continue;
303 730 }
304
305 62618 if(! is_field_vchar(ch) )
306 {
307 34 goto done;
308 }
309
310 62584 if(! s0 )
311 13264 s0 = it;
312
313 62584 ++it;
314 62584 s1 = it;
315 }
316
317 2648 done:
318 // later routines wind up doing pointer
319 // subtraction using the .data() member
320 // of the value so we need a valid 0-len range
321 13323 if(! s0 )
322 {
323 765 s0 = it;
324 765 s1 = s0;
325 }
326
327 13323 v.value = core::string_view(s0, s1 - s0);
328 13323 v.has_crlf = has_crlf;
329 13323 v.has_obs_fold = has_obs_fold;
330 13323 return v;
331 }
332
333 auto
334 32015 field_rule_t::
335 parse(
336 char const*& it,
337 char const* end) const noexcept ->
338 system::result<value_type>
339 {
340 32015 if(it == end)
341 {
342 671 BOOST_HTTP_RETURN_EC(
343 grammar::error::need_more);
344 }
345 // check for leading CRLF
346 31344 if(it[0] == '\r')
347 {
348 10384 ++it;
349 10384 if(it == end)
350 {
351 367 BOOST_HTTP_RETURN_EC(
352 grammar::error::need_more);
353 }
354 10017 if(*it != '\n')
355 {
356 21 BOOST_HTTP_RETURN_EC(
357 grammar::error::mismatch);
358 }
359 // end of fields
360 9996 ++it;
361 9996 BOOST_HTTP_RETURN_EC(
362 grammar::error::end_of_range);
363 }
364
365 20960 value_type v;
366 auto rv = grammar::parse(
367 20960 it, end, grammar::tuple_rule(
368 field_name_rule,
369 20960 grammar::delim_rule(':'),
370 field_value_rule,
371 20960 crlf_rule));
372
373 20960 if( rv.has_error() )
374 10388 return rv.error();
375
376 10572 auto val = rv.value();
377 10572 v.name = std::get<0>(val);
378 10572 v.value = std::get<2>(val).value;
379 10572 v.has_obs_fold = std::get<2>(val).has_obs_fold;
380
381 10572 return v;
382 }
383
384 //------------------------------------------------
385
386 void
387 244 remove_obs_fold(
388 char* it,
389 char const* const end) noexcept
390 {
391 2262 while(it != end)
392 {
393 2236 if(*it != '\r')
394 {
395 1637 ++it;
396 1637 continue;
397 }
398 599 if(end - it < 3)
399 218 break;
400 381 BOOST_ASSERT(it[1] == '\n');
401 762 if( it[1] == '\n' &&
402 381 ws(it[2]))
403 {
404 378 it[0] = ' ';
405 378 it[1] = ' ';
406 378 it += 3;
407 }
408 else
409 {
410 3 ++it;
411 }
412 }
413 244 }
414
415 } // detail
416 } // http
417 } // boost
418