request_parser.cpp 5.9 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315
  1. //
  2. // request_parser.cpp
  3. // ~~~~~~~~~~~~~~~~~~
  4. //
  5. // Copyright (c) 2003-2019 Christopher M. Kohlhoff (chris at kohlhoff dot com)
  6. //
  7. // Distributed under the Boost Software License, Version 1.0. (See accompanying
  8. // file LICENSE_1_0.txt or copy at http://www.boost.org/LICENSE_1_0.txt)
  9. //
  10. #include "request_parser.hpp"
  11. #include "request.hpp"
  12. namespace http {
  13. namespace server {
  14. request_parser::request_parser()
  15. : state_(method_start)
  16. {
  17. }
  18. void request_parser::reset()
  19. {
  20. state_ = method_start;
  21. }
  22. request_parser::result_type request_parser::consume(request& req, char input)
  23. {
  24. switch (state_)
  25. {
  26. case method_start:
  27. if (!is_char(input) || is_ctl(input) || is_tspecial(input))
  28. {
  29. return bad;
  30. }
  31. else
  32. {
  33. state_ = method;
  34. req.method.push_back(input);
  35. return indeterminate;
  36. }
  37. case method:
  38. if (input == ' ')
  39. {
  40. state_ = uri;
  41. return indeterminate;
  42. }
  43. else if (!is_char(input) || is_ctl(input) || is_tspecial(input))
  44. {
  45. return bad;
  46. }
  47. else
  48. {
  49. req.method.push_back(input);
  50. return indeterminate;
  51. }
  52. case uri:
  53. if (input == ' ')
  54. {
  55. state_ = http_version_h;
  56. return indeterminate;
  57. }
  58. else if (is_ctl(input))
  59. {
  60. return bad;
  61. }
  62. else
  63. {
  64. req.uri.push_back(input);
  65. return indeterminate;
  66. }
  67. case http_version_h:
  68. if (input == 'H')
  69. {
  70. state_ = http_version_t_1;
  71. return indeterminate;
  72. }
  73. else
  74. {
  75. return bad;
  76. }
  77. case http_version_t_1:
  78. if (input == 'T')
  79. {
  80. state_ = http_version_t_2;
  81. return indeterminate;
  82. }
  83. else
  84. {
  85. return bad;
  86. }
  87. case http_version_t_2:
  88. if (input == 'T')
  89. {
  90. state_ = http_version_p;
  91. return indeterminate;
  92. }
  93. else
  94. {
  95. return bad;
  96. }
  97. case http_version_p:
  98. if (input == 'P')
  99. {
  100. state_ = http_version_slash;
  101. return indeterminate;
  102. }
  103. else
  104. {
  105. return bad;
  106. }
  107. case http_version_slash:
  108. if (input == '/')
  109. {
  110. req.http_version_major = 0;
  111. req.http_version_minor = 0;
  112. state_ = http_version_major_start;
  113. return indeterminate;
  114. }
  115. else
  116. {
  117. return bad;
  118. }
  119. case http_version_major_start:
  120. if (is_digit(input))
  121. {
  122. req.http_version_major = req.http_version_major * 10 + input - '0';
  123. state_ = http_version_major;
  124. return indeterminate;
  125. }
  126. else
  127. {
  128. return bad;
  129. }
  130. case http_version_major:
  131. if (input == '.')
  132. {
  133. state_ = http_version_minor_start;
  134. return indeterminate;
  135. }
  136. else if (is_digit(input))
  137. {
  138. req.http_version_major = req.http_version_major * 10 + input - '0';
  139. return indeterminate;
  140. }
  141. else
  142. {
  143. return bad;
  144. }
  145. case http_version_minor_start:
  146. if (is_digit(input))
  147. {
  148. req.http_version_minor = req.http_version_minor * 10 + input - '0';
  149. state_ = http_version_minor;
  150. return indeterminate;
  151. }
  152. else
  153. {
  154. return bad;
  155. }
  156. case http_version_minor:
  157. if (input == '\r')
  158. {
  159. state_ = expecting_newline_1;
  160. return indeterminate;
  161. }
  162. else if (is_digit(input))
  163. {
  164. req.http_version_minor = req.http_version_minor * 10 + input - '0';
  165. return indeterminate;
  166. }
  167. else
  168. {
  169. return bad;
  170. }
  171. case expecting_newline_1:
  172. if (input == '\n')
  173. {
  174. state_ = header_line_start;
  175. return indeterminate;
  176. }
  177. else
  178. {
  179. return bad;
  180. }
  181. case header_line_start:
  182. if (input == '\r')
  183. {
  184. state_ = expecting_newline_3;
  185. return indeterminate;
  186. }
  187. else if (!req.headers.empty() && (input == ' ' || input == '\t'))
  188. {
  189. state_ = header_lws;
  190. return indeterminate;
  191. }
  192. else if (!is_char(input) || is_ctl(input) || is_tspecial(input))
  193. {
  194. return bad;
  195. }
  196. else
  197. {
  198. req.headers.push_back(header());
  199. req.headers.back().name.push_back(input);
  200. state_ = header_name;
  201. return indeterminate;
  202. }
  203. case header_lws:
  204. if (input == '\r')
  205. {
  206. state_ = expecting_newline_2;
  207. return indeterminate;
  208. }
  209. else if (input == ' ' || input == '\t')
  210. {
  211. return indeterminate;
  212. }
  213. else if (is_ctl(input))
  214. {
  215. return bad;
  216. }
  217. else
  218. {
  219. state_ = header_value;
  220. req.headers.back().value.push_back(input);
  221. return indeterminate;
  222. }
  223. case header_name:
  224. if (input == ':')
  225. {
  226. state_ = space_before_header_value;
  227. return indeterminate;
  228. }
  229. else if (!is_char(input) || is_ctl(input) || is_tspecial(input))
  230. {
  231. return bad;
  232. }
  233. else
  234. {
  235. req.headers.back().name.push_back(input);
  236. return indeterminate;
  237. }
  238. case space_before_header_value:
  239. if (input == ' ')
  240. {
  241. state_ = header_value;
  242. return indeterminate;
  243. }
  244. else
  245. {
  246. return bad;
  247. }
  248. case header_value:
  249. if (input == '\r')
  250. {
  251. state_ = expecting_newline_2;
  252. return indeterminate;
  253. }
  254. else if (is_ctl(input))
  255. {
  256. return bad;
  257. }
  258. else
  259. {
  260. req.headers.back().value.push_back(input);
  261. return indeterminate;
  262. }
  263. case expecting_newline_2:
  264. if (input == '\n')
  265. {
  266. state_ = header_line_start;
  267. return indeterminate;
  268. }
  269. else
  270. {
  271. return bad;
  272. }
  273. case expecting_newline_3:
  274. return (input == '\n') ? good : bad;
  275. default:
  276. return bad;
  277. }
  278. }
  279. bool request_parser::is_char(int c)
  280. {
  281. return c >= 0 && c <= 127;
  282. }
  283. bool request_parser::is_ctl(int c)
  284. {
  285. return (c >= 0 && c <= 31) || (c == 127);
  286. }
  287. bool request_parser::is_tspecial(int c)
  288. {
  289. switch (c)
  290. {
  291. case '(': case ')': case '<': case '>': case '@':
  292. case ',': case ';': case ':': case '\\': case '"':
  293. case '/': case '[': case ']': case '?': case '=':
  294. case '{': case '}': case ' ': case '\t':
  295. return true;
  296. default:
  297. return false;
  298. }
  299. }
  300. bool request_parser::is_digit(int c)
  301. {
  302. return c >= '0' && c <= '9';
  303. }
  304. } // namespace server
  305. } // namespace http