http_parser.h 19 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449
  1. /* Copyright Joyent, Inc. and other Node contributors. All rights reserved.
  2. *
  3. * Permission is hereby granted, free of charge, to any person obtaining a copy
  4. * of this software and associated documentation files (the "Software"), to
  5. * deal in the Software without restriction, including without limitation the
  6. * rights to use, copy, modify, merge, publish, distribute, sublicense, and/or
  7. * sell copies of the Software, and to permit persons to whom the Software is
  8. * furnished to do so, subject to the following conditions:
  9. *
  10. * The above copyright notice and this permission notice shall be included in
  11. * all copies or substantial portions of the Software.
  12. *
  13. * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  14. * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  15. * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
  16. * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
  17. * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
  18. * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
  19. * IN THE SOFTWARE.
  20. */
  21. #ifndef http_parser_h
  22. #define http_parser_h
  23. #ifdef __cplusplus
  24. extern "C" {
  25. #endif
  26. /* Also update SONAME in the Makefile whenever you change these. */
  27. #define HTTP_PARSER_VERSION_MAJOR 2
  28. #define HTTP_PARSER_VERSION_MINOR 9
  29. #define HTTP_PARSER_VERSION_PATCH 4
  30. #include <stddef.h>
  31. #if defined(_WIN32) && !defined(__MINGW32__) && \
  32. (!defined(_MSC_VER) || _MSC_VER<1600) && !defined(__WINE__)
  33. #include <BaseTsd.h>
  34. typedef __int8 int8_t;
  35. typedef unsigned __int8 uint8_t;
  36. typedef __int16 int16_t;
  37. typedef unsigned __int16 uint16_t;
  38. typedef __int32 int32_t;
  39. typedef unsigned __int32 uint32_t;
  40. typedef __int64 int64_t;
  41. typedef unsigned __int64 uint64_t;
  42. #elif (defined(__sun) || defined(__sun__)) && defined(__SunOS_5_9)
  43. #include <sys/inttypes.h>
  44. #else
  45. #include <stdint.h>
  46. #endif
  47. /* Compile with -DHTTP_PARSER_STRICT=0 to make less checks, but run
  48. * faster
  49. */
  50. #ifndef HTTP_PARSER_STRICT
  51. # define HTTP_PARSER_STRICT 1
  52. #endif
  53. /* Maximium header size allowed. If the macro is not defined
  54. * before including this header then the default is used. To
  55. * change the maximum header size, define the macro in the build
  56. * environment (e.g. -DHTTP_MAX_HEADER_SIZE=<value>). To remove
  57. * the effective limit on the size of the header, define the macro
  58. * to a very large number (e.g. -DHTTP_MAX_HEADER_SIZE=0x7fffffff)
  59. */
  60. #ifndef HTTP_MAX_HEADER_SIZE
  61. # define HTTP_MAX_HEADER_SIZE (80*1024)
  62. #endif
  63. typedef struct http_parser http_parser;
  64. typedef struct http_parser_settings http_parser_settings;
  65. /* Callbacks should return non-zero to indicate an error. The parser will
  66. * then halt execution.
  67. *
  68. * The one exception is on_headers_complete. In a HTTP_RESPONSE parser
  69. * returning '1' from on_headers_complete will tell the parser that it
  70. * should not expect a body. This is used when receiving a response to a
  71. * HEAD request which may contain 'Content-Length' or 'Transfer-Encoding:
  72. * chunked' headers that indicate the presence of a body.
  73. *
  74. * Returning `2` from on_headers_complete will tell parser that it should not
  75. * expect neither a body nor any futher responses on this connection. This is
  76. * useful for handling responses to a CONNECT request which may not contain
  77. * `Upgrade` or `Connection: upgrade` headers.
  78. *
  79. * http_data_cb does not return data chunks. It will be called arbitrarily
  80. * many times for each string. E.G. you might get 10 callbacks for "on_url"
  81. * each providing just a few characters more data.
  82. */
  83. typedef int (*http_data_cb) (http_parser*, const char *at, size_t length);
  84. typedef int (*http_cb) (http_parser*);
  85. /* Status Codes */
  86. #define HTTP_STATUS_MAP(XX) \
  87. XX(100, CONTINUE, Continue) \
  88. XX(101, SWITCHING_PROTOCOLS, Switching Protocols) \
  89. XX(102, PROCESSING, Processing) \
  90. XX(200, OK, OK) \
  91. XX(201, CREATED, Created) \
  92. XX(202, ACCEPTED, Accepted) \
  93. XX(203, NON_AUTHORITATIVE_INFORMATION, Non-Authoritative Information) \
  94. XX(204, NO_CONTENT, No Content) \
  95. XX(205, RESET_CONTENT, Reset Content) \
  96. XX(206, PARTIAL_CONTENT, Partial Content) \
  97. XX(207, MULTI_STATUS, Multi-Status) \
  98. XX(208, ALREADY_REPORTED, Already Reported) \
  99. XX(226, IM_USED, IM Used) \
  100. XX(300, MULTIPLE_CHOICES, Multiple Choices) \
  101. XX(301, MOVED_PERMANENTLY, Moved Permanently) \
  102. XX(302, FOUND, Found) \
  103. XX(303, SEE_OTHER, See Other) \
  104. XX(304, NOT_MODIFIED, Not Modified) \
  105. XX(305, USE_PROXY, Use Proxy) \
  106. XX(307, TEMPORARY_REDIRECT, Temporary Redirect) \
  107. XX(308, PERMANENT_REDIRECT, Permanent Redirect) \
  108. XX(400, BAD_REQUEST, Bad Request) \
  109. XX(401, UNAUTHORIZED, Unauthorized) \
  110. XX(402, PAYMENT_REQUIRED, Payment Required) \
  111. XX(403, FORBIDDEN, Forbidden) \
  112. XX(404, NOT_FOUND, Not Found) \
  113. XX(405, METHOD_NOT_ALLOWED, Method Not Allowed) \
  114. XX(406, NOT_ACCEPTABLE, Not Acceptable) \
  115. XX(407, PROXY_AUTHENTICATION_REQUIRED, Proxy Authentication Required) \
  116. XX(408, REQUEST_TIMEOUT, Request Timeout) \
  117. XX(409, CONFLICT, Conflict) \
  118. XX(410, GONE, Gone) \
  119. XX(411, LENGTH_REQUIRED, Length Required) \
  120. XX(412, PRECONDITION_FAILED, Precondition Failed) \
  121. XX(413, PAYLOAD_TOO_LARGE, Payload Too Large) \
  122. XX(414, URI_TOO_LONG, URI Too Long) \
  123. XX(415, UNSUPPORTED_MEDIA_TYPE, Unsupported Media Type) \
  124. XX(416, RANGE_NOT_SATISFIABLE, Range Not Satisfiable) \
  125. XX(417, EXPECTATION_FAILED, Expectation Failed) \
  126. XX(421, MISDIRECTED_REQUEST, Misdirected Request) \
  127. XX(422, UNPROCESSABLE_ENTITY, Unprocessable Entity) \
  128. XX(423, LOCKED, Locked) \
  129. XX(424, FAILED_DEPENDENCY, Failed Dependency) \
  130. XX(426, UPGRADE_REQUIRED, Upgrade Required) \
  131. XX(428, PRECONDITION_REQUIRED, Precondition Required) \
  132. XX(429, TOO_MANY_REQUESTS, Too Many Requests) \
  133. XX(431, REQUEST_HEADER_FIELDS_TOO_LARGE, Request Header Fields Too Large) \
  134. XX(451, UNAVAILABLE_FOR_LEGAL_REASONS, Unavailable For Legal Reasons) \
  135. XX(500, INTERNAL_SERVER_ERROR, Internal Server Error) \
  136. XX(501, NOT_IMPLEMENTED, Not Implemented) \
  137. XX(502, BAD_GATEWAY, Bad Gateway) \
  138. XX(503, SERVICE_UNAVAILABLE, Service Unavailable) \
  139. XX(504, GATEWAY_TIMEOUT, Gateway Timeout) \
  140. XX(505, HTTP_VERSION_NOT_SUPPORTED, HTTP Version Not Supported) \
  141. XX(506, VARIANT_ALSO_NEGOTIATES, Variant Also Negotiates) \
  142. XX(507, INSUFFICIENT_STORAGE, Insufficient Storage) \
  143. XX(508, LOOP_DETECTED, Loop Detected) \
  144. XX(510, NOT_EXTENDED, Not Extended) \
  145. XX(511, NETWORK_AUTHENTICATION_REQUIRED, Network Authentication Required) \
  146. enum http_status
  147. {
  148. #define XX(num, name, string) HTTP_STATUS_##name = num,
  149. HTTP_STATUS_MAP(XX)
  150. #undef XX
  151. };
  152. /* Request Methods */
  153. #define HTTP_METHOD_MAP(XX) \
  154. XX(0, DELETE, DELETE) \
  155. XX(1, GET, GET) \
  156. XX(2, HEAD, HEAD) \
  157. XX(3, POST, POST) \
  158. XX(4, PUT, PUT) \
  159. /* pathological */ \
  160. XX(5, CONNECT, CONNECT) \
  161. XX(6, OPTIONS, OPTIONS) \
  162. XX(7, TRACE, TRACE) \
  163. /* WebDAV */ \
  164. XX(8, COPY, COPY) \
  165. XX(9, LOCK, LOCK) \
  166. XX(10, MKCOL, MKCOL) \
  167. XX(11, MOVE, MOVE) \
  168. XX(12, PROPFIND, PROPFIND) \
  169. XX(13, PROPPATCH, PROPPATCH) \
  170. XX(14, SEARCH, SEARCH) \
  171. XX(15, UNLOCK, UNLOCK) \
  172. XX(16, BIND, BIND) \
  173. XX(17, REBIND, REBIND) \
  174. XX(18, UNBIND, UNBIND) \
  175. XX(19, ACL, ACL) \
  176. /* subversion */ \
  177. XX(20, REPORT, REPORT) \
  178. XX(21, MKACTIVITY, MKACTIVITY) \
  179. XX(22, CHECKOUT, CHECKOUT) \
  180. XX(23, MERGE, MERGE) \
  181. /* upnp */ \
  182. XX(24, MSEARCH, M-SEARCH) \
  183. XX(25, NOTIFY, NOTIFY) \
  184. XX(26, SUBSCRIBE, SUBSCRIBE) \
  185. XX(27, UNSUBSCRIBE, UNSUBSCRIBE) \
  186. /* RFC-5789 */ \
  187. XX(28, PATCH, PATCH) \
  188. XX(29, PURGE, PURGE) \
  189. /* CalDAV */ \
  190. XX(30, MKCALENDAR, MKCALENDAR) \
  191. /* RFC-2068, section 19.6.1.2 */ \
  192. XX(31, LINK, LINK) \
  193. XX(32, UNLINK, UNLINK) \
  194. /* icecast */ \
  195. XX(33, SOURCE, SOURCE) \
  196. enum http_method
  197. {
  198. #define XX(num, name, string) HTTP_##name = num,
  199. HTTP_METHOD_MAP(XX)
  200. #undef XX
  201. };
  202. enum http_parser_type { HTTP_REQUEST, HTTP_RESPONSE, HTTP_BOTH };
  203. /* Flag values for http_parser.flags field */
  204. enum flags
  205. { F_CHUNKED = 1 << 0
  206. , F_CONNECTION_KEEP_ALIVE = 1 << 1
  207. , F_CONNECTION_CLOSE = 1 << 2
  208. , F_CONNECTION_UPGRADE = 1 << 3
  209. , F_TRAILING = 1 << 4
  210. , F_UPGRADE = 1 << 5
  211. , F_SKIPBODY = 1 << 6
  212. , F_CONTENTLENGTH = 1 << 7
  213. };
  214. /* Map for errno-related constants
  215. *
  216. * The provided argument should be a macro that takes 2 arguments.
  217. */
  218. #define HTTP_ERRNO_MAP(XX) \
  219. /* No error */ \
  220. XX(OK, "success") \
  221. \
  222. /* Callback-related errors */ \
  223. XX(CB_message_begin, "the on_message_begin callback failed") \
  224. XX(CB_url, "the on_url callback failed") \
  225. XX(CB_header_field, "the on_header_field callback failed") \
  226. XX(CB_header_value, "the on_header_value callback failed") \
  227. XX(CB_headers_complete, "the on_headers_complete callback failed") \
  228. XX(CB_body, "the on_body callback failed") \
  229. XX(CB_message_complete, "the on_message_complete callback failed") \
  230. XX(CB_status, "the on_status callback failed") \
  231. XX(CB_chunk_header, "the on_chunk_header callback failed") \
  232. XX(CB_chunk_complete, "the on_chunk_complete callback failed") \
  233. \
  234. /* Parsing-related errors */ \
  235. XX(INVALID_EOF_STATE, "stream ended at an unexpected time") \
  236. XX(HEADER_OVERFLOW, \
  237. "too many header bytes seen; overflow detected") \
  238. XX(CLOSED_CONNECTION, \
  239. "data received after completed connection: close message") \
  240. XX(INVALID_VERSION, "invalid HTTP version") \
  241. XX(INVALID_STATUS, "invalid HTTP status code") \
  242. XX(INVALID_METHOD, "invalid HTTP method") \
  243. XX(INVALID_URL, "invalid URL") \
  244. XX(INVALID_HOST, "invalid host") \
  245. XX(INVALID_PORT, "invalid port") \
  246. XX(INVALID_PATH, "invalid path") \
  247. XX(INVALID_QUERY_STRING, "invalid query string") \
  248. XX(INVALID_FRAGMENT, "invalid fragment") \
  249. XX(LF_EXPECTED, "LF character expected") \
  250. XX(INVALID_HEADER_TOKEN, "invalid character in header") \
  251. XX(INVALID_CONTENT_LENGTH, \
  252. "invalid character in content-length header") \
  253. XX(UNEXPECTED_CONTENT_LENGTH, \
  254. "unexpected content-length header") \
  255. XX(INVALID_CHUNK_SIZE, \
  256. "invalid character in chunk size header") \
  257. XX(INVALID_CONSTANT, "invalid constant string") \
  258. XX(INVALID_INTERNAL_STATE, "encountered unexpected internal state")\
  259. XX(STRICT, "strict mode assertion failed") \
  260. XX(PAUSED, "parser is paused") \
  261. XX(UNKNOWN, "an unknown error occurred") \
  262. XX(INVALID_TRANSFER_ENCODING, \
  263. "request has invalid transfer-encoding") \
  264. /* Define HPE_* values for each errno value above */
  265. #define HTTP_ERRNO_GEN(n, s) HPE_##n,
  266. enum http_errno {
  267. HTTP_ERRNO_MAP(HTTP_ERRNO_GEN)
  268. };
  269. #undef HTTP_ERRNO_GEN
  270. /* Get an http_errno value from an http_parser */
  271. #define HTTP_PARSER_ERRNO(p) ((enum http_errno) (p)->http_errno)
  272. struct http_parser {
  273. /** PRIVATE **/
  274. unsigned int type : 2; /* enum http_parser_type */
  275. unsigned int flags : 8; /* F_* values from 'flags' enum; semi-public */
  276. unsigned int state : 7; /* enum state from http_parser.c */
  277. unsigned int header_state : 7; /* enum header_state from http_parser.c */
  278. unsigned int index : 5; /* index into current matcher */
  279. unsigned int uses_transfer_encoding : 1; /* Transfer-Encoding header is present */
  280. unsigned int allow_chunked_length : 1; /* Allow headers with both
  281. * `Content-Length` and
  282. * `Transfer-Encoding: chunked` set */
  283. unsigned int lenient_http_headers : 1;
  284. uint32_t nread; /* # bytes read in various scenarios */
  285. uint64_t content_length; /* # bytes in body. `(uint64_t) -1` (all bits one)
  286. * if no Content-Length header.
  287. */
  288. /** READ-ONLY **/
  289. unsigned short http_major;
  290. unsigned short http_minor;
  291. unsigned int status_code : 16; /* responses only */
  292. unsigned int method : 8; /* requests only */
  293. unsigned int http_errno : 7;
  294. /* 1 = Upgrade header was present and the parser has exited because of that.
  295. * 0 = No upgrade header present.
  296. * Should be checked when http_parser_execute() returns in addition to
  297. * error checking.
  298. */
  299. unsigned int upgrade : 1;
  300. /** PUBLIC **/
  301. void *data; /* A pointer to get hook to the "connection" or "socket" object */
  302. };
  303. struct http_parser_settings {
  304. http_cb on_message_begin;
  305. http_data_cb on_url;
  306. http_data_cb on_status;
  307. http_data_cb on_header_field;
  308. http_data_cb on_header_value;
  309. http_cb on_headers_complete;
  310. http_data_cb on_body;
  311. http_cb on_message_complete;
  312. /* When on_chunk_header is called, the current chunk length is stored
  313. * in parser->content_length.
  314. */
  315. http_cb on_chunk_header;
  316. http_cb on_chunk_complete;
  317. };
  318. enum http_parser_url_fields
  319. { UF_SCHEMA = 0
  320. , UF_HOST = 1
  321. , UF_PORT = 2
  322. , UF_PATH = 3
  323. , UF_QUERY = 4
  324. , UF_FRAGMENT = 5
  325. , UF_USERINFO = 6
  326. , UF_MAX = 7
  327. };
  328. /* Result structure for http_parser_parse_url().
  329. *
  330. * Callers should index into field_data[] with UF_* values iff field_set
  331. * has the relevant (1 << UF_*) bit set. As a courtesy to clients (and
  332. * because we probably have padding left over), we convert any port to
  333. * a uint16_t.
  334. */
  335. struct http_parser_url {
  336. uint16_t field_set; /* Bitmask of (1 << UF_*) values */
  337. uint16_t port; /* Converted UF_PORT string */
  338. struct {
  339. uint16_t off; /* Offset into buffer in which field starts */
  340. uint16_t len; /* Length of run in buffer */
  341. } field_data[UF_MAX];
  342. };
  343. /* Returns the library version. Bits 16-23 contain the major version number,
  344. * bits 8-15 the minor version number and bits 0-7 the patch level.
  345. * Usage example:
  346. *
  347. * unsigned long version = http_parser_version();
  348. * unsigned major = (version >> 16) & 255;
  349. * unsigned minor = (version >> 8) & 255;
  350. * unsigned patch = version & 255;
  351. * printf("http_parser v%u.%u.%u\n", major, minor, patch);
  352. */
  353. unsigned long http_parser_version(void);
  354. void http_parser_init(http_parser *parser, enum http_parser_type type);
  355. /* Initialize http_parser_settings members to 0
  356. */
  357. void http_parser_settings_init(http_parser_settings *settings);
  358. /* Executes the parser. Returns number of parsed bytes. Sets
  359. * `parser->http_errno` on error. */
  360. size_t http_parser_execute(http_parser *parser,
  361. const http_parser_settings *settings,
  362. const char *data,
  363. size_t len);
  364. /* If http_should_keep_alive() in the on_headers_complete or
  365. * on_message_complete callback returns 0, then this should be
  366. * the last message on the connection.
  367. * If you are the server, respond with the "Connection: close" header.
  368. * If you are the client, close the connection.
  369. */
  370. int http_should_keep_alive(const http_parser *parser);
  371. /* Returns a string version of the HTTP method. */
  372. const char *http_method_str(enum http_method m);
  373. /* Returns a string version of the HTTP status code. */
  374. const char *http_status_str(enum http_status s);
  375. /* Return a string name of the given error */
  376. const char *http_errno_name(enum http_errno err);
  377. /* Return a string description of the given error */
  378. const char *http_errno_description(enum http_errno err);
  379. /* Initialize all http_parser_url members to 0 */
  380. void http_parser_url_init(struct http_parser_url *u);
  381. /* Parse a URL; return nonzero on failure */
  382. int http_parser_parse_url(const char *buf, size_t buflen,
  383. int is_connect,
  384. struct http_parser_url *u);
  385. /* Pause or un-pause the parser; a nonzero value pauses */
  386. void http_parser_pause(http_parser *parser, int paused);
  387. /* Checks if this is the final chunk of the body. */
  388. int http_body_is_final(const http_parser *parser);
  389. /* Change the maximum header size provided at compile time. */
  390. void http_parser_set_max_header_size(uint32_t size);
  391. #ifdef __cplusplus
  392. }
  393. #endif
  394. #endif