2011-06-03 20:12:14 +08:00
|
|
|
/* Copyright Joyent, Inc. and other Node contributors. All rights reserved.
|
2010-01-08 10:36:28 +08:00
|
|
|
*
|
2009-11-21 23:27:02 +08:00
|
|
|
* Permission is hereby granted, free of charge, to any person obtaining a copy
|
|
|
|
* of this software and associated documentation files (the "Software"), to
|
|
|
|
* deal in the Software without restriction, including without limitation the
|
|
|
|
* rights to use, copy, modify, merge, publish, distribute, sublicense, and/or
|
|
|
|
* sell copies of the Software, and to permit persons to whom the Software is
|
|
|
|
* furnished to do so, subject to the following conditions:
|
2010-01-08 10:36:28 +08:00
|
|
|
*
|
2009-11-21 23:27:02 +08:00
|
|
|
* The above copyright notice and this permission notice shall be included in
|
|
|
|
* all copies or substantial portions of the Software.
|
2010-01-08 10:36:28 +08:00
|
|
|
*
|
2009-11-21 23:27:02 +08:00
|
|
|
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
|
|
* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
|
|
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
|
|
|
|
* AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
|
|
|
* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
|
|
|
|
* FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
|
2010-01-08 10:36:28 +08:00
|
|
|
* IN THE SOFTWARE.
|
2009-05-03 20:09:16 +08:00
|
|
|
*/
|
|
|
|
#ifndef http_parser_h
|
|
|
|
#define http_parser_h
|
|
|
|
#ifdef __cplusplus
|
|
|
|
extern "C" {
|
2009-11-21 23:27:02 +08:00
|
|
|
#endif
|
2009-05-03 20:09:16 +08:00
|
|
|
|
2011-06-03 20:12:14 +08:00
|
|
|
#define HTTP_PARSER_VERSION_MAJOR 1
|
|
|
|
#define HTTP_PARSER_VERSION_MINOR 0
|
2010-03-23 00:00:24 +08:00
|
|
|
|
2009-11-21 23:27:02 +08:00
|
|
|
#include <sys/types.h>
|
2011-08-06 17:58:44 +08:00
|
|
|
#if defined(_WIN32) && !defined(__MINGW32__) && !defined(_MSC_VER)
|
2010-11-10 05:49:03 +08:00
|
|
|
typedef __int8 int8_t;
|
|
|
|
typedef unsigned __int8 uint8_t;
|
|
|
|
typedef __int16 int16_t;
|
|
|
|
typedef unsigned __int16 uint16_t;
|
|
|
|
typedef __int32 int32_t;
|
|
|
|
typedef unsigned __int32 uint32_t;
|
|
|
|
typedef __int64 int64_t;
|
|
|
|
typedef unsigned __int64 uint64_t;
|
|
|
|
|
2010-07-17 16:22:16 +08:00
|
|
|
typedef unsigned int size_t;
|
|
|
|
typedef int ssize_t;
|
2010-11-10 05:49:03 +08:00
|
|
|
#else
|
|
|
|
#include <stdint.h>
|
2010-07-17 16:22:16 +08:00
|
|
|
#endif
|
2010-03-23 00:00:24 +08:00
|
|
|
|
2009-11-21 23:27:02 +08:00
|
|
|
/* Compile with -DHTTP_PARSER_STRICT=0 to make less checks, but run
|
2010-01-08 10:36:28 +08:00
|
|
|
* faster
|
|
|
|
*/
|
2009-11-21 23:27:02 +08:00
|
|
|
#ifndef HTTP_PARSER_STRICT
|
|
|
|
# define HTTP_PARSER_STRICT 1
|
|
|
|
#endif
|
2009-05-03 20:09:16 +08:00
|
|
|
|
2011-08-06 17:58:44 +08:00
|
|
|
/* Compile with -DHTTP_PARSER_DEBUG=1 to add extra debugging information to
|
|
|
|
* the error reporting facility.
|
|
|
|
*/
|
|
|
|
#ifndef HTTP_PARSER_DEBUG
|
|
|
|
# define HTTP_PARSER_DEBUG 0
|
|
|
|
#endif
|
|
|
|
|
2010-03-23 00:00:24 +08:00
|
|
|
|
2010-02-03 08:40:54 +08:00
|
|
|
/* Maximium header size allowed */
|
|
|
|
#define HTTP_MAX_HEADER_SIZE (80*1024)
|
|
|
|
|
2010-03-23 00:00:24 +08:00
|
|
|
|
2009-05-03 20:09:16 +08:00
|
|
|
typedef struct http_parser http_parser;
|
2010-03-23 00:00:24 +08:00
|
|
|
typedef struct http_parser_settings http_parser_settings;
|
2011-08-06 17:58:44 +08:00
|
|
|
typedef struct http_parser_result http_parser_result;
|
2009-05-03 20:09:16 +08:00
|
|
|
|
2010-03-23 00:00:24 +08:00
|
|
|
|
|
|
|
/* Callbacks should return non-zero to indicate an error. The parser will
|
2009-11-21 23:27:02 +08:00
|
|
|
* then halt execution.
|
|
|
|
*
|
2010-05-26 09:41:31 +08:00
|
|
|
* The one exception is on_headers_complete. In a HTTP_RESPONSE parser
|
|
|
|
* returning '1' from on_headers_complete will tell the parser that it
|
|
|
|
* should not expect a body. This is used when receiving a response to a
|
|
|
|
* HEAD request which may contain 'Content-Length' or 'Transfer-Encoding:
|
|
|
|
* chunked' headers that indicate the presence of a body.
|
|
|
|
*
|
2009-05-03 20:09:16 +08:00
|
|
|
* http_data_cb does not return data chunks. It will be call arbitrarally
|
|
|
|
* many times for each string. E.G. you might get 10 callbacks for "on_path"
|
|
|
|
* each providing just a few characters more data.
|
|
|
|
*/
|
|
|
|
typedef int (*http_data_cb) (http_parser*, const char *at, size_t length);
|
|
|
|
typedef int (*http_cb) (http_parser*);
|
|
|
|
|
2010-03-23 00:00:24 +08:00
|
|
|
|
2009-05-03 20:09:16 +08:00
|
|
|
/* Request Methods */
|
2009-11-21 23:27:02 +08:00
|
|
|
enum http_method
|
2010-06-24 12:10:13 +08:00
|
|
|
{ HTTP_DELETE = 0
|
|
|
|
, HTTP_GET
|
|
|
|
, HTTP_HEAD
|
|
|
|
, HTTP_POST
|
|
|
|
, HTTP_PUT
|
2009-12-07 22:21:12 +08:00
|
|
|
/* pathological */
|
2010-06-24 12:10:13 +08:00
|
|
|
, HTTP_CONNECT
|
|
|
|
, HTTP_OPTIONS
|
|
|
|
, HTTP_TRACE
|
2009-12-07 22:21:12 +08:00
|
|
|
/* webdav */
|
2010-06-24 12:10:13 +08:00
|
|
|
, HTTP_COPY
|
|
|
|
, HTTP_LOCK
|
|
|
|
, HTTP_MKCOL
|
|
|
|
, HTTP_MOVE
|
|
|
|
, HTTP_PROPFIND
|
|
|
|
, HTTP_PROPPATCH
|
|
|
|
, HTTP_UNLOCK
|
|
|
|
/* subversion */
|
|
|
|
, HTTP_REPORT
|
|
|
|
, HTTP_MKACTIVITY
|
|
|
|
, HTTP_CHECKOUT
|
|
|
|
, HTTP_MERGE
|
2010-11-22 13:39:14 +08:00
|
|
|
/* upnp */
|
|
|
|
, HTTP_MSEARCH
|
|
|
|
, HTTP_NOTIFY
|
|
|
|
, HTTP_SUBSCRIBE
|
|
|
|
, HTTP_UNSUBSCRIBE
|
2011-06-03 20:12:14 +08:00
|
|
|
/* RFC-5789 */
|
|
|
|
, HTTP_PATCH
|
2009-11-21 23:27:02 +08:00
|
|
|
};
|
2009-10-16 01:18:18 +08:00
|
|
|
|
2010-03-23 00:00:24 +08:00
|
|
|
|
2010-06-07 08:41:03 +08:00
|
|
|
enum http_parser_type { HTTP_REQUEST, HTTP_RESPONSE, HTTP_BOTH };
|
2010-01-09 17:52:49 +08:00
|
|
|
|
2010-03-23 00:00:24 +08:00
|
|
|
|
2011-06-03 20:12:14 +08:00
|
|
|
/* Flag values for http_parser.flags field */
|
|
|
|
enum flags
|
|
|
|
{ F_CHUNKED = 1 << 0
|
|
|
|
, F_CONNECTION_KEEP_ALIVE = 1 << 1
|
|
|
|
, F_CONNECTION_CLOSE = 1 << 2
|
|
|
|
, F_TRAILING = 1 << 3
|
|
|
|
, F_UPGRADE = 1 << 4
|
|
|
|
, F_SKIPBODY = 1 << 5
|
|
|
|
};
|
|
|
|
|
|
|
|
|
2011-08-06 17:58:44 +08:00
|
|
|
/* Map for errno-related constants
|
|
|
|
*
|
|
|
|
* The provided argument should be a macro that takes 2 arguments.
|
|
|
|
*/
|
|
|
|
#define HTTP_ERRNO_MAP(XX) \
|
|
|
|
/* No error */ \
|
|
|
|
XX(OK, "success") \
|
|
|
|
\
|
|
|
|
/* Callback-related errors */ \
|
|
|
|
XX(CB_message_begin, "the on_message_begin callback failed") \
|
|
|
|
XX(CB_path, "the on_path callback failed") \
|
|
|
|
XX(CB_query_string, "the on_query_string callback failed") \
|
|
|
|
XX(CB_url, "the on_url callback failed") \
|
|
|
|
XX(CB_fragment, "the on_fragment callback failed") \
|
|
|
|
XX(CB_header_field, "the on_header_field callback failed") \
|
|
|
|
XX(CB_header_value, "the on_header_value callback failed") \
|
|
|
|
XX(CB_headers_complete, "the on_headers_complete callback failed") \
|
|
|
|
XX(CB_body, "the on_body callback failed") \
|
|
|
|
XX(CB_message_complete, "the on_message_complete callback failed") \
|
|
|
|
\
|
|
|
|
/* Parsing-related errors */ \
|
|
|
|
XX(INVALID_EOF_STATE, "stream ended at an unexpected time") \
|
|
|
|
XX(HEADER_OVERFLOW, \
|
|
|
|
"too many header bytes seen; overflow detected") \
|
|
|
|
XX(CLOSED_CONNECTION, \
|
|
|
|
"data received after completed connection: close message") \
|
|
|
|
XX(INVALID_VERSION, "invalid HTTP version") \
|
|
|
|
XX(INVALID_STATUS, "invalid HTTP status code") \
|
|
|
|
XX(INVALID_METHOD, "invalid HTTP method") \
|
|
|
|
XX(INVALID_URL, "invalid URL") \
|
|
|
|
XX(INVALID_HOST, "invalid host") \
|
|
|
|
XX(INVALID_PORT, "invalid port") \
|
|
|
|
XX(INVALID_PATH, "invalid path") \
|
|
|
|
XX(INVALID_QUERY_STRING, "invalid query string") \
|
|
|
|
XX(INVALID_FRAGMENT, "invalid fragment") \
|
|
|
|
XX(LF_EXPECTED, "LF character expected") \
|
|
|
|
XX(INVALID_HEADER_TOKEN, "invalid character in header") \
|
|
|
|
XX(INVALID_CONTENT_LENGTH, \
|
|
|
|
"invalid character in content-length header") \
|
|
|
|
XX(INVALID_CHUNK_SIZE, \
|
|
|
|
"invalid character in chunk size header") \
|
|
|
|
XX(INVALID_CONSTANT, "invalid constant string") \
|
|
|
|
XX(INVALID_INTERNAL_STATE, "encountered unexpected internal state")\
|
|
|
|
XX(STRICT, "strict mode assertion failed") \
|
|
|
|
XX(UNKNOWN, "an unknown error occurred")
|
|
|
|
|
|
|
|
|
|
|
|
/* Define HPE_* values for each errno value above */
|
|
|
|
#define HTTP_ERRNO_GEN(n, s) HPE_##n,
|
|
|
|
enum http_errno {
|
|
|
|
HTTP_ERRNO_MAP(HTTP_ERRNO_GEN)
|
|
|
|
};
|
|
|
|
#undef HTTP_ERRNO_GEN
|
|
|
|
|
|
|
|
|
|
|
|
/* Get an http_errno value from an http_parser */
|
|
|
|
#define HTTP_PARSER_ERRNO(p) ((enum http_errno) (p)->http_errno)
|
|
|
|
|
|
|
|
/* Get the line number that generated the current error */
|
|
|
|
#if HTTP_PARSER_DEBUG
|
|
|
|
#define HTTP_PARSER_ERRNO_LINE(p) ((p)->error_lineno)
|
|
|
|
#else
|
|
|
|
#define HTTP_PARSER_ERRNO_LINE(p) 0
|
|
|
|
#endif
|
|
|
|
|
|
|
|
|
2009-05-03 20:09:16 +08:00
|
|
|
struct http_parser {
|
|
|
|
/** PRIVATE **/
|
2010-10-13 17:45:37 +08:00
|
|
|
unsigned char type : 2;
|
2011-06-03 20:12:14 +08:00
|
|
|
unsigned char flags : 6; /* F_* values from 'flags' enum; semi-public */
|
2010-06-07 08:41:03 +08:00
|
|
|
unsigned char state;
|
|
|
|
unsigned char header_state;
|
|
|
|
unsigned char index;
|
2010-04-14 18:22:38 +08:00
|
|
|
|
2010-10-13 17:45:37 +08:00
|
|
|
uint32_t nread;
|
2010-07-27 06:01:54 +08:00
|
|
|
int64_t content_length;
|
2009-11-21 23:27:02 +08:00
|
|
|
|
2009-05-03 20:09:16 +08:00
|
|
|
/** READ-ONLY **/
|
2009-11-21 23:27:02 +08:00
|
|
|
unsigned short http_major;
|
|
|
|
unsigned short http_minor;
|
2010-06-24 12:10:13 +08:00
|
|
|
unsigned short status_code; /* responses only */
|
|
|
|
unsigned char method; /* requests only */
|
2011-08-06 17:58:44 +08:00
|
|
|
unsigned char http_errno : 7;
|
2009-05-03 20:09:16 +08:00
|
|
|
|
2010-06-07 08:41:03 +08:00
|
|
|
/* 1 = Upgrade header was present and the parser has exited because of that.
|
|
|
|
* 0 = No upgrade header present.
|
|
|
|
* Should be checked when http_parser_execute() returns in addition to
|
|
|
|
* error checking.
|
|
|
|
*/
|
2011-11-23 04:54:12 +08:00
|
|
|
unsigned char upgrade : 1;
|
2011-08-06 17:58:44 +08:00
|
|
|
|
|
|
|
#if HTTP_PARSER_DEBUG
|
|
|
|
uint32_t error_lineno;
|
|
|
|
#endif
|
2010-06-07 08:41:03 +08:00
|
|
|
|
2009-05-03 20:09:16 +08:00
|
|
|
/** PUBLIC **/
|
|
|
|
void *data; /* A pointer to get hook to the "connection" or "socket" object */
|
2010-03-23 00:00:24 +08:00
|
|
|
};
|
2009-05-03 20:09:16 +08:00
|
|
|
|
|
|
|
|
2010-03-23 00:00:24 +08:00
|
|
|
struct http_parser_settings {
|
2009-05-03 20:09:16 +08:00
|
|
|
http_cb on_message_begin;
|
2009-11-21 23:27:02 +08:00
|
|
|
http_data_cb on_url;
|
2009-05-03 20:09:16 +08:00
|
|
|
http_data_cb on_header_field;
|
|
|
|
http_data_cb on_header_value;
|
|
|
|
http_cb on_headers_complete;
|
|
|
|
http_data_cb on_body;
|
|
|
|
http_cb on_message_complete;
|
|
|
|
};
|
|
|
|
|
2010-03-23 00:00:24 +08:00
|
|
|
|
2010-01-09 17:52:49 +08:00
|
|
|
void http_parser_init(http_parser *parser, enum http_parser_type type);
|
2010-03-23 00:00:24 +08:00
|
|
|
|
|
|
|
|
|
|
|
size_t http_parser_execute(http_parser *parser,
|
2010-05-26 09:41:31 +08:00
|
|
|
const http_parser_settings *settings,
|
2010-03-23 00:00:24 +08:00
|
|
|
const char *data,
|
|
|
|
size_t len);
|
|
|
|
|
|
|
|
|
|
|
|
/* If http_should_keep_alive() in the on_headers_complete or
|
|
|
|
* on_message_complete callback returns true, then this will be should be
|
|
|
|
* the last message on the connection.
|
|
|
|
* If you are the server, respond with the "Connection: close" header.
|
|
|
|
* If you are the client, close the connection.
|
2009-05-03 20:09:16 +08:00
|
|
|
*/
|
2009-11-21 23:27:02 +08:00
|
|
|
int http_should_keep_alive(http_parser *parser);
|
2009-05-03 20:09:16 +08:00
|
|
|
|
2010-06-24 12:10:13 +08:00
|
|
|
/* Returns a string version of the HTTP method. */
|
2011-08-06 17:58:44 +08:00
|
|
|
const char *http_method_str(enum http_method m);
|
|
|
|
|
|
|
|
/* Return a string name of the given error */
|
|
|
|
const char *http_errno_name(enum http_errno err);
|
|
|
|
|
|
|
|
/* Return a string description of the given error */
|
|
|
|
const char *http_errno_description(enum http_errno err);
|
2010-03-23 00:00:24 +08:00
|
|
|
|
2009-05-03 20:09:16 +08:00
|
|
|
#ifdef __cplusplus
|
|
|
|
}
|
2009-11-21 23:27:02 +08:00
|
|
|
#endif
|
2009-05-03 20:09:16 +08:00
|
|
|
#endif
|