mirror of
https://github.com/Xahau/xahaud.git
synced 2025-12-06 17:27:52 +00:00
3bcd986 Set version to 79 4f42f8c Remove spurious fallthrough guidance fa1ac16 Set version to 78 0cb9b63 Fix warning in root ca declaration f78c73a Tidy up file_posix unused variable 72ce9ef Tidy up dstream for existing Boost versions efe8e58 Add Boost.Locale utf8 benchmark comparison f7c745e Remove string_view_body 7a79efa Tidy up FieldsReader doc e51aefd Header file tidying 69898f4 Fix warning in zlib 53723c0 Add message keep_alive, chunked, content_length members d7af73b Fix spurious uninitialized warning ca42cc0 Tidy up invalid characters in test vector 48d3e60 Use make_unique_noinit a1ff804 span, string, vector bodies are public feab6a0 Documentation work 116c0b0 Add span_body 7fb901d Tidy up includes and javadocs f0f58be Add span 7a8982b Add vector_body 524f73a Tidy up basic_string_body a8ad67b Set version to 77 d555859 file_posix works without large file support 1bc30cb Set version to 76 9a1e7a8 Disable SSE4.2 optimizations 09af312 Fix parse illegal characters in obs-fold 7dd684c Add file_body_win32: 1bbc71c serializing file_body is not const 9a4b55e BodyReader, BodyWriter use two-phase init (API Change): dc400ce Serializer members are not const 1a33c37 Rename to serializer::keep_alive (API Change): 55935c5 Add serializer::chunked 63ace37 Add serializer::get 2c4047b BodyReader may construct from a non-const message 0a0a225 Use Boost.Config 6f83d07 Always go through write_some: 0e23066 Set version to 75 28f3ece Doc tidying 3495331 Using SSE4.2 intrinsics in basic_parser if available bc1f0ac file_body tests 4e03d7e Add serializer::limit 85e3ee8 Shrink serializer buffers using buffers_ref 78bcdb1 Tidy up BEAST_NO_BIG_VARIANTS 3ea6cf2 Construct buffer_prefix_view in-place 69f9f7a Use file_body for valid requests, string_body otherwise. 6f88f01 Set version to 74 93fed8e remove redundant flush() from example: e0f56da Fix Beast include directories for cmake targets 5ff9e0a Add file_posix 1bb5705 Remove common/file_body.hpp 5c89d87 Add file_body 67a55c8 Add file_win32 647d3b0 Add file_stdio and File concept 89c416c Set version to 73 0efc32f Fixes for gcc-4.8 c8910ab Initialize local variable in basic_parser 8a28193 Adjust benchmarks 81e51d8 Verify certificates in SSL clients a43f6d4 Jamroot tweak 8c85ee8 Put more... links on overload reference pages ff1104e Documentation tidy 826ff0e serializer::next replaces serializer::get (API Change): 8d67775 Refactor header and message constructors: 6c79f19 Add basic_parser tests 25127d9 basic_parser optimizations: 9d082fd Set version to 72 c88e2b9 Various improvements to http_server_fast.cpp: 20b0fdb Documentation tidying afd1fa7 Add websocket-server-async example 954b597 Add http-server-threaded example df8f253 Refactor file_body for best practices 11c1037 Newly constructed responses have a 200 OK result a648817 Refine Body::size specification 40aad37 Tidy up set payload in http-server-fast 52cefbc Set version to 71 8c51c77 Tidy up Jamroot /permissive- 5efecea Update README.md 5a47acd Tidy up http_sync_port error check a2af2b5 Concept check in basic_dynamic_body 8b80a6f Fix buffer overflow handling for string_body and mutable_body ec3b4fd Return std::size_t from Body::writer::put (API Change) effbb37 Check trailers in test f5368cf Call prepare_payload in HTTP example a3e5e01 Fix spurious on_chunk invocation 96d94eb Add options for building examples and tests. Move zlib test sources to test/zlib e0efdc7 Allow close, ping, and write to happen concurrently 9c1a419 Refactor websocket composed ops d5659a4 Fine tune websocket asserts b8e8943 std::pair "last" -> "first" in http_message.qbk c691bf4 Fix can/cannot thinko in FAQ. 6dd006b Documentation revision 6d2e315 Fix extra ; warning 78a065b Set version to 70 00c7e9d Fix HEAD response in file_service 67d70d2 Fix BEAST_FALLTHROUGH in config 4f33655 Add parser::on_header to set a callback 9c16b21 Add basic_parser header and body limits: b64d1f7 Rename to message::base (API Change): 436c66a Serialize in one step when possible 3e1061b Set version to 69 f709273 Add /permissive- to msvc toolchain 0dae464 Use BEAST_FALLTHROUGH to silence warnings a70d386 basic_parser optimizations 4269f35 Set version to 68 544327f Link statically on cmake MSVC e213ffe Add const_body, mutable_body to examples 0568763 Optimize field lookups 8fc3001 Use string_ref in older Boost versions 8af77da bad_target replaces bad_path (API Change): 325dd62 Adjust buffer size in fast server be59785 Doc erratum d9b44f3 Small speed up in fields comparisons 3e6ce38 Use Boost master on Appveyor 09f3d64 Split common tests to a new project adfd22a Remove BodyReader::is_deferred (API Change): 582d28d Change BodyReader, BodyWriter requirements (API Change): 8982e14 Set version to 67 daa58a2 Group common example headers afd8f1a Rename to http-server-fast 07cb9f7 control_callback replaces ping_callback (API Change): 91e83ed Use boost::string_view 067db87 Merge stream_base to stream and tidy d61241a Add http-server-small example eb08e92 Fix doc example link 7fb75d0 Set version to 66 df86723 Respect debug flag for marked output c08565a Squelch spurious warning on gcc 188ef7c Documentation work 1c62d3a Add http-server example 3f54582 basic_fields optimizations a8b05b8 Add header aliases b94eac3 Tidy up message piecewise ctors 9c48b52 Handle bad_alloc in parser 1b57c54 Fix costly potential value-init in parser 1edc41e Make consuming_buffers smaller 72ac918 Add serializer request/response aliases 18f7606 string_param optimizations c675252 Set version to 65 c398cdd Enable msvc warnings in Jamfile 380cceb Fix unused variable warnings 4172e7e Enable unused variable warning on msvc cmake f04d227 Fix integer warnings ca975b3 Fix narrowing in deflate_stream 2fab796 Fix narrowing in inflate_stream cff87f6 Fix narrowing in ostream 1956886 Fix narrowing in static_ostream 69cdc4b Fix integer types in deflate_stream::bi_reverse 3e3dd21 Enable narrowing warning on msvc cmake e11a294 Set version to 64 a00e070 Remove make_serializer (API Change): 8449697 Add link_directories to cmake 7b2b066 Doc tidying 158d3e8 async_write requires a non-const message: d13328b Better User-Agent in examples ebcb2c0 Exemplars are compiled code b9054d3 Simplify websocket write_op c2571fe Simplify ssl teardown composed op d8ad3d1 Simplify buffered_read_stream composed op f68dc34 Set version to 63 a99f7ef Control running with valgrind explicitly 4eb7af4 Tidy up Jamfiles 49b42a5 Tidy up CMakeLists.txt dadb54f Only run the tests under ubasan d1c7696 Move benchmarks to a separate project a4aada8 Only build and run tests in variant=coverage f835b9a Don't use cached Boost a0edd82 Put num_jobs back up on Travis a8d5823 Use std::to_string instead of lexical_cast 45d8b81 Set version to 62 09e07ce Put slow tests back for coverage builds 295b1d7 Doc tidy f58425c Squelch harmless not_connected errors 9b537f7 Add http::is_fields trait d43701b message::prepare_payload replaces message::prepare (API Change): 42ba289 Refine FieldsReader concept (API Change) bde90a1 Narrow the use of Fields parameters: 5f47526 parser requires basic_fields (API Change): 60f58e4 Avoid explicit operator bool for error 352f8de Clear the error faster 34befd8 Tidy up namespaces in examples 9e0b4b5 Doc fixes and tidy c003a2a Tidy up test build scripts and projects b929130 Add server-framework tests 03d4301 Increase detail::static_ostream coverage 80d7cbc Remove libssl-dev from a Travis matrix item 4c15db4 Set version to 61 1dfbd0b Don't run slow tests on certain targets 6bb1109 Use one job less on CI 6f58342 Tidy up resolver calls 530b044 Add multi_port to server-framework bfef5d1 Tidy up http-crawl example e2f2f33 Reorganize SSL examples adc301b Fix shadowing warnings c60185e Add server-framework SSL HTTP and WebSocket ports 7912fb8 Refactor WebSocket, HTTP examples: cd4b9e0 Flush the output stream in the example d046b20 Tidy up names in error categories 9d4a422 status-codes is unsigned (API Change) e3599b0 header::version is unsigned (API Change) a26b043 Add message::header_part() fc8d2e9 Tidy up some integer conversion warnings c91732e Reorganize SSL examples 9907b31 Documentation work 4b2e78e Use generic_cateogry for errno 38c46cd Remove Spirit dependency c111d6f Set version to 60 d78dc12 Documentation work 141a524 New server-framework, full featured server example: 3f7ffd9 Fix response message type in async websocket accept 13f3750 String comparisons are public interfaces 4e4bcf8 Set version to 59 5015cdb Remove obsolete doc/README.md 71c3f0a Fix base64 alphabet aa2b843 Change Body::size signature (API Change): 80a599a Documentation work 9c19449 Integrated Beast interface. 3f8097b Set version to 58 4581777 Better message formal parameter names 5879cd8 Fix parsing chunk size with leading zeroes 56bd228 Remove redundant code 534ca63 Use static string in basic_fields::reader a7b3810 basic_parser::put doc 1e4413f basic_fields::set optimization: 9b244c1 Fix basic_fields insert ordering 4f854d0 Avoid std::string in websocket dc8f146 Renamed to basic_fields::set (API Change): 660c465 Specification for http read 981285b Documentation tidy 983d676 Reorganize examples: a2a5c57 Qualify size_t in message template d86769c Fix unaligned reads in utf8-checker 8ba182c Set version to 57 42e2791 Update doc/ for docca 1ee0afd Merge commit '101d7dbfb9725674cb9ce5a4196f19aa1d4bb801' as 'doc/docca' 101d7db Squashed 'doc/docca/' content from commit c50b3ba5 900c04e Documentation work 8eee932 Fix warning in basic_parser.cpp 437a616 Fix message.hpp javadocs 18c68ce Set version to 56 b058e90 Convert buffer in range loops cbc9212 Add Beast INTERFACE CMake target 2914b59 More basic_parser tests ed5c317 Reset error codes ba14251 Test error code handling e45e50b Tidy up README.md build instructions 16efb9b Try harder to find Boost (cmake) e281d91 HTTP/1 is the default version 916fe4a Call on_chunk when the extension is empty 9855598 Add string_view_body 19d4520 Tidy up 6e59f9b Add provisional IANA header field names 84722f2 Revert "Add a Beast CMake interface target:" fde6929 Set version to 55 01f6cc4 Documentation work a7a388c read_size replaces read_size_helper: ed8f0bb Tidy up type_traits c2f6268 Avoid a parser allocation using non-flat buffer: 906db45 Add a Beast CMake interface target: 47f2541 Don't allocate memory to handle obs-fold 6a8912a Set version to 54 296ef3b Documentation work e3e9b61 Fix incorrect use of [[fallthrough]] 3c44398 Retain ownership when reading using a message a71bb2b basic_fields refactor (API Change): d8d3562 Add string_param 83b2558 basic_fields members and coverage c4f5fa5 consuming_buffers members and coverage e10507c multi_buffer members and coverage 0e6bd3f flat_buffer coverage 7351d6e static_buffer coverage 18a8ef5 Set version to 53 452df59 Remove extraneous doc file 3ef0359 Fix read_size_helper usage: b64e6d3 Fix basic_parser::maybe_flatten (#462) 76402f7 Set version to 52 b0ceb2a Add drain_buffer class 4c6735a flat_buffer is an AllocatorAwareContainer 9d5d4d5 Documentation work d4ec693 finish(error_code&) is a BodyReader requirement (API Change) 7b24cad opcode is private (API Change): 068c2ac Documentation work a1ff89b Disable std::future snippet for libstdc++ bug b5ef664 read_frame returns `bool` fin (API Change): 7911847 Remove opcode from read, async_read (API Change): c72d70f ping_callback is a member of stream (API Change): 720a309 write_buffer_size is a member of stream (API Change): 7ff0178 read_message_max is a member of stream (API Change): cd40964 read_buffer_size is a member of stream (API Change): a58e5e1 binary, text are members of stream (API Change): ad35846 auto_fragment is a member of stream (API Change): ccee139 Documentation work 13c64e3 Set version to 51 cafc8e2 Fix infinite loop in basic_parser dc4b69d Add construct, destroy to handler_alloc 58c2739 multi_buffer implementation change (API Change): dd7f5c0 DynamicBuffer benchmarks 1c4811b Use BOOST_STRINGIZE 31051ac Use BOOST_FALLTHROUGH 8f2430b Documentation work eb35b92 Fix file_body::get() not setting the more flag correctly 566244a Tidy up file_body 53cbeea Tune up static_buffer (API Change): 20c59b7 Fix operator<< for header a2c1117 Set version to 50 6045b74 http read_some, async_read_some don't return bytes (API Change): 4df6885 Fix chunk header parsing 36bf32b Fix test::pipe read_size bf69ce1 Fix chunk delimiter parsing 0c6b6b1 Add missing handler_alloc nested types a06b8f9 Tidy up message javadoc 3bd8260 Remove obsolete serializer allocator (API Change) 001c979 Remove message free functions (API Change) 745876b Remove message connection settings (API Change) bcf2c33 Body documentation work 1e303b0 Fields concept work 9d0464a Tidy up basic_fields, header, and concepts 3ba81b5 Use field in basic_parser b5f6cc1 Use field in basic_fields and call sites cfd6d14 Documentation reference tidy 2adc80a Protect basic_fields special members (API Change) d55b079 Fix basic_fields allocator awareness d8febda Documentation work 485a6e5 Refactor prepare (API Change) 9fd3071 Derive header from Fields (API Change) 8ad26b8 Use allocator more in basic_fields 0071039 Add verb to on_request for parsers (API Change) 74f6cbb Add field enumeration be0d74f Documentation fixes 054ac40 Remove header_parser (API Change) a007eba parser is constructible from other body types d89809f Documentation work (buffer_body) ac5bc4f Set version to 49 af47128 Documentation work a1848f0 Add HEAD request example ddfbfbf Use <iosfwd> instead of <ostream> e67c0ab Refactor header status, reason, and target (API Change): 60f044a Tidy up empty_body writer error 7d267f4 Canonicalize string_view parameter types ac175cb Refactor method and verb (API Change): e18efed Documentation work d77e423 Set version to 48 d3a5a05 Documentation work acf18fb Tidy up traits 6cb188e Remove detail::sync_ostream d6092bc Documentation work 4707b21 Rename to parser (API Change): 3cb385d Consolidate parsers to parser.hpp 290bdf1 Documentation work 7cb442c Make buffer_prefix_view public ef0b121 Rename to buffer_cat_view (API Change) b9df187 Tidy up chunk decorator (API Change): 458fa7e Set version to 47 fc83a03 Documentation work 1ee3013 Fix leak in basic_flat_buffer 55fbf76 Fix undefined behavior in pausation fe75a7c Refactor HTTP serialization and parsing (API Change): 50cba32 buffer_size overload for basic_multi_buffer::const_buffers_type d977bf2 Disable operator<< for buffer_body 5db707a Refactor treatment of status code and obsolete reason (API Change): 9a585a8 Refactor treatment of request-method (API Change): 3ae76d0 Set version to 46 6004712 Documentation work 34ea0b3 Refactor serialization algorithms: 407b046 Rename to make_serializer c29451a Refactor type_traits (API Change): 8578419 Refactor HTTP serialization (API Change): f8612aa Remove HTTP header aliases (API Change): b0054e3 Add test::pipe dfba72b Set version to 45 6ba3697 Disable reverse_iterator buffer_view test 266ebac buffer_view skips empty buffer sequences 96b9892 Documentation work c23f1e2 Fix header::reason 9796106 Better test::enable_yield_to 9a8bcb7 Fix message doc image 7a5e87e Workaround for boost::asio::basic_streambuf type check 663c275 Set version to 44 f205976 Make buffers_adapter meet requirements 8e39c60 Tidy up is_dynamic_buffer traits test 0088f7c Add buffers_adapter regression test 8a23de1 Fix README websocket example 949504a Fix async return values in docs cd9f41b Use BOOST_STATIC_ASSERT 1b616fa Tidy up and make get_lowest_layer public 612e616 Require Boost 1.58 or later 1b1daa7 Tidy up read_size_helper and dynamic buffers bf0145d Use BOOST_THROW_EXCEPTION e762818 Add GitHub issue template dab679c Set version to 43 386b817 Reformat README.md QR code 50e5123 Additional constructors for consuming_buffers f7289b9 Add write limit to test::string_ostream 3aa87e0 Tidy up buffer_prefix overloads and test bee583c Fix strict aliasing warnings in buffers_view 6b54d3a Require Boost 1.64.0 76f1084 Set version to 42 0bdb148 Make buffers_view a public interface 338fc81 Add formal review notes 784f965 Fix javadoc typo 823aee2 Set version to v41 88adbdd Remove handler helpers, tidy up hook invocations (API Change) 4974af2 Rename prepare_buffer(s) to buffer_prefix (API Change) ebd459b Tidy up websocket::close_code enum and constructors c3fd6f9 Tidy up formal parameter names 210cd70 Remove coveralls integration d811962 Concept revision and documentation (API Change): bdae92a Replace asynchronous helper macros with template aliases (API Change) df95a09 Move prepare_buffers to prepare_buffer.hpp (API Change) 787de21 Remove placeholders (API Change) c59b544 Trim Appveyor matrix rows b7184f3 Return http::error::end_of_stream on HTTP read eof (API Change) f2d8255 Set version to 40 40b9194 Tidy up .travis.yml: 9b240c7 Fix basic_streambuf movable trait 76a2617 Consolidate get_lowest_layer in type_traits.hpp 6d00321 Add to_static_string: f888136 Set version to 39 47c82b5 Better travis deps 4ed7865 Squelch openssl spurious leak and memory errors b6bc26f Fixed braced-init error with older gcc 59b2f8f ostream workaround for gcc 4.8.4 8363d86 Increase ostream test coverage 5631936 Tidy up HTTP reason_string (API Change): 2bf5150 Harmonize concepts and identifiers with net-ts (API Change): 728e9d8 Tidy up basic_parser javadocs 1c9067b Use beast::string_view alias 771c5ca Doc fixes and tidying e2b5c31 Rename to buffered_read_stream (API Change): a753f1c Rename to static_buffer, static_buffer_n (API Change): 24b6686 Rename to flat_buffer, basic_flat_buffer (API Change): 69259ef Rename to multi_buffer, basic_multi_buffer (API Change): bef9ae1 New buffers() replaces to_string() (API Change): a7ef4f5 New ostream() returns dynamic buffer output stream (API Change): 87fd60c Fix eof error on ssl::stream shutdown 606fc9d Add websocket async echo ssl server test: ff5e659 Refactor http::header contents (API Change): dd02097 Set version to 1.0.0-b38 5596e97 Prevent basic_fields operator[] assignment c2b32dc Remove websocket::keep_alive option (API Change): 32dbfb2 Refactor WebSocket error codes (API Change): dd6b500 WebSocket doc work 0b4d87c More flat_streambuf tests aacefb4 Add test_allocator to extras/test 931a5fb Simplify get_lowest_layer test ba4228a Use static_string for WebSocket handshakes: 6df3ff3 Refactor base64: 19b124d Refactor static_string: 30e8d16 Set version to 1.0.0-b37 b141020 Fix narrowing warning in table constants d554b81 Add -funsigned-char to asan build target bcc6ad8 Add ub sanitizer blacklist e1f08e9 Fix flat_streambuf: 7d08f59 Fix typo in documentation example 21ef97d Rename to http::dynamic_body, consolidate header: 45a2d73 Rename project to http-bench c86fee9 Move everything in basic_fields.hpp to fields.hpp (API Change) a14a5d6 Rename to detail::is_invocable 540d037 Rename to websocket::detail::pausation 84e1739 Document websocket::stream thread safety dc274af Add is_upgrade() free function: 2c17d04 Refactor websocket decorators (API Change): 235fe68 Provide websocket::stream accept() overloads (API Change): a715825 CMake hide command lines in .vcxproj Output windows 32024d8 Set version to 1.0.0-b36 f48b95f Update README.md d8db5f1 Set version to 1.0.0-b35 dd2a514 Tidy up doc declarations 2c50aba Fix README.md CMake instructions 4ffdce2 Update .gitignore for VS2017 403011f Remove http::empty_body (API Change) f47b661 New HTTP interfaces (API Change): f6835b8 Rename to BEAST_DOXYGEN 7e37723 Add flat_streambuf: 5b68faa Doc XSL support for list and table markdown 3de46de Make websocket::close_code a proper enum: 0128743 Tidy up MSVC CMake configuration ccd188e Add appveyor build script git-subtree-dir: src/beast git-subtree-split: 3bcd9865f80f12ba5faad35c564918f85b02e271
2469 lines
70 KiB
C
2469 lines
70 KiB
C
/* Based on src/http/ngx_http_parse.c from NGINX copyright Igor Sysoev
|
|
*
|
|
* Additional changes are licensed under the same terms as NGINX and
|
|
* copyright Joyent, Inc. and other Node contributors. All rights reserved.
|
|
*
|
|
* Permission is hereby granted, free of charge, to any person obtaining a copy
|
|
* of this software and associated documentation files (the "Software"), to
|
|
* deal in the Software without restriction, including without limitation the
|
|
* rights to use, copy, modify, merge, publish, distribute, sublicense, and/or
|
|
* sell copies of the Software, and to permit persons to whom the Software is
|
|
* furnished to do so, subject to the following conditions:
|
|
*
|
|
* The above copyright notice and this permission notice shall be included in
|
|
* all copies or substantial portions of the Software.
|
|
*
|
|
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
|
|
* AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
|
* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
|
|
* FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
|
|
* IN THE SOFTWARE.
|
|
*/
|
|
#include "http_parser.h"
|
|
#include <assert.h>
|
|
#include <stddef.h>
|
|
#include <ctype.h>
|
|
#include <stdlib.h>
|
|
#include <string.h>
|
|
#include <limits.h>
|
|
|
|
#ifndef ULLONG_MAX
|
|
# define ULLONG_MAX ((uint64_t) -1) /* 2^64-1 */
|
|
#endif
|
|
|
|
#ifndef MIN
|
|
# define MIN(a,b) ((a) < (b) ? (a) : (b))
|
|
#endif
|
|
|
|
#ifndef ARRAY_SIZE
|
|
# define ARRAY_SIZE(a) (sizeof(a) / sizeof((a)[0]))
|
|
#endif
|
|
|
|
#ifndef BIT_AT
|
|
# define BIT_AT(a, i) \
|
|
(!!((unsigned int) (a)[(unsigned int) (i) >> 3] & \
|
|
(1 << ((unsigned int) (i) & 7))))
|
|
#endif
|
|
|
|
#ifndef ELEM_AT
|
|
# define ELEM_AT(a, i, v) ((unsigned int) (i) < ARRAY_SIZE(a) ? (a)[(i)] : (v))
|
|
#endif
|
|
|
|
#define SET_ERRNO(e) \
|
|
do { \
|
|
parser->http_errno = (e); \
|
|
} while(0)
|
|
|
|
#define CURRENT_STATE() p_state
|
|
#define UPDATE_STATE(V) p_state = (enum state) (V);
|
|
#define RETURN(V) \
|
|
do { \
|
|
parser->state = CURRENT_STATE(); \
|
|
return (V); \
|
|
} while (0);
|
|
#define REEXECUTE() \
|
|
goto reexecute; \
|
|
|
|
|
|
#ifdef __GNUC__
|
|
# define LIKELY(X) __builtin_expect(!!(X), 1)
|
|
# define UNLIKELY(X) __builtin_expect(!!(X), 0)
|
|
#else
|
|
# define LIKELY(X) (X)
|
|
# define UNLIKELY(X) (X)
|
|
#endif
|
|
|
|
|
|
/* Run the notify callback FOR, returning ER if it fails */
|
|
#define CALLBACK_NOTIFY_(FOR, ER) \
|
|
do { \
|
|
assert(HTTP_PARSER_ERRNO(parser) == HPE_OK); \
|
|
\
|
|
if (LIKELY(settings->on_##FOR)) { \
|
|
parser->state = CURRENT_STATE(); \
|
|
if (UNLIKELY(0 != settings->on_##FOR(parser))) { \
|
|
SET_ERRNO(HPE_CB_##FOR); \
|
|
} \
|
|
UPDATE_STATE(parser->state); \
|
|
\
|
|
/* We either errored above or got paused; get out */ \
|
|
if (UNLIKELY(HTTP_PARSER_ERRNO(parser) != HPE_OK)) { \
|
|
return (ER); \
|
|
} \
|
|
} \
|
|
} while (0)
|
|
|
|
/* Run the notify callback FOR and consume the current byte */
|
|
#define CALLBACK_NOTIFY(FOR) CALLBACK_NOTIFY_(FOR, p - data + 1)
|
|
|
|
/* Run the notify callback FOR and don't consume the current byte */
|
|
#define CALLBACK_NOTIFY_NOADVANCE(FOR) CALLBACK_NOTIFY_(FOR, p - data)
|
|
|
|
/* Run data callback FOR with LEN bytes, returning ER if it fails */
|
|
#define CALLBACK_DATA_(FOR, LEN, ER) \
|
|
do { \
|
|
assert(HTTP_PARSER_ERRNO(parser) == HPE_OK); \
|
|
\
|
|
if (FOR##_mark) { \
|
|
if (LIKELY(settings->on_##FOR)) { \
|
|
parser->state = CURRENT_STATE(); \
|
|
if (UNLIKELY(0 != \
|
|
settings->on_##FOR(parser, FOR##_mark, (LEN)))) { \
|
|
SET_ERRNO(HPE_CB_##FOR); \
|
|
} \
|
|
UPDATE_STATE(parser->state); \
|
|
\
|
|
/* We either errored above or got paused; get out */ \
|
|
if (UNLIKELY(HTTP_PARSER_ERRNO(parser) != HPE_OK)) { \
|
|
return (ER); \
|
|
} \
|
|
} \
|
|
FOR##_mark = NULL; \
|
|
} \
|
|
} while (0)
|
|
|
|
/* Run the data callback FOR and consume the current byte */
|
|
#define CALLBACK_DATA(FOR) \
|
|
CALLBACK_DATA_(FOR, p - FOR##_mark, p - data + 1)
|
|
|
|
/* Run the data callback FOR and don't consume the current byte */
|
|
#define CALLBACK_DATA_NOADVANCE(FOR) \
|
|
CALLBACK_DATA_(FOR, p - FOR##_mark, p - data)
|
|
|
|
/* Set the mark FOR; non-destructive if mark is already set */
|
|
#define MARK(FOR) \
|
|
do { \
|
|
if (!FOR##_mark) { \
|
|
FOR##_mark = p; \
|
|
} \
|
|
} while (0)
|
|
|
|
/* Don't allow the total size of the HTTP headers (including the status
|
|
* line) to exceed HTTP_MAX_HEADER_SIZE. This check is here to protect
|
|
* embedders against denial-of-service attacks where the attacker feeds
|
|
* us a never-ending header that the embedder keeps buffering.
|
|
*
|
|
* This check is arguably the responsibility of embedders but we're doing
|
|
* it on the embedder's behalf because most won't bother and this way we
|
|
* make the web a little safer. HTTP_MAX_HEADER_SIZE is still far bigger
|
|
* than any reasonable request or response so this should never affect
|
|
* day-to-day operation.
|
|
*/
|
|
#define COUNT_HEADER_SIZE(V) \
|
|
do { \
|
|
parser->nread += (V); \
|
|
if (UNLIKELY(parser->nread > (HTTP_MAX_HEADER_SIZE))) { \
|
|
SET_ERRNO(HPE_HEADER_OVERFLOW); \
|
|
goto error; \
|
|
} \
|
|
} while (0)
|
|
|
|
|
|
#define PROXY_CONNECTION "proxy-connection"
|
|
#define CONNECTION "connection"
|
|
#define CONTENT_LENGTH "content-length"
|
|
#define TRANSFER_ENCODING "transfer-encoding"
|
|
#define UPGRADE "upgrade"
|
|
#define CHUNKED "chunked"
|
|
#define KEEP_ALIVE "keep-alive"
|
|
#define CLOSE "close"
|
|
|
|
|
|
static const char *method_strings[] =
|
|
{
|
|
#define XX(num, name, string) #string,
|
|
HTTP_METHOD_MAP(XX)
|
|
#undef XX
|
|
};
|
|
|
|
|
|
/* Tokens as defined by rfc 2616. Also lowercases them.
|
|
* token = 1*<any CHAR except CTLs or separators>
|
|
* separators = "(" | ")" | "<" | ">" | "@"
|
|
* | "," | ";" | ":" | "\" | <">
|
|
* | "/" | "[" | "]" | "?" | "="
|
|
* | "{" | "}" | SP | HT
|
|
*/
|
|
static const char tokens[256] = {
|
|
/* 0 nul 1 soh 2 stx 3 etx 4 eot 5 enq 6 ack 7 bel */
|
|
0, 0, 0, 0, 0, 0, 0, 0,
|
|
/* 8 bs 9 ht 10 nl 11 vt 12 np 13 cr 14 so 15 si */
|
|
0, 0, 0, 0, 0, 0, 0, 0,
|
|
/* 16 dle 17 dc1 18 dc2 19 dc3 20 dc4 21 nak 22 syn 23 etb */
|
|
0, 0, 0, 0, 0, 0, 0, 0,
|
|
/* 24 can 25 em 26 sub 27 esc 28 fs 29 gs 30 rs 31 us */
|
|
0, 0, 0, 0, 0, 0, 0, 0,
|
|
/* 32 sp 33 ! 34 " 35 # 36 $ 37 % 38 & 39 ' */
|
|
0, '!', 0, '#', '$', '%', '&', '\'',
|
|
/* 40 ( 41 ) 42 * 43 + 44 , 45 - 46 . 47 / */
|
|
0, 0, '*', '+', 0, '-', '.', 0,
|
|
/* 48 0 49 1 50 2 51 3 52 4 53 5 54 6 55 7 */
|
|
'0', '1', '2', '3', '4', '5', '6', '7',
|
|
/* 56 8 57 9 58 : 59 ; 60 < 61 = 62 > 63 ? */
|
|
'8', '9', 0, 0, 0, 0, 0, 0,
|
|
/* 64 @ 65 A 66 B 67 C 68 D 69 E 70 F 71 G */
|
|
0, 'a', 'b', 'c', 'd', 'e', 'f', 'g',
|
|
/* 72 H 73 I 74 J 75 K 76 L 77 M 78 N 79 O */
|
|
'h', 'i', 'j', 'k', 'l', 'm', 'n', 'o',
|
|
/* 80 P 81 Q 82 R 83 S 84 T 85 U 86 V 87 W */
|
|
'p', 'q', 'r', 's', 't', 'u', 'v', 'w',
|
|
/* 88 X 89 Y 90 Z 91 [ 92 \ 93 ] 94 ^ 95 _ */
|
|
'x', 'y', 'z', 0, 0, 0, '^', '_',
|
|
/* 96 ` 97 a 98 b 99 c 100 d 101 e 102 f 103 g */
|
|
'`', 'a', 'b', 'c', 'd', 'e', 'f', 'g',
|
|
/* 104 h 105 i 106 j 107 k 108 l 109 m 110 n 111 o */
|
|
'h', 'i', 'j', 'k', 'l', 'm', 'n', 'o',
|
|
/* 112 p 113 q 114 r 115 s 116 t 117 u 118 v 119 w */
|
|
'p', 'q', 'r', 's', 't', 'u', 'v', 'w',
|
|
/* 120 x 121 y 122 z 123 { 124 | 125 } 126 ~ 127 del */
|
|
'x', 'y', 'z', 0, '|', 0, '~', 0 };
|
|
|
|
|
|
static const int8_t unhex[256] =
|
|
{-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1
|
|
,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1
|
|
,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1
|
|
, 0, 1, 2, 3, 4, 5, 6, 7, 8, 9,-1,-1,-1,-1,-1,-1
|
|
,-1,10,11,12,13,14,15,-1,-1,-1,-1,-1,-1,-1,-1,-1
|
|
,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1
|
|
,-1,10,11,12,13,14,15,-1,-1,-1,-1,-1,-1,-1,-1,-1
|
|
,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1
|
|
};
|
|
|
|
|
|
#if HTTP_PARSER_STRICT
|
|
# define T(v) 0
|
|
#else
|
|
# define T(v) v
|
|
#endif
|
|
|
|
|
|
static const uint8_t normal_url_char[32] = {
|
|
/* 0 nul 1 soh 2 stx 3 etx 4 eot 5 enq 6 ack 7 bel */
|
|
0 | 0 | 0 | 0 | 0 | 0 | 0 | 0,
|
|
/* 8 bs 9 ht 10 nl 11 vt 12 np 13 cr 14 so 15 si */
|
|
0 | T(2) | 0 | 0 | T(16) | 0 | 0 | 0,
|
|
/* 16 dle 17 dc1 18 dc2 19 dc3 20 dc4 21 nak 22 syn 23 etb */
|
|
0 | 0 | 0 | 0 | 0 | 0 | 0 | 0,
|
|
/* 24 can 25 em 26 sub 27 esc 28 fs 29 gs 30 rs 31 us */
|
|
0 | 0 | 0 | 0 | 0 | 0 | 0 | 0,
|
|
/* 32 sp 33 ! 34 " 35 # 36 $ 37 % 38 & 39 ' */
|
|
0 | 2 | 4 | 0 | 16 | 32 | 64 | 128,
|
|
/* 40 ( 41 ) 42 * 43 + 44 , 45 - 46 . 47 / */
|
|
1 | 2 | 4 | 8 | 16 | 32 | 64 | 128,
|
|
/* 48 0 49 1 50 2 51 3 52 4 53 5 54 6 55 7 */
|
|
1 | 2 | 4 | 8 | 16 | 32 | 64 | 128,
|
|
/* 56 8 57 9 58 : 59 ; 60 < 61 = 62 > 63 ? */
|
|
1 | 2 | 4 | 8 | 16 | 32 | 64 | 0,
|
|
/* 64 @ 65 A 66 B 67 C 68 D 69 E 70 F 71 G */
|
|
1 | 2 | 4 | 8 | 16 | 32 | 64 | 128,
|
|
/* 72 H 73 I 74 J 75 K 76 L 77 M 78 N 79 O */
|
|
1 | 2 | 4 | 8 | 16 | 32 | 64 | 128,
|
|
/* 80 P 81 Q 82 R 83 S 84 T 85 U 86 V 87 W */
|
|
1 | 2 | 4 | 8 | 16 | 32 | 64 | 128,
|
|
/* 88 X 89 Y 90 Z 91 [ 92 \ 93 ] 94 ^ 95 _ */
|
|
1 | 2 | 4 | 8 | 16 | 32 | 64 | 128,
|
|
/* 96 ` 97 a 98 b 99 c 100 d 101 e 102 f 103 g */
|
|
1 | 2 | 4 | 8 | 16 | 32 | 64 | 128,
|
|
/* 104 h 105 i 106 j 107 k 108 l 109 m 110 n 111 o */
|
|
1 | 2 | 4 | 8 | 16 | 32 | 64 | 128,
|
|
/* 112 p 113 q 114 r 115 s 116 t 117 u 118 v 119 w */
|
|
1 | 2 | 4 | 8 | 16 | 32 | 64 | 128,
|
|
/* 120 x 121 y 122 z 123 { 124 | 125 } 126 ~ 127 del */
|
|
1 | 2 | 4 | 8 | 16 | 32 | 64 | 0, };
|
|
|
|
#undef T
|
|
|
|
enum state
|
|
{ s_dead = 1 /* important that this is > 0 */
|
|
|
|
, s_start_req_or_res
|
|
, s_res_or_resp_H
|
|
, s_start_res
|
|
, s_res_H
|
|
, s_res_HT
|
|
, s_res_HTT
|
|
, s_res_HTTP
|
|
, s_res_first_http_major
|
|
, s_res_http_major
|
|
, s_res_first_http_minor
|
|
, s_res_http_minor
|
|
, s_res_first_status_code
|
|
, s_res_status_code
|
|
, s_res_status_start
|
|
, s_res_status
|
|
, s_res_line_almost_done
|
|
|
|
, s_start_req
|
|
|
|
, s_req_method
|
|
, s_req_spaces_before_url
|
|
, s_req_schema
|
|
, s_req_schema_slash
|
|
, s_req_schema_slash_slash
|
|
, s_req_server_start
|
|
, s_req_server
|
|
, s_req_server_with_at
|
|
, s_req_path
|
|
, s_req_query_string_start
|
|
, s_req_query_string
|
|
, s_req_fragment_start
|
|
, s_req_fragment
|
|
, s_req_http_start
|
|
, s_req_http_H
|
|
, s_req_http_HT
|
|
, s_req_http_HTT
|
|
, s_req_http_HTTP
|
|
, s_req_first_http_major
|
|
, s_req_http_major
|
|
, s_req_first_http_minor
|
|
, s_req_http_minor
|
|
, s_req_line_almost_done
|
|
|
|
, s_header_field_start
|
|
, s_header_field
|
|
, s_header_value_discard_ws
|
|
, s_header_value_discard_ws_almost_done
|
|
, s_header_value_discard_lws
|
|
, s_header_value_start
|
|
, s_header_value
|
|
, s_header_value_lws
|
|
|
|
, s_header_almost_done
|
|
|
|
, s_chunk_size_start
|
|
, s_chunk_size
|
|
, s_chunk_parameters
|
|
, s_chunk_size_almost_done
|
|
|
|
, s_headers_almost_done
|
|
, s_headers_done
|
|
|
|
/* Important: 's_headers_done' must be the last 'header' state. All
|
|
* states beyond this must be 'body' states. It is used for overflow
|
|
* checking. See the PARSING_HEADER() macro.
|
|
*/
|
|
|
|
, s_chunk_data
|
|
, s_chunk_data_almost_done
|
|
, s_chunk_data_done
|
|
|
|
, s_body_identity
|
|
, s_body_identity_eof
|
|
|
|
, s_message_done
|
|
};
|
|
|
|
|
|
#define PARSING_HEADER(state) (state <= s_headers_done)
|
|
|
|
|
|
enum header_states
|
|
{ h_general = 0
|
|
, h_C
|
|
, h_CO
|
|
, h_CON
|
|
|
|
, h_matching_connection
|
|
, h_matching_proxy_connection
|
|
, h_matching_content_length
|
|
, h_matching_transfer_encoding
|
|
, h_matching_upgrade
|
|
|
|
, h_connection
|
|
, h_content_length
|
|
, h_transfer_encoding
|
|
, h_upgrade
|
|
|
|
, h_matching_transfer_encoding_chunked
|
|
, h_matching_connection_token_start
|
|
, h_matching_connection_keep_alive
|
|
, h_matching_connection_close
|
|
, h_matching_connection_upgrade
|
|
, h_matching_connection_token
|
|
|
|
, h_transfer_encoding_chunked
|
|
, h_connection_keep_alive
|
|
, h_connection_close
|
|
, h_connection_upgrade
|
|
};
|
|
|
|
enum http_host_state
|
|
{
|
|
s_http_host_dead = 1
|
|
, s_http_userinfo_start
|
|
, s_http_userinfo
|
|
, s_http_host_start
|
|
, s_http_host_v6_start
|
|
, s_http_host
|
|
, s_http_host_v6
|
|
, s_http_host_v6_end
|
|
, s_http_host_v6_zone_start
|
|
, s_http_host_v6_zone
|
|
, s_http_host_port_start
|
|
, s_http_host_port
|
|
};
|
|
|
|
/* Macros for character classes; depends on strict-mode */
|
|
#define CR '\r'
|
|
#define LF '\n'
|
|
#define LOWER(c) (unsigned char)(c | 0x20)
|
|
#define IS_ALPHA(c) (LOWER(c) >= 'a' && LOWER(c) <= 'z')
|
|
#define IS_NUM(c) ((c) >= '0' && (c) <= '9')
|
|
#define IS_ALPHANUM(c) (IS_ALPHA(c) || IS_NUM(c))
|
|
#define IS_HEX(c) (IS_NUM(c) || (LOWER(c) >= 'a' && LOWER(c) <= 'f'))
|
|
#define IS_MARK(c) ((c) == '-' || (c) == '_' || (c) == '.' || \
|
|
(c) == '!' || (c) == '~' || (c) == '*' || (c) == '\'' || (c) == '(' || \
|
|
(c) == ')')
|
|
#define IS_USERINFO_CHAR(c) (IS_ALPHANUM(c) || IS_MARK(c) || (c) == '%' || \
|
|
(c) == ';' || (c) == ':' || (c) == '&' || (c) == '=' || (c) == '+' || \
|
|
(c) == '$' || (c) == ',')
|
|
|
|
#define STRICT_TOKEN(c) (tokens[(unsigned char)c])
|
|
|
|
#if HTTP_PARSER_STRICT
|
|
#define TOKEN(c) (tokens[(unsigned char)c])
|
|
#define IS_URL_CHAR(c) (BIT_AT(normal_url_char, (unsigned char)c))
|
|
#define IS_HOST_CHAR(c) (IS_ALPHANUM(c) || (c) == '.' || (c) == '-')
|
|
#else
|
|
#define TOKEN(c) ((c == ' ') ? ' ' : tokens[(unsigned char)c])
|
|
#define IS_URL_CHAR(c) \
|
|
(BIT_AT(normal_url_char, (unsigned char)c) || ((c) & 0x80))
|
|
#define IS_HOST_CHAR(c) \
|
|
(IS_ALPHANUM(c) || (c) == '.' || (c) == '-' || (c) == '_')
|
|
#endif
|
|
|
|
/**
|
|
* Verify that a char is a valid visible (printable) US-ASCII
|
|
* character or %x80-FF
|
|
**/
|
|
#define IS_HEADER_CHAR(ch) \
|
|
(ch == CR || ch == LF || ch == 9 || ((unsigned char)ch > 31 && ch != 127))
|
|
|
|
#define start_state (parser->type == HTTP_REQUEST ? s_start_req : s_start_res)
|
|
|
|
|
|
#if HTTP_PARSER_STRICT
|
|
# define STRICT_CHECK(cond) \
|
|
do { \
|
|
if (cond) { \
|
|
SET_ERRNO(HPE_STRICT); \
|
|
goto error; \
|
|
} \
|
|
} while (0)
|
|
# define NEW_MESSAGE() (http_should_keep_alive(parser) ? start_state : s_dead)
|
|
#else
|
|
# define STRICT_CHECK(cond)
|
|
# define NEW_MESSAGE() start_state
|
|
#endif
|
|
|
|
|
|
/* Map errno values to strings for human-readable output */
|
|
#define HTTP_STRERROR_GEN(n, s) { "HPE_" #n, s },
|
|
static struct {
|
|
const char *name;
|
|
const char *description;
|
|
} http_strerror_tab[] = {
|
|
HTTP_ERRNO_MAP(HTTP_STRERROR_GEN)
|
|
};
|
|
#undef HTTP_STRERROR_GEN
|
|
|
|
int http_message_needs_eof(const http_parser *parser);
|
|
|
|
/* Our URL parser.
|
|
*
|
|
* This is designed to be shared by http_parser_execute() for URL validation,
|
|
* hence it has a state transition + byte-for-byte interface. In addition, it
|
|
* is meant to be embedded in http_parser_parse_url(), which does the dirty
|
|
* work of turning state transitions URL components for its API.
|
|
*
|
|
* This function should only be invoked with non-space characters. It is
|
|
* assumed that the caller cares about (and can detect) the transition between
|
|
* URL and non-URL states by looking for these.
|
|
*/
|
|
static enum state
|
|
parse_url_char(enum state s, const char ch)
|
|
{
|
|
if (ch == ' ' || ch == '\r' || ch == '\n') {
|
|
return s_dead;
|
|
}
|
|
|
|
#if HTTP_PARSER_STRICT
|
|
if (ch == '\t' || ch == '\f') {
|
|
return s_dead;
|
|
}
|
|
#endif
|
|
|
|
switch (s) {
|
|
case s_req_spaces_before_url:
|
|
/* Proxied requests are followed by scheme of an absolute URI (alpha).
|
|
* All methods except CONNECT are followed by '/' or '*'.
|
|
*/
|
|
|
|
if (ch == '/' || ch == '*') {
|
|
return s_req_path;
|
|
}
|
|
|
|
if (IS_ALPHA(ch)) {
|
|
return s_req_schema;
|
|
}
|
|
|
|
break;
|
|
|
|
case s_req_schema:
|
|
if (IS_ALPHA(ch)) {
|
|
return s;
|
|
}
|
|
|
|
if (ch == ':') {
|
|
return s_req_schema_slash;
|
|
}
|
|
|
|
break;
|
|
|
|
case s_req_schema_slash:
|
|
if (ch == '/') {
|
|
return s_req_schema_slash_slash;
|
|
}
|
|
|
|
break;
|
|
|
|
case s_req_schema_slash_slash:
|
|
if (ch == '/') {
|
|
return s_req_server_start;
|
|
}
|
|
|
|
break;
|
|
|
|
case s_req_server_with_at:
|
|
if (ch == '@') {
|
|
return s_dead;
|
|
}
|
|
|
|
/* FALLTHROUGH */
|
|
case s_req_server_start:
|
|
case s_req_server:
|
|
if (ch == '/') {
|
|
return s_req_path;
|
|
}
|
|
|
|
if (ch == '?') {
|
|
return s_req_query_string_start;
|
|
}
|
|
|
|
if (ch == '@') {
|
|
return s_req_server_with_at;
|
|
}
|
|
|
|
if (IS_USERINFO_CHAR(ch) || ch == '[' || ch == ']') {
|
|
return s_req_server;
|
|
}
|
|
|
|
break;
|
|
|
|
case s_req_path:
|
|
if (IS_URL_CHAR(ch)) {
|
|
return s;
|
|
}
|
|
|
|
switch (ch) {
|
|
case '?':
|
|
return s_req_query_string_start;
|
|
|
|
case '#':
|
|
return s_req_fragment_start;
|
|
}
|
|
|
|
break;
|
|
|
|
case s_req_query_string_start:
|
|
case s_req_query_string:
|
|
if (IS_URL_CHAR(ch)) {
|
|
return s_req_query_string;
|
|
}
|
|
|
|
switch (ch) {
|
|
case '?':
|
|
/* allow extra '?' in query string */
|
|
return s_req_query_string;
|
|
|
|
case '#':
|
|
return s_req_fragment_start;
|
|
}
|
|
|
|
break;
|
|
|
|
case s_req_fragment_start:
|
|
if (IS_URL_CHAR(ch)) {
|
|
return s_req_fragment;
|
|
}
|
|
|
|
switch (ch) {
|
|
case '?':
|
|
return s_req_fragment;
|
|
|
|
case '#':
|
|
return s;
|
|
}
|
|
|
|
break;
|
|
|
|
case s_req_fragment:
|
|
if (IS_URL_CHAR(ch)) {
|
|
return s;
|
|
}
|
|
|
|
switch (ch) {
|
|
case '?':
|
|
case '#':
|
|
return s;
|
|
}
|
|
|
|
break;
|
|
|
|
default:
|
|
break;
|
|
}
|
|
|
|
/* We should never fall out of the switch above unless there's an error */
|
|
return s_dead;
|
|
}
|
|
|
|
size_t http_parser_execute (http_parser *parser,
|
|
const http_parser_settings *settings,
|
|
const char *data,
|
|
size_t len)
|
|
{
|
|
char c, ch;
|
|
int8_t unhex_val;
|
|
const char *p = data;
|
|
const char *header_field_mark = 0;
|
|
const char *header_value_mark = 0;
|
|
const char *url_mark = 0;
|
|
const char *body_mark = 0;
|
|
const char *status_mark = 0;
|
|
enum state p_state = (enum state) parser->state;
|
|
const unsigned int lenient = parser->lenient_http_headers;
|
|
|
|
/* We're in an error state. Don't bother doing anything. */
|
|
if (HTTP_PARSER_ERRNO(parser) != HPE_OK) {
|
|
return 0;
|
|
}
|
|
|
|
if (len == 0) {
|
|
switch (CURRENT_STATE()) {
|
|
case s_body_identity_eof:
|
|
/* Use of CALLBACK_NOTIFY() here would erroneously return 1 byte read if
|
|
* we got paused.
|
|
*/
|
|
CALLBACK_NOTIFY_NOADVANCE(message_complete);
|
|
return 0;
|
|
|
|
case s_dead:
|
|
case s_start_req_or_res:
|
|
case s_start_res:
|
|
case s_start_req:
|
|
return 0;
|
|
|
|
default:
|
|
SET_ERRNO(HPE_INVALID_EOF_STATE);
|
|
return 1;
|
|
}
|
|
}
|
|
|
|
|
|
if (CURRENT_STATE() == s_header_field)
|
|
header_field_mark = data;
|
|
if (CURRENT_STATE() == s_header_value)
|
|
header_value_mark = data;
|
|
switch (CURRENT_STATE()) {
|
|
case s_req_path:
|
|
case s_req_schema:
|
|
case s_req_schema_slash:
|
|
case s_req_schema_slash_slash:
|
|
case s_req_server_start:
|
|
case s_req_server:
|
|
case s_req_server_with_at:
|
|
case s_req_query_string_start:
|
|
case s_req_query_string:
|
|
case s_req_fragment_start:
|
|
case s_req_fragment:
|
|
url_mark = data;
|
|
break;
|
|
case s_res_status:
|
|
status_mark = data;
|
|
break;
|
|
default:
|
|
break;
|
|
}
|
|
|
|
for (p=data; p != data + len; p++) {
|
|
ch = *p;
|
|
|
|
if (PARSING_HEADER(CURRENT_STATE()))
|
|
COUNT_HEADER_SIZE(1);
|
|
|
|
reexecute:
|
|
switch (CURRENT_STATE()) {
|
|
|
|
case s_dead:
|
|
/* this state is used after a 'Connection: close' message
|
|
* the parser will error out if it reads another message
|
|
*/
|
|
if (LIKELY(ch == CR || ch == LF))
|
|
break;
|
|
|
|
SET_ERRNO(HPE_CLOSED_CONNECTION);
|
|
goto error;
|
|
|
|
case s_start_req_or_res:
|
|
{
|
|
if (ch == CR || ch == LF)
|
|
break;
|
|
parser->flags = 0;
|
|
parser->content_length = ULLONG_MAX;
|
|
|
|
if (ch == 'H') {
|
|
UPDATE_STATE(s_res_or_resp_H);
|
|
|
|
CALLBACK_NOTIFY(message_begin);
|
|
} else {
|
|
parser->type = HTTP_REQUEST;
|
|
UPDATE_STATE(s_start_req);
|
|
REEXECUTE();
|
|
}
|
|
|
|
break;
|
|
}
|
|
|
|
case s_res_or_resp_H:
|
|
if (ch == 'T') {
|
|
parser->type = HTTP_RESPONSE;
|
|
UPDATE_STATE(s_res_HT);
|
|
} else {
|
|
if (UNLIKELY(ch != 'E')) {
|
|
SET_ERRNO(HPE_INVALID_CONSTANT);
|
|
goto error;
|
|
}
|
|
|
|
parser->type = HTTP_REQUEST;
|
|
parser->method = HTTP_HEAD;
|
|
parser->index = 2;
|
|
UPDATE_STATE(s_req_method);
|
|
}
|
|
break;
|
|
|
|
case s_start_res:
|
|
{
|
|
parser->flags = 0;
|
|
parser->content_length = ULLONG_MAX;
|
|
|
|
switch (ch) {
|
|
case 'H':
|
|
UPDATE_STATE(s_res_H);
|
|
break;
|
|
|
|
case CR:
|
|
case LF:
|
|
break;
|
|
|
|
default:
|
|
SET_ERRNO(HPE_INVALID_CONSTANT);
|
|
goto error;
|
|
}
|
|
|
|
CALLBACK_NOTIFY(message_begin);
|
|
break;
|
|
}
|
|
|
|
case s_res_H:
|
|
STRICT_CHECK(ch != 'T');
|
|
UPDATE_STATE(s_res_HT);
|
|
break;
|
|
|
|
case s_res_HT:
|
|
STRICT_CHECK(ch != 'T');
|
|
UPDATE_STATE(s_res_HTT);
|
|
break;
|
|
|
|
case s_res_HTT:
|
|
STRICT_CHECK(ch != 'P');
|
|
UPDATE_STATE(s_res_HTTP);
|
|
break;
|
|
|
|
case s_res_HTTP:
|
|
STRICT_CHECK(ch != '/');
|
|
UPDATE_STATE(s_res_first_http_major);
|
|
break;
|
|
|
|
case s_res_first_http_major:
|
|
if (UNLIKELY(ch < '0' || ch > '9')) {
|
|
SET_ERRNO(HPE_INVALID_VERSION);
|
|
goto error;
|
|
}
|
|
|
|
parser->http_major = ch - '0';
|
|
UPDATE_STATE(s_res_http_major);
|
|
break;
|
|
|
|
/* major HTTP version or dot */
|
|
case s_res_http_major:
|
|
{
|
|
if (ch == '.') {
|
|
UPDATE_STATE(s_res_first_http_minor);
|
|
break;
|
|
}
|
|
|
|
if (!IS_NUM(ch)) {
|
|
SET_ERRNO(HPE_INVALID_VERSION);
|
|
goto error;
|
|
}
|
|
|
|
parser->http_major *= 10;
|
|
parser->http_major += ch - '0';
|
|
|
|
if (UNLIKELY(parser->http_major > 999)) {
|
|
SET_ERRNO(HPE_INVALID_VERSION);
|
|
goto error;
|
|
}
|
|
|
|
break;
|
|
}
|
|
|
|
/* first digit of minor HTTP version */
|
|
case s_res_first_http_minor:
|
|
if (UNLIKELY(!IS_NUM(ch))) {
|
|
SET_ERRNO(HPE_INVALID_VERSION);
|
|
goto error;
|
|
}
|
|
|
|
parser->http_minor = ch - '0';
|
|
UPDATE_STATE(s_res_http_minor);
|
|
break;
|
|
|
|
/* minor HTTP version or end of request line */
|
|
case s_res_http_minor:
|
|
{
|
|
if (ch == ' ') {
|
|
UPDATE_STATE(s_res_first_status_code);
|
|
break;
|
|
}
|
|
|
|
if (UNLIKELY(!IS_NUM(ch))) {
|
|
SET_ERRNO(HPE_INVALID_VERSION);
|
|
goto error;
|
|
}
|
|
|
|
parser->http_minor *= 10;
|
|
parser->http_minor += ch - '0';
|
|
|
|
if (UNLIKELY(parser->http_minor > 999)) {
|
|
SET_ERRNO(HPE_INVALID_VERSION);
|
|
goto error;
|
|
}
|
|
|
|
break;
|
|
}
|
|
|
|
case s_res_first_status_code:
|
|
{
|
|
if (!IS_NUM(ch)) {
|
|
if (ch == ' ') {
|
|
break;
|
|
}
|
|
|
|
SET_ERRNO(HPE_INVALID_STATUS);
|
|
goto error;
|
|
}
|
|
parser->status_code = ch - '0';
|
|
UPDATE_STATE(s_res_status_code);
|
|
break;
|
|
}
|
|
|
|
case s_res_status_code:
|
|
{
|
|
if (!IS_NUM(ch)) {
|
|
switch (ch) {
|
|
case ' ':
|
|
UPDATE_STATE(s_res_status_start);
|
|
break;
|
|
case CR:
|
|
UPDATE_STATE(s_res_line_almost_done);
|
|
break;
|
|
case LF:
|
|
UPDATE_STATE(s_header_field_start);
|
|
break;
|
|
default:
|
|
SET_ERRNO(HPE_INVALID_STATUS);
|
|
goto error;
|
|
}
|
|
break;
|
|
}
|
|
|
|
parser->status_code *= 10;
|
|
parser->status_code += ch - '0';
|
|
|
|
if (UNLIKELY(parser->status_code > 999)) {
|
|
SET_ERRNO(HPE_INVALID_STATUS);
|
|
goto error;
|
|
}
|
|
|
|
break;
|
|
}
|
|
|
|
case s_res_status_start:
|
|
{
|
|
if (ch == CR) {
|
|
UPDATE_STATE(s_res_line_almost_done);
|
|
break;
|
|
}
|
|
|
|
if (ch == LF) {
|
|
UPDATE_STATE(s_header_field_start);
|
|
break;
|
|
}
|
|
|
|
MARK(status);
|
|
UPDATE_STATE(s_res_status);
|
|
parser->index = 0;
|
|
break;
|
|
}
|
|
|
|
case s_res_status:
|
|
if (ch == CR) {
|
|
UPDATE_STATE(s_res_line_almost_done);
|
|
CALLBACK_DATA(status);
|
|
break;
|
|
}
|
|
|
|
if (ch == LF) {
|
|
UPDATE_STATE(s_header_field_start);
|
|
CALLBACK_DATA(status);
|
|
break;
|
|
}
|
|
|
|
break;
|
|
|
|
case s_res_line_almost_done:
|
|
STRICT_CHECK(ch != LF);
|
|
UPDATE_STATE(s_header_field_start);
|
|
break;
|
|
|
|
case s_start_req:
|
|
{
|
|
if (ch == CR || ch == LF)
|
|
break;
|
|
parser->flags = 0;
|
|
parser->content_length = ULLONG_MAX;
|
|
|
|
if (UNLIKELY(!IS_ALPHA(ch))) {
|
|
SET_ERRNO(HPE_INVALID_METHOD);
|
|
goto error;
|
|
}
|
|
|
|
parser->method = (enum http_method) 0;
|
|
parser->index = 1;
|
|
switch (ch) {
|
|
case 'A': parser->method = HTTP_ACL; break;
|
|
case 'B': parser->method = HTTP_BIND; break;
|
|
case 'C': parser->method = HTTP_CONNECT; /* or COPY, CHECKOUT */ break;
|
|
case 'D': parser->method = HTTP_DELETE; break;
|
|
case 'G': parser->method = HTTP_GET; break;
|
|
case 'H': parser->method = HTTP_HEAD; break;
|
|
case 'L': parser->method = HTTP_LOCK; /* or LINK */ break;
|
|
case 'M': parser->method = HTTP_MKCOL; /* or MOVE, MKACTIVITY, MERGE, M-SEARCH, MKCALENDAR */ break;
|
|
case 'N': parser->method = HTTP_NOTIFY; break;
|
|
case 'O': parser->method = HTTP_OPTIONS; break;
|
|
case 'P': parser->method = HTTP_POST;
|
|
/* or PROPFIND|PROPPATCH|PUT|PATCH|PURGE */
|
|
break;
|
|
case 'R': parser->method = HTTP_REPORT; /* or REBIND */ break;
|
|
case 'S': parser->method = HTTP_SUBSCRIBE; /* or SEARCH */ break;
|
|
case 'T': parser->method = HTTP_TRACE; break;
|
|
case 'U': parser->method = HTTP_UNLOCK; /* or UNSUBSCRIBE, UNBIND, UNLINK */ break;
|
|
default:
|
|
SET_ERRNO(HPE_INVALID_METHOD);
|
|
goto error;
|
|
}
|
|
UPDATE_STATE(s_req_method);
|
|
|
|
CALLBACK_NOTIFY(message_begin);
|
|
|
|
break;
|
|
}
|
|
|
|
case s_req_method:
|
|
{
|
|
const char *matcher;
|
|
if (UNLIKELY(ch == '\0')) {
|
|
SET_ERRNO(HPE_INVALID_METHOD);
|
|
goto error;
|
|
}
|
|
|
|
matcher = method_strings[parser->method];
|
|
if (ch == ' ' && matcher[parser->index] == '\0') {
|
|
UPDATE_STATE(s_req_spaces_before_url);
|
|
} else if (ch == matcher[parser->index]) {
|
|
; /* nada */
|
|
} else if (IS_ALPHA(ch)) {
|
|
|
|
switch (parser->method << 16 | parser->index << 8 | ch) {
|
|
#define XX(meth, pos, ch, new_meth) \
|
|
case (HTTP_##meth << 16 | pos << 8 | ch): \
|
|
parser->method = HTTP_##new_meth; break;
|
|
|
|
XX(POST, 1, 'U', PUT)
|
|
XX(POST, 1, 'A', PATCH)
|
|
XX(CONNECT, 1, 'H', CHECKOUT)
|
|
XX(CONNECT, 2, 'P', COPY)
|
|
XX(MKCOL, 1, 'O', MOVE)
|
|
XX(MKCOL, 1, 'E', MERGE)
|
|
XX(MKCOL, 2, 'A', MKACTIVITY)
|
|
XX(MKCOL, 3, 'A', MKCALENDAR)
|
|
XX(SUBSCRIBE, 1, 'E', SEARCH)
|
|
XX(REPORT, 2, 'B', REBIND)
|
|
XX(POST, 1, 'R', PROPFIND)
|
|
XX(PROPFIND, 4, 'P', PROPPATCH)
|
|
XX(PUT, 2, 'R', PURGE)
|
|
XX(LOCK, 1, 'I', LINK)
|
|
XX(UNLOCK, 2, 'S', UNSUBSCRIBE)
|
|
XX(UNLOCK, 2, 'B', UNBIND)
|
|
XX(UNLOCK, 3, 'I', UNLINK)
|
|
#undef XX
|
|
|
|
default:
|
|
SET_ERRNO(HPE_INVALID_METHOD);
|
|
goto error;
|
|
}
|
|
} else if (ch == '-' &&
|
|
parser->index == 1 &&
|
|
parser->method == HTTP_MKCOL) {
|
|
parser->method = HTTP_MSEARCH;
|
|
} else {
|
|
SET_ERRNO(HPE_INVALID_METHOD);
|
|
goto error;
|
|
}
|
|
|
|
++parser->index;
|
|
break;
|
|
}
|
|
|
|
case s_req_spaces_before_url:
|
|
{
|
|
if (ch == ' ') break;
|
|
|
|
MARK(url);
|
|
if (parser->method == HTTP_CONNECT) {
|
|
UPDATE_STATE(s_req_server_start);
|
|
}
|
|
|
|
UPDATE_STATE(parse_url_char(CURRENT_STATE(), ch));
|
|
if (UNLIKELY(CURRENT_STATE() == s_dead)) {
|
|
SET_ERRNO(HPE_INVALID_URL);
|
|
goto error;
|
|
}
|
|
|
|
break;
|
|
}
|
|
|
|
case s_req_schema:
|
|
case s_req_schema_slash:
|
|
case s_req_schema_slash_slash:
|
|
case s_req_server_start:
|
|
{
|
|
switch (ch) {
|
|
/* No whitespace allowed here */
|
|
case ' ':
|
|
case CR:
|
|
case LF:
|
|
SET_ERRNO(HPE_INVALID_URL);
|
|
goto error;
|
|
default:
|
|
UPDATE_STATE(parse_url_char(CURRENT_STATE(), ch));
|
|
if (UNLIKELY(CURRENT_STATE() == s_dead)) {
|
|
SET_ERRNO(HPE_INVALID_URL);
|
|
goto error;
|
|
}
|
|
}
|
|
|
|
break;
|
|
}
|
|
|
|
case s_req_server:
|
|
case s_req_server_with_at:
|
|
case s_req_path:
|
|
case s_req_query_string_start:
|
|
case s_req_query_string:
|
|
case s_req_fragment_start:
|
|
case s_req_fragment:
|
|
{
|
|
switch (ch) {
|
|
case ' ':
|
|
UPDATE_STATE(s_req_http_start);
|
|
CALLBACK_DATA(url);
|
|
break;
|
|
case CR:
|
|
case LF:
|
|
parser->http_major = 0;
|
|
parser->http_minor = 9;
|
|
UPDATE_STATE((ch == CR) ?
|
|
s_req_line_almost_done :
|
|
s_header_field_start);
|
|
CALLBACK_DATA(url);
|
|
break;
|
|
default:
|
|
UPDATE_STATE(parse_url_char(CURRENT_STATE(), ch));
|
|
if (UNLIKELY(CURRENT_STATE() == s_dead)) {
|
|
SET_ERRNO(HPE_INVALID_URL);
|
|
goto error;
|
|
}
|
|
}
|
|
break;
|
|
}
|
|
|
|
case s_req_http_start:
|
|
switch (ch) {
|
|
case 'H':
|
|
UPDATE_STATE(s_req_http_H);
|
|
break;
|
|
case ' ':
|
|
break;
|
|
default:
|
|
SET_ERRNO(HPE_INVALID_CONSTANT);
|
|
goto error;
|
|
}
|
|
break;
|
|
|
|
case s_req_http_H:
|
|
STRICT_CHECK(ch != 'T');
|
|
UPDATE_STATE(s_req_http_HT);
|
|
break;
|
|
|
|
case s_req_http_HT:
|
|
STRICT_CHECK(ch != 'T');
|
|
UPDATE_STATE(s_req_http_HTT);
|
|
break;
|
|
|
|
case s_req_http_HTT:
|
|
STRICT_CHECK(ch != 'P');
|
|
UPDATE_STATE(s_req_http_HTTP);
|
|
break;
|
|
|
|
case s_req_http_HTTP:
|
|
STRICT_CHECK(ch != '/');
|
|
UPDATE_STATE(s_req_first_http_major);
|
|
break;
|
|
|
|
/* first digit of major HTTP version */
|
|
case s_req_first_http_major:
|
|
if (UNLIKELY(ch < '1' || ch > '9')) {
|
|
SET_ERRNO(HPE_INVALID_VERSION);
|
|
goto error;
|
|
}
|
|
|
|
parser->http_major = ch - '0';
|
|
UPDATE_STATE(s_req_http_major);
|
|
break;
|
|
|
|
/* major HTTP version or dot */
|
|
case s_req_http_major:
|
|
{
|
|
if (ch == '.') {
|
|
UPDATE_STATE(s_req_first_http_minor);
|
|
break;
|
|
}
|
|
|
|
if (UNLIKELY(!IS_NUM(ch))) {
|
|
SET_ERRNO(HPE_INVALID_VERSION);
|
|
goto error;
|
|
}
|
|
|
|
parser->http_major *= 10;
|
|
parser->http_major += ch - '0';
|
|
|
|
if (UNLIKELY(parser->http_major > 999)) {
|
|
SET_ERRNO(HPE_INVALID_VERSION);
|
|
goto error;
|
|
}
|
|
|
|
break;
|
|
}
|
|
|
|
/* first digit of minor HTTP version */
|
|
case s_req_first_http_minor:
|
|
if (UNLIKELY(!IS_NUM(ch))) {
|
|
SET_ERRNO(HPE_INVALID_VERSION);
|
|
goto error;
|
|
}
|
|
|
|
parser->http_minor = ch - '0';
|
|
UPDATE_STATE(s_req_http_minor);
|
|
break;
|
|
|
|
/* minor HTTP version or end of request line */
|
|
case s_req_http_minor:
|
|
{
|
|
if (ch == CR) {
|
|
UPDATE_STATE(s_req_line_almost_done);
|
|
break;
|
|
}
|
|
|
|
if (ch == LF) {
|
|
UPDATE_STATE(s_header_field_start);
|
|
break;
|
|
}
|
|
|
|
/* XXX allow spaces after digit? */
|
|
|
|
if (UNLIKELY(!IS_NUM(ch))) {
|
|
SET_ERRNO(HPE_INVALID_VERSION);
|
|
goto error;
|
|
}
|
|
|
|
parser->http_minor *= 10;
|
|
parser->http_minor += ch - '0';
|
|
|
|
if (UNLIKELY(parser->http_minor > 999)) {
|
|
SET_ERRNO(HPE_INVALID_VERSION);
|
|
goto error;
|
|
}
|
|
|
|
break;
|
|
}
|
|
|
|
/* end of request line */
|
|
case s_req_line_almost_done:
|
|
{
|
|
if (UNLIKELY(ch != LF)) {
|
|
SET_ERRNO(HPE_LF_EXPECTED);
|
|
goto error;
|
|
}
|
|
|
|
UPDATE_STATE(s_header_field_start);
|
|
break;
|
|
}
|
|
|
|
case s_header_field_start:
|
|
{
|
|
if (ch == CR) {
|
|
UPDATE_STATE(s_headers_almost_done);
|
|
break;
|
|
}
|
|
|
|
if (ch == LF) {
|
|
/* they might be just sending \n instead of \r\n so this would be
|
|
* the second \n to denote the end of headers*/
|
|
UPDATE_STATE(s_headers_almost_done);
|
|
REEXECUTE();
|
|
}
|
|
|
|
c = TOKEN(ch);
|
|
|
|
if (UNLIKELY(!c)) {
|
|
SET_ERRNO(HPE_INVALID_HEADER_TOKEN);
|
|
goto error;
|
|
}
|
|
|
|
MARK(header_field);
|
|
|
|
parser->index = 0;
|
|
UPDATE_STATE(s_header_field);
|
|
|
|
switch (c) {
|
|
case 'c':
|
|
parser->header_state = h_C;
|
|
break;
|
|
|
|
case 'p':
|
|
parser->header_state = h_matching_proxy_connection;
|
|
break;
|
|
|
|
case 't':
|
|
parser->header_state = h_matching_transfer_encoding;
|
|
break;
|
|
|
|
case 'u':
|
|
parser->header_state = h_matching_upgrade;
|
|
break;
|
|
|
|
default:
|
|
parser->header_state = h_general;
|
|
break;
|
|
}
|
|
break;
|
|
}
|
|
|
|
case s_header_field:
|
|
{
|
|
const char* start = p;
|
|
for (; p != data + len; p++) {
|
|
ch = *p;
|
|
c = TOKEN(ch);
|
|
|
|
if (!c)
|
|
break;
|
|
|
|
switch (parser->header_state) {
|
|
case h_general:
|
|
break;
|
|
|
|
case h_C:
|
|
parser->index++;
|
|
parser->header_state = (c == 'o' ? h_CO : h_general);
|
|
break;
|
|
|
|
case h_CO:
|
|
parser->index++;
|
|
parser->header_state = (c == 'n' ? h_CON : h_general);
|
|
break;
|
|
|
|
case h_CON:
|
|
parser->index++;
|
|
switch (c) {
|
|
case 'n':
|
|
parser->header_state = h_matching_connection;
|
|
break;
|
|
case 't':
|
|
parser->header_state = h_matching_content_length;
|
|
break;
|
|
default:
|
|
parser->header_state = h_general;
|
|
break;
|
|
}
|
|
break;
|
|
|
|
/* connection */
|
|
|
|
case h_matching_connection:
|
|
parser->index++;
|
|
if (parser->index > sizeof(CONNECTION)-1
|
|
|| c != CONNECTION[parser->index]) {
|
|
parser->header_state = h_general;
|
|
} else if (parser->index == sizeof(CONNECTION)-2) {
|
|
parser->header_state = h_connection;
|
|
}
|
|
break;
|
|
|
|
/* proxy-connection */
|
|
|
|
case h_matching_proxy_connection:
|
|
parser->index++;
|
|
if (parser->index > sizeof(PROXY_CONNECTION)-1
|
|
|| c != PROXY_CONNECTION[parser->index]) {
|
|
parser->header_state = h_general;
|
|
} else if (parser->index == sizeof(PROXY_CONNECTION)-2) {
|
|
parser->header_state = h_connection;
|
|
}
|
|
break;
|
|
|
|
/* content-length */
|
|
|
|
case h_matching_content_length:
|
|
parser->index++;
|
|
if (parser->index > sizeof(CONTENT_LENGTH)-1
|
|
|| c != CONTENT_LENGTH[parser->index]) {
|
|
parser->header_state = h_general;
|
|
} else if (parser->index == sizeof(CONTENT_LENGTH)-2) {
|
|
if (parser->flags & F_CONTENTLENGTH) {
|
|
SET_ERRNO(HPE_UNEXPECTED_CONTENT_LENGTH);
|
|
goto error;
|
|
}
|
|
parser->header_state = h_content_length;
|
|
parser->flags |= F_CONTENTLENGTH;
|
|
}
|
|
break;
|
|
|
|
/* transfer-encoding */
|
|
|
|
case h_matching_transfer_encoding:
|
|
parser->index++;
|
|
if (parser->index > sizeof(TRANSFER_ENCODING)-1
|
|
|| c != TRANSFER_ENCODING[parser->index]) {
|
|
parser->header_state = h_general;
|
|
} else if (parser->index == sizeof(TRANSFER_ENCODING)-2) {
|
|
parser->header_state = h_transfer_encoding;
|
|
}
|
|
break;
|
|
|
|
/* upgrade */
|
|
|
|
case h_matching_upgrade:
|
|
parser->index++;
|
|
if (parser->index > sizeof(UPGRADE)-1
|
|
|| c != UPGRADE[parser->index]) {
|
|
parser->header_state = h_general;
|
|
} else if (parser->index == sizeof(UPGRADE)-2) {
|
|
parser->header_state = h_upgrade;
|
|
}
|
|
break;
|
|
|
|
case h_connection:
|
|
case h_content_length:
|
|
case h_transfer_encoding:
|
|
case h_upgrade:
|
|
if (ch != ' ') parser->header_state = h_general;
|
|
break;
|
|
|
|
default:
|
|
assert(0 && "Unknown header_state");
|
|
break;
|
|
}
|
|
}
|
|
|
|
COUNT_HEADER_SIZE(p - start);
|
|
|
|
if (p == data + len) {
|
|
--p;
|
|
break;
|
|
}
|
|
|
|
if (ch == ':') {
|
|
UPDATE_STATE(s_header_value_discard_ws);
|
|
CALLBACK_DATA(header_field);
|
|
break;
|
|
}
|
|
|
|
SET_ERRNO(HPE_INVALID_HEADER_TOKEN);
|
|
goto error;
|
|
}
|
|
|
|
case s_header_value_discard_ws:
|
|
if (ch == ' ' || ch == '\t') break;
|
|
|
|
if (ch == CR) {
|
|
UPDATE_STATE(s_header_value_discard_ws_almost_done);
|
|
break;
|
|
}
|
|
|
|
if (ch == LF) {
|
|
UPDATE_STATE(s_header_value_discard_lws);
|
|
break;
|
|
}
|
|
|
|
/* FALLTHROUGH */
|
|
|
|
case s_header_value_start:
|
|
{
|
|
MARK(header_value);
|
|
|
|
UPDATE_STATE(s_header_value);
|
|
parser->index = 0;
|
|
|
|
c = LOWER(ch);
|
|
|
|
switch (parser->header_state) {
|
|
case h_upgrade:
|
|
parser->flags |= F_UPGRADE;
|
|
parser->header_state = h_general;
|
|
break;
|
|
|
|
case h_transfer_encoding:
|
|
/* looking for 'Transfer-Encoding: chunked' */
|
|
if ('c' == c) {
|
|
parser->header_state = h_matching_transfer_encoding_chunked;
|
|
} else {
|
|
parser->header_state = h_general;
|
|
}
|
|
break;
|
|
|
|
case h_content_length:
|
|
if (UNLIKELY(!IS_NUM(ch))) {
|
|
SET_ERRNO(HPE_INVALID_CONTENT_LENGTH);
|
|
goto error;
|
|
}
|
|
|
|
parser->content_length = ch - '0';
|
|
break;
|
|
|
|
case h_connection:
|
|
/* looking for 'Connection: keep-alive' */
|
|
if (c == 'k') {
|
|
parser->header_state = h_matching_connection_keep_alive;
|
|
/* looking for 'Connection: close' */
|
|
} else if (c == 'c') {
|
|
parser->header_state = h_matching_connection_close;
|
|
} else if (c == 'u') {
|
|
parser->header_state = h_matching_connection_upgrade;
|
|
} else {
|
|
parser->header_state = h_matching_connection_token;
|
|
}
|
|
break;
|
|
|
|
/* Multi-value `Connection` header */
|
|
case h_matching_connection_token_start:
|
|
break;
|
|
|
|
default:
|
|
parser->header_state = h_general;
|
|
break;
|
|
}
|
|
break;
|
|
}
|
|
|
|
case s_header_value:
|
|
{
|
|
const char* start = p;
|
|
enum header_states h_state = (enum header_states) parser->header_state;
|
|
for (; p != data + len; p++) {
|
|
ch = *p;
|
|
if (ch == CR) {
|
|
UPDATE_STATE(s_header_almost_done);
|
|
parser->header_state = h_state;
|
|
CALLBACK_DATA(header_value);
|
|
break;
|
|
}
|
|
|
|
if (ch == LF) {
|
|
UPDATE_STATE(s_header_almost_done);
|
|
COUNT_HEADER_SIZE(p - start);
|
|
parser->header_state = h_state;
|
|
CALLBACK_DATA_NOADVANCE(header_value);
|
|
REEXECUTE();
|
|
}
|
|
|
|
if (!lenient && !IS_HEADER_CHAR(ch)) {
|
|
SET_ERRNO(HPE_INVALID_HEADER_TOKEN);
|
|
goto error;
|
|
}
|
|
|
|
c = LOWER(ch);
|
|
|
|
switch (h_state) {
|
|
case h_general:
|
|
{
|
|
const char* p_cr;
|
|
const char* p_lf;
|
|
size_t limit = data + len - p;
|
|
|
|
limit = MIN(limit, HTTP_MAX_HEADER_SIZE);
|
|
|
|
p_cr = (const char*) memchr(p, CR, limit);
|
|
p_lf = (const char*) memchr(p, LF, limit);
|
|
if (p_cr != NULL) {
|
|
if (p_lf != NULL && p_cr >= p_lf)
|
|
p = p_lf;
|
|
else
|
|
p = p_cr;
|
|
} else if (UNLIKELY(p_lf != NULL)) {
|
|
p = p_lf;
|
|
} else {
|
|
p = data + len;
|
|
}
|
|
--p;
|
|
|
|
break;
|
|
}
|
|
|
|
case h_connection:
|
|
case h_transfer_encoding:
|
|
assert(0 && "Shouldn't get here.");
|
|
break;
|
|
|
|
case h_content_length:
|
|
{
|
|
uint64_t t;
|
|
|
|
if (ch == ' ') break;
|
|
|
|
if (UNLIKELY(!IS_NUM(ch))) {
|
|
SET_ERRNO(HPE_INVALID_CONTENT_LENGTH);
|
|
parser->header_state = h_state;
|
|
goto error;
|
|
}
|
|
|
|
t = parser->content_length;
|
|
t *= 10;
|
|
t += ch - '0';
|
|
|
|
/* Overflow? Test against a conservative limit for simplicity. */
|
|
if (UNLIKELY((ULLONG_MAX - 10) / 10 < parser->content_length)) {
|
|
SET_ERRNO(HPE_INVALID_CONTENT_LENGTH);
|
|
parser->header_state = h_state;
|
|
goto error;
|
|
}
|
|
|
|
parser->content_length = t;
|
|
break;
|
|
}
|
|
|
|
/* Transfer-Encoding: chunked */
|
|
case h_matching_transfer_encoding_chunked:
|
|
parser->index++;
|
|
if (parser->index > sizeof(CHUNKED)-1
|
|
|| c != CHUNKED[parser->index]) {
|
|
h_state = h_general;
|
|
} else if (parser->index == sizeof(CHUNKED)-2) {
|
|
h_state = h_transfer_encoding_chunked;
|
|
}
|
|
break;
|
|
|
|
case h_matching_connection_token_start:
|
|
/* looking for 'Connection: keep-alive' */
|
|
if (c == 'k') {
|
|
h_state = h_matching_connection_keep_alive;
|
|
/* looking for 'Connection: close' */
|
|
} else if (c == 'c') {
|
|
h_state = h_matching_connection_close;
|
|
} else if (c == 'u') {
|
|
h_state = h_matching_connection_upgrade;
|
|
} else if (STRICT_TOKEN(c)) {
|
|
h_state = h_matching_connection_token;
|
|
} else if (c == ' ' || c == '\t') {
|
|
/* Skip lws */
|
|
} else {
|
|
h_state = h_general;
|
|
}
|
|
break;
|
|
|
|
/* looking for 'Connection: keep-alive' */
|
|
case h_matching_connection_keep_alive:
|
|
parser->index++;
|
|
if (parser->index > sizeof(KEEP_ALIVE)-1
|
|
|| c != KEEP_ALIVE[parser->index]) {
|
|
h_state = h_matching_connection_token;
|
|
} else if (parser->index == sizeof(KEEP_ALIVE)-2) {
|
|
h_state = h_connection_keep_alive;
|
|
}
|
|
break;
|
|
|
|
/* looking for 'Connection: close' */
|
|
case h_matching_connection_close:
|
|
parser->index++;
|
|
if (parser->index > sizeof(CLOSE)-1 || c != CLOSE[parser->index]) {
|
|
h_state = h_matching_connection_token;
|
|
} else if (parser->index == sizeof(CLOSE)-2) {
|
|
h_state = h_connection_close;
|
|
}
|
|
break;
|
|
|
|
/* looking for 'Connection: upgrade' */
|
|
case h_matching_connection_upgrade:
|
|
parser->index++;
|
|
if (parser->index > sizeof(UPGRADE) - 1 ||
|
|
c != UPGRADE[parser->index]) {
|
|
h_state = h_matching_connection_token;
|
|
} else if (parser->index == sizeof(UPGRADE)-2) {
|
|
h_state = h_connection_upgrade;
|
|
}
|
|
break;
|
|
|
|
case h_matching_connection_token:
|
|
if (ch == ',') {
|
|
h_state = h_matching_connection_token_start;
|
|
parser->index = 0;
|
|
}
|
|
break;
|
|
|
|
case h_transfer_encoding_chunked:
|
|
if (ch != ' ') h_state = h_general;
|
|
break;
|
|
|
|
case h_connection_keep_alive:
|
|
case h_connection_close:
|
|
case h_connection_upgrade:
|
|
if (ch == ',') {
|
|
if (h_state == h_connection_keep_alive) {
|
|
parser->flags |= F_CONNECTION_KEEP_ALIVE;
|
|
} else if (h_state == h_connection_close) {
|
|
parser->flags |= F_CONNECTION_CLOSE;
|
|
} else if (h_state == h_connection_upgrade) {
|
|
parser->flags |= F_CONNECTION_UPGRADE;
|
|
}
|
|
h_state = h_matching_connection_token_start;
|
|
parser->index = 0;
|
|
} else if (ch != ' ') {
|
|
h_state = h_matching_connection_token;
|
|
}
|
|
break;
|
|
|
|
default:
|
|
UPDATE_STATE(s_header_value);
|
|
h_state = h_general;
|
|
break;
|
|
}
|
|
}
|
|
parser->header_state = h_state;
|
|
|
|
COUNT_HEADER_SIZE(p - start);
|
|
|
|
if (p == data + len)
|
|
--p;
|
|
break;
|
|
}
|
|
|
|
case s_header_almost_done:
|
|
{
|
|
if (UNLIKELY(ch != LF)) {
|
|
SET_ERRNO(HPE_LF_EXPECTED);
|
|
goto error;
|
|
}
|
|
|
|
UPDATE_STATE(s_header_value_lws);
|
|
break;
|
|
}
|
|
|
|
case s_header_value_lws:
|
|
{
|
|
if (ch == ' ' || ch == '\t') {
|
|
UPDATE_STATE(s_header_value_start);
|
|
REEXECUTE();
|
|
}
|
|
|
|
/* finished the header */
|
|
switch (parser->header_state) {
|
|
case h_connection_keep_alive:
|
|
parser->flags |= F_CONNECTION_KEEP_ALIVE;
|
|
break;
|
|
case h_connection_close:
|
|
parser->flags |= F_CONNECTION_CLOSE;
|
|
break;
|
|
case h_transfer_encoding_chunked:
|
|
parser->flags |= F_CHUNKED;
|
|
break;
|
|
case h_connection_upgrade:
|
|
parser->flags |= F_CONNECTION_UPGRADE;
|
|
break;
|
|
default:
|
|
break;
|
|
}
|
|
|
|
UPDATE_STATE(s_header_field_start);
|
|
REEXECUTE();
|
|
}
|
|
|
|
case s_header_value_discard_ws_almost_done:
|
|
{
|
|
STRICT_CHECK(ch != LF);
|
|
UPDATE_STATE(s_header_value_discard_lws);
|
|
break;
|
|
}
|
|
|
|
case s_header_value_discard_lws:
|
|
{
|
|
if (ch == ' ' || ch == '\t') {
|
|
UPDATE_STATE(s_header_value_discard_ws);
|
|
break;
|
|
} else {
|
|
switch (parser->header_state) {
|
|
case h_connection_keep_alive:
|
|
parser->flags |= F_CONNECTION_KEEP_ALIVE;
|
|
break;
|
|
case h_connection_close:
|
|
parser->flags |= F_CONNECTION_CLOSE;
|
|
break;
|
|
case h_connection_upgrade:
|
|
parser->flags |= F_CONNECTION_UPGRADE;
|
|
break;
|
|
case h_transfer_encoding_chunked:
|
|
parser->flags |= F_CHUNKED;
|
|
break;
|
|
default:
|
|
break;
|
|
}
|
|
|
|
/* header value was empty */
|
|
MARK(header_value);
|
|
UPDATE_STATE(s_header_field_start);
|
|
CALLBACK_DATA_NOADVANCE(header_value);
|
|
REEXECUTE();
|
|
}
|
|
}
|
|
|
|
case s_headers_almost_done:
|
|
{
|
|
STRICT_CHECK(ch != LF);
|
|
|
|
if (parser->flags & F_TRAILING) {
|
|
/* End of a chunked request */
|
|
UPDATE_STATE(s_message_done);
|
|
CALLBACK_NOTIFY_NOADVANCE(chunk_complete);
|
|
REEXECUTE();
|
|
}
|
|
|
|
/* Cannot use chunked encoding and a content-length header together
|
|
per the HTTP specification. */
|
|
if ((parser->flags & F_CHUNKED) &&
|
|
(parser->flags & F_CONTENTLENGTH)) {
|
|
SET_ERRNO(HPE_UNEXPECTED_CONTENT_LENGTH);
|
|
goto error;
|
|
}
|
|
|
|
UPDATE_STATE(s_headers_done);
|
|
|
|
/* Set this here so that on_headers_complete() callbacks can see it */
|
|
parser->upgrade =
|
|
((parser->flags & (F_UPGRADE | F_CONNECTION_UPGRADE)) ==
|
|
(F_UPGRADE | F_CONNECTION_UPGRADE) ||
|
|
parser->method == HTTP_CONNECT);
|
|
|
|
/* Here we call the headers_complete callback. This is somewhat
|
|
* different than other callbacks because if the user returns 1, we
|
|
* will interpret that as saying that this message has no body. This
|
|
* is needed for the annoying case of recieving a response to a HEAD
|
|
* request.
|
|
*
|
|
* We'd like to use CALLBACK_NOTIFY_NOADVANCE() here but we cannot, so
|
|
* we have to simulate it by handling a change in errno below.
|
|
*/
|
|
if (settings->on_headers_complete) {
|
|
switch (settings->on_headers_complete(parser)) {
|
|
case 0:
|
|
break;
|
|
|
|
case 2:
|
|
parser->upgrade = 1;
|
|
|
|
case 1:
|
|
parser->flags |= F_SKIPBODY;
|
|
break;
|
|
|
|
default:
|
|
SET_ERRNO(HPE_CB_headers_complete);
|
|
RETURN(p - data); /* Error */
|
|
}
|
|
}
|
|
|
|
if (HTTP_PARSER_ERRNO(parser) != HPE_OK) {
|
|
RETURN(p - data);
|
|
}
|
|
|
|
REEXECUTE();
|
|
}
|
|
|
|
case s_headers_done:
|
|
{
|
|
int hasBody;
|
|
STRICT_CHECK(ch != LF);
|
|
|
|
parser->nread = 0;
|
|
|
|
hasBody = parser->flags & F_CHUNKED ||
|
|
(parser->content_length > 0 && parser->content_length != ULLONG_MAX);
|
|
if (parser->upgrade && (parser->method == HTTP_CONNECT ||
|
|
(parser->flags & F_SKIPBODY) || !hasBody)) {
|
|
/* Exit, the rest of the message is in a different protocol. */
|
|
UPDATE_STATE(NEW_MESSAGE());
|
|
CALLBACK_NOTIFY(message_complete);
|
|
RETURN((p - data) + 1);
|
|
}
|
|
|
|
if (parser->flags & F_SKIPBODY) {
|
|
UPDATE_STATE(NEW_MESSAGE());
|
|
CALLBACK_NOTIFY(message_complete);
|
|
} else if (parser->flags & F_CHUNKED) {
|
|
/* chunked encoding - ignore Content-Length header */
|
|
UPDATE_STATE(s_chunk_size_start);
|
|
} else {
|
|
if (parser->content_length == 0) {
|
|
/* Content-Length header given but zero: Content-Length: 0\r\n */
|
|
UPDATE_STATE(NEW_MESSAGE());
|
|
CALLBACK_NOTIFY(message_complete);
|
|
} else if (parser->content_length != ULLONG_MAX) {
|
|
/* Content-Length header given and non-zero */
|
|
UPDATE_STATE(s_body_identity);
|
|
} else {
|
|
if (!http_message_needs_eof(parser)) {
|
|
/* Assume content-length 0 - read the next */
|
|
UPDATE_STATE(NEW_MESSAGE());
|
|
CALLBACK_NOTIFY(message_complete);
|
|
} else {
|
|
/* Read body until EOF */
|
|
UPDATE_STATE(s_body_identity_eof);
|
|
}
|
|
}
|
|
}
|
|
|
|
break;
|
|
}
|
|
|
|
case s_body_identity:
|
|
{
|
|
uint64_t to_read = MIN(parser->content_length,
|
|
(uint64_t) ((data + len) - p));
|
|
|
|
assert(parser->content_length != 0
|
|
&& parser->content_length != ULLONG_MAX);
|
|
|
|
/* The difference between advancing content_length and p is because
|
|
* the latter will automaticaly advance on the next loop iteration.
|
|
* Further, if content_length ends up at 0, we want to see the last
|
|
* byte again for our message complete callback.
|
|
*/
|
|
MARK(body);
|
|
parser->content_length -= to_read;
|
|
p += to_read - 1;
|
|
|
|
if (parser->content_length == 0) {
|
|
UPDATE_STATE(s_message_done);
|
|
|
|
/* Mimic CALLBACK_DATA_NOADVANCE() but with one extra byte.
|
|
*
|
|
* The alternative to doing this is to wait for the next byte to
|
|
* trigger the data callback, just as in every other case. The
|
|
* problem with this is that this makes it difficult for the test
|
|
* harness to distinguish between complete-on-EOF and
|
|
* complete-on-length. It's not clear that this distinction is
|
|
* important for applications, but let's keep it for now.
|
|
*/
|
|
CALLBACK_DATA_(body, p - body_mark + 1, p - data);
|
|
REEXECUTE();
|
|
}
|
|
|
|
break;
|
|
}
|
|
|
|
/* read until EOF */
|
|
case s_body_identity_eof:
|
|
MARK(body);
|
|
p = data + len - 1;
|
|
|
|
break;
|
|
|
|
case s_message_done:
|
|
UPDATE_STATE(NEW_MESSAGE());
|
|
CALLBACK_NOTIFY(message_complete);
|
|
if (parser->upgrade) {
|
|
/* Exit, the rest of the message is in a different protocol. */
|
|
RETURN((p - data) + 1);
|
|
}
|
|
break;
|
|
|
|
case s_chunk_size_start:
|
|
{
|
|
assert(parser->nread == 1);
|
|
assert(parser->flags & F_CHUNKED);
|
|
|
|
unhex_val = unhex[(unsigned char)ch];
|
|
if (UNLIKELY(unhex_val == -1)) {
|
|
SET_ERRNO(HPE_INVALID_CHUNK_SIZE);
|
|
goto error;
|
|
}
|
|
|
|
parser->content_length = unhex_val;
|
|
UPDATE_STATE(s_chunk_size);
|
|
break;
|
|
}
|
|
|
|
case s_chunk_size:
|
|
{
|
|
uint64_t t;
|
|
|
|
assert(parser->flags & F_CHUNKED);
|
|
|
|
if (ch == CR) {
|
|
UPDATE_STATE(s_chunk_size_almost_done);
|
|
break;
|
|
}
|
|
|
|
unhex_val = unhex[(unsigned char)ch];
|
|
|
|
if (unhex_val == -1) {
|
|
if (ch == ';' || ch == ' ') {
|
|
UPDATE_STATE(s_chunk_parameters);
|
|
break;
|
|
}
|
|
|
|
SET_ERRNO(HPE_INVALID_CHUNK_SIZE);
|
|
goto error;
|
|
}
|
|
|
|
t = parser->content_length;
|
|
t *= 16;
|
|
t += unhex_val;
|
|
|
|
/* Overflow? Test against a conservative limit for simplicity. */
|
|
if (UNLIKELY((ULLONG_MAX - 16) / 16 < parser->content_length)) {
|
|
SET_ERRNO(HPE_INVALID_CONTENT_LENGTH);
|
|
goto error;
|
|
}
|
|
|
|
parser->content_length = t;
|
|
break;
|
|
}
|
|
|
|
case s_chunk_parameters:
|
|
{
|
|
assert(parser->flags & F_CHUNKED);
|
|
/* just ignore this shit. TODO check for overflow */
|
|
if (ch == CR) {
|
|
UPDATE_STATE(s_chunk_size_almost_done);
|
|
break;
|
|
}
|
|
break;
|
|
}
|
|
|
|
case s_chunk_size_almost_done:
|
|
{
|
|
assert(parser->flags & F_CHUNKED);
|
|
STRICT_CHECK(ch != LF);
|
|
|
|
parser->nread = 0;
|
|
|
|
if (parser->content_length == 0) {
|
|
parser->flags |= F_TRAILING;
|
|
UPDATE_STATE(s_header_field_start);
|
|
} else {
|
|
UPDATE_STATE(s_chunk_data);
|
|
}
|
|
CALLBACK_NOTIFY(chunk_header);
|
|
break;
|
|
}
|
|
|
|
case s_chunk_data:
|
|
{
|
|
uint64_t to_read = MIN(parser->content_length,
|
|
(uint64_t) ((data + len) - p));
|
|
|
|
assert(parser->flags & F_CHUNKED);
|
|
assert(parser->content_length != 0
|
|
&& parser->content_length != ULLONG_MAX);
|
|
|
|
/* See the explanation in s_body_identity for why the content
|
|
* length and data pointers are managed this way.
|
|
*/
|
|
MARK(body);
|
|
parser->content_length -= to_read;
|
|
p += to_read - 1;
|
|
|
|
if (parser->content_length == 0) {
|
|
UPDATE_STATE(s_chunk_data_almost_done);
|
|
}
|
|
|
|
break;
|
|
}
|
|
|
|
case s_chunk_data_almost_done:
|
|
assert(parser->flags & F_CHUNKED);
|
|
assert(parser->content_length == 0);
|
|
STRICT_CHECK(ch != CR);
|
|
UPDATE_STATE(s_chunk_data_done);
|
|
CALLBACK_DATA(body);
|
|
break;
|
|
|
|
case s_chunk_data_done:
|
|
assert(parser->flags & F_CHUNKED);
|
|
STRICT_CHECK(ch != LF);
|
|
parser->nread = 0;
|
|
UPDATE_STATE(s_chunk_size_start);
|
|
CALLBACK_NOTIFY(chunk_complete);
|
|
break;
|
|
|
|
default:
|
|
assert(0 && "unhandled state");
|
|
SET_ERRNO(HPE_INVALID_INTERNAL_STATE);
|
|
goto error;
|
|
}
|
|
}
|
|
|
|
/* Run callbacks for any marks that we have leftover after we ran our of
|
|
* bytes. There should be at most one of these set, so it's OK to invoke
|
|
* them in series (unset marks will not result in callbacks).
|
|
*
|
|
* We use the NOADVANCE() variety of callbacks here because 'p' has already
|
|
* overflowed 'data' and this allows us to correct for the off-by-one that
|
|
* we'd otherwise have (since CALLBACK_DATA() is meant to be run with a 'p'
|
|
* value that's in-bounds).
|
|
*/
|
|
|
|
assert(((header_field_mark ? 1 : 0) +
|
|
(header_value_mark ? 1 : 0) +
|
|
(url_mark ? 1 : 0) +
|
|
(body_mark ? 1 : 0) +
|
|
(status_mark ? 1 : 0)) <= 1);
|
|
|
|
CALLBACK_DATA_NOADVANCE(header_field);
|
|
CALLBACK_DATA_NOADVANCE(header_value);
|
|
CALLBACK_DATA_NOADVANCE(url);
|
|
CALLBACK_DATA_NOADVANCE(body);
|
|
CALLBACK_DATA_NOADVANCE(status);
|
|
|
|
RETURN(len);
|
|
|
|
error:
|
|
if (HTTP_PARSER_ERRNO(parser) == HPE_OK) {
|
|
SET_ERRNO(HPE_UNKNOWN);
|
|
}
|
|
|
|
RETURN(p - data);
|
|
}
|
|
|
|
|
|
/* Does the parser need to see an EOF to find the end of the message? */
|
|
int
|
|
http_message_needs_eof (const http_parser *parser)
|
|
{
|
|
if (parser->type == HTTP_REQUEST) {
|
|
return 0;
|
|
}
|
|
|
|
/* See RFC 2616 section 4.4 */
|
|
if (parser->status_code / 100 == 1 || /* 1xx e.g. Continue */
|
|
parser->status_code == 204 || /* No Content */
|
|
parser->status_code == 304 || /* Not Modified */
|
|
parser->flags & F_SKIPBODY) { /* response to a HEAD request */
|
|
return 0;
|
|
}
|
|
|
|
if ((parser->flags & F_CHUNKED) || parser->content_length != ULLONG_MAX) {
|
|
return 0;
|
|
}
|
|
|
|
return 1;
|
|
}
|
|
|
|
|
|
int
|
|
http_should_keep_alive (const http_parser *parser)
|
|
{
|
|
if (parser->http_major > 0 && parser->http_minor > 0) {
|
|
/* HTTP/1.1 */
|
|
if (parser->flags & F_CONNECTION_CLOSE) {
|
|
return 0;
|
|
}
|
|
} else {
|
|
/* HTTP/1.0 or earlier */
|
|
if (!(parser->flags & F_CONNECTION_KEEP_ALIVE)) {
|
|
return 0;
|
|
}
|
|
}
|
|
|
|
return !http_message_needs_eof(parser);
|
|
}
|
|
|
|
|
|
const char *
|
|
http_method_str (enum http_method m)
|
|
{
|
|
return ELEM_AT(method_strings, m, "<unknown>");
|
|
}
|
|
|
|
|
|
void
|
|
http_parser_init (http_parser *parser, enum http_parser_type t)
|
|
{
|
|
void *data = parser->data; /* preserve application data */
|
|
memset(parser, 0, sizeof(*parser));
|
|
parser->data = data;
|
|
parser->type = t;
|
|
parser->state = (t == HTTP_REQUEST ? s_start_req : (t == HTTP_RESPONSE ? s_start_res : s_start_req_or_res));
|
|
parser->http_errno = HPE_OK;
|
|
}
|
|
|
|
void
|
|
http_parser_settings_init(http_parser_settings *settings)
|
|
{
|
|
memset(settings, 0, sizeof(*settings));
|
|
}
|
|
|
|
const char *
|
|
http_errno_name(enum http_errno err) {
|
|
assert(((size_t) err) < ARRAY_SIZE(http_strerror_tab));
|
|
return http_strerror_tab[err].name;
|
|
}
|
|
|
|
const char *
|
|
http_errno_description(enum http_errno err) {
|
|
assert(((size_t) err) < ARRAY_SIZE(http_strerror_tab));
|
|
return http_strerror_tab[err].description;
|
|
}
|
|
|
|
static enum http_host_state
|
|
http_parse_host_char(enum http_host_state s, const char ch) {
|
|
switch(s) {
|
|
case s_http_userinfo:
|
|
case s_http_userinfo_start:
|
|
if (ch == '@') {
|
|
return s_http_host_start;
|
|
}
|
|
|
|
if (IS_USERINFO_CHAR(ch)) {
|
|
return s_http_userinfo;
|
|
}
|
|
break;
|
|
|
|
case s_http_host_start:
|
|
if (ch == '[') {
|
|
return s_http_host_v6_start;
|
|
}
|
|
|
|
if (IS_HOST_CHAR(ch)) {
|
|
return s_http_host;
|
|
}
|
|
|
|
break;
|
|
|
|
case s_http_host:
|
|
if (IS_HOST_CHAR(ch)) {
|
|
return s_http_host;
|
|
}
|
|
|
|
/* FALLTHROUGH */
|
|
case s_http_host_v6_end:
|
|
if (ch == ':') {
|
|
return s_http_host_port_start;
|
|
}
|
|
|
|
break;
|
|
|
|
case s_http_host_v6:
|
|
if (ch == ']') {
|
|
return s_http_host_v6_end;
|
|
}
|
|
|
|
/* FALLTHROUGH */
|
|
case s_http_host_v6_start:
|
|
if (IS_HEX(ch) || ch == ':' || ch == '.') {
|
|
return s_http_host_v6;
|
|
}
|
|
|
|
if (s == s_http_host_v6 && ch == '%') {
|
|
return s_http_host_v6_zone_start;
|
|
}
|
|
break;
|
|
|
|
case s_http_host_v6_zone:
|
|
if (ch == ']') {
|
|
return s_http_host_v6_end;
|
|
}
|
|
|
|
/* FALLTHROUGH */
|
|
case s_http_host_v6_zone_start:
|
|
/* RFC 6874 Zone ID consists of 1*( unreserved / pct-encoded) */
|
|
if (IS_ALPHANUM(ch) || ch == '%' || ch == '.' || ch == '-' || ch == '_' ||
|
|
ch == '~') {
|
|
return s_http_host_v6_zone;
|
|
}
|
|
break;
|
|
|
|
case s_http_host_port:
|
|
case s_http_host_port_start:
|
|
if (IS_NUM(ch)) {
|
|
return s_http_host_port;
|
|
}
|
|
|
|
break;
|
|
|
|
default:
|
|
break;
|
|
}
|
|
return s_http_host_dead;
|
|
}
|
|
|
|
static int
|
|
http_parse_host(const char * buf, struct http_parser_url *u, int found_at) {
|
|
assert(u->field_set & (1 << UF_HOST));
|
|
enum http_host_state s;
|
|
|
|
const char *p;
|
|
size_t buflen = u->field_data[UF_HOST].off + u->field_data[UF_HOST].len;
|
|
|
|
u->field_data[UF_HOST].len = 0;
|
|
|
|
s = found_at ? s_http_userinfo_start : s_http_host_start;
|
|
|
|
for (p = buf + u->field_data[UF_HOST].off; p < buf + buflen; p++) {
|
|
enum http_host_state new_s = http_parse_host_char(s, *p);
|
|
|
|
if (new_s == s_http_host_dead) {
|
|
return 1;
|
|
}
|
|
|
|
switch(new_s) {
|
|
case s_http_host:
|
|
if (s != s_http_host) {
|
|
u->field_data[UF_HOST].off = p - buf;
|
|
}
|
|
u->field_data[UF_HOST].len++;
|
|
break;
|
|
|
|
case s_http_host_v6:
|
|
if (s != s_http_host_v6) {
|
|
u->field_data[UF_HOST].off = p - buf;
|
|
}
|
|
u->field_data[UF_HOST].len++;
|
|
break;
|
|
|
|
case s_http_host_v6_zone_start:
|
|
case s_http_host_v6_zone:
|
|
u->field_data[UF_HOST].len++;
|
|
break;
|
|
|
|
case s_http_host_port:
|
|
if (s != s_http_host_port) {
|
|
u->field_data[UF_PORT].off = p - buf;
|
|
u->field_data[UF_PORT].len = 0;
|
|
u->field_set |= (1 << UF_PORT);
|
|
}
|
|
u->field_data[UF_PORT].len++;
|
|
break;
|
|
|
|
case s_http_userinfo:
|
|
if (s != s_http_userinfo) {
|
|
u->field_data[UF_USERINFO].off = p - buf ;
|
|
u->field_data[UF_USERINFO].len = 0;
|
|
u->field_set |= (1 << UF_USERINFO);
|
|
}
|
|
u->field_data[UF_USERINFO].len++;
|
|
break;
|
|
|
|
default:
|
|
break;
|
|
}
|
|
s = new_s;
|
|
}
|
|
|
|
/* Make sure we don't end somewhere unexpected */
|
|
switch (s) {
|
|
case s_http_host_start:
|
|
case s_http_host_v6_start:
|
|
case s_http_host_v6:
|
|
case s_http_host_v6_zone_start:
|
|
case s_http_host_v6_zone:
|
|
case s_http_host_port_start:
|
|
case s_http_userinfo:
|
|
case s_http_userinfo_start:
|
|
return 1;
|
|
default:
|
|
break;
|
|
}
|
|
|
|
return 0;
|
|
}
|
|
|
|
void
|
|
http_parser_url_init(struct http_parser_url *u) {
|
|
memset(u, 0, sizeof(*u));
|
|
}
|
|
|
|
int
|
|
http_parser_parse_url(const char *buf, size_t buflen, int is_connect,
|
|
struct http_parser_url *u)
|
|
{
|
|
enum state s;
|
|
const char *p;
|
|
enum http_parser_url_fields uf, old_uf;
|
|
int found_at = 0;
|
|
|
|
u->port = u->field_set = 0;
|
|
s = is_connect ? s_req_server_start : s_req_spaces_before_url;
|
|
old_uf = UF_MAX;
|
|
|
|
for (p = buf; p < buf + buflen; p++) {
|
|
s = parse_url_char(s, *p);
|
|
|
|
/* Figure out the next field that we're operating on */
|
|
switch (s) {
|
|
case s_dead:
|
|
return 1;
|
|
|
|
/* Skip delimeters */
|
|
case s_req_schema_slash:
|
|
case s_req_schema_slash_slash:
|
|
case s_req_server_start:
|
|
case s_req_query_string_start:
|
|
case s_req_fragment_start:
|
|
continue;
|
|
|
|
case s_req_schema:
|
|
uf = UF_SCHEMA;
|
|
break;
|
|
|
|
case s_req_server_with_at:
|
|
found_at = 1;
|
|
|
|
/* FALLTROUGH */
|
|
case s_req_server:
|
|
uf = UF_HOST;
|
|
break;
|
|
|
|
case s_req_path:
|
|
uf = UF_PATH;
|
|
break;
|
|
|
|
case s_req_query_string:
|
|
uf = UF_QUERY;
|
|
break;
|
|
|
|
case s_req_fragment:
|
|
uf = UF_FRAGMENT;
|
|
break;
|
|
|
|
default:
|
|
assert(!"Unexpected state");
|
|
return 1;
|
|
}
|
|
|
|
/* Nothing's changed; soldier on */
|
|
if (uf == old_uf) {
|
|
u->field_data[uf].len++;
|
|
continue;
|
|
}
|
|
|
|
u->field_data[uf].off = p - buf;
|
|
u->field_data[uf].len = 1;
|
|
|
|
u->field_set |= (1 << uf);
|
|
old_uf = uf;
|
|
}
|
|
|
|
/* host must be present if there is a schema */
|
|
/* parsing http:///toto will fail */
|
|
if ((u->field_set & (1 << UF_SCHEMA)) &&
|
|
(u->field_set & (1 << UF_HOST)) == 0) {
|
|
return 1;
|
|
}
|
|
|
|
if (u->field_set & (1 << UF_HOST)) {
|
|
if (http_parse_host(buf, u, found_at) != 0) {
|
|
return 1;
|
|
}
|
|
}
|
|
|
|
/* CONNECT requests can only contain "hostname:port" */
|
|
if (is_connect && u->field_set != ((1 << UF_HOST)|(1 << UF_PORT))) {
|
|
return 1;
|
|
}
|
|
|
|
if (u->field_set & (1 << UF_PORT)) {
|
|
/* Don't bother with endp; we've already validated the string */
|
|
unsigned long v = strtoul(buf + u->field_data[UF_PORT].off, NULL, 10);
|
|
|
|
/* Ports have a max value of 2^16 */
|
|
if (v > 0xffff) {
|
|
return 1;
|
|
}
|
|
|
|
u->port = (uint16_t) v;
|
|
}
|
|
|
|
return 0;
|
|
}
|
|
|
|
void
|
|
http_parser_pause(http_parser *parser, int paused) {
|
|
/* Users should only be pausing/unpausing a parser that is not in an error
|
|
* state. In non-debug builds, there's not much that we can do about this
|
|
* other than ignore it.
|
|
*/
|
|
if (HTTP_PARSER_ERRNO(parser) == HPE_OK ||
|
|
HTTP_PARSER_ERRNO(parser) == HPE_PAUSED) {
|
|
SET_ERRNO((paused) ? HPE_PAUSED : HPE_OK);
|
|
} else {
|
|
assert(0 && "Attempting to pause parser in error state");
|
|
}
|
|
}
|
|
|
|
int
|
|
http_body_is_final(const struct http_parser *parser) {
|
|
return parser->state == s_message_done;
|
|
}
|
|
|
|
unsigned long
|
|
http_parser_version(void) {
|
|
return HTTP_PARSER_VERSION_MAJOR * 0x10000 |
|
|
HTTP_PARSER_VERSION_MINOR * 0x00100 |
|
|
HTTP_PARSER_VERSION_PATCH * 0x00001;
|
|
}
|